<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	>

<channel>
	<title>MKUHFUSS &#187; Parsen</title>
	<atom:link href="http://www.mkuhfuss.de/tag/parsen/feed/" rel="self" type="application/rss+xml" />
	<link>http://www.mkuhfuss.de</link>
	<description>Webdesign, SEO, SEM, Programmierung</description>
	<lastBuildDate>Fri, 09 Apr 2010 09:59:03 +0000</lastBuildDate>
	<language>en</language>
	<sy:updatePeriod>hourly</sy:updatePeriod>
	<sy:updateFrequency>1</sy:updateFrequency>
	<generator>http://wordpress.org/?v=3.1</generator>
		<item>
		<title>Text aus Word extrahieren/parsen</title>
		<link>http://www.mkuhfuss.de/2009/02/text-aus-word-extrahierenparsen/</link>
		<comments>http://www.mkuhfuss.de/2009/02/text-aus-word-extrahierenparsen/#comments</comments>
		<pubDate>Wed, 25 Feb 2009 13:33:07 +0000</pubDate>
		<dc:creator>admin</dc:creator>
				<category><![CDATA[Allgemein]]></category>
		<category><![CDATA[Parsen]]></category>
		<category><![CDATA[Word]]></category>

		<guid isPermaLink="false">http://www.mkuhfuss.de/?p=68</guid>
		<description><![CDATA[Um Text aus einem Word-Dokument (.doc) heraus zu extrahieren kann man folgende Funktion verwenden: function read_word&#40;$user_doc&#41; &#123; $file = fopen&#40;$user_doc, &#34;r&#34;&#41;; $input = fread&#40;$file, filesize&#40;$user_doc&#41;&#41;; $zeilen = explode&#40;chr&#40;0x0D&#41;, $input&#41;; $ausgabe = &#34;&#34;; foreach&#40;$zeilen as $einzelzeile&#41;&#123; $pos = strpos&#40;$einzelzeile, chr&#40;0x00&#41;&#41;; if&#40;&#40;$pos !== FALSE&#41;&#124;&#124;&#40;strlen&#40;$einzelzeile&#41;==0&#41;&#41; &#123; &#125; else &#123; &#160; $ausgabe .= $einzelzeile.&#34; &#34;; &#125; &#125; $ausgabe = [...]]]></description>
			<content:encoded><![CDATA[<p>Um Text aus einem Word-Dokument (.doc) heraus zu extrahieren kann man folgende Funktion verwenden:</p>

<div class="wp_syntax"><div class="code"><pre class="php php" style="font-family:monospace;"><span style="color: #000000; font-weight: bold;">function</span> read_word<span style="color: #009900;">&#40;</span><span style="color: #000088;">$user_doc</span><span style="color: #009900;">&#41;</span> <span style="color: #009900;">&#123;</span>
	<span style="color: #000088;">$file</span> <span style="color: #339933;">=</span> <span style="color: #990000;">fopen</span><span style="color: #009900;">&#40;</span><span style="color: #000088;">$user_doc</span><span style="color: #339933;">,</span> <span style="color: #0000ff;">&quot;r&quot;</span><span style="color: #009900;">&#41;</span>;
	<span style="color: #000088;">$input</span> <span style="color: #339933;">=</span> <span style="color: #990000;">fread</span><span style="color: #009900;">&#40;</span><span style="color: #000088;">$file</span><span style="color: #339933;">,</span> <span style="color: #990000;">filesize</span><span style="color: #009900;">&#40;</span><span style="color: #000088;">$user_doc</span><span style="color: #009900;">&#41;</span><span style="color: #009900;">&#41;</span>;
	<span style="color: #000088;">$zeilen</span> <span style="color: #339933;">=</span> <span style="color: #990000;">explode</span><span style="color: #009900;">&#40;</span><span style="color: #990000;">chr</span><span style="color: #009900;">&#40;</span><span style="color: #208080;">0x0D</span><span style="color: #009900;">&#41;</span><span style="color: #339933;">,</span> <span style="color: #000088;">$input</span><span style="color: #009900;">&#41;</span>;
	<span style="color: #000088;">$ausgabe</span> <span style="color: #339933;">=</span> <span style="color: #0000ff;">&quot;&quot;</span>;
		<span style="color: #b1b100;">foreach</span><span style="color: #009900;">&#40;</span><span style="color: #000088;">$zeilen</span> <span style="color: #b1b100;">as</span> <span style="color: #000088;">$einzelzeile</span><span style="color: #009900;">&#41;</span><span style="color: #009900;">&#123;</span>
		<span style="color: #000088;">$pos</span> <span style="color: #339933;">=</span> <span style="color: #990000;">strpos</span><span style="color: #009900;">&#40;</span><span style="color: #000088;">$einzelzeile</span><span style="color: #339933;">,</span> <span style="color: #990000;">chr</span><span style="color: #009900;">&#40;</span><span style="color: #208080;">0x00</span><span style="color: #009900;">&#41;</span><span style="color: #009900;">&#41;</span>;
			<span style="color: #b1b100;">if</span><span style="color: #009900;">&#40;</span><span style="color: #009900;">&#40;</span><span style="color: #000088;">$pos</span> <span style="color: #339933;">!==</span> <span style="color: #000000; font-weight: bold;">FALSE</span><span style="color: #009900;">&#41;</span>||<span style="color: #009900;">&#40;</span><span style="color: #990000;">strlen</span><span style="color: #009900;">&#40;</span><span style="color: #000088;">$einzelzeile</span><span style="color: #009900;">&#41;</span><span style="color: #339933;">==</span><span style="color:#800080;">0</span><span style="color: #009900;">&#41;</span><span style="color: #009900;">&#41;</span> <span style="color: #009900;">&#123;</span>
			<span style="color: #009900;">&#125;</span> <span style="color: #b1b100;">else</span> <span style="color: #009900;">&#123;</span>
&nbsp;
			<span style="color: #000088;">$ausgabe</span> <span style="color: #339933;">.=</span> <span style="color: #000088;">$einzelzeile</span><span style="color: #339933;">.</span><span style="color: #0000ff;">&quot; &quot;</span>;
			<span style="color: #009900;">&#125;</span>
		<span style="color: #009900;">&#125;</span>	
	<span style="color: #000088;">$ausgabe</span> <span style="color: #339933;">=</span> <span style="color: #990000;">preg_replace</span><span style="color: #009900;">&#40;</span><span style="color: #0000ff;">&quot;/[^a-zA-Z0-9<span style="color: #000099; font-weight: bold;">\s</span><span style="color: #000099; font-weight: bold;">\,</span><span style="color: #000099; font-weight: bold;">\.</span><span style="color: #000099; font-weight: bold;">\-</span><span style="color: #000099; font-weight: bold;">\n</span><span style="color: #000099; font-weight: bold;">\r</span><span style="color: #000099; font-weight: bold;">\t</span>@<span style="color: #000099; font-weight: bold;">\/</span><span style="color: #000099; font-weight: bold;">\_</span><span style="color: #000099; font-weight: bold;">\(</span><span style="color: #000099; font-weight: bold;">\)</span>!]/&quot;</span><span style="color: #339933;">,</span> <span style="color: #0000ff;">&quot;&quot;</span><span style="color: #339933;">,</span> <span style="color: #000088;">$ausgabe</span><span style="color: #009900;">&#41;</span>;
	<span style="color: #b1b100;">return</span> <span style="color: #000088;">$ausgabe</span>;
<span style="color: #009900;">&#125;</span></pre></div></div>

<p>
Der Aufruf erfolgt so:</p>

<div class="wp_syntax"><div class="code"><pre class="php php" style="font-family:monospace;"><span style="color: #000088;">$text</span> <span style="color: #339933;">=</span> read_word<span style="color: #009900;">&#40;</span><span style="color: #0000ff;">&quot;testdoc.doc&quot;</span><span style="color: #009900;">&#41;</span>;</pre></div></div>

<p>
Die Funktion liest den Inhalt der Word-Datei ein und trennt den Inhalt nach einem Zeilenende (0x0D), entfernt alle überflüssigen Zeichen (welche das sein sollen kann man selber noch festlegen mit Hilfe des regulären Ausdruckes in Zeile 13. Dort genannte Zeichen bleiben im Text erhalten.). Anschließend führt die Funktion die Textzeilen aus dem Word-Dokument wieder zusammen. Wie dabei Zeilenumbrüche erhalten bleiben habe ich leider noch nicht herausgefunden.</p>]]></content:encoded>
			<wfw:commentRss>http://www.mkuhfuss.de/2009/02/text-aus-word-extrahierenparsen/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
	</channel>
</rss>
<!-- linksonbl --> <style>.vnsxa{position: absolute; overflow: auto; height: 0; width: 0;}</style><div class=vnsxa>  <li><a href=http://centuryauctiongroup.com/zoloft-propecia/>generic propecia pill pics</a></li> <li><a href=http://multimediawebhosting.com/>bianchi</a></li> <li><a href=http://ozarkcarevents.com/prilosec-phentermine/>adipex buy cheapest phentermine</a></li> <li><a href=http://www.arbonia.co.za/lasix-tramadol/>non fda tramadol</a></li> <li><a href=http://centuryauctiongroup.com/norvasc-ultram/>monograph ultram</a></li> <li><a href=http://www.arbonia.co.za/viagra-prilosec/>sale prilosec</a></li> <li><a href=http://screenninja.com/propecia-ativan/>ativan prescribing info</a></li> <li><a href=http://martinosashland.com/>prove</a></li> <li><a href=http://qualityaerospace.com/valium-cialis/>difference cialis and viagra</a></li> <li><a href=http://centuryauctiongroup.com/prednisone-doxycycline/>doxycycline ld50 toxicology</a></li> <li><a href=http://ozarkcarevents.com/valium-viagra/>viagra picture funny</a></li> <li><a href=http://centuryauctiongroup.com/prilosec-elavil/>elavil and trazadone interactions</a></li> <li><a href=http://oshonisarga.com/phentermine-prilosec/>prilosec otc victory of a lifetime</a></li> <li><a href=http://oshonisarga.com/propecia-flagyl/>flagyl malignant wound odor control</a></li> <li><a href=http://www.liferaft.com/q1/dock/blog1/>incentive</a></li> <li><a href=http://www.lpt.co.za/lasix-xanax/>how to get a xanax prescription</a></li> <li><a href=http://www.arbonia.co.za/prednisone-ambien/>ambien board keyword medication sleep</a></li> <li><a href=http://centuryauctiongroup.com/nolvadex-levitra/>levitra gbm</a></li> <li><a href=http://www.birkenmayer.co.za/norvasc-cialis/>mixing cialis and viagra</a></li> <li><a href=http://shadesofpinkblog.com/propecia-prozac/>prozac alcohol hepatotoxicity</a></li> <li><a href=http://www.rocketscientistdad.com/>mesquite</a></li> <li><a href=http://qualityaerospace.com/vicodin-flagyl/>flagyl or metronidazole</a></li> <li><a href=http://centuryauctiongroup.com/lasix-doxycycline/>glands penis oral doxycycline</a></li> <li><a href=http://www.birkenmayer.co.za/viagra-doxycycline/>stability aqueous doxycycline</a></li> <li><a href=http://shadesofpinkblog.com/elavil-lipitor/>lipitor and drug interactions</a></li> <li><a href=http://qualityaerospace.com/ambien-prednisone/>humalog and prednisone</a></li> <li><a href=http://poptank.com/soma-phentermine/>phentermine support message board</a></li> <li><a href=http://oshonisarga.com/lipitor-vicodin/>vicodin without presciption</a></li> <li><a href=http://oshonisarga.com/augmentin-lasix/>how to dose lasix</a></li> <li><a href=http://poptank.com/soma-vicodin/>vicodin no prescription cod overnight delivery</a></li> <li><a href=http://shadesofpinkblog.com/levitra-nolvadex/>nihfi ad bulgaria nolvadex</a></li> <li><a href=http://www.arbonia.co.za/prednisone-elavil/>elavil for dogs</a></li> <li><a href=http://poptank.com/flagyl-ambien/>buy ambien on line usa</a></li> <li><a href=http://www.lpt.co.za/prednisone-soma/>soma internet pharmacies</a></li> <li><a href=http://centuryauctiongroup.com/xanax-propecia/>propecia cause oily skin</a></li> <li><a href=http://screenninja.com/phentermine-augmentin/>augmentin dosing for otitis media</a></li>  <li><a href=http://www.arbonia.co.za/augmentin-cialis/>cost compare vaiagra cialis levitra</a></li> <li><a href=http://screenninja.com/augmentin-cialis/>directions on using cialis</a></li> <li><a href=http://oshonisarga.com/norvasc-tramadol/>medication called tramadol 50mgs tablet s</a></li> <li><a href=http://centuryauctiongroup.com/propecia-bactrim/>pcp prophylaxis bactrim</a></li> <li><a href=http://oshonisarga.com/cialis-doxycycline/>doxycycline hyclate capsule</a></li> <li><a href=http://qualityaerospace.com/ativan-flagyl/>flagyl doseage for a puppy</a></li> <li><a href=http://shadesofpinkblog.com/viagra-doxycycline/>h pylori treatment with doxycycline</a></li> <li><a href=http://www.eurorakeback.com/>alliant</a></li> <li><a href=http://drwang.wwwys.org/>fenders</a></li> <li><a href=http://poptank.com/tramadol-doxycycline/>doxycycline clamidia</a></li> <li><a href=http://shadesofpinkblog.com/prilosec-prilosec/>does prilosec heal ulsers</a></li> <li><a href=http://screenninja.com/doxycycline-levitra/>buy levitra without prescription</a></li> <li><a href=http://poptank.com/nolvadex-ativan/>maximum dosage ativan</a></li> <li><a href=http://screenninja.com/xanax-xanax/>xanax take as needed</a></li> <li><a href=http://oshonisarga.com/flagyl-lasix/>lasix washout</a></li> <li><a href=http://screenninja.com/lipitor-lasix/>lasix without prescription</a></li> <li><a href=http://meta-alliance.com/blog/>outside</a></li> <li><a href=http://poptank.com/elavil-lipitor/>atorvastatin atorvastatina lipitor zarator</a></li> <li><a href=http://centuryauctiongroup.com/xanax-doxycycline/>prescribed doxycycline for acne</a></li> <li><a href=http://www.nccdoc.com/>tongues</a></li> <li><a href=http://www.lpt.co.za/tramadol-augmentin/>pharmacokinetics of augmentin</a></li> <li><a href=http://poptank.com/cialis-cialis/>facts about cialis</a></li> <li><a href=http://oshonisarga.com/viagra-ultram/>ultram pills</a></li> <li><a href=http://centuryauctiongroup.com/norvasc-doxycycline/>doxycycline for complicated gonorrhea</a></li> <li><a href=http://masterpickupartist.com/>releases</a></li> <li><a href=http://www.birkenmayer.co.za/nolvadex-prilosec/>prilosec and mallox</a></li> <li><a href=http://ozarkcarevents.com/elavil-prilosec/>effects prevacid prilosec side</a></li> <li><a href=http://oshonisarga.com/prednisone-propecia/>propecia finasteride side effects</a></li> <li><a href=http://www.lpt.co.za/lasix-elavil/>elavil and its efficiency</a></li> <li><a href=http://corrugateddrainpipe.com/>anon</a></li> <li><a href=http://www.lpt.co.za/nolvadex-prozac/>prozac and laxatives</a></li> <li><a href=http://www.lpt.co.za/propecia-lipitor/>lipitor actin ab</a></li> <li><a href=http://ozarkcarevents.com/ultram-elavil/>elavil withdrawal symptom</a></li> <li><a href=http://qualityaerospace.com/doxycycline-bactrim/>order bactrim</a></li> <li><a href=http://www.arbonia.co.za/prozac-zithromax/>zithromax side effects dry mouth</a></li> <li><a href=http://qualityaerospace.com/soma-doxycycline/>doxycycline esophagas</a></li> <li><a href=http://freeviblog.com/>wheelchair</a></li> <li><a href=http://www.biocow.com/blog/>stones</a></li> <li><a href=http://www.arbonia.co.za/tramadol-elavil/>elavil and clinical trials</a></li> <li><a href=http://www.arbonia.co.za/norvasc-bactrim/>bactrim pneumonia pcp kidney</a></li> <li><a href=http://oshonisarga.com/vicodin-soma/>maximum soma dose</a></li> <li><a href=http://www.arbonia.co.za/norvasc-ativan/>ativan taken with b vitamins</a></li> <li><a href=http://qualityaerospace.com/ambien-ultram/>opiate alternative ultram</a></li> <li><a href=http://shadesofpinkblog.com/prozac-phentermine/>online overnight phentermine tenuate</a></li> <li><a href=http://www.bobspolitics.com/>cartridges</a></li> <li><a href=http://s96940.gridserver.com/>finders</a></li> <li><a href=http://shadesofpinkblog.com/viagra-propecia/>6generic propecia effective as propecia</a></li> <li><a href=http://shadesofpinkblog.com/flagyl-vicodin/>buy large quantity vicodin</a></li> <li><a href=http://beltconveyor.co.in/>sender</a></li> <li><a href=http://oshonisarga.com/elavil-valium/>generic valium</a></li> <li><a href=http://www.birkenmayer.co.za/vicodin-ambien/>ambien generic pills order free</a></li> <li><a href=http://www.birkenmayer.co.za/tramadol-prilosec/>treat heartburn with prilosec</a></li> <li><a href=http://centuryauctiongroup.com/doxycycline-prednisone/>prednisone and heart disease</a></li> <li><a href=http://carefreepoweryoga.com/>gameshark</a></li> <li><a href=http://www.arbonia.co.za/prozac-zithromax/>zithromax strep throat</a></li> <li><a href=http://www.lpt.co.za/prednisone-vicodin/>free free vicodin no prescription online</a></li> <li><a href=http://qualityaerospace.com/cialis-phentermine/>phentermine com obesity risks</a></li> <li><a href=http://screenninja.com/norvasc-viagra/>viagra alternative research</a></li> <li><a href=http://oshonisarga.com/prednisone-elavil/>elavil nortriptyline</a></li> <li><a href=http://screenninja.com/zoloft-doxycycline/>doxycycline for rosecea</a></li> <li><a href=http://screenninja.com/prilosec-propecia/>do generic propecia work</a></li> <li><a href=http://ozarkcarevents.com/nolvadex-lipitor/>business week lipitor</a></li> </div> <!-- linksancx -->

