<?xml version="1.0" encoding="UTF-8"?>
 <rdf:RDF xmlns="http://purl.org/rss/1.0/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:cc="http://web.resource.org/cc/" xmlns:syn="http://purl.org/rss/1.0/modules/syndication/" xmlns:admin="http://webns.net/mvcb/">
  <channel rdf:about="http://pinboard.in">
    <title>Pinboard (ithkuil)</title>
    <link>https://pinboard.in/u:ithkuil/public/</link>
    <description>recent bookmarks from ithkuil</description>
    <items>
      <rdf:Seq>	<rdf:li rdf:resource="http://tomazkovacic.com/blog/14/extracting-article-text-from-html-documents/"/>
	<rdf:li rdf:resource="http://documentcloud.github.com/docsplit/"/>
      </rdf:Seq>
    </items>
  </channel><item rdf:about="http://tomazkovacic.com/blog/14/extracting-article-text-from-html-documents/">
    <title>Overview: Extracting article text from HTML documents | My tech blog.</title>
    <dc:date>2011-03-20T01:37:41+00:00</dc:date>
    <link>http://tomazkovacic.com/blog/14/extracting-article-text-from-html-documents/</link>
    <dc:creator>ithkuil</dc:creator><dc:subject>datamining extraction html text dteam</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:ithkuil/b:ec7f7e0318f1/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:ithkuil/t:datamining"/>
	<rdf:li rdf:resource="https://pinboard.in/u:ithkuil/t:extraction"/>
	<rdf:li rdf:resource="https://pinboard.in/u:ithkuil/t:html"/>
	<rdf:li rdf:resource="https://pinboard.in/u:ithkuil/t:text"/>
	<rdf:li rdf:resource="https://pinboard.in/u:ithkuil/t:dteam"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://documentcloud.github.com/docsplit/">
    <title>Doc⚡split</title>
    <dc:date>2010-09-16T13:53:48+00:00</dc:date>
    <link>http://documentcloud.github.com/docsplit/</link>
    <dc:creator>ithkuil</dc:creator><description><![CDATA[feature extraction]]></description>
<dc:subject>pdf ruby extraction</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:ithkuil/b:546a13336ce4/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:ithkuil/t:pdf"/>
	<rdf:li rdf:resource="https://pinboard.in/u:ithkuil/t:ruby"/>
	<rdf:li rdf:resource="https://pinboard.in/u:ithkuil/t:extraction"/>
</rdf:Bag></taxo:topics>
</item>
</rdf:RDF>