<?xml version="1.0" encoding="UTF-8"?>
 <rdf:RDF xmlns="http://purl.org/rss/1.0/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:cc="http://web.resource.org/cc/" xmlns:syn="http://purl.org/rss/1.0/modules/syndication/" xmlns:admin="http://webns.net/mvcb/">
  <channel rdf:about="http://pinboard.in">
    <title>Pinboard (torsten)</title>
    <link>https://pinboard.in/u:torsten/public/</link>
    <description>recent bookmarks from torsten</description>
    <items>
      <rdf:Seq>	<rdf:li rdf:resource="https://github.com/google/sentencepiece"/>
	<rdf:li rdf:resource="http://spacy.io/"/>
	<rdf:li rdf:resource="https://github.com/explosion/spaCy"/>
	<rdf:li rdf:resource="https://code.google.com/p/word2vec/"/>
	<rdf:li rdf:resource="http://nlp.stanford.edu/projects/glove/"/>
	<rdf:li rdf:resource="http://www.ark.cs.cmu.edu/TweetNLP/"/>
	<rdf:li rdf:resource="http://www.cs.princeton.edu/~blei/topicmodeling.html"/>
	<rdf:li rdf:resource="http://mallet.cs.umass.edu/"/>
	<rdf:li rdf:resource="http://norvig.com/mayzner.html"/>
	<rdf:li rdf:resource="http://en.wikipedia.org/wiki/Tf%E2%80%93idf"/>
	<rdf:li rdf:resource="http://www.commoncrawl.org/"/>
	<rdf:li rdf:resource="http://norvig.com/ngrams/"/>
	<rdf:li rdf:resource="http://www.gutenberg.org/catalog/"/>
	<rdf:li rdf:resource="http://en.wikipedia.org/w/index.php?title=Special:LongPages"/>
      </rdf:Seq>
    </items>
  </channel><item rdf:about="https://github.com/google/sentencepiece">
    <title>sentencepiece – Google</title>
    <dc:date>2021-04-01T01:23:26+00:00</dc:date>
    <link>https://github.com/google/sentencepiece</link>
    <dc:creator>torsten</dc:creator><description><![CDATA[Unsupervised text tokenizer for Neural Network-based text generation.]]></description>
<dc:subject>from:github neural-machine-translation natural-language-processing word-segmentation c++ machine-learning ml nlp google neural networks</dc:subject>
<dc:identifier>https://pinboard.in/u:torsten/b:3e2f0ca30f87/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:from:github"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:neural-machine-translation"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:natural-language-processing"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:word-segmentation"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:c++"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:machine-learning"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:ml"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:nlp"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:google"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:neural"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:networks"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://spacy.io/">
    <title>spaCy.io | Build Tomorrow's Language Technologies</title>
    <dc:date>2015-09-22T20:36:43+00:00</dc:date>
    <link>http://spacy.io/</link>
    <dc:creator>torsten</dc:creator><dc:subject>language library nlp programming python</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:torsten/b:2ae584a32e05/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:language"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:library"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:nlp"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:programming"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:python"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="https://github.com/explosion/spaCy">
    <title>spaCy – Explosion</title>
    <dc:date>2015-01-26T21:15:14+00:00</dc:date>
    <link>https://github.com/explosion/spaCy</link>
    <dc:creator>torsten</dc:creator><description><![CDATA[💫 Industrial-strength Natural Language Processing (NLP) in Python]]></description>
<dc:subject>from:github natural-language-processing data-science machine-learning python cython nlp artificial-intelligence ai spacy nlp-library</dc:subject>
<dc:identifier>https://pinboard.in/u:torsten/b:a2ea27fdb286/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:from:github"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:natural-language-processing"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:data-science"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:machine-learning"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:python"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:cython"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:nlp"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:artificial-intelligence"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:ai"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:spacy"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:nlp-library"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="https://code.google.com/p/word2vec/">
    <title>word2vec - Tool for computing continuous distributed representations of words. - Google Project Hosting</title>
    <dc:date>2015-01-20T17:23:06+00:00</dc:date>
    <link>https://code.google.com/p/word2vec/</link>
    <dc:creator>torsten</dc:creator><dc:subject>google library nlp opensource ml machine learning</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:torsten/b:f7ae811cd1b7/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:google"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:library"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:nlp"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:opensource"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:ml"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:machine"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:learning"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://nlp.stanford.edu/projects/glove/">
    <title>GloVe: Global Vectors for Word Representation</title>
    <dc:date>2014-12-23T22:14:25+00:00</dc:date>
    <link>http://nlp.stanford.edu/projects/glove/</link>
    <dc:creator>torsten</dc:creator><dc:subject>ai language ml nlp papers research</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:torsten/b:77533f6e601e/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:ai"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:language"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:ml"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:nlp"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:papers"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:research"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://www.ark.cs.cmu.edu/TweetNLP/">
    <title>Twitter Natural Language Processing -- Noah's ARK</title>
    <dc:date>2014-10-23T21:45:15+00:00</dc:date>
    <link>http://www.ark.cs.cmu.edu/TweetNLP/</link>
    <dc:creator>torsten</dc:creator><dc:subject>free java nlp research twitter language speech</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:torsten/b:bcf7eed87a4d/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:free"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:java"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:nlp"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:research"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:twitter"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:language"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:speech"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://www.cs.princeton.edu/~blei/topicmodeling.html">
    <title>David M. Blei</title>
    <dc:date>2014-03-26T16:47:06+00:00</dc:date>
    <link>http://www.cs.princeton.edu/~blei/topicmodeling.html</link>
    <dc:creator>torsten</dc:creator><description><![CDATA[Topic modeling
]]></description>
<dc:subject>nlp lda ml machine learning topic modeling models model</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:torsten/b:2403f21a4bdc/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:nlp"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:lda"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:ml"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:machine"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:learning"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:topic"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:modeling"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:models"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:model"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://mallet.cs.umass.edu/">
    <title>MALLET homepage</title>
    <dc:date>2014-03-26T14:28:37+00:00</dc:date>
    <link>http://mallet.cs.umass.edu/</link>
    <dc:creator>torsten</dc:creator><dc:subject>datamining java nlp programming machine learning ml</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:torsten/b:de8ea531bca2/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:datamining"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:java"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:nlp"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:programming"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:machine"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:learning"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:ml"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://norvig.com/mayzner.html">
    <title>English Letter Frequency Counts: Mayzner Revisited or ETAOIN SRHLDCU</title>
    <dc:date>2013-01-09T19:10:15+00:00</dc:date>
    <link>http://norvig.com/mayzner.html</link>
    <dc:creator>torsten</dc:creator><dc:subject>english nlp statistics data</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:torsten/b:dde266d6f527/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:english"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:nlp"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:statistics"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:data"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://en.wikipedia.org/wiki/Tf%E2%80%93idf">
    <title>tf–idf - Wikipedia</title>
    <dc:date>2012-02-05T21:55:48+00:00</dc:date>
    <link>http://en.wikipedia.org/wiki/Tf%E2%80%93idf</link>
    <dc:creator>torsten</dc:creator><description><![CDATA[term frequency–inverse document frequency: how to find relavant terms from a set of overlapping terms]]></description>
<dc:subject>algorithm data datamining nlp wikipedia geo wp</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:torsten/b:f737fedfbab7/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:algorithm"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:data"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:datamining"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:nlp"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:wikipedia"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:geo"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:wp"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://www.commoncrawl.org/">
    <title>CommonCrawl | | CommonCrawl</title>
    <dc:date>2011-12-17T18:53:26+00:00</dc:date>
    <link>http://www.commoncrawl.org/</link>
    <dc:creator>torsten</dc:creator><description><![CDATA[a free crawl of the web hosted on amazon s3]]></description>
<dc:subject>open web data crawl nlp opensource ai ml amazon s3</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:torsten/b:f63d6a73b9f3/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:open"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:web"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:data"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:crawl"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:nlp"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:opensource"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:ai"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:ml"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:amazon"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:s3"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://norvig.com/ngrams/">
    <title>Natural Language Corpus Data: Beautiful Data</title>
    <dc:date>2011-12-17T17:38:15+00:00</dc:date>
    <link>http://norvig.com/ngrams/</link>
    <dc:creator>torsten</dc:creator><description><![CDATA[contains links to several text corpora for nlp]]></description>
<dc:subject>data language nlp ai ml</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:torsten/b:dbb03a167a98/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:data"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:language"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:nlp"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:ai"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:ml"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://www.gutenberg.org/catalog/">
    <title>Online Book Catalog - Overview - Project Gutenberg</title>
    <dc:date>2011-12-17T15:59:08+00:00</dc:date>
    <link>http://www.gutenberg.org/catalog/</link>
    <dc:creator>torsten</dc:creator><dc:subject>data nlp ml ai book books free</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:torsten/b:33908d4aebc0/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:data"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:nlp"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:ml"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:ai"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:book"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:books"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:free"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://en.wikipedia.org/w/index.php?title=Special:LongPages">
    <title>Long pages - Wikipedia, the free encyclopedia</title>
    <dc:date>2011-12-17T15:58:29+00:00</dc:date>
    <link>http://en.wikipedia.org/w/index.php?title=Special:LongPages</link>
    <dc:creator>torsten</dc:creator><dc:subject>data wikipedia nlp ml ai</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:torsten/b:e0896756461b/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:data"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:wikipedia"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:nlp"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:ml"/>
	<rdf:li rdf:resource="https://pinboard.in/u:torsten/t:ai"/>
</rdf:Bag></taxo:topics>
</item>
</rdf:RDF>