<?xml version="1.0" encoding="UTF-8"?>
 <rdf:RDF xmlns="http://purl.org/rss/1.0/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:cc="http://web.resource.org/cc/" xmlns:syn="http://purl.org/rss/1.0/modules/syndication/" xmlns:admin="http://webns.net/mvcb/">
  <channel rdf:about="http://pinboard.in">
    <title>Pinboard (duckworth)</title>
    <link>https://pinboard.in/u:duckworth/public/</link>
    <description>recent bookmarks from duckworth</description>
    <items>
      <rdf:Seq>	<rdf:li rdf:resource="https://www.crunchydata.com/blog/postgres-full-text-search-a-search-engine-in-a-database"/>
	<rdf:li rdf:resource="https://posthog.com/"/>
	<rdf:li rdf:resource="http://www.opisnet.com/products/retail-fuel-prices-widget.aspx"/>
	<rdf:li rdf:resource="http://multithreaded.stitchfix.com/blog/2016/03/16/engineers-shouldnt-write-etl/"/>
	<rdf:li rdf:resource="http://www.analyticsvidhya.com/blog/2015/12/faster-data-manipulation-7-packages/?platform=hootsuite"/>
	<rdf:li rdf:resource="http://blog.datadive.net/selecting-good-features-part-iii-random-forests/"/>
	<rdf:li rdf:resource="http://chartkick.com/"/>
	<rdf:li rdf:resource="http://engineering.harrys.com/2014/06/09/seed-migrations.html"/>
	<rdf:li rdf:resource="http://www.michael-noll.com/blog/2013/01/18/implementing-real-time-trending-topics-in-storm/"/>
	<rdf:li rdf:resource="https://coderanger.net/2014/02/data-bags/"/>
	<rdf:li rdf:resource="http://www-958.ibm.com/software/analytics/manyeyes/datasets/zip-dma-mapping/versions/1.txt"/>
	<rdf:li rdf:resource="http://beekn.net/"/>
	<rdf:li rdf:resource="http://jeroenjanssens.com/2013/09/19/seven-command-line-tools-for-data-science.html"/>
	<rdf:li rdf:resource="http://type-exit.org/adventures-with-open-source-bi/2010/07/creating-a-basic-mondrian-olap-cube/"/>
	<rdf:li rdf:resource="http://spatialhadoop.cs.umn.edu/"/>
	<rdf:li rdf:resource="http://www.juiceanalytics.com/"/>
	<rdf:li rdf:resource="https://github.com/nathanmarz/storm"/>
	<rdf:li rdf:resource="http://www.slideshare.net/nathanmarz/the-secrets-of-building-realtime-big-data-systems"/>
	<rdf:li rdf:resource="http://persistencejs.org/plugin/sync"/>
	<rdf:li rdf:resource="http://www.cs.usfca.edu/~galles/visualization/Algorithms.html"/>
	<rdf:li rdf:resource="http://www.visual-literacy.org/periodic_table/periodic_table.html#"/>
      </rdf:Seq>
    </items>
  </channel><item rdf:about="https://www.crunchydata.com/blog/postgres-full-text-search-a-search-engine-in-a-database">
    <title>Postgres Full-Text Search: A Search Engine in a Database</title>
    <dc:date>2022-07-11T19:59:55+00:00</dc:date>
    <link>https://www.crunchydata.com/blog/postgres-full-text-search-a-search-engine-in-a-database</link>
    <dc:creator>duckworth</dc:creator><dc:subject>data postgres databases search NLP</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:duckworth/b:ac5847006a5c/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:data"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:postgres"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:databases"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:search"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:NLP"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="https://posthog.com/">
    <title>PostHog - Open-Source Product Analytics</title>
    <dc:date>2021-01-22T14:37:59+00:00</dc:date>
    <link>https://posthog.com/</link>
    <dc:creator>duckworth</dc:creator><dc:subject>analytics data api opensource tools</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:duckworth/b:d8191e7d1bf9/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:analytics"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:data"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:api"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:opensource"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:tools"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://www.opisnet.com/products/retail-fuel-prices-widget.aspx">
    <title>Retail Fuel Prices Widget | OPIS | Oil Price Information Service</title>
    <dc:date>2016-07-06T20:59:38+00:00</dc:date>
    <link>http://www.opisnet.com/products/retail-fuel-prices-widget.aspx</link>
    <dc:creator>duckworth</dc:creator><dc:subject>feeds data</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:duckworth/b:89bd8cbedbf0/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:feeds"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:data"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://multithreaded.stitchfix.com/blog/2016/03/16/engineers-shouldnt-write-etl/">
    <title>Engineers Shouldn’t Write ETL: A Guide to Building a High Functioning Data Science Department | Stitch Fix Technology – Multithreaded</title>
    <dc:date>2016-03-21T19:20:20+00:00</dc:date>
    <link>http://multithreaded.stitchfix.com/blog/2016/03/16/engineers-shouldnt-write-etl/</link>
    <dc:creator>duckworth</dc:creator><dc:subject>culture data etl</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:duckworth/b:092443b615e4/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:culture"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:data"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:etl"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://www.analyticsvidhya.com/blog/2015/12/faster-data-manipulation-7-packages/?platform=hootsuite">
    <title>Do Faster Data Manipulation using These 7 R Packages</title>
    <dc:date>2015-12-24T21:34:42+00:00</dc:date>
    <link>http://www.analyticsvidhya.com/blog/2015/12/faster-data-manipulation-7-packages/?platform=hootsuite</link>
    <dc:creator>duckworth</dc:creator><dc:subject>tools R data</dc:subject>
<dc:identifier>https://pinboard.in/u:duckworth/b:a5cc23858f40/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:tools"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:R"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:data"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://blog.datadive.net/selecting-good-features-part-iii-random-forests/">
    <title>Selecting good features – Part III: random forests | Diving into data</title>
    <dc:date>2015-09-10T19:14:14+00:00</dc:date>
    <link>http://blog.datadive.net/selecting-good-features-part-iii-random-forests/</link>
    <dc:creator>duckworth</dc:creator><description><![CDATA[Firstly, feature selection based on impurity reduction is biased towards preferring variables with more categories (see Bias in random forest variable importance measures). Secondly, when the dataset has two (or more) correlated features, then from the point of view of the model, any of these correlated features can be used as the predictor, with no concrete preference of one over the others. But once one of them is used, the importance of others is significantly reduced since effectively the impurity they can remove is already removed by the first feature. As a consequence, they will have a lower reported importance]]></description>
<dc:subject>python machine-learning data</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:duckworth/b:8e8900fabd69/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:python"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:machine-learning"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:data"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://chartkick.com/">
    <title>Chartkick</title>
    <dc:date>2014-07-22T19:28:37+00:00</dc:date>
    <link>http://chartkick.com/</link>
    <dc:creator>duckworth</dc:creator><dc:subject>charts data development javascript ruby</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:duckworth/b:347f9a27e2ca/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:charts"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:data"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:development"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:javascript"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:ruby"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://engineering.harrys.com/2014/06/09/seed-migrations.html">
    <title>SeedMigrations. Like schema migrations, but for your data - Harry's Engineering</title>
    <dc:date>2014-06-11T17:38:51+00:00</dc:date>
    <link>http://engineering.harrys.com/2014/06/09/seed-migrations.html</link>
    <dc:creator>duckworth</dc:creator><dc:subject>data migrations rails</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:duckworth/b:51aec1369875/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:data"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:migrations"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:rails"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://www.michael-noll.com/blog/2013/01/18/implementing-real-time-trending-topics-in-storm/">
    <title>Implementing Real-Time Trending Topics with a Distributed Rolling Count Algorithm in Storm - Michael G. Noll</title>
    <dc:date>2014-06-09T16:25:39+00:00</dc:date>
    <link>http://www.michael-noll.com/blog/2013/01/18/implementing-real-time-trending-topics-in-storm/</link>
    <dc:creator>duckworth</dc:creator><dc:subject>architecture data development distributed storm</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:duckworth/b:dd293e4b0206/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:architecture"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:data"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:development"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:distributed"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:storm"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="https://coderanger.net/2014/02/data-bags/">
    <title>Data Bags are a Code Smell</title>
    <dc:date>2014-04-30T12:13:35+00:00</dc:date>
    <link>https://coderanger.net/2014/02/data-bags/</link>
    <dc:creator>duckworth</dc:creator><dc:subject>devops data chef api</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:duckworth/b:d17df7efc68d/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:devops"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:data"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:chef"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:api"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://www-958.ibm.com/software/analytics/manyeyes/datasets/zip-dma-mapping/versions/1.txt">
    <title>dma to zip mapping</title>
    <dc:date>2014-04-04T19:10:09+00:00</dc:date>
    <link>http://www-958.ibm.com/software/analytics/manyeyes/datasets/zip-dma-mapping/versions/1.txt</link>
    <dc:creator>duckworth</dc:creator><dc:subject>dma zipcode data</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:duckworth/b:85be3e66a8fc/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:dma"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:zipcode"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:data"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://beekn.net/">
    <title>BEEKn | Beacons, brands and culture on the Internet of Things</title>
    <dc:date>2014-02-24T23:16:59+00:00</dc:date>
    <link>http://beekn.net/</link>
    <dc:creator>duckworth</dc:creator><dc:subject>bluetooth data ibeacon</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:duckworth/b:e5cf9608a0be/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:bluetooth"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:data"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:ibeacon"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://jeroenjanssens.com/2013/09/19/seven-command-line-tools-for-data-science.html">
    <title>7 command-line tools for data science</title>
    <dc:date>2013-09-19T18:31:24+00:00</dc:date>
    <link>http://jeroenjanssens.com/2013/09/19/seven-command-line-tools-for-data-science.html</link>
    <dc:creator>duckworth</dc:creator><dc:subject>json tools data</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:duckworth/b:ea8a2969b03d/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:json"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:tools"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:data"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://type-exit.org/adventures-with-open-source-bi/2010/07/creating-a-basic-mondrian-olap-cube/">
    <title>Creating a basic Mondrian OLAP Cube | Adventures with Open Source BI</title>
    <dc:date>2013-06-05T13:47:17+00:00</dc:date>
    <link>http://type-exit.org/adventures-with-open-source-bi/2010/07/creating-a-basic-mondrian-olap-cube/</link>
    <dc:creator>duckworth</dc:creator><dc:subject>data software olap jasper</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:duckworth/b:e74a5e7197c2/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:data"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:software"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:olap"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:jasper"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://spatialhadoop.cs.umn.edu/">
    <title>SpatialHadoop</title>
    <dc:date>2013-05-13T17:13:12+00:00</dc:date>
    <link>http://spatialhadoop.cs.umn.edu/</link>
    <dc:creator>duckworth</dc:creator><dc:subject>data hadoop geolocation</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:duckworth/b:0243b8996b87/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:data"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:hadoop"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:geolocation"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://www.juiceanalytics.com/">
    <title>Juice Analytics - Your data is meant for action.</title>
    <dc:date>2013-04-05T19:51:12+00:00</dc:date>
    <link>http://www.juiceanalytics.com/</link>
    <dc:creator>duckworth</dc:creator><dc:subject>analytics data design statistics visualization</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:duckworth/b:32c18a08ed0e/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:analytics"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:data"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:design"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:statistics"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:visualization"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="https://github.com/nathanmarz/storm">
    <title>nathanmarz/storm · GitHub</title>
    <dc:date>2012-07-02T14:39:01+00:00</dc:date>
    <link>https://github.com/nathanmarz/storm</link>
    <dc:creator>duckworth</dc:creator><dc:subject>twitter data distributed storm</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:duckworth/b:7ac89844b3fa/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:twitter"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:data"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:distributed"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:storm"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://www.slideshare.net/nathanmarz/the-secrets-of-building-realtime-big-data-systems">
    <title>The Secrets of Building Realtime Big Data Systems</title>
    <dc:date>2012-07-02T14:37:36+00:00</dc:date>
    <link>http://www.slideshare.net/nathanmarz/the-secrets-of-building-realtime-big-data-systems</link>
    <dc:creator>duckworth</dc:creator><dc:subject>scaling data scalability</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:duckworth/b:ff276e25a1ac/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:scaling"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:data"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:scalability"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://persistencejs.org/plugin/sync">
    <title>plugin:sync [persistence.js]</title>
    <dc:date>2011-11-02T15:09:57+00:00</dc:date>
    <link>http://persistencejs.org/plugin/sync</link>
    <dc:creator>duckworth</dc:creator><dc:subject>javascript data html5 localStorage</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:duckworth/b:7e0fa343784a/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:javascript"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:data"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:html5"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:localStorage"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://www.cs.usfca.edu/~galles/visualization/Algorithms.html">
    <title>Data Structure Visualization</title>
    <dc:date>2011-05-02T14:24:40+00:00</dc:date>
    <link>http://www.cs.usfca.edu/~galles/visualization/Algorithms.html</link>
    <dc:creator>duckworth</dc:creator><dc:subject>algorithm algorithms programming visualization data</dc:subject>
<dc:source>https://pinboard.in/</dc:source>
<dc:identifier>https://pinboard.in/u:duckworth/b:aae114da42c6/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:algorithm"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:algorithms"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:programming"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:visualization"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:data"/>
</rdf:Bag></taxo:topics>
</item>
<item rdf:about="http://www.visual-literacy.org/periodic_table/periodic_table.html#">
    <title>A Periodic Table of Visualization Methods</title>
    <dc:date>2007-02-02T13:36:03+00:00</dc:date>
    <link>http://www.visual-literacy.org/periodic_table/periodic_table.html#</link>
    <dc:creator>duckworth</dc:creator><dc:subject>data visualization</dc:subject>
<dc:identifier>https://pinboard.in/u:duckworth/b:9a114f707bfd/</dc:identifier>
<taxo:topics><rdf:Bag>	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:data"/>
	<rdf:li rdf:resource="https://pinboard.in/u:duckworth/t:visualization"/>
</rdf:Bag></taxo:topics>
</item>
</rdf:RDF>