<?xml version="1.0" encoding="UTF-8"?>
<?xml-stylesheet type="text/xsl" media="screen" href="/~d/styles/rss2full.xsl"?><?xml-stylesheet type="text/css" media="screen" href="http://feeds.feedburner.com/~d/styles/itemcontent.css"?><rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:wfw="http://wellformedweb.org/CommentAPI/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:atom="http://www.w3.org/2005/Atom" xmlns:sy="http://purl.org/rss/1.0/modules/syndication/" xmlns:slash="http://purl.org/rss/1.0/modules/slash/" xmlns:georss="http://www.georss.org/georss" xmlns:geo="http://www.w3.org/2003/01/geo/wgs84_pos#" xmlns:media="http://search.yahoo.com/mrss/" version="2.0">

<channel>
	<title>The Mendicant Bug</title>
	
	<link>http://mendicantbug.com</link>
	<description>Wanderings into computational linguistics, science, social media and life...</description>
	<lastBuildDate>Sat, 24 Jul 2010 05:30:04 +0000</lastBuildDate>
	<language>en</language>
	<sy:updatePeriod>hourly</sy:updatePeriod>
	<sy:updateFrequency>1</sy:updateFrequency>
	<generator>http://wordpress.com/</generator>
<cloud domain="mendicantbug.com" port="80" path="/?rsscloud=notify" registerProcedure="" protocol="http-post" />
<image>
		<url>http://1.gravatar.com/blavatar/3c73bbb145eaa976335be29004da9868?s=96&amp;d=http%3A%2F%2Fs2.wp.com%2Fi%2Fbuttonw-com.png</url>
		<title>The Mendicant Bug</title>
		<link>http://mendicantbug.com</link>
	</image>
	<atom:link rel="search" type="application/opensearchdescription+xml" href="http://mendicantbug.com/osd.xml" title="The Mendicant Bug" />
	
		<atom10:link xmlns:atom10="http://www.w3.org/2005/Atom" rel="self" type="application/rss+xml" href="http://feeds.feedburner.com/TheMendicantBugComputationalLinguistics" /><feedburner:info xmlns:feedburner="http://rssnamespace.org/feedburner/ext/1.0" uri="themendicantbugcomputationallinguistics" /><atom10:link xmlns:atom10="http://www.w3.org/2005/Atom" rel="hub" href="http://pubsubhubbub.appspot.com/" /><atom10:link xmlns:atom10="http://www.w3.org/2005/Atom" rel="hub" href="http://mendicantbug.com/?pushpress=hub" /><item>
		<title>Simple Random Number Generator Gem</title>
		<link>http://mendicantbug.com/2010/07/24/simple-random-number-generator-gem/</link>
		<comments>http://mendicantbug.com/2010/07/24/simple-random-number-generator-gem/#comments</comments>
		<pubDate>Sat, 24 Jul 2010 05:26:23 +0000</pubDate>
		<dc:creator>Jason Adams</dc:creator>
				<category><![CDATA[Uncategorized]]></category>
		<category><![CDATA[code]]></category>
		<category><![CDATA[math]]></category>
		<category><![CDATA[random number generation]]></category>
		<category><![CDATA[ruby]]></category>
		<category><![CDATA[rubygems]]></category>
		<category><![CDATA[statistics]]></category>

		<guid isPermaLink="false">http://mendicantbug.com/?p=1311</guid>
		<description><![CDATA[I just published the simple-random ruby gem, which is ported from C# code by John D. Cook.  You can view the source on github or install the gem via rubygems: gem install simple-random The gem allows you to sample from the following distributions: Beta Cauchy Chi Square Exponential Gamma Inverse Gamma Laplace (double exponential) Normal Student [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1311&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>I just published the <strong>simple-random </strong>ruby gem, which is ported from <a href="http://www.codeproject.com/KB/recipes/SimpleRNG.aspx" target="_blank">C# code</a> by <a href="http://www.johndcook.com/blog/2010/05/03/c-random-number-generation-code/" target="_blank">John D. Cook</a>.  You can view the <a href="http://github.com/ealdent/simple-random" target="_blank">source on github</a> or install the gem via rubygems:</p>
<p style="padding-left:30px;"><code>gem install simple-random</code></p>
<p>The gem allows you to sample from the following distributions:</p>
<ul>
<li>Beta</li>
<li>Cauchy</li>
<li>Chi Square</li>
<li>Exponential</li>
<li>Gamma</li>
<li>Inverse Gamma</li>
<li>Laplace (double exponential)</li>
<li>Normal</li>
<li>Student t</li>
<li>Uniform</li>
<li>Weibull</li>
</ul>
<p>Simple examples:</p>
<p style="padding-left:30px;"><code>require 'rubygems'<br />
require 'simple-random'</code></p>
<p style="padding-left:30px;"><code>r = SimpleRandom.new<br />
r.uniform # =&gt; 0.127064087195322<br />
r.normal(5, 1) # =&gt; 5.71972152940515</code></p>
<br />Filed under: <a href='http://mendicantbug.com/category/uncategorized/'>Uncategorized</a>  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/ealdent.wordpress.com/1311/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/ealdent.wordpress.com/1311/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/ealdent.wordpress.com/1311/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/ealdent.wordpress.com/1311/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/ealdent.wordpress.com/1311/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/ealdent.wordpress.com/1311/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/ealdent.wordpress.com/1311/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/ealdent.wordpress.com/1311/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/ealdent.wordpress.com/1311/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/ealdent.wordpress.com/1311/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/ealdent.wordpress.com/1311/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/ealdent.wordpress.com/1311/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/ealdent.wordpress.com/1311/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/ealdent.wordpress.com/1311/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1311&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />
<p><a href="http://feedads.g.doubleclick.net/~a/AGMeXklWXAzTftvl9VPKHUnkhgc/0/da"><img src="http://feedads.g.doubleclick.net/~a/AGMeXklWXAzTftvl9VPKHUnkhgc/0/di" border="0" ismap="true"></img></a><br/>
<a href="http://feedads.g.doubleclick.net/~a/AGMeXklWXAzTftvl9VPKHUnkhgc/1/da"><img src="http://feedads.g.doubleclick.net/~a/AGMeXklWXAzTftvl9VPKHUnkhgc/1/di" border="0" ismap="true"></img></a></p>]]></content:encoded>
			<wfw:commentRss>http://mendicantbug.com/2010/07/24/simple-random-number-generator-gem/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ebec6abd2b9f1eb4de865aed01242171?s=96&amp;d=monsterid&amp;r=PG" medium="image">
			<media:title type="html">ealdent</media:title>
		</media:content>
	</item>
		<item>
		<title>War on Attention Poverty</title>
		<link>http://mendicantbug.com/2010/07/14/war-on-attention-poverty/</link>
		<comments>http://mendicantbug.com/2010/07/14/war-on-attention-poverty/#comments</comments>
		<pubDate>Wed, 14 Jul 2010 11:39:05 +0000</pubDate>
		<dc:creator>Jason Adams</dc:creator>
				<category><![CDATA[daniel tunkelang]]></category>
		<category><![CDATA[tunkrank]]></category>
		<category><![CDATA[attention scarcity]]></category>

		<guid isPermaLink="false">http://mendicantbug.com/?p=1307</guid>
		<description><![CDATA[Daniel Tunkelang has posted his slides from his talk at AT&#38;T Labs on TunkRank over at the Noisy Channel. Embedded below for your viewing pleasure:<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1307&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p><a href="http://twitter.com/dtunkelang" target="new">Daniel Tunkelang</a> has posted his slides from his talk at AT&amp;T Labs on <a href="http://tunkrank.com">TunkRank</a> over at <a href="http://thenoisychannel.com/2010/07/13/the-war-on-attention-poverty-measuring-twitter-authority/" target="new">the Noisy Channel</a>.  Embedded below for your viewing pleasure:</p>
<p><object type='application/x-shockwave-flash' wmode='opaque' data='http://static.slideshare.net/swf/ssplayer2.swf?id=4749609&#038;doc=waronattentionpoverty-100713213804-phpapp01' width='614' height='503'><param name='movie' value='http://static.slideshare.net/swf/ssplayer2.swf?id=4749609&#038;doc=waronattentionpoverty-100713213804-phpapp01' /><param name='allowFullScreen' value='true' /><param name='allowScriptAccess' value='always' /></object></p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/ealdent.wordpress.com/1307/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/ealdent.wordpress.com/1307/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/ealdent.wordpress.com/1307/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/ealdent.wordpress.com/1307/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/ealdent.wordpress.com/1307/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/ealdent.wordpress.com/1307/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/ealdent.wordpress.com/1307/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/ealdent.wordpress.com/1307/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/ealdent.wordpress.com/1307/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/ealdent.wordpress.com/1307/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/ealdent.wordpress.com/1307/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/ealdent.wordpress.com/1307/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/ealdent.wordpress.com/1307/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/ealdent.wordpress.com/1307/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1307&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />
<p><a href="http://feedads.g.doubleclick.net/~a/GJKnMOlZXSC5Qp1kq4wQ8Y5YpMw/0/da"><img src="http://feedads.g.doubleclick.net/~a/GJKnMOlZXSC5Qp1kq4wQ8Y5YpMw/0/di" border="0" ismap="true"></img></a><br/>
<a href="http://feedads.g.doubleclick.net/~a/GJKnMOlZXSC5Qp1kq4wQ8Y5YpMw/1/da"><img src="http://feedads.g.doubleclick.net/~a/GJKnMOlZXSC5Qp1kq4wQ8Y5YpMw/1/di" border="0" ismap="true"></img></a></p>]]></content:encoded>
			<wfw:commentRss>http://mendicantbug.com/2010/07/14/war-on-attention-poverty/feed/</wfw:commentRss>
		<slash:comments>4</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ebec6abd2b9f1eb4de865aed01242171?s=96&amp;d=monsterid&amp;r=PG" medium="image">
			<media:title type="html">ealdent</media:title>
		</media:content>
	</item>
		<item>
		<title>TunkRank, Meet Tickery</title>
		<link>http://mendicantbug.com/2010/05/05/tunkrank-meet-tickery/</link>
		<comments>http://mendicantbug.com/2010/05/05/tunkrank-meet-tickery/#comments</comments>
		<pubDate>Wed, 05 May 2010 22:30:09 +0000</pubDate>
		<dc:creator>Jason Adams</dc:creator>
				<category><![CDATA[fluiddb]]></category>
		<category><![CDATA[tickery]]></category>
		<category><![CDATA[tunkrank]]></category>
		<category><![CDATA[twitter]]></category>

		<guid isPermaLink="false">http://mendicantbug.com/?p=1294</guid>
		<description><![CDATA[Tickery is a rather awesome application of FluidDB that lets you explore Twitter in a number of ways. I mentioned previously in post on recent TunkRank improvements that TunkRank scores would soon be integrated with Tickery, and thanks to Terry Jones and his crew, the time is now! Full disclosure: I&#8217;m a fan of FluidDB. [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1294&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p style="text-align:justify;"><a href="http://ealdent.files.wordpress.com/2010/05/fi-logo-cropped.png"><img class="alignright size-full wp-image-1297" style="margin-left:4px;margin-bottom:4px;" title="fi-logo-cropped" src="http://ealdent.files.wordpress.com/2010/05/fi-logo-cropped.png?w=200&#038;h=245" alt="" width="200" height="245" /></a><br />
<a href="http://tickery.net" target="_blank">Tickery</a> is a rather awesome application of <a href="http://fluidinfo.com" target="_blank">FluidDB</a> that lets you explore Twitter in a number of ways.  I mentioned previously in <a href="http://mendicantbug.com/2010/02/17/tunkrank-improvements/">post on recent TunkRank improvements</a> that <a href="http://tunkrank.com" target="_blank">TunkRank</a> scores would soon be integrated with Tickery, and thanks to <a href="http://twitter.com/terrycojones" target="_blank">Terry Jones</a> and his crew, the time is now!</p>
<p style="text-align:justify;">Full disclosure: I&#8217;m a fan of FluidDB.  I think it&#8217;s an awesomely useful technology and concept and I&#8217;m happy that TunkRank scores can be a part of it.  One cool thing is that FluidDB&#8217;s permission system is designed so that even though Tickery is using TunkRank&#8217;s data, TunkRank still owns it.  It can be revoked at any time if there was a reason to do so (not that I can imagine such a thing will ever be the case).  Also, the data in FluidDB for Tickery and TunkRank are completely independent.  Anyone else can come along and add a new set of data for mash-ups that would then use all three, without TunkRank or Tickery having to do a thing.</p>
<h3>Playing around with Tickery</h3>
<p style="text-align:justify;">Now when you use the advanced search on Tickery, you can filter your results by TunkRank score, letting you do some interesting combinations on the data.  For example, if I want to see who I&#8217;m following TunkRank scores greater than 50:</p>
<p style="padding-left:30px;"><code>has twitter.com/friends/ealdent and tunkrank.com/score &gt; 50</code></p>
<p><a href="http://ealdent.files.wordpress.com/2010/05/picture-9.png"><img class="aligncenter size-full wp-image-1295" title="tickery query results 1" src="http://ealdent.files.wordpress.com/2010/05/picture-9.png?w=547&#038;h=78" alt="" width="547" height="78" /></a></p>
<p style="text-align:justify;">There&#8217;s lots to play around with there, especially when you start comparing the friends of various users.  For example, if you wanted to know who <a href="http://thenoisychannel.com" target="_blank">Daniel Tunkelang</a> (<a href="http://twitter.com/dtunkelang" target="_blank">@dtunkelang</a>) and <a href="http://twitter.com/ealdent">I</a> both follow who have TunkRank scores less than 20:</p>
<p style="padding-left:30px;"><code>has twitter.com/friends/ealdent and<br />
has twitter.com/friends/dtunkelang and<br />
tunkrank.com/score &lt; 20</code></p>
<p><a href="http://ealdent.files.wordpress.com/2010/05/picture-10.png"><img class="aligncenter size-full wp-image-1296" title="tickery query results 2" src="http://ealdent.files.wordpress.com/2010/05/picture-10.png?w=280&#038;h=87" alt="" width="280" height="87" /></a></p>
<p style="text-align:justify;">Those people have something clearly in common, and it tells you something about the interests that Daniel and I share.  I hope you check it out and let me know what you think.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/ealdent.wordpress.com/1294/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/ealdent.wordpress.com/1294/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/ealdent.wordpress.com/1294/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/ealdent.wordpress.com/1294/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/ealdent.wordpress.com/1294/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/ealdent.wordpress.com/1294/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/ealdent.wordpress.com/1294/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/ealdent.wordpress.com/1294/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/ealdent.wordpress.com/1294/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/ealdent.wordpress.com/1294/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/ealdent.wordpress.com/1294/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/ealdent.wordpress.com/1294/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/ealdent.wordpress.com/1294/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/ealdent.wordpress.com/1294/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1294&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />
<p><a href="http://feedads.g.doubleclick.net/~a/VYUbC5NwTmzRxSsoWM-kHXrPXN0/0/da"><img src="http://feedads.g.doubleclick.net/~a/VYUbC5NwTmzRxSsoWM-kHXrPXN0/0/di" border="0" ismap="true"></img></a><br/>
<a href="http://feedads.g.doubleclick.net/~a/VYUbC5NwTmzRxSsoWM-kHXrPXN0/1/da"><img src="http://feedads.g.doubleclick.net/~a/VYUbC5NwTmzRxSsoWM-kHXrPXN0/1/di" border="0" ismap="true"></img></a></p>]]></content:encoded>
			<wfw:commentRss>http://mendicantbug.com/2010/05/05/tunkrank-meet-tickery/feed/</wfw:commentRss>
		<slash:comments>7</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ebec6abd2b9f1eb4de865aed01242171?s=96&amp;d=monsterid&amp;r=PG" medium="image">
			<media:title type="html">ealdent</media:title>
		</media:content>

		<media:content url="http://ealdent.files.wordpress.com/2010/05/fi-logo-cropped.png" medium="image">
			<media:title type="html">fi-logo-cropped</media:title>
		</media:content>

		<media:content url="http://ealdent.files.wordpress.com/2010/05/picture-9.png" medium="image">
			<media:title type="html">tickery query results 1</media:title>
		</media:content>

		<media:content url="http://ealdent.files.wordpress.com/2010/05/picture-10.png" medium="image">
			<media:title type="html">tickery query results 2</media:title>
		</media:content>
	</item>
		<item>
		<title>Wordnik Gem</title>
		<link>http://mendicantbug.com/2010/03/12/wordnik-gem/</link>
		<comments>http://mendicantbug.com/2010/03/12/wordnik-gem/#comments</comments>
		<pubDate>Sat, 13 Mar 2010 03:49:45 +0000</pubDate>
		<dc:creator>Jason Adams</dc:creator>
				<category><![CDATA[api]]></category>
		<category><![CDATA[dictionaries]]></category>
		<category><![CDATA[erin mckean]]></category>
		<category><![CDATA[ruby]]></category>
		<category><![CDATA[rubygems]]></category>
		<category><![CDATA[wordnik]]></category>

		<guid isPermaLink="false">http://mendicantbug.com/?p=1287</guid>
		<description><![CDATA[I&#8217;ve had my eye on Wordnik for a while, since finding out the excellent lexicographer Erin McKean co-founded it.  Wordnik is the most comprehensive dictionary in the known universe.  Srsly! They released an API a few months ago and I quickly threw together a gem wrapping it, based on HTTParty.  Tonight I updated the gem [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1287&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p style="text-align:justify;">
<div id="attachment_1291" class="wp-caption alignright" style="width: 110px"><a href="http://ealdent.files.wordpress.com/2010/03/erin_mckean.jpg"><img class="size-full wp-image-1291" title="Erin_McKean" src="http://ealdent.files.wordpress.com/2010/03/erin_mckean.jpg?w=100&#038;h=155" alt="" width="100" height="155" /></a><p class="wp-caption-text">Erin McKean</p></div>
<p style="text-align:justify;">I&#8217;ve had my eye on <a href="http://wordnik.com" target="_blank">Wordnik</a> for a while, since finding out the excellent lexicographer <a href="http://www.dictionaryevangelist.com/" target="_blank">Erin McKean</a> co-founded it.  Wordnik is the most comprehensive dictionary in the known universe.  Srsly!</p>
<p style="text-align:justify;">They released an API a few months ago and I quickly threw together a gem wrapping it, based on <a href="http://github.com/jnunemaker/httparty" target="_blank">HTTParty</a>.  Tonight I updated the gem for version 3 of the API and simplified it to just a single class with the bare essentials.  You can perform pretty much all of the API calls and get a hash of the results.  It&#8217;s nothing major, but will give you a chance to play around with the Wordnik API with almost no work on your part (aside from getting yourself a key).  This change breaks backwards compatibility completely, sorry.</p>
<p>Example usage:</p>
<p style="padding-left:30px;"><code>w = Wordnik.new("YOUR_API_KEY")<br />
w.define('gem') # =&gt; big hash with all the definitions<br />
w.examples('gem') # =&gt; example sentences using "gem"</code></p>
<p style="text-align:justify;">You can grab the gem off of <a href="http://rubygems.org/gems/wordnik" target="_blank">RubyGems</a> or you can take a look at the source on <a href="http://github.com/ealdent/wordnik" target="_blank">github</a>.  As always, please let me know if you encounter any problems.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/ealdent.wordpress.com/1287/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/ealdent.wordpress.com/1287/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/ealdent.wordpress.com/1287/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/ealdent.wordpress.com/1287/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/ealdent.wordpress.com/1287/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/ealdent.wordpress.com/1287/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/ealdent.wordpress.com/1287/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/ealdent.wordpress.com/1287/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/ealdent.wordpress.com/1287/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/ealdent.wordpress.com/1287/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/ealdent.wordpress.com/1287/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/ealdent.wordpress.com/1287/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/ealdent.wordpress.com/1287/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/ealdent.wordpress.com/1287/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1287&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />
<p><a href="http://feedads.g.doubleclick.net/~a/jh_GAaTpxq06OhpMIRdATMlYSYo/0/da"><img src="http://feedads.g.doubleclick.net/~a/jh_GAaTpxq06OhpMIRdATMlYSYo/0/di" border="0" ismap="true"></img></a><br/>
<a href="http://feedads.g.doubleclick.net/~a/jh_GAaTpxq06OhpMIRdATMlYSYo/1/da"><img src="http://feedads.g.doubleclick.net/~a/jh_GAaTpxq06OhpMIRdATMlYSYo/1/di" border="0" ismap="true"></img></a></p>]]></content:encoded>
			<wfw:commentRss>http://mendicantbug.com/2010/03/12/wordnik-gem/feed/</wfw:commentRss>
		<slash:comments>1</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ebec6abd2b9f1eb4de865aed01242171?s=96&amp;d=monsterid&amp;r=PG" medium="image">
			<media:title type="html">ealdent</media:title>
		</media:content>

		<media:content url="http://ealdent.files.wordpress.com/2010/03/erin_mckean.jpg" medium="image">
			<media:title type="html">Erin_McKean</media:title>
		</media:content>
	</item>
		<item>
		<title>TunkRank Improvements</title>
		<link>http://mendicantbug.com/2010/02/17/tunkrank-improvements/</link>
		<comments>http://mendicantbug.com/2010/02/17/tunkrank-improvements/#comments</comments>
		<pubDate>Thu, 18 Feb 2010 03:41:51 +0000</pubDate>
		<dc:creator>Jason Adams</dc:creator>
				<category><![CDATA[influence ranking]]></category>
		<category><![CDATA[merb]]></category>
		<category><![CDATA[mysql]]></category>
		<category><![CDATA[postgresql]]></category>
		<category><![CDATA[rails]]></category>
		<category><![CDATA[redis]]></category>
		<category><![CDATA[resque]]></category>
		<category><![CDATA[ruby]]></category>
		<category><![CDATA[tunkrank]]></category>
		<category><![CDATA[twitter]]></category>

		<guid isPermaLink="false">http://mendicantbug.com/?p=1281</guid>
		<description><![CDATA[Over the past few weeks, I&#8217;ve been working on a number of improvements to TunkRank that I will be rolling out tonight. First, I&#8217;ve secured a server to host it on, rather than my old Dell laptop, so reliability should improve and TunkRank is no longer a slave to dynamic DNS problems. Also, my cable [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1281&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>Over the past few weeks, I&#8217;ve been working on a number of improvements to <a href="http://tunkrank.com" target="_blank">TunkRank</a> that I will be rolling out tonight.  First, I&#8217;ve secured a server to host it on, rather than my old Dell laptop, so reliability should improve and TunkRank is no longer a slave to dynamic DNS problems.  Also, my cable company is less likely to hunt me down.  TunkRank has gotten some increased attention over the past few weeks, including from <a href="http://twitter.com/cdixon" target="_blank">Chris Dixon</a>, CEO of the wonderful website <a href="http://hunch.com" target="_blank">hunch</a>:</p>
<blockquote><p>Twitter could fix the whole follower obsession by highlighting a more meaningful metric like TunkRank.</p></blockquote>
<p>Awesome!  So with this new version, there are a few changes that will immediately impact you, the end-user.  I&#8217;ll go into the ones that affect you the most first, followed by some technical points of interest for those who care.  Then I&#8217;ll conclude with a couple of hints at the future.</p>
<h3>Changes to TunkRank</h3>
<p>First and foremost, I have changed the main score that is reported.  Previously I was using a percentile in the range (1-100).  This got a lot of objections and created confusion.  Partially because I consider the 100th percentile to be the &#8220;top-tier&#8221; of users, while standardized testing often reports the 99th percentile to mean you performed better than 99% of the population.  Also, most people who actually care about their scores enough to use TunkRank are in the 95-100 percentile range, making more fine-grained comparisons difficult.  <a href="http://twitter.com/nealrichter" target="_blank">Neal Richter</a> even posted on <a href="http://aicoder.blogspot.com/2009/02/tunkrank-scoring-improvement.html" target="_blank">his blog</a> some suggestions for improving it (quite a while ago, now).</p>
<p>I took a page out of Neal&#8217;s book with the log scores, but I also put it in a range where the most influential twitter user (let&#8217;s call her MAX) will always have a score of 100.  Your TunkRank Score™ is the ratio of the log of your raw score to the log of MAX&#8217;s score.  So formulas aside, this means your TunkRank score is directly comparable to other users and is always in perspective of the maximum influence exerted by any user in the Twitterverse.  Incidentally, comparing users with a difference of seven TunkRank score points means the user with the higher score is about twice as influential.</p>
<p>Accessing the API has also changed slightly, and I apologize to anyone actually using it at the moment.  Basically, I am matching the API calls to more closely conform to the URLs used on the web side, and I&#8217;m returning more information with each call.  TunkRank also supports XML responses in addition to JSON.  You can find all of the documentation <a href="http://tunkrank.com/api" target="_blank">here</a>.</p>
<h3>Some Technical Notes</h3>
<p>As part of the move, I&#8217;ve decided to transition from using <a href="http://merbivore.com" target="_blank">Merb</a> to <a href="http://rubyonrails.org/" target="_blank">Rails</a>.  My original decision to use Merb was partially as a learning exercise, but also because Merb appealed to me with its being lightweight.  However, I often ran into roadblocks because some useful plugin wasn&#8217;t supported (or I couldn&#8217;t figure out how to make it work in the limited time I had).  Sometimes the documentation for Merb was very good and sometimes it was absent altogether.  Rails, on the other hand, has a substantial amount of documentation and people are always blogging about the best way to do things &#8212; which makes life as a developer much easier.  Rails is my day job, so I knew I could transition quickly and easily.</p>
<p>I also migrated from MySQL to PostgreSQL.  The main reason is that I love PostgreSQL &#8212; plain and simple.  They both have their advantages, but MySQL gives me a sense of uneasiness I don&#8217;t have with PostgreSQL.  I&#8217;ve managed to achieve some nice speed improvements as part of the redesign, though that is not to say that the same speed improvements wouldn&#8217;t have been possible with MySQL.</p>
<p>I&#8217;ve also adopted <a href="http://github.com/defunkt/resque" target="_blank">Resque</a> as my background job-processing library.  It is backed by <a href="http://code.google.com/p/redis/" target="_blank">Redis</a>, an advanced key-value store that you can think of as a &#8220;data structures server.&#8221;  The important thing for me is that Resque is fast, has a kick-ass web interface, and integrating with Rails is brain-dead easy.</p>
<h3>The Road Ahead</h3>
<p>I wrote before about the <a href="http://mendicantbug.com/2009/03/06/the-road-ahead-for-tunkrank/" target="_self">road ahead for TunkRank</a>, and I have mostly held to it.  I have many more ideas I want to expand on, including topic-sensitive influence rankings.  I like the ideas in the recent WSDM <a href="http://www.mysmu.edu/staff/jsweng/papers/TwitterRank_WSDM.pdf" target="_blank">paper</a> (pdf) by Weng et al, but I have a few new ideas I&#8217;m eager to try out.  TunkRank scores may also be integrated into <a href="http://tickery.net" target="_blank">Tickery</a> in the near future, thanks to some discussions with <a href="http://twitter.com/terrycojones" target="_blank">Terry Jones</a> of <a href="http://fluidinfo.com" target="_blank">FluidDB</a>.  I&#8217;m excited!</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/ealdent.wordpress.com/1281/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/ealdent.wordpress.com/1281/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/ealdent.wordpress.com/1281/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/ealdent.wordpress.com/1281/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/ealdent.wordpress.com/1281/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/ealdent.wordpress.com/1281/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/ealdent.wordpress.com/1281/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/ealdent.wordpress.com/1281/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/ealdent.wordpress.com/1281/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/ealdent.wordpress.com/1281/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/ealdent.wordpress.com/1281/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/ealdent.wordpress.com/1281/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/ealdent.wordpress.com/1281/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/ealdent.wordpress.com/1281/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1281&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />
<p><a href="http://feedads.g.doubleclick.net/~a/-AC4su6L3bbhFVjMPKtf31QcGW0/0/da"><img src="http://feedads.g.doubleclick.net/~a/-AC4su6L3bbhFVjMPKtf31QcGW0/0/di" border="0" ismap="true"></img></a><br/>
<a href="http://feedads.g.doubleclick.net/~a/-AC4su6L3bbhFVjMPKtf31QcGW0/1/da"><img src="http://feedads.g.doubleclick.net/~a/-AC4su6L3bbhFVjMPKtf31QcGW0/1/di" border="0" ismap="true"></img></a></p>]]></content:encoded>
			<wfw:commentRss>http://mendicantbug.com/2010/02/17/tunkrank-improvements/feed/</wfw:commentRss>
		<slash:comments>5</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ebec6abd2b9f1eb4de865aed01242171?s=96&amp;d=monsterid&amp;r=PG" medium="image">
			<media:title type="html">ealdent</media:title>
		</media:content>
	</item>
		<item>
		<title>Semantifi and the Deep Web</title>
		<link>http://mendicantbug.com/2010/02/06/semantifi-and-the-deep-web/</link>
		<comments>http://mendicantbug.com/2010/02/06/semantifi-and-the-deep-web/#comments</comments>
		<pubDate>Sat, 06 Feb 2010 05:09:22 +0000</pubDate>
		<dc:creator>Jason Adams</dc:creator>
				<category><![CDATA[computational linguistics]]></category>
		<category><![CDATA[natural language processing]]></category>
		<category><![CDATA[search engines]]></category>
		<category><![CDATA[search interfaces]]></category>
		<category><![CDATA[semantic search engine]]></category>
		<category><![CDATA[semantic web]]></category>
		<category><![CDATA[wolfram alpha]]></category>

		<guid isPermaLink="false">http://mendicantbug.com/?p=1277</guid>
		<description><![CDATA[At the Atlanta Semantic Web Meetup tonight, Vishy Dasari gave us a quick description and demo of a new search engine called Semantifi.  They purportedly are a search engine for the deep web, meaning the web that is not indexed by traditional search engines because the content is dynamic.  They are just in the very [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1277&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>At the <a href="http://www.meetup.com/The-Atlanta-Semantic-Web-Meetup/" target="_blank">Atlanta Semantic Web Meetup</a> tonight, Vishy Dasari gave us a quick description and demo of a new search engine called <a href="http://semantifi.com" target="_blank">Semantifi</a>.  They purportedly are a search engine for the deep web, meaning the web that is not indexed by traditional search engines because the content is dynamic.  They are just in the very early stages, but have opened the site for people to play with and add data to via &#8220;Apps.&#8221;  These apps are sort of like agents that respond to queries, returning results to some marshal process that decides which App will get the right to answer.  Results are ranked by some method I wasn&#8217;t able to ascertain, but it reminded me of how <a href="http://blog.amyiris.com/2009/06/extending-amy-iris-python.html" target="_blank">Amy Iris</a> works.  These apps form the backbone of the Semantifi system, it seems, and they are crowdsourcing their creation.  You can create a very simple app to return answers on your own data set in a few short minutes.</p>
<p>Perhaps more interesting is that they use a natural language interface in addition to the standard query sort of interface we&#8217;re all used to.  Given the small amount of data currently available, I couldn&#8217;t really determine just how well this interface performs.  It is based on a cognitive theory by John Hawks (sp?) that apparently states we think in terms of patterns.  That&#8217;s very general and I haven&#8217;t been able to chase down that reference &#8212; and I forgot to ask Vishy for more info at the meetup.  If someone can clear that up for me, I&#8217;d be grateful.  The only seemingly relevant <a href="http://johnhawks.net/weblog" target="_blank">John Hawks</a> I could find is a paleoanthropologist, so not sure.  Anyhow, these patterns are what Vishy says the system uses to interpret natural language input.  That may be a grandiose way of saying n-gram matching.</p>
<p>While Wolfram|Alpha is a computational knowledge engine™, Semantifi does not make that claim.  Apps may compute certain things like mortgage values, but it&#8217;s not a general purpose calculator.  However, Semantifi is looking at bringing in unstructured data from blogs and the like, that W|A ignores.  It remains to be seen what that will look like, though.  Also, users can contribute to Semantifi while W|A is a black box.  In any case, they are making interesting claims and I look forward to seeing how they play out with more data.</p>
<p><em>Note: All of my observations are based on notes and memories of tonight&#8217;s presentation, so if I made any mistakes please post corrections in the comments or email me.</em></p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/ealdent.wordpress.com/1277/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/ealdent.wordpress.com/1277/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/ealdent.wordpress.com/1277/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/ealdent.wordpress.com/1277/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/ealdent.wordpress.com/1277/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/ealdent.wordpress.com/1277/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/ealdent.wordpress.com/1277/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/ealdent.wordpress.com/1277/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/ealdent.wordpress.com/1277/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/ealdent.wordpress.com/1277/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/ealdent.wordpress.com/1277/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/ealdent.wordpress.com/1277/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/ealdent.wordpress.com/1277/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/ealdent.wordpress.com/1277/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1277&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />
<p><a href="http://feedads.g.doubleclick.net/~a/sXIQtFBlFhKYBUS8_dh0InTzVdc/0/da"><img src="http://feedads.g.doubleclick.net/~a/sXIQtFBlFhKYBUS8_dh0InTzVdc/0/di" border="0" ismap="true"></img></a><br/>
<a href="http://feedads.g.doubleclick.net/~a/sXIQtFBlFhKYBUS8_dh0InTzVdc/1/da"><img src="http://feedads.g.doubleclick.net/~a/sXIQtFBlFhKYBUS8_dh0InTzVdc/1/di" border="0" ismap="true"></img></a></p>]]></content:encoded>
			<wfw:commentRss>http://mendicantbug.com/2010/02/06/semantifi-and-the-deep-web/feed/</wfw:commentRss>
		<slash:comments>1</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ebec6abd2b9f1eb4de865aed01242171?s=96&amp;d=monsterid&amp;r=PG" medium="image">
			<media:title type="html">ealdent</media:title>
		</media:content>
	</item>
		<item>
		<title>Unintentional HCIR commercial</title>
		<link>http://mendicantbug.com/2009/11/07/unintentional-hcir-commercial/</link>
		<comments>http://mendicantbug.com/2009/11/07/unintentional-hcir-commercial/#comments</comments>
		<pubDate>Sun, 08 Nov 2009 02:54:50 +0000</pubDate>
		<dc:creator>Jason Adams</dc:creator>
				<category><![CDATA[advertising]]></category>
		<category><![CDATA[commercials]]></category>
		<category><![CDATA[faceted search]]></category>
		<category><![CDATA[hcir]]></category>

		<guid isPermaLink="false">http://mendicantbug.com/?p=1275</guid>
		<description><![CDATA[This commercial just caught my eye and made me think about faceted search.<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1275&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p style="text-align:justify;">This commercial just caught my eye and made me think about faceted search.</p>
<p><span style="text-align:center; display: block;"><a href="http://mendicantbug.com/2009/11/07/unintentional-hcir-commercial/"><img src="http://img.youtube.com/vi/N8yWjJXbaPA/2.jpg" alt="" /></a></span></p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/ealdent.wordpress.com/1275/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/ealdent.wordpress.com/1275/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/ealdent.wordpress.com/1275/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/ealdent.wordpress.com/1275/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/ealdent.wordpress.com/1275/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/ealdent.wordpress.com/1275/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/ealdent.wordpress.com/1275/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/ealdent.wordpress.com/1275/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/ealdent.wordpress.com/1275/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/ealdent.wordpress.com/1275/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/ealdent.wordpress.com/1275/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/ealdent.wordpress.com/1275/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/ealdent.wordpress.com/1275/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/ealdent.wordpress.com/1275/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1275&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />
<p><a href="http://feedads.g.doubleclick.net/~a/dtV6Ar9sSoK_5WeQrhuYPrdDi08/0/da"><img src="http://feedads.g.doubleclick.net/~a/dtV6Ar9sSoK_5WeQrhuYPrdDi08/0/di" border="0" ismap="true"></img></a><br/>
<a href="http://feedads.g.doubleclick.net/~a/dtV6Ar9sSoK_5WeQrhuYPrdDi08/1/da"><img src="http://feedads.g.doubleclick.net/~a/dtV6Ar9sSoK_5WeQrhuYPrdDi08/1/di" border="0" ismap="true"></img></a></p>]]></content:encoded>
			<wfw:commentRss>http://mendicantbug.com/2009/11/07/unintentional-hcir-commercial/feed/</wfw:commentRss>
		<slash:comments>1</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ebec6abd2b9f1eb4de865aed01242171?s=96&amp;d=monsterid&amp;r=PG" medium="image">
			<media:title type="html">ealdent</media:title>
		</media:content>

		<media:content url="http://img.youtube.com/vi/N8yWjJXbaPA/2.jpg" medium="image" />
	</item>
		<item>
		<title>Daedalpumpkin</title>
		<link>http://mendicantbug.com/2009/10/31/daedalpumpkin/</link>
		<comments>http://mendicantbug.com/2009/10/31/daedalpumpkin/#comments</comments>
		<pubDate>Sat, 31 Oct 2009 20:08:40 +0000</pubDate>
		<dc:creator>Jason Adams</dc:creator>
				<category><![CDATA[beagles]]></category>
		<category><![CDATA[halloween]]></category>
		<category><![CDATA[pumpkins]]></category>

		<guid isPermaLink="false">http://mendicantbug.com/?p=1271</guid>
		<description><![CDATA[We decided to do a complicated pumpkin design this year and it turned out surprisingly well!  I present, the Daedalpumpkin: &#160; &#160; &#160;<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1271&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p style="text-align:justify;">We decided to do a complicated pumpkin design this year and it turned out surprisingly well!  I present, the Daedalpumpkin:</p>
<p>&nbsp;</p>
<div id="attachment_1272" class="wp-caption aligncenter" style="width: 580px"><a href="http://ealdent.files.wordpress.com/2009/10/s1052134.jpg"><img class="size-full wp-image-1272" title="The Daedalpumpkin" src="http://ealdent.files.wordpress.com/2009/10/s1052134.jpg?w=570&#038;h=427" alt="The Daedalpumpkin" width="570" height="427" /></a><p class="wp-caption-text">The Daedalpumpkin</p></div>
<p>&nbsp;</p>
<p>&nbsp;</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/ealdent.wordpress.com/1271/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/ealdent.wordpress.com/1271/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/ealdent.wordpress.com/1271/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/ealdent.wordpress.com/1271/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/ealdent.wordpress.com/1271/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/ealdent.wordpress.com/1271/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/ealdent.wordpress.com/1271/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/ealdent.wordpress.com/1271/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/ealdent.wordpress.com/1271/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/ealdent.wordpress.com/1271/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/ealdent.wordpress.com/1271/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/ealdent.wordpress.com/1271/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/ealdent.wordpress.com/1271/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/ealdent.wordpress.com/1271/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1271&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />
<p><a href="http://feedads.g.doubleclick.net/~a/NJSUfianGBk_xhd6X7Rcm6gOaQQ/0/da"><img src="http://feedads.g.doubleclick.net/~a/NJSUfianGBk_xhd6X7Rcm6gOaQQ/0/di" border="0" ismap="true"></img></a><br/>
<a href="http://feedads.g.doubleclick.net/~a/NJSUfianGBk_xhd6X7Rcm6gOaQQ/1/da"><img src="http://feedads.g.doubleclick.net/~a/NJSUfianGBk_xhd6X7Rcm6gOaQQ/1/di" border="0" ismap="true"></img></a></p>]]></content:encoded>
			<wfw:commentRss>http://mendicantbug.com/2009/10/31/daedalpumpkin/feed/</wfw:commentRss>
		<slash:comments>1</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ebec6abd2b9f1eb4de865aed01242171?s=96&amp;d=monsterid&amp;r=PG" medium="image">
			<media:title type="html">ealdent</media:title>
		</media:content>

		<media:content url="http://ealdent.files.wordpress.com/2009/10/s1052134.jpg" medium="image">
			<media:title type="html">The Daedalpumpkin</media:title>
		</media:content>
	</item>
		<item>
		<title>NLP Resources for Ruby</title>
		<link>http://mendicantbug.com/2009/09/13/nlp-resources-for-ruby/</link>
		<comments>http://mendicantbug.com/2009/09/13/nlp-resources-for-ruby/#comments</comments>
		<pubDate>Sun, 13 Sep 2009 06:28:02 +0000</pubDate>
		<dc:creator>Jason Adams</dc:creator>
				<category><![CDATA[python]]></category>
		<category><![CDATA[computational linguistics]]></category>
		<category><![CDATA[java]]></category>
		<category><![CDATA[natural language processing]]></category>
		<category><![CDATA[nlp]]></category>
		<category><![CDATA[ruby]]></category>
		<category><![CDATA[stemmers]]></category>
		<category><![CDATA[wordnet]]></category>
		<category><![CDATA[parsers]]></category>

		<guid isPermaLink="false">http://mendicantbug.com/?p=1268</guid>
		<description><![CDATA[There are quite a few well-known libraries for doing various NLP tasks in Java and Python, such as the Stanford Parser (Java) and the Natural Language Toolkit (Python).  For Ruby, there are a few resources out there, but they are usually derivative or not as mature.  By derivative, I mean they are ports from other [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1268&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p style="text-align:justify;">There are quite a few well-known libraries for doing various NLP tasks in Java and Python, such as the Stanford Parser (Java) and the Natural Language Toolkit (Python).  For Ruby, there are a few resources out there, but they are usually derivative or not as mature.  By derivative, I mean they are ports from other languages or extensions using code from another language.  And I&#8217;m responsible for two of them! :)</p>
<ul>
<li><span style="background-color:#ffffff;"><a href="http://www.deveiate.org/projects/Linguistics/" target="_blank">Ruby Linguistics</a> &#8211; this is one of the more ambitious projects, but is not as mature as NLTK</span>
<ul>
<li><span style="background-color:#ffffff;">interface for WordNet</span></li>
<li><span style="background-color:#ffffff;">Link grammar parser</span></li>
<li><span style="background-color:#ffffff;">some inflection stuff</span></li>
</ul>
</li>
<li><a href="http://rubyforge.org/projects/stanfordparser/" target="_blank">Stanford Parser</a> interface &#8211; uses a Java bridge to access the Stanford Parser library</li>
<li><a href="http://www.markwatson.com/" target="_blank">Mark Watson</a> has a <a href="http://www.markwatson.com/opensource/rubytagger_0.1.1.zip" target="_blank">part of speech tagger</a> [zip], a <a href="http://www.markwatson.com/opensource/rubyreuters_0.1.zip" target="_blank">text categorizer</a> [zip], and <a href="http://www.markwatson.com/opensource/ruby_read_docs.zip" target="_blank">some text extraction utilities</a> [zip], but I haven&#8217;t tried to use them yet</li>
<li><a href="http://github.com/ealdent/lda-ruby" target="_blank">LDA Ruby Gem</a> &#8211; Ruby port of David Blei&#8217;s lda-c library by yours truly
<ul>
<li>Uses Blei&#8217;s c-code for the actual LDA but I include some wrappers to make using it a bit easier</li>
</ul>
</li>
<li><a href="http://github.com/ealdent/uea-stemmer" target="_blank">UEA Stemmer</a> &#8211; Ruby port (again by yours truly) of a conservative stemmer based on Jenkins and Smith&#8217;s <a href="http://www.uea.ac.uk/cmp/research/graphicsvisionspeech/speech/WordStemming" target="_blank">UEA Stemmer</a></li>
<li><a href="http://rubyforge.org/projects/stemmer/" target="_blank">Stemmer gem</a> &#8211; <a href="http://tartarus.org/~martin/PorterStemmer/" target="_blank">Porter stemmer</a></li>
<li><a href="http://www.locknet.ro/projects/ann-ruby-stemmer" target="_blank">Lingua Stemmer </a>- another stemming library, Porter stemmer</li>
<li><a href="http://www.deveiate.org/projects/Ruby-WordNet/" target="_blank">Ruby WordNet </a>- basically what&#8217;s included in Ruby Linguistics</li>
<li><a href="http://sourceforge.net/projects/raspell/" target="_blank">Raspell</a> &#8211; Ruby interface to Aspell spell checker</li>
</ul>
<p style="text-align:justify;">There are also a number of fledgling or orphaned projects out there purporting to be ports or interfaces for various other libraries like Stanford POS Tagger and Named Entity Recognizer.  Ruby (straight Ruby, not just JRuby) can interface just about any Java library using the <a href="http://rjb.rubyforge.org/" target="_blank">Ruby Java Bridge</a> (RJB).  RJB can be a pain, and I could only initialize it once per run (a second attempt never succeeds), so there are some limitations.  But using it, I was able to easily interface with the Stanford POS tagger.</p>
<p style="text-align:justify;">So while there aren&#8217;t terribly many libraries for NLP tasks in Ruby, the availability of interfacing with Java directly widens the scope quite a bit.  You can also incorporate a c library using extensions.</p>
<p style="text-align:justify;">Naturally, if I missed anything, no matter how small, please let me know.</p>
<p style="text-align:justify;"><em>Update:</em> Here is a great list of <a href="http://web.media.mit.edu/~dustin/papers/ai_ruby_plugins/" target="_blank">AI-related ruby libraries</a> from Dustin Smith.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/ealdent.wordpress.com/1268/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/ealdent.wordpress.com/1268/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/ealdent.wordpress.com/1268/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/ealdent.wordpress.com/1268/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/ealdent.wordpress.com/1268/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/ealdent.wordpress.com/1268/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/ealdent.wordpress.com/1268/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/ealdent.wordpress.com/1268/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/ealdent.wordpress.com/1268/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/ealdent.wordpress.com/1268/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/ealdent.wordpress.com/1268/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/ealdent.wordpress.com/1268/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/ealdent.wordpress.com/1268/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/ealdent.wordpress.com/1268/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1268&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />
<p><a href="http://feedads.g.doubleclick.net/~a/jRGWGvgVf3axzTlBbfSaadPAqJQ/0/da"><img src="http://feedads.g.doubleclick.net/~a/jRGWGvgVf3axzTlBbfSaadPAqJQ/0/di" border="0" ismap="true"></img></a><br/>
<a href="http://feedads.g.doubleclick.net/~a/jRGWGvgVf3axzTlBbfSaadPAqJQ/1/da"><img src="http://feedads.g.doubleclick.net/~a/jRGWGvgVf3axzTlBbfSaadPAqJQ/1/di" border="0" ismap="true"></img></a></p>]]></content:encoded>
			<wfw:commentRss>http://mendicantbug.com/2009/09/13/nlp-resources-for-ruby/feed/</wfw:commentRss>
		<slash:comments>6</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ebec6abd2b9f1eb4de865aed01242171?s=96&amp;d=monsterid&amp;r=PG" medium="image">
			<media:title type="html">ealdent</media:title>
		</media:content>
	</item>
		<item>
		<title>Books and movies</title>
		<link>http://mendicantbug.com/2009/08/16/books-and-movies/</link>
		<comments>http://mendicantbug.com/2009/08/16/books-and-movies/#comments</comments>
		<pubDate>Mon, 17 Aug 2009 04:02:13 +0000</pubDate>
		<dc:creator>Jason Adams</dc:creator>
				<category><![CDATA[adaptations]]></category>
		<category><![CDATA[books]]></category>
		<category><![CDATA[douglas adams]]></category>
		<category><![CDATA[movies]]></category>
		<category><![CDATA[time traveler's wife]]></category>

		<guid isPermaLink="false">http://mendicantbug.com/?p=1264</guid>
		<description><![CDATA[This post contains NO spoilers. I saw The Time Traveler&#8217;s Wife with my wife today.  I had read the book about a year ago, and had been looking forward to the movie.  I wasn&#8217;t disappointed &#8212; I thought the movie was very moving and captured the spirit of the book, even if it didn&#8217;t capture [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1264&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p style="text-align:justify;"><em>This post contains NO spoilers.</em></p>
<p style="text-align:justify;">I saw <em><a href="http://www.imdb.com/title/tt0452694/" target="_blank">The Time Traveler&#8217;s Wife</a></em> with my wife today.  I had read <a onclick="return mugicPopWin(this,event);" oncontextmenu="mugicRightClick(this);" href="http://www.amazon.com/gp/product/015602943X?ie=UTF8&amp;tag=themenbug-20&amp;linkCode=as2&amp;camp=1789&amp;creative=390957&amp;creativeASIN=015602943X" target="_blank">the book</a> about a year ago, and had been looking forward to the movie.  I wasn&#8217;t disappointed &#8212; I thought the movie was very moving and captured the spirit of the book, even if it didn&#8217;t capture everything.  It ignored some dynamics that the book elaborated on and some scenes and details were slightly different.</p>
<p style="text-align:justify;">One thing I was concerned about while watching the movie was just how much I was liking it because I knew all the background in the book, or how much came from the movie.  If the former was true, then the movie wasn&#8217;t going to be that great an experience for someone who had read it.  If the latter was true, then it was a damn good movie.  I don&#8217;t have the answer to that.</p>
<p style="text-align:justify;">Another concern is how it&#8217;s a cultural norm in our society to bash movies based on books, and yet to relentlessly watch them to the point that Hollywood feels compelled to turn every book that sells a few copies <a href="http://www.imdb.com/title/tt1001508/" target="_blank">into one</a>.  Douglas Adams once made the point that he changed the story of the Hitchhiker&#8217;s Guide to the Galaxy to match the medium he was writing it for.  A story that plays well on the radio can take advantage of completely different things when it is translated to book or movie form.  I don&#8217;t have the exact quote and searching for that kind of thing is damn near impossible on Google (let me know if you find it).</p>
<p style="text-align:justify;">But that&#8217;s an observation I have long taken to heart when watching movies translated from books.  Obviously you can&#8217;t fit an entire book into 2 hours and still have a story that tells like anything worth watching.  You can&#8217;t capture the full power of every scene, every nuance, nor every subtlety that a book can.  That&#8217;s not what the silver screen does well.  What it does well (when it is done right) is making you feel in touch with characters and the story.  Books do that too, but movies actually put the images before your eyes.</p>
<p style="text-align:justify;">That said, I have never been able to bring myself to read a book based on a movie.  I just can&#8217;t do it.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/ealdent.wordpress.com/1264/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/ealdent.wordpress.com/1264/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/ealdent.wordpress.com/1264/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/ealdent.wordpress.com/1264/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/ealdent.wordpress.com/1264/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/ealdent.wordpress.com/1264/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/ealdent.wordpress.com/1264/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/ealdent.wordpress.com/1264/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/ealdent.wordpress.com/1264/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/ealdent.wordpress.com/1264/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/ealdent.wordpress.com/1264/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/ealdent.wordpress.com/1264/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/ealdent.wordpress.com/1264/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/ealdent.wordpress.com/1264/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1264&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />
<p><a href="http://feedads.g.doubleclick.net/~a/KCUlaUeNFu4-R6egpOUILJoC5WQ/0/da"><img src="http://feedads.g.doubleclick.net/~a/KCUlaUeNFu4-R6egpOUILJoC5WQ/0/di" border="0" ismap="true"></img></a><br/>
<a href="http://feedads.g.doubleclick.net/~a/KCUlaUeNFu4-R6egpOUILJoC5WQ/1/da"><img src="http://feedads.g.doubleclick.net/~a/KCUlaUeNFu4-R6egpOUILJoC5WQ/1/di" border="0" ismap="true"></img></a></p>]]></content:encoded>
			<wfw:commentRss>http://mendicantbug.com/2009/08/16/books-and-movies/feed/</wfw:commentRss>
		<slash:comments>2</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ebec6abd2b9f1eb4de865aed01242171?s=96&amp;d=monsterid&amp;r=PG" medium="image">
			<media:title type="html">ealdent</media:title>
		</media:content>
	</item>
		<item>
		<title>Next total solar eclipse in Atlanta</title>
		<link>http://mendicantbug.com/2009/08/04/next-total-solar-eclipse-in-atlanta/</link>
		<comments>http://mendicantbug.com/2009/08/04/next-total-solar-eclipse-in-atlanta/#comments</comments>
		<pubDate>Wed, 05 Aug 2009 00:10:09 +0000</pubDate>
		<dc:creator>Jason Adams</dc:creator>
				<category><![CDATA[astronomy]]></category>
		<category><![CDATA[futureme]]></category>
		<category><![CDATA[solar eclipse]]></category>
		<category><![CDATA[wolfram alpha]]></category>

		<guid isPermaLink="false">http://mendicantbug.com/?p=1259</guid>
		<description><![CDATA[I already knew Wolfram&#124;Alpha could do some cool astronomy calculations, like comparing the escape velocities of the Galilean moons.  A recent W&#124;A blog post also pointed out that you can calculate the next lunar eclipse.  So I tried to see when the next solar eclipse would be for my area and it came up with [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1259&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p style="text-align:justify;">I already knew <a href="http://wolframalpha.com" target="_blank">Wolfram|Alpha</a> could do some cool astronomy calculations, like comparing the <a href="http://www83.wolframalpha.com/input/?i=galilean+moons+escape+velocity" target="_blank">escape velocities of the Galilean moons</a>.  A recent <a href="http://blog.wolframalpha.com/2009/08/03/exploring-our-solar-system-with-wolframalpha/" target="_blank">W|A blog post</a> also pointed out that you can calculate the next lunar eclipse.  So I tried to see when the next <em>solar </em>eclipse would be for my area and it came up with a partial solar eclipse in 2014.  Skip that and go to the next and it turns out there&#8217;s going to be <a href="http://www67.wolframalpha.com/input/?i=solar+eclipse+in+alpharetta,+ga+after+2015" target="_blank">a decent one</a> in 2017.  As a reminder, I sent an email to myself via <a href="http://www.futureme.org/" target="_blank">FutureMe</a>.  It&#8217;ll be interesting to see if a) I&#8217;m still using gmail in 8 years, b) if FutureMe is still around sending emails, and c) if we can still see the sun.  Man, I love W|A.</p>
<div id="attachment_1260" class="wp-caption aligncenter" style="width: 509px"><a href="http://ealdent.files.wordpress.com/2009/08/picture-3.png"><img class="size-full wp-image-1260" title="Picture 3" src="http://ealdent.files.wordpress.com/2009/08/picture-3.png?w=499&#038;h=423" alt="Total solar eclipse in 2017" width="499" height="423" /></a><p class="wp-caption-text">Total solar eclipse in 2017</p></div>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/ealdent.wordpress.com/1259/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/ealdent.wordpress.com/1259/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/ealdent.wordpress.com/1259/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/ealdent.wordpress.com/1259/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/ealdent.wordpress.com/1259/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/ealdent.wordpress.com/1259/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/ealdent.wordpress.com/1259/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/ealdent.wordpress.com/1259/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/ealdent.wordpress.com/1259/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/ealdent.wordpress.com/1259/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/ealdent.wordpress.com/1259/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/ealdent.wordpress.com/1259/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/ealdent.wordpress.com/1259/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/ealdent.wordpress.com/1259/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1259&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />
<p><a href="http://feedads.g.doubleclick.net/~a/LC9qc8WKWbVgbvci07RShE1Jxd0/0/da"><img src="http://feedads.g.doubleclick.net/~a/LC9qc8WKWbVgbvci07RShE1Jxd0/0/di" border="0" ismap="true"></img></a><br/>
<a href="http://feedads.g.doubleclick.net/~a/LC9qc8WKWbVgbvci07RShE1Jxd0/1/da"><img src="http://feedads.g.doubleclick.net/~a/LC9qc8WKWbVgbvci07RShE1Jxd0/1/di" border="0" ismap="true"></img></a></p>]]></content:encoded>
			<wfw:commentRss>http://mendicantbug.com/2009/08/04/next-total-solar-eclipse-in-atlanta/feed/</wfw:commentRss>
		<slash:comments>1</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ebec6abd2b9f1eb4de865aed01242171?s=96&amp;d=monsterid&amp;r=PG" medium="image">
			<media:title type="html">ealdent</media:title>
		</media:content>

		<media:content url="http://ealdent.files.wordpress.com/2009/08/picture-3.png" medium="image">
			<media:title type="html">Picture 3</media:title>
		</media:content>
	</item>
		<item>
		<title>Java maps and sorting</title>
		<link>http://mendicantbug.com/2009/08/01/java-maps-and-sorting/</link>
		<comments>http://mendicantbug.com/2009/08/01/java-maps-and-sorting/#comments</comments>
		<pubDate>Sun, 02 Aug 2009 03:42:49 +0000</pubDate>
		<dc:creator>Jason Adams</dc:creator>
				<category><![CDATA[algorithms]]></category>
		<category><![CDATA[code]]></category>
		<category><![CDATA[collections]]></category>
		<category><![CDATA[java]]></category>
		<category><![CDATA[programming]]></category>
		<category><![CDATA[sorting]]></category>

		<guid isPermaLink="false">http://mendicantbug.com/?p=1250</guid>
		<description><![CDATA[I&#8217;m always a little annoyed I have to implement sorting Map keys by their values myself in Java.  It seems like they should be a part of the standard Collections library or something.  Maybe they are and I just haven&#8217;t seen it?  My solution (gist) is based on feedback from Josh in the comments to [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1250&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p style="text-align:justify;">I&#8217;m always a little annoyed I have to implement sorting <code>Map</code> keys by their values myself in Java.  It seems like they should be a part of the standard <code>Collections</code> library or something.  Maybe they are and I just haven&#8217;t seen it?  <a href="http://gist.github.com/159913" target="_blank">My solution</a> (gist) is based on feedback from <a href="http://www.humphrelia.bluegosling.com/author/josh" target="_blank">Josh</a> in the comments to <a href="http://mendicantbug.com/2007/09/18/merge-sort-fun/" target="_self">a previous post</a>. <span style="font-family:Georgia, 'Times New Roman', 'Bitstream Charter', Times, serif;line-height:19px;white-space:normal;font-size:13px;">How does that look to you?</span></p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/ealdent.wordpress.com/1250/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/ealdent.wordpress.com/1250/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/ealdent.wordpress.com/1250/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/ealdent.wordpress.com/1250/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/ealdent.wordpress.com/1250/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/ealdent.wordpress.com/1250/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/ealdent.wordpress.com/1250/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/ealdent.wordpress.com/1250/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/ealdent.wordpress.com/1250/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/ealdent.wordpress.com/1250/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/ealdent.wordpress.com/1250/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/ealdent.wordpress.com/1250/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/ealdent.wordpress.com/1250/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/ealdent.wordpress.com/1250/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1250&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />
<p><a href="http://feedads.g.doubleclick.net/~a/R-e3K5z3NjK8hIMRoJoo48MTU6g/0/da"><img src="http://feedads.g.doubleclick.net/~a/R-e3K5z3NjK8hIMRoJoo48MTU6g/0/di" border="0" ismap="true"></img></a><br/>
<a href="http://feedads.g.doubleclick.net/~a/R-e3K5z3NjK8hIMRoJoo48MTU6g/1/da"><img src="http://feedads.g.doubleclick.net/~a/R-e3K5z3NjK8hIMRoJoo48MTU6g/1/di" border="0" ismap="true"></img></a></p>]]></content:encoded>
			<wfw:commentRss>http://mendicantbug.com/2009/08/01/java-maps-and-sorting/feed/</wfw:commentRss>
		<slash:comments>6</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ebec6abd2b9f1eb4de865aed01242171?s=96&amp;d=monsterid&amp;r=PG" medium="image">
			<media:title type="html">ealdent</media:title>
		</media:content>
	</item>
		<item>
		<title>Lazyfeed: the missing link in the evolution of RSS?</title>
		<link>http://mendicantbug.com/2009/08/01/lazyfeed-the-missing-link-in-the-evolution-of-rss/</link>
		<comments>http://mendicantbug.com/2009/08/01/lazyfeed-the-missing-link-in-the-evolution-of-rss/#comments</comments>
		<pubDate>Sat, 01 Aug 2009 13:00:09 +0000</pubDate>
		<dc:creator>Jason Adams</dc:creator>
				<category><![CDATA[computational linguistics]]></category>
		<category><![CDATA[exploratory search]]></category>
		<category><![CDATA[google alerts]]></category>
		<category><![CDATA[information trapping]]></category>
		<category><![CDATA[invites]]></category>
		<category><![CDATA[lazyfeed]]></category>
		<category><![CDATA[recommender system]]></category>
		<category><![CDATA[rss]]></category>
		<category><![CDATA[topic detection]]></category>

		<guid isPermaLink="false">http://mendicantbug.com/?p=1240</guid>
		<description><![CDATA[When Lazyfeed announced a limited round of beta invites on TechCrunch, I admit, I lusted after them.  Only 250?  I wanted to be one!  But alas, I was put on the waiting list.  It&#8217;s a decent marketing strategy for building up some hype.  When I finally did get my invite, I tried them out for [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1240&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p style="text-align:justify;">When <a href="http://www.lazyfeed.com" target="_blank">Lazyfeed</a> announced a limited round of beta invites on <a href="http://www.techcrunch.com/2009/07/10/lazyfeed-wakes-up-%E2%80%94-and-we-have-invites/" target="_blank">TechCrunch</a>, I admit, I lusted after them.  Only 250?  I wanted to be one!  But alas, I was put on the waiting list.  It&#8217;s a decent marketing strategy for building up some hype.  When I finally did get my invite, I tried them out for about 5 minutes and fell prey to the distractions of the internet.  That was a bad sign, though.  Usually a new service can hold my attention for a little while longer.  So what happened?</p>
<h3>Lazy-wha?</h3>
<p style="text-align:justify;">Lazyfeed is a service that lets you enter topics, blogs, twitter, delicious and flickr accounts to form a live streaming <em>lazyfeed</em>.  You then get live updates in the form of your tags being updated.  Your main screen consists of a bunch of boxes with your topics and then things it guesses are related.</p>
<h3>The hook</h3>
<p style="text-align:justify;">Lazyfeed&#8217;s marketing strategy succeeded again by giving me three invites to hand out to friends.  I offered them on <a class="zem_slink" title="Twitter" rel="homepage" href="http://twitter.com">Twitter</a>, having only one person bite.  So here are the other two invites for the adventurous.  Get em while they&#8217;re hot.  If you manage to take one, please comment that you did so, so that I can at least know who you were and we can save someone else the wasted time.  I&#8217;m just throwing them into the ether like this because I don&#8217;t feel like pushing them on Twitter again.</p>
<blockquote><p><span style="text-decoration:line-through;">NTI1MzMxMjc5ZVhmUTl5cDBiek1R<br />
</span><span style="text-decoration:line-through;"> OTk5MTUwNjczN3JCLklmZHhjMDdV</span></p></blockquote>
<h3>The rub</h3>
<p style="text-align:justify;">Lazyfeed is a lovely service in terms of appearance and ajaxy goodness, but my initial impression is that it ends up being streaming <a class="zem_slink" title="Information overload" rel="wikipedia" href="http://en.wikipedia.org/wiki/Information_overload">information overload</a>.  For one, the topic suggestion feature appears to be fairly naive.  Someone correct me if I&#8217;m wrong, but it looks a bit like document similarity for topics is done purely by one-for-one matching on tags.  Whatever the method, the result of their suggested topics (&#8220;Stuff for Lazy Jason&#8221;) is stuff like the following:</p>
<div id="attachment_1241" class="wp-caption aligncenter" style="width: 510px"><a href="http://ealdent.files.wordpress.com/2009/08/picture-1.png"><img class="size-full wp-image-1241" title="Lazyfeed sample results" src="http://ealdent.files.wordpress.com/2009/08/picture-1.png?w=500&#038;h=287" alt="Lazyfeed sample results" width="500" height="287" /></a><p class="wp-caption-text">Lazyfeed sample suggested topics</p></div>
<p style="text-align:justify;">Granted, it&#8217;s a hard problem, but those results are pretty bad.  So as I started to write this post lambasting this service, I considered that maybe I was just seeing cold-start problems, and I was being unfair.  So I trained it with some additional feeds and topics that are straight-to-the-point of stuff I&#8217;m interested in, like <em>sigir2009</em>, <em>topicmodeling</em>, <em>recommendersystems</em>, etc.  Tags can contain no spaces, btw, which is why those don&#8217;t.  When I tried using dashes, like I often do on delicious, it gives no results.  I also removed some things that were too general or contained too many spurious results.</p>
<h3>The light</h3>
<p style="text-align:justify;">Things started improving here, and I actually began to understand what the point of Lazyfeed is.  My initial confusion was that &#8220;Stuff for Lazy Jason&#8221; is stuff that I would want to read right now.  Being lazy, I didn&#8217;t expect to have to do work to get those things.  But &#8220;Stuff for Lazy Jason&#8221; is a list of topics it thinks I might be interested in.  Saving any one of those puts it into my lazyfeed, which is in the bar on the left.</p>
<div id="attachment_1242" class="wp-caption aligncenter" style="width: 510px"><a href="http://ealdent.files.wordpress.com/2009/08/picture-2.png"><img class="size-full wp-image-1242" title="My lazyfeed topics" src="http://ealdent.files.wordpress.com/2009/08/picture-2.png?w=500&#038;h=375" alt="My lazyfeed topics" width="500" height="375" /></a><p class="wp-caption-text">My lazyfeed topics</p></div>
<p style="text-align:justify;">So now what happens is that occasionally it discovers something new related to my interests and it bumps that category to the top of the list and turns it bold again (grayed out topics have been read).  Most of my topics are low traffic, so add something like <em>mariahcarey</em> if you want to see this functionality in action.  Now we&#8217;re getting somewhere.  It has actually started being helpful and has found me some stuff that my Google alerts haven&#8217;t.  Which is weird, and is making me think I need to double check to make sure my Google alerts are working&#8230;</p>
<h3>The end</h3>
<p style="text-align:justify;">My takeaway after using Lazyfeed for nigh on two hours is that it&#8217;s an interesting alternative (or even extension) to <a class="zem_slink" title="RSS" rel="wikipedia" href="http://en.wikipedia.org/wiki/RSS">RSS</a>, but one that still hasn&#8217;t crossed the bridge to the next stage in evolution.  The idea is solid.  Automatically discover stuff in the sea of human knowledge (or human idiocy) and serve it up fresh.  The implementation lacks robust topic detection which is unfortunately going to be necessary unless it is to become another source of information overload rather than a useful stream of relevant information. Relevance is an ephemeral thing, given that your information needs change from day to day.  Lazyfeed makes it pretty easy to get rid of old topics and add new ones, even if some of their suggestions are still wonky.  It&#8217;s an interesting recommender system problem with a lot of potential.</p>
<div class="zemanta-pixie" style="margin-top:10px;height:15px;"><a class="zemanta-pixie-a" title="Reblog this post [with Zemanta]" href="http://reblog.zemanta.com/zemified/403d8746-534f-461c-8872-df09ca6433c9/"><img class="zemanta-pixie-img" style="border:medium none;float:right;" src="http://img.zemanta.com/reblog_c.png?x-id=403d8746-534f-461c-8872-df09ca6433c9" alt="Reblog this post [with Zemanta]" /></a></div>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/ealdent.wordpress.com/1240/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/ealdent.wordpress.com/1240/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/ealdent.wordpress.com/1240/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/ealdent.wordpress.com/1240/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/ealdent.wordpress.com/1240/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/ealdent.wordpress.com/1240/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/ealdent.wordpress.com/1240/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/ealdent.wordpress.com/1240/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/ealdent.wordpress.com/1240/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/ealdent.wordpress.com/1240/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/ealdent.wordpress.com/1240/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/ealdent.wordpress.com/1240/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/ealdent.wordpress.com/1240/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/ealdent.wordpress.com/1240/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1240&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />
<p><a href="http://feedads.g.doubleclick.net/~a/S2xclZ5JpFeYAvZ8FdrTHuH3g10/0/da"><img src="http://feedads.g.doubleclick.net/~a/S2xclZ5JpFeYAvZ8FdrTHuH3g10/0/di" border="0" ismap="true"></img></a><br/>
<a href="http://feedads.g.doubleclick.net/~a/S2xclZ5JpFeYAvZ8FdrTHuH3g10/1/da"><img src="http://feedads.g.doubleclick.net/~a/S2xclZ5JpFeYAvZ8FdrTHuH3g10/1/di" border="0" ismap="true"></img></a></p>]]></content:encoded>
			<wfw:commentRss>http://mendicantbug.com/2009/08/01/lazyfeed-the-missing-link-in-the-evolution-of-rss/feed/</wfw:commentRss>
		<slash:comments>5</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ebec6abd2b9f1eb4de865aed01242171?s=96&amp;d=monsterid&amp;r=PG" medium="image">
			<media:title type="html">ealdent</media:title>
		</media:content>

		<media:content url="http://ealdent.files.wordpress.com/2009/08/picture-1.png" medium="image">
			<media:title type="html">Lazyfeed sample results</media:title>
		</media:content>

		<media:content url="http://ealdent.files.wordpress.com/2009/08/picture-2.png" medium="image">
			<media:title type="html">My lazyfeed topics</media:title>
		</media:content>

		<media:content url="http://img.zemanta.com/reblog_c.png?x-id=403d8746-534f-461c-8872-df09ca6433c9" medium="image">
			<media:title type="html">Reblog this post [with Zemanta]</media:title>
		</media:content>
	</item>
		<item>
		<title>Github announces recommender system contest</title>
		<link>http://mendicantbug.com/2009/07/30/github-announces-recommender-system-contest/</link>
		<comments>http://mendicantbug.com/2009/07/30/github-announces-recommender-system-contest/#comments</comments>
		<pubDate>Fri, 31 Jul 2009 03:28:39 +0000</pubDate>
		<dc:creator>Jason Adams</dc:creator>
				<category><![CDATA[contests]]></category>
		<category><![CDATA[recommender systems]]></category>
		<category><![CDATA[netflix prize]]></category>
		<category><![CDATA[github]]></category>

		<guid isPermaLink="false">http://mendicantbug.com/?p=1237</guid>
		<description><![CDATA[Github just announced their own version of the Netflix Prize.  Instead of predicting movie ratings, Github wants you to suggest repositories for users to watch.  This is different from the Netflix Prize in a number of ways: a user watching a repo is similar to a user visiting a page from a search engine &#8211; [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1237&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p style="text-align:justify;"><a href="http://github.com" target="_blank">Github </a>just announced <a href="http://contest.github.com/" target="_blank">their own version</a> of the <a href="http://netflixprize.com" target="_blank">Netflix Prize</a>.  Instead of predicting movie ratings, Github wants you to suggest repositories for users to watch.  This is different from the Netflix Prize in a number of ways:</p>
<ol>
<li>a user watching a repo is similar to a user visiting a page from a search engine &#8211; they are implicit endorsements (we assume that doing so means the user actually likes the repo)</li>
<li>we are predicting the likelihood of a user wanting to watch a repo (binary event), rather than how much a user likes a movie</li>
<li>the data set is a lot smaller, and <a href="http://en.wikipedia.org/wiki/Sparse_matrix" target="_blank">sparsity</a> is a LOT greater (the matrix is 0.006% filled vs. Netflix 1% filled)</li>
<li>you get multiple tries!  they let you pick 10 repos that user may watch and as long as one of them matches, you get credit for it</li>
</ol>
<p style="text-align:justify;">Already there have been many submissions.  The number one place is currently held by Daniel Haran with 46.9% guessed correctly.  Happy hunting, if you decide to compete.</p>
<p>The prizes are a bottle of Pappy van Winkle bourbon and a large Github account for life.  The bottle of Pappy is making me consider competing.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/ealdent.wordpress.com/1237/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/ealdent.wordpress.com/1237/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/ealdent.wordpress.com/1237/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/ealdent.wordpress.com/1237/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/ealdent.wordpress.com/1237/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/ealdent.wordpress.com/1237/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/ealdent.wordpress.com/1237/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/ealdent.wordpress.com/1237/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/ealdent.wordpress.com/1237/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/ealdent.wordpress.com/1237/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/ealdent.wordpress.com/1237/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/ealdent.wordpress.com/1237/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/ealdent.wordpress.com/1237/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/ealdent.wordpress.com/1237/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1237&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />
<p><a href="http://feedads.g.doubleclick.net/~a/lKKQHt7GB_Ayn7dxNiN4XIE9gBY/0/da"><img src="http://feedads.g.doubleclick.net/~a/lKKQHt7GB_Ayn7dxNiN4XIE9gBY/0/di" border="0" ismap="true"></img></a><br/>
<a href="http://feedads.g.doubleclick.net/~a/lKKQHt7GB_Ayn7dxNiN4XIE9gBY/1/da"><img src="http://feedads.g.doubleclick.net/~a/lKKQHt7GB_Ayn7dxNiN4XIE9gBY/1/di" border="0" ismap="true"></img></a></p>]]></content:encoded>
			<wfw:commentRss>http://mendicantbug.com/2009/07/30/github-announces-recommender-system-contest/feed/</wfw:commentRss>
		<slash:comments>1</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ebec6abd2b9f1eb4de865aed01242171?s=96&amp;d=monsterid&amp;r=PG" medium="image">
			<media:title type="html">ealdent</media:title>
		</media:content>
	</item>
		<item>
		<title>Updates to lda-ruby gem</title>
		<link>http://mendicantbug.com/2009/07/30/updates-to-lda-ruby-gem/</link>
		<comments>http://mendicantbug.com/2009/07/30/updates-to-lda-ruby-gem/#comments</comments>
		<pubDate>Fri, 31 Jul 2009 02:20:25 +0000</pubDate>
		<dc:creator>Jason Adams</dc:creator>
				<category><![CDATA[c]]></category>
		<category><![CDATA[computational linguistics]]></category>
		<category><![CDATA[latent dirichlet allocation]]></category>
		<category><![CDATA[lda]]></category>
		<category><![CDATA[machine learning]]></category>
		<category><![CDATA[nlp]]></category>
		<category><![CDATA[ruby]]></category>
		<category><![CDATA[rubygems]]></category>
		<category><![CDATA[topic modeling]]></category>

		<guid isPermaLink="false">http://mendicantbug.com/?p=1230</guid>
		<description><![CDATA[A while back I ported David Blei&#8217;s lda-c code for performing Latent Dirichlet Allocation to Ruby.  Basically I just wrapped the C methods in a Ruby class, turned it into a gem, and called it a day.  The result was a bit ugly and unwieldy, like most research code.  A few months later, Todd Fisher [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1230&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p style="text-align:justify;"><a href="http://ealdent.files.wordpress.com/2009/07/works-on-my-machine-starburst.jpg"><img class="alignright size-full wp-image-1232" style="margin:3px 4px;" title="works-on-my-machine-starburst" src="http://ealdent.files.wordpress.com/2009/07/works-on-my-machine-starburst.jpg?w=150&#038;h=145" alt="works-on-my-machine-starburst" width="150" height="145" /></a>A while back <a href="http://mendicantbug.com/2008/11/17/lda-in-ruby/" target="_self">I ported</a> David Blei&#8217;s <a href="http://www.cs.princeton.edu/~blei/lda-c/" target="_blank">lda-c</a> code for performing <a class="zem_slink" title="Latent Dirichlet allocation" rel="wikipedia" href="http://en.wikipedia.org/wiki/Latent_Dirichlet_allocation">Latent Dirichlet Allocation</a> to <a class="zem_slink" title="Ruby (programming language)" rel="homepage" href="http://www.ruby-lang.org/">Ruby</a>.  Basically I just wrapped the C methods in a Ruby class, turned it into <a href="http://github.com/ealdent/lda-ruby" target="_blank">a gem</a>, and called it a day.  The result was a bit ugly and unwieldy, like most research code.  A few months later, <a href="http://github.com/taf2" target="_blank">Todd Fisher</a> came along and discovered a couple bugs and memory leaks in the C code, for which I am very grateful.  I had been toying with the idea of improving the Ruby code, and embarked on a mission to do so.  The result is a hopefully much cleaner <a class="zem_slink" title="RubyGems" rel="homepage" href="http://docs.rubygems.org">gem</a> that can be used right out of the box with little screwing around.</p>
<p style="text-align:justify;">Unfortunately, I did something I&#8217;m ashamed of.  Ruby gems are notorious for breaking backwards compatibility, and I have done just that.  The good news is, your code will almost work, assuming you didn&#8217;t start diving into the Document and Corpus classes too heavily.  If you did, then you will probably experience a lot of breakage.  The result, I hope is a more sensical implementation, however, so maybe you won&#8217;t hate me.  Of course, I could be wrong and my implementation is still crap.  If that&#8217;s the case, please let me know what needs to be improved.</p>
<p>To install the gem:</p>
<p style="padding-left:30px;"><code>gem sources -a http://gems.github.com<br />
sudo gem install ealdent-lda-ruby</code></p>
<p>Enjoy!</p>
<div class="zemanta-pixie" style="margin-top:10px;height:15px;"><a class="zemanta-pixie-a" title="Reblog this post [with Zemanta]" href="http://reblog.zemanta.com/zemified/f6bb550a-b4f1-4af6-bcde-fabdba98ad7a/"><img class="zemanta-pixie-img" style="border:medium none;float:right;" src="http://img.zemanta.com/reblog_c.png?x-id=f6bb550a-b4f1-4af6-bcde-fabdba98ad7a" alt="Reblog this post [with Zemanta]" /></a></div></p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/ealdent.wordpress.com/1230/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/ealdent.wordpress.com/1230/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/ealdent.wordpress.com/1230/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/ealdent.wordpress.com/1230/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/ealdent.wordpress.com/1230/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/ealdent.wordpress.com/1230/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/ealdent.wordpress.com/1230/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/ealdent.wordpress.com/1230/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/ealdent.wordpress.com/1230/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/ealdent.wordpress.com/1230/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/ealdent.wordpress.com/1230/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/ealdent.wordpress.com/1230/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/ealdent.wordpress.com/1230/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/ealdent.wordpress.com/1230/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mendicantbug.com&amp;blog=1474857&amp;post=1230&amp;subd=ealdent&amp;ref=&amp;feed=1" width="1" height="1" />
<p><a href="http://feedads.g.doubleclick.net/~a/JQ3l7IYHc0zfWaE_jPfeWSN8E6A/0/da"><img src="http://feedads.g.doubleclick.net/~a/JQ3l7IYHc0zfWaE_jPfeWSN8E6A/0/di" border="0" ismap="true"></img></a><br/>
<a href="http://feedads.g.doubleclick.net/~a/JQ3l7IYHc0zfWaE_jPfeWSN8E6A/1/da"><img src="http://feedads.g.doubleclick.net/~a/JQ3l7IYHc0zfWaE_jPfeWSN8E6A/1/di" border="0" ismap="true"></img></a></p>]]></content:encoded>
			<wfw:commentRss>http://mendicantbug.com/2009/07/30/updates-to-lda-ruby-gem/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ebec6abd2b9f1eb4de865aed01242171?s=96&amp;d=monsterid&amp;r=PG" medium="image">
			<media:title type="html">ealdent</media:title>
		</media:content>

		<media:content url="http://ealdent.files.wordpress.com/2009/07/works-on-my-machine-starburst.jpg" medium="image">
			<media:title type="html">works-on-my-machine-starburst</media:title>
		</media:content>

		<media:content url="http://img.zemanta.com/reblog_c.png?x-id=f6bb550a-b4f1-4af6-bcde-fabdba98ad7a" medium="image">
			<media:title type="html">Reblog this post [with Zemanta]</media:title>
		</media:content>
	</item>
	</channel>
</rss>

