<?xml version="1.0" encoding="UTF-8"?>
<?xml-stylesheet type="text/xsl" media="screen" href="/~d/styles/rss2full.xsl"?><?xml-stylesheet type="text/css" media="screen" href="http://feeds.feedburner.com/~d/styles/itemcontent.css"?><rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:wfw="http://wellformedweb.org/CommentAPI/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:atom="http://www.w3.org/2005/Atom" xmlns:sy="http://purl.org/rss/1.0/modules/syndication/" xmlns:slash="http://purl.org/rss/1.0/modules/slash/" xmlns:feedburner="http://rssnamespace.org/feedburner/ext/1.0" version="2.0">

<channel>
	<title>Michael G. Noll</title>
	
	<link>http://www.michael-noll.com/blog</link>
	<description>My digital moleskine</description>
	<lastBuildDate>Tue, 20 Jul 2010 20:07:54 +0000</lastBuildDate>
	<generator>http://wordpress.org/?v=2.9.2</generator>
	<language>en</language>
	<sy:updatePeriod>hourly</sy:updatePeriod>
	<sy:updateFrequency>1</sy:updateFrequency>
			<feedburner:info uri="michael-noll" /><atom10:link xmlns:atom10="http://www.w3.org/2005/Atom" rel="hub" href="http://pubsubhubbub.appspot.com/" /><atom10:link xmlns:atom10="http://www.w3.org/2005/Atom" rel="self" type="application/rss+xml" href="http://www.michael-noll.com/feed/" /><feedburner:feedFlare href="http://add.my.yahoo.com/rss?url=http%3A%2F%2Fwww.michael-noll.com%2Ffeed%2F" src="http://us.i1.yimg.com/us.yimg.com/i/us/my/addtomyyahoo4.gif">Subscribe with My Yahoo!</feedburner:feedFlare><feedburner:feedFlare href="http://www.newsgator.com/ngs/subscriber/subext.aspx?url=http%3A%2F%2Fwww.michael-noll.com%2Ffeed%2F" src="http://www.newsgator.com/images/ngsub1.gif">Subscribe with NewsGator</feedburner:feedFlare><feedburner:feedFlare href="http://feeds.my.aol.com/add.jsp?url=http%3A%2F%2Fwww.michael-noll.com%2Ffeed%2F" src="http://o.aolcdn.com/favorites.my.aol.com/webmaster/ffclient/webroot/locale/en-US/images/myAOLButtonSmall.gif">Subscribe with My AOL</feedburner:feedFlare><feedburner:feedFlare href="http://www.bloglines.com/sub/http://www.michael-noll.com/feed/" src="http://www.bloglines.com/images/sub_modern11.gif">Subscribe with Bloglines</feedburner:feedFlare><feedburner:feedFlare href="http://www.netvibes.com/subscribe.php?url=http%3A%2F%2Fwww.michael-noll.com%2Ffeed%2F" src="http://www.netvibes.com/img/add2netvibes.gif">Subscribe with Netvibes</feedburner:feedFlare><feedburner:feedFlare href="http://fusion.google.com/add?feedurl=http%3A%2F%2Fwww.michael-noll.com%2Ffeed%2F" src="http://buttons.googlesyndication.com/fusion/add.gif">Subscribe with Google</feedburner:feedFlare><feedburner:feedFlare href="http://www.pageflakes.com/subscribe.aspx?url=http%3A%2F%2Fwww.michael-noll.com%2Ffeed%2F" src="http://www.pageflakes.com/ImageFile.ashx?instanceId=Static_4&amp;fileName=ATP_blu_91x17.gif">Subscribe with Pageflakes</feedburner:feedFlare><item>
		<title>Reference implementation of SPEAR algorithm released</title>
		<link>http://feedproxy.google.com/~r/michael-noll/~3/RhSdOc4bb3I/</link>
		<comments>http://www.michael-noll.com/blog/2010/07/10/reference-implementation-of-spear-algorithm-released/#comments</comments>
		<pubDate>Sat, 10 Jul 2010 17:24:25 +0000</pubDate>
		<dc:creator>Michael G. Noll</dc:creator>
				<category><![CDATA[Development & Programming]]></category>
		<category><![CDATA[Publications]]></category>
		<category><![CDATA[Research]]></category>
		<category><![CDATA[algorithm]]></category>
		<category><![CDATA[expertise]]></category>
		<category><![CDATA[experts]]></category>
		<category><![CDATA[foss]]></category>
		<category><![CDATA[gpl]]></category>
		<category><![CDATA[hits]]></category>
		<category><![CDATA[implementation]]></category>
		<category><![CDATA[information retrieval]]></category>
		<category><![CDATA[library]]></category>
		<category><![CDATA[license:gplv2]]></category>
		<category><![CDATA[module]]></category>
		<category><![CDATA[open source]]></category>
		<category><![CDATA[python]]></category>
		<category><![CDATA[ranking]]></category>
		<category><![CDATA[sigir]]></category>
		<category><![CDATA[spam]]></category>
		<category><![CDATA[spammers]]></category>
		<category><![CDATA[spear]]></category>

		<guid isPermaLink="false">http://www.michael-noll.com/blog/?p=322</guid>
		<description><![CDATA[I have just released the &#8220;reference&#8221; implementation of our SPEAR algorithm. The library is written in the Python programming language, and should be straight-forward to use. You can install the library via Python&#8217;s setuptools/easy_install or download it from GitHub.
Here&#8217;s a quick example on how to use it:




&#62;&#62;&#62; import spear


&#62;&#62;&#62; activities = &#91;


&#8230; &#40;datetime.datetime&#40;2010,7,1,9,0,0&#41;, &#34;alice&#34;, &#34;http://www.quuxlabs.com/&#34;&#41;,


&#8230; [...]]]></description>
			<content:encoded><![CDATA[<p>I have just released the <a href="http://github.com/quuxlabs/Spear">&#8220;reference&#8221; implementation</a> of our <a href="http://www.spear-algorithm.org/">SPEAR algorithm</a>. The <a href="http://github.com/quuxlabs/Spear">library</a> is written in the Python programming language, and should be straight-forward to use. You can install the library via Python&#8217;s setuptools/easy_install or download it from <a href="http://github.com/quuxlabs/Spear">GitHub</a>.</p>
<p>Here&#8217;s a quick example on how to use it:</p>
<div class="codesnip-container" >
<div class="python codesnip" style="font-family:monospace;">
<ol>
<li class="li1">
<div class="de1"><span class="sy0">&gt;&gt;&gt;</span> <span class="kw1">import</span> spear</div>
</li>
<li class="li1">
<div class="de1"><span class="sy0">&gt;&gt;&gt;</span> activities = <span class="br0">&#91;</span></div>
</li>
<li class="li1">
<div class="de1">&#8230; <span class="br0">&#40;</span><span class="kw3">datetime</span>.<span class="kw3">datetime</span><span class="br0">&#40;</span><span class="nu0">2010</span>,<span class="nu0">7</span>,<span class="nu0">1</span>,<span class="nu0">9</span>,<span class="nu0">0</span>,<span class="nu0">0</span><span class="br0">&#41;</span>, <span class="st0">&quot;alice&quot;</span>, <span class="st0">&quot;http://www.quuxlabs.com/&quot;</span><span class="br0">&#41;</span>,</div>
</li>
<li class="li1">
<div class="de1">&#8230; <span class="br0">&#40;</span><span class="kw3">datetime</span>.<span class="kw3">datetime</span><span class="br0">&#40;</span><span class="nu0">2010</span>,<span class="nu0">8</span>,<span class="nu0">1</span>,<span class="nu0">12</span>,<span class="nu0">45</span>,<span class="nu0">0</span><span class="br0">&#41;</span>, <span class="st0">&quot;bob&quot;</span>, <span class="st0">&quot;http://www.quuxlabs.com/&quot;</span><span class="br0">&#41;</span>,</div>
</li>
<li class="li1">
<div class="de1">&#8230; <span class="br0">&#93;</span></div>
</li>
<li class="li1">
<div class="de1"><span class="sy0">&gt;&gt;&gt;</span> spear_algorithm = spear.<span class="me1">Spear</span><span class="br0">&#40;</span>activities<span class="br0">&#41;</span></div>
</li>
<li class="li1">
<div class="de1"><span class="sy0">&gt;&gt;&gt;</span> expertise_results, quality_results = spear_algorithm.<span class="me1">run</span><span class="br0">&#40;</span><span class="br0">&#41;</span></div>
</li>
</ol>
</div>
</div>
<p><span id="more-322"></span><br />
Get the top user and his expertise score:</p>
<div class="codesnip-container" >
<div class="python codesnip" style="font-family:monospace;">
<ol>
<li class="li1">
<div class="de1"><span class="sy0">&gt;&gt;&gt;</span> expertise_score, <span class="kw3">user</span> = expertise_results<span class="br0">&#91;</span>0<span class="br0">&#93;</span></div>
</li>
<li class="li1">
<div class="de1"><span class="sy0">&gt;&gt;&gt;</span> <span class="kw1">print</span> <span class="st0">&quot;%s =&gt; %.4f&quot;</span> <span class="sy0">%</span> <span class="br0">&#40;</span><span class="kw3">user</span>, expertise_score<span class="br0">&#41;</span></div>
</li>
<li class="li1">
<div class="de1">alice =<span class="sy0">&gt;</span> <span class="nu0">0.5858</span></div>
</li>
</ol>
</div>
</div>
<p>Get the top resource and its quality score:</p>
<div class="codesnip-container" >
<div class="python codesnip" style="font-family:monospace;">
<ol>
<li class="li1">
<div class="de1"><span class="sy0">&gt;&gt;&gt;</span> quality_score, <span class="kw3">resource</span> = quality_results<span class="br0">&#91;</span>0<span class="br0">&#93;</span></div>
</li>
<li class="li1">
<div class="de1"><span class="sy0">&gt;&gt;&gt;</span> <span class="kw1">print</span> <span class="st0">&quot;%s =&gt; %.4f&quot;</span> <span class="sy0">%</span> <span class="br0">&#40;</span><span class="kw3">resource</span>, quality_score<span class="br0">&#41;</span></div>
</li>
<li class="li1">
<div class="de1">http://www.<span class="me1">quuxlabs</span>.<span class="me1">com</span>/ =<span class="sy0">&gt;</span> <span class="nu0">1.0000</span></div>
</li>
</ol>
</div>
</div>
<p>You can also use the library to simulate the <a href="http://en.wikipedia.org/wiki/HITS_algorithm">HITS algorithm</a> of Jon Kleinberg. Simply supply a credit score function C(x) = 1 to the SPEAR algorithm (see the documentation of the Spear.run() method).</p>
<p>Feel free to play around with it and send me feedback!</p>
<p>PS: The SPEAR Python library requires <a href="http://www.scipy.org/">SciPy/NumPy</a>. If you don&#8217;t have these installed already, here are <a href="http://www.scipy.org/Installing_SciPy">some installation instructures</a> to get you started.</p>
<div class="feedflare">
<a href="http://feeds.feedburner.com/~ff/michael-noll?a=RhSdOc4bb3I:KDDTyOyPhWg:yIl2AUoC8zA"><img src="http://feeds.feedburner.com/~ff/michael-noll?d=yIl2AUoC8zA" border="0"></img></a> <a href="http://feeds.feedburner.com/~ff/michael-noll?a=RhSdOc4bb3I:KDDTyOyPhWg:F7zBnMyn0Lo"><img src="http://feeds.feedburner.com/~ff/michael-noll?i=RhSdOc4bb3I:KDDTyOyPhWg:F7zBnMyn0Lo" border="0"></img></a> <a href="http://feeds.feedburner.com/~ff/michael-noll?a=RhSdOc4bb3I:KDDTyOyPhWg:V_sGLiPBpWU"><img src="http://feeds.feedburner.com/~ff/michael-noll?i=RhSdOc4bb3I:KDDTyOyPhWg:V_sGLiPBpWU" border="0"></img></a> <a href="http://feeds.feedburner.com/~ff/michael-noll?a=RhSdOc4bb3I:KDDTyOyPhWg:qj6IDK7rITs"><img src="http://feeds.feedburner.com/~ff/michael-noll?d=qj6IDK7rITs" border="0"></img></a>
</div><img src="http://feeds.feedburner.com/~r/michael-noll/~4/RhSdOc4bb3I" height="1" width="1"/>]]></content:encoded>
			<wfw:commentRss>http://www.michael-noll.com/blog/2010/07/10/reference-implementation-of-spear-algorithm-released/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		<feedburner:origLink>http://www.michael-noll.com/blog/2010/07/10/reference-implementation-of-spear-algorithm-released/</feedburner:origLink></item>
		<item>
		<title>Publication at Journal of Computational Intelligence</title>
		<link>http://feedproxy.google.com/~r/michael-noll/~3/Uoka30WVtTk/</link>
		<comments>http://www.michael-noll.com/blog/2010/01/04/publication-at-journal-of-computational-intelligence/#comments</comments>
		<pubDate>Mon, 04 Jan 2010 18:46:53 +0000</pubDate>
		<dc:creator>Michael G. Noll</dc:creator>
				<category><![CDATA[Publications]]></category>
		<category><![CDATA[Research]]></category>
		<category><![CDATA[article]]></category>
		<category><![CDATA[collaborative tagging]]></category>
		<category><![CDATA[del.icio.us]]></category>
		<category><![CDATA[delicious.com]]></category>
		<category><![CDATA[expert]]></category>
		<category><![CDATA[expertise]]></category>
		<category><![CDATA[experts]]></category>
		<category><![CDATA[folksonomies]]></category>
		<category><![CDATA[folksonomy]]></category>
		<category><![CDATA[hits]]></category>
		<category><![CDATA[journal]]></category>
		<category><![CDATA[publication]]></category>
		<category><![CDATA[social annotation]]></category>
		<category><![CDATA[social-annotations]]></category>
		<category><![CDATA[social-bookmarking]]></category>
		<category><![CDATA[social-tagging]]></category>
		<category><![CDATA[social-web]]></category>
		<category><![CDATA[spam]]></category>
		<category><![CDATA[spammer]]></category>
		<category><![CDATA[spammers]]></category>
		<category><![CDATA[spear]]></category>
		<category><![CDATA[tagging]]></category>
		<category><![CDATA[web]]></category>
		<category><![CDATA[web 2.0]]></category>
		<category><![CDATA[yahoo]]></category>

		<guid isPermaLink="false">http://www.michael-noll.com/blog/?p=313</guid>
		<description><![CDATA[I&#8217;ve just received the notification that the joint paper of Ching-man Au Yeung and me, titled &#8220;SPEAR: Spamming-resistant Expertise Analysis and Ranking in Collaborative Tagging Systems&#8221;, has been accepted for publication by the renowned Journal of Computational Intelligence. Seems like the new year 2010 is starting well!
]]></description>
			<content:encoded><![CDATA[<p>I&#8217;ve just received the notification that the joint paper of <a href="http://www.albertauyeung.com/">Ching-man Au Yeung</a> and me, titled &#8220;SPEAR: Spamming-resistant Expertise Analysis and Ranking in Collaborative Tagging Systems&#8221;, has been accepted for publication by the renowned <a href="http://www.wiley.com/bw/journal.asp?ref=0824-7935">Journal of Computational Intelligence</a>. Seems like the new year 2010 is starting well!</p>
<div class="feedflare">
<a href="http://feeds.feedburner.com/~ff/michael-noll?a=Uoka30WVtTk:QZ5gMRWgBXg:yIl2AUoC8zA"><img src="http://feeds.feedburner.com/~ff/michael-noll?d=yIl2AUoC8zA" border="0"></img></a> <a href="http://feeds.feedburner.com/~ff/michael-noll?a=Uoka30WVtTk:QZ5gMRWgBXg:F7zBnMyn0Lo"><img src="http://feeds.feedburner.com/~ff/michael-noll?i=Uoka30WVtTk:QZ5gMRWgBXg:F7zBnMyn0Lo" border="0"></img></a> <a href="http://feeds.feedburner.com/~ff/michael-noll?a=Uoka30WVtTk:QZ5gMRWgBXg:V_sGLiPBpWU"><img src="http://feeds.feedburner.com/~ff/michael-noll?i=Uoka30WVtTk:QZ5gMRWgBXg:V_sGLiPBpWU" border="0"></img></a> <a href="http://feeds.feedburner.com/~ff/michael-noll?a=Uoka30WVtTk:QZ5gMRWgBXg:qj6IDK7rITs"><img src="http://feeds.feedburner.com/~ff/michael-noll?d=qj6IDK7rITs" border="0"></img></a>
</div><img src="http://feeds.feedburner.com/~r/michael-noll/~4/Uoka30WVtTk" height="1" width="1"/>]]></content:encoded>
			<wfw:commentRss>http://www.michael-noll.com/blog/2010/01/04/publication-at-journal-of-computational-intelligence/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		<feedburner:origLink>http://www.michael-noll.com/blog/2010/01/04/publication-at-journal-of-computational-intelligence/</feedburner:origLink></item>
		<item>
		<title>Article about SPEAR on Communications of the ACM</title>
		<link>http://feedproxy.google.com/~r/michael-noll/~3/3cYqhV2c-TA/</link>
		<comments>http://www.michael-noll.com/blog/2009/09/29/article-about-spear-on-communications-of-the-acm/#comments</comments>
		<pubDate>Tue, 29 Sep 2009 11:21:30 +0000</pubDate>
		<dc:creator>Michael G. Noll</dc:creator>
				<category><![CDATA[Publications]]></category>
		<category><![CDATA[Research]]></category>
		<category><![CDATA[acm]]></category>
		<category><![CDATA[article]]></category>
		<category><![CDATA[cacm]]></category>
		<category><![CDATA[collaborative tagging]]></category>
		<category><![CDATA[del.icio.us]]></category>
		<category><![CDATA[delicious.com]]></category>
		<category><![CDATA[expert]]></category>
		<category><![CDATA[expertise]]></category>
		<category><![CDATA[experts]]></category>
		<category><![CDATA[folksonomies]]></category>
		<category><![CDATA[folksonomy]]></category>
		<category><![CDATA[hits]]></category>
		<category><![CDATA[publication]]></category>
		<category><![CDATA[social annotation]]></category>
		<category><![CDATA[social-annotations]]></category>
		<category><![CDATA[social-bookmarking]]></category>
		<category><![CDATA[social-tagging]]></category>
		<category><![CDATA[social-web]]></category>
		<category><![CDATA[spam]]></category>
		<category><![CDATA[spammer]]></category>
		<category><![CDATA[spammers]]></category>
		<category><![CDATA[spear]]></category>
		<category><![CDATA[tagging]]></category>
		<category><![CDATA[web]]></category>
		<category><![CDATA[web 2.0]]></category>
		<category><![CDATA[yahoo]]></category>

		<guid isPermaLink="false">http://www.michael-noll.com/blog/?p=308</guid>
		<description><![CDATA[I&#8217;m happy to announce that the Communications of the ACM (CACM) magazine has published an article about our work on the SPEAR algorithm: New Ranking Algorithm Separates Digital Wheat from Chaff
]]></description>
			<content:encoded><![CDATA[<p>I&#8217;m happy to announce that the <a href="http://cacm.acm.org/">Communications of the ACM (CACM)</a> magazine has published an <a href="http://cacm.acm.org/news/42206-new-ranking-algorithm-separates-digital-wheat-from-chaff">article</a> about our work on the <a href="http://www.spear-algorithm.org/">SPEAR algorithm</a>: <a href="http://cacm.acm.org/news/42206-new-ranking-algorithm-separates-digital-wheat-from-chaff">New Ranking Algorithm Separates Digital Wheat from Chaff</a></p>
<div class="feedflare">
<a href="http://feeds.feedburner.com/~ff/michael-noll?a=3cYqhV2c-TA:GiQ2FMfxEGU:yIl2AUoC8zA"><img src="http://feeds.feedburner.com/~ff/michael-noll?d=yIl2AUoC8zA" border="0"></img></a> <a href="http://feeds.feedburner.com/~ff/michael-noll?a=3cYqhV2c-TA:GiQ2FMfxEGU:F7zBnMyn0Lo"><img src="http://feeds.feedburner.com/~ff/michael-noll?i=3cYqhV2c-TA:GiQ2FMfxEGU:F7zBnMyn0Lo" border="0"></img></a> <a href="http://feeds.feedburner.com/~ff/michael-noll?a=3cYqhV2c-TA:GiQ2FMfxEGU:V_sGLiPBpWU"><img src="http://feeds.feedburner.com/~ff/michael-noll?i=3cYqhV2c-TA:GiQ2FMfxEGU:V_sGLiPBpWU" border="0"></img></a> <a href="http://feeds.feedburner.com/~ff/michael-noll?a=3cYqhV2c-TA:GiQ2FMfxEGU:qj6IDK7rITs"><img src="http://feeds.feedburner.com/~ff/michael-noll?d=qj6IDK7rITs" border="0"></img></a>
</div><img src="http://feeds.feedburner.com/~r/michael-noll/~4/3cYqhV2c-TA" height="1" width="1"/>]]></content:encoded>
			<wfw:commentRss>http://www.michael-noll.com/blog/2009/09/29/article-about-spear-on-communications-of-the-acm/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		<feedburner:origLink>http://www.michael-noll.com/blog/2009/09/29/article-about-spear-on-communications-of-the-acm/</feedburner:origLink></item>
		<item>
		<title>Invited article for Yahoo! on SPEAR algorithm</title>
		<link>http://feedproxy.google.com/~r/michael-noll/~3/YrRx17dj500/</link>
		<comments>http://www.michael-noll.com/blog/2009/09/03/invited-article-for-yahoo-on-spear-algorithm/#comments</comments>
		<pubDate>Thu, 03 Sep 2009 19:24:18 +0000</pubDate>
		<dc:creator>Michael G. Noll</dc:creator>
				<category><![CDATA[Development & Programming]]></category>
		<category><![CDATA[Publications]]></category>
		<category><![CDATA[Research]]></category>
		<category><![CDATA[article]]></category>
		<category><![CDATA[collaborative tagging]]></category>
		<category><![CDATA[del.icio.us]]></category>
		<category><![CDATA[delicious.com]]></category>
		<category><![CDATA[expert]]></category>
		<category><![CDATA[expertise]]></category>
		<category><![CDATA[experts]]></category>
		<category><![CDATA[folksonomies]]></category>
		<category><![CDATA[folksonomy]]></category>
		<category><![CDATA[hits]]></category>
		<category><![CDATA[publication]]></category>
		<category><![CDATA[social annotation]]></category>
		<category><![CDATA[social-annotations]]></category>
		<category><![CDATA[social-bookmarking]]></category>
		<category><![CDATA[social-tagging]]></category>
		<category><![CDATA[social-web]]></category>
		<category><![CDATA[spam]]></category>
		<category><![CDATA[spammer]]></category>
		<category><![CDATA[spammers]]></category>
		<category><![CDATA[spear]]></category>
		<category><![CDATA[tagging]]></category>
		<category><![CDATA[web]]></category>
		<category><![CDATA[web 2.0]]></category>
		<category><![CDATA[yahoo]]></category>

		<guid isPermaLink="false">http://www.michael-noll.com/blog/?p=299</guid>
		<description><![CDATA[A couple of days ago, my co-worker Ching-man Au Yeung and I were approached by Yahoo! to write a guest article about our work on the SPEAR algorithm for the Delicious.com blog. Well, I&#8217;m happy to announce that the article is published now: How SPEAR Identifies Domain Experts within Delicious. Check it out while it&#8217;s [...]]]></description>
			<content:encoded><![CDATA[<p>A couple of days ago, my co-worker Ching-man Au Yeung and I were approached by <a href="http://www.yahoo.com/">Yahoo!</a> to write a guest article about our work on the <a href="http://www.spear-algorithm.org/">SPEAR algorithm</a> for the <a href="http://blog.delicious.com/blog/2009/08/how-spear-identifies-domain-experts-within-delicious.html">Delicious.com blog</a>. Well, I&#8217;m happy to announce that the article is published now: <strong><a href="http://blog.delicious.com/blog/2009/08/how-spear-identifies-domain-experts-within-delicious.html">How SPEAR Identifies Domain Experts within Delicious</a></strong>. Check it out while it&#8217;s still hot <img src='http://www.michael-noll.com/blog/wp-includes/images/smilies/icon_wink.gif' alt=';-)' class='wp-smiley' /> </p>
<p>Thanks again to <a href="http://zooie.wordpress.com/bio/">Vik Singh</a> and <a href="http://aseidman.com/about/">Ariel Seidman</a> from Yahoo! for this great opportunity and for their support!</p>
<p><span id="more-299"></span></p>
<div class="feedflare">
<a href="http://feeds.feedburner.com/~ff/michael-noll?a=YrRx17dj500:omEUmObaacI:yIl2AUoC8zA"><img src="http://feeds.feedburner.com/~ff/michael-noll?d=yIl2AUoC8zA" border="0"></img></a> <a href="http://feeds.feedburner.com/~ff/michael-noll?a=YrRx17dj500:omEUmObaacI:F7zBnMyn0Lo"><img src="http://feeds.feedburner.com/~ff/michael-noll?i=YrRx17dj500:omEUmObaacI:F7zBnMyn0Lo" border="0"></img></a> <a href="http://feeds.feedburner.com/~ff/michael-noll?a=YrRx17dj500:omEUmObaacI:V_sGLiPBpWU"><img src="http://feeds.feedburner.com/~ff/michael-noll?i=YrRx17dj500:omEUmObaacI:V_sGLiPBpWU" border="0"></img></a> <a href="http://feeds.feedburner.com/~ff/michael-noll?a=YrRx17dj500:omEUmObaacI:qj6IDK7rITs"><img src="http://feeds.feedburner.com/~ff/michael-noll?d=qj6IDK7rITs" border="0"></img></a>
</div><img src="http://feeds.feedburner.com/~r/michael-noll/~4/YrRx17dj500" height="1" width="1"/>]]></content:encoded>
			<wfw:commentRss>http://www.michael-noll.com/blog/2009/09/03/invited-article-for-yahoo-on-spear-algorithm/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		<feedburner:origLink>http://www.michael-noll.com/blog/2009/09/03/invited-article-for-yahoo-on-spear-algorithm/</feedburner:origLink></item>
		<item>
		<title>Technology Review article on our expertise ranking approach from SIGIR ‘09</title>
		<link>http://feedproxy.google.com/~r/michael-noll/~3/Gp3GNRqJP6Q/</link>
		<comments>http://www.michael-noll.com/blog/2009/07/31/technology-review-article-on-our-expertise-ranking-approach-from-sigir-09/#comments</comments>
		<pubDate>Fri, 31 Jul 2009 15:06:25 +0000</pubDate>
		<dc:creator>Michael G. Noll</dc:creator>
				<category><![CDATA[Publications]]></category>
		<category><![CDATA[Research]]></category>
		<category><![CDATA[acm]]></category>
		<category><![CDATA[article]]></category>
		<category><![CDATA[collaborative tagging]]></category>
		<category><![CDATA[del.icio.us]]></category>
		<category><![CDATA[evaluation]]></category>
		<category><![CDATA[expert]]></category>
		<category><![CDATA[expertise]]></category>
		<category><![CDATA[experts]]></category>
		<category><![CDATA[folksonomies]]></category>
		<category><![CDATA[folksonomy]]></category>
		<category><![CDATA[hits]]></category>
		<category><![CDATA[magazine]]></category>
		<category><![CDATA[publication]]></category>
		<category><![CDATA[reputation]]></category>
		<category><![CDATA[social annotation]]></category>
		<category><![CDATA[social-annotations]]></category>
		<category><![CDATA[social-bookmarking]]></category>
		<category><![CDATA[social-tagging]]></category>
		<category><![CDATA[social-web]]></category>
		<category><![CDATA[spam]]></category>
		<category><![CDATA[spammer]]></category>
		<category><![CDATA[spammers]]></category>
		<category><![CDATA[spear]]></category>
		<category><![CDATA[tagging]]></category>
		<category><![CDATA[technology review]]></category>
		<category><![CDATA[web]]></category>
		<category><![CDATA[web 2.0]]></category>

		<guid isPermaLink="false">http://www.michael-noll.com/blog/?p=288</guid>
		<description><![CDATA[The US magazine Technology Review has published an article about our SPEAR algorithm for expertise ranking in the Social Web. My co-worker Ching-man Au Yeung from University of Southampton and I just returned from this year&#8217;s ACM SIGIR conference where we presented this joint work.
The TR article A Better Way to Rank Expertise Online summarizes [...]]]></description>
			<content:encoded><![CDATA[<p>The US magazine <a href="http://www.technologyreview.com/web/23100/">Technology Review</a> has <a href="http://www.technologyreview.com/web/23100/">published an article</a> about our <a href="http://www.michael-noll.com/blog/2009/06/05/telling-experts-from-spammers-expertise-ranking-in-folksonomies/">SPEAR algorithm</a> for expertise ranking in the Social Web. My co-worker <a href="http://www.ecs.soton.ac.uk/people/cmay06r">Ching-man Au Yeung</a> from University of Southampton and I just returned from this year&#8217;s <a href="http://www.sigir2009.org/">ACM SIGIR conference</a> where we presented this joint work.</p>
<p>The TR article <a href="http://www.technologyreview.com/web/23100/">A Better Way to Rank Expertise Online</a> summarizes our approach quite well, and we&#8217;re really happy about the very positive feedback therein from researchers like <a href="http://en.wikipedia.org/wiki/Jon_Kleinberg">Professor Jon Kleinberg</a> (the inventor of the <a href="http://en.wikipedia.org/wiki/HITS_algorithm">HITS algorithm</a> on which our SPEAR algorithm is based), <a href="http://www.redlog.net/">Scott Golder</a> (his publication together with Huberman on usage patterns in collaborative tagging systems is one of the earliest and currently most cited works in the area of the Social Web) and <a href="http://isiosf.isi.it/~cattuto/">Ciro Cattuto</a> (very nice work on social dynamics and network characteristics of folksonomies). Thanks!</p>
<p><span id="more-288"></span></p>
<div class="feedflare">
<a href="http://feeds.feedburner.com/~ff/michael-noll?a=Gp3GNRqJP6Q:wt-EJ3L9LBQ:yIl2AUoC8zA"><img src="http://feeds.feedburner.com/~ff/michael-noll?d=yIl2AUoC8zA" border="0"></img></a> <a href="http://feeds.feedburner.com/~ff/michael-noll?a=Gp3GNRqJP6Q:wt-EJ3L9LBQ:F7zBnMyn0Lo"><img src="http://feeds.feedburner.com/~ff/michael-noll?i=Gp3GNRqJP6Q:wt-EJ3L9LBQ:F7zBnMyn0Lo" border="0"></img></a> <a href="http://feeds.feedburner.com/~ff/michael-noll?a=Gp3GNRqJP6Q:wt-EJ3L9LBQ:V_sGLiPBpWU"><img src="http://feeds.feedburner.com/~ff/michael-noll?i=Gp3GNRqJP6Q:wt-EJ3L9LBQ:V_sGLiPBpWU" border="0"></img></a> <a href="http://feeds.feedburner.com/~ff/michael-noll?a=Gp3GNRqJP6Q:wt-EJ3L9LBQ:qj6IDK7rITs"><img src="http://feeds.feedburner.com/~ff/michael-noll?d=qj6IDK7rITs" border="0"></img></a>
</div><img src="http://feeds.feedburner.com/~r/michael-noll/~4/Gp3GNRqJP6Q" height="1" width="1"/>]]></content:encoded>
			<wfw:commentRss>http://www.michael-noll.com/blog/2009/07/31/technology-review-article-on-our-expertise-ranking-approach-from-sigir-09/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		<feedburner:origLink>http://www.michael-noll.com/blog/2009/07/31/technology-review-article-on-our-expertise-ranking-approach-from-sigir-09/</feedburner:origLink></item>
		<item>
		<title>Telling Experts from Spammers: Expertise Ranking in Folksonomies</title>
		<link>http://feedproxy.google.com/~r/michael-noll/~3/dPQexTICDX0/</link>
		<comments>http://www.michael-noll.com/blog/2009/06/05/telling-experts-from-spammers-expertise-ranking-in-folksonomies/#comments</comments>
		<pubDate>Fri, 05 Jun 2009 13:13:17 +0000</pubDate>
		<dc:creator>Michael G. Noll</dc:creator>
				<category><![CDATA[Publications]]></category>
		<category><![CDATA[Research]]></category>
		<category><![CDATA[acm]]></category>
		<category><![CDATA[collaborative tagging]]></category>
		<category><![CDATA[del.icio.us]]></category>
		<category><![CDATA[evaluation]]></category>
		<category><![CDATA[expert]]></category>
		<category><![CDATA[expertise]]></category>
		<category><![CDATA[experts]]></category>
		<category><![CDATA[folksonomies]]></category>
		<category><![CDATA[folksonomy]]></category>
		<category><![CDATA[hits]]></category>
		<category><![CDATA[publication]]></category>
		<category><![CDATA[reputation]]></category>
		<category><![CDATA[social annotation]]></category>
		<category><![CDATA[social-annotations]]></category>
		<category><![CDATA[social-bookmarking]]></category>
		<category><![CDATA[social-tagging]]></category>
		<category><![CDATA[social-web]]></category>
		<category><![CDATA[spam]]></category>
		<category><![CDATA[spammer]]></category>
		<category><![CDATA[spammers]]></category>
		<category><![CDATA[spear]]></category>
		<category><![CDATA[tagging]]></category>
		<category><![CDATA[web]]></category>
		<category><![CDATA[web 2.0]]></category>

		<guid isPermaLink="false">http://www.michael-noll.com/blog/?p=278</guid>
		<description><![CDATA[My paper Telling Experts from Spammers: Expertise Ranking in Folksonomies, a joint work written together with fellow Ph.D. candidate Ching-Man Au Yeung from University of Southampton, has been accepted for publication and presentation at this year’s International ACM SIGIR Conference which will be held in Boston, USA, from July 19 &#8211; 23, 2009.

Update: Head over [...]]]></description>
			<content:encoded><![CDATA[<p>My paper <em>Telling Experts from Spammers: Expertise Ranking in Folksonomies</em>, a joint work written together with fellow Ph.D. candidate Ching-Man Au Yeung from University of Southampton, has been accepted for publication and presentation at this year’s <a href="http://www.sigir2009.org/">International ACM SIGIR Conference</a> which will be held in Boston, USA, from July 19 &#8211; 23, 2009.<span id="more-278"></span></p>
<p></p>
<div style="border:2px solid red; padding: 10px 5px;"><strong>Update:</strong> Head over to the dedicated <a href="http://www.spear-algorithm.org/">SPEAR algorithm website</a> for more information!</div>
<h1>Abstract</h1>
<p>With a suitable algorithm for ranking the expertise of a user in a collaborative tagging system, we will be able to identify experts and discover useful and relevant resources through them. We propose that the level of expertise of a user with respect to a particular topic is mainly determined by two factors. Firstly, an expert should possess a high quality collection of resources, while the quality of a Web resource depends on the expertise of the users who have assigned tags to it. Secondly, an expert should be one who tends to identify interesting or useful resources before other users do.</p>
<p>We propose a graph-based algorithm, <em>SPEAR (SPamming-resistant Expertise Analysis and Ranking)</em>, which implements these ideas for ranking users in a folksonomy. We evaluate our method with experiments on data sets collected from Delicious.com comprising over 71,000 Web documents, 0.5 million users and 2 million shared bookmarks. We also show that the algorithm is more resistant to spammers than other methods such as the original HITS algorithm and simple statistical measures.</p>
<h1>Full Paper &amp; Presentation</h1>
<ul>
<li>M. G. Noll, C.-M. Au Yeung, N. Gibbins, C. Meinel, N. Shadbolt<br />
<a href="/blog/uploads/Michael-Noll_Telling-Experts-from-Spammers_SIGIR_2009.pdf">Telling Experts from Spammers: Expertise Ranking in Folksonomies</a><br />
Proceedings of 32nd ACM SIGIR Conference, Boston, USA, July 2009, pp. 612-619, <a href="../../wiki/Special:BookSources/9781605584836">ISBN 978-1-60558-483-6</a> (<a title="http://portal.acm.org/citation.cfm?id=1571941.1572046" href="http://portal.acm.org/citation.cfm?id=1571941.1572046">ACM Link</a>, <a href="/uploads/sigir2009.bib">BibTeX</a>)</li>
<li>Presentation: <a href="/blog/uploads/Michael-Noll_Talk_Telling-Experts-from-Spammers_SIGIR_2009.pdf">Telling Experts from Spammers (Talk)</a>, our talk at SIGIR 2009</li>
</ul>
<h1>Related Links</h1>
<ul>
<li><a href="http://www.spear-algorithm.org/">The Spear Algorithm</a> &#8211; website dedicated to SPEAR</li>
<li><a href="../../wiki/Publications">List of my publications</a></li>
<li><a href="http://www.technologyreview.com/web/23100/">Article on Technology Review</a> about this work: <a href="http://www.technologyreview.com/web/23100/" target="_blank">A Better Way to Rank Expertise Online</a>, July 2009</li>
<li><a href="http://www.sigir2009.org/" target="_blank">32nd Annual ACM SIGIR Conference</a>, Boston, USA, July 2009</li>
</ul>
<div class="feedflare">
<a href="http://feeds.feedburner.com/~ff/michael-noll?a=dPQexTICDX0:60hBosaih7g:yIl2AUoC8zA"><img src="http://feeds.feedburner.com/~ff/michael-noll?d=yIl2AUoC8zA" border="0"></img></a> <a href="http://feeds.feedburner.com/~ff/michael-noll?a=dPQexTICDX0:60hBosaih7g:F7zBnMyn0Lo"><img src="http://feeds.feedburner.com/~ff/michael-noll?i=dPQexTICDX0:60hBosaih7g:F7zBnMyn0Lo" border="0"></img></a> <a href="http://feeds.feedburner.com/~ff/michael-noll?a=dPQexTICDX0:60hBosaih7g:V_sGLiPBpWU"><img src="http://feeds.feedburner.com/~ff/michael-noll?i=dPQexTICDX0:60hBosaih7g:V_sGLiPBpWU" border="0"></img></a> <a href="http://feeds.feedburner.com/~ff/michael-noll?a=dPQexTICDX0:60hBosaih7g:qj6IDK7rITs"><img src="http://feeds.feedburner.com/~ff/michael-noll?d=qj6IDK7rITs" border="0"></img></a>
</div><img src="http://feeds.feedburner.com/~r/michael-noll/~4/dPQexTICDX0" height="1" width="1"/>]]></content:encoded>
			<wfw:commentRss>http://www.michael-noll.com/blog/2009/06/05/telling-experts-from-spammers-expertise-ranking-in-folksonomies/feed/</wfw:commentRss>
		<slash:comments>3</slash:comments>
		<feedburner:origLink>http://www.michael-noll.com/blog/2009/06/05/telling-experts-from-spammers-expertise-ranking-in-folksonomies/</feedburner:origLink></item>
		<item>
		<title>Article published in Python Magazine</title>
		<link>http://feedproxy.google.com/~r/michael-noll/~3/OaDrfzSgm6k/</link>
		<comments>http://www.michael-noll.com/blog/2009/03/13/article-published-in-python-magazine/#comments</comments>
		<pubDate>Fri, 13 Mar 2009 13:35:06 +0000</pubDate>
		<dc:creator>Michael G. Noll</dc:creator>
				<category><![CDATA[Development & Programming]]></category>
		<category><![CDATA[Publications]]></category>
		<category><![CDATA[Research]]></category>
		<category><![CDATA[article]]></category>
		<category><![CDATA[articles]]></category>
		<category><![CDATA[beautifulsoup]]></category>
		<category><![CDATA[del.icio.us]]></category>
		<category><![CDATA[DeliciousAPI]]></category>
		<category><![CDATA[feedparser]]></category>
		<category><![CDATA[json]]></category>
		<category><![CDATA[link recommendation]]></category>
		<category><![CDATA[magazine]]></category>
		<category><![CDATA[publication]]></category>
		<category><![CDATA[python]]></category>
		<category><![CDATA[rss]]></category>

		<guid isPermaLink="false">http://www.michael-noll.com/blog/?p=269</guid>
		<description><![CDATA[A couple of months ago Doug Hellmann, the chief editor of Python Magazine, invited me to write a featured article. I&#8217;m happy to share the good news that my article Writing a Personal Link Recommendation Engine has eventually been published in this year&#8217;s February issue.

Here&#8217;s a brief teaser:
Writing a Personal Link Recommendation Engine
There is so [...]]]></description>
			<content:encoded><![CDATA[<p>A couple of months ago Doug Hellmann, the chief editor of <a href="http://pythonmagazine.com/c/issue/view/92">Python Magazine</a>, invited me to write a featured article. I&#8217;m happy to share the good news that my article <a href="http://pythonmagazine.com/c/issue/view/92"><em>Writing a Personal Link Recommendation Engine</em></a> has eventually been published in this year&#8217;s February issue.</p>
<p><span id="more-269"></span><img class="size-full wp-image-270" title="Cover of Python Magazine, February 2009" src="http://www.michael-noll.com/blog/uploads/pymag_february2009.jpg" alt="Cover of Python Magazine, Volume 3(2), February 2009" width="200" height="258" /></p>
<p>Here&#8217;s a brief teaser:</p>
<blockquote><p><strong>Writing a Personal Link Recommendation Engine</strong></p>
<p>There is so much going on in the Internet today that it’s hard to keep track of it all. Whether you need to stay up to date with job-related information, the current state of research, or the latest developments in the Open Source world, finding relevant information quickly on the Internet is difficult. So-called “social” services such as Delicious.com or Digg.com try to support users by allowing them to collaboratively share their knowledge about interesting web sites. In this article, we will design and implement a simple, yet powerful link recommender whose analysis is based solely on Delicious.com social bookmarks information.</p></blockquote>
<p>Interested? <a href="http://pythonmagazine.com/c/issue/view/92">Head over to PyMag</a> and have a look!</p>
<div class="feedflare">
<a href="http://feeds.feedburner.com/~ff/michael-noll?a=OaDrfzSgm6k:XyGRAFqNfpg:yIl2AUoC8zA"><img src="http://feeds.feedburner.com/~ff/michael-noll?d=yIl2AUoC8zA" border="0"></img></a> <a href="http://feeds.feedburner.com/~ff/michael-noll?a=OaDrfzSgm6k:XyGRAFqNfpg:F7zBnMyn0Lo"><img src="http://feeds.feedburner.com/~ff/michael-noll?i=OaDrfzSgm6k:XyGRAFqNfpg:F7zBnMyn0Lo" border="0"></img></a> <a href="http://feeds.feedburner.com/~ff/michael-noll?a=OaDrfzSgm6k:XyGRAFqNfpg:V_sGLiPBpWU"><img src="http://feeds.feedburner.com/~ff/michael-noll?i=OaDrfzSgm6k:XyGRAFqNfpg:V_sGLiPBpWU" border="0"></img></a> <a href="http://feeds.feedburner.com/~ff/michael-noll?a=OaDrfzSgm6k:XyGRAFqNfpg:qj6IDK7rITs"><img src="http://feeds.feedburner.com/~ff/michael-noll?d=qj6IDK7rITs" border="0"></img></a>
</div><img src="http://feeds.feedburner.com/~r/michael-noll/~4/OaDrfzSgm6k" height="1" width="1"/>]]></content:encoded>
			<wfw:commentRss>http://www.michael-noll.com/blog/2009/03/13/article-published-in-python-magazine/feed/</wfw:commentRss>
		<slash:comments>6</slash:comments>
		<feedburner:origLink>http://www.michael-noll.com/blog/2009/03/13/article-published-in-python-magazine/</feedburner:origLink></item>
		<item>
		<title>WI 2008 and SITIS 2008 papers available for download</title>
		<link>http://feedproxy.google.com/~r/michael-noll/~3/K51TK6MsaAo/</link>
		<comments>http://www.michael-noll.com/blog/2009/01/06/wi-2008-and-sitis-2008-papers-available-for-download/#comments</comments>
		<pubDate>Tue, 06 Jan 2009 16:05:30 +0000</pubDate>
		<dc:creator>Michael G. Noll</dc:creator>
				<category><![CDATA[Publications]]></category>
		<category><![CDATA[Research]]></category>
		<category><![CDATA[acm]]></category>
		<category><![CDATA[add-on]]></category>
		<category><![CDATA[anchor texts]]></category>
		<category><![CDATA[backlinks]]></category>
		<category><![CDATA[bookmarks]]></category>
		<category><![CDATA[cabs120k08]]></category>
		<category><![CDATA[categories]]></category>
		<category><![CDATA[categorization]]></category>
		<category><![CDATA[corpus]]></category>
		<category><![CDATA[data set]]></category>
		<category><![CDATA[del.icio.us]]></category>
		<category><![CDATA[dmoz]]></category>
		<category><![CDATA[download]]></category>
		<category><![CDATA[extension]]></category>
		<category><![CDATA[firefox]]></category>
		<category><![CDATA[folksonomy]]></category>
		<category><![CDATA[google]]></category>
		<category><![CDATA[hadoop]]></category>
		<category><![CDATA[ieee]]></category>
		<category><![CDATA[inlinks]]></category>
		<category><![CDATA[metadata]]></category>
		<category><![CDATA[mysql]]></category>
		<category><![CDATA[open directory project]]></category>
		<category><![CDATA[pagerank]]></category>
		<category><![CDATA[paper]]></category>
		<category><![CDATA[papers]]></category>
		<category><![CDATA[pdf]]></category>
		<category><![CDATA[publication]]></category>
		<category><![CDATA[pylog]]></category>
		<category><![CDATA[pylons]]></category>
		<category><![CDATA[search queries]]></category>
		<category><![CDATA[sitis]]></category>
		<category><![CDATA[social-bookmarking]]></category>
		<category><![CDATA[social-tagging]]></category>
		<category><![CDATA[study]]></category>
		<category><![CDATA[tagging]]></category>
		<category><![CDATA[tokyo cabinet]]></category>
		<category><![CDATA[tokyo tyrant]]></category>
		<category><![CDATA[triumvirate]]></category>
		<category><![CDATA[twisted]]></category>
		<category><![CDATA[web2.0]]></category>

		<guid isPermaLink="false">http://www.michael-noll.com/blog/?p=260</guid>
		<description><![CDATA[As promised, my papers The Metadata Triumvirate: Social Annotations, Anchor Texts and Search Queries (IEEE/WIC/ACM WI 2008) and Building a Scalable Collaborative Web Filter with Free and Open Source Software (IEEE SITIS 2008) are available for download. Enjoy!
]]></description>
			<content:encoded><![CDATA[<p>As promised, my papers <a href="../2008/09/05/the-metadata-triumvirate-social-annotations-anchor-texts-and-search-queries/">The Metadata Triumvirate: Social Annotations, Anchor Texts and Search Queries</a> (IEEE/WIC/ACM WI 2008) and <a href="../2008/09/17/building-a-scalable-collaborative-web-filter-with-free-and-open-source-software/">Building a Scalable Collaborative Web Filter with Free and Open Source Software</a> (IEEE SITIS 2008) are available for download. Enjoy!</p>
<div class="feedflare">
<a href="http://feeds.feedburner.com/~f/michael-noll?a=BSS5UtNu"><img src="http://feeds.feedburner.com/~f/michael-noll?d=41" border="0"></img></a> <a href="http://feeds.feedburner.com/~f/michael-noll?a=g5I2f8uT"><img src="http://feeds.feedburner.com/~f/michael-noll?i=g5I2f8uT" border="0"></img></a> <a href="http://feeds.feedburner.com/~f/michael-noll?a=JIgjolPp"><img src="http://feeds.feedburner.com/~f/michael-noll?i=JIgjolPp" border="0"></img></a> <a href="http://feeds.feedburner.com/~f/michael-noll?a=jaSaWhRe"><img src="http://feeds.feedburner.com/~f/michael-noll?d=52" border="0"></img></a>
</div><img src="http://feeds.feedburner.com/~r/michael-noll/~4/K51TK6MsaAo" height="1" width="1"/>]]></content:encoded>
			<wfw:commentRss>http://www.michael-noll.com/blog/2009/01/06/wi-2008-and-sitis-2008-papers-available-for-download/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		<feedburner:origLink>http://www.michael-noll.com/blog/2009/01/06/wi-2008-and-sitis-2008-papers-available-for-download/</feedburner:origLink></item>
		<item>
		<title>CABS120k08: Data Corpus for Research in the Web 2.0, November 2008</title>
		<link>http://feedproxy.google.com/~r/michael-noll/~3/ToCiU24y7rs/</link>
		<comments>http://www.michael-noll.com/blog/2008/12/02/cabs120k08-data-corpus-for-research-in-the-web-20-november-2008/#comments</comments>
		<pubDate>Tue, 02 Dec 2008 03:34:16 +0000</pubDate>
		<dc:creator>Michael G. Noll</dc:creator>
				<category><![CDATA[Publications]]></category>
		<category><![CDATA[Research]]></category>
		<category><![CDATA[acm]]></category>
		<category><![CDATA[anchor texts]]></category>
		<category><![CDATA[aol500k]]></category>
		<category><![CDATA[backlinks]]></category>
		<category><![CDATA[bookmarks]]></category>
		<category><![CDATA[cabs120k078]]></category>
		<category><![CDATA[cabs120k08]]></category>
		<category><![CDATA[categories]]></category>
		<category><![CDATA[categorization]]></category>
		<category><![CDATA[corpus]]></category>
		<category><![CDATA[del.icio.us]]></category>
		<category><![CDATA[dmoz]]></category>
		<category><![CDATA[doceng]]></category>
		<category><![CDATA[google]]></category>
		<category><![CDATA[incoming hyperlinks]]></category>
		<category><![CDATA[inlinks]]></category>
		<category><![CDATA[metadata]]></category>
		<category><![CDATA[open directory project]]></category>
		<category><![CDATA[pagerank]]></category>
		<category><![CDATA[paper]]></category>
		<category><![CDATA[papers]]></category>
		<category><![CDATA[publication]]></category>
		<category><![CDATA[random-sample]]></category>
		<category><![CDATA[search queries]]></category>
		<category><![CDATA[social-bookmarking]]></category>
		<category><![CDATA[social-tagging]]></category>
		<category><![CDATA[study]]></category>
		<category><![CDATA[tagging]]></category>
		<category><![CDATA[web2.0]]></category>

		<guid isPermaLink="false">http://www.michael-noll.com/blog/?p=249</guid>
		<description><![CDATA[My CABS120k08 research data set is now available for download.
CABS120k08 is a large research data set about Web metadata based on a sample of 120,000 web documents in 2008 (=120k08) with data retrieved from the Open Directory Project, the AOL Search query log corpus AOL500k, Google PageRank, Delicious.com, and anchor text from incoming hyperlinks.
The data [...]]]></description>
			<content:encoded><![CDATA[<p>My <a href="http://www.michael-noll.com/wiki/CABS120k08">CABS120k08</a> research data set is now available for <a href="http://www.michael-noll.com/wiki/CABS120k08#Download">download</a>.</p>
<p><a href="http://www.michael-noll.com/wiki/CABS120k08">CABS120k08</a> is a large research data set about Web metadata based on a sample of 120,000 web documents in 2008 (=120k08) with data retrieved from the Open Directory Project, the AOL Search query log corpus AOL500k, Google PageRank, Delicious.com, and anchor text from incoming hyperlinks.</p>
<p>The data corpus is described in detail in my paper  <a href="../2008/09/05/the-metadata-triumvirate-social-annotations-anchor-texts-and-search-queries/">The Metadata Triumvirate: Social Annotations, Anchor Texts and Search Queries</a>, for which the corpus was built. Enjoy!</p>
<p><span id="more-249"></span></p>
<div class="feedflare">
<a href="http://feeds.feedburner.com/~f/michael-noll?a=JHkcMU6Y"><img src="http://feeds.feedburner.com/~f/michael-noll?d=41" border="0"></img></a> <a href="http://feeds.feedburner.com/~f/michael-noll?a=cbw6xtuG"><img src="http://feeds.feedburner.com/~f/michael-noll?i=cbw6xtuG" border="0"></img></a> <a href="http://feeds.feedburner.com/~f/michael-noll?a=E5kJ2J0Y"><img src="http://feeds.feedburner.com/~f/michael-noll?i=E5kJ2J0Y" border="0"></img></a> <a href="http://feeds.feedburner.com/~f/michael-noll?a=TILv9awC"><img src="http://feeds.feedburner.com/~f/michael-noll?d=52" border="0"></img></a>
</div><img src="http://feeds.feedburner.com/~r/michael-noll/~4/ToCiU24y7rs" height="1" width="1"/>]]></content:encoded>
			<wfw:commentRss>http://www.michael-noll.com/blog/2008/12/02/cabs120k08-data-corpus-for-research-in-the-web-20-november-2008/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		<feedburner:origLink>http://www.michael-noll.com/blog/2008/12/02/cabs120k08-data-corpus-for-research-in-the-web-20-november-2008/</feedburner:origLink></item>
		<item>
		<title>Building a Scalable Collaborative Web Filter with Free and Open Source Software</title>
		<link>http://feedproxy.google.com/~r/michael-noll/~3/qFqJb88EYW0/</link>
		<comments>http://www.michael-noll.com/blog/2008/09/17/building-a-scalable-collaborative-web-filter-with-free-and-open-source-software/#comments</comments>
		<pubDate>Wed, 17 Sep 2008 14:53:04 +0000</pubDate>
		<dc:creator>Michael G. Noll</dc:creator>
				<category><![CDATA[Development & Programming]]></category>
		<category><![CDATA[Publications]]></category>
		<category><![CDATA[Research]]></category>
		<category><![CDATA[Safer Internet]]></category>
		<category><![CDATA[Uncategorized]]></category>
		<category><![CDATA[add-on]]></category>
		<category><![CDATA[browser]]></category>
		<category><![CDATA[case study]]></category>
		<category><![CDATA[categorization]]></category>
		<category><![CDATA[classification]]></category>
		<category><![CDATA[content filtering]]></category>
		<category><![CDATA[content-filter]]></category>
		<category><![CDATA[filter]]></category>
		<category><![CDATA[filtering]]></category>
		<category><![CDATA[firefox]]></category>
		<category><![CDATA[floss]]></category>
		<category><![CDATA[foss]]></category>
		<category><![CDATA[free software]]></category>
		<category><![CDATA[hadoop]]></category>
		<category><![CDATA[ieee]]></category>
		<category><![CDATA[internet security]]></category>
		<category><![CDATA[mysql]]></category>
		<category><![CDATA[open source]]></category>
		<category><![CDATA[paper]]></category>
		<category><![CDATA[papers]]></category>
		<category><![CDATA[publication]]></category>
		<category><![CDATA[pylog]]></category>
		<category><![CDATA[pylons]]></category>
		<category><![CDATA[python]]></category>
		<category><![CDATA[security]]></category>
		<category><![CDATA[social-annotations]]></category>
		<category><![CDATA[social-bookmarking]]></category>
		<category><![CDATA[social-tagging]]></category>
		<category><![CDATA[tagging]]></category>
		<category><![CDATA[tags]]></category>
		<category><![CDATA[tokyo cabinet]]></category>
		<category><![CDATA[tokyo tyrant]]></category>
		<category><![CDATA[twisted]]></category>
		<category><![CDATA[web democracy]]></category>
		<category><![CDATA[web filter]]></category>
		<category><![CDATA[web2.0]]></category>

		<guid isPermaLink="false">http://www.michael-noll.com/blog/?p=208</guid>
		<description><![CDATA[My paper “Building a Scalable Collaborative Web Filter with Free and Open Source Software” has been accepted for publication and presentation at this year’s IEEE International Conference on Signal-Image Technology &#38; Internet-based Systems (SITIS) which will be held in Bali, Indonesia, from November 30 &#8211; December 03, 2008.


Abstract
In this case study, we describe the design [...]]]></description>
			<content:encoded><![CDATA[<p>My paper <em>“Building a Scalable Collaborative Web Filter with Free and Open Source Software”</em> has been accepted for publication and presentation at this year’s <a href="http://www.u-bourgogne.fr/SITIS/08/" target="_blank">IEEE International Conference on Signal-Image Technology &amp; Internet-based Systems (SITIS)</a> which will be held in Bali, Indonesia, from November 30 &#8211; December 03, 2008.</p>
<p><span id="more-208"></span></p>
<p><a href="http://www.u-bourgogne.fr/SITIS/08/" target="_blank"><img class="size-full wp-image-214" title="IEEE SITIS 2008 Conference Logo" src="http://www.michael-noll.com/blog/uploads/sitis2008-logo.png" alt="IEEE SITIS 2008 Conference Logo" width="201" height="152" /></a></p>
<h1>Abstract</h1>
<p>In this case study, we describe the design and architecture of a scalable collaborative web filtering service, TaggyBear, which is powered by free and open source software. We will introduce the reader to the ideas and concepts behind TaggyBear, and discuss why we picked the software components that form the basis of the service. We will talk about how we combined or extended their functionality to build the TaggyBear service, and provide some initial benchmarking results and performance figures.</p>
<p><em>Note for fellow developers: The described system components include <a title="Pylons" href="http://www.pylonshq.com/" target="_blank">Pylons</a>, <a title="MySQL Community Server" href="http://www.mysql.com/" target="_blank">MySQL</a>, <a href="http://tokyocabinet.sourceforge.net/" target="_blank">Tokyo Cabinet/Tokyo Tyrant</a>, Pylog (custom app based on <a title="Twisted" href="http://twistedmatrix.com/" target="_blank">Twisted</a>), <a title="Hadoop" href="http://hadoop.apache.org/core/" target="_blank">Hadoop</a>, and on the client side a <a href="http://www.mozilla.com/firefox/" target="_blank">Firefox Add-On</a>.</em></p>
<h1>Full Paper &amp; Presentation</h1>
<ul>
<li>M. G. Noll, C. Meinel<br />
<a title="Building a Scalable Collaborative Web Filter with Free and Open Source Software" href="/blog/uploads/Michael-Noll_TaggyBear_SITIS_2008.pdf">Building a Scalable Collaborative Web Filter with Free and Open Source Software</a> (PDF)<br />
Proceedings of 4th IEEE Signal-Image Technology &amp; Internet-based Systems (SITIS), IEEE CS Press, Bali, Indonesia, November 2008, pp. 563-571, ISBN 978-0-7695-3493-0 (<a href="http://ieeexplore.ieee.org/xpl/freeabs_all.jsp?isnumber=4725761&amp;arnumber=4725855">IEEE Link</a>, <a href="http://www.michael-noll.com/uploads/sitis2008.bib">BibTeX</a>)</li>
</ul>
<h1>Related Links</h1>
<ul>
<li><a href="/wiki/Publications">List of my publications</a></li>
<li><a href="/blog/2006/09/25/design-and-anatomy-of-a-social-web-filtering-service/">Design and Anatomy of a Social Web Filtering Service</a>, Proceedings of 4th International Conference on Cooperative Internet Computing (CIC), Hong Kong, October 2006, pp. 35-44, ISBN 978-981-281-109-7</li>
<li><a href="http://www.u-bourgogne.fr/SITIS/08/" target="_blank">4th IEEE International Conference on Signal-Image Technology &amp; Internet-based Systems (SITIS)</a>, Bali, Indonesia, November 2008</li>
</ul>
<div class="feedflare">
<a href="http://feeds.feedburner.com/~f/michael-noll?a=9MMiln0Z"><img src="http://feeds.feedburner.com/~f/michael-noll?d=41" border="0"></img></a> <a href="http://feeds.feedburner.com/~f/michael-noll?a=XGpQ1lNA"><img src="http://feeds.feedburner.com/~f/michael-noll?i=XGpQ1lNA" border="0"></img></a> <a href="http://feeds.feedburner.com/~f/michael-noll?a=9XeqQL2F"><img src="http://feeds.feedburner.com/~f/michael-noll?i=9XeqQL2F" border="0"></img></a> <a href="http://feeds.feedburner.com/~f/michael-noll?a=gdGugg6i"><img src="http://feeds.feedburner.com/~f/michael-noll?d=52" border="0"></img></a>
</div><img src="http://feeds.feedburner.com/~r/michael-noll/~4/qFqJb88EYW0" height="1" width="1"/>]]></content:encoded>
			<wfw:commentRss>http://www.michael-noll.com/blog/2008/09/17/building-a-scalable-collaborative-web-filter-with-free-and-open-source-software/feed/</wfw:commentRss>
		<slash:comments>2</slash:comments>
		<feedburner:origLink>http://www.michael-noll.com/blog/2008/09/17/building-a-scalable-collaborative-web-filter-with-free-and-open-source-software/</feedburner:origLink></item>
	</channel>
</rss>
