<?xml version="1.0" encoding="UTF-8"?>
<?xml-stylesheet type="text/xsl" media="screen" href="/~d/styles/atom10full.xsl"?><?xml-stylesheet type="text/css" media="screen" href="http://feeds.feedburner.com/~d/styles/itemcontent.css"?><feed xmlns="http://www.w3.org/2005/Atom" xmlns:feedburner="http://rssnamespace.org/feedburner/ext/1.0">
 
 <title>Born to be geek!</title>
 
 <link href="http://herraiz.org/blog/" />
 <updated>2013-05-17T18:07:47-07:00</updated>
 <id>http://herraiz.org/blog</id>
 <author>
   <name>Israel Herraiz</name>
   <email>isra@herraiz.org</email>
 </author>

 
 <atom10:link xmlns:atom10="http://www.w3.org/2005/Atom" rel="self" type="application/atom+xml" href="http://feeds.feedburner.com/herraiz/btbg" /><feedburner:info uri="herraiz/btbg" /><atom10:link xmlns:atom10="http://www.w3.org/2005/Atom" rel="hub" href="http://pubsubhubbub.appspot.com/" /><link rel="license" type="text/html" href="http://creativecommons.org/licenses/by-sa/3.0/" /><feedburner:emailServiceId>herraiz/btbg</feedburner:emailServiceId><feedburner:feedburnerHostname>http://feedburner.google.com</feedburner:feedburnerHostname><feedburner:feedFlare href="http://add.my.yahoo.com/rss?url=http%3A%2F%2Ffeeds.feedburner.com%2Fherraiz%2Fbtbg" src="http://us.i1.yimg.com/us.yimg.com/i/us/my/addtomyyahoo4.gif">Subscribe with My Yahoo!</feedburner:feedFlare><feedburner:feedFlare href="http://www.newsgator.com/ngs/subscriber/subext.aspx?url=http%3A%2F%2Ffeeds.feedburner.com%2Fherraiz%2Fbtbg" src="http://www.newsgator.com/images/ngsub1.gif">Subscribe with NewsGator</feedburner:feedFlare><feedburner:feedFlare href="http://feeds.my.aol.com/add.jsp?url=http%3A%2F%2Ffeeds.feedburner.com%2Fherraiz%2Fbtbg" src="http://o.aolcdn.com/favorites.my.aol.com/webmaster/ffclient/webroot/locale/en-US/images/myAOLButtonSmall.gif">Subscribe with My AOL</feedburner:feedFlare><feedburner:feedFlare href="http://www.bloglines.com/sub/http://feeds.feedburner.com/herraiz/btbg" src="http://www.bloglines.com/images/sub_modern11.gif">Subscribe with Bloglines</feedburner:feedFlare><feedburner:feedFlare href="http://www.netvibes.com/subscribe.php?url=http%3A%2F%2Ffeeds.feedburner.com%2Fherraiz%2Fbtbg" src="http://www.netvibes.com/img/add2netvibes.gif">Subscribe with Netvibes</feedburner:feedFlare><feedburner:feedFlare href="http://fusion.google.com/add?feedurl=http%3A%2F%2Ffeeds.feedburner.com%2Fherraiz%2Fbtbg" src="http://buttons.googlesyndication.com/fusion/add.gif">Subscribe with Google</feedburner:feedFlare><feedburner:feedFlare href="http://www.pageflakes.com/subscribe.aspx?url=http%3A%2F%2Ffeeds.feedburner.com%2Fherraiz%2Fbtbg" src="http://www.pageflakes.com/ImageFile.ashx?instanceId=Static_4&amp;fileName=ATP_blu_91x17.gif">Subscribe with Pageflakes</feedburner:feedFlare><feedburner:feedFlare href="http://www.plusmo.com/add?url=http%3A%2F%2Ffeeds.feedburner.com%2Fherraiz%2Fbtbg" src="http://plusmo.com/res/graphics/fbplusmo.gif">Subscribe with Plusmo</feedburner:feedFlare><feedburner:feedFlare href="http://www.thefreedictionary.com/_/hp/AddRSS.aspx?http%3A%2F%2Ffeeds.feedburner.com%2Fherraiz%2Fbtbg" src="http://img.tfd.com/hp/addToTheFreeDictionary.gif">Subscribe with The Free Dictionary</feedburner:feedFlare><feedburner:feedFlare href="http://www.bitty.com/manual/?contenttype=rssfeed&amp;contentvalue=http%3A%2F%2Ffeeds.feedburner.com%2Fherraiz%2Fbtbg" src="http://www.bitty.com/img/bittychicklet_91x17.gif">Subscribe with Bitty Browser</feedburner:feedFlare><feedburner:feedFlare href="http://www.newsalloy.com/?rss=http%3A%2F%2Ffeeds.feedburner.com%2Fherraiz%2Fbtbg" src="http://www.newsalloy.com/subrss3.gif">Subscribe with NewsAlloy</feedburner:feedFlare><feedburner:feedFlare href="http://www.live.com/?add=http%3A%2F%2Ffeeds.feedburner.com%2Fherraiz%2Fbtbg" src="http://tkfiles.storage.msn.com/x1piYkpqHC_35nIp1gLE68-wvzLZO8iXl_JMledmJQXP-XTBOLfmQv4zhj4MhcWEJh_GtoBIiAl1Mjh-ndp9k47If7hTaFno0mxW9_i3p_5qQw">Subscribe with Live.com</feedburner:feedFlare><feedburner:feedFlare href="http://mix.excite.eu/add?feedurl=http%3A%2F%2Ffeeds.feedburner.com%2Fherraiz%2Fbtbg" src="http://image.excite.co.uk/mix/addtomix.gif">Subscribe with Excite MIX</feedburner:feedFlare><feedburner:feedFlare href="http://download.attensa.com/app/get_attensa.html?feedurl=http%3A%2F%2Ffeeds.feedburner.com%2Fherraiz%2Fbtbg" src="http://www.attensa.com/blogs/attensa/WindowsLiveWriter/BadgeredintoBadges_10C02/attensa_feed_button5.gif">Subscribe with Attensa for Outlook</feedburner:feedFlare><feedburner:feedFlare href="http://www.webwag.com/wwgthis.php?url=http%3A%2F%2Ffeeds.feedburner.com%2Fherraiz%2Fbtbg" src="http://www.webwag.com/images/wwgthis.gif">Subscribe with Webwag</feedburner:feedFlare><feedburner:feedFlare href="http://www.podcastready.com/oneclick_bookmark.php?url=http%3A%2F%2Ffeeds.feedburner.com%2Fherraiz%2Fbtbg" src="http://www.podcastready.com/images/podcastready_button.gif">Subscribe with Podcast Ready</feedburner:feedFlare><feedburner:feedFlare href="http://www.flurry.com/pushRssFeed.do?r=fb&amp;url=http%3A%2F%2Ffeeds.feedburner.com%2Fherraiz%2Fbtbg" src="http://www.flurry.com/images/flurry_rss_logo2.gif">Subscribe with Flurry</feedburner:feedFlare><feedburner:feedFlare href="http://www.wikio.com/subscribe?url=http%3A%2F%2Ffeeds.feedburner.com%2Fherraiz%2Fbtbg" src="http://www.wikio.com/shared/img/add2wikio.gif">Subscribe with Wikio</feedburner:feedFlare><feedburner:feedFlare href="http://www.dailyrotation.com/index.php?feed=http%3A%2F%2Ffeeds.feedburner.com%2Fherraiz%2Fbtbg" src="http://www.dailyrotation.com/rss-dr2.gif">Subscribe with Daily Rotation</feedburner:feedFlare><entry>
   <title>Intensive Metrics for Software Evolution</title>
   <link href="http://feedproxy.google.com/~r/herraiz/btbg/~3/pJtJoDTzouI/" />
   <updated>2013-05-17T00:00:00-07:00</updated>
   <id>http://herraiz.org/blog/2013/05/17/intensive-metrics-for-software-evolution</id>
   <content type="html">&lt;p&gt;
In natural sciences, intensive metrics do not depend on the size of
the system (or amount of material) being measured. For instance, the
temperature of an object or the hardness of a material are intensive
properties.
&lt;/p&gt;
&lt;p&gt;
In the case of software projects, many of the metrics used to study
them are extensive, that is, the metrics depend on the size of the
system. Thus, it is hard to compare different software projects using
these metrics.
&lt;/p&gt;
&lt;p&gt;
For the case of the Apache Software Foundation, we have found some
ratios that are intensive properties, and we show how to use them to
study the evolution of different projects, comparing them regardless
their size, intended audience, technology used or maturity
state. The metrics are obtained from the ratios between communication
and development activies in the project. Interested? See a tag cloud
of the keywords of this paper: 
&lt;/p&gt;


&lt;!--
begin tag cloud : generated by TagCrowd.com
Feel free to modify as long as you keep this notice.

EMBEDDING INSTRUCTIONS:
1. Customize your cloud's style by editing the CSS where it says CUSTOMIZE below.
2. Insert this code in its entirety into your webpage or blog post.

This code and its rendered image are released under the Creative Commons Attribution-Noncommercial 3.0 Unported License. (http://creativecommons.org/licenses/by-nc/3.0/)

For COMMERCIAL USE LICENSING, visit http://tagcrowd.com/licensing.html
--&gt;
&lt;style type="text/css"&gt;&lt;!-- #htmltagcloud{

/******************************************
 * CUSTOMIZE CLOUD CSS BELOW (optional)
 */
 font-size: 100%;
 width: auto;/* auto or fixed width, e.g. 500px   */
 font-family:'lucida grande','trebuchet ms',arial,helvetica,sans-serif;
 background-color:#fff;
 margin:1em 1em 0 1em;
 border:2px dotted #ddd;
 padding:2em; 
/******************************************
 * END CUSTOMIZE
 */

}#htmltagcloud{line-height:2.4em;word-spacing:normal;letter-spacing:normal;text-transform:none;text-align:justify;text-indent:0}#htmltagcloud a:link{text-decoration:none}#htmltagcloud a:visited{text-decoration:none}#htmltagcloud a:hover{color:white;background-color:#05f}#htmltagcloud a:active{color:white;background-color:#03d}.wrd{padding:0;position:relative}.wrd a{text-decoration:none}.tagcloud0{font-size:1.0em;color:#ACC1F3;z-index:10}.tagcloud0 a{color:#ACC1F3}.tagcloud1{font-size:1.4em;color:#ACC1F3;z-index:9}.tagcloud1 a{color:#ACC1F3}.tagcloud2{font-size:1.8em;color:#86A0DC;z-index:8}.tagcloud2 a{color:#86A0DC}.tagcloud3{font-size:2.2em;color:#86A0DC;z-index:7}.tagcloud3 a{color:#86A0DC}.tagcloud4{font-size:2.6em;color:#607EC5;z-index:6}.tagcloud4 a{color:#607EC5}.tagcloud5{font-size:3.0em;color:#607EC5;z-index:5}.tagcloud5 a{color:#607EC5}.tagcloud6{font-size:3.3em;color:#4C6DB9;z-index:4}.tagcloud6 a{color:#4C6DB9}.tagcloud7{font-size:3.6em;color:#395CAE;z-index:3}.tagcloud7 a{color:#395CAE}.tagcloud8{font-size:3.9em;color:#264CA2;z-index:2}.tagcloud8 a{color:#264CA2}.tagcloud9{font-size:4.2em;color:#133B97;z-index:1}.tagcloud9 a{color:#133B97}.tagcloud10{font-size:4.5em;color:#002A8B;z-index:0}.tagcloud10 a{color:#002A8B}.freq{font-size:10pt !important;color:#bbb}#credit{text-align:center;color:#333;margin-bottom:0.6em;font:0.7em 'lucida grande',trebuchet,'trebuchet ms',verdana,arial,helvetica,sans-serif}#credit a:link{color:#777;text-decoration:none}#credit a:visited{color:#777;text-decoration:none}#credit a:hover{color:white;background-color:#05f}#credit a:active{text-decoration:underline}// --&gt;
&lt;/style&gt;

&lt;div id="htmltagcloud"&gt; &lt;span id="0" class="wrd tagcloud4"&gt;&lt;a href="#tagcloud"&gt;activity&lt;/a&gt;&lt;/span&gt; &lt;span id="1" class="wrd tagcloud0"&gt;&lt;a href="#tagcloud"&gt;annotated&lt;/a&gt;&lt;/span&gt; &lt;span id="2" class="wrd tagcloud5"&gt;&lt;a href="#tagcloud"&gt;apache&lt;/a&gt;&lt;/span&gt; &lt;span id="3" class="wrd tagcloud0"&gt;&lt;a href="#tagcloud"&gt;around&lt;/a&gt;&lt;/span&gt; &lt;span id="4" class="wrd tagcloud3"&gt;&lt;a href="#tagcloud"&gt;asf&lt;/a&gt;&lt;/span&gt; &lt;span id="5" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;code&lt;/a&gt;&lt;/span&gt; &lt;span id="6" class="wrd tagcloud5"&gt;&lt;a href="#tagcloud"&gt;commits&lt;/a&gt;&lt;/span&gt; &lt;span id="7" class="wrd tagcloud3"&gt;&lt;a href="#tagcloud"&gt;community&lt;/a&gt;&lt;/span&gt; &lt;span id="8" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;data&lt;/a&gt;&lt;/span&gt; &lt;span id="9" class="wrd tagcloud6"&gt;&lt;a href="#tagcloud"&gt;developer&lt;/a&gt;&lt;/span&gt; &lt;span id="10" class="wrd tagcloud0"&gt;&lt;a href="#tagcloud"&gt;different&lt;/a&gt;&lt;/span&gt; &lt;span id="11" class="wrd tagcloud0"&gt;&lt;a href="#tagcloud"&gt;discussion&lt;/a&gt;&lt;/span&gt; &lt;span id="12" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;email&lt;/a&gt;&lt;/span&gt; &lt;span id="13" class="wrd tagcloud2"&gt;&lt;a href="#tagcloud"&gt;evolution&lt;/a&gt;&lt;/span&gt; &lt;span id="14" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;fig&lt;/a&gt;&lt;/span&gt; &lt;span id="15" class="wrd tagcloud2"&gt;&lt;a href="#tagcloud"&gt;figure&lt;/a&gt;&lt;/span&gt; &lt;span id="16" class="wrd tagcloud0"&gt;&lt;a href="#tagcloud"&gt;found&lt;/a&gt;&lt;/span&gt; &lt;span id="17" class="wrd tagcloud0"&gt;&lt;a href="#tagcloud"&gt;hadoop&lt;/a&gt;&lt;/span&gt; &lt;span id="18" class="wrd tagcloud0"&gt;&lt;a href="#tagcloud"&gt;httpd&lt;/a&gt;&lt;/span&gt; &lt;span id="19" class="wrd tagcloud3"&gt;&lt;a href="#tagcloud"&gt;information&lt;/a&gt;&lt;/span&gt; &lt;span id="20" class="wrd tagcloud0"&gt;&lt;a href="#tagcloud"&gt;intensive&lt;/a&gt;&lt;/span&gt; &lt;span id="21" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;international&lt;/a&gt;&lt;/span&gt; &lt;span id="22" class="wrd tagcloud0"&gt;&lt;a href="#tagcloud"&gt;issue&lt;/a&gt;&lt;/span&gt; &lt;span id="23" class="wrd tagcloud0"&gt;&lt;a href="#tagcloud"&gt;lines&lt;/a&gt;&lt;/span&gt; &lt;span id="24" class="wrd tagcloud4"&gt;&lt;a href="#tagcloud"&gt;list&lt;/a&gt;&lt;/span&gt; &lt;span id="25" class="wrd tagcloud2"&gt;&lt;a href="#tagcloud"&gt;mailing&lt;/a&gt;&lt;/span&gt; &lt;span id="26" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;main&lt;/a&gt;&lt;/span&gt; &lt;span id="27" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;measures&lt;/a&gt;&lt;/span&gt; &lt;span id="28" class="wrd tagcloud4"&gt;&lt;a href="#tagcloud"&gt;messages&lt;/a&gt;&lt;/span&gt; &lt;span id="29" class="wrd tagcloud5"&gt;&lt;a href="#tagcloud"&gt;metric&lt;/a&gt;&lt;/span&gt; &lt;span id="30" class="wrd tagcloud3"&gt;&lt;a href="#tagcloud"&gt;number&lt;/a&gt;&lt;/span&gt; &lt;span id="31" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;open&lt;/a&gt;&lt;/span&gt; &lt;span id="32" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;paper&lt;/a&gt;&lt;/span&gt; &lt;span id="33" class="wrd tagcloud2"&gt;&lt;a href="#tagcloud"&gt;pp&lt;/a&gt;&lt;/span&gt; &lt;span id="34" class="wrd tagcloud10"&gt;&lt;a href="#tagcloud"&gt;projects&lt;/a&gt;&lt;/span&gt; &lt;span id="35" class="wrd tagcloud5"&gt;&lt;a href="#tagcloud"&gt;ratio&lt;/a&gt;&lt;/span&gt; &lt;span id="36" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;related&lt;/a&gt;&lt;/span&gt; &lt;span id="37" class="wrd tagcloud4"&gt;&lt;a href="#tagcloud"&gt;releases&lt;/a&gt;&lt;/span&gt; &lt;span id="38" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;results&lt;/a&gt;&lt;/span&gt; &lt;span id="39" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;shows&lt;/a&gt;&lt;/span&gt; &lt;span id="40" class="wrd tagcloud2"&gt;&lt;a href="#tagcloud"&gt;size&lt;/a&gt;&lt;/span&gt; &lt;span id="41" class="wrd tagcloud7"&gt;&lt;a href="#tagcloud"&gt;software&lt;/a&gt;&lt;/span&gt; &lt;span id="42" class="wrd tagcloud2"&gt;&lt;a href="#tagcloud"&gt;source&lt;/a&gt;&lt;/span&gt; &lt;span id="43" class="wrd tagcloud4"&gt;&lt;a href="#tagcloud"&gt;study&lt;/a&gt;&lt;/span&gt; &lt;span id="44" class="wrd tagcloud3"&gt;&lt;a href="#tagcloud"&gt;system&lt;/a&gt;&lt;/span&gt; &lt;span id="45" class="wrd tagcloud3"&gt;&lt;a href="#tagcloud"&gt;total&lt;/a&gt;&lt;/span&gt; &lt;span id="46" class="wrd tagcloud4"&gt;&lt;a href="#tagcloud"&gt;traffic&lt;/a&gt;&lt;/span&gt; &lt;span id="47" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;used&lt;/a&gt;&lt;/span&gt; &lt;span id="48" class="wrd tagcloud0"&gt;&lt;a href="#tagcloud"&gt;vertical&lt;/a&gt;&lt;/span&gt; &lt;span id="49" class="wrd tagcloud0"&gt;&lt;a href="#tagcloud"&gt;web&lt;/a&gt;&lt;/span&gt; &lt;/div&gt;&lt;div id="credit"&gt;created at &lt;a href="http://tagcrowd.com"&gt;TagCrowd.com&lt;/a&gt;&lt;/div&gt;

&lt;!-- end tag cloud : generated by TagCrowd.com : please keep this notice --&gt;

&lt;p&gt;
The paper is &lt;a href="http://oa.upm.es/14698/1/paper.pdf"&gt;available in PDF&lt;/a&gt;, and it can be cited using this BibTeX
code (also available as a &lt;a href="http://herraiz.org/bibtex/english/msr2013.txt"&gt;text file for your convenience&lt;/a&gt;):
&lt;/p&gt;



&lt;pre class="src src-bibtex"&gt;&lt;span style="font-weight: bold;"&gt;@InProceedings&lt;/span&gt;{&lt;span style="font-weight: bold; text-decoration: underline;"&gt;gala2013:apache&lt;/span&gt;,
  &lt;span style="font-weight: bold; font-style: italic;"&gt;author&lt;/span&gt;    =    {Santiago Gala-Perez
                  and Gregorio Robles
                  and Jesus M. Gonzalez-Barahona 
                  and Israel Herraiz},
  &lt;span style="font-weight: bold; font-style: italic;"&gt;title&lt;/span&gt;     =    {Intensive Metrics for the Study of the Evolution of Open Source Projects},
  &lt;span style="font-weight: bold; font-style: italic;"&gt;booktitle&lt;/span&gt; =    {10th IEEE Working Conference on Mining Software Repositories},
  &lt;span style="font-weight: bold; font-style: italic;"&gt;year&lt;/span&gt;      =    {2013},
  &lt;span style="font-weight: bold; font-style: italic;"&gt;address&lt;/span&gt;   =    {San Francisco, California, USA},
}
&lt;/pre&gt;


&lt;p&gt;
We are presenting this paper at the &lt;a href="http://2013.msrconf.org/"&gt;10th IEEE Working Conference on Mining Software Repositories&lt;/a&gt;, with the following slides (see &lt;a href="http://www.slideshare.net/herraiz/intensive-metrics-software-evolution"&gt;the slides at SlideShare.net&lt;/a&gt;):
&lt;/p&gt;


&lt;iframe src="http://www.slideshare.net/slideshow/embed_code/21354695" width="427" height="356" frameborder="0" marginwidth="0" marginheight="0" scrolling="no" style="border:1px solid #CCC;border-width:1px 1px 0;margin-bottom:5px" allowfullscreen webkitallowfullscreen mozallowfullscreen&gt; &lt;/iframe&gt; 

&lt;p&gt;
Finally, this work is derived from &lt;a href="http://eciencia.urjc.es/handle/10115/11518"&gt;Santiago Gala's master thesis&lt;/a&gt;,
available in PDF format and including full details about the study of
intensive metrics for software evolution. There is also a &lt;a href="http://gsyc.es/~grex/repro/2013-apache-intensive/"&gt;replication package&lt;/a&gt; that you can use to verify and extend our empirical study.
&lt;/p&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/herraiz/btbg?a=pJtJoDTzouI:1WTAZT_1zNs:I9og5sOYxJI"&gt;&lt;img src="http://feeds.feedburner.com/~ff/herraiz/btbg?d=I9og5sOYxJI" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/herraiz/btbg?a=pJtJoDTzouI:1WTAZT_1zNs:qj6IDK7rITs"&gt;&lt;img src="http://feeds.feedburner.com/~ff/herraiz/btbg?d=qj6IDK7rITs" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/herraiz/btbg?a=pJtJoDTzouI:1WTAZT_1zNs:ecdYMiMMAMM"&gt;&lt;img src="http://feeds.feedburner.com/~ff/herraiz/btbg?d=ecdYMiMMAMM" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/herraiz/btbg?a=pJtJoDTzouI:1WTAZT_1zNs:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/herraiz/btbg?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/herraiz/btbg/~4/pJtJoDTzouI" height="1" width="1"/&gt;</content>
 <feedburner:origLink>http://herraiz.org/blog/2013/05/17/intensive-metrics-for-software-evolution/</feedburner:origLink></entry>
 
 <entry>
   <title>Don't do empirical software engineering with Excel</title>
   <link href="http://feedproxy.google.com/~r/herraiz/btbg/~3/QJosNJWt5C8/" />
   <updated>2012-11-23T00:00:00-08:00</updated>
   <id>http://herraiz.org/blog/2012/11/23/dont-do-empirical-software-engineering-with-excel</id>
   <content type="html">&lt;p&gt;
Or any other statistical analysis. From time to time, I see papers
published in Empirical Software Engineering conferences and journals
that have used Excel for the statistical analyses (although I would
not point here to any of those papers :). I have not liked this much,
but it was mostly because of personal taste, and probably also a sort
of prejudice.
&lt;/p&gt;
&lt;p&gt;
But I found &lt;a href="http://www.pages.drexel.edu/%7Ebdm25/excel2007.pdf"&gt;this paper&lt;/a&gt; today:
&lt;/p&gt;
&lt;blockquote&gt;

&lt;p&gt;On the accuracy of statistical procedures in Microsoft Excel 2007 &lt;br/&gt;
B.D. McCullough , David A. Heiser &lt;br/&gt;
&lt;i&gt;Computational Statistics and Data Analysis&lt;/i&gt; 52 (2008) 4570–4578
&lt;/p&gt;
&lt;/blockquote&gt;


&lt;p&gt;
The paper remarks some of the flaws of Excel 2007 in standard
statistical methods. Two of the flaws are related to the least squares
fitting of exponential models, and to the normality plot of a sample
against the deciles of the Normal distribution. Apparently, this
situation has repeated since years ago with every new release of
Excel. Some of the problems have even been claimed to be fixed, while
the truth is that they remain providing wrong results.
&lt;/p&gt;
&lt;p&gt;
If you use Excel in your research, I think you would better consider
switching to &lt;a href="http://www.r-project.org/"&gt;GNU R&lt;/a&gt;, and its superb IDE &lt;a href="http://www.rstudio.com/ide/"&gt;R Studio&lt;/a&gt;.
&lt;/p&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/herraiz/btbg?a=QJosNJWt5C8:IrnShH26OY8:I9og5sOYxJI"&gt;&lt;img src="http://feeds.feedburner.com/~ff/herraiz/btbg?d=I9og5sOYxJI" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/herraiz/btbg?a=QJosNJWt5C8:IrnShH26OY8:qj6IDK7rITs"&gt;&lt;img src="http://feeds.feedburner.com/~ff/herraiz/btbg?d=qj6IDK7rITs" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/herraiz/btbg?a=QJosNJWt5C8:IrnShH26OY8:ecdYMiMMAMM"&gt;&lt;img src="http://feeds.feedburner.com/~ff/herraiz/btbg?d=ecdYMiMMAMM" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/herraiz/btbg?a=QJosNJWt5C8:IrnShH26OY8:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/herraiz/btbg?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/herraiz/btbg/~4/QJosNJWt5C8" height="1" width="1"/&gt;</content>
 <feedburner:origLink>http://herraiz.org/blog/2012/11/23/dont-do-empirical-software-engineering-with-excel/</feedburner:origLink></entry>
 
 <entry>
   <title>The impact of bias in bug-fix datasets for defects prediction</title>
   <link href="http://feedproxy.google.com/~r/herraiz/btbg/~3/n3SFur8NoBE/" />
   <updated>2012-04-15T00:00:00-07:00</updated>
   <id>http://herraiz.org/blog/2012/04/15/the-impact-of-bias-in-bugfix-datasets</id>
   <content type="html">&lt;p&gt;
Last week I gave &lt;a href="http://seminars.cs.ucdavis.edu/?type=1&amp;amp;when=past&amp;amp;talkid=263"&gt;a talk at UC Davis&lt;/a&gt; about the research work I will be
doing &lt;a href="http://herraiz.org/blog/2012/04/02/visiting-uc-davis/"&gt;during these months&lt;/a&gt;. It contains some preliminary results about
the impact of bias in bug-fix datasets.
&lt;/p&gt;
&lt;p&gt;
In projects with bug tracking systems and version control
repositories, when a commit corresponds to a bug fix, it is usually
marked accordingly (for instance, with a message like "Fixes
bug #123"). This information can be used to recover the relation
between commits and bugs, which is useful for defects prediction. The
preliminary results I have obtained so far, show that the impact of
bias is negligible for defects prediction if the model is based on a
binary classifier (that is, only predicts whether an entity will
contain or not defects, not how many defects it will
contain). However, it is true that a non-biased dataset can provide a
better accuracy, but just because, by definition, &lt;i&gt;non-biased datasets contain more data&lt;/i&gt;. If we reduce the size of a non-biased dataset, by
extracting a random sub-sample, it is as good as a biased dataset of
the same size. Well, at least for the two cases I have studied so far.
&lt;/p&gt;
&lt;p&gt;
More details in the slides. You can also &lt;a href="http://www.slideshare.net/herraiz/evaluating-the-presence-and-impact-of-bias-in-bugfix-datasets"&gt;see the slides at Slideshare.net, and get a PDF copy&lt;/a&gt;.
&lt;div style="width:425px" id="__ss_12494328"&gt; 
&lt;iframe src="http://www.slideshare.net/slideshow/embed_code/12494328" width="425" height="355" frameborder="0" marginwidth="0" marginheight="0" scrolling="no"&gt;&lt;/iframe&gt; 
&lt;/div&gt;
&lt;/p&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/herraiz/btbg?a=n3SFur8NoBE:XLlof0PS538:I9og5sOYxJI"&gt;&lt;img src="http://feeds.feedburner.com/~ff/herraiz/btbg?d=I9og5sOYxJI" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/herraiz/btbg?a=n3SFur8NoBE:XLlof0PS538:qj6IDK7rITs"&gt;&lt;img src="http://feeds.feedburner.com/~ff/herraiz/btbg?d=qj6IDK7rITs" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/herraiz/btbg?a=n3SFur8NoBE:XLlof0PS538:ecdYMiMMAMM"&gt;&lt;img src="http://feeds.feedburner.com/~ff/herraiz/btbg?d=ecdYMiMMAMM" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/herraiz/btbg?a=n3SFur8NoBE:XLlof0PS538:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/herraiz/btbg?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/herraiz/btbg/~4/n3SFur8NoBE" height="1" width="1"/&gt;</content>
 <feedburner:origLink>http://herraiz.org/blog/2012/04/15/the-impact-of-bias-in-bugfix-datasets/</feedburner:origLink></entry>
 
 <entry>
   <title>Visiting UC Davis</title>
   <link href="http://feedproxy.google.com/~r/herraiz/btbg/~3/xguDHjvA4XM/" />
   <updated>2012-04-02T00:00:00-07:00</updated>
   <id>http://herraiz.org/blog/2012/04/02/visiting-uc-davis</id>
   <content type="html">&lt;p&gt;
Since a couple of days ago, I am in Davis, California, for a 4-months
visit to &lt;a href="http://ucdavis.edu/"&gt;UC Davis&lt;/a&gt;, hosted by &lt;a href="http://www.cs.ucdavis.edu/~devanbu/"&gt;Prof. Prem Devanbu&lt;/a&gt;. This visit is
possible thanks to a &lt;a href="http://www.educacion.gob.es/educacion/universidades/convocatorias/titulados-doctores-profesores/estancias-profesores-centros-extranjeros/modalidad-b.html"&gt;"José Castillejo" grant&lt;/a&gt; awarded by the Spanish
Ministry of Education and Science.
&lt;/p&gt;
&lt;p&gt;
The main goal of this visit is to work on finding an automated method
to evaluate the bias in bugs datasets. This bias is introduced when
the bug-fix reports are linked with commits in the version control
system. When a developer accepts and/or fix a bug report, she decides
and accordingly marks the report with a severity level. In Bugzilla,
one of the most used bug tracking systems, a developer can mark
severity using a seven levels scale. In a &lt;a href="http://dl.acm.org/citation.cfm?id=1370786"&gt;previous paper&lt;/a&gt; (&lt;a href="http://herraiz.org/papers/english/msr84cp-herraiz.pdf"&gt;PDF available&lt;/a&gt;), I have shown that not all developers use the same criteria
to select the severity, and it should be enough with only three
levels. This difference in the developers criteria to mark and
classify bug reports is &lt;a href="http://dl.acm.org/citation.cfm?id=1595716"&gt;one of the sources of bias in the bug-fix datasets&lt;/a&gt; (&lt;a href="http://macbeth.cs.ucdavis.edu/biasbusters.pdf"&gt;PDF of the paper available&lt;/a&gt;). Another source of bias is
developer confidence; not all developers mark commits or bug reports
with commit ids when they are starting in a project, because they are
afraid of exposing themselves. However, those commits do correspond to
bug fixes, and should be accounted for in a bug-fix dataset.
&lt;/p&gt;
&lt;p&gt;
This bias disease affects the &lt;a href="http://www.st.cs.uni-saarland.de/softevo/bug-data/eclipse/"&gt;Eclipse Bug Data&lt;/a&gt; from &lt;a href="http://www.st.cs.uni-saarland.de/?lang=en"&gt;Software Engineering Chair at Saarland University&lt;/a&gt;, which is one of the main
data sources used for empirical software engineering. As an example, &lt;a href="http://ieeexplore.ieee.org/xpls/abs_all.jsp?arnumber=4407730"&gt;a paper studying the distribution of software bugs&lt;/a&gt; which was based on
that Eclipse data has generated &lt;a href="http://ieeexplore.ieee.org/xpls/abs_all.jsp?arnumber=5928349&amp;amp;tag=1"&gt;a response&lt;/a&gt; which has found other
better distribution fits, and that does not reuse the same dataset but
gathers the data directly from the original sources.
&lt;/p&gt;
&lt;p&gt;
Clearly, reusing datasets for empirical software engineering is a good
idea, which fosters reproducibility and verifiability, essential
properties of any empirical research discipline. However, if we can
not assure the quality of the reusable datasets, &lt;a href="http://www.springerlink.com/content/190151j3380051uj/"&gt;reusable datasets can cause more harm than benefits&lt;/a&gt;. 
&lt;/p&gt;
&lt;p&gt;
My goal with this visit is to apply statistical methods to evaluate
the bias in a bug-fix dataset. The two papers about the distribution
of bugs in Eclipse are an example of the kind of work I want to do. If
we can be sure of the quality and lack of bias of a dataset, carefully
built to act as a "canonical" dataset, we can compare other datasets
against that canonical dataset, to find out if there is any bias. The
two papers about Eclipse mentioned above show that the distribution of
bugs can vary in the presence of bias. The first paper used a biased
dataset, and the second paper repeated the data gathering process from
scratch, avoiding the use of the biased dataset. Although it can also
be due to methodological differences, they found different
distributions for software bugs.
&lt;/p&gt;
&lt;p&gt;
So my goal is to measure this difference in the distribution using a
statistical technique, to detect the presence of bias, and develop a
statistical test to find bias in reusable datasets. I am assuming here
that the distribution cannot change due to other factors (and &lt;a href="http://herraiz.org/blog/2011/11/01/popularity-bias-in-bug-datasets/"&gt;we already know that there are other sources of bias in bug reports&lt;/a&gt;), and
that the shape of the distribution is unique. The second assumption is
quite fair, but the first assumption is more complicated, and it will
require to find more than one dataset that is known to be
unbiased.
&lt;/p&gt;
&lt;p&gt;
I hope this work will provide a tool to assess the quality of a
bug-fix dataset, and to avoid the problems of bias, which are a threat
to the validity of all the empirical studies using these bug-fix
datasets.
&lt;/p&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/herraiz/btbg?a=xguDHjvA4XM:gv9EY9Xc5e8:I9og5sOYxJI"&gt;&lt;img src="http://feeds.feedburner.com/~ff/herraiz/btbg?d=I9og5sOYxJI" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/herraiz/btbg?a=xguDHjvA4XM:gv9EY9Xc5e8:qj6IDK7rITs"&gt;&lt;img src="http://feeds.feedburner.com/~ff/herraiz/btbg?d=qj6IDK7rITs" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/herraiz/btbg?a=xguDHjvA4XM:gv9EY9Xc5e8:ecdYMiMMAMM"&gt;&lt;img src="http://feeds.feedburner.com/~ff/herraiz/btbg?d=ecdYMiMMAMM" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/herraiz/btbg?a=xguDHjvA4XM:gv9EY9Xc5e8:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/herraiz/btbg?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/herraiz/btbg/~4/xguDHjvA4XM" height="1" width="1"/&gt;</content>
 <feedburner:origLink>http://herraiz.org/blog/2012/04/02/visiting-uc-davis/</feedburner:origLink></entry>
 
 <entry>
   <title>Popularity bias in bug datasets</title>
   <link href="http://feedproxy.google.com/~r/herraiz/btbg/~3/hMhb-mgDbxA/" />
   <updated>2011-11-01T00:00:00-07:00</updated>
   <id>http://herraiz.org/blog/2011/11/01/popularity-bias-in-bug-datasets</id>
   <content type="html">&lt;p&gt;
In recent times, the replicability of Software Engineering empirical
studies has become a main concern in the research community. One way
to achieve replicability is by reusing datasets, so everybody base
their results on the same data. However, if these datasets contain any
kind of problem, &lt;a href="http://www.springerlink.com/content/190151j3380051uj/"&gt;they could cause more harm than benefits&lt;/a&gt;.
&lt;/p&gt;
&lt;p&gt;
In the case of software defects, there are datasets that are known to
contain bias, mainly &lt;a href="http://ieeexplore.ieee.org/xpl/freeabs_all.jsp?arnumber=5645567"&gt;when referencing a fix to a particular bug report&lt;/a&gt;.
&lt;/p&gt;
&lt;p&gt;
We have studied a different kind of bias: &lt;i&gt;popularity bias&lt;/i&gt;. A
software project with less bugs is of higher quality. However, in open
source software development, more bugs may mean more quality. Why?
Because more &lt;i&gt;found&lt;/i&gt; bugs imply more people looking for those
bugs. This is, if you have no bugs it is because nobody is using your
software and reporting them. If you have more bugs, it is because your
software is popular; should your software be less popular, the number
of bugs would be lower. We have studied this effect in the case of
Debian, using the &lt;a href="http://udd.debian.org/"&gt;Ultimate Debian Database&lt;/a&gt;, and we indeed find that
only very popular Debian packages will present a very high number of
bugs, and that non-popular packages get very few bug reports.
&lt;/p&gt;
&lt;p&gt;
If you want to know more, &lt;a href="http://oa.upm.es/9585/1/paper.pdf"&gt;read our WCRE 2011 paper&lt;/a&gt;, entitled "Impact
of Installation Counts on Perceived Quality: A Case Study on
Debian". A tag cloud of the contents of the paper:
&lt;/p&gt;


&lt;!--
begin tag cloud : generated by TagCrowd.com
Feel free to modify as long as you keep this notice.

EMBEDDING INSTRUCTIONS:
1. Customize your cloud's style by editing the CSS where it says CUSTOMIZE below.
2. Insert this code in its entirety into your webpage or blog post.

This code and its rendered image are released under the Creative Commons Attribution-Noncommercial 3.0 Unported License. (http://creativecommons.org/licenses/by-nc/3.0/)

For COMMERCIAL USE LICENSING, visit http://tagcrowd.com/licensing.html
--&gt;
&lt;style type="text/css"&gt;&lt;!-- #htmltagcloud{

/******************************************
 * CUSTOMIZE CLOUD CSS BELOW (optional)
 */
font-size: 80%;
width: auto;/* auto or fixed width, e.g. 500px   */
font-family:'lucida grande','trebuchet ms',arial,helvetica,sans-serif;
background-color:#fff;
margin:1em 1em 0 1em;
border:2px dotted #ddd;
padding:2em; 
/******************************************
 * END CUSTOMIZE
 */

}#htmltagcloud{line-height:2.4em;word-spacing:normal;letter-spacing:normal;text-transform:none;text-align:justify;text-indent:0}#htmltagcloud a:link{text-decoration:none}#htmltagcloud a:visited{text-decoration:none}#htmltagcloud a:hover{color:white;background-color:#05f}#htmltagcloud a:active{color:white;background-color:#03d}.wrd{padding:0;position:relative}.wrd a{text-decoration:none}.tagcloud0{font-size:1.0em;color:#ACC1F3;z-index:10}.tagcloud0 a{color:#ACC1F3}.tagcloud1{font-size:1.4em;color:#ACC1F3;z-index:9}.tagcloud1 a{color:#ACC1F3}.tagcloud2{font-size:1.8em;color:#86A0DC;z-index:8}.tagcloud2 a{color:#86A0DC}.tagcloud3{font-size:2.2em;color:#86A0DC;z-index:7}.tagcloud3 a{color:#86A0DC}.tagcloud4{font-size:2.6em;color:#607EC5;z-index:6}.tagcloud4 a{color:#607EC5}.tagcloud5{font-size:3.0em;color:#607EC5;z-index:5}.tagcloud5 a{color:#607EC5}.tagcloud6{font-size:3.3em;color:#4C6DB9;z-index:4}.tagcloud6 a{color:#4C6DB9}.tagcloud7{font-size:3.6em;color:#395CAE;z-index:3}.tagcloud7 a{color:#395CAE}.tagcloud8{font-size:3.9em;color:#264CA2;z-index:2}.tagcloud8 a{color:#264CA2}.tagcloud9{font-size:4.2em;color:#133B97;z-index:1}.tagcloud9 a{color:#133B97}.tagcloud10{font-size:4.5em;color:#002A8B;z-index:0}.tagcloud10 a{color:#002A8B}.freq{font-size:10pt !important;color:#bbb}#credit{text-align:center;color:#333;margin-bottom:0.6em;font:0.7em 'lucida grande',trebuchet,'trebuchet ms',verdana,arial,helvetica,sans-serif}#credit a:link{color:#777;text-decoration:none}#credit a:visited{color:#777;text-decoration:none}#credit a:hover{color:white;background-color:#05f}#credit a:active{text-decoration:underline}// --&gt;
&lt;/style&gt;

&lt;div id="htmltagcloud"&gt; &lt;span id="0" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;age&lt;/a&gt;&lt;/span&gt; &lt;span id="1" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;analysis&lt;/a&gt;&lt;/span&gt; &lt;span id="2" class="wrd tagcloud0"&gt;&lt;a href="#tagcloud"&gt;binary&lt;/a&gt;&lt;/span&gt; &lt;span id="3" class="wrd tagcloud0"&gt;&lt;a href="#tagcloud"&gt;case&lt;/a&gt;&lt;/span&gt; &lt;span id="4" class="wrd tagcloud3"&gt;&lt;a href="#tagcloud"&gt;data&lt;/a&gt;&lt;/span&gt; &lt;span id="5" class="wrd tagcloud2"&gt;&lt;a href="#tagcloud"&gt;days&lt;/a&gt;&lt;/span&gt; &lt;span id="6" class="wrd tagcloud6"&gt;&lt;a href="#tagcloud"&gt;debian&lt;/a&gt;&lt;/span&gt; &lt;span id="7" class="wrd tagcloud10"&gt;&lt;a href="#tagcloud"&gt;defects&lt;/a&gt;&lt;/span&gt; &lt;span id="8" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;developers&lt;/a&gt;&lt;/span&gt; &lt;span id="9" class="wrd tagcloud2"&gt;&lt;a href="#tagcloud"&gt;different&lt;/a&gt;&lt;/span&gt; &lt;span id="10" class="wrd tagcloud0"&gt;&lt;a href="#tagcloud"&gt;distribution&lt;/a&gt;&lt;/span&gt; &lt;span id="11" class="wrd tagcloud0"&gt;&lt;a href="#tagcloud"&gt;engineering&lt;/a&gt;&lt;/span&gt; &lt;span id="12" class="wrd tagcloud3"&gt;&lt;a href="#tagcloud"&gt;fixed&lt;/a&gt;&lt;/span&gt; &lt;span id="13" class="wrd tagcloud3"&gt;&lt;a href="#tagcloud"&gt;groups&lt;/a&gt;&lt;/span&gt; &lt;span id="14" class="wrd tagcloud0"&gt;&lt;a href="#tagcloud"&gt;higher&lt;/a&gt;&lt;/span&gt; &lt;span id="15" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;installations&lt;/a&gt;&lt;/span&gt; &lt;span id="16" class="wrd tagcloud5"&gt;&lt;a href="#tagcloud"&gt;number&lt;/a&gt;&lt;/span&gt; &lt;span id="17" class="wrd tagcloud0"&gt;&lt;a href="#tagcloud"&gt;open&lt;/a&gt;&lt;/span&gt; &lt;span id="18" class="wrd tagcloud7"&gt;&lt;a href="#tagcloud"&gt;packages&lt;/a&gt;&lt;/span&gt; &lt;span id="19" class="wrd tagcloud7"&gt;&lt;a href="#tagcloud"&gt;popularity&lt;/a&gt;&lt;/span&gt; &lt;span id="20" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;quality&lt;/a&gt;&lt;/span&gt; &lt;span id="21" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;recent&lt;/a&gt;&lt;/span&gt; &lt;span id="22" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;relationship&lt;/a&gt;&lt;/span&gt; &lt;span id="23" class="wrd tagcloud4"&gt;&lt;a href="#tagcloud"&gt;reported&lt;/a&gt;&lt;/span&gt; &lt;span id="24" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;shows&lt;/a&gt;&lt;/span&gt; &lt;span id="25" class="wrd tagcloud6"&gt;&lt;a href="#tagcloud"&gt;software&lt;/a&gt;&lt;/span&gt; &lt;span id="26" class="wrd tagcloud4"&gt;&lt;a href="#tagcloud"&gt;source&lt;/a&gt;&lt;/span&gt; &lt;span id="27" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;study&lt;/a&gt;&lt;/span&gt; &lt;span id="28" class="wrd tagcloud1"&gt;&lt;a href="#tagcloud"&gt;system&lt;/a&gt;&lt;/span&gt; &lt;span id="29" class="wrd tagcloud2"&gt;&lt;a href="#tagcloud"&gt;users&lt;/a&gt;&lt;/span&gt; &lt;/div&gt;&lt;div id="credit"&gt;created at &lt;a href="http://tagcrowd.com"&gt;TagCrowd.com&lt;/a&gt;&lt;/div&gt;

&lt;!-- end tag cloud : generated by TagCrowd.com : please keep this notice --&gt;

&lt;p&gt;
To cite this paper, there is a &lt;a href="http://herraiz.org/bibtex/english/wcre2011.txt"&gt;BibTeX file available&lt;/a&gt;, or you can copy
from below
&lt;/p&gt;



&lt;pre class="src src-bibtex"&gt;&lt;span style="font-weight: bold;"&gt;@InProceedings&lt;/span&gt;{&lt;span style="font-weight: bold; text-decoration: underline;"&gt;debian_wcre2011&lt;/span&gt;,
  &lt;span style="font-weight: bold; font-style: italic;"&gt;author&lt;/span&gt; =       {Israel Herraiz and Emad Shihab and Thanh H.D. Nguyen and Ahmed E. Hassan},
  &lt;span style="font-weight: bold; font-style: italic;"&gt;title&lt;/span&gt; =        {Impact of Installation Counts on Perceived Quality: A Case Study on {D}ebian},
  &lt;span style="font-weight: bold; font-style: italic;"&gt;booktitle&lt;/span&gt; = {Proceedings of the 18th Working Conference on Reverse Engineering},
  &lt;span style="font-weight: bold; font-style: italic;"&gt;year&lt;/span&gt; =         {2011},
  &lt;span style="font-weight: bold; font-style: italic;"&gt;publisher&lt;/span&gt; = {IEEE Computer Society},
}
&lt;/pre&gt;

&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/herraiz/btbg?a=hMhb-mgDbxA:vCgMP54yuKY:I9og5sOYxJI"&gt;&lt;img src="http://feeds.feedburner.com/~ff/herraiz/btbg?d=I9og5sOYxJI" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/herraiz/btbg?a=hMhb-mgDbxA:vCgMP54yuKY:qj6IDK7rITs"&gt;&lt;img src="http://feeds.feedburner.com/~ff/herraiz/btbg?d=qj6IDK7rITs" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/herraiz/btbg?a=hMhb-mgDbxA:vCgMP54yuKY:ecdYMiMMAMM"&gt;&lt;img src="http://feeds.feedburner.com/~ff/herraiz/btbg?d=ecdYMiMMAMM" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/herraiz/btbg?a=hMhb-mgDbxA:vCgMP54yuKY:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/herraiz/btbg?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/herraiz/btbg/~4/hMhb-mgDbxA" height="1" width="1"/&gt;</content>
 <feedburner:origLink>http://herraiz.org/blog/2011/11/01/popularity-bias-in-bug-datasets/</feedburner:origLink></entry>
 
 
</feed>
