<?xml version="1.0" encoding="UTF-8"?>
<?xml-stylesheet type="text/xsl" media="screen" href="/~d/styles/atom10full.xsl"?><?xml-stylesheet type="text/css" media="screen" href="http://feeds.feedburner.com/~d/styles/itemcontent.css"?><feed xmlns="http://www.w3.org/2005/Atom" xmlns:openSearch="http://a9.com/-/spec/opensearch/1.1/" xmlns:georss="http://www.georss.org/georss" xmlns:gd="http://schemas.google.com/g/2005" xmlns:thr="http://purl.org/syndication/thread/1.0" xmlns:feedburner="http://rssnamespace.org/feedburner/ext/1.0" gd:etag="W/&quot;CkAERngzfCp7ImA9WhRaEkw.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704</id><updated>2012-02-14T17:11:47.684+08:00</updated><category term="pipelines" /><category term="clustering" /><category term="no_reference" /><category term="jokes" /><category term="tools" /><category term="FAQ" /><category term="sms" /><category term="news" /><category term="free" /><category term="Contrail" /><category term="privacy" /><category term="assembler" /><category term="poll" /><category term="NCBI" /><category term="genome" /><category term="bioinformatics" /><category term="samtools" /><category term="sed" /><category term="next-next" /><category term="chrome" /><category term="casper-rw" /><category term="transcriptome" /><category term="tab behaviour" /><category term="real-time PCR" /><category term="awk" /><category term="fasta" /><category term="qc" /><category term="de novo" /><category term="apps" /><category term="qual" /><category term="Life Technologies" /><category term="oral" /><category term="open access" /><category term="RNA-seq" /><category term="Nature" /><category term="tmap" /><category term="workshop" /><category term="rna seq" /><category term="talk" /><category term="boycott" /><category term="webinar" /><category term="small rna sequencing" /><category term="SureSelect" /><category term="humour" /><category term="HPC" /><category term="quality check" /><category term="snp" /><category term="convertors" /><category term="pdf" /><category term="316" /><category term="interview" /><category term="NFS" /><category term="Roche" /><category term="problems" /><category term="Pacific Biosciences" /><category term="pyrosequencing" /><category term="drivers" /><category term="De Brujin" /><category term="Agilent" /><category term="aegilops_tauschii" /><category term="SAET" /><category term="disease" /><category term="statistics" /><category term="framework" /><category term="life science" /><category term="ubuntu" /><category term="Broad Institute" /><category term="conferences" /><category term="google" /><category term="tophat" /><category term="NTFS" /><category term="bam" /><category term="SOLiD" /><category term="slides" /><category term="cluster" /><category term="mpileup" /><category term="magic" /><category term="solid_system" /><category term="perl" /><category term="#OpenAccess" /><category term="Bioconductor" /><category term="protocols" /><category term="flock" /><category term="IDE" /><category term="gut" /><category term="visualisation" /><category term="VM" /><category term="opensource" /><category term="survey" /><category term="shell" /><category term="ray" /><category term="solid 4 hq" /><category term="ABySS" /><category term="file format" /><category term="base_space" /><category term="depth" /><category term="virtual machine" /><category term="Personal Genomics" /><category term="DNAstar" /><category term="pendrive" /><category term="Sanger" /><category term="scripts" /><category term="1000 Genomes" /><category term="NGS" /><category term="paper" /><category term="plant" /><category term="experiment design" /><category term="coverage" /><category term="bmc_genomics" /><category term="boot" /><category term="cloud computing" /><category term="Molecular Diagnostics" /><category term="howto" /><category term="miRNA-seq" /><category term="colorspace" /><category term="multicore" /><category term="wheat_genome" /><category term="publishing" /><category term="AWS" /><category term="uniquely mapped" /><category term="torrent_server" /><category term="transcriptomics" /><category term="sequencing" /><category term="ATI" /><category term="mathematics" /><category term="index" /><category term="adaptor" /><category term="tea" /><category term="Partek" /><category term="human" /><category term="install" /><category term="cancer" /><category term="resequencing" /><category term="galaxy" /><category term="16s rRNA" /><category term="structural variation" /><category term="EST" /><category term="PGx" /><category term="Applied Biosystems" /><category term="ChIP-seq" /><category term="singleton" /><category term="whole transcriptome" /><category term="funding" /><category term="storage" /><category term="infectious disease" /><category term="alignment" /><category term="thumbdrive" /><category term="library" /><category term="big data" /><category term="trends" /><category term="troubleshooting" /><category term="bacterial" /><category term="firefox" /><category term="applications" /><category term="cost" /><category term="yum" /><category term="next-generation_sequencing" /><category term="microRNA" /><category term="tips" /><category term="journal" /><category term="fastq" /><category term="color_space" /><category term="Biomarkers" /><category term="PGM" /><category term="5500xl" /><category term="review" /><category term="future" /><category term="JCVI" /><category term="virtualbox" /><category term="LIMS" /><category term="bwa" /><category term="CentOS" /><category term="metagenomics" /><category term="hilbert curve" /><category term="cloud" /><category term="Paired end" /><category term="bash" /><category term="Bioethics" /><category term="filter" /><category term="3rd gen seq" /><category term="android" /><category term="intel" /><category term="whole genome" /><category term="software" /><category term="trimming" /><category term="AGBT" /><category term="microbial" /><category term="GS Junior" /><category term="methods" /><category term="crowdsourcing" /><category term="microarray" /><category term="microbiome" /><category term="differential expression" /><category term="cheat sheet" /><category term="url" /><category term="Illumina" /><category term="personalized medicine" /><category term="snv" /><category term="workflow" /><category term="usegalaxy" /><category term="9.10" /><category term="alt" /><category term="frank_you" /><category term="clinical" /><category term="uniq" /><category term="HiSeq" /><category term="benchmark" /><category term="youtube" /><category term="assembly" /><category term="Homo sapiens" /><category term="Amazon Web Services" /><category term="compression" /><category term="E. coli" /><category term="GWAS" /><category term="agile" /><category term="python" /><category term="Ion Torrent" /><category term="analysis" /><category term="comparison" /><category term="mirna" /><category term="browser" /><category term="Hadoop" /><category term="ABI" /><category term="bioperl" /><category term="parallel" /><category term="right" /><category term="BGI" /><category term="genomics" /><category term="Genetic Testing" /><category term="Next Generation Sequencing" /><category term="single cell" /><category term="single molecule sequencing" /><category term="reivew" /><category term="linux" /><category term="evolution." /><category term="bedtools" /><category term="454" /><category term="convert" /><category term="programming" /><category term="geospiza" /><category term="splitter" /><category term="tutorial" /><category term="velvet" /><category term="mapping" /><category term="variation" /><category term="samsung" /><category term="pubmed" /><category term="bioscope" /><category term="Nature Publishing Group" /><category term="Solexa" /><category term="bowtie" /><category term="5500" /><category term="exome" /><category term="data" /><category term="R" /><title>My Weblog on Bioinformatics, Genome Science, Next Generation Sequencing</title><subtitle type="html" /><link rel="http://schemas.google.com/g/2005#feed" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/posts/default" /><link rel="alternate" type="text/html" href="http://kevin-gattaca.blogspot.com/" /><link rel="next" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default?start-index=26&amp;max-results=25&amp;redirect=false&amp;v=2" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><generator version="7.00" uri="http://www.blogger.com">Blogger</generator><openSearch:totalResults>574</openSearch:totalResults><openSearch:startIndex>1</openSearch:startIndex><openSearch:itemsPerPage>25</openSearch:itemsPerPage><atom10:link xmlns:atom10="http://www.w3.org/2005/Atom" rel="self" type="application/atom+xml" href="http://feeds.feedburner.com/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing" /><feedburner:info uri="myweblogonbioinformaticsgenomesciencenextgenerationsequencing" /><atom10:link xmlns:atom10="http://www.w3.org/2005/Atom" rel="hub" href="http://pubsubhubbub.appspot.com/" /><entry gd:etag="W/&quot;CkAERnk-fip7ImA9WhRaEkw.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-8776469784801338804</id><published>2012-02-14T17:11:00.001+08:00</published><updated>2012-02-14T17:11:47.756+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-02-14T17:11:47.756+08:00</app:edited><title>FAQ Admin/Data Libraries/Uploading Library Files local instance - Galaxy Wiki</title><content type="html">This is a FAQ that&amp;#39;s best answered in the Wiki page &lt;br&gt;the most intuitive is to use the web GUI to upload but this creates unnecessary overhead and slowdown when you can point to the files &lt;br&gt;&lt;br&gt;&lt;b&gt;Options for Uploading Files from the Admin Perspective&lt;/b&gt;&lt;br&gt;  &lt;br&gt;There are currently four options available to a Galaxy admin user for uploading files to a data library. Some of these same options are available to all regular users that have been granted permission to add items to a Data Library or folder, but &lt;b&gt;&lt;i&gt;this section describes the features from the Galaxy admin perspective which is accessed by clicking on the &amp;quot;Admin&amp;quot; link in the top Galaxy menu bar.&lt;/i&gt;&lt;/b&gt;&lt;br&gt;  &lt;a href="http://wiki.g2.bx.psu.edu/Admin/Data%20Libraries/Uploading%20Library%20Files"&gt;http://wiki.g2.bx.psu.edu/Admin/Data%20Libraries/Uploading%20Library%20Files&lt;/a&gt; &lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-8776469784801338804?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/7cccblZsELOdkbToEFa7BXDhEQk/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/7cccblZsELOdkbToEFa7BXDhEQk/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/7cccblZsELOdkbToEFa7BXDhEQk/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/7cccblZsELOdkbToEFa7BXDhEQk/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/Tozc8YEyl4o" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/8776469784801338804/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/02/faq-admindata-librariesuploading.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/8776469784801338804?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/8776469784801338804?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/Tozc8YEyl4o/faq-admindata-librariesuploading.html" title="FAQ Admin/Data Libraries/Uploading Library Files local instance - Galaxy Wiki" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/02/faq-admindata-librariesuploading.html</feedburner:origLink></entry><entry gd:etag="W/&quot;CkEASHYzcSp7ImA9WhRaEU8.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-2792251498708100090</id><published>2012-02-13T16:07:00.000+08:00</published><updated>2012-02-13T16:10:49.889+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-02-13T16:10:49.889+08:00</app:edited><title>Get to Know Btrfs | Linux.com</title><content type="html">&lt;div dir="ltr" style="text-align: left;" trbidi="on"&gt;
&lt;a href="https://www.linux.com/learn/tutorials/533112-weekend-project-get-to-know-btrfs"&gt;https://www.linux.com/learn/tutorials/533112-weekend-project-get-to-know-btrfs&lt;/a&gt;&lt;br /&gt;
&lt;br /&gt;
As expected, Storage Spaces will indeed be a feature of both desktop and server editions of the operating system.  &lt;br /&gt;
If the feature does indeed ship in desktop Windows, it will overnight  obsolete a range of SOHO-oriented storage systems; products like Drobo  and ReadyNAS will find it hard to survive in a Windows 8 world.&lt;br /&gt;
&lt;br /&gt;
&lt;h3&gt;
  Btrfs Features&lt;/h3&gt;
&lt;ul&gt;
&lt;li&gt;   RAID 0, 1, 10&lt;/li&gt;
&lt;li&gt;   COW&lt;/li&gt;
&lt;li&gt;   Incremental backup&lt;/li&gt;
&lt;li&gt;   Online defrag&lt;/li&gt;
&lt;li&gt;   gzip and LZO compression&lt;/li&gt;
&lt;li&gt;   Space-efficient packing of small files&lt;/li&gt;
&lt;li&gt;   Dynamic inode allocation&lt;/li&gt;
&lt;li&gt;   Checksums on data and metadata&lt;/li&gt;
&lt;li&gt;   Shrink and grow storage volumes&lt;/li&gt;
&lt;li&gt;   Extents&lt;/li&gt;
&lt;li&gt;   Snapshots&lt;/li&gt;
&lt;li&gt;   16 EiB maximum file size&lt;/li&gt;
&lt;/ul&gt;
Planned features include RAID 5 and 6, &lt;a href="http://en.wikipedia.org/wiki/Data_deduplication"&gt;deduplication&lt;/a&gt;,  and a ready-for-primetime filesystem checker, btrfsck. You can try out  btrfsck now because it is included in btrfsprogs. (Which of course  Debian/Ubuntu/Mint etc. changes to btrfs-tools, and Fedora calls it  btrfs-progs.) But it is not ready for production systems yet.&lt;br /&gt;
Putting the finishing touches on btrfsck is the last big step before  Oracle makes it the default filesystem in their next Unbreakable Linux  release. Fedora 16 Linux was supposed to default to Btrfs, but now  they're aiming for Fedora 17 in May 2012.&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
also see&amp;nbsp;&lt;a href="https://btrfs.wiki.kernel.org/"&gt;https://btrfs.wiki.kernel.org/&lt;/a&gt;&lt;/div&gt;&lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-2792251498708100090?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/19VWbyjm0CVbVZV0Hm91_IToQUI/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/19VWbyjm0CVbVZV0Hm91_IToQUI/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/19VWbyjm0CVbVZV0Hm91_IToQUI/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/19VWbyjm0CVbVZV0Hm91_IToQUI/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/d2WaD5R4k7o" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/2792251498708100090/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/02/weekend-project-get-to-know-btrfs.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/2792251498708100090?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/2792251498708100090?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/d2WaD5R4k7o/weekend-project-get-to-know-btrfs.html" title="Get to Know Btrfs | Linux.com" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/02/weekend-project-get-to-know-btrfs.html</feedburner:origLink></entry><entry gd:etag="W/&quot;Ck4BRXgzfip7ImA9WhRaEU8.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-5881236921327062736</id><published>2012-02-13T16:01:00.000+08:00</published><updated>2012-02-13T16:15:54.686+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-02-13T16:15:54.686+08:00</app:edited><title>Windows 8 Storage Spaces detailed: pooling redundant disk space for all</title><content type="html">&lt;div dir="ltr" style="text-align: left;" trbidi="on"&gt;
This will definitely change mainstream consumer ideas on backup and data storage .. maybe it will ripple down to labs who currently do not backup their data .. &lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
&lt;div class="gmail_quote"&gt;
&lt;div bgcolor="#FFFFFF"&gt;
&lt;div&gt;
&lt;b&gt;Windows 8 Storage Spaces detailed: pooling redundant disk space for all&lt;/b&gt;&lt;br /&gt;
&lt;a href="http://arstechnica.com/microsoft/news/2012/01/windows-8-storage-spaces-detailed-pooling-redundant-disk-space-for-all.ars" target="_blank"&gt;&lt;/a&gt;&lt;a href="http://arstechnica.com/microsoft/news/2012/01/windows-8-storage-spaces-detailed-pooling-redundant-disk-space-for-all.ars" target="_blank"&gt;http://arstechnica.com/microsoft/news/2012/01/windows-8-storage-spaces-detailed-pooling-redundant-disk-space-for-all.ars&lt;/a&gt;&lt;br /&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;/div&gt;
&lt;/div&gt;
Unlike RAID systems of old, but in common with other modern storage  technologies such as Solaris' ZFS and Linux's btrfs, pools can use disks  of different interface technologies—USB, SATA, Serial Attached SCSI—and  different, mismatched sizes. New disks can be added to a pool at any  time. Pools can also include one or more hot spares: drives allocated to  a pool but kept in standby until another disk in the pool fails, at  which point they spring into life.&lt;br /&gt;
&lt;br /&gt;
As expected, Storage Spaces will indeed be a feature of both desktop and server editions of the operating system.  &lt;br /&gt;
If the feature does indeed ship in desktop Windows, it will overnight  obsolete a range of SOHO-oriented storage systems; products like Drobo  and ReadyNAS will find it hard to survive in a Windows 8 world.&lt;br /&gt;
&lt;br /&gt;&lt;/div&gt;&lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-5881236921327062736?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/N1FjnRJRiAGzg4Sp8zmlGgpyBO0/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/N1FjnRJRiAGzg4Sp8zmlGgpyBO0/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/N1FjnRJRiAGzg4Sp8zmlGgpyBO0/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/N1FjnRJRiAGzg4Sp8zmlGgpyBO0/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/CovIZm6ca8U" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/5881236921327062736/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/02/fwd-article-windows-8-storage-spaces.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/5881236921327062736?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/5881236921327062736?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/CovIZm6ca8U/fwd-article-windows-8-storage-spaces.html" title="Windows 8 Storage Spaces detailed: pooling redundant disk space for all" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/02/fwd-article-windows-8-storage-spaces.html</feedburner:origLink></entry><entry gd:etag="W/&quot;CkYAQH0_eSp7ImA9WhRbGEk.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-3500089100881411057</id><published>2012-02-10T10:15:00.001+08:00</published><updated>2012-02-10T10:15:41.341+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-02-10T10:15:41.341+08:00</app:edited><title>Article: Running Python and R inside Emacs</title><content type="html">&lt;table class="moz-email-headers-table" border="0" cellpadding="0"       cellspacing="0"&gt;       &lt;tbody&gt;         &lt;tr&gt;           &lt;th align="RIGHT" nowrap="nowrap" valign="BASELINE"&gt;&lt;br&gt;           &lt;/th&gt;           &lt;td&gt;&lt;br&gt;           &lt;/td&gt;         &lt;/tr&gt;         &lt;tr&gt;           &lt;th align="RIGHT" nowrap="nowrap" valign="BASELINE"&gt;&lt;br&gt;           &lt;/th&gt;           &lt;td&gt;&lt;br&gt;           &lt;/td&gt;         &lt;/tr&gt;         &lt;tr&gt;           &lt;th align="RIGHT" nowrap="nowrap" valign="BASELINE"&gt;&lt;br&gt;           &lt;/th&gt;           &lt;td&gt;&lt;br&gt;           &lt;/td&gt;         &lt;/tr&gt;         &lt;tr&gt;           &lt;th align="RIGHT" nowrap="nowrap" valign="BASELINE"&gt;&lt;br&gt;           &lt;/th&gt;           &lt;td&gt;&lt;br&gt;           &lt;/td&gt;         &lt;/tr&gt;       &lt;/tbody&gt;     &lt;/table&gt;     &lt;div&gt;&lt;br&gt;       &lt;strong&gt;Running Python and R inside Emacs&lt;/strong&gt;&lt;br&gt;       &lt;a moz-do-not-send="true"         href="http://www.johndcook.com/blog/2012/02/09/python-org-mode/"&gt;http://www.johndcook.com/blog/2012/02/09/python-org-mode/&lt;/a&gt;&lt;br&gt;     &lt;/div&gt;     &lt;br&gt;   &lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-3500089100881411057?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/_bGV-JqtVPo1SFjqlvVqOPomoII/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/_bGV-JqtVPo1SFjqlvVqOPomoII/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/_bGV-JqtVPo1SFjqlvVqOPomoII/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/_bGV-JqtVPo1SFjqlvVqOPomoII/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/LW-wUmGl-jU" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/3500089100881411057/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/02/article-running-python-and-r-inside.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/3500089100881411057?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/3500089100881411057?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/LW-wUmGl-jU/article-running-python-and-r-inside.html" title="Article: Running Python and R inside Emacs" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/02/article-running-python-and-r-inside.html</feedburner:origLink></entry><entry gd:etag="W/&quot;C04NSHs8cSp7ImA9WhRbGE0.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-4047012398751842118</id><published>2012-02-09T23:39:00.001+08:00</published><updated>2012-02-09T23:39:59.579+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-02-09T23:39:59.579+08:00</app:edited><title>Unix join on more than two files - Stack Overflow</title><content type="html">&lt;p&gt;&lt;a href="http://stackoverflow.com/questions/9212893/unix-join-on-more-than-two-files"&gt;http://stackoverflow.com/questions/9212893/unix-join-on-more-than-two-files&lt;/a&gt;&lt;br&gt;&lt;/p&gt; &lt;p&gt;This has to be useful someday ... &lt;/p&gt; &lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-4047012398751842118?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/H8XPVHdMfGPpB9adsXuIoGE_PyE/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/H8XPVHdMfGPpB9adsXuIoGE_PyE/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/H8XPVHdMfGPpB9adsXuIoGE_PyE/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/H8XPVHdMfGPpB9adsXuIoGE_PyE/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/y40_QiLGDkc" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/4047012398751842118/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/02/unix-join-on-more-than-two-files-stack.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/4047012398751842118?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/4047012398751842118?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/y40_QiLGDkc/unix-join-on-more-than-two-files-stack.html" title="Unix join on more than two files - Stack Overflow" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/02/unix-join-on-more-than-two-files-stack.html</feedburner:origLink></entry><entry gd:etag="W/&quot;CUMERXw7eip7ImA9WhRbF0o.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-7370584689850391094</id><published>2012-02-09T15:42:00.000+08:00</published><updated>2012-02-09T15:43:24.202+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-02-09T15:43:24.202+08:00</app:edited><title>ea-utils - FASTQ processing utilities - Google Project Hosting</title><content type="html">didn&amp;#39;t cc Rick cos he&amp;#39;s away, heh share with him later .. &lt;br&gt;&lt;br&gt;&lt;a href="http://code.google.com/p/ea-utils/"&gt;http://code.google.com/p/ea-utils/&lt;/a&gt;&lt;br&gt;&lt;br&gt;&lt;p&gt;Suite of processing tools for sequencing output.  Barcode demultiplexing, adapter trimming, etc. &lt;/p&gt;  &lt;p&gt;Primarily written to support an Illumina based pipeline - but should work with any FASTQs. &lt;/p&gt;&lt;h3&gt;&lt;a name="Overview:"&gt;&lt;/a&gt;Overview:&lt;/h3&gt;&lt;ul&gt;&lt;li&gt;&lt;a href="http://code.google.com/p/ea-utils/wiki/FastqMcf"&gt;fastq-mcf&lt;/a&gt; &lt;/li&gt;  &lt;blockquote&gt;Scans  a sequence file for adapters, and, based on a log-scaled threshold,  determines a set of clipping parameters and performs clipping.  Also  does skewing detection and quality filtering.  &lt;/blockquote&gt;&lt;li&gt;&lt;a href="http://code.google.com/p/ea-utils/wiki/FastqMultx"&gt;fastq-multx&lt;/a&gt; &lt;/li&gt;&lt;blockquote&gt;Demultiplexes  a fastq.  Capable of auto-determining barcode id&amp;#39;s based on a master  set fields.  Keeps multiple reads in-sync during demultiplexing.  Can  verify that the reads are in-sync as well, and fail if they&amp;#39;re not.  &lt;/blockquote&gt;&lt;li&gt;&lt;a href="http://code.google.com/p/ea-utils/wiki/FastqJoin"&gt;fastq-join&lt;/a&gt; &lt;/li&gt;&lt;blockquote&gt;Similar  to audy&amp;#39;s stitch program, but in C, more efficient and supports some  automatic benchmarking and tuning. It uses the same &amp;quot;squared distance  for anchored alignment&amp;quot; as other tools.  &lt;/blockquote&gt;&lt;/ul&gt;&lt;h3&gt;&lt;a name="Other_Stuff:"&gt;&lt;/a&gt;Other Stuff:&lt;/h3&gt;&lt;ul&gt;&lt;li&gt;&lt;a href="http://code.google.com/p/ea-utils/wiki/SamStats"&gt;sam-stats&lt;/a&gt;  - Basic sam/bam stats.  Like other tools, but produces what I want to  look at, in a format suitable for passing to other programs.  (&lt;a href="http://ea-utils.googlecode.com/svn/trunk/clipper/sam-stats" rel="nofollow"&gt;Click for source&lt;/a&gt;) &lt;/li&gt;&lt;/ul&gt;&lt;ul&gt;&lt;li&gt;fastq-stats - Basic fastq stats.  Counts duplicates. Option for per-cycle stats, or not (irrelevant for many sequencers).    (&lt;a href="http://ea-utils.googlecode.com/svn/trunk/clipper/fastq-stats" rel="nofollow"&gt;Click for source&lt;/a&gt;) &lt;/li&gt;  &lt;/ul&gt;&lt;ul&gt;&lt;li&gt;determine-phred - Returns the phred scale of the input file. Works with sams, fastq&amp;#39;s or pileups and gzipped files. &lt;/li&gt;&lt;/ul&gt;&lt;ul&gt;&lt;li&gt;Chrdex.pm  - indexes a delimited file by chromosome start/stop.  There are lots of  tools for this.   This one works pretty well if you&amp;#39;re a perl user.  It  handles overlapping regions reasonably well.  It uses RAM comparable to  the size of the annotation file. &lt;/li&gt;&lt;/ul&gt;&lt;ul&gt;&lt;li&gt;Sqldex.pm - just like Chrdex.pm, except uses a disk-based btree.  Not as fast, but close, and uses very little RAM. &lt;/li&gt;&lt;/ul&gt;&lt;ul&gt;&lt;li&gt;qsh  - Runs a bash script file like a &amp;quot;cluster aware makefile&amp;quot;...only  processing newer things, die&amp;#39;ing if things go wrong, and sending jobs to  a queue manager if they&amp;#39;re big.  That way you don&amp;#39;t have to write  makefiles, or wrap things in &amp;quot;qsub&amp;quot; calls for every little program.  Not  really ready yet. &lt;/li&gt;&lt;/ul&gt;&lt;ul&gt;&lt;li&gt;grun - Fast, lightweight grid queue software.  Keeps the job queue on disk at all times.  Very fast.   Works well by now &lt;/li&gt;&lt;/ul&gt;&lt;ul&gt;&lt;li&gt;gwrap  - Bash wrapper shell that downloads all dependencies that are not the  local system.... good for EC2 nodes.  Linux only.   Will use it if we  ever go to EC2. &lt;/li&gt;&lt;/ul&gt;&lt;br&gt; &lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-7370584689850391094?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/WhJCHTVG8-ObyHFAqXfeaXsxsfQ/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/WhJCHTVG8-ObyHFAqXfeaXsxsfQ/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/WhJCHTVG8-ObyHFAqXfeaXsxsfQ/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/WhJCHTVG8-ObyHFAqXfeaXsxsfQ/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/_S9eqIyhe34" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/7370584689850391094/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/02/ea-utils-fastq-processing-utilities.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/7370584689850391094?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/7370584689850391094?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/_S9eqIyhe34/ea-utils-fastq-processing-utilities.html" title="ea-utils - FASTQ processing utilities - Google Project Hosting" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/02/ea-utils-fastq-processing-utilities.html</feedburner:origLink></entry><entry gd:etag="W/&quot;AkYMR3Y9fip7ImA9WhRbFk8.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-6824568162845164730</id><published>2012-02-07T23:23:00.001+08:00</published><updated>2012-02-07T23:23:06.866+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-02-07T23:23:06.866+08:00</app:edited><title>Amazon S3 Lowers Standard Storage Prices</title><content type="html">&lt;p&gt;&lt;/p&gt; &lt;p&gt;Dear Amazon S3 Customer,&lt;/p&gt; &lt;p&gt;We are excited to announce that we have reduced the Amazon S3 standard storage prices in all regions. With this price change, all Amazon S3 standard storage customers will see a reduction in their storage costs. For instance, if you store 50 TB of data on average, you'll see a 12% reduction in costs. If you store 500 TB of data on average, you'll see a 13.5% reduction in costs. The price reduction applies to all of your standard storage- both existing storage and all new storage you add. Here is a summary of price changes for the US Standard region:&lt;/p&gt;  &lt;p&gt;                          Old         New&lt;br&gt; First 1TB           $0.140    $0.125&lt;br&gt; Next 49TB         $0.125    $0.110&lt;br&gt; Next 450TB       $0.110    $0.095 &lt;br&gt; Next 500TB       $0.095    $0.090&lt;br&gt; Next 4000TB     $0.080    $0.080 (no change)&lt;br&gt; Over 5000TB     $0.055    $0.055 (no change)&lt;/p&gt; &lt;p&gt;The new lower prices for all regions can be found on the Amazon S3 Detail Page. New prices are effective February 1st and will be applied to your bill for all storage on or after this date.&lt;/p&gt; &lt;p&gt;We are happy to pass along these savings to you as we continue to innovate and drive down our costs.&lt;/p&gt; &lt;p&gt;Sincerely,&lt;br&gt; The Amazon S3 Team&lt;/p&gt; &lt;p&gt;We hope you enjoyed receiving this message. If you wish to remove yourself from receiving future product announcements and the monthly AWS Newsletter, please update your communication preferences.&lt;/p&gt; &lt;p&gt;Amazon Web Services LLC is a subsidiary of Amazon.com, Inc. Amazon.com is a registered trademark of Amazon.com, Inc. This message produced and distributed by Amazon Web Services, LLC, 1918 8th Avenue, Seattle, WA 98101.&lt;/p&gt;  &lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-6824568162845164730?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/HrYiauIfymo6Y-WBdPsUP-uFMNo/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/HrYiauIfymo6Y-WBdPsUP-uFMNo/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/HrYiauIfymo6Y-WBdPsUP-uFMNo/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/HrYiauIfymo6Y-WBdPsUP-uFMNo/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/t9ABfMW2VfY" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/6824568162845164730/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/02/amazon-s3-lowers-standard-storage.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/6824568162845164730?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/6824568162845164730?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/t9ABfMW2VfY/amazon-s3-lowers-standard-storage.html" title="Amazon S3 Lowers Standard Storage Prices" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/02/amazon-s3-lowers-standard-storage.html</feedburner:origLink></entry><entry gd:etag="W/&quot;AkMFRHc7eCp7ImA9WhRbFk0.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-7892051686369847345</id><published>2012-02-07T17:52:00.000+08:00</published><updated>2012-02-07T17:53:35.900+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-02-07T17:53:35.900+08:00</app:edited><title>Google Refine is a power tool for working with messy data sets</title><content type="html">&lt;a href="http://google-refine.blogspot.com/"&gt;http://google-refine.blogspot.com/&lt;/a&gt;&lt;br&gt;&lt;br&gt;&lt;a href="http://code.google.com/p/google-refine/"&gt;Google Refine&lt;/a&gt; is a  power tool for working with messy data sets, including cleaning up  inconsistencies, transforming them from one format into another, and  extending them with new data from external web services or other  databases.  Version 2.0 introduces a new extensions architecture, a  reconciliation framework for linking records to other databases (like &lt;a href="http://www.freebase.com/"&gt;Freebase&lt;/a&gt;), and a ton of &lt;a href="http://code.google.com/p/google-refine/wiki/ChangesFor2p0"&gt;new transformation commands and expressions&lt;/a&gt;.&lt;br&gt;  &lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-7892051686369847345?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/0SYC3W14TyBas3RiEn77C-VCa0A/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/0SYC3W14TyBas3RiEn77C-VCa0A/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/0SYC3W14TyBas3RiEn77C-VCa0A/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/0SYC3W14TyBas3RiEn77C-VCa0A/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/xBNm3MLSCAI" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/7892051686369847345/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/02/google-refine-is-power-tool-for-working.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/7892051686369847345?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/7892051686369847345?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/xBNm3MLSCAI/google-refine-is-power-tool-for-working.html" title="Google Refine is a power tool for working with messy data sets" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/02/google-refine-is-power-tool-for-working.html</feedburner:origLink></entry><entry gd:etag="W/&quot;CkUFRn05fCp7ImA9WhRbFUw.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-5377210573102088942</id><published>2012-02-06T14:34:00.002+08:00</published><updated>2012-02-06T14:36:57.324+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-02-06T14:36:57.324+08:00</app:edited><category scheme="http://www.blogger.com/atom/ns#" term="poll" /><category scheme="http://www.blogger.com/atom/ns#" term="NGS" /><category scheme="http://www.blogger.com/atom/ns#" term="big data" /><category scheme="http://www.blogger.com/atom/ns#" term="storage" /><category scheme="http://www.blogger.com/atom/ns#" term="parallel" /><category scheme="http://www.blogger.com/atom/ns#" term="life science" /><title>Public Poll: What data storage solutions are you using now?</title><content type="html">&lt;div dir="ltr" style="text-align: left;" trbidi="on"&gt;&lt;a href="http://booroo.com/app/showpoll.asp?sid=f1ff2qn2fxe3vex22992&amp;amp;qid=22992#.Ty90KYydyHA.blogger"&gt;BooRoo&lt;/a&gt;&lt;br /&gt;
&lt;div&gt;&lt;br /&gt;
&lt;/div&gt;&lt;div&gt;Just a public poll created curious as to what systems are out there and what is being used day to day. Results are immediately viewable. Order of choices is randomized.&amp;nbsp;&lt;/div&gt;&lt;div&gt;&lt;script type="text/javascript"&gt;
var cookie_booroo=0, random_booroo=1, enddate_booroo=0, maxchecked_booroo=0, jsonurl_booroo='http://booroo.com/app/vote.asp', customurl_booroo='';
&lt;/script&gt;&lt;br /&gt;
&lt;link href="http://booroo.com/app_content/theme_poll/2/set3/css/default.css" media="screen" rel="stylesheet" type="text/css"&gt;&lt;/link&gt;  &lt;br /&gt;
&lt;div class="poll_booroo cleanslate" style="width: 300px;"&gt;&lt;div class="theme_booroo"&gt;Which data storage platform are you using?&lt;br /&gt;
&lt;div class="content_booroo"&gt;&lt;div class="options_booroo"&gt;&lt;form class="form_booroo"&gt;&lt;fieldset&gt;&lt;div class="padded_booroo"&gt;&lt;input name="qid" type="hidden" value="22992" /&gt;&lt;input name="sid" type="hidden" value="f1ff2qn2fxe3vex22992" /&gt;&lt;input name="pqid" type="hidden" value="15135" /&gt;&lt;br /&gt;
&lt;div class="items_booroo"&gt;&lt;div class="row_booroo"&gt;&lt;label&gt;&lt;input class="checkbox_booroo" id="ans-72222" name="ans-72222" type="checkbox" value="1" /&gt;http://www.bluearc.com/ BlueArc is your Life Sciences Solution&lt;/label&gt;&lt;/div&gt;&lt;div class="row_booroo"&gt;&lt;label&gt;&lt;input class="checkbox_booroo" id="ans-72223" name="ans-72223" type="checkbox" value="1" /&gt;http://www.isilon.com/ Isilon scale-out NAS, BIG data is no longer a challenge, it’s an opportunity.&lt;/label&gt;&lt;/div&gt;&lt;div class="row_booroo"&gt;&lt;label&gt;&lt;input class="checkbox_booroo" id="ans-72224" name="ans-72224" type="checkbox" value="1" /&gt;http://www.panasas.com/ PANASAS SOLVES BIG DATA PROBLEMS&lt;/label&gt;&lt;/div&gt;&lt;div class="row_booroo"&gt;&lt;label&gt;&lt;input class="checkbox_booroo" id="ans-72225" name="ans-72225" type="checkbox" value="1" /&gt;http://www.ddn.com/ DataDirect Networks’ (DDN) Big Data Storage Technology Powers More&lt;/label&gt;&lt;/div&gt;&lt;div class="row_booroo"&gt;&lt;label&gt;&lt;input class="checkbox_booroo" id="ans-72226" name="ans-72226" type="checkbox" value="1" /&gt;http://aws.amazon.com/ Store data and build dependable backup solutions using AWS’s highly reliable, inexpensive data storage services.&lt;/label&gt;&lt;/div&gt;&lt;div class="row_booroo"&gt;&lt;label&gt;&lt;input class="checkbox_booroo" id="ans-72227" name="ans-72227" type="checkbox" value="1" /&gt;Inhouse solutions using commodity hardware&lt;/label&gt;&lt;/div&gt;&lt;div class="row_booroo"&gt;&lt;label&gt;&lt;input class="checkbox_booroo" id="ans-72228" name="ans-72228" type="checkbox" value="1" /&gt;http://www-03.ibm.com/systems/software/gpfs/ IBM GPFS&lt;/label&gt;&lt;/div&gt;&lt;/div&gt;&lt;div&gt;&lt;input class="text_booroo" id="ans-other" name="ans-other" type="text" value="Other: (Please specify)" /&gt;&lt;/div&gt;&lt;div class="submit_booroo"&gt;&lt;a class="viewresults" href=""&gt;View results&lt;/a&gt;&lt;a class="vote_booroo" href=""&gt;Vote Now&lt;/a&gt;&lt;/div&gt;&lt;/div&gt;&lt;a href="http://booroo.com/"&gt;Create an online survey&lt;/a&gt; &lt;a href="http://booroo.com/quizzes"&gt;quiz&lt;/a&gt; or &lt;a href="http://booroo.com/polls"&gt;web poll&lt;/a&gt;&lt;/fieldset&gt;&lt;/form&gt;&lt;/div&gt;&lt;div class="results_booroo"&gt;&lt;div class="padded_booroo"&gt;&lt;div class="row_booroo"&gt;&lt;strong&gt;http://www.bluearc.com/ BlueArc is your Life Sciences Solution&lt;/strong&gt;&lt;img class="result_booroo" id="res-72222" src="http://booroo.com/app_content/theme_poll/2/set3/images/graph.gif" style="width: 0%;" /&gt;0%&lt;/div&gt;&lt;div class="row_booroo"&gt;&lt;strong&gt;http://www.isilon.com/ Isilon scale-out NAS, BIG data is no longer a challenge, it’s an opportunity.&lt;/strong&gt;&lt;img class="result_booroo" id="res-72223" src="http://booroo.com/app_content/theme_poll/2/set3/images/graph.gif" style="width: 0%;" /&gt;0%&lt;/div&gt;&lt;div class="row_booroo"&gt;&lt;strong&gt;http://www.panasas.com/ PANASAS SOLVES BIG DATA PROBLEMS&lt;/strong&gt;&lt;img class="result_booroo" id="res-72224" src="http://booroo.com/app_content/theme_poll/2/set3/images/graph.gif" style="width: 0%;" /&gt;0%&lt;/div&gt;&lt;div class="row_booroo"&gt;&lt;strong&gt;http://www.ddn.com/ DataDirect Networks’ (DDN) Big Data Storage Technology Powers More&lt;/strong&gt;&lt;img class="result_booroo" id="res-72225" src="http://booroo.com/app_content/theme_poll/2/set3/images/graph.gif" style="width: 0%;" /&gt;0%&lt;/div&gt;&lt;div class="row_booroo"&gt;&lt;strong&gt;http://aws.amazon.com/ Store data and build dependable backup solutions using AWS’s highly reliable, inexpensive data storage services.&lt;/strong&gt;&lt;img class="result_booroo" id="res-72226" src="http://booroo.com/app_content/theme_poll/2/set3/images/graph.gif" style="width: 0%;" /&gt;0%&lt;/div&gt;&lt;div class="row_booroo"&gt;&lt;strong&gt;Inhouse solutions using commodity hardware&lt;/strong&gt;&lt;img class="result_booroo" id="res-72227" src="http://booroo.com/app_content/theme_poll/2/set3/images/graph.gif" style="width: 0%;" /&gt;0%&lt;/div&gt;&lt;div class="row_booroo"&gt;&lt;strong&gt;http://www-03.ibm.com/systems/software/gpfs/ IBM GPFS&lt;/strong&gt;&lt;img class="result_booroo" id="res-72228" src="http://booroo.com/app_content/theme_poll/2/set3/images/graph.gif" style="width: 0%;" /&gt;0%&lt;/div&gt;&lt;div class="row_booroo"&gt;&lt;strong&gt;Other: (Please specify)&lt;/strong&gt;&lt;img class="result_booroo" id="res-999999" src="http://booroo.com/app_content/theme_poll/2/set3/images/graph.gif" style="width: 0%;" /&gt;0%&lt;/div&gt;&lt;/div&gt;&lt;a href="http://booroo.com/"&gt;Create an online survey&lt;/a&gt; &lt;a href="http://booroo.com/quizzes"&gt;quiz&lt;/a&gt; or &lt;a href="http://booroo.com/polls"&gt;web poll&lt;/a&gt;&lt;/div&gt;&lt;/div&gt;&lt;/div&gt;&lt;/div&gt;&lt;script src="http://ajax.googleapis.com/ajax/libs/jquery/1.6.1/jquery.min.js" type="text/javascript"&gt;
&lt;/script&gt;&lt;script src="http://booroo.com/app/polltheme/2/poll.js" type="text/javascript"&gt;
&lt;/script&gt;&lt;/div&gt;&lt;div&gt;&lt;br /&gt;
&lt;/div&gt;&lt;/div&gt;&lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-5377210573102088942?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/SkW3STa1v7u9g69TlJbzchRLFQs/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/SkW3STa1v7u9g69TlJbzchRLFQs/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/SkW3STa1v7u9g69TlJbzchRLFQs/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/SkW3STa1v7u9g69TlJbzchRLFQs/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/22NYN2i6uBs" height="1" width="1"/&gt;</content><link rel="related" href="http://booroo.com/app/showpoll.asp?sid=f1ff2qn2fxe3vex22992&amp;qid=22992#.Ty90KYydyHA.blogger" title="Public Poll: What data storage solutions are you using now?" /><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/5377210573102088942/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/02/public-poll-what-data-storage-solutions.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/5377210573102088942?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/5377210573102088942?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/22NYN2i6uBs/public-poll-what-data-storage-solutions.html" title="Public Poll: What data storage solutions are you using now?" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/02/public-poll-what-data-storage-solutions.html</feedburner:origLink></entry><entry gd:etag="W/&quot;CUcAQ3k7fyp7ImA9WhRbFU0.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-1417435315212831387</id><published>2012-02-06T12:37:00.001+08:00</published><updated>2012-02-06T12:37:22.707+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-02-06T12:37:22.707+08:00</app:edited><title>[circos] Circos v0.56 released</title><content type="html">&lt;p&gt;&lt;br&gt; ---------- Forwarded message ----------&lt;br&gt; From: &amp;quot;Martin&amp;quot; &lt;br&gt; Date: Feb 6, 2012 9:56 am&lt;br&gt; Subject: [circos] Circos v0.56 released&lt;br&gt;&lt;/p&gt; &lt;p&gt;Dear Circos users!&lt;/p&gt; &lt;p&gt;I have made v0.56 available.&lt;/p&gt; &lt;p&gt;&lt;a href="http://circos.ca/software/download/"&gt;http://circos.ca/software/download/&lt;/a&gt;&lt;/p&gt; &lt;p&gt;Thank you to everyone who submitted bug reports and patiently waited&lt;br&gt; for me to respond.&lt;/p&gt; &lt;p&gt;Remember that now tutorials and the core code are kept separate. The&lt;br&gt; core circos-0.56.tgz archive contains an example directory (example/)&lt;br&gt; that creates a relatively complex image. Use this to ensure that&lt;br&gt; everything is working.&lt;/p&gt; &lt;p&gt;Most of the changes are bug fixes. Error handling is improved - many&lt;br&gt; errors have a gentler format and should be more explanatory.&lt;/p&gt; &lt;p&gt;*** IMPORTANT CHANGES AND REMINDERS ***&lt;/p&gt; &lt;p&gt;1. Import colors/fonts/patterns all at once&lt;/p&gt; &lt;p&gt;Use a single line to add color, font and pattern definitions in&lt;br&gt; circos.conf:&lt;/p&gt; &lt;p&gt;&amp;lt;&amp;lt;include etc/colors_fonts_patterns.conf&amp;gt;&amp;gt;&lt;/p&gt; &lt;p&gt;instead of&lt;/p&gt; &lt;p&gt;&amp;lt;colors&amp;gt;&lt;br&gt; &amp;lt;&amp;lt;include etc/colors.conf&amp;gt;&amp;gt;&lt;br&gt; ...&lt;/p&gt; &lt;p&gt;Note that colors.conf now imports brewer.conf automatically.&lt;/p&gt; &lt;p&gt;Please see example/etc/circos.conf for ideas of how to make your&lt;br&gt; configuration more modular.&lt;/p&gt; &lt;p&gt;2. Make sure you&amp;#39;re using etc/housekeeping.conf&lt;/p&gt; &lt;p&gt;A while back, I had centralized system parameters that used to appear&lt;br&gt; at the bottom of circos.conf into a separate file. For those of you&lt;br&gt; who still have these parameters in their circos.conf file, please&lt;br&gt; remove them.&lt;/p&gt; &lt;p&gt;&amp;lt;&amp;lt;include etc/housekeeping.conf&amp;gt;&amp;gt;&lt;/p&gt; &lt;p&gt;instead of&lt;/p&gt; &lt;p&gt;anglestep       = 0.5&lt;br&gt; minslicestep    = 10&lt;br&gt; beziersamples   = 40&lt;br&gt; debug           = no&lt;br&gt; warnings        = no&lt;br&gt; imagemap        = no&lt;br&gt; units_ok = bupr&lt;br&gt; units_nounit = n&lt;/p&gt; &lt;p&gt;3. Use debug_group&lt;/p&gt; &lt;p&gt;You&amp;#39;ll notice that Circos&amp;#39; default debug output contains more text. By&lt;br&gt; default debugging that falls into the &amp;#39;summary&amp;#39; category is created. A&lt;br&gt; complete list of debug categories is listed here&lt;/p&gt; &lt;p&gt;&lt;a href="http://mkweb.bcgsc.ca/dev/circos/documentation/tutorials/configuration/debugging/"&gt;http://mkweb.bcgsc.ca/dev/circos/documentation/tutorials/configuration/debugging/&lt;/a&gt;&lt;/p&gt; &lt;p&gt;In particular, the following are very useful&lt;/p&gt; &lt;p&gt;  timer - show code timings&lt;br&gt;   io - loading and locating files&lt;br&gt;   textplace - reports whether a text in a text track has been&lt;br&gt; successfully placed&lt;/p&gt; &lt;p&gt;4. SVG text handling improved&lt;/p&gt; &lt;p&gt;I&amp;#39;ve revamped how SVG text labels are placed. You&amp;#39;ll notice that fonts&lt;br&gt; now have font family definitions in etc/fonts.conf. This string is&lt;br&gt; used in the SVG file to specify the font. Once you have the font&lt;br&gt; installed on your system, labels won&amp;#39;t all appear in the SVG app or&lt;br&gt; viewer default (e.g. Arial) font.&lt;/p&gt; &lt;p&gt;There&amp;#39;s still more to do here, but it&amp;#39;s getting better.&lt;/p&gt; &lt;p&gt;0.56 CHANGELOG&lt;/p&gt; &lt;p&gt;Parallel ideogram labels are now centered with respect to the&lt;br&gt; ideogram.&lt;/p&gt; &lt;p&gt;restrict_parameter_names now controls whether parameters are&lt;br&gt; restricted to a pre-defined list (e.g. color, thickness, etc). If you&lt;br&gt; have custom parameters (e.g. &amp;#39;myspecialcode&amp;#39;) then set&lt;br&gt; restrict_parameter_names=no. By default, this is always set to &amp;#39;yes&amp;#39;.&lt;/p&gt; &lt;p&gt;Added link_orientation for text tracks. When set to &amp;quot;out&amp;quot; links from&lt;br&gt; text labels face out, rather than in.&lt;/p&gt; &lt;p&gt;Added font names to SVG files via font-family tag.&lt;/p&gt; &lt;p&gt;Removed -verbose. The -v flag now reports version.&lt;/p&gt; &lt;p&gt;Removed dependence on Graphics::ColorObject.&lt;/p&gt; &lt;p&gt;Added error handling framework.&lt;/p&gt; &lt;p&gt;Circos now requires Text::Format&lt;/p&gt; &lt;p&gt;Bug fix to heat map color mapping of last color.&lt;/p&gt; &lt;p&gt;Fixed bug which was causing line links to be drawn with a thickness&lt;br&gt; half of what was requested.&lt;/p&gt; &lt;p&gt;Fixed bug that prevented parameters made acceptable by the&lt;br&gt; restrict_parameter_names=no setting from being parsed.&lt;/p&gt; &lt;p&gt;Configuration file location is now guessed if guess_conf_location=yes&lt;br&gt; (see etc/housekeeping.conf)&lt;/p&gt; &lt;p&gt;Color file cache can now be static (color_cache_static) and dir/file&lt;br&gt; can be changed (color_cache_{file,dir})&lt;/p&gt; &lt;p&gt;Added &amp;#39;placed&amp;#39; and &amp;#39;not_placed&amp;#39; output for labels in text tracks to.&lt;br&gt; Use -debug_group text to see this.&lt;/p&gt; &lt;p&gt;  # create data file of labels that were not placed&lt;br&gt;   circos -conf ... -debug_group text | grep not_placed &amp;gt;&lt;br&gt; text.notplaced.txt&lt;/p&gt; &lt;p&gt;Parts of the code were made faster (unit checking) through Memoize.&lt;/p&gt; &lt;p&gt;Fixed a bug which prevented links with thickness=1 from being shown&lt;br&gt; with correct transparency.&lt;/p&gt; &lt;p&gt;Fixed bug in which color errors were produced when PNG file was not&lt;br&gt; asked for.&lt;/p&gt; &lt;p&gt;Fixed bug in which opacity of links in SVG files was missing in some&lt;br&gt; cases.&lt;/p&gt; &lt;p&gt;Fixed but which was assigning the wrong color to transparent links in&lt;br&gt; PNG files in some cases.&lt;/p&gt; &lt;p&gt;Centralized color configuration files colors.conf now includes&lt;br&gt; brewer.conf - no need to include brewer.conf separately.&lt;/p&gt; &lt;p&gt;Added -paranoid flag to exit on warnings.&lt;/p&gt; &lt;p&gt;Made error messages friendlier. Revamped internal error handling&lt;br&gt; mechanism.&lt;/p&gt; &lt;p&gt;Added data_path to allow adding to locations where files are searched&lt;br&gt; for.&lt;/p&gt; &lt;p&gt;Added data/ to prefix path of locations where files are searched for.&lt;br&gt; Now the default search locations are&lt;/p&gt; &lt;p&gt; { CWD | CIRCOS_PATH } + { . | .. | ../.. } + { . | etc | data }&lt;/p&gt; &lt;p&gt;--&lt;br&gt; You received this message because you are subscribed to the Google Groups &amp;quot;Circos&amp;quot; group.&lt;/p&gt; &lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-1417435315212831387?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/3CCuSW85sU6IPLs5GyvJ59vQOTE/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/3CCuSW85sU6IPLs5GyvJ59vQOTE/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/3CCuSW85sU6IPLs5GyvJ59vQOTE/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/3CCuSW85sU6IPLs5GyvJ59vQOTE/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/h84346UB2PI" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/1417435315212831387/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/02/circos-circos-v056-released.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/1417435315212831387?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/1417435315212831387?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/h84346UB2PI/circos-circos-v056-released.html" title="[circos] Circos v0.56 released" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/02/circos-circos-v056-released.html</feedburner:origLink></entry><entry gd:etag="W/&quot;C0IFQn0zfip7ImA9WhRbFEk.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-1747312544067897540</id><published>2012-02-05T19:31:00.001+08:00</published><updated>2012-02-05T19:31:53.386+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-02-05T19:31:53.386+08:00</app:edited><title>Hive Plots - Linear Layout for Network Visualization - Visually Interpreting Network Structure and Content Made Possible</title><content type="html">&lt;a href="http://mkweb.bcgsc.ca/linnet/"&gt;http://mkweb.bcgsc.ca/linnet/&lt;/a&gt;&lt;div&gt;&lt;span style="font-family:&amp;#39;Times New Roman&amp;#39;;font-size:medium"&gt;Krzywinski M, Birol I, Jones S, Marra M (2011). &lt;/span&gt;&lt;a href="http://bib.oxfordjournals.org/content/early/2011/12/09/bib.bbr069.short?rss=1" style="font-family:&amp;#39;Times New Roman&amp;#39;;font-size:medium"&gt;Hive Plots — Rational Approach to Visualizing Networks&lt;/a&gt;&lt;span style="font-family:&amp;#39;Times New Roman&amp;#39;;font-size:medium"&gt;. Briefings in Bioinformatics (early access 9 December 2011, doi: 10.1093/bib/bbr069). (&lt;/span&gt;&lt;a href="http://mkweb.bcgsc.ca/linnet/hiveplot.enw" style="font-family:&amp;#39;Times New Roman&amp;#39;;font-size:medium"&gt;download citation&lt;/a&gt;&lt;span style="font-family:&amp;#39;Times New Roman&amp;#39;;font-size:medium"&gt;)&lt;/span&gt;&lt;/div&gt;  &lt;div&gt;&lt;span style="font-family:&amp;#39;Times New Roman&amp;#39;;font-size:medium"&gt;&lt;br&gt;&lt;/span&gt;&lt;/div&gt;&lt;div&gt;&lt;div id="title" style="font-family:&amp;#39;Times New Roman&amp;#39;;font-size:medium"&gt;&lt;div class="content"&gt;&lt;div id="badge"&gt;&lt;img src="http://mkweb.bcgsc.ca/linnet/gfx/hiveplot-useful-geeky-simple.png" alt="Hive plots are useful, geeky and simple to implement. Go nuts.  [ Hive Plots - Rational Network Visualization - A Simple, Informative and Pretty Linear Layout for Network Analytics - Martin Krzywinski ]"&gt;&lt;/div&gt;  &lt;div id="logo"&gt;&lt;a href="http://www.hiveplot.com/"&gt;&lt;img src="http://mkweb.bcgsc.ca/linnet/gfx/hiveplot-logo.png" alt="Linear layout for network visualization.  [ Hive Plots - Rational Network Visualization - A Simple, Informative and Pretty Linear Layout for Network Analytics - Martin Krzywinski ]"&gt;&lt;/a&gt;&lt;/div&gt;  &lt;/div&gt;&lt;/div&gt;&lt;div id="masthead" style="font-family:&amp;#39;Times New Roman&amp;#39;;font-size:medium"&gt;&lt;div class="content"&gt;&lt;div class="caption"&gt;&lt;p&gt;&lt;em&gt;the hive plot is a perceptually uniform and scalable linear layout visualization for network visual analytics&lt;/em&gt; &lt;/p&gt;  &lt;p&gt;&lt;br&gt;&lt;/p&gt;&lt;p&gt;&lt;/p&gt;&lt;p&gt;UNDERSTANDING NETWORK STRUCTURE WITH HIVE PLOTS.&lt;/p&gt;&lt;p&gt;(A) Normalized (top) and absolute (bottom) connectivity of &lt;i&gt;E. coli&lt;/i&gt; gene regulatory network and Linux function call network (&lt;a href="http://www.pnas.org/content/early/2010/04/28/0914771107.short"&gt;Yan &lt;i&gt;et al.&lt;/i&gt;&lt;/a&gt;)&lt;/p&gt;  &lt;p&gt;(B) Gene co-regulation networks in neuroblastoma samples.&lt;/p&gt;&lt;p&gt;(C) Network edges shown as ribbons creating circularly composited stacked bar plots (a periodic steamgraph).&lt;/p&gt;&lt;p&gt;(D) Syntenic network of three modern crucifer species to ancestral genome.&lt;/p&gt;  &lt;p&gt;(E) Layered network correlation matrix. In each cell two layers &lt;i&gt;u&lt;/i&gt;,&lt;i&gt;v&lt;/i&gt; are depicted with &lt;i&gt;u&lt;/i&gt; used to order axes and nodes while links for &lt;i&gt;v&lt;/i&gt; are shown.&lt;/p&gt;&lt;p&gt;&lt;br&gt;&lt;/p&gt;&lt;p&gt;&lt;/p&gt;&lt;h1&gt;Hive plots — for the impatient&lt;/h1&gt;  &lt;p&gt;The &lt;i&gt;hive plot&lt;/i&gt; is a rational visualization method for drawing networks. Nodes are mapped to and positioned on radially distributed linear axes — this mapping is based on network structural properties. Edges are drawn as curved links. Simple and interpretable.&lt;/p&gt;  &lt;p&gt;The purpose of the hive plot is to establish a new baseline for visualization of large networks — a method that is both general and tunable and useful as a starting point in visually exploring network structure.&lt;/p&gt;&lt;p&gt;  &lt;a href="http://mkweb.bcgsc.ca/linnet/conference/ismb2011/netbiosig/hivepanel-human-dip-poster.png"&gt;&lt;img src="http://mkweb.bcgsc.ca/linnet/img/hiveplot-thisisuseful.png" alt=" [ Hive Plots - Rational Network Visualization - A Simple, Informative and Pretty Linear Layout for Network Analytics - Martin Krzywinski ]"&gt;&lt;/a&gt;&lt;/p&gt;  &lt;p&gt;Hive plots give the reader a passing chance to &lt;i&gt;quantitatively&lt;/i&gt; understand important aspects of a network&amp;#39;s structure. Unlike hairballs, hive plots are excellent at managing the visual complexity arising from large number of edges and exposing both trends and outlier patterns in network structure.&lt;/p&gt;  &lt;p&gt;&lt;br&gt;&lt;/p&gt;&lt;p&gt;&lt;br&gt;&lt;/p&gt;&lt;p&gt;&lt;/p&gt;&lt;h1&gt;only for networks?&lt;/h1&gt;&lt;p&gt;No.&lt;/p&gt;&lt;p&gt;Hive plots can be applied to data structures other than networks. The method requires that your data be mappable onto a set of pairwise relationships. For networks, this pairwise relationship is the edge between two nodes. In other circumstances, it can relate two spatial positions (where the axis corresponds to an object with a physical length scale) or two intervals (two axis segments are related, thereby creating a ratio comparison).&lt;/p&gt;  &lt;p&gt;&lt;br&gt;&lt;/p&gt;&lt;p&gt;&lt;/p&gt;&lt;p&gt;&lt;a href="http://mkweb.bcgsc.ca/linnet/img/assembly-quality.png"&gt;&lt;img src="http://mkweb.bcgsc.ca/linnet/img/assembly-quality-small-black.png" alt=" [ Hive Plots - Rational Network Visualization - A Simple, Informative and Pretty Linear Layout for Network Analytics - Martin Krzywinski ] - Assessing genome assembly quality with a hive plot, which compares reads, assembly and reference."&gt;&lt;/a&gt;&lt;/p&gt;  &lt;p&gt;This hive plot provides a visual recipe for assessing the quality of a genomic assembly. An assembly is composed of reads (bottom axis), which are assembled into contigs (right axis). Independently, a reference assembly (left axis) may exist and act as a comparator. Among others, this hive plot answers the following questions&lt;/p&gt;  &lt;ul&gt;&lt;li&gt;what fraction of reads are unassembled? 20%&lt;/li&gt;&lt;li&gt;what fraction of reads are unaligned to reference? 30%&lt;/li&gt;&lt;li&gt;what fraction of reference has no read coverage? 2%&lt;/li&gt;&lt;li&gt;what fraction of reference has no contig coverage? 15%&lt;/li&gt;  &lt;li&gt;what fraction of reference is constructed by contigs &amp;lt; 200kb? 60%&lt;/li&gt;&lt;li&gt;are there contigs &amp;gt; 200kb? no.&lt;/li&gt;&lt;li&gt;what fraction of contigs are unaligned to the reference? 20%&lt;/li&gt;&lt;li&gt;what fraction of the overall assembly is derived from k=27 assembly? 80%&lt;/li&gt;  &lt;/ul&gt;&lt;p&gt;The benefit of this stacked bar plot layout is that the circular layout is both periodic and has visual weight. This approach is similar to a &lt;a href="http://en.wikipedia.org/wiki/Parallel_coordinates"&gt;parallel coordinate plot&lt;/a&gt;, except here the plot wraps around.&lt;/p&gt;  &lt;p&gt;Multiple panels can be combined to display a very large number of ratios. Below are shown 3 x 3 x 3 (27) comparisons, each with 3 x 8 ratios, for a total of &lt;i&gt;648 ratios&lt;/i&gt;. By categorizing each ratio using a spectral color scheme, patterns can be quickly spotted and interpreted. The image below was created for the &lt;a href="http://mkweb.bcgsc.ca/embo/hiveplot/"&gt;EMBO Journal 2011 cover contest&lt;/a&gt;.&lt;/p&gt;  &lt;p&gt;&lt;/p&gt;&lt;p&gt;&lt;/p&gt;&lt;p&gt;&lt;/p&gt;&lt;p&gt;&lt;/p&gt;&lt;/div&gt;&lt;/div&gt;&lt;/div&gt;&lt;/div&gt; &lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-1747312544067897540?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/gGZrNOTPL32Qhgj67s7N0ZxADsg/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/gGZrNOTPL32Qhgj67s7N0ZxADsg/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/gGZrNOTPL32Qhgj67s7N0ZxADsg/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/gGZrNOTPL32Qhgj67s7N0ZxADsg/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/2t9oCrQtmxU" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/1747312544067897540/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/02/hive-plots-linear-layout-for-network.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/1747312544067897540?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/1747312544067897540?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/2t9oCrQtmxU/hive-plots-linear-layout-for-network.html" title="Hive Plots - Linear Layout for Network Visualization - Visually Interpreting Network Structure and Content Made Possible" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/02/hive-plots-linear-layout-for-network.html</feedburner:origLink></entry><entry gd:etag="W/&quot;DEYNQ3s8eSp7ImA9WhRbEk0.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-8696191712958554427</id><published>2012-02-03T02:06:00.001+08:00</published><updated>2012-02-03T02:09:52.571+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-02-03T02:09:52.571+08:00</app:edited><title>R-SAP: a multi-threading computational pipeline for the characterization of high-throughput RNA-sequencing data</title><content type="html">&lt;div dir="ltr" style="text-align: left;" trbidi="on"&gt;
&lt;a href="http://nar.oxfordjournals.org/content/early/2012/01/28/nar.gks047.long"&gt;http://nar.oxfordjournals.org/content/early/2012/01/28/nar.gks047.long&lt;/a&gt;&lt;br /&gt;
&lt;div id="p-2"&gt;
The rapid expansion in the quantity and  quality of RNA-Seq data requires the development of sophisticated  high-performance                      bioinformatics tools capable of rapidly  transforming this data into meaningful information that is easily  interpretable by                      biologists. Currently available analysis tools are  often not easily installed by the general biologist and most of them  lack                      inherent parallel processing capabilities widely  recognized as an essential feature of next-generation bioinformatics  tools.                      We present here a user-friendly and fully automated  &lt;span class="underline"&gt;R&lt;/span&gt;NA-&lt;span class="underline"&gt;S&lt;/span&gt;eq &lt;span class="underline"&gt;a&lt;/span&gt;nalysis &lt;span class="underline"&gt;p&lt;/span&gt;ipeline  (R-SAP) with built-in multi-threading capability to analyze and  quantitate high-throughput RNA-Seq datasets. R-SAP                      follows a hierarchical decision making procedure to  accurately characterize various classes of transcripts and achieves a                      near linear decrease in data processing time as a  result of increased multi-threading. In addition, RNA expression level  estimates                      obtained using R-SAP display high concordance with  levels measured by microarrays.                   &lt;/div&gt;
&lt;br /&gt;
&lt;div id="p-10"&gt;
To initiate analyses using R-SAP, the user provides two 
required inputs for the pipeline: the sequence alignment file and
                        known transcripts’ coordinate file. Currently 
R-SAP accepts alignment files only in psl format that are generated by 
mapping
                        RNA-Seq reads to the reference genome using BLAT
 (Blast like alignment tool) (&lt;a class="xref-bibr" href="http://nar.oxfordjournals.org/content/early/2012/01/28/nar.gks047.long#ref-21" id="xref-ref-21-1"&gt;21&lt;/a&gt;) or SSAHA2 (Sequence search and alignment by hashing algorithm) (&lt;a class="xref-bibr" href="http://nar.oxfordjournals.org/content/early/2012/01/28/nar.gks047.long#ref-22" id="xref-ref-22-1"&gt;22&lt;/a&gt;).
 RNA-Seq reads mapping to the genome may result in the alignments 
scattered across multiple exons separated by introns.
                        We chose psl as the alignment format for the 
pipeline because the scattered alignments are precisely stitched 
together and
                        reported as a large single alignment. As a 
result, for each sequencing read the most likely alignment and 
corresponding genomic
                        locus can be readily found in the alignment 
files. Moreover, the psl format preserves the orientation of alignment 
blocks
                        originating from the contiguous genomic loci 
enabling their accurate re-mapping to the annotated exons and 
determination of
                        associated reference structural variants.
                     &lt;/div&gt;
&lt;div id="p-11"&gt;
R-SAP is also configured to work with two of the currently available transcript assemblers: Cufflinks (&lt;a class="xref-bibr" href="http://nar.oxfordjournals.org/content/early/2012/01/28/nar.gks047.long#ref-23" id="xref-ref-23-1"&gt;23&lt;/a&gt;) and Scripture (&lt;a class="xref-bibr" href="http://nar.oxfordjournals.org/content/early/2012/01/28/nar.gks047.long#ref-24" id="xref-ref-24-1"&gt;24&lt;/a&gt;). Assembled transcripts can be supplied to R-SAP either in GTF (Gene Transfer Format) or in BED (Browser Extensible Data)
                        format. GTF and BED are default output formats from Cufflinks and Scripture respectively.&amp;nbsp;&lt;/div&gt;
&lt;div class="separator" style="clear: both; text-align: center;"&gt;
&lt;a href="http://nar.oxfordjournals.org/content/early/2012/01/28/nar.gks047/F1.large.jpg" imageanchor="1" style="margin-left: 1em; margin-right: 1em;"&gt;&lt;img border="0" height="177" src="http://nar.oxfordjournals.org/content/early/2012/01/28/nar.gks047/F1.large.jpg" width="640" /&gt;&lt;/a&gt;&lt;/div&gt;
&lt;div id="p-11"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div class="cb-section cb-slug"&gt;
&lt;ol id="docked-slug"&gt;
&lt;li&gt;&lt;div id="slugline"&gt;
&lt;cite&gt;                                  &lt;abbr class="slug-jnl-abbrev" title="Nucleic Acids Research"&gt;                                     Nucl. Acids Res.&lt;/abbr&gt;&lt;span class="slug-pub-date"&gt;                                     (2012)                                      &lt;/span&gt;                                                                                                      &lt;span class="slug-doi-wrapper"&gt;                                                                          doi:                                                                          &lt;span class="slug-doi" title="10.1093/nar/gks047"&gt;10.1093/nar/gks047&lt;/span&gt;                                     &lt;/span&gt;                                  &lt;/cite&gt;                                                                                             &lt;span class="slug-metadata-note ahead-of-print"&gt;                                                                    First published online:                                                                    &lt;span class="slug-ahead-of-print-date"&gt;January 28, 2012&lt;/span&gt;                                  &lt;/span&gt;                                                                                                                                                                                                                                                     &lt;/div&gt;
&lt;/li&gt;
&lt;/ol&gt;
&lt;/div&gt;
&lt;span class="creative-commons-article"&gt;This article is Open Access&lt;/span&gt;&lt;/div&gt;&lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-8696191712958554427?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/dUkf5cpCtHcPrplu5cpVMecqu08/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/dUkf5cpCtHcPrplu5cpVMecqu08/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/dUkf5cpCtHcPrplu5cpVMecqu08/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/dUkf5cpCtHcPrplu5cpVMecqu08/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/TJjULRlK6fw" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/8696191712958554427/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/02/r-sap-multi-threading-computational.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/8696191712958554427?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/8696191712958554427?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/TJjULRlK6fw/r-sap-multi-threading-computational.html" title="R-SAP: a multi-threading computational pipeline for the characterization of high-throughput RNA-sequencing data" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/02/r-sap-multi-threading-computational.html</feedburner:origLink></entry><entry gd:etag="W/&quot;D0AMRXY5fip7ImA9WhRbEk0.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-3912321030654340442</id><published>2012-02-03T02:02:00.000+08:00</published><updated>2012-02-03T02:03:04.826+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-02-03T02:03:04.826+08:00</app:edited><title>Performance comparison and evaluation of software tools for microRNA deep-sequencing data analysis</title><content type="html">&lt;a href="http://nar.oxfordjournals.org/content/early/2012/01/28/nar.gks043.long"&gt;http://nar.oxfordjournals.org/content/early/2012/01/28/nar.gks043.long&lt;/a&gt;&lt;br&gt;                                      &lt;p id="p-2"&gt;With the development of next-generation  sequencing (NGS) techniques, many software tools have emerged for the  discovery of                      novel microRNAs (miRNAs) and for analyzing the  miRNAs expression profiles. An overall evaluation of these diverse  software                      tools is lacking. In this study, we evaluated eight  software tools based on their common feature and key algorithms. Three                      deep-sequencing data sets were collected from  different species and used to assess the computational time, sensitivity  and                      accuracy of detecting known miRNAs as well as their  capacity for predicting novel miRNAs. Our results provide useful  information                      for researchers to facilitate their selection of  the optimal software tools for miRNA analysis depending on their  specific                      requirements, i.e. novel miRNAs discovery or miRNA  expression profile analysis of sequencing data sets.                   &lt;/p&gt;&lt;br&gt; &lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-3912321030654340442?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/FAJtAGgs9TOOWA5Gi4hn6UyVawI/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/FAJtAGgs9TOOWA5Gi4hn6UyVawI/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/FAJtAGgs9TOOWA5Gi4hn6UyVawI/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/FAJtAGgs9TOOWA5Gi4hn6UyVawI/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/VK2U1qFFKLI" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/3912321030654340442/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/02/performance-comparison-and-evaluation.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/3912321030654340442?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/3912321030654340442?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/VK2U1qFFKLI/performance-comparison-and-evaluation.html" title="Performance comparison and evaluation of software tools for microRNA deep-sequencing data analysis" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/02/performance-comparison-and-evaluation.html</feedburner:origLink></entry><entry gd:etag="W/&quot;DE8CSXk6fyp7ImA9WhRbEk0.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-8083324362472672025</id><published>2012-02-03T00:50:00.001+08:00</published><updated>2012-02-03T02:21:08.717+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-02-03T02:21:08.717+08:00</app:edited><category scheme="http://www.blogger.com/atom/ns#" term="open access" /><category scheme="http://www.blogger.com/atom/ns#" term="#OpenAccess" /><title>Are we slaves to the scientific publishing industry?</title><content type="html">&lt;div dir="ltr" style="text-align: left;" trbidi="on"&gt;
Found this fascinating analogy in the post &lt;a href="http://conservationbytes.com/2012/01/29/knowledge-slavery/"&gt;http://conservationbytes.com/2012/01/29/knowledge-slavery/&lt;/a&gt; &lt;br /&gt;
&lt;br /&gt;
&lt;i&gt;...our slavery to the scientific publishing industry.&lt;/i&gt; &lt;br /&gt;
&lt;div style="text-align: left;"&gt;
&lt;i&gt;And 'slavery' is definitely the most  appropriate term here, for how else would you describe a business where  the product is produced by others for free&lt;sup&gt;1&lt;/sup&gt; (scientific  results), is assessed for quality by others for free (reviewing), is  commissioned, overviewed and selected by yet others for free (editing),  and then sold back to the very same scientists and the rest of the  world's consumers at exorbitant prices.&lt;/i&gt;&lt;/div&gt;
&lt;i&gt;This isn't just a whinge about a specialised  and economically irrelevant sector of the economy, we're talking about  an industry worth hundreds of billions of dollars annually. In fact, &lt;a href="http://www.elsevier.com/"&gt;Elsevier&lt;/a&gt; (agreed by many to be the leader in the greed-pack – see how some scientists are &lt;a href="http://gowers.wordpress.com/2012/01/21/elsevier-my-part-in-its-downfall/"&gt;staging their protest&lt;/a&gt;; &lt;a href="http://johncarlosbaez.wordpress.com/2012/01/26/ban-elsevier/"&gt;also here&lt;/a&gt;) made &lt;a href="http://www.guardian.co.uk/commentisfree/2011/aug/29/academic-publishers-murdoch-socialist"&gt;US$1.1 billion&lt;/a&gt; in 2010!&lt;br /&gt;  &lt;br /&gt;&lt;/i&gt;what are your thoughts? I don't think that making money is necessarily bad, but apparently rich is even a derogatory term now, with rich ppl (oops) preferring to be called high net worth individuals. But when it's larger entities, corporations, it might be easy to mud sling them. &lt;br /&gt;
However, I think the author has a point when making the analogy, my 1st shock was discovering that I have to read lengthy copyright info on what I can or cannot do with something that I researched / wrote&amp;nbsp; (see &lt;a href="http://www.elsevier.com/wps/find/authorsview.authors/rights"&gt;http://www.elsevier.com/wps/find/authorsview.authors/rights&lt;/a&gt; ) &lt;br /&gt;
&lt;br /&gt;
It's so much easier to understand from a photographer's point of view &lt;br /&gt;
&lt;a href="http://www.photosecrets.com/photography-law-copyright"&gt;http://www.photosecrets.com/photography-law-copyright&lt;/a&gt;&lt;br /&gt;
&lt;i&gt;&lt;br /&gt;"Copyright" is "the right to copy." This right is a legal construct,  designed for you — the artist — to support your artistic endeavors.  Without copyright, people would be free to use your artistic work &lt;br /&gt;You can negotiate a "license" to copy, and perhaps even get paid in real  money. Hopefully this will give you more incentive to create art, and  the world will be a better place.&lt;/i&gt;&lt;br /&gt;
&lt;h3&gt;
&lt;i&gt;Will People Steal My Work?&lt;/i&gt;&lt;/h3&gt;
&lt;i&gt;Generally no, as publishers live by copyright law and usually have  established rates which they gladly pay. A more likely problem is that  publishers may not know that you are the copyright owner, which goes  back to that "©" symbol and digital watermark.&lt;/i&gt;&lt;br /&gt;
&lt;br /&gt;
Hey wait a minute .. "&lt;i&gt;the world will be a better place "&lt;/i&gt;&amp;nbsp; hmmm I thought scientists are the ones trying to help the world with advancing human knowledge where our incentive to churn out more scientific results? &lt;br /&gt;
&lt;br /&gt;
hmmm food for thought .. &lt;br /&gt;
Post comments!&lt;br /&gt;
&lt;br /&gt;&lt;/div&gt;&lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-8083324362472672025?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/C2dF0hPD7qjAyfgt2Zz5yxhzIYc/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/C2dF0hPD7qjAyfgt2Zz5yxhzIYc/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/C2dF0hPD7qjAyfgt2Zz5yxhzIYc/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/C2dF0hPD7qjAyfgt2Zz5yxhzIYc/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/WMNfrkDRHuo" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/8083324362472672025/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/02/are-we-slaves-to-scientific-publishing.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/8083324362472672025?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/8083324362472672025?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/WMNfrkDRHuo/are-we-slaves-to-scientific-publishing.html" title="Are we slaves to the scientific publishing industry?" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/02/are-we-slaves-to-scientific-publishing.html</feedburner:origLink></entry><entry gd:etag="W/&quot;DkUARns9fyp7ImA9WhRbEE8.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-7758963311801109742</id><published>2012-01-31T23:37:00.001+08:00</published><updated>2012-01-31T23:37:27.567+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-01-31T23:37:27.567+08:00</app:edited><title>How do u share ur results from genome studies?</title><content type="html">&lt;p&gt;RT @emblebi: A new @sangerinstitute project is exploring how researchers share results from genome studies. Take the questionnaire: &lt;a href="http://bit.ly/xw8Y0k"&gt;http://bit.ly/xw8Y0k&lt;/a&gt;&lt;/p&gt; &lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-7758963311801109742?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/nbbbAB9udRRop4KjZn7LTkc672Y/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/nbbbAB9udRRop4KjZn7LTkc672Y/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/nbbbAB9udRRop4KjZn7LTkc672Y/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/nbbbAB9udRRop4KjZn7LTkc672Y/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/-yYcCEkPyOk" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/7758963311801109742/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/01/how-do-u-share-ur-results-from-genome.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/7758963311801109742?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/7758963311801109742?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/-yYcCEkPyOk/how-do-u-share-ur-results-from-genome.html" title="How do u share ur results from genome studies?" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/01/how-do-u-share-ur-results-from-genome.html</feedburner:origLink></entry><entry gd:etag="W/&quot;DEEHR3kyeSp7ImA9WhRUGUs.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-6986509622567829550</id><published>2012-01-31T07:37:00.001+08:00</published><updated>2012-01-31T07:37:16.791+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-01-31T07:37:16.791+08:00</app:edited><title>[Samtools-help] Picard release 1.61</title><content type="html">&lt;p&gt;&lt;br&gt; Picard release 1.61&lt;br&gt; 30 January 2012&lt;/p&gt; &lt;p&gt;- PicardException used to extend SAMException, which extends RuntimeException.  Now PicardException extends RuntimeException directly.  If you have code that catches SAMException, you may want to add a catch clause for PicardException if you use the net.sf.picard classes.  If you only use classes in net.sf.samtools, you should never see PicardException thrown.&lt;/p&gt;  &lt;p&gt;- IlluminaDataProviderFactory.java: Ensure position data type is in set of data types in ctors rather than in makeDataProvider(), in order to avoid ConcurrentModificationException.&lt;/p&gt; &lt;p&gt;-Alec&lt;/p&gt; &lt;p&gt;------------------------------------------------------------------------------&lt;br&gt; _______________________________________________&lt;br&gt; Samtools-help mailing list&lt;br&gt; &lt;a href="https://lists.sourceforge.net/lists/listinfo/samtools-help"&gt;https://lists.sourceforge.net/lists/listinfo/samtools-help&lt;/a&gt;&lt;/p&gt; &lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-6986509622567829550?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/i4RuYswVGyuhEPrZWqhqhxazlnQ/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/i4RuYswVGyuhEPrZWqhqhxazlnQ/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/i4RuYswVGyuhEPrZWqhqhxazlnQ/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/i4RuYswVGyuhEPrZWqhqhxazlnQ/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/Su7b8CsFSfA" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/6986509622567829550/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/01/samtools-help-picard-release-161.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/6986509622567829550?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/6986509622567829550?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/Su7b8CsFSfA/samtools-help-picard-release-161.html" title="[Samtools-help] Picard release 1.61" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/01/samtools-help-picard-release-161.html</feedburner:origLink></entry><entry gd:etag="W/&quot;DU8NRHk4eyp7ImA9WhRUF04.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-9026958176691494018</id><published>2012-01-28T16:04:00.001+08:00</published><updated>2012-01-28T16:04:55.733+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-01-28T16:04:55.733+08:00</app:edited><title>galaxy-user] January 27, 2012 Galaxy Distribution &amp; News Brief</title><content type="html">&lt;br&gt;&lt;br&gt;---------- Forwarded message ----------&lt;br&gt;From: Jennifer Jackson&lt;br&gt;Date: Saturday, 28 January 2012&lt;br&gt;Subject: [galaxy-user] January 27, 2012 Galaxy Distribution &amp;amp; News Brief&lt;br&gt;&lt;br&gt;&lt;br&gt;&lt;br&gt;January 27, 2012 Galaxy Distribution &amp;amp;  News Brief&lt;br&gt; &lt;br&gt;&lt;br&gt;Complete News Brief&lt;br&gt;* &lt;a href="http://wiki.g2.bx.psu.edu/DevNewsBriefs/2012_01_27"&gt;http://wiki.g2.bx.psu.edu/DevNewsBriefs/2012_01_27&lt;/a&gt;&lt;br&gt;&lt;br&gt;&lt;br&gt;Highlights:&lt;br&gt;&lt;br&gt;* Important metadata and Python 2.5 support corrections&lt;br&gt; * SAMtools upgraded for version 0.1.18. Mpileup added.&lt;br&gt;* Dynamic filtering, easy color options, and quicker&lt;br&gt; indexing enhance Trackster&lt;br&gt;* Set up your Galaxy instance to run cluster jobs as&lt;br&gt; the real user, not the Galaxy owner&lt;br&gt; * Improvements to metadata handling and searching in&lt;br&gt; the Tool Shed&lt;br&gt;* Improved solutions for schema access, jobs management,&lt;br&gt; &amp;amp; workflow imports and inputs.&lt;br&gt;* New datatypes (Eland, XML), multiple tool enhancements,&lt;br&gt;  and bug fixes.&lt;br&gt;&lt;br&gt;&lt;br&gt;Get Galaxy!&lt;br&gt;* &lt;a href="http://getgalaxy.org"&gt;http://getgalaxy.org&lt;/a&gt;&lt;br&gt;&lt;br&gt;new:     % hg clone &lt;a href="http://www.bx.psu.edu/hg/galaxy"&gt;http://www.bx.psu.edu/hg/galaxy&lt;/a&gt; galaxy-dist&lt;br&gt;upgrade: % hg pull -u -r 26920e20157f&lt;br&gt; &lt;br&gt;&lt;br&gt;Read the release announcement and see the prior release history&lt;br&gt;* &lt;a href="http://wiki.g2.bx.psu.edu/DevNewsBriefs/"&gt;http://wiki.g2.bx.psu.edu/DevNewsBriefs/&lt;/a&gt;&lt;br&gt;&lt;br&gt;&lt;br&gt;Need help with a local instance?&lt;br&gt;&lt;br&gt; Search with our custom google tools!&lt;br&gt;* &lt;a href="http://wiki.g2.bx.psu.edu/Mailing%20Lists#Searching"&gt;http://wiki.g2.bx.psu.edu/Mailing%20Lists#Searching&lt;/a&gt;&lt;br&gt;&lt;br&gt;And consider subscribing to the galaxy-dev mailing list!&lt;br&gt; * &lt;a href="http://wiki.g2.bx.psu.edu/Mailing%20Lists#Subscribing_and_Unsubscribing"&gt;http://wiki.g2.bx.psu.edu/Mailing%20Lists#Subscribing_and_Unsubscribing&lt;/a&gt;&lt;br&gt;&lt;br&gt;&lt;br&gt;&lt;br&gt;&lt;br&gt;--&lt;br&gt;Jennifer Jackson&lt;br&gt;Galaxy Team&lt;br&gt;&lt;br&gt; &lt;a href="http://usegalaxy.org"&gt;http://usegalaxy.org&lt;/a&gt;&lt;br&gt;&lt;a href="http://galaxyproject.org"&gt;http://galaxyproject.org&lt;/a&gt;&lt;br&gt;&lt;a href="http://galaxyproject.org/wiki/Support"&gt;http://galaxyproject.org/wiki/Support&lt;/a&gt;&lt;br&gt;&lt;br&gt; &lt;br&gt;&lt;br&gt;___________________________________________________________&lt;br&gt;The Galaxy User list should be used for the discussion of&lt;br&gt;Galaxy analysis and other features on the public server&lt;br&gt;at &lt;a href="http://usegalaxy.org"&gt;usegalaxy.org&lt;/a&gt;.  Please keep all replies on the list by&lt;br&gt; using &amp;quot;reply all&amp;quot; in your mail client.  For discussion of&lt;br&gt;local Galaxy instances and the Galaxy source code, please&lt;br&gt;use the Galaxy Development list:&lt;br&gt;&lt;br&gt; &lt;a href="http://lists.bx.psu.edu/listinfo/galaxy-dev"&gt;http://lists.bx.psu.edu/listinfo/galaxy-dev&lt;/a&gt;&lt;br&gt; &lt;br&gt;To manage your subscriptions to this and other Galaxy lists,&lt;br&gt;please use the interface at:&lt;br&gt;&lt;br&gt; &lt;a href="http://lists.bx.psu.edu/"&gt;http://lists.bx.psu.edu/&lt;/a&gt;&lt;br&gt;&lt;br&gt; &lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-9026958176691494018?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/EsIaFFcrvUcboFotfCnISGDymJo/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/EsIaFFcrvUcboFotfCnISGDymJo/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/EsIaFFcrvUcboFotfCnISGDymJo/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/EsIaFFcrvUcboFotfCnISGDymJo/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/DCX9H-KuGCw" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/9026958176691494018/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/01/galaxy-user-january-27-2012-galaxy.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/9026958176691494018?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/9026958176691494018?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/DCX9H-KuGCw/galaxy-user-january-27-2012-galaxy.html" title="galaxy-user] January 27, 2012 Galaxy Distribution &amp; News Brief" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/01/galaxy-user-january-27-2012-galaxy.html</feedburner:origLink></entry><entry gd:etag="W/&quot;DUAGQHw5fip7ImA9WhRUF04.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-6027030732807780355</id><published>2012-01-28T16:02:00.001+08:00</published><updated>2012-01-28T16:02:01.226+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-01-28T16:02:01.226+08:00</app:edited><title>Changes to Google Privacy Policy and Terms of Service</title><content type="html">hmmm unsure if this is for better or worse&lt;br&gt;&lt;br&gt;---------- Forwarded message ----------&lt;br&gt;From: Google&lt;br&gt;Date: Saturday, 28 January 2012&lt;br&gt;Subject: Changes to Google Privacy Policy and Terms of Service&lt;br&gt;&lt;br&gt;&lt;br&gt;Is this email not displaying properly?&lt;br&gt; View it in your browser.&lt;br&gt;&lt;br&gt;Dear Google user,&lt;br&gt;&lt;br&gt;We're getting rid of over 60 different privacy policies across Google and replacing them with one that's a lot shorter and easier to read. Our new policy covers multiple products and features, reflecting our desire to create one beautifully simple and intuitive experience across Google.&lt;br&gt; &lt;br&gt;We believe that this stuff matters so please take a few minutes to read our updated Privacy Policy and Terms of Service at &lt;a href="http://www.google.com/policies"&gt;http://www.google.com/policies&lt;/a&gt;. These changes will take effect on 1 March, 2012.&lt;br&gt; &lt;br&gt;One policy, one Google experience&lt;br&gt;________________________________&lt;br&gt;Easy to work across Google&lt;br&gt;&lt;br&gt;Our new policy reflects a single product experience that does what you need, when you want it to. Whether you&amp;#39;re reading an email that reminds you to schedule a family get-together or finding a favourite video that you want to share, we want to ensure that you can move across Gmail, Calendar, Search, YouTube or whatever your life calls for, with ease.&lt;br&gt; &lt;br&gt;Tailored for you&lt;br&gt;&lt;br&gt;If you're signed in to Google, we can do things like suggest search queries – or tailor your search results – based on the interests that you've expressed in Google+, Gmail and YouTube. We'll better understand which version of Pink or Jaguar you're searching for and get you those results faster.&lt;br&gt; &lt;br&gt;Easy to share and collaborate&lt;br&gt;&lt;br&gt;When you post or create a document online, you often want others to see and contribute. By remembering the contact information of the people you want to share with, we make it easy for you to share in any Google product or service with minimal clicks and errors.&lt;br&gt; &lt;br&gt;________________________________&lt;br&gt;Protecting your privacy hasn't changed&lt;br&gt;&lt;br&gt;Our goal is to provide you with as much transparency and choice as possible through products like Google Dashboard and Ad Preferences Manager, alongside other tools. Our privacy principles remain unchanged. And we'll never sell your personal information or share it without your permission (other than rare circumstances like valid legal requests).&lt;br&gt; &lt;br&gt;Have questions?&lt;br&gt;We have answers.&lt;br&gt;&lt;br&gt;Visit our FAQ at &lt;a href="http://www.google.com/policies/faq"&gt;http://www.google.com/policies/faq&lt;/a&gt; to read more about the changes. (We reckoned our users might have a question or twenty-two.)&lt;br&gt; &lt;br&gt;________________________________&lt;br&gt;Notice of Change&lt;br&gt;&lt;br&gt;1 March, 2012 is when the new Privacy Policy and Terms will come into effect. If you choose to keep using Google once the change occurs, you will be doing so under the new Privacy Policy and Terms of Service.&lt;br&gt; &lt;br&gt;Please do not reply to this email. Mail sent to this address cannot be answered. Also, never enter your Google Account password after following a link in an email or chat to an untrusted site. Instead, go directly to the site, such as &lt;a href="http://mail.google.com"&gt;mail.google.com&lt;/a&gt; or &lt;a href="http://www.google.com/accounts"&gt;www.google.com/accounts&lt;/a&gt;. Google will never email you to ask for your password or other sensitive information.&lt;br&gt; &lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-6027030732807780355?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/0-InkTtUXrNZRHnf0GR1xyy9pHY/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/0-InkTtUXrNZRHnf0GR1xyy9pHY/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/0-InkTtUXrNZRHnf0GR1xyy9pHY/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/0-InkTtUXrNZRHnf0GR1xyy9pHY/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/rTob1Q6Ubk4" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/6027030732807780355/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/01/changes-to-google-privacy-policy-and.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/6027030732807780355?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/6027030732807780355?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/rTob1Q6Ubk4/changes-to-google-privacy-policy-and.html" title="Changes to Google Privacy Policy and Terms of Service" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/01/changes-to-google-privacy-policy-and.html</feedburner:origLink></entry><entry gd:etag="W/&quot;DEcCQ3c_fSp7ImA9WhRUFkg.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-4624793832742476223</id><published>2012-01-27T17:21:00.001+08:00</published><updated>2012-01-27T17:21:02.945+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-01-27T17:21:02.945+08:00</app:edited><title>Manuel's Personal Exome Now Publicly Released | Manuel Corpas' Blog</title><content type="html">&lt;p&gt;After 5 months of having performed the sequencing of my personal exome, I now make it available to the community for public use. I release it under a CC BY-SA 3.0 license, giving you permission to use this data in any way, as long as it provides attribution to the source and it is shared under a similar license.&lt;/p&gt;  &lt;p&gt;&lt;a href="http://manuelcorpas.com/2012/01/23/my-personal-exome-now-publicly-released/"&gt;http://manuelcorpas.com/2012/01/23/my-personal-exome-now-publicly-released/&lt;/a&gt;&lt;/p&gt; &lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-4624793832742476223?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/9CTxfmrrdOnTOpNHTml0jz3OWCo/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/9CTxfmrrdOnTOpNHTml0jz3OWCo/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/9CTxfmrrdOnTOpNHTml0jz3OWCo/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/9CTxfmrrdOnTOpNHTml0jz3OWCo/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/1PXui3L0EUk" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/4624793832742476223/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/01/manuels-personal-exome-now-publicly.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/4624793832742476223?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/4624793832742476223?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/1PXui3L0EUk/manuels-personal-exome-now-publicly.html" title="Manuel's Personal Exome Now Publicly Released | Manuel Corpas' Blog" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/01/manuels-personal-exome-now-publicly.html</feedburner:origLink></entry><entry gd:etag="W/&quot;Dk8DSX4_fyp7ImA9WhRUFU8.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-6701141134025012804</id><published>2012-01-26T04:54:00.001+08:00</published><updated>2012-01-26T04:54:38.047+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-01-26T04:54:38.047+08:00</app:edited><title>Roche in $5.7 billion bid for Illumina</title><content type="html">&lt;p&gt;Wow ... Things are going to be interesting now .... &lt;/p&gt; &lt;p&gt;ZURICH/LONDON (Reuters) -Swiss drugmaker Roche Holding AG (ROG.VX) has offered $5.7 billion in cash in a hostile bid to take over Illumina Inc (ILMN.O), and investors are already betting that the U.S. gene sequencing company will command a significantly higher price.&lt;/p&gt;  &lt;p&gt;&lt;a href="http://mobile.reuters.com/article/innovationNews/idUSTRE80O0FR20120125?irpc=932"&gt;http://mobile.reuters.com/article/innovationNews/idUSTRE80O0FR20120125?irpc=932&lt;/a&gt;&lt;/p&gt; &lt;p&gt;Cheers&lt;br&gt; Kevin&lt;br&gt; Sent from an Android&lt;/p&gt; &lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-6701141134025012804?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/KXjnSzCpjGrVRlxGua7LYEFZino/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/KXjnSzCpjGrVRlxGua7LYEFZino/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/KXjnSzCpjGrVRlxGua7LYEFZino/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/KXjnSzCpjGrVRlxGua7LYEFZino/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/-0qWUWgnFHk" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/6701141134025012804/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/01/roche-in-57-billion-bid-for-illumina.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/6701141134025012804?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/6701141134025012804?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/-0qWUWgnFHk/roche-in-57-billion-bid-for-illumina.html" title="Roche in $5.7 billion bid for Illumina" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/01/roche-in-57-billion-bid-for-illumina.html</feedburner:origLink></entry><entry gd:etag="W/&quot;CE4NRX06eyp7ImA9WhRUFEw.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-3421894556086390433</id><published>2012-01-24T21:49:00.001+08:00</published><updated>2012-01-24T21:49:54.313+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-01-24T21:49:54.313+08:00</app:edited><title>Why we need the Assemblathon - The Assemblathon</title><content type="html">&lt;div class="gmail_quote"&gt;&lt;br&gt;Why we need the Assemblathon - The Assemblathon&lt;br&gt; excerpted &lt;/div&gt;&lt;div class="gmail_quote"&gt;&lt;span style="color:rgb(68,68,68);font-family:Helvetica;background-color:rgb(254,254,254);font-size:medium"&gt;If you want the best genome assembly possible, you may have to accept some trade-offs. The assemblers that may perform well in one area may not perform as well in other areas. Everybody wants to be told &amp;#39;genome assembler X will give you the best assembly&amp;#39; but at the moment it doesn&amp;#39;t seem fair to make such bold assertions. What we did find out from Assemblathon 1 was that a number of genome assemblers performed admirably across many, but not all, of the different metrics. For example, the assembler that did the best job at increasing &lt;/span&gt;&lt;em style="margin-top:0px;margin-right:0px;margin-bottom:0px;margin-left:0px;padding-top:0px;padding-right:0px;padding-bottom:0px;padding-left:0px;border-top-width:0px;border-right-width:0px;border-bottom-width:0px;border-left-width:0px;border-style:initial;border-color:initial;font-size:medium;font-family:Helvetica;vertical-align:baseline;color:rgb(68,68,68);background-color:rgb(254,254,254)"&gt;coverage&lt;/em&gt;&lt;span style="color:rgb(68,68,68);font-family:Helvetica;background-color:rgb(254,254,254);font-size:medium"&gt; (the amount of the known genome present in the assembly), ranked 9th when considering the number of substitution errors present in the assembly. Conversely, the assembler that did the best job at minimizing substitution errors ranked 8th in terms of coverage. You pays your money and you takes your choice. We should mention, however, that these two assemblers (&lt;/span&gt;&lt;a href="http://soap.genomics.org.cn/soapdenovo.html" style="margin-top:0px;margin-right:0px;margin-bottom:0px;margin-left:0px;padding-top:0px;padding-right:0px;padding-bottom:0px;padding-left:0px;border-top-width:0px;border-right-width:0px;border-bottom-width:0px;border-left-width:0px;border-style:initial;border-color:initial;font-size:medium;font-family:Helvetica;vertical-align:baseline;color:rgb(0,102,153);text-decoration:none;background-color:rgb(254,254,254)"&gt;&lt;span style="margin-top:0px;margin-right:0px;margin-bottom:0px;margin-left:0px;padding-top:0px;padding-right:0px;padding-bottom:0px;padding-left:0px;border-top-width:0px;border-right-width:0px;border-bottom-width:0px;border-left-width:0px;border-style:initial;border-color:initial;font-style:inherit;font-size:16px;font-family:inherit;vertical-align:baseline;text-decoration:underline;letter-spacing:0px;color:rgb(1,38,167)"&gt;SOAPdenovo&lt;/span&gt;&lt;/a&gt;&lt;span style="color:rgb(68,68,68);font-family:Helvetica;background-color:rgb(254,254,254);font-size:medium"&gt; and &lt;/span&gt;&lt;a href="https://github.com/jts/sga" style="margin-top:0px;margin-right:0px;margin-bottom:0px;margin-left:0px;padding-top:0px;padding-right:0px;padding-bottom:0px;padding-left:0px;border-top-width:0px;border-right-width:0px;border-bottom-width:0px;border-left-width:0px;border-style:initial;border-color:initial;font-size:medium;font-family:Helvetica;vertical-align:baseline;color:rgb(0,102,153);text-decoration:none;background-color:rgb(254,254,254)"&gt;&lt;span style="margin-top:0px;margin-right:0px;margin-bottom:0px;margin-left:0px;padding-top:0px;padding-right:0px;padding-bottom:0px;padding-left:0px;border-top-width:0px;border-right-width:0px;border-bottom-width:0px;border-left-width:0px;border-style:initial;border-color:initial;font-style:inherit;font-size:16px;font-family:inherit;vertical-align:baseline;text-decoration:underline;letter-spacing:0px;color:rgb(1,38,167)"&gt;SGA&lt;/span&gt;&lt;/a&gt;&lt;span style="color:rgb(68,68,68);font-family:Helvetica;background-color:rgb(254,254,254);font-size:medium"&gt;), along with &lt;/span&gt;&lt;a href="https://www.broadinstitute.org/scientific-community/science/programs/genome-sequencing-and-analysis/computational-rd/computational-" style="margin-top:0px;margin-right:0px;margin-bottom:0px;margin-left:0px;padding-top:0px;padding-right:0px;padding-bottom:0px;padding-left:0px;border-top-width:0px;border-right-width:0px;border-bottom-width:0px;border-left-width:0px;border-style:initial;border-color:initial;font-size:medium;font-family:Helvetica;vertical-align:baseline;color:rgb(0,102,153);text-decoration:none;background-color:rgb(254,254,254)"&gt;&lt;span style="margin-top:0px;margin-right:0px;margin-bottom:0px;margin-left:0px;padding-top:0px;padding-right:0px;padding-bottom:0px;padding-left:0px;border-top-width:0px;border-right-width:0px;border-bottom-width:0px;border-left-width:0px;border-style:initial;border-color:initial;font-style:inherit;font-size:16px;font-family:inherit;vertical-align:baseline;text-decoration:underline;letter-spacing:0px;color:rgb(1,38,167)"&gt;ALLPATHS&lt;/span&gt;&lt;/a&gt;&lt;span style="color:rgb(68,68,68);font-family:Helvetica;background-color:rgb(254,254,254);font-size:medium"&gt; were consistently ranked among the best assemblers for the vast majority of metrics and were the three best overall assemblers in Assemblathon 1. &lt;/span&gt; &lt;/div&gt;  &lt;div class="gmail_quote"&gt;&lt;br&gt; Read it online: &lt;a href="http://assemblathon.org/why-we-need-the-assemblathon" target="_blank"&gt;http://assemblathon.org/why-we-need-the-assemblathon&lt;/a&gt;&lt;br&gt;&lt;br&gt;&lt;/div&gt; &lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-3421894556086390433?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/W1C-qyULsPzKvXMBUxQEFzVXh6c/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/W1C-qyULsPzKvXMBUxQEFzVXh6c/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/W1C-qyULsPzKvXMBUxQEFzVXh6c/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/W1C-qyULsPzKvXMBUxQEFzVXh6c/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/FK4VY5p3KfY" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/3421894556086390433/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/01/why-we-need-assemblathon-assemblathon.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/3421894556086390433?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/3421894556086390433?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/FK4VY5p3KfY/why-we-need-assemblathon-assemblathon.html" title="Why we need the Assemblathon - The Assemblathon" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/01/why-we-need-assemblathon-assemblathon.html</feedburner:origLink></entry><entry gd:etag="W/&quot;DE8NSXc4eCp7ImA9WhRUEUs.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-418430000881825729</id><published>2012-01-22T01:28:00.001+08:00</published><updated>2012-01-22T01:28:18.930+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-01-22T01:28:18.930+08:00</app:edited><title>Free Science, One Paper at a Time | Wired Science | Wired.com</title><content type="html">&lt;div&gt;&lt;a href="http://m.wired.com/wiredscience/2011/05/free-science-one-paper-at-a-time-2/all/1"&gt;http://m.wired.com/wiredscience/2011/05/free-science-one-paper-at-a-time-2/all/1&lt;/a&gt;&lt;/div&gt;&lt;div&gt;&lt;/div&gt;&lt;div&gt;&lt;br&gt;&lt;span class="Apple-style-span" style="font-family: Helvetica, Arial, sans-serif; -webkit-tap-highlight-color: rgba(26, 26, 26, 0.296875); -webkit-composition-fill-color: rgba(175, 192, 227, 0.230469); -webkit-composition-frame-color: rgba(77, 128, 180, 0.230469); font-size: 14px; line-height: 20px; -webkit-text-size-adjust: none; "&gt;&lt;p style="margin-top: 0px; margin-right: 0px; margin-bottom: 1em; margin-left: 0px; padding-top: 0px; padding-right: 0px; padding-bottom: 0px; padding-left: 0px; border-top-width: 0px; border-right-width: 0px; border-bottom-width: 0px; border-left-width: 0px; border-style: initial; border-color: initial; outline-width: 0px; outline-style: initial; outline-color: initial; font-weight: inherit; font-style: inherit; font-size: 15px; font-family: inherit; vertical-align: baseline; line-height: 1.5; "&gt;Part of the answer, strangely, is the very thing at the center of science: the paper. Once science's main conduit, the paper has become its choke point.&lt;/p&gt;&lt;p style="margin-top: 0px; margin-right: 0px; margin-bottom: 1em; margin-left: 0px; padding-top: 0px; padding-right: 0px; padding-bottom: 0px; padding-left: 0px; border-top-width: 0px; border-right-width: 0px; border-bottom-width: 0px; border-left-width: 0px; border-style: initial; border-color: initial; outline-width: 0px; outline-style: initial; outline-color: initial; font-weight: inherit; font-style: inherit; font-size: 15px; font-family: inherit; vertical-align: baseline; line-height: 1.5; "&gt;It's not just that the paper is slow, though that is a huge problem. A researcher who submits a paper to a traditional journal right now, for instance, won't see the published piece for about a year. She must wait while the paper gets passed around among editors, then goes through rounds of peer review by experts in her field, who might and often do object not just to her methods or data but to her findings and interpretations. Finally, she must wait while it moves through an editing, layout, and publishing pipeline that itself might run anywhere from 2 to 12 weeks.&lt;/p&gt;&lt;p style="margin-top: 0px; margin-right: 0px; margin-bottom: 1em; margin-left: 0px; padding-top: 0px; padding-right: 0px; padding-bottom: 0px; padding-left: 0px; border-top-width: 0px; border-right-width: 0px; border-bottom-width: 0px; border-left-width: 0px; border-style: initial; border-color: initial; outline-width: 0px; outline-style: initial; outline-color: initial; font-weight: inherit; font-style: inherit; font-size: 15px; font-family: inherit; vertical-align: baseline; line-height: 1.5; "&gt;Yet the paper is not simply slow; it's heavy. Even as increasingly data-rich science has outgrown the paper's ability to deliver and describe all that science has to offer — its deep databases, its often elaborate methods — we've loaded it up needlessly with reputational weight and vital functions other than carrying data.&lt;/p&gt;&lt;p style="margin-top: 0px; margin-right: 0px; margin-bottom: 1em; margin-left: 0px; padding-top: 0px; padding-right: 0px; padding-bottom: 0px; padding-left: 0px; border-top-width: 0px; border-right-width: 0px; border-bottom-width: 0px; border-left-width: 0px; border-style: initial; border-color: initial; outline-width: 0px; outline-style: initial; outline-color: initial; font-weight: inherit; font-style: inherit; font-size: 15px; font-family: inherit; vertical-align: baseline; line-height: 1.5; "&gt;The paper is meant to be a conduit for the real content and currency of the science: the ideas, methods, data, and findings of the people who do science. But the tremendous publishing and commercial infrastructure built around the academic paper over the last half-century has concentrated so many functions and so much value in the journal that the paper itself, rather than the information in it, has become science's main currency. It is the paper you must buy; the paper you must publish; the paper you must cite; the paper on which not just citations but tenure, reputation, status, and even school rankings are built&lt;/p&gt;&lt;/span&gt;&lt;/div&gt;&lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-418430000881825729?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/t9BcH4Fh3rkvyaCjS4kvFGvIuLs/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/t9BcH4Fh3rkvyaCjS4kvFGvIuLs/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/t9BcH4Fh3rkvyaCjS4kvFGvIuLs/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/t9BcH4Fh3rkvyaCjS4kvFGvIuLs/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/ts2DyiuesAk" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/418430000881825729/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/01/free-science-one-paper-at-time-wired.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/418430000881825729?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/418430000881825729?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/ts2DyiuesAk/free-science-one-paper-at-time-wired.html" title="Free Science, One Paper at a Time | Wired Science | Wired.com" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/01/free-science-one-paper-at-time-wired.html</feedburner:origLink></entry><entry gd:etag="W/&quot;CUYDQno6fSp7ImA9WhRUEU8.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-6604326226730849916</id><published>2012-01-21T13:19:00.001+08:00</published><updated>2012-01-21T13:19:33.415+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-01-21T13:19:33.415+08:00</app:edited><title>SGA uses less memory for de novo assembly</title><content type="html">&lt;div dir="ltr" style="text-align: left;" trbidi="on"&gt;
&lt;div style="font-family: Arial,Helvetica,sans-serif;"&gt;
excerpted from Genomeweb&lt;/div&gt;
&lt;div style="font-family: Arial,Helvetica,sans-serif;"&gt;
According to a &lt;a href="http://genome.cshlp.org/content/early/2011/12/07/gr.126953.111.full.pdf+html" target="_blank"&gt;&lt;em&gt;Genome Research&lt;/em&gt;&lt;/a&gt; paper describing the method, the secret to the &lt;a href="https://github.com/jts/sga" target="_blank"&gt;String Graph Assembler&lt;/a&gt;'s
 reduced memory footprint is that it uses compressed data structures to 
"exploit the redundancy" in sequence reads and to "substantially lower 
the amount of memory required to perform &lt;em&gt;de novo&lt;/em&gt; assembly."&lt;/div&gt;
&lt;div style="font-family: Arial,Helvetica,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: Arial,Helvetica,sans-serif;"&gt;
SGA relies on an algorithm its developers published in 2010 that 
constructs an assembly string graph from a so-called “full-text 
minute-space” index, or FM-index, which enables searching over a 
compressed representation of a text. Unlike other short-read assemblers 
that rely on the de Bruijn graph model, which breaks reads up into 
k-mers, the string graph model “keeps all reads intact and creates a 
graph from overlaps between reads,” the Sanger team wrote.&amp;nbsp;&amp;nbsp;&lt;/div&gt;
&lt;div style="font-family: Arial,Helvetica,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: Arial,Helvetica,sans-serif;"&gt;
his approach makes even more sense now that sequencing instruments like the Pacific Biosciences RS are generating longer reads.
&lt;/div&gt;
&lt;div style="font-family: Arial,Helvetica,sans-serif;"&gt;
In the paper, Durbin and co-developer Jared Simpson report that SGA 
successfully assembled 1.2 billion human genome sequence reads using &lt;b&gt;54 
GB of memory. This was compared with SOAPdenovo, which required 118 GB 
for the same task.&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Arial,Helvetica,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: Arial,Helvetica,sans-serif;"&gt;
Results from comparisons of SGA with Velvet, &lt;a href="http://www.bcgsc.ca/platform/bioinfo/software/abyss" target="_blank"&gt;ABySS&lt;/a&gt;, and SOAPdenovo using a &lt;em&gt;C. elegans&lt;/em&gt;
 dataset showed that its assembled contigs covered 95.9 percent of the 
reference genome while the other three programs covered 94.5 percent, 
95.6 percent, and 94.8 percent respectively. &lt;/div&gt;
&lt;span style="font-family: Arial,Helvetica,sans-serif;"&gt;
&lt;/span&gt;&lt;div style="font-family: Arial,Helvetica,sans-serif;"&gt;
Furthermore, SGA required only 4.5 gigabytes of memory to assemble the &lt;em&gt;C. elegans&lt;/em&gt; dataset compared to 14.1 GB, 23 GB, and 38.8 GB required for ABySS, Velvet, and SOAPdenovo respectively.&lt;/div&gt;
&lt;div style="font-family: Arial,Helvetica,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: Arial,Helvetica,sans-serif;"&gt;
SGA is slower that its counterparts, however. SGA took 1,427 CPU 
hours to complete a human genome assembly, while SOAPdenovo required 479
 CPU hours.&lt;/div&gt;
&lt;span style="font-family: Arial,Helvetica,sans-serif;"&gt;
&lt;/span&gt;&lt;div style="font-family: Arial,Helvetica,sans-serif;"&gt;
"We explicitly trade off a bit longer CPU time for lower memory usage," Simpson, a doctoral student in Durbin's lab, told &lt;em&gt;BioInform&lt;/em&gt;. "We feel that fits better into most of the clusters that are available right now."&lt;/div&gt;
&lt;span style="font-family: Arial,Helvetica,sans-serif;"&gt;
&lt;/span&gt;&lt;div style="font-family: Arial,Helvetica,sans-serif;"&gt;
On the other hand, SGA is parallelizable, so its most 
compute-intensive activities — error-correcting reads and building the 
FM-index of corrected reads — can be distributed across a compute 
cluster to reduce run time, the researchers explain in the paper.&lt;/div&gt;
&lt;div style="font-family: Arial,Helvetica,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: Arial,Helvetica,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: Arial,Helvetica,sans-serif;"&gt;
He explained that while de bruijn assemblers like Velvet require a 
separate processing step after completing the genome assembly, SGA 
doesn’t and potentially avoids "some of the errors or incomplete 
analysis" that can occur in the extra processing step.&lt;/div&gt;
&lt;span style="font-family: Arial,Helvetica,sans-serif;"&gt;
&lt;/span&gt;&lt;div style="font-family: Arial,Helvetica,sans-serif;"&gt;
This reduced error risk plus its lower memory requirement ensures that tools like SGA have a "future," Durbin said.&lt;/div&gt;
&lt;span style="font-family: Arial,Helvetica,sans-serif;"&gt;
&lt;/span&gt;&lt;div style="font-family: Arial,Helvetica,sans-serif;"&gt;
For their next steps, Durbin and Simpson are adapting SGA to work 
with longer read data from the Roche 454 sequencer and the Life 
Technologies Ion Torrent Personal Genome Machine. They are also 
exploring ways of discovering variants using the program.&lt;/div&gt;
&lt;span style="font-family: Arial,Helvetica,sans-serif;"&gt;
&lt;/span&gt;&lt;div style="font-family: Arial,Helvetica,sans-serif;"&gt;
The approach could also be used to analyze metagenomic data, the researchers  said in the paper.&lt;/div&gt;
&lt;div style="font-family: Arial,Helvetica,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: Arial,Helvetica,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;br /&gt;
&lt;b&gt;&lt;i&gt;&amp;nbsp;Read the full article here http://www.genomeweb.com/informatics/sanger-teams-de-novo-assembler-adopts-compressed-approach-reduce-memory-footprin&lt;/i&gt;&lt;/b&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
&lt;b&gt;&lt;i&gt;1427 CPU hours is ALOT more than 479 CPU hours (~ 3x) but of course when you can parallelize it, it's definitely a worthwhile tradeoff especially when it's more likely that one has a lot of lower memory clusters then one single cluster with a lot of memory and is likely to be hogged by a 479 CPU hour job. I wonder if this might encourage investigators to relook at existing data by de novo assembly. Of course it would be great if the NGS data is made public, then I guess other groups can actually do the de novo assembly comparison for them.&amp;nbsp;&lt;/i&gt;&lt;/b&gt;&lt;br /&gt;
&lt;b&gt;&lt;i&gt;&amp;nbsp; &lt;/i&gt;&lt;/b&gt;&lt;br /&gt;
&lt;/div&gt;&lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-6604326226730849916?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/bFPWlP37qHU34Ys5lqj2BWX7dwU/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/bFPWlP37qHU34Ys5lqj2BWX7dwU/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/bFPWlP37qHU34Ys5lqj2BWX7dwU/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/bFPWlP37qHU34Ys5lqj2BWX7dwU/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/FDPmPaePRHk" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/6604326226730849916/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/01/sga-uses-less-memory-for-de-novo.html#comment-form" title="1 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/6604326226730849916?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/6604326226730849916?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/FDPmPaePRHk/sga-uses-less-memory-for-de-novo.html" title="SGA uses less memory for de novo assembly" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>1</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/01/sga-uses-less-memory-for-de-novo.html</feedburner:origLink></entry><entry gd:etag="W/&quot;CE8HQXkzfip7ImA9WhRVGUQ.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-2641596609672811555</id><published>2012-01-20T01:06:00.000+08:00</published><updated>2012-01-20T01:07:10.786+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-01-20T01:07:10.786+08:00</app:edited><title>What's the difference between an accession number (AC) and the entry name (ID)?</title><content type="html">&lt;br&gt;&lt;div class="gmail_quote"&gt;RT @pride_ebi: .@uniprot 101: What&amp;#39;s the difference between an accession number (AC) and the entry name (ID)? &lt;a href="http://bit.ly/Ahh2AM" target="_blank"&gt;http://www.uniprot.org/faq/6&lt;/a&gt;&lt;br&gt;   &lt;br&gt; Read it online: &lt;a href="http://twitter.com/emblebi/status/154584407729119233" target="_blank"&gt;http://twitter.com/emblebi/status/154584407729119233&lt;/a&gt;&lt;br&gt;&lt;/div&gt;&lt;br&gt; &lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-2641596609672811555?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/lN1DyyaYJ_Rsv44vq_AE32K9V5g/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/lN1DyyaYJ_Rsv44vq_AE32K9V5g/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/lN1DyyaYJ_Rsv44vq_AE32K9V5g/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/lN1DyyaYJ_Rsv44vq_AE32K9V5g/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/PgHtdiv2dyg" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/2641596609672811555/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/01/whats-difference-between-accession.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/2641596609672811555?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/2641596609672811555?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/PgHtdiv2dyg/whats-difference-between-accession.html" title="What's the difference between an accession number (AC) and the entry name (ID)?" /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/01/whats-difference-between-accession.html</feedburner:origLink></entry><entry gd:etag="W/&quot;Ck8ER3g9fip7ImA9WhRVGUQ.&quot;"><id>tag:blogger.com,1999:blog-8959227089815463704.post-5943900875353496053</id><published>2012-01-20T00:32:00.000+08:00</published><updated>2012-01-20T00:33:26.666+08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-01-20T00:33:26.666+08:00</app:edited><title>Cancer Commons is a non-profit open science initiative dedicated to improving outcomes for today's cancer patients.</title><content type="html">&lt;div&gt;This should be interesting to watch out for ... &lt;/div&gt;&lt;div&gt;&lt;br&gt;&lt;/div&gt;&lt;a href="http://cancercommons.org/about/"&gt;http://cancercommons.org/about/&lt;/a&gt;&lt;div&gt;&lt;br&gt;&lt;/div&gt;&lt;div&gt;&lt;div class="f kv" style="color:rgb(102,102,102);margin-bottom:1px;font-family:arial,sans-serif;line-height:13px;background-color:rgb(255,255,255)"&gt;  &lt;cite style="color:rgb(0,153,51);font-style:normal;display:inline-block;margin-bottom:1px"&gt;&lt;b&gt;cancercommons&lt;/b&gt;.org/&lt;/cite&gt;&lt;/div&gt;&lt;span class="st" style="line-height:1.24;color:rgb(34,34,34);font-family:arial,sans-serif;background-color:rgb(255,255,255)"&gt;&lt;em style="font-weight:bold;font-style:normal;color:rgb(0,0,0)"&gt;Cancer Commons&lt;/em&gt; is a non-profit open science initiative dedicated to improving outcomes for today&amp;#39;s cancer patients. Our goals are to: 1) give each patient the &lt;b&gt;.&lt;/b&gt;&lt;/span&gt; &lt;/div&gt; &lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/8959227089815463704-5943900875353496053?l=kevin-gattaca.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/025dhw8l5ftE7QZucBAl4ll96Lc/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/025dhw8l5ftE7QZucBAl4ll96Lc/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/025dhw8l5ftE7QZucBAl4ll96Lc/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/025dhw8l5ftE7QZucBAl4ll96Lc/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;img src="http://feeds.feedburner.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~4/38HwW7YLFo0" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kevin-gattaca.blogspot.com/feeds/5943900875353496053/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kevin-gattaca.blogspot.com/2012/01/cancer-commons-is-non-profit-open.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/5943900875353496053?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/8959227089815463704/posts/default/5943900875353496053?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/MyWeblogOnBioinformaticsGenomeScienceNextGenerationSequencing/~3/38HwW7YLFo0/cancer-commons-is-non-profit-open.html" title="Cancer Commons is a non-profit open science initiative dedicated to improving outcomes for today's cancer patients." /><author><name>Kevin</name><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="16" height="16" src="http://img2.blogblog.com/img/b16-rounded.gif" /></author><thr:total>0</thr:total><feedburner:origLink>http://kevin-gattaca.blogspot.com/2012/01/cancer-commons-is-non-profit-open.html</feedburner:origLink></entry></feed>

