<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	xmlns:georss="http://www.georss.org/georss" xmlns:geo="http://www.w3.org/2003/01/geo/wgs84_pos#" xmlns:media="http://search.yahoo.com/mrss/"
	>

<channel>
	<title>Manuel Corpas&#039; Blog</title>
	<atom:link href="http://manuelcorpas.com/feed/" rel="self" type="application/rss+xml" />
	<link>http://manuelcorpas.com</link>
	<description>Genomes, Web 2.0 and Bioethics</description>
	<lastBuildDate>Wed, 23 May 2012 15:51:10 +0000</lastBuildDate>
	<language>en</language>
	<sy:updatePeriod>hourly</sy:updatePeriod>
	<sy:updateFrequency>1</sy:updateFrequency>
	<generator>http://wordpress.com/</generator>
<cloud domain='manuelcorpas.com' port='80' path='/?rsscloud=notify' registerProcedure='' protocol='http-post' />
<image>
		<url>http://1.gravatar.com/blavatar/30b9f4f8115fc52af0bb4d7d67d33f7d?s=96&#038;d=http%3A%2F%2Fs2.wp.com%2Fi%2Fbuttonw-com.png</url>
		<title>Manuel Corpas&#039; Blog</title>
		<link>http://manuelcorpas.com</link>
	</image>
	<atom:link rel="search" type="application/opensearchdescription+xml" href="http://manuelcorpas.com/osd.xml" title="Manuel Corpas&#039; Blog" />
	<atom:link rel='hub' href='http://manuelcorpas.com/?pushpress=hub'/>
		<item>
		<title>Converting FASTQ to FASTA</title>
		<link>http://manuelcorpas.com/2012/05/21/converting-fastq-to-fasta/</link>
		<comments>http://manuelcorpas.com/2012/05/21/converting-fastq-to-fasta/#comments</comments>
		<pubDate>Mon, 21 May 2012 15:17:57 +0000</pubDate>
		<dc:creator>admin</dc:creator>
				<category><![CDATA[Genomics]]></category>
		<category><![CDATA[Tutorials]]></category>
		<category><![CDATA[code]]></category>
		<category><![CDATA[fasta]]></category>
		<category><![CDATA[fastq]]></category>
		<category><![CDATA[perl]]></category>

		<guid isPermaLink="false">http://manuelcorpas.com/?p=1559</guid>
		<description><![CDATA[A little Perl one liner I borrowed from The Edwards Lab that converts FASTQ to FASTA. Please note I had to truncate the line to make it show properly in this blog entry. $ cat file_to_covert.fq &#124; perl -e \ '$i=0;while(&#60;&#62;){if(/^\@/&#38;&#38;$i==0){s/^\@/\&#62;/;print;}elsif($i==1){print;$i=-3}$i++;}' \ &#62; output.fasta Thanks Edwards Lab!<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=manuelcorpas.com&#038;blog=5424602&#038;post=1559&#038;subd=corpasfoo&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>A little Perl one liner I borrowed from <a href="http://edwards.sdsu.edu/labsite/index.php/robert/289-how-to-convert-fastq-to-fasta" target="_blank">The Edwards Lab</a> that converts FASTQ to FASTA. Please note I had to truncate the line to make it show properly in this blog entry.</p>
<pre>$ cat file_to_covert.fq | perl -e \
'$i=0;while(&lt;&gt;){if(/^\@/&amp;&amp;$i==0){s/^\@/\&gt;/;print;}elsif($i==1){print;$i=-3}$i++;}' \
&gt; output.fasta</pre>
<p>Thanks Edwards Lab!</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/corpasfoo.wordpress.com/1559/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/corpasfoo.wordpress.com/1559/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/corpasfoo.wordpress.com/1559/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/corpasfoo.wordpress.com/1559/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/corpasfoo.wordpress.com/1559/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/corpasfoo.wordpress.com/1559/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/corpasfoo.wordpress.com/1559/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/corpasfoo.wordpress.com/1559/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/corpasfoo.wordpress.com/1559/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/corpasfoo.wordpress.com/1559/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/corpasfoo.wordpress.com/1559/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/corpasfoo.wordpress.com/1559/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/corpasfoo.wordpress.com/1559/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/corpasfoo.wordpress.com/1559/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=manuelcorpas.com&#038;blog=5424602&#038;post=1559&#038;subd=corpasfoo&#038;ref=&#038;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://manuelcorpas.com/2012/05/21/converting-fastq-to-fasta/feed/</wfw:commentRss>
		<slash:comments>2</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ad7b9d282ec00a53fee5c0d293f3f425?s=96&#38;d=wavatar" medium="image">
			<media:title type="html">manuelcorpas</media:title>
		</media:content>
	</item>
		<item>
		<title>My Personal Exome Now Publicly Released</title>
		<link>http://manuelcorpas.com/2012/05/10/1548/</link>
		<comments>http://manuelcorpas.com/2012/05/10/1548/#comments</comments>
		<pubDate>Thu, 10 May 2012 08:27:48 +0000</pubDate>
		<dc:creator>admin</dc:creator>
				<category><![CDATA[Uncategorized]]></category>

		<guid isPermaLink="false">http://manuelcorpas.com/2012/05/10/1548/</guid>
		<description><![CDATA[Reblogged from Manuel Corpas&#039; Blog: After many months of having performed the sequencing of my personal exome, I now make it available to the community for public use. I release it under a public domain license (CC0 1.0 Universal), giving you permission to use this data in any way. What is an exome? An exome is [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=manuelcorpas.com&#038;blog=5424602&#038;post=1548&#038;subd=corpasfoo&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<div class="reblog-post"><p class="reblog-from"><img alt='' src='http://0.gravatar.com/avatar/ad7b9d282ec00a53fee5c0d293f3f425?s=25&amp;d=wavatar' class='avatar avatar-25' height='25' width='25' /> <a href="http://manuelcorpas.com/2012/01/23/my-personal-exome-now-publicly-released/">Reblogged from Manuel Corpas&#039; Blog:</a></p><div class="wpcom-enhanced-excerpt">
<p>After many months of having performed the sequencing of my personal exome, I now make it available to the community for public use. I release it under a public domain license (<a href="http://creativecommons.org/publicdomain/zero/1.0/">CC0 1.0 Universal</a>), giving you permission to use this data in any way.</p>
What is an exome?
<p>An exome is the ~1% of my genome that encodes for proteins.</p>
 <p class="read-more"><a href="http://manuelcorpas.com/2012/01/23/my-personal-exome-now-publicly-released/" target="_self"><span>Read more&hellip;</span> 337 more words</a></p></div></div> ]]></content:encoded>
			<wfw:commentRss>http://manuelcorpas.com/2012/05/10/1548/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ad7b9d282ec00a53fee5c0d293f3f425?s=96&#38;d=wavatar" medium="image">
			<media:title type="html">manuelcorpas</media:title>
		</media:content>
	</item>
		<item>
		<title>Nightmare Naming Conventions</title>
		<link>http://manuelcorpas.com/2012/03/22/nightmare-naming-conventions/</link>
		<comments>http://manuelcorpas.com/2012/03/22/nightmare-naming-conventions/#comments</comments>
		<pubDate>Thu, 22 Mar 2012 13:28:24 +0000</pubDate>
		<dc:creator>admin</dc:creator>
				<category><![CDATA[Lectures]]></category>
		<category><![CDATA[Tutorials]]></category>
		<category><![CDATA[computer science]]></category>
		<category><![CDATA[Data Analysis]]></category>
		<category><![CDATA[directory]]></category>
		<category><![CDATA[file]]></category>
		<category><![CDATA[next generation sequencing]]></category>
		<category><![CDATA[pipeline]]></category>

		<guid isPermaLink="false">http://manuelcorpas.com/?p=1486</guid>
		<description><![CDATA[One of the tasks I seem to be spending a lot time thinking about these days is how to name files and structure them in the appropriate directories so that they follow a consistent logic. This is because my current research involves development of analysis pipelines of Next Generation Sequencing Data where the output file(s) [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=manuelcorpas.com&#038;blog=5424602&#038;post=1486&#038;subd=corpasfoo&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>One of the tasks I seem to be spending a lot time thinking about these days is how to name files and structure them in the appropriate directories so that they follow a consistent logic. This is because my current research involves development of analysis pipelines of Next Generation Sequencing Data where the output file(s) of a program(s) is the input to the next. These processing steps allow raw data straight out of the machine to help answer the biological questions for which the experiments were run on the first place.</p>
<p>File and directory naming conventions may sound like a trivial thing to do but I have found that their complexity increases exponentially when many components are run. To illustrate my current approach to tackling this problem, I present here a simple example. Suppose a project (&#8216;project_name&#8217;) that runs two programs, &#8216;program_1&#8242; and &#8216;program_2&#8242;. Each time the pipeline is run, input files may vary and so I create a new &#8216;job_name&#8217; for each run. I have come up with this directory architecture:</p>
<pre>/project_name
/project_name/data
/project_name/data/job_name_1
/project_name/data/job_name_1/input_data_type_1
/project_name/data/job_name_1/input_data_type_2
/project_name/data/job_name_1/input_data_type_3
/project_name/results
/project_name/results/job_name_1/program_1
/project_name/results/job_name_1/program_1/output_1
/project_name/results/job_name_1/program_1/output_2
...
/project_name/results/job_name/program_2/output_1
/project_name/results/job_name/program_2/output_1
...</pre>
<p>What would happen if instead of running 2 programs as I did above I run 5 or 6? And what if for each input data file I had replicates? What about maximising the number steps taken in parallel? You can start to see that the thing really gets complicated.</p>
<p>File and directory naming conventions is something that I am teaching myself, but any directives or systematic methods taught during my computer science student years would have come in handy now. In future bioinformatics lectures I teach I will definitively challenge my students to think about this issue very carefully.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/corpasfoo.wordpress.com/1486/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/corpasfoo.wordpress.com/1486/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/corpasfoo.wordpress.com/1486/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/corpasfoo.wordpress.com/1486/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/corpasfoo.wordpress.com/1486/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/corpasfoo.wordpress.com/1486/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/corpasfoo.wordpress.com/1486/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/corpasfoo.wordpress.com/1486/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/corpasfoo.wordpress.com/1486/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/corpasfoo.wordpress.com/1486/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/corpasfoo.wordpress.com/1486/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/corpasfoo.wordpress.com/1486/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/corpasfoo.wordpress.com/1486/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/corpasfoo.wordpress.com/1486/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=manuelcorpas.com&#038;blog=5424602&#038;post=1486&#038;subd=corpasfoo&#038;ref=&#038;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://manuelcorpas.com/2012/03/22/nightmare-naming-conventions/feed/</wfw:commentRss>
		<slash:comments>9</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ad7b9d282ec00a53fee5c0d293f3f425?s=96&#38;d=wavatar" medium="image">
			<media:title type="html">manuelcorpas</media:title>
		</media:content>
	</item>
		<item>
		<title>From Life in the Server to Life in the Cluster</title>
		<link>http://manuelcorpas.com/2012/03/12/from-life-in-the-server-to-life-in-the-cluster/</link>
		<comments>http://manuelcorpas.com/2012/03/12/from-life-in-the-server-to-life-in-the-cluster/#comments</comments>
		<pubDate>Mon, 12 Mar 2012 16:42:07 +0000</pubDate>
		<dc:creator>admin</dc:creator>
				<category><![CDATA[Opinion]]></category>
		<category><![CDATA[Cloud Computing]]></category>
		<category><![CDATA[computational biology]]></category>
		<category><![CDATA[databases]]></category>
		<category><![CDATA[next generation sequencing]]></category>

		<guid isPermaLink="false">http://manuelcorpas.com/?p=1462</guid>
		<description><![CDATA[Life in early 2011: Work around a server, one process, Gigabyte datasets. Life in early 2012: Work around a cluster, many processes, Terabyte datasets. I remember the old days, when I had to pipette to run an experiment. Today I do not have to pipette, I run a command or pipeline in a computer terminal connecting remotely [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=manuelcorpas.com&#038;blog=5424602&#038;post=1462&#038;subd=corpasfoo&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<h3>Life in early <strong>2011:</strong></h3>
<ul>
<li>Work around a server, one process, Gigabyte datasets.</li>
</ul>
<h3>Life in early <strong>2012:</strong></h3>
<ul>
<li>Work around a cluster, many processes, Terabyte datasets.</li>
</ul>
<p>I remember the old days, when I had to pipette to run an experiment. Today I do not have to pipette, I run a command or pipeline in a computer terminal connecting remotely to a cluster of a few thousand nodes. Sometimes it might be quicker to run a PCR than running my workflow script.</p>
<p>I consider a privilege being &#8220;drown&#8221; in data. Why? Because this is the future. More data brings more hypotheses and more hypotheses bring more knowledge. One either learns to surf the waves or a tsunami ends up catching one soon enough.</p>
<p>How does it feel from the inside? It feels exciting, overwhelmingly exhilarating! It feels like wanting to surf in a sea of data yet happy to be able to barely keep afloat: this is the inevitable fate of those genome bioinformaticians dealing with <a href="http://en.wikipedia.org/wiki/DNA_sequencing#High-throughput_sequencing" target="_blank">Next Generation Sequencing </a>data.</p>
<h3>What next in my todo list?</h3>
<p><a href="http://en.wikipedia.org/wiki/Cloud_computing" target="_blank">Cloud computing</a>. I am counting the days when my experiments will be run in the cloud, not the cluster.</p>
<div class="wp-caption aligncenter" style="width: 434px"><img class="  " src="http://upload.wikimedia.org/wikipedia/commons/b/b5/Cloud_computing.svg" alt="" width="424" height="383" /><p class="wp-caption-text">By Sam Johnston (CC BY-SA 3.0 license)</p></div>
<p>I look forward to welcoming you to the data feast. Will you join?</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/corpasfoo.wordpress.com/1462/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/corpasfoo.wordpress.com/1462/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/corpasfoo.wordpress.com/1462/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/corpasfoo.wordpress.com/1462/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/corpasfoo.wordpress.com/1462/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/corpasfoo.wordpress.com/1462/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/corpasfoo.wordpress.com/1462/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/corpasfoo.wordpress.com/1462/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/corpasfoo.wordpress.com/1462/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/corpasfoo.wordpress.com/1462/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/corpasfoo.wordpress.com/1462/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/corpasfoo.wordpress.com/1462/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/corpasfoo.wordpress.com/1462/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/corpasfoo.wordpress.com/1462/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=manuelcorpas.com&#038;blog=5424602&#038;post=1462&#038;subd=corpasfoo&#038;ref=&#038;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://manuelcorpas.com/2012/03/12/from-life-in-the-server-to-life-in-the-cluster/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ad7b9d282ec00a53fee5c0d293f3f425?s=96&#38;d=wavatar" medium="image">
			<media:title type="html">manuelcorpas</media:title>
		</media:content>

		<media:content url="http://upload.wikimedia.org/wikipedia/commons/b/b5/Cloud_computing.svg" medium="image" />
	</item>
		<item>
		<title>Visualizing Your DNA Genotype Profile in a Blanket</title>
		<link>http://manuelcorpas.com/2012/03/06/visualizing-your-dna-genotype-profile-in-a-blanket/</link>
		<comments>http://manuelcorpas.com/2012/03/06/visualizing-your-dna-genotype-profile-in-a-blanket/#comments</comments>
		<pubDate>Tue, 06 Mar 2012 09:16:31 +0000</pubDate>
		<dc:creator>admin</dc:creator>
				<category><![CDATA[Personal Genomes]]></category>
		<category><![CDATA[Technology]]></category>
		<category><![CDATA[23andMe]]></category>
		<category><![CDATA[art]]></category>
		<category><![CDATA[blanket]]></category>
		<category><![CDATA[Corpas family]]></category>
		<category><![CDATA[ingenuity]]></category>
		<category><![CDATA[textile]]></category>

		<guid isPermaLink="false">http://manuelcorpas.com/?p=1450</guid>
		<description><![CDATA[I have encountered a rather ingenious idea in Ben Landau&#8217;s blog. You may have read that Mike Cariaso, founder of SNPedia, created a visualization graph with the genotype of my family where my family member genotypes were compared against each other. Visualization patterns were created that compared each chromosome against every other. To show how [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=manuelcorpas.com&#038;blog=5424602&#038;post=1450&#038;subd=corpasfoo&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>I have encountered a rather <a href="http://benlandau.com/?p=1300" target="_blank">ingenious idea in Ben Landau&#8217;s blog</a>. You may have read that Mike Cariaso, founder of <a href="http://www.snpedia.com/index.php/SNPedia" target="_blank">SNPedia</a>, created a <a href="http://files.snpedia.org/reports/promethease_data/promethease_corpas_family_comparison_newfamily.html" target="_blank">visualization graph with the genotype of my family</a> where my family member genotypes were compared against each other. Visualization patterns were created that compared each chromosome against every other. To show how this actually looks, I have taken from Mike&#8217;s tool an image that shows the comparison of 23andMe genotypes from my mom and dad (x and y axis respectively), each pixel being a SNP and different colors representing match (light blue), half match (dark blue) and conflict (red).</p>
<div id="attachment_1451" class="wp-caption aligncenter" style="width: 416px"><a href="http://files.snpedia.org/reports/promethease_data/promethease_corpas_family_comparison_newfamily.html"><img class="size-full wp-image-1451 " title="chr1-mom-dad" src="http://corpasfoo.files.wordpress.com/2012/03/chr1-mom-dad.png?w=480" alt=""   /></a><p class="wp-caption-text">Chromosome 1. Comparison of Corpas mum and dad 23andMe genotypes using SNPedia's visualization tool.</p></div>
<p>It seems that Ben has taken this idea further and designed a blanket that incorporates chromosomal patterns for a complete 23andMe genotype. I quote here the description for this blanket from the Ben&#8217;s blog:</p>
<blockquote><p>First Gift is a precious blanket which compares the digital DNA data of a child with their parents. If the child’s genes are edited, these changes will mask the parent’s DNA with synthesized DNA. The blanket itself represents a sacred and fragile heirloom, where tampering with it could potentially lead to frayed edges and uncertain outcomes. This first genetic gift will be with the child for life, and will also be inherited by future generations.</p></blockquote>
<p>Although technically speaking this visualization shows comparisons between any two individuals, and not between the two parents and child as it is mentioned in the blog, I am still amazed at the craftiness and ingenuity of this idea. And since it uses data from the Corpas family dataset, I hereby report it in <em>Manuel Corpas&#8217; Blog</em>. Here is <a href="http://manuelcorpas.com/2011/06/06/benefits-for-publishing-family-genomes-on-the-internet/" target="_blank">another unpredicted</a> and surprising effect from publishing our family genomes on the Internet.</p>
<p>To finish this blog entry, I borrow from Ben a complete profile view of my sister&#8217;s genotype patterned in his &#8216;First Gift&#8217; blanket. According to him, the weaving of the blanket was done at the <a href="http://www.textielmuseum.nl/" target="_blank">Tilburg Textile Museum</a> in Amsterdam.</p>
<div id="attachment_1452" class="wp-caption aligncenter" style="width: 397px"><img class="size-full wp-image-1452" title="blanket-ben-landau" src="http://corpasfoo.files.wordpress.com/2012/03/blanket-ben-landau.png?w=480" alt=""   /><p class="wp-caption-text">Blanket showing genotype pattern comparisons in my sister's 23andMe genotype. Each shape in theory corresponds to a chromosome comparison, although I still need to understand which chromosome represents each of the 25 shapes above (Humans have 22 autosomes + 1 sexual pair + mitochondrial).</p></div>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/corpasfoo.wordpress.com/1450/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/corpasfoo.wordpress.com/1450/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/corpasfoo.wordpress.com/1450/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/corpasfoo.wordpress.com/1450/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/corpasfoo.wordpress.com/1450/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/corpasfoo.wordpress.com/1450/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/corpasfoo.wordpress.com/1450/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/corpasfoo.wordpress.com/1450/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/corpasfoo.wordpress.com/1450/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/corpasfoo.wordpress.com/1450/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/corpasfoo.wordpress.com/1450/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/corpasfoo.wordpress.com/1450/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/corpasfoo.wordpress.com/1450/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/corpasfoo.wordpress.com/1450/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=manuelcorpas.com&#038;blog=5424602&#038;post=1450&#038;subd=corpasfoo&#038;ref=&#038;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://manuelcorpas.com/2012/03/06/visualizing-your-dna-genotype-profile-in-a-blanket/feed/</wfw:commentRss>
		<slash:comments>1</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ad7b9d282ec00a53fee5c0d293f3f425?s=96&#38;d=wavatar" medium="image">
			<media:title type="html">manuelcorpas</media:title>
		</media:content>

		<media:content url="http://corpasfoo.files.wordpress.com/2012/03/chr1-mom-dad.png" medium="image">
			<media:title type="html">chr1-mom-dad</media:title>
		</media:content>

		<media:content url="http://corpasfoo.files.wordpress.com/2012/03/blanket-ben-landau.png" medium="image">
			<media:title type="html">blanket-ben-landau</media:title>
		</media:content>
	</item>
		<item>
		<title>Bye Sanger, Hello TGAC</title>
		<link>http://manuelcorpas.com/2012/02/14/bye-sanger-hello-tgac/</link>
		<comments>http://manuelcorpas.com/2012/02/14/bye-sanger-hello-tgac/#comments</comments>
		<pubDate>Tue, 14 Feb 2012 12:10:21 +0000</pubDate>
		<dc:creator>admin</dc:creator>
				<category><![CDATA[Bioinformatics]]></category>
		<category><![CDATA[Opinion]]></category>
		<category><![CDATA[Personal]]></category>
		<category><![CDATA[Bisulfite-seq]]></category>
		<category><![CDATA[ChIP-seq]]></category>
		<category><![CDATA[epigenomics]]></category>
		<category><![CDATA[gene regulation]]></category>
		<category><![CDATA[job openings]]></category>
		<category><![CDATA[opportunities]]></category>
		<category><![CDATA[RNA-seq]]></category>
		<category><![CDATA[Sanger]]></category>
		<category><![CDATA[TGAC]]></category>
		<category><![CDATA[transcriptomics]]></category>

		<guid isPermaLink="false">http://manuelcorpas.com/2012/02/14/bye-sanger-hello-tgac/</guid>
		<description><![CDATA[After 3.5 exciting years at the Wellcome Trust Sanger Institute, working as senior developer for the DECIPHER database, it was time to start a new venture. As of February 13th, I am the Project Leader of Plant and Animal Genomes at The Genome Analysis Centre (TGAC). TGAC is specialized in the study of plants, microbes [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=manuelcorpas.com&#038;blog=5424602&#038;post=1432&#038;subd=corpasfoo&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>After 3.5 exciting years at the <a href="http://www.sanger.ac.uk" target="_blank">Wellcome Trust Sanger Institute</a>, working as senior developer for the <a href="https://decipher.sanger.ac.uk" target="_blank">DECIPHER database</a>, it was time to start a new venture. As of February 13th, I am the Project Leader of Plant and Animal Genomes at The Genome Analysis Centre (<a href="http://www.tgac.ac.uk/" target="_blank">TGAC</a>). TGAC is specialized in the study of plants, microbes and animal genomes with the view to facilitate the development of new genomics-based biology in academic and commercial sectors.</p>
<p>In my new role at TGAC I will be leading the group of computational biologists working on plant and animal genome analyses within the Genome Analysis Team. Our aims will include the organization of the analysis of sequence generated at TGAC, engaging with internal and external collaborators, nationally and internationally. A lot of the work will focus on (but will not solely be restricted to) the analysis of <a href="http://en.wikipedia.org/wiki/RNA-Seq" target="_blank">RNA-seq</a>, <a href="http://en.wikipedia.org/wiki/Chip-sequencing" target="_blank">ChIP-seq</a> and <a href="http://en.wikipedia.org/wiki/Bisulfite_sequencing" target="_blank">Bisulphite sequencing</a> data for the purposes of understanding how genes are regulated.</p>
<h3>Coming Opportunities</h3>
<p>I will be expecting to have openings in my group in the near future for student projects (Masters and PhD) as well as research associates and technicians. Meanwhile, if you are interested in joining or simply discussing ideas or potential projects in the the broad areas of transcriptomics, epigenomics and gene regulation, you are always welcome to drop me a line.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/corpasfoo.wordpress.com/1432/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/corpasfoo.wordpress.com/1432/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/corpasfoo.wordpress.com/1432/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/corpasfoo.wordpress.com/1432/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/corpasfoo.wordpress.com/1432/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/corpasfoo.wordpress.com/1432/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/corpasfoo.wordpress.com/1432/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/corpasfoo.wordpress.com/1432/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/corpasfoo.wordpress.com/1432/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/corpasfoo.wordpress.com/1432/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/corpasfoo.wordpress.com/1432/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/corpasfoo.wordpress.com/1432/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/corpasfoo.wordpress.com/1432/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/corpasfoo.wordpress.com/1432/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=manuelcorpas.com&#038;blog=5424602&#038;post=1432&#038;subd=corpasfoo&#038;ref=&#038;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://manuelcorpas.com/2012/02/14/bye-sanger-hello-tgac/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ad7b9d282ec00a53fee5c0d293f3f425?s=96&#38;d=wavatar" medium="image">
			<media:title type="html">manuelcorpas</media:title>
		</media:content>
	</item>
		<item>
		<title>My Personal Exome Analysis (Part I): First Findings</title>
		<link>http://manuelcorpas.com/2012/02/06/my-personal-exome-analysis-part-i-first-findings/</link>
		<comments>http://manuelcorpas.com/2012/02/06/my-personal-exome-analysis-part-i-first-findings/#comments</comments>
		<pubDate>Mon, 06 Feb 2012 09:57:41 +0000</pubDate>
		<dc:creator>admin</dc:creator>
				<category><![CDATA[Personal Genomes]]></category>
		<category><![CDATA[BAM]]></category>
		<category><![CDATA[Data Analysis]]></category>
		<category><![CDATA[Exome]]></category>
		<category><![CDATA[public license]]></category>
		<category><![CDATA[VCF]]></category>

		<guid isPermaLink="false">http://manuelcorpas.com/?p=1309</guid>
		<description><![CDATA[You may have read about the release of my raw personal exome data in a previous entry. Although users were not required to report back any finding derived from this data, my hope was that some of them would return with interesting results. The response to this call has been overwhelmingly positive and in less than [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=manuelcorpas.com&#038;blog=5424602&#038;post=1309&#038;subd=corpasfoo&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>You may have read about the <a href="http://manuelcorpas.com/2012/01/23/my-personal-exome-now-publicly-released/" target="_blank">release of my raw personal exome data</a> in a previous entry. Although users were not required to report back any finding derived from this data, my hope was that some of them would return with interesting results. The response to this call has been overwhelmingly positive and in less than a week <a href="http://www.ogt.co.uk/" target="_blank">Oxford Gene Technology</a> (OGT) has kindly provided me with a report to facilitate the analysis of my personal exome. OGT’s donation has allowed the start of the “My Personal Exome Analysis” series in this blog. In Part I, I will be sharing some data and preliminary metrics gathered from OGT’s exome analysis services. I will continue to report further findings and insights as I keep exploring my personal exome at the deepest level that technology (and budget) currently allows.</p>
<p>In addition, I release under a <a href="http://creativecommons.org/publicdomain/zero/1.0/" target="_blank">CC0</a> license the following sequence-derived data from OGT’s services: a) the aligned and processed <a href="http://23andus.org/manuel.bam" target="_blank">BAM file</a>, b) the <a href="http://23andus.org/manuel.bam.bai" target="_blank">BAM file index</a> and c) the compressed <a href="http://23andus.org/manuel_BOTH_SNPINDELfilter_PASSED.vcf.gz" target="_blank">VCF file</a>. The <em>BAM file</em> (.bam) is the binary version of a tab-delimited text file that contains sequence alignment data. The <em>BAM file index</em> (.bai) provides fast random access to the BAM file. The compressed <em>VCF file</em> (.vcf.gz) describes variant calls in text format. These format types are industry standard and can be used in a variety of research contexts involving genome visualization and analysis.</p>
<p>Looking at the summary metrics in OGT’s report, my personal exome produces:</p>
<ul>
<li><strong>30,702</strong> variations to the reference genome (GRCh37)</li>
<li><strong>5,565</strong> non synonymous coding variations with consequences</li>
<li>A minimum of <strong>61.42%</strong> of the on-target regions, covered with a depth of at least 20x (remember that this data was sequenced by the BGI).</li>
<li>A total of <strong>2.54</strong> Gigabases of sequence data read and aligned at high quality.</li>
</ul>
<p>Figure 1 is a screenshot of the OGT report showing the summary of all variants identified, including those in dbSNP release 132.</p>
<p><a href="http://corpasfoo.files.wordpress.com/2012/02/fig1.png"><img class="aligncenter size-full wp-image-1310" title="fig1" src="http://corpasfoo.files.wordpress.com/2012/02/fig1.png?w=480" alt=""   /></a></p>
<p>Figure 2 summarizes all novel variants identified by OGT, filtering those in dbSNP release 132.</p>
<p><a href="http://corpasfoo.files.wordpress.com/2012/02/fig2.png"><img class="aligncenter size-full wp-image-1311" title="fig2" src="http://corpasfoo.files.wordpress.com/2012/02/fig2.png?w=480" alt=""   /></a></p>
<h2>Download of BAM and VCF Files</h2>
<p>You are allowed to use my personal exome’s BAM and VCF files under a completely free license <a href="http://creativecommons.org/publicdomain/zero/1.0/" target="_blank">CC0</a>. You can add this data to any database or resource with no need for attribution. Any usage or finding derived from this data communicated back to me will be shared (if considered noteworthy) through this blog or publication, with due attribution or request for coathorship in papers.</p>
<ul>
<li><a href="http://23andus.org/manuel.bam" target="_blank">Aligned BAM file download</a></li>
<li><a href="http://23andus.org/manuel.bam.bai" target="_blank">Index BAM file download</a></li>
<li><a href="http://23andus.org/manuel_BOTH_SNPINDELfilter_PASSED.vcf.gz" target="_blank">VCF file download</a></li>
</ul>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/corpasfoo.wordpress.com/1309/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/corpasfoo.wordpress.com/1309/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/corpasfoo.wordpress.com/1309/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/corpasfoo.wordpress.com/1309/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/corpasfoo.wordpress.com/1309/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/corpasfoo.wordpress.com/1309/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/corpasfoo.wordpress.com/1309/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/corpasfoo.wordpress.com/1309/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/corpasfoo.wordpress.com/1309/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/corpasfoo.wordpress.com/1309/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/corpasfoo.wordpress.com/1309/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/corpasfoo.wordpress.com/1309/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/corpasfoo.wordpress.com/1309/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/corpasfoo.wordpress.com/1309/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=manuelcorpas.com&#038;blog=5424602&#038;post=1309&#038;subd=corpasfoo&#038;ref=&#038;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://manuelcorpas.com/2012/02/06/my-personal-exome-analysis-part-i-first-findings/feed/</wfw:commentRss>
		<slash:comments>4</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ad7b9d282ec00a53fee5c0d293f3f425?s=96&#38;d=wavatar" medium="image">
			<media:title type="html">manuelcorpas</media:title>
		</media:content>

		<media:content url="http://corpasfoo.files.wordpress.com/2012/02/fig1.png" medium="image">
			<media:title type="html">fig1</media:title>
		</media:content>

		<media:content url="http://corpasfoo.files.wordpress.com/2012/02/fig2.png" medium="image">
			<media:title type="html">fig2</media:title>
		</media:content>
	</item>
		<item>
		<title>A Personal View of Personal Genomics</title>
		<link>http://manuelcorpas.com/2012/01/30/a-personal-view-of-personal-genomics/</link>
		<comments>http://manuelcorpas.com/2012/01/30/a-personal-view-of-personal-genomics/#comments</comments>
		<pubDate>Mon, 30 Jan 2012 10:54:44 +0000</pubDate>
		<dc:creator>admin</dc:creator>
				<category><![CDATA[Opinion]]></category>
		<category><![CDATA[Personal]]></category>
		<category><![CDATA[DTC]]></category>
		<category><![CDATA[Exome]]></category>
		<category><![CDATA[Human Genome]]></category>
		<category><![CDATA[personal genomes]]></category>
		<category><![CDATA[recreational genomics]]></category>

		<guid isPermaLink="false">http://manuelcorpas.com/?p=1305</guid>
		<description><![CDATA[In this interview I talk about my experiences in analyzing my genome and the genomes of my family. Here I also introduce the motivation and future plans for the analysis of my personal exome (i.e. all coding regions in my genome). Some further information regarding my family experience of personal genomics can be found in a recent [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=manuelcorpas.com&#038;blog=5424602&#038;post=1305&#038;subd=corpasfoo&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p><span style="text-align:center; display: block;"><a href="http://manuelcorpas.com/2012/01/30/a-personal-view-of-personal-genomics/"><img src="http://img.youtube.com/vi/MkW_MqYz7a0/2.jpg" alt="" /></a></span></p>
<p>In this interview I talk about my experiences in analyzing my genome and the genomes of my family. Here I also introduce the motivation and future plans for the analysis of my personal <a href="http://en.wikipedia.org/wiki/Exome" target="_blank">exome</a> (i.e. all coding regions in my genome).</p>
<p>Some further information regarding my family experience of personal genomics can be found in <a href="http://www.springerlink.com/content/481v7507kv336n07/fulltext.pdf" target="_blank">a recent publication</a>.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/corpasfoo.wordpress.com/1305/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/corpasfoo.wordpress.com/1305/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/corpasfoo.wordpress.com/1305/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/corpasfoo.wordpress.com/1305/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/corpasfoo.wordpress.com/1305/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/corpasfoo.wordpress.com/1305/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/corpasfoo.wordpress.com/1305/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/corpasfoo.wordpress.com/1305/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/corpasfoo.wordpress.com/1305/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/corpasfoo.wordpress.com/1305/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/corpasfoo.wordpress.com/1305/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/corpasfoo.wordpress.com/1305/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/corpasfoo.wordpress.com/1305/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/corpasfoo.wordpress.com/1305/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=manuelcorpas.com&#038;blog=5424602&#038;post=1305&#038;subd=corpasfoo&#038;ref=&#038;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://manuelcorpas.com/2012/01/30/a-personal-view-of-personal-genomics/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ad7b9d282ec00a53fee5c0d293f3f425?s=96&#38;d=wavatar" medium="image">
			<media:title type="html">manuelcorpas</media:title>
		</media:content>
	</item>
		<item>
		<title>My Personal Exome Now Publicly Released</title>
		<link>http://manuelcorpas.com/2012/01/23/my-personal-exome-now-publicly-released/</link>
		<comments>http://manuelcorpas.com/2012/01/23/my-personal-exome-now-publicly-released/#comments</comments>
		<pubDate>Mon, 23 Jan 2012 11:34:51 +0000</pubDate>
		<dc:creator>admin</dc:creator>
				<category><![CDATA[Genomics]]></category>
		<category><![CDATA[Personal]]></category>
		<category><![CDATA[Personal Genomes]]></category>
		<category><![CDATA[Exome]]></category>
		<category><![CDATA[fastq]]></category>
		<category><![CDATA[personal genomes]]></category>

		<guid isPermaLink="false">http://manuelcorpas.com/?p=1284</guid>
		<description><![CDATA[After many months of having performed the sequencing of my personal exome, I now make it available to the community for public use. I release it under a public domain license (CC0 1.0 Universal), giving you permission to use this data in any way. What is an exome? An exome is the ~1% of my genome [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=manuelcorpas.com&#038;blog=5424602&#038;post=1284&#038;subd=corpasfoo&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>After many months of having performed the sequencing of my personal exome, I now make it available to the community for public use. I release it under a public domain license (<a href="http://creativecommons.org/publicdomain/zero/1.0/" rel="license">CC0 1.0 Universal</a>), giving you permission to use this data in any way.</p>
<h4>What is an exome?</h4>
<p>An exome is the ~1% of my genome that encodes for proteins.</p>
<h4>Why do I release my personal exome?</h4>
<p>When my family and myself made our genotypes available through the Internet, we immediately received results from researchers around the world who took our data for analysis and came back with interesting results. As a result of this, we have been able to learn much about ourselves. I have reported this in a previous entry on this blog entitled &#8220;<a href="http://manuelcorpas.com/2011/06/06/benefits-for-publishing-family-genomes-on-the-internet/" target="_blank">Benefits for Publishing Family Genomes on the Internet</a>&#8220;. I now follow the same principle: if I make my exome available for people to analyse it, I can expect that some researchers may come back with interesting results.</p>
<h4>What data do I actually release?</h4>
<p>I release my 4 FastQ files that were given to me by my sequencing provider. This is the same kind of information that 23andMe gives in their current exome analysis offer. This information basically consists of raw reads that need to be aligned to a reference assembly. Once aligned, interesting variation data can be inferred.</p>
<h4>What do I ask in return?</h4>
<p>Nothing. I do appeal though to the good will of potential users to report back to me anything interesting they might find.</p>
<h4>How big are the files?</h4>
<p>They are huge. On average they are about 0.6 Gb per file and I have 4 of these. That means that it can take several hours for each file to be downloaded. Be patient!</p>
<h4>Where can I get them?</h4>
<p>Here:</p>
<ol>
<li><a href="http://23andus.org/exome-file1.fq.gz">File 1</a></li>
<li><a href="http://23andus.org/exome-file2.fq.gz">File 2</a></li>
<li><a href="http://23andus.org/exome-file3.fq.gz">File 3</a></li>
<li><a href="http://23andus.org/exome-file4.fq.gz">File 4</a></li>
</ol>
<h4><span id="more-1284"></span></h4>
<h4>How did I get my personal exome sequenced?</h4>
<p>Completely independently. If you want to know the story on how I did it, please refer to my blog entries &#8220;Getting My Genome Sequencing Done&#8221; <a href="http://manuelcorpas.com/2011/07/12/getting-my-genome-sequencing-done-part-i/" target="_blank">Part I</a> and <a href="http://manuelcorpas.com/2011/09/12/getting-my-genome-sequencing-done-part-ii/" target="_blank">Part II</a>. As it is implied there, I managed to get my personal genome sequenced by knocking on quite a few doors and then finding someone who would sponsor me to do so. In fact, part of this exercise&#8217;s aim was to prove that it is possible now a days for ordinary citizens to get their genomes sequenced if they so wish.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/corpasfoo.wordpress.com/1284/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/corpasfoo.wordpress.com/1284/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/corpasfoo.wordpress.com/1284/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/corpasfoo.wordpress.com/1284/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/corpasfoo.wordpress.com/1284/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/corpasfoo.wordpress.com/1284/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/corpasfoo.wordpress.com/1284/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/corpasfoo.wordpress.com/1284/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/corpasfoo.wordpress.com/1284/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/corpasfoo.wordpress.com/1284/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/corpasfoo.wordpress.com/1284/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/corpasfoo.wordpress.com/1284/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/corpasfoo.wordpress.com/1284/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/corpasfoo.wordpress.com/1284/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=manuelcorpas.com&#038;blog=5424602&#038;post=1284&#038;subd=corpasfoo&#038;ref=&#038;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://manuelcorpas.com/2012/01/23/my-personal-exome-now-publicly-released/feed/</wfw:commentRss>
		<slash:comments>14</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ad7b9d282ec00a53fee5c0d293f3f425?s=96&#38;d=wavatar" medium="image">
			<media:title type="html">manuelcorpas</media:title>
		</media:content>
	</item>
		<item>
		<title>Converting Genes and Genomic Features From NCBI36 to GRCh37</title>
		<link>http://manuelcorpas.com/2012/01/10/converting-genes-and-genomic-features-between-ncbi36-to-grch37/</link>
		<comments>http://manuelcorpas.com/2012/01/10/converting-genes-and-genomic-features-between-ncbi36-to-grch37/#comments</comments>
		<pubDate>Tue, 10 Jan 2012 15:00:12 +0000</pubDate>
		<dc:creator>admin</dc:creator>
				<category><![CDATA[Bioinformatics]]></category>
		<category><![CDATA[Genomics]]></category>
		<category><![CDATA[Tutorials]]></category>
		<category><![CDATA[gene]]></category>
		<category><![CDATA[GRCh37]]></category>
		<category><![CDATA[ncbi36]]></category>
		<category><![CDATA[remap]]></category>

		<guid isPermaLink="false">http://manuelcorpas.com/?p=1273</guid>
		<description><![CDATA[The Human Genome is a like map where features and genes are mapped to. As techniques improve, our fine-grained resolution for that map increases and new versions are released every few years. When a new coordinate reference map (or assembly) for the Human Genome is released, it produces lots of headaches for those who work [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=manuelcorpas.com&#038;blog=5424602&#038;post=1273&#038;subd=corpasfoo&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>The Human Genome is a like map where features and genes are mapped to. As techniques improve, our fine-grained resolution for that map increases and new versions are released every few years. When a new coordinate reference map (or assembly) for the Human Genome is released, it produces lots of headaches for those who work in the field as it means that the locations of genes, chromosomal bands and other features like Single Nucleotide Polymorphisms (SNPs) or Copy Number Variation (CNVs) change.</p>
<p>In order to have the most up-to-date version for the Human Genome set of genes and features sometimes it is necessary to convert from one assembly to another. In the past I have written a tutorial on how to <a href="http://manuelcorpas.com/2011/02/02/838/" target="_blank">remap from NCBI36 to GRCh37 human assemblies using liftOver</a>. In this tutorial I present a simple step-by-step guide for feature remapping using NCBI&#8217;s remapping tool.</p>
<p><strong>Important:</strong></p>
<p>Please make sure you know in advance the assembly to which your aberration data is currently mapped to. If by mistake you remap an aberration already in GRCh37 to GRCh37 you will get new coordinates for the region mapped to the wrong coordinates.</p>
<p>The NCBI provides a web facility to convert coordinates from one assembly into another. To convert coordinates using their genome remapping service do the following:</p>
<ol>
<li>Make sure that your data is in BED format,  e.g. “chr3            100000 999990 myId0000123” -&gt; CNV aberration in NCBI36/hg18</li>
</ol>
<ul>
<li>Please note that each field is separated by a tab and each line by a character return. Please follow this strictly or the remapping tool may throw an error.</li>
<li>Add as many lines as aberrations you would like to remap</li>
</ul>
<ol>
<li>Go to the NCBI Remap page:</li>
</ol>
<ul>
<li><a href="http://www.ncbi.nlm.nih.gov/genome/tools/remap/" rel="nofollow">http://www.ncbi.nlm.nih.gov/genome/tools/remap/</a></li>
</ul>
<ol>
<li>Select “Organism for source data” Homo Sapiens, “Source Assembly” NCBI36 (hg18) and “Target Assembly” GRCh37 (hg19)</li>
<li>Please leave all “Remapping Options” (Minimum ratio of bases that must remap, etc) with default values</li>
<li>Select for “Input format” BED, “Output format” Same as input</li>
<li>Paste your aberration in the input box where it says “Paste data here” and hit submit at the bottom of the page</li>
<li>Wait until results are returned</li>
<li>To retrieve results download “Mapping Report”, which is in excel format or alternatively Mapping report Sample in the results page</li>
</ol>
<p><a href="http://corpasfoo.files.wordpress.com/2012/01/screen-shot-2012-01-10-at-11-02-50-am.png"><img class="aligncenter size-full wp-image-1274" title="result remapping tool" src="http://corpasfoo.files.wordpress.com/2012/01/screen-shot-2012-01-10-at-11-02-50-am.png?w=480" alt=""   /></a></p>
<p>Please note that your aberration may remap to more than one location. I recommend that you manually check the coordinates and select the most appropriate of the doubly remapped aberration in the new assembly. Please also note that your aberration may not remap because the region is partially or entirely deleted in the new assembly or split in GRCh37. In this case I recommend that you use another start or end point position, maybe use the start/end of alternative probes until you find a region where it maps.</p>
<p>Another possibility could be to look at the genes for the region in the old assembly and select a region in GRCh37 that includes the same genes as in NCBI36. Each of these solutions requires careful deliberation and may not be applicable to your particular case (e.g. genes in different chromosomes would not allow remapping based on genes).</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/corpasfoo.wordpress.com/1273/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/corpasfoo.wordpress.com/1273/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/corpasfoo.wordpress.com/1273/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/corpasfoo.wordpress.com/1273/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/corpasfoo.wordpress.com/1273/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/corpasfoo.wordpress.com/1273/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/corpasfoo.wordpress.com/1273/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/corpasfoo.wordpress.com/1273/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/corpasfoo.wordpress.com/1273/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/corpasfoo.wordpress.com/1273/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/corpasfoo.wordpress.com/1273/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/corpasfoo.wordpress.com/1273/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/corpasfoo.wordpress.com/1273/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/corpasfoo.wordpress.com/1273/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=manuelcorpas.com&#038;blog=5424602&#038;post=1273&#038;subd=corpasfoo&#038;ref=&#038;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://manuelcorpas.com/2012/01/10/converting-genes-and-genomic-features-between-ncbi36-to-grch37/feed/</wfw:commentRss>
		<slash:comments>2</slash:comments>
	
		<media:content url="http://0.gravatar.com/avatar/ad7b9d282ec00a53fee5c0d293f3f425?s=96&#38;d=wavatar" medium="image">
			<media:title type="html">manuelcorpas</media:title>
		</media:content>

		<media:content url="http://corpasfoo.files.wordpress.com/2012/01/screen-shot-2012-01-10-at-11-02-50-am.png" medium="image">
			<media:title type="html">result remapping tool</media:title>
		</media:content>
	</item>
	</channel>
</rss>
