1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288
|
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
<html xmlns="http://www.w3.org/1999/xhtml" lang="en">
<!-- Version: Multiflex-5.4 / About -->
<!-- Type: Design with sidebar -->
<!-- Date: March 13, 2008 -->
<!-- Design: www.1234.info -->
<!-- License: Fully open source without restrictions. -->
<!-- Please keep footer credits with the words -->
<!-- "Design by 1234.info". Thank you! -->
<head>
<script type="text/javascript">
var _gaq = _gaq || [];
_gaq.push(['_setAccount', 'UA-25486066-1']);
_gaq.push(['_trackPageview']);
(function() {
})();
</script>
<meta http-equiv="content-type" content="text/html; charset=utf-8" />
<meta http-equiv="cache-control" content="no-cache" />
<meta http-equiv="expires" content="3600" />
<meta name="revisit-after" content="2 days" />
<meta name="robots" content="index,follow" />
<meta name="publisher" content="Your publisher infos here" />
<meta name="copyright" content="Copyright (c) 2011 Adam Roberts" />
<meta name="author" content="Designed by www.1234.info / Modified: Adam Roberts" />
<meta name="distribution" content="global" />
<meta name="image" content="http://bio.math.berkeley.edu/eXpress/img/logo.png" />
<meta name="description" content="eXpress is a general quantification tool for target DNA/RNA sequences. While its primary use currently is RNA-Seq it has the potential for applications in many other areas including as allele-specific expression and metgenomics. What makes eXpress different is that it is an online (or streaming) algorithm, meaning it only makes one pass through the data. This allows it to be very light-weight and efficient using a constant amount of memory and time linear in the number of sequenced fragments being processed. Furthermore, it accepts piped SAM/BAM input, allowing users to avoid storing extremely large alignment files. eXpress models fragment biases, fragment lengths, and errors, allowing it to also be one of the most accurate quantification methods available." />
<meta name="keywords" content="RNA-Seq, Genomics, transcript,quantification" />
<link rel="stylesheet" type="text/css" media="screen,projection,print" href="./css/mf54_reset.css" />
<link rel="stylesheet" type="text/css" media="screen,projection,print" href="./css/mf54_grid.css" />
<link rel="stylesheet" type="text/css" media="screen,projection,print" href="./css/mf54_content.css" />
<link rel="icon" type="image/x-icon" href="./img/favicon.ico" />
<title>eXpress • About</title>
<script language="Javascript">
logo1=new Image
logo1.src="img/logo.png"
logo2=new Image
logo2.src="img/logo_yellow.png"
</script>
<title>eXpress • About</title>
</head>
<!-- Global IE fix to avoid layout crash when single word size wider than column width -->
<!-- Following line MUST remain as a comment to have the proper effect -->
<!--[if IE]><style type="text/css"> body {word-wrap: break-word;}</style><![endif]-->
<body>
<!-- CONTAINER FOR ENTIRE PAGE -->
<div class="container">
<!-- A. HEADER -->
<div class="corner-page-top"></div>
<div class="header">
<div class="header-top">
<!-- A.1 SITENAME -->
<div class="sitelogo">
<ul>
<li><a href="#" onMouseOver="document.logo.src=logo2.src" onMouseOut="document.logo.src=logo1.src"><img name="logo" src="img/logo.png"/></a></li>
</ul>
</div>
<div class="sitename">
<h1><a href="#">eXpress</a></h1>
<h2><i>Streaming</i> quantification for high-throughput sequencing</h2>
</div>
<!-- A.2 BUTTON NAVIGATION -->
<div class="navbutton">
<ul>
<li><a href="http://www.berkeley.edu"><img src="img/berkeley_seal.gif"/></a></li>
</ul>
</div>
</div>
<!-- A.4 BREADCRUMB and SEARCHFORM -->
<div class="header-bottom">
<!-- Search form -->
<div class="searchform" id="cse-search-form" style="padding-top:4px; width:30%;">Loading</div>
<script type="text/javascript">
}, true);
</script>
<link rel="stylesheet" href="css/googlesearch.css" type="text/css" />
</div>
</div>
<div class="corner-page-bottom"></div>
<!-- B. NAVIGATION BAR -->
<div class="corner-page-top"></div>
<div class="navbar">
<!-- Navigation item -->
<ul>
<li><a href="index.html">Home</a></li>
</ul>
<!-- Navigation item -->
<ul>
<li><a href="overview.html">About</a></li>
</ul>
<!-- Navigation item -->
<ul>
<li><a href="#">Download<!--[if IE 7]><!--></a><!--<![endif]-->
<!--[if lte IE 6]><table><tr><td><![endif]-->
<ul>
<li><a href=downloads/express-1.5.1/express-1.5.1-macosx_x86_64.tgz onClick="_gaq.push(['_trackEvent', 'Downloads', 'Mac', 'About']);" target="_blank">Mac OS X (64-bit)</a></li>
<li><a href=downloads/express-1.5.1/express-1.5.1-linux_x86_64.tgz onClick="_gaq.push(['_trackEvent', 'Downloads', 'Linux', 'About']);" target="_blank">Linux (64-bit)</a></li>
<li><a href=downloads/express-1.5.1/express-1.5.1-win32_x86_64.zip onClick="_gaq.push(['_trackEvent', 'Downloads', 'Windows', 'About']);" target="_blank">Windows (64-bit)</a></li>
<li><a href=downloads onClick="_gaq.push(['_trackEvent', 'Downloads', 'Previous','About']);">Previous Versions</a></li>
<li><a href=downloads/express-1.5.1/express-1.5.1-src.tgz onClick="_gaq.push(['_trackEvent', 'Downloads', 'Source', 'About']);" target="_blank">Source Code</a></li>
</ul>
<!--[if lte IE 6]></td></tr></table></a><![endif]-->
</li>
</ul>
<ul>
<li><a href="tutorial.html">Getting Started</a></li>
</ul>
<ul>
<li><a href="https://github.com/adarob/eXpress">Source</a></li>
</ul>
<ul>
<li><a href="manual.html">Manual</a></li>
</ul>
<ul>
<li><a href="faq.html">FAQ</a></li>
</ul>
</div>
<!-- C. MAIN SECTION -->
<div class="main">
<h1 class="pagetitle">About</h1>
<!-- C.1 CONTENT -->
<div class="content">
<!-- CONTENT CELL -->
<div class="corner-content-1col-top"></div>
<div class="content-1col-nobox">
<h1 id="description">Description</h1>
<p>eXpress is a streaming tool for quantifying the abundances of a set of target sequences from sampled subsequences. Example applications include transcript-level RNA-Seq quantification, allele-specific/haplotype expression analysis (from RNA-Seq), transcription factor binding quantification in ChIP-Seq, and analysis of metagenomic data. It is based on an online-EM
algorithm [<a href="#ref1">1</a>] that results in space (memory) requirements
proportional to the total size of the target sequences and time
requirements that are proportional to the number of sampled
fragments. Thus, in applications such as RNA-Seq, eXpress can accurately quantify much larger
samples than other currently available
tools greatly reducing computing infrastructure requirements. eXpress can be used to build lightweight
high-throughput sequencing processing pipelines when coupled with
a streaming aligner (such as Bowtie), as
output can be piped directly into eXpress, effectively eliminating the need to store read alignments in memory or on disk.</p>
<p>In an analysis of the performance of eXpress for RNA-Seq data, we have observed that this efficiency does not come
at a cost of accuracy. eXpress is more accurate
than other available tools, even when limited
to smaller datasets that do not require such
efficiency [<a href="#ref2">2</a>]. Moreover, like the <a href=http://cufflinks.cbcb.umd.edu>Cufflinks</a>
program [<a href="#ref3">3</a>], eXpress can be used to
estimate transcript abundances in
multi-isoform genes. eXpress is also able
to resolve multi-mappings of reads across gene
families, and does not require a reference
genome so that it can be used in conjunction
with <i>de novo</i> assemblers such as <a href=http://trinityrnaseq.sourceforge.net/>Trinity</a>, <a
href=http://www.ebi.ac.uk/~zerbino/oases/>Oases</a>, or <a
href=http://www.bcgsc.ca/platform/bioinfo/software/trans-abyss>Trans-ABySS</a>. The underlying model is based on previously described probabilistic
models developed for RNA-Seq [<a href="#ref4">4</a>] but is applicable to other settings where target sequences are sampled, and includes
parameters for fragment length distributions,
errors in reads, and sequence-specific fragment bias [<a href="#ref5">5</a>].
</p>
<p>eXpress can be used to resolve ambiguous mappings in other high-throughput sequencing based applications. The only required inputs to eXpress are a set of target sequences and a set of sequenced fragments multiply-aligned to them. While these target sequences will often be gene isoforms, they need not be. Haplotypes can be used as the reference for allele-specific expression analysis, binding regions for ChIP-Seq, or target genomes in metagenomics experiments. eXpress is useful in any analysis where reads multi-map to sequences that differ in abundance.</p>
<p>→ <a href="#top">Back to top.</a></p>
</div>
<div class="corner-content-1col-bottom"></div>
<!-- CONTENT CELL -->
<div class="corner-content-1col-top"></div>
<div class="content-1col-nobox">
<h1 id="features">Features</h1>
<ul>
<li>Time proportional to number of reads, memory proportional to transcriptome size.</li>
<li>Maximum of 3 free processor cores required (2 without bias
correction). Try it on your laptop!</li>
<li>Outputs <a href="http://cufflinks.cbcb.umd.edu/howitworks.html#hqua">FPKM</a>, estimated counts, and posterior count distributions for differential analysis.</li>
<li>Supports alignments with unlimited multi-mappings and errors.</li>
<li>Transcript-level abundance estimation when used for RNA-Seq.</li>
<li>Can be used for allele-specific expression estimates in RNA-Seq.</li>
<li>Corrects for sequence-specific fragment biases.</li>
<li>Learns first-order Markov model for sequencing errors for use in probablistic read assignment.</li>
<li>Models indels in reads.</li>
<li>Learns fragment length distribution for use in probablistic assignment of paired-end reads.</li>
<li>Supports both directional and non-directional sequencing.</li>
<li>Written in C++ and runs on Mac, Linux, and Windows.</li>
</ul>
<p>→ <a href="#top">Back to top.</a></p>
</div>
<div class="corner-content-1col-bottom"></div>
<!-- CONTENT CELL -->
<div class="corner-content-1col-top"></div>
<div class="content-1col-nobox">
<h1 id="methods">Methods</h1>
<p>A complete description of the eXpress method can be found in the manuscript [<a href="ref1">2</a>].
<p>→ <a href="#top">Back to top.</a></p>
</div>
<div class="corner-content-1col-bottom"></div>
<!-- CONTENT CELL -->
<div class="corner-content-1col-top"></div>
<div class="content-1col-nobox">
<h1 id="references">References</h1>
<ol>
<li id="ref1">CappeĚ O and Moulines E. (2009).
<b>On-line expectationâmaximization algorithm for latent data models.</b>
<i>Journal of the Royal Statistical Society.</i>
<br />→<a href=http://http://onlinelibrary.wiley.com/doi/10.1111/j.1467-9868.2009.00698.x/abstract>doi:10.1111/j.1467-9868.2009.00698.x</a></li>
<li id="ref2">Roberts A and Pachter L (2012).
<b>Streaming fragment assignment for real-time analysis of sequencing experiments.</b>
<i>Nature Methods.</i>
<br />→<a href=http://dx.doi.org/10.1038/nmeth.2251>doi:10.1038/nmeth.2251</a></li>
<li id="ref3">Trapnell C, Williams BA, Pertea G, Mortazavi AM, Kwan G, van Baren MJ, Salzberg SL, Wold B, Pachter L (2010).
<b>Transcript assembly and quantification by RNA-Seq reveals unannotated transcripts and isoform switching during cell differentiation.</b>
<i>Nature Biotechnology.</i>
<br />→<a href=http://dx.doi.org/10.1038/nbt.1621>doi:10.1038/nbt.162</a></li>
<li id="ref4">Pachter, L (2011).
<b>Models for transcript quantification from RNA-Seq.</b>
<i>Submitted.</i>
<br />→<a href="http://arxiv.org/abs/1104.3889">arXiv:1104.3889v2</a></font></li>
</li>
<li id="ref5">Roberts A, Trapnell C, Donaghey J, Rinn JL, Pachter L (2011).
<b>Improving RNA-Seq expression estimates by correcting for fragment bias.</b>
<i>Genome Biology.</i>
<br />→<a href="http://genomebiology.com/2011/12/3/R22/abstract">doi:10.1186/gb-2011-12-3-r22</a></font></li>
</ol>
<p>→ <a href="#top">Back to top.</a></p>
</div>
<div class="corner-content-1col-bottom"></div>
</div>
<!-- C.2 SUBCONTENT -->
<div class="subcontent">
<!-- SUBCONTENT CELL -->
<div class="corner-subcontent-top"></div>
<div class="subcontent-box">
<h1 class="menu">Outline</h1>
<div class="sidemenu1">
<!-- CONTENT CELL -->
<ul>
<li><a href="#description">Description</a></li>
<li><a href="#features">Features</a></li>
<li><a href="#method">Method</a></li>
<li><a href="#references">References</a></li>
</ul>
</div>
</div>
<div class="corner-subcontent-bottom"></div>
</div>
</div>
<!-- D. FOOTER -->
<div class="footer">
<p>Copyright © 2011 Adam Roberts | All Rights Reserved</p>
<p class="credits">Design by <a href="http://1234.info/" title="Designer Homepage">1234.info</a> | Modified by <a href="http://cs.berkeley.edu/~adarob/">Adam Roberts</a> | <a href="http://validator.w3.org/check?uri=referer" title="Validate XHTML code">XHTML 1.0</a> | <a href="http://jigsaw.w3.org/css-validator/" title="Validate CSS code">CSS 2.0</a></p>
<br />
<p>The eXpress project was funded in part by an NSF graduate fellowship to Adam Roberts and NIH grant 1R01HG006129-01</p>
</div>
<div class="corner-page-bottom"></div>
</div>
</body>
</html>
|