File: overview.html

package info (click to toggle)
berkeley-express 1.5.3%2Bdfsg-3
  • links: PTS, VCS
  • area: main
  • in suites: bookworm, forky, trixie
  • size: 3,764 kB
  • sloc: cpp: 4,785; sh: 65; makefile: 11
file content (288 lines) | stat: -rw-r--r-- 15,471 bytes parent folder | download | duplicates (4)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
<html xmlns="http://www.w3.org/1999/xhtml" lang="en">

<!--  Version: Multiflex-5.4 / About                     -->
<!--  Type:    Design with sidebar                          -->
<!--  Date:    March 13, 2008                               -->
<!--  Design:  www.1234.info                                -->
<!--  License: Fully open source without restrictions.      -->
<!--           Please keep footer credits with the words    -->
<!--           "Design by 1234.info". Thank you!            -->

<head> 
<script type="text/javascript">

  var _gaq = _gaq || [];
  _gaq.push(['_setAccount', 'UA-25486066-1']);
  _gaq.push(['_trackPageview']);

  (function() {
  })();

</script>
  <meta http-equiv="content-type" content="text/html; charset=utf-8" />
  <meta http-equiv="cache-control" content="no-cache" />
  <meta http-equiv="expires" content="3600" />
  <meta name="revisit-after" content="2 days" />
  <meta name="robots" content="index,follow" />
  <meta name="publisher" content="Your publisher infos here" />
  <meta name="copyright" content="Copyright (c) 2011 Adam Roberts" />
  <meta name="author" content="Designed by www.1234.info / Modified: Adam Roberts" />
  <meta name="distribution" content="global" />
  <meta name="image" content="http://bio.math.berkeley.edu/eXpress/img/logo.png" />
  <meta name="description" content="eXpress is a general quantification tool for target DNA/RNA sequences. While its primary use currently is RNA-Seq it has the potential for applications in many other areas including as allele-specific expression and metgenomics. What makes eXpress different is that it is an online (or streaming) algorithm, meaning it only makes one pass through the data. This allows it to be very light-weight and efficient using a constant amount of memory and time linear in the number of sequenced fragments being processed. Furthermore, it accepts piped SAM/BAM input, allowing users to avoid storing extremely large alignment files. eXpress models fragment biases, fragment lengths, and errors, allowing it to also be one of the most accurate quantification methods available." />
  <meta name="keywords" content="RNA-Seq, Genomics, transcript,quantification" />
  <link rel="stylesheet" type="text/css" media="screen,projection,print" href="./css/mf54_reset.css" />
  <link rel="stylesheet" type="text/css" media="screen,projection,print" href="./css/mf54_grid.css" />
  <link rel="stylesheet" type="text/css" media="screen,projection,print" href="./css/mf54_content.css" />
  <link rel="icon" type="image/x-icon" href="./img/favicon.ico" />
  <title>eXpress &bull; About</title>
   <script language="Javascript">
        logo1=new Image
        logo1.src="img/logo.png"
        logo2=new Image
        logo2.src="img/logo_yellow.png"
 </script>
  <title>eXpress &bull; About</title>
</head>

<!-- Global IE fix to avoid layout crash when single word size wider than column width -->
<!-- Following line MUST remain as a comment to have the proper effect -->
<!--[if IE]><style type="text/css"> body {word-wrap: break-word;}</style><![endif]-->



<body>
  <!-- CONTAINER FOR ENTIRE PAGE -->
  <div class="container">

    <!-- A. HEADER -->         
    <div class="corner-page-top"></div>        
    <div class="header">
      <div class="header-top">
        
        <!-- A.1 SITENAME -->    
        <div class="sitelogo">
        <ul>
            <li><a href="#" onMouseOver="document.logo.src=logo2.src" onMouseOut="document.logo.src=logo1.src"><img name="logo" src="img/logo.png"/></a></li>
        </ul>
        </div>
        <div class="sitename">
          <h1><a href="#">eXpress</a></h1> 
          &nbsp;
          <h2><i>Streaming</i> quantification for high-throughput sequencing</h2>
        </div>
    
        <!-- A.2 BUTTON NAVIGATION -->
        <div class="navbutton">
          <ul>
            <li><a href="http://www.berkeley.edu"><img src="img/berkeley_seal.gif"/></a></li>
          </ul>
        </div>
      </div>

      <!-- A.4 BREADCRUMB and SEARCHFORM -->
      <div class="header-bottom">

		

        <!-- Search form -->    
<div class="searchform" id="cse-search-form" style="padding-top:4px; width:30%;">Loading</div>
<script type="text/javascript"> 
  }, true);
</script>
<link rel="stylesheet" href="css/googlesearch.css" type="text/css" />

   </div>
    </div>      
    <div class="corner-page-bottom"></div>    
    
    <!-- B. NAVIGATION BAR -->
    <div class="corner-page-top"></div>        
    <div class="navbar">
	
      <!-- Navigation item -->
      <ul>
        <li><a href="index.html">Home</a></li>
      </ul>
      <!-- Navigation item -->
      <ul>
        <li><a href="overview.html">About</a></li>
      </ul>            
      <!-- Navigation item -->
      <ul>
        <li><a href="#">Download<!--[if IE 7]><!--></a><!--<![endif]-->
          <!--[if lte IE 6]><table><tr><td><![endif]-->
            <ul>
              <li><a href=downloads/express-1.5.1/express-1.5.1-macosx_x86_64.tgz onClick="_gaq.push(['_trackEvent', 'Downloads', 'Mac', 'About']);" target="_blank">Mac OS X (64-bit)</a></li>
              <li><a href=downloads/express-1.5.1/express-1.5.1-linux_x86_64.tgz onClick="_gaq.push(['_trackEvent', 'Downloads', 'Linux', 'About']);" target="_blank">Linux (64-bit)</a></li>
              <li><a href=downloads/express-1.5.1/express-1.5.1-win32_x86_64.zip onClick="_gaq.push(['_trackEvent', 'Downloads', 'Windows', 'About']);" target="_blank">Windows (64-bit)</a></li>
              <li><a href=downloads onClick="_gaq.push(['_trackEvent', 'Downloads', 'Previous','About']);">Previous Versions</a></li>
              <li><a href=downloads/express-1.5.1/express-1.5.1-src.tgz onClick="_gaq.push(['_trackEvent', 'Downloads', 'Source', 'About']);" target="_blank">Source Code</a></li>
            </ul>
          <!--[if lte IE 6]></td></tr></table></a><![endif]-->
        </li>
      </ul>                  
      <ul>
        <li><a href="tutorial.html">Getting Started</a></li>
      </ul>
      <ul>
        <li><a href="https://github.com/adarob/eXpress">Source</a></li>
      </ul>
      <ul>
        <li><a href="manual.html">Manual</a></li>
      </ul>
      <ul>
        <li><a href="faq.html">FAQ</a></li>
      </ul>
      </div>
  
    <!-- C. MAIN SECTION -->      
    <div class="main">
    	<h1 class="pagetitle">About</h1>

      <!-- C.1 CONTENT -->
      <div class="content">

        <!-- CONTENT CELL -->                
        <div class="corner-content-1col-top"></div>                        
        <div class="content-1col-nobox">
        <h1 id="description">Description</h1>
			<p>eXpress is a streaming tool for quantifying the abundances of a set of target sequences from sampled subsequences. Example applications include transcript-level RNA-Seq quantification, allele-specific/haplotype expression analysis (from RNA-Seq), transcription factor binding quantification in ChIP-Seq, and analysis of metagenomic data. It is based on an online-EM
        algorithm [<a href="#ref1">1</a>] that results in space (memory) requirements
        proportional to the total size of the target sequences  and time
        requirements that are proportional to the number of sampled
        fragments. Thus, in applications such as RNA-Seq, eXpress can accurately quantify much larger
        samples than other currently available
        tools greatly reducing computing infrastructure requirements. eXpress can be used to build lightweight
			high-throughput sequencing  processing pipelines when coupled with
			a streaming aligner (such as Bowtie), as
			output can be piped directly into eXpress, effectively eliminating the need to store read alignments in memory or on disk.</p>

	  <p>In an analysis of the performance of eXpress for RNA-Seq data, we have observed that this efficiency does not come
			at a cost of accuracy. eXpress is more accurate
			than other available tools, even when limited
			to smaller datasets that do not require such
			efficiency [<a href="#ref2">2</a>]. Moreover, like the <a href=http://cufflinks.cbcb.umd.edu>Cufflinks</a>
			program [<a href="#ref3">3</a>], eXpress can be used to
			estimate transcript abundances in
			multi-isoform genes. eXpress is also able
			to resolve multi-mappings of reads across gene
			families, and does not require a reference
			genome so that it can be used in conjunction
			with <i>de novo</i> assemblers such as <a href=http://trinityrnaseq.sourceforge.net/>Trinity</a>, <a
        href=http://www.ebi.ac.uk/~zerbino/oases/>Oases</a>, or <a
        href=http://www.bcgsc.ca/platform/bioinfo/software/trans-abyss>Trans-ABySS</a>. The underlying model is based on previously described probabilistic
			models developed for RNA-Seq [<a href="#ref4">4</a>] but is applicable to other settings where target sequences are sampled, and includes
			parameters for fragment length distributions,
			errors in reads, and sequence-specific fragment bias [<a href="#ref5">5</a>].
	  </p>

			<p>eXpress can be used to resolve ambiguous mappings in other high-throughput sequencing based applications. The only required inputs to eXpress are a set of target sequences and a set of sequenced fragments multiply-aligned to them. While these target sequences will often be gene isoforms, they need not be. Haplotypes can be used as the reference for allele-specific expression analysis, binding regions for ChIP-Seq, or target genomes in metagenomics experiments. eXpress is useful in any analysis where reads multi-map to sequences that differ in abundance.</p>
      			<p>&rarr; <a href="#top">Back to top.</a></p>
      	</div>      

        <div class="corner-content-1col-bottom"></div>                               
        <!-- CONTENT CELL -->                
        <div class="corner-content-1col-top"></div>                        
        <div class="content-1col-nobox">
		  	<h1 id="features">Features</h1>
		  	<ul>
		  	<li>Time proportional to number of reads, memory proportional to transcriptome size.</li>
		  	<li>Maximum of 3 free processor cores required (2 without bias
		  	correction). Try it on your laptop!</li>
		  	<li>Outputs <a href="http://cufflinks.cbcb.umd.edu/howitworks.html#hqua">FPKM</a>, estimated counts, and posterior count distributions for differential analysis.</li>
		  	<li>Supports alignments with unlimited multi-mappings and errors.</li>
		  	<li>Transcript-level abundance estimation when used for RNA-Seq.</li>
			<li>Can be used for allele-specific expression estimates in RNA-Seq.</li>
		    <li>Corrects for sequence-specific fragment biases.</li>
   		    <li>Learns first-order Markov model for sequencing errors for use in probablistic read assignment.</li>
	       	<li>Models indels in reads.</li>
   		    <li>Learns fragment length distribution for use in probablistic assignment of paired-end reads.</li>
   		    <li>Supports both directional and non-directional sequencing.</li>
		  	<li>Written in C++ and runs on Mac, Linux, and Windows.</li>
		  	</ul>
      			<p>&rarr; <a href="#top">Back to top.</a></p>
      	</div>      

        <div class="corner-content-1col-bottom"></div>                               
        <!-- CONTENT CELL -->                
        <div class="corner-content-1col-top"></div>                        
        <div class="content-1col-nobox">

			<h1 id="methods">Methods</h1>
			<p>A complete description of the eXpress method can be found in the manuscript [<a href="ref1">2</a>].
			      		<p>&rarr; <a href="#top">Back to top.</a></p>	
			      </div>      

        <div class="corner-content-1col-bottom"></div>                               
        <!-- CONTENT CELL -->                
        <div class="corner-content-1col-top"></div>                        
        <div class="content-1col-nobox">
			<h1 id="references">References</h1>
	  		<ol>
	  	  <li id="ref1">Cappé O and Moulines E. (2009).
	  	  <b>On-line expectation–maximization algorithm for latent data models.</b>
	  	  <i>Journal of the Royal Statistical Society.</i>
	  	  <br />&rarr;<a href=http://http://onlinelibrary.wiley.com/doi/10.1111/j.1467-9868.2009.00698.x/abstract>doi:10.1111/j.1467-9868.2009.00698.x</a></li>
	  		<li id="ref2">Roberts A and Pachter L (2012).
	  		<b>Streaming fragment assignment for real-time analysis of sequencing experiments.</b>
	  		<i>Nature Methods.</i>
	  		<br />&rarr;<a href=http://dx.doi.org/10.1038/nmeth.2251>doi:10.1038/nmeth.2251</a></li>
	  	  <li id="ref3">Trapnell C, Williams BA, Pertea G, Mortazavi AM, Kwan G, van Baren MJ, Salzberg SL, Wold B,&nbsp; Pachter L (2010).
	  	  <b>Transcript assembly and quantification by RNA-Seq reveals unannotated transcripts and isoform switching during cell differentiation.</b>
	  	  <i>Nature Biotechnology.</i>
	  	  <br />&rarr;<a href=http://dx.doi.org/10.1038/nbt.1621>doi:10.1038/nbt.162</a></li>
	  	  <li id="ref4">Pachter, L (2011).
	  	  <b>Models for transcript quantification from RNA-Seq.</b>
	  	  <i>Submitted.</i>
          <br />&rarr;<a href="http://arxiv.org/abs/1104.3889">arXiv:1104.3889v2</a></font></li>
	  	  </li>
         <li id="ref5">Roberts A, Trapnell C, Donaghey J, Rinn JL, Pachter L (2011).
          <b>Improving RNA-Seq expression estimates by correcting for fragment bias.</b>
          <i>Genome Biology.</i>
          <br />&rarr;<a href="http://genomebiology.com/2011/12/3/R22/abstract">doi:10.1186/gb-2011-12-3-r22</a></font></li>
      	</ol>
      		<p>&rarr; <a href="#top">Back to top.</a></p>
      </div>      

        <div class="corner-content-1col-bottom"></div>                               
      </div>
                
       <!-- C.2 SUBCONTENT -->
      <div class="subcontent">
      
         <!-- SUBCONTENT CELL -->
        <div class="corner-subcontent-top"></div>                        
        <div class="subcontent-box">
          <h1 class="menu">Outline</h1> 
          <div class="sidemenu1">
          <!-- CONTENT CELL -->                
 		  <ul>
			  <li><a href="#description">Description</a></li>
			  <li><a href="#features">Features</a></li>
			  <li><a href="#method">Method</a></li>
			  <li><a href="#references">References</a></li>

		  </ul>
          </div> 
          </div>
        <div class="corner-subcontent-bottom"></div> 
	</div>
 	 </div>
      
    <!-- D. FOOTER -->      
    <div class="footer">
      <p>Copyright &copy; 2011 Adam Roberts&nbsp;&nbsp;|&nbsp;&nbsp;All Rights Reserved</p>
      <p class="credits">Design by <a href="http://1234.info/" title="Designer Homepage">1234.info</a> | Modified by <a href="http://cs.berkeley.edu/~adarob/">Adam Roberts</a> | <a href="http://validator.w3.org/check?uri=referer" title="Validate XHTML code">XHTML 1.0</a> | <a href="http://jigsaw.w3.org/css-validator/" title="Validate CSS code">CSS 2.0</a></p>
      <br />
      <p>The eXpress project was funded in part by an NSF graduate fellowship to Adam Roberts and NIH grant 1R01HG006129-01</p>
    </div>
    <div class="corner-page-bottom"></div>        
  </div> 
  
</body>
</html>