/* * Copyright 2014 Brian Tjaden * * This file is part of Rockhopper. * * Rockhopper is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation, either version 3 of the License, or * any later version. * * Rockhopper is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * (in the file gpl.txt) along with Rockhopper. * If not, see . */ import java.util.ArrayList; import java.util.Random; import java.util.concurrent.atomic.AtomicIntegerArray; /** * An instance of the DeNovoTranscripts class represents * a collection of de novo assembled transcripts. */ public class DeNovoTranscripts { /******************************************** ********** Instance Variables ********** ********************************************/ private ArrayList transcripts; private ArrayList> upperQuartiles; private ArrayList minDiffExpressionLevels; // Min diff expression level per condition /***************************************** ********** Class Variables ********** *****************************************/ public static int[] avgLengthOfReads; // Avg length of mapping reads in each file public static int[] numReads; // Total reads in each file public static int[] numMappingReads; // Reads mapping to transcripts in each file public static ArrayList> totalReads; // Total number of nt reads in each replicate private static Random rand = new Random(); // Random number generator /************************************** ********** CONSTRUCTORS ********** **************************************/ public DeNovoTranscripts(DeNovoIndex bwtIndex) { DeNovoTranscripts.avgLengthOfReads = bwtIndex.getAvgLengthOfReads(); DeNovoTranscripts.numReads = bwtIndex.getNumReads(); DeNovoTranscripts.numMappingReads = bwtIndex.getNumMappingReads(); DeNovoTranscripts.totalReads = bwtIndex.getTotalReads(); transcripts = determineTranscripts(bwtIndex.sequence, bwtIndex.readCounts); computeExpression(); } /** * Used when reading transcripts in from compressed file. */ public DeNovoTranscripts(ArrayList transcripts) { this.transcripts = transcripts; } /************************************************* ********** Public Instance Methods ********** *************************************************/ public int getNumTranscripts() { return transcripts.size(); } public DeNovoTranscript getTranscript(int i) { return transcripts.get(i); } /** * Returns the average transcript length. */ public int getAverageTranscriptLength() { long length = 0; if (transcripts.size() == 0) return 0; for (DeNovoTranscript transcript : transcripts) length += transcript.length(); return (int)(length/transcripts.size()); } /** * Returns the median transcript length. */ public int getMedianTranscriptLength() { ArrayList a = new ArrayList(transcripts.size()); for (DeNovoTranscript transcript : transcripts) a.add((long)transcript.length()); return (int)Misc.select_Long(a, a.size()/2); } /** * Returns the sum of all transcript lengths. */ public long getTotalAssembledBases() { long sum = 0; for (DeNovoTranscript transcript : transcripts) sum += transcript.length(); return sum; } public String getTranscriptSequences() { StringBuilder sb = new StringBuilder(); for (int z=0; z(Assembler.conditionFiles.size()); for (int i=0; i= THRESHOLD) foundThreshold = false; } if (foundThreshold) break; minDiffExpressionLevel++; } minDiffExpressionLevels.add(minDiffExpressionLevel); } } public String toString(String[] labels) { // Include Header StringBuilder sb = new StringBuilder(); sb.append("Sequence" + "\t" + "Length"); for (int i=0; i determineTranscripts(String allSequences, AtomicIntegerArray[] readCounts) { ArrayList transcripts = new ArrayList(); int start = -1; // -1 is sentinel indicating no transcript int end = -1; // inclusive long[] readCounts_nts = new long[readCounts.length]; for (int i=0; i= 0) && (end-start+1 >= Assembler.minTranscriptLength)) transcripts.add(new DeNovoTranscript(allSequences.substring(start, end+1), readCounts_nts)); start = -1; end = -1; for (int j=0; j= Assembler.MIN_READS_MAPPING)) { // Start of new expressed transcript start = i; for (int j=0; j= Assembler.MIN_READS_MAPPING) { // Within expressed transcript end = i; for (int j=0; j= 0) && (end-start+1 >= Assembler.minTranscriptLength)) transcripts.add(new DeNovoTranscript(allSequences.substring(start, end+1), readCounts_nts)); start = -1; end = -1; for (int j=0; j>(Assembler.conditionFiles.size()); for (int i=0; i(files.length)); for (int j=0; j expressions = new ArrayList(transcripts.size()); for (int k=0; k 0) && (files.length > 1)) { // We have replicates for (DeNovoTranscript transcript : transcripts) transcript.lowess[x][y] = transcript.lowess[0][y]; continue; } */ /* (x,y) lowess is NOT the same as (y,x) lowess String[] files2 = Assembler.conditionFiles.get(y).split(","); if ((x > y) && (files.length == 1) && (files2.length == 1)) { // Already computed lowess[y][x], which is same as lowess[x][y] for (DeNovoTranscript transcript : transcripts) transcript.lowess[x][y] = transcript.lowess[y][x]; continue; } */ double b = 0.0; // Bias correction term for (int j=0; j expression = new ArrayList(); ArrayList variance = new ArrayList(); for (DeNovoTranscript transcript : transcripts) { expression.add(transcript.getMean(x)); variance.add(transcript.variances[x][y]); } // Perform Lowess computation ArrayList lowessVariance = Lowess.lowess(expression, variance); // Uncomment to output data for Lowess graph to StdOut //System.out.println("Mean" + "\t" + "Variance" + "\t" + "Lowess"); //for (int k=0; k= a1.length) { a[k] = a2[j]; b[k] = b2[j]; j++; } else if (j >= a2.length) { a[k] = a1[i]; b[k] = b1[i]; i++; } else if (a1[i] <= a2[j]) { a[k] = a1[i]; b[k] = b1[i]; i++; } else { a[k] = a2[j]; b[k] = b2[j]; j++; } } } }