1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43
|
#include "Transcriptome.h"
#include "serviceFuns.cpp"
#include "ReadAnnotations.h"
void Transcriptome::geneFullAlignOverlap_ExonOverIntron(uint nA, Transcript **aAll, int32 strandType, ReadAnnotFeature &annFeat, ReadAnnotFeature &annFeatGeneConcordant)
{
// annFeat.ovType = 0;
if (annFeatGeneConcordant.fSet.size()>0) {//if concordant genes were found for this read, prioritize them over intronic overlap
annFeat = annFeatGeneConcordant;
annFeat.ovType = ReadAnnotFeature::overlapTypes::exonic;
return;
};
//calculate overlap with introns
// annFeat.fSet={};
// annFeat.fAlign = {};
annFeat.fAlign.resize(nA);
for (uint32 iA=0; iA<nA; iA++) {//only includes aligns that are entirely inside genes (?)
Transcript &a = *aAll[iA];
uint64 aS = a.exons[0][EX_G]; //align start
uint64 aE = a.exons[a.nExons-1][EX_G] + a.exons[a.nExons-1][EX_L]-1; //align end
//TODO: for paired end, need to look fo max min
int64 gi1=binarySearch1a<uint64>(aS, geneFull.s, (int32) nGe); //search align-start against gene-starts. Find last gene which still starts to the left of align-start
while (gi1>=0 && geneFull.eMax[gi1]>=aE) {//these genes may overlap this block
if (geneFull.e[gi1]>=aE) {//this gene contains the block: gene-end is to the right of block start
int32 str1 = geneFull.str[gi1]==1 ? a.Str : 1-a.Str;
if (strandType==-1 || strandType==str1) {
annFeat.fSet.insert(geneFull.g[gi1]);
annFeat.fAlign[iA].insert(geneFull.g[gi1]);
};
};
--gi1;// go to the previous gene
};
};
if (annFeat.fSet.size()>0)
annFeat.ovType = ReadAnnotFeature::overlapTypes::intronic;
};
|