File: LookupAnchorDistribution.cpp

package info (click to toggle)
pbseqlib 0~20161219-1
  • links: PTS, VCS
  • area: main
  • in suites: stretch
  • size: 5,924 kB
  • ctags: 5,123
  • sloc: cpp: 82,727; makefile: 305; python: 239; sh: 8
file content (57 lines) | stat: -rw-r--r-- 2,939 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
#include "LookupAnchorDistribution.hpp"

int LookupAnchorDistribution(int readLength, int minMatchLength, 
    int accuracy, float &mn, float &sdn, float &mnab, 
    float &sdnab) {

    int kIndex, accIndex, lengthIndex;
    int returnValue = 0;

    // Major index is by accuracy
    if (accuracy < PacBio::AnchorDistributionTable::anchorReadAccuracies[0]) {
        returnValue = -2;
        accuracy    = PacBio::AnchorDistributionTable::anchorReadAccuracies[0];
    }
    else if (accuracy >= PacBio::AnchorDistributionTable::anchorReadAccuracies[1]) {
        returnValue = 2;
        accuracy    = PacBio::AnchorDistributionTable::anchorReadAccuracies[1] - PacBio::AnchorDistributionTable::anchorReadAccuracies[2];
    }

    accIndex = ( ((int)accuracy) - PacBio::AnchorDistributionTable::anchorReadAccuracies[0]) / PacBio::AnchorDistributionTable::anchorReadAccuracies[2];

    // middle index is by k 
    if (minMatchLength < PacBio::AnchorDistributionTable::anchorMinKValues[0]) {
        returnValue = -1; // signal too low
        minMatchLength = PacBio::AnchorDistributionTable::anchorMinKValues[0];
    }
    else if (minMatchLength >= PacBio::AnchorDistributionTable::anchorMinKValues[1]) {
        returnValue = 1; // signal too high
        minMatchLength = PacBio::AnchorDistributionTable::anchorMinKValues[1] - PacBio::AnchorDistributionTable::anchorMinKValues[2]; // max match length
    }

    kIndex = (minMatchLength - PacBio::AnchorDistributionTable::anchorMinKValues[0])/ PacBio::AnchorDistributionTable::anchorMinKValues[2];

    // last index is by read length
    if (readLength < PacBio::AnchorDistributionTable::anchorReadLengths[0]){ 
        returnValue = -3;
        readLength = PacBio::AnchorDistributionTable::anchorReadLengths[0];
    }
    else if (readLength >= PacBio::AnchorDistributionTable::anchorReadLengths[1]) {
        returnValue = 3;
        readLength = PacBio::AnchorDistributionTable::anchorReadLengths[1] - PacBio::AnchorDistributionTable::anchorReadLengths[2]; // max read length
    }

    lengthIndex = (readLength - PacBio::AnchorDistributionTable::anchorReadLengths[0]) / PacBio::AnchorDistributionTable::anchorReadLengths[2];


    int nLengths = (PacBio::AnchorDistributionTable::anchorReadLengths[1] - PacBio::AnchorDistributionTable::anchorReadLengths[0]) / PacBio::AnchorDistributionTable::anchorReadLengths[2];
    int nAnchors = (PacBio::AnchorDistributionTable::anchorMinKValues[1] - PacBio::AnchorDistributionTable::anchorMinKValues[0]) / PacBio::AnchorDistributionTable::anchorMinKValues[2];
    int index = accIndex*(nLengths*nAnchors) + kIndex*nLengths + lengthIndex;

    mn = PacBio::AnchorDistributionTable::meanNumAnchors[index];
    sdn = PacBio::AnchorDistributionTable::sdNumAnchors[index];
    mnab = PacBio::AnchorDistributionTable::meanNumAnchorBases[index];
    sdnab = PacBio::AnchorDistributionTable::sdNumAnchorBases[index];

    return returnValue;
}