File: LookupAnchorDistribution.cpp

package info (click to toggle)
pbseqlib 5.3.1%2Bdfsg-2.1
  • links: PTS, VCS
  • area: main
  • in suites: buster
  • size: 7,136 kB
  • sloc: cpp: 77,246; python: 570; makefile: 312; sh: 111; ansic: 9
file content (63 lines) | stat: -rw-r--r-- 3,158 bytes parent folder | download | duplicates (4)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
#include <alignment/statistics/LookupAnchorDistribution.hpp>

int LookupAnchorDistribution(int readLength, int minMatchLength, int accuracy, float &mn,
                             float &sdn, float &mnab, float &sdnab)
{

    int kIndex, accIndex, lengthIndex;
    int returnValue = 0;

    // Major index is by accuracy
    if (accuracy < PacBio::AnchorDistributionTable::anchorReadAccuracies[0]) {
        returnValue = -2;
        accuracy = PacBio::AnchorDistributionTable::anchorReadAccuracies[0];
    } else if (accuracy >= PacBio::AnchorDistributionTable::anchorReadAccuracies[1]) {
        returnValue = 2;
        accuracy = PacBio::AnchorDistributionTable::anchorReadAccuracies[1] -
                   PacBio::AnchorDistributionTable::anchorReadAccuracies[2];
    }

    accIndex = (((int)accuracy) - PacBio::AnchorDistributionTable::anchorReadAccuracies[0]) /
               PacBio::AnchorDistributionTable::anchorReadAccuracies[2];

    // middle index is by k
    if (minMatchLength < PacBio::AnchorDistributionTable::anchorMinKValues[0]) {
        returnValue = -1;  // signal too low
        minMatchLength = PacBio::AnchorDistributionTable::anchorMinKValues[0];
    } else if (minMatchLength >= PacBio::AnchorDistributionTable::anchorMinKValues[1]) {
        returnValue = 1;  // signal too high
        minMatchLength = PacBio::AnchorDistributionTable::anchorMinKValues[1] -
                         PacBio::AnchorDistributionTable::anchorMinKValues[2];  // max match length
    }

    kIndex = (minMatchLength - PacBio::AnchorDistributionTable::anchorMinKValues[0]) /
             PacBio::AnchorDistributionTable::anchorMinKValues[2];

    // last index is by read length
    if (readLength < PacBio::AnchorDistributionTable::anchorReadLengths[0]) {
        returnValue = -3;
        readLength = PacBio::AnchorDistributionTable::anchorReadLengths[0];
    } else if (readLength >= PacBio::AnchorDistributionTable::anchorReadLengths[1]) {
        returnValue = 3;
        readLength = PacBio::AnchorDistributionTable::anchorReadLengths[1] -
                     PacBio::AnchorDistributionTable::anchorReadLengths[2];  // max read length
    }

    lengthIndex = (readLength - PacBio::AnchorDistributionTable::anchorReadLengths[0]) /
                  PacBio::AnchorDistributionTable::anchorReadLengths[2];

    int nLengths = (PacBio::AnchorDistributionTable::anchorReadLengths[1] -
                    PacBio::AnchorDistributionTable::anchorReadLengths[0]) /
                   PacBio::AnchorDistributionTable::anchorReadLengths[2];
    int nAnchors = (PacBio::AnchorDistributionTable::anchorMinKValues[1] -
                    PacBio::AnchorDistributionTable::anchorMinKValues[0]) /
                   PacBio::AnchorDistributionTable::anchorMinKValues[2];
    int index = accIndex * (nLengths * nAnchors) + kIndex * nLengths + lengthIndex;

    mn = PacBio::AnchorDistributionTable::meanNumAnchors[index];
    sdn = PacBio::AnchorDistributionTable::sdNumAnchors[index];
    mnab = PacBio::AnchorDistributionTable::meanNumAnchorBases[index];
    sdnab = PacBio::AnchorDistributionTable::sdNumAnchorBases[index];

    return returnValue;
}