File: SeqUtilsImpl.hpp

package info (click to toggle)
pbseqlib 5.3.4%2Bdfsg-3
  • links: PTS, VCS
  • area: main
  • in suites: bullseye
  • size: 7,020 kB
  • sloc: cpp: 77,246; python: 331; sh: 103; makefile: 42
file content (44 lines) | stat: -rw-r--r-- 975 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
#include <cstdint>
#include <iostream>
#include <vector>

#include <pbdata/DNASequence.hpp>
#include <pbdata/NucConversion.hpp>
#include <pbdata/SeqUtils.hpp>
#include <pbdata/utils.hpp>

template <typename T_Sequence>
int OnlyACTG(T_Sequence &seq)
{
    DNALength p;
    for (p = 0; p < seq.length; p++) {
        if (ThreeBit[seq.seq[p]] > 3) return 0;
    }
    return 1;
}

template <typename T_Sequence>
DNALength CountMasked(T_Sequence &seq)
{
    DNALength p;
    DNALength nMasked = 0;
    for (p = 0; p < seq.length; p++) {
        if ((seq.seq[p] >= 'a' and seq.seq[p] <= 'z') or seq.seq[p] == 'N') {
            nMasked++;
        }
    }
    return nMasked;
}

template <typename T_Sequence>
int CountNotMasked(T_Sequence &seq)
{
    int nUnmasked = 0;
    for (unsigned p = 0; p < seq.length; p++) {
        if (seq.seq[p] == 'A' or seq.seq[p] == 'C' or seq.seq[p] == 'G' or seq.seq[p] == 'T') {
            nUnmasked++;
        }
    }

    return nUnmasked;
}