1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122
|
#ifndef SEQEXT_H
#define SEQEXT_H 1
#include "Common/Options.h" // for opt::colourSpace
#include "Common/Sequence.h" // for codeToBase
#include <cassert>
#include <ostream>
#include <stdint.h>
static const unsigned NUM_BASES = 4;
/** Return the complement of the specified base.
* The reverse of a single base is a no-op.
* If the assembly is in colour space, this is a no-op.
*/
static inline uint8_t reverseComplement(uint8_t base)
{
return opt::colourSpace ? base : ~base & 0x3;
}
/** The adjacent vertices of a Kmer. */
class SeqExt
{
public:
typedef uint8_t Symbol;
/** The number of symbols. */
static const unsigned NUM = NUM_BASES;
SeqExt() : m_record(0) { };
explicit SeqExt(uint8_t base) : m_record(1<<base) { };
/** Return a SeqExt with the specified bits set. */
static SeqExt mask(uint8_t bits)
{
SeqExt ext;
ext.m_record = bits;
return ext;
}
/** Return the out degree. */
unsigned outDegree()
{
assert(m_record < 16);
static const uint8_t popcount[16] = {
0, 1, 1, 2, 1, 2, 2, 3, 1, 2, 2, 3, 2, 3, 3, 4
};
return popcount[m_record];
}
/** Set the specified adjacency. */
void setBase(uint8_t base)
{
m_record |= 1 << base;
}
/** Clear the specified adjacency. */
void clearBase(uint8_t base)
{
m_record &= ~(1 << base);
}
/** Remove the specified edges. */
void clear(SeqExt ext)
{
m_record &= ~ext.m_record;
}
/** Return wheter the specified base is adjacent. */
bool checkBase(uint8_t base) const
{
return m_record & (1 << base);
}
/** Clear all adjacency. */
void clear()
{
m_record = 0;
}
/** Return whether this kmer has any adjacent kmer. */
bool hasExtension() const
{
return m_record > 0;
}
/** Return whether this kmer has more than one adjacent kmer.
*/
bool isAmbiguous() const
{
bool powerOfTwo = (m_record & (m_record - 1)) > 0;
return m_record > 0 && powerOfTwo;
}
/** Return the complementary adjacency.
* If the assembly is in colour space, this is a no-op.
*/
SeqExt complement() const
{
static const uint8_t complements[16] = {
0x0, 0x8, 0x4, 0xc, 0x2, 0xa, 0x6, 0xe,
0x1, 0x9, 0x5, 0xd, 0x3, 0xb, 0x7, 0xf
};
assert(m_record < 1 << NUM);
return opt::colourSpace ? *this : mask(complements[m_record]);
}
friend std::ostream& operator <<(std::ostream& out,
const SeqExt& o)
{
assert(o.m_record < 1 << NUM);
for (unsigned i = 0; i << NUM; ++i)
if (o.checkBase(i))
out << codeToBase(i);
return out;
}
private:
uint8_t m_record;
};
#endif
|