File: Tabix.h

package info (click to toggle)
libstatgen 1.0.15-8
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 4,588 kB
  • sloc: cpp: 49,624; ansic: 1,408; makefile: 320; sh: 60
file content (86 lines) | stat: -rw-r--r-- 2,446 bytes parent folder | download | duplicates (4)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
/*
 *  Copyright (C) 2012-2013  Regents of the University of Michigan
 *
 *   This program is free software: you can redistribute it and/or modify
 *   it under the terms of the GNU General Public License as published by
 *   the Free Software Foundation, either version 3 of the License, or
 *   (at your option) any later version.
 *
 *   This program is distributed in the hope that it will be useful,
 *   but WITHOUT ANY WARRANTY; without even the implied warranty of
 *   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *   GNU General Public License for more details.
 *
 *   You should have received a copy of the GNU General Public License
 *   along with this program.  If not, see <http://www.gnu.org/licenses/>.
 */

#ifndef __TABIX_H__
#define __TABIX_H__

#include <stdint.h>
#include <vector>
#include <map>
#include <stdlib.h>

#include "IndexBase.h"

#include "InputFile.h"
#include "StatGenStatus.h"

class Tabix : public IndexBase
{
public:

    enum Format
        { 
            FORMAT_GENERIC = 0,
            FORMAT_SAM = 1,
            FORMAT_VCF = 2
        };

    Tabix();
    virtual ~Tabix();

    /// Reset the member data for a new index file.
    void resetIndex();

    // Read & parse the specified index file.
    /// \param filename the bam index file to be read.
    /// \return the status of the read.
    StatGenStatus::Status readIndex(const char* filename);

    /// Get the starting file offset to look for the specified start position.
    /// For an entire reference ID, set start to -1.
    /// To start at the beginning of the region, set start to 0/-1.
    bool getStartPos(const char* refName, int32_t start,
                     uint64_t& fileStartPos) const;

    /// Return the reference name at the specified index or
    /// throws an exception if out of range.
    const char* getRefName(unsigned int indexNum) const;

    // Get the format of this tabix file.
    inline int32_t getFormat() const { return myFormat.format; }

private:
    struct TabixFormat
    {
        int32_t format;
        int32_t col_seq;
        int32_t col_beg;
        int32_t col_end;
        int32_t meta; // character that starts header lines
        int32_t skip; // Number of lines to skip from putting into the index.
    };

    TabixFormat myFormat;

    char* myChromNamesBuffer;

    // vector pointing to the chromosome names.
    std::vector<const char*> myChromNamesVector;
};


#endif