File: BaseSequenceIO.cpp

package info (click to toggle)
pbseqlib 5.3.5%2Bdfsg-11
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 7,152 kB
  • sloc: cpp: 77,259; python: 331; sh: 103; makefile: 41
file content (67 lines) | stat: -rw-r--r-- 2,457 bytes parent folder | download | duplicates (5)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
#include <alignment/files/BaseSequenceIO.hpp>

#include <cstdlib>

void BaseSequenceIO::SetFiles(FileType &pFileType, std::string &pFileName)
{
    fileType = pFileType;
    fileName = pFileName;
}

FileType BaseSequenceIO::GetFileType() { return fileType; }

int BaseSequenceIO::DetermineFileTypeByExtension(std::string &fileName, FileType &type,
                                                 bool exitOnFailure)
{

    std::string::size_type dotPos = fileName.rfind(".");
    if (dotPos != std::string::npos) {
        std::string extension;
        extension.assign(fileName, dotPos + 1, fileName.size() - (dotPos + 1));
        if (extension == "fasta" || extension == "fa" || extension == "fas" ||
            extension == "fsta" || extension == "screen") {
            type = FileType::Fasta;
            return 1;
        } else if (extension == "h5") {
            dotPos = fileName.rfind(".", dotPos - 1);
            extension.assign(fileName, dotPos + 1, fileName.size() - (dotPos + 1));
            if (extension == "pls.h5" || extension == "plx.h5") {
                type = FileType::HDFPulse;
                return 1;
            } else if (extension == "bas.h5" || extension == "bax.h5") {
                type = FileType::HDFBase;
                return 1;
            } else if (extension == "ccs.h5") {
                type = FileType::HDFCCSONLY;
                return 1;
            } else {
                type = FileType::None;
                return 0;
            }
        } else if (extension == "fastq" || extension == "fq") {
            type = FileType::Fastq;
            return 1;
        } else if (extension == "4bit" || extension == "fourbit") {
            type = FileType::Fourbit;
            assert("Four bit reading is not yet implemented for the reader agglomerate!" == 0);
            return 1;
        } else if (extension == "bam") {
            type = FileType::PBBAM;
            return 1;
        } else if (extension == "xml") {
            type = FileType::PBDATASET;
            return 1;
        } else {
            type = FileType::None;
            if (exitOnFailure) {
                std::cout << "ERROR, file type '." << extension
                          << "' is not understood to be one of pls.h5, fasta, fastq, nor bam. "
                          << std::endl;
                std::exit(EXIT_FAILURE);
            }
            return 0;
        }
        return 0;
    }
    return 0;
}