File: ColorSpaceLoader.cpp

package info (click to toggle)
ray 2.3.1-9
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 6,008 kB
  • sloc: cpp: 49,973; sh: 339; makefile: 281; python: 168
file content (105 lines) | stat: -rw-r--r-- 2,781 bytes parent folder | download | duplicates (5)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
/*
    Ray -- Parallel genome assemblies for parallel DNA sequencing
    Copyright (C) 2011, 2012, 2013 Sébastien Boisvert

	http://DeNovoAssembler.SourceForge.Net/

    This program is free software: you can redistribute it and/or modify
    it under the terms of the GNU General Public License as published by
    the Free Software Foundation, version 3 of the License.

    This program is distributed in the hope that it will be useful,
    but WITHOUT ANY WARRANTY; without even the implied warranty of
    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
    GNU General Public License for more details.

    You have received a copy of the GNU General Public License
    along with this program (gpl-3.0.txt).
	see <http://www.gnu.org/licenses/>

*/

#include "ColorSpaceLoader.h"

#include <code/Mock/common_functions.h>

#include <stdlib.h>
#include <fstream>
#include <iostream>
#include <string.h>
#include <assert.h>
using namespace std;

ColorSpaceLoader::ColorSpaceLoader() {
	addExtension(".csfasta");
	addExtension(".csfa");
}

int ColorSpaceLoader::open(string file){
	m_f=fopen(file.c_str(),"r");
	m_size=0;
	m_loaded=0;
	char bufferForLine[RAY_MAXIMUM_READ_LENGTH];
	while(NULL!=fgets(bufferForLine,RAY_MAXIMUM_READ_LENGTH,m_f)){
		if(bufferForLine[0]=='#'){
			continue;// skip csfasta comment
		}

		if(bufferForLine[0]=='>'){
			char*returnValue=fgets(bufferForLine,RAY_MAXIMUM_READ_LENGTH,m_f);

			assert(returnValue != NULL);

			m_size++;
		}
	}
	fclose(m_f);
	m_f=fopen(file.c_str(),"r");
	return EXIT_SUCCESS;
}

void ColorSpaceLoader::load(int maxToLoad,ArrayOfReads*reads,MyAllocator*seqMyAllocator){
	char bufferForLine[RAY_MAXIMUM_READ_LENGTH];
	int loadedSequences=0;
	while(m_loaded<m_size&& loadedSequences<maxToLoad){
		if(NULL==fgets(bufferForLine,RAY_MAXIMUM_READ_LENGTH,m_f))
			continue;

		if(bufferForLine[0]=='#'){
			continue;// skip csfasta comment
		}
		// read two lines
		if(bufferForLine[0]=='>'){
			char*returnValue=fgets(bufferForLine,RAY_MAXIMUM_READ_LENGTH,m_f);
			assert(returnValue != NULL);

			for(int j=0;j<(int)strlen(bufferForLine);j++){
				if(bufferForLine[j]==DOUBLE_ENCODING_A_COLOR){
					bufferForLine[j]=SYMBOL_A;
				}else if(bufferForLine[j]==DOUBLE_ENCODING_T_COLOR){
					bufferForLine[j]=SYMBOL_T;
				}else if(bufferForLine[j]==DOUBLE_ENCODING_C_COLOR){
					bufferForLine[j]=SYMBOL_C;
				}else if(bufferForLine[j]==DOUBLE_ENCODING_G_COLOR){
					bufferForLine[j]=SYMBOL_G;
				}
			}
			Read t;
			// remove the leading T & first color
			t.constructor(bufferForLine+2,seqMyAllocator,true);
			reads->push_back(&t);
			loadedSequences++;
			m_loaded++;
		}
	}
	if(m_loaded==m_size){
		fclose(m_f);
	}
}

int ColorSpaceLoader::getSize(){
	return m_size;
}

void ColorSpaceLoader::close(){
}