File: kff_writer.h

package info (click to toggle)
kmc 3.2.4%2Bdfsg-1
  • links: PTS, VCS
  • area: main
  • in suites: sid, trixie
  • size: 3,716 kB
  • sloc: cpp: 38,308; python: 664; makefile: 216; perl: 179; sh: 34
file content (54 lines) | stat: -rw-r--r-- 1,179 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
#pragma once

#include <cstdint>
#include <string>
#include <vector>
#include <cstdint>

template<typename T>
void StoreBigEndian(uint8_t* buff, const T& data)
{
	using unsigned_T = typename std::make_unsigned<T>::type;
	unsigned_T _data = static_cast<unsigned_T>(data);

	for (int32_t b = sizeof(_data) - 1; b >= 0; --b)
		*buff++ = _data >> (8 * b);
}

class CKFFWriter
{
	static constexpr uint8_t VER_MAJOR = 1;
	static constexpr uint8_t VER_MINOR = 0;
	FILE* file;

	uint64_t k;

	uint64_t counter_size;
	uint64_t min_count;
	uint64_t max_count;

	std::vector<int64_t> index;
	uint64_t cur_file_size = 0;

	void storeIndexPair(const char* type, int64_t val, std::vector<uint8_t>& tmp);



	struct SectionPartState
	{
		uint64_t where_to_store_nb_recs;
		uint64_t nb_recs;
	};
	SectionPartState section_part_state;

public:
	explicit CKFFWriter(const std::string& path, uint8_t canonical, uint64_t k, uint64_t counter_size, uint64_t min_count, uint64_t max_count, uint8_t encoding = 0b00011011);

	void StoreWholeSection(uint8_t* data, uint64_t n_kmers);

	void InitSection();
	void StoreSectionPart(uint8_t* data, uint64_t n_recs);
	void FinishSection();

	~CKFFWriter();
};