forked from statgen/demuxlet
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathtsv_reader.cpp
87 lines (74 loc) · 2.14 KB
/
tsv_reader.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
#include "tsv_reader.h"
/*
htsFile* hp;
kstring_t str;
int32_t lstr;
int32_t nfields;
int32_t* fields;
int32_t nlines;
*/
bool tsv_reader::open(const char* filename) {
this->filename = filename;
hp = hts_open(filename, "r");
if ( hp == NULL ) return false;
return true;
//error("[E:%s:%s %s] Cannot open file %s for reading", __FILE__, __LINE__, __FUNCTION__, filename);
}
int32_t tsv_reader::read_line() {
if ( itr == NULL ) {
lstr = hts_getline(hp, KS_SEP_LINE, &str);
}
else {
lstr = tbx_itr_next(hp, tbx, itr, &str);
}
if ( lstr <= 0 ) {
nfields = 0;
return lstr;
}
fields = ksplit(&str, 0, &nfields);
++nlines;
return nfields;
}
bool tsv_reader::jump_to(const char* chr, int32_t beg, int32_t end) {
char buf[65536];
sprintf(buf, "%s:%d-%d", chr, beg, end);
return jump_to(buf);
}
bool tsv_reader::jump_to(const char* reg) {
if ( tbx == NULL ) {
tbx = tbx_index_load(filename.c_str());
if ( !tbx ) error("[E:%s] Could not load .tbi/.csi index of %s\n", __PRETTY_FUNCTION__, filename.c_str());
}
if ( itr != NULL )
tbx_itr_destroy(itr);
itr = tbx_itr_querys(tbx, reg);
if ( itr == NULL ) {
notice("Failed jumping to %s, tbx = %x, itr = %x", reg, tbx, itr);
return false;
}
else return true;
}
const char* tsv_reader::str_field_at(int32_t idx) {
if ( idx >= nfields ) {
error("[E:%s:%s %s] Cannot access field at %d >= %d", __FILE__, __LINE__, __FUNCTION__, idx, nfields);
//return NULL;
}
return ( &str.s[fields[idx]] );
}
int32_t tsv_reader::int_field_at(int32_t idx) {
if ( idx >= nfields )
error("[E:%s:%s %s] Cannot access field at %d >= %d", __FILE__, __LINE__, __FUNCTION__, idx, nfields);
return ( atoi(&str.s[fields[idx]]) );
}
double tsv_reader::double_field_at(int32_t idx) {
if ( idx >= nfields )
error("[E:%s:%s %s] Cannot access field at %d >= %d", __FILE__, __LINE__, __FUNCTION__, idx, nfields);
return ( atof(&str.s[fields[idx]]) );
}
int32_t tsv_reader::store_to_vector(std::vector<std::string>& v) {
v.resize(nfields);
for(int32_t i=0; i < nfields; ++i) {
v[i].assign(&str.s[fields[i]]);
}
return nfields;
}