-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathEgt.h
99 lines (90 loc) · 3.02 KB
/
Egt.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
//
// Egt.h
//
// Author: Iain Bancarz <[email protected]>
//
// Copyright (c) 2014 Genome Research Ltd.
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are met:
// 1. Redistributions of source code must retain the above copyright notice,
// this list of conditions and the following disclaimer.
// 2. Redistributions in binary form must reproduce the above copyright
// notice, this list of conditions and the following disclaimer in the
// documentation and/or other materials provided with the distribution.
// 3. Neither the name of Genome Research Ltd nor the names of the
// contributors may be used to endorse or promote products derived from
// software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
// IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
// OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
// IN NO EVENT SHALL GENOME RESEARCH LTD. BE LIABLE FOR ANY DIRECT, INDIRECT,
// INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
// BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
// USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
// THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
//
#ifndef _EGT_H
#define _EGT_H
#include <string>
#include <iostream>
#include <fstream>
using namespace std;
union numericConverter {
float ncFloat;
int ncInt;
char ncChar[sizeof(int)];
};
class Egt {
public:
Egt(bool verbose=false);
//~Egt();
void getClusters(long index, float params[]);
void getMeanR(long index, float means[]);
void getMeanTheta(long index, float means[]);
void open(char *filename);
void open(string filename);
void printHeader();
void printPreface();
string filename;
bool verbose;
// constants
int NUMERIC_BYTES;
int ENTRIES_IN_RECORD;
int BYTES_IN_RECORD;
int GENOTYPES_PER_SNP;
int ENTRIES_TO_USE;
int PARAMS_PER_SNP;
// EGT header fields
long fileVersion;
string gcVersion;
string clusterVersion;
string callVersion;
string normalizationVersion;
string dateCreated;
char mode;
string manifest;
// EGT 'file preface' fields
long dataVersion;
string opa;
long snpTotal;
// arrays for numerical data
int *counts;
float *params;
// array for SNP names
string *snpNames;
private:
int* bytesToInts(char block[], int start, int end);
float* bytesToFloats(char block[], int start, int end);
numericConverter getNextConverter(ifstream &file);
void readHeader(ifstream &file);
int readInteger(ifstream &file);
float readFloat(ifstream &file);
void readPreface(ifstream &file);
void readSNPNames(ifstream &file, string names[]);
string readString(ifstream &file, string name="UNKNOWN_NAME");
};
#endif // _EGT_H