-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathReliefFSeq.h
80 lines (74 loc) · 2.81 KB
/
ReliefFSeq.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
/**
* \class ReliefFSeq
*
* \brief ReliefFSeq attribute ranking algorithm.
*
* Designed to handle digital gene expression (DGE) data sets, particularly
* RNA-Seq high-throughput count data, by accounting for variable-specific
* variance in counts. Data is known to follow a Poisson or negative binomial
* distribution. This algorithm is a more computationally practical approach
* than others that use more sophisticated statistical methods and models.
* Our approach keeps the ReliefF algorithm general while addressing the
* variance "dispersion" problem as a special case.
*
* \sa ReliefF
*
* \author Bill White
* \version 1.0
*
* Contact: [email protected]
* Created on: 7/23/12
*/
#ifndef RELIEFFSEQ_H
#define RELIEFFSEQ_H
#include <vector>
#include <map>
#include <string>
#include <fstream>
#include "ReliefF.h"
#include "Dataset.h"
#include "DatasetInstance.h"
#include "Insilico.h"
#include <boost/program_options.hpp>
namespace po = boost::program_options;
class ReliefFSeq : public ReliefF
{
public:
/*************************************************************************//**
* Construct an ReliefFSeq algorithm object.
* \param [in] ds pointer to a Dataset object
****************************************************************************/
ReliefFSeq(Dataset* ds);
/*************************************************************************//**
* Construct an ReliefFSeq algorithm object.
* \param [in] ds pointer to a Dataset object
* \param [in] vm reference to a Boost map of command line options
****************************************************************************/
ReliefFSeq(Dataset* ds, po::variables_map& vm);
/*************************************************************************//**
* Construct an ReliefFSeq algorithm object.
* \param [in] ds pointer to a Dataset object
* \param [in] configMap reference to a ConfigMap (map<string, string>)
****************************************************************************/
ReliefFSeq(Dataset* ds, ConfigMap& configMap);
bool ComputeAttributeScores();
AttributeScores GetScores();
// average hit and miss diffs for gene alpha
std::pair<double, double> MuDeltaAlphas(unsigned int alpha);
/// standard deviations of hit and miss diffs for gene alpha
std::pair<double, double> SigmaDeltaAlphas(unsigned int alpha,
double muDeltaHit, double muDeltaMiss);
virtual ~ReliefFSeq();
private:
/// ReliefSeq mode: signal-to-noise ratio (snr) or t-statistic (tstat)
std::string mode;
/// ReliefSeq signal-to-noise ratio mode: signal-to-noise ratio (snr) or
/// ReliefF (relieff)
std::string snrMode;
/// ReliefFSeq t-statistic mode: 1-pvalue (pval) or the absolute value
/// of the t-statistic (abst)
std::string tstatMode;
/// variance denominator adjustment s0
double s0;
};
#endif /* SNReliefF_H */