-
Notifications
You must be signed in to change notification settings - Fork 4
/
Sim.h
108 lines (95 loc) · 3.59 KB
/
Sim.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
//
// Sim.h
//
// Header file for Sim.cpp
//
// Author: Jennifer Liddle (js10)
//
// $Id: Sim.h 1354 2010-11-11 16:20:09Z js10 $
//
// Author: Jennifer Liddle <[email protected], [email protected]>
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are met:
// 1. Redistributions of source code must retain the above copyright notice,
// this list of conditions and the following disclaimer.
// 2. Redistributions in binary form must reproduce the above copyright
// notice, this list of conditions and the following disclaimer in the
// documentation and/or other materials provided with the distribution.
// 3. Neither the name of Genome Research Ltd nor the names of the
// contributors may be used to endorse or promote products derived from
// software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
// IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
// OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
// IN NO EVENT SHALL GENOME RESEARCH LTD. BE LIABLE FOR ANY DIRECT, INDIRECT,
// INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
// BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
// USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
// THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
//
#ifndef _SIM_H
#define _SIM_H
#include <string>
#include <vector>
#include <map>
#include <fstream>
#include <stdint.h>
using namespace std;
class Sim {
public:
// Number formats
static const int FLOAT = 0;
static const int INTEGER = 1;
static const int SCALED_INTEGER = 2;
static const int VERSION = 1;
static const int SAMPLE_NAME_SIZE = 255;
static const int HEADER_LENGTH = 16;
public:
Sim();
void openInput(string filename);
void openLowLevel(char *f);
void close(void);
string dump(void);
const char *dumpc(void) { return dump().c_str(); }
void openOutput(string filename);
void reportNonNumeric(void);
void reset(void);
void writeHeader(uint32_t _numSamples, uint32_t _numProbes, uint8_t _numChannels=2, uint8_t _numberFormat=INTEGER);
void write(void *buffer, int length);
string errorMsg;
string filename;
string magic; // expected to be "sim"
uint8_t version; // file version (expected to be 1)
uint16_t sampleNameSize;
uint32_t numSamples;
uint32_t numProbes;
uint8_t numChannels;
uint8_t numberFormat;
long nanCount; // count NaN entries in input
long infCount; // count +/- INF entries in input
bool cleanInput;
int recordLength; // calculated when file opened and header read
int numericBytes; // record size of each number in file
int sampleIntensityTotal; // number of intensities for each sample
// These inline functions are for the use of SWIG and Perl
const char *getFilename(void) { return filename.c_str(); }
const char *getErrorMsg(void) { return errorMsg.c_str(); }
int getVersion(void) { return version; }
const char *getMagic(void) { return magic.c_str(); }
void getNextRecord(char *sampleName, uint16_t *intensity);
void getNextRecord(char *sampleName, float *intensity,
bool cleanup=false);
private:
ostream *outfile;
ofstream fout;
string inPath;
FILE *inFile; // low-level file access for greater speed
map<string,long> sampleIndex;
void __openout(ostream &f);
void _openOut(string fname);
};
#endif // _SIM_H