-
Notifications
You must be signed in to change notification settings - Fork 17
/
IO.cpp
111 lines (102 loc) · 2.96 KB
/
IO.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
#include "IO.h"
#include <algorithm>
//static method
AbstractFileReader* AbstractFileReader::open(const char* fileName){
AbstractFileReader * fr = NULL;
if (!fileName || fileName[0] == '\0') {
fprintf(stderr, "Empty file name.\n");
return fr;
}
switch(AbstractFileReader::checkFileType(fileName)) {
case IO_PLAIN:
fr = new PlainFileReader(fileName);
break;
case IO_GZIP:
fr = new GzipFileReader(fileName);
break;
case IO_BZIP2:
fr = new Bzip2FileReader(fileName);
break;
default:
fprintf(stderr, "Cannot detect file type (does it exist?!)\n");
break;
}
return fr;
}
// static method
void AbstractFileReader::close(AbstractFileReader** f) {
assert(f && *f);
(*f)->close();
delete (*f);
*f = NULL;
};
// check header for known file type
FileType AbstractFileReader::checkFileType(const char* fileName){
// treat stdin as plain text file
if (strncmp(fileName, "-", 1) == 0) {
return IO_PLAIN;
}
// magic numbers
const int gz_magic[2] = {0x1f, 0x8b}; /* gzip magic header */
const int bzip2_magic[2] = {'B', 'Z'}; /* bzip2 magic header */
// read file header
FILE* fp = fopen(fileName, "rb");
if (!fp) return IO_UNKNOWN;
unsigned char header[2]={0,0};
int n = fread(header, sizeof(char), 2, fp);
fclose(fp);
// check file types
if ( n >= 2 && header[0] == gz_magic[0] && header[1] == gz_magic[1]) {
return IO_GZIP;
}
if ( n >= 2 && header[0] == bzip2_magic[0] && header[1] == bzip2_magic[1]) {
return IO_BZIP2;
}
return IO_PLAIN;
/* // check the characters fall into visible ASCII range */
/* if ( header[0] >= 0x20 /\* space *\/ && */
/* header[0] < 0x7f /\* DEL *\/ && */
/* header[1] >= 0x20 /\* space *\/ && */
/* header[1] < 0x7f /\* DEL *\/) { */
/* return PLAIN; */
/* } */
/* return UNKNOWN; */
};
/**
* @return number of empty elements filtered out
*/
int removeEmptyField(std::vector<std::string>* fields) {
int s = fields->size();
std::remove(fields->begin(), fields->end(), "");
s -= fields->size();
return s;
};
AbstractFileWriter::~AbstractFileWriter() {
#ifdef IO_DEBUG
fprintf(stderr, "AbstractFileWriter desc()\n");
#endif
};
int BGZipFileWriter::open(const char* fn, bool append){
if (append)
fprintf(stderr, "Gzip does not support appending.\n");
this->fp = bgzf_open(fn, "w");
if (!this->fp) {
fprintf(stderr, "ERROR: Cannot open %s for write\n", fn);
return -1;
}
return 0;
}
void BGZipFileWriter::close(){
if (this->fp) {
bgzf_close(this->fp);
this->fp = NULL;
}
};
int BGZipFileWriter::write(const char* s) {
return bgzf_write(this->fp, s, strlen(s));
};
int BGZipFileWriter::writeLine(const char* s) {
int ret = bgzf_write(this->fp, s, strlen(s));
ret += bgzf_write(this->fp, "\n", 1);
return (ret);
};