-
Notifications
You must be signed in to change notification settings - Fork 5
/
Copy pathQualityScore.cpp
91 lines (83 loc) · 2.97 KB
/
QualityScore.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
/*
* Part of SMITHLAB software
*
* Copyright (C) 2009 University of Southern California and
* Andrew D. Smith
*
* Authors: Andrew D. Smith
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program. If not, see <http://www.gnu.org/licenses/>.
*/
#include "QualityScore.hpp"
#include "smithlab_utils.hpp"
#include <fstream>
using std::runtime_error;
using std::string;
static bool check_formats(char c, bool &solexa, bool &phred) {
solexa = solexa && valid_solexa_score(c);
phred = phred && valid_phred_score(c);
return (solexa && phred);
}
FASTQScoreType fastq_score_type(const string filename) {
static const size_t MAX_LINE_SIZE = 1000;
std::ifstream f(filename.c_str());
if (!f)
throw runtime_error("cannot open input file " + filename);
char line[MAX_LINE_SIZE];
bool solexa = true, phred = true;
size_t line_count = 0;
while (f.getline(line, MAX_LINE_SIZE)) {
if (line_count % 4 == 3) {
char *c = line;
while (*c != '\0' && check_formats(*c, solexa, phred))
++c;
if (!check_formats(*c, solexa, phred))
return ((phred) ? FASTQ_Phred : FASTQ_Solexa);
}
++line_count;
}
return (phred) ? FASTQ_Phred : FASTQ_Solexa;
}
FASTQScoreType mapped_reads_score_type(const string filename) {
static const size_t MAX_LINE_SIZE = 10000;
std::ifstream f(filename.c_str());
if (!f)
throw runtime_error("cannot open input file " + filename);
char line[MAX_LINE_SIZE];
bool solexa = true, phred = true;
while (f.getline(line, MAX_LINE_SIZE)) {
size_t space_count = 0, position = 0;
while (space_count < 7) {
while (position < MAX_LINE_SIZE && isspace(line[position]))
++position;
if (position == MAX_LINE_SIZE)
throw runtime_error("line too long in file: " + filename);
while (position < MAX_LINE_SIZE && !isspace(line[position]))
++position;
if (position == MAX_LINE_SIZE)
throw runtime_error("line too long in file: " + filename);
++space_count;
}
if (space_count < 7)
throw runtime_error("malformed line in file: " + filename);
while (position < MAX_LINE_SIZE && isspace(line[position]))
++position;
char *c = line + position;
while (!isspace(*c) && check_formats(*c, solexa, phred))
++c;
if (!check_formats(*c, solexa, phred))
return ((phred) ? FASTQ_Phred : FASTQ_Solexa);
}
return (phred) ? FASTQ_Phred : FASTQ_Solexa;
}