-
Notifications
You must be signed in to change notification settings - Fork 0
/
data_set.cpp
62 lines (53 loc) · 1.54 KB
/
data_set.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
// Implementation of data set class
//
// Copyright (C) 2012 Heidelberg University
//
// Author: Sascha Fendrich
//
// This file is part of Sol.
//
// Sol is free software: you can redistribute it and/or modify
// it under the terms of the GNU Lesser General Public License as published by
// the Free Software Foundation, either version 3 of the License, or
// (at your option) any later version.
//
// Sol is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
// GNU Lesser General Public License for more details.
//
// You should have received a copy of the GNU Lesser General Public License
// along with Sol. If not, see <http://www.gnu.org/licenses/>.
#include <fstream>
#include <string>
#include "tiny_log.h"
#include "data_set.h"
#include "sparse_data_format.h"
DataSet::DataSet (int num_instances)
{
if (num_instances > 0)
data_set_.reserve (num_instances);
}
id_t DataSet::Read (const char *file_name)
{
std::ifstream ifs (file_name);
std::string line;
id_t max_id = 0;
int line_count = 0;
while (getline (ifs, line))
{
line_count++;
SparseVector temp;
const char *pos = sdf_parse_line (line.c_str (), temp);
if (*pos && (*pos != '#'))
{
FATAL << "Error in input:" << line_count << ':'
<< pos - line.c_str () + 1 << std::endl;
return 0;
}
data_set_.push_back (temp);
if (temp.max_id () > max_id)
max_id = temp.max_id ();
}
return max_id;
}