-
Notifications
You must be signed in to change notification settings - Fork 1
/
Dataset.cpp
123 lines (92 loc) · 2.87 KB
/
Dataset.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
#include "Dataset.h"
vector<float> Dataset::generateInMemoryInLine(float mean, float variance) {
default_random_engine generator;
normal_distribution <float> distribution(mean, variance);
vector<float> dataset;
dataset.resize(this->dataset_size*this->data_size);
double start = omp_get_wtime();
for (int i = 0; i < this->dataset_size*this->data_size; i++)
dataset[i] = distribution(generator);
printf_s("GenerateInMemory Dataset = %.16g", omp_get_wtime() - start);
cout << endl;
return dataset;
}
vector<float> Dataset::readInLineDataset(bool COALESCED) {
ifstream inFile;
inFile.open(this->name.c_str());
vector<float> dataset;
dataset.resize(this->dataset_size * this->data_size);
cout << "=========================== ... READING ... ============================" << endl << endl;
if (inFile.is_open())
{
double start = omp_get_wtime();
if(!COALESCED)
for (int a = 0; a < this->dataset_size * this->data_size; a++)
inFile >> dataset[a];
else {
for (int a = 0; a < this->data_size; a++) {
for (int b = 0; b < this->dataset_size; a++) {
inFile >> dataset[b*dataset_size + a];
}
}
}
printf_s("Read Dataset = %.16g", omp_get_wtime() - start);
cout << endl;
inFile.close();
}
else {
std::cout << "Can't find input file " << endl;
}
return dataset;
}
vector<float> Dataset::readInLine(vector<vector<float>> v) {
int data_size = v[0].size();
int vector_size = v.size();
vector<float> inLine(data_size*vector_size);
cout << "=========================== ... READING ... ============================" << endl << endl;
for (int i = 0; i < vector_size; i++) {
for (int j = 0; j < data_size; j++) {
inLine[i*data_size + j] = v[i][j];
}
}
cout << endl;
return inLine;
}
vector<int> Dataset::readInLine(vector<vector<int>> v) {
int data_size = v[0].size();
int vector_size = v.size();
vector<int> inLine(data_size*vector_size);
cout << "=========================== ... READING ... ============================" << endl << endl;
for (int i = 0; i < vector_size; i++) {
for (int j = 0; j < data_size; j++) {
inLine[i*data_size + j] = v[i][j];
}
}
cout << endl;
return inLine;
}
vector<vector<float>> Dataset::generateCPUCUDAdataset( vector<vector<float>> tmpDataset) {
int dataset_query_size = tmpDataset.size();
int query_size = tmpDataset[0].size();
vector< vector<float>> dataset(2);
dataset[0].resize(dataset_query_size*query_size);
dataset[1].resize(dataset_query_size*query_size);
for (int i = 0; i < dataset_query_size; i++)
for (int j = 0; j < query_size; j++)
dataset[0][i*query_size + j] = tmpDataset[i][j];
//out << "i: " << i << endl;
for (int i = 0; i < dataset_query_size; i++)
for (int j = 0; j < query_size; j++)
dataset[1][j*dataset_query_size + i] = tmpDataset[i][j];
return dataset;
}
/*
[ 1 2 3]
[ 4 5 6]
[ 7 8 9]
[ 1 1 1]
[ 1 4 7 1 ][ 2 5 8 1 ]...
*/
Dataset::~Dataset()
{
}