-
Notifications
You must be signed in to change notification settings - Fork 0
/
format_mnist.cc
54 lines (42 loc) · 1.27 KB
/
format_mnist.cc
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
#include <iostream>
#include <fstream>
int main(int argc, char** argv) {
if (argc != 4) {
std::cerr << "Must provide features, labels, and number of examples\n";
exit(1);
}
int num_examples = std::atoi(argv[3]);
std::ifstream feature_file(argv[1]);
std::ifstream label_file(argv[2]);
std::ofstream digit_files[10];
for (int i = 0; i < 9 ; i++) {
digit_files[i] = std::ofstream("mnist_digit_" + std::to_string(i) + ".csv");
}
// read over the preamble of the feature file
for (int i = 0; i < 16; i++) {
feature_file.get();
}
// read over the preamble of the label file
for (int i = 0; i < 8; i++) {
label_file.get();
}
for (int i = 0; i < num_examples; i++) {
// first output the label. Divide into < 5 and >= 5.
int label = label_file.get();
// std::cout << (int)(label < 5) << ",";
// // each image is 28*28
// for (int j = 0; j < 28*28; j++) {
// int pval = feature_file.get();
// std::cout << pval << ",";
// }
// std::cout << std::endl;
digit_files[label] << (int)(label < 5) << ",";
// each image is 28*28
for (int j = 0; j < 28*28; j++) {
int pval = feature_file.get();
digit_files[label] << pval << ",";
}
digit_files[label] << std::endl;
}
return 0;
}