forked from btgraham/SparseConvNet-archived
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathSpatiallySparseDataset.cpp
More file actions
89 lines (83 loc) · 2.73 KB
/
SpatiallySparseDataset.cpp
File metadata and controls
89 lines (83 loc) · 2.73 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
#include "SpatiallySparseDataset.h"
#include <algorithm>
#include <iostream>
#include <chrono>
void SpatiallySparseDataset::summary() {
std::cout << "Name: " << name << std::endl;
std::cout << "nPictures: " << pictures.size() << std::endl;
std::cout << "nClasses: " << nClasses << std::endl;
std::cout << "nFeatures: " << nFeatures << std::endl;
std::cout << "Type: " << batchTypeNames[type]<<std::endl;
}
SpatiallySparseDataset SpatiallySparseDataset::extractValidationSet(float p) {
SpatiallySparseDataset val;
val.name=name+std::string(" Validation set");
name=name+std::string(" minus Validation set");
val.nClasses=nClasses;
val.nFeatures=nFeatures;
val.type=TESTBATCH;
std::mt19937 gen(123);
std::shuffle(pictures.begin(), pictures.end(), gen);
int size=pictures.size()*p;
for (;size>0;size--) {
val.pictures.push_back(pictures.back());
pictures.pop_back();
}
return val;
}
void SpatiallySparseDataset::subsetOfClasses(std::vector<int> activeClasses) {
nClasses=activeClasses.size();
std::vector<Picture*> p=pictures;
pictures.clear();
for (int i=0;i<p.size();++i) {
std::vector<int>::iterator it;
it = find (activeClasses.begin(), activeClasses.end(), p[i]->label);
if (it != activeClasses.end()) {
p[i]->label=it-activeClasses.begin();
pictures.push_back(p[i]);
//std::cout << pictures.size() << " " << p[i]->identify() << std::endl;
} else
delete p[i];
}
}
//Assume there are at least n of each class in the dataset
SpatiallySparseDataset SpatiallySparseDataset::balencedSubset(int n) {
SpatiallySparseDataset bs;
bs.name=name+std::string(" subset");
bs.nFeatures=nFeatures;
bs.nClasses=nClasses;
bs.type=type;
shuffle();
auto permutation=rng.permutation(pictures.size());
std::vector<int> count(nClasses);
int classesDone=0;
for (int i=0;i<pictures.size() and classesDone<nClasses;i++) {
if (count[pictures[permutation[i]]->label]++ < n) {
if (count[pictures[permutation[i]]->label]==n)
classesDone++;
bs.pictures.push_back(pictures[permutation[i]]);
}
}
return bs;
}
SpatiallySparseDataset SpatiallySparseDataset::subset(int n) {
SpatiallySparseDataset subset;
subset.name=name+std::string(" subset");
subset.nFeatures=nFeatures;
subset.nClasses=nClasses;
subset.type=type;
auto pick=rng.NchooseM(pictures.size(),n);
for (auto i: pick) {
subset.pictures.push_back(pictures[i]);
}
return subset;
}
void SpatiallySparseDataset::shuffle() {
std::shuffle( pictures.begin(), pictures.end(), rng.gen);
}
void SpatiallySparseDataset::repeatSamples(int reps) {
int s=pictures.size();
for (int i=1; i<reps; ++i)
for (int j=0; j<s; ++j)
pictures.push_back(pictures[j]);
}