From edbccdfcaf46f11e631afe98796f3e6e170da5d0 Mon Sep 17 00:00:00 2001
From: Joseph Redmon <pjreddie@gmail.com>
Date: Sun, 26 Oct 2014 05:04:34 +0000
Subject: [PATCH] Maybe something changed?
---
src/data.c | 73 ++++++++++++++++++++++++++++++++++++
1 files changed, 72 insertions(+), 1 deletions(-)
diff --git a/src/data.c b/src/data.c
index 30ee9ec..734fffa 100644
--- a/src/data.c
+++ b/src/data.c
@@ -41,9 +41,11 @@
d.y = make_matrix(n, k);
for(i = 0; i < n; ++i){
- image im = load_image(paths[i], h, w);
+ image im = load_image_color(paths[i], h, w);
d.X.vals[i] = im.data;
d.X.cols = im.h*im.w*im.c;
+ }
+ for(i = 0; i < n; ++i){
fill_truth(paths[i], labels, k, d.y.vals[i]);
}
return d;
@@ -60,6 +62,14 @@
return d;
}
+char **get_labels(char *filename)
+{
+ list *plist = get_paths(filename);
+ char **labels = (char **)list_to_array(plist);
+ free_list(plist);
+ return labels;
+}
+
void free_data(data d)
{
if(!d.shallow){
@@ -84,6 +94,20 @@
return d;
}
+data load_data_random(int n, char **paths, int m, char **labels, int k, int h, int w)
+{
+ char **random_paths = calloc(n, sizeof(char*));
+ int i;
+ for(i = 0; i < n; ++i){
+ int index = rand()%m;
+ random_paths[i] = paths[index];
+ if(i == 0) printf("%s\n", paths[index]);
+ }
+ data d = load_data_image_paths(random_paths, n, labels, k, h, w);
+ free(random_paths);
+ return d;
+}
+
data load_data_image_pathfile_random(char *filename, int n, char **labels, int k, int h, int w)
{
int i;
@@ -131,6 +155,7 @@
d.y = y;
FILE *fp = fopen(filename, "rb");
+ if(!fp) file_error(filename);
for(i = 0; i < 10000; ++i){
unsigned char bytes[3073];
fread(bytes, 1, 3073, fp);
@@ -140,10 +165,56 @@
X.vals[i][j] = (double)bytes[j+1];
}
}
+ translate_data_rows(d, -144);
+ scale_data_rows(d, 1./128);
+ //normalize_data_rows(d);
fclose(fp);
return d;
}
+void get_batch(data d, int n, float *X, float *y)
+{
+ int j;
+ for(j = 0; j < n; ++j){
+ int index = rand()%d.X.rows;
+ memcpy(X+j*d.X.cols, d.X.vals[index], d.X.cols*sizeof(float));
+ memcpy(y+j*d.y.cols, d.y.vals[index], d.y.cols*sizeof(float));
+ }
+}
+
+data load_all_cifar10()
+{
+ data d;
+ d.shallow = 0;
+ int i,j,b;
+ matrix X = make_matrix(50000, 3072);
+ matrix y = make_matrix(50000, 10);
+ d.X = X;
+ d.y = y;
+
+
+ for(b = 0; b < 5; ++b){
+ char buff[256];
+ sprintf(buff, "data/cifar10/data_batch_%d.bin", b+1);
+ FILE *fp = fopen(buff, "rb");
+ if(!fp) file_error(buff);
+ for(i = 0; i < 10000; ++i){
+ unsigned char bytes[3073];
+ fread(bytes, 1, 3073, fp);
+ int class = bytes[0];
+ y.vals[i+b*10000][class] = 1;
+ for(j = 0; j < X.cols; ++j){
+ X.vals[i+b*10000][j] = (double)bytes[j+1];
+ }
+ }
+ fclose(fp);
+ }
+ //normalize_data_rows(d);
+ translate_data_rows(d, -144);
+ scale_data_rows(d, 1./128);
+ return d;
+}
+
void randomize_data(data d)
{
int i;
--
Gitblit v1.10.0