| | |
| | | for(y = 0; y < b.h; ++y){ |
| | | for(x = 0; x < b.w; ++x){ |
| | | float val = get_pixel_extend(a, x - border, y - border, k); |
| | | if(x - border < 0 || x - border >= a.w || y - border < 0 || y - border >= a.h) val = 1; |
| | | set_pixel(b, x, y, k, val); |
| | | } |
| | | } |
| | |
| | | return c; |
| | | } |
| | | |
| | | image get_label(image *characters, char *string) |
| | | image get_label(image **characters, char *string, int size) |
| | | { |
| | | if(size > 7) size = 7; |
| | | image label = make_empty_image(0,0,0); |
| | | while(*string){ |
| | | image l = characters[(int)*string]; |
| | | image n = tile_images(label, l, -4); |
| | | image l = characters[size][(int)*string]; |
| | | image n = tile_images(label, l, -size - 1 + (size+1)/2); |
| | | free_image(label); |
| | | label = n; |
| | | ++string; |
| | |
| | | |
| | | void draw_label(image a, int r, int c, image label, const float *rgb) |
| | | { |
| | | float ratio = (float) label.w / label.h; |
| | | int h = a.h * .04; |
| | | h = label.h; |
| | | h = a.h * .06; |
| | | int w = ratio * h; |
| | | image rl = resize_image(label, w, h); |
| | | int w = label.w; |
| | | int h = label.h; |
| | | if (r - h >= 0) r = r - h; |
| | | |
| | | int i, j, k; |
| | | for(j = 0; j < h && j + r < a.h; ++j){ |
| | | for(i = 0; i < w && i + c < a.w; ++i){ |
| | | for(k = 0; k < label.c; ++k){ |
| | | float val = get_pixel(rl, i, j, k); |
| | | float val = get_pixel(label, i, j, k); |
| | | set_pixel(a, i+c, j+r, k, rgb[k] * val); |
| | | } |
| | | } |
| | | } |
| | | free_image(rl); |
| | | } |
| | | |
| | | void draw_box(image a, int x1, int y1, int x2, int y2, float r, float g, float b) |
| | |
| | | } |
| | | } |
| | | |
| | | image *load_alphabet() |
| | | image **load_alphabet() |
| | | { |
| | | int i; |
| | | image *alphabet = calloc(128, sizeof(image)); |
| | | for(i = 32; i < 127; ++i){ |
| | | char buff[256]; |
| | | sprintf(buff, "data/labels/%d.png", i); |
| | | alphabet[i] = load_image_color(buff, 0, 0); |
| | | int i, j; |
| | | const int nsize = 8; |
| | | image **alphabets = calloc(nsize, sizeof(image)); |
| | | for(j = 0; j < nsize; ++j){ |
| | | alphabets[j] = calloc(128, sizeof(image)); |
| | | for(i = 32; i < 127; ++i){ |
| | | char buff[256]; |
| | | sprintf(buff, "data/labels/%d_%d.png", i, j); |
| | | alphabets[j][i] = load_image_color(buff, 0, 0); |
| | | } |
| | | } |
| | | return alphabet; |
| | | return alphabets; |
| | | } |
| | | |
| | | void draw_detections(image im, int num, float thresh, box *boxes, float **probs, char **names, image *alphabet, int classes) |
| | | void draw_detections(image im, int num, float thresh, box *boxes, float **probs, char **names, image **alphabet, int classes) |
| | | { |
| | | int i; |
| | | |
| | |
| | | int class = max_index(probs[i], classes); |
| | | float prob = probs[i][class]; |
| | | if(prob > thresh){ |
| | | //int width = pow(prob, 1./2.)*30+1; |
| | | |
| | | int width = im.h * .012; |
| | | |
| | | if(0){ |
| | | width = pow(prob, 1./2.)*10+1; |
| | | alphabet = 0; |
| | | } |
| | | |
| | | printf("%s: %.0f%%\n", names[class], prob*100); |
| | | int offset = class*1 % classes; |
| | | int offset = class*123457 % classes; |
| | | float red = get_color(2,offset,classes); |
| | | float green = get_color(1,offset,classes); |
| | | float blue = get_color(0,offset,classes); |
| | |
| | | |
| | | draw_box_width(im, left, top, right, bot, width, red, green, blue); |
| | | if (alphabet) { |
| | | image label = get_label(alphabet, names[class]); |
| | | image label = get_label(alphabet, names[class], (im.h*.03)/10); |
| | | draw_label(im, top + width, left, label, rgb); |
| | | } |
| | | } |
| | | } |
| | | } |
| | | |
| | | #ifdef OPENCV |
| | | void draw_detections_cv(IplImage* show_img, int num, float thresh, box *boxes, float **probs, char **names, image **alphabet, int classes) |
| | | { |
| | | int i; |
| | | |
| | | for (i = 0; i < num; ++i) { |
| | | int class = max_index(probs[i], classes); |
| | | float prob = probs[i][class]; |
| | | if (prob > thresh) { |
| | | |
| | | int width = show_img->height * .012; |
| | | |
| | | if (0) { |
| | | width = pow(prob, 1. / 2.) * 10 + 1; |
| | | alphabet = 0; |
| | | } |
| | | |
| | | printf("%s: %.0f%%\n", names[class], prob * 100); |
| | | int offset = class * 123457 % classes; |
| | | float red = get_color(2, offset, classes); |
| | | float green = get_color(1, offset, classes); |
| | | float blue = get_color(0, offset, classes); |
| | | float rgb[3]; |
| | | |
| | | //width = prob*20+2; |
| | | |
| | | rgb[0] = red; |
| | | rgb[1] = green; |
| | | rgb[2] = blue; |
| | | box b = boxes[i]; |
| | | |
| | | int left = (b.x - b.w / 2.)*show_img->width; |
| | | int right = (b.x + b.w / 2.)*show_img->width; |
| | | int top = (b.y - b.h / 2.)*show_img->height; |
| | | int bot = (b.y + b.h / 2.)*show_img->height; |
| | | |
| | | if (left < 0) left = 0; |
| | | if (right > show_img->width - 1) right = show_img->width - 1; |
| | | if (top < 0) top = 0; |
| | | if (bot > show_img->height - 1) bot = show_img->height - 1; |
| | | |
| | | float const font_size = show_img->height / 1000.F; |
| | | CvPoint pt1, pt2, pt_text, pt_text_bg1, pt_text_bg2; |
| | | pt1.x = left; |
| | | pt1.y = top; |
| | | pt2.x = right; |
| | | pt2.y = bot; |
| | | pt_text.x = left; |
| | | pt_text.y = top - 12; |
| | | pt_text_bg1.x = left; |
| | | pt_text_bg1.y = top - (10+25*font_size); |
| | | pt_text_bg2.x = right; |
| | | pt_text_bg2.y = top; |
| | | CvScalar color; |
| | | color.val[0] = red * 256; |
| | | color.val[1] = green * 256; |
| | | color.val[2] = blue * 256; |
| | | |
| | | cvRectangle(show_img, pt1, pt2, color, width, 8, 0); |
| | | |
| | | cvRectangle(show_img, pt_text_bg1, pt_text_bg2, color, width, 8, 0); |
| | | cvRectangle(show_img, pt_text_bg1, pt_text_bg2, color, CV_FILLED, 8, 0); // filled |
| | | CvScalar black_color; |
| | | black_color.val[0] = 0; |
| | | CvFont font; |
| | | cvInitFont(&font, CV_FONT_HERSHEY_COMPLEX, font_size, font_size, 0, font_size*3, 8); |
| | | cvPutText(show_img, names[class], pt_text, &font, black_color); |
| | | } |
| | | } |
| | | } |
| | | #endif |
| | | |
| | | void transpose_image(image im) |
| | | { |
| | | assert(im.w == im.h); |
| | |
| | | cvReleaseImage(&buffer); |
| | | } |
| | | cvShowImage(buff, disp); |
| | | |
| | | cvReleaseImage(&disp); |
| | | } |
| | | |
| | | |
| | | void show_image_cv_ipl(IplImage *disp, const char *name) |
| | | { |
| | | if (disp == NULL) return; |
| | | char buff[256]; |
| | | //sprintf(buff, "%s (%d)", name, windows); |
| | | sprintf(buff, "%s", name); |
| | | cvNamedWindow(buff, CV_WINDOW_NORMAL); |
| | | //cvMoveWindow(buff, 100*(windows%10) + 200*(windows/10), 100*(windows%10)); |
| | | ++windows; |
| | | cvShowImage(buff, disp); |
| | | |
| | | |
| | | { |
| | | CvSize size; |
| | | { |
| | | size.width = disp->width, size.height = disp->height; |
| | | } |
| | | |
| | | static CvVideoWriter* output_video = NULL; // cv::VideoWriter output_video; |
| | | if (output_video == NULL) |
| | | { |
| | | //printf("\n SRC output_video = %p \n", output_video); |
| | | const char* output_name = "test_dnn_out.avi"; |
| | | //output_video = cvCreateVideoWriter(output_name, CV_FOURCC('H', '2', '6', '4'), 25, size, 1); |
| | | output_video = cvCreateVideoWriter(output_name, CV_FOURCC('D', 'I', 'V', 'X'), 25, size, 1); |
| | | //output_video = cvCreateVideoWriter(output_name, CV_FOURCC('M', 'J', 'P', 'G'), 25, size, 1); |
| | | //printf("\n cvCreateVideoWriter, DST output_video = %p \n", output_video); |
| | | } |
| | | |
| | | cvWriteFrame(output_video, disp); // comment this line to improve FPS !!! |
| | | printf("\n cvWriteFrame \n"); |
| | | } |
| | | |
| | | cvReleaseImage(&disp); |
| | | } |
| | | #endif |
| | | |
| | | void show_image(image p, const char *name) |
| | |
| | | return im; |
| | | } |
| | | |
| | | image get_image_from_stream_resize(CvCapture *cap, int w, int h, IplImage** in_img) |
| | | { |
| | | IplImage* src = cvQueryFrame(cap); |
| | | if (!src) return make_empty_image(0, 0, 0); |
| | | IplImage* new_img = cvCreateImage(cvSize(w, h), IPL_DEPTH_8U, 3); |
| | | *in_img = cvCreateImage(cvSize(src->width, src->height), IPL_DEPTH_8U, 3); |
| | | cvResize(src, *in_img, CV_INTER_LINEAR); |
| | | cvResize(src, new_img, CV_INTER_LINEAR); |
| | | image im = ipl_to_image(new_img); |
| | | cvReleaseImage(&new_img); |
| | | rgbgr_image(im); |
| | | return im; |
| | | } |
| | | |
| | | void save_image_jpg(image p, const char *name) |
| | | { |
| | | image copy = copy_image(p); |
| | |
| | | } |
| | | #endif |
| | | |
| | | void save_image(image im, const char *name) |
| | | void save_image_png(image im, const char *name) |
| | | { |
| | | #ifdef OPENCV |
| | | save_image_jpg(im, name); |
| | | #else |
| | | char buff[256]; |
| | | //sprintf(buff, "%s (%d)", name, windows); |
| | | sprintf(buff, "%s.png", name); |
| | |
| | | int success = stbi_write_png(buff, im.w, im.h, im.c, data, im.w*im.c); |
| | | free(data); |
| | | if(!success) fprintf(stderr, "Failed to write image %s\n", buff); |
| | | } |
| | | |
| | | void save_image(image im, const char *name) |
| | | { |
| | | #ifdef OPENCV |
| | | save_image_jpg(im, name); |
| | | #else |
| | | save_image_png(im, name); |
| | | #endif |
| | | } |
| | | |
| | |
| | | #endif |
| | | } |
| | | |
| | | image resize_max(image im, int max) |
| | | { |
| | | int w = im.w; |
| | | int h = im.h; |
| | | if(w > h){ |
| | | h = (h * max) / w; |
| | | w = max; |
| | | } else { |
| | | w = (w * max) / h; |
| | | h = max; |
| | | } |
| | | if(w == im.w && h == im.h) return im; |
| | | image resized = resize_image(im, w, h); |
| | | return resized; |
| | | } |
| | | |
| | | image resize_min(image im, int min) |
| | | { |
| | | int w = im.w; |
| | |
| | | show_image(c4, "C4"); |
| | | #ifdef OPENCV |
| | | while(1){ |
| | | image aug = random_augment_image(im, 0, 320, 448, 320, .75); |
| | | image aug = random_augment_image(im, 0, .75, 320, 448, 320); |
| | | show_image(aug, "aug"); |
| | | free_image(aug); |
| | | |