Improve training performance - batch-norm using cuDNN.

2023-08-10 21:13:14 +03:00 · 2018-03-20 02:16:51 +03:00
parent 2f52cfeb07
commit 537d135feb
12 changed files with 193 additions and 42 deletions
--- a/src/detector.c
+++ b/src/detector.c
@ -91,7 +91,7 @@ void train_detector(char *datacfg, char *cfgfile, char *weightfile, int *gpus, i
 	args.small_object = l.small_object;
    args.d = &buffer;
    args.type = DETECTION_DATA;
-	args.threads = 8;	// 64
+	args.threads = 64;	// 8

    args.angle = net.angle;
    args.exposure = net.exposure;
@ -1031,6 +1031,7 @@ void test_detector(char *datacfg, char *cfgfile, char *weightfile, char *filenam
        }
        image im = load_image_color(input,0,0);
        image sized = resize_image(im, net.w, net.h);
+		//image sized = letterbox_image(im, net.w, net.h);
        layer l = net.layers[net.n-1];

        box *boxes = calloc(l.w*l.h*l.n, sizeof(box));