darknet/src/region_layer.c

#include "region_layer.h"
#include "activations.h"
#include "blas.h"
#include "box.h"
#include "cuda.h"
#include "utils.h"
#include <stdio.h>
#include <assert.h>
#include <string.h>
#include <stdlib.h>

region_layer make_region_layer(int batch, int w, int h, int n, int classes, int coords)
{
    region_layer l = {0};
    l.type = REGION;

    l.n = n;
    l.batch = batch;
    l.h = h;
    l.w = w;
    l.classes = classes;
    l.coords = coords;
    l.cost = calloc(1, sizeof(float));
    l.biases = calloc(n*2, sizeof(float));
    l.bias_updates = calloc(n*2, sizeof(float));
    l.outputs = h*w*n*(classes + coords + 1);
    l.inputs = l.outputs;
    l.truths = 30*(5);
    l.delta = calloc(batch*l.outputs, sizeof(float));
    l.output = calloc(batch*l.outputs, sizeof(float));
    int i;
    for(i = 0; i < n*2; ++i){
        l.biases[i] = .5;
    }

    l.forward = forward_region_layer;
    l.backward = backward_region_layer;
#ifdef GPU
    l.forward_gpu = forward_region_layer_gpu;
    l.backward_gpu = backward_region_layer_gpu;
    l.output_gpu = cuda_make_array(l.output, batch*l.outputs);
    l.delta_gpu = cuda_make_array(l.delta, batch*l.outputs);
#endif

    fprintf(stderr, "Region Layer\n");
    srand(0);

    return l;
}

#define DOABS 1
box get_region_box(float *x, float *biases, int n, int index, int i, int j, int w, int h)
{
    box b;
    b.x = (i + logistic_activate(x[index + 0])) / w;
    b.y = (j + logistic_activate(x[index + 1])) / h;
    b.w = exp(x[index + 2]) * biases[2*n];
    b.h = exp(x[index + 3]) * biases[2*n+1];
    if(DOABS){
        b.w = exp(x[index + 2]) * biases[2*n]   / w;
        b.h = exp(x[index + 3]) * biases[2*n+1] / h;
    }
    return b;
}

float delta_region_box(box truth, float *x, float *biases, int n, int index, int i, int j, int w, int h, float *delta, float scale)
{
    box pred = get_region_box(x, biases, n, index, i, j, w, h);
    float iou = box_iou(pred, truth);

    float tx = (truth.x*w - i);
    float ty = (truth.y*h - j);
    float tw = log(truth.w / biases[2*n]);
    float th = log(truth.h / biases[2*n + 1]);
    if(DOABS){
        tw = log(truth.w*w / biases[2*n]);
        th = log(truth.h*h / biases[2*n + 1]);
    }

    delta[index + 0] = scale * (tx - logistic_activate(x[index + 0])) * logistic_gradient(logistic_activate(x[index + 0]));
    delta[index + 1] = scale * (ty - logistic_activate(x[index + 1])) * logistic_gradient(logistic_activate(x[index + 1]));
    delta[index + 2] = scale * (tw - x[index + 2]);
    delta[index + 3] = scale * (th - x[index + 3]);
    return iou;
}

void delta_region_class(float *output, float *delta, int index, int class, int classes, tree *hier, float scale, float *avg_cat)
{
    int i, n;
    if(hier){
        float pred = 1;
        while(class >= 0){
            pred *= output[index + class];
            int g = hier->group[class];
            int offset = hier->group_offset[g];
            for(i = 0; i < hier->group_size[g]; ++i){
                delta[index + offset + i] = scale * (0 - output[index + offset + i]);
            }
            delta[index + class] = scale * (1 - output[index + class]);

            class = hier->parent[class];
        }
        *avg_cat += pred;
    } else {
        for(n = 0; n < classes; ++n){
            delta[index + n] = scale * (((n == class)?1 : 0) - output[index + n]);
            if(n == class) *avg_cat += output[index + n];
        }
    }
}

float logit(float x)
{
    return log(x/(1.-x));
}

float tisnan(float x)
{
    return (x != x);
}

void softmax_tree(float *input, int batch, int inputs, float temp, tree *hierarchy, float *output);
void forward_region_layer(const region_layer l, network_state state)
{
    int i,j,b,t,n;
    int size = l.coords + l.classes + 1;
    memcpy(l.output, state.input, l.outputs*l.batch*sizeof(float));
    reorg(l.output, l.w*l.h, size*l.n, l.batch, 1);
    for (b = 0; b < l.batch; ++b){
        for(i = 0; i < l.h*l.w*l.n; ++i){
            int index = size*i + b*l.outputs;
            l.output[index + 4] = logistic_activate(l.output[index + 4]);
        }
    }


    if (l.softmax_tree){
#ifdef GPU
        cuda_push_array(l.output_gpu, l.output, l.batch*l.outputs);
        int i;
        int count = 5;
        for (i = 0; i < l.softmax_tree->groups; ++i) {
            int group_size = l.softmax_tree->group_size[i];
            softmax_gpu(l.output_gpu+count, group_size, l.classes + 5, l.w*l.h*l.n*l.batch, 1, l.output_gpu + count);
            count += group_size;
        }
        cuda_pull_array(l.output_gpu, l.output, l.batch*l.outputs);
#else
        for (b = 0; b < l.batch; ++b){
            for(i = 0; i < l.h*l.w*l.n; ++i){
                int index = size*i + b*l.outputs;
                softmax_tree(l.output + index + 5, 1, 0, 1, l.softmax_tree, l.output + index + 5);
            }
        }
#endif
    } else if (l.softmax){
        for (b = 0; b < l.batch; ++b){
            for(i = 0; i < l.h*l.w*l.n; ++i){
                int index = size*i + b*l.outputs;
                softmax(l.output + index + 5, l.classes, 1, l.output + index + 5);
            }
        }
    }
    if(!state.train) return;
    memset(l.delta, 0, l.outputs * l.batch * sizeof(float));
    float avg_iou = 0;
    float recall = 0;
    float avg_cat = 0;
    float avg_obj = 0;
    float avg_anyobj = 0;
    int count = 0;
    int class_count = 0;
    *(l.cost) = 0;
    for (b = 0; b < l.batch; ++b) {
        for (j = 0; j < l.h; ++j) {
            for (i = 0; i < l.w; ++i) {
                for (n = 0; n < l.n; ++n) {
                    int index = size*(j*l.w*l.n + i*l.n + n) + b*l.outputs;
                    box pred = get_region_box(l.output, l.biases, n, index, i, j, l.w, l.h);
                    float best_iou = 0;
                    int best_class = -1;
                    for(t = 0; t < 30; ++t){
                        box truth = float_to_box(state.truth + t*5 + b*l.truths);
                        if(!truth.x) break;
                        float iou = box_iou(pred, truth);
                        if (iou > best_iou) {
                            best_class = state.truth[t*5 + b*l.truths + 4];
                            best_iou = iou;
                        }
                    }
                    avg_anyobj += l.output[index + 4];
                    l.delta[index + 4] = l.noobject_scale * ((0 - l.output[index + 4]) * logistic_gradient(l.output[index + 4]));
                    if(l.classfix == -1) l.delta[index + 4] = l.noobject_scale * ((best_iou - l.output[index + 4]) * logistic_gradient(l.output[index + 4]));
                    else{
                        if (best_iou > l.thresh) {
                            l.delta[index + 4] = 0;
                            if(l.classfix > 0){
                                delta_region_class(l.output, l.delta, index + 5, best_class, l.classes, l.softmax_tree, l.class_scale*(l.classfix == 2 ? l.output[index + 4] : 1), &avg_cat);
                                ++class_count;
                            }
                        }
                    }

                    if(*(state.net.seen) < 12800){
                        box truth = {0};
                        truth.x = (i + .5)/l.w;
                        truth.y = (j + .5)/l.h;
                        truth.w = l.biases[2*n];
                        truth.h = l.biases[2*n+1];
                        if(DOABS){
                            truth.w = l.biases[2*n]/l.w;
                            truth.h = l.biases[2*n+1]/l.h;
                        }
                        delta_region_box(truth, l.output, l.biases, n, index, i, j, l.w, l.h, l.delta, .01);
                    }
                }
            }
        }
        for(t = 0; t < 30; ++t){
            box truth = float_to_box(state.truth + t*5 + b*l.truths);

            if(!truth.x) break;
            float best_iou = 0;
            int best_index = 0;
            int best_n = 0;
            i = (truth.x * l.w);
            j = (truth.y * l.h);
            //printf("%d %f %d %f\n", i, truth.x*l.w, j, truth.y*l.h);
            box truth_shift = truth;
            truth_shift.x = 0;
            truth_shift.y = 0;
            //printf("index %d %d\n",i, j);
            for(n = 0; n < l.n; ++n){
                int index = size*(j*l.w*l.n + i*l.n + n) + b*l.outputs;
                box pred = get_region_box(l.output, l.biases, n, index, i, j, l.w, l.h);
                if(l.bias_match){
                    pred.w = l.biases[2*n];
                    pred.h = l.biases[2*n+1];
                    if(DOABS){
                        pred.w = l.biases[2*n]/l.w;
                        pred.h = l.biases[2*n+1]/l.h;
                    }
                }
                //printf("pred: (%f, %f) %f x %f\n", pred.x, pred.y, pred.w, pred.h);
                pred.x = 0;
                pred.y = 0;
                float iou = box_iou(pred, truth_shift);
                if (iou > best_iou){
                    best_index = index;
                    best_iou = iou;
                    best_n = n;
                }
            }
            //printf("%d %f (%f, %f) %f x %f\n", best_n, best_iou, truth.x, truth.y, truth.w, truth.h);

            float iou = delta_region_box(truth, l.output, l.biases, best_n, best_index, i, j, l.w, l.h, l.delta, l.coord_scale);
            if(iou > .5) recall += 1;
            avg_iou += iou;

            //l.delta[best_index + 4] = iou - l.output[best_index + 4];
            avg_obj += l.output[best_index + 4];
            l.delta[best_index + 4] = l.object_scale * (1 - l.output[best_index + 4]) * logistic_gradient(l.output[best_index + 4]);
            if (l.rescore) {
                l.delta[best_index + 4] = l.object_scale * (iou - l.output[best_index + 4]) * logistic_gradient(l.output[best_index + 4]);
            }


            int class = state.truth[t*5 + b*l.truths + 4];
            if (l.map) class = l.map[class];
            delta_region_class(l.output, l.delta, best_index + 5, class, l.classes, l.softmax_tree, l.class_scale, &avg_cat);
            ++count;
            ++class_count;
        }
    }
    //printf("\n");
    reorg(l.delta, l.w*l.h, size*l.n, l.batch, 0);
    *(l.cost) = pow(mag_array(l.delta, l.outputs * l.batch), 2);
    printf("Region Avg IOU: %f, Class: %f, Obj: %f, No Obj: %f, Avg Recall: %f,  count: %d\n", avg_iou/count, avg_cat/class_count, avg_obj/count, avg_anyobj/(l.w*l.h*l.n*l.batch), recall/count, count);
}

void backward_region_layer(const region_layer l, network_state state)
{
    axpy_cpu(l.batch*l.inputs, 1, l.delta, 1, state.delta, 1);
}

void get_region_boxes(layer l, int w, int h, float thresh, float **probs, box *boxes, int only_objectness)
{
    int i,j,n;
    float *predictions = l.output;
    for (i = 0; i < l.w*l.h; ++i){
        int row = i / l.w;
        int col = i % l.w;
        for(n = 0; n < l.n; ++n){
            int index = i*l.n + n;
            int p_index = index * (l.classes + 5) + 4;
            float scale = predictions[p_index];
            if(l.classfix == -1 && scale < .5) scale = 0;
            int box_index = index * (l.classes + 5);
            boxes[index] = get_region_box(predictions, l.biases, n, box_index, col, row, l.w, l.h);
            boxes[index].x *= w;
            boxes[index].y *= h;
            boxes[index].w *= w;
            boxes[index].h *= h;

            int class_index = index * (l.classes + 5) + 5;
            if(l.softmax_tree){

                hierarchy_predictions(predictions + class_index, l.classes, l.softmax_tree, 0);
                int found = 0;
                for(j = l.classes - 1; j >= 0; --j){
                    if(!found && predictions[class_index + j] > .5){
                        found = 1;
                    } else {
                        predictions[class_index + j] = 0;
                    }
                    float prob = predictions[class_index+j];
                    probs[index][j] = (scale > thresh) ? prob : 0;
                }
            }else{
                for(j = 0; j < l.classes; ++j){
                    float prob = scale*predictions[class_index+j];
                    probs[index][j] = (prob > thresh) ? prob : 0;
                }
            }
            if(only_objectness){
                probs[index][0] = scale;
            }
        }
    }
}

#ifdef GPU

void forward_region_layer_gpu(const region_layer l, network_state state)
{
    /*
       if(!state.train){
       copy_ongpu(l.batch*l.inputs, state.input, 1, l.output_gpu, 1);
       return;
       }
     */

    float *in_cpu = calloc(l.batch*l.inputs, sizeof(float));
    float *truth_cpu = 0;
    if(state.truth){
        int num_truth = l.batch*l.truths;
        truth_cpu = calloc(num_truth, sizeof(float));
        cuda_pull_array(state.truth, truth_cpu, num_truth);
    }
    cuda_pull_array(state.input, in_cpu, l.batch*l.inputs);
    network_state cpu_state = state;
    cpu_state.train = state.train;
    cpu_state.truth = truth_cpu;
    cpu_state.input = in_cpu;
    forward_region_layer(l, cpu_state);
    cuda_push_array(l.output_gpu, l.output, l.batch*l.outputs);
    cuda_push_array(l.delta_gpu, l.delta, l.batch*l.outputs);
    free(cpu_state.input);
    if(cpu_state.truth) free(cpu_state.truth);
}

void backward_region_layer_gpu(region_layer l, network_state state)
{
    axpy_ongpu(l.batch*l.outputs, 1, l.delta_gpu, 1, state.delta, 1);
    //copy_ongpu(l.batch*l.inputs, l.delta_gpu, 1, state.delta, 1);
}
#endif
some more stuff 2016-08-06 01:27:07 +03:00			`#include "region_layer.h"`
			`#include "activations.h"`
			`#include "blas.h"`
			`#include "box.h"`
			`#include "cuda.h"`
			`#include "utils.h"`
			`#include <stdio.h>`
			`#include <assert.h>`
			`#include <string.h>`
			`#include <stdlib.h>`

			`region_layer make_region_layer(int batch, int w, int h, int n, int classes, int coords)`
			`{`
			`region_layer l = {0};`
			`l.type = REGION;`

			`l.n = n;`
			`l.batch = batch;`
			`l.h = h;`
			`l.w = w;`
			`l.classes = classes;`
			`l.coords = coords;`
			`l.cost = calloc(1, sizeof(float));`
good chance I didn't break anything 2016-09-12 23:55:20 +03:00			`l.biases = calloc(n*2, sizeof(float));`
			`l.bias_updates = calloc(n*2, sizeof(float));`
some more stuff 2016-08-06 01:27:07 +03:00			`l.outputs = hwn*(classes + coords + 1);`
			`l.inputs = l.outputs;`
			`l.truths = 30*(5);`
			`l.delta = calloc(batch*l.outputs, sizeof(float));`
			`l.output = calloc(batch*l.outputs, sizeof(float));`
good chance I didn't break anything 2016-09-12 23:55:20 +03:00			`int i;`
			`for(i = 0; i < n*2; ++i){`
			`l.biases[i] = .5;`
			`}`

So I have this new programming paradigm....... 2016-09-25 09:12:54 +03:00			`l.forward = forward_region_layer;`
			`l.backward = backward_region_layer;`
some more stuff 2016-08-06 01:27:07 +03:00			`#ifdef GPU`
So I have this new programming paradigm....... 2016-09-25 09:12:54 +03:00			`l.forward_gpu = forward_region_layer_gpu;`
			`l.backward_gpu = backward_region_layer_gpu;`
some more stuff 2016-08-06 01:27:07 +03:00			`l.output_gpu = cuda_make_array(l.output, batch*l.outputs);`
			`l.delta_gpu = cuda_make_array(l.delta, batch*l.outputs);`
			`#endif`

			`fprintf(stderr, "Region Layer\n");`
			`srand(0);`

			`return l;`
			`}`

:fire: crush. crush. admit. :fire: 2016-11-11 19:48:40 +03:00			`#define DOABS 1`
good chance I didn't break anything 2016-09-12 23:55:20 +03:00			`box get_region_box(float x, float biases, int n, int index, int i, int j, int w, int h)`
some more stuff 2016-08-06 01:27:07 +03:00			`{`
			`box b;`
:fire: crush. crush. admit. :fire: 2016-11-11 19:48:40 +03:00			`b.x = (i + logistic_activate(x[index + 0])) / w;`
			`b.y = (j + logistic_activate(x[index + 1])) / h;`
good chance I didn't break anything 2016-09-12 23:55:20 +03:00			`b.w = exp(x[index + 2]) * biases[2*n];`
			`b.h = exp(x[index + 3]) * biases[2*n+1];`
:fire: crush. crush. admit. :fire: 2016-11-11 19:48:40 +03:00			`if(DOABS){`
			`b.w = exp(x[index + 2]) * biases[2*n] / w;`
			`b.h = exp(x[index + 3]) * biases[2*n+1] / h;`
			`}`
some more stuff 2016-08-06 01:27:07 +03:00			`return b;`
			`}`

good chance I didn't break anything 2016-09-12 23:55:20 +03:00			`float delta_region_box(box truth, float x, float biases, int n, int index, int i, int j, int w, int h, float *delta, float scale)`
some more stuff 2016-08-06 01:27:07 +03:00			`{`
good chance I didn't break anything 2016-09-12 23:55:20 +03:00			`box pred = get_region_box(x, biases, n, index, i, j, w, h);`
some more stuff 2016-08-06 01:27:07 +03:00			`float iou = box_iou(pred, truth);`

:fire: crush. crush. admit. :fire: 2016-11-11 19:48:40 +03:00			`float tx = (truth.x*w - i);`
			`float ty = (truth.y*h - j);`
good chance I didn't break anything 2016-09-12 23:55:20 +03:00			`float tw = log(truth.w / biases[2*n]);`
			`float th = log(truth.h / biases[2*n + 1]);`
:fire: crush. crush. admit. :fire: 2016-11-11 19:48:40 +03:00			`if(DOABS){`
			`tw = log(truth.ww / biases[2n]);`
			`th = log(truth.hh / biases[2n + 1]);`
new font strategy 2016-11-06 00:09:21 +03:00			`}`
:fire: crush. crush. admit. :fire: 2016-11-11 19:48:40 +03:00
			`delta[index + 0] = scale * (tx - logistic_activate(x[index + 0])) * logistic_gradient(logistic_activate(x[index + 0]));`
			`delta[index + 1] = scale * (ty - logistic_activate(x[index + 1])) * logistic_gradient(logistic_activate(x[index + 1]));`
good chance I didn't break anything 2016-09-12 23:55:20 +03:00			`delta[index + 2] = scale * (tw - x[index + 2]);`
			`delta[index + 3] = scale * (th - x[index + 3]);`
some more stuff 2016-08-06 01:27:07 +03:00			`return iou;`
			`}`

stuff and things 2016-11-08 10:42:19 +03:00			`void delta_region_class(float output, float delta, int index, int class, int classes, tree hier, float scale, float avg_cat)`
			`{`
			`int i, n;`
			`if(hier){`
			`float pred = 1;`
			`while(class >= 0){`
			`pred *= output[index + class];`
			`int g = hier->group[class];`
			`int offset = hier->group_offset[g];`
			`for(i = 0; i < hier->group_size[g]; ++i){`
			`delta[index + offset + i] = scale * (0 - output[index + offset + i]);`
			`}`
			`delta[index + class] = scale * (1 - output[index + class]);`

			`class = hier->parent[class];`
			`}`
			`*avg_cat += pred;`
			`} else {`
			`for(n = 0; n < classes; ++n){`
			`delta[index + n] = scale * (((n == class)?1 : 0) - output[index + n]);`
			`if(n == class) *avg_cat += output[index + n];`
			`}`
			`}`
			`}`

some more stuff 2016-08-06 01:27:07 +03:00			`float logit(float x)`
			`{`
			`return log(x/(1.-x));`
			`}`

			`float tisnan(float x)`
			`{`
			`return (x != x);`
			`}`

new font strategy 2016-11-06 00:09:21 +03:00			`void softmax_tree(float input, int batch, int inputs, float temp, tree hierarchy, float *output);`
some more stuff 2016-08-06 01:27:07 +03:00			`void forward_region_layer(const region_layer l, network_state state)`
			`{`
			`int i,j,b,t,n;`
			`int size = l.coords + l.classes + 1;`
			`memcpy(l.output, state.input, l.outputsl.batchsizeof(float));`
			`reorg(l.output, l.wl.h, sizel.n, l.batch, 1);`
			`for (b = 0; b < l.batch; ++b){`
			`for(i = 0; i < l.hl.wl.n; ++i){`
			`int index = sizei + bl.outputs;`
			`l.output[index + 4] = logistic_activate(l.output[index + 4]);`
:fire: crush. crush. admit. :fire: 2016-11-11 19:48:40 +03:00			`}`
			`}`


			`if (l.softmax_tree){`
			`#ifdef GPU`
			`cuda_push_array(l.output_gpu, l.output, l.batch*l.outputs);`
			`int i;`
			`int count = 5;`
			`for (i = 0; i < l.softmax_tree->groups; ++i) {`
			`int group_size = l.softmax_tree->group_size[i];`
			`softmax_gpu(l.output_gpu+count, group_size, l.classes + 5, l.wl.hl.n*l.batch, 1, l.output_gpu + count);`
			`count += group_size;`
			`}`
			`cuda_pull_array(l.output_gpu, l.output, l.batch*l.outputs);`
			`#else`
			`for (b = 0; b < l.batch; ++b){`
			`for(i = 0; i < l.hl.wl.n; ++i){`
			`int index = sizei + bl.outputs;`
new font strategy 2016-11-06 00:09:21 +03:00			`softmax_tree(l.output + index + 5, 1, 0, 1, l.softmax_tree, l.output + index + 5);`
:fire: crush. crush. admit. :fire: 2016-11-11 19:48:40 +03:00			`}`
			`}`
			`#endif`
			`} else if (l.softmax){`
			`for (b = 0; b < l.batch; ++b){`
			`for(i = 0; i < l.hl.wl.n; ++i){`
			`int index = sizei + bl.outputs;`
tree stuff 2016-10-21 23:16:43 +03:00			`softmax(l.output + index + 5, l.classes, 1, l.output + index + 5);`
some more stuff 2016-08-06 01:27:07 +03:00			`}`
			`}`
			`}`
			`if(!state.train) return;`
			`memset(l.delta, 0, l.outputs * l.batch * sizeof(float));`
			`float avg_iou = 0;`
good chance I didn't break anything 2016-09-12 23:55:20 +03:00			`float recall = 0;`
some more stuff 2016-08-06 01:27:07 +03:00			`float avg_cat = 0;`
			`float avg_obj = 0;`
			`float avg_anyobj = 0;`
			`int count = 0;`
stuff and things 2016-11-08 10:42:19 +03:00			`int class_count = 0;`
some more stuff 2016-08-06 01:27:07 +03:00			`*(l.cost) = 0;`
			`for (b = 0; b < l.batch; ++b) {`
			`for (j = 0; j < l.h; ++j) {`
			`for (i = 0; i < l.w; ++i) {`
			`for (n = 0; n < l.n; ++n) {`
			`int index = size(jl.wl.n + il.n + n) + b*l.outputs;`
good chance I didn't break anything 2016-09-12 23:55:20 +03:00			`box pred = get_region_box(l.output, l.biases, n, index, i, j, l.w, l.h);`
some more stuff 2016-08-06 01:27:07 +03:00			`float best_iou = 0;`
stuff and things 2016-11-08 10:42:19 +03:00			`int best_class = -1;`
some more stuff 2016-08-06 01:27:07 +03:00			`for(t = 0; t < 30; ++t){`
			`box truth = float_to_box(state.truth + t5 + bl.truths);`
			`if(!truth.x) break;`
			`float iou = box_iou(pred, truth);`
stuff and things 2016-11-08 10:42:19 +03:00			`if (iou > best_iou) {`
			`best_class = state.truth[t5 + bl.truths + 4];`
			`best_iou = iou;`
			`}`
some more stuff 2016-08-06 01:27:07 +03:00			`}`
			`avg_anyobj += l.output[index + 4];`
			`l.delta[index + 4] = l.noobject_scale * ((0 - l.output[index + 4]) * logistic_gradient(l.output[index + 4]));`
stuff and things 2016-11-08 10:42:19 +03:00			`if(l.classfix == -1) l.delta[index + 4] = l.noobject_scale * ((best_iou - l.output[index + 4]) * logistic_gradient(l.output[index + 4]));`
			`else{`
			`if (best_iou > l.thresh) {`
			`l.delta[index + 4] = 0;`
			`if(l.classfix > 0){`
			`delta_region_class(l.output, l.delta, index + 5, best_class, l.classes, l.softmax_tree, l.class_scale*(l.classfix == 2 ? l.output[index + 4] : 1), &avg_cat);`
			`++class_count;`
			`}`
			`}`
			`}`
some more stuff 2016-08-06 01:27:07 +03:00
new font strategy 2016-11-06 00:09:21 +03:00			`if(*(state.net.seen) < 12800){`
some more stuff 2016-08-06 01:27:07 +03:00			`box truth = {0};`
			`truth.x = (i + .5)/l.w;`
			`truth.y = (j + .5)/l.h;`
new font strategy 2016-11-06 00:09:21 +03:00			`truth.w = l.biases[2*n];`
			`truth.h = l.biases[2*n+1];`
:fire: crush. crush. admit. :fire: 2016-11-11 19:48:40 +03:00			`if(DOABS){`
			`truth.w = l.biases[2*n]/l.w;`
			`truth.h = l.biases[2*n+1]/l.h;`
			`}`
good chance I didn't break anything 2016-09-12 23:55:20 +03:00			`delta_region_box(truth, l.output, l.biases, n, index, i, j, l.w, l.h, l.delta, .01);`
some more stuff 2016-08-06 01:27:07 +03:00			`}`
			`}`
			`}`
			`}`
			`for(t = 0; t < 30; ++t){`
			`box truth = float_to_box(state.truth + t5 + bl.truths);`
new font strategy 2016-11-06 00:09:21 +03:00
some more stuff 2016-08-06 01:27:07 +03:00			`if(!truth.x) break;`
			`float best_iou = 0;`
			`int best_index = 0;`
			`int best_n = 0;`
			`i = (truth.x * l.w);`
			`j = (truth.y * l.h);`
			`//printf("%d %f %d %f\n", i, truth.xl.w, j, truth.yl.h);`
			`box truth_shift = truth;`
			`truth_shift.x = 0;`
			`truth_shift.y = 0;`
:charizard: :charizard: :charizard: 2016-11-06 03:27:31 +03:00			`//printf("index %d %d\n",i, j);`
some more stuff 2016-08-06 01:27:07 +03:00			`for(n = 0; n < l.n; ++n){`
			`int index = size(jl.wl.n + il.n + n) + b*l.outputs;`
good chance I didn't break anything 2016-09-12 23:55:20 +03:00			`box pred = get_region_box(l.output, l.biases, n, index, i, j, l.w, l.h);`
new font strategy 2016-11-06 00:09:21 +03:00			`if(l.bias_match){`
			`pred.w = l.biases[2*n];`
			`pred.h = l.biases[2*n+1];`
:fire: crush. crush. admit. :fire: 2016-11-11 19:48:40 +03:00			`if(DOABS){`
			`pred.w = l.biases[2*n]/l.w;`
			`pred.h = l.biases[2*n+1]/l.h;`
			`}`
new font strategy 2016-11-06 00:09:21 +03:00			`}`
:charizard: :charizard: :charizard: 2016-11-06 03:27:31 +03:00			`//printf("pred: (%f, %f) %f x %f\n", pred.x, pred.y, pred.w, pred.h);`
some more stuff 2016-08-06 01:27:07 +03:00			`pred.x = 0;`
			`pred.y = 0;`
			`float iou = box_iou(pred, truth_shift);`
			`if (iou > best_iou){`
			`best_index = index;`
			`best_iou = iou;`
			`best_n = n;`
			`}`
			`}`
:charizard: :charizard: :charizard: 2016-11-06 03:27:31 +03:00			`//printf("%d %f (%f, %f) %f x %f\n", best_n, best_iou, truth.x, truth.y, truth.w, truth.h);`
some more stuff 2016-08-06 01:27:07 +03:00
good chance I didn't break anything 2016-09-12 23:55:20 +03:00			`float iou = delta_region_box(truth, l.output, l.biases, best_n, best_index, i, j, l.w, l.h, l.delta, l.coord_scale);`
			`if(iou > .5) recall += 1;`
some more stuff 2016-08-06 01:27:07 +03:00			`avg_iou += iou;`

			`//l.delta[best_index + 4] = iou - l.output[best_index + 4];`
			`avg_obj += l.output[best_index + 4];`
			`l.delta[best_index + 4] = l.object_scale * (1 - l.output[best_index + 4]) * logistic_gradient(l.output[best_index + 4]);`
			`if (l.rescore) {`
			`l.delta[best_index + 4] = l.object_scale * (iou - l.output[best_index + 4]) * logistic_gradient(l.output[best_index + 4]);`
			`}`

new font strategy 2016-11-06 00:09:21 +03:00
			`int class = state.truth[t5 + bl.truths + 4];`
			`if (l.map) class = l.map[class];`
stuff and things 2016-11-08 10:42:19 +03:00			`delta_region_class(l.output, l.delta, best_index + 5, class, l.classes, l.softmax_tree, l.class_scale, &avg_cat);`
some more stuff 2016-08-06 01:27:07 +03:00			`++count;`
stuff and things 2016-11-08 10:42:19 +03:00			`++class_count;`
some more stuff 2016-08-06 01:27:07 +03:00			`}`
			`}`
:charizard: :charizard: :charizard: 2016-11-06 03:27:31 +03:00			`//printf("\n");`
some more stuff 2016-08-06 01:27:07 +03:00			`reorg(l.delta, l.wl.h, sizel.n, l.batch, 0);`
			`(l.cost) = pow(mag_array(l.delta, l.outputs l.batch), 2);`
stuff and things 2016-11-08 10:42:19 +03:00			`printf("Region Avg IOU: %f, Class: %f, Obj: %f, No Obj: %f, Avg Recall: %f, count: %d\n", avg_iou/count, avg_cat/class_count, avg_obj/count, avg_anyobj/(l.wl.hl.n*l.batch), recall/count, count);`
some more stuff 2016-08-06 01:27:07 +03:00			`}`

			`void backward_region_layer(const region_layer l, network_state state)`
			`{`
			`axpy_cpu(l.batch*l.inputs, 1, l.delta, 1, state.delta, 1);`
			`}`

So I have this new programming paradigm....... 2016-09-25 09:12:54 +03:00			`void get_region_boxes(layer l, int w, int h, float thresh, float *probs, box boxes, int only_objectness)`
			`{`
			`int i,j,n;`
			`float *predictions = l.output;`
			`for (i = 0; i < l.w*l.h; ++i){`
			`int row = i / l.w;`
			`int col = i % l.w;`
			`for(n = 0; n < l.n; ++n){`
			`int index = i*l.n + n;`
			`int p_index = index * (l.classes + 5) + 4;`
			`float scale = predictions[p_index];`
stuff and things 2016-11-08 10:42:19 +03:00			`if(l.classfix == -1 && scale < .5) scale = 0;`
So I have this new programming paradigm....... 2016-09-25 09:12:54 +03:00			`int box_index = index * (l.classes + 5);`
new font strategy 2016-11-06 00:09:21 +03:00			`boxes[index] = get_region_box(predictions, l.biases, n, box_index, col, row, l.w, l.h);`
			`boxes[index].x *= w;`
			`boxes[index].y *= h;`
			`boxes[index].w *= w;`
			`boxes[index].h *= h;`

			`int class_index = index * (l.classes + 5) + 5;`
			`if(l.softmax_tree){`
stuff and things 2016-11-08 10:42:19 +03:00
new font strategy 2016-11-06 00:09:21 +03:00			`hierarchy_predictions(predictions + class_index, l.classes, l.softmax_tree, 0);`
			`int found = 0;`
			`for(j = l.classes - 1; j >= 0; --j){`
			`if(!found && predictions[class_index + j] > .5){`
			`found = 1;`
			`} else {`
			`predictions[class_index + j] = 0;`
			`}`
			`float prob = predictions[class_index+j];`
			`probs[index][j] = (scale > thresh) ? prob : 0;`
			`}`
			`}else{`
			`for(j = 0; j < l.classes; ++j){`
			`float prob = scale*predictions[class_index+j];`
			`probs[index][j] = (prob > thresh) ? prob : 0;`
			`}`
So I have this new programming paradigm....... 2016-09-25 09:12:54 +03:00			`}`
			`if(only_objectness){`
			`probs[index][0] = scale;`
			`}`
			`}`
			`}`
			`}`

some more stuff 2016-08-06 01:27:07 +03:00			`#ifdef GPU`

			`void forward_region_layer_gpu(const region_layer l, network_state state)`
			`{`
			`/*`
			`if(!state.train){`
			`copy_ongpu(l.batch*l.inputs, state.input, 1, l.output_gpu, 1);`
			`return;`
			`}`
			`*/`

			`float in_cpu = calloc(l.batchl.inputs, sizeof(float));`
			`float *truth_cpu = 0;`
			`if(state.truth){`
			`int num_truth = l.batch*l.truths;`
			`truth_cpu = calloc(num_truth, sizeof(float));`
			`cuda_pull_array(state.truth, truth_cpu, num_truth);`
			`}`
			`cuda_pull_array(state.input, in_cpu, l.batch*l.inputs);`
			`network_state cpu_state = state;`
			`cpu_state.train = state.train;`
			`cpu_state.truth = truth_cpu;`
			`cpu_state.input = in_cpu;`
			`forward_region_layer(l, cpu_state);`
			`cuda_push_array(l.output_gpu, l.output, l.batch*l.outputs);`
			`cuda_push_array(l.delta_gpu, l.delta, l.batch*l.outputs);`
			`free(cpu_state.input);`
			`if(cpu_state.truth) free(cpu_state.truth);`
			`}`

			`void backward_region_layer_gpu(region_layer l, network_state state)`
			`{`
			`axpy_ongpu(l.batch*l.outputs, 1, l.delta_gpu, 1, state.delta, 1);`
			`//copy_ongpu(l.batch*l.inputs, l.delta_gpu, 1, state.delta, 1);`
			`}`
			`#endif`