darknet/src/dropout_layer_kernels.cu

42 lines
1.2 KiB
Plaintext
Raw Normal View History

2015-11-16 06:51:26 +03:00
#include "cuda_runtime.h"
#include "curand.h"
#include "cublas_v2.h"
2015-01-23 03:38:24 +03:00
extern "C" {
2017-06-02 06:31:13 +03:00
#include "dropout_layer.h"
#include "cuda.h"
#include "utils.h"
2015-01-23 03:38:24 +03:00
}
2015-03-12 08:20:15 +03:00
__global__ void yoloswag420blazeit360noscope(float *input, int size, float *rand, float prob, float scale)
2015-01-23 03:38:24 +03:00
{
int id = (blockIdx.x + blockIdx.y*gridDim.x) * blockDim.x + threadIdx.x;
2015-03-12 08:20:15 +03:00
if(id < size) input[id] = (rand[id] < prob) ? 0 : input[id]*scale;
2015-01-23 03:38:24 +03:00
}
void forward_dropout_layer_gpu(dropout_layer layer, network net)
2015-01-23 03:38:24 +03:00
{
if (!net.train) return;
2015-01-23 03:38:24 +03:00
int size = layer.inputs*layer.batch;
2015-03-21 22:25:14 +03:00
cuda_random(layer.rand_gpu, size);
2015-03-28 03:32:01 +03:00
/*
2015-03-27 05:13:59 +03:00
int i;
for(i = 0; i < size; ++i){
layer.rand[i] = rand_uniform();
}
cuda_push_array(layer.rand_gpu, layer.rand, size);
2015-03-28 03:32:01 +03:00
*/
2015-01-23 03:38:24 +03:00
yoloswag420blazeit360noscope<<<cuda_gridsize(size), BLOCK>>>(net.input_gpu, size, layer.rand_gpu, layer.probability, layer.scale);
2015-01-23 03:38:24 +03:00
check_error(cudaPeekAtLastError());
}
void backward_dropout_layer_gpu(dropout_layer layer, network net)
2015-01-23 03:38:24 +03:00
{
if(!net.delta_gpu) return;
2015-01-23 03:38:24 +03:00
int size = layer.inputs*layer.batch;
yoloswag420blazeit360noscope<<<cuda_gridsize(size), BLOCK>>>(net.delta_gpu, size, layer.rand_gpu, layer.probability, layer.scale);
2015-01-23 03:38:24 +03:00
check_error(cudaPeekAtLastError());
}