darknet/src/activations.c

132 lines
3.1 KiB
C
Raw Normal View History

#include "activations.h"
#include <math.h>
#include <stdio.h>
2014-05-10 02:14:52 +04:00
#include <stdlib.h>
#include <string.h>
2014-02-14 22:26:31 +04:00
char *get_activation_string(ACTIVATION a)
{
switch(a){
case SIGMOID:
return "sigmoid";
case RELU:
return "relu";
case RAMP:
return "ramp";
case LINEAR:
return "linear";
case TANH:
return "tanh";
default:
break;
}
return "relu";
}
ACTIVATION get_activation(char *s)
{
if (strcmp(s, "sigmoid")==0) return SIGMOID;
if (strcmp(s, "relu")==0) return RELU;
2013-12-06 01:17:16 +04:00
if (strcmp(s, "linear")==0) return LINEAR;
2013-12-03 04:41:40 +04:00
if (strcmp(s, "ramp")==0) return RAMP;
2013-12-06 01:17:16 +04:00
if (strcmp(s, "tanh")==0) return TANH;
fprintf(stderr, "Couldn't find activation function %s, going with ReLU\n", s);
return RELU;
}
2014-05-01 03:17:40 +04:00
float linear_activate(float x){return x;}
float sigmoid_activate(float x){return 1./(1. + exp(-x));}
float relu_activate(float x){return x*(x>0);}
float ramp_activate(float x){return x*(x>0)+.1*x;}
float tanh_activate(float x){return (exp(2*x)-1)/(exp(2*x)+1);}
2014-05-10 02:14:52 +04:00
float activate(float x, ACTIVATION a, float dropout)
{
if((float)rand()/RAND_MAX < dropout) return 0;
2013-12-03 04:41:40 +04:00
switch(a){
2013-12-06 01:17:16 +04:00
case LINEAR:
2014-05-10 02:14:52 +04:00
return linear_activate(x)/(1-dropout);
2013-12-03 04:41:40 +04:00
case SIGMOID:
2014-05-10 02:14:52 +04:00
return sigmoid_activate(x)/(1-dropout);
2013-12-03 04:41:40 +04:00
case RELU:
2014-05-10 02:14:52 +04:00
return relu_activate(x)/(1-dropout);
2013-12-03 04:41:40 +04:00
case RAMP:
2014-05-10 02:14:52 +04:00
return ramp_activate(x)/(1-dropout);
2013-12-06 01:17:16 +04:00
case TANH:
2014-05-10 02:14:52 +04:00
return tanh_activate(x)/(1-dropout);
2013-12-03 04:41:40 +04:00
}
return 0;
}
2014-05-01 03:17:40 +04:00
2014-05-10 02:14:52 +04:00
void activate_array(float *x, const int n, const ACTIVATION a, float dropout)
2014-05-01 03:17:40 +04:00
{
int i;
for(i = 0; i < n; ++i){
2014-05-10 02:14:52 +04:00
x[i] = activate(x[i], a, dropout);
2014-05-01 03:17:40 +04:00
}
}
float gradient(float x, ACTIVATION a){
2013-12-03 04:41:40 +04:00
switch(a){
2013-12-06 01:17:16 +04:00
case LINEAR:
2013-12-03 04:41:40 +04:00
return 1;
case SIGMOID:
return (1.-x)*x;
case RELU:
return (x>0);
case RAMP:
return (x>0) + .1;
2013-12-06 01:17:16 +04:00
case TANH:
return 1-x*x;
2013-12-03 04:41:40 +04:00
}
return 0;
}
2014-05-01 03:17:40 +04:00
void gradient_array(const float *x, const int n, const ACTIVATION a, float *delta)
{
int i;
for(i = 0; i < n; ++i){
delta[i] *= gradient(x[i], a);
}
}
2014-05-10 02:14:52 +04:00
#ifdef GPU
#include "opencl.h"
#include <math.h>
cl_kernel get_activation_kernel()
{
static int init = 0;
static cl_kernel kernel;
if(!init){
kernel = get_kernel("src/activations.cl", "activate_array", 0);
init = 1;
}
return kernel;
}
void activate_array_ongpu(cl_mem x, int n, ACTIVATION a, float dropout)
{
cl_setup();
cl_kernel kernel = get_activation_kernel();
cl_command_queue queue = cl.queue;
cl_uint i = 0;
cl.error = clSetKernelArg(kernel, i++, sizeof(x), (void*) &x);
cl.error = clSetKernelArg(kernel, i++, sizeof(n), (void*) &n);
cl.error = clSetKernelArg(kernel, i++, sizeof(a), (void*) &a);
cl.error = clSetKernelArg(kernel, i++, sizeof(dropout),
(void*) &dropout);
check_error(cl);
size_t gsize = n;
clEnqueueNDRangeKernel(queue, kernel, 1, 0, &gsize, 0, 0, 0, 0);
check_error(cl);
}
#endif