mirror of https://github.com/AlexeyAB/darknet.git
parent
176d65b765
commit
76ee68f96d
18 changed files with 550 additions and 200 deletions
@ -0,0 +1,41 @@ |
||||
int index(int row, int col) |
||||
{ |
||||
|
||||
} |
||||
|
||||
__kernel void col2im(__global float *data_col, int batch, |
||||
int channels, int height, int width, |
||||
int ksize, int stride, int pad, __global float *data_im) |
||||
{ |
||||
int id = get_global_id(0); |
||||
int index = id; |
||||
int w = id%width; |
||||
id /= width; |
||||
int h = id%height; |
||||
id /= height; |
||||
int c = id%channels; |
||||
id /= channels; |
||||
int b = id%batch; |
||||
|
||||
int height_col = (height - ksize) / stride + 1; |
||||
int width_col = (width - ksize) / stride + 1; |
||||
int rows = channels * ksize * ksize; |
||||
if (pad){ |
||||
height_col = 1 + (height-1) / stride; |
||||
width_col = 1 + (width-1) / stride; |
||||
pad = ksize/2; |
||||
} |
||||
int cols = height_col*width_col; |
||||
int batch_offset = b*cols*rows; |
||||
int channel_offset = c*cols*ksize*ksize; |
||||
data_col[index] = 0; |
||||
int i,j; |
||||
for(i = 0; i < ksize; ++i){ |
||||
row_offset = i*height_col*width_col; |
||||
for(j = 0; j < ksize; ++j){ |
||||
col_offset = |
||||
} |
||||
} |
||||
|
||||
data_col[col_index] = im2col_get_pixel(data_im, height, width, channels, b, im_row, im_col, c_im, pad); |
||||
} |
@ -0,0 +1,25 @@ |
||||
|
||||
__kernel void bias(int n, int size, __global float *biases, __global float *output) |
||||
{ |
||||
int batch = get_global_id(0); |
||||
int id = get_global_id(1); |
||||
int filter = id/size; |
||||
int position = id%size; |
||||
|
||||
output[batch*n*size + id] = biases[filter]; |
||||
} |
||||
|
||||
__kernel void learn_bias(int batch, int n, int size, __global float *delta, __global float *bias_updates) |
||||
{ |
||||
int i,b; |
||||
int filter = get_global_id(0); |
||||
float sum = 0; |
||||
for(b = 0; b < batch; ++b){ |
||||
for(i = 0; i < size; ++i){ |
||||
int index = i + size*(filter + n*b); |
||||
sum += delta[index]; |
||||
} |
||||
} |
||||
bias_updates[filter] += sum; |
||||
} |
||||
|
@ -1,26 +1,43 @@ |
||||
|
||||
__kernel void im2col(__global float *data_im, const int im_offset, |
||||
const int channels, const int height, const int width, |
||||
const int ksize, const int stride, __global float *data_col, const int col_offset) |
||||
float im2col_get_pixel(__global float *im, int height, int width, int channels, |
||||
int batch, int row, int col, int channel, int pad) |
||||
{ |
||||
int b = get_global_id(0); |
||||
int c = get_global_id(1); |
||||
row -= pad; |
||||
col -= pad; |
||||
|
||||
int h = get_local_id(0); |
||||
int w = get_local_id(1); |
||||
if (row < 0 || col < 0 || row >= height || col >= width) return 0; |
||||
int index = col + width*(row + height*(channel+batch*channels)); |
||||
return im[index]; |
||||
} |
||||
|
||||
__kernel void im2col(__global float *data_im, int batch, |
||||
int channels, int height, int width, |
||||
int ksize, int stride, int pad, __global float *data_col) |
||||
{ |
||||
int c,h,w,b; |
||||
int height_col = (height - ksize) / stride + 1; |
||||
int width_col = (width - ksize) / stride + 1; |
||||
int channels_col = channels * ksize * ksize; |
||||
if (pad){ |
||||
height_col = 1 + (height-1) / stride; |
||||
width_col = 1 + (width-1) / stride; |
||||
pad = ksize/2; |
||||
} |
||||
int gid1 = get_global_id(0); |
||||
b = gid1%batch; |
||||
c = gid1/batch; |
||||
|
||||
int im_offset = height*width*channels*b; |
||||
int col_offset = height_col*width_col*channels_col*b; |
||||
int gid2 = get_global_id(1); |
||||
h = gid2%height_col; |
||||
w = gid2/height_col; |
||||
|
||||
|
||||
int channels_col = channels * ksize * ksize; |
||||
int col_size = height_col*width_col*channels_col; |
||||
int w_offset = c % ksize; |
||||
int h_offset = (c / ksize) % ksize; |
||||
int c_im = c / ksize / ksize; |
||||
|
||||
data_col[(c * height_col + h) * width_col + w + col_offset] = |
||||
data_im[(c_im * height + h * stride + h_offset) * width |
||||
+ w * stride + w_offset + im_offset]; |
||||
int im_row = h_offset + h * stride; |
||||
int im_col = w_offset + w * stride; |
||||
int col_index = (c * height_col + h) * width_col + w + b*col_size; |
||||
data_col[col_index] = im2col_get_pixel(data_im, height, width, channels, b, im_row, im_col, c_im, pad); |
||||
} |
||||
|
Loading…
Reference in new issue