|
|
@ -8,19 +8,16 @@ |
|
|
|
void frame_init(ModelFrame* frame, int width, int height, |
|
|
|
void frame_init(ModelFrame* frame, int width, int height, |
|
|
|
cl_device_id device_id, cl_context context) { |
|
|
|
cl_device_id device_id, cl_context context) { |
|
|
|
transform_init(&frame->transform, context, device_id); |
|
|
|
transform_init(&frame->transform, context, device_id); |
|
|
|
frame->transformed_width = width; |
|
|
|
frame->width = width; |
|
|
|
frame->transformed_height = height; |
|
|
|
frame->height = height; |
|
|
|
|
|
|
|
|
|
|
|
frame->transformed_y_cl = CL_CHECK_ERR(clCreateBuffer(context, CL_MEM_READ_WRITE, |
|
|
|
frame->y_cl = CL_CHECK_ERR(clCreateBuffer(context, CL_MEM_READ_WRITE, (size_t)width*height, NULL, &err)); |
|
|
|
(size_t)frame->transformed_width*frame->transformed_height, NULL, &err)); |
|
|
|
frame->u_cl = CL_CHECK_ERR(clCreateBuffer(context, CL_MEM_READ_WRITE, (size_t)(width/2)*(height/2), NULL, &err)); |
|
|
|
frame->transformed_u_cl = CL_CHECK_ERR(clCreateBuffer(context, CL_MEM_READ_WRITE, |
|
|
|
frame->v_cl = CL_CHECK_ERR(clCreateBuffer(context, CL_MEM_READ_WRITE, (size_t)(width/2)*(height/2), NULL, &err)); |
|
|
|
(size_t)(frame->transformed_width/2)*(frame->transformed_height/2), NULL, &err)); |
|
|
|
|
|
|
|
frame->transformed_v_cl = CL_CHECK_ERR(clCreateBuffer(context, CL_MEM_READ_WRITE, |
|
|
|
|
|
|
|
(size_t)(frame->transformed_width/2)*(frame->transformed_height/2), NULL, &err)); |
|
|
|
|
|
|
|
frame->net_input_size = ((width*height*3)/2)*sizeof(float); |
|
|
|
frame->net_input_size = ((width*height*3)/2)*sizeof(float); |
|
|
|
frame->net_input = CL_CHECK_ERR(clCreateBuffer(context, CL_MEM_READ_WRITE, |
|
|
|
frame->net_input = CL_CHECK_ERR(clCreateBuffer(context, CL_MEM_READ_WRITE, |
|
|
|
frame->net_input_size, (void*)NULL, &err)); |
|
|
|
frame->net_input_size, (void*)NULL, &err)); |
|
|
|
loadyuv_init(&frame->loadyuv, context, device_id, frame->transformed_width, frame->transformed_height); |
|
|
|
loadyuv_init(&frame->loadyuv, context, device_id, width, height); |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
float *frame_prepare(ModelFrame* frame, cl_command_queue q, |
|
|
|
float *frame_prepare(ModelFrame* frame, cl_command_queue q, |
|
|
@ -28,11 +25,11 @@ float *frame_prepare(ModelFrame* frame, cl_command_queue q, |
|
|
|
const mat3 &transform) { |
|
|
|
const mat3 &transform) { |
|
|
|
transform_queue(&frame->transform, q, |
|
|
|
transform_queue(&frame->transform, q, |
|
|
|
yuv_cl, width, height, |
|
|
|
yuv_cl, width, height, |
|
|
|
frame->transformed_y_cl, frame->transformed_u_cl, frame->transformed_v_cl, |
|
|
|
frame->y_cl, frame->u_cl, frame->v_cl, |
|
|
|
frame->transformed_width, frame->transformed_height, |
|
|
|
frame->width, frame->height, |
|
|
|
transform); |
|
|
|
transform); |
|
|
|
loadyuv_queue(&frame->loadyuv, q, |
|
|
|
loadyuv_queue(&frame->loadyuv, q, |
|
|
|
frame->transformed_y_cl, frame->transformed_u_cl, frame->transformed_v_cl, |
|
|
|
frame->y_cl, frame->u_cl, frame->v_cl, |
|
|
|
frame->net_input); |
|
|
|
frame->net_input); |
|
|
|
float *net_input_buf = (float *)CL_CHECK_ERR(clEnqueueMapBuffer(q, frame->net_input, CL_TRUE, |
|
|
|
float *net_input_buf = (float *)CL_CHECK_ERR(clEnqueueMapBuffer(q, frame->net_input, CL_TRUE, |
|
|
|
CL_MAP_READ, 0, frame->net_input_size, |
|
|
|
CL_MAP_READ, 0, frame->net_input_size, |
|
|
@ -45,9 +42,9 @@ void frame_free(ModelFrame* frame) { |
|
|
|
transform_destroy(&frame->transform); |
|
|
|
transform_destroy(&frame->transform); |
|
|
|
loadyuv_destroy(&frame->loadyuv); |
|
|
|
loadyuv_destroy(&frame->loadyuv); |
|
|
|
CL_CHECK(clReleaseMemObject(frame->net_input)); |
|
|
|
CL_CHECK(clReleaseMemObject(frame->net_input)); |
|
|
|
CL_CHECK(clReleaseMemObject(frame->transformed_v_cl)); |
|
|
|
CL_CHECK(clReleaseMemObject(frame->v_cl)); |
|
|
|
CL_CHECK(clReleaseMemObject(frame->transformed_u_cl)); |
|
|
|
CL_CHECK(clReleaseMemObject(frame->u_cl)); |
|
|
|
CL_CHECK(clReleaseMemObject(frame->transformed_y_cl)); |
|
|
|
CL_CHECK(clReleaseMemObject(frame->y_cl)); |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
void softmax(const float* input, float* output, size_t len) { |
|
|
|
void softmax(const float* input, float* output, size_t len) { |
|
|
|