#include "commonmodel.h" #include #include "cereal/gen/c/log.capnp.h" #include "common/mat.h" #include "common/timing.h" void model_input_init(ModelInput* s, int width, int height, cl_device_id device_id, cl_context context) { int err; s->device_id = device_id; s->context = context; transform_init(&s->transform, context, device_id); s->transformed_width = width; s->transformed_height = height; s->transformed_y_cl = clCreateBuffer(s->context, CL_MEM_READ_WRITE, s->transformed_width*s->transformed_height, NULL, &err); assert(err == 0); s->transformed_u_cl = clCreateBuffer(s->context, CL_MEM_READ_WRITE, (s->transformed_width/2)*(s->transformed_height/2), NULL, &err); assert(err == 0); s->transformed_v_cl = clCreateBuffer(s->context, CL_MEM_READ_WRITE, (s->transformed_width/2)*(s->transformed_height/2), NULL, &err); assert(err == 0); s->net_input_size = ((width*height*3)/2)*sizeof(float); s->net_input = clCreateBuffer(s->context, CL_MEM_READ_WRITE, s->net_input_size, (void*)NULL, &err); assert(err == 0); loadyuv_init(&s->loadyuv, context, device_id, s->transformed_width, s->transformed_height); } float *model_input_prepare(ModelInput* s, cl_command_queue q, cl_mem yuv_cl, int width, int height, mat3 transform) { int err; int i = 0; transform_queue(&s->transform, q, yuv_cl, width, height, s->transformed_y_cl, s->transformed_u_cl, s->transformed_v_cl, s->transformed_width, s->transformed_height, transform); loadyuv_queue(&s->loadyuv, q, s->transformed_y_cl, s->transformed_u_cl, s->transformed_v_cl, s->net_input); float *net_input_buf = (float *)clEnqueueMapBuffer(q, s->net_input, CL_TRUE, CL_MAP_READ, 0, s->net_input_size, 0, NULL, NULL, &err); clFinish(q); return net_input_buf; } void model_input_free(ModelInput* s) { transform_destroy(&s->transform); loadyuv_destroy(&s->loadyuv); } void softmax(const float* input, float* output, size_t len) { float max_val = -FLT_MAX; for(int i = 0; i < len; i++) { const float v = input[i]; if( v > max_val ) { max_val = v; } } float denominator = 0; for(int i = 0; i < len; i++) { float const v = input[i]; float const v_exp = expf(v - max_val); denominator += v_exp; output[i] = v_exp; } const float inv_denominator = 1. / denominator; for(int i = 0; i < len; i++) { output[i] *= inv_denominator; } } static cereal_ModelData_PathData_ptr path_to_cereal(struct capn_segment *cs, const PathData data) { capn_list32 points_ptr = capn_new_list32(cs, MODEL_PATH_DISTANCE); for (int i=0; i