You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
117 lines
2.9 KiB
117 lines
2.9 KiB
#include "visionbuf.h"
|
|
|
|
#include <stdio.h>
|
|
#include <fcntl.h>
|
|
#include <assert.h>
|
|
#include <stdlib.h>
|
|
#include <unistd.h>
|
|
#include <sys/mman.h>
|
|
#include <sys/types.h>
|
|
|
|
#define CL_USE_DEPRECATED_OPENCL_1_2_APIS
|
|
#ifdef __APPLE__
|
|
#include <OpenCL/cl.h>
|
|
#else
|
|
#include <CL/cl.h>
|
|
#endif
|
|
|
|
int offset = 0;
|
|
void *malloc_with_fd(size_t len, int *fd) {
|
|
char full_path[0x100];
|
|
#ifdef __APPLE__
|
|
snprintf(full_path, sizeof(full_path)-1, "/tmp/visionbuf_%d_%d", getpid(), offset++);
|
|
#else
|
|
snprintf(full_path, sizeof(full_path)-1, "/dev/shm/visionbuf_%d_%d", getpid(), offset++);
|
|
#endif
|
|
*fd = open(full_path, O_RDWR | O_CREAT, 0777);
|
|
assert(*fd >= 0);
|
|
unlink(full_path);
|
|
ftruncate(*fd, len);
|
|
void *addr = mmap(NULL, len, PROT_READ | PROT_WRITE, MAP_SHARED, *fd, 0);
|
|
assert(addr != MAP_FAILED);
|
|
return addr;
|
|
}
|
|
|
|
VisionBuf visionbuf_allocate(size_t len) {
|
|
// const size_t alignment = 4096;
|
|
// void* addr = aligned_alloc(alignment, alignment * ((len - 1) / alignment + 1));
|
|
//void* addr = calloc(1, len);
|
|
|
|
int fd;
|
|
void *addr = malloc_with_fd(len, &fd);
|
|
|
|
return (VisionBuf){
|
|
.len = len, .addr = addr, .handle = 1, .fd = fd,
|
|
};
|
|
}
|
|
|
|
cl_mem visionbuf_to_cl(const VisionBuf* buf, cl_device_id device_id, cl_context ctx) {
|
|
// HACK because this platform is just for convenience
|
|
VisionBuf *w_buf = (VisionBuf*)buf;
|
|
cl_mem ret;
|
|
*w_buf = visionbuf_allocate_cl(buf->len, device_id, ctx, &ret);
|
|
return ret;
|
|
}
|
|
|
|
VisionBuf visionbuf_allocate_cl(size_t len, cl_device_id device_id, cl_context ctx, cl_mem *out_mem) {
|
|
int err;
|
|
assert(out_mem);
|
|
|
|
#if __OPENCL_VERSION__ >= 200
|
|
void* host_ptr =
|
|
clSVMAlloc(ctx, CL_MEM_READ_WRITE | CL_MEM_SVM_FINE_GRAIN_BUFFER, len, 0);
|
|
assert(host_ptr);
|
|
#else
|
|
int fd;
|
|
void* host_ptr = malloc_with_fd(len, &fd);
|
|
|
|
cl_command_queue q = clCreateCommandQueue(ctx, device_id, 0, &err);
|
|
assert(err == 0);
|
|
#endif
|
|
|
|
cl_mem mem = clCreateBuffer(ctx, CL_MEM_READ_WRITE | CL_MEM_USE_HOST_PTR, len, host_ptr, &err);
|
|
assert(err == 0);
|
|
|
|
*out_mem = mem;
|
|
|
|
return (VisionBuf){
|
|
.len = len, .addr = host_ptr, .handle = 0, .fd = fd,
|
|
.device_id = device_id, .ctx = ctx, .buf_cl = mem,
|
|
|
|
#if __OPENCL_VERSION__ < 200
|
|
.copy_q = q,
|
|
#endif
|
|
|
|
};
|
|
}
|
|
|
|
void visionbuf_sync(const VisionBuf* buf, int dir) {
|
|
int err = 0;
|
|
if (!buf->buf_cl) return;
|
|
|
|
#if __OPENCL_VERSION__ < 200
|
|
if (dir == VISIONBUF_SYNC_FROM_DEVICE) {
|
|
err = clEnqueueReadBuffer(buf->copy_q, buf->buf_cl, CL_FALSE, 0, buf->len, buf->addr, 0, NULL, NULL);
|
|
} else {
|
|
err = clEnqueueWriteBuffer(buf->copy_q, buf->buf_cl, CL_FALSE, 0, buf->len, buf->addr, 0, NULL, NULL);
|
|
}
|
|
assert(err == 0);
|
|
clFinish(buf->copy_q);
|
|
#endif
|
|
}
|
|
|
|
void visionbuf_free(const VisionBuf* buf) {
|
|
if (buf->handle) {
|
|
munmap(buf->addr, buf->len);
|
|
close(buf->fd);
|
|
} else {
|
|
int err = clReleaseMemObject(buf->buf_cl);
|
|
assert(err == 0);
|
|
#if __OPENCL_VERSION__ >= 200
|
|
clSVMFree(buf->ctx, buf->addr);
|
|
#else
|
|
munmap(buf->addr, buf->len);
|
|
close(buf->fd);
|
|
#endif
|
|
}
|
|
}
|
|
|