You can not select more than 25 topics
			Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
		
		
		
		
		
			
		
			
				
					
					
						
							111 lines
						
					
					
						
							2.8 KiB
						
					
					
				
			
		
		
	
	
							111 lines
						
					
					
						
							2.8 KiB
						
					
					
				| #include "visionbuf.h"
 | |
| 
 | |
| #include <stdio.h>
 | |
| #include <fcntl.h>
 | |
| #include <assert.h>
 | |
| #include <stdlib.h>
 | |
| #include <unistd.h>
 | |
| #include <sys/mman.h>
 | |
| #include <sys/types.h>
 | |
| 
 | |
| #define CL_USE_DEPRECATED_OPENCL_1_2_APIS
 | |
| #ifdef __APPLE__
 | |
| #include <OpenCL/cl.h>
 | |
| #else
 | |
| #include <CL/cl.h>
 | |
| #endif
 | |
| 
 | |
| int offset = 0;
 | |
| void *malloc_with_fd(size_t len, int *fd) {
 | |
|   char full_path[0x100];
 | |
|   snprintf(full_path, sizeof(full_path)-1, "/dev/shm/visionbuf_%d_%d", getpid(), offset++);
 | |
|   *fd = open(full_path, O_RDWR | O_CREAT, 0777);
 | |
|   unlink(full_path);
 | |
|   ftruncate(*fd, len);
 | |
|   void *addr = mmap(NULL, len, PROT_READ | PROT_WRITE, MAP_SHARED, *fd, 0);
 | |
|   return addr;
 | |
| }
 | |
| 
 | |
| VisionBuf visionbuf_allocate(size_t len) {
 | |
|   // const size_t alignment = 4096;
 | |
|   // void* addr = aligned_alloc(alignment, alignment * ((len - 1) / alignment + 1));
 | |
|   //void* addr = calloc(1, len);
 | |
| 
 | |
|   int fd;
 | |
|   void *addr = malloc_with_fd(len, &fd);
 | |
| 
 | |
|   return (VisionBuf){
 | |
|       .len = len, .addr = addr, .handle = 1, .fd = fd,
 | |
|   };
 | |
| }
 | |
| 
 | |
| cl_mem visionbuf_to_cl(const VisionBuf* buf, cl_device_id device_id, cl_context ctx) {
 | |
|   // HACK because this platform is just for convenience
 | |
|   VisionBuf *w_buf = (VisionBuf*)buf;
 | |
|   cl_mem ret;
 | |
|   *w_buf = visionbuf_allocate_cl(buf->len, device_id, ctx, &ret);
 | |
|   return ret;
 | |
| }
 | |
| 
 | |
| VisionBuf visionbuf_allocate_cl(size_t len, cl_device_id device_id, cl_context ctx, cl_mem *out_mem) {
 | |
|   int err;
 | |
|   assert(out_mem);
 | |
| 
 | |
| #if __OPENCL_VERSION__ >= 200
 | |
|   void* host_ptr =
 | |
|       clSVMAlloc(ctx, CL_MEM_READ_WRITE | CL_MEM_SVM_FINE_GRAIN_BUFFER, len, 0);
 | |
|   assert(host_ptr);
 | |
| #else
 | |
|   int fd;
 | |
|   void* host_ptr = malloc_with_fd(len, &fd);
 | |
| 
 | |
|   cl_command_queue q = clCreateCommandQueue(ctx, device_id, 0, &err);
 | |
|   assert(err == 0);
 | |
| #endif
 | |
| 
 | |
|   cl_mem mem = clCreateBuffer(ctx, CL_MEM_READ_WRITE | CL_MEM_USE_HOST_PTR, len, host_ptr, &err);
 | |
|   assert(err == 0);
 | |
| 
 | |
|   *out_mem = mem;
 | |
| 
 | |
|   return (VisionBuf){
 | |
|       .len = len, .addr = host_ptr, .handle = 0, .fd = fd,
 | |
|       .device_id = device_id, .ctx = ctx, .buf_cl = mem,
 | |
| 
 | |
| #if __OPENCL_VERSION__ < 200
 | |
|       .copy_q = q,
 | |
| #endif
 | |
| 
 | |
|   };
 | |
| }
 | |
| 
 | |
| void visionbuf_sync(const VisionBuf* buf, int dir) {
 | |
|   int err = 0;
 | |
|   if (!buf->buf_cl) return;
 | |
| 
 | |
| #if __OPENCL_VERSION__ < 200
 | |
|   if (dir == VISIONBUF_SYNC_FROM_DEVICE) {
 | |
|     err = clEnqueueReadBuffer(buf->copy_q, buf->buf_cl, CL_FALSE, 0, buf->len, buf->addr, 0, NULL, NULL);
 | |
|   } else {
 | |
|     err = clEnqueueWriteBuffer(buf->copy_q, buf->buf_cl, CL_FALSE, 0, buf->len, buf->addr, 0, NULL, NULL);
 | |
|   }
 | |
|   assert(err == 0);
 | |
|   clFinish(buf->copy_q);
 | |
| #endif
 | |
| }
 | |
| 
 | |
| void visionbuf_free(const VisionBuf* buf) {
 | |
|   if (buf->handle) {
 | |
|     munmap(buf->addr, buf->len);
 | |
|     close(buf->fd);
 | |
|   } else {
 | |
|     int err = clReleaseMemObject(buf->buf_cl);
 | |
|     assert(err == 0);
 | |
| #if __OPENCL_VERSION__ >= 200
 | |
|     clSVMFree(buf->ctx, buf->addr);
 | |
| #else
 | |
|     munmap(buf->addr, buf->len);
 | |
|     close(buf->fd);
 | |
| #endif
 | |
|   }
 | |
| }
 | |
| 
 |