|  |  | @ -6,6 +6,14 @@ | 
			
		
	
		
		
			
				
					
					|  |  |  | 
 |  |  |  | 
 | 
			
		
	
		
		
			
				
					
					|  |  |  | #include "cereal/visionipc/visionbuf.h" |  |  |  | #include "cereal/visionipc/visionbuf.h" | 
			
		
	
		
		
			
				
					
					|  |  |  | 
 |  |  |  | 
 | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  | #ifdef __APPLE__ | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  | #define HW_DEVICE_TYPE AV_HWDEVICE_TYPE_VIDEOTOOLBOX | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  | #define HW_PIX_FMT AV_PIX_FMT_VIDEOTOOLBOX | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  | #else | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  | #define HW_DEVICE_TYPE AV_HWDEVICE_TYPE_CUDA | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  | #define HW_PIX_FMT AV_PIX_FMT_CUDA | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  | #endif | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  | 
 | 
			
		
	
		
		
			
				
					
					|  |  |  | namespace { |  |  |  | namespace { | 
			
		
	
		
		
			
				
					
					|  |  |  | 
 |  |  |  | 
 | 
			
		
	
		
		
			
				
					
					|  |  |  | struct buffer_data { |  |  |  | struct buffer_data { | 
			
		
	
	
		
		
			
				
					|  |  | @ -30,7 +38,7 @@ enum AVPixelFormat get_hw_format(AVCodecContext *ctx, const enum AVPixelFormat * | 
			
		
	
		
		
			
				
					
					|  |  |  |   for (const enum AVPixelFormat *p = pix_fmts; *p != -1; p++) { |  |  |  |   for (const enum AVPixelFormat *p = pix_fmts; *p != -1; p++) { | 
			
		
	
		
		
			
				
					
					|  |  |  |     if (*p == *hw_pix_fmt) return *p; |  |  |  |     if (*p == *hw_pix_fmt) return *p; | 
			
		
	
		
		
			
				
					
					|  |  |  |   } |  |  |  |   } | 
			
		
	
		
		
			
				
					
					|  |  |  |   rWarning("Please run replay with the --no-cuda flag!"); |  |  |  |   rWarning("Please run replay with the --no-hw-decoder flag!"); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |   // fallback to YUV420p
 |  |  |  |   // fallback to YUV420p
 | 
			
		
	
		
		
			
				
					
					|  |  |  |   *hw_pix_fmt = AV_PIX_FMT_NONE; |  |  |  |   *hw_pix_fmt = AV_PIX_FMT_NONE; | 
			
		
	
		
		
			
				
					
					|  |  |  |   return AV_PIX_FMT_YUV420P; |  |  |  |   return AV_PIX_FMT_YUV420P; | 
			
		
	
	
		
		
			
				
					|  |  | @ -57,15 +65,15 @@ FrameReader::~FrameReader() { | 
			
		
	
		
		
			
				
					
					|  |  |  |   } |  |  |  |   } | 
			
		
	
		
		
			
				
					
					|  |  |  | } |  |  |  | } | 
			
		
	
		
		
			
				
					
					|  |  |  | 
 |  |  |  | 
 | 
			
		
	
		
		
			
				
					
					|  |  |  | bool FrameReader::load(const std::string &url, bool no_cuda, std::atomic<bool> *abort, bool local_cache, int chunk_size, int retries) { |  |  |  | bool FrameReader::load(const std::string &url, bool no_hw_decoder, std::atomic<bool> *abort, bool local_cache, int chunk_size, int retries) { | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |   FileReader f(local_cache, chunk_size, retries); |  |  |  |   FileReader f(local_cache, chunk_size, retries); | 
			
		
	
		
		
			
				
					
					|  |  |  |   std::string data = f.read(url, abort); |  |  |  |   std::string data = f.read(url, abort); | 
			
		
	
		
		
			
				
					
					|  |  |  |   if (data.empty()) return false; |  |  |  |   if (data.empty()) return false; | 
			
		
	
		
		
			
				
					
					|  |  |  | 
 |  |  |  | 
 | 
			
		
	
		
		
			
				
					
					|  |  |  |   return load((std::byte *)data.data(), data.size(), no_cuda, abort); |  |  |  |   return load((std::byte *)data.data(), data.size(), no_hw_decoder, abort); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  | } |  |  |  | } | 
			
		
	
		
		
			
				
					
					|  |  |  | 
 |  |  |  | 
 | 
			
		
	
		
		
			
				
					
					|  |  |  | bool FrameReader::load(const std::byte *data, size_t size, bool no_cuda, std::atomic<bool> *abort) { |  |  |  | bool FrameReader::load(const std::byte *data, size_t size, bool no_hw_decoder, std::atomic<bool> *abort) { | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |   input_ctx = avformat_alloc_context(); |  |  |  |   input_ctx = avformat_alloc_context(); | 
			
		
	
		
		
			
				
					
					|  |  |  |   if (!input_ctx) return false; |  |  |  |   if (!input_ctx) return false; | 
			
		
	
		
		
			
				
					
					|  |  |  | 
 |  |  |  | 
 | 
			
		
	
	
		
		
			
				
					|  |  | @ -106,9 +114,9 @@ bool FrameReader::load(const std::byte *data, size_t size, bool no_cuda, std::at | 
			
		
	
		
		
			
				
					
					|  |  |  |   height = decoder_ctx->height; |  |  |  |   height = decoder_ctx->height; | 
			
		
	
		
		
			
				
					
					|  |  |  |   visionbuf_compute_aligned_width_and_height(width, height, &aligned_width, &aligned_height); |  |  |  |   visionbuf_compute_aligned_width_and_height(width, height, &aligned_width, &aligned_height); | 
			
		
	
		
		
			
				
					
					|  |  |  | 
 |  |  |  | 
 | 
			
		
	
		
		
			
				
					
					|  |  |  |   if (has_cuda_device && !no_cuda) { |  |  |  |   if (has_hw_decoder && !no_hw_decoder) { | 
			
				
				
			
		
	
		
		
			
				
					
					|  |  |  |     if (!initHardwareDecoder(AV_HWDEVICE_TYPE_CUDA)) { |  |  |  |     if (!initHardwareDecoder(HW_DEVICE_TYPE)) { | 
			
				
				
			
		
	
		
		
			
				
					
					|  |  |  |       rWarning("No CUDA capable device was found. fallback to CPU decoding."); |  |  |  |       rWarning("No device with hardware decoder found. fallback to CPU decoding."); | 
			
				
				
			
		
	
		
		
	
		
		
	
		
		
	
		
		
			
				
					
					|  |  |  |     } else { |  |  |  |     } else { | 
			
		
	
		
		
			
				
					
					|  |  |  |       nv12toyuv_buffer.resize(getYUVSize()); |  |  |  |       nv12toyuv_buffer.resize(getYUVSize()); | 
			
		
	
		
		
			
				
					
					|  |  |  |     } |  |  |  |     } | 
			
		
	
	
		
		
			
				
					|  |  | @ -151,7 +159,7 @@ bool FrameReader::initHardwareDecoder(AVHWDeviceType hw_device_type) { | 
			
		
	
		
		
			
				
					
					|  |  |  |   int ret = av_hwdevice_ctx_create(&hw_device_ctx, hw_device_type, nullptr, nullptr, 0); |  |  |  |   int ret = av_hwdevice_ctx_create(&hw_device_ctx, hw_device_type, nullptr, nullptr, 0); | 
			
		
	
		
		
			
				
					
					|  |  |  |   if (ret < 0) { |  |  |  |   if (ret < 0) { | 
			
		
	
		
		
			
				
					
					|  |  |  |     hw_pix_fmt = AV_PIX_FMT_NONE; |  |  |  |     hw_pix_fmt = AV_PIX_FMT_NONE; | 
			
		
	
		
		
			
				
					
					|  |  |  |     has_cuda_device = false; |  |  |  |     has_hw_decoder = false; | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |     rWarning("Failed to create specified HW device %d.", ret); |  |  |  |     rWarning("Failed to create specified HW device %d.", ret); | 
			
		
	
		
		
			
				
					
					|  |  |  |     return false; |  |  |  |     return false; | 
			
		
	
		
		
			
				
					
					|  |  |  |   } |  |  |  |   } | 
			
		
	
	
		
		
			
				
					|  |  | @ -219,7 +227,7 @@ AVFrame *FrameReader::decodeFrame(AVPacket *pkt) { | 
			
		
	
		
		
			
				
					
					|  |  |  | } |  |  |  | } | 
			
		
	
		
		
			
				
					
					|  |  |  | 
 |  |  |  | 
 | 
			
		
	
		
		
			
				
					
					|  |  |  | bool FrameReader::copyBuffers(AVFrame *f, uint8_t *rgb, uint8_t *yuv) { |  |  |  | bool FrameReader::copyBuffers(AVFrame *f, uint8_t *rgb, uint8_t *yuv) { | 
			
		
	
		
		
			
				
					
					|  |  |  |   if (hw_pix_fmt == AV_PIX_FMT_CUDA) { |  |  |  |   if (hw_pix_fmt == HW_PIX_FMT) { | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |     uint8_t *y = yuv ? yuv : nv12toyuv_buffer.data(); |  |  |  |     uint8_t *y = yuv ? yuv : nv12toyuv_buffer.data(); | 
			
		
	
		
		
			
				
					
					|  |  |  |     uint8_t *u = y + width * height; |  |  |  |     uint8_t *u = y + width * height; | 
			
		
	
		
		
			
				
					
					|  |  |  |     uint8_t *v = u + (width / 2) * (height / 2); |  |  |  |     uint8_t *v = u + (width / 2) * (height / 2); | 
			
		
	
	
		
		
			
				
					|  |  | 
 |