You can not select more than 25 topics
			Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
		
		
		
		
		
			
		
			
				
					
					
						
							284 lines
						
					
					
						
							9.1 KiB
						
					
					
				
			
		
		
	
	
							284 lines
						
					
					
						
							9.1 KiB
						
					
					
				| import os
 | |
| import struct
 | |
| import bisect
 | |
| import numpy as np
 | |
| import _io
 | |
| 
 | |
| import capnp
 | |
| from cereal import log as capnp_log
 | |
| 
 | |
| class RawData():
 | |
|   def __init__(self, f):
 | |
|     self.f = _io.FileIO(f, 'rb')
 | |
|     self.lenn = struct.unpack("I", self.f.read(4))[0]
 | |
|     self.count = os.path.getsize(f) / (self.lenn+4)
 | |
| 
 | |
|   def read(self, i):
 | |
|     self.f.seek((self.lenn+4)*i + 4)
 | |
|     return self.f.read(self.lenn)
 | |
| 
 | |
| def yuv420_to_rgb(raw, image_dim=None, swizzled=False):
 | |
|   def expand(x):
 | |
|     x = np.repeat(x, 2, axis=0)
 | |
|     return np.repeat(x, 2, axis=1)
 | |
| 
 | |
|   if image_dim is None:
 | |
|     image_dim = (raw.shape[1]*2, raw.shape[2]*2)
 | |
|     swizzled = True
 | |
| 
 | |
|   if not swizzled:
 | |
|     img_data = np.array(raw, copy=False, dtype=np.uint8)
 | |
|     uv_len = (image_dim[0]/2)*(image_dim[1]/2)
 | |
|     img_data_u = expand(img_data[image_dim[0]*image_dim[1]: \
 | |
|                                  image_dim[0]*image_dim[1]+uv_len]. \
 | |
|                                  reshape(image_dim[0]/2, image_dim[1]/2))
 | |
| 
 | |
|     img_data_v = expand(img_data[image_dim[0]*image_dim[1]+uv_len: \
 | |
|                                  image_dim[0]*image_dim[1]+2*uv_len]. \
 | |
|                                  reshape(image_dim[0]/2, image_dim[1]/2))
 | |
|     img_data_y = img_data[0:image_dim[0]*image_dim[1]].reshape(image_dim)
 | |
|   else:
 | |
|     img_data_y = np.zeros(image_dim, dtype=np.uint8)
 | |
|     img_data_y[0::2, 0::2] = raw[0]
 | |
|     img_data_y[1::2, 0::2] = raw[1]
 | |
|     img_data_y[0::2, 1::2] = raw[2]
 | |
|     img_data_y[1::2, 1::2] = raw[3]
 | |
|     img_data_u = expand(raw[4])
 | |
|     img_data_v = expand(raw[5])
 | |
| 
 | |
|   yuv = np.stack((img_data_y, img_data_u, img_data_v)).swapaxes(0,2).swapaxes(0,1)
 | |
|   yuv = yuv.astype(np.int16)
 | |
| 
 | |
|   # http://maxsharabayko.blogspot.com/2016/01/fast-yuv-to-rgb-conversion-in-python-3.html
 | |
|   # according to ITU-R BT.709
 | |
|   yuv[:,:, 0] = yuv[:,:, 0].clip(16, 235).astype(yuv.dtype) - 16
 | |
|   yuv[:,:,1:] = yuv[:,:,1:].clip(16, 240).astype(yuv.dtype) - 128
 | |
| 
 | |
|   A = np.array([[1.164,  0.000,  1.793],
 | |
|                 [1.164, -0.213, -0.533],
 | |
|                 [1.164,  2.112,  0.000]])
 | |
| 
 | |
|   # our result
 | |
|   img = np.dot(yuv, A.T).clip(0, 255).astype('uint8')
 | |
|   return img
 | |
| 
 | |
| 
 | |
| class YuvData():
 | |
|   def __init__(self, f, dim=(160,320)):
 | |
|     self.f = _io.FileIO(f, 'rb')
 | |
|     self.image_dim = dim
 | |
|     self.image_size = self.image_dim[0]/2 * self.image_dim[1]/2 * 6
 | |
|     self.count = os.path.getsize(f) / self.image_size
 | |
| 
 | |
|   def read_frame(self, frame):
 | |
|     self.f.seek(self.image_size*frame)
 | |
|     raw = self.f.read(self.image_size)
 | |
|     return raw
 | |
| 
 | |
|   def read_frames(self, range_start, range_len):
 | |
|     self.f.seek(self.image_size*range_start)
 | |
|     raw = self.f.read(self.image_size*range_len)
 | |
|     return raw
 | |
| 
 | |
|   def read_frames_into(self, range_start, buf):
 | |
|     self.f.seek(self.image_size*range_start)
 | |
|     return self.f.readinto(buf)
 | |
| 
 | |
|   def read(self, frame):
 | |
|     return yuv420_to_rgb(self.read_frame(frame), self.image_dim)
 | |
| 
 | |
|   def close(self):
 | |
|     self.f.close()
 | |
| 
 | |
|   def __enter__(self):
 | |
|     return self
 | |
| 
 | |
|   def __exit__(self, type, value, traceback):
 | |
|     self.close()
 | |
| 
 | |
| 
 | |
| 
 | |
| class OneReader():
 | |
|   def __init__(self, base_path, goofy=False, segment_range=None):
 | |
|     self.base_path = base_path
 | |
| 
 | |
|     route_name = os.path.basename(base_path)
 | |
| 
 | |
|     self.rcamera_size = (304, 560)
 | |
| 
 | |
|     if segment_range is None:
 | |
|       parent_path = os.path.dirname(base_path)
 | |
|       self.segment_nums = []
 | |
|       for p in os.listdir(parent_path):
 | |
|         if not p.startswith(route_name+"--"):
 | |
|           continue
 | |
|         self.segment_nums.append(int(p.rsplit("--", 1)[-1]))
 | |
|       if not self.segment_nums:
 | |
|         raise Exception("no route segments found")
 | |
|       self.segment_nums.sort()
 | |
|       self.segment_range = (self.segment_nums[0], self.segment_nums[-1])
 | |
|     else:
 | |
|       self.segment_range = segment_range
 | |
|       self.segment_nums = range(segment_range[0], segment_range[1]+1)
 | |
|       for i in self.segment_nums:
 | |
|         if not os.path.exists(base_path+"--"+str(i)):
 | |
|           raise Exception("missing segment in provided range")
 | |
| 
 | |
|     # goofy data is broken with discontinuous logs
 | |
|     if goofy and (self.segment_range[0] != 0
 | |
|         or self.segment_nums != range(self.segment_range[0], self.segment_range[1]+1)):
 | |
|       raise Exception("goofy data needs all the segments for a route")
 | |
| 
 | |
|     self.cur_seg = None
 | |
|     self.cur_seg_f = None
 | |
| 
 | |
|     # index the frames
 | |
|     print("indexing frames {}...".format(self.segment_nums))
 | |
| 
 | |
|     self.rcamera_encode_map = {} # frame_id -> (segment num, segment id, frame_time)
 | |
|     last_frame_id = -1
 | |
| 
 | |
|     if goofy:
 | |
|       # goofy is goofy
 | |
| 
 | |
|       frame_size = self.rcamera_size[0]*self.rcamera_size[1]*3/2
 | |
| 
 | |
|       # find the encode id ranges for each segment by using the rcamera file size
 | |
|       segment_encode_ids = []
 | |
|       cur_encode_id = 0
 | |
|       for n in self.segment_nums:
 | |
|         camera_path = os.path.join(self.seg_path(n), "rcamera")
 | |
|         if not os.path.exists(camera_path):
 | |
|           # for goofy, missing camera files means a bad route
 | |
|           raise Exception("Missing camera file {}".format(camera_path))
 | |
|         camera_size = os.path.getsize(camera_path)
 | |
|         assert (camera_size % frame_size) == 0
 | |
| 
 | |
|         num_frames = camera_size / frame_size
 | |
|         segment_encode_ids.append(cur_encode_id)
 | |
|         cur_encode_id += num_frames
 | |
| 
 | |
|       last_encode_id = -1
 | |
|       # use the segment encode id map and frame events to build the frame index
 | |
|       for n in self.segment_nums:
 | |
|         log_path = os.path.join(self.seg_path(n), "rlog")
 | |
|         if os.path.exists(log_path):
 | |
|           with open(log_path, "rb") as f:
 | |
|             for evt in capnp_log.Event.read_multiple(f):
 | |
|               if evt.which() == 'frame':
 | |
| 
 | |
|                 if evt.frame.frameId < last_frame_id:
 | |
|                   # a non-increasing frame id is bad route (eg visiond was restarted)
 | |
|                   raise Exception("non-increasing frame id")
 | |
|                 last_frame_id = evt.frame.frameId
 | |
| 
 | |
|                 seg_i = bisect.bisect_right(segment_encode_ids, evt.frame.encodeId)-1
 | |
|                 assert seg_i >= 0
 | |
|                 seg_num = self.segment_nums[seg_i]
 | |
|                 seg_id = evt.frame.encodeId-segment_encode_ids[seg_i]
 | |
|                 frame_time = evt.logMonoTime / 1.0e9
 | |
| 
 | |
|                 self.rcamera_encode_map[evt.frame.frameId] = (seg_num, seg_id,
 | |
|                                                               frame_time)
 | |
| 
 | |
|                 last_encode_id = evt.frame.encodeId
 | |
| 
 | |
|       if last_encode_id-cur_encode_id > 10:
 | |
|         # too many missing frames is a bad route (eg route from before encoder rotating worked)
 | |
|         raise Exception("goofy route is missing frames: {}, {}".format(
 | |
|           last_encode_id, cur_encode_id))
 | |
| 
 | |
|     else:
 | |
|       # for harry data, build the index from encodeIdx events
 | |
|       for n in self.segment_nums:
 | |
|         log_path = os.path.join(self.seg_path(n), "rlog")
 | |
|         if os.path.exists(log_path):
 | |
|           with open(log_path, "rb") as f:
 | |
|             for evt in capnp_log.Event.read_multiple(f):
 | |
|               if evt.which() == 'encodeIdx' and evt.encodeIdx.type == 'bigBoxLossless':
 | |
|                 frame_time = evt.logMonoTime / 1.0e9
 | |
|                 self.rcamera_encode_map[evt.encodeIdx.frameId] = (
 | |
|                   evt.encodeIdx.segmentNum, evt.encodeIdx.segmentId,
 | |
|                   frame_time)
 | |
| 
 | |
|     print("done")
 | |
| 
 | |
|     # read the first event to find the start time
 | |
|     self.reset_to_seg(self.segment_range[0])
 | |
|     for evt in self.events():
 | |
|       if evt.which() != 'initData':
 | |
|         self.start_mono = evt.logMonoTime
 | |
|         break
 | |
|     self.reset_to_seg(self.segment_range[0])
 | |
| 
 | |
| 
 | |
|   def seg_path(self, num):
 | |
|     return self.base_path+"--"+str(num)
 | |
| 
 | |
|   def reset_to_seg(self, seg):
 | |
|     self.cur_seg = seg
 | |
|     if self.cur_seg_f:
 | |
|       self.cur_seg_f.close()
 | |
|       self.cur_seg_f = None
 | |
| 
 | |
|   def seek_ts(self, ts):
 | |
|     seek_seg = int(ts/60)
 | |
|     if seek_seg < self.segment_range[0] or seek_seg > self.segment_range[1]:
 | |
|       raise ValueError
 | |
| 
 | |
|     self.reset_to_seg(seek_seg)
 | |
|     target_mono = self.start_mono + int(ts*1e9)
 | |
|     for evt in self.events():
 | |
|       if evt.logMonoTime >= target_mono:
 | |
|         break
 | |
| 
 | |
|   def read_event(self):
 | |
|     while True:
 | |
|       if self.cur_seg > self.segment_range[1]:
 | |
|         return None
 | |
|       if self.cur_seg_f is None:
 | |
|         log_path = os.path.join(self.seg_path(self.cur_seg), "rlog")
 | |
|         if not os.path.exists(log_path):
 | |
|           print("missing log file!", log_path)
 | |
|           self.cur_seg += 1
 | |
|           continue
 | |
|         self.cur_seg_f = open(log_path, "rb")
 | |
| 
 | |
|       try:
 | |
|         return capnp_log.Event.read(self.cur_seg_f)
 | |
|       except capnp.lib.capnp.KjException as e:
 | |
|         if 'EOF' in str(e): # dumb, but pycapnp does this too
 | |
|           self.cur_seg_f.close()
 | |
|           self.cur_seg_f = None
 | |
|           self.cur_seg += 1
 | |
|         else:
 | |
|           raise
 | |
| 
 | |
|   def events(self):
 | |
|     while True:
 | |
|       r = self.read_event()
 | |
|       if r is None:
 | |
|         break
 | |
|       yield r
 | |
| 
 | |
|   def read_frame(self, frame_id):
 | |
|     encode_idx = self.rcamera_encode_map.get(frame_id)
 | |
|     if encode_idx is None:
 | |
|       return None
 | |
| 
 | |
|     seg_num, seg_id, _ = encode_idx
 | |
|     camera_path = os.path.join(self.seg_path(seg_num), "rcamera")
 | |
|     if not os.path.exists(camera_path):
 | |
|       return None
 | |
|     with YuvData(camera_path, self.rcamera_size) as data:
 | |
|       return data.read_frame(seg_id)
 | |
| 
 | |
|   def close(self):
 | |
|     if self.cur_seg_f is not None:
 | |
|       self.cur_seg_f.close()
 | |
| 
 | |
|   def __enter__(self):
 | |
|     return self
 | |
| 
 | |
|   def __exit__(self, type, value, traceback):
 | |
|     self.close()
 | |
| 
 |