You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
285 lines
9.1 KiB
285 lines
9.1 KiB
5 years ago
|
import os
|
||
|
import struct
|
||
|
import bisect
|
||
|
import numpy as np
|
||
|
import _io
|
||
|
|
||
|
import capnp
|
||
|
from cereal import log as capnp_log
|
||
|
|
||
|
class RawData():
|
||
|
def __init__(self, f):
|
||
|
self.f = _io.FileIO(f, 'rb')
|
||
|
self.lenn = struct.unpack("I", self.f.read(4))[0]
|
||
|
self.count = os.path.getsize(f) / (self.lenn+4)
|
||
|
|
||
|
def read(self, i):
|
||
|
self.f.seek((self.lenn+4)*i + 4)
|
||
|
return self.f.read(self.lenn)
|
||
|
|
||
|
def yuv420_to_rgb(raw, image_dim=None, swizzled=False):
|
||
|
def expand(x):
|
||
|
x = np.repeat(x, 2, axis=0)
|
||
|
return np.repeat(x, 2, axis=1)
|
||
|
|
||
|
if image_dim is None:
|
||
|
image_dim = (raw.shape[1]*2, raw.shape[2]*2)
|
||
|
swizzled = True
|
||
|
|
||
|
if not swizzled:
|
||
|
img_data = np.array(raw, copy=False, dtype=np.uint8)
|
||
|
uv_len = (image_dim[0]/2)*(image_dim[1]/2)
|
||
|
img_data_u = expand(img_data[image_dim[0]*image_dim[1]: \
|
||
|
image_dim[0]*image_dim[1]+uv_len]. \
|
||
|
reshape(image_dim[0]/2, image_dim[1]/2))
|
||
|
|
||
|
img_data_v = expand(img_data[image_dim[0]*image_dim[1]+uv_len: \
|
||
|
image_dim[0]*image_dim[1]+2*uv_len]. \
|
||
|
reshape(image_dim[0]/2, image_dim[1]/2))
|
||
|
img_data_y = img_data[0:image_dim[0]*image_dim[1]].reshape(image_dim)
|
||
|
else:
|
||
|
img_data_y = np.zeros(image_dim, dtype=np.uint8)
|
||
|
img_data_y[0::2, 0::2] = raw[0]
|
||
|
img_data_y[1::2, 0::2] = raw[1]
|
||
|
img_data_y[0::2, 1::2] = raw[2]
|
||
|
img_data_y[1::2, 1::2] = raw[3]
|
||
|
img_data_u = expand(raw[4])
|
||
|
img_data_v = expand(raw[5])
|
||
|
|
||
|
yuv = np.stack((img_data_y, img_data_u, img_data_v)).swapaxes(0,2).swapaxes(0,1)
|
||
|
yuv = yuv.astype(np.int16)
|
||
|
|
||
|
# http://maxsharabayko.blogspot.com/2016/01/fast-yuv-to-rgb-conversion-in-python-3.html
|
||
|
# according to ITU-R BT.709
|
||
|
yuv[:,:, 0] = yuv[:,:, 0].clip(16, 235).astype(yuv.dtype) - 16
|
||
|
yuv[:,:,1:] = yuv[:,:,1:].clip(16, 240).astype(yuv.dtype) - 128
|
||
|
|
||
|
A = np.array([[1.164, 0.000, 1.793],
|
||
|
[1.164, -0.213, -0.533],
|
||
|
[1.164, 2.112, 0.000]])
|
||
|
|
||
|
# our result
|
||
|
img = np.dot(yuv, A.T).clip(0, 255).astype('uint8')
|
||
|
return img
|
||
|
|
||
|
|
||
|
class YuvData():
|
||
|
def __init__(self, f, dim=(160,320)):
|
||
|
self.f = _io.FileIO(f, 'rb')
|
||
|
self.image_dim = dim
|
||
|
self.image_size = self.image_dim[0]/2 * self.image_dim[1]/2 * 6
|
||
|
self.count = os.path.getsize(f) / self.image_size
|
||
|
|
||
|
def read_frame(self, frame):
|
||
|
self.f.seek(self.image_size*frame)
|
||
|
raw = self.f.read(self.image_size)
|
||
|
return raw
|
||
|
|
||
|
def read_frames(self, range_start, range_len):
|
||
|
self.f.seek(self.image_size*range_start)
|
||
|
raw = self.f.read(self.image_size*range_len)
|
||
|
return raw
|
||
|
|
||
|
def read_frames_into(self, range_start, buf):
|
||
|
self.f.seek(self.image_size*range_start)
|
||
|
return self.f.readinto(buf)
|
||
|
|
||
|
def read(self, frame):
|
||
|
return yuv420_to_rgb(self.read_frame(frame), self.image_dim)
|
||
|
|
||
|
def close(self):
|
||
|
self.f.close()
|
||
|
|
||
|
def __enter__(self):
|
||
|
return self
|
||
|
|
||
|
def __exit__(self, type, value, traceback):
|
||
|
self.close()
|
||
|
|
||
|
|
||
|
|
||
|
class OneReader():
|
||
|
def __init__(self, base_path, goofy=False, segment_range=None):
|
||
|
self.base_path = base_path
|
||
|
|
||
|
route_name = os.path.basename(base_path)
|
||
|
|
||
|
self.rcamera_size = (304, 560)
|
||
|
|
||
|
if segment_range is None:
|
||
|
parent_path = os.path.dirname(base_path)
|
||
|
self.segment_nums = []
|
||
|
for p in os.listdir(parent_path):
|
||
|
if not p.startswith(route_name+"--"):
|
||
|
continue
|
||
|
self.segment_nums.append(int(p.rsplit("--", 1)[-1]))
|
||
|
if not self.segment_nums:
|
||
|
raise Exception("no route segments found")
|
||
|
self.segment_nums.sort()
|
||
|
self.segment_range = (self.segment_nums[0], self.segment_nums[-1])
|
||
|
else:
|
||
|
self.segment_range = segment_range
|
||
|
self.segment_nums = range(segment_range[0], segment_range[1]+1)
|
||
|
for i in self.segment_nums:
|
||
|
if not os.path.exists(base_path+"--"+str(i)):
|
||
|
raise Exception("missing segment in provided range")
|
||
|
|
||
|
# goofy data is broken with discontinuous logs
|
||
|
if goofy and (self.segment_range[0] != 0
|
||
|
or self.segment_nums != range(self.segment_range[0], self.segment_range[1]+1)):
|
||
|
raise Exception("goofy data needs all the segments for a route")
|
||
|
|
||
|
self.cur_seg = None
|
||
|
self.cur_seg_f = None
|
||
|
|
||
|
# index the frames
|
||
|
print("indexing frames {}...".format(self.segment_nums))
|
||
|
|
||
|
self.rcamera_encode_map = {} # frame_id -> (segment num, segment id, frame_time)
|
||
|
last_frame_id = -1
|
||
|
|
||
|
if goofy:
|
||
|
# goofy is goofy
|
||
|
|
||
|
frame_size = self.rcamera_size[0]*self.rcamera_size[1]*3/2
|
||
|
|
||
|
# find the encode id ranges for each segment by using the rcamera file size
|
||
|
segment_encode_ids = []
|
||
|
cur_encode_id = 0
|
||
|
for n in self.segment_nums:
|
||
|
camera_path = os.path.join(self.seg_path(n), "rcamera")
|
||
|
if not os.path.exists(camera_path):
|
||
|
# for goofy, missing camera files means a bad route
|
||
|
raise Exception("Missing camera file {}".format(camera_path))
|
||
|
camera_size = os.path.getsize(camera_path)
|
||
|
assert (camera_size % frame_size) == 0
|
||
|
|
||
|
num_frames = camera_size / frame_size
|
||
|
segment_encode_ids.append(cur_encode_id)
|
||
|
cur_encode_id += num_frames
|
||
|
|
||
|
last_encode_id = -1
|
||
|
# use the segment encode id map and frame events to build the frame index
|
||
|
for n in self.segment_nums:
|
||
|
log_path = os.path.join(self.seg_path(n), "rlog")
|
||
|
if os.path.exists(log_path):
|
||
|
with open(log_path, "rb") as f:
|
||
|
for evt in capnp_log.Event.read_multiple(f):
|
||
|
if evt.which() == 'frame':
|
||
|
|
||
|
if evt.frame.frameId < last_frame_id:
|
||
|
# a non-increasing frame id is bad route (eg visiond was restarted)
|
||
|
raise Exception("non-increasing frame id")
|
||
|
last_frame_id = evt.frame.frameId
|
||
|
|
||
|
seg_i = bisect.bisect_right(segment_encode_ids, evt.frame.encodeId)-1
|
||
|
assert seg_i >= 0
|
||
|
seg_num = self.segment_nums[seg_i]
|
||
|
seg_id = evt.frame.encodeId-segment_encode_ids[seg_i]
|
||
|
frame_time = evt.logMonoTime / 1.0e9
|
||
|
|
||
|
self.rcamera_encode_map[evt.frame.frameId] = (seg_num, seg_id,
|
||
|
frame_time)
|
||
|
|
||
|
last_encode_id = evt.frame.encodeId
|
||
|
|
||
|
if last_encode_id-cur_encode_id > 10:
|
||
|
# too many missing frames is a bad route (eg route from before encoder rotating worked)
|
||
|
raise Exception("goofy route is missing frames: {}, {}".format(
|
||
|
last_encode_id, cur_encode_id))
|
||
|
|
||
|
else:
|
||
|
# for harry data, build the index from encodeIdx events
|
||
|
for n in self.segment_nums:
|
||
|
log_path = os.path.join(self.seg_path(n), "rlog")
|
||
|
if os.path.exists(log_path):
|
||
|
with open(log_path, "rb") as f:
|
||
|
for evt in capnp_log.Event.read_multiple(f):
|
||
|
if evt.which() == 'encodeIdx' and evt.encodeIdx.type == 'bigBoxLossless':
|
||
|
frame_time = evt.logMonoTime / 1.0e9
|
||
|
self.rcamera_encode_map[evt.encodeIdx.frameId] = (
|
||
|
evt.encodeIdx.segmentNum, evt.encodeIdx.segmentId,
|
||
|
frame_time)
|
||
|
|
||
|
print("done")
|
||
|
|
||
|
# read the first event to find the start time
|
||
|
self.reset_to_seg(self.segment_range[0])
|
||
|
for evt in self.events():
|
||
|
if evt.which() != 'initData':
|
||
|
self.start_mono = evt.logMonoTime
|
||
|
break
|
||
|
self.reset_to_seg(self.segment_range[0])
|
||
|
|
||
|
|
||
|
def seg_path(self, num):
|
||
|
return self.base_path+"--"+str(num)
|
||
|
|
||
|
def reset_to_seg(self, seg):
|
||
|
self.cur_seg = seg
|
||
|
if self.cur_seg_f:
|
||
|
self.cur_seg_f.close()
|
||
|
self.cur_seg_f = None
|
||
|
|
||
|
def seek_ts(self, ts):
|
||
|
seek_seg = int(ts/60)
|
||
|
if seek_seg < self.segment_range[0] or seek_seg > self.segment_range[1]:
|
||
|
raise ValueError
|
||
|
|
||
|
self.reset_to_seg(seek_seg)
|
||
|
target_mono = self.start_mono + int(ts*1e9)
|
||
|
for evt in self.events():
|
||
|
if evt.logMonoTime >= target_mono:
|
||
|
break
|
||
|
|
||
|
def read_event(self):
|
||
|
while True:
|
||
|
if self.cur_seg > self.segment_range[1]:
|
||
|
return None
|
||
|
if self.cur_seg_f is None:
|
||
|
log_path = os.path.join(self.seg_path(self.cur_seg), "rlog")
|
||
|
if not os.path.exists(log_path):
|
||
|
print("missing log file!", log_path)
|
||
|
self.cur_seg += 1
|
||
|
continue
|
||
|
self.cur_seg_f = open(log_path, "rb")
|
||
|
|
||
|
try:
|
||
|
return capnp_log.Event.read(self.cur_seg_f)
|
||
|
except capnp.lib.capnp.KjException as e:
|
||
|
if 'EOF' in str(e): # dumb, but pycapnp does this too
|
||
|
self.cur_seg_f.close()
|
||
|
self.cur_seg_f = None
|
||
|
self.cur_seg += 1
|
||
|
else:
|
||
|
raise
|
||
|
|
||
|
def events(self):
|
||
|
while True:
|
||
|
r = self.read_event()
|
||
|
if r is None:
|
||
|
break
|
||
|
yield r
|
||
|
|
||
|
def read_frame(self, frame_id):
|
||
|
encode_idx = self.rcamera_encode_map.get(frame_id)
|
||
|
if encode_idx is None:
|
||
|
return None
|
||
|
|
||
|
seg_num, seg_id, _ = encode_idx
|
||
|
camera_path = os.path.join(self.seg_path(seg_num), "rcamera")
|
||
|
if not os.path.exists(camera_path):
|
||
|
return None
|
||
|
with YuvData(camera_path, self.rcamera_size) as data:
|
||
|
return data.read_frame(seg_id)
|
||
|
|
||
|
def close(self):
|
||
|
if self.cur_seg_f is not None:
|
||
|
self.cur_seg_f.close()
|
||
|
|
||
|
def __enter__(self):
|
||
|
return self
|
||
|
|
||
|
def __exit__(self, type, value, traceback):
|
||
|
self.close()
|