|
|
|
|
|
|
|
dataset_type = 'WaymoDataset' |
|
data_root = 'data/waymo/kitti_format/' |
|
class_names = ['Car', 'Pedestrian', 'Cyclist'] |
|
input_modality = dict(use_lidar=False, use_camera=True) |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
backend_args = None |
|
|
|
train_pipeline = [ |
|
dict(type='LoadImageFromFileMono3D', backend_args=backend_args), |
|
dict( |
|
type='LoadAnnotations3D', |
|
with_bbox=True, |
|
with_label=True, |
|
with_attr_label=False, |
|
with_bbox_3d=True, |
|
with_label_3d=True, |
|
with_bbox_depth=True), |
|
|
|
dict( |
|
type='RandomResize3D', |
|
scale=(1284, 832), |
|
ratio_range=(0.95, 1.05), |
|
keep_ratio=True, |
|
), |
|
dict(type='RandomFlip3D', flip_ratio_bev_horizontal=0.5), |
|
dict( |
|
type='Pack3DDetInputs', |
|
keys=[ |
|
'img', 'gt_bboxes', 'gt_bboxes_labels', 'gt_bboxes_3d', |
|
'gt_labels_3d', 'centers_2d', 'depths' |
|
]), |
|
] |
|
|
|
test_pipeline = [ |
|
dict(type='LoadImageFromFileMono3D', backend_args=backend_args), |
|
dict( |
|
type='RandomResize3D', |
|
scale=(1248, 832), |
|
ratio_range=(1., 1.), |
|
keep_ratio=True), |
|
dict(type='Pack3DDetInputs', keys=['img']), |
|
] |
|
|
|
|
|
eval_pipeline = [ |
|
dict(type='LoadImageFromFileMono3D', backend_args=backend_args), |
|
dict( |
|
type='RandomResize3D', |
|
scale=(1248, 832), |
|
ratio_range=(1., 1.), |
|
keep_ratio=True), |
|
dict(type='Pack3DDetInputs', keys=['img']), |
|
] |
|
|
|
metainfo = dict(classes=class_names) |
|
|
|
train_dataloader = dict( |
|
batch_size=3, |
|
num_workers=3, |
|
persistent_workers=True, |
|
sampler=dict(type='DefaultSampler', shuffle=True), |
|
dataset=dict( |
|
type=dataset_type, |
|
data_root=data_root, |
|
ann_file='waymo_infos_train.pkl', |
|
data_prefix=dict( |
|
pts='training/velodyne', |
|
CAM_FRONT='training/image_0', |
|
CAM_FRONT_LEFT='training/image_1', |
|
CAM_FRONT_RIGHT='training/image_2', |
|
CAM_SIDE_LEFT='training/image_3', |
|
CAM_SIDE_RIGHT='training/image_4'), |
|
pipeline=train_pipeline, |
|
modality=input_modality, |
|
test_mode=False, |
|
metainfo=metainfo, |
|
|
|
|
|
box_type_3d='Camera', |
|
load_type='mv_image_based', |
|
|
|
load_interval=5, |
|
backend_args=backend_args)) |
|
|
|
val_dataloader = dict( |
|
batch_size=1, |
|
num_workers=1, |
|
persistent_workers=True, |
|
drop_last=False, |
|
sampler=dict(type='DefaultSampler', shuffle=False), |
|
dataset=dict( |
|
type=dataset_type, |
|
data_root=data_root, |
|
data_prefix=dict( |
|
pts='training/velodyne', |
|
CAM_FRONT='training/image_0', |
|
CAM_FRONT_LEFT='training/image_1', |
|
CAM_FRONT_RIGHT='training/image_2', |
|
CAM_SIDE_LEFT='training/image_3', |
|
CAM_SIDE_RIGHT='training/image_4'), |
|
ann_file='waymo_infos_val.pkl', |
|
pipeline=eval_pipeline, |
|
modality=input_modality, |
|
test_mode=True, |
|
metainfo=metainfo, |
|
|
|
|
|
box_type_3d='Camera', |
|
load_type='mv_image_based', |
|
backend_args=backend_args)) |
|
|
|
test_dataloader = dict( |
|
batch_size=1, |
|
num_workers=1, |
|
persistent_workers=True, |
|
drop_last=False, |
|
sampler=dict(type='DefaultSampler', shuffle=False), |
|
dataset=dict( |
|
type=dataset_type, |
|
data_root=data_root, |
|
data_prefix=dict( |
|
pts='training/velodyne', |
|
CAM_FRONT='training/image_0', |
|
CAM_FRONT_LEFT='training/image_1', |
|
CAM_FRONT_RIGHT='training/image_2', |
|
CAM_SIDE_LEFT='training/image_3', |
|
CAM_SIDE_RIGHT='training/image_4'), |
|
ann_file='waymo_infos_val.pkl', |
|
pipeline=eval_pipeline, |
|
modality=input_modality, |
|
test_mode=True, |
|
metainfo=metainfo, |
|
|
|
|
|
box_type_3d='Camera', |
|
load_type='mv_image_based', |
|
backend_args=backend_args)) |
|
|
|
val_evaluator = dict( |
|
type='WaymoMetric', |
|
ann_file='./data/waymo/kitti_format/waymo_infos_val.pkl', |
|
waymo_bin_file='./data/waymo/waymo_format/cam_gt.bin', |
|
data_root='./data/waymo/waymo_format', |
|
metric='LET_mAP', |
|
load_type='mv_image_based', |
|
backend_args=backend_args) |
|
test_evaluator = val_evaluator |
|
|