Skip to content

Commit 5e9e7f1

Browse files
author
David Josef Emmerichs
committed
add config refactor example
1 parent cfd4b98 commit 5e9e7f1

File tree

7 files changed

+667
-0
lines changed

7 files changed

+667
-0
lines changed
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,64 @@
1+
SEQUENCE_CONFIG:
2+
ENABLED: True
3+
SAMPLE_OFFSET: [-3, 0]
4+
5+
TRAIN_WITH_SPEED: True
6+
7+
8+
DATA_AUGMENTOR:
9+
AUG_CONFIG_LIST:
10+
- NAME: gt_sampling
11+
USE_ROAD_PLANE: False
12+
DB_INFO_PATH:
13+
- waymo_processed_data_v0_5_0_waymo_dbinfos_train_sampled_1_multiframe_-4_to_0.pkl
14+
15+
USE_SHARED_MEMORY: False # set it to True to speed up (it costs about 50GB? shared memory)
16+
DB_DATA_PATH:
17+
- waymo_processed_data_v0_5_0_gt_database_train_sampled_1_multiframe_-4_to_0_global.npy
18+
19+
PREPARE: {
20+
filter_by_min_points: ['Vehicle:5', 'Pedestrian:5', 'Cyclist:5'],
21+
filter_by_difficulty: [-1],
22+
}
23+
24+
SAMPLE_GROUPS: ['Vehicle:15', 'Pedestrian:10', 'Cyclist:10']
25+
NUM_POINT_FEATURES: 6
26+
REMOVE_EXTRA_WIDTH: [0.0, 0.0, 0.0]
27+
LIMIT_WHOLE_SCENE: True
28+
29+
FILTER_OBJ_POINTS_BY_TIMESTAMP: True
30+
TIME_RANGE: [0.3, 0.0] # 0.3s-0.0s indicates 4 frames
31+
32+
- NAME: random_world_flip
33+
ALONG_AXIS_LIST: ['x', 'y']
34+
35+
- NAME: random_world_rotation
36+
WORLD_ROT_ANGLE: [-0.78539816, 0.78539816]
37+
38+
- NAME: random_world_scaling
39+
WORLD_SCALE_RANGE: [0.95, 1.05]
40+
41+
42+
POINT_FEATURE_ENCODING:
43+
used_feature_list: ['x', 'y', 'z', 'intensity', 'elongation', 'timestamp']
44+
src_feature_list: ['x', 'y', 'z', 'intensity', 'elongation', 'timestamp']
45+
46+
47+
DATA_PROCESSOR:
48+
- NAME: mask_points_and_boxes_outside_range
49+
REMOVE_OUTSIDE_BOXES: True
50+
USE_CENTER_TO_FILTER: True
51+
52+
- NAME: shuffle_points
53+
SHUFFLE_ENABLED: {
54+
'train': True,
55+
'test': True
56+
}
57+
58+
- NAME: transform_points_to_voxels
59+
VOXEL_SIZE: [0.1, 0.1, 0.15]
60+
MAX_POINTS_PER_VOXEL: 5
61+
MAX_NUMBER_OF_VOXELS: {
62+
'train': 180000,
63+
'test': 400000
64+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,16 @@
1+
DATA_CONFIG:
2+
SEQUENCE_CONFIG:
3+
SAMPLE_OFFSET: [-15,0]
4+
5+
MODEL:
6+
ROI_HEAD:
7+
TRANS_INPUT: 64
8+
9+
ROI_GRID_POOL:
10+
MLPS: [[64,64]]
11+
POOL_RADIUS: [0.8]
12+
NSAMPLE: [16]
13+
14+
Transformer:
15+
num_frames: 16
16+
sequence_stride: 4
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,15 @@
1+
DATA_CONFIG:
2+
SEQUENCE_CONFIG:
3+
SAMPLE_OFFSET: [-3,0]
4+
5+
MODEL:
6+
ROI_HEAD:
7+
TRANS_INPUT: 256
8+
9+
ROI_GRID_POOL:
10+
MLPS: [[128,128], [128,128]]
11+
POOL_RADIUS: [0.8, 1.6]
12+
NSAMPLE: [16, 16]
13+
14+
Transformer:
15+
num_frames: 4
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,93 @@
1+
DATA_CONFIG:
2+
_BASE_CONFIG_: cfgs/dataset_configs/modifiers/waymo/multiframe.yaml
3+
_TRANSFORM:
4+
- name: remove_element
5+
target: ROI_BOXES_PATH
6+
- name: remove_element
7+
target: USE_PREDBOX
8+
9+
SAMPLED_INTERVAL: {
10+
'train': 5,
11+
'test': 1
12+
}
13+
14+
POINT_FEATURE_ENCODING:
15+
encoding_type: absolute_coordinates_encoding
16+
used_feature_list: ['x', 'y', 'z', 'intensity', 'elongation', 'time']
17+
src_feature_list: ['x', 'y', 'z', 'intensity', 'elongation', 'time']
18+
19+
MODEL:
20+
NAME: MPPNetE2E
21+
22+
VFE:
23+
NAME: DynMeanVFE
24+
25+
BACKBONE_3D:
26+
NAME: VoxelResBackBone8x
27+
28+
MAP_TO_BEV:
29+
NAME: HeightCompression
30+
NUM_BEV_FEATURES: 256
31+
32+
BACKBONE_2D:
33+
NAME: BaseBEVBackbone
34+
NUM_FRAME: 2
35+
LAYER_NUMS: [5, 5]
36+
LAYER_STRIDES: [1, 2]
37+
NUM_FILTERS: [128, 256]
38+
UPSAMPLE_STRIDES: [1, 2]
39+
NUM_UPSAMPLE_FILTERS: [256, 256]
40+
41+
DENSE_HEAD:
42+
NAME: CenterHead
43+
CLASS_AGNOSTIC: False
44+
45+
CLASS_NAMES_EACH_HEAD: [
46+
['Vehicle', 'Pedestrian', 'Cyclist']
47+
]
48+
49+
SHARED_CONV_CHANNEL: 64
50+
USE_BIAS_BEFORE_NORM: True
51+
NUM_HM_CONV: 2
52+
SEPARATE_HEAD_CFG:
53+
HEAD_ORDER: ['center', 'center_z', 'dim', 'rot','vel']
54+
HEAD_DICT: {
55+
'center': {'out_channels': 2, 'num_conv': 2},
56+
'center_z': {'out_channels': 1, 'num_conv': 2},
57+
'dim': {'out_channels': 3, 'num_conv': 2},
58+
'rot': {'out_channels': 2, 'num_conv': 2},
59+
'vel': {'out_channels': 2, 'num_conv': 2},
60+
61+
}
62+
63+
TARGET_ASSIGNER_CONFIG:
64+
FEATURE_MAP_STRIDE: 8
65+
NUM_MAX_OBJS: 500
66+
GAUSSIAN_OVERLAP: 0.1
67+
MIN_RADIUS: 2
68+
69+
LOSS_CONFIG:
70+
LOSS_WEIGHTS: {
71+
'cls_weight': 1.0,
72+
'loc_weight': 2.0,
73+
'code_weights': [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.2, 0.2]
74+
}
75+
76+
POST_PROCESSING:
77+
SCORE_THRESH: 0.1
78+
POST_CENTER_LIMIT_RANGE: [-75.2, -75.2, -2, 75.2, 75.2, 4]
79+
MAX_OBJ_PER_SAMPLE: 500
80+
NMS_CONFIG:
81+
NMS_TYPE: nms_gpu
82+
NMS_THRESH: 0.7
83+
NMS_PRE_MAXSIZE: 4096
84+
NMS_POST_MAXSIZE: 500
85+
86+
ROI_HEAD:
87+
NAME: MPPNetHeadE2E
88+
USE_BOX_ENCODING:
89+
NORM_T0: True
90+
ALL_YAW_T0: True
91+
92+
Transformer:
93+
sequence_stride: 1 #16frame using 4

tools/cfgs/waymo_models/mppnet.yaml

+170
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,170 @@
1+
CLASS_NAMES: ['Vehicle', 'Pedestrian', 'Cyclist']
2+
3+
DATA_CONFIG:
4+
_BASE_CONFIG_: cfgs/dataset_configs/waymo_dataset.yaml
5+
PROCESSED_DATA_TAG: 'waymo_processed_data_v0_5_0'
6+
7+
SAMPLED_INTERVAL: {
8+
'train': 1,
9+
'test': 1
10+
}
11+
FILTER_EMPTY_BOXES_FOR_TRAIN: True
12+
DISABLE_NLZ_FLAG_ON_POINTS: True
13+
14+
SEQUENCE_CONFIG:
15+
ENABLED: True
16+
SAMPLE_OFFSET: [-3,0]
17+
18+
USE_PREDBOX: True
19+
ROI_BOXES_PATH: {
20+
'train': '../output/xxxxx/train/result.pkl', # example: predicted boxes of RPN in training set
21+
'test': '../output/xxxxx/val/result.pkl', # example: predicted boxes of RPN in evalulation set
22+
}
23+
24+
DATA_AUGMENTOR:
25+
DISABLE_AUG_LIST: [ 'placeholder' ]
26+
AUG_CONFIG_LIST:
27+
28+
- NAME: random_world_flip
29+
ALONG_AXIS_LIST: [ 'x', 'y' ]
30+
31+
- NAME: random_world_rotation
32+
WORLD_ROT_ANGLE: [ -0.78539816, 0.78539816 ]
33+
34+
- NAME: random_world_scaling
35+
WORLD_SCALE_RANGE: [ 0.95, 1.05 ]
36+
37+
DATA_PROCESSOR:
38+
- NAME: mask_points_and_boxes_outside_range
39+
REMOVE_OUTSIDE_BOXES: True
40+
41+
- NAME: shuffle_points
42+
SHUFFLE_ENABLED: {
43+
'train': True,
44+
'test': True
45+
}
46+
47+
POINT_FEATURE_ENCODING: {
48+
encoding_type: absolute_coordinates_encoding,
49+
used_feature_list: ['x', 'y', 'z', 'intensity', 'elongation', 'time'],
50+
src_feature_list: ['x', 'y', 'z', 'intensity', 'elongation', 'time'],
51+
}
52+
53+
54+
MODEL:
55+
NAME: MPPNet
56+
57+
ROI_HEAD:
58+
NAME: MPPNetHead
59+
TRANS_INPUT: 256
60+
CLASS_AGNOSTIC: True
61+
USE_BOX_ENCODING:
62+
ENABLED: True
63+
AVG_STAGE1_SCORE: True
64+
USE_TRAJ_EMPTY_MASK: True
65+
USE_AUX_LOSS: True
66+
IOU_WEIGHT: [0.5,0.4]
67+
68+
69+
70+
ROI_GRID_POOL:
71+
GRID_SIZE: 4
72+
MLPS: [[128,128], [128,128]]
73+
POOL_RADIUS: [0.8, 1.6]
74+
NSAMPLE: [16, 16]
75+
POOL_METHOD: max_pool
76+
77+
78+
_TRANSFORM:
79+
name: copy
80+
src: TRANS_INPUT
81+
dest: Transformer.hidden_dim
82+
Transformer:
83+
num_lidar_points: 128
84+
num_proxy_points: 64 # GRID_SIZE*GRID_SIZE*GRID_SIZE
85+
pos_hidden_dim: 64
86+
enc_layers: 3
87+
dim_feedforward: 512
88+
dropout: 0.1
89+
nheads: 4
90+
pre_norm: False
91+
num_frames: 4
92+
num_groups: 4
93+
use_grid_pos:
94+
enabled: True
95+
init_type: index
96+
97+
use_mlp_mixer:
98+
enabled: True
99+
hidden_dim: 16
100+
101+
TARGET_CONFIG:
102+
BOX_CODER: ResidualCoder
103+
ROI_PER_IMAGE: 96
104+
FG_RATIO: 0.5
105+
REG_AUG_METHOD: single
106+
ROI_FG_AUG_TIMES: 10
107+
RATIO: 0.2
108+
USE_ROI_AUG: True
109+
USE_TRAJ_AUG:
110+
ENABLED: True
111+
THRESHOD: 0.8
112+
SAMPLE_ROI_BY_EACH_CLASS: True
113+
CLS_SCORE_TYPE: roi_iou
114+
115+
CLS_FG_THRESH: 0.75
116+
CLS_BG_THRESH: 0.25
117+
CLS_BG_THRESH_LO: 0.1
118+
HARD_BG_RATIO: 0.8
119+
120+
REG_FG_THRESH: 0.55
121+
122+
LOSS_CONFIG:
123+
CLS_LOSS: BinaryCrossEntropy
124+
REG_LOSS: smooth-l1
125+
CORNER_LOSS_REGULARIZATION: True
126+
LOSS_WEIGHTS: {
127+
'rcnn_cls_weight': 1.0,
128+
'rcnn_reg_weight': 1.0,
129+
'rcnn_corner_weight': 2.0,
130+
'traj_reg_weight': [2.0, 2.0, 2.0],
131+
'code_weights': [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]
132+
}
133+
134+
POST_PROCESSING:
135+
RECALL_THRESH_LIST: [0.3, 0.5, 0.7]
136+
SCORE_THRESH: 0.1
137+
OUTPUT_RAW_SCORE: False
138+
SAVE_BBOX: False
139+
EVAL_METRIC: waymo
140+
NOT_APPLY_NMS_FOR_VEL: True
141+
142+
NMS_CONFIG:
143+
MULTI_CLASSES_NMS: False
144+
NMS_TYPE: nms_gpu
145+
NMS_THRESH: 0.7
146+
NMS_PRE_MAXSIZE: 4096
147+
NMS_POST_MAXSIZE: 500
148+
149+
150+
OPTIMIZATION:
151+
BATCH_SIZE_PER_GPU: 2
152+
NUM_EPOCHS: 6
153+
154+
OPTIMIZER: adam_onecycle
155+
LR: 0.003
156+
WEIGHT_DECAY: 0.01
157+
MOMENTUM: 0.9
158+
159+
MOMS: [0.95, 0.85]
160+
PCT_START: 0.4
161+
DIV_FACTOR: 10
162+
DECAY_STEP_LIST: [35, 45]
163+
LR_DECAY: 0.1
164+
LR_CLIP: 0.0000001
165+
166+
LR_WARMUP: False
167+
WARMUP_EPOCH: 1
168+
169+
GRAD_NORM_CLIP: 10
170+

0 commit comments

Comments
 (0)