2 type=
'ActionRecognitionRunner',
8 stage_blocks = (4, 6, 3),
10 spatial_strides = (2, 2, 2),
11 temporal_strides = (1, 1, 2),
12 dilations = (1, 1, 1),
13 conv1_kernel = (1, 7, 7),
19 inflate_style =
'3x1x1',
20 input_key =
'pose_heatmap_for_action'
26 stage_blocks = (4, 6, 3),
28 spatial_strides = (2, 2, 2),
29 temporal_strides = (1, 1, 2),
30 dilations = (1, 1, 1),
31 conv1_kernel = (1, 7, 7),
37 inflate_style =
'3x1x1',
38 input_key =
'pose_heatmap_for_pose'
43 stage_blocks = [2, 2, 2, 2],
44 input_key =
'image_feature',
49 input_key = [
'action_feat',
'pose_feat',
'img_feat'],
50 input_type = [
'3d',
'3d',
'2d'],
55 in_channels=1024+512+768,
62 in_channels=1024+512+768,
69 in_channels=1024+512+768,
71 layer_channels=[2048],
77 in_channels=1024+512+768,
79 layer_channels=[2048],
85 in_channels=1024+512+768,
87 layer_channels=[2048],
91 aux_action_upper = dict(
96 input_key =
'action_feat',
98 aux_action_lower = dict(
103 input_key =
'action_feat',
109 layer_channels=[1024],
111 input_key =
'pose_feat',
118 layer_channels=[1024],
120 input_key =
'pose_feat',
127 layer_channels=[1024],
129 input_key =
'pose_feat',
135 pred_action_upper =
'action_upper',
136 pred_action_lower =
'action_lower',
143score_keys = [
'action_upper',
'action_lower',
'pose',
'hand',
'foot',
'aux_action_upper',
'aux_action_lower',
'aux_pose',
'aux_hand',
'aux_foot']
144pred_keys = [
'pred_action_upper',
'pred_action_lower',
'pred_pose',
'pred_hand',
'pred_foot']
145gt_keys = [
'gt_action_upper',
'gt_action_lower',
'gt_pose',
'gt_hand',
'gt_foot',
'gt_action_upper',
'gt_action_lower',
'gt_pose',
'gt_hand',
'gt_foot']
146target_tasks = [
'action_upper',
'action_lower',
'pose',
'hand',
'foot',
'action_upper',
'action_lower',
'pose',
'hand',
'foot']
147train_tasks = [
'action_upper',
'action_lower',
'pose',
'hand',
'foot']
151 MutiTaskSigmoidFocalLoss = dict(
153 task_key =
'category',
154 pred_keys = score_keys,
156 target_tasks = target_tasks,
157 weights = [1.0, 1.0, 1.0, 1.0, 1.0, 0.25, 0.25, 0.25, 0.25, 0.25],
162metric_args = dict(pred_key=pred_keys,
164 target_tasks=target_tasks[:5],
167collect_keys = [
'pose_heatmap_for_action',
'pose_heatmap_for_pose',
'image_feature',
'gt_action_upper',
'gt_action_lower',
'gt_pose',
'gt_hand',
'gt_foot']
170 type =
'ActionDatasetLoader_mtml',
171 data_folder =
'/media/safemotion/HDD5/pjm_test/action_train_dataset_2023/action_kp_imf_split',
172 category_info = dict(action_upper = 6,
177 clip_len_action = 20,
187 optimizer_args = dict(momentum=0.9, nesterov=
True, weight_decay=0.0001),
188 scheduler =
'CosineAnnealingLR',
190 scheduler_args = dict(T_max=30*ep_mul, eta_min=0),
191 adjust_lr_epoch = [10*ep_mul, 50*ep_mul, 100*ep_mul, 130*ep_mul],
192 adjust_lr_rate = [0.5, 0.1, 0.1, 0.1],
196 update_loss_weight =
False,
197 update_loss_weight_interval = 20,
201 save_root =
'/media/safemotion/HDD5/pjm_test/action_train_result/action_kp_img',