|
config = { |
|
"data": { |
|
"use_cache": True, |
|
"data_dir": "./data", |
|
"trainset_humandata": [ |
|
'SynHand'], |
|
"testset": 'EHF', |
|
"BEDLAM_train_sample_interval": 5, |
|
"SynBody_train_sample_interval": 10, |
|
"EgoBody_Kinect_train_sample_interval": 10, |
|
"UBody_train_sample_interval": 10, |
|
"MPI_INF_3DHP_train_sample_interval": 5, |
|
"InstaVariety_train_sample_interval": 10, |
|
"RenBody_HiRes_train_sample_interval": 5, |
|
"ARCTIC_train_sample_interval": 10, |
|
"RenBody_train_sample_interval": 10, |
|
"Talkshow_train_sample_interval": 10, |
|
"bbox_ratio": 1.2, |
|
"no_aug": False, |
|
"data_strategy": "balance", |
|
"total_data_len": 7500000, |
|
}, |
|
|
|
"train": { |
|
"num_gpus": 1, |
|
"continue_train": True, |
|
"start_over": True, |
|
"end_epoch": 20, |
|
"train_batch_size": 16, |
|
"num_thread": 1, |
|
"lr": 1e-5, |
|
"min_lr": 1e-6, |
|
"save_epoch": 1, |
|
"remove_checkpoint": False, |
|
"print_iters": 100, |
|
"smplx_kps_3d_weight": 100.0, |
|
"smplx_kps_2d_weight": 1.0, |
|
"smplx_pose_weight": 10.0, |
|
"smplx_shape_weight": 1.0, |
|
"smplx_orient_weight": 1.0, |
|
"hand_root_weight": 1.0, |
|
"hand_consist_weight": 1.0, |
|
}, |
|
|
|
"inference":{ |
|
"num_gpus": 1, |
|
"detection":{ |
|
"model_type": "yolo", |
|
"model_path": "./pretrained_models/yolov8x.pt", |
|
"conf": 0.5, |
|
"save": False, |
|
"verbose": False, |
|
"iou_thr": 0.5, |
|
}, |
|
|
|
}, |
|
|
|
"test": { |
|
"test_batch_size": 1 |
|
}, |
|
|
|
"model": { |
|
'model_type': 'vit_huge', |
|
"pretrained_model_path": './outputs/train_annot_xtp20_20241108_203832/model_dump/snapshot_7.pth.tar', |
|
"human_model_path": './human_models/human_model_files', |
|
'encoder_pretrained_model_path': './pretrained_models/vitpose_huge.pth', |
|
'encoder_config': { |
|
'num_classes': 80, |
|
'task_tokens_num': 80, |
|
'img_size': (256, 192), |
|
'patch_size': 16, |
|
'embed_dim': 1280, |
|
'depth': 32, |
|
'num_heads': 16, |
|
'ratio': 1, |
|
'use_checkpoint': False, |
|
'mlp_ratio': 4, |
|
'qkv_bias': True, |
|
'drop_path_rate': 0.55 |
|
}, |
|
'decoder_config': { |
|
'feat_dim': 1280, |
|
"dim_out": 512, |
|
'task_tokens_num': 80, |
|
}, |
|
'input_img_shape': (512, 384), |
|
'input_body_shape': (256, 192), |
|
'output_hm_shape': (16, 16, 12), |
|
'focal': (5000, 5000), |
|
'princpt': (192 / 2, 256 / 2), |
|
'body_3d_size': 2, |
|
'hand_3d_size': 0.3, |
|
'face_3d_size': 0.3, |
|
'camera_3d_size': 2.5, |
|
|
|
}, |
|
"log":{ |
|
'exp_name': None, |
|
'output_dir': None, |
|
'model_dir': None, |
|
'log_dir': None, |
|
'result_dir': None, |
|
} |
|
} |