brjathu commited on
Commit
3987f44
1 Parent(s): 29a229f

Upload folder using huggingface_hub

Browse files
train/multiruns/hmr2/0/checkpoints/epoch=35-step=1000000.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9ea09c834161468638c9de7a782c614e300c622709bf52967274c543ec72fcf
3
+ size 2709521501
train/multiruns/hmr2/0/dataset_config.yaml ADDED
@@ -0,0 +1,112 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 3DPW-TEST:
2
+ KEYPOINT_LIST:
3
+ - 25
4
+ - 26
5
+ - 27
6
+ - 28
7
+ - 29
8
+ - 30
9
+ - 31
10
+ - 32
11
+ - 33
12
+ - 34
13
+ - 35
14
+ - 36
15
+ - 37
16
+ - 43
17
+ TYPE: ImageDataset
18
+ URLS: /fsx/shubham/data/hmr2023_data_shuffled_new/3dpw-test/{000000..000012}.tar
19
+ USE_HIPS: false
20
+ AIC-TRAIN:
21
+ TYPE: ImageDataset
22
+ URLS: /fsx/shubham/data/hmr2023_data_shuffled/aic-train/{000000..000104}.tar
23
+ epoch_size: 200000
24
+ AIC-TRAIN-WMASK:
25
+ TYPE: ImageDataset
26
+ URLS: /fsx/shubham/data/hmr2023_data_shuffled_wmasks/aic-train-vitpose/{000000..000104}.tar
27
+ epoch_size: 200000
28
+ AVA-TRAIN-MIDFRAMES-1FPS:
29
+ TYPE: ImageDataset
30
+ URLS: /fsx/shubham/data/hmr2023_data_shuffled/ava-train-midframes-1fps/{000000..000092}.tar
31
+ epoch_size: 200000
32
+ AVA-TRAIN-MIDFRAMES-1FPS-WMASK:
33
+ TYPE: ImageDataset
34
+ URLS: /fsx/shubham/data/hmr2023_data_shuffled_wmasks/ava-train-midframes-1fps-vitpose/{000000..000092}.tar
35
+ epoch_size: 200000
36
+ CMU-MOCAP:
37
+ DATASET_FILE: /fsx/shubham/code/hmr2023/data/datasets/cmu_mocap.npz
38
+ COCO-TRAIN-2014:
39
+ TYPE: ImageDataset
40
+ URLS: /fsx/shubham/data/hmr2023_data_shuffled/coco-train-2014/{000000..000017}.tar
41
+ epoch_size: 360000
42
+ COCO-TRAIN-2014-VITPOSE-REPLICATE-PRUNED12:
43
+ TYPE: ImageDataset
44
+ URLS: /fsx/shubham/data/hmr2023_data_shuffled_wmasks/coco-train-2014-vitpose-replicate-pruned12/{000000..000044}.tar
45
+ epoch_size: 45000
46
+ COCO-TRAIN-2014-WMASK:
47
+ TYPE: ImageDataset
48
+ URLS: /fsx/shubham/data/hmr2023_data_shuffled_wmasks/coco-train-2014/{000000..000034}.tar
49
+ epoch_size: 35000
50
+ COCO-TRAIN-2014-WMASK-PRUNED:
51
+ TYPE: ImageDataset
52
+ URLS: /fsx/shubham/data/hmr2023_data_shuffled_wmasks/coco-train-2014-pruned/{000000..000017}.tar
53
+ epoch_size: 18000
54
+ COCO-VAL:
55
+ KEYPOINT_LIST:
56
+ - 0
57
+ TYPE: ImageDataset
58
+ URLS: /fsx/shubham/data/hmr2023_data_shuffled/coco-val/{000000..000000}.tar
59
+ H36M-TRAIN:
60
+ TYPE: ImageDataset
61
+ URLS: /fsx/shubham/data/hmr2023_data_shuffled/h36m-train/{000000..000156}.tar
62
+ epoch_size: 314000
63
+ H36M-TRAIN-WMASK:
64
+ TYPE: ImageDataset
65
+ URLS: /fsx/shubham/data/hmr2023_data_shuffled_wmasks/h36m-train/{000000..000312}.tar
66
+ epoch_size: 314000
67
+ H36M-VAL-P2:
68
+ KEYPOINT_LIST:
69
+ - 25
70
+ - 26
71
+ - 27
72
+ - 28
73
+ - 29
74
+ - 30
75
+ - 31
76
+ - 32
77
+ - 33
78
+ - 34
79
+ - 35
80
+ - 36
81
+ - 37
82
+ - 43
83
+ TYPE: ImageDataset
84
+ URLS: /fsx/shubham/data/hmr2023_data_shuffled_new/h36m-val-p2/{000000..000013}.tar
85
+ USE_HIPS: true
86
+ H36M-VAL-P2-OPENPOSE:
87
+ TYPE: ImageDataset
88
+ URLS: /fsx/shubham/data/hmr2023_data_shuffled_new/h36m-val-p2-openpose/{000000..000013}.tar
89
+ INSTA-TRAIN:
90
+ TYPE: ImageDataset
91
+ URLS: /fsx/shubham/data/hmr2023_data_shuffled/insta-train/{000000..001828}.tar
92
+ epoch_size: 4000000
93
+ INSTA-TRAIN-WMASK:
94
+ TYPE: ImageDataset
95
+ URLS: /fsx/shubham/data/hmr2023_data_shuffled_wmasks/insta-train-vitpose/{000000..001828}.tar
96
+ epoch_size: 4000000
97
+ MPI-INF-TRAIN:
98
+ TYPE: ImageDataset
99
+ URLS: /fsx/shubham/data/hmr2023_data_shuffled/mpi-inf-train/{000000..000048}.tar
100
+ epoch_size: 100000
101
+ MPI-INF-TRAIN-PRUNED:
102
+ TYPE: ImageDataset
103
+ URLS: /fsx/shubham/data/hmr2023_data_shuffled_new/mpi-inf-train-pruned/{000000..00006}.tar
104
+ epoch_size: 12000
105
+ MPII-TRAIN:
106
+ TYPE: ImageDataset
107
+ URLS: /fsx/shubham/data/hmr2023_data_shuffled/mpii-train/{000000..000004}.tar
108
+ epoch_size: 100000
109
+ MPII-TRAIN-WMASK:
110
+ TYPE: ImageDataset
111
+ URLS: /fsx/shubham/data/hmr2023_data_shuffled_wmasks/mpii-train/{000000..000009}.tar
112
+ epoch_size: 100000
train/multiruns/hmr2/0/model_config.yaml ADDED
@@ -0,0 +1,148 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ task_name: train
2
+ tags:
3
+ - dev
4
+ train: true
5
+ test: false
6
+ ckpt_path: null
7
+ seed: null
8
+ DATASETS:
9
+ SUPPRESS_KP_CONF_THRESH: 0.3
10
+ FILTER_NUM_KP: 4
11
+ FILTER_NUM_KP_THRESH: 0.0
12
+ FILTER_REPROJ_THRESH: 31000
13
+ SUPPRESS_BETAS_THRESH: 3.0
14
+ SUPPRESS_BAD_POSES: true
15
+ POSES_BETAS_SIMULTANEOUS: true
16
+ FILTER_NO_POSES: false
17
+ TRAIN:
18
+ H36M-TRAIN-WMASK:
19
+ WEIGHT: 0.1
20
+ MPII-TRAIN-WMASK:
21
+ WEIGHT: 0.1
22
+ COCO-TRAIN-2014-WMASK-PRUNED:
23
+ WEIGHT: 0.1
24
+ COCO-TRAIN-2014-VITPOSE-REPLICATE-PRUNED12:
25
+ WEIGHT: 0.1
26
+ MPI-INF-TRAIN-PRUNED:
27
+ WEIGHT: 0.02
28
+ AVA-TRAIN-MIDFRAMES-1FPS-WMASK:
29
+ WEIGHT: 0.19
30
+ AIC-TRAIN-WMASK:
31
+ WEIGHT: 0.19
32
+ INSTA-TRAIN-WMASK:
33
+ WEIGHT: 0.2
34
+ VAL:
35
+ COCO-VAL:
36
+ WEIGHT: 1.0
37
+ MOCAP: CMU-MOCAP
38
+ CONFIG:
39
+ SCALE_FACTOR: 0.3
40
+ ROT_FACTOR: 30
41
+ TRANS_FACTOR: 0.02
42
+ COLOR_SCALE: 0.2
43
+ ROT_AUG_RATE: 0.6
44
+ TRANS_AUG_RATE: 0.5
45
+ DO_FLIP: true
46
+ FLIP_AUG_RATE: 0.5
47
+ EXTREME_CROP_AUG_RATE: 0.1
48
+ EXTREME_CROP_AUG_LEVEL: 1
49
+ BETAS_REG: true
50
+ trainer:
51
+ _target_: pytorch_lightning.Trainer
52
+ default_root_dir: ${paths.output_dir}
53
+ accelerator: gpu
54
+ devices: 8
55
+ deterministic: false
56
+ num_sanity_val_steps: 0
57
+ log_every_n_steps: ${GENERAL.LOG_STEPS}
58
+ val_check_interval: ${GENERAL.VAL_STEPS}
59
+ precision: 16
60
+ max_steps: ${GENERAL.TOTAL_STEPS}
61
+ move_metrics_to_cpu: true
62
+ limit_val_batches: 1
63
+ track_grad_norm: -1
64
+ strategy: ddp
65
+ num_nodes: 1
66
+ sync_batchnorm: true
67
+ paths:
68
+ root_dir: ${oc.env:PROJECT_ROOT}
69
+ data_dir: ${paths.root_dir}/data/
70
+ log_dir: /fsx/shubham/code/hmr2023/logs_hydra/
71
+ output_dir: ${hydra:runtime.output_dir}
72
+ work_dir: ${hydra:runtime.cwd}
73
+ extras:
74
+ ignore_warnings: false
75
+ enforce_tags: true
76
+ print_config: true
77
+ exp_name: hmr2
78
+ SMPL:
79
+ MODEL_PATH: data/smpl
80
+ GENDER: neutral
81
+ NUM_BODY_JOINTS: 23
82
+ JOINT_REGRESSOR_EXTRA: data/SMPL_to_J19.pkl
83
+ MEAN_PARAMS: data/smpl_mean_params.npz
84
+ EXTRA:
85
+ FOCAL_LENGTH: 5000
86
+ NUM_LOG_IMAGES: 4
87
+ NUM_LOG_SAMPLES_PER_IMAGE: 8
88
+ PELVIS_IND: 39
89
+ MODEL:
90
+ IMAGE_SIZE: 256
91
+ IMAGE_MEAN:
92
+ - 0.485
93
+ - 0.456
94
+ - 0.406
95
+ IMAGE_STD:
96
+ - 0.229
97
+ - 0.224
98
+ - 0.225
99
+ BACKBONE:
100
+ TYPE: vit
101
+ NUM_LAYERS: 50
102
+ OUT_CHANNELS: 2048
103
+ ADD_NECK: false
104
+ FLOW:
105
+ DIM: 144
106
+ NUM_LAYERS: 4
107
+ CONTEXT_FEATURES: 2048
108
+ LAYER_HIDDEN_FEATURES: 1024
109
+ LAYER_DEPTH: 2
110
+ FC_HEAD:
111
+ NUM_FEATURES: 1024
112
+ SMPL_HEAD:
113
+ TYPE: transformer_decoder
114
+ IN_CHANNELS: 2048
115
+ TRANSFORMER_DECODER:
116
+ depth: 6
117
+ heads: 8
118
+ mlp_dim: 1024
119
+ dim_head: 64
120
+ dropout: 0.0
121
+ emb_dropout: 0.0
122
+ norm: layer
123
+ context_dim: 1280
124
+ GENERAL:
125
+ TOTAL_STEPS: 1000000
126
+ LOG_STEPS: 1000
127
+ VAL_STEPS: 1000
128
+ CHECKPOINT_STEPS: 10000
129
+ CHECKPOINT_SAVE_TOP_K: 1
130
+ NUM_WORKERS: 6
131
+ PREFETCH_FACTOR: 2
132
+ TRAIN:
133
+ LR: 1.0e-05
134
+ WEIGHT_DECAY: 0.0001
135
+ BATCH_SIZE: 48
136
+ LOSS_REDUCTION: mean
137
+ NUM_TRAIN_SAMPLES: 2
138
+ NUM_TEST_SAMPLES: 64
139
+ POSE_2D_NOISE_RATIO: 0.01
140
+ SMPL_PARAM_NOISE_RATIO: 0.005
141
+ LOSS_WEIGHTS:
142
+ KEYPOINTS_3D: 0.05
143
+ KEYPOINTS_2D: 0.01
144
+ GLOBAL_ORIENT: 0.001
145
+ BODY_POSE: 0.001
146
+ BETAS: 0.0005
147
+ ADVERSARIAL: 0.0005
148
+ local: {}