SeunghoEum commited on
Commit
1d5132b
·
verified ·
1 Parent(s): 0e292bc

Upload 16 files

Browse files
checkpoints/epoch=119.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:790f0cababdc401ca0455ddff64ef7ddb7082f5706e30f29e9bd87189c6c4f67
3
+ size 1130308662
checkpoints/epoch=149.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f70cc12964dff35aa733c92d1e1d1f9edec52a1f348f5bd754904b5708b76e96
3
+ size 1130309045
checkpoints/epoch=179.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e781b61aac30c5569790f9c09d43a5bd635f069b85ce199abecbaf27568c6bc
3
+ size 1130309428
checkpoints/epoch=209.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbe35341bb9434977a93a9dc4c176ee0bd9144b8e0788b272491aeecf774d4f9
3
+ size 1130309811
checkpoints/epoch=239.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bdb38ceae6149b94d3c5f171251c6719953dcd4468ce9018d93919fa2ae80d36
3
+ size 1130310194
checkpoints/epoch=269.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:486846f0f378342ba43c68bf0ff95c37a561b479585ccd8446072ec119636015
3
+ size 1130310577
checkpoints/epoch=299.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:091bae9ef1807cd69f3a2a9773b93f2e909e69fea75b6bfb9985987b0ff78736
3
+ size 1130310960
checkpoints/epoch=329.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31d2f4447924b8d3ea89228d028d3f676e741b4a292eb8e1a59c24b210148e74
3
+ size 1130311343
checkpoints/epoch=359.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11c4eab8e78db60b9ef9f8f99e950eefcd8f9b335e36c0686c10b92e078f39fc
3
+ size 1130311790
checkpoints/epoch=389.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b23d0d1aa700ca5e8cca573dbae90aa96da6bd1603536ef3efa6146d2fb69d3
3
+ size 1130312173
checkpoints/epoch=49.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ec566353eec79dd9fa60cf721177acf2251840d9591726d329dd5039d2350ed
3
+ size 1130308662
checkpoints/epoch=99.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdf355a4970e4ab3979a238dfc37dcbf04dfef8c1fd2c20a2c860b312c0f398c
3
+ size 1130309045
configs/data/assets.yaml ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ FOLDER: './checkpoints' # Experiment files saving path
2
+
3
+ TEST:
4
+ FOLDER: './outputs' # Testing files saving path
5
+
6
+ DATASET:
7
+ SMPL_PATH: '/data2/lrh/smpl_model/smpl'
8
+ SMPLH_PATH: '/data2/lrh/smpl_model/smplh'
9
+ SMPLX_PATH: '/data2/lrh/smpl_model/smplx'
10
+ FINEDANCE_139CUT:
11
+ ROOT: data/finedance
12
+ MOTION: data/finedance/mofea319
13
+ MUSIC: data/finedance/music_npynew
14
+ normalizer: data/Normalizer.pth
15
+ LABEL: data/finedance/label_json/
16
+
17
+
18
+
configs/lodge/coarse_finedance_fea139.yaml ADDED
@@ -0,0 +1,158 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ NAME: FineDance_Coarse_v2_relative_noNorm_128len_139_diff_bc800 # Experiment name
2
+ ACCELERATOR: 'gpu' # Devices optioncal: “cpu”, “gpu”, “tpu”, “ipu”, “hpu”, “mps, “auto”
3
+ DEVICE: [0,1,2,3]
4
+
5
+ FOLDER: ./checkpoints
6
+ SEED_VALUE: 1234
7
+ Norm: True
8
+ DEBUG: False
9
+ Discriminator: False
10
+ FineTune: False
11
+ TRAIN:
12
+ STAGE: diffusion # diffusion
13
+ SPLIT: 'train'
14
+ NUM_WORKERS: 16 # Number of workers
15
+ BATCH_SIZE: 190 # Size of batches
16
+ START_EPOCH: 1 # Start epoch
17
+ END_EPOCH: 3001 # End epoch
18
+ RESUME: '/home/seungho/research/lodge/experiments/Global_Module/debug--FineDance_Coarse_v2_relative_noNorm_128len_139_diff_bc800/' # Experiment path to be resumed training
19
+ PRETRAINED_VAE: ''
20
+ PRETRAINED: 'checkpoints/exp/Local_Module/FineDance_FineTuneV2_Local/checkpoints/epoch=299.ckpt' # Attention! Set your Pretrained model path
21
+ DATASETS: ['FINEDANCE_139CUT'] # Training datasets
22
+
23
+ # OPTIM:
24
+ # TYPE: 'AdamW' # Optimizer type
25
+ # LR: 1e-4 # Learning rate
26
+ OPTIM:
27
+ TYPE: 'Adan' # Optimizer type
28
+ LR: 4e-4 # Learning rate
29
+
30
+ ABLATION:
31
+ VAE_TYPE: 'no' # vae ablation: actor or mcross
32
+ VAE_ARCH: 'encoder_decoder' # mdiffusion vae architecture
33
+ PE_TYPE: 'actor' # mdiffusion mld or actor
34
+ DIFF_PE_TYPE: 'actor' # mdiffusion mld or actor
35
+ SKIP_CONNECT: False # skip connection for denoiser va
36
+ # use linear to expand mean and std rather expand token nums
37
+ MLP_DIST: False
38
+ IS_DIST: False # Mcross distribution kl
39
+ PREDICT_EPSILON: False # noise or motion
40
+
41
+ EVAL:
42
+ SPLIT: 'gtest'
43
+ BATCH_SIZE: 32 # Evaluating Batch size
44
+ NUM_WORKERS: 16 # Evaluating Batch size
45
+
46
+ TEST:
47
+ TEST_DIR: ''
48
+ CHECKPOINTS: ''
49
+ SPLIT: 'gtest'
50
+ BATCH_SIZE: 32 # Testing Batch size
51
+ NUM_WORKERS: 12 # Evaluating Batch size
52
+ SAVE_PREDICTIONS: True # Weather to save predictions
53
+ COUNT_TIME: False # Weather to count time during test
54
+ REPLICATION_TIMES: 2 # Number of times to replicate the test
55
+ MM_NUM_SAMPLES: 100 # Number of samples for multimodal test
56
+ MM_NUM_REPEATS: 30 # Number of repeats for multimodal test
57
+ MM_NUM_TIMES: 10 # Number of times to repeat the multimodal test
58
+ DIVERSITY_TIMES: 300 # Number of times to repeat the diversity test
59
+ REP_I: 0
60
+ DATASETS: ['FINEDANCE_139CUT']
61
+
62
+ model:
63
+ target: 'modules'
64
+ vae_type: 'no'
65
+
66
+ vae: true # whether vae model
67
+ model_type: Global_Module # model type
68
+ condition: 'music'
69
+ latent_dim: [1, 256] #[512, 135] # [${FINEDANCE.full_seq_len}, ${DATASET.NFEATS}] # # latent dimension
70
+ ff_size: 1024 #
71
+ num_layers: 9 # number of layers
72
+ num_head: 4 # number of head layers
73
+ droupout: 0.1 # dropout rate
74
+ activation: gelu # activation type
75
+ guidance_scale: 7.5 # 7.5 #
76
+ guidance_uncondp: 0.1 # 0.1 0.25
77
+
78
+ diffusion:
79
+ target: dld.models.architectures.diffusion.GaussianDiffusion
80
+ params:
81
+ horizon: ${FINEDANCE.full_seq_len}
82
+ repr_dim: ${FINEDANCE.nfeats}
83
+ schedule: "cosine"
84
+ n_timestep: 1000
85
+ predict_epsilon: False
86
+ loss_type: "l2"
87
+ use_p2: False
88
+ cond_drop_prob: 0.25
89
+ guidance_weight: 2
90
+
91
+ DanceDecoder:
92
+ target: dld.models.architectures.model.DanceDecoderv2
93
+ params:
94
+ nfeats: ${FINEDANCE.nfeats}
95
+ seq_len: ${FINEDANCE.full_seq_len}
96
+ latent_dim: 512
97
+ ff_size: 1024
98
+ num_layers: 8
99
+ num_heads: 8
100
+ dropout: 0.1
101
+ cond_feature_dim: 35
102
+ activation: gelu
103
+
104
+
105
+ LOSS:
106
+ TYPE: smpl_loss # Losses type
107
+ LAMBDA_MSE: 0.636
108
+ LAMBDA_V: 2.964
109
+ LAMBDA_FK: 0.636
110
+ LAMBDA_FOOT: 10.942 # Lambda for reconstruction losses
111
+ DIST_SYNC_ON_STEP: True # Sync Losses on step when distributed trained
112
+ METRIC:
113
+ FORCE_IN_METER: True
114
+ DIST_SYNC_ON_STEP: True # # Sync Losses on step when distributed trained
115
+ TYPE: ['DanceDiffuse_Metric'] # DanceAE_Metric
116
+ LOGGER:
117
+ SACE_CHECKPOINT_EPOCH: 30
118
+ LOG_EVERY_STEPS: 30
119
+ VAL_EVERY_STEPS: 30
120
+ TENSORBOARD: true
121
+ WANDB:
122
+ OFFLINE: false
123
+ PROJECT: null
124
+ RESUME_ID: null
125
+ RENDER:
126
+ JOINT_TYPE: mmm
127
+ INPUT_MODE: npy
128
+ DIR: ''
129
+ NPY: ''
130
+ DENOISING: true
131
+ OLDRENDER: true
132
+ RES: high
133
+ DOWNSAMPLE: true
134
+ FPS: 12.5
135
+ CANONICALIZE: true
136
+ EXACT_FRAME: 0.5
137
+ NUM: 7
138
+ MODE: sequence
139
+ VID_EXT: mp4
140
+ ALWAYS_ON_FLOOR: false
141
+ GT: false
142
+ DEMO:
143
+ MusicDir: /data2/lrh/dataset/fine_dance/origin/music
144
+ RENDER: false
145
+ EXAMPLE: null
146
+ use_cached_features: false
147
+
148
+ FINEDANCE:
149
+ mix: False # 是否做混合的数据增强
150
+ full_seq_len: 256 # 150
151
+ length_fi: 128
152
+ windows: 10 # 16 #40 #
153
+ is_mirror: False # 是否做镜像的数据增强
154
+ nfeats: 139
155
+ njoints: 22
156
+ mode: single # "single" , "double_react", "double"
157
+ partial: full # "full" , "morden", "tradition"
158
+ GENRE_NUM: 16
configs/lodge/finedance_fea139.yaml ADDED
@@ -0,0 +1,170 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ NAME: FineDance_relative_Norm_GenreDis_bc190 # Experiment name
2
+ ACCELERATOR: 'gpu' # Devices optioncal: “cpu”, “gpu”, “tpu”, “ipu”, “hpu”, “mps, “auto”
3
+ DEVICE: [0] #, # # Index of gpus eg. [0] or [0,1,2,3]
4
+
5
+ # FOLDER: ./experiments
6
+ SEED_VALUE: 7777
7
+ Norm: True
8
+ Discriminator: True
9
+ DEBUG: False
10
+ FineTune: false
11
+ TRAIN:
12
+ STAGE: diffusion # diffusion
13
+ SPLIT: 'train'
14
+ NUM_WORKERS: 16 # Number of workers
15
+ BATCH_SIZE: 64 # Size of batches
16
+ START_EPOCH: 1 # Start epoch
17
+ END_EPOCH: 3001 # End epoch
18
+ RESUME: '' # Experiment path to be resumed training
19
+ # PRETRAINED_VAE: ''
20
+ PRETRAINED: '' # Pretrained model path
21
+ DATASETS: ['FINEDANCE_139CUT'] # Training datasets
22
+
23
+ OPTIM:
24
+ TYPE: 'Adan' # Optimizer type
25
+ LR: 4e-4 # Learning rate
26
+
27
+ ABLATION:
28
+ VAE_TYPE: 'no' # vae ablation: actor or mcross
29
+ VAE_ARCH: 'encoder_decoder' # mdiffusion vae architecture
30
+ PE_TYPE: 'actor' # mdiffusion mld or actor
31
+ DIFF_PE_TYPE: 'actor' # mdiffusion mld or actor
32
+ SKIP_CONNECT: False # skip connection for denoiser va
33
+ # use linear to expand mean and std rather expand token nums
34
+ MLP_DIST: False
35
+ IS_DIST: False # Mcross distribution kl
36
+ PREDICT_EPSILON: False # noise or motion
37
+
38
+ EVAL:
39
+ SPLIT: 'gtest'
40
+ BATCH_SIZE: 32 # Evaluating Batch size
41
+ NUM_WORKERS: 16 # Evaluating Batch size
42
+
43
+ TEST:
44
+ TEST_DIR: ''
45
+ CHECKPOINTS: '' #/data2/lrh/project/dance/Lodge/lodge_pylight/experiments/Edge_Module/0115_newNorm_256len_263_diff_bc768/checkpoints/epoch=3899.ckpt
46
+ SPLIT: 'gtest'
47
+ BATCH_SIZE: 32 # Testing Batch size
48
+ NUM_WORKERS: 12 # Evaluating Batch size
49
+ SAVE_PREDICTIONS: True # Weather to save predictions
50
+ COUNT_TIME: False # Weather to count time during test
51
+ REPLICATION_TIMES: 2 # Number of times to replicate the test
52
+ MM_NUM_SAMPLES: 100 # Number of samples for multimodal test
53
+ MM_NUM_REPEATS: 30 # Number of repeats for multimodal test
54
+ MM_NUM_TIMES: 10 # Number of times to repeat the multimodal test
55
+ DIVERSITY_TIMES: 300 # Number of times to repeat the diversity test
56
+ REP_I: 0
57
+ DATASETS: ['FINEDANCE_139CUT']
58
+
59
+ model:
60
+ target: 'modules'
61
+ vae_type: 'no'
62
+
63
+ vae: true # whether vae model
64
+ model_type: Local_Module # model type
65
+ condition: 'music'
66
+ latent_dim: [1, 256] #[512, 135] # [${FINEDANCE.full_seq_len}, ${DATASET.NFEATS}] # # latent dimension
67
+ ff_size: 1024 #
68
+ num_layers: 9 # number of layers
69
+ num_head: 4 # number of head layers
70
+ droupout: 0.1 # dropout rate
71
+ activation: gelu # activation type
72
+ guidance_scale: 7.5 # 7.5 #
73
+ guidance_uncondp: 0.1 # 0.1 0.25
74
+
75
+
76
+ diffusion:
77
+ target: dld.models.architectures.diffusion.GaussianDiffusion
78
+ params:
79
+ horizon: ${FINEDANCE.full_seq_len}
80
+ repr_dim: ${FINEDANCE.nfeats}
81
+ schedule: "cosine"
82
+ n_timestep: 1000
83
+ predict_epsilon: False
84
+ loss_type: "l2"
85
+ use_p2: False
86
+ cond_drop_prob: 0.25
87
+ guidance_weight: 2
88
+
89
+ DanceDecoder:
90
+ target: dld.models.architectures.model.Refine_DanceDecoder
91
+ params:
92
+ nfeats: ${FINEDANCE.nfeats}
93
+ seq_len: ${FINEDANCE.full_seq_len}
94
+ latent_dim: 512
95
+ ff_size: 1024
96
+ num_layers: 8
97
+ num_heads: 8
98
+ dropout: 0.1
99
+ cond_feature_dim: 35
100
+ activation: gelu
101
+
102
+ DanceDiscriminator:
103
+ target: dld.models.architectures.model.DanceDiscriminator
104
+ params:
105
+ nfeats: ${FINEDANCE.nfeats}
106
+ seq_len: ${FINEDANCE.full_seq_len}
107
+ latent_dim: 512
108
+ ff_size: 1024
109
+ num_layers: 8
110
+ num_heads: 8
111
+ dropout: 0.1
112
+ cond_feature_dim: 35
113
+ activation: gelu
114
+
115
+ LOSS:
116
+ TYPE: smpl_loss_relative # Losses type
117
+ LAMBDA_MSE: 0.636
118
+ LAMBDA_V: 2.964
119
+ LAMBDA_FK: 1
120
+ LAMBDA_FOOT: 20 # Lambda for reconstruction losses
121
+ LAMBDA_FC: 0
122
+ LAMBDA_TRANS: 0
123
+ LAMBDA_DIS: 0.1
124
+ DIST_SYNC_ON_STEP: True # Sync Losses on step when distributed trained
125
+ METRIC:
126
+ FORCE_IN_METER: True
127
+ DIST_SYNC_ON_STEP: True # # Sync Losses on step when distributed trained
128
+ TYPE: ['DanceDiffuse_Metric'] # DanceAE_Metric
129
+ LOGGER:
130
+ SACE_CHECKPOINT_EPOCH: 100 # 保存间隔
131
+ LOG_EVERY_STEPS: 100
132
+ VAL_EVERY_STEPS: 100
133
+ TENSORBOARD: true
134
+ WANDB:
135
+ OFFLINE: false
136
+ PROJECT: null
137
+ RESUME_ID: null
138
+ RENDER:
139
+ JOINT_TYPE: mmm
140
+ INPUT_MODE: npy
141
+ DIR: ''
142
+ NPY: ''
143
+ DENOISING: true
144
+ OLDRENDER: true
145
+ RES: high
146
+ DOWNSAMPLE: true
147
+ FPS: 12.5
148
+ CANONICALIZE: true
149
+ EXACT_FRAME: 0.5
150
+ NUM: 7
151
+ MODE: sequence
152
+ VID_EXT: mp4
153
+ ALWAYS_ON_FLOOR: false
154
+ GT: false
155
+ DEMO:
156
+ MusicDir: /data2/lrh/dataset/fine_dance/origin/music
157
+ RENDER: false
158
+ EXAMPLE: null
159
+ use_cached_features: false
160
+
161
+ FINEDANCE:
162
+ mix: False # weather do mix data augmention
163
+ full_seq_len: 256 # 150
164
+ windows: 8 # 16 #40 #
165
+ is_mirror: False # weather do mirror data augmention
166
+ nfeats: 139
167
+ njoints: 22
168
+ mode: single # "single" , "double_react", "double"
169
+ partial: full # "full" , "morden", "tradition"
170
+ GENRE_NUM: 16
configs/lodge/finedance_fea139_finetune_v2.yaml ADDED
@@ -0,0 +1,169 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ NAME: Debug_FineDance_FineTuneV2_Local # Experiment name
2
+ ACCELERATOR: 'gpu' # Devices optioncal: “cpu”, “gpu”, “tpu”, “ipu”, “hpu”, “mps, “auto”
3
+ DEVICE: [0,1,2,3] #, # # Index of gpus eg. [0] or [0,1,2,3]
4
+
5
+ # FOLDER: ./experiments
6
+ SEED_VALUE: 1233
7
+ Norm: True
8
+ Discriminator: True
9
+ DEBUG: False
10
+ FineTune: True
11
+ TRAIN:
12
+ STAGE: diffusion # diffusion
13
+ SPLIT: 'train'
14
+ NUM_WORKERS: 16 # Number of workers
15
+ BATCH_SIZE: 190 # Size of batches
16
+ START_EPOCH: 1 # Start epoch
17
+ END_EPOCH: 1601 # End epoch
18
+ RESUME: '' # Experiment path to be resumed training
19
+ PRETRAINED: '/data2/lrh/project/dance/Lodge/lodge302/experiments/Local_Module/FineDance_relative_Norm_GenreDis_bc190/checkpoints/epoch=1399.ckpt' # Pretrained model path
20
+ DATASETS: ['FINEDANCE_139CUT'] # Training datasets
21
+
22
+ OPTIM:
23
+ TYPE: 'Adan' # Optimizer type
24
+ LR: 4e-4 # Learning rate
25
+
26
+ ABLATION:
27
+ VAE_TYPE: 'no' # vae ablation: actor or mcross
28
+ VAE_ARCH: 'encoder_decoder' # mdiffusion vae architecture
29
+ PE_TYPE: 'actor' # mdiffusion mld or actor
30
+ DIFF_PE_TYPE: 'actor' # mdiffusion mld or actor
31
+ SKIP_CONNECT: False # skip connection for denoiser va
32
+ # use linear to expand mean and std rather expand token nums
33
+ MLP_DIST: False
34
+ IS_DIST: False # Mcross distribution kl
35
+ PREDICT_EPSILON: False # noise or motion
36
+
37
+ EVAL:
38
+ SPLIT: 'gtest'
39
+ BATCH_SIZE: 256 # Evaluating Batch size
40
+ NUM_WORKERS: 16 # Evaluating Batch size
41
+ TEST:
42
+ TEST_DIR: ''
43
+ CHECKPOINTS: ''
44
+ SPLIT: 'gtest'
45
+ BATCH_SIZE: 256 # Testing Batch size
46
+ NUM_WORKERS: 12 # Evaluating Batch size
47
+ SAVE_PREDICTIONS: True # Weather to save predictions
48
+ COUNT_TIME: False # Weather to count time during test
49
+ REPLICATION_TIMES: 2 # Number of times to replicate the test
50
+ MM_NUM_SAMPLES: 100 # Number of samples for multimodal test
51
+ MM_NUM_REPEATS: 30 # Number of repeats for multimodal test
52
+ MM_NUM_TIMES: 10 # Number of times to repeat the multimodal test
53
+ DIVERSITY_TIMES: 300 # Number of times to repeat the diversity test
54
+ REP_I: 0
55
+ DATASETS: ['FINEDANCE_139CUT']
56
+
57
+ model:
58
+ target: 'modules'
59
+ vae_type: 'no'
60
+
61
+ vae: true # whether vae model
62
+ model_type: Local_Module # model type
63
+ condition: 'music'
64
+ latent_dim: [1, 256] #[512, 135] # [${FINEDANCE.full_seq_len}, ${DATASET.NFEATS}] # # latent dimension
65
+ ff_size: 1024 #
66
+ num_layers: 9 # number of layers
67
+ num_head: 4 # number of head layers
68
+ droupout: 0.1 # dropout rate
69
+ activation: gelu # activation type
70
+ guidance_scale: 7.5 # 7.5 #
71
+ guidance_uncondp: 0.1 # 0.1 0.25
72
+
73
+ diffusion:
74
+ target: dld.models.architectures.diffusion.GaussianDiffusion
75
+ params:
76
+ horizon: ${FINEDANCE.full_seq_len}
77
+ repr_dim: ${FINEDANCE.nfeats}
78
+ schedule: "cosine"
79
+ n_timestep: 1000
80
+ predict_epsilon: False
81
+ loss_type: "l2"
82
+ use_p2: False
83
+ cond_drop_prob: 0.25
84
+ guidance_weight: 2
85
+
86
+ DanceDecoder:
87
+ target: dld.models.architectures.model.Refine_DanceDecoder
88
+ params:
89
+ nfeats: ${FINEDANCE.nfeats}
90
+ seq_len: ${FINEDANCE.full_seq_len}
91
+ latent_dim: 512
92
+ ff_size: 1024
93
+ num_layers: 8
94
+ num_heads: 8
95
+ dropout: 0.1
96
+ cond_feature_dim: 35
97
+ activation: gelu
98
+
99
+ DanceDiscriminator:
100
+ target: dld.models.architectures.model.DanceDiscriminator
101
+ params:
102
+ nfeats: ${FINEDANCE.nfeats}
103
+ seq_len: ${FINEDANCE.full_seq_len}
104
+ latent_dim: 512
105
+ ff_size: 1024
106
+ num_layers: 8
107
+ num_heads: 8
108
+ dropout: 0.1
109
+ cond_feature_dim: 35
110
+ activation: gelu
111
+
112
+ LOSS:
113
+ TYPE: smpl_loss_relative # Losses type
114
+ LAMBDA_MSE: 0.636
115
+ LAMBDA_V: 2.964
116
+ LAMBDA_FK: 1
117
+ LAMBDA_FK_V: 0
118
+ LAMBDA_FK_A: 0
119
+ LAMBDA_FOOT: 10 # Lambda for reconstruction losses
120
+ LAMBDA_FC: 0
121
+ LAMBDA_TRANS: 0.5
122
+ LAMBDA_DIS: 0.1
123
+ DIST_SYNC_ON_STEP: True # Sync Losses on step when distributed trained
124
+ METRIC:
125
+ FORCE_IN_METER: True
126
+ DIST_SYNC_ON_STEP: True # # Sync Losses on step when distributed trained
127
+ TYPE: ['DanceDiffuse_Metric'] # DanceAE_Metric
128
+ LOGGER:
129
+ SACE_CHECKPOINT_EPOCH: 50 # 保存间隔
130
+ LOG_EVERY_STEPS: 50
131
+ VAL_EVERY_STEPS: 50
132
+ TENSORBOARD: true
133
+ WANDB:
134
+ OFFLINE: false
135
+ PROJECT: null
136
+ RESUME_ID: null
137
+ RENDER:
138
+ JOINT_TYPE: mmm
139
+ INPUT_MODE: npy
140
+ DIR: ''
141
+ NPY: ''
142
+ DENOISING: true
143
+ OLDRENDER: true
144
+ RES: high
145
+ DOWNSAMPLE: true
146
+ FPS: 12.5
147
+ CANONICALIZE: true
148
+ EXACT_FRAME: 0.5
149
+ NUM: 7
150
+ MODE: sequence
151
+ VID_EXT: mp4
152
+ ALWAYS_ON_FLOOR: false
153
+ GT: false
154
+ DEMO:
155
+ MusicDir: /data2/lrh/dataset/fine_dance/origin/music
156
+ RENDER: false
157
+ EXAMPLE: null
158
+ use_cached_features: false
159
+
160
+ FINEDANCE:
161
+ mix: False # 是否做混合的数据增强
162
+ full_seq_len: 256 # 150
163
+ windows: 8 # 16 #40 #
164
+ is_mirror: False # 是否做镜像的数据增强
165
+ nfeats: 139
166
+ njoints: 22
167
+ mode: single # "single" , "double_react", "double"
168
+ partial: full # "full" , "morden", "tradition"
169
+ GENRE_NUM: 16