Upload 16 files
Browse files- checkpoints/epoch=119.ckpt +3 -0
- checkpoints/epoch=149.ckpt +3 -0
- checkpoints/epoch=179.ckpt +3 -0
- checkpoints/epoch=209.ckpt +3 -0
- checkpoints/epoch=239.ckpt +3 -0
- checkpoints/epoch=269.ckpt +3 -0
- checkpoints/epoch=299.ckpt +3 -0
- checkpoints/epoch=329.ckpt +3 -0
- checkpoints/epoch=359.ckpt +3 -0
- checkpoints/epoch=389.ckpt +3 -0
- checkpoints/epoch=49.ckpt +3 -0
- checkpoints/epoch=99.ckpt +3 -0
- configs/data/assets.yaml +18 -0
- configs/lodge/coarse_finedance_fea139.yaml +158 -0
- configs/lodge/finedance_fea139.yaml +170 -0
- configs/lodge/finedance_fea139_finetune_v2.yaml +169 -0
checkpoints/epoch=119.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:790f0cababdc401ca0455ddff64ef7ddb7082f5706e30f29e9bd87189c6c4f67
|
3 |
+
size 1130308662
|
checkpoints/epoch=149.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f70cc12964dff35aa733c92d1e1d1f9edec52a1f348f5bd754904b5708b76e96
|
3 |
+
size 1130309045
|
checkpoints/epoch=179.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e781b61aac30c5569790f9c09d43a5bd635f069b85ce199abecbaf27568c6bc
|
3 |
+
size 1130309428
|
checkpoints/epoch=209.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bbe35341bb9434977a93a9dc4c176ee0bd9144b8e0788b272491aeecf774d4f9
|
3 |
+
size 1130309811
|
checkpoints/epoch=239.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bdb38ceae6149b94d3c5f171251c6719953dcd4468ce9018d93919fa2ae80d36
|
3 |
+
size 1130310194
|
checkpoints/epoch=269.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:486846f0f378342ba43c68bf0ff95c37a561b479585ccd8446072ec119636015
|
3 |
+
size 1130310577
|
checkpoints/epoch=299.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:091bae9ef1807cd69f3a2a9773b93f2e909e69fea75b6bfb9985987b0ff78736
|
3 |
+
size 1130310960
|
checkpoints/epoch=329.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31d2f4447924b8d3ea89228d028d3f676e741b4a292eb8e1a59c24b210148e74
|
3 |
+
size 1130311343
|
checkpoints/epoch=359.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11c4eab8e78db60b9ef9f8f99e950eefcd8f9b335e36c0686c10b92e078f39fc
|
3 |
+
size 1130311790
|
checkpoints/epoch=389.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b23d0d1aa700ca5e8cca573dbae90aa96da6bd1603536ef3efa6146d2fb69d3
|
3 |
+
size 1130312173
|
checkpoints/epoch=49.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ec566353eec79dd9fa60cf721177acf2251840d9591726d329dd5039d2350ed
|
3 |
+
size 1130308662
|
checkpoints/epoch=99.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cdf355a4970e4ab3979a238dfc37dcbf04dfef8c1fd2c20a2c860b312c0f398c
|
3 |
+
size 1130309045
|
configs/data/assets.yaml
ADDED
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
FOLDER: './checkpoints' # Experiment files saving path
|
2 |
+
|
3 |
+
TEST:
|
4 |
+
FOLDER: './outputs' # Testing files saving path
|
5 |
+
|
6 |
+
DATASET:
|
7 |
+
SMPL_PATH: '/data2/lrh/smpl_model/smpl'
|
8 |
+
SMPLH_PATH: '/data2/lrh/smpl_model/smplh'
|
9 |
+
SMPLX_PATH: '/data2/lrh/smpl_model/smplx'
|
10 |
+
FINEDANCE_139CUT:
|
11 |
+
ROOT: data/finedance
|
12 |
+
MOTION: data/finedance/mofea319
|
13 |
+
MUSIC: data/finedance/music_npynew
|
14 |
+
normalizer: data/Normalizer.pth
|
15 |
+
LABEL: data/finedance/label_json/
|
16 |
+
|
17 |
+
|
18 |
+
|
configs/lodge/coarse_finedance_fea139.yaml
ADDED
@@ -0,0 +1,158 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
NAME: FineDance_Coarse_v2_relative_noNorm_128len_139_diff_bc800 # Experiment name
|
2 |
+
ACCELERATOR: 'gpu' # Devices optioncal: “cpu”, “gpu”, “tpu”, “ipu”, “hpu”, “mps, “auto”
|
3 |
+
DEVICE: [0,1,2,3]
|
4 |
+
|
5 |
+
FOLDER: ./checkpoints
|
6 |
+
SEED_VALUE: 1234
|
7 |
+
Norm: True
|
8 |
+
DEBUG: False
|
9 |
+
Discriminator: False
|
10 |
+
FineTune: False
|
11 |
+
TRAIN:
|
12 |
+
STAGE: diffusion # diffusion
|
13 |
+
SPLIT: 'train'
|
14 |
+
NUM_WORKERS: 16 # Number of workers
|
15 |
+
BATCH_SIZE: 190 # Size of batches
|
16 |
+
START_EPOCH: 1 # Start epoch
|
17 |
+
END_EPOCH: 3001 # End epoch
|
18 |
+
RESUME: '/home/seungho/research/lodge/experiments/Global_Module/debug--FineDance_Coarse_v2_relative_noNorm_128len_139_diff_bc800/' # Experiment path to be resumed training
|
19 |
+
PRETRAINED_VAE: ''
|
20 |
+
PRETRAINED: 'checkpoints/exp/Local_Module/FineDance_FineTuneV2_Local/checkpoints/epoch=299.ckpt' # Attention! Set your Pretrained model path
|
21 |
+
DATASETS: ['FINEDANCE_139CUT'] # Training datasets
|
22 |
+
|
23 |
+
# OPTIM:
|
24 |
+
# TYPE: 'AdamW' # Optimizer type
|
25 |
+
# LR: 1e-4 # Learning rate
|
26 |
+
OPTIM:
|
27 |
+
TYPE: 'Adan' # Optimizer type
|
28 |
+
LR: 4e-4 # Learning rate
|
29 |
+
|
30 |
+
ABLATION:
|
31 |
+
VAE_TYPE: 'no' # vae ablation: actor or mcross
|
32 |
+
VAE_ARCH: 'encoder_decoder' # mdiffusion vae architecture
|
33 |
+
PE_TYPE: 'actor' # mdiffusion mld or actor
|
34 |
+
DIFF_PE_TYPE: 'actor' # mdiffusion mld or actor
|
35 |
+
SKIP_CONNECT: False # skip connection for denoiser va
|
36 |
+
# use linear to expand mean and std rather expand token nums
|
37 |
+
MLP_DIST: False
|
38 |
+
IS_DIST: False # Mcross distribution kl
|
39 |
+
PREDICT_EPSILON: False # noise or motion
|
40 |
+
|
41 |
+
EVAL:
|
42 |
+
SPLIT: 'gtest'
|
43 |
+
BATCH_SIZE: 32 # Evaluating Batch size
|
44 |
+
NUM_WORKERS: 16 # Evaluating Batch size
|
45 |
+
|
46 |
+
TEST:
|
47 |
+
TEST_DIR: ''
|
48 |
+
CHECKPOINTS: ''
|
49 |
+
SPLIT: 'gtest'
|
50 |
+
BATCH_SIZE: 32 # Testing Batch size
|
51 |
+
NUM_WORKERS: 12 # Evaluating Batch size
|
52 |
+
SAVE_PREDICTIONS: True # Weather to save predictions
|
53 |
+
COUNT_TIME: False # Weather to count time during test
|
54 |
+
REPLICATION_TIMES: 2 # Number of times to replicate the test
|
55 |
+
MM_NUM_SAMPLES: 100 # Number of samples for multimodal test
|
56 |
+
MM_NUM_REPEATS: 30 # Number of repeats for multimodal test
|
57 |
+
MM_NUM_TIMES: 10 # Number of times to repeat the multimodal test
|
58 |
+
DIVERSITY_TIMES: 300 # Number of times to repeat the diversity test
|
59 |
+
REP_I: 0
|
60 |
+
DATASETS: ['FINEDANCE_139CUT']
|
61 |
+
|
62 |
+
model:
|
63 |
+
target: 'modules'
|
64 |
+
vae_type: 'no'
|
65 |
+
|
66 |
+
vae: true # whether vae model
|
67 |
+
model_type: Global_Module # model type
|
68 |
+
condition: 'music'
|
69 |
+
latent_dim: [1, 256] #[512, 135] # [${FINEDANCE.full_seq_len}, ${DATASET.NFEATS}] # # latent dimension
|
70 |
+
ff_size: 1024 #
|
71 |
+
num_layers: 9 # number of layers
|
72 |
+
num_head: 4 # number of head layers
|
73 |
+
droupout: 0.1 # dropout rate
|
74 |
+
activation: gelu # activation type
|
75 |
+
guidance_scale: 7.5 # 7.5 #
|
76 |
+
guidance_uncondp: 0.1 # 0.1 0.25
|
77 |
+
|
78 |
+
diffusion:
|
79 |
+
target: dld.models.architectures.diffusion.GaussianDiffusion
|
80 |
+
params:
|
81 |
+
horizon: ${FINEDANCE.full_seq_len}
|
82 |
+
repr_dim: ${FINEDANCE.nfeats}
|
83 |
+
schedule: "cosine"
|
84 |
+
n_timestep: 1000
|
85 |
+
predict_epsilon: False
|
86 |
+
loss_type: "l2"
|
87 |
+
use_p2: False
|
88 |
+
cond_drop_prob: 0.25
|
89 |
+
guidance_weight: 2
|
90 |
+
|
91 |
+
DanceDecoder:
|
92 |
+
target: dld.models.architectures.model.DanceDecoderv2
|
93 |
+
params:
|
94 |
+
nfeats: ${FINEDANCE.nfeats}
|
95 |
+
seq_len: ${FINEDANCE.full_seq_len}
|
96 |
+
latent_dim: 512
|
97 |
+
ff_size: 1024
|
98 |
+
num_layers: 8
|
99 |
+
num_heads: 8
|
100 |
+
dropout: 0.1
|
101 |
+
cond_feature_dim: 35
|
102 |
+
activation: gelu
|
103 |
+
|
104 |
+
|
105 |
+
LOSS:
|
106 |
+
TYPE: smpl_loss # Losses type
|
107 |
+
LAMBDA_MSE: 0.636
|
108 |
+
LAMBDA_V: 2.964
|
109 |
+
LAMBDA_FK: 0.636
|
110 |
+
LAMBDA_FOOT: 10.942 # Lambda for reconstruction losses
|
111 |
+
DIST_SYNC_ON_STEP: True # Sync Losses on step when distributed trained
|
112 |
+
METRIC:
|
113 |
+
FORCE_IN_METER: True
|
114 |
+
DIST_SYNC_ON_STEP: True # # Sync Losses on step when distributed trained
|
115 |
+
TYPE: ['DanceDiffuse_Metric'] # DanceAE_Metric
|
116 |
+
LOGGER:
|
117 |
+
SACE_CHECKPOINT_EPOCH: 30
|
118 |
+
LOG_EVERY_STEPS: 30
|
119 |
+
VAL_EVERY_STEPS: 30
|
120 |
+
TENSORBOARD: true
|
121 |
+
WANDB:
|
122 |
+
OFFLINE: false
|
123 |
+
PROJECT: null
|
124 |
+
RESUME_ID: null
|
125 |
+
RENDER:
|
126 |
+
JOINT_TYPE: mmm
|
127 |
+
INPUT_MODE: npy
|
128 |
+
DIR: ''
|
129 |
+
NPY: ''
|
130 |
+
DENOISING: true
|
131 |
+
OLDRENDER: true
|
132 |
+
RES: high
|
133 |
+
DOWNSAMPLE: true
|
134 |
+
FPS: 12.5
|
135 |
+
CANONICALIZE: true
|
136 |
+
EXACT_FRAME: 0.5
|
137 |
+
NUM: 7
|
138 |
+
MODE: sequence
|
139 |
+
VID_EXT: mp4
|
140 |
+
ALWAYS_ON_FLOOR: false
|
141 |
+
GT: false
|
142 |
+
DEMO:
|
143 |
+
MusicDir: /data2/lrh/dataset/fine_dance/origin/music
|
144 |
+
RENDER: false
|
145 |
+
EXAMPLE: null
|
146 |
+
use_cached_features: false
|
147 |
+
|
148 |
+
FINEDANCE:
|
149 |
+
mix: False # 是否做混合的数据增强
|
150 |
+
full_seq_len: 256 # 150
|
151 |
+
length_fi: 128
|
152 |
+
windows: 10 # 16 #40 #
|
153 |
+
is_mirror: False # 是否做镜像的数据增强
|
154 |
+
nfeats: 139
|
155 |
+
njoints: 22
|
156 |
+
mode: single # "single" , "double_react", "double"
|
157 |
+
partial: full # "full" , "morden", "tradition"
|
158 |
+
GENRE_NUM: 16
|
configs/lodge/finedance_fea139.yaml
ADDED
@@ -0,0 +1,170 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
NAME: FineDance_relative_Norm_GenreDis_bc190 # Experiment name
|
2 |
+
ACCELERATOR: 'gpu' # Devices optioncal: “cpu”, “gpu”, “tpu”, “ipu”, “hpu”, “mps, “auto”
|
3 |
+
DEVICE: [0] #, # # Index of gpus eg. [0] or [0,1,2,3]
|
4 |
+
|
5 |
+
# FOLDER: ./experiments
|
6 |
+
SEED_VALUE: 7777
|
7 |
+
Norm: True
|
8 |
+
Discriminator: True
|
9 |
+
DEBUG: False
|
10 |
+
FineTune: false
|
11 |
+
TRAIN:
|
12 |
+
STAGE: diffusion # diffusion
|
13 |
+
SPLIT: 'train'
|
14 |
+
NUM_WORKERS: 16 # Number of workers
|
15 |
+
BATCH_SIZE: 64 # Size of batches
|
16 |
+
START_EPOCH: 1 # Start epoch
|
17 |
+
END_EPOCH: 3001 # End epoch
|
18 |
+
RESUME: '' # Experiment path to be resumed training
|
19 |
+
# PRETRAINED_VAE: ''
|
20 |
+
PRETRAINED: '' # Pretrained model path
|
21 |
+
DATASETS: ['FINEDANCE_139CUT'] # Training datasets
|
22 |
+
|
23 |
+
OPTIM:
|
24 |
+
TYPE: 'Adan' # Optimizer type
|
25 |
+
LR: 4e-4 # Learning rate
|
26 |
+
|
27 |
+
ABLATION:
|
28 |
+
VAE_TYPE: 'no' # vae ablation: actor or mcross
|
29 |
+
VAE_ARCH: 'encoder_decoder' # mdiffusion vae architecture
|
30 |
+
PE_TYPE: 'actor' # mdiffusion mld or actor
|
31 |
+
DIFF_PE_TYPE: 'actor' # mdiffusion mld or actor
|
32 |
+
SKIP_CONNECT: False # skip connection for denoiser va
|
33 |
+
# use linear to expand mean and std rather expand token nums
|
34 |
+
MLP_DIST: False
|
35 |
+
IS_DIST: False # Mcross distribution kl
|
36 |
+
PREDICT_EPSILON: False # noise or motion
|
37 |
+
|
38 |
+
EVAL:
|
39 |
+
SPLIT: 'gtest'
|
40 |
+
BATCH_SIZE: 32 # Evaluating Batch size
|
41 |
+
NUM_WORKERS: 16 # Evaluating Batch size
|
42 |
+
|
43 |
+
TEST:
|
44 |
+
TEST_DIR: ''
|
45 |
+
CHECKPOINTS: '' #/data2/lrh/project/dance/Lodge/lodge_pylight/experiments/Edge_Module/0115_newNorm_256len_263_diff_bc768/checkpoints/epoch=3899.ckpt
|
46 |
+
SPLIT: 'gtest'
|
47 |
+
BATCH_SIZE: 32 # Testing Batch size
|
48 |
+
NUM_WORKERS: 12 # Evaluating Batch size
|
49 |
+
SAVE_PREDICTIONS: True # Weather to save predictions
|
50 |
+
COUNT_TIME: False # Weather to count time during test
|
51 |
+
REPLICATION_TIMES: 2 # Number of times to replicate the test
|
52 |
+
MM_NUM_SAMPLES: 100 # Number of samples for multimodal test
|
53 |
+
MM_NUM_REPEATS: 30 # Number of repeats for multimodal test
|
54 |
+
MM_NUM_TIMES: 10 # Number of times to repeat the multimodal test
|
55 |
+
DIVERSITY_TIMES: 300 # Number of times to repeat the diversity test
|
56 |
+
REP_I: 0
|
57 |
+
DATASETS: ['FINEDANCE_139CUT']
|
58 |
+
|
59 |
+
model:
|
60 |
+
target: 'modules'
|
61 |
+
vae_type: 'no'
|
62 |
+
|
63 |
+
vae: true # whether vae model
|
64 |
+
model_type: Local_Module # model type
|
65 |
+
condition: 'music'
|
66 |
+
latent_dim: [1, 256] #[512, 135] # [${FINEDANCE.full_seq_len}, ${DATASET.NFEATS}] # # latent dimension
|
67 |
+
ff_size: 1024 #
|
68 |
+
num_layers: 9 # number of layers
|
69 |
+
num_head: 4 # number of head layers
|
70 |
+
droupout: 0.1 # dropout rate
|
71 |
+
activation: gelu # activation type
|
72 |
+
guidance_scale: 7.5 # 7.5 #
|
73 |
+
guidance_uncondp: 0.1 # 0.1 0.25
|
74 |
+
|
75 |
+
|
76 |
+
diffusion:
|
77 |
+
target: dld.models.architectures.diffusion.GaussianDiffusion
|
78 |
+
params:
|
79 |
+
horizon: ${FINEDANCE.full_seq_len}
|
80 |
+
repr_dim: ${FINEDANCE.nfeats}
|
81 |
+
schedule: "cosine"
|
82 |
+
n_timestep: 1000
|
83 |
+
predict_epsilon: False
|
84 |
+
loss_type: "l2"
|
85 |
+
use_p2: False
|
86 |
+
cond_drop_prob: 0.25
|
87 |
+
guidance_weight: 2
|
88 |
+
|
89 |
+
DanceDecoder:
|
90 |
+
target: dld.models.architectures.model.Refine_DanceDecoder
|
91 |
+
params:
|
92 |
+
nfeats: ${FINEDANCE.nfeats}
|
93 |
+
seq_len: ${FINEDANCE.full_seq_len}
|
94 |
+
latent_dim: 512
|
95 |
+
ff_size: 1024
|
96 |
+
num_layers: 8
|
97 |
+
num_heads: 8
|
98 |
+
dropout: 0.1
|
99 |
+
cond_feature_dim: 35
|
100 |
+
activation: gelu
|
101 |
+
|
102 |
+
DanceDiscriminator:
|
103 |
+
target: dld.models.architectures.model.DanceDiscriminator
|
104 |
+
params:
|
105 |
+
nfeats: ${FINEDANCE.nfeats}
|
106 |
+
seq_len: ${FINEDANCE.full_seq_len}
|
107 |
+
latent_dim: 512
|
108 |
+
ff_size: 1024
|
109 |
+
num_layers: 8
|
110 |
+
num_heads: 8
|
111 |
+
dropout: 0.1
|
112 |
+
cond_feature_dim: 35
|
113 |
+
activation: gelu
|
114 |
+
|
115 |
+
LOSS:
|
116 |
+
TYPE: smpl_loss_relative # Losses type
|
117 |
+
LAMBDA_MSE: 0.636
|
118 |
+
LAMBDA_V: 2.964
|
119 |
+
LAMBDA_FK: 1
|
120 |
+
LAMBDA_FOOT: 20 # Lambda for reconstruction losses
|
121 |
+
LAMBDA_FC: 0
|
122 |
+
LAMBDA_TRANS: 0
|
123 |
+
LAMBDA_DIS: 0.1
|
124 |
+
DIST_SYNC_ON_STEP: True # Sync Losses on step when distributed trained
|
125 |
+
METRIC:
|
126 |
+
FORCE_IN_METER: True
|
127 |
+
DIST_SYNC_ON_STEP: True # # Sync Losses on step when distributed trained
|
128 |
+
TYPE: ['DanceDiffuse_Metric'] # DanceAE_Metric
|
129 |
+
LOGGER:
|
130 |
+
SACE_CHECKPOINT_EPOCH: 100 # 保存间隔
|
131 |
+
LOG_EVERY_STEPS: 100
|
132 |
+
VAL_EVERY_STEPS: 100
|
133 |
+
TENSORBOARD: true
|
134 |
+
WANDB:
|
135 |
+
OFFLINE: false
|
136 |
+
PROJECT: null
|
137 |
+
RESUME_ID: null
|
138 |
+
RENDER:
|
139 |
+
JOINT_TYPE: mmm
|
140 |
+
INPUT_MODE: npy
|
141 |
+
DIR: ''
|
142 |
+
NPY: ''
|
143 |
+
DENOISING: true
|
144 |
+
OLDRENDER: true
|
145 |
+
RES: high
|
146 |
+
DOWNSAMPLE: true
|
147 |
+
FPS: 12.5
|
148 |
+
CANONICALIZE: true
|
149 |
+
EXACT_FRAME: 0.5
|
150 |
+
NUM: 7
|
151 |
+
MODE: sequence
|
152 |
+
VID_EXT: mp4
|
153 |
+
ALWAYS_ON_FLOOR: false
|
154 |
+
GT: false
|
155 |
+
DEMO:
|
156 |
+
MusicDir: /data2/lrh/dataset/fine_dance/origin/music
|
157 |
+
RENDER: false
|
158 |
+
EXAMPLE: null
|
159 |
+
use_cached_features: false
|
160 |
+
|
161 |
+
FINEDANCE:
|
162 |
+
mix: False # weather do mix data augmention
|
163 |
+
full_seq_len: 256 # 150
|
164 |
+
windows: 8 # 16 #40 #
|
165 |
+
is_mirror: False # weather do mirror data augmention
|
166 |
+
nfeats: 139
|
167 |
+
njoints: 22
|
168 |
+
mode: single # "single" , "double_react", "double"
|
169 |
+
partial: full # "full" , "morden", "tradition"
|
170 |
+
GENRE_NUM: 16
|
configs/lodge/finedance_fea139_finetune_v2.yaml
ADDED
@@ -0,0 +1,169 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
NAME: Debug_FineDance_FineTuneV2_Local # Experiment name
|
2 |
+
ACCELERATOR: 'gpu' # Devices optioncal: “cpu”, “gpu”, “tpu”, “ipu”, “hpu”, “mps, “auto”
|
3 |
+
DEVICE: [0,1,2,3] #, # # Index of gpus eg. [0] or [0,1,2,3]
|
4 |
+
|
5 |
+
# FOLDER: ./experiments
|
6 |
+
SEED_VALUE: 1233
|
7 |
+
Norm: True
|
8 |
+
Discriminator: True
|
9 |
+
DEBUG: False
|
10 |
+
FineTune: True
|
11 |
+
TRAIN:
|
12 |
+
STAGE: diffusion # diffusion
|
13 |
+
SPLIT: 'train'
|
14 |
+
NUM_WORKERS: 16 # Number of workers
|
15 |
+
BATCH_SIZE: 190 # Size of batches
|
16 |
+
START_EPOCH: 1 # Start epoch
|
17 |
+
END_EPOCH: 1601 # End epoch
|
18 |
+
RESUME: '' # Experiment path to be resumed training
|
19 |
+
PRETRAINED: '/data2/lrh/project/dance/Lodge/lodge302/experiments/Local_Module/FineDance_relative_Norm_GenreDis_bc190/checkpoints/epoch=1399.ckpt' # Pretrained model path
|
20 |
+
DATASETS: ['FINEDANCE_139CUT'] # Training datasets
|
21 |
+
|
22 |
+
OPTIM:
|
23 |
+
TYPE: 'Adan' # Optimizer type
|
24 |
+
LR: 4e-4 # Learning rate
|
25 |
+
|
26 |
+
ABLATION:
|
27 |
+
VAE_TYPE: 'no' # vae ablation: actor or mcross
|
28 |
+
VAE_ARCH: 'encoder_decoder' # mdiffusion vae architecture
|
29 |
+
PE_TYPE: 'actor' # mdiffusion mld or actor
|
30 |
+
DIFF_PE_TYPE: 'actor' # mdiffusion mld or actor
|
31 |
+
SKIP_CONNECT: False # skip connection for denoiser va
|
32 |
+
# use linear to expand mean and std rather expand token nums
|
33 |
+
MLP_DIST: False
|
34 |
+
IS_DIST: False # Mcross distribution kl
|
35 |
+
PREDICT_EPSILON: False # noise or motion
|
36 |
+
|
37 |
+
EVAL:
|
38 |
+
SPLIT: 'gtest'
|
39 |
+
BATCH_SIZE: 256 # Evaluating Batch size
|
40 |
+
NUM_WORKERS: 16 # Evaluating Batch size
|
41 |
+
TEST:
|
42 |
+
TEST_DIR: ''
|
43 |
+
CHECKPOINTS: ''
|
44 |
+
SPLIT: 'gtest'
|
45 |
+
BATCH_SIZE: 256 # Testing Batch size
|
46 |
+
NUM_WORKERS: 12 # Evaluating Batch size
|
47 |
+
SAVE_PREDICTIONS: True # Weather to save predictions
|
48 |
+
COUNT_TIME: False # Weather to count time during test
|
49 |
+
REPLICATION_TIMES: 2 # Number of times to replicate the test
|
50 |
+
MM_NUM_SAMPLES: 100 # Number of samples for multimodal test
|
51 |
+
MM_NUM_REPEATS: 30 # Number of repeats for multimodal test
|
52 |
+
MM_NUM_TIMES: 10 # Number of times to repeat the multimodal test
|
53 |
+
DIVERSITY_TIMES: 300 # Number of times to repeat the diversity test
|
54 |
+
REP_I: 0
|
55 |
+
DATASETS: ['FINEDANCE_139CUT']
|
56 |
+
|
57 |
+
model:
|
58 |
+
target: 'modules'
|
59 |
+
vae_type: 'no'
|
60 |
+
|
61 |
+
vae: true # whether vae model
|
62 |
+
model_type: Local_Module # model type
|
63 |
+
condition: 'music'
|
64 |
+
latent_dim: [1, 256] #[512, 135] # [${FINEDANCE.full_seq_len}, ${DATASET.NFEATS}] # # latent dimension
|
65 |
+
ff_size: 1024 #
|
66 |
+
num_layers: 9 # number of layers
|
67 |
+
num_head: 4 # number of head layers
|
68 |
+
droupout: 0.1 # dropout rate
|
69 |
+
activation: gelu # activation type
|
70 |
+
guidance_scale: 7.5 # 7.5 #
|
71 |
+
guidance_uncondp: 0.1 # 0.1 0.25
|
72 |
+
|
73 |
+
diffusion:
|
74 |
+
target: dld.models.architectures.diffusion.GaussianDiffusion
|
75 |
+
params:
|
76 |
+
horizon: ${FINEDANCE.full_seq_len}
|
77 |
+
repr_dim: ${FINEDANCE.nfeats}
|
78 |
+
schedule: "cosine"
|
79 |
+
n_timestep: 1000
|
80 |
+
predict_epsilon: False
|
81 |
+
loss_type: "l2"
|
82 |
+
use_p2: False
|
83 |
+
cond_drop_prob: 0.25
|
84 |
+
guidance_weight: 2
|
85 |
+
|
86 |
+
DanceDecoder:
|
87 |
+
target: dld.models.architectures.model.Refine_DanceDecoder
|
88 |
+
params:
|
89 |
+
nfeats: ${FINEDANCE.nfeats}
|
90 |
+
seq_len: ${FINEDANCE.full_seq_len}
|
91 |
+
latent_dim: 512
|
92 |
+
ff_size: 1024
|
93 |
+
num_layers: 8
|
94 |
+
num_heads: 8
|
95 |
+
dropout: 0.1
|
96 |
+
cond_feature_dim: 35
|
97 |
+
activation: gelu
|
98 |
+
|
99 |
+
DanceDiscriminator:
|
100 |
+
target: dld.models.architectures.model.DanceDiscriminator
|
101 |
+
params:
|
102 |
+
nfeats: ${FINEDANCE.nfeats}
|
103 |
+
seq_len: ${FINEDANCE.full_seq_len}
|
104 |
+
latent_dim: 512
|
105 |
+
ff_size: 1024
|
106 |
+
num_layers: 8
|
107 |
+
num_heads: 8
|
108 |
+
dropout: 0.1
|
109 |
+
cond_feature_dim: 35
|
110 |
+
activation: gelu
|
111 |
+
|
112 |
+
LOSS:
|
113 |
+
TYPE: smpl_loss_relative # Losses type
|
114 |
+
LAMBDA_MSE: 0.636
|
115 |
+
LAMBDA_V: 2.964
|
116 |
+
LAMBDA_FK: 1
|
117 |
+
LAMBDA_FK_V: 0
|
118 |
+
LAMBDA_FK_A: 0
|
119 |
+
LAMBDA_FOOT: 10 # Lambda for reconstruction losses
|
120 |
+
LAMBDA_FC: 0
|
121 |
+
LAMBDA_TRANS: 0.5
|
122 |
+
LAMBDA_DIS: 0.1
|
123 |
+
DIST_SYNC_ON_STEP: True # Sync Losses on step when distributed trained
|
124 |
+
METRIC:
|
125 |
+
FORCE_IN_METER: True
|
126 |
+
DIST_SYNC_ON_STEP: True # # Sync Losses on step when distributed trained
|
127 |
+
TYPE: ['DanceDiffuse_Metric'] # DanceAE_Metric
|
128 |
+
LOGGER:
|
129 |
+
SACE_CHECKPOINT_EPOCH: 50 # 保存间隔
|
130 |
+
LOG_EVERY_STEPS: 50
|
131 |
+
VAL_EVERY_STEPS: 50
|
132 |
+
TENSORBOARD: true
|
133 |
+
WANDB:
|
134 |
+
OFFLINE: false
|
135 |
+
PROJECT: null
|
136 |
+
RESUME_ID: null
|
137 |
+
RENDER:
|
138 |
+
JOINT_TYPE: mmm
|
139 |
+
INPUT_MODE: npy
|
140 |
+
DIR: ''
|
141 |
+
NPY: ''
|
142 |
+
DENOISING: true
|
143 |
+
OLDRENDER: true
|
144 |
+
RES: high
|
145 |
+
DOWNSAMPLE: true
|
146 |
+
FPS: 12.5
|
147 |
+
CANONICALIZE: true
|
148 |
+
EXACT_FRAME: 0.5
|
149 |
+
NUM: 7
|
150 |
+
MODE: sequence
|
151 |
+
VID_EXT: mp4
|
152 |
+
ALWAYS_ON_FLOOR: false
|
153 |
+
GT: false
|
154 |
+
DEMO:
|
155 |
+
MusicDir: /data2/lrh/dataset/fine_dance/origin/music
|
156 |
+
RENDER: false
|
157 |
+
EXAMPLE: null
|
158 |
+
use_cached_features: false
|
159 |
+
|
160 |
+
FINEDANCE:
|
161 |
+
mix: False # 是否做混合的数据增强
|
162 |
+
full_seq_len: 256 # 150
|
163 |
+
windows: 8 # 16 #40 #
|
164 |
+
is_mirror: False # 是否做镜像的数据增强
|
165 |
+
nfeats: 139
|
166 |
+
njoints: 22
|
167 |
+
mode: single # "single" , "double_react", "double"
|
168 |
+
partial: full # "full" , "morden", "tradition"
|
169 |
+
GENRE_NUM: 16
|