|
is_train: True |
|
ddp: False |
|
stat: ts |
|
root_path: ./ |
|
out_path: ./outputs/audio2pose/ |
|
project: s2g |
|
data_path: ./EMAGE/test_sequences/ |
|
e_path: weights/AESKConv_240_100.bin |
|
eval_model: motion_representation |
|
e_name: VAESKConv |
|
test_ckpt: ./EMAGE/emage_audio_175.bin |
|
data_path_1: ./EMAGE/ |
|
vae_test_len: 32 |
|
vae_test_dim: 330 |
|
vae_test_stride: 20 |
|
vae_length: 240 |
|
vae_codebook_size: 256 |
|
vae_layer: 4 |
|
vae_grow: [1,1,2,1] |
|
variational: False |
|
|
|
|
|
training_speakers: [2] |
|
additional_data: False |
|
cache_path: ./datasets/beat_cache/beat_smplx_en_emage_test/ |
|
dataset: beat_testonly_hf |
|
new_cache: True |
|
|
|
|
|
ori_joints: beat_smplx_joints |
|
tar_joints: beat_smplx_full |
|
pose_rep: smplxflame_30 |
|
pose_norm: False |
|
pose_fps: 30 |
|
rot6d: True |
|
pre_frames: 4 |
|
pose_dims: 330 |
|
pose_length: 64 |
|
stride: 20 |
|
test_length: 64 |
|
motion_f: 256 |
|
m_pre_encoder: null |
|
m_encoder: null |
|
m_fix_pre: False |
|
|
|
|
|
audio_rep: wave16k |
|
audio_sr: 16000 |
|
audio_fps: 16000 |
|
audio_norm: False |
|
audio_f: 256 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
facial_rep: smplxflame_30 |
|
facial_dims: 100 |
|
facial_norm: False |
|
facial_f: 0 |
|
f_pre_encoder: null |
|
f_encoder: null |
|
f_fix_pre: False |
|
|
|
|
|
id_rep: onehot |
|
speaker_f: 0 |
|
|
|
|
|
batch_size: 64 |
|
|
|
|
|
lr_base: 5e-4 |
|
model: emage_audio |
|
g_name: MAGE_Transformer |
|
trainer: emage |
|
hidden_size: 768 |
|
n_layer: 1 |
|
|
|
rec_weight: 1 |
|
grad_norm: 0.99 |
|
epochs: 400 |
|
test_period: 20 |
|
ll: 3 |
|
lf: 3 |
|
lu: 3 |
|
lh: 3 |
|
cl: 1 |
|
cf: 0 |
|
cu: 1 |
|
ch: 1 |
|
|