| is_train: True |
| ddp: False |
| stat: ts |
| root_path: ./ |
| out_path: ./outputs/audio2pose/ |
| project: s2g |
| data_path: ./EMAGE/test_sequences/ |
| e_path: weights/AESKConv_240_100.bin |
| eval_model: motion_representation |
| e_name: VAESKConv |
| test_ckpt: ./EMAGE/emage_240.bin |
| data_path_1: ./EMAGE/ |
| vae_test_len: 32 |
| vae_test_dim: 330 |
| vae_test_stride: 20 |
| vae_length: 240 |
| vae_codebook_size: 256 |
| vae_layer: 4 |
| vae_grow: [1,1,2,1] |
| variational: False |
|
|
| |
| training_speakers: [2] |
| additional_data: False |
| cache_path: ./datasets/beat_cache/beat_smplx_en_emage_test/ |
| dataset: beat_testonly |
| new_cache: True |
|
|
| |
| ori_joints: beat_smplx_joints |
| tar_joints: beat_smplx_full |
| pose_rep: smplxflame_30 |
| pose_norm: False |
| pose_fps: 30 |
| rot6d: True |
| pre_frames: 4 |
| pose_dims: 330 |
| pose_length: 64 |
| stride: 20 |
| test_length: 64 |
| motion_f: 256 |
| m_pre_encoder: null |
| m_encoder: null |
| m_fix_pre: False |
|
|
| |
| audio_rep: onset+amplitude |
| audio_sr: 16000 |
| audio_fps: 16000 |
| audio_norm: False |
| audio_f: 256 |
| |
| |
| |
|
|
| |
| word_rep: textgrid |
| word_index_num: 11195 |
| word_dims: 300 |
| freeze_wordembed: False |
| word_f: 256 |
| t_pre_encoder: fasttext |
| t_encoder: null |
| t_fix_pre: False |
|
|
| |
| facial_rep: smplxflame_30 |
| facial_dims: 100 |
| facial_norm: False |
| facial_f: 0 |
| f_pre_encoder: null |
| f_encoder: null |
| f_fix_pre: False |
|
|
| |
| id_rep: onehot |
| speaker_f: 0 |
|
|
| |
| batch_size: 64 |
| |
| |
| lr_base: 5e-4 |
| model: emage |
| g_name: MAGE_Transformer |
| trainer: emage |
| hidden_size: 768 |
| n_layer: 1 |
| |
| rec_weight: 1 |
| grad_norm: 0.99 |
| epochs: 400 |
| test_period: 20 |
| ll: 3 |
| lf: 3 |
| lu: 3 |
| lh: 3 |
| cl: 1 |
| cf: 0 |
| cu: 1 |
| ch: 1 |
|
|