camenduru
/

EMAGE

Model card Files Files and versions

EMAGE / configs /emage_test.yaml

camenduru's picture

thanks to H-Liu1997 ❤

bb82d2f verified about 2 years ago

history blame contribute delete

1.74 kB

	is_train: True
	ddp: False
	stat: ts
	root_path: ./
	out_path: ./outputs/audio2pose/
	project: s2g
	data_path: ./EMAGE/test_sequences/
	e_path: weights/AESKConv_240_100.bin
	eval_model: motion_representation
	e_name: VAESKConv
	test_ckpt: ./EMAGE/emage_240.bin
	data_path_1: ./EMAGE/
	vae_test_len: 32
	vae_test_dim: 330
	vae_test_stride: 20
	vae_length: 240
	vae_codebook_size: 256
	vae_layer: 4
	vae_grow: [1,1,2,1]
	variational: False

	# data config
	training_speakers: [2] #[1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30]
	additional_data: False
	cache_path: ./datasets/beat_cache/beat_smplx_en_emage_test/
	dataset: beat_testonly
	new_cache: True

	# motion config
	ori_joints: beat_smplx_joints
	tar_joints: beat_smplx_full
	pose_rep: smplxflame_30
	pose_norm: False
	pose_fps: 30
	rot6d: True
	pre_frames: 4
	pose_dims: 330
	pose_length: 64
	stride: 20
	test_length: 64
	motion_f: 256
	m_pre_encoder: null
	m_encoder: null
	m_fix_pre: False

	# audio config
	audio_rep: onset+amplitude
	audio_sr: 16000
	audio_fps: 16000
	audio_norm: False
	audio_f: 256
	# a_pre_encoder: tcn_camn
	# a_encoder: none
	# a_fix_pre: False

	# text config
	word_rep: textgrid
	word_index_num: 11195
	word_dims: 300
	freeze_wordembed: False
	word_f: 256
	t_pre_encoder: fasttext
	t_encoder: null
	t_fix_pre: False

	# facial config
	facial_rep: smplxflame_30
	facial_dims: 100
	facial_norm: False
	facial_f: 0
	f_pre_encoder: null
	f_encoder: null
	f_fix_pre: False

	# speaker config
	id_rep: onehot
	speaker_f: 0

	# model config
	batch_size: 64
	# warmup_epochs: 1
	# warmup_lr: 1e-6
	lr_base: 5e-4
	model: emage
	g_name: MAGE_Transformer
	trainer: emage
	hidden_size: 768
	n_layer: 1

	rec_weight: 1
	grad_norm: 0.99
	epochs: 400
	test_period: 20
	ll: 3
	lf: 3
	lu: 3
	lh: 3
	cl: 1
	cf: 0
	cu: 1
	ch: 1