| name: synth-u_text2motion | |
| description: '' | |
| seed: 1 | |
| device: cuda:0 | |
| train: | |
| stages: | |
| - name: pretrain | |
| epochs: 200 | |
| lr: 0.001 | |
| use_condition: false | |
| freeze_modules: [] | |
| early_stopping_patience: 50 | |
| - name: finetune | |
| epochs: 500 | |
| lr: 0.001 | |
| use_condition: true | |
| freeze_modules: [] | |
| load_from_stage: pretrain | |
| early_stopping_patience: 50 | |
| epochs: 700 | |
| batch_size: 256 | |
| lr: 0.001 | |
| weight_decay: 0.0001 | |
| scheduler: cosine | |
| scheduler_params: {} | |
| early_stopping_patience: 5 | |
| gradient_clip_val: 1.0 | |
| accumulate_grad_batches: 1 | |
| val_check_interval: 1.0 | |
| num_workers: 4 | |
| pin_memory: true | |
| limit_train_batches: 1.0 | |
| limit_val_batches: 1.0 | |
| limit_test_batches: 1.0 | |
| num_sanity_val_steps: 2 | |
| data: | |
| name: synth-u | |
| data_folder: __DATA_ROOT__/datasets/synth-u | |
| n_var: 1 | |
| seq_length: 128 | |
| normalize: false | |
| train_split: 0.8 | |
| val_split: 0.1 | |
| model: | |
| name: text2motion | |
| channels: 64 | |
| layers: 3 | |
| nheads: 8 | |
| dropout: 0.1 | |
| unit_length: 4 | |
| dim_movement_latent: 512 | |
| dim_movement_enc_hidden: 512 | |
| dim_movement_dec_hidden: 512 | |
| text_latent_dim: 1024 | |
| dim_att_vec: 512 | |
| dim_z: 128 | |
| n_layers_pri: 1 | |
| n_layers_pos: 1 | |
| n_layers_dec: 1 | |
| dim_pri_hidden: 1024 | |
| dim_pos_hidden: 1024 | |
| dim_dec_hidden: 1024 | |
| lambda_rec_ts: 1.0 | |
| lambda_rec_mov: 1.0 | |
| lambda_kld: 0.01 | |
| teacher_forcing_ratio: 0.9 | |
| detach_movement_latents: true | |
| condition: | |
| text: | |
| enabled: true | |
| input_dim: 1024 | |
| embedding_key: cap_emb | |
| dropout: 0.0 | |
| cfg_scale: 1.0 | |
| attribute: | |
| enabled: false | |
| continuous_dim: 0 | |
| discrete_configs: [] | |
| output_dim: 128 | |
| dropout: 0.0 | |
| label: | |
| enabled: false | |
| num_classes: 10 | |
| output_dim: 64 | |
| fusion: concat | |
| condition_dropout: 0.0 | |
| eval: | |
| n_samples: 10 | |
| metrics: | |
| - dtw | |
| - wape | |
| - ed | |
| - crps | |
| - acd | |
| - sd | |
| - kd | |
| - mdd | |
| - fid | |
| - sfd | |
| - jftsd | |
| - prdc_f1 | |
| - joint_prdc_f1 | |
| - cttp | |
| - disc_auc | |
| batch_size: 128 | |
| save_samples: true | |
| sampler: ddim | |
| display_interval: 10 | |
| clip_config_path: __RELEASE_ROOT__/resources/cttp/synth-u/model_configs.yaml | |
| clip_model_path: __RELEASE_ROOT__/resources/cttp/synth-u/clip_model_best.pth | |
| cache_folder: __CACHE_ROOT__/text2motion/synth-u/seed1 | |
| use_longalign: false | |
| reference_split: train | |
| disc_auc: | |
| k_folds: 5 | |
| epochs: 5 | |
| batch_size: 128 | |
| lr: 0.001 | |
| weight_decay: 0.0001 | |
| hidden_channels: 128 | |
| num_layers: 3 | |
| dropout: 0.1 | |
| seed: 42 | |
| num_workers: 0 | |
| prdc: | |
| k: 5 | |
| max_samples: 5000 | |
| seed: 0 | |
| metric: euclidean | |
| backend: auto | |
| knn_chunk_size: 4096 | |
| joint_enable: true | |
| joint_weights: | |
| ts: 1.0 | |
| text: 1.0 | |
| joint_normalize: standard | |
| segment_classifier: | |
| enable: false | |
| segment_len: 128 | |
| n_segments: 3 | |
| seed: 42 | |
| acd_max_lag: 50 | |
| mdd_bins: 32 | |
| use_cache: false | |
| cache_file: predictions_cache.pkl | |
| output_dir: '' | |
| created_at: '2025-12-22T21:35:41.926282' | |