File size: 3,126 Bytes
09154c8 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 | {
"allow_non_vq_stats": false,
"amp": true,
"amp_dtype": "bf16",
"batch_size": 64,
"best_checkpoint_limit": 3,
"betas": [
0.9,
0.95
],
"clean_loss_weight": 0.0,
"clip_path": "checkpoints/clip/ViT-B-32.pt",
"clip_version": "ViT-B/32",
"code_ce_gamma": 2.0,
"code_ce_normalize": true,
"code_ce_t_max": 0.9,
"code_ce_t_min": 0.35,
"code_dim": 128,
"cond_drop_prob": 0.1,
"coupling_mode": "frame_grouped",
"data_root": "dataset/HumanML3D",
"dataset_name": "t2m",
"dataset_opt_path": "",
"decode_mode": "nearest",
"denoiser_p_mean": -1.5,
"denoiser_p_std": 0.8,
"depth_double": 6,
"depth_single": 12,
"disable_full_eval_ema": false,
"disable_grad_health_check": false,
"disable_self_condition": true,
"disable_vq_contract_check": false,
"dropout": 0.05,
"eta_min_ratio": 0.01,
"flow_loss_weight": 1.0,
"full_eval_batch_size": 32,
"full_eval_cond_scale": 6.0,
"full_eval_every_epoch": 10,
"full_eval_num_workers": 4,
"full_eval_repeat_times": 1,
"full_eval_seed": 42,
"full_eval_start_epoch": 0,
"full_eval_steps": 96,
"gamma": 0.5,
"geometry_severe_quantile": 0.75,
"gpu_id": -1,
"grad_clip": 1.0,
"grad_health_check_steps": 20,
"grad_health_min_abs": 0.0,
"hidden_size": 1152,
"holder_depth": 2,
"holder_mlp_ratio": 4.0,
"iters_per_epoch": 383,
"kv_root": ".",
"latent_norm_eps": 1e-06,
"latent_norm_mode": "codebook",
"latent_offset": 0.0,
"log_every": 50,
"lr": 0.0001,
"lr_scheduler": "half_cosine",
"max_epoch": 600,
"max_steps": 0,
"mean_path": "stats/mean.npy",
"milestone_unit": "auto",
"milestones": [
0.8,
0.9,
0.95
],
"mlp_ratio": 4.0,
"motion_length": 196,
"name": "codeflow_hml3d_best_top3_release",
"noise_scale": 1.0,
"num_codes": 128,
"num_heads": 12,
"num_parts": 6,
"num_workers": 4,
"output_dir": "checkpoints/t2m/codeflow_hml3d_best_top3_release",
"part_hidden_dim": 192,
"reachable_milestones": [],
"release_source_run": "codeflow_part_structured_newvqtop3_w150_p192_h1152_d6s12_drop005_w0_b64_lr1e4_e600_eval10from0_seed42_test_h200_blossom_g1_20260601",
"representation": "part_structured",
"resolved_milestone_epochs": [],
"resolved_milestones": [],
"resume": "checkpoints/t2m/codeflow_part_structured_newvqtop3_w150_p192_h1152_d6s12_drop005_w0_b64_lr1e4_e600_eval10from0_seed42_test_h200_blossom_g1_20260601/model/latest.pt",
"sampling_method": "ode",
"sampling_schedule": "uniform",
"save_every": 0,
"sde_gamma": 0.0,
"seed": 42,
"self_cond_prob": 0.5,
"std_path": "stats/std.npy",
"terminal_loss_weight": 0.0,
"terminal_mode": "tied_logits",
"terminal_tau": 1.0,
"terminal_tau_floor": 1e-06,
"terminal_tau_mode": "codebook_nn",
"time_patch": 1,
"time_schedule": "uniform",
"total_train_steps": 229800,
"unit_length": 4,
"vq_backend": "kv_part",
"vq_checkpoint": "rvq/part_vq_hml3d_overlap_best_top3.pth",
"vq_contract_samples": 2,
"vq_opt_path": "",
"vq_partition": "rvq/skeleton_partition.json",
"warmup_epochs": 5.221932114882507,
"warmup_steps": 2000,
"weight_decay": 0.01
}
|