Delete train_config.json
Browse files- train_config.json +0 -59
train_config.json
DELETED
|
@@ -1,59 +0,0 @@
|
|
| 1 |
-
{
|
| 2 |
-
"dataset_type": "short_metaworld",
|
| 3 |
-
"data_root": "data/short-metaworld-vla",
|
| 4 |
-
"train_jsonl": "",
|
| 5 |
-
"val_jsonl": "",
|
| 6 |
-
"val_ratio": 0.15,
|
| 7 |
-
"vision_model_name": "google/siglip2-base-patch16-224",
|
| 8 |
-
"text_model_name": "google/siglip2-base-patch16-224",
|
| 9 |
-
"separate_backbones": false,
|
| 10 |
-
"image_size": 224,
|
| 11 |
-
"freeze_vision": true,
|
| 12 |
-
"freeze_text": true,
|
| 13 |
-
"unfreeze_vision_last_n_layers": 2,
|
| 14 |
-
"unfreeze_text_last_n_layers": 2,
|
| 15 |
-
"fusion_type": "cross_attn",
|
| 16 |
-
"proj_dim": 512,
|
| 17 |
-
"fusion_hidden_dim": 1024,
|
| 18 |
-
"fusion_out_dim": 512,
|
| 19 |
-
"fusion_num_layers": 3,
|
| 20 |
-
"fusion_num_heads": 8,
|
| 21 |
-
"fusion_dropout": 0.1,
|
| 22 |
-
"normalize_embeddings": true,
|
| 23 |
-
"action_head_type": "moe",
|
| 24 |
-
"action_mlp_hidden_dim": 256,
|
| 25 |
-
"action_mlp_layers": 2,
|
| 26 |
-
"action_mlp_dropout": 0.1,
|
| 27 |
-
"moe_num_experts": 4,
|
| 28 |
-
"moe_hidden_dim": 512,
|
| 29 |
-
"moe_load_balance_weight": 0.001,
|
| 30 |
-
"router_condition": "action_input",
|
| 31 |
-
"act_chunk_size": 8,
|
| 32 |
-
"act_hidden_dim": 512,
|
| 33 |
-
"act_num_layers": 2,
|
| 34 |
-
"act_dropout": 0.1,
|
| 35 |
-
"use_geometry_features": true,
|
| 36 |
-
"geometry_dim": 6,
|
| 37 |
-
"temporal_context": 4,
|
| 38 |
-
"action_dim": 4,
|
| 39 |
-
"num_workers": 8,
|
| 40 |
-
"normalize_action_targets": true,
|
| 41 |
-
"action_norm_eps": 1e-06,
|
| 42 |
-
"learnable_action_scale": true,
|
| 43 |
-
"action_scale_init": 1.0,
|
| 44 |
-
"loss_type": "huber",
|
| 45 |
-
"huber_delta": 0.5,
|
| 46 |
-
"epochs": 80,
|
| 47 |
-
"batch_size": 32,
|
| 48 |
-
"grad_accum_steps": 2,
|
| 49 |
-
"learning_rate": 5e-05,
|
| 50 |
-
"weight_decay": 0.01,
|
| 51 |
-
"grad_clip_norm": 1.0,
|
| 52 |
-
"use_fp16": true,
|
| 53 |
-
"early_stopping_patience": 8,
|
| 54 |
-
"early_stopping_min_delta": 0.0005,
|
| 55 |
-
"seed": 42,
|
| 56 |
-
"device": "cuda",
|
| 57 |
-
"out_dir": "checkpoints_stage2_moe_full_peg_only",
|
| 58 |
-
"save_best_by_val": true
|
| 59 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|