Tr0612 commited on
Commit
889a15d
·
verified ·
1 Parent(s): dcbc5a2

Delete train_config.json

Browse files
Files changed (1) hide show
  1. train_config.json +0 -59
train_config.json DELETED
@@ -1,59 +0,0 @@
1
- {
2
- "dataset_type": "short_metaworld",
3
- "data_root": "data/short-metaworld-vla",
4
- "train_jsonl": "",
5
- "val_jsonl": "",
6
- "val_ratio": 0.15,
7
- "vision_model_name": "google/siglip2-base-patch16-224",
8
- "text_model_name": "google/siglip2-base-patch16-224",
9
- "separate_backbones": false,
10
- "image_size": 224,
11
- "freeze_vision": true,
12
- "freeze_text": true,
13
- "unfreeze_vision_last_n_layers": 2,
14
- "unfreeze_text_last_n_layers": 2,
15
- "fusion_type": "cross_attn",
16
- "proj_dim": 512,
17
- "fusion_hidden_dim": 1024,
18
- "fusion_out_dim": 512,
19
- "fusion_num_layers": 3,
20
- "fusion_num_heads": 8,
21
- "fusion_dropout": 0.1,
22
- "normalize_embeddings": true,
23
- "action_head_type": "moe",
24
- "action_mlp_hidden_dim": 256,
25
- "action_mlp_layers": 2,
26
- "action_mlp_dropout": 0.1,
27
- "moe_num_experts": 4,
28
- "moe_hidden_dim": 512,
29
- "moe_load_balance_weight": 0.001,
30
- "router_condition": "action_input",
31
- "act_chunk_size": 8,
32
- "act_hidden_dim": 512,
33
- "act_num_layers": 2,
34
- "act_dropout": 0.1,
35
- "use_geometry_features": true,
36
- "geometry_dim": 6,
37
- "temporal_context": 4,
38
- "action_dim": 4,
39
- "num_workers": 8,
40
- "normalize_action_targets": true,
41
- "action_norm_eps": 1e-06,
42
- "learnable_action_scale": true,
43
- "action_scale_init": 1.0,
44
- "loss_type": "huber",
45
- "huber_delta": 0.5,
46
- "epochs": 80,
47
- "batch_size": 32,
48
- "grad_accum_steps": 2,
49
- "learning_rate": 5e-05,
50
- "weight_decay": 0.01,
51
- "grad_clip_norm": 1.0,
52
- "use_fp16": true,
53
- "early_stopping_patience": 8,
54
- "early_stopping_min_delta": 0.0005,
55
- "seed": 42,
56
- "device": "cuda",
57
- "out_dir": "checkpoints_stage2_moe_full_peg_only",
58
- "save_best_by_val": true
59
- }