hywslxh commited on
Commit
540ee9b
·
verified ·
1 Parent(s): ae9d8b9

Update configs/kosmos_ph_calvin_abc.json

Browse files
Files changed (1) hide show
  1. configs/kosmos_ph_calvin_abc.json +16 -41
configs/kosmos_ph_calvin_abc.json CHANGED
@@ -6,16 +6,8 @@
6
  "model_url": "https://huggingface.co/microsoft/kosmos-2-patch14-224",
7
  "seq_len": 1,
8
  "image_size": 224,
9
- "image_mean": [
10
- 0.48145466,
11
- 0.4578275,
12
- 0.40821073
13
- ],
14
- "image_std": [
15
- 0.26862954,
16
- 0.26130258,
17
- 0.27577711
18
- ],
19
  "window_size": 16,
20
  "fwd_pred_next_n": 10,
21
  "arm_gripper_loss_ratio": 0.01,
@@ -26,8 +18,8 @@
26
  "num_workers": 16,
27
  "data_scale": 1,
28
  "optimizer": "adam",
29
- "learning_rate": 0.0001,
30
- "min_lr_scale": 0.01,
31
  "weight_decay": 0,
32
  "warmup_epochs": 0.25,
33
  "warmup_steps": 0,
@@ -40,16 +32,16 @@
40
  "use_vision_resampler": false,
41
  "vision_masked_ratio": 0.9,
42
  "use_tube_mask": false,
43
- "output_root": "checkpoints/kosmos/calvin_finetune",
44
- "log_root": "logs/kosmos/calvin_finetune",
45
- "cache_root": "cache/kosmos",
46
  "model_load_path": null,
47
  "model_load_source": "torch",
48
  "resume": null,
49
  "model_path": ".vlms/kosmos-2-patch14-224",
50
  "model_config": ".vlms/kosmos-2-patch14-224/config.json",
51
  "train_setup": {
52
- "precision": "16",
53
  "predict_action": true,
54
  "predict_forward": false,
55
  "predict_forward_hand": false,
@@ -64,7 +56,7 @@
64
  "mm_use_im_patch_token": false,
65
  "gradient_checkpointing": false,
66
  "lora_enable": false,
67
- "mm_projector_lr": 0.0001,
68
  "lora_r": 64,
69
  "lora_alpha": 16,
70
  "lora_dropout": 0.05,
@@ -99,13 +91,16 @@
99
  "max_text_len": 256,
100
  "additional_special_tokens": null
101
  },
 
 
 
 
 
102
  "trainer": {
103
  "accelerator": "gpu",
104
  "strategy": "deepspeed_stage_2",
105
  "precision": "16",
106
- "logger": [
107
- "tensorboard"
108
- ],
109
  "gradient_clip_val": 1.0,
110
  "use_distributed_sampler": false,
111
  "log_every_n_steps": 10,
@@ -130,25 +125,5 @@
130
  },
131
  "norm_action": true,
132
  "norm_min": -0.65,
133
- "norm_max": 0.65,
134
- "raw_config_path": "configs/kosmos/finetune_kosmos_cont-lstm-post_full-ft_text_vision_wd=0_hist=16_act=10_use-hand_aug-shift_act-norm_lr-1e-4_abc.json",
135
- "config": "configs/kosmos/finetune_kosmos_cont-lstm-post_full-ft_text_vision_wd=0_hist=16_act=10_use-hand_aug-shift_act-norm_lr-1e-4_abc.json",
136
- "gpus": 8,
137
- "num_nodes": 4,
138
- "log_dir": "logs/kosmos/calvin_finetune/2024-11-20/04-00",
139
- "output_dir": "checkpoints/kosmos/calvin_finetune/2024-11-20/04-00",
140
- "data_dir": null,
141
- "annotation_file": null,
142
- "data_subfolder": null,
143
- "task_num": null,
144
- "exp_name": "04-00",
145
- "use_multi_modal_emb": false,
146
- "no_video_pretrained_model": false,
147
- "finetune": false,
148
- "llm": {
149
- "type": null,
150
- "n_embd": null,
151
- "n_layer": null,
152
- "n_head": null
153
- }
154
  }
 
6
  "model_url": "https://huggingface.co/microsoft/kosmos-2-patch14-224",
7
  "seq_len": 1,
8
  "image_size": 224,
9
+ "image_mean": [0.48145466, 0.4578275, 0.40821073],
10
+ "image_std": [0.26862954, 0.26130258, 0.27577711],
 
 
 
 
 
 
 
 
11
  "window_size": 16,
12
  "fwd_pred_next_n": 10,
13
  "arm_gripper_loss_ratio": 0.01,
 
18
  "num_workers": 16,
19
  "data_scale": 1,
20
  "optimizer": "adam",
21
+ "learning_rate": 2e-5,
22
+ "min_lr_scale": 1e-2,
23
  "weight_decay": 0,
24
  "warmup_epochs": 0.25,
25
  "warmup_steps": 0,
 
32
  "use_vision_resampler": false,
33
  "vision_masked_ratio": 0.9,
34
  "use_tube_mask": false,
35
+ "output_root": "runs/checkpoints",
36
+ "log_root": "runs/logs",
37
+ "cache_root": "runs/cache",
38
  "model_load_path": null,
39
  "model_load_source": "torch",
40
  "resume": null,
41
  "model_path": ".vlms/kosmos-2-patch14-224",
42
  "model_config": ".vlms/kosmos-2-patch14-224/config.json",
43
  "train_setup": {
44
+ "precision": "bf16",
45
  "predict_action": true,
46
  "predict_forward": false,
47
  "predict_forward_hand": false,
 
56
  "mm_use_im_patch_token": false,
57
  "gradient_checkpointing": false,
58
  "lora_enable": false,
59
+ "mm_projector_lr": 1e-4,
60
  "lora_r": 64,
61
  "lora_alpha": 16,
62
  "lora_dropout": 0.05,
 
91
  "max_text_len": 256,
92
  "additional_special_tokens": null
93
  },
94
+ "vlm": {
95
+ "type": "AutoModelForVision2Seq",
96
+ "name": "kosmos",
97
+ "pretrained_model_name_or_path": ".vlms/kosmos-2-patch14-224"
98
+ },
99
  "trainer": {
100
  "accelerator": "gpu",
101
  "strategy": "deepspeed_stage_2",
102
  "precision": "16",
103
+ "logger": ["tensorboard"],
 
 
104
  "gradient_clip_val": 1.0,
105
  "use_distributed_sampler": false,
106
  "log_every_n_steps": 10,
 
125
  },
126
  "norm_action": true,
127
  "norm_min": -0.65,
128
+ "norm_max": 0.65
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
129
  }