hywslxh commited on
Commit
ae9d8b9
·
verified ·
1 Parent(s): ce462d5

Update configs/kosmos_ph_calvin_abcd.json

Browse files
Files changed (1) hide show
  1. configs/kosmos_ph_calvin_abcd.json +21 -47
configs/kosmos_ph_calvin_abcd.json CHANGED
@@ -6,16 +6,8 @@
6
  "model_url": "https://huggingface.co/microsoft/kosmos-2-patch14-224",
7
  "seq_len": 1,
8
  "image_size": 224,
9
- "image_mean": [
10
- 0.48145466,
11
- 0.4578275,
12
- 0.40821073
13
- ],
14
- "image_std": [
15
- 0.26862954,
16
- 0.26130258,
17
- 0.27577711
18
- ],
19
  "window_size": 16,
20
  "fwd_pred_next_n": 10,
21
  "arm_gripper_loss_ratio": 0.01,
@@ -26,8 +18,8 @@
26
  "num_workers": 16,
27
  "data_scale": 1,
28
  "optimizer": "adam",
29
- "learning_rate": 0.0001,
30
- "min_lr_scale": 0.01,
31
  "weight_decay": 0,
32
  "warmup_epochs": 0.25,
33
  "warmup_steps": 0,
@@ -40,16 +32,16 @@
40
  "use_vision_resampler": false,
41
  "vision_masked_ratio": 0.9,
42
  "use_tube_mask": false,
43
- "output_root": "checkpoints/kosmos/calvin_finetune",
44
- "log_root": "logs/kosmos/calvin_finetune",
45
- "cache_root": "cache/kosmos",
46
  "model_load_path": null,
47
  "model_load_source": "torch",
48
  "resume": null,
49
- "model_path": "/mnt/bn/robotics-data-lxh-lq/LLaVA/kosmos-2-patch14-224",
50
- "model_config": "/mnt/bn/robotics-data-lxh-lq/LLaVA/kosmos-2-patch14-224/config.json",
51
  "train_setup": {
52
- "precision": "16",
53
  "predict_action": true,
54
  "predict_forward": false,
55
  "predict_forward_hand": false,
@@ -64,7 +56,7 @@
64
  "mm_use_im_patch_token": false,
65
  "gradient_checkpointing": false,
66
  "lora_enable": false,
67
- "mm_projector_lr": 0.0001,
68
  "lora_r": 64,
69
  "lora_alpha": 16,
70
  "lora_dropout": 0.05,
@@ -94,18 +86,21 @@
94
  "fwd_head": null,
95
  "tokenizer": {
96
  "type": "AutoProcessor",
97
- "pretrained_model_name_or_path": "/mnt/bn/robotics-data-lxh-lq/LLaVA/kosmos-2-patch14-224",
98
  "tokenizer_type": "kosmos",
99
  "max_text_len": 256,
100
  "additional_special_tokens": null
101
  },
 
 
 
 
 
102
  "trainer": {
103
  "accelerator": "gpu",
104
  "strategy": "deepspeed_stage_2",
105
  "precision": "16",
106
- "logger": [
107
- "tensorboard"
108
- ],
109
  "gradient_clip_val": 1.0,
110
  "use_distributed_sampler": false,
111
  "log_every_n_steps": 10,
@@ -117,7 +112,7 @@
117
  },
118
  "train_dataset": {
119
  "type": "DiskCalvinDataset",
120
- "data_dir": "/mnt/bn/robotics/manipulation_data/calvin_data/task_ABCD_D/training",
121
  "shift_first": false,
122
  "model_name": "kosmos",
123
  "rgb_pad": 10,
@@ -125,31 +120,10 @@
125
  },
126
  "val_dataset": {
127
  "type": "DiskCalvinDataset",
128
- "data_dir": "/mnt/bn/robotics/manipulation_data/calvin_data/task_ABCD_D/validation",
129
  "model_name": "kosmos"
130
  },
131
  "norm_action": true,
132
  "norm_min": -0.65,
133
- "norm_max": 0.65,
134
- "scheduler": "cosine",
135
- "raw_config_path": "configs/kosmos/finetune_kosmos_cont-lstm-post_full-ft_text_vision_wd=0_hist=16_act=10_use-hand_aug-shift_act-norm_lr-1e-4.json",
136
- "config": "configs/kosmos/finetune_kosmos_cont-lstm-post_full-ft_text_vision_wd=0_hist=16_act=10_use-hand_aug-shift_act-norm_lr-1e-4.json",
137
- "gpus": 8,
138
- "num_nodes": 4,
139
- "log_dir": "logs/kosmos/calvin_finetune/2024-11-20/04-00",
140
- "output_dir": "checkpoints/kosmos/calvin_finetune/2024-11-20/04-00",
141
- "data_dir": null,
142
- "annotation_file": null,
143
- "data_subfolder": null,
144
- "task_num": null,
145
- "exp_name": "17-54",
146
- "use_multi_modal_emb": false,
147
- "no_video_pretrained_model": false,
148
- "finetune": false,
149
- "llm": {
150
- "type": null,
151
- "n_embd": null,
152
- "n_layer": null,
153
- "n_head": null
154
- }
155
  }
 
6
  "model_url": "https://huggingface.co/microsoft/kosmos-2-patch14-224",
7
  "seq_len": 1,
8
  "image_size": 224,
9
+ "image_mean": [0.48145466, 0.4578275, 0.40821073],
10
+ "image_std": [0.26862954, 0.26130258, 0.27577711],
 
 
 
 
 
 
 
 
11
  "window_size": 16,
12
  "fwd_pred_next_n": 10,
13
  "arm_gripper_loss_ratio": 0.01,
 
18
  "num_workers": 16,
19
  "data_scale": 1,
20
  "optimizer": "adam",
21
+ "learning_rate": 2e-5,
22
+ "min_lr_scale": 1e-2,
23
  "weight_decay": 0,
24
  "warmup_epochs": 0.25,
25
  "warmup_steps": 0,
 
32
  "use_vision_resampler": false,
33
  "vision_masked_ratio": 0.9,
34
  "use_tube_mask": false,
35
+ "output_root": "runs/checkpoints",
36
+ "log_root": "runs/logs",
37
+ "cache_root": "runs/cache",
38
  "model_load_path": null,
39
  "model_load_source": "torch",
40
  "resume": null,
41
+ "model_path": ".vlms/kosmos-2-patch14-224",
42
+ "model_config": ".vlms/kosmos-2-patch14-224/config.json",
43
  "train_setup": {
44
+ "precision": "bf16",
45
  "predict_action": true,
46
  "predict_forward": false,
47
  "predict_forward_hand": false,
 
56
  "mm_use_im_patch_token": false,
57
  "gradient_checkpointing": false,
58
  "lora_enable": false,
59
+ "mm_projector_lr": 1e-4,
60
  "lora_r": 64,
61
  "lora_alpha": 16,
62
  "lora_dropout": 0.05,
 
86
  "fwd_head": null,
87
  "tokenizer": {
88
  "type": "AutoProcessor",
89
+ "pretrained_model_name_or_path": ".vlms/kosmos-2-patch14-224",
90
  "tokenizer_type": "kosmos",
91
  "max_text_len": 256,
92
  "additional_special_tokens": null
93
  },
94
+ "vlm": {
95
+ "type": "AutoModelForVision2Seq",
96
+ "name": "kosmos",
97
+ "pretrained_model_name_or_path": ".vlms/kosmos-2-patch14-224"
98
+ },
99
  "trainer": {
100
  "accelerator": "gpu",
101
  "strategy": "deepspeed_stage_2",
102
  "precision": "16",
103
+ "logger": ["tensorboard"],
 
 
104
  "gradient_clip_val": 1.0,
105
  "use_distributed_sampler": false,
106
  "log_every_n_steps": 10,
 
112
  },
113
  "train_dataset": {
114
  "type": "DiskCalvinDataset",
115
+ "data_dir": "datasets/calvin_data/task_ABCD_D/training",
116
  "shift_first": false,
117
  "model_name": "kosmos",
118
  "rgb_pad": 10,
 
120
  },
121
  "val_dataset": {
122
  "type": "DiskCalvinDataset",
123
+ "data_dir": "datasets/calvin_data/task_ABCD_D/validation",
124
  "model_name": "kosmos"
125
  },
126
  "norm_action": true,
127
  "norm_min": -0.65,
128
+ "norm_max": 0.65
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
129
  }