upload vlm

Files changed (10) hide show

.gitattributes CHANGED Viewed

@@ -33,3 +33,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+LIBERO_checkpoints filter=lfs diff=lfs merge=lfs -text
+Qwen2.5-VLM filter=lfs diff=lfs merge=lfs -text
+README.md filter=lfs diff=lfs merge=lfs -text

Qwen2.5-VLM/qwen25-dinosiglip-224px+0_5b+stage-finetune+x42/checkpoints/latest-checkpoint.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:dc63d956a7e9ee853b2ef74b812454bc71e011cbf65f98c79da5a29e9bf2a61b
+size 3992031074

Qwen2.5-VLM/qwen25-dinosiglip-224px+0_5b+stage-finetune+x42/config.yaml ADDED Viewed

+seed: 42
+hf_token: .hf_token
+run_root_dir: runs
+wandb_project: qwen-vlm
+wandb_entity: null
+model:
+  model_id: qwen25-dinosiglip-224px+0_5b
+  pretrained_checkpoint: null
+  llm_backbone_id: qwen25-0_5b
+  inference_mode: false
+  vision_backbone_id: dinosiglip-vit-so-224px
+  image_resize_strategy: resize-naive
+  default_image_size: 224
+  image_sequence_len: 1
+training:
+  stage: finetune
+  epochs: 2
+  max_steps: null
+  global_batch_size: 32
+  per_device_batch_size: 4
+  learning_rate: 2.0e-05
+  weight_decay: 0.1
+  max_grad_norm: 1.0
+  lr_scheduler_type: linear-warmup+cosine-decay
+  warmup_ratio: 0.03
+  enable_gradient_checkpointing: true
+  enable_mixed_precision_training: true
+  reduce_in_full_precision: false
+  sharding_strategy: full-shard
+dataset:
+  dataset_id: llava-v15
+  dataset_root_dir: dataset/
+  finetune_stage_components:
+  - llava-v1.5-instruct/llava_v1_5_mix665k.json
+  - llava-v1.5-instruct/
+run_id: qwen25-dinosiglip-224px+0_5b+stage-finetune+x42

Qwen2.5-VLM/qwen25-dinosiglip-224px+1_5b+stage-finetune+x42/checkpoints/latest-checkpoint.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:c133f7c5ed5e21469f33dbcb885cdf4533d71f7609cdc4ddab82e3bbe4c28319
+size 8590225842

Qwen2.5-VLM/qwen25-dinosiglip-224px+1_5b+stage-finetune+x42/config.yaml ADDED Viewed

+seed: 42
+hf_token: .hf_token
+run_root_dir: runs
+wandb_project: qwen-vlm
+wandb_entity: null
+model:
+  model_id: qwen25-dinosiglip-224px+1_5b
+  pretrained_checkpoint: null
+  llm_backbone_id: qwen25-1_5b
+  inference_mode: false
+  vision_backbone_id: dinosiglip-vit-so-224px
+  image_resize_strategy: resize-naive
+  default_image_size: 224
+  image_sequence_len: 1
+training:
+  stage: finetune
+  epochs: 2
+  max_steps: null
+  global_batch_size: 32
+  per_device_batch_size: 4
+  learning_rate: 2.0e-05
+  weight_decay: 0.1
+  max_grad_norm: 1.0
+  lr_scheduler_type: linear-warmup+cosine-decay
+  warmup_ratio: 0.03
+  enable_gradient_checkpointing: true
+  enable_mixed_precision_training: true
+  reduce_in_full_precision: false
+  sharding_strategy: full-shard
+dataset:
+  dataset_id: llava-v15
+  dataset_root_dir: dataset/
+  finetune_stage_components:
+  - llava-v1.5-instruct/llava_v1_5_mix665k.json
+  - llava-v1.5-instruct/
+run_id: qwen25-dinosiglip-224px+1_5b+stage-finetune+x42

Qwen2.5-VLM/qwen25-dinosiglip-224px+3b+stage-finetune+x42/checkpoints/latest-checkpoint.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:c29bf8a3f68153dda1289c52f1a3f556e34cb5278f1a3e58645e766534edb70b
+size 15081086078

Qwen2.5-VLM/qwen25-dinosiglip-224px+3b+stage-finetune+x42/config.yaml ADDED Viewed

+seed: 42
+hf_token: .hf_token
+run_root_dir: runs
+wandb_project: qwen-vlm
+wandb_entity: null
+model:
+  model_id: qwen25-dinosiglip-224px+3b
+  pretrained_checkpoint: null
+  llm_backbone_id: qwen25-3b
+  inference_mode: false
+  vision_backbone_id: dinosiglip-vit-so-224px
+  image_resize_strategy: resize-naive
+  default_image_size: 224
+  image_sequence_len: 1
+training:
+  stage: finetune
+  epochs: 2
+  max_steps: null
+  global_batch_size: 32
+  per_device_batch_size: 4
+  learning_rate: 2.0e-05
+  weight_decay: 0.1
+  max_grad_norm: 1.0
+  lr_scheduler_type: linear-warmup+cosine-decay
+  warmup_ratio: 0.03
+  enable_gradient_checkpointing: true
+  enable_mixed_precision_training: true
+  reduce_in_full_precision: false
+  sharding_strategy: full-shard
+dataset:
+  dataset_id: llava-v15
+  dataset_root_dir: dataset/
+  finetune_stage_components:
+  - llava-v1.5-instruct/llava_v1_5_mix665k.json
+  - llava-v1.5-instruct/
+run_id: qwen25-dinosiglip-224px+3b+stage-finetune+x42

Qwen2.5-VLM/qwen25-dinosiglip-224px+7b+stage-finetune+x42/checkpoints/latest-checkpoint.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:6d5bcd68dc1fab956f576ce260a26dad67a662c51639553828a910a975a5925b
+size 31996269478

Qwen2.5-VLM/qwen25-dinosiglip-224px+7b+stage-finetune+x42/config.yaml ADDED Viewed

+seed: 42
+hf_token: .hf_token
+run_root_dir: runs
+wandb_project: qwen-vlm
+wandb_entity: null
+model:
+  model_id: qwen25-dinosiglip-224px+7b
+  pretrained_checkpoint: null
+  llm_backbone_id: qwen25-7b
+  inference_mode: false
+  vision_backbone_id: dinosiglip-vit-so-224px
+  image_resize_strategy: resize-naive
+  default_image_size: 224
+  image_sequence_len: 1
+training:
+  stage: finetune
+  epochs: 2
+  max_steps: null
+  global_batch_size: 32
+  per_device_batch_size: 4
+  learning_rate: 2.0e-05
+  weight_decay: 0.1
+  max_grad_norm: 1.0
+  lr_scheduler_type: linear-warmup+cosine-decay
+  warmup_ratio: 0.03
+  enable_gradient_checkpointing: true
+  enable_mixed_precision_training: true
+  reduce_in_full_precision: false
+  sharding_strategy: full-shard
+dataset:
+  dataset_id: llava-v15
+  dataset_root_dir: dataset/
+  finetune_stage_components:
+  - llava-v1.5-instruct/llava_v1_5_mix665k.json
+  - llava-v1.5-instruct/
+run_id: qwen25-dinosiglip-224px+7b+stage-finetune+x42

README.md CHANGED Viewed

@@ -1,3 +1,3 @@
----
-license: mit
----

+version https://git-lfs.github.com/spec/v1
+oid sha256:d8d7a46d41a1a37fe4f0a5f637bf55c649310185329127d8a2204632e480be17
+size 24