End of training

Files changed (7) hide show

README.md CHANGED Viewed

@@ -3,7 +3,9 @@ library_name: peft
 license: apache-2.0
 base_model: HuggingFaceTB/SmolVLM-Base
 tags:
-- generated_from_trainer
 model-index:
 - name: SmolVLM-Base-vqav2
   results: []
@@ -14,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
 # SmolVLM-Base-vqav2
-This model is a fine-tuned version of [HuggingFaceTB/SmolVLM-Base](https://huggingface.co/HuggingFaceTB/SmolVLM-Base) on an unknown dataset.
 ## Model description
@@ -44,14 +46,10 @@ The following hyperparameters were used during training:
 - lr_scheduler_warmup_steps: 50
 - num_epochs: 1
-### Training results
 ### Framework versions
-- PEFT 0.15.2
-- Transformers 4.53.0
 - Pytorch 2.7.1+cu126
 - Datasets 3.6.0
 - Tokenizers 0.21.2

 license: apache-2.0
 base_model: HuggingFaceTB/SmolVLM-Base
 tags:
+- base_model:adapter:HuggingFaceTB/SmolVLM-Base
+- lora
+- transformers
 model-index:
 - name: SmolVLM-Base-vqav2
   results: []
 # SmolVLM-Base-vqav2
+This model is a fine-tuned version of [HuggingFaceTB/SmolVLM-Base](https://huggingface.co/HuggingFaceTB/SmolVLM-Base) on the None dataset.
 ## Model description
 - lr_scheduler_warmup_steps: 50
 - num_epochs: 1
 ### Framework versions
+- PEFT 0.16.0
+- Transformers 4.52.4
 - Pytorch 2.7.1+cu126
 - Datasets 3.6.0
 - Tokenizers 0.21.2

adapter_config.json CHANGED Viewed

@@ -23,20 +23,22 @@
   "megatron_core": "megatron.core",
   "modules_to_save": null,
   "peft_type": "LORA",
   "r": 8,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "gate_proj",
-    "q_proj",
-    "down_proj",
     "o_proj",
-    "up_proj",
     "k_proj",
-    "v_proj"
   ],
   "task_type": null,
   "trainable_token_indices": null,
   "use_dora": false,
   "use_rslora": false
 }

   "megatron_core": "megatron.core",
   "modules_to_save": null,
   "peft_type": "LORA",
+  "qalora_group_size": 16,
   "r": 8,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "up_proj",
     "gate_proj",
     "o_proj",
+    "v_proj",
+    "q_proj",
     "k_proj",
+    "down_proj"
   ],
   "task_type": null,
   "trainable_token_indices": null,
   "use_dora": false,
+  "use_qalora": false,
   "use_rslora": false
 }

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:78522da1225fcb0f5455517b8aee0ea48e9b45a3c79ba1727d22488c7f2c5b48
 size 42220792

 version https://git-lfs.github.com/spec/v1
+oid sha256:36627d7ba4ce2125f6cf4aca91d7bd29e52b97beeaebd4c97725c8f53600200b
 size 42220792

runs/Jul04_02-21-12_MemeMachina9000/events.out.tfevents.1751592907.MemeMachina9000.2903879.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:4fa0542c4cbd7c60980c6ca7ca333fbcbb3046292334e977fafa522414822bf1
+size 315

runs/Jul06_00-42-30_MemeMachina9000/events.out.tfevents.1751758957.MemeMachina9000.3841747.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:0a28fe16fc1c01f57f382f602a3db3d052bc8588011403e3d29105072479f294
+size 17388

runs/Jul06_00-46-56_MemeMachina9000/events.out.tfevents.1751759346.MemeMachina9000.3848260.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:c33ec6bccb9afd028e99218e1b99256a8779828192b827ee6c7a426de762df3b
+size 9707

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:835f8226843f7aebbb86873b02b70afd4132ea6b79da0a3da5609514e1e49326
-size 5777

 version https://git-lfs.github.com/spec/v1
+oid sha256:9ee841cc72d15e2bf88bdc9082d59e07c2b0214fa7693264ee646642c7252dc6
+size 5713