Upload 8 files

Files changed (7) hide show

README.md CHANGED Viewed

@@ -1,6 +1,6 @@
 ---
-library_name: transformers
-tags: []
 ---
 # Model Card for Model ID
@@ -15,7 +15,7 @@ tags: []
 <!-- Provide a longer summary of what this model is. -->
-This is the model card of a 🤗 transformers model that has been pushed on the Hub. This model card has been automatically generated.
 - **Developed by:** [More Information Needed]
 - **Funded by [optional]:** [More Information Needed]
@@ -196,4 +196,7 @@ Carbon emissions can be estimated using the [Machine Learning Impact calculator]
 ## Model Card Contact
-[More Information Needed]

 ---
+base_model: google/paligemma2-3b-mix-224
+library_name: peft
 ---
 # Model Card for Model ID
 <!-- Provide a longer summary of what this model is. -->
 - **Developed by:** [More Information Needed]
 - **Funded by [optional]:** [More Information Needed]
 ## Model Card Contact
+[More Information Needed]
+### Framework versions
+- PEFT 0.13.2

adapter_config.json CHANGED Viewed

@@ -3,9 +3,6 @@
   "auto_mapping": null,
   "base_model_name_or_path": "google/paligemma2-3b-mix-224",
   "bias": "none",
-  "corda_config": null,
-  "eva_config": null,
-  "exclude_modules": null,
   "fan_in_fan_out": false,
   "inference_mode": true,
   "init_lora_weights": true,
@@ -14,7 +11,6 @@
   "layers_to_transform": null,
   "loftq_config": {},
   "lora_alpha": 32,
-  "lora_bias": false,
   "lora_dropout": 0.05,
   "megatron_config": null,
   "megatron_core": "megatron.core",
@@ -24,16 +20,15 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "o_proj",
-    "v_proj",
     "k_proj",
-    "down_proj",
     "gate_proj",
     "up_proj",
-    "q_proj"
   ],
   "task_type": "CAUSAL_LM",
-  "trainable_token_indices": null,
   "use_dora": false,
   "use_rslora": false
 }

   "auto_mapping": null,
   "base_model_name_or_path": "google/paligemma2-3b-mix-224",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
   "init_lora_weights": true,
   "layers_to_transform": null,
   "loftq_config": {},
   "lora_alpha": 32,
   "lora_dropout": 0.05,
   "megatron_config": null,
   "megatron_core": "megatron.core",
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "k_proj",
+    "v_proj",
     "gate_proj",
+    "q_proj",
+    "down_proj",
     "up_proj",
+    "o_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,
   "use_rslora": false
 }

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:03b453353fe25701748063ab2f641c70987694041fb8e3aff78a575b1b9813d3
-size 47586024

 version https://git-lfs.github.com/spec/v1
+oid sha256:b6539b77bc9aed7dc918910c68ed0a077215a3500748175fdf00df1d37c4fbf6
+size 95091968

optimizer.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:882f5995d607120782db6bd18a91b78a85bf2448ac403711dd16a65fa0c003eb
+size 177067885

rng_state.pth ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:c12bd36d197fececea5785e1700cff3230099e967e819c33c9687e2d513a0427
+size 14645

scheduler.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:2ee3f99a053745d2a79ee8e0484c666a074aa17a6222120eda9b13716fb5e96a
+size 1465

training_args.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:8352e7e8fc5d051fa5fa107f8ef4eccf59cf677bed62f059335768858d425e0b
+size 5713