Upload folder using huggingface_hub

Browse files

Files changed (4) hide show

README.md +2 -3
adapter_config.json +4 -4
adapter_model.safetensors +1 -1
trainer_state.json +29 -29

README.md CHANGED Viewed

@@ -2,10 +2,9 @@
 base_model: Qwen/Qwen3-0.6B
 library_name: peft
 ---
-# Model Card for Model ID
-<!-- Provide a quick summary of what the model is/does. -->

 base_model: Qwen/Qwen3-0.6B
 library_name: peft
 ---
+### Framework versions
+- PEFT 0.15.1ide a quick summary of what the model is/does. -->

adapter_config.json CHANGED Viewed

@@ -24,13 +24,13 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "gate_proj",
     "down_proj",
     "k_proj",
-    "q_proj",
-    "up_proj",
-    "v_proj",
-    "o_proj"
   ],
   "task_type": "CAUSAL_LM",
   "trainable_token_indices": null,

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "v_proj",
     "gate_proj",
+    "q_proj",
     "down_proj",
+    "o_proj",
     "k_proj",
+    "up_proj"
   ],
   "task_type": "CAUSAL_LM",
   "trainable_token_indices": null,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c213b339d3beff756c65a7624aea9cfacc0f041499406e83f01dbc2c149356e3
 size 161533160

 version https://git-lfs.github.com/spec/v1
+oid sha256:37cca7d0e06ebdcc365613800bb8f220b076275e2298986dbf2e77b3d8c91700
 size 161533160

trainer_state.json CHANGED Viewed

@@ -11,107 +11,107 @@
   "log_history": [
     {
       "epoch": 0.2,
-      "grad_norm": 4.880182266235352,
       "learning_rate": 1e-05,
       "loss": 0.9092,
       "step": 1
     },
     {
       "epoch": 0.4,
-      "grad_norm": 5.186452388763428,
       "learning_rate": 9.890738003669029e-06,
-      "loss": 0.9494,
       "step": 2
     },
     {
       "epoch": 0.6,
-      "grad_norm": 5.036950588226318,
       "learning_rate": 9.567727288213005e-06,
-      "loss": 0.7849,
       "step": 3
     },
     {
       "epoch": 0.8,
-      "grad_norm": 5.341607570648193,
       "learning_rate": 9.045084971874738e-06,
-      "loss": 0.7692,
       "step": 4
     },
     {
       "epoch": 1.0,
-      "grad_norm": 4.708967685699463,
       "learning_rate": 8.345653031794292e-06,
-      "loss": 0.6502,
       "step": 5
     },
     {
       "epoch": 1.2,
-      "grad_norm": 3.691345453262329,
       "learning_rate": 7.500000000000001e-06,
-      "loss": 0.5581,
       "step": 6
     },
     {
       "epoch": 1.4,
-      "grad_norm": 2.7508931159973145,
       "learning_rate": 6.545084971874738e-06,
-      "loss": 0.5363,
       "step": 7
     },
     {
       "epoch": 1.6,
-      "grad_norm": 1.858952283859253,
       "learning_rate": 5.522642316338268e-06,
-      "loss": 0.5077,
       "step": 8
     },
     {
       "epoch": 1.8,
-      "grad_norm": 1.805176019668579,
       "learning_rate": 4.477357683661734e-06,
-      "loss": 0.5521,
       "step": 9
     },
     {
       "epoch": 2.0,
-      "grad_norm": 1.4771124124526978,
       "learning_rate": 3.4549150281252635e-06,
-      "loss": 0.4747,
       "step": 10
     },
     {
       "epoch": 2.2,
-      "grad_norm": 1.5449007749557495,
       "learning_rate": 2.5000000000000015e-06,
-      "loss": 0.5101,
       "step": 11
     },
     {
       "epoch": 2.4,
-      "grad_norm": 1.393797755241394,
       "learning_rate": 1.6543469682057105e-06,
-      "loss": 0.4949,
       "step": 12
     },
     {
       "epoch": 2.6,
-      "grad_norm": 1.2324782609939575,
       "learning_rate": 9.549150281252633e-07,
-      "loss": 0.4521,
       "step": 13
     },
     {
       "epoch": 2.8,
-      "grad_norm": 1.2213858366012573,
       "learning_rate": 4.322727117869951e-07,
-      "loss": 0.432,
       "step": 14
     },
     {
       "epoch": 3.0,
-      "grad_norm": 1.4015122652053833,
       "learning_rate": 1.0926199633097156e-07,
-      "loss": 0.4952,
       "step": 15
     }
   ],

   "log_history": [
     {
       "epoch": 0.2,
+      "grad_norm": 4.834155559539795,
       "learning_rate": 1e-05,
       "loss": 0.9092,
       "step": 1
     },
     {
       "epoch": 0.4,
+      "grad_norm": 5.137935638427734,
       "learning_rate": 9.890738003669029e-06,
+      "loss": 0.9497,
       "step": 2
     },
     {
       "epoch": 0.6,
+      "grad_norm": 4.987179279327393,
       "learning_rate": 9.567727288213005e-06,
+      "loss": 0.7857,
       "step": 3
     },
     {
       "epoch": 0.8,
+      "grad_norm": 5.295909881591797,
       "learning_rate": 9.045084971874738e-06,
+      "loss": 0.7714,
       "step": 4
     },
     {
       "epoch": 1.0,
+      "grad_norm": 4.681474208831787,
       "learning_rate": 8.345653031794292e-06,
+      "loss": 0.6515,
       "step": 5
     },
     {
       "epoch": 1.2,
+      "grad_norm": 3.703080892562866,
       "learning_rate": 7.500000000000001e-06,
+      "loss": 0.56,
       "step": 6
     },
     {
       "epoch": 1.4,
+      "grad_norm": 2.7864272594451904,
       "learning_rate": 6.545084971874738e-06,
+      "loss": 0.5379,
       "step": 7
     },
     {
       "epoch": 1.6,
+      "grad_norm": 1.8693835735321045,
       "learning_rate": 5.522642316338268e-06,
+      "loss": 0.509,
       "step": 8
     },
     {
       "epoch": 1.8,
+      "grad_norm": 1.8035385608673096,
       "learning_rate": 4.477357683661734e-06,
+      "loss": 0.5536,
       "step": 9
     },
     {
       "epoch": 2.0,
+      "grad_norm": 1.4770323038101196,
       "learning_rate": 3.4549150281252635e-06,
+      "loss": 0.4764,
       "step": 10
     },
     {
       "epoch": 2.2,
+      "grad_norm": 1.537730097770691,
       "learning_rate": 2.5000000000000015e-06,
+      "loss": 0.5115,
       "step": 11
     },
     {
       "epoch": 2.4,
+      "grad_norm": 1.3944271802902222,
       "learning_rate": 1.6543469682057105e-06,
+      "loss": 0.4966,
       "step": 12
     },
     {
       "epoch": 2.6,
+      "grad_norm": 1.2273967266082764,
       "learning_rate": 9.549150281252633e-07,
+      "loss": 0.4532,
       "step": 13
     },
     {
       "epoch": 2.8,
+      "grad_norm": 1.2184977531433105,
       "learning_rate": 4.322727117869951e-07,
+      "loss": 0.4331,
       "step": 14
     },
     {
       "epoch": 3.0,
+      "grad_norm": 1.390999436378479,
       "learning_rate": 1.0926199633097156e-07,
+      "loss": 0.4964,
       "step": 15
     }
   ],