Training in progress, step 2100

Files changed (4) hide show

README.md CHANGED Viewed

@@ -37,7 +37,7 @@ This model was trained with SFT.
 - TRL: 0.27.0
 - Transformers: 4.57.6
 - Pytorch: 2.8.0+cu126
-- Datasets: 4.4.1
 - Tokenizers: 0.22.1
 ## Citations

 - TRL: 0.27.0
 - Transformers: 4.57.6
 - Pytorch: 2.8.0+cu126
+- Datasets: 4.4.2
 - Tokenizers: 0.22.1
 ## Citations

adapter_config.json CHANGED Viewed

@@ -29,13 +29,13 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "k_proj",
-    "down_proj",
-    "o_proj",
-    "q_proj",
     "v_proj",
     "gate_proj",
-    "up_proj"
   ],
   "target_parameters": null,
   "task_type": "CAUSAL_LM",

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "v_proj",
+    "k_proj",
     "gate_proj",
+    "o_proj",
+    "up_proj",
+    "down_proj",
+    "q_proj"
   ],
   "target_parameters": null,
   "task_type": "CAUSAL_LM",

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:875e11864c60557b1ce9d0f4a3628b1921ba20dcfcb047f1194317ca21dd647e
 size 228140600

 version https://git-lfs.github.com/spec/v1
+oid sha256:c9e46ae2720088669da0e7f9e660e9df21b3f13cd814ef2c054173a76a40c0a8
 size 228140600

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1429883e942c6b0b337507f32bd2f9e9b227b047e8eeab1d3295f008840498d1
 size 6353

 version https://git-lfs.github.com/spec/v1
+oid sha256:dc0c9c43aae96575e8afc416e967ac5674d13cc1a38c487b69cd4534aafef005
 size 6353