Refresh base adapter to best eval_loss (profile=llama3_2_3b_base, step=1428, eval_loss=0.038845)

Files changed (3) hide show

meta-llama__llama-3.2-3b/adapter_config.json CHANGED Viewed

@@ -34,12 +34,12 @@
   "revision": null,
   "target_modules": [
     "up_proj",
-    "down_proj",
-    "v_proj",
-    "q_proj",
     "gate_proj",
     "o_proj",
-    "k_proj"
   ],
   "target_parameters": null,
   "task_type": "CAUSAL_LM",

   "revision": null,
   "target_modules": [
     "up_proj",
+    "k_proj",
     "gate_proj",
     "o_proj",
+    "v_proj",
+    "q_proj",
+    "down_proj"
   ],
   "target_parameters": null,
   "task_type": "CAUSAL_LM",

meta-llama__llama-3.2-3b/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:18e31466a1cf25c49c0799368ebfb1bce429eeeb15344ee87de6645692bc3729
 size 97307544

 version https://git-lfs.github.com/spec/v1
+oid sha256:289d90c2c922da5b009bca034b751b4297d9edce70b37a2df59f13b6cf4da554
 size 97307544

meta-llama__llama-3.2-3b/best_eval_metrics.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "best_eval_loss": 0.04342564195394516,
-  "best_step": 504,
-  "epoch": 1.7560975609756098
 }

 {
+  "best_eval_loss": 0.038845136761665344,
+  "best_step": 1428,
+  "epoch": 1.0
 }