Refresh base adapter to best eval_loss (profile=llama3_2_1b_base, step=2968, eval_loss=0.041312)

Files changed (3) hide show

meta-llama__llama-3.2-1b/adapter_config.json CHANGED Viewed

@@ -33,13 +33,13 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "down_proj",
     "up_proj",
-    "o_proj",
-    "v_proj",
     "q_proj",
     "gate_proj",
-    "k_proj"
   ],
   "target_parameters": null,
   "task_type": "CAUSAL_LM",

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "k_proj",
     "up_proj",
     "q_proj",
+    "down_proj",
+    "v_proj",
     "gate_proj",
+    "o_proj"
   ],
   "target_parameters": null,
   "task_type": "CAUSAL_LM",

meta-llama__llama-3.2-1b/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8b92e4103207d7ad80b57d220f7cce916c752362f19e02a4a2d8c3e2666b2d9e
 size 45118424

 version https://git-lfs.github.com/spec/v1
+oid sha256:c2408afc781cee231b6f78f8c438fabceca16c1ce626cd072fbe81ed94eaf6c4
 size 45118424

meta-llama__llama-3.2-1b/best_eval_metrics.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "best_eval_loss": 0.041491035372018814,
-  "best_step": 4284,
-  "epoch": 3.0
 }

 {
+  "best_eval_loss": 0.04131177067756653,
+  "best_step": 2968,
+  "epoch": 0.9996631862579993
 }