Refresh base adapter to best eval_loss (profile=llama3_2_1b_base, step=2968, eval_loss=0.038945)

Files changed (3) hide show

meta-llama__llama-3.2-1b/adapter_config.json CHANGED Viewed

@@ -33,12 +33,12 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "k_proj",
     "up_proj",
-    "q_proj",
     "down_proj",
     "v_proj",
-    "gate_proj",
     "o_proj"
   ],
   "target_parameters": null,

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "gate_proj",
+    "q_proj",
     "k_proj",
     "up_proj",
     "down_proj",
     "v_proj",
     "o_proj"
   ],
   "target_parameters": null,

meta-llama__llama-3.2-1b/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c2408afc781cee231b6f78f8c438fabceca16c1ce626cd072fbe81ed94eaf6c4
 size 45118424

 version https://git-lfs.github.com/spec/v1
+oid sha256:ab485621ca30f9d7587cdfb66747e7f691d713cf9272e1e6feeb07fa667f9774
 size 45118424

meta-llama__llama-3.2-1b/best_eval_metrics.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "best_eval_loss": 0.04131177067756653,
   "best_step": 2968,
   "epoch": 0.9996631862579993
 }

 {
+  "best_eval_loss": 0.03894522041082382,
   "best_step": 2968,
   "epoch": 0.9996631862579993
 }