brthor commited on
Commit
1c5a48c
·
verified ·
1 Parent(s): 43a84bc

Refresh base adapter to best eval_loss (profile=llama3_2_1b_base, step=1352, eval_loss=0.066586)

Browse files
meta-llama__llama-3.2-1b/adapter_config.json CHANGED
@@ -33,13 +33,13 @@
33
  "rank_pattern": {},
34
  "revision": null,
35
  "target_modules": [
36
- "v_proj",
37
  "q_proj",
38
- "down_proj",
39
  "o_proj",
40
- "gate_proj",
41
- "k_proj",
42
- "up_proj"
 
43
  ],
44
  "target_parameters": null,
45
  "task_type": "CAUSAL_LM",
 
33
  "rank_pattern": {},
34
  "revision": null,
35
  "target_modules": [
36
+ "k_proj",
37
  "q_proj",
 
38
  "o_proj",
39
+ "down_proj",
40
+ "up_proj",
41
+ "v_proj",
42
+ "gate_proj"
43
  ],
44
  "target_parameters": null,
45
  "task_type": "CAUSAL_LM",
meta-llama__llama-3.2-1b/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2d38150ac1b825e49c15bc2977fc97e308da13ba450c9e9bc62fedcc4b9f98eb
3
  size 45118424
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a845f119c2cf06d7dff9e80ad0e92a201bd7ae3ceaf6edf4ed53f48283cfbaf
3
  size 45118424
meta-llama__llama-3.2-1b/best_eval_metrics.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_eval_loss": 0.014388032257556915,
3
- "best_step": 3876,
4
- "epoch": 1.5005807200929153
5
  }
 
1
  {
2
+ "best_eval_loss": 0.06658560037612915,
3
+ "best_step": 1352,
4
+ "epoch": 0.5001849796522383
5
  }