DevHunterAI commited on
Commit
28eacbe
·
verified ·
1 Parent(s): ef36934

CAD LoRA adapter upload

Browse files
adapter_config.json CHANGED
@@ -29,8 +29,8 @@
29
  "rank_pattern": {},
30
  "revision": null,
31
  "target_modules": [
32
- "v_proj",
33
  "up_proj",
 
34
  "q_proj"
35
  ],
36
  "target_parameters": null,
 
29
  "rank_pattern": {},
30
  "revision": null,
31
  "target_modules": [
 
32
  "up_proj",
33
+ "v_proj",
34
  "q_proj"
35
  ],
36
  "target_parameters": null,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba8d614b094e235cd267370ad57bab6b1526c0561f009a1533486986b9082e45
3
  size 27547336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc2cc7257ebd4cd73b1c7374f391dec191015c425a9ceb4f9259c8a8c281de02
3
  size 27547336
checkpoint-4/adapter_config.json CHANGED
@@ -29,8 +29,8 @@
29
  "rank_pattern": {},
30
  "revision": null,
31
  "target_modules": [
32
- "v_proj",
33
  "up_proj",
 
34
  "q_proj"
35
  ],
36
  "target_parameters": null,
 
29
  "rank_pattern": {},
30
  "revision": null,
31
  "target_modules": [
 
32
  "up_proj",
33
+ "v_proj",
34
  "q_proj"
35
  ],
36
  "target_parameters": null,
checkpoint-4/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bf58dbe200afff2dec926b3d5d2456143b945dd6eda66cd49ef02d4923c40084
3
  size 27547336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0068bbb55640de2e6a5b9788ef78a9c2038a60b87b2fc8904c9796b39f20580b
3
  size 27547336
checkpoint-4/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:597b6281a83fc0faf04a230b279297c1649f7f87e6e6b631a8901222b5e90a4c
3
  size 55191482
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7ee1202bdb7b019ea0256bc1aee85ac3b1eaea14b844e1abfb9813b37ad6cbb
3
  size 55191482
checkpoint-4/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e9837c2e4d58d01133e4668cffaa8ef6741d1ecca79e127b539e4997cd03de3e
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0c40c4a81f200aad10927b2fb78e549faf5e14be0b5d66b8ffdc58cd6eaa7bf
3
  size 14244
checkpoint-4/trainer_state.json CHANGED
@@ -26,7 +26,7 @@
26
  "attributes": {}
27
  }
28
  },
29
- "total_flos": 137739258384384.0,
30
  "train_batch_size": 1,
31
  "trial_name": null,
32
  "trial_params": null
 
26
  "attributes": {}
27
  }
28
  },
29
+ "total_flos": 145326456459264.0,
30
  "train_batch_size": 1,
31
  "trial_name": null,
32
  "trial_params": null
checkpoint-6/adapter_config.json CHANGED
@@ -29,8 +29,8 @@
29
  "rank_pattern": {},
30
  "revision": null,
31
  "target_modules": [
32
- "v_proj",
33
  "up_proj",
 
34
  "q_proj"
35
  ],
36
  "target_parameters": null,
 
29
  "rank_pattern": {},
30
  "revision": null,
31
  "target_modules": [
 
32
  "up_proj",
33
+ "v_proj",
34
  "q_proj"
35
  ],
36
  "target_parameters": null,
checkpoint-6/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba8d614b094e235cd267370ad57bab6b1526c0561f009a1533486986b9082e45
3
  size 27547336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc2cc7257ebd4cd73b1c7374f391dec191015c425a9ceb4f9259c8a8c281de02
3
  size 27547336
checkpoint-6/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5c4e33f62121c6d9da18ed4c0e1e6f6fb48e91ec456d1c0d139ef61860ecf7f
3
  size 55191482
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb00c6a6c62ff7d7a6ec09215d12e3313b68eb6f4cb014a8d3cf884e8e11cdd2
3
  size 55191482
checkpoint-6/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:60a8fb80ac1bf80fef94772d1bdc9568443800de852553425ea39c224fe280a6
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64123b336e44c6cf78b63f66127ecea6f20a681e01f9223d7d4f5ef02fd154ce
3
  size 14244
checkpoint-6/trainer_state.json CHANGED
@@ -10,13 +10,13 @@
10
  "is_world_process_zero": true,
11
  "log_history": [
12
  {
13
- "entropy": 0.8762538245430699,
14
- "epoch": 2.8421052631578947,
15
- "grad_norm": 0.6482176184654236,
16
  "learning_rate": 6.909830056250527e-05,
17
- "loss": 1.3301252365112304,
18
- "mean_token_accuracy": 0.7302898124412254,
19
- "num_tokens": 24767.0,
20
  "step": 5
21
  }
22
  ],
@@ -37,7 +37,7 @@
37
  "attributes": {}
38
  }
39
  },
40
- "total_flos": 206608887576576.0,
41
  "train_batch_size": 1,
42
  "trial_name": null,
43
  "trial_params": null
 
10
  "is_world_process_zero": true,
11
  "log_history": [
12
  {
13
+ "entropy": 0.8723009686384883,
14
+ "epoch": 2.8,
15
+ "grad_norm": 0.6077917814254761,
16
  "learning_rate": 6.909830056250527e-05,
17
+ "loss": 1.339169979095459,
18
+ "mean_token_accuracy": 0.7311233420457158,
19
+ "num_tokens": 25846.0,
20
  "step": 5
21
  }
22
  ],
 
37
  "attributes": {}
38
  }
39
  },
40
+ "total_flos": 217989684688896.0,
41
  "train_batch_size": 1,
42
  "trial_name": null,
43
  "trial_params": null