full-state checkpoint 40-percent (step 300)
Browse files
ckpt-40-percent/adapter_config.json
CHANGED
|
@@ -33,13 +33,13 @@
|
|
| 33 |
"rank_pattern": {},
|
| 34 |
"revision": null,
|
| 35 |
"target_modules": [
|
| 36 |
-
"o_proj",
|
| 37 |
-
"k_proj",
|
| 38 |
"up_proj",
|
| 39 |
-
"
|
| 40 |
-
"
|
| 41 |
"down_proj",
|
| 42 |
-
"
|
|
|
|
|
|
|
| 43 |
],
|
| 44 |
"target_parameters": null,
|
| 45 |
"task_type": "CAUSAL_LM",
|
|
|
|
| 33 |
"rank_pattern": {},
|
| 34 |
"revision": null,
|
| 35 |
"target_modules": [
|
|
|
|
|
|
|
| 36 |
"up_proj",
|
| 37 |
+
"o_proj",
|
| 38 |
+
"gate_proj",
|
| 39 |
"down_proj",
|
| 40 |
+
"v_proj",
|
| 41 |
+
"k_proj",
|
| 42 |
+
"q_proj"
|
| 43 |
],
|
| 44 |
"target_parameters": null,
|
| 45 |
"task_type": "CAUSAL_LM",
|
ckpt-40-percent/adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 528550256
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:76a7b18234880765beb259126bdfa8889d9f4e2b6cf8871967be8cd1ad2c99aa
|
| 3 |
size 528550256
|
ckpt-40-percent/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e50462cc2ab8b5ead9c8a1ac771a1c2f094e66f00d2c7d715b64f9f4ce2667e4
|
| 3 |
+
size 268963653
|
ckpt-40-percent/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:475b3c40e3ef7c758588d268f27c4502722e9539a9db40661ec6d5ffe3f329fe
|
| 3 |
+
size 14645
|
ckpt-40-percent/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1465
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dcace000289ccea7ca399f35dcd83e38ce1d38a0ac83184841539e7bb865286c
|
| 3 |
size 1465
|
ckpt-40-percent/trainer_state.json
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
ckpt-40-percent/training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 7505
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:08a7756db7d337356b03f79cfc247284ee5c8ed3985ced618c069718c8faeac6
|
| 3 |
size 7505
|