End of training
Browse files- README.md +1 -1
- config.json +27 -27
- model-00001-of-00003.safetensors +1 -1
- model-00002-of-00003.safetensors +1 -1
- model-00003-of-00003.safetensors +1 -1
README.md
CHANGED
|
@@ -15,7 +15,7 @@ should probably proofread and complete it, then remove this comment. -->
|
|
| 15 |
|
| 16 |
This model is a fine-tuned version of [mistralai/Mistral-7B-v0.1](https://huggingface.co/mistralai/Mistral-7B-v0.1) on the None dataset.
|
| 17 |
It achieves the following results on the evaluation set:
|
| 18 |
-
- Loss: 2.
|
| 19 |
|
| 20 |
## Model description
|
| 21 |
|
|
|
|
| 15 |
|
| 16 |
This model is a fine-tuned version of [mistralai/Mistral-7B-v0.1](https://huggingface.co/mistralai/Mistral-7B-v0.1) on the None dataset.
|
| 17 |
It achieves the following results on the evaluation set:
|
| 18 |
+
- Loss: 2.4040
|
| 19 |
|
| 20 |
## Model description
|
| 21 |
|
config.json
CHANGED
|
@@ -23,38 +23,38 @@
|
|
| 23 |
"rope_theta": 10000.0,
|
| 24 |
"sliding_window": 4096,
|
| 25 |
"thresholds": [
|
| 26 |
-
0.017051145434379578,
|
| 27 |
0.023069201037287712,
|
| 28 |
-
0.
|
| 29 |
-
0.
|
| 30 |
-
0.
|
| 31 |
-
0.
|
| 32 |
-
0.
|
| 33 |
-
0.07923770695924759,
|
| 34 |
-
0.08324974030256271,
|
| 35 |
-
0.07923770695924759,
|
| 36 |
-
0.089267797768116,
|
| 37 |
-
0.089267797768116,
|
| 38 |
-
0.0992978885769844,
|
| 39 |
-
0.0992978885769844,
|
| 40 |
0.10531593859195709,
|
| 41 |
-
0.
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 42 |
0.1414242684841156,
|
| 43 |
-
0.
|
| 44 |
-
0.
|
|
|
|
| 45 |
0.19157472252845764,
|
| 46 |
-
0.
|
| 47 |
-
0.
|
| 48 |
-
0.
|
| 49 |
-
0.
|
| 50 |
0.2357071191072464,
|
| 51 |
-
0.
|
| 52 |
-
0.
|
| 53 |
-
0.
|
| 54 |
-
0.
|
| 55 |
-
0.
|
| 56 |
-
0.
|
| 57 |
-
0.
|
|
|
|
|
|
|
| 58 |
],
|
| 59 |
"tie_word_embeddings": false,
|
| 60 |
"torch_dtype": "bfloat16",
|
|
|
|
| 23 |
"rope_theta": 10000.0,
|
| 24 |
"sliding_window": 4096,
|
| 25 |
"thresholds": [
|
|
|
|
| 26 |
0.023069201037287712,
|
| 27 |
+
0.03309928998351097,
|
| 28 |
+
0.04312938079237938,
|
| 29 |
+
0.05516548827290535,
|
| 30 |
+
0.07522567361593246,
|
| 31 |
+
0.09327983111143112,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 32 |
0.10531593859195709,
|
| 33 |
+
0.11935807019472122,
|
| 34 |
+
0.12738214433193207,
|
| 35 |
+
0.12738214433193207,
|
| 36 |
+
0.1313941776752472,
|
| 37 |
+
0.13340020179748535,
|
| 38 |
+
0.13941824436187744,
|
| 39 |
0.1414242684841156,
|
| 40 |
+
0.15546639263629913,
|
| 41 |
+
0.1675025075674057,
|
| 42 |
+
0.18555666506290436,
|
| 43 |
0.19157472252845764,
|
| 44 |
+
0.20762285590171814,
|
| 45 |
+
0.2196589708328247,
|
| 46 |
+
0.22768303751945496,
|
| 47 |
+
0.23771312832832336,
|
| 48 |
0.2357071191072464,
|
| 49 |
+
0.23771312832832336,
|
| 50 |
+
0.24172517657279968,
|
| 51 |
+
0.24172517657279968,
|
| 52 |
+
0.24172517657279968,
|
| 53 |
+
0.24172517657279968,
|
| 54 |
+
0.24172517657279968,
|
| 55 |
+
0.23971915245056152,
|
| 56 |
+
0.2357071191072464,
|
| 57 |
+
0.225677028298378
|
| 58 |
],
|
| 59 |
"tie_word_embeddings": false,
|
| 60 |
"torch_dtype": "bfloat16",
|
model-00001-of-00003.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4943163992
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0614f728766b92b1615c8d517b5974b34637fa328cbb4245781b4045b106c037
|
| 3 |
size 4943163992
|
model-00002-of-00003.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4999821144
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3d4e08eef455b0c321fc81384f5b714615d206f3ed750833bd478342f7420cc5
|
| 3 |
size 4999821144
|
model-00003-of-00003.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4540517840
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d7af3748ac11c9732fca3ad1c359e63953a668eae233501094c8c6744b0f2ca5
|
| 3 |
size 4540517840
|