vxbrandon commited on
Commit
d299143
·
verified ·
1 Parent(s): 1305765

End of training

Browse files
README.md CHANGED
@@ -15,7 +15,7 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  This model is a fine-tuned version of [mistralai/Mistral-7B-v0.1](https://huggingface.co/mistralai/Mistral-7B-v0.1) on the None dataset.
17
  It achieves the following results on the evaluation set:
18
- - Loss: 2.5957
19
 
20
  ## Model description
21
 
 
15
 
16
  This model is a fine-tuned version of [mistralai/Mistral-7B-v0.1](https://huggingface.co/mistralai/Mistral-7B-v0.1) on the None dataset.
17
  It achieves the following results on the evaluation set:
18
+ - Loss: 2.4040
19
 
20
  ## Model description
21
 
config.json CHANGED
@@ -23,38 +23,38 @@
23
  "rope_theta": 10000.0,
24
  "sliding_window": 4096,
25
  "thresholds": [
26
- 0.017051145434379578,
27
  0.023069201037287712,
28
- 0.049147434532642365,
29
- 0.051153454929590225,
30
- 0.05917752534151077,
31
- 0.06920761615037918,
32
- 0.0732196494936943,
33
- 0.07923770695924759,
34
- 0.08324974030256271,
35
- 0.07923770695924759,
36
- 0.089267797768116,
37
- 0.089267797768116,
38
- 0.0992978885769844,
39
- 0.0992978885769844,
40
  0.10531593859195709,
41
- 0.12136408686637878,
 
 
 
 
 
42
  0.1414242684841156,
43
- 0.15947842597961426,
44
- 0.1775325983762741,
 
45
  0.19157472252845764,
46
- 0.19759276509284973,
47
- 0.21765294671058655,
48
- 0.21765294671058655,
49
- 0.23169508576393127,
50
  0.2357071191072464,
51
- 0.23169508576393127,
52
- 0.225677028298378,
53
- 0.22968906164169312,
54
- 0.225677028298378,
55
- 0.225677028298378,
56
- 0.2457372099161148,
57
- 0.26980942487716675
 
 
58
  ],
59
  "tie_word_embeddings": false,
60
  "torch_dtype": "bfloat16",
 
23
  "rope_theta": 10000.0,
24
  "sliding_window": 4096,
25
  "thresholds": [
 
26
  0.023069201037287712,
27
+ 0.03309928998351097,
28
+ 0.04312938079237938,
29
+ 0.05516548827290535,
30
+ 0.07522567361593246,
31
+ 0.09327983111143112,
 
 
 
 
 
 
 
32
  0.10531593859195709,
33
+ 0.11935807019472122,
34
+ 0.12738214433193207,
35
+ 0.12738214433193207,
36
+ 0.1313941776752472,
37
+ 0.13340020179748535,
38
+ 0.13941824436187744,
39
  0.1414242684841156,
40
+ 0.15546639263629913,
41
+ 0.1675025075674057,
42
+ 0.18555666506290436,
43
  0.19157472252845764,
44
+ 0.20762285590171814,
45
+ 0.2196589708328247,
46
+ 0.22768303751945496,
47
+ 0.23771312832832336,
48
  0.2357071191072464,
49
+ 0.23771312832832336,
50
+ 0.24172517657279968,
51
+ 0.24172517657279968,
52
+ 0.24172517657279968,
53
+ 0.24172517657279968,
54
+ 0.24172517657279968,
55
+ 0.23971915245056152,
56
+ 0.2357071191072464,
57
+ 0.225677028298378
58
  ],
59
  "tie_word_embeddings": false,
60
  "torch_dtype": "bfloat16",
model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e178646fb43467fe1ac68c767dc53a190c62e7ab176499a24203913360d32b3
3
  size 4943163992
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0614f728766b92b1615c8d517b5974b34637fa328cbb4245781b4045b106c037
3
  size 4943163992
model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c608913252c5ec911a52cc6a18aaad7787986220ee14dadd515f0a130e5be7d6
3
  size 4999821144
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d4e08eef455b0c321fc81384f5b714615d206f3ed750833bd478342f7420cc5
3
  size 4999821144
model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0199cb7cf5b42356ce1fa59a4fc571fcf15222f723459f2db7b81ef18a47d5d9
3
  size 4540517840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7af3748ac11c9732fca3ad1c359e63953a668eae233501094c8c6744b0f2ca5
3
  size 4540517840