Training update - Run 80 - 2025-12-29 04:20 UTC
Browse files- config.json +8 -8
- model.pt +2 -2
config.json
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
-
{
|
| 2 |
-
"vocab_size": 50257,
|
| 3 |
-
"n_layers": 6,
|
| 4 |
-
"n_heads": 6,
|
| 5 |
-
"embed_dim": 384,
|
| 6 |
-
"ff_dim": 1536,
|
| 7 |
-
"max_seq_len": 512,
|
| 8 |
-
"dropout": 0.1
|
| 9 |
}
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"vocab_size": 50257,
|
| 3 |
+
"n_layers": 6,
|
| 4 |
+
"n_heads": 6,
|
| 5 |
+
"embed_dim": 384,
|
| 6 |
+
"ff_dim": 1536,
|
| 7 |
+
"max_seq_len": 512,
|
| 8 |
+
"dropout": 0.1
|
| 9 |
}
|
model.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f612fbdff355b4549198e79cbed2fa425925e7d44c46c528b56e9d549b1515fb
|
| 3 |
+
size 120596251
|