Revised upload of MicroGPT-Deva model with 3 epoch training
Browse files- config.json +1 -1
- model.pth +3 -0
- pytorch_model.bin +1 -1
config.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"batch_size": 32, "block_size": 512, "dropout": 0.0, "lr": 0.0003, "n_embd": 512, "n_head": 8, "n_layer": 8, "num_epochs":
|
|
|
|
| 1 |
+
{"batch_size": 32, "block_size": 512, "dropout": 0.0, "lr": 0.0003, "n_embd": 512, "n_head": 8, "n_layer": 8, "num_epochs": 3, "resume_path": "model.pth", "vocab_size": 12000}
|
model.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:311e8552e5d6330f0b9a2573332d50ea6e17b39db8e7c98706dbf8a755c6c0c5
|
| 3 |
+
size 453342893
|
pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 151116577
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d72294d450431fa9bbc5d05181c65a22dc0277f85fdc85ca84fcabba60932f7c
|
| 3 |
size 151116577
|