checkpoint step 1000
Browse files- step_1000/config.json +14 -0
- step_1000/model.pt +3 -0
- step_1000/optimizer.pt +3 -0
- step_1000/scaler.pt +3 -0
- step_1000/scheduler.pt +3 -0
step_1000/config.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"vocab_size": 256,
|
| 3 |
+
"d_model": 384,
|
| 4 |
+
"n_layers": 6,
|
| 5 |
+
"dropout": 0.1,
|
| 6 |
+
"max_len": 512,
|
| 7 |
+
"lr": 0.0003,
|
| 8 |
+
"warmup": 500,
|
| 9 |
+
"batch": 64,
|
| 10 |
+
"block": 512,
|
| 11 |
+
"steps": 2000000,
|
| 12 |
+
"world_size": 2,
|
| 13 |
+
"step": 1000
|
| 14 |
+
}
|
step_1000/model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:41fd4c149e937ca431e10a8677e442a183ada46d74001c9b0e1281312924f7d0
|
| 3 |
+
size 25761151
|
step_1000/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a6edbfa0e0c483f24a78d473d112e9b4e7fd770ff19d35366e8e75e899c1dc13
|
| 3 |
+
size 43838795
|
step_1000/scaler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:14ae2a2128444abab378aa06c09a61a84665f758fcc19fc46f5789b0bc1b5665
|
| 3 |
+
size 1383
|
step_1000/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:153e82b9b21f7a55a02f068fd88a7597fb0bed7095f9120c365377e609abd243
|
| 3 |
+
size 1465
|