Upload folder using huggingface_hub
Browse files- DuplexMamba_train_stage4-110/3407/save/CKPT+2025-01-20+04-03-11+00/CKPT.yaml +5 -0
- DuplexMamba_train_stage4-110/3407/save/CKPT+2025-01-20+04-03-11+00/brain.ckpt +3 -0
- DuplexMamba_train_stage4-110/3407/save/CKPT+2025-01-20+04-03-11+00/counter.ckpt +3 -0
- DuplexMamba_train_stage4-110/3407/save/CKPT+2025-01-20+04-03-11+00/dataloader-TRAIN.ckpt +3 -0
- DuplexMamba_train_stage4-110/3407/save/CKPT+2025-01-20+04-03-11+00/model.ckpt +3 -0
- DuplexMamba_train_stage4-110/3407/save/CKPT+2025-01-20+04-03-11+00/noam_scheduler.ckpt +3 -0
- DuplexMamba_train_stage4-110/3407/save/CKPT+2025-01-20+04-03-11+00/normalizer.ckpt +3 -0
- DuplexMamba_train_stage4-110/3407/save/CKPT+2025-01-20+04-03-11+00/optimizer.ckpt +3 -0
- DuplexMamba_train_stage4-110/3407/save/CKPT+2025-01-20+04-03-11+00/scaler.ckpt +3 -0
DuplexMamba_train_stage4-110/3407/save/CKPT+2025-01-20+04-03-11+00/CKPT.yaml
ADDED
|
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# yamllint disable
|
| 2 |
+
PPL: 8.114310244586521
|
| 3 |
+
end-of-epoch: true
|
| 4 |
+
epoch: 2
|
| 5 |
+
unixtime: 1737316991.7090805
|
DuplexMamba_train_stage4-110/3407/save/CKPT+2025-01-20+04-03-11+00/brain.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3a7cabaef44431faa2f43e6287869f5b4acf13e4a03cea296ac5b4970526cc42
|
| 3 |
+
size 48
|
DuplexMamba_train_stage4-110/3407/save/CKPT+2025-01-20+04-03-11+00/counter.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d4735e3a265e16eee03f59718b9b5d03019c07d8b6c51f90da3a666eec13ab35
|
| 3 |
+
size 1
|
DuplexMamba_train_stage4-110/3407/save/CKPT+2025-01-20+04-03-11+00/dataloader-TRAIN.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:60eaa995208fb3488a82efb7e4184ba8084903bbca672fe3694870feb9ce3224
|
| 3 |
+
size 5
|
DuplexMamba_train_stage4-110/3407/save/CKPT+2025-01-20+04-03-11+00/model.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8608ed8ad88aa79e4c9b79a67201e81d6397ac083bdfb44184071b9dab669bcb
|
| 3 |
+
size 11429008102
|
DuplexMamba_train_stage4-110/3407/save/CKPT+2025-01-20+04-03-11+00/noam_scheduler.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:43811fa611b4b9d3c02455dc01269b512eba10f4d04418b6e4e9414fe33b4417
|
| 3 |
+
size 892
|
DuplexMamba_train_stage4-110/3407/save/CKPT+2025-01-20+04-03-11+00/normalizer.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2ffbe78d22be940876b62a5cc5cba55a0f3ab19abd12a199ad03988712649d48
|
| 3 |
+
size 2218
|
DuplexMamba_train_stage4-110/3407/save/CKPT+2025-01-20+04-03-11+00/optimizer.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b04ff31aa0947071601fe85c4c3a535c5ff8224f5d78bfb1c3083a0fece8cf97
|
| 3 |
+
size 700590634
|
DuplexMamba_train_stage4-110/3407/save/CKPT+2025-01-20+04-03-11+00/scaler.ckpt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1e73d379dcd4c29a573374353cd8dbba2dbe07652f7eef40d8a0a9563e509b11
|
| 3 |
+
size 860
|