Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- base_checkpoints/d34/meta_009000.json +59 -0
- base_checkpoints/d34/meta_010507.json +59 -0
- base_checkpoints/d34/model_009000.pt +3 -0
- base_checkpoints/d34/model_010507.pt +3 -0
- base_checkpoints/d34/optim_009000_rank0.pt +3 -0
- base_checkpoints/d34/optim_009000_rank1.pt +3 -0
- base_checkpoints/d34/optim_009000_rank10.pt +3 -0
- base_checkpoints/d34/optim_009000_rank11.pt +3 -0
- base_checkpoints/d34/optim_009000_rank12.pt +3 -0
- base_checkpoints/d34/optim_009000_rank13.pt +3 -0
- base_checkpoints/d34/optim_009000_rank14.pt +3 -0
- base_checkpoints/d34/optim_009000_rank15.pt +3 -0
- base_checkpoints/d34/optim_009000_rank16.pt +3 -0
- base_checkpoints/d34/optim_009000_rank17.pt +3 -0
- base_checkpoints/d34/optim_009000_rank18.pt +3 -0
- base_checkpoints/d34/optim_009000_rank19.pt +3 -0
- base_checkpoints/d34/optim_009000_rank2.pt +3 -0
- base_checkpoints/d34/optim_009000_rank20.pt +3 -0
- base_checkpoints/d34/optim_009000_rank21.pt +3 -0
- base_checkpoints/d34/optim_009000_rank22.pt +3 -0
- base_checkpoints/d34/optim_009000_rank23.pt +3 -0
- base_checkpoints/d34/optim_009000_rank24.pt +3 -0
- base_checkpoints/d34/optim_009000_rank25.pt +3 -0
- base_checkpoints/d34/optim_009000_rank26.pt +3 -0
- base_checkpoints/d34/optim_009000_rank27.pt +3 -0
- base_checkpoints/d34/optim_009000_rank28.pt +3 -0
- base_checkpoints/d34/optim_009000_rank29.pt +3 -0
- base_checkpoints/d34/optim_009000_rank3.pt +3 -0
- base_checkpoints/d34/optim_009000_rank30.pt +3 -0
- base_checkpoints/d34/optim_009000_rank31.pt +3 -0
- base_checkpoints/d34/optim_009000_rank32.pt +3 -0
- base_checkpoints/d34/optim_009000_rank33.pt +3 -0
- base_checkpoints/d34/optim_009000_rank34.pt +3 -0
- base_checkpoints/d34/optim_009000_rank35.pt +3 -0
- base_checkpoints/d34/optim_009000_rank36.pt +3 -0
- base_checkpoints/d34/optim_009000_rank37.pt +3 -0
- base_checkpoints/d34/optim_009000_rank38.pt +3 -0
- base_checkpoints/d34/optim_009000_rank39.pt +3 -0
- base_checkpoints/d34/optim_009000_rank4.pt +3 -0
- base_checkpoints/d34/optim_009000_rank40.pt +3 -0
- base_checkpoints/d34/optim_009000_rank41.pt +3 -0
- base_checkpoints/d34/optim_009000_rank42.pt +3 -0
- base_checkpoints/d34/optim_009000_rank43.pt +3 -0
- base_checkpoints/d34/optim_009000_rank44.pt +3 -0
- base_checkpoints/d34/optim_009000_rank45.pt +3 -0
- base_checkpoints/d34/optim_009000_rank46.pt +3 -0
- base_checkpoints/d34/optim_009000_rank47.pt +3 -0
- base_checkpoints/d34/optim_009000_rank48.pt +3 -0
- base_checkpoints/d34/optim_009000_rank49.pt +3 -0
- base_checkpoints/d34/optim_009000_rank5.pt +3 -0
base_checkpoints/d34/meta_009000.json
ADDED
|
@@ -0,0 +1,59 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"step": 9000,
|
| 3 |
+
"val_bpb": 0.7525381183282047,
|
| 4 |
+
"model_config": {
|
| 5 |
+
"sequence_len": 2048,
|
| 6 |
+
"vocab_size": 32768,
|
| 7 |
+
"n_layer": 34,
|
| 8 |
+
"n_head": 17,
|
| 9 |
+
"n_kv_head": 17,
|
| 10 |
+
"n_embd": 2176,
|
| 11 |
+
"window_pattern": "L"
|
| 12 |
+
},
|
| 13 |
+
"user_config": {
|
| 14 |
+
"run": "pre1900_d34_full22btok",
|
| 15 |
+
"device_type": "",
|
| 16 |
+
"fp8": true,
|
| 17 |
+
"fp8_recipe": "tensorwise",
|
| 18 |
+
"depth": 34,
|
| 19 |
+
"aspect_ratio": 64,
|
| 20 |
+
"head_dim": 128,
|
| 21 |
+
"max_seq_len": 2048,
|
| 22 |
+
"window_pattern": "L",
|
| 23 |
+
"num_iterations": -1,
|
| 24 |
+
"target_flops": -1.0,
|
| 25 |
+
"target_param_data_ratio": 11.0,
|
| 26 |
+
"device_batch_size": 4,
|
| 27 |
+
"total_batch_size": -1,
|
| 28 |
+
"embedding_lr": 0.3,
|
| 29 |
+
"unembedding_lr": 0.004,
|
| 30 |
+
"weight_decay": 0.2,
|
| 31 |
+
"matrix_lr": 0.02,
|
| 32 |
+
"scalar_lr": 0.5,
|
| 33 |
+
"adam_beta1": 0.8,
|
| 34 |
+
"adam_beta2": 0.95,
|
| 35 |
+
"warmup_ratio": 0.0,
|
| 36 |
+
"warmdown_ratio": 0.5,
|
| 37 |
+
"final_lr_frac": 0.0,
|
| 38 |
+
"resume_from_step": -1,
|
| 39 |
+
"eval_every": 250,
|
| 40 |
+
"eval_tokens": 20971520,
|
| 41 |
+
"core_metric_every": 2000,
|
| 42 |
+
"core_metric_max_per_task": 500,
|
| 43 |
+
"sample_every": 2000,
|
| 44 |
+
"save_every": 3000,
|
| 45 |
+
"model_tag": null
|
| 46 |
+
},
|
| 47 |
+
"device_batch_size": 4,
|
| 48 |
+
"max_seq_len": 2048,
|
| 49 |
+
"dataloader_state_dict": {
|
| 50 |
+
"pq_idx": 172,
|
| 51 |
+
"rg_idx": 64,
|
| 52 |
+
"epoch": 1
|
| 53 |
+
},
|
| 54 |
+
"loop_state": {
|
| 55 |
+
"min_val_bpb": 0.7525381183282047,
|
| 56 |
+
"smooth_train_loss": 2.2710539888406336,
|
| 57 |
+
"total_training_time": 44112.03752231598
|
| 58 |
+
}
|
| 59 |
+
}
|
base_checkpoints/d34/meta_010507.json
ADDED
|
@@ -0,0 +1,59 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"step": 10507,
|
| 3 |
+
"val_bpb": 0.7259969166510065,
|
| 4 |
+
"model_config": {
|
| 5 |
+
"sequence_len": 2048,
|
| 6 |
+
"vocab_size": 32768,
|
| 7 |
+
"n_layer": 34,
|
| 8 |
+
"n_head": 17,
|
| 9 |
+
"n_kv_head": 17,
|
| 10 |
+
"n_embd": 2176,
|
| 11 |
+
"window_pattern": "L"
|
| 12 |
+
},
|
| 13 |
+
"user_config": {
|
| 14 |
+
"run": "pre1900_d34_full22btok",
|
| 15 |
+
"device_type": "",
|
| 16 |
+
"fp8": true,
|
| 17 |
+
"fp8_recipe": "tensorwise",
|
| 18 |
+
"depth": 34,
|
| 19 |
+
"aspect_ratio": 64,
|
| 20 |
+
"head_dim": 128,
|
| 21 |
+
"max_seq_len": 2048,
|
| 22 |
+
"window_pattern": "L",
|
| 23 |
+
"num_iterations": -1,
|
| 24 |
+
"target_flops": -1.0,
|
| 25 |
+
"target_param_data_ratio": 11.0,
|
| 26 |
+
"device_batch_size": 4,
|
| 27 |
+
"total_batch_size": -1,
|
| 28 |
+
"embedding_lr": 0.3,
|
| 29 |
+
"unembedding_lr": 0.004,
|
| 30 |
+
"weight_decay": 0.2,
|
| 31 |
+
"matrix_lr": 0.02,
|
| 32 |
+
"scalar_lr": 0.5,
|
| 33 |
+
"adam_beta1": 0.8,
|
| 34 |
+
"adam_beta2": 0.95,
|
| 35 |
+
"warmup_ratio": 0.0,
|
| 36 |
+
"warmdown_ratio": 0.5,
|
| 37 |
+
"final_lr_frac": 0.0,
|
| 38 |
+
"resume_from_step": -1,
|
| 39 |
+
"eval_every": 250,
|
| 40 |
+
"eval_tokens": 20971520,
|
| 41 |
+
"core_metric_every": 2000,
|
| 42 |
+
"core_metric_max_per_task": 500,
|
| 43 |
+
"sample_every": 2000,
|
| 44 |
+
"save_every": 3000,
|
| 45 |
+
"model_tag": null
|
| 46 |
+
},
|
| 47 |
+
"device_batch_size": 4,
|
| 48 |
+
"max_seq_len": 2048,
|
| 49 |
+
"dataloader_state_dict": {
|
| 50 |
+
"pq_idx": 201,
|
| 51 |
+
"rg_idx": 0,
|
| 52 |
+
"epoch": 1
|
| 53 |
+
},
|
| 54 |
+
"loop_state": {
|
| 55 |
+
"min_val_bpb": 0.7259969166510065,
|
| 56 |
+
"smooth_train_loss": 2.3119625572178344,
|
| 57 |
+
"total_training_time": 51539.05968785286
|
| 58 |
+
}
|
| 59 |
+
}
|
base_checkpoints/d34/model_009000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f75be5f8e15ae143a822e1280f9dc3b845c12bd52d3ea63e5488d2acb4e197ca
|
| 3 |
+
size 10579743323
|
base_checkpoints/d34/model_010507.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0aff5326add2d9ba0a898555cc03dc199565ef2fa26e60fe1d9548abf2e91902
|
| 3 |
+
size 10579743323
|
base_checkpoints/d34/optim_009000_rank0.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cc6d9e3b76cab851231a4782e789aa1a7ae16d1c906ca382a6853693b76575dc
|
| 3 |
+
size 297584053
|
base_checkpoints/d34/optim_009000_rank1.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f3c93b2f4aaa1f6a4eba6673ff2ad352c4c465b457a39d7a9d4d8ad1cd6d1af8
|
| 3 |
+
size 297584053
|
base_checkpoints/d34/optim_009000_rank10.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cf55efca36a7f118e0ece4cec35fdae6b772e31585854b054afabbbb7fb3d2a9
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank11.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9d652dadaf93487ccd21ceb64d654f355390fd829c61e99c393fde2b105fb17f
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank12.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f7120cd507939c241757b9fbda90519aa4ca931f253c9d5b35c821e174aa3f85
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank13.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:087be507faabe130348701e0a9e2773b162fe6ad2dc65a65b9d4fa0998d18c71
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank14.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eb81ea528bad1235033ba301527268de92953d06513271fa24d8694ff2dd4b5d
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank15.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0febb82adf830022e3655845691e476ec01874281059600ea5295cda12b8d259
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank16.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:02f0a185e003fb8208b0be46e4e5560f1464c4ab27ff556a4632042c1f6a131c
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank17.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:281a983b4cea46808dad6759dfea6cd0f50a0c171b69c3e2f31d8e0294450c6d
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank18.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ce53a61c2e4e52c9d4b388168886d2c12bed522cd2ec0b565130b0bd4a66c4d3
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank19.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6bb64f4eebf8c7afae8b346761cc4fc0292095c6c7ddb9d5cd0c4cbd4856c486
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank2.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cec6179a85577002faa2c361b6a4ea257f318dbb50d81fe28825cfc6be1d68f5
|
| 3 |
+
size 297584053
|
base_checkpoints/d34/optim_009000_rank20.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1946a11ccb38a2ca47f25578ff81d3501f5edff654ec6d90a202eb263e4cfd94
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank21.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:50b7da78a7a3851f1e3f9638bc50c458294453ce0421b74d7e4c502522340e6e
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank22.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4f6441896c54983ae9aef0bb3b013ec35dd6bff3da72a447b602f8169962f21c
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank23.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:02ea1733ce8fdcd3712796774e003dbf156a8b58788cfa6f0a71d8fe01cd0b37
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank24.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fcd3b84ba483b34251940bda2f6e82cf69c919036a2fc6a60e9321ef2cbbf0b7
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank25.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2bffa6b7378f031cd01289874662e0f7efca17ec5e104780af8162525ce63cab
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank26.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9541e0e396e9011fcf693f819aafc3c1d8720201ae1ec23ca22a1d2d20618f73
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank27.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:acdf2b257ae33406969c8e6624d6fa594f30bd52c4b1fab106b65478ec8af6b7
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank28.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fb0081dfbaeabe89319f7a823a9437ccbd6d411b4342d9cdfe65cba9dc3523f7
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank29.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6422d559d2f6412fc71b57661534af3ab80e10ff6215521f9175db3c9e0fb1fd
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank3.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ee018c9d088dfed96beabbeb02a2bc953cdf189bf631dc89a254451de4e0904f
|
| 3 |
+
size 297584053
|
base_checkpoints/d34/optim_009000_rank30.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:57cf6a8a028e1bcda3ca14010209c894af79ab0ba24a5cddaf23ae357817db3b
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank31.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:19c5c14800026abce177bb724942be79067aef37ee09e16bc6dc46c33f3cb47d
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank32.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:337708ea9aef0f9e428053464fa810a7920c2d4deda801fa507b1ea7381db7a7
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank33.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:934fa2ae29c4935afa93da50ef9ed2156bdcf4beafef98c16b0aa9b7a6ad1f5d
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank34.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:11616bd9165ba1dab37385bd76b4995cae68326d2f0a916c974cf3775a061d79
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank35.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:39d1af4cb57ca60b5e5e0f96019a0ef7311f35e0a754ea2ad837316e022250d9
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank36.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:27b9d401dc36de83a96cf056dad00e9182198ad598479524254cebe1127c413e
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank37.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:59d8c6694e37a4d2d156d1358c9ebeb66a517cefc2173c6084664267552acce2
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank38.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5b06d87312282475bc6aea29822442809219527d97f3871fd2eddfab3e4d04b1
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank39.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:24190d270db4281744cb6aaa9a8698056d2a9b4ed738b2adc0863c68bfec92c5
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank4.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:474d364fec81c9797426ea7b33a8fbcab645f1f8832080b6895a1d2b53144f43
|
| 3 |
+
size 297584053
|
base_checkpoints/d34/optim_009000_rank40.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fdb952df4319daaa99c056497912fe007541107ef7dd769d30b0f3dcffc87a23
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank41.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ba76324128d6da1915758456cc8b21c4c57f48ce1feceb6ebfaa3e999d5160ed
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank42.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bfeb6d4e2949fabf893e6798552b4405d23713cdc44b17c2c2390456ac25c2f9
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank43.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cc53abf4c195c24b40ee45ad543e89a8dff48b019ca96e6654c30aa0638257f0
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank44.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a51d546632fcee552c41c7ec468b1677e13357182dbd01ef1d05fffa790d45a
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank45.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ef586dfe6f414d9b7c111f8b6dc2b85f97ce86275886cfa64b030d52c3ae7792
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank46.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6fd87aba098a700fd5a92c0382d21ba4d5bb02c968b1489e66f013750f4526de
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank47.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:46c4522663f5a870b49c1388881f49bf50461862219cd5ed88ffbbe429010f8f
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank48.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d77441a11dd38204691c4ff2cc343ab95c02a54b120bd1fa108b255d829a79d5
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank49.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7627fc6b4dfd1ed0927b44beab1c433b60c9c4f860a6c456cac401aba1e09661
|
| 3 |
+
size 297584109
|
base_checkpoints/d34/optim_009000_rank5.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:30b6289103760078f31b2d7c833b85cb9de7bc4d35b089675e07f7410ae864f3
|
| 3 |
+
size 297584053
|