guyhadad01 commited on
Commit
3d6902c
·
verified ·
1 Parent(s): 1e2c841

Training in progress, step 12400, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1269,6 +1269,10 @@ You can finetune this model on your own dataset.
1269
  | 0.2138 | 12100 | 0.4082 |
1270
  | 0.2147 | 12150 | 0.3855 |
1271
  | 0.2156 | 12200 | 0.4567 |
 
 
 
 
1272
 
1273
 
1274
  ### Framework Versions
 
1269
  | 0.2138 | 12100 | 0.4082 |
1270
  | 0.2147 | 12150 | 0.3855 |
1271
  | 0.2156 | 12200 | 0.4567 |
1272
+ | 0.2165 | 12250 | 0.4368 |
1273
+ | 0.2173 | 12300 | 0.3686 |
1274
+ | 0.2182 | 12350 | 0.4163 |
1275
+ | 0.2191 | 12400 | 0.3595 |
1276
 
1277
 
1278
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ad55c4b6b6eb0c0378b40f5afe9b809839ef4dcaf65938b6be44df391f5a5ea4
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:574b3805817f84c05fe61afaa266bdb741864872a08c8b02a26021f7f2d4b6a1
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6292ed9a900b0c859bfdd6c9df2c5387f1a04143b05826767cb8bedebe906bb1
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4ffa53be833c86425bcb85e6adb4b16c9a27186fd568e0bc2763a7d2449b3db
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f520f013fa8b5071407e30d736875f828fde9d624a9e917e055760aba4e8b925
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ef1f923f6a1dc64581eaa57f689d3afe64e52f3a89bbade50c868ec911b07ce
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:400813ac47bbcdbc0fc813340b1eb9c8ae221654524666a11f89e971d58d1c7c
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3af4348a2f962e0a24bd0d54fa3ca7b60bf2d2d90f2e31ee6b869eaaa1d91a60
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:038fcca02e593a472cc6365efd49e0401f5576654e492a85d64164b873c49869
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd23584cb98398038b4f29f6fb0b60db3fae00d268a4c127abde12daed6ca267
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.2155819830008305,
6
  "eval_steps": 500,
7
- "global_step": 12200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -1716,6 +1716,34 @@
1716
  "learning_rate": 4.3581512242052976e-05,
1717
  "loss": 0.4567,
1718
  "step": 12200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1719
  }
1720
  ],
1721
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.2191161138696966,
6
  "eval_steps": 500,
7
+ "global_step": 12400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
1716
  "learning_rate": 4.3581512242052976e-05,
1717
  "loss": 0.4567,
1718
  "step": 12200
1719
+ },
1720
+ {
1721
+ "epoch": 0.21646551571804704,
1722
+ "grad_norm": 2.0770373344421387,
1723
+ "learning_rate": 4.353242622371444e-05,
1724
+ "loss": 0.4368,
1725
+ "step": 12250
1726
+ },
1727
+ {
1728
+ "epoch": 0.21734904843526356,
1729
+ "grad_norm": 1.4739536046981812,
1730
+ "learning_rate": 4.3483340205375905e-05,
1731
+ "loss": 0.3686,
1732
+ "step": 12300
1733
+ },
1734
+ {
1735
+ "epoch": 0.21823258115248007,
1736
+ "grad_norm": 1.8857239484786987,
1737
+ "learning_rate": 4.343425418703736e-05,
1738
+ "loss": 0.4163,
1739
+ "step": 12350
1740
+ },
1741
+ {
1742
+ "epoch": 0.2191161138696966,
1743
+ "grad_norm": 1.722424030303955,
1744
+ "learning_rate": 4.3385168168698834e-05,
1745
+ "loss": 0.3595,
1746
+ "step": 12400
1747
  }
1748
  ],
1749
  "logging_steps": 50,