guyhadad01 commited on
Commit
82d41c3
·
verified ·
1 Parent(s): 1e4b116

Training in progress, step 49000, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1269,6 +1269,10 @@ You can finetune this model on your own dataset.
1269
  | 0.8606 | 48700 | 0.3028 |
1270
  | 0.8614 | 48750 | 0.2579 |
1271
  | 0.8623 | 48800 | 0.3404 |
 
 
 
 
1272
 
1273
 
1274
  ### Framework Versions
 
1269
  | 0.8606 | 48700 | 0.3028 |
1270
  | 0.8614 | 48750 | 0.2579 |
1271
  | 0.8623 | 48800 | 0.3404 |
1272
+ | 0.8632 | 48850 | 0.3535 |
1273
+ | 0.8641 | 48900 | 0.2224 |
1274
+ | 0.8650 | 48950 | 0.2701 |
1275
+ | 0.8659 | 49000 | 0.2506 |
1276
 
1277
 
1278
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:36dc7c9e83fd465b92a2847be177b9eb428689ac2977e5e232b38d92574447f6
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84efeaad3a28b91cc498c5612f39d5a4c2c9f8daa7acd8511082cc68b8ddc2cb
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:476cfc5664418f0c7219fe39c91775cf7ee5aec7d0f1d77a8008aa21455285b8
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7a89c0e9e8e599e158b35c8a497af87a6ed6aa2e7dbb6685a96e88a89c0ee09
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7c91689e6fe6ea5ac1e3ed99062e8d26595b040c06b11772caa18d4fe3ffb3e8
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3d739b2e6d744ac93c261a7254a1e982aa4ce3774f886b8c343e7cb40301307
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e7d183fbaa9612fc768da7cf7cefd13466b61ea27398ff0fc8e2f5977752f4ef
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:866c5a8b8535e30581fc80f2ad91749cdaeeee2ad90769cad0b001d56fb4e651
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c86d99e394985101a11e9cbc029a6edaca303ea24f38f1f70ed88d32b2ae0eb0
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f974b2cab5a8a0bdcab6bbe8e6e05d55c8066b6602ba318fa916b4a6a3ca4678
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.862327932003322,
6
  "eval_steps": 500,
7
- "global_step": 48800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -6840,6 +6840,34 @@
6840
  "learning_rate": 7.667236064479394e-06,
6841
  "loss": 0.3404,
6842
  "step": 48800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6843
  }
6844
  ],
6845
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.8658620628721881,
6
  "eval_steps": 500,
7
+ "global_step": 49000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
6840
  "learning_rate": 7.667236064479394e-06,
6841
  "loss": 0.3404,
6842
  "step": 48800
6843
+ },
6844
+ {
6845
+ "epoch": 0.8632114647205386,
6846
+ "grad_norm": 1.3516128063201904,
6847
+ "learning_rate": 7.618150046140858e-06,
6848
+ "loss": 0.3535,
6849
+ "step": 48850
6850
+ },
6851
+ {
6852
+ "epoch": 0.8640949974377551,
6853
+ "grad_norm": 1.4083527326583862,
6854
+ "learning_rate": 7.569064027802321e-06,
6855
+ "loss": 0.2224,
6856
+ "step": 48900
6857
+ },
6858
+ {
6859
+ "epoch": 0.8649785301549716,
6860
+ "grad_norm": 1.421423077583313,
6861
+ "learning_rate": 7.5199780094637854e-06,
6862
+ "loss": 0.2701,
6863
+ "step": 48950
6864
+ },
6865
+ {
6866
+ "epoch": 0.8658620628721881,
6867
+ "grad_norm": 2.421118974685669,
6868
+ "learning_rate": 7.4708919911252476e-06,
6869
+ "loss": 0.2506,
6870
+ "step": 49000
6871
  }
6872
  ],
6873
  "logging_steps": 50,