JuanPajero commited on
Commit
f96514a
Β·
1 Parent(s): 76d7629

Training in progress, step 35500

Browse files
{checkpoint-14200 β†’ checkpoint-35500}/config.json RENAMED
File without changes
{checkpoint-14200 β†’ checkpoint-35500}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ce9c29c1923f02b3a8d6df9a2c832cd743d1ad062f7f17c0682d952b22e23e33
3
  size 721687499
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2852db7cf014b14489b48c2b4434ecfc606da92d93234e33d8ab765f212d43ac
3
  size 721687499
{checkpoint-14200 β†’ checkpoint-35500}/preprocessor_config.json RENAMED
File without changes
{checkpoint-14200 β†’ checkpoint-35500}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:42abb36894ab0c8cab607935ed11d784d3438a7ab977686063829b782e67afcd
3
  size 377674359
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f6a91c0cd3efa0326503b4148695da414af93512af37092a4f75e483f5b7886
3
  size 377674359
{checkpoint-14200 β†’ checkpoint-35500}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8d0e532f7f8aafb8358fc8c962ab3116e2e93c6dbacd1785aa3b1c62966926f7
3
  size 14773
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c57cd849ea7c0f7c68a597c364a643221c2bec00262fd4d7f58e148e5f4e191b
3
  size 14773
{checkpoint-14200 β†’ checkpoint-35500}/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de7d045249d5724b67b8237e4c292dc20eae96b999609b191a9cc3b3493b6fdc
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16be25ec3156a8306d0d1d2d1e342085ac407c8f872a2b9638fdc2d2263d1aa3
3
  size 1383
{checkpoint-14200 β†’ checkpoint-35500}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f628a48d936785b81b4fa83f7bcc43980103ec1541eb8b56944a0b68929cb007
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e397eca0724de78a0bcb22ea0120cbc2c4e2e3481857c7f086bf94efbedf9e94
3
  size 1465
{checkpoint-14200 β†’ checkpoint-35500}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.7418085932731628,
3
- "best_model_checkpoint": "JuanPajero/FT-S3/checkpoint-14200",
4
- "epoch": 1.9749652294853965,
5
- "global_step": 14200,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -36,11 +36,56 @@
36
  "eval_steps_per_second": 2.061,
37
  "eval_wer": 0.31068540368553627,
38
  "step": 14200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
39
  }
40
  ],
41
  "max_steps": 71900,
42
  "num_train_epochs": 10,
43
- "total_flos": 1.698176517880873e+19,
44
  "trial_name": null,
45
  "trial_params": null
46
  }
 
1
  {
2
+ "best_metric": 0.6885841488838196,
3
+ "best_model_checkpoint": "JuanPajero/FT-S3/checkpoint-21300",
4
+ "epoch": 4.937413073713491,
5
+ "global_step": 35500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
36
  "eval_steps_per_second": 2.061,
37
  "eval_wer": 0.31068540368553627,
38
  "step": 14200
39
+ },
40
+ {
41
+ "epoch": 2.96,
42
+ "learning_rate": 2.3462679647658787e-05,
43
+ "loss": 0.338,
44
+ "step": 21300
45
+ },
46
+ {
47
+ "epoch": 2.96,
48
+ "eval_loss": 0.6885841488838196,
49
+ "eval_runtime": 1207.7134,
50
+ "eval_samples_per_second": 16.501,
51
+ "eval_steps_per_second": 2.063,
52
+ "eval_wer": 0.2933106599088304,
53
+ "step": 21300
54
+ },
55
+ {
56
+ "epoch": 3.95,
57
+ "learning_rate": 2.0172461752433936e-05,
58
+ "loss": 0.3011,
59
+ "step": 28400
60
+ },
61
+ {
62
+ "epoch": 3.95,
63
+ "eval_loss": 0.7342329621315002,
64
+ "eval_runtime": 1203.3539,
65
+ "eval_samples_per_second": 16.56,
66
+ "eval_steps_per_second": 2.07,
67
+ "eval_wer": 0.28296994666476305,
68
+ "step": 28400
69
+ },
70
+ {
71
+ "epoch": 4.94,
72
+ "learning_rate": 1.688270746407047e-05,
73
+ "loss": 0.2763,
74
+ "step": 35500
75
+ },
76
+ {
77
+ "epoch": 4.94,
78
+ "eval_loss": 0.7109239101409912,
79
+ "eval_runtime": 1205.3003,
80
+ "eval_samples_per_second": 16.534,
81
+ "eval_steps_per_second": 2.067,
82
+ "eval_wer": 0.2757370562620463,
83
+ "step": 35500
84
  }
85
  ],
86
  "max_steps": 71900,
87
  "num_train_epochs": 10,
88
+ "total_flos": 4.242114943584952e+19,
89
  "trial_name": null,
90
  "trial_params": null
91
  }
{checkpoint-14200 β†’ checkpoint-35500}/training_args.bin RENAMED
File without changes
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5a9608394bdcbf0f5b6c30c64691a84b8aa61151e60c5849c2c39dc3128b168d
3
  size 377674359
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f6a91c0cd3efa0326503b4148695da414af93512af37092a4f75e483f5b7886
3
  size 377674359
runs/Mar22_03-10-48_48c38934e4d2/events.out.tfevents.1774154952.48c38934e4d2.13068.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:66ec37a4899ba64e5520e6862312ea9adf26cd5878c47eb021d3b2742ecc3ca9
3
- size 6976
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ea1f4ca7c8ae4baa6f5c6635fafb4d811b283af4126a373e662e5eeb816106d
3
+ size 7460