JuanPajero commited on
Commit
5f95b96
Β·
1 Parent(s): 90f5ea7

Training in progress, step 2000

Browse files
{checkpoint-500 β†’ checkpoint-2000}/config.json RENAMED
File without changes
{checkpoint-500 β†’ checkpoint-2000}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:02f346f697add59272a426dce5e971f3c0d785fcbf7f1d2008a23228575d87e9
3
  size 721687499
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64d22661dcba3d0cb6d911b4bd416db42117c6811d3cf45df55a7e83a9134508
3
  size 721687499
{checkpoint-500 β†’ checkpoint-2000}/preprocessor_config.json RENAMED
File without changes
{checkpoint-500 β†’ checkpoint-2000}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:34a2fa3614bce2d2ba6860a335316bd068455f93b1e0a7d7563bfa18391e4a4d
3
  size 377674359
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a292bb26d6fc95282e7803a4a5b79608fdb1b8c7e82347ddc648c085b668783f
3
  size 377674359
{checkpoint-500 β†’ checkpoint-2000}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2dca4940646957043faa2ac0bde35b4a38d9810301fb798c9a41ff0123da17c4
3
  size 14709
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98686e7580d7add044a34553ef0317cad35ddac85e33e65313c14e5e9b3231ea
3
  size 14709
{checkpoint-500 β†’ checkpoint-2000}/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f5f88bc9b6a2d5d66f9e5683c4038944de51affd26b803ee8d3db49f106fa587
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50786c05f475ef653b53ebc3a6daee74f887308e526f335b68aa5669a6ae4442
3
  size 1383
{checkpoint-500 β†’ checkpoint-2000}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c6104403a3f016695b27d773ae378dc0511e7853c40dcd465e4333854ec96039
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1c7208a78c4eead1aea111474a41ee9bbf256971f80fae940dad9bf17894d12
3
  size 1465
{checkpoint-500 β†’ checkpoint-2000}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 3.0022623538970947,
3
- "best_model_checkpoint": "JuanPajero/FT-XS2/checkpoint-500",
4
- "epoch": 1.7006802721088436,
5
- "global_step": 500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -21,11 +21,56 @@
21
  "eval_steps_per_second": 1.726,
22
  "eval_wer": 0.9992262457443516,
23
  "step": 500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
24
  }
25
  ],
26
  "max_steps": 2940,
27
  "num_train_epochs": 10,
28
- "total_flos": 5.99032552253184e+17,
29
  "trial_name": null,
30
  "trial_params": null
31
  }
 
1
  {
2
+ "best_metric": 1.0205419063568115,
3
+ "best_model_checkpoint": "JuanPajero/FT-XS2/checkpoint-1500",
4
+ "epoch": 6.802721088435375,
5
+ "global_step": 2000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
21
  "eval_steps_per_second": 1.726,
22
  "eval_wer": 0.9992262457443516,
23
  "step": 500
24
+ },
25
+ {
26
+ "epoch": 3.4,
27
+ "learning_rate": 2.2029478458049888e-05,
28
+ "loss": 1.3402,
29
+ "step": 1000
30
+ },
31
+ {
32
+ "epoch": 3.4,
33
+ "eval_loss": 1.416143536567688,
34
+ "eval_runtime": 407.671,
35
+ "eval_samples_per_second": 14.019,
36
+ "eval_steps_per_second": 1.754,
37
+ "eval_wer": 0.6038765088207985,
38
+ "step": 1000
39
+ },
40
+ {
41
+ "epoch": 5.1,
42
+ "learning_rate": 1.6360544217687075e-05,
43
+ "loss": 0.7515,
44
+ "step": 1500
45
+ },
46
+ {
47
+ "epoch": 5.1,
48
+ "eval_loss": 1.0205419063568115,
49
+ "eval_runtime": 410.6786,
50
+ "eval_samples_per_second": 13.916,
51
+ "eval_steps_per_second": 1.741,
52
+ "eval_wer": 0.4986459300526153,
53
+ "step": 1500
54
+ },
55
+ {
56
+ "epoch": 6.8,
57
+ "learning_rate": 1.0691609977324262e-05,
58
+ "loss": 0.6136,
59
+ "step": 2000
60
+ },
61
+ {
62
+ "epoch": 6.8,
63
+ "eval_loss": 1.0564398765563965,
64
+ "eval_runtime": 410.9183,
65
+ "eval_samples_per_second": 13.908,
66
+ "eval_steps_per_second": 1.74,
67
+ "eval_wer": 0.4804704425874342,
68
+ "step": 2000
69
  }
70
  ],
71
  "max_steps": 2940,
72
  "num_train_epochs": 10,
73
+ "total_flos": 2.357760234513715e+18,
74
  "trial_name": null,
75
  "trial_params": null
76
  }
{checkpoint-500 β†’ checkpoint-2000}/training_args.bin RENAMED
File without changes
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b21bffe301d799a2b0ec0af49471d25bb9cfa5b8036a4db306ef6161b20f6610
3
  size 377674359
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a292bb26d6fc95282e7803a4a5b79608fdb1b8c7e82347ddc648c085b668783f
3
  size 377674359
runs/Mar29_09-49-04_9cd49a3ed4d1/events.out.tfevents.1774778031.9cd49a3ed4d1.24900.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:23983735746f59a38ca1030003ef1a6b22947645ba39cfc0706ce3fff4d0e462
3
- size 6484
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dab4dc11c82ddefba06bbd00f5a28f8cfa50916188b54c369f7a30257486fc3d
3
+ size 6959