JuanPajero commited on
Commit
76d7629
Β·
1 Parent(s): ae6f401

Training in progress, step 28400

Browse files
{checkpoint-7100 β†’ checkpoint-28400}/config.json RENAMED
File without changes
{checkpoint-7100 β†’ checkpoint-28400}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b9e3c8e53522ceb0dab7bfa04ca1d8478e8ce00311f5a408b38d943600bb76fb
3
  size 721687499
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4aa56be871c5206478c15a1d4d20ee9d027809061cffaf15d4910642d49724b
3
  size 721687499
{checkpoint-7100 β†’ checkpoint-28400}/preprocessor_config.json RENAMED
File without changes
{checkpoint-7100 β†’ checkpoint-28400}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8f5b2fb64505601bbed74a3260fda2f3e509b40bf0a69fdccb2f63346a20d960
3
  size 377674359
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a9608394bdcbf0f5b6c30c64691a84b8aa61151e60c5849c2c39dc3128b168d
3
  size 377674359
{checkpoint-7100 β†’ checkpoint-28400}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c41a1ebd8b69ee58ba79eb31ba4a5258c2407cc41cc3bd033d7c4381bdef2897
3
  size 14709
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:528f3da69cf01134cb223099a8072801c6bd1c0558813b8f85e2472e450e4b63
3
  size 14709
{checkpoint-7100 β†’ checkpoint-28400}/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c59431fcea85bbf5c8e94303864a3537df25105e3d9b79bbbdc9979354028d92
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3b3334ad0870e3c545571c84d2b7e962a8c290fac16c9609e7eb7b5e2257a26
3
  size 1383
{checkpoint-7100 β†’ checkpoint-28400}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ad0a011f8cbe47e1fff8ce6ce943f0e0fd519124f63356e578c30d81f0223ece
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca0ccae7fbd380fabad16a8ed1659fdef32b741c4d2c23c48f43d244a5cd57bf
3
  size 1465
{checkpoint-7100 β†’ checkpoint-28400}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.8227799534797668,
3
- "best_model_checkpoint": "JuanPajero/FT-S3/checkpoint-7100",
4
- "epoch": 0.9874826147426982,
5
- "global_step": 7100,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -21,11 +21,56 @@
21
  "eval_steps_per_second": 2.076,
22
  "eval_wer": 0.3727602769761062,
23
  "step": 7100
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
24
  }
25
  ],
26
  "max_steps": 71900,
27
  "num_train_epochs": 10,
28
- "total_flos": 8.479506458433946e+18,
29
  "trial_name": null,
30
  "trial_params": null
31
  }
 
1
  {
2
+ "best_metric": 0.6885841488838196,
3
+ "best_model_checkpoint": "JuanPajero/FT-S3/checkpoint-21300",
4
+ "epoch": 3.9499304589707926,
5
+ "global_step": 28400,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
21
  "eval_steps_per_second": 2.076,
22
  "eval_wer": 0.3727602769761062,
23
  "step": 7100
24
+ },
25
+ {
26
+ "epoch": 1.97,
27
+ "learning_rate": 2.6753361149745017e-05,
28
+ "loss": 0.4098,
29
+ "step": 14200
30
+ },
31
+ {
32
+ "epoch": 1.97,
33
+ "eval_loss": 0.7418085932731628,
34
+ "eval_runtime": 1208.9139,
35
+ "eval_samples_per_second": 16.484,
36
+ "eval_steps_per_second": 2.061,
37
+ "eval_wer": 0.31068540368553627,
38
+ "step": 14200
39
+ },
40
+ {
41
+ "epoch": 2.96,
42
+ "learning_rate": 2.3462679647658787e-05,
43
+ "loss": 0.338,
44
+ "step": 21300
45
+ },
46
+ {
47
+ "epoch": 2.96,
48
+ "eval_loss": 0.6885841488838196,
49
+ "eval_runtime": 1207.7134,
50
+ "eval_samples_per_second": 16.501,
51
+ "eval_steps_per_second": 2.063,
52
+ "eval_wer": 0.2933106599088304,
53
+ "step": 21300
54
+ },
55
+ {
56
+ "epoch": 3.95,
57
+ "learning_rate": 2.0172461752433936e-05,
58
+ "loss": 0.3011,
59
+ "step": 28400
60
+ },
61
+ {
62
+ "epoch": 3.95,
63
+ "eval_loss": 0.7342329621315002,
64
+ "eval_runtime": 1203.3539,
65
+ "eval_samples_per_second": 16.56,
66
+ "eval_steps_per_second": 2.07,
67
+ "eval_wer": 0.28296994666476305,
68
+ "step": 28400
69
  }
70
  ],
71
  "max_steps": 71900,
72
  "num_train_epochs": 10,
73
+ "total_flos": 3.3951659801377997e+19,
74
  "trial_name": null,
75
  "trial_params": null
76
  }
{checkpoint-7100 β†’ checkpoint-28400}/training_args.bin RENAMED
File without changes
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e240587e9e5d2eba0f7bd4cc9e60e8ab8fecd3cf3157b072914c7eb3ea6d0fcf
3
  size 377674359
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a9608394bdcbf0f5b6c30c64691a84b8aa61151e60c5849c2c39dc3128b168d
3
  size 377674359
runs/Mar22_03-10-48_48c38934e4d2/events.out.tfevents.1774154952.48c38934e4d2.13068.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:288880fa3c716a6fffcc1208ecf7a9dc30076c05b3fb5309b8e12574fbd9090f
3
- size 6492
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66ec37a4899ba64e5520e6862312ea9adf26cd5878c47eb021d3b2742ecc3ca9
3
+ size 6976