JuanPajero commited on
Commit
93d1a11
Β·
1 Parent(s): 493b16c

Training in progress, step 43000

Browse files
{checkpoint-30100 β†’ checkpoint-43000}/config.json RENAMED
File without changes
{checkpoint-30100 β†’ checkpoint-43000}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c956b5ebeccdcc8eb7aabec2de6bf5bcdf7e13cfcdcc404131ef3e4af2f76764
3
  size 721687499
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ab1ea33e31fa79511e2828661e615665e8119d6b08b3344acd7a6298bca92dc
3
  size 721687499
{checkpoint-30100 β†’ checkpoint-43000}/preprocessor_config.json RENAMED
File without changes
{checkpoint-30100 β†’ checkpoint-43000}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:19a5d9e631fa62a90d244323ae9258b128911e1b9a59139980580a00bc2c313d
3
  size 377674359
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0522901a72f42c1cbe4064a0b4cac893454b3e5a98c7b6624bf11995f15f64a6
3
  size 377674359
{checkpoint-30100 β†’ checkpoint-43000}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9311228ae07085e09913d5be0ef13bb46a49229b63f77cbf5a2a742d03fea583
3
  size 14709
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6042a492bab1444a3137e5dd722e1d9a760a16689e6defdb8d7bc2fab1cbb6f9
3
  size 14709
{checkpoint-30100 β†’ checkpoint-43000}/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5dee27a953c9a7d685c66de0c98f7e94774836a29efb4775360b44b9cb5985a5
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb1e36e6665723682d58b1ff4037a292ddf664550aa7b0545651d6553b02ba4d
3
  size 1383
{checkpoint-30100 β†’ checkpoint-43000}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6e1d2295b0dfcf799bf93fee828447c5377feb43c85055c9e1f533a2b35b5491
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11b014559d4b378af9357e0d0b25cb5344a6aab44ca7e0910108285f179c75eb
3
  size 1465
{checkpoint-30100 β†’ checkpoint-43000}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.6688737869262695,
3
- "best_model_checkpoint": "JuanPajero/FT-S2/checkpoint-25800",
4
- "epoch": 2.0931849791376913,
5
- "global_step": 30100,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -111,11 +111,56 @@
111
  "eval_steps_per_second": 2.068,
112
  "eval_wer": 0.28621799120937397,
113
  "step": 30100
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
114
  }
115
  ],
116
  "max_steps": 43140,
117
  "num_train_epochs": 3,
118
- "total_flos": 1.7919431464611226e+19,
119
  "trial_name": null,
120
  "trial_params": null
121
  }
 
1
  {
2
+ "best_metric": 0.6614052653312683,
3
+ "best_model_checkpoint": "JuanPajero/FT-S2/checkpoint-34400",
4
+ "epoch": 2.9902642559109873,
5
+ "global_step": 43000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
111
  "eval_steps_per_second": 2.068,
112
  "eval_wer": 0.28621799120937397,
113
  "step": 30100
114
+ },
115
+ {
116
+ "epoch": 2.39,
117
+ "learning_rate": 6.7663421418637e-06,
118
+ "loss": 0.3111,
119
+ "step": 34400
120
+ },
121
+ {
122
+ "epoch": 2.39,
123
+ "eval_loss": 0.6614052653312683,
124
+ "eval_runtime": 1208.4999,
125
+ "eval_samples_per_second": 16.49,
126
+ "eval_steps_per_second": 2.061,
127
+ "eval_wer": 0.2852058454603861,
128
+ "step": 34400
129
+ },
130
+ {
131
+ "epoch": 2.69,
132
+ "learning_rate": 3.4445989800649053e-06,
133
+ "loss": 0.3032,
134
+ "step": 38700
135
+ },
136
+ {
137
+ "epoch": 2.69,
138
+ "eval_loss": 0.6847738027572632,
139
+ "eval_runtime": 1209.9287,
140
+ "eval_samples_per_second": 16.47,
141
+ "eval_steps_per_second": 2.059,
142
+ "eval_wer": 0.2815039924943146,
143
+ "step": 38700
144
+ },
145
+ {
146
+ "epoch": 2.99,
147
+ "learning_rate": 1.236284963684129e-07,
148
+ "loss": 0.2973,
149
+ "step": 43000
150
+ },
151
+ {
152
+ "epoch": 2.99,
153
+ "eval_loss": 0.6681790351867676,
154
+ "eval_runtime": 1206.5281,
155
+ "eval_samples_per_second": 16.517,
156
+ "eval_steps_per_second": 2.065,
157
+ "eval_wer": 0.2794975473949357,
158
+ "step": 43000
159
  }
160
  ],
161
  "max_steps": 43140,
162
  "num_train_epochs": 3,
163
+ "total_flos": 2.5595238773759386e+19,
164
  "trial_name": null,
165
  "trial_params": null
166
  }
{checkpoint-30100 β†’ checkpoint-43000}/training_args.bin RENAMED
File without changes
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4012135ba862caeb93a93145c915ff1ff9a7e904c9feb913c8ff0ca300450ade
3
  size 377674359
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0522901a72f42c1cbe4064a0b4cac893454b3e5a98c7b6624bf11995f15f64a6
3
  size 377674359
runs/Mar14_07-22-31_4c0520d7b0b9/events.out.tfevents.1773478987.4c0520d7b0b9.11056.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6294feffe8604e20cccd25f5dddb4da456a874959bfa15f3fda9a87fa52e27a1
3
- size 9386
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a71cd818349e825d0fa83661b313419a1ee613e393f1899c4077591abc91586
3
+ size 9870