hypaai commited on
Commit
fcdc53c
·
verified ·
1 Parent(s): 40e0b3a

Training in progress, step 1343

Browse files
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:648bf4d6f8205604f2c379a74384e514d7f2533dd82c411f4ffdee9089dd6805
3
  size 187673752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58a235f577ae951c5e41a12ab4c71ecf6f8ff9821412f5343182aec8704e4c6f
3
  size 187673752
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:648bf4d6f8205604f2c379a74384e514d7f2533dd82c411f4ffdee9089dd6805
3
  size 187673752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a51eecea612921a6892b36f9e2fcc3227e5628e806fc19d387ce2fe411c6e31
3
  size 187673752
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0ebb85871c6b082b1647229471377e7b5105a2a487b4d45f2d3da63c8cc636ad
3
  size 14921099
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:412b801a2500e3aa534b612e94d6dc16d9f6a36cf9ac9739de58b5ec90974d6d
3
  size 14921099
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:89feea09a6f1ed288a67c1a57e2fb79641d0f921fce49294468baca12e30898e
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e65f55bd28c553c15e73931a90cf38e36a32b6d9c47c087efaedd446d7a2964
3
  size 14645
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:317914e1b0b7e57d42f0fa6759aa19d9a30f1d604cc5192b2404476b6f3f4a62
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:849fbe2f82a426b1b4997bc0878657e98737a4dd461d8a5a40a85e49101baa28
3
  size 1383
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd751fe8073c015fdc1ec3ce0bf61f0e1eacae42b35b7bf9f0f55f3d6c99fcf2
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3bb987046d6617ffac50447cbd191330d5f9f74750af09bfa65367796337436b
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 9.02680565897245,
6
  "eval_steps": 50,
7
- "global_step": 1300,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -280,150 +280,6 @@
280
  "eval_steps_per_second": 10.897,
281
  "eval_wer": 16.452007692755988,
282
  "step": 850
283
- },
284
- {
285
- "epoch": 1.0029784065524945,
286
- "grad_norm": 0.48208168148994446,
287
- "learning_rate": 3.3183856502242154e-05,
288
- "loss": 1.1043916320800782,
289
- "step": 900
290
- },
291
- {
292
- "epoch": 1.0029784065524945,
293
- "eval_loss": 0.3950841724872589,
294
- "eval_runtime": 156.2906,
295
- "eval_samples_per_second": 11.114,
296
- "eval_steps_per_second": 11.114,
297
- "eval_wer": 16.1081648114692,
298
- "step": 900
299
- },
300
- {
301
- "epoch": 2.005956813104989,
302
- "grad_norm": 0.4363427460193634,
303
- "learning_rate": 2.944693572496263e-05,
304
- "loss": 1.002419662475586,
305
- "step": 950
306
- },
307
- {
308
- "epoch": 2.005956813104989,
309
- "eval_loss": 0.3973139822483063,
310
- "eval_runtime": 150.5158,
311
- "eval_samples_per_second": 11.54,
312
- "eval_steps_per_second": 11.54,
313
- "eval_wer": 16.16644326592459,
314
- "step": 950
315
- },
316
- {
317
- "epoch": 3.0089352196574835,
318
- "grad_norm": 0.4448009133338928,
319
- "learning_rate": 2.571001494768311e-05,
320
- "loss": 0.9439057159423828,
321
- "step": 1000
322
- },
323
- {
324
- "epoch": 3.0089352196574835,
325
- "eval_loss": 0.4021342992782593,
326
- "eval_runtime": 151.2965,
327
- "eval_samples_per_second": 11.481,
328
- "eval_steps_per_second": 11.481,
329
- "eval_wer": 16.236377411271054,
330
- "step": 1000
331
- },
332
- {
333
- "epoch": 4.011913626209978,
334
- "grad_norm": 0.32352492213249207,
335
- "learning_rate": 2.197309417040359e-05,
336
- "loss": 0.9013279724121094,
337
- "step": 1050
338
- },
339
- {
340
- "epoch": 4.011913626209978,
341
- "eval_loss": 0.4091801941394806,
342
- "eval_runtime": 149.3668,
343
- "eval_samples_per_second": 11.629,
344
- "eval_steps_per_second": 11.629,
345
- "eval_wer": 16.20141033859782,
346
- "step": 1050
347
- },
348
- {
349
- "epoch": 5.014892032762472,
350
- "grad_norm": 0.29706525802612305,
351
- "learning_rate": 1.8236173393124067e-05,
352
- "loss": 0.8674221801757812,
353
- "step": 1100
354
- },
355
- {
356
- "epoch": 5.014892032762472,
357
- "eval_loss": 0.40518996119499207,
358
- "eval_runtime": 157.4047,
359
- "eval_samples_per_second": 11.035,
360
- "eval_steps_per_second": 11.035,
361
- "eval_wer": 16.271344483944286,
362
- "step": 1100
363
- },
364
- {
365
- "epoch": 6.017870439314967,
366
- "grad_norm": 0.36136195063591003,
367
- "learning_rate": 1.4499252615844544e-05,
368
- "loss": 0.842430648803711,
369
- "step": 1150
370
- },
371
- {
372
- "epoch": 6.017870439314967,
373
- "eval_loss": 0.40126579999923706,
374
- "eval_runtime": 154.0519,
375
- "eval_samples_per_second": 11.275,
376
- "eval_steps_per_second": 11.275,
377
- "eval_wer": 16.259688793053208,
378
- "step": 1150
379
- },
380
- {
381
- "epoch": 7.0208488458674605,
382
- "grad_norm": 0.40088629722595215,
383
- "learning_rate": 1.0762331838565023e-05,
384
- "loss": 0.8319394683837891,
385
- "step": 1200
386
- },
387
- {
388
- "epoch": 7.0208488458674605,
389
- "eval_loss": 0.39827466011047363,
390
- "eval_runtime": 157.3801,
391
- "eval_samples_per_second": 11.037,
392
- "eval_steps_per_second": 11.037,
393
- "eval_wer": 16.24803310216213,
394
- "step": 1200
395
- },
396
- {
397
- "epoch": 8.023827252419956,
398
- "grad_norm": 0.3946095108985901,
399
- "learning_rate": 7.025411061285502e-06,
400
- "loss": 0.834195785522461,
401
- "step": 1250
402
- },
403
- {
404
- "epoch": 8.023827252419956,
405
- "eval_loss": 0.3936406075954437,
406
- "eval_runtime": 154.2809,
407
- "eval_samples_per_second": 11.259,
408
- "eval_steps_per_second": 11.259,
409
- "eval_wer": 16.277172329389824,
410
- "step": 1250
411
- },
412
- {
413
- "epoch": 9.02680565897245,
414
- "grad_norm": 0.3853761553764343,
415
- "learning_rate": 3.2884902840059795e-06,
416
- "loss": 0.8308474731445312,
417
- "step": 1300
418
- },
419
- {
420
- "epoch": 9.02680565897245,
421
- "eval_loss": 0.3941210210323334,
422
- "eval_runtime": 154.465,
423
- "eval_samples_per_second": 11.245,
424
- "eval_steps_per_second": 11.245,
425
- "eval_wer": 16.323795092954136,
426
- "step": 1300
427
  }
428
  ],
429
  "logging_steps": 50,
@@ -443,7 +299,7 @@
443
  "attributes": {}
444
  }
445
  },
446
- "total_flos": 4.863411472785408e+19,
447
  "train_batch_size": 64,
448
  "trial_name": null,
449
  "trial_params": null
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.03723008190618019,
6
  "eval_steps": 50,
7
+ "global_step": 850,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
280
  "eval_steps_per_second": 10.897,
281
  "eval_wer": 16.452007692755988,
282
  "step": 850
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
283
  }
284
  ],
285
  "logging_steps": 50,
 
299
  "attributes": {}
300
  }
301
  },
302
+ "total_flos": 3.157242221887488e+19,
303
  "train_batch_size": 64,
304
  "trial_name": null,
305
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f3ea77af43b1094f8223c24207bfa2d82d65643fa265a38412be3476877d8220
3
  size 5457
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c41c98e6d3ee70c478d1ea32d80592130dbc19c7448399d91812e9d8c8424f7
3
  size 5457
runs/Mar27_10-11-38_63249a1410af/events.out.tfevents.1774606298.63249a1410af.3168.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7aa7a7483266950bffe4d4d79e6e258a1b5009ddd6d1b78c1a2b3a75a6225e0d
3
- size 10047
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fc22c1b8390b3408e68cd57be17aba48b050440f21a496b6450b47a8a72a8de
3
+ size 10401