yueqis commited on
Commit
25556fa
·
verified ·
1 Parent(s): fcf3936

Upload trainer_state.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. trainer_state.json +73 -3
trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 2.3822651045256147,
6
  "eval_steps": 500,
7
- "global_step": 650,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -463,6 +463,76 @@
463
  "learning_rate": 5.5130235322263634e-06,
464
  "loss": 0.4155,
465
  "step": 650
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
466
  }
467
  ],
468
  "logging_steps": 10,
@@ -482,7 +552,7 @@
482
  "attributes": {}
483
  }
484
  },
485
- "total_flos": 2.163261743877325e+16,
486
  "train_batch_size": 1,
487
  "trial_name": null,
488
  "trial_params": null
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 2.749827705031013,
6
  "eval_steps": 500,
7
+ "global_step": 750,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
463
  "learning_rate": 5.5130235322263634e-06,
464
  "loss": 0.4155,
465
  "step": 650
466
+ },
467
+ {
468
+ "epoch": 2.4190213645761545,
469
+ "grad_norm": 0.40967750549316406,
470
+ "learning_rate": 4.894372840954112e-06,
471
+ "loss": 0.433,
472
+ "step": 660
473
+ },
474
+ {
475
+ "epoch": 2.4557776246266942,
476
+ "grad_norm": 0.3949553370475769,
477
+ "learning_rate": 4.3087556423111186e-06,
478
+ "loss": 0.4262,
479
+ "step": 670
480
+ },
481
+ {
482
+ "epoch": 2.492533884677234,
483
+ "grad_norm": 0.3676910698413849,
484
+ "learning_rate": 3.757134103817053e-06,
485
+ "loss": 0.4306,
486
+ "step": 680
487
+ },
488
+ {
489
+ "epoch": 2.529290144727774,
490
+ "grad_norm": 0.4114847481250763,
491
+ "learning_rate": 3.2404145382112254e-06,
492
+ "loss": 0.4351,
493
+ "step": 690
494
+ },
495
+ {
496
+ "epoch": 2.566046404778314,
497
+ "grad_norm": 0.38977691531181335,
498
+ "learning_rate": 2.759445914383135e-06,
499
+ "loss": 0.4293,
500
+ "step": 700
501
+ },
502
+ {
503
+ "epoch": 2.602802664828854,
504
+ "grad_norm": 0.39468637108802795,
505
+ "learning_rate": 2.315018462518803e-06,
506
+ "loss": 0.422,
507
+ "step": 710
508
+ },
509
+ {
510
+ "epoch": 2.6395589248793936,
511
+ "grad_norm": 0.3883320093154907,
512
+ "learning_rate": 1.9078623757546767e-06,
513
+ "loss": 0.418,
514
+ "step": 720
515
+ },
516
+ {
517
+ "epoch": 2.6763151849299334,
518
+ "grad_norm": 0.4122566878795624,
519
+ "learning_rate": 1.5386466104722053e-06,
520
+ "loss": 0.4268,
521
+ "step": 730
522
+ },
523
+ {
524
+ "epoch": 2.713071444980473,
525
+ "grad_norm": 0.40187907218933105,
526
+ "learning_rate": 1.2079777872042592e-06,
527
+ "loss": 0.4256,
528
+ "step": 740
529
+ },
530
+ {
531
+ "epoch": 2.749827705031013,
532
+ "grad_norm": 0.3951718211174011,
533
+ "learning_rate": 9.163991939592081e-07,
534
+ "loss": 0.4315,
535
+ "step": 750
536
  }
537
  ],
538
  "logging_steps": 10,
 
552
  "attributes": {}
553
  }
554
  },
555
+ "total_flos": 2.496191032773837e+16,
556
  "train_batch_size": 1,
557
  "trial_name": null,
558
  "trial_params": null