avsolatorio commited on
Commit
6457180
·
verified ·
1 Parent(s): 307adce

Training in progress, step 31000, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:200b998b368c5e03deb5a46079d27bd6bfeb127cb7478a1f826abe16e3859b87
3
  size 567860028
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bacf8a7eab59fb1966c2948f6183a87b1e12612562c43e3e00be0845f7dfd3a9
3
  size 567860028
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b2ec8cdc4580a142ebac5e5b13f36ee4b4ac51a3bdadfa8fdc82d2d89d48533a
3
  size 1135783354
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84b2fd565ca572922065d0ca702f1af7af2ba8bef22f6dac651b24a5e385367d
3
  size 1135783354
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a536d8021983dc8ddd5749b3c7268784df09edd584c2a4cefb49b35a14b723b
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d68ccaff5a373330ed15f4450e2f0f4e7ec0f2a426a61b0b530e080dd32f44ed
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4172e62d60e6611e586aefafe5c3cb9d66704232378d7f9895f5ee27089afad
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4e103e890947dce8b5cc8f45d5f7726e35dcc2af236d3ec8833bd262720ccd6
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.029792238026857376,
3
  "best_model_checkpoint": "doc-topic-model/checkpoint-29000",
4
- "epoch": 3.698680803846628,
5
  "eval_steps": 1000,
6
- "global_step": 30000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -787,6 +787,32 @@
787
  "eval_samples_per_second": 304.981,
788
  "eval_steps_per_second": 19.064,
789
  "step": 30000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
790
  }
791
  ],
792
  "logging_steps": 500,
@@ -794,7 +820,7 @@
794
  "num_input_tokens_seen": 0,
795
  "num_train_epochs": 10,
796
  "save_steps": 1000,
797
- "total_flos": 678379953845124.0,
798
  "train_batch_size": 4,
799
  "trial_name": null,
800
  "trial_params": null
 
1
  {
2
  "best_metric": 0.029792238026857376,
3
  "best_model_checkpoint": "doc-topic-model/checkpoint-29000",
4
+ "epoch": 3.821970163974849,
5
  "eval_steps": 1000,
6
+ "global_step": 31000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
787
  "eval_samples_per_second": 304.981,
788
  "eval_steps_per_second": 19.064,
789
  "step": 30000
790
+ },
791
+ {
792
+ "epoch": 3.7603254839107385,
793
+ "grad_norm": 0.4146226942539215,
794
+ "learning_rate": 1.2479349032178524e-05,
795
+ "loss": 0.0266,
796
+ "step": 30500
797
+ },
798
+ {
799
+ "epoch": 3.821970163974849,
800
+ "grad_norm": 0.2495744824409485,
801
+ "learning_rate": 1.2356059672050302e-05,
802
+ "loss": 0.0265,
803
+ "step": 31000
804
+ },
805
+ {
806
+ "epoch": 3.821970163974849,
807
+ "eval_accuracy": 0.9894934791265445,
808
+ "eval_f1": 0.6934843724160741,
809
+ "eval_loss": 0.029959995299577713,
810
+ "eval_precision": 0.7549734449545413,
811
+ "eval_recall": 0.6412569768330912,
812
+ "eval_runtime": 26.4331,
813
+ "eval_samples_per_second": 306.851,
814
+ "eval_steps_per_second": 19.181,
815
+ "step": 31000
816
  }
817
  ],
818
  "logging_steps": 500,
 
820
  "num_input_tokens_seen": 0,
821
  "num_train_epochs": 10,
822
  "save_steps": 1000,
823
+ "total_flos": 700958189659932.0,
824
  "train_batch_size": 4,
825
  "trial_name": null,
826
  "trial_params": null