baby-dev commited on
Commit
d35df0b
·
verified ·
1 Parent(s): 2e417e4

Training in progress, step 3600, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7564ca0da7a36af4a49e6efe1b662d7b48552179d9139c4a0001f28fb52be0f7
3
  size 48552
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cbdc2b9825166869a6fac2e63a5a97fa4b37b5b84f026246356242c3f1b4f3c
3
  size 48552
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0df3d50fec9eb8da6ca5775a03ebf1ccb07ed80efaff1d783e7ae0d06f549730
3
  size 107046
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3ccbbe76b5289cfdf27cae32ff8667d16da79bd900a109b903abe92fb00891a
3
  size 107046
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:96f94a9e66b44ef92a231133a85ce908f6da4522f199e6c8f8ae6ace2cb26f13
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aebc4da58173c003f7aad6d162278501a1be585d313d2d5f53369f2e219408a6
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3e1024000b4f413660ff937a139f75de92e5c98f66c23ae365cd7ddd5af918b5
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0afe5275623b07807c5bf749b62f86b7a1ab63345ab37a5eef17970d4cb1036
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 11.898159980773926,
3
  "best_model_checkpoint": "miner_id_24/checkpoint-3450",
4
- "epoch": 28.69022869022869,
5
  "eval_steps": 150,
6
- "global_step": 3450,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -682,6 +682,35 @@
682
  "eval_samples_per_second": 225.536,
683
  "eval_steps_per_second": 57.49,
684
  "step": 3450
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
685
  }
686
  ],
687
  "logging_steps": 50,
@@ -696,7 +725,7 @@
696
  "early_stopping_threshold": 0.0
697
  },
698
  "attributes": {
699
- "early_stopping_patience_counter": 0
700
  }
701
  },
702
  "TrainerControl": {
@@ -710,7 +739,7 @@
710
  "attributes": {}
711
  }
712
  },
713
- "total_flos": 4491195580416.0,
714
  "train_batch_size": 4,
715
  "trial_name": null,
716
  "trial_params": null
 
1
  {
2
  "best_metric": 11.898159980773926,
3
  "best_model_checkpoint": "miner_id_24/checkpoint-3450",
4
+ "epoch": 29.93762993762994,
5
  "eval_steps": 150,
6
+ "global_step": 3600,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
682
  "eval_samples_per_second": 225.536,
683
  "eval_steps_per_second": 57.49,
684
  "step": 3450
685
+ },
686
+ {
687
+ "epoch": 29.106029106029105,
688
+ "grad_norm": 0.05766765773296356,
689
+ "learning_rate": 4.2084942084942086e-05,
690
+ "loss": 12.0737,
691
+ "step": 3500
692
+ },
693
+ {
694
+ "epoch": 29.52182952182952,
695
+ "grad_norm": 0.046123795211315155,
696
+ "learning_rate": 4.124559341950647e-05,
697
+ "loss": 11.9,
698
+ "step": 3550
699
+ },
700
+ {
701
+ "epoch": 29.93762993762994,
702
+ "grad_norm": 0.09343673288822174,
703
+ "learning_rate": 4.0406244754070844e-05,
704
+ "loss": 11.901,
705
+ "step": 3600
706
+ },
707
+ {
708
+ "epoch": 29.93762993762994,
709
+ "eval_loss": 11.898192405700684,
710
+ "eval_runtime": 0.4526,
711
+ "eval_samples_per_second": 225.366,
712
+ "eval_steps_per_second": 57.446,
713
+ "step": 3600
714
  }
715
  ],
716
  "logging_steps": 50,
 
725
  "early_stopping_threshold": 0.0
726
  },
727
  "attributes": {
728
+ "early_stopping_patience_counter": 1
729
  }
730
  },
731
  "TrainerControl": {
 
739
  "attributes": {}
740
  }
741
  },
742
+ "total_flos": 4686500364288.0,
743
  "train_batch_size": 4,
744
  "trial_name": null,
745
  "trial_params": null