baby-dev commited on
Commit
b580919
·
verified ·
1 Parent(s): b2571c2

Training in progress, epoch 3, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aa61242d59dde07b6e124c28e4f02961504a3d80a62d3744879f8d576710c5a1
3
  size 48552
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d253b566d126f3aba50addeec7b7eb765dcd73cb4b88bcfa0193f7cdfb91c3f5
3
  size 48552
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4bff118783a624c3d4494650098c048335a60deb649201045a57196051f28776
3
  size 107046
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3d7ca924fd1345c00abf75278e6b67d1da97a8585f9d4fe25064f0dcd089c7f
3
  size 107046
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f1f6811de7fd6719f9ba6d6a0209af7f4bc36fd4331e413781421b0ce2308264
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:adef08fda30a046b79221275438406fd995dd5a4dadb0a71a27682a7dcae8f3b
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e3ab4343fd37af80ff3b7a6d2bbb453cb34e903babf826a940b14f4bd54d6552
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63ac0c876d99cedd1c7e14354171b8bdaaea7163f00b90c59253d9bf8b43e991
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.9937106918238996,
5
  "eval_steps": 500,
6
- "global_step": 357,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -80,6 +80,14 @@
80
  "eval_samples_per_second": 246.686,
81
  "eval_steps_per_second": 63.503,
82
  "step": 357
 
 
 
 
 
 
 
 
83
  }
84
  ],
85
  "logging_steps": 50,
@@ -94,12 +102,12 @@
94
  "should_evaluate": false,
95
  "should_log": false,
96
  "should_save": true,
97
- "should_training_stop": false
98
  },
99
  "attributes": {}
100
  }
101
  },
102
- "total_flos": 402378350592.0,
103
  "train_batch_size": 4,
104
  "trial_name": null,
105
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 3.0020964360587,
5
  "eval_steps": 500,
6
+ "global_step": 358,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
80
  "eval_samples_per_second": 246.686,
81
  "eval_steps_per_second": 63.503,
82
  "step": 357
83
+ },
84
+ {
85
+ "epoch": 3.0020964360587,
86
+ "eval_loss": 11.916298866271973,
87
+ "eval_runtime": 0.4304,
88
+ "eval_samples_per_second": 234.654,
89
+ "eval_steps_per_second": 60.406,
90
+ "step": 358
91
  }
92
  ],
93
  "logging_steps": 50,
 
102
  "should_evaluate": false,
103
  "should_log": false,
104
  "should_save": true,
105
+ "should_training_stop": true
106
  },
107
  "attributes": {}
108
  }
109
  },
110
+ "total_flos": 402704130048.0,
111
  "train_batch_size": 4,
112
  "trial_name": null,
113
  "trial_params": null