Reggie commited on
Commit
26d9d17
·
verified ·
1 Parent(s): 114fbbf

Training in progress, step 400, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4e6026de3b84ceba28811a32cfbb9c3b69e390810167aff159af4add247f487c
3
  size 69782384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f8dea4d325a4635d3c239e793bad657771e2130c83b3dfef9813d57f5058df9
3
  size 69782384
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:37333b1dd04e29ac205c0f9bfcc393e3b6032d9a61718e76260190d1ce080b47
3
  size 139790651
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a691a2dd0083ffd45de8f8ba46f1319a1176b01199ed67ae21c5b8f4c7c5d65a
3
  size 139790651
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f49441abb975ccb348c1229085bf97990332babf644800bec7b3f3a97b104927
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77af5db692d8169680b37a82ccaf2369394b341d2c152f145639fd25a259d63f
3
  size 14645
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f2198c886767e72e8b6e7d6fefea2fe94ace4419909b570aeb4660b8668dee2
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14206d6f39047b8dbff5f90ecc0ad71bc03ad9f0a166b1d0248ef5714395ce2a
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 200,
3
- "best_metric": 2.348525047302246,
4
- "best_model_checkpoint": "./outputs/checkpoint-200",
5
- "epoch": 0.21715526601520088,
6
  "eval_steps": 200,
7
- "global_step": 200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -44,6 +44,42 @@
44
  "eval_samples_per_second": 66.25,
45
  "eval_steps_per_second": 2.091,
46
  "step": 200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
47
  }
48
  ],
49
  "logging_steps": 50,
@@ -72,7 +108,7 @@
72
  "attributes": {}
73
  }
74
  },
75
- "total_flos": 5.591561099791565e+16,
76
  "train_batch_size": 32,
77
  "trial_name": null,
78
  "trial_params": null
 
1
  {
2
+ "best_global_step": 400,
3
+ "best_metric": 2.2951860427856445,
4
+ "best_model_checkpoint": "./outputs/checkpoint-400",
5
+ "epoch": 0.43431053203040176,
6
  "eval_steps": 200,
7
+ "global_step": 400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
44
  "eval_samples_per_second": 66.25,
45
  "eval_steps_per_second": 2.091,
46
  "step": 200
47
+ },
48
+ {
49
+ "epoch": 0.2714440825190011,
50
+ "grad_norm": 0.6019847393035889,
51
+ "learning_rate": 0.00019735665616115814,
52
+ "loss": 2.3382,
53
+ "step": 250
54
+ },
55
+ {
56
+ "epoch": 0.3257328990228013,
57
+ "grad_norm": 0.7136948704719543,
58
+ "learning_rate": 0.00019587182680566505,
59
+ "loss": 2.3352,
60
+ "step": 300
61
+ },
62
+ {
63
+ "epoch": 0.3800217155266015,
64
+ "grad_norm": 0.6682165861129761,
65
+ "learning_rate": 0.00019406569810316855,
66
+ "loss": 2.3282,
67
+ "step": 350
68
+ },
69
+ {
70
+ "epoch": 0.43431053203040176,
71
+ "grad_norm": 0.6841819882392883,
72
+ "learning_rate": 0.00019194432300991294,
73
+ "loss": 2.3176,
74
+ "step": 400
75
+ },
76
+ {
77
+ "epoch": 0.43431053203040176,
78
+ "eval_loss": 2.2951860427856445,
79
+ "eval_runtime": 7.346,
80
+ "eval_samples_per_second": 81.949,
81
+ "eval_steps_per_second": 2.586,
82
+ "step": 400
83
  }
84
  ],
85
  "logging_steps": 50,
 
108
  "attributes": {}
109
  }
110
  },
111
+ "total_flos": 1.1185423411367117e+17,
112
  "train_batch_size": 32,
113
  "trial_name": null,
114
  "trial_params": null