HiAmNear commited on
Commit
cd2fdc4
·
verified ·
1 Parent(s): 8a62d04

Training in progress, epoch 4, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8b7e62e925af24c3c46e451bdff1f8741c5f27e678dd9e4e1d76a94a086d496a
3
  size 1476713628
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00248ee9684c65a32615da2b0cccb3ee6b6ac475e02b1cc704d4a10d03c53364
3
  size 1476713628
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d12eabbc14436e317cdf37d9dba3b756242f5d198e74c991dbb74857301a737f
3
  size 2953659629
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69f8175b7a9c4f54cd8420af1fc659bf71ac2b603ae7671b17572d14702dc17b
3
  size 2953659629
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:45479556d4ba632600b7dd85f430f0b6fcb738ecd5454ea101816125db2d33f0
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0c230ad29373d00210d983f3964cf3edad2620215c1c6091bf41cb911b3b787
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb9c5f460012b3238729ee5b4cd8719008838840199b21ad75fcef7c04d58970
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56a642fd3959d962a047731abaf128bced517e3db0e7e9f18577cfe93e2f6753
3
  size 1064
last-checkpoint/sentencepiece.bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
3
+ size 5069051
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.719619326500732,
3
- "best_model_checkpoint": "modelParams/TrainingArguments_output\\checkpoint-149",
4
- "epoch": 2.9949748743718594,
5
  "eval_steps": 500,
6
- "global_step": 149,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -34,6 +34,15 @@
34
  "eval_samples_per_second": 27.684,
35
  "eval_steps_per_second": 3.466,
36
  "step": 149
 
 
 
 
 
 
 
 
 
37
  }
38
  ],
39
  "logging_steps": 500,
@@ -53,7 +62,7 @@
53
  "attributes": {}
54
  }
55
  },
56
- "total_flos": 8867065653362880.0,
57
  "train_batch_size": 8,
58
  "trial_name": null,
59
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.7291361639824304,
3
+ "best_model_checkpoint": "modelParams/TrainingArguments_output\\checkpoint-199",
4
+ "epoch": 4.0,
5
  "eval_steps": 500,
6
+ "global_step": 199,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
34
  "eval_samples_per_second": 27.684,
35
  "eval_steps_per_second": 3.466,
36
  "step": 149
37
+ },
38
+ {
39
+ "epoch": 4.0,
40
+ "eval_accuracy": 0.7291361639824304,
41
+ "eval_loss": 0.6263195872306824,
42
+ "eval_runtime": 45.4245,
43
+ "eval_samples_per_second": 30.072,
44
+ "eval_steps_per_second": 3.764,
45
+ "step": 199
46
  }
47
  ],
48
  "logging_steps": 500,
 
62
  "attributes": {}
63
  }
64
  },
65
+ "total_flos": 1.182275420448384e+16,
66
  "train_batch_size": 8,
67
  "trial_name": null,
68
  "trial_params": null