MuafiraThasni commited on
Commit
667d4a6
·
verified ·
1 Parent(s): deccbc2

Training in progress, step 400, checkpoint

Browse files
checkpoint-400/config.json CHANGED
@@ -49,7 +49,7 @@
49
  "pad_token_id": 1,
50
  "position_embedding_type": "absolute",
51
  "torch_dtype": "float32",
52
- "transformers_version": "4.42.4",
53
  "type_vocab_size": 1,
54
  "use_cache": true,
55
  "vocab_size": 250002
 
49
  "pad_token_id": 1,
50
  "position_embedding_type": "absolute",
51
  "torch_dtype": "float32",
52
+ "transformers_version": "4.42.3",
53
  "type_vocab_size": 1,
54
  "use_cache": true,
55
  "vocab_size": 250002
checkpoint-400/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3f32caa3ade0bc4dd79232fd1456fae9603bb7c02292df8675852e005eff55e9
3
  size 1134332228
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e8dea633ddefd5c6a77825a5ad48949cacf27d7dfd7be23bdb43604b3445369
3
  size 1134332228
checkpoint-400/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e18282059758f7438f8035104343961dae0354a3bf096166da6d8f2c8402bc4a
3
- size 2265924830
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a51c90031d2351c0172e0d11461c02d6a3927f46e41e12851994a1e424524116
3
+ size 2268900866
checkpoint-400/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:662e921e03fcf92563a3b2458b6412a5d7887e0762378509ed7fc9f2b0e4bae7
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f5daab7d556fc02d85dffe50c326709842df42c35ef620127cae6836a494e7c
3
  size 14244
checkpoint-400/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2d2d6ad579de8c53cc7768e169f4897cd81cf9311331caed421754d374415e90
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02ca0267ce9457847149d1dc514b449ab61a93b118b8048db3838e7a156f3daa
3
  size 1064
checkpoint-400/tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:683eb7c7eca2f8d4661f33cb19ad5dcb7c826bbc4256f314d42c7d9d3ac93240
3
- size 17083001
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a56def25aa40facc030ea8b0b87f3688e4b3c39eb8b45d5702b3a1300fe2a20
3
+ size 17082734
checkpoint-400/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.7865890784233485,
3
- "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_paragraphs_ml512-v1/checkpoint-300",
4
  "epoch": 0.21321961620469082,
5
  "eval_steps": 100,
6
  "global_step": 400,
@@ -10,50 +10,50 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.053304904051172705,
13
- "eval_accuracy": 0.6912373860880154,
14
- "eval_f1": 0.6912373860880154,
15
- "eval_loss": 0.8656882047653198,
16
- "eval_precision": 0.6912373860880154,
17
- "eval_recall": 0.6912373860880154,
18
- "eval_runtime": 41.8245,
19
- "eval_samples_per_second": 38.422,
20
- "eval_steps_per_second": 2.415,
21
  "step": 100
22
  },
23
  {
24
  "epoch": 0.10660980810234541,
25
- "eval_accuracy": 0.7121482827113298,
26
- "eval_f1": 0.7121482827113298,
27
- "eval_loss": 0.856532096862793,
28
- "eval_precision": 0.7121482827113298,
29
- "eval_recall": 0.7121482827113298,
30
- "eval_runtime": 42.6291,
31
- "eval_samples_per_second": 37.697,
32
- "eval_steps_per_second": 2.369,
33
  "step": 200
34
  },
35
  {
36
  "epoch": 0.15991471215351813,
37
- "eval_accuracy": 0.7865890784233484,
38
- "eval_f1": 0.7865890784233485,
39
- "eval_loss": 0.6567804217338562,
40
- "eval_precision": 0.7865890784233484,
41
- "eval_recall": 0.7865890784233484,
42
- "eval_runtime": 41.1268,
43
- "eval_samples_per_second": 39.074,
44
- "eval_steps_per_second": 2.456,
45
  "step": 300
46
  },
47
  {
48
  "epoch": 0.21321961620469082,
49
- "eval_accuracy": 0.7400361324323516,
50
- "eval_f1": 0.7400361324323516,
51
- "eval_loss": 0.575270414352417,
52
- "eval_precision": 0.7400361324323516,
53
- "eval_recall": 0.7400361324323516,
54
- "eval_runtime": 43.0681,
55
- "eval_samples_per_second": 37.313,
56
- "eval_steps_per_second": 2.345,
57
  "step": 400
58
  }
59
  ],
@@ -75,7 +75,7 @@
75
  }
76
  },
77
  "total_flos": 890151164313600.0,
78
- "train_batch_size": 8,
79
  "trial_name": null,
80
  "trial_params": null
81
  }
 
1
  {
2
+ "best_metric": 0.8202860650583409,
3
+ "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_paragraphs_ml512-v1/checkpoint-200",
4
  "epoch": 0.21321961620469082,
5
  "eval_steps": 100,
6
  "global_step": 400,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.053304904051172705,
13
+ "eval_accuracy": 0.6321578647928374,
14
+ "eval_f1": 0.6321578647928374,
15
+ "eval_loss": 0.9594171643257141,
16
+ "eval_precision": 0.6321578647928374,
17
+ "eval_recall": 0.6321578647928374,
18
+ "eval_runtime": 69.4219,
19
+ "eval_samples_per_second": 23.148,
20
+ "eval_steps_per_second": 0.735,
21
  "step": 100
22
  },
23
  {
24
  "epoch": 0.10660980810234541,
25
+ "eval_accuracy": 0.8202860650583409,
26
+ "eval_f1": 0.8202860650583409,
27
+ "eval_loss": 0.6088714599609375,
28
+ "eval_precision": 0.8202860650583409,
29
+ "eval_recall": 0.8202860650583409,
30
+ "eval_runtime": 69.0048,
31
+ "eval_samples_per_second": 23.288,
32
+ "eval_steps_per_second": 0.739,
33
  "step": 200
34
  },
35
  {
36
  "epoch": 0.15991471215351813,
37
+ "eval_accuracy": 0.7378602014233383,
38
+ "eval_f1": 0.7378602014233383,
39
+ "eval_loss": 0.7009087800979614,
40
+ "eval_precision": 0.7378602014233383,
41
+ "eval_recall": 0.7378602014233383,
42
+ "eval_runtime": 68.7975,
43
+ "eval_samples_per_second": 23.358,
44
+ "eval_steps_per_second": 0.741,
45
  "step": 300
46
  },
47
  {
48
  "epoch": 0.21321961620469082,
49
+ "eval_accuracy": 0.7694710890634513,
50
+ "eval_f1": 0.7694710890634513,
51
+ "eval_loss": 0.5369378328323364,
52
+ "eval_precision": 0.7694710890634513,
53
+ "eval_recall": 0.7694710890634513,
54
+ "eval_runtime": 69.0856,
55
+ "eval_samples_per_second": 23.261,
56
+ "eval_steps_per_second": 0.738,
57
  "step": 400
58
  }
59
  ],
 
75
  }
76
  },
77
  "total_flos": 890151164313600.0,
78
+ "train_batch_size": 16,
79
  "trial_name": null,
80
  "trial_params": null
81
  }
checkpoint-400/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d884d25b9a0a1975c8ad8cdce24ef6b7c329f16153a80771adc673a879e2c8c3
3
  size 5304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2544ef83614d223e3dbe1cbe496bce99a66932dd46abc19142f548bbc4c106c4
3
  size 5304