HuaminChen commited on
Commit
95fa7fd
·
verified ·
1 Parent(s): 8d2a1a0

Delete checkpoint-396

Browse files
checkpoint-396/config.json DELETED
@@ -1,86 +0,0 @@
1
- {
2
- "architectures": [
3
- "ModernBertForSequenceClassification"
4
- ],
5
- "attention_bias": false,
6
- "attention_dropout": 0.0,
7
- "bos_token_id": 50281,
8
- "classifier_activation": "gelu",
9
- "classifier_bias": false,
10
- "classifier_dropout": 0.0,
11
- "classifier_pooling": "mean",
12
- "cls_token_id": 50281,
13
- "decoder_bias": true,
14
- "deterministic_flash_attn": false,
15
- "embedding_dropout": 0.0,
16
- "eos_token_id": 50282,
17
- "global_attn_every_n_layers": 3,
18
- "global_rope_theta": 160000.0,
19
- "gradient_checkpointing": false,
20
- "hidden_activation": "gelu",
21
- "hidden_size": 768,
22
- "id2label": {
23
- "0": "AGE",
24
- "1": "CREDIT_CARD",
25
- "2": "DATE_TIME",
26
- "3": "DOMAIN_NAME",
27
- "4": "EMAIL_ADDRESS",
28
- "5": "GPE",
29
- "6": "IBAN_CODE",
30
- "7": "IP_ADDRESS",
31
- "8": "NO_PII",
32
- "9": "NRP",
33
- "10": "ORGANIZATION",
34
- "11": "PERSON",
35
- "12": "PHONE_NUMBER",
36
- "13": "STREET_ADDRESS",
37
- "14": "TITLE",
38
- "15": "US_DRIVER_LICENSE",
39
- "16": "US_SSN",
40
- "17": "ZIP_CODE"
41
- },
42
- "initializer_cutoff_factor": 2.0,
43
- "initializer_range": 0.02,
44
- "intermediate_size": 1152,
45
- "label2id": {
46
- "AGE": 0,
47
- "CREDIT_CARD": 1,
48
- "DATE_TIME": 2,
49
- "DOMAIN_NAME": 3,
50
- "EMAIL_ADDRESS": 4,
51
- "GPE": 5,
52
- "IBAN_CODE": 6,
53
- "IP_ADDRESS": 7,
54
- "NO_PII": 8,
55
- "NRP": 9,
56
- "ORGANIZATION": 10,
57
- "PERSON": 11,
58
- "PHONE_NUMBER": 12,
59
- "STREET_ADDRESS": 13,
60
- "TITLE": 14,
61
- "US_DRIVER_LICENSE": 15,
62
- "US_SSN": 16,
63
- "ZIP_CODE": 17
64
- },
65
- "layer_norm_eps": 1e-05,
66
- "local_attention": 128,
67
- "local_rope_theta": 10000.0,
68
- "max_position_embeddings": 8192,
69
- "mlp_bias": false,
70
- "mlp_dropout": 0.0,
71
- "model_type": "modernbert",
72
- "norm_bias": false,
73
- "norm_eps": 1e-05,
74
- "num_attention_heads": 12,
75
- "num_hidden_layers": 22,
76
- "pad_token_id": 50283,
77
- "position_embedding_type": "absolute",
78
- "problem_type": "single_label_classification",
79
- "repad_logits_with_grad": false,
80
- "sep_token_id": 50282,
81
- "sparse_pred_ignore_index": -100,
82
- "sparse_prediction": false,
83
- "torch_dtype": "float32",
84
- "transformers_version": "4.54.1",
85
- "vocab_size": 50368
86
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-396/model.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:c805ffa11eb42a105777473d6c15ece8f1edbd042f695ad860a6b9bd445d4cd7
3
- size 598489008
 
 
 
 
checkpoint-396/optimizer.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:4f825ddc5bf4a0878168aec2b913f72a8adb5ad4951f2e6c9cf76d951532dfd3
3
- size 1197066315
 
 
 
 
checkpoint-396/rng_state.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:9fd9432b50864b1799d071a2391f13a188cc959e985675ab69fd688672db2853
3
- size 14645
 
 
 
 
checkpoint-396/scheduler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:15481c2efe0ee4c3f739eaea3b176ff3a31af2aab89e2b7f41bf029020f18c56
3
- size 1465
 
 
 
 
checkpoint-396/trainer_state.json DELETED
@@ -1,85 +0,0 @@
1
- {
2
- "best_global_step": 396,
3
- "best_metric": 0.9674286242857673,
4
- "best_model_checkpoint": "pii_classifier_modernbert-base_model/checkpoint-396",
5
- "epoch": 3.0,
6
- "eval_steps": 500,
7
- "global_step": 396,
8
- "is_hyper_param_search": false,
9
- "is_local_process_zero": true,
10
- "is_world_process_zero": true,
11
- "log_history": [
12
- {
13
- "epoch": 0.7575757575757576,
14
- "grad_norm": 15.822543144226074,
15
- "learning_rate": 9.900000000000002e-06,
16
- "loss": 2.387,
17
- "step": 100
18
- },
19
- {
20
- "epoch": 1.0,
21
- "eval_accuracy": 0.8444444444444444,
22
- "eval_f1": 0.8201940521734123,
23
- "eval_loss": 0.7109369039535522,
24
- "eval_runtime": 9.3515,
25
- "eval_samples_per_second": 24.06,
26
- "eval_steps_per_second": 3.101,
27
- "step": 132
28
- },
29
- {
30
- "epoch": 1.5151515151515151,
31
- "grad_norm": 44.086917877197266,
32
- "learning_rate": 1.9900000000000003e-05,
33
- "loss": 0.6038,
34
- "step": 200
35
- },
36
- {
37
- "epoch": 2.0,
38
- "eval_accuracy": 0.9288888888888889,
39
- "eval_f1": 0.9239100517009231,
40
- "eval_loss": 0.30152201652526855,
41
- "eval_runtime": 9.2706,
42
- "eval_samples_per_second": 24.27,
43
- "eval_steps_per_second": 3.128,
44
- "step": 264
45
- },
46
- {
47
- "epoch": 2.2727272727272725,
48
- "grad_norm": 0.5022214651107788,
49
- "learning_rate": 2.9900000000000002e-05,
50
- "loss": 0.1797,
51
- "step": 300
52
- },
53
- {
54
- "epoch": 3.0,
55
- "eval_accuracy": 0.9688888888888889,
56
- "eval_f1": 0.9674286242857673,
57
- "eval_loss": 0.18659120798110962,
58
- "eval_runtime": 9.2646,
59
- "eval_samples_per_second": 24.286,
60
- "eval_steps_per_second": 3.13,
61
- "step": 396
62
- }
63
- ],
64
- "logging_steps": 100,
65
- "max_steps": 660,
66
- "num_input_tokens_seen": 0,
67
- "num_train_epochs": 5,
68
- "save_steps": 500,
69
- "stateful_callbacks": {
70
- "TrainerControl": {
71
- "args": {
72
- "should_epoch_stop": false,
73
- "should_evaluate": false,
74
- "should_log": false,
75
- "should_save": true,
76
- "should_training_stop": false
77
- },
78
- "attributes": {}
79
- }
80
- },
81
- "total_flos": 1073506278297600.0,
82
- "train_batch_size": 8,
83
- "trial_name": null,
84
- "trial_params": null
85
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-396/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:057a7aa2553eac3d64bcb87db40e93bb3fe3ab14aadcdced12723c7e1524b795
3
- size 5777