Leonardolin commited on
Commit
cd44699
·
1 Parent(s): 69bf980

Upload 11 files

Browse files
Files changed (7) hide show
  1. config.json +99 -117
  2. optimizer.pt +2 -2
  3. pytorch_model.bin +2 -2
  4. rng_state.pth +1 -1
  5. scheduler.pt +1 -1
  6. trainer_state.json +195 -201
  7. training_args.bin +1 -1
config.json CHANGED
@@ -10,126 +10,108 @@
10
  "hidden_dropout_prob": 0.1,
11
  "hidden_size": 768,
12
  "id2label": {
13
- "0": "\u7d42\u8eab",
14
- "1": "\u8eca\u9ad4\u96aa",
15
- "2": "\u9577\u671f\u7167\u8b77\u96aa",
16
- "3": "\u6c7d\u8eca\u96aa",
17
- "4": "\u7279\u5b9a\u50b7\u75c5\u96aa",
18
- "5": "\u526f\u672c\u7406\u8ce0",
19
- "6": "\u5931\u80fd\u96aa/\u5931\u80fd\u6276\u52a9\u96aa",
20
- "7": "\u58fd\u96aa",
21
- "8": "\u4fdd\u8b49\u7d66\u4ed8",
22
- "9": "\u5be6\u652f\u578b\u610f\u5916\u96aa",
23
- "10": "\u5931\u80fd\u589e\u984d",
24
- "11": "\u6b98\u5ee2\u96aa",
25
- "12": "\u5e74\u91d1\u4fdd\u96aa",
26
- "13": "\u91cd\u5927\u75be\u75c5\u96aa",
27
- "14": "\u6295\u4fdd",
28
- "15": "\u7522\u96aa",
29
- "16": "\u6a5f\u8eca\u96aa",
30
- "17": "\u512a\u9ad4\u58fd\u96aa",
31
- "18": "\u52de\u5065\u4fdd",
32
- "19": "\u91cd\u5927\u71d2\u71d9\u50b7",
33
- "20": "\u6295\u8cc7\u7406\u8ca1",
34
- "21": "\u4e3b\u7d04",
35
- "22": "\u65c5\u904a\u4e0d\u4fbf\u96aa",
36
- "23": "\u4e00\u6b21\u7d66\u4ed8\u578b\u764c\u75c7\u96aa",
37
- "24": "\u764c\u75c7\u96aa",
38
- "25": "\u7642\u7a0b\u578b\u764c\u75c7\u96aa",
39
- "26": "\u5b9a\u671f",
40
- "27": "\u65c5\u904a\u5e73\u5b89\u96aa",
41
- "28": "\u8d85\u984d\u8cac\u4efb\u96aa",
42
- "29": "\u65e5\u984d\u578b\u610f\u5916\u96aa",
43
- "30": "\u5eb7\u5065\u4eba\u58fd",
44
- "31": "\u9644\u52a0\u4e58\u5ba2\u96aa",
45
- "32": "\u7406\u8ce0",
46
- "33": "\u7121\u7b49\u5f85\u671f",
47
- "34": "\u91cd\u5927\u50b7\u75c5\u96aa/\u91cd\u5927\u75be\u75c5\u96aa",
48
- "35": "\u6b98\u6276\u96aa",
49
- "36": "\u7b2c\u4e09\u4eba\u8cac\u4efb\u96aa",
50
- "37": "\u5916\u5e63\u5546\u54c1",
51
- "38": "\u8c41\u514d\u4fdd\u8cbb",
52
- "39": "\u5132\u84c4\u96aa",
53
- "40": "\u9580\u8a3a\u624b\u8853",
54
- "41": "\u5931\u80fd\u6276\u52a9\u96aa",
55
- "42": "\u4fdd\u8b49\u7e8c\u4fdd",
56
- "43": "\u99d5\u99db\u4eba\u50b7\u5bb3\u96aa",
57
- "44": "\u8f49\u63db\u4f4f\u9662\u65e5\u984d",
58
- "45": "\u5931\u80fd\u96aa",
59
- "46": "\u5be6\u652f\u578b\u91ab\u7642\u96aa",
60
- "47": "\u65e5\u984d\u578b\u91ab\u7642\u96aa",
61
- "48": "\u91ab\u7642\u96aa",
62
- "49": "\u9ad8CP\u503c",
63
- "50": "\u610f\u5916\u96aa",
64
- "51": "\u5718\u9ad4\u4fdd\u96aa",
65
- "52": "\u89e3\u7d04",
66
- "53": "\u5f37\u5236\u96aa",
67
- "54": "\u9084\u672c\u578b",
68
- "55": "\u9644\u7d04",
69
- "56": "\u91cd\u5927\u50b7\u75c5\u96aa",
70
- "57": "\u7aca\u76dc\u96aa"
71
  },
72
  "initializer_range": 0.02,
73
  "intermediate_size": 3072,
74
  "label2id": {
75
- "\u4e00\u6b21\u7d66\u4ed8\u578b\u764c\u75c7\u96aa": 23,
76
- "\u4e3b\u7d04": 21,
77
- "\u4fdd\u8b49\u7d66\u4ed8": 8,
78
- "\u4fdd\u8b49\u7e8c\u4fdd": 42,
79
- "\u512a\u9ad4\u58fd\u96aa": 17,
80
- "\u5132\u84c4\u96aa": 39,
81
- "\u526f\u672c\u7406\u8ce0": 5,
82
- "\u52de\u5065\u4fdd": 18,
83
- "\u5718\u9ad4\u4fdd\u96aa": 51,
84
- "\u58fd\u96aa": 7,
85
- "\u5916\u5e63\u5546\u54c1": 37,
86
- "\u5931\u80fd\u589e\u984d": 10,
87
- "\u5931\u80fd\u6276\u52a9\u96aa": 41,
88
- "\u5931\u80fd\u96aa": 45,
89
- "\u5931\u80fd\u96aa/\u5931\u80fd\u6276\u52a9\u96aa": 6,
90
- "\u5b9a\u671f": 26,
91
- "\u5be6\u652f\u578b\u610f\u5916\u96aa": 9,
92
- "\u5be6\u652f\u578b\u91ab\u7642\u96aa": 46,
93
- "\u5e74\u91d1\u4fdd\u96aa": 12,
94
- "\u5eb7\u5065\u4eba\u58fd": 30,
95
- "\u5f37\u5236\u96aa": 53,
96
- "\u610f\u5916\u96aa": 50,
97
- "\u6295\u4fdd": 14,
98
- "\u6295\u8cc7\u7406\u8ca1": 20,
99
- "\u65c5\u904a\u4e0d\u4fbf\u96aa": 22,
100
- "\u65c5\u904a\u5e73\u5b89\u96aa": 27,
101
- "\u65e5\u984d\u578b\u610f\u5916\u96aa": 29,
102
- "\u65e5\u984d\u578b\u91ab\u7642\u96aa": 47,
103
- "\u6a5f\u8eca\u96aa": 16,
104
- "\u6b98\u5ee2\u96aa": 11,
105
- "\u6b98\u6276\u96aa": 35,
106
- "\u6c7d\u8eca\u96aa": 3,
107
- "\u7121\u7b49\u5f85\u671f": 33,
108
- "\u7279\u5b9a\u50b7\u75c5\u96aa": 4,
109
- "\u7406\u8ce0": 32,
110
- "\u7522\u96aa": 15,
111
- "\u7642\u7a0b\u578b\u764c\u75c7\u96aa": 25,
112
- "\u764c\u75c7\u96aa": 24,
113
- "\u7aca\u76dc\u96aa": 57,
114
- "\u7b2c\u4e09\u4eba\u8cac\u4efb\u96aa": 36,
115
- "\u7d42\u8eab": 0,
116
- "\u89e3\u7d04": 52,
117
- "\u8c41\u514d\u4fdd\u8cbb": 38,
118
- "\u8d85\u984d\u8cac\u4efb\u96aa": 28,
119
- "\u8eca\u9ad4\u96aa": 1,
120
- "\u8f49\u63db\u4f4f\u9662\u65e5\u984d": 44,
121
- "\u9084\u672c\u578b": 54,
122
- "\u91ab\u7642\u96aa": 48,
123
- "\u91cd\u5927\u50b7\u75c5\u96aa": 56,
124
- "\u91cd\u5927\u50b7\u75c5\u96aa/\u91cd\u5927\u75be\u75c5\u96aa": 34,
125
- "\u91cd\u5927\u71d2\u71d9\u50b7": 19,
126
- "\u91cd\u5927\u75be\u75c5\u96aa": 13,
127
- "\u9577\u671f\u7167\u8b77\u96aa": 2,
128
- "\u9580\u8a3a\u624b\u8853": 40,
129
- "\u9644\u52a0\u4e58\u5ba2\u96aa": 31,
130
- "\u9644\u7d04": 55,
131
- "\u99d5\u99db\u4eba\u50b7\u5bb3\u96aa": 43,
132
- "\u9ad8CP\u503c": 49
133
  },
134
  "layer_norm_eps": 1e-12,
135
  "max_position_embeddings": 512,
@@ -145,7 +127,7 @@
145
  "position_embedding_type": "absolute",
146
  "problem_type": "multi_label_classification",
147
  "torch_dtype": "float32",
148
- "transformers_version": "4.30.2",
149
  "type_vocab_size": 2,
150
  "use_cache": true,
151
  "vocab_size": 21128
 
10
  "hidden_dropout_prob": 0.1,
11
  "hidden_size": 768,
12
  "id2label": {
13
+ "0": "\u91cd\u5927\u75be\u75c5\u96aa",
14
+ "1": "\u7522\u96aa",
15
+ "2": "\u6b98\u5ee2\u96aa",
16
+ "3": "\u7279\u5b9a\u50b7\u75c5\u96aa",
17
+ "4": "\u5132\u84c4\u96aa",
18
+ "5": "\u6b98\u6276\u96aa",
19
+ "6": "\u764c\u75c7\u96aa",
20
+ "7": "\u5718\u9ad4\u4fdd\u96aa",
21
+ "8": "\u99d5\u99db\u4eba\u50b7\u5bb3\u96aa",
22
+ "9": "\u4e00\u6b21\u7d66\u4ed8\u578b\u764c\u75c7\u96aa",
23
+ "10": "\u4e3b\u7d04",
24
+ "11": "\u4fdd\u8b49\u7d66\u4ed8",
25
+ "12": "\u5be6\u652f\u578b",
26
+ "13": "\u6c7d\u8eca\u96aa",
27
+ "14": "\u9084\u672c\u578b",
28
+ "15": "\u9644\u52a0\u4e58\u5ba2\u96aa",
29
+ "16": "\u7aca\u76dc\u96aa",
30
+ "17": "\u7d42\u8eab",
31
+ "18": "\u91ab\u7642\u96aa",
32
+ "19": "\u610f\u5916\u96aa",
33
+ "20": "\u58fd\u96aa",
34
+ "21": "\u9580\u8a3a\u624b\u8853",
35
+ "22": "\u91cd\u5927\u71d2\u71d9\u50b7",
36
+ "23": "\u65c5\u904a\u5e73\u5b89\u96aa",
37
+ "24": "\u5931\u80fd\u96aa",
38
+ "25": "\u7b2c\u4e09\u4eba\u8cac\u4efb\u96aa",
39
+ "26": "\u4fdd\u8b49\u7e8c\u4fdd",
40
+ "27": "\u5f37\u5236\u96aa",
41
+ "28": "\u7642\u7a0b\u578b\u764c\u75c7\u96aa",
42
+ "29": "\u5931\u80fd\u589e\u984d",
43
+ "30": "\u7121\u7b49\u5f85\u671f",
44
+ "31": "\u8c41\u514d\u4fdd\u8cbb",
45
+ "32": "\u5e74\u91d1\u4fdd\u96aa",
46
+ "33": "\u526f\u672c\u7406\u8ce0",
47
+ "34": "\u5b9a\u671f",
48
+ "35": "\u52de\u5065\u4fdd",
49
+ "36": "\u8d85\u984d\u8cac\u4efb\u96aa",
50
+ "37": "\u9644\u7d04",
51
+ "38": "\u5916\u5e63\u5546\u54c1",
52
+ "39": "\u8eca\u9ad4\u96aa",
53
+ "40": "\u91cd\u5927\u50b7\u75c5\u96aa",
54
+ "41": "\u8f49\u63db\u4f4f\u9662\u65e5\u984d",
55
+ "42": "\u9577\u671f\u7167\u8b77\u96aa",
56
+ "43": "\u65c5\u904a\u4e0d\u4fbf\u96aa",
57
+ "44": "\u6295\u8cc7\u7406\u8ca1",
58
+ "45": "\u6a5f\u8eca\u96aa",
59
+ "46": "\u5931\u80fd\u6276\u52a9\u96aa",
60
+ "47": "\u512a\u9ad4\u58fd\u96aa",
61
+ "48": "\u65e5\u984d\u578b"
 
 
 
 
 
 
 
 
 
62
  },
63
  "initializer_range": 0.02,
64
  "intermediate_size": 3072,
65
  "label2id": {
66
+ "\u4e00\u6b21\u7d66\u4ed8\u578b\u764c\u75c7\u96aa": 9,
67
+ "\u4e3b\u7d04": 10,
68
+ "\u4fdd\u8b49\u7d66\u4ed8": 11,
69
+ "\u4fdd\u8b49\u7e8c\u4fdd": 26,
70
+ "\u512a\u9ad4\u58fd\u96aa": 47,
71
+ "\u5132\u84c4\u96aa": 4,
72
+ "\u526f\u672c\u7406\u8ce0": 33,
73
+ "\u52de\u5065\u4fdd": 35,
74
+ "\u5718\u9ad4\u4fdd\u96aa": 7,
75
+ "\u58fd\u96aa": 20,
76
+ "\u5916\u5e63\u5546\u54c1": 38,
77
+ "\u5931\u80fd\u589e\u984d": 29,
78
+ "\u5931\u80fd\u6276\u52a9\u96aa": 46,
79
+ "\u5931\u80fd\u96aa": 24,
80
+ "\u5b9a\u671f": 34,
81
+ "\u5be6\u652f\u578b": 12,
82
+ "\u5e74\u91d1\u4fdd\u96aa": 32,
83
+ "\u5f37\u5236\u96aa": 27,
84
+ "\u610f\u5916\u96aa": 19,
85
+ "\u6295\u8cc7\u7406\u8ca1": 44,
86
+ "\u65c5\u904a\u4e0d\u4fbf\u96aa": 43,
87
+ "\u65c5\u904a\u5e73\u5b89\u96aa": 23,
88
+ "\u65e5\u984d\u578b": 48,
89
+ "\u6a5f\u8eca\u96aa": 45,
90
+ "\u6b98\u5ee2\u96aa": 2,
91
+ "\u6b98\u6276\u96aa": 5,
92
+ "\u6c7d\u8eca\u96aa": 13,
93
+ "\u7121\u7b49\u5f85\u671f": 30,
94
+ "\u7279\u5b9a\u50b7\u75c5\u96aa": 3,
95
+ "\u7522\u96aa": 1,
96
+ "\u7642\u7a0b\u578b\u764c\u75c7\u96aa": 28,
97
+ "\u764c\u75c7\u96aa": 6,
98
+ "\u7aca\u76dc\u96aa": 16,
99
+ "\u7b2c\u4e09\u4eba\u8cac\u4efb\u96aa": 25,
100
+ "\u7d42\u8eab": 17,
101
+ "\u8c41\u514d\u4fdd\u8cbb": 31,
102
+ "\u8d85\u984d\u8cac\u4efb\u96aa": 36,
103
+ "\u8eca\u9ad4\u96aa": 39,
104
+ "\u8f49\u63db\u4f4f\u9662\u65e5\u984d": 41,
105
+ "\u9084\u672c\u578b": 14,
106
+ "\u91ab\u7642\u96aa": 18,
107
+ "\u91cd\u5927\u50b7\u75c5\u96aa": 40,
108
+ "\u91cd\u5927\u71d2\u71d9\u50b7": 22,
109
+ "\u91cd\u5927\u75be\u75c5\u96aa": 0,
110
+ "\u9577\u671f\u7167\u8b77\u96aa": 42,
111
+ "\u9580\u8a3a\u624b\u8853": 21,
112
+ "\u9644\u52a0\u4e58\u5ba2\u96aa": 15,
113
+ "\u9644\u7d04": 37,
114
+ "\u99d5\u99db\u4eba\u50b7\u5bb3\u96aa": 8
 
 
 
 
 
 
 
 
 
115
  },
116
  "layer_norm_eps": 1e-12,
117
  "max_position_embeddings": 512,
 
127
  "position_embedding_type": "absolute",
128
  "problem_type": "multi_label_classification",
129
  "torch_dtype": "float32",
130
+ "transformers_version": "4.31.0",
131
  "type_vocab_size": 2,
132
  "use_cache": true,
133
  "vocab_size": 21128
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5a76601140035efb6c21063a432df1a3db1623bf4ff1458b627bba8e2c13726e
3
- size 818615877
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9642edc572d7b2e23173b6054c49f58211a2429fd9b09fb3bb2c18b636a77ba
3
+ size 818560581
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a70cba2d4b660e85c8df0ffce5f11fe9ec2f2ccd02d8d59b303bd50d2f33a441
3
- size 409321781
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ed670329e7c3c1d17b57e491064e921b4646ff79c9b2fe900a588c8cc4f92a7
3
+ size 409289713
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb270d3ae860f11cf3c460aaa8e4c5def620c1c0810226037f53557bc70107bb
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9af5634aa9361a6940f3d1c32c45e51f9ffdc722fd2baafa8ebd03f20b659a4a
3
  size 14575
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:80636f86a16567ef0f8d224d7dc105da5b294f11a4aa0269a9c057ac9ebd35ac
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa6c7a04dbc7c613fe79004c534f37c1cebe30a25814c99e56027fb1c86fd918
3
  size 627
trainer_state.json CHANGED
@@ -1,284 +1,278 @@
1
  {
2
- "best_metric": 0.564568262274896,
3
- "best_model_checkpoint": "bert-finetuned-insurence/checkpoint-3852",
4
  "epoch": 20.0,
5
- "global_step": 4280,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
- "eval_accuracy": 0.0,
13
- "eval_f1": 0.2651817608741332,
14
- "eval_loss": 0.2465316206216812,
15
- "eval_roc_auc": 0.5780009947992923,
16
- "eval_runtime": 4.1824,
17
- "eval_samples_per_second": 143.457,
18
- "eval_steps_per_second": 2.391,
19
- "step": 214
20
  },
21
  {
22
  "epoch": 2.0,
23
- "eval_accuracy": 0.0033333333333333335,
24
- "eval_f1": 0.4286243974786801,
25
- "eval_loss": 0.2168939709663391,
26
- "eval_roc_auc": 0.6460988356101586,
27
- "eval_runtime": 4.1125,
28
- "eval_samples_per_second": 145.895,
29
- "eval_steps_per_second": 2.432,
30
- "step": 428
31
  },
32
  {
33
- "epoch": 2.34,
34
- "learning_rate": 1.766355140186916e-05,
35
- "loss": 0.2607,
36
  "step": 500
37
  },
38
  {
39
  "epoch": 3.0,
40
- "eval_accuracy": 0.01,
41
- "eval_f1": 0.46524160229926353,
42
- "eval_loss": 0.20735658705234528,
43
- "eval_roc_auc": 0.6640500103615281,
44
- "eval_runtime": 4.1378,
45
- "eval_samples_per_second": 145.003,
46
- "eval_steps_per_second": 2.417,
47
- "step": 642
48
  },
49
  {
50
  "epoch": 4.0,
51
- "eval_accuracy": 0.006666666666666667,
52
- "eval_f1": 0.49712192569335417,
53
- "eval_loss": 0.2018413543701172,
54
- "eval_roc_auc": 0.6807712075579161,
55
- "eval_runtime": 4.1419,
56
- "eval_samples_per_second": 144.86,
57
- "eval_steps_per_second": 2.414,
58
- "step": 856
59
  },
60
  {
61
- "epoch": 4.67,
62
- "learning_rate": 1.5327102803738318e-05,
63
- "loss": 0.1957,
64
- "step": 1000
 
 
 
 
 
65
  },
66
  {
67
- "epoch": 5.0,
68
- "eval_accuracy": 0.013333333333333334,
69
- "eval_f1": 0.531224523071906,
70
- "eval_loss": 0.1989612579345703,
71
- "eval_roc_auc": 0.7047636174438967,
72
- "eval_runtime": 4.1224,
73
- "eval_samples_per_second": 145.547,
74
- "eval_steps_per_second": 2.426,
75
- "step": 1070
76
  },
77
  {
78
  "epoch": 6.0,
79
- "eval_accuracy": 0.028333333333333332,
80
- "eval_f1": 0.552503531627688,
81
- "eval_loss": 0.19641733169555664,
82
- "eval_roc_auc": 0.7204743245073841,
83
- "eval_runtime": 4.1162,
84
- "eval_samples_per_second": 145.765,
85
- "eval_steps_per_second": 2.429,
86
- "step": 1284
87
  },
88
  {
89
  "epoch": 7.0,
90
- "eval_accuracy": 0.021666666666666667,
91
- "eval_f1": 0.5480784313725491,
92
- "eval_loss": 0.19820699095726013,
93
- "eval_roc_auc": 0.7184704069589273,
94
- "eval_runtime": 4.1253,
95
- "eval_samples_per_second": 145.442,
96
- "eval_steps_per_second": 2.424,
97
- "step": 1498
98
  },
99
  {
100
- "epoch": 7.01,
101
- "learning_rate": 1.2990654205607478e-05,
102
- "loss": 0.1749,
103
  "step": 1500
104
  },
105
  {
106
  "epoch": 8.0,
107
- "eval_accuracy": 0.025,
108
- "eval_f1": 0.541625534715367,
109
- "eval_loss": 0.19906778633594513,
110
- "eval_roc_auc": 0.7081857426146021,
111
- "eval_runtime": 4.1299,
112
- "eval_samples_per_second": 145.284,
113
- "eval_steps_per_second": 2.421,
114
- "step": 1712
115
  },
116
  {
117
  "epoch": 9.0,
118
- "eval_accuracy": 0.023333333333333334,
119
- "eval_f1": 0.5581826611033842,
120
- "eval_loss": 0.20057238638401031,
121
- "eval_roc_auc": 0.7257264689844256,
122
- "eval_runtime": 4.123,
123
- "eval_samples_per_second": 145.527,
124
- "eval_steps_per_second": 2.425,
125
- "step": 1926
126
- },
127
- {
128
- "epoch": 9.35,
129
- "learning_rate": 1.0654205607476635e-05,
130
- "loss": 0.1552,
131
- "step": 2000
132
  },
133
  {
134
  "epoch": 10.0,
135
- "eval_accuracy": 0.023333333333333334,
136
- "eval_f1": 0.5491239048811013,
137
- "eval_loss": 0.20264221727848053,
138
- "eval_roc_auc": 0.7193901260078247,
139
- "eval_runtime": 4.1359,
140
- "eval_samples_per_second": 145.073,
141
- "eval_steps_per_second": 2.418,
142
- "step": 2140
143
  },
144
  {
145
- "epoch": 11.0,
146
- "eval_accuracy": 0.023333333333333334,
147
- "eval_f1": 0.5452513966480447,
148
- "eval_loss": 0.20413073897361755,
149
- "eval_roc_auc": 0.7144236705813142,
150
- "eval_runtime": 4.1888,
151
- "eval_samples_per_second": 143.238,
152
- "eval_steps_per_second": 2.387,
153
- "step": 2354
154
  },
155
  {
156
- "epoch": 11.68,
157
- "learning_rate": 8.317757009345795e-06,
158
- "loss": 0.142,
159
- "step": 2500
 
 
 
 
 
160
  },
161
  {
162
  "epoch": 12.0,
163
- "eval_accuracy": 0.03,
164
- "eval_f1": 0.5433158480368782,
165
- "eval_loss": 0.2068767249584198,
166
- "eval_roc_auc": 0.7141540882215025,
167
- "eval_runtime": 4.1429,
168
- "eval_samples_per_second": 144.826,
169
- "eval_steps_per_second": 2.414,
170
- "step": 2568
171
  },
172
  {
173
  "epoch": 13.0,
174
- "eval_accuracy": 0.02666666666666667,
175
- "eval_f1": 0.5504587155963303,
176
- "eval_loss": 0.20743216574192047,
177
- "eval_roc_auc": 0.7182797203748162,
178
- "eval_runtime": 4.1314,
179
- "eval_samples_per_second": 145.228,
180
- "eval_steps_per_second": 2.42,
181
- "step": 2782
182
  },
183
  {
184
- "epoch": 14.0,
185
- "eval_accuracy": 0.02666666666666667,
186
- "eval_f1": 0.5574488041269346,
187
- "eval_loss": 0.20869675278663635,
188
- "eval_roc_auc": 0.7234869573231687,
189
- "eval_runtime": 4.1354,
190
- "eval_samples_per_second": 145.09,
191
- "eval_steps_per_second": 2.418,
192
- "step": 2996
193
  },
194
  {
195
- "epoch": 14.02,
196
- "learning_rate": 5.981308411214953e-06,
197
- "loss": 0.1314,
198
- "step": 3000
 
 
 
 
 
199
  },
200
  {
201
  "epoch": 15.0,
202
- "eval_accuracy": 0.028333333333333332,
203
- "eval_f1": 0.5433563071004968,
204
- "eval_loss": 0.2121913880109787,
205
- "eval_roc_auc": 0.712902953754437,
206
- "eval_runtime": 4.165,
207
- "eval_samples_per_second": 144.058,
208
- "eval_steps_per_second": 2.401,
209
- "step": 3210
210
  },
211
  {
212
- "epoch": 16.0,
213
- "eval_accuracy": 0.03166666666666667,
214
- "eval_f1": 0.5553453169347209,
215
- "eval_loss": 0.21151989698410034,
216
- "eval_roc_auc": 0.7210906101371354,
217
- "eval_runtime": 4.1328,
218
- "eval_samples_per_second": 145.182,
219
- "eval_steps_per_second": 2.42,
220
- "step": 3424
221
  },
222
  {
223
- "epoch": 16.36,
224
- "learning_rate": 3.6448598130841123e-06,
225
- "loss": 0.1242,
226
- "step": 3500
 
 
 
 
 
227
  },
228
  {
229
  "epoch": 17.0,
230
- "eval_accuracy": 0.03166666666666667,
231
- "eval_f1": 0.5528838598145529,
232
- "eval_loss": 0.21267028152942657,
233
- "eval_roc_auc": 0.720453986434248,
234
- "eval_runtime": 4.1485,
235
- "eval_samples_per_second": 144.63,
236
- "eval_steps_per_second": 2.41,
237
- "step": 3638
238
  },
239
  {
240
  "epoch": 18.0,
241
- "eval_accuracy": 0.028333333333333332,
242
- "eval_f1": 0.564568262274896,
243
- "eval_loss": 0.21246589720249176,
244
- "eval_roc_auc": 0.7294850597946638,
245
- "eval_runtime": 4.1681,
246
- "eval_samples_per_second": 143.949,
247
- "eval_steps_per_second": 2.399,
248
- "step": 3852
249
  },
250
  {
251
- "epoch": 18.69,
252
- "learning_rate": 1.308411214953271e-06,
253
- "loss": 0.1194,
254
- "step": 4000
255
  },
256
  {
257
  "epoch": 19.0,
258
- "eval_accuracy": 0.03333333333333333,
259
- "eval_f1": 0.5572077007356393,
260
- "eval_loss": 0.21363653242588043,
261
- "eval_roc_auc": 0.7231682360522511,
262
- "eval_runtime": 4.124,
263
- "eval_samples_per_second": 145.491,
264
- "eval_steps_per_second": 2.425,
265
- "step": 4066
266
  },
267
  {
268
  "epoch": 20.0,
269
- "eval_accuracy": 0.03166666666666667,
270
- "eval_f1": 0.5593989669744873,
271
- "eval_loss": 0.2135751098394394,
272
- "eval_roc_auc": 0.7242125772444862,
273
- "eval_runtime": 4.1303,
274
- "eval_samples_per_second": 145.268,
275
- "eval_steps_per_second": 2.421,
276
- "step": 4280
277
  }
278
  ],
279
- "max_steps": 4280,
280
  "num_train_epochs": 20,
281
- "total_flos": 1.79926828336128e+16,
282
  "trial_name": null,
283
  "trial_params": null
284
  }
 
1
  {
2
+ "best_metric": 0.5812987875768144,
3
+ "best_model_checkpoint": "bert-finetuned-insurence/checkpoint-1504",
4
  "epoch": 20.0,
5
+ "global_step": 3760,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
+ "eval_accuracy": 0.016666666666666666,
13
+ "eval_f1": 0.1856089499110094,
14
+ "eval_loss": 0.2537216246128082,
15
+ "eval_roc_auc": 0.5502226265229397,
16
+ "eval_runtime": 4.2613,
17
+ "eval_samples_per_second": 140.801,
18
+ "eval_steps_per_second": 2.347,
19
+ "step": 188
20
  },
21
  {
22
  "epoch": 2.0,
23
+ "eval_accuracy": 0.02666666666666667,
24
+ "eval_f1": 0.4750710900473934,
25
+ "eval_loss": 0.2218438684940338,
26
+ "eval_roc_auc": 0.6751318414846118,
27
+ "eval_runtime": 4.2236,
28
+ "eval_samples_per_second": 142.059,
29
+ "eval_steps_per_second": 2.368,
30
+ "step": 376
31
  },
32
  {
33
+ "epoch": 2.66,
34
+ "learning_rate": 1.7340425531914894e-05,
35
+ "loss": 0.2657,
36
  "step": 500
37
  },
38
  {
39
  "epoch": 3.0,
40
+ "eval_accuracy": 0.041666666666666664,
41
+ "eval_f1": 0.5161290322580645,
42
+ "eval_loss": 0.20993947982788086,
43
+ "eval_roc_auc": 0.6941419674142428,
44
+ "eval_runtime": 4.2298,
45
+ "eval_samples_per_second": 141.852,
46
+ "eval_steps_per_second": 2.364,
47
+ "step": 564
48
  },
49
  {
50
  "epoch": 4.0,
51
+ "eval_accuracy": 0.041666666666666664,
52
+ "eval_f1": 0.537253469685902,
53
+ "eval_loss": 0.20495453476905823,
54
+ "eval_roc_auc": 0.7082594844493445,
55
+ "eval_runtime": 4.2212,
56
+ "eval_samples_per_second": 142.139,
57
+ "eval_steps_per_second": 2.369,
58
+ "step": 752
59
  },
60
  {
61
+ "epoch": 5.0,
62
+ "eval_accuracy": 0.055,
63
+ "eval_f1": 0.5567817728729085,
64
+ "eval_loss": 0.20180459320545197,
65
+ "eval_roc_auc": 0.7213133386735834,
66
+ "eval_runtime": 4.2593,
67
+ "eval_samples_per_second": 140.868,
68
+ "eval_steps_per_second": 2.348,
69
+ "step": 940
70
  },
71
  {
72
+ "epoch": 5.32,
73
+ "learning_rate": 1.4680851063829789e-05,
74
+ "loss": 0.1948,
75
+ "step": 1000
 
 
 
 
 
76
  },
77
  {
78
  "epoch": 6.0,
79
+ "eval_accuracy": 0.04666666666666667,
80
+ "eval_f1": 0.5600428877769836,
81
+ "eval_loss": 0.20023241639137268,
82
+ "eval_roc_auc": 0.7222440876299687,
83
+ "eval_runtime": 4.2842,
84
+ "eval_samples_per_second": 140.05,
85
+ "eval_steps_per_second": 2.334,
86
+ "step": 1128
87
  },
88
  {
89
  "epoch": 7.0,
90
+ "eval_accuracy": 0.05,
91
+ "eval_f1": 0.5645614035087719,
92
+ "eval_loss": 0.2023993879556656,
93
+ "eval_roc_auc": 0.72737489130751,
94
+ "eval_runtime": 4.2454,
95
+ "eval_samples_per_second": 141.329,
96
+ "eval_steps_per_second": 2.355,
97
+ "step": 1316
98
  },
99
  {
100
+ "epoch": 7.98,
101
+ "learning_rate": 1.2021276595744681e-05,
102
+ "loss": 0.1685,
103
  "step": 1500
104
  },
105
  {
106
  "epoch": 8.0,
107
+ "eval_accuracy": 0.05,
108
+ "eval_f1": 0.5812987875768144,
109
+ "eval_loss": 0.20405741035938263,
110
+ "eval_roc_auc": 0.7451393429382976,
111
+ "eval_runtime": 4.2486,
112
+ "eval_samples_per_second": 141.223,
113
+ "eval_steps_per_second": 2.354,
114
+ "step": 1504
115
  },
116
  {
117
  "epoch": 9.0,
118
+ "eval_accuracy": 0.051666666666666666,
119
+ "eval_f1": 0.5782645324347093,
120
+ "eval_loss": 0.2039116472005844,
121
+ "eval_roc_auc": 0.7410205309812413,
122
+ "eval_runtime": 4.2832,
123
+ "eval_samples_per_second": 140.082,
124
+ "eval_steps_per_second": 2.335,
125
+ "step": 1692
 
 
 
 
 
 
126
  },
127
  {
128
  "epoch": 10.0,
129
+ "eval_accuracy": 0.05333333333333334,
130
+ "eval_f1": 0.5611961057023644,
131
+ "eval_loss": 0.20895147323608398,
132
+ "eval_roc_auc": 0.7272260462547598,
133
+ "eval_runtime": 4.2515,
134
+ "eval_samples_per_second": 141.128,
135
+ "eval_steps_per_second": 2.352,
136
+ "step": 1880
137
  },
138
  {
139
+ "epoch": 10.64,
140
+ "learning_rate": 9.361702127659576e-06,
141
+ "loss": 0.1481,
142
+ "step": 2000
 
 
 
 
 
143
  },
144
  {
145
+ "epoch": 11.0,
146
+ "eval_accuracy": 0.05,
147
+ "eval_f1": 0.5766101694915254,
148
+ "eval_loss": 0.20634876191616058,
149
+ "eval_roc_auc": 0.7391470139862534,
150
+ "eval_runtime": 4.2535,
151
+ "eval_samples_per_second": 141.06,
152
+ "eval_steps_per_second": 2.351,
153
+ "step": 2068
154
  },
155
  {
156
  "epoch": 12.0,
157
+ "eval_accuracy": 0.05333333333333334,
158
+ "eval_f1": 0.5601417183348095,
159
+ "eval_loss": 0.2106322944164276,
160
+ "eval_roc_auc": 0.7236795284079115,
161
+ "eval_runtime": 4.2654,
162
+ "eval_samples_per_second": 140.666,
163
+ "eval_steps_per_second": 2.344,
164
+ "step": 2256
165
  },
166
  {
167
  "epoch": 13.0,
168
+ "eval_accuracy": 0.05,
169
+ "eval_f1": 0.5558127114117857,
170
+ "eval_loss": 0.21359555423259735,
171
+ "eval_roc_auc": 0.7208235913661607,
172
+ "eval_runtime": 4.2657,
173
+ "eval_samples_per_second": 140.656,
174
+ "eval_steps_per_second": 2.344,
175
+ "step": 2444
176
  },
177
  {
178
+ "epoch": 13.3,
179
+ "learning_rate": 6.702127659574469e-06,
180
+ "loss": 0.1331,
181
+ "step": 2500
 
 
 
 
 
182
  },
183
  {
184
+ "epoch": 14.0,
185
+ "eval_accuracy": 0.04,
186
+ "eval_f1": 0.5686879068174031,
187
+ "eval_loss": 0.2141793817281723,
188
+ "eval_roc_auc": 0.7333805433804568,
189
+ "eval_runtime": 4.2245,
190
+ "eval_samples_per_second": 142.028,
191
+ "eval_steps_per_second": 2.367,
192
+ "step": 2632
193
  },
194
  {
195
  "epoch": 15.0,
196
+ "eval_accuracy": 0.058333333333333334,
197
+ "eval_f1": 0.5659075224292616,
198
+ "eval_loss": 0.21738983690738678,
199
+ "eval_roc_auc": 0.730793042125031,
200
+ "eval_runtime": 4.2924,
201
+ "eval_samples_per_second": 139.781,
202
+ "eval_steps_per_second": 2.33,
203
+ "step": 2820
204
  },
205
  {
206
+ "epoch": 15.96,
207
+ "learning_rate": 4.042553191489362e-06,
208
+ "loss": 0.1222,
209
+ "step": 3000
 
 
 
 
 
210
  },
211
  {
212
+ "epoch": 16.0,
213
+ "eval_accuracy": 0.04,
214
+ "eval_f1": 0.5679096818337325,
215
+ "eval_loss": 0.21772129833698273,
216
+ "eval_roc_auc": 0.7332271515025567,
217
+ "eval_runtime": 4.2711,
218
+ "eval_samples_per_second": 140.478,
219
+ "eval_steps_per_second": 2.341,
220
+ "step": 3008
221
  },
222
  {
223
  "epoch": 17.0,
224
+ "eval_accuracy": 0.041666666666666664,
225
+ "eval_f1": 0.5633460603956959,
226
+ "eval_loss": 0.21912114322185516,
227
+ "eval_roc_auc": 0.7285610702838653,
228
+ "eval_runtime": 4.246,
229
+ "eval_samples_per_second": 141.309,
230
+ "eval_steps_per_second": 2.355,
231
+ "step": 3196
232
  },
233
  {
234
  "epoch": 18.0,
235
+ "eval_accuracy": 0.045,
236
+ "eval_f1": 0.5691861457089235,
237
+ "eval_loss": 0.21997326612472534,
238
+ "eval_roc_auc": 0.7342966651772544,
239
+ "eval_runtime": 4.2727,
240
+ "eval_samples_per_second": 140.425,
241
+ "eval_steps_per_second": 2.34,
242
+ "step": 3384
243
  },
244
  {
245
+ "epoch": 18.62,
246
+ "learning_rate": 1.3829787234042555e-06,
247
+ "loss": 0.1156,
248
+ "step": 3500
249
  },
250
  {
251
  "epoch": 19.0,
252
+ "eval_accuracy": 0.05,
253
+ "eval_f1": 0.5648404993065187,
254
+ "eval_loss": 0.2216050773859024,
255
+ "eval_roc_auc": 0.7294638689597607,
256
+ "eval_runtime": 4.2818,
257
+ "eval_samples_per_second": 140.127,
258
+ "eval_steps_per_second": 2.335,
259
+ "step": 3572
260
  },
261
  {
262
  "epoch": 20.0,
263
+ "eval_accuracy": 0.04666666666666667,
264
+ "eval_f1": 0.5661549077108851,
265
+ "eval_loss": 0.22130462527275085,
266
+ "eval_roc_auc": 0.7309435085710135,
267
+ "eval_runtime": 4.2738,
268
+ "eval_samples_per_second": 140.39,
269
+ "eval_steps_per_second": 2.34,
270
+ "step": 3760
271
  }
272
  ],
273
+ "max_steps": 3760,
274
  "num_train_epochs": 20,
275
+ "total_flos": 1.579595742022656e+16,
276
  "trial_name": null,
277
  "trial_params": null
278
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:958ccbf5e147c249c07aac2a8acbe9a19c5128f7ab046f00ae2bebff4c73ad57
3
  size 3963
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a70ff22bb0dc7f2725e461f5d604d3e51d14bf1c277ff029b006171115f80e3
3
  size 3963