gianghoang commited on
Commit
e7d8539
·
verified ·
1 Parent(s): ed42a5e

Upload folder using huggingface_hub

Browse files
checkpoint-best/config.json ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_cross_attention": false,
3
+ "architectures": [
4
+ "RobertaForSequenceClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
+ "classifier_dropout": null,
9
+ "dtype": "float32",
10
+ "eos_token_id": 2,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout_prob": 0.1,
13
+ "hidden_size": 768,
14
+ "id2label": {
15
+ "0": "LABEL_0",
16
+ "1": "LABEL_1",
17
+ "2": "LABEL_2",
18
+ "3": "LABEL_3",
19
+ "4": "LABEL_4",
20
+ "5": "LABEL_5",
21
+ "6": "LABEL_6",
22
+ "7": "LABEL_7",
23
+ "8": "LABEL_8",
24
+ "9": "LABEL_9",
25
+ "10": "LABEL_10",
26
+ "11": "LABEL_11"
27
+ },
28
+ "initializer_range": 0.02,
29
+ "intermediate_size": 3072,
30
+ "is_decoder": false,
31
+ "label2id": {
32
+ "LABEL_0": 0,
33
+ "LABEL_1": 1,
34
+ "LABEL_10": 10,
35
+ "LABEL_11": 11,
36
+ "LABEL_2": 2,
37
+ "LABEL_3": 3,
38
+ "LABEL_4": 4,
39
+ "LABEL_5": 5,
40
+ "LABEL_6": 6,
41
+ "LABEL_7": 7,
42
+ "LABEL_8": 8,
43
+ "LABEL_9": 9
44
+ },
45
+ "layer_norm_eps": 1e-05,
46
+ "max_position_embeddings": 514,
47
+ "model_type": "roberta",
48
+ "num_attention_heads": 12,
49
+ "num_hidden_layers": 12,
50
+ "pad_token_id": 1,
51
+ "problem_type": "single_label_classification",
52
+ "tie_word_embeddings": true,
53
+ "transformers_version": "5.0.0",
54
+ "type_vocab_size": 1,
55
+ "use_cache": true,
56
+ "vocab_size": 50265
57
+ }
checkpoint-best/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a140abc72f23acfeee6403f1947d24d20561863739a3f656b9ff4920a8be9e2e
3
+ size 498643560
checkpoint-best/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7aad3e98c8ecedd550a192588c2746a7ba4aabfc7f50754a21ee67c69f1566cd
3
+ size 997407371
checkpoint-best/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fad9d3d814422fc24594f9e6de16e4af7ee16238cef70fe96e25680c409c7157
3
+ size 1465
checkpoint-best/training_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5421dc4775b16b532e493cc5b1b5fa8ff4c9ffa5872a5ea2e2f4b27eb6c57077
3
+ size 2751
checkpoint-best/training_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:445cddfdf17199d8777e5d8761543e7476a4bfe707817856d05eacc24c64b8fc
3
+ size 2751
checkpoint-best/training_9.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd12dd4427cd491d86b3c563f6bc60950d124f5d77d03d7ff3c8d6a1fc329486
3
+ size 2751
checkpoint-last/config.json ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_cross_attention": false,
3
+ "architectures": [
4
+ "RobertaForSequenceClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
+ "classifier_dropout": null,
9
+ "dtype": "float32",
10
+ "eos_token_id": 2,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout_prob": 0.1,
13
+ "hidden_size": 768,
14
+ "id2label": {
15
+ "0": "LABEL_0",
16
+ "1": "LABEL_1",
17
+ "2": "LABEL_2",
18
+ "3": "LABEL_3",
19
+ "4": "LABEL_4",
20
+ "5": "LABEL_5",
21
+ "6": "LABEL_6",
22
+ "7": "LABEL_7",
23
+ "8": "LABEL_8",
24
+ "9": "LABEL_9",
25
+ "10": "LABEL_10",
26
+ "11": "LABEL_11"
27
+ },
28
+ "initializer_range": 0.02,
29
+ "intermediate_size": 3072,
30
+ "is_decoder": false,
31
+ "label2id": {
32
+ "LABEL_0": 0,
33
+ "LABEL_1": 1,
34
+ "LABEL_10": 10,
35
+ "LABEL_11": 11,
36
+ "LABEL_2": 2,
37
+ "LABEL_3": 3,
38
+ "LABEL_4": 4,
39
+ "LABEL_5": 5,
40
+ "LABEL_6": 6,
41
+ "LABEL_7": 7,
42
+ "LABEL_8": 8,
43
+ "LABEL_9": 9
44
+ },
45
+ "layer_norm_eps": 1e-05,
46
+ "max_position_embeddings": 514,
47
+ "model_type": "roberta",
48
+ "num_attention_heads": 12,
49
+ "num_hidden_layers": 12,
50
+ "pad_token_id": 1,
51
+ "problem_type": "single_label_classification",
52
+ "tie_word_embeddings": true,
53
+ "transformers_version": "5.0.0",
54
+ "type_vocab_size": 1,
55
+ "use_cache": true,
56
+ "vocab_size": 50265
57
+ }
checkpoint-last/idx_file.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ 9
checkpoint-last/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a140abc72f23acfeee6403f1947d24d20561863739a3f656b9ff4920a8be9e2e
3
+ size 498643560
checkpoint-last/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7aad3e98c8ecedd550a192588c2746a7ba4aabfc7f50754a21ee67c69f1566cd
3
+ size 997407371
checkpoint-last/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fad9d3d814422fc24594f9e6de16e4af7ee16238cef70fe96e25680c409c7157
3
+ size 1465
checkpoint-last/step_file.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ 3660
config.json ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_cross_attention": false,
3
+ "architectures": [
4
+ "RobertaForSequenceClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
+ "classifier_dropout": null,
9
+ "dtype": "float32",
10
+ "eos_token_id": 2,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout_prob": 0.1,
13
+ "hidden_size": 768,
14
+ "id2label": {
15
+ "0": "LABEL_0",
16
+ "1": "LABEL_1",
17
+ "2": "LABEL_2",
18
+ "3": "LABEL_3",
19
+ "4": "LABEL_4",
20
+ "5": "LABEL_5",
21
+ "6": "LABEL_6",
22
+ "7": "LABEL_7",
23
+ "8": "LABEL_8",
24
+ "9": "LABEL_9",
25
+ "10": "LABEL_10",
26
+ "11": "LABEL_11"
27
+ },
28
+ "initializer_range": 0.02,
29
+ "intermediate_size": 3072,
30
+ "is_decoder": false,
31
+ "label2id": {
32
+ "LABEL_0": 0,
33
+ "LABEL_1": 1,
34
+ "LABEL_10": 10,
35
+ "LABEL_11": 11,
36
+ "LABEL_2": 2,
37
+ "LABEL_3": 3,
38
+ "LABEL_4": 4,
39
+ "LABEL_5": 5,
40
+ "LABEL_6": 6,
41
+ "LABEL_7": 7,
42
+ "LABEL_8": 8,
43
+ "LABEL_9": 9
44
+ },
45
+ "layer_norm_eps": 1e-05,
46
+ "max_position_embeddings": 514,
47
+ "model_type": "roberta",
48
+ "num_attention_heads": 12,
49
+ "num_hidden_layers": 12,
50
+ "pad_token_id": 1,
51
+ "problem_type": "single_label_classification",
52
+ "tie_word_embeddings": true,
53
+ "transformers_version": "5.0.0",
54
+ "type_vocab_size": 1,
55
+ "use_cache": true,
56
+ "vocab_size": 50265
57
+ }
eval_results.txt ADDED
@@ -0,0 +1,190 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ evaluate 0
2
+ acc = 0.7474801061007957
3
+ acc_and_f1_macro = 0.7048938434748613
4
+ acc_and_f1_weighted = 0.739449319460284
5
+ class_f1 = [np.float64(nan), np.float64(0.7238493723849372), np.float64(0.7958656330749354), np.float64(0.3373493975903614), np.float64(0.6004415011037526), np.float64(0.6722689075630252), np.float64(0.9182389937106918), np.float64(0.8677248677248677), np.float64(0.9201030927835051), np.float64(0.7872340425531915)]
6
+ class_p = [np.float64(nan), np.float64(0.650375939849624), np.float64(0.7857142857142857), np.float64(0.4883720930232558), np.float64(0.6325581395348837), np.float64(0.6042296072507553), np.float64(0.9240506329113924), np.float64(0.8631578947368421), np.float64(0.9224806201550387), np.float64(0.6607142857142857)]
7
+ class_r = [np.float64(0.0), np.float64(0.8160377358490566), np.float64(0.806282722513089), np.float64(0.25766871165644173), np.float64(0.5714285714285714), np.float64(0.7575757575757576), np.float64(0.9125), np.float64(0.8723404255319149), np.float64(0.9177377892030848), np.float64(0.9736842105263158)]
8
+ confusion_matrix = [[ 0 8 0 12 2 20 0 0 0 0]
9
+ [ 0 173 23 0 2 14 0 0 0 0]
10
+ [ 0 31 154 2 2 0 0 0 0 2]
11
+ [ 0 15 8 42 50 46 0 0 0 2]
12
+ [ 0 22 4 14 136 50 0 0 0 12]
13
+ [ 0 15 7 16 23 200 0 0 0 3]
14
+ [ 0 2 0 0 0 0 146 4 8 0]
15
+ [ 0 0 0 0 0 0 2 164 22 0]
16
+ [ 0 0 0 0 0 0 10 22 357 0]
17
+ [ 0 0 0 0 0 1 0 0 0 37]]
18
+ f1_macro = 0.6623075808489268
19
+ f1_weighted = 0.7314185328197723
20
+ evaluate 1
21
+ acc = 0.7618037135278515
22
+ acc_and_f1_macro = 0.7229381973826235
23
+ acc_and_f1_weighted = 0.7575460583049605
24
+ class_f1 = [np.float64(nan), np.float64(0.7421686746987951), np.float64(0.7999999999999999), np.float64(0.4999999999999999), np.float64(0.5740740740740741), np.float64(0.6946308724832215), np.float64(0.925925925925926), np.float64(0.8844221105527638), np.float64(0.936), np.float64(0.7835051546391751)]
25
+ class_p = [np.float64(nan), np.float64(0.7586206896551724), np.float64(0.8042328042328042), np.float64(0.48554913294797686), np.float64(0.6391752577319587), np.float64(0.6234939759036144), np.float64(0.9146341463414634), np.float64(0.8380952380952381), np.float64(0.9722991689750693), np.float64(0.6440677966101694)]
26
+ class_r = [np.float64(0.0), np.float64(0.7264150943396226), np.float64(0.7958115183246073), np.float64(0.5153374233128835), np.float64(0.5210084033613446), np.float64(0.7840909090909091), np.float64(0.9375), np.float64(0.9361702127659575), np.float64(0.9023136246786633), np.float64(1.0)]
27
+ confusion_matrix = [[ 0 5 0 16 5 16 0 0 0 0]
28
+ [ 0 154 22 0 8 26 0 0 0 2]
29
+ [ 0 18 152 8 7 2 0 0 0 4]
30
+ [ 0 4 7 84 38 26 0 0 0 4]
31
+ [ 0 14 4 33 124 55 0 0 0 8]
32
+ [ 0 6 4 32 12 207 0 0 0 3]
33
+ [ 0 2 0 0 0 0 150 6 2 0]
34
+ [ 0 0 0 0 0 0 4 176 8 0]
35
+ [ 0 0 0 0 0 0 10 28 351 0]
36
+ [ 0 0 0 0 0 0 0 0 0 38]]
37
+ f1_macro = 0.6840726812373956
38
+ f1_weighted = 0.7532884030820696
39
+ evaluate 2
40
+ acc = 0.7522546419098143
41
+ acc_and_f1_macro = 0.7302639191012046
42
+ acc_and_f1_weighted = 0.7514893569292973
43
+ class_f1 = [np.float64(0.25806451612903225), np.float64(0.7196261682242991), np.float64(0.7799442896935934), np.float64(0.4675324675324675), np.float64(0.6061705989110707), np.float64(0.6561264822134387), np.float64(0.9308176100628932), np.float64(0.8730964467005077), np.float64(0.9342105263157896), np.float64(0.8571428571428571)]
44
+ class_p = [np.float64(0.4), np.float64(0.7129629629629629), np.float64(0.8333333333333334), np.float64(0.496551724137931), np.float64(0.5335463258785943), np.float64(0.6859504132231405), np.float64(0.9367088607594937), np.float64(0.8349514563106796), np.float64(0.9568733153638814), np.float64(0.782608695652174)]
45
+ class_r = [np.float64(0.19047619047619047), np.float64(0.7264150943396226), np.float64(0.7329842931937173), np.float64(0.44171779141104295), np.float64(0.7016806722689075), np.float64(0.6287878787878788), np.float64(0.925), np.float64(0.9148936170212766), np.float64(0.9125964010282777), np.float64(0.9473684210526315)]
46
+ confusion_matrix = [[ 8 4 0 10 8 12 0 0 0 0]
47
+ [ 4 154 14 2 18 20 0 0 0 0]
48
+ [ 0 31 140 8 8 2 0 0 0 2]
49
+ [ 4 7 6 72 58 12 0 0 0 4]
50
+ [ 0 12 4 25 167 28 0 0 0 2]
51
+ [ 4 6 4 28 54 166 0 0 0 2]
52
+ [ 0 2 0 0 0 0 148 8 2 0]
53
+ [ 0 0 0 0 0 0 2 172 14 0]
54
+ [ 0 0 0 0 0 0 8 26 355 0]
55
+ [ 0 0 0 0 0 2 0 0 0 36]]
56
+ f1_macro = 0.7082731962925949
57
+ f1_weighted = 0.7507240719487804
58
+ evaluate 3
59
+ acc = 0.7480106100795756
60
+ acc_and_f1_macro = 0.7216309782116379
61
+ acc_and_f1_weighted = 0.745009762685597
62
+ class_f1 = [np.float64(0.2), np.float64(0.7132867132867132), np.float64(0.7570621468926554), np.float64(0.43262411347517726), np.float64(0.6058091286307054), np.float64(0.6898839137645107), np.float64(0.9230769230769231), np.float64(0.8471849865951742), np.float64(0.9199491740787803), np.float64(0.8636363636363636)]
63
+ class_p = [np.float64(0.3333333333333333), np.float64(0.7050691244239631), np.float64(0.8220858895705522), np.float64(0.5126050420168067), np.float64(0.5983606557377049), np.float64(0.6135693215339233), np.float64(0.9473684210526315), np.float64(0.8540540540540541), np.float64(0.9095477386934674), np.float64(0.76)]
64
+ class_r = [np.float64(0.14285714285714285), np.float64(0.7216981132075472), np.float64(0.7015706806282722), np.float64(0.37423312883435583), np.float64(0.6134453781512605), np.float64(0.7878787878787878), np.float64(0.9), np.float64(0.8404255319148937), np.float64(0.9305912596401028), np.float64(1.0)]
65
+ confusion_matrix = [[ 6 4 0 10 6 16 0 0 0 0]
66
+ [ 4 153 15 2 12 26 0 0 0 0]
67
+ [ 2 32 134 7 10 2 0 0 0 4]
68
+ [ 4 8 6 61 44 36 0 0 0 4]
69
+ [ 0 12 4 21 146 51 0 0 0 4]
70
+ [ 2 6 4 18 26 208 0 0 0 0]
71
+ [ 0 2 0 0 0 0 144 6 8 0]
72
+ [ 0 0 0 0 0 0 2 158 28 0]
73
+ [ 0 0 0 0 0 0 6 21 362 0]
74
+ [ 0 0 0 0 0 0 0 0 0 38]]
75
+ f1_macro = 0.6952513463437002
76
+ f1_weighted = 0.7420089152916185
77
+ evaluate 4
78
+ acc = 0.7554376657824934
79
+ acc_and_f1_macro = 0.7299251289757365
80
+ acc_and_f1_weighted = 0.7534075021522451
81
+ class_f1 = [np.float64(0.16666666666666666), np.float64(0.7403846153846154), np.float64(0.8021390374331551), np.float64(0.4563758389261745), np.float64(0.5755395683453237), np.float64(0.678095238095238), np.float64(0.925), np.float64(0.8783068783068785), np.float64(0.9300518134715026), np.float64(0.891566265060241)]
82
+ class_p = [np.float64(0.6666666666666666), np.float64(0.7549019607843137), np.float64(0.819672131147541), np.float64(0.5037037037037037), np.float64(0.5031446540880503), np.float64(0.6819923371647509), np.float64(0.925), np.float64(0.8736842105263158), np.float64(0.9373368146214099), np.float64(0.8222222222222222)]
83
+ class_r = [np.float64(0.09523809523809523), np.float64(0.7264150943396226), np.float64(0.7853403141361257), np.float64(0.4171779141104294), np.float64(0.6722689075630253), np.float64(0.6742424242424242), np.float64(0.925), np.float64(0.8829787234042553), np.float64(0.922879177377892), np.float64(0.9736842105263158)]
84
+ confusion_matrix = [[ 4 4 0 12 8 14 0 0 0 0]
85
+ [ 2 154 16 4 20 16 0 0 0 0]
86
+ [ 0 20 150 3 12 4 0 0 0 2]
87
+ [ 0 6 7 68 62 16 0 0 0 4]
88
+ [ 0 12 4 28 160 32 0 0 0 2]
89
+ [ 0 8 6 20 52 178 0 0 0 0]
90
+ [ 0 0 0 0 2 0 148 6 4 0]
91
+ [ 0 0 0 0 0 0 2 166 20 0]
92
+ [ 0 0 0 0 2 0 10 18 359 0]
93
+ [ 0 0 0 0 0 1 0 0 0 37]]
94
+ f1_macro = 0.7044125921689796
95
+ f1_weighted = 0.7513773385219968
96
+ evaluate 5
97
+ acc = 0.7586206896551724
98
+ acc_and_f1_macro = 0.7333208161673415
99
+ acc_and_f1_weighted = 0.7566757125566077
100
+ class_f1 = [np.float64(0.16), np.float64(0.7464114832535885), np.float64(0.7914438502673796), np.float64(0.4814814814814815), np.float64(0.5988483685220729), np.float64(0.6994328922495274), np.float64(0.9240506329113924), np.float64(0.8524590163934426), np.float64(0.9213197969543147), np.float64(0.9047619047619047)]
101
+ class_p = [np.float64(0.5), np.float64(0.7572815533980582), np.float64(0.8087431693989071), np.float64(0.484472049689441), np.float64(0.5512367491166078), np.float64(0.6981132075471698), np.float64(0.9358974358974359), np.float64(0.8764044943820225), np.float64(0.9097744360902256), np.float64(0.8260869565217391)]
102
+ class_r = [np.float64(0.09523809523809523), np.float64(0.7358490566037735), np.float64(0.774869109947644), np.float64(0.4785276073619632), np.float64(0.6554621848739496), np.float64(0.7007575757575758), np.float64(0.9125), np.float64(0.8297872340425532), np.float64(0.9331619537275064), np.float64(1.0)]
103
+ confusion_matrix = [[ 4 4 0 16 4 14 0 0 0 0]
104
+ [ 2 156 18 4 16 16 0 0 0 0]
105
+ [ 0 20 148 5 12 4 0 0 0 2]
106
+ [ 2 6 7 78 52 14 0 0 0 4]
107
+ [ 0 12 4 32 156 32 0 0 0 2]
108
+ [ 0 8 6 26 39 185 0 0 0 0]
109
+ [ 0 0 0 0 2 0 146 6 6 0]
110
+ [ 0 0 0 0 0 0 2 156 30 0]
111
+ [ 0 0 0 0 2 0 8 16 363 0]
112
+ [ 0 0 0 0 0 0 0 0 0 38]]
113
+ f1_macro = 0.7080209426795105
114
+ f1_weighted = 0.7547307354580429
115
+ evaluate 6
116
+ acc = 0.7564986737400531
117
+ acc_and_f1_macro = 0.7311158097126855
118
+ acc_and_f1_weighted = 0.7542026248283529
119
+ class_f1 = [np.float64(0.16666666666666666), np.float64(0.7403846153846154), np.float64(0.7956989247311829), np.float64(0.46302250803858525), np.float64(0.5939849624060151), np.float64(0.6990654205607477), np.float64(0.925), np.float64(0.8478260869565217), np.float64(0.9209183673469388), np.float64(0.9047619047619047)]
120
+ class_p = [np.float64(0.6666666666666666), np.float64(0.7549019607843137), np.float64(0.8176795580110497), np.float64(0.4864864864864865), np.float64(0.5374149659863946), np.float64(0.6900369003690037), np.float64(0.925), np.float64(0.8666666666666667), np.float64(0.9139240506329114), np.float64(0.8260869565217391)]
121
+ class_r = [np.float64(0.09523809523809523), np.float64(0.7264150943396226), np.float64(0.774869109947644), np.float64(0.44171779141104295), np.float64(0.6638655462184874), np.float64(0.7083333333333334), np.float64(0.925), np.float64(0.8297872340425532), np.float64(0.9280205655526992), np.float64(1.0)]
122
+ confusion_matrix = [[ 4 4 0 15 5 14 0 0 0 0]
123
+ [ 2 154 16 4 20 16 0 0 0 0]
124
+ [ 0 22 148 3 12 4 0 0 0 2]
125
+ [ 0 6 7 72 56 18 0 0 0 4]
126
+ [ 0 12 4 30 158 32 0 0 0 2]
127
+ [ 0 6 6 24 41 187 0 0 0 0]
128
+ [ 0 0 0 0 2 0 148 6 4 0]
129
+ [ 0 0 0 0 0 0 2 156 30 0]
130
+ [ 0 0 0 0 0 0 10 18 361 0]
131
+ [ 0 0 0 0 0 0 0 0 0 38]]
132
+ f1_macro = 0.7057329456853179
133
+ f1_weighted = 0.7519065759166527
134
+ evaluate 7
135
+ acc = 0.7580901856763925
136
+ acc_and_f1_macro = 0.732903294943322
137
+ acc_and_f1_weighted = 0.7560980300675524
138
+ class_f1 = [np.float64(0.16), np.float64(0.7499999999999999), np.float64(0.8), np.float64(0.48253968253968255), np.float64(0.5928705440900564), np.float64(0.7018867924528303), np.float64(0.925), np.float64(0.8415300546448087), np.float64(0.9185750636132316), np.float64(0.9047619047619047)]
139
+ class_p = [np.float64(0.5), np.float64(0.7647058823529411), np.float64(0.8268156424581006), np.float64(0.5), np.float64(0.535593220338983), np.float64(0.6992481203007519), np.float64(0.925), np.float64(0.8651685393258427), np.float64(0.9093198992443325), np.float64(0.8260869565217391)]
140
+ class_r = [np.float64(0.09523809523809523), np.float64(0.7358490566037735), np.float64(0.774869109947644), np.float64(0.4662576687116564), np.float64(0.6638655462184874), np.float64(0.7045454545454546), np.float64(0.925), np.float64(0.8191489361702128), np.float64(0.9280205655526992), np.float64(1.0)]
141
+ confusion_matrix = [[ 4 4 0 15 5 14 0 0 0 0]
142
+ [ 2 156 14 4 20 16 0 0 0 0]
143
+ [ 0 22 148 3 12 4 0 0 0 2]
144
+ [ 2 6 7 76 54 14 0 0 0 4]
145
+ [ 0 12 4 30 158 32 0 0 0 2]
146
+ [ 0 4 6 24 44 186 0 0 0 0]
147
+ [ 0 0 0 0 2 0 148 6 4 0]
148
+ [ 0 0 0 0 0 0 2 154 32 0]
149
+ [ 0 0 0 0 0 0 10 18 361 0]
150
+ [ 0 0 0 0 0 0 0 0 0 38]]
151
+ f1_macro = 0.7077164042102514
152
+ f1_weighted = 0.7541058744587121
153
+ evaluate 8
154
+ acc = 0.7618037135278515
155
+ acc_and_f1_macro = 0.7323228184279761
156
+ acc_and_f1_weighted = 0.7590034977915698
157
+ class_f1 = [np.float64(0.08695652173913042), np.float64(0.7523809523809523), np.float64(0.8043478260869565), np.float64(0.4705882352941177), np.float64(0.5981308411214953), np.float64(0.6964618249534452), np.float64(0.925), np.float64(0.8601036269430052), np.float64(0.9296874999999999), np.float64(0.9047619047619047)]
158
+ class_p = [np.float64(0.5), np.float64(0.7596153846153846), np.float64(0.8361581920903954), np.float64(0.5034965034965035), np.float64(0.5387205387205387), np.float64(0.684981684981685), np.float64(0.925), np.float64(0.8383838383838383), np.float64(0.941952506596306), np.float64(0.8260869565217391)]
159
+ class_r = [np.float64(0.047619047619047616), np.float64(0.7452830188679245), np.float64(0.774869109947644), np.float64(0.44171779141104295), np.float64(0.6722689075630253), np.float64(0.7083333333333334), np.float64(0.925), np.float64(0.8829787234042553), np.float64(0.9177377892030848), np.float64(1.0)]
160
+ confusion_matrix = [[ 2 4 0 12 8 16 0 0 0 0]
161
+ [ 2 158 14 4 18 16 0 0 0 0]
162
+ [ 0 22 148 3 12 4 0 0 0 2]
163
+ [ 0 7 6 72 56 18 0 0 0 4]
164
+ [ 0 12 4 28 160 32 0 0 0 2]
165
+ [ 0 5 5 24 43 187 0 0 0 0]
166
+ [ 0 0 0 0 0 0 148 10 2 0]
167
+ [ 0 0 0 0 0 0 2 166 20 0]
168
+ [ 0 0 0 0 0 0 10 22 357 0]
169
+ [ 0 0 0 0 0 0 0 0 0 38]]
170
+ f1_macro = 0.7028419233281007
171
+ f1_weighted = 0.7562032820552881
172
+ evaluate 9
173
+ acc = 0.7644562334217506
174
+ acc_and_f1_macro = 0.7386967474391453
175
+ acc_and_f1_weighted = 0.7625543782840718
176
+ class_f1 = [np.float64(0.16), np.float64(0.7541766109785202), np.float64(0.802168021680217), np.float64(0.48253968253968255), np.float64(0.5951035781544257), np.float64(0.7018867924528303), np.float64(0.925), np.float64(0.8736842105263158), np.float64(0.9300518134715026), np.float64(0.9047619047619047)]
177
+ class_p = [np.float64(0.5), np.float64(0.7632850241545893), np.float64(0.8314606741573034), np.float64(0.5), np.float64(0.5392491467576792), np.float64(0.6992481203007519), np.float64(0.925), np.float64(0.8645833333333334), np.float64(0.9373368146214099), np.float64(0.8260869565217391)]
178
+ class_r = [np.float64(0.09523809523809523), np.float64(0.7452830188679245), np.float64(0.774869109947644), np.float64(0.4662576687116564), np.float64(0.6638655462184874), np.float64(0.7045454545454546), np.float64(0.925), np.float64(0.8829787234042553), np.float64(0.922879177377892), np.float64(1.0)]
179
+ confusion_matrix = [[ 4 4 0 15 5 14 0 0 0 0]
180
+ [ 2 158 14 4 18 16 0 0 0 0]
181
+ [ 0 22 148 3 12 4 0 0 0 2]
182
+ [ 2 6 7 76 54 14 0 0 0 4]
183
+ [ 0 12 4 30 158 32 0 0 0 2]
184
+ [ 0 5 5 24 44 186 0 0 0 0]
185
+ [ 0 0 0 0 2 0 148 6 4 0]
186
+ [ 0 0 0 0 0 0 2 166 20 0]
187
+ [ 0 0 0 0 0 0 10 20 359 0]
188
+ [ 0 0 0 0 0 0 0 0 0 38]]
189
+ f1_macro = 0.7129372614565399
190
+ f1_weighted = 0.760652523146393
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a140abc72f23acfeee6403f1947d24d20561863739a3f656b9ff4920a8be9e2e
3
+ size 498643560
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "backend": "tokenizers",
4
+ "bos_token": "<s>",
5
+ "cls_token": "<s>",
6
+ "do_lower_case": false,
7
+ "eos_token": "</s>",
8
+ "errors": "replace",
9
+ "is_local": false,
10
+ "mask_token": "<mask>",
11
+ "model_max_length": 512,
12
+ "pad_token": "<pad>",
13
+ "sep_token": "</s>",
14
+ "tokenizer_class": "RobertaTokenizer",
15
+ "trim_offsets": true,
16
+ "unk_token": "<unk>"
17
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06e90bba594a67858fbed551759bbc8d67acfcba7a9da07f7dbf1cd75c77ce1e
3
+ size 2769