gianghoang commited on
Commit
aae29f0
·
verified ·
1 Parent(s): b43b6df

Upload folder using huggingface_hub

Browse files
checkpoint-best/config.json ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_cross_attention": false,
3
+ "architectures": [
4
+ "RobertaForSequenceClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
+ "classifier_dropout": null,
9
+ "dtype": "float32",
10
+ "eos_token_id": 2,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout_prob": 0.1,
13
+ "hidden_size": 768,
14
+ "id2label": {
15
+ "0": "LABEL_0",
16
+ "1": "LABEL_1",
17
+ "2": "LABEL_2",
18
+ "3": "LABEL_3",
19
+ "4": "LABEL_4",
20
+ "5": "LABEL_5",
21
+ "6": "LABEL_6",
22
+ "7": "LABEL_7",
23
+ "8": "LABEL_8",
24
+ "9": "LABEL_9",
25
+ "10": "LABEL_10",
26
+ "11": "LABEL_11"
27
+ },
28
+ "initializer_range": 0.02,
29
+ "intermediate_size": 3072,
30
+ "is_decoder": false,
31
+ "label2id": {
32
+ "LABEL_0": 0,
33
+ "LABEL_1": 1,
34
+ "LABEL_10": 10,
35
+ "LABEL_11": 11,
36
+ "LABEL_2": 2,
37
+ "LABEL_3": 3,
38
+ "LABEL_4": 4,
39
+ "LABEL_5": 5,
40
+ "LABEL_6": 6,
41
+ "LABEL_7": 7,
42
+ "LABEL_8": 8,
43
+ "LABEL_9": 9
44
+ },
45
+ "layer_norm_eps": 1e-05,
46
+ "max_position_embeddings": 514,
47
+ "model_type": "roberta",
48
+ "num_attention_heads": 12,
49
+ "num_hidden_layers": 12,
50
+ "output_past": true,
51
+ "pad_token_id": 1,
52
+ "position_embedding_type": "absolute",
53
+ "problem_type": "single_label_classification",
54
+ "tie_word_embeddings": true,
55
+ "transformers_version": "5.0.0",
56
+ "type_vocab_size": 1,
57
+ "use_cache": true,
58
+ "vocab_size": 250002
59
+ }
checkpoint-best/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d4e3e38414b5d2c5a596e0ab5c8a5f5acc78ef632ffc14bfcc0df565a52171b
3
+ size 1112235744
checkpoint-best/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29802fbac574a6343d6590c324e85b19359e6021e7e707365fea8af24e09370a
3
+ size 2224591499
checkpoint-best/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d46ebbe86cc296e0659ad6d70cc71025895e9b0ca50bf4d999e099e27ebec81
3
+ size 1465
checkpoint-best/training_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7b727449fefeba793fb9580f65c60481a8c179df5700a35433e0a1c57958712
3
+ size 2751
checkpoint-best/training_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c6825ff2f41b152453471580a04ec5538eeaf4dd13698bbd4de415e5f8f2d21
3
+ size 2751
checkpoint-best/training_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:685e4ad908898fc6dabeb9f80917014c1ceb588a7d791e708b50fda4ab315b81
3
+ size 2751
checkpoint-best/training_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee72edb116c9d6d1a49c7124a650269090702b2b5d51afab86b2f86b4a94175f
3
+ size 2751
checkpoint-best/training_6.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9daa462e2ce2191fc68c3f55ca61ae27f52fddaf0bf225dd7541ba6ab39251a1
3
+ size 2751
checkpoint-last/config.json ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_cross_attention": false,
3
+ "architectures": [
4
+ "RobertaForSequenceClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
+ "classifier_dropout": null,
9
+ "dtype": "float32",
10
+ "eos_token_id": 2,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout_prob": 0.1,
13
+ "hidden_size": 768,
14
+ "id2label": {
15
+ "0": "LABEL_0",
16
+ "1": "LABEL_1",
17
+ "2": "LABEL_2",
18
+ "3": "LABEL_3",
19
+ "4": "LABEL_4",
20
+ "5": "LABEL_5",
21
+ "6": "LABEL_6",
22
+ "7": "LABEL_7",
23
+ "8": "LABEL_8",
24
+ "9": "LABEL_9",
25
+ "10": "LABEL_10",
26
+ "11": "LABEL_11"
27
+ },
28
+ "initializer_range": 0.02,
29
+ "intermediate_size": 3072,
30
+ "is_decoder": false,
31
+ "label2id": {
32
+ "LABEL_0": 0,
33
+ "LABEL_1": 1,
34
+ "LABEL_10": 10,
35
+ "LABEL_11": 11,
36
+ "LABEL_2": 2,
37
+ "LABEL_3": 3,
38
+ "LABEL_4": 4,
39
+ "LABEL_5": 5,
40
+ "LABEL_6": 6,
41
+ "LABEL_7": 7,
42
+ "LABEL_8": 8,
43
+ "LABEL_9": 9
44
+ },
45
+ "layer_norm_eps": 1e-05,
46
+ "max_position_embeddings": 514,
47
+ "model_type": "roberta",
48
+ "num_attention_heads": 12,
49
+ "num_hidden_layers": 12,
50
+ "output_past": true,
51
+ "pad_token_id": 1,
52
+ "position_embedding_type": "absolute",
53
+ "problem_type": "single_label_classification",
54
+ "tie_word_embeddings": true,
55
+ "transformers_version": "5.0.0",
56
+ "type_vocab_size": 1,
57
+ "use_cache": true,
58
+ "vocab_size": 250002
59
+ }
checkpoint-last/idx_file.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ 9
checkpoint-last/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c17da51ee001d45bde6fa33740a0130fb17c72c4c137b2bc371dab3e1e08f4b
3
+ size 1112235744
checkpoint-last/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a581158cea338dac724a1c78fd8a760b94b7d862818b923520ce9665f1d9ccd8
3
+ size 2224591499
checkpoint-last/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fad9d3d814422fc24594f9e6de16e4af7ee16238cef70fe96e25680c409c7157
3
+ size 1465
checkpoint-last/step_file.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ 3660
config.json ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_cross_attention": false,
3
+ "architectures": [
4
+ "RobertaForSequenceClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
+ "classifier_dropout": null,
9
+ "dtype": "float32",
10
+ "eos_token_id": 2,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout_prob": 0.1,
13
+ "hidden_size": 768,
14
+ "id2label": {
15
+ "0": "LABEL_0",
16
+ "1": "LABEL_1",
17
+ "2": "LABEL_2",
18
+ "3": "LABEL_3",
19
+ "4": "LABEL_4",
20
+ "5": "LABEL_5",
21
+ "6": "LABEL_6",
22
+ "7": "LABEL_7",
23
+ "8": "LABEL_8",
24
+ "9": "LABEL_9",
25
+ "10": "LABEL_10",
26
+ "11": "LABEL_11"
27
+ },
28
+ "initializer_range": 0.02,
29
+ "intermediate_size": 3072,
30
+ "is_decoder": false,
31
+ "label2id": {
32
+ "LABEL_0": 0,
33
+ "LABEL_1": 1,
34
+ "LABEL_10": 10,
35
+ "LABEL_11": 11,
36
+ "LABEL_2": 2,
37
+ "LABEL_3": 3,
38
+ "LABEL_4": 4,
39
+ "LABEL_5": 5,
40
+ "LABEL_6": 6,
41
+ "LABEL_7": 7,
42
+ "LABEL_8": 8,
43
+ "LABEL_9": 9
44
+ },
45
+ "layer_norm_eps": 1e-05,
46
+ "max_position_embeddings": 514,
47
+ "model_type": "roberta",
48
+ "num_attention_heads": 12,
49
+ "num_hidden_layers": 12,
50
+ "output_past": true,
51
+ "pad_token_id": 1,
52
+ "position_embedding_type": "absolute",
53
+ "problem_type": "single_label_classification",
54
+ "tie_word_embeddings": true,
55
+ "transformers_version": "5.0.0",
56
+ "type_vocab_size": 1,
57
+ "use_cache": true,
58
+ "vocab_size": 250002
59
+ }
eval_results.txt ADDED
@@ -0,0 +1,190 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ evaluate 0
2
+ acc = 0.553315649867374
3
+ acc_and_f1_macro = 0.5036680015396735
4
+ acc_and_f1_weighted = 0.5436802384152634
5
+ class_f1 = [np.float64(nan), np.float64(0.3319148936170213), np.float64(0.419047619047619), np.float64(0.12972972972972974), np.float64(0.3037383177570093), np.float64(0.483221476510067), np.float64(0.8322147651006713), np.float64(0.7777777777777779), np.float64(0.8772378516624041), np.float64(0.38532110091743127)]
6
+ class_p = [np.float64(nan), np.float64(0.3023255813953488), np.float64(0.532258064516129), np.float64(0.5454545454545454), np.float64(0.34210526315789475), np.float64(0.37422037422037424), np.float64(0.8985507246376812), np.float64(0.7403846153846154), np.float64(0.8727735368956743), np.float64(0.29577464788732394)]
7
+ class_r = [np.float64(0.0), np.float64(0.36792452830188677), np.float64(0.34554973821989526), np.float64(0.0736196319018405), np.float64(0.27310924369747897), np.float64(0.6818181818181818), np.float64(0.775), np.float64(0.8191489361702128), np.float64(0.8817480719794345), np.float64(0.5526315789473685)]
8
+ confusion_matrix = [[ 0 4 0 4 4 27 0 0 2 1]
9
+ [ 0 78 44 2 40 42 0 0 0 6]
10
+ [ 0 87 66 0 22 13 0 0 0 3]
11
+ [ 0 14 6 12 27 94 0 0 0 10]
12
+ [ 0 45 2 0 65 108 0 0 0 18]
13
+ [ 0 30 6 4 32 180 0 0 0 12]
14
+ [ 0 0 0 0 0 0 124 18 18 0]
15
+ [ 0 0 0 0 0 0 4 154 30 0]
16
+ [ 0 0 0 0 0 0 10 36 343 0]
17
+ [ 0 0 0 0 0 17 0 0 0 21]]
18
+ f1_macro = 0.45402035321197304
19
+ f1_weighted = 0.5340448269631527
20
+ evaluate 1
21
+ acc = 0.6477453580901856
22
+ acc_and_f1_macro = 0.6109098715451384
23
+ acc_and_f1_weighted = 0.6440256663564747
24
+ class_f1 = [np.float64(nan), np.float64(0.5021645021645021), np.float64(0.7002652519893899), np.float64(0.41775456919060056), np.float64(0.41884816753926707), np.float64(0.5066666666666666), np.float64(0.8834355828220859), np.float64(0.8167539267015708), np.float64(0.8932291666666669), np.float64(0.6016260162601627)]
25
+ class_p = [np.float64(nan), np.float64(0.464), np.float64(0.7096774193548387), np.float64(0.36363636363636365), np.float64(0.5555555555555556), np.float64(0.5095785440613027), np.float64(0.8674698795180723), np.float64(0.8041237113402062), np.float64(0.9050131926121372), np.float64(0.43529411764705883)]
26
+ class_r = [np.float64(0.0), np.float64(0.5471698113207547), np.float64(0.6910994764397905), np.float64(0.49079754601226994), np.float64(0.33613445378151263), np.float64(0.5037878787878788), np.float64(0.9), np.float64(0.8297872340425532), np.float64(0.8817480719794345), np.float64(0.9736842105263158)]
27
+ confusion_matrix = [[ 0 6 0 20 3 11 0 0 2 0]
28
+ [ 0 116 42 8 16 26 0 0 0 4]
29
+ [ 0 47 132 2 2 4 0 0 0 4]
30
+ [ 0 13 2 80 31 28 0 0 0 9]
31
+ [ 0 34 4 48 80 58 0 0 0 14]
32
+ [ 0 34 6 62 12 133 0 0 0 17]
33
+ [ 0 0 0 0 0 0 144 8 8 0]
34
+ [ 0 0 0 0 0 0 6 156 26 0]
35
+ [ 0 0 0 0 0 0 16 30 343 0]
36
+ [ 0 0 0 0 0 1 0 0 0 37]]
37
+ f1_macro = 0.5740743850000912
38
+ f1_weighted = 0.6403059746227637
39
+ evaluate 2
40
+ acc = 0.6525198938992043
41
+ acc_and_f1_macro = 0.6231816753120988
42
+ acc_and_f1_weighted = 0.6521421608321463
43
+ class_f1 = [np.float64(nan), np.float64(0.46796657381615603), np.float64(0.6862745098039216), np.float64(0.39316239316239315), np.float64(0.445916114790287), np.float64(0.5543859649122808), np.float64(0.8917197452229298), np.float64(0.835978835978836), np.float64(0.907928388746803), np.float64(0.7551020408163265)]
44
+ class_p = [np.float64(nan), np.float64(0.5714285714285714), np.float64(0.9130434782608695), np.float64(0.3016393442622951), np.float64(0.4697674418604651), np.float64(0.5163398692810458), np.float64(0.9090909090909091), np.float64(0.8315789473684211), np.float64(0.9033078880407125), np.float64(0.6166666666666667)]
45
+ class_r = [np.float64(0.0), np.float64(0.39622641509433965), np.float64(0.5497382198952879), np.float64(0.5644171779141104), np.float64(0.42436974789915966), np.float64(0.5984848484848485), np.float64(0.875), np.float64(0.8404255319148937), np.float64(0.9125964010282777), np.float64(0.9736842105263158)]
46
+ confusion_matrix = [[ 0 0 0 26 6 10 0 0 0 0]
47
+ [ 0 84 8 18 44 52 0 0 0 6]
48
+ [ 0 40 105 27 11 8 0 0 0 0]
49
+ [ 0 4 0 92 32 30 0 0 0 5]
50
+ [ 0 8 0 76 101 47 0 0 0 6]
51
+ [ 0 11 2 66 21 158 0 0 0 6]
52
+ [ 0 0 0 0 0 0 140 10 10 0]
53
+ [ 0 0 0 0 0 0 2 158 28 0]
54
+ [ 0 0 0 0 0 0 12 22 355 0]
55
+ [ 0 0 0 0 0 1 0 0 0 37]]
56
+ f1_macro = 0.5938434567249933
57
+ f1_weighted = 0.6517644277650883
58
+ evaluate 3
59
+ acc = 0.6970822281167108
60
+ acc_and_f1_macro = 0.665524574862322
61
+ acc_and_f1_weighted = 0.6927153195289348
62
+ class_f1 = [np.float64(0.0909090909090909), np.float64(0.6120689655172414), np.float64(0.7507002801120448), np.float64(0.390625), np.float64(0.5487603305785124), np.float64(0.5104602510460251), np.float64(0.8944099378881988), np.float64(0.861878453038674), np.float64(0.9189873417721519), np.float64(0.7608695652173912)]
63
+ class_p = [np.float64(1.0), np.float64(0.5634920634920635), np.float64(0.8072289156626506), np.float64(0.5376344086021505), np.float64(0.45231607629427795), np.float64(0.5700934579439252), np.float64(0.8888888888888888), np.float64(0.896551724137931), np.float64(0.9052369077306733), np.float64(0.6481481481481481)]
64
+ class_r = [np.float64(0.047619047619047616), np.float64(0.6698113207547169), np.float64(0.7015706806282722), np.float64(0.3067484662576687), np.float64(0.6974789915966386), np.float64(0.4621212121212121), np.float64(0.9), np.float64(0.8297872340425532), np.float64(0.9331619537275064), np.float64(0.9210526315789473)]
65
+ confusion_matrix = [[ 2 1 2 10 14 13 0 0 0 0]
66
+ [ 0 142 14 2 38 16 0 0 0 0]
67
+ [ 0 45 134 2 6 4 0 0 0 0]
68
+ [ 0 12 6 50 67 23 0 0 0 5]
69
+ [ 0 18 4 10 166 34 0 0 0 6]
70
+ [ 0 34 6 18 76 122 0 0 0 8]
71
+ [ 0 0 0 0 0 0 144 6 10 0]
72
+ [ 0 0 0 0 0 0 4 156 28 0]
73
+ [ 0 0 0 0 0 0 14 12 363 0]
74
+ [ 0 0 0 1 0 2 0 0 0 35]]
75
+ f1_macro = 0.633966921607933
76
+ f1_weighted = 0.688348410941159
77
+ evaluate 4
78
+ acc = 0.673209549071618
79
+ acc_and_f1_macro = 0.6450619507162738
80
+ acc_and_f1_weighted = 0.6715050760798013
81
+ class_f1 = [np.float64(0.1791044776119403), np.float64(0.5851528384279476), np.float64(0.7611548556430446), np.float64(0.44880174291939), np.float64(0.46361185983827496), np.float64(0.502283105022831), np.float64(0.8819875776397514), np.float64(0.8255813953488371), np.float64(0.8985148514851486), np.float64(0.6229508196721312)]
82
+ class_p = [np.float64(0.24), np.float64(0.5447154471544715), np.float64(0.7631578947368421), np.float64(0.34797297297297297), np.float64(0.6466165413533834), np.float64(0.632183908045977), np.float64(0.8765432098765432), np.float64(0.9102564102564102), np.float64(0.8663484486873508), np.float64(0.4523809523809524)]
83
+ class_r = [np.float64(0.14285714285714285), np.float64(0.6320754716981132), np.float64(0.7591623036649214), np.float64(0.6319018404907976), np.float64(0.36134453781512604), np.float64(0.4166666666666667), np.float64(0.8875), np.float64(0.7553191489361702), np.float64(0.9331619537275064), np.float64(1.0)]
84
+ confusion_matrix = [[ 6 5 0 18 3 10 0 0 0 0]
85
+ [ 4 134 30 10 10 18 0 0 0 6]
86
+ [ 0 36 145 4 2 0 0 0 0 4]
87
+ [ 3 11 7 103 20 14 0 0 0 5]
88
+ [ 8 22 4 80 86 22 0 0 0 16]
89
+ [ 4 38 4 81 12 110 0 0 0 15]
90
+ [ 0 0 0 0 0 0 142 4 14 0]
91
+ [ 0 0 0 0 0 0 4 142 42 0]
92
+ [ 0 0 0 0 0 0 16 10 363 0]
93
+ [ 0 0 0 0 0 0 0 0 0 38]]
94
+ f1_macro = 0.6169143523609297
95
+ f1_weighted = 0.6698006030879845
96
+ evaluate 5
97
+ acc = 0.6923076923076923
98
+ acc_and_f1_macro = 0.6701551641026473
99
+ acc_and_f1_weighted = 0.6913225727110167
100
+ class_f1 = [np.float64(0.2985074626865672), np.float64(0.5936254980079683), np.float64(0.7551622418879056), np.float64(0.45925925925925926), np.float64(0.5292929292929293), np.float64(0.5220729366602688), np.float64(0.8674698795180723), np.float64(0.859504132231405), np.float64(0.9088575096277278), np.float64(0.6862745098039216)]
101
+ class_p = [np.float64(0.4), np.float64(0.5137931034482759), np.float64(0.8648648648648649), np.float64(0.5794392523364486), np.float64(0.5097276264591439), np.float64(0.5291828793774319), np.float64(0.8372093023255814), np.float64(0.8914285714285715), np.float64(0.9076923076923077), np.float64(0.546875)]
102
+ class_r = [np.float64(0.23809523809523808), np.float64(0.7028301886792453), np.float64(0.6701570680628273), np.float64(0.3803680981595092), np.float64(0.5504201680672269), np.float64(0.5151515151515151), np.float64(0.9), np.float64(0.8297872340425532), np.float64(0.910025706940874), np.float64(0.9210526315789473)]
103
+ confusion_matrix = [[ 10 3 0 11 6 12 0 0 0 0]
104
+ [ 0 149 12 4 22 21 0 0 0 4]
105
+ [ 0 51 128 0 6 4 0 0 0 2]
106
+ [ 1 20 2 62 40 33 0 0 0 5]
107
+ [ 4 29 2 14 131 50 0 0 0 8]
108
+ [ 10 38 4 15 51 136 0 0 0 10]
109
+ [ 0 0 0 0 0 0 144 6 10 0]
110
+ [ 0 0 0 0 0 0 6 156 26 0]
111
+ [ 0 0 0 0 0 0 22 13 354 0]
112
+ [ 0 0 0 1 1 1 0 0 0 35]]
113
+ f1_macro = 0.6480026358976024
114
+ f1_weighted = 0.6903374531143411
115
+ evaluate 6
116
+ acc = 0.6997347480106101
117
+ acc_and_f1_macro = 0.6746040583246593
118
+ acc_and_f1_weighted = 0.6982406833442424
119
+ class_f1 = [np.float64(0.2318840579710145), np.float64(0.6133909287257019), np.float64(0.7774798927613941), np.float64(0.48765432098765427), np.float64(0.5436105476673427), np.float64(0.5356371490280778), np.float64(0.8834355828220859), np.float64(0.8369565217391304), np.float64(0.8999999999999999), np.float64(0.6846846846846847)]
120
+ class_p = [np.float64(0.2962962962962963), np.float64(0.5657370517928287), np.float64(0.7967032967032966), np.float64(0.4906832298136646), np.float64(0.5254901960784314), np.float64(0.6231155778894473), np.float64(0.8674698795180723), np.float64(0.8555555555555555), np.float64(0.8976982097186701), np.float64(0.5205479452054794)]
121
+ class_r = [np.float64(0.19047619047619047), np.float64(0.6698113207547169), np.float64(0.7591623036649214), np.float64(0.48466257668711654), np.float64(0.5630252100840336), np.float64(0.4696969696969697), np.float64(0.9), np.float64(0.8191489361702128), np.float64(0.9023136246786633), np.float64(1.0)]
122
+ confusion_matrix = [[ 8 2 0 12 8 12 0 0 0 0]
123
+ [ 2 142 18 6 26 14 0 0 0 4]
124
+ [ 0 32 145 2 8 4 0 0 0 0]
125
+ [ 1 17 7 79 35 19 0 0 0 5]
126
+ [ 8 20 8 28 134 26 0 0 0 14]
127
+ [ 8 38 4 34 44 124 0 0 0 12]
128
+ [ 0 0 0 0 0 0 144 6 10 0]
129
+ [ 0 0 0 0 0 0 4 154 30 0]
130
+ [ 0 0 0 0 0 0 18 20 351 0]
131
+ [ 0 0 0 0 0 0 0 0 0 38]]
132
+ f1_macro = 0.6494733686387086
133
+ f1_weighted = 0.6967466186778747
134
+ evaluate 7
135
+ acc = 0.6949602122015915
136
+ acc_and_f1_macro = 0.6736449120606118
137
+ acc_and_f1_weighted = 0.6941753333487539
138
+ class_f1 = [np.float64(0.2222222222222222), np.float64(0.5967741935483871), np.float64(0.7543859649122806), np.float64(0.4745762711864407), np.float64(0.5376782077393076), np.float64(0.5404339250493096), np.float64(0.8795180722891567), np.float64(0.8421052631578947), np.float64(0.9014084507042253), np.float64(0.7741935483870966)]
139
+ class_p = [np.float64(0.26666666666666666), np.float64(0.5211267605633803), np.float64(0.8543046357615894), np.float64(0.5303030303030303), np.float64(0.5217391304347826), np.float64(0.5637860082304527), np.float64(0.8488372093023255), np.float64(0.8786127167630058), np.float64(0.8979591836734694), np.float64(0.6545454545454545)]
140
+ class_r = [np.float64(0.19047619047619047), np.float64(0.6981132075471698), np.float64(0.675392670157068), np.float64(0.4294478527607362), np.float64(0.5546218487394958), np.float64(0.5189393939393939), np.float64(0.9125), np.float64(0.8085106382978723), np.float64(0.9048843187660668), np.float64(0.9473684210526315)]
141
+ confusion_matrix = [[ 8 4 0 12 6 12 0 0 0 0]
142
+ [ 2 148 14 4 24 18 0 0 0 2]
143
+ [ 2 48 129 0 8 4 0 0 0 0]
144
+ [ 1 24 0 70 35 28 0 0 0 5]
145
+ [ 7 24 4 22 132 43 0 0 0 6]
146
+ [ 10 36 4 23 48 137 0 0 0 6]
147
+ [ 0 0 0 0 0 0 146 4 10 0]
148
+ [ 0 0 0 0 0 0 6 152 30 0]
149
+ [ 0 0 0 0 0 0 20 17 352 0]
150
+ [ 0 0 0 1 0 1 0 0 0 36]]
151
+ f1_macro = 0.652329611919632
152
+ f1_weighted = 0.6933904544959164
153
+ evaluate 8
154
+ acc = 0.6997347480106101
155
+ acc_and_f1_macro = 0.6799997041569643
156
+ acc_and_f1_weighted = 0.6995116358901213
157
+ class_f1 = [np.float64(0.2631578947368421), np.float64(0.6058091286307054), np.float64(0.76878612716763), np.float64(0.4935897435897436), np.float64(0.5210084033613446), np.float64(0.55078125), np.float64(0.8834355828220859), np.float64(0.8510638297872339), np.float64(0.9041450777202072), np.float64(0.7608695652173912)]
158
+ class_p = [np.float64(0.29411764705882354), np.float64(0.5407407407407407), np.float64(0.8580645161290322), np.float64(0.5167785234899329), np.float64(0.5210084033613446), np.float64(0.5685483870967742), np.float64(0.8674698795180723), np.float64(0.851063829787234), np.float64(0.9112271540469974), np.float64(0.6481481481481481)]
159
+ class_r = [np.float64(0.23809523809523808), np.float64(0.6886792452830188), np.float64(0.6963350785340314), np.float64(0.4723926380368098), np.float64(0.5210084033613446), np.float64(0.5340909090909091), np.float64(0.9), np.float64(0.851063829787234), np.float64(0.897172236503856), np.float64(0.9210526315789473)]
160
+ confusion_matrix = [[ 10 2 0 12 6 12 0 0 0 0]
161
+ [ 2 146 14 4 26 18 0 0 0 2]
162
+ [ 0 44 133 2 8 4 0 0 0 0]
163
+ [ 4 22 0 77 30 25 0 0 0 5]
164
+ [ 8 22 4 28 124 46 0 0 0 6]
165
+ [ 10 34 4 25 44 141 0 0 0 6]
166
+ [ 0 0 0 0 0 0 144 6 10 0]
167
+ [ 0 0 0 0 0 0 4 160 24 0]
168
+ [ 0 0 0 0 0 0 18 22 349 0]
169
+ [ 0 0 0 1 0 2 0 0 0 35]]
170
+ f1_macro = 0.6602646603033184
171
+ f1_weighted = 0.6992885237696326
172
+ evaluate 9
173
+ acc = 0.6944297082228117
174
+ acc_and_f1_macro = 0.6740689450220392
175
+ acc_and_f1_weighted = 0.6939169890732269
176
+ class_f1 = [np.float64(0.2222222222222222), np.float64(0.6033057851239669), np.float64(0.76878612716763), np.float64(0.4838709677419355), np.float64(0.5206611570247934), np.float64(0.5401174168297457), np.float64(0.8727272727272727), np.float64(0.837465564738292), np.float64(0.9014084507042253), np.float64(0.7865168539325842)]
177
+ class_p = [np.float64(0.26666666666666666), np.float64(0.5367647058823529), np.float64(0.8580645161290322), np.float64(0.5102040816326531), np.float64(0.5121951219512195), np.float64(0.5587044534412956), np.float64(0.8470588235294118), np.float64(0.8685714285714285), np.float64(0.8979591836734694), np.float64(0.6862745098039216)]
178
+ class_r = [np.float64(0.19047619047619047), np.float64(0.6886792452830188), np.float64(0.6963350785340314), np.float64(0.4601226993865031), np.float64(0.5294117647058824), np.float64(0.5227272727272727), np.float64(0.9), np.float64(0.8085106382978723), np.float64(0.9048843187660668), np.float64(0.9210526315789473)]
179
+ confusion_matrix = [[ 8 2 0 12 6 14 0 0 0 0]
180
+ [ 2 146 14 4 26 18 0 0 0 2]
181
+ [ 0 44 133 2 8 4 0 0 0 0]
182
+ [ 4 22 0 75 32 25 0 0 0 5]
183
+ [ 8 22 4 26 126 46 0 0 0 6]
184
+ [ 8 36 4 27 48 138 0 0 0 3]
185
+ [ 0 0 0 0 0 0 144 6 10 0]
186
+ [ 0 0 0 0 0 0 6 152 30 0]
187
+ [ 0 0 0 0 0 0 20 17 352 0]
188
+ [ 0 0 0 1 0 2 0 0 0 35]]
189
+ f1_macro = 0.6537081818212667
190
+ f1_weighted = 0.6934042699236419
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c17da51ee001d45bde6fa33740a0130fb17c72c4c137b2bc371dab3e1e08f4b
3
+ size 1112235744
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "backend": "tokenizers",
4
+ "bos_token": "<s>",
5
+ "clean_up_tokenization_spaces": true,
6
+ "cls_token": "<s>",
7
+ "do_lower_case": false,
8
+ "eos_token": "</s>",
9
+ "errors": "replace",
10
+ "is_local": false,
11
+ "mask_token": "<mask>",
12
+ "model_max_length": 512,
13
+ "pad_token": "<pad>",
14
+ "sep_token": "</s>",
15
+ "tokenizer_class": "RobertaTokenizer",
16
+ "trim_offsets": true,
17
+ "unk_token": "<unk>"
18
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8326842a5c7bc2e1e489f64889cf28cc938f2cec75e85efaba88b54ffa77d2b0
3
+ size 2769