Upload folder using huggingface_hub
Browse files- checkpoint-best/config.json +57 -0
- checkpoint-best/model.safetensors +3 -0
- checkpoint-best/optimizer.pt +3 -0
- checkpoint-best/scheduler.pt +3 -0
- checkpoint-best/training_0.bin +3 -0
- checkpoint-best/training_1.bin +3 -0
- checkpoint-best/training_9.bin +3 -0
- checkpoint-last/config.json +57 -0
- checkpoint-last/idx_file.txt +1 -0
- checkpoint-last/model.safetensors +3 -0
- checkpoint-last/optimizer.pt +3 -0
- checkpoint-last/scheduler.pt +3 -0
- checkpoint-last/step_file.txt +1 -0
- config.json +57 -0
- eval_results.txt +190 -0
- model.safetensors +3 -0
- tokenizer.json +0 -0
- tokenizer_config.json +17 -0
- training_args.bin +3 -0
checkpoint-best/config.json
ADDED
|
@@ -0,0 +1,57 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"add_cross_attention": false,
|
| 3 |
+
"architectures": [
|
| 4 |
+
"RobertaForSequenceClassification"
|
| 5 |
+
],
|
| 6 |
+
"attention_probs_dropout_prob": 0.1,
|
| 7 |
+
"bos_token_id": 0,
|
| 8 |
+
"classifier_dropout": null,
|
| 9 |
+
"dtype": "float32",
|
| 10 |
+
"eos_token_id": 2,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 768,
|
| 14 |
+
"id2label": {
|
| 15 |
+
"0": "LABEL_0",
|
| 16 |
+
"1": "LABEL_1",
|
| 17 |
+
"2": "LABEL_2",
|
| 18 |
+
"3": "LABEL_3",
|
| 19 |
+
"4": "LABEL_4",
|
| 20 |
+
"5": "LABEL_5",
|
| 21 |
+
"6": "LABEL_6",
|
| 22 |
+
"7": "LABEL_7",
|
| 23 |
+
"8": "LABEL_8",
|
| 24 |
+
"9": "LABEL_9",
|
| 25 |
+
"10": "LABEL_10",
|
| 26 |
+
"11": "LABEL_11"
|
| 27 |
+
},
|
| 28 |
+
"initializer_range": 0.02,
|
| 29 |
+
"intermediate_size": 3072,
|
| 30 |
+
"is_decoder": false,
|
| 31 |
+
"label2id": {
|
| 32 |
+
"LABEL_0": 0,
|
| 33 |
+
"LABEL_1": 1,
|
| 34 |
+
"LABEL_10": 10,
|
| 35 |
+
"LABEL_11": 11,
|
| 36 |
+
"LABEL_2": 2,
|
| 37 |
+
"LABEL_3": 3,
|
| 38 |
+
"LABEL_4": 4,
|
| 39 |
+
"LABEL_5": 5,
|
| 40 |
+
"LABEL_6": 6,
|
| 41 |
+
"LABEL_7": 7,
|
| 42 |
+
"LABEL_8": 8,
|
| 43 |
+
"LABEL_9": 9
|
| 44 |
+
},
|
| 45 |
+
"layer_norm_eps": 1e-05,
|
| 46 |
+
"max_position_embeddings": 514,
|
| 47 |
+
"model_type": "roberta",
|
| 48 |
+
"num_attention_heads": 12,
|
| 49 |
+
"num_hidden_layers": 12,
|
| 50 |
+
"pad_token_id": 1,
|
| 51 |
+
"problem_type": "single_label_classification",
|
| 52 |
+
"tie_word_embeddings": true,
|
| 53 |
+
"transformers_version": "5.0.0",
|
| 54 |
+
"type_vocab_size": 1,
|
| 55 |
+
"use_cache": true,
|
| 56 |
+
"vocab_size": 50265
|
| 57 |
+
}
|
checkpoint-best/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a140abc72f23acfeee6403f1947d24d20561863739a3f656b9ff4920a8be9e2e
|
| 3 |
+
size 498643560
|
checkpoint-best/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7aad3e98c8ecedd550a192588c2746a7ba4aabfc7f50754a21ee67c69f1566cd
|
| 3 |
+
size 997407371
|
checkpoint-best/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fad9d3d814422fc24594f9e6de16e4af7ee16238cef70fe96e25680c409c7157
|
| 3 |
+
size 1465
|
checkpoint-best/training_0.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5421dc4775b16b532e493cc5b1b5fa8ff4c9ffa5872a5ea2e2f4b27eb6c57077
|
| 3 |
+
size 2751
|
checkpoint-best/training_1.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:445cddfdf17199d8777e5d8761543e7476a4bfe707817856d05eacc24c64b8fc
|
| 3 |
+
size 2751
|
checkpoint-best/training_9.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fd12dd4427cd491d86b3c563f6bc60950d124f5d77d03d7ff3c8d6a1fc329486
|
| 3 |
+
size 2751
|
checkpoint-last/config.json
ADDED
|
@@ -0,0 +1,57 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"add_cross_attention": false,
|
| 3 |
+
"architectures": [
|
| 4 |
+
"RobertaForSequenceClassification"
|
| 5 |
+
],
|
| 6 |
+
"attention_probs_dropout_prob": 0.1,
|
| 7 |
+
"bos_token_id": 0,
|
| 8 |
+
"classifier_dropout": null,
|
| 9 |
+
"dtype": "float32",
|
| 10 |
+
"eos_token_id": 2,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 768,
|
| 14 |
+
"id2label": {
|
| 15 |
+
"0": "LABEL_0",
|
| 16 |
+
"1": "LABEL_1",
|
| 17 |
+
"2": "LABEL_2",
|
| 18 |
+
"3": "LABEL_3",
|
| 19 |
+
"4": "LABEL_4",
|
| 20 |
+
"5": "LABEL_5",
|
| 21 |
+
"6": "LABEL_6",
|
| 22 |
+
"7": "LABEL_7",
|
| 23 |
+
"8": "LABEL_8",
|
| 24 |
+
"9": "LABEL_9",
|
| 25 |
+
"10": "LABEL_10",
|
| 26 |
+
"11": "LABEL_11"
|
| 27 |
+
},
|
| 28 |
+
"initializer_range": 0.02,
|
| 29 |
+
"intermediate_size": 3072,
|
| 30 |
+
"is_decoder": false,
|
| 31 |
+
"label2id": {
|
| 32 |
+
"LABEL_0": 0,
|
| 33 |
+
"LABEL_1": 1,
|
| 34 |
+
"LABEL_10": 10,
|
| 35 |
+
"LABEL_11": 11,
|
| 36 |
+
"LABEL_2": 2,
|
| 37 |
+
"LABEL_3": 3,
|
| 38 |
+
"LABEL_4": 4,
|
| 39 |
+
"LABEL_5": 5,
|
| 40 |
+
"LABEL_6": 6,
|
| 41 |
+
"LABEL_7": 7,
|
| 42 |
+
"LABEL_8": 8,
|
| 43 |
+
"LABEL_9": 9
|
| 44 |
+
},
|
| 45 |
+
"layer_norm_eps": 1e-05,
|
| 46 |
+
"max_position_embeddings": 514,
|
| 47 |
+
"model_type": "roberta",
|
| 48 |
+
"num_attention_heads": 12,
|
| 49 |
+
"num_hidden_layers": 12,
|
| 50 |
+
"pad_token_id": 1,
|
| 51 |
+
"problem_type": "single_label_classification",
|
| 52 |
+
"tie_word_embeddings": true,
|
| 53 |
+
"transformers_version": "5.0.0",
|
| 54 |
+
"type_vocab_size": 1,
|
| 55 |
+
"use_cache": true,
|
| 56 |
+
"vocab_size": 50265
|
| 57 |
+
}
|
checkpoint-last/idx_file.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
9
|
checkpoint-last/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a140abc72f23acfeee6403f1947d24d20561863739a3f656b9ff4920a8be9e2e
|
| 3 |
+
size 498643560
|
checkpoint-last/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7aad3e98c8ecedd550a192588c2746a7ba4aabfc7f50754a21ee67c69f1566cd
|
| 3 |
+
size 997407371
|
checkpoint-last/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fad9d3d814422fc24594f9e6de16e4af7ee16238cef70fe96e25680c409c7157
|
| 3 |
+
size 1465
|
checkpoint-last/step_file.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
3660
|
config.json
ADDED
|
@@ -0,0 +1,57 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"add_cross_attention": false,
|
| 3 |
+
"architectures": [
|
| 4 |
+
"RobertaForSequenceClassification"
|
| 5 |
+
],
|
| 6 |
+
"attention_probs_dropout_prob": 0.1,
|
| 7 |
+
"bos_token_id": 0,
|
| 8 |
+
"classifier_dropout": null,
|
| 9 |
+
"dtype": "float32",
|
| 10 |
+
"eos_token_id": 2,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 768,
|
| 14 |
+
"id2label": {
|
| 15 |
+
"0": "LABEL_0",
|
| 16 |
+
"1": "LABEL_1",
|
| 17 |
+
"2": "LABEL_2",
|
| 18 |
+
"3": "LABEL_3",
|
| 19 |
+
"4": "LABEL_4",
|
| 20 |
+
"5": "LABEL_5",
|
| 21 |
+
"6": "LABEL_6",
|
| 22 |
+
"7": "LABEL_7",
|
| 23 |
+
"8": "LABEL_8",
|
| 24 |
+
"9": "LABEL_9",
|
| 25 |
+
"10": "LABEL_10",
|
| 26 |
+
"11": "LABEL_11"
|
| 27 |
+
},
|
| 28 |
+
"initializer_range": 0.02,
|
| 29 |
+
"intermediate_size": 3072,
|
| 30 |
+
"is_decoder": false,
|
| 31 |
+
"label2id": {
|
| 32 |
+
"LABEL_0": 0,
|
| 33 |
+
"LABEL_1": 1,
|
| 34 |
+
"LABEL_10": 10,
|
| 35 |
+
"LABEL_11": 11,
|
| 36 |
+
"LABEL_2": 2,
|
| 37 |
+
"LABEL_3": 3,
|
| 38 |
+
"LABEL_4": 4,
|
| 39 |
+
"LABEL_5": 5,
|
| 40 |
+
"LABEL_6": 6,
|
| 41 |
+
"LABEL_7": 7,
|
| 42 |
+
"LABEL_8": 8,
|
| 43 |
+
"LABEL_9": 9
|
| 44 |
+
},
|
| 45 |
+
"layer_norm_eps": 1e-05,
|
| 46 |
+
"max_position_embeddings": 514,
|
| 47 |
+
"model_type": "roberta",
|
| 48 |
+
"num_attention_heads": 12,
|
| 49 |
+
"num_hidden_layers": 12,
|
| 50 |
+
"pad_token_id": 1,
|
| 51 |
+
"problem_type": "single_label_classification",
|
| 52 |
+
"tie_word_embeddings": true,
|
| 53 |
+
"transformers_version": "5.0.0",
|
| 54 |
+
"type_vocab_size": 1,
|
| 55 |
+
"use_cache": true,
|
| 56 |
+
"vocab_size": 50265
|
| 57 |
+
}
|
eval_results.txt
ADDED
|
@@ -0,0 +1,190 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
evaluate 0
|
| 2 |
+
acc = 0.7474801061007957
|
| 3 |
+
acc_and_f1_macro = 0.7048938434748613
|
| 4 |
+
acc_and_f1_weighted = 0.739449319460284
|
| 5 |
+
class_f1 = [np.float64(nan), np.float64(0.7238493723849372), np.float64(0.7958656330749354), np.float64(0.3373493975903614), np.float64(0.6004415011037526), np.float64(0.6722689075630252), np.float64(0.9182389937106918), np.float64(0.8677248677248677), np.float64(0.9201030927835051), np.float64(0.7872340425531915)]
|
| 6 |
+
class_p = [np.float64(nan), np.float64(0.650375939849624), np.float64(0.7857142857142857), np.float64(0.4883720930232558), np.float64(0.6325581395348837), np.float64(0.6042296072507553), np.float64(0.9240506329113924), np.float64(0.8631578947368421), np.float64(0.9224806201550387), np.float64(0.6607142857142857)]
|
| 7 |
+
class_r = [np.float64(0.0), np.float64(0.8160377358490566), np.float64(0.806282722513089), np.float64(0.25766871165644173), np.float64(0.5714285714285714), np.float64(0.7575757575757576), np.float64(0.9125), np.float64(0.8723404255319149), np.float64(0.9177377892030848), np.float64(0.9736842105263158)]
|
| 8 |
+
confusion_matrix = [[ 0 8 0 12 2 20 0 0 0 0]
|
| 9 |
+
[ 0 173 23 0 2 14 0 0 0 0]
|
| 10 |
+
[ 0 31 154 2 2 0 0 0 0 2]
|
| 11 |
+
[ 0 15 8 42 50 46 0 0 0 2]
|
| 12 |
+
[ 0 22 4 14 136 50 0 0 0 12]
|
| 13 |
+
[ 0 15 7 16 23 200 0 0 0 3]
|
| 14 |
+
[ 0 2 0 0 0 0 146 4 8 0]
|
| 15 |
+
[ 0 0 0 0 0 0 2 164 22 0]
|
| 16 |
+
[ 0 0 0 0 0 0 10 22 357 0]
|
| 17 |
+
[ 0 0 0 0 0 1 0 0 0 37]]
|
| 18 |
+
f1_macro = 0.6623075808489268
|
| 19 |
+
f1_weighted = 0.7314185328197723
|
| 20 |
+
evaluate 1
|
| 21 |
+
acc = 0.7618037135278515
|
| 22 |
+
acc_and_f1_macro = 0.7229381973826235
|
| 23 |
+
acc_and_f1_weighted = 0.7575460583049605
|
| 24 |
+
class_f1 = [np.float64(nan), np.float64(0.7421686746987951), np.float64(0.7999999999999999), np.float64(0.4999999999999999), np.float64(0.5740740740740741), np.float64(0.6946308724832215), np.float64(0.925925925925926), np.float64(0.8844221105527638), np.float64(0.936), np.float64(0.7835051546391751)]
|
| 25 |
+
class_p = [np.float64(nan), np.float64(0.7586206896551724), np.float64(0.8042328042328042), np.float64(0.48554913294797686), np.float64(0.6391752577319587), np.float64(0.6234939759036144), np.float64(0.9146341463414634), np.float64(0.8380952380952381), np.float64(0.9722991689750693), np.float64(0.6440677966101694)]
|
| 26 |
+
class_r = [np.float64(0.0), np.float64(0.7264150943396226), np.float64(0.7958115183246073), np.float64(0.5153374233128835), np.float64(0.5210084033613446), np.float64(0.7840909090909091), np.float64(0.9375), np.float64(0.9361702127659575), np.float64(0.9023136246786633), np.float64(1.0)]
|
| 27 |
+
confusion_matrix = [[ 0 5 0 16 5 16 0 0 0 0]
|
| 28 |
+
[ 0 154 22 0 8 26 0 0 0 2]
|
| 29 |
+
[ 0 18 152 8 7 2 0 0 0 4]
|
| 30 |
+
[ 0 4 7 84 38 26 0 0 0 4]
|
| 31 |
+
[ 0 14 4 33 124 55 0 0 0 8]
|
| 32 |
+
[ 0 6 4 32 12 207 0 0 0 3]
|
| 33 |
+
[ 0 2 0 0 0 0 150 6 2 0]
|
| 34 |
+
[ 0 0 0 0 0 0 4 176 8 0]
|
| 35 |
+
[ 0 0 0 0 0 0 10 28 351 0]
|
| 36 |
+
[ 0 0 0 0 0 0 0 0 0 38]]
|
| 37 |
+
f1_macro = 0.6840726812373956
|
| 38 |
+
f1_weighted = 0.7532884030820696
|
| 39 |
+
evaluate 2
|
| 40 |
+
acc = 0.7522546419098143
|
| 41 |
+
acc_and_f1_macro = 0.7302639191012046
|
| 42 |
+
acc_and_f1_weighted = 0.7514893569292973
|
| 43 |
+
class_f1 = [np.float64(0.25806451612903225), np.float64(0.7196261682242991), np.float64(0.7799442896935934), np.float64(0.4675324675324675), np.float64(0.6061705989110707), np.float64(0.6561264822134387), np.float64(0.9308176100628932), np.float64(0.8730964467005077), np.float64(0.9342105263157896), np.float64(0.8571428571428571)]
|
| 44 |
+
class_p = [np.float64(0.4), np.float64(0.7129629629629629), np.float64(0.8333333333333334), np.float64(0.496551724137931), np.float64(0.5335463258785943), np.float64(0.6859504132231405), np.float64(0.9367088607594937), np.float64(0.8349514563106796), np.float64(0.9568733153638814), np.float64(0.782608695652174)]
|
| 45 |
+
class_r = [np.float64(0.19047619047619047), np.float64(0.7264150943396226), np.float64(0.7329842931937173), np.float64(0.44171779141104295), np.float64(0.7016806722689075), np.float64(0.6287878787878788), np.float64(0.925), np.float64(0.9148936170212766), np.float64(0.9125964010282777), np.float64(0.9473684210526315)]
|
| 46 |
+
confusion_matrix = [[ 8 4 0 10 8 12 0 0 0 0]
|
| 47 |
+
[ 4 154 14 2 18 20 0 0 0 0]
|
| 48 |
+
[ 0 31 140 8 8 2 0 0 0 2]
|
| 49 |
+
[ 4 7 6 72 58 12 0 0 0 4]
|
| 50 |
+
[ 0 12 4 25 167 28 0 0 0 2]
|
| 51 |
+
[ 4 6 4 28 54 166 0 0 0 2]
|
| 52 |
+
[ 0 2 0 0 0 0 148 8 2 0]
|
| 53 |
+
[ 0 0 0 0 0 0 2 172 14 0]
|
| 54 |
+
[ 0 0 0 0 0 0 8 26 355 0]
|
| 55 |
+
[ 0 0 0 0 0 2 0 0 0 36]]
|
| 56 |
+
f1_macro = 0.7082731962925949
|
| 57 |
+
f1_weighted = 0.7507240719487804
|
| 58 |
+
evaluate 3
|
| 59 |
+
acc = 0.7480106100795756
|
| 60 |
+
acc_and_f1_macro = 0.7216309782116379
|
| 61 |
+
acc_and_f1_weighted = 0.745009762685597
|
| 62 |
+
class_f1 = [np.float64(0.2), np.float64(0.7132867132867132), np.float64(0.7570621468926554), np.float64(0.43262411347517726), np.float64(0.6058091286307054), np.float64(0.6898839137645107), np.float64(0.9230769230769231), np.float64(0.8471849865951742), np.float64(0.9199491740787803), np.float64(0.8636363636363636)]
|
| 63 |
+
class_p = [np.float64(0.3333333333333333), np.float64(0.7050691244239631), np.float64(0.8220858895705522), np.float64(0.5126050420168067), np.float64(0.5983606557377049), np.float64(0.6135693215339233), np.float64(0.9473684210526315), np.float64(0.8540540540540541), np.float64(0.9095477386934674), np.float64(0.76)]
|
| 64 |
+
class_r = [np.float64(0.14285714285714285), np.float64(0.7216981132075472), np.float64(0.7015706806282722), np.float64(0.37423312883435583), np.float64(0.6134453781512605), np.float64(0.7878787878787878), np.float64(0.9), np.float64(0.8404255319148937), np.float64(0.9305912596401028), np.float64(1.0)]
|
| 65 |
+
confusion_matrix = [[ 6 4 0 10 6 16 0 0 0 0]
|
| 66 |
+
[ 4 153 15 2 12 26 0 0 0 0]
|
| 67 |
+
[ 2 32 134 7 10 2 0 0 0 4]
|
| 68 |
+
[ 4 8 6 61 44 36 0 0 0 4]
|
| 69 |
+
[ 0 12 4 21 146 51 0 0 0 4]
|
| 70 |
+
[ 2 6 4 18 26 208 0 0 0 0]
|
| 71 |
+
[ 0 2 0 0 0 0 144 6 8 0]
|
| 72 |
+
[ 0 0 0 0 0 0 2 158 28 0]
|
| 73 |
+
[ 0 0 0 0 0 0 6 21 362 0]
|
| 74 |
+
[ 0 0 0 0 0 0 0 0 0 38]]
|
| 75 |
+
f1_macro = 0.6952513463437002
|
| 76 |
+
f1_weighted = 0.7420089152916185
|
| 77 |
+
evaluate 4
|
| 78 |
+
acc = 0.7554376657824934
|
| 79 |
+
acc_and_f1_macro = 0.7299251289757365
|
| 80 |
+
acc_and_f1_weighted = 0.7534075021522451
|
| 81 |
+
class_f1 = [np.float64(0.16666666666666666), np.float64(0.7403846153846154), np.float64(0.8021390374331551), np.float64(0.4563758389261745), np.float64(0.5755395683453237), np.float64(0.678095238095238), np.float64(0.925), np.float64(0.8783068783068785), np.float64(0.9300518134715026), np.float64(0.891566265060241)]
|
| 82 |
+
class_p = [np.float64(0.6666666666666666), np.float64(0.7549019607843137), np.float64(0.819672131147541), np.float64(0.5037037037037037), np.float64(0.5031446540880503), np.float64(0.6819923371647509), np.float64(0.925), np.float64(0.8736842105263158), np.float64(0.9373368146214099), np.float64(0.8222222222222222)]
|
| 83 |
+
class_r = [np.float64(0.09523809523809523), np.float64(0.7264150943396226), np.float64(0.7853403141361257), np.float64(0.4171779141104294), np.float64(0.6722689075630253), np.float64(0.6742424242424242), np.float64(0.925), np.float64(0.8829787234042553), np.float64(0.922879177377892), np.float64(0.9736842105263158)]
|
| 84 |
+
confusion_matrix = [[ 4 4 0 12 8 14 0 0 0 0]
|
| 85 |
+
[ 2 154 16 4 20 16 0 0 0 0]
|
| 86 |
+
[ 0 20 150 3 12 4 0 0 0 2]
|
| 87 |
+
[ 0 6 7 68 62 16 0 0 0 4]
|
| 88 |
+
[ 0 12 4 28 160 32 0 0 0 2]
|
| 89 |
+
[ 0 8 6 20 52 178 0 0 0 0]
|
| 90 |
+
[ 0 0 0 0 2 0 148 6 4 0]
|
| 91 |
+
[ 0 0 0 0 0 0 2 166 20 0]
|
| 92 |
+
[ 0 0 0 0 2 0 10 18 359 0]
|
| 93 |
+
[ 0 0 0 0 0 1 0 0 0 37]]
|
| 94 |
+
f1_macro = 0.7044125921689796
|
| 95 |
+
f1_weighted = 0.7513773385219968
|
| 96 |
+
evaluate 5
|
| 97 |
+
acc = 0.7586206896551724
|
| 98 |
+
acc_and_f1_macro = 0.7333208161673415
|
| 99 |
+
acc_and_f1_weighted = 0.7566757125566077
|
| 100 |
+
class_f1 = [np.float64(0.16), np.float64(0.7464114832535885), np.float64(0.7914438502673796), np.float64(0.4814814814814815), np.float64(0.5988483685220729), np.float64(0.6994328922495274), np.float64(0.9240506329113924), np.float64(0.8524590163934426), np.float64(0.9213197969543147), np.float64(0.9047619047619047)]
|
| 101 |
+
class_p = [np.float64(0.5), np.float64(0.7572815533980582), np.float64(0.8087431693989071), np.float64(0.484472049689441), np.float64(0.5512367491166078), np.float64(0.6981132075471698), np.float64(0.9358974358974359), np.float64(0.8764044943820225), np.float64(0.9097744360902256), np.float64(0.8260869565217391)]
|
| 102 |
+
class_r = [np.float64(0.09523809523809523), np.float64(0.7358490566037735), np.float64(0.774869109947644), np.float64(0.4785276073619632), np.float64(0.6554621848739496), np.float64(0.7007575757575758), np.float64(0.9125), np.float64(0.8297872340425532), np.float64(0.9331619537275064), np.float64(1.0)]
|
| 103 |
+
confusion_matrix = [[ 4 4 0 16 4 14 0 0 0 0]
|
| 104 |
+
[ 2 156 18 4 16 16 0 0 0 0]
|
| 105 |
+
[ 0 20 148 5 12 4 0 0 0 2]
|
| 106 |
+
[ 2 6 7 78 52 14 0 0 0 4]
|
| 107 |
+
[ 0 12 4 32 156 32 0 0 0 2]
|
| 108 |
+
[ 0 8 6 26 39 185 0 0 0 0]
|
| 109 |
+
[ 0 0 0 0 2 0 146 6 6 0]
|
| 110 |
+
[ 0 0 0 0 0 0 2 156 30 0]
|
| 111 |
+
[ 0 0 0 0 2 0 8 16 363 0]
|
| 112 |
+
[ 0 0 0 0 0 0 0 0 0 38]]
|
| 113 |
+
f1_macro = 0.7080209426795105
|
| 114 |
+
f1_weighted = 0.7547307354580429
|
| 115 |
+
evaluate 6
|
| 116 |
+
acc = 0.7564986737400531
|
| 117 |
+
acc_and_f1_macro = 0.7311158097126855
|
| 118 |
+
acc_and_f1_weighted = 0.7542026248283529
|
| 119 |
+
class_f1 = [np.float64(0.16666666666666666), np.float64(0.7403846153846154), np.float64(0.7956989247311829), np.float64(0.46302250803858525), np.float64(0.5939849624060151), np.float64(0.6990654205607477), np.float64(0.925), np.float64(0.8478260869565217), np.float64(0.9209183673469388), np.float64(0.9047619047619047)]
|
| 120 |
+
class_p = [np.float64(0.6666666666666666), np.float64(0.7549019607843137), np.float64(0.8176795580110497), np.float64(0.4864864864864865), np.float64(0.5374149659863946), np.float64(0.6900369003690037), np.float64(0.925), np.float64(0.8666666666666667), np.float64(0.9139240506329114), np.float64(0.8260869565217391)]
|
| 121 |
+
class_r = [np.float64(0.09523809523809523), np.float64(0.7264150943396226), np.float64(0.774869109947644), np.float64(0.44171779141104295), np.float64(0.6638655462184874), np.float64(0.7083333333333334), np.float64(0.925), np.float64(0.8297872340425532), np.float64(0.9280205655526992), np.float64(1.0)]
|
| 122 |
+
confusion_matrix = [[ 4 4 0 15 5 14 0 0 0 0]
|
| 123 |
+
[ 2 154 16 4 20 16 0 0 0 0]
|
| 124 |
+
[ 0 22 148 3 12 4 0 0 0 2]
|
| 125 |
+
[ 0 6 7 72 56 18 0 0 0 4]
|
| 126 |
+
[ 0 12 4 30 158 32 0 0 0 2]
|
| 127 |
+
[ 0 6 6 24 41 187 0 0 0 0]
|
| 128 |
+
[ 0 0 0 0 2 0 148 6 4 0]
|
| 129 |
+
[ 0 0 0 0 0 0 2 156 30 0]
|
| 130 |
+
[ 0 0 0 0 0 0 10 18 361 0]
|
| 131 |
+
[ 0 0 0 0 0 0 0 0 0 38]]
|
| 132 |
+
f1_macro = 0.7057329456853179
|
| 133 |
+
f1_weighted = 0.7519065759166527
|
| 134 |
+
evaluate 7
|
| 135 |
+
acc = 0.7580901856763925
|
| 136 |
+
acc_and_f1_macro = 0.732903294943322
|
| 137 |
+
acc_and_f1_weighted = 0.7560980300675524
|
| 138 |
+
class_f1 = [np.float64(0.16), np.float64(0.7499999999999999), np.float64(0.8), np.float64(0.48253968253968255), np.float64(0.5928705440900564), np.float64(0.7018867924528303), np.float64(0.925), np.float64(0.8415300546448087), np.float64(0.9185750636132316), np.float64(0.9047619047619047)]
|
| 139 |
+
class_p = [np.float64(0.5), np.float64(0.7647058823529411), np.float64(0.8268156424581006), np.float64(0.5), np.float64(0.535593220338983), np.float64(0.6992481203007519), np.float64(0.925), np.float64(0.8651685393258427), np.float64(0.9093198992443325), np.float64(0.8260869565217391)]
|
| 140 |
+
class_r = [np.float64(0.09523809523809523), np.float64(0.7358490566037735), np.float64(0.774869109947644), np.float64(0.4662576687116564), np.float64(0.6638655462184874), np.float64(0.7045454545454546), np.float64(0.925), np.float64(0.8191489361702128), np.float64(0.9280205655526992), np.float64(1.0)]
|
| 141 |
+
confusion_matrix = [[ 4 4 0 15 5 14 0 0 0 0]
|
| 142 |
+
[ 2 156 14 4 20 16 0 0 0 0]
|
| 143 |
+
[ 0 22 148 3 12 4 0 0 0 2]
|
| 144 |
+
[ 2 6 7 76 54 14 0 0 0 4]
|
| 145 |
+
[ 0 12 4 30 158 32 0 0 0 2]
|
| 146 |
+
[ 0 4 6 24 44 186 0 0 0 0]
|
| 147 |
+
[ 0 0 0 0 2 0 148 6 4 0]
|
| 148 |
+
[ 0 0 0 0 0 0 2 154 32 0]
|
| 149 |
+
[ 0 0 0 0 0 0 10 18 361 0]
|
| 150 |
+
[ 0 0 0 0 0 0 0 0 0 38]]
|
| 151 |
+
f1_macro = 0.7077164042102514
|
| 152 |
+
f1_weighted = 0.7541058744587121
|
| 153 |
+
evaluate 8
|
| 154 |
+
acc = 0.7618037135278515
|
| 155 |
+
acc_and_f1_macro = 0.7323228184279761
|
| 156 |
+
acc_and_f1_weighted = 0.7590034977915698
|
| 157 |
+
class_f1 = [np.float64(0.08695652173913042), np.float64(0.7523809523809523), np.float64(0.8043478260869565), np.float64(0.4705882352941177), np.float64(0.5981308411214953), np.float64(0.6964618249534452), np.float64(0.925), np.float64(0.8601036269430052), np.float64(0.9296874999999999), np.float64(0.9047619047619047)]
|
| 158 |
+
class_p = [np.float64(0.5), np.float64(0.7596153846153846), np.float64(0.8361581920903954), np.float64(0.5034965034965035), np.float64(0.5387205387205387), np.float64(0.684981684981685), np.float64(0.925), np.float64(0.8383838383838383), np.float64(0.941952506596306), np.float64(0.8260869565217391)]
|
| 159 |
+
class_r = [np.float64(0.047619047619047616), np.float64(0.7452830188679245), np.float64(0.774869109947644), np.float64(0.44171779141104295), np.float64(0.6722689075630253), np.float64(0.7083333333333334), np.float64(0.925), np.float64(0.8829787234042553), np.float64(0.9177377892030848), np.float64(1.0)]
|
| 160 |
+
confusion_matrix = [[ 2 4 0 12 8 16 0 0 0 0]
|
| 161 |
+
[ 2 158 14 4 18 16 0 0 0 0]
|
| 162 |
+
[ 0 22 148 3 12 4 0 0 0 2]
|
| 163 |
+
[ 0 7 6 72 56 18 0 0 0 4]
|
| 164 |
+
[ 0 12 4 28 160 32 0 0 0 2]
|
| 165 |
+
[ 0 5 5 24 43 187 0 0 0 0]
|
| 166 |
+
[ 0 0 0 0 0 0 148 10 2 0]
|
| 167 |
+
[ 0 0 0 0 0 0 2 166 20 0]
|
| 168 |
+
[ 0 0 0 0 0 0 10 22 357 0]
|
| 169 |
+
[ 0 0 0 0 0 0 0 0 0 38]]
|
| 170 |
+
f1_macro = 0.7028419233281007
|
| 171 |
+
f1_weighted = 0.7562032820552881
|
| 172 |
+
evaluate 9
|
| 173 |
+
acc = 0.7644562334217506
|
| 174 |
+
acc_and_f1_macro = 0.7386967474391453
|
| 175 |
+
acc_and_f1_weighted = 0.7625543782840718
|
| 176 |
+
class_f1 = [np.float64(0.16), np.float64(0.7541766109785202), np.float64(0.802168021680217), np.float64(0.48253968253968255), np.float64(0.5951035781544257), np.float64(0.7018867924528303), np.float64(0.925), np.float64(0.8736842105263158), np.float64(0.9300518134715026), np.float64(0.9047619047619047)]
|
| 177 |
+
class_p = [np.float64(0.5), np.float64(0.7632850241545893), np.float64(0.8314606741573034), np.float64(0.5), np.float64(0.5392491467576792), np.float64(0.6992481203007519), np.float64(0.925), np.float64(0.8645833333333334), np.float64(0.9373368146214099), np.float64(0.8260869565217391)]
|
| 178 |
+
class_r = [np.float64(0.09523809523809523), np.float64(0.7452830188679245), np.float64(0.774869109947644), np.float64(0.4662576687116564), np.float64(0.6638655462184874), np.float64(0.7045454545454546), np.float64(0.925), np.float64(0.8829787234042553), np.float64(0.922879177377892), np.float64(1.0)]
|
| 179 |
+
confusion_matrix = [[ 4 4 0 15 5 14 0 0 0 0]
|
| 180 |
+
[ 2 158 14 4 18 16 0 0 0 0]
|
| 181 |
+
[ 0 22 148 3 12 4 0 0 0 2]
|
| 182 |
+
[ 2 6 7 76 54 14 0 0 0 4]
|
| 183 |
+
[ 0 12 4 30 158 32 0 0 0 2]
|
| 184 |
+
[ 0 5 5 24 44 186 0 0 0 0]
|
| 185 |
+
[ 0 0 0 0 2 0 148 6 4 0]
|
| 186 |
+
[ 0 0 0 0 0 0 2 166 20 0]
|
| 187 |
+
[ 0 0 0 0 0 0 10 20 359 0]
|
| 188 |
+
[ 0 0 0 0 0 0 0 0 0 38]]
|
| 189 |
+
f1_macro = 0.7129372614565399
|
| 190 |
+
f1_weighted = 0.760652523146393
|
model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a140abc72f23acfeee6403f1947d24d20561863739a3f656b9ff4920a8be9e2e
|
| 3 |
+
size 498643560
|
tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tokenizer_config.json
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"add_prefix_space": false,
|
| 3 |
+
"backend": "tokenizers",
|
| 4 |
+
"bos_token": "<s>",
|
| 5 |
+
"cls_token": "<s>",
|
| 6 |
+
"do_lower_case": false,
|
| 7 |
+
"eos_token": "</s>",
|
| 8 |
+
"errors": "replace",
|
| 9 |
+
"is_local": false,
|
| 10 |
+
"mask_token": "<mask>",
|
| 11 |
+
"model_max_length": 512,
|
| 12 |
+
"pad_token": "<pad>",
|
| 13 |
+
"sep_token": "</s>",
|
| 14 |
+
"tokenizer_class": "RobertaTokenizer",
|
| 15 |
+
"trim_offsets": true,
|
| 16 |
+
"unk_token": "<unk>"
|
| 17 |
+
}
|
training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:06e90bba594a67858fbed551759bbc8d67acfcba7a9da07f7dbf1cd75c77ce1e
|
| 3 |
+
size 2769
|