Upload folder using huggingface_hub
Browse files- checkpoint-best/config.json +59 -0
- checkpoint-best/model.safetensors +3 -0
- checkpoint-best/optimizer.pt +3 -0
- checkpoint-best/scheduler.pt +3 -0
- checkpoint-best/training_0.bin +3 -0
- checkpoint-best/training_1.bin +3 -0
- checkpoint-best/training_2.bin +3 -0
- checkpoint-best/training_3.bin +3 -0
- checkpoint-best/training_6.bin +3 -0
- checkpoint-last/config.json +59 -0
- checkpoint-last/idx_file.txt +1 -0
- checkpoint-last/model.safetensors +3 -0
- checkpoint-last/optimizer.pt +3 -0
- checkpoint-last/scheduler.pt +3 -0
- checkpoint-last/step_file.txt +1 -0
- config.json +59 -0
- eval_results.txt +190 -0
- model.safetensors +3 -0
- tokenizer.json +0 -0
- tokenizer_config.json +18 -0
- training_args.bin +3 -0
checkpoint-best/config.json
ADDED
|
@@ -0,0 +1,59 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"add_cross_attention": false,
|
| 3 |
+
"architectures": [
|
| 4 |
+
"RobertaForSequenceClassification"
|
| 5 |
+
],
|
| 6 |
+
"attention_probs_dropout_prob": 0.1,
|
| 7 |
+
"bos_token_id": 0,
|
| 8 |
+
"classifier_dropout": null,
|
| 9 |
+
"dtype": "float32",
|
| 10 |
+
"eos_token_id": 2,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 768,
|
| 14 |
+
"id2label": {
|
| 15 |
+
"0": "LABEL_0",
|
| 16 |
+
"1": "LABEL_1",
|
| 17 |
+
"2": "LABEL_2",
|
| 18 |
+
"3": "LABEL_3",
|
| 19 |
+
"4": "LABEL_4",
|
| 20 |
+
"5": "LABEL_5",
|
| 21 |
+
"6": "LABEL_6",
|
| 22 |
+
"7": "LABEL_7",
|
| 23 |
+
"8": "LABEL_8",
|
| 24 |
+
"9": "LABEL_9",
|
| 25 |
+
"10": "LABEL_10",
|
| 26 |
+
"11": "LABEL_11"
|
| 27 |
+
},
|
| 28 |
+
"initializer_range": 0.02,
|
| 29 |
+
"intermediate_size": 3072,
|
| 30 |
+
"is_decoder": false,
|
| 31 |
+
"label2id": {
|
| 32 |
+
"LABEL_0": 0,
|
| 33 |
+
"LABEL_1": 1,
|
| 34 |
+
"LABEL_10": 10,
|
| 35 |
+
"LABEL_11": 11,
|
| 36 |
+
"LABEL_2": 2,
|
| 37 |
+
"LABEL_3": 3,
|
| 38 |
+
"LABEL_4": 4,
|
| 39 |
+
"LABEL_5": 5,
|
| 40 |
+
"LABEL_6": 6,
|
| 41 |
+
"LABEL_7": 7,
|
| 42 |
+
"LABEL_8": 8,
|
| 43 |
+
"LABEL_9": 9
|
| 44 |
+
},
|
| 45 |
+
"layer_norm_eps": 1e-05,
|
| 46 |
+
"max_position_embeddings": 514,
|
| 47 |
+
"model_type": "roberta",
|
| 48 |
+
"num_attention_heads": 12,
|
| 49 |
+
"num_hidden_layers": 12,
|
| 50 |
+
"output_past": true,
|
| 51 |
+
"pad_token_id": 1,
|
| 52 |
+
"position_embedding_type": "absolute",
|
| 53 |
+
"problem_type": "single_label_classification",
|
| 54 |
+
"tie_word_embeddings": true,
|
| 55 |
+
"transformers_version": "5.0.0",
|
| 56 |
+
"type_vocab_size": 1,
|
| 57 |
+
"use_cache": true,
|
| 58 |
+
"vocab_size": 250002
|
| 59 |
+
}
|
checkpoint-best/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1d4e3e38414b5d2c5a596e0ab5c8a5f5acc78ef632ffc14bfcc0df565a52171b
|
| 3 |
+
size 1112235744
|
checkpoint-best/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:29802fbac574a6343d6590c324e85b19359e6021e7e707365fea8af24e09370a
|
| 3 |
+
size 2224591499
|
checkpoint-best/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9d46ebbe86cc296e0659ad6d70cc71025895e9b0ca50bf4d999e099e27ebec81
|
| 3 |
+
size 1465
|
checkpoint-best/training_0.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a7b727449fefeba793fb9580f65c60481a8c179df5700a35433e0a1c57958712
|
| 3 |
+
size 2751
|
checkpoint-best/training_1.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8c6825ff2f41b152453471580a04ec5538eeaf4dd13698bbd4de415e5f8f2d21
|
| 3 |
+
size 2751
|
checkpoint-best/training_2.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:685e4ad908898fc6dabeb9f80917014c1ceb588a7d791e708b50fda4ab315b81
|
| 3 |
+
size 2751
|
checkpoint-best/training_3.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ee72edb116c9d6d1a49c7124a650269090702b2b5d51afab86b2f86b4a94175f
|
| 3 |
+
size 2751
|
checkpoint-best/training_6.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9daa462e2ce2191fc68c3f55ca61ae27f52fddaf0bf225dd7541ba6ab39251a1
|
| 3 |
+
size 2751
|
checkpoint-last/config.json
ADDED
|
@@ -0,0 +1,59 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"add_cross_attention": false,
|
| 3 |
+
"architectures": [
|
| 4 |
+
"RobertaForSequenceClassification"
|
| 5 |
+
],
|
| 6 |
+
"attention_probs_dropout_prob": 0.1,
|
| 7 |
+
"bos_token_id": 0,
|
| 8 |
+
"classifier_dropout": null,
|
| 9 |
+
"dtype": "float32",
|
| 10 |
+
"eos_token_id": 2,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 768,
|
| 14 |
+
"id2label": {
|
| 15 |
+
"0": "LABEL_0",
|
| 16 |
+
"1": "LABEL_1",
|
| 17 |
+
"2": "LABEL_2",
|
| 18 |
+
"3": "LABEL_3",
|
| 19 |
+
"4": "LABEL_4",
|
| 20 |
+
"5": "LABEL_5",
|
| 21 |
+
"6": "LABEL_6",
|
| 22 |
+
"7": "LABEL_7",
|
| 23 |
+
"8": "LABEL_8",
|
| 24 |
+
"9": "LABEL_9",
|
| 25 |
+
"10": "LABEL_10",
|
| 26 |
+
"11": "LABEL_11"
|
| 27 |
+
},
|
| 28 |
+
"initializer_range": 0.02,
|
| 29 |
+
"intermediate_size": 3072,
|
| 30 |
+
"is_decoder": false,
|
| 31 |
+
"label2id": {
|
| 32 |
+
"LABEL_0": 0,
|
| 33 |
+
"LABEL_1": 1,
|
| 34 |
+
"LABEL_10": 10,
|
| 35 |
+
"LABEL_11": 11,
|
| 36 |
+
"LABEL_2": 2,
|
| 37 |
+
"LABEL_3": 3,
|
| 38 |
+
"LABEL_4": 4,
|
| 39 |
+
"LABEL_5": 5,
|
| 40 |
+
"LABEL_6": 6,
|
| 41 |
+
"LABEL_7": 7,
|
| 42 |
+
"LABEL_8": 8,
|
| 43 |
+
"LABEL_9": 9
|
| 44 |
+
},
|
| 45 |
+
"layer_norm_eps": 1e-05,
|
| 46 |
+
"max_position_embeddings": 514,
|
| 47 |
+
"model_type": "roberta",
|
| 48 |
+
"num_attention_heads": 12,
|
| 49 |
+
"num_hidden_layers": 12,
|
| 50 |
+
"output_past": true,
|
| 51 |
+
"pad_token_id": 1,
|
| 52 |
+
"position_embedding_type": "absolute",
|
| 53 |
+
"problem_type": "single_label_classification",
|
| 54 |
+
"tie_word_embeddings": true,
|
| 55 |
+
"transformers_version": "5.0.0",
|
| 56 |
+
"type_vocab_size": 1,
|
| 57 |
+
"use_cache": true,
|
| 58 |
+
"vocab_size": 250002
|
| 59 |
+
}
|
checkpoint-last/idx_file.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
9
|
checkpoint-last/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4c17da51ee001d45bde6fa33740a0130fb17c72c4c137b2bc371dab3e1e08f4b
|
| 3 |
+
size 1112235744
|
checkpoint-last/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a581158cea338dac724a1c78fd8a760b94b7d862818b923520ce9665f1d9ccd8
|
| 3 |
+
size 2224591499
|
checkpoint-last/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fad9d3d814422fc24594f9e6de16e4af7ee16238cef70fe96e25680c409c7157
|
| 3 |
+
size 1465
|
checkpoint-last/step_file.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
3660
|
config.json
ADDED
|
@@ -0,0 +1,59 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"add_cross_attention": false,
|
| 3 |
+
"architectures": [
|
| 4 |
+
"RobertaForSequenceClassification"
|
| 5 |
+
],
|
| 6 |
+
"attention_probs_dropout_prob": 0.1,
|
| 7 |
+
"bos_token_id": 0,
|
| 8 |
+
"classifier_dropout": null,
|
| 9 |
+
"dtype": "float32",
|
| 10 |
+
"eos_token_id": 2,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 768,
|
| 14 |
+
"id2label": {
|
| 15 |
+
"0": "LABEL_0",
|
| 16 |
+
"1": "LABEL_1",
|
| 17 |
+
"2": "LABEL_2",
|
| 18 |
+
"3": "LABEL_3",
|
| 19 |
+
"4": "LABEL_4",
|
| 20 |
+
"5": "LABEL_5",
|
| 21 |
+
"6": "LABEL_6",
|
| 22 |
+
"7": "LABEL_7",
|
| 23 |
+
"8": "LABEL_8",
|
| 24 |
+
"9": "LABEL_9",
|
| 25 |
+
"10": "LABEL_10",
|
| 26 |
+
"11": "LABEL_11"
|
| 27 |
+
},
|
| 28 |
+
"initializer_range": 0.02,
|
| 29 |
+
"intermediate_size": 3072,
|
| 30 |
+
"is_decoder": false,
|
| 31 |
+
"label2id": {
|
| 32 |
+
"LABEL_0": 0,
|
| 33 |
+
"LABEL_1": 1,
|
| 34 |
+
"LABEL_10": 10,
|
| 35 |
+
"LABEL_11": 11,
|
| 36 |
+
"LABEL_2": 2,
|
| 37 |
+
"LABEL_3": 3,
|
| 38 |
+
"LABEL_4": 4,
|
| 39 |
+
"LABEL_5": 5,
|
| 40 |
+
"LABEL_6": 6,
|
| 41 |
+
"LABEL_7": 7,
|
| 42 |
+
"LABEL_8": 8,
|
| 43 |
+
"LABEL_9": 9
|
| 44 |
+
},
|
| 45 |
+
"layer_norm_eps": 1e-05,
|
| 46 |
+
"max_position_embeddings": 514,
|
| 47 |
+
"model_type": "roberta",
|
| 48 |
+
"num_attention_heads": 12,
|
| 49 |
+
"num_hidden_layers": 12,
|
| 50 |
+
"output_past": true,
|
| 51 |
+
"pad_token_id": 1,
|
| 52 |
+
"position_embedding_type": "absolute",
|
| 53 |
+
"problem_type": "single_label_classification",
|
| 54 |
+
"tie_word_embeddings": true,
|
| 55 |
+
"transformers_version": "5.0.0",
|
| 56 |
+
"type_vocab_size": 1,
|
| 57 |
+
"use_cache": true,
|
| 58 |
+
"vocab_size": 250002
|
| 59 |
+
}
|
eval_results.txt
ADDED
|
@@ -0,0 +1,190 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
evaluate 0
|
| 2 |
+
acc = 0.553315649867374
|
| 3 |
+
acc_and_f1_macro = 0.5036680015396735
|
| 4 |
+
acc_and_f1_weighted = 0.5436802384152634
|
| 5 |
+
class_f1 = [np.float64(nan), np.float64(0.3319148936170213), np.float64(0.419047619047619), np.float64(0.12972972972972974), np.float64(0.3037383177570093), np.float64(0.483221476510067), np.float64(0.8322147651006713), np.float64(0.7777777777777779), np.float64(0.8772378516624041), np.float64(0.38532110091743127)]
|
| 6 |
+
class_p = [np.float64(nan), np.float64(0.3023255813953488), np.float64(0.532258064516129), np.float64(0.5454545454545454), np.float64(0.34210526315789475), np.float64(0.37422037422037424), np.float64(0.8985507246376812), np.float64(0.7403846153846154), np.float64(0.8727735368956743), np.float64(0.29577464788732394)]
|
| 7 |
+
class_r = [np.float64(0.0), np.float64(0.36792452830188677), np.float64(0.34554973821989526), np.float64(0.0736196319018405), np.float64(0.27310924369747897), np.float64(0.6818181818181818), np.float64(0.775), np.float64(0.8191489361702128), np.float64(0.8817480719794345), np.float64(0.5526315789473685)]
|
| 8 |
+
confusion_matrix = [[ 0 4 0 4 4 27 0 0 2 1]
|
| 9 |
+
[ 0 78 44 2 40 42 0 0 0 6]
|
| 10 |
+
[ 0 87 66 0 22 13 0 0 0 3]
|
| 11 |
+
[ 0 14 6 12 27 94 0 0 0 10]
|
| 12 |
+
[ 0 45 2 0 65 108 0 0 0 18]
|
| 13 |
+
[ 0 30 6 4 32 180 0 0 0 12]
|
| 14 |
+
[ 0 0 0 0 0 0 124 18 18 0]
|
| 15 |
+
[ 0 0 0 0 0 0 4 154 30 0]
|
| 16 |
+
[ 0 0 0 0 0 0 10 36 343 0]
|
| 17 |
+
[ 0 0 0 0 0 17 0 0 0 21]]
|
| 18 |
+
f1_macro = 0.45402035321197304
|
| 19 |
+
f1_weighted = 0.5340448269631527
|
| 20 |
+
evaluate 1
|
| 21 |
+
acc = 0.6477453580901856
|
| 22 |
+
acc_and_f1_macro = 0.6109098715451384
|
| 23 |
+
acc_and_f1_weighted = 0.6440256663564747
|
| 24 |
+
class_f1 = [np.float64(nan), np.float64(0.5021645021645021), np.float64(0.7002652519893899), np.float64(0.41775456919060056), np.float64(0.41884816753926707), np.float64(0.5066666666666666), np.float64(0.8834355828220859), np.float64(0.8167539267015708), np.float64(0.8932291666666669), np.float64(0.6016260162601627)]
|
| 25 |
+
class_p = [np.float64(nan), np.float64(0.464), np.float64(0.7096774193548387), np.float64(0.36363636363636365), np.float64(0.5555555555555556), np.float64(0.5095785440613027), np.float64(0.8674698795180723), np.float64(0.8041237113402062), np.float64(0.9050131926121372), np.float64(0.43529411764705883)]
|
| 26 |
+
class_r = [np.float64(0.0), np.float64(0.5471698113207547), np.float64(0.6910994764397905), np.float64(0.49079754601226994), np.float64(0.33613445378151263), np.float64(0.5037878787878788), np.float64(0.9), np.float64(0.8297872340425532), np.float64(0.8817480719794345), np.float64(0.9736842105263158)]
|
| 27 |
+
confusion_matrix = [[ 0 6 0 20 3 11 0 0 2 0]
|
| 28 |
+
[ 0 116 42 8 16 26 0 0 0 4]
|
| 29 |
+
[ 0 47 132 2 2 4 0 0 0 4]
|
| 30 |
+
[ 0 13 2 80 31 28 0 0 0 9]
|
| 31 |
+
[ 0 34 4 48 80 58 0 0 0 14]
|
| 32 |
+
[ 0 34 6 62 12 133 0 0 0 17]
|
| 33 |
+
[ 0 0 0 0 0 0 144 8 8 0]
|
| 34 |
+
[ 0 0 0 0 0 0 6 156 26 0]
|
| 35 |
+
[ 0 0 0 0 0 0 16 30 343 0]
|
| 36 |
+
[ 0 0 0 0 0 1 0 0 0 37]]
|
| 37 |
+
f1_macro = 0.5740743850000912
|
| 38 |
+
f1_weighted = 0.6403059746227637
|
| 39 |
+
evaluate 2
|
| 40 |
+
acc = 0.6525198938992043
|
| 41 |
+
acc_and_f1_macro = 0.6231816753120988
|
| 42 |
+
acc_and_f1_weighted = 0.6521421608321463
|
| 43 |
+
class_f1 = [np.float64(nan), np.float64(0.46796657381615603), np.float64(0.6862745098039216), np.float64(0.39316239316239315), np.float64(0.445916114790287), np.float64(0.5543859649122808), np.float64(0.8917197452229298), np.float64(0.835978835978836), np.float64(0.907928388746803), np.float64(0.7551020408163265)]
|
| 44 |
+
class_p = [np.float64(nan), np.float64(0.5714285714285714), np.float64(0.9130434782608695), np.float64(0.3016393442622951), np.float64(0.4697674418604651), np.float64(0.5163398692810458), np.float64(0.9090909090909091), np.float64(0.8315789473684211), np.float64(0.9033078880407125), np.float64(0.6166666666666667)]
|
| 45 |
+
class_r = [np.float64(0.0), np.float64(0.39622641509433965), np.float64(0.5497382198952879), np.float64(0.5644171779141104), np.float64(0.42436974789915966), np.float64(0.5984848484848485), np.float64(0.875), np.float64(0.8404255319148937), np.float64(0.9125964010282777), np.float64(0.9736842105263158)]
|
| 46 |
+
confusion_matrix = [[ 0 0 0 26 6 10 0 0 0 0]
|
| 47 |
+
[ 0 84 8 18 44 52 0 0 0 6]
|
| 48 |
+
[ 0 40 105 27 11 8 0 0 0 0]
|
| 49 |
+
[ 0 4 0 92 32 30 0 0 0 5]
|
| 50 |
+
[ 0 8 0 76 101 47 0 0 0 6]
|
| 51 |
+
[ 0 11 2 66 21 158 0 0 0 6]
|
| 52 |
+
[ 0 0 0 0 0 0 140 10 10 0]
|
| 53 |
+
[ 0 0 0 0 0 0 2 158 28 0]
|
| 54 |
+
[ 0 0 0 0 0 0 12 22 355 0]
|
| 55 |
+
[ 0 0 0 0 0 1 0 0 0 37]]
|
| 56 |
+
f1_macro = 0.5938434567249933
|
| 57 |
+
f1_weighted = 0.6517644277650883
|
| 58 |
+
evaluate 3
|
| 59 |
+
acc = 0.6970822281167108
|
| 60 |
+
acc_and_f1_macro = 0.665524574862322
|
| 61 |
+
acc_and_f1_weighted = 0.6927153195289348
|
| 62 |
+
class_f1 = [np.float64(0.0909090909090909), np.float64(0.6120689655172414), np.float64(0.7507002801120448), np.float64(0.390625), np.float64(0.5487603305785124), np.float64(0.5104602510460251), np.float64(0.8944099378881988), np.float64(0.861878453038674), np.float64(0.9189873417721519), np.float64(0.7608695652173912)]
|
| 63 |
+
class_p = [np.float64(1.0), np.float64(0.5634920634920635), np.float64(0.8072289156626506), np.float64(0.5376344086021505), np.float64(0.45231607629427795), np.float64(0.5700934579439252), np.float64(0.8888888888888888), np.float64(0.896551724137931), np.float64(0.9052369077306733), np.float64(0.6481481481481481)]
|
| 64 |
+
class_r = [np.float64(0.047619047619047616), np.float64(0.6698113207547169), np.float64(0.7015706806282722), np.float64(0.3067484662576687), np.float64(0.6974789915966386), np.float64(0.4621212121212121), np.float64(0.9), np.float64(0.8297872340425532), np.float64(0.9331619537275064), np.float64(0.9210526315789473)]
|
| 65 |
+
confusion_matrix = [[ 2 1 2 10 14 13 0 0 0 0]
|
| 66 |
+
[ 0 142 14 2 38 16 0 0 0 0]
|
| 67 |
+
[ 0 45 134 2 6 4 0 0 0 0]
|
| 68 |
+
[ 0 12 6 50 67 23 0 0 0 5]
|
| 69 |
+
[ 0 18 4 10 166 34 0 0 0 6]
|
| 70 |
+
[ 0 34 6 18 76 122 0 0 0 8]
|
| 71 |
+
[ 0 0 0 0 0 0 144 6 10 0]
|
| 72 |
+
[ 0 0 0 0 0 0 4 156 28 0]
|
| 73 |
+
[ 0 0 0 0 0 0 14 12 363 0]
|
| 74 |
+
[ 0 0 0 1 0 2 0 0 0 35]]
|
| 75 |
+
f1_macro = 0.633966921607933
|
| 76 |
+
f1_weighted = 0.688348410941159
|
| 77 |
+
evaluate 4
|
| 78 |
+
acc = 0.673209549071618
|
| 79 |
+
acc_and_f1_macro = 0.6450619507162738
|
| 80 |
+
acc_and_f1_weighted = 0.6715050760798013
|
| 81 |
+
class_f1 = [np.float64(0.1791044776119403), np.float64(0.5851528384279476), np.float64(0.7611548556430446), np.float64(0.44880174291939), np.float64(0.46361185983827496), np.float64(0.502283105022831), np.float64(0.8819875776397514), np.float64(0.8255813953488371), np.float64(0.8985148514851486), np.float64(0.6229508196721312)]
|
| 82 |
+
class_p = [np.float64(0.24), np.float64(0.5447154471544715), np.float64(0.7631578947368421), np.float64(0.34797297297297297), np.float64(0.6466165413533834), np.float64(0.632183908045977), np.float64(0.8765432098765432), np.float64(0.9102564102564102), np.float64(0.8663484486873508), np.float64(0.4523809523809524)]
|
| 83 |
+
class_r = [np.float64(0.14285714285714285), np.float64(0.6320754716981132), np.float64(0.7591623036649214), np.float64(0.6319018404907976), np.float64(0.36134453781512604), np.float64(0.4166666666666667), np.float64(0.8875), np.float64(0.7553191489361702), np.float64(0.9331619537275064), np.float64(1.0)]
|
| 84 |
+
confusion_matrix = [[ 6 5 0 18 3 10 0 0 0 0]
|
| 85 |
+
[ 4 134 30 10 10 18 0 0 0 6]
|
| 86 |
+
[ 0 36 145 4 2 0 0 0 0 4]
|
| 87 |
+
[ 3 11 7 103 20 14 0 0 0 5]
|
| 88 |
+
[ 8 22 4 80 86 22 0 0 0 16]
|
| 89 |
+
[ 4 38 4 81 12 110 0 0 0 15]
|
| 90 |
+
[ 0 0 0 0 0 0 142 4 14 0]
|
| 91 |
+
[ 0 0 0 0 0 0 4 142 42 0]
|
| 92 |
+
[ 0 0 0 0 0 0 16 10 363 0]
|
| 93 |
+
[ 0 0 0 0 0 0 0 0 0 38]]
|
| 94 |
+
f1_macro = 0.6169143523609297
|
| 95 |
+
f1_weighted = 0.6698006030879845
|
| 96 |
+
evaluate 5
|
| 97 |
+
acc = 0.6923076923076923
|
| 98 |
+
acc_and_f1_macro = 0.6701551641026473
|
| 99 |
+
acc_and_f1_weighted = 0.6913225727110167
|
| 100 |
+
class_f1 = [np.float64(0.2985074626865672), np.float64(0.5936254980079683), np.float64(0.7551622418879056), np.float64(0.45925925925925926), np.float64(0.5292929292929293), np.float64(0.5220729366602688), np.float64(0.8674698795180723), np.float64(0.859504132231405), np.float64(0.9088575096277278), np.float64(0.6862745098039216)]
|
| 101 |
+
class_p = [np.float64(0.4), np.float64(0.5137931034482759), np.float64(0.8648648648648649), np.float64(0.5794392523364486), np.float64(0.5097276264591439), np.float64(0.5291828793774319), np.float64(0.8372093023255814), np.float64(0.8914285714285715), np.float64(0.9076923076923077), np.float64(0.546875)]
|
| 102 |
+
class_r = [np.float64(0.23809523809523808), np.float64(0.7028301886792453), np.float64(0.6701570680628273), np.float64(0.3803680981595092), np.float64(0.5504201680672269), np.float64(0.5151515151515151), np.float64(0.9), np.float64(0.8297872340425532), np.float64(0.910025706940874), np.float64(0.9210526315789473)]
|
| 103 |
+
confusion_matrix = [[ 10 3 0 11 6 12 0 0 0 0]
|
| 104 |
+
[ 0 149 12 4 22 21 0 0 0 4]
|
| 105 |
+
[ 0 51 128 0 6 4 0 0 0 2]
|
| 106 |
+
[ 1 20 2 62 40 33 0 0 0 5]
|
| 107 |
+
[ 4 29 2 14 131 50 0 0 0 8]
|
| 108 |
+
[ 10 38 4 15 51 136 0 0 0 10]
|
| 109 |
+
[ 0 0 0 0 0 0 144 6 10 0]
|
| 110 |
+
[ 0 0 0 0 0 0 6 156 26 0]
|
| 111 |
+
[ 0 0 0 0 0 0 22 13 354 0]
|
| 112 |
+
[ 0 0 0 1 1 1 0 0 0 35]]
|
| 113 |
+
f1_macro = 0.6480026358976024
|
| 114 |
+
f1_weighted = 0.6903374531143411
|
| 115 |
+
evaluate 6
|
| 116 |
+
acc = 0.6997347480106101
|
| 117 |
+
acc_and_f1_macro = 0.6746040583246593
|
| 118 |
+
acc_and_f1_weighted = 0.6982406833442424
|
| 119 |
+
class_f1 = [np.float64(0.2318840579710145), np.float64(0.6133909287257019), np.float64(0.7774798927613941), np.float64(0.48765432098765427), np.float64(0.5436105476673427), np.float64(0.5356371490280778), np.float64(0.8834355828220859), np.float64(0.8369565217391304), np.float64(0.8999999999999999), np.float64(0.6846846846846847)]
|
| 120 |
+
class_p = [np.float64(0.2962962962962963), np.float64(0.5657370517928287), np.float64(0.7967032967032966), np.float64(0.4906832298136646), np.float64(0.5254901960784314), np.float64(0.6231155778894473), np.float64(0.8674698795180723), np.float64(0.8555555555555555), np.float64(0.8976982097186701), np.float64(0.5205479452054794)]
|
| 121 |
+
class_r = [np.float64(0.19047619047619047), np.float64(0.6698113207547169), np.float64(0.7591623036649214), np.float64(0.48466257668711654), np.float64(0.5630252100840336), np.float64(0.4696969696969697), np.float64(0.9), np.float64(0.8191489361702128), np.float64(0.9023136246786633), np.float64(1.0)]
|
| 122 |
+
confusion_matrix = [[ 8 2 0 12 8 12 0 0 0 0]
|
| 123 |
+
[ 2 142 18 6 26 14 0 0 0 4]
|
| 124 |
+
[ 0 32 145 2 8 4 0 0 0 0]
|
| 125 |
+
[ 1 17 7 79 35 19 0 0 0 5]
|
| 126 |
+
[ 8 20 8 28 134 26 0 0 0 14]
|
| 127 |
+
[ 8 38 4 34 44 124 0 0 0 12]
|
| 128 |
+
[ 0 0 0 0 0 0 144 6 10 0]
|
| 129 |
+
[ 0 0 0 0 0 0 4 154 30 0]
|
| 130 |
+
[ 0 0 0 0 0 0 18 20 351 0]
|
| 131 |
+
[ 0 0 0 0 0 0 0 0 0 38]]
|
| 132 |
+
f1_macro = 0.6494733686387086
|
| 133 |
+
f1_weighted = 0.6967466186778747
|
| 134 |
+
evaluate 7
|
| 135 |
+
acc = 0.6949602122015915
|
| 136 |
+
acc_and_f1_macro = 0.6736449120606118
|
| 137 |
+
acc_and_f1_weighted = 0.6941753333487539
|
| 138 |
+
class_f1 = [np.float64(0.2222222222222222), np.float64(0.5967741935483871), np.float64(0.7543859649122806), np.float64(0.4745762711864407), np.float64(0.5376782077393076), np.float64(0.5404339250493096), np.float64(0.8795180722891567), np.float64(0.8421052631578947), np.float64(0.9014084507042253), np.float64(0.7741935483870966)]
|
| 139 |
+
class_p = [np.float64(0.26666666666666666), np.float64(0.5211267605633803), np.float64(0.8543046357615894), np.float64(0.5303030303030303), np.float64(0.5217391304347826), np.float64(0.5637860082304527), np.float64(0.8488372093023255), np.float64(0.8786127167630058), np.float64(0.8979591836734694), np.float64(0.6545454545454545)]
|
| 140 |
+
class_r = [np.float64(0.19047619047619047), np.float64(0.6981132075471698), np.float64(0.675392670157068), np.float64(0.4294478527607362), np.float64(0.5546218487394958), np.float64(0.5189393939393939), np.float64(0.9125), np.float64(0.8085106382978723), np.float64(0.9048843187660668), np.float64(0.9473684210526315)]
|
| 141 |
+
confusion_matrix = [[ 8 4 0 12 6 12 0 0 0 0]
|
| 142 |
+
[ 2 148 14 4 24 18 0 0 0 2]
|
| 143 |
+
[ 2 48 129 0 8 4 0 0 0 0]
|
| 144 |
+
[ 1 24 0 70 35 28 0 0 0 5]
|
| 145 |
+
[ 7 24 4 22 132 43 0 0 0 6]
|
| 146 |
+
[ 10 36 4 23 48 137 0 0 0 6]
|
| 147 |
+
[ 0 0 0 0 0 0 146 4 10 0]
|
| 148 |
+
[ 0 0 0 0 0 0 6 152 30 0]
|
| 149 |
+
[ 0 0 0 0 0 0 20 17 352 0]
|
| 150 |
+
[ 0 0 0 1 0 1 0 0 0 36]]
|
| 151 |
+
f1_macro = 0.652329611919632
|
| 152 |
+
f1_weighted = 0.6933904544959164
|
| 153 |
+
evaluate 8
|
| 154 |
+
acc = 0.6997347480106101
|
| 155 |
+
acc_and_f1_macro = 0.6799997041569643
|
| 156 |
+
acc_and_f1_weighted = 0.6995116358901213
|
| 157 |
+
class_f1 = [np.float64(0.2631578947368421), np.float64(0.6058091286307054), np.float64(0.76878612716763), np.float64(0.4935897435897436), np.float64(0.5210084033613446), np.float64(0.55078125), np.float64(0.8834355828220859), np.float64(0.8510638297872339), np.float64(0.9041450777202072), np.float64(0.7608695652173912)]
|
| 158 |
+
class_p = [np.float64(0.29411764705882354), np.float64(0.5407407407407407), np.float64(0.8580645161290322), np.float64(0.5167785234899329), np.float64(0.5210084033613446), np.float64(0.5685483870967742), np.float64(0.8674698795180723), np.float64(0.851063829787234), np.float64(0.9112271540469974), np.float64(0.6481481481481481)]
|
| 159 |
+
class_r = [np.float64(0.23809523809523808), np.float64(0.6886792452830188), np.float64(0.6963350785340314), np.float64(0.4723926380368098), np.float64(0.5210084033613446), np.float64(0.5340909090909091), np.float64(0.9), np.float64(0.851063829787234), np.float64(0.897172236503856), np.float64(0.9210526315789473)]
|
| 160 |
+
confusion_matrix = [[ 10 2 0 12 6 12 0 0 0 0]
|
| 161 |
+
[ 2 146 14 4 26 18 0 0 0 2]
|
| 162 |
+
[ 0 44 133 2 8 4 0 0 0 0]
|
| 163 |
+
[ 4 22 0 77 30 25 0 0 0 5]
|
| 164 |
+
[ 8 22 4 28 124 46 0 0 0 6]
|
| 165 |
+
[ 10 34 4 25 44 141 0 0 0 6]
|
| 166 |
+
[ 0 0 0 0 0 0 144 6 10 0]
|
| 167 |
+
[ 0 0 0 0 0 0 4 160 24 0]
|
| 168 |
+
[ 0 0 0 0 0 0 18 22 349 0]
|
| 169 |
+
[ 0 0 0 1 0 2 0 0 0 35]]
|
| 170 |
+
f1_macro = 0.6602646603033184
|
| 171 |
+
f1_weighted = 0.6992885237696326
|
| 172 |
+
evaluate 9
|
| 173 |
+
acc = 0.6944297082228117
|
| 174 |
+
acc_and_f1_macro = 0.6740689450220392
|
| 175 |
+
acc_and_f1_weighted = 0.6939169890732269
|
| 176 |
+
class_f1 = [np.float64(0.2222222222222222), np.float64(0.6033057851239669), np.float64(0.76878612716763), np.float64(0.4838709677419355), np.float64(0.5206611570247934), np.float64(0.5401174168297457), np.float64(0.8727272727272727), np.float64(0.837465564738292), np.float64(0.9014084507042253), np.float64(0.7865168539325842)]
|
| 177 |
+
class_p = [np.float64(0.26666666666666666), np.float64(0.5367647058823529), np.float64(0.8580645161290322), np.float64(0.5102040816326531), np.float64(0.5121951219512195), np.float64(0.5587044534412956), np.float64(0.8470588235294118), np.float64(0.8685714285714285), np.float64(0.8979591836734694), np.float64(0.6862745098039216)]
|
| 178 |
+
class_r = [np.float64(0.19047619047619047), np.float64(0.6886792452830188), np.float64(0.6963350785340314), np.float64(0.4601226993865031), np.float64(0.5294117647058824), np.float64(0.5227272727272727), np.float64(0.9), np.float64(0.8085106382978723), np.float64(0.9048843187660668), np.float64(0.9210526315789473)]
|
| 179 |
+
confusion_matrix = [[ 8 2 0 12 6 14 0 0 0 0]
|
| 180 |
+
[ 2 146 14 4 26 18 0 0 0 2]
|
| 181 |
+
[ 0 44 133 2 8 4 0 0 0 0]
|
| 182 |
+
[ 4 22 0 75 32 25 0 0 0 5]
|
| 183 |
+
[ 8 22 4 26 126 46 0 0 0 6]
|
| 184 |
+
[ 8 36 4 27 48 138 0 0 0 3]
|
| 185 |
+
[ 0 0 0 0 0 0 144 6 10 0]
|
| 186 |
+
[ 0 0 0 0 0 0 6 152 30 0]
|
| 187 |
+
[ 0 0 0 0 0 0 20 17 352 0]
|
| 188 |
+
[ 0 0 0 1 0 2 0 0 0 35]]
|
| 189 |
+
f1_macro = 0.6537081818212667
|
| 190 |
+
f1_weighted = 0.6934042699236419
|
model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4c17da51ee001d45bde6fa33740a0130fb17c72c4c137b2bc371dab3e1e08f4b
|
| 3 |
+
size 1112235744
|
tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tokenizer_config.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"add_prefix_space": false,
|
| 3 |
+
"backend": "tokenizers",
|
| 4 |
+
"bos_token": "<s>",
|
| 5 |
+
"clean_up_tokenization_spaces": true,
|
| 6 |
+
"cls_token": "<s>",
|
| 7 |
+
"do_lower_case": false,
|
| 8 |
+
"eos_token": "</s>",
|
| 9 |
+
"errors": "replace",
|
| 10 |
+
"is_local": false,
|
| 11 |
+
"mask_token": "<mask>",
|
| 12 |
+
"model_max_length": 512,
|
| 13 |
+
"pad_token": "<pad>",
|
| 14 |
+
"sep_token": "</s>",
|
| 15 |
+
"tokenizer_class": "RobertaTokenizer",
|
| 16 |
+
"trim_offsets": true,
|
| 17 |
+
"unk_token": "<unk>"
|
| 18 |
+
}
|
training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8326842a5c7bc2e1e489f64889cf28cc938f2cec75e85efaba88b54ffa77d2b0
|
| 3 |
+
size 2769
|