Upload folder using huggingface_hub
Browse files- config.json +59 -0
- eval_results.txt +190 -0
- model.safetensors +3 -0
- tokenizer.json +0 -0
- tokenizer_config.json +18 -0
- training_args.bin +3 -0
config.json
ADDED
|
@@ -0,0 +1,59 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"add_cross_attention": false,
|
| 3 |
+
"architectures": [
|
| 4 |
+
"RobertaForSequenceClassification"
|
| 5 |
+
],
|
| 6 |
+
"attention_probs_dropout_prob": 0.1,
|
| 7 |
+
"bos_token_id": 0,
|
| 8 |
+
"classifier_dropout": null,
|
| 9 |
+
"dtype": "float32",
|
| 10 |
+
"eos_token_id": 2,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 1024,
|
| 14 |
+
"id2label": {
|
| 15 |
+
"0": "LABEL_0",
|
| 16 |
+
"1": "LABEL_1",
|
| 17 |
+
"2": "LABEL_2",
|
| 18 |
+
"3": "LABEL_3",
|
| 19 |
+
"4": "LABEL_4",
|
| 20 |
+
"5": "LABEL_5",
|
| 21 |
+
"6": "LABEL_6",
|
| 22 |
+
"7": "LABEL_7",
|
| 23 |
+
"8": "LABEL_8",
|
| 24 |
+
"9": "LABEL_9",
|
| 25 |
+
"10": "LABEL_10",
|
| 26 |
+
"11": "LABEL_11"
|
| 27 |
+
},
|
| 28 |
+
"initializer_range": 0.02,
|
| 29 |
+
"intermediate_size": 4096,
|
| 30 |
+
"is_decoder": false,
|
| 31 |
+
"label2id": {
|
| 32 |
+
"LABEL_0": 0,
|
| 33 |
+
"LABEL_1": 1,
|
| 34 |
+
"LABEL_10": 10,
|
| 35 |
+
"LABEL_11": 11,
|
| 36 |
+
"LABEL_2": 2,
|
| 37 |
+
"LABEL_3": 3,
|
| 38 |
+
"LABEL_4": 4,
|
| 39 |
+
"LABEL_5": 5,
|
| 40 |
+
"LABEL_6": 6,
|
| 41 |
+
"LABEL_7": 7,
|
| 42 |
+
"LABEL_8": 8,
|
| 43 |
+
"LABEL_9": 9
|
| 44 |
+
},
|
| 45 |
+
"layer_norm_eps": 1e-05,
|
| 46 |
+
"max_position_embeddings": 514,
|
| 47 |
+
"model_type": "roberta",
|
| 48 |
+
"num_attention_heads": 16,
|
| 49 |
+
"num_hidden_layers": 24,
|
| 50 |
+
"output_past": true,
|
| 51 |
+
"pad_token_id": 1,
|
| 52 |
+
"position_embedding_type": "absolute",
|
| 53 |
+
"problem_type": "single_label_classification",
|
| 54 |
+
"tie_word_embeddings": true,
|
| 55 |
+
"transformers_version": "5.0.0",
|
| 56 |
+
"type_vocab_size": 1,
|
| 57 |
+
"use_cache": true,
|
| 58 |
+
"vocab_size": 250002
|
| 59 |
+
}
|
eval_results.txt
ADDED
|
@@ -0,0 +1,190 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
evaluate 0
|
| 2 |
+
acc = 0.6891246684350133
|
| 3 |
+
acc_and_f1_macro = 0.6334905949921364
|
| 4 |
+
acc_and_f1_weighted = 0.6756927166539615
|
| 5 |
+
class_f1 = [np.float64(nan), np.float64(0.6070038910505835), np.float64(0.7111111111111112), np.float64(0.023668639053254437), np.float64(0.5491651205936919), np.float64(0.5770491803278688), np.float64(0.9192546583850932), np.float64(0.8854166666666667), np.float64(0.9293193717277487), np.float64(0.5765765765765766)]
|
| 6 |
+
class_p = [np.float64(nan), np.float64(0.5165562913907285), np.float64(0.9032258064516129), np.float64(0.3333333333333333), np.float64(0.49169435215946844), np.float64(0.5086705202312138), np.float64(0.9135802469135802), np.float64(0.8673469387755102), np.float64(0.9466666666666667), np.float64(0.4383561643835616)]
|
| 7 |
+
class_r = [np.float64(0.0), np.float64(0.7358490566037735), np.float64(0.5863874345549738), np.float64(0.012269938650306749), np.float64(0.6218487394957983), np.float64(0.6666666666666666), np.float64(0.925), np.float64(0.9042553191489362), np.float64(0.9125964010282777), np.float64(0.8421052631578947)]
|
| 8 |
+
confusion_matrix = [[ 0 10 0 0 2 29 0 0 0 1]
|
| 9 |
+
[ 0 156 8 0 10 30 0 0 0 8]
|
| 10 |
+
[ 0 65 112 0 6 4 0 0 0 4]
|
| 11 |
+
[ 0 19 0 2 83 55 0 0 0 4]
|
| 12 |
+
[ 0 22 2 2 148 49 0 0 0 15]
|
| 13 |
+
[ 0 28 2 2 47 176 0 0 0 9]
|
| 14 |
+
[ 0 0 0 0 0 0 148 6 6 0]
|
| 15 |
+
[ 0 0 0 0 0 0 4 170 14 0]
|
| 16 |
+
[ 0 0 0 0 2 2 10 20 355 0]
|
| 17 |
+
[ 0 2 0 0 3 1 0 0 0 32]]
|
| 18 |
+
f1_macro = 0.5778565215492596
|
| 19 |
+
f1_weighted = 0.6622607648729097
|
| 20 |
+
evaluate 1
|
| 21 |
+
acc = 0.7480106100795756
|
| 22 |
+
acc_and_f1_macro = 0.7075732467155612
|
| 23 |
+
acc_and_f1_weighted = 0.7450751936656139
|
| 24 |
+
class_f1 = [np.float64(nan), np.float64(0.7281105990783409), np.float64(0.7857142857142857), np.float64(0.5168539325842696), np.float64(0.6150234741784038), np.float64(0.6467486818980668), np.float64(0.9113924050632911), np.float64(0.8550368550368551), np.float64(0.9267643142476697), np.float64(0.6857142857142856)]
|
| 25 |
+
class_p = [np.float64(nan), np.float64(0.7117117117117117), np.float64(0.8265895953757225), np.float64(0.47668393782383417), np.float64(0.6968085106382979), np.float64(0.6032786885245902), np.float64(0.9230769230769231), np.float64(0.7945205479452054), np.float64(0.9613259668508287), np.float64(0.5373134328358209)]
|
| 26 |
+
class_r = [np.float64(0.0), np.float64(0.7452830188679245), np.float64(0.7486910994764397), np.float64(0.5644171779141104), np.float64(0.5504201680672269), np.float64(0.696969696969697), np.float64(0.9), np.float64(0.925531914893617), np.float64(0.8946015424164524), np.float64(0.9473684210526315)]
|
| 27 |
+
confusion_matrix = [[ 0 4 0 18 0 20 0 0 0 0]
|
| 28 |
+
[ 0 158 16 4 10 24 0 0 0 0]
|
| 29 |
+
[ 0 33 143 2 7 4 0 0 0 2]
|
| 30 |
+
[ 0 5 8 92 26 28 0 0 0 4]
|
| 31 |
+
[ 0 16 2 35 131 44 0 0 0 10]
|
| 32 |
+
[ 0 6 4 41 14 184 0 0 0 15]
|
| 33 |
+
[ 0 0 0 0 0 0 144 12 4 0]
|
| 34 |
+
[ 0 0 0 0 0 0 4 174 10 0]
|
| 35 |
+
[ 0 0 0 0 0 0 8 33 348 0]
|
| 36 |
+
[ 0 0 0 1 0 1 0 0 0 36]]
|
| 37 |
+
f1_macro = 0.6671358833515468
|
| 38 |
+
f1_weighted = 0.7421397772516521
|
| 39 |
+
evaluate 2
|
| 40 |
+
acc = 0.7305039787798409
|
| 41 |
+
acc_and_f1_macro = 0.7050249560062639
|
| 42 |
+
acc_and_f1_weighted = 0.7287820591439015
|
| 43 |
+
class_f1 = [np.float64(0.13793103448275862), np.float64(0.6650602409638554), np.float64(0.7570332480818416), np.float64(0.49221183800623053), np.float64(0.5862068965517242), np.float64(0.5836575875486382), np.float64(0.9135802469135802), np.float64(0.8756756756756756), np.float64(0.9307692307692307), np.float64(0.8533333333333334)]
|
| 44 |
+
class_p = [np.float64(0.25), np.float64(0.6798029556650246), np.float64(0.74), np.float64(0.5), np.float64(0.5387323943661971), np.float64(0.6), np.float64(0.9024390243902439), np.float64(0.8901098901098901), np.float64(0.928388746803069), np.float64(0.8648648648648649)]
|
| 45 |
+
class_r = [np.float64(0.09523809523809523), np.float64(0.6509433962264151), np.float64(0.774869109947644), np.float64(0.48466257668711654), np.float64(0.6428571428571429), np.float64(0.5681818181818182), np.float64(0.925), np.float64(0.8617021276595744), np.float64(0.9331619537275064), np.float64(0.8421052631578947)]
|
| 46 |
+
confusion_matrix = [[ 4 4 2 12 8 12 0 0 0 0]
|
| 47 |
+
[ 4 138 36 0 22 12 0 0 0 0]
|
| 48 |
+
[ 0 29 148 2 4 8 0 0 0 0]
|
| 49 |
+
[ 2 8 8 79 35 29 0 0 0 2]
|
| 50 |
+
[ 2 12 2 30 153 37 0 0 0 2]
|
| 51 |
+
[ 4 11 4 34 60 150 0 0 0 1]
|
| 52 |
+
[ 0 0 0 0 0 0 148 8 4 0]
|
| 53 |
+
[ 0 0 0 0 0 0 2 162 24 0]
|
| 54 |
+
[ 0 0 0 0 0 0 14 12 363 0]
|
| 55 |
+
[ 0 1 0 1 2 2 0 0 0 32]]
|
| 56 |
+
f1_macro = 0.679545933232687
|
| 57 |
+
f1_weighted = 0.7270601395079621
|
| 58 |
+
evaluate 3
|
| 59 |
+
acc = 0.7336870026525198
|
| 60 |
+
acc_and_f1_macro = 0.7098841287434561
|
| 61 |
+
acc_and_f1_weighted = 0.7313466077268491
|
| 62 |
+
class_f1 = [np.float64(0.2898550724637681), np.float64(0.7109004739336493), np.float64(0.8010610079575596), np.float64(0.416), np.float64(0.5510597302504817), np.float64(0.5884413309982487), np.float64(0.9308176100628932), np.float64(0.8681318681318682), np.float64(0.9318181818181819), np.float64(0.7727272727272727)]
|
| 63 |
+
class_p = [np.float64(0.37037037037037035), np.float64(0.7142857142857143), np.float64(0.8118279569892473), np.float64(0.5977011494252874), np.float64(0.5088967971530249), np.float64(0.5472312703583062), np.float64(0.9367088607594937), np.float64(0.8977272727272727), np.float64(0.9156327543424317), np.float64(0.68)]
|
| 64 |
+
class_r = [np.float64(0.23809523809523808), np.float64(0.7075471698113207), np.float64(0.7905759162303665), np.float64(0.31901840490797545), np.float64(0.6008403361344538), np.float64(0.6363636363636364), np.float64(0.925), np.float64(0.8404255319148937), np.float64(0.9485861182519281), np.float64(0.8947368421052632)]
|
| 65 |
+
confusion_matrix = [[ 10 2 0 2 4 24 0 0 0 0]
|
| 66 |
+
[ 4 150 22 2 14 20 0 0 0 0]
|
| 67 |
+
[ 0 27 151 0 7 4 0 0 0 2]
|
| 68 |
+
[ 5 6 7 52 50 39 0 0 0 4]
|
| 69 |
+
[ 4 14 4 15 143 50 0 0 0 8]
|
| 70 |
+
[ 4 11 2 16 61 168 0 0 0 2]
|
| 71 |
+
[ 0 0 0 0 0 0 148 6 6 0]
|
| 72 |
+
[ 0 0 0 0 0 0 2 158 28 0]
|
| 73 |
+
[ 0 0 0 0 0 0 8 12 369 0]
|
| 74 |
+
[ 0 0 0 0 2 2 0 0 0 34]]
|
| 75 |
+
f1_macro = 0.6860812548343923
|
| 76 |
+
f1_weighted = 0.7290062128011783
|
| 77 |
+
evaluate 4
|
| 78 |
+
acc = 0.736870026525199
|
| 79 |
+
acc_and_f1_macro = 0.7133907423644683
|
| 80 |
+
acc_and_f1_weighted = 0.7340449446819173
|
| 81 |
+
class_f1 = [np.float64(0.30303030303030304), np.float64(0.722466960352423), np.float64(0.7843137254901961), np.float64(0.4126984126984127), np.float64(0.5469387755102041), np.float64(0.6061643835616437), np.float64(0.925925925925926), np.float64(0.8663101604278075), np.float64(0.9355670103092784), np.float64(0.7956989247311828)]
|
| 82 |
+
class_p = [np.float64(0.4166666666666667), np.float64(0.6776859504132231), np.float64(0.8433734939759037), np.float64(0.5842696629213483), np.float64(0.5317460317460317), np.float64(0.553125), np.float64(0.9146341463414634), np.float64(0.8709677419354839), np.float64(0.937984496124031), np.float64(0.6727272727272727)]
|
| 83 |
+
class_r = [np.float64(0.23809523809523808), np.float64(0.7735849056603774), np.float64(0.7329842931937173), np.float64(0.31901840490797545), np.float64(0.5630252100840336), np.float64(0.6704545454545454), np.float64(0.9375), np.float64(0.8617021276595744), np.float64(0.9331619537275064), np.float64(0.9736842105263158)]
|
| 84 |
+
confusion_matrix = [[ 10 2 0 0 6 24 0 0 0 0]
|
| 85 |
+
[ 2 164 12 0 10 24 0 0 0 0]
|
| 86 |
+
[ 0 37 140 0 6 6 0 0 0 2]
|
| 87 |
+
[ 4 11 8 52 51 32 0 0 0 5]
|
| 88 |
+
[ 2 14 4 21 134 57 0 0 0 6]
|
| 89 |
+
[ 6 14 2 16 44 177 0 0 0 5]
|
| 90 |
+
[ 0 0 0 0 0 0 150 8 2 0]
|
| 91 |
+
[ 0 0 0 0 0 0 4 162 22 0]
|
| 92 |
+
[ 0 0 0 0 0 0 10 16 363 0]
|
| 93 |
+
[ 0 0 0 0 1 0 0 0 0 37]]
|
| 94 |
+
f1_macro = 0.6899114582037378
|
| 95 |
+
f1_weighted = 0.7312198628386355
|
| 96 |
+
evaluate 5
|
| 97 |
+
acc = 0.736870026525199
|
| 98 |
+
acc_and_f1_macro = 0.7161707259870482
|
| 99 |
+
acc_and_f1_weighted = 0.7354812627355416
|
| 100 |
+
class_f1 = [np.float64(0.4), np.float64(0.7264150943396227), np.float64(0.7903225806451613), np.float64(0.45692883895131087), np.float64(0.5497076023391811), np.float64(0.5776965265082266), np.float64(0.925925925925926), np.float64(0.870967741935484), np.float64(0.9383033419023136), np.float64(0.7184466019417477)]
|
| 101 |
+
class_p = [np.float64(0.5), np.float64(0.7264150943396226), np.float64(0.8121546961325967), np.float64(0.5865384615384616), np.float64(0.5127272727272727), np.float64(0.558303886925795), np.float64(0.9146341463414634), np.float64(0.8804347826086957), np.float64(0.9383033419023136), np.float64(0.5692307692307692)]
|
| 102 |
+
class_r = [np.float64(0.3333333333333333), np.float64(0.7264150943396226), np.float64(0.7696335078534031), np.float64(0.37423312883435583), np.float64(0.592436974789916), np.float64(0.5984848484848485), np.float64(0.9375), np.float64(0.8617021276595744), np.float64(0.9383033419023136), np.float64(0.9736842105263158)]
|
| 103 |
+
confusion_matrix = [[ 14 0 2 2 5 19 0 0 0 0]
|
| 104 |
+
[ 2 154 18 0 12 26 0 0 0 0]
|
| 105 |
+
[ 0 33 147 0 5 4 0 0 0 2]
|
| 106 |
+
[ 4 7 8 61 53 26 0 0 0 4]
|
| 107 |
+
[ 2 10 4 23 141 50 0 0 0 8]
|
| 108 |
+
[ 6 8 2 18 58 158 0 0 0 14]
|
| 109 |
+
[ 0 0 0 0 0 0 150 8 2 0]
|
| 110 |
+
[ 0 0 0 0 0 0 4 162 22 0]
|
| 111 |
+
[ 0 0 0 0 0 0 10 14 365 0]
|
| 112 |
+
[ 0 0 0 0 1 0 0 0 0 37]]
|
| 113 |
+
f1_macro = 0.6954714254488974
|
| 114 |
+
f1_weighted = 0.7340924989458844
|
| 115 |
+
evaluate 6
|
| 116 |
+
acc = 0.7400530503978779
|
| 117 |
+
acc_and_f1_macro = 0.7194814775633938
|
| 118 |
+
acc_and_f1_weighted = 0.7381404877009761
|
| 119 |
+
class_f1 = [np.float64(0.37681159420289856), np.float64(0.7247706422018348), np.float64(0.8032786885245902), np.float64(0.4274809160305344), np.float64(0.5483234714003945), np.float64(0.6074600355239785), np.float64(0.920245398773006), np.float64(0.870967741935484), np.float64(0.9355670103092784), np.float64(0.7741935483870966)]
|
| 120 |
+
class_p = [np.float64(0.48148148148148145), np.float64(0.7053571428571429), np.float64(0.84), np.float64(0.5656565656565656), np.float64(0.516728624535316), np.float64(0.5719063545150501), np.float64(0.9036144578313253), np.float64(0.8804347826086957), np.float64(0.937984496124031), np.float64(0.6545454545454545)]
|
| 121 |
+
class_r = [np.float64(0.30952380952380953), np.float64(0.7452830188679245), np.float64(0.7696335078534031), np.float64(0.34355828220858897), np.float64(0.5840336134453782), np.float64(0.6477272727272727), np.float64(0.9375), np.float64(0.8617021276595744), np.float64(0.9331619537275064), np.float64(0.9473684210526315)]
|
| 122 |
+
confusion_matrix = [[ 13 2 0 2 5 20 0 0 0 0]
|
| 123 |
+
[ 2 158 14 0 12 26 0 0 0 0]
|
| 124 |
+
[ 0 33 147 0 5 4 0 0 0 2]
|
| 125 |
+
[ 4 8 8 56 54 29 0 0 0 4]
|
| 126 |
+
[ 2 12 4 25 139 48 0 0 0 8]
|
| 127 |
+
[ 6 11 2 16 53 171 0 0 0 5]
|
| 128 |
+
[ 0 0 0 0 0 0 150 8 2 0]
|
| 129 |
+
[ 0 0 0 0 0 0 4 162 22 0]
|
| 130 |
+
[ 0 0 0 0 0 0 12 14 363 0]
|
| 131 |
+
[ 0 0 0 0 1 1 0 0 0 36]]
|
| 132 |
+
f1_macro = 0.6989099047289097
|
| 133 |
+
f1_weighted = 0.7362279250040741
|
| 134 |
+
evaluate 7
|
| 135 |
+
acc = 0.7400530503978779
|
| 136 |
+
acc_and_f1_macro = 0.719712348383416
|
| 137 |
+
acc_and_f1_weighted = 0.7383193385351758
|
| 138 |
+
class_f1 = [np.float64(0.37681159420289856), np.float64(0.7205542725173211), np.float64(0.7989130434782609), np.float64(0.43609022556390975), np.float64(0.5504950495049505), np.float64(0.6014234875444839), np.float64(0.920245398773006), np.float64(0.877005347593583), np.float64(0.937984496124031), np.float64(0.7741935483870966)]
|
| 139 |
+
class_p = [np.float64(0.48148148148148145), np.float64(0.7058823529411765), np.float64(0.8305084745762712), np.float64(0.5631067961165048), np.float64(0.5205992509363296), np.float64(0.5671140939597316), np.float64(0.9036144578313253), np.float64(0.8817204301075269), np.float64(0.9428571428571428), np.float64(0.6545454545454545)]
|
| 140 |
+
class_r = [np.float64(0.30952380952380953), np.float64(0.7358490566037735), np.float64(0.7696335078534031), np.float64(0.3558282208588957), np.float64(0.5840336134453782), np.float64(0.6401515151515151), np.float64(0.9375), np.float64(0.8723404255319149), np.float64(0.9331619537275064), np.float64(0.9473684210526315)]
|
| 141 |
+
confusion_matrix = [[ 13 2 0 2 5 20 0 0 0 0]
|
| 142 |
+
[ 2 156 16 0 12 26 0 0 0 0]
|
| 143 |
+
[ 0 33 147 0 5 4 0 0 0 2]
|
| 144 |
+
[ 4 7 8 58 52 30 0 0 0 4]
|
| 145 |
+
[ 2 12 4 25 139 48 0 0 0 8]
|
| 146 |
+
[ 6 11 2 18 53 169 0 0 0 5]
|
| 147 |
+
[ 0 0 0 0 0 0 150 8 2 0]
|
| 148 |
+
[ 0 0 0 0 0 0 4 164 20 0]
|
| 149 |
+
[ 0 0 0 0 0 0 12 14 363 0]
|
| 150 |
+
[ 0 0 0 0 1 1 0 0 0 36]]
|
| 151 |
+
f1_macro = 0.6993716463689542
|
| 152 |
+
f1_weighted = 0.7365856266724738
|
| 153 |
+
evaluate 8
|
| 154 |
+
acc = 0.7384615384615385
|
| 155 |
+
acc_and_f1_macro = 0.7183460858337962
|
| 156 |
+
acc_and_f1_weighted = 0.7365981877073211
|
| 157 |
+
class_f1 = [np.float64(0.37681159420289856), np.float64(0.7172413793103449), np.float64(0.7989130434782609), np.float64(0.4242424242424243), np.float64(0.5483234714003945), np.float64(0.5989304812834224), np.float64(0.920245398773006), np.float64(0.877005347593583), np.float64(0.937984496124031), np.float64(0.782608695652174)]
|
| 158 |
+
class_p = [np.float64(0.48148148148148145), np.float64(0.6995515695067265), np.float64(0.8305084745762712), np.float64(0.5544554455445545), np.float64(0.516728624535316), np.float64(0.5656565656565656), np.float64(0.9036144578313253), np.float64(0.8817204301075269), np.float64(0.9428571428571428), np.float64(0.6666666666666666)]
|
| 159 |
+
class_r = [np.float64(0.30952380952380953), np.float64(0.7358490566037735), np.float64(0.7696335078534031), np.float64(0.34355828220858897), np.float64(0.5840336134453782), np.float64(0.6363636363636364), np.float64(0.9375), np.float64(0.8723404255319149), np.float64(0.9331619537275064), np.float64(0.9473684210526315)]
|
| 160 |
+
confusion_matrix = [[ 13 2 0 2 5 20 0 0 0 0]
|
| 161 |
+
[ 2 156 16 0 12 26 0 0 0 0]
|
| 162 |
+
[ 0 33 147 0 5 4 0 0 0 2]
|
| 163 |
+
[ 4 7 8 56 54 30 0 0 0 4]
|
| 164 |
+
[ 2 12 4 25 139 48 0 0 0 8]
|
| 165 |
+
[ 6 13 2 18 53 168 0 0 0 4]
|
| 166 |
+
[ 0 0 0 0 0 0 150 8 2 0]
|
| 167 |
+
[ 0 0 0 0 0 0 4 164 20 0]
|
| 168 |
+
[ 0 0 0 0 0 0 12 14 363 0]
|
| 169 |
+
[ 0 0 0 0 1 1 0 0 0 36]]
|
| 170 |
+
f1_macro = 0.6982306332060538
|
| 171 |
+
f1_weighted = 0.7347348369531037
|
| 172 |
+
evaluate 9
|
| 173 |
+
acc = 0.7395225464190981
|
| 174 |
+
acc_and_f1_macro = 0.7192689346869343
|
| 175 |
+
acc_and_f1_weighted = 0.7376388444885733
|
| 176 |
+
class_f1 = [np.float64(0.37681159420289856), np.float64(0.7172413793103449), np.float64(0.7989130434782609), np.float64(0.4242424242424243), np.float64(0.5540275049115914), np.float64(0.6010733452593918), np.float64(0.920245398773006), np.float64(0.877005347593583), np.float64(0.937984496124031), np.float64(0.782608695652174)]
|
| 177 |
+
class_p = [np.float64(0.48148148148148145), np.float64(0.6995515695067265), np.float64(0.8305084745762712), np.float64(0.5544554455445545), np.float64(0.5202952029520295), np.float64(0.5694915254237288), np.float64(0.9036144578313253), np.float64(0.8817204301075269), np.float64(0.9428571428571428), np.float64(0.6666666666666666)]
|
| 178 |
+
class_r = [np.float64(0.30952380952380953), np.float64(0.7358490566037735), np.float64(0.7696335078534031), np.float64(0.34355828220858897), np.float64(0.592436974789916), np.float64(0.6363636363636364), np.float64(0.9375), np.float64(0.8723404255319149), np.float64(0.9331619537275064), np.float64(0.9473684210526315)]
|
| 179 |
+
confusion_matrix = [[ 13 2 0 2 5 20 0 0 0 0]
|
| 180 |
+
[ 2 156 16 0 12 26 0 0 0 0]
|
| 181 |
+
[ 0 33 147 0 5 4 0 0 0 2]
|
| 182 |
+
[ 4 7 8 56 54 30 0 0 0 4]
|
| 183 |
+
[ 2 12 4 25 141 46 0 0 0 8]
|
| 184 |
+
[ 6 13 2 18 53 168 0 0 0 4]
|
| 185 |
+
[ 0 0 0 0 0 0 150 8 2 0]
|
| 186 |
+
[ 0 0 0 0 0 0 4 164 20 0]
|
| 187 |
+
[ 0 0 0 0 0 0 12 14 363 0]
|
| 188 |
+
[ 0 0 0 0 1 1 0 0 0 36]]
|
| 189 |
+
f1_macro = 0.6990153229547705
|
| 190 |
+
f1_weighted = 0.7357551425580484
|
model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dbe9b39d45f0d0572d9b56117df6e5b9cb1975fbeb171e280015236305ade3d2
|
| 3 |
+
size 2239659624
|
tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tokenizer_config.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"add_prefix_space": false,
|
| 3 |
+
"backend": "tokenizers",
|
| 4 |
+
"bos_token": "<s>",
|
| 5 |
+
"clean_up_tokenization_spaces": true,
|
| 6 |
+
"cls_token": "<s>",
|
| 7 |
+
"do_lower_case": false,
|
| 8 |
+
"eos_token": "</s>",
|
| 9 |
+
"errors": "replace",
|
| 10 |
+
"is_local": false,
|
| 11 |
+
"mask_token": "<mask>",
|
| 12 |
+
"model_max_length": 512,
|
| 13 |
+
"pad_token": "<pad>",
|
| 14 |
+
"sep_token": "</s>",
|
| 15 |
+
"tokenizer_class": "RobertaTokenizer",
|
| 16 |
+
"trim_offsets": true,
|
| 17 |
+
"unk_token": "<unk>"
|
| 18 |
+
}
|
training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:82e21a647ced231b2802fd00e6e84be75bf9d0cdc3aa01f55870a2207cd00ff0
|
| 3 |
+
size 2833
|