Training in progress, epoch 1

Files changed (8) hide show

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text

best_threshold.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"best_threshold": 0.5}

config.json ADDED Viewed

+{
+  "architectures": [
+    "DebertaV2ForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 1,
+  "dtype": "float16",
+  "eos_token_id": 2,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "entailment",
+    "1": "neutral",
+    "2": "contradiction"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "contradiction": 2,
+    "entailment": 0,
+    "neutral": 1
+  },
+  "layer_norm_eps": 1e-07,
+  "legacy": true,
+  "max_position_embeddings": 512,
+  "max_relative_positions": -1,
+  "model_type": "deberta-v2",
+  "norm_rel_ebd": "layer_norm",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "pooler_dropout": 0,
+  "pooler_hidden_act": "gelu",
+  "pooler_hidden_size": 768,
+  "pos_att_type": [
+    "p2c",
+    "c2p"
+  ],
+  "position_biased_input": false,
+  "position_buckets": 256,
+  "relative_attention": true,
+  "share_att_key": true,
+  "tie_word_embeddings": true,
+  "transformers_version": "5.0.0",
+  "type_vocab_size": 0,
+  "use_cache": false,
+  "vocab_size": 251000
+}

model.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:29b8ba7c2ffae85b1a074667b8d12f632c4d023a504c84e94a456cbc767e6dd9
+size 557647822

test_per_outlet_summary.csv ADDED Viewed

+outlet,support,precision_entailment,recall_entailment,f1_entailment,precision_contradiction,recall_contradiction,f1_contradiction,accuracy,macro_f1,weighted_f1
+Bild,180,0.12804878048780488,0.875,0.22340425531914893,0.8125,0.08333333333333333,0.1511627906976744,0.18888888888888888,0.18728352300841167,0.16079498598053768
+FAZ,188,0.25675675675675674,0.7755102040816326,0.38578680203045684,0.725,0.20863309352517986,0.3240223463687151,0.35638297872340424,0.354904574199586,0.3401205289614031
+SZ,180,0.12422360248447205,0.9523809523809523,0.21978021978021978,0.9473684210526315,0.11320754716981132,0.20224719101123595,0.2111111111111111,0.21101370539572786,0.20429271103428404
+Spiegel,180,0.13986013986013987,0.7407407407407407,0.23529411764705882,0.8108108108108109,0.19607843137254902,0.3157894736842105,0.2777777777777778,0.27554179566563464,0.30371517027863776
+Welt,180,0.22875816993464052,0.8536585365853658,0.36082474226804123,0.7777777777777778,0.1510791366906475,0.25301204819277107,0.3111111111111111,0.30691839523040615,0.2775693840654715
+Zeit,180,0.2549019607843137,0.8478260869565217,0.39195979899497485,0.7407407407407407,0.14925373134328357,0.2484472049689441,0.3277777777777778,0.32020350198195946,0.2851226456644853

tokenizer.json ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:a66269b2b7b04009c9e482ef6a99accee231b6822b83e7eb6df36626b61db43a
+size 16014878

tokenizer_config.json ADDED Viewed

+{
+  "add_prefix_space": true,
+  "backend": "tokenizers",
+  "bos_token": "[CLS]",
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": false,
+  "eos_token": "[SEP]",
+  "is_local": false,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "sp_model_kwargs": {},
+  "split_by_punct": false,
+  "tokenizer_class": "DebertaV2Tokenizer",
+  "unk_id": 3,
+  "unk_token": "[UNK]",
+  "vocab_type": "spm"
+}

training_args.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:38747397f40204ef789b870a748edc5308acbfeed87cf84f7d27c55161a4e3ae
+size 5265