taglish-roberta-tactic / comprehensive_results_tactic.json

Upload folder using huggingface_hub

2812b09 verified 2 months ago

3.44 kB

	{
	"val": {
	"loss": 0.2741684317588806,
	"accuracy": 0.9154929577464789,
	"macro_f1": 0.9149011138355096,
	"weighted_f1": 0.9152502181169738,
	"distortion_precision": 0.8918918918918919,
	"distortion_recall": 0.9428571428571428,
	"distortion_f1": 0.9166666666666666,
	"trivialization_precision": 0.8974358974358975,
	"trivialization_recall": 0.9459459459459459,
	"trivialization_f1": 0.9210526315789473,
	"coercion_precision": 0.9428571428571428,
	"coercion_recall": 0.9166666666666666,
	"coercion_f1": 0.9295774647887324,
	"knowledge_precision": 0.9354838709677419,
	"knowledge_recall": 0.8529411764705882,
	"knowledge_f1": 0.8923076923076924,
	"runtime": 12.4031,
	"samples_per_second": 11.449,
	"steps_per_second": 0.726,
	"confusion_matrix": [
	[
	33,
	1,
	0,
	1
	],
	[
	0,
	35,
	1,
	1
	],
	[
	1,
	2,
	33,
	0
	],
	[
	3,
	1,
	1,
	29
	]
	]
	},
	"test_id": {
	"loss": 0.27421480417251587,
	"accuracy": 0.9084507042253521,
	"macro_f1": 0.9085461883825343,
	"weighted_f1": 0.9084405799722616,
	"distortion_precision": 0.9117647058823529,
	"distortion_recall": 0.8611111111111112,
	"distortion_f1": 0.8857142857142857,
	"trivialization_precision": 0.8611111111111112,
	"trivialization_recall": 0.9393939393939394,
	"trivialization_f1": 0.8985507246376812,
	"coercion_precision": 0.9285714285714286,
	"coercion_recall": 0.9285714285714286,
	"coercion_f1": 0.9285714285714286,
	"knowledge_precision": 0.9318181818181818,
	"knowledge_recall": 0.9111111111111111,
	"knowledge_f1": 0.9213483146067416,
	"runtime": 12.2783,
	"samples_per_second": 11.565,
	"steps_per_second": 0.733,
	"confusion_matrix": [
	[
	31,
	3,
	1,
	1
	],
	[
	0,
	31,
	0,
	2
	],
	[
	1,
	1,
	26,
	0
	],
	[
	2,
	1,
	1,
	41
	]
	]
	},
	"test_ood": {
	"loss": 1.1873223781585693,
	"accuracy": 0.6086956521739131,
	"macro_f1": 0.5871759832188721,
	"weighted_f1": 0.6067226831556392,
	"distortion_precision": 0.6787564766839378,
	"distortion_recall": 0.645320197044335,
	"distortion_f1": 0.6616161616161617,
	"trivialization_precision": 0.4918032786885246,
	"trivialization_recall": 0.7692307692307693,
	"trivialization_f1": 0.6,
	"coercion_precision": 0.5625,
	"coercion_recall": 0.5510204081632653,
	"coercion_f1": 0.5567010309278351,
	"knowledge_precision": 0.6486486486486487,
	"knowledge_recall": 0.4485981308411215,
	"knowledge_f1": 0.5303867403314917,
	"runtime": 13.0062,
	"samples_per_second": 33.599,
	"steps_per_second": 2.153,
	"confusion_matrix": [
	[
	131,
	47,
	12,
	13
	],
	[
	10,
	60,
	2,
	6
	],
	[
	9,
	6,
	27,
	7
	],
	[
	43,
	9,
	7,
	48
	]
	]
	},
	"delta_f1": 0.3213702051636622,
	"delta_f1_interpretation": "\u274c Significant overfitting (domain adaptation needed)"
	}