deberta-prism-v2 / training_report.json
Austin-Groundsetter's picture
Upload folder using huggingface_hub
0f3973a verified
{
"config": {
"base_model": "microsoft/deberta-v3-large",
"num_labels": 25,
"max_length": 512,
"learning_rate": 2e-05,
"weight_decay": 0.01,
"warmup_ratio": 0.1,
"num_train_epochs": 15,
"per_device_train_batch_size": 8,
"per_device_eval_batch_size": 16,
"gradient_accumulation_steps": 4,
"fp16": true,
"early_stopping_patience": 4,
"real_example_weight": 3.0,
"synthetic_example_weight": 1.0,
"focal_alpha": 0.25,
"focal_gamma": 2.0,
"class_weight_cap": 15.0
},
"data": {
"total_rows": 12568,
"train": 10054,
"val": 1257,
"test": 1257,
"labels": 25
},
"train_metrics": {
"train_runtime": 8749.3343,
"train_samples_per_second": 17.237,
"train_steps_per_second": 0.538,
"train_loss": 0.01095637260738344,
"epoch": 14.99
},
"test_metrics": {
"eval_loss": 0.0009040662553161383,
"eval_macro_f1": 0.9955046353163275,
"eval_micro_f1": 0.9959484346224677,
"eval_f1_L01_DISEASE_CLAIM": 1.0,
"eval_f1_L02_STRUCTURE_FUNCTION": 0.9945945945945946,
"eval_f1_L03_UNSUBSTANTIATED_EFFICACY": 1.0,
"eval_f1_L04_DRUG_COMPARISON": 1.0,
"eval_f1_L05_DOSING_INSTRUCTIONS": 1.0,
"eval_f1_L06_IMPLIED_HUMAN_USE": 0.9859154929577465,
"eval_f1_L07_PHARMA_GRADE_CLAIM": 0.9948717948717949,
"eval_f1_L08_TESTIMONIAL_VIOLATION": 1.0,
"eval_f1_L09_MISSING_DISCLAIMER": 0.9948717948717949,
"eval_f1_L10_MISLEADING_DISCLAIMER": 0.9577464788732394,
"eval_f1_L11_MISSING_COA": 1.0,
"eval_f1_L12_FDA_FALSE_CLAIM": 1.0,
"eval_f1_L13_MISSING_DISCLOSURES": 1.0,
"eval_f1_L14_FAIR_BALANCE_VIOLATION": 0.987012987012987,
"eval_f1_L19_DECEPTIVE_PRICING": 1.0,
"eval_f1_L21_CONSUMER_LANGUAGE": 0.9863013698630136,
"eval_f1_L22_BODYBUILDING_CONTENT": 1.0,
"eval_f1_L23_META_HEALTH_KEYWORDS": 1.0,
"eval_f1_L24_COVER_CONTRADICTION": 0.9863013698630136,
"eval_f1_L25_MISSING_RESEARCH_ID": 1.0,
"eval_f1_L27_THCA_LEGALITY_CLAIM": 1.0,
"eval_f1_L28_CBD_DISEASE_CLAIM": 1.0,
"eval_f1_L31_COMPLIANT_RESEARCH": 1.0,
"eval_f1_L32_COMPLIANT_DISCLAIMER": 1.0,
"eval_f1_L33_COMPLIANT_MARKETING": 1.0,
"eval_runtime": 20.7913,
"eval_samples_per_second": 60.458,
"eval_steps_per_second": 3.8,
"epoch": 14.99
},
"optimized_thresholds": {
"L01_DISEASE_CLAIM": {
"threshold": 0.35,
"f1": 1.0,
"precision": 1.0,
"recall": 1.0,
"support": 53
},
"L02_STRUCTURE_FUNCTION": {
"threshold": 0.55,
"f1": 1.0,
"precision": 1.0,
"recall": 1.0,
"support": 91
},
"L03_UNSUBSTANTIATED_EFFICACY": {
"threshold": 0.15,
"f1": 0.9892,
"precision": 1.0,
"recall": 0.9787,
"support": 47
},
"L04_DRUG_COMPARISON": {
"threshold": 0.125,
"f1": 1.0,
"precision": 1.0,
"recall": 1.0,
"support": 112
},
"L05_DOSING_INSTRUCTIONS": {
"threshold": 0.05,
"f1": 0.9722,
"precision": 0.9459,
"recall": 1.0,
"support": 35
},
"L06_IMPLIED_HUMAN_USE": {
"threshold": 0.275,
"f1": 0.9744,
"precision": 0.9661,
"recall": 0.9828,
"support": 58
},
"L07_PHARMA_GRADE_CLAIM": {
"threshold": 0.375,
"f1": 1.0,
"precision": 1.0,
"recall": 1.0,
"support": 92
},
"L08_TESTIMONIAL_VIOLATION": {
"threshold": 0.25,
"f1": 1.0,
"precision": 1.0,
"recall": 1.0,
"support": 62
},
"L09_MISSING_DISCLAIMER": {
"threshold": 0.15,
"f1": 1.0,
"precision": 1.0,
"recall": 1.0,
"support": 88
},
"L10_MISLEADING_DISCLAIMER": {
"threshold": 0.5,
"f1": 1.0,
"precision": 1.0,
"recall": 1.0,
"support": 44
},
"L11_MISSING_COA": {
"threshold": 0.65,
"f1": 1.0,
"precision": 1.0,
"recall": 1.0,
"support": 114
},
"L12_FDA_FALSE_CLAIM": {
"threshold": 0.05,
"f1": 1.0,
"precision": 1.0,
"recall": 1.0,
"support": 24
},
"L13_MISSING_DISCLOSURES": {
"threshold": 0.075,
"f1": 1.0,
"precision": 1.0,
"recall": 1.0,
"support": 75
},
"L14_FAIR_BALANCE_VIOLATION": {
"threshold": 0.325,
"f1": 1.0,
"precision": 1.0,
"recall": 1.0,
"support": 30
},
"L19_DECEPTIVE_PRICING": {
"threshold": 0.05,
"f1": 1.0,
"precision": 1.0,
"recall": 1.0,
"support": 18
},
"L21_CONSUMER_LANGUAGE": {
"threshold": 0.075,
"f1": 0.9885,
"precision": 0.9773,
"recall": 1.0,
"support": 43
},
"L22_BODYBUILDING_CONTENT": {
"threshold": 0.075,
"f1": 1.0,
"precision": 1.0,
"recall": 1.0,
"support": 87
},
"L23_META_HEALTH_KEYWORDS": {
"threshold": 0.05,
"f1": 1.0,
"precision": 1.0,
"recall": 1.0,
"support": 24
},
"L24_COVER_CONTRADICTION": {
"threshold": 0.15,
"f1": 1.0,
"precision": 1.0,
"recall": 1.0,
"support": 39
},
"L25_MISSING_RESEARCH_ID": {
"threshold": 0.425,
"f1": 1.0,
"precision": 1.0,
"recall": 1.0,
"support": 27
},
"L27_THCA_LEGALITY_CLAIM": {
"threshold": 0.15,
"f1": 1.0,
"precision": 1.0,
"recall": 1.0,
"support": 28
},
"L28_CBD_DISEASE_CLAIM": {
"threshold": 0.175,
"f1": 1.0,
"precision": 1.0,
"recall": 1.0,
"support": 42
},
"L31_COMPLIANT_RESEARCH": {
"threshold": 0.4,
"f1": 1.0,
"precision": 1.0,
"recall": 1.0,
"support": 69
},
"L32_COMPLIANT_DISCLAIMER": {
"threshold": 0.3,
"f1": 1.0,
"precision": 1.0,
"recall": 1.0,
"support": 22
},
"L33_COMPLIANT_MARKETING": {
"threshold": 0.05,
"f1": 1.0,
"precision": 1.0,
"recall": 1.0,
"support": 20
}
},
"optimized_macro_f1": 0.997,
"training_time_minutes": 145.82
}