Upload folder using huggingface_hub
Browse files- .gitattributes +2 -0
- 20260306_075806/analysis_bundle/cartography/summary.json +7 -0
- 20260306_075806/analysis_bundle/cartography/task1_cartography.csv +3 -0
- 20260306_075806/analysis_bundle/cartography/task1_cartography.png +3 -0
- 20260306_075806/analysis_bundle/metrics/metrics.jsonl +10 -0
- 20260306_075806/analysis_bundle/predictions/final_eval_predictions.csv +0 -0
- 20260306_075806/analysis_bundle/predictions/final_eval_predictions_evalonly.csv +0 -0
- 20260306_075806/analysis_bundle/summaries/final_eval_summary.csv +2 -0
- 20260306_075806/analysis_bundle/summaries/final_eval_summary_evalonly.csv +2 -0
- 20260306_075806/analysis_bundle/summaries/summary.json +54 -0
.gitattributes
CHANGED
|
@@ -56,3 +56,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 56 |
20260306_041307/analysis_bundle/cartography/task1_cartography.png filter=lfs diff=lfs merge=lfs -text
|
| 57 |
20260306_061847/analysis_bundle/cartography/task1_cartography.csv filter=lfs diff=lfs merge=lfs -text
|
| 58 |
20260306_061847/analysis_bundle/cartography/task1_cartography.png filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
| 56 |
20260306_041307/analysis_bundle/cartography/task1_cartography.png filter=lfs diff=lfs merge=lfs -text
|
| 57 |
20260306_061847/analysis_bundle/cartography/task1_cartography.csv filter=lfs diff=lfs merge=lfs -text
|
| 58 |
20260306_061847/analysis_bundle/cartography/task1_cartography.png filter=lfs diff=lfs merge=lfs -text
|
| 59 |
+
20260306_075806/analysis_bundle/cartography/task1_cartography.csv filter=lfs diff=lfs merge=lfs -text
|
| 60 |
+
20260306_075806/analysis_bundle/cartography/task1_cartography.png filter=lfs diff=lfs merge=lfs -text
|
20260306_075806/analysis_bundle/cartography/summary.json
ADDED
|
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"epochs": 10,
|
| 3 |
+
"task1_rows": 17206,
|
| 4 |
+
"task1_lowmean_threshold": 0.4644450329244137,
|
| 5 |
+
"task1_suspects": 87,
|
| 6 |
+
"plot_saved": true
|
| 7 |
+
}
|
20260306_075806/analysis_bundle/cartography/task1_cartography.csv
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:258cc6ec383a241a7fbee3f2da446afd18e4e2984781b5a3c4f4e040a75ea81f
|
| 3 |
+
size 62158824
|
20260306_075806/analysis_bundle/cartography/task1_cartography.png
ADDED
|
Git LFS Details
|
20260306_075806/analysis_bundle/metrics/metrics.jsonl
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"epoch": 1, "train_loss": 0.2456423486946462, "acc": 0.8306409588327254, "f1": 0.7757073844030365, "precision": 0.6422857142857142, "recall": 0.9790940766550522, "selection_score": 0.7312718613927899, "score": 0.7312718613927899}
|
| 2 |
+
{"epoch": 2, "train_loss": 0.14148816659520327, "acc": 0.8160500260552371, "f1": 0.7622895622895622, "precision": 0.6212952799121844, "recall": 0.9860627177700348, "selection_score": 0.7117365932894854, "score": 0.7117365932894854}
|
| 3 |
+
{"epoch": 3, "train_loss": 0.1116914390949844, "acc": 0.8593017196456487, "f1": 0.8029197080291971, "precision": 0.6909547738693468, "recall": 0.9581881533101045, "selection_score": 0.7747373052478493, "score": 0.7747373052478493}
|
| 4 |
+
{"epoch": 4, "train_loss": 0.09569636324150523, "acc": 0.8686816050026055, "f1": 0.812220566318927, "precision": 0.7096354166666666, "recall": 0.9494773519163763, "selection_score": 0.7908284850773382, "score": 0.7908284850773382}
|
| 5 |
+
{"epoch": 5, "train_loss": 0.08042041696331094, "acc": 0.8947368421052632, "f1": 0.8344262295081967, "precision": 0.7879256965944272, "recall": 0.8867595818815331, "selection_score": 0.779408967436277, "score": 0.779408967436277}
|
| 6 |
+
{"epoch": 6, "train_loss": 0.07593365665871414, "acc": 0.8879624804585722, "f1": 0.833976833976834, "precision": 0.7489597780859917, "recall": 0.9407665505226481, "selection_score": 0.8251962732421306, "score": 0.8251962732421306}
|
| 7 |
+
{"epoch": 7, "train_loss": 0.06676800747066182, "acc": 0.866597186034393, "f1": 0.8083832335329342, "precision": 0.7086614173228346, "recall": 0.9407665505226481, "selection_score": 0.7887743650996214, "score": 0.7887743650996214}
|
| 8 |
+
{"epoch": 8, "train_loss": 0.06473139765218842, "acc": 0.897342365815529, "f1": 0.8435266084193804, "precision": 0.7751824817518248, "recall": 0.9250871080139372, "selection_score": 0.8460137688641017, "score": 0.8460137688641017}
|
| 9 |
+
{"epoch": 9, "train_loss": 0.06107548705638009, "acc": 0.8900468994267848, "f1": 0.8357976653696498, "precision": 0.7552742616033755, "recall": 0.9355400696864111, "selection_score": 0.8300494485406781, "score": 0.8300494485406781}
|
| 10 |
+
{"epoch": 10, "train_loss": 0.061821550736723116, "acc": 0.8884835852006253, "f1": 0.8325508607198748, "precision": 0.7556818181818182, "recall": 0.926829268292683, "selection_score": 0.8290849462216833, "score": 0.8290849462216833}
|
20260306_075806/analysis_bundle/predictions/final_eval_predictions.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
20260306_075806/analysis_bundle/predictions/final_eval_predictions_evalonly.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
20260306_075806/analysis_bundle/summaries/final_eval_summary.csv
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
dataset,rows_evaluated,acc,f1,precision,recall,always_pick_acc,always_decline_acc
|
| 2 |
+
data_for_deberta/dedup_split/risk_test.csv,2879,0.8968391802709275,0.8354570637119113,0.7600806451612904,0.9274292742927429,0.28238971865230983,0.7176102813476901
|
20260306_075806/analysis_bundle/summaries/final_eval_summary_evalonly.csv
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
run_dir,model_path,dataset,rows_raw,rows_evaluated,acc,f1,precision,recall,always_pick_acc,always_decline_acc
|
| 2 |
+
outputs/task1_binary_runs/20260306_075806,outputs/task1_binary_runs/20260306_075806/best_model.pt,data_for_deberta/dedup_split/risk_test.csv,2879,2879,0.8968391802709275,0.8354570637119113,0.7600806451612904,0.9274292742927429,0.28238971865230983,0.7176102813476901
|
20260306_075806/analysis_bundle/summaries/summary.json
ADDED
|
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"best_epoch": 8,
|
| 3 |
+
"best_score": 0.8460137688641017,
|
| 4 |
+
"best_selection_score": 0.8460137688641017,
|
| 5 |
+
"best_val_metrics_at_selection": {
|
| 6 |
+
"acc": 0.897342365815529,
|
| 7 |
+
"f1": 0.8435266084193804,
|
| 8 |
+
"precision": 0.7751824817518248,
|
| 9 |
+
"recall": 0.9250871080139372
|
| 10 |
+
},
|
| 11 |
+
"model_selection": {
|
| 12 |
+
"metric": "recall-floor-constrained-fbeta",
|
| 13 |
+
"beta": 0.5,
|
| 14 |
+
"recall_floor": 0.9,
|
| 15 |
+
"recall_floor_penalty": 2.0,
|
| 16 |
+
"acc_weight": 0.05
|
| 17 |
+
},
|
| 18 |
+
"data_provenance": {
|
| 19 |
+
"train_csv": {
|
| 20 |
+
"path": "data_for_deberta/Risk-only-pick/task1_risk_training_20260225.csv",
|
| 21 |
+
"sha256_16": "149b65cfd4785835",
|
| 22 |
+
"size_bytes": 61496472
|
| 23 |
+
},
|
| 24 |
+
"val_csv_source": {
|
| 25 |
+
"path": "data_for_deberta/dedup_split/risk_val.csv",
|
| 26 |
+
"sha256_16": "61c445d1558d1b34",
|
| 27 |
+
"size_bytes": 6044780
|
| 28 |
+
},
|
| 29 |
+
"final_eval_csv": {
|
| 30 |
+
"path": "data_for_deberta/dedup_split/risk_test.csv",
|
| 31 |
+
"sha256_16": "7bb9f6e80cd447ae",
|
| 32 |
+
"size_bytes": 9345127
|
| 33 |
+
}
|
| 34 |
+
},
|
| 35 |
+
"train_rows": 17206,
|
| 36 |
+
"val_rows": 1919,
|
| 37 |
+
"final_eval_rows": 2879,
|
| 38 |
+
"val_metrics": {
|
| 39 |
+
"acc": 0.897342365815529,
|
| 40 |
+
"f1": 0.8435266084193804,
|
| 41 |
+
"precision": 0.7751824817518248,
|
| 42 |
+
"recall": 0.9250871080139372
|
| 43 |
+
},
|
| 44 |
+
"final_eval_metrics": {
|
| 45 |
+
"acc": 0.8968391802709275,
|
| 46 |
+
"f1": 0.8354570637119113,
|
| 47 |
+
"precision": 0.7600806451612904,
|
| 48 |
+
"recall": 0.9274292742927429
|
| 49 |
+
},
|
| 50 |
+
"final_eval_baseline": {
|
| 51 |
+
"always_pick_acc": 0.28238971865230983,
|
| 52 |
+
"always_decline_acc": 0.7176102813476901
|
| 53 |
+
}
|
| 54 |
+
}
|