teru00801 commited on
Commit
011463c
·
verified ·
1 Parent(s): 3929110

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -40,3 +40,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
40
  20260222_175136/analysis_bundle/predictions/final_eval_predictions_evalonly.csv filter=lfs diff=lfs merge=lfs -text
41
  20260303_171212/analysis_bundle/cartography/task1_cartography.csv filter=lfs diff=lfs merge=lfs -text
42
  20260303_171212/analysis_bundle/cartography/task1_cartography.png filter=lfs diff=lfs merge=lfs -text
 
 
 
40
  20260222_175136/analysis_bundle/predictions/final_eval_predictions_evalonly.csv filter=lfs diff=lfs merge=lfs -text
41
  20260303_171212/analysis_bundle/cartography/task1_cartography.csv filter=lfs diff=lfs merge=lfs -text
42
  20260303_171212/analysis_bundle/cartography/task1_cartography.png filter=lfs diff=lfs merge=lfs -text
43
+ 20260305_115207/analysis_bundle/cartography/task1_cartography.csv filter=lfs diff=lfs merge=lfs -text
44
+ 20260305_115207/analysis_bundle/cartography/task1_cartography.png filter=lfs diff=lfs merge=lfs -text
20260305_115207/analysis_bundle/cartography/summary.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "epochs": 4,
3
+ "task1_rows": 17214,
4
+ "task1_lowmean_threshold": 0.0,
5
+ "task1_suspects": 643,
6
+ "plot_saved": true
7
+ }
20260305_115207/analysis_bundle/cartography/task1_cartography.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb0240821f2b237482623102f47a3c0119de1193dd75778327ab54d50e9d12c7
3
+ size 62147661
20260305_115207/analysis_bundle/cartography/task1_cartography.png ADDED

Git LFS Details

  • SHA256: ca7403037e0b708add4083aa67635f2b893dccc2bc80eabc2bc789ee1e9f43e6
  • Pointer size: 131 Bytes
  • Size of remote file: 326 kB
20260305_115207/analysis_bundle/metrics/metrics.jsonl ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {"epoch": 1, "train_loss": 0.2580397548707943, "acc": 0.8842544316996872, "f1": 0.8362831858407079, "precision": 0.7490092470277411, "recall": 0.9465776293823038, "selection_score": 0.8258504387065724, "score": 0.8258504387065724}
2
+ {"epoch": 2, "train_loss": 0.13849756630920013, "acc": 0.90563086548488, "f1": 0.8571428571428571, "precision": 0.812874251497006, "recall": 0.9065108514190318, "selection_score": 0.8753029434576742, "score": 0.8753029434576742}
3
+ {"epoch": 3, "train_loss": 0.10975362556436026, "acc": 0.8795620437956204, "f1": 0.8339324227174695, "precision": 0.7323232323232324, "recall": 0.9682804674457429, "selection_score": 0.8138214788821092, "score": 0.8138214788821092}
4
+ {"epoch": 4, "train_loss": 0.08633500159645391, "acc": 0.8847758081334723, "f1": 0.8395061728395061, "precision": 0.7429305912596401, "recall": 0.9649415692821369, "selection_score": 0.8230046217189885, "score": 0.8230046217189885}
20260305_115207/analysis_bundle/predictions/final_eval_predictions.csv ADDED
The diff for this file is too large to render. See raw diff
 
20260305_115207/analysis_bundle/predictions/final_eval_predictions_evalonly.csv ADDED
The diff for this file is too large to render. See raw diff
 
20260305_115207/analysis_bundle/summaries/final_eval_summary.csv ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ dataset,rows_evaluated,acc,f1,precision,recall,always_pick_acc,always_decline_acc
2
+ data_for_deberta/dedup_split/risk_test.csv,2879,0.8982285515804098,0.8418780356179169,0.8024691358024691,0.8853575482406356,0.3060090309135116,0.6939909690864884
20260305_115207/analysis_bundle/summaries/final_eval_summary_evalonly.csv ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ run_dir,model_path,dataset,rows_raw,rows_evaluated,acc,f1,precision,recall,always_pick_acc,always_decline_acc
2
+ outputs/task1_binary_runs/20260305_115207,outputs/task1_binary_runs/20260305_115207/best_model.pt,data_for_deberta/dedup_split/risk_test.csv,2879,2879,0.8982285515804098,0.8418780356179169,0.8024691358024691,0.8853575482406356,0.3060090309135116,0.6939909690864884
20260305_115207/analysis_bundle/summaries/summary.json ADDED
@@ -0,0 +1,54 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 2,
3
+ "best_score": 0.8753029434576742,
4
+ "best_selection_score": 0.8753029434576742,
5
+ "best_val_metrics_at_selection": {
6
+ "acc": 0.90563086548488,
7
+ "f1": 0.8571428571428571,
8
+ "precision": 0.812874251497006,
9
+ "recall": 0.9065108514190318
10
+ },
11
+ "model_selection": {
12
+ "metric": "recall-floor-constrained-fbeta",
13
+ "beta": 0.5,
14
+ "recall_floor": 0.9,
15
+ "recall_floor_penalty": 2.0,
16
+ "acc_weight": 0.05
17
+ },
18
+ "data_provenance": {
19
+ "train_csv": {
20
+ "path": "data_for_deberta/Risk-only-pick/task1_risk_training_20260225.csv",
21
+ "sha256_16": "e8a3504a9b457cce",
22
+ "size_bytes": 61519951
23
+ },
24
+ "val_csv_source": {
25
+ "path": "data_for_deberta/dedup_split/risk_val.csv",
26
+ "sha256_16": "5a878fcd1d1713be",
27
+ "size_bytes": 6146696
28
+ },
29
+ "final_eval_csv": {
30
+ "path": "data_for_deberta/dedup_split/risk_test.csv",
31
+ "sha256_16": "1aa054c802b71ee8",
32
+ "size_bytes": 9140917
33
+ }
34
+ },
35
+ "train_rows": 17214,
36
+ "val_rows": 1918,
37
+ "final_eval_rows": 2879,
38
+ "val_metrics": {
39
+ "acc": 0.90563086548488,
40
+ "f1": 0.8571428571428571,
41
+ "precision": 0.812874251497006,
42
+ "recall": 0.9065108514190318
43
+ },
44
+ "final_eval_metrics": {
45
+ "acc": 0.8982285515804098,
46
+ "f1": 0.8418780356179169,
47
+ "precision": 0.8024691358024691,
48
+ "recall": 0.8853575482406356
49
+ },
50
+ "final_eval_baseline": {
51
+ "always_pick_acc": 0.3060090309135116,
52
+ "always_decline_acc": 0.6939909690864884
53
+ }
54
+ }