teru00801 commited on
Commit
1edbbfe
·
verified ·
1 Parent(s): 682602c

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -48,3 +48,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
48
  20260305_143247/analysis_bundle/cartography/task1_cartography.png filter=lfs diff=lfs merge=lfs -text
49
  20260305_160843/analysis_bundle/cartography/task1_cartography.csv filter=lfs diff=lfs merge=lfs -text
50
  20260305_160843/analysis_bundle/cartography/task1_cartography.png filter=lfs diff=lfs merge=lfs -text
 
 
 
48
  20260305_143247/analysis_bundle/cartography/task1_cartography.png filter=lfs diff=lfs merge=lfs -text
49
  20260305_160843/analysis_bundle/cartography/task1_cartography.csv filter=lfs diff=lfs merge=lfs -text
50
  20260305_160843/analysis_bundle/cartography/task1_cartography.png filter=lfs diff=lfs merge=lfs -text
51
+ 20260305_234210/analysis_bundle/cartography/task1_cartography.csv filter=lfs diff=lfs merge=lfs -text
52
+ 20260305_234210/analysis_bundle/cartography/task1_cartography.png filter=lfs diff=lfs merge=lfs -text
20260305_234210/analysis_bundle/cartography/summary.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "epochs": 9,
3
+ "task1_rows": 17206,
4
+ "task1_lowmean_threshold": 0.3295763455331326,
5
+ "task1_suspects": 87,
6
+ "plot_saved": true
7
+ }
20260305_234210/analysis_bundle/cartography/task1_cartography.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3421cfaaf9514f5491d2bd876b14279ceca1789a5a83fe9cd0b5797eb2baa7f0
3
+ size 62157379
20260305_234210/analysis_bundle/cartography/task1_cartography.png ADDED

Git LFS Details

  • SHA256: 9bb8f833100b369e2edf0d187e10da7b439b803d4afd38593953aac1704b77ef
  • Pointer size: 131 Bytes
  • Size of remote file: 256 kB
20260305_234210/analysis_bundle/metrics/metrics.jsonl ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {"epoch": 1, "train_loss": 0.2504281156755236, "acc": 0.8280354351224596, "f1": 0.7730398899587345, "precision": 0.6386363636363637, "recall": 0.9790940766550522, "selection_score": 0.727772069753192, "score": 0.727772069753192}
2
+ {"epoch": 2, "train_loss": 0.13862331558822144, "acc": 0.8400208441896821, "f1": 0.7860627177700349, "precision": 0.6550522648083623, "recall": 0.9825783972125436, "selection_score": 0.7438427545041579, "score": 0.7438427545041579}
3
+ {"epoch": 3, "train_loss": 0.10752340027072284, "acc": 0.8264721208963002, "f1": 0.7708189951823813, "precision": 0.6370875995449374, "recall": 0.975609756097561, "selection_score": 0.72592018306193, "score": 0.72592018306193}
4
+ {"epoch": 4, "train_loss": 0.09520636254152955, "acc": 0.8759770713913496, "f1": 0.8218562874251497, "precision": 0.7204724409448819, "recall": 0.9564459930313589, "selection_score": 0.801667434464101, "score": 0.801667434464101}
5
+ {"epoch": 5, "train_loss": 0.08266666641313458, "acc": 0.883793642522147, "f1": 0.8316981132075472, "precision": 0.7336884154460719, "recall": 0.9599303135888502, "selection_score": 0.8141729129813338, "score": 0.8141729129813338}
6
+ {"epoch": 6, "train_loss": 0.07137370736210098, "acc": 0.8806670140698281, "f1": 0.8279489105935387, "precision": 0.7278731836195509, "recall": 0.9599303135888502, "selection_score": 0.8088862102259788, "score": 0.8088862102259788}
7
+ {"epoch": 7, "train_loss": 0.0684460368748325, "acc": 0.8895257946847316, "f1": 0.8354037267080745, "precision": 0.7535014005602241, "recall": 0.9372822299651568, "selection_score": 0.8287328495010005, "score": 0.8287328495010005}
8
+ {"epoch": 8, "train_loss": 0.0679263743298426, "acc": 0.8712871287128713, "f1": 0.8177121771217712, "precision": 0.7093469910371318, "recall": 0.9651567944250871, "selection_score": 0.7926178988910249, "score": 0.7926178988910249}
9
+ {"epoch": 9, "train_loss": 0.06160068674684679, "acc": 0.8884835852006253, "f1": 0.8348765432098766, "precision": 0.7493074792243767, "recall": 0.9425087108013938, "selection_score": 0.8257644450023767, "score": 0.8257644450023767}
20260305_234210/analysis_bundle/predictions/final_eval_predictions.csv ADDED
The diff for this file is too large to render. See raw diff
 
20260305_234210/analysis_bundle/predictions/final_eval_predictions_evalonly.csv ADDED
The diff for this file is too large to render. See raw diff
 
20260305_234210/analysis_bundle/summaries/final_eval_summary.csv ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ dataset,rows_evaluated,acc,f1,precision,recall,always_pick_acc,always_decline_acc
2
+ data_for_deberta/dedup_split/risk_test.csv,2879,0.8912816950329976,0.831266846361186,0.7399232245681382,0.948339483394834,0.28238971865230983,0.7176102813476901
20260305_234210/analysis_bundle/summaries/final_eval_summary_evalonly.csv ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ run_dir,model_path,dataset,rows_raw,rows_evaluated,acc,f1,precision,recall,always_pick_acc,always_decline_acc
2
+ outputs/task1_binary_runs/20260305_234210,outputs/task1_binary_runs/20260305_234210/best_model.pt,data_for_deberta/dedup_split/risk_test.csv,2879,2879,0.8912816950329976,0.831266846361186,0.7399232245681382,0.948339483394834,0.28238971865230983,0.7176102813476901
20260305_234210/analysis_bundle/summaries/summary.json ADDED
@@ -0,0 +1,54 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 7,
3
+ "best_score": 0.8287328495010005,
4
+ "best_selection_score": 0.8287328495010005,
5
+ "best_val_metrics_at_selection": {
6
+ "acc": 0.8895257946847316,
7
+ "f1": 0.8354037267080745,
8
+ "precision": 0.7535014005602241,
9
+ "recall": 0.9372822299651568
10
+ },
11
+ "model_selection": {
12
+ "metric": "recall-floor-constrained-fbeta",
13
+ "beta": 0.5,
14
+ "recall_floor": 0.9,
15
+ "recall_floor_penalty": 2.0,
16
+ "acc_weight": 0.05
17
+ },
18
+ "data_provenance": {
19
+ "train_csv": {
20
+ "path": "data_for_deberta/Risk-only-pick/task1_risk_training_20260225.csv",
21
+ "sha256_16": "149b65cfd4785835",
22
+ "size_bytes": 61496472
23
+ },
24
+ "val_csv_source": {
25
+ "path": "data_for_deberta/dedup_split/risk_val.csv",
26
+ "sha256_16": "61c445d1558d1b34",
27
+ "size_bytes": 6044780
28
+ },
29
+ "final_eval_csv": {
30
+ "path": "data_for_deberta/dedup_split/risk_test.csv",
31
+ "sha256_16": "7bb9f6e80cd447ae",
32
+ "size_bytes": 9345127
33
+ }
34
+ },
35
+ "train_rows": 17206,
36
+ "val_rows": 1919,
37
+ "final_eval_rows": 2879,
38
+ "val_metrics": {
39
+ "acc": 0.8895257946847316,
40
+ "f1": 0.8354037267080745,
41
+ "precision": 0.7535014005602241,
42
+ "recall": 0.9372822299651568
43
+ },
44
+ "final_eval_metrics": {
45
+ "acc": 0.8912816950329976,
46
+ "f1": 0.831266846361186,
47
+ "precision": 0.7399232245681382,
48
+ "recall": 0.948339483394834
49
+ },
50
+ "final_eval_baseline": {
51
+ "always_pick_acc": 0.28238971865230983,
52
+ "always_decline_acc": 0.7176102813476901
53
+ }
54
+ }