karma689 commited on
Commit
a1548ee
·
verified ·
1 Parent(s): 35d5a7b

Add test confusion matrices (JSON + PNG) for all variants

Browse files
README.md CHANGED
@@ -164,17 +164,20 @@ python inference_uchen_ume.py \
164
  ## Repo layout
165
 
166
  ```
167
- center_crop_all/ ← use with center_crop_whole_page at inference (~99% test)
168
  final_model.pt
169
  model_card.json
170
- results.json
171
- without_preprocess/ ← use with preprocess none / full pages (~81% test)
 
 
172
  final_model.pt
173
  model_card.json
174
  results.json
175
- benchmark_eval_results.json
176
- with_preprocess/ ← legacy (train/val crop, test full page) — do not use
177
- final_model.pt
 
178
  ...
179
  ```
180
 
 
164
  ## Repo layout
165
 
166
  ```
167
+ center_crop_all/ ← center_crop_whole_page at inference (~99% test)
168
  final_model.pt
169
  model_card.json
170
+ results.json ← includes confusion_matrix
171
+ confusion_matrix.json
172
+ confusion_matrix.png
173
+ without_preprocess/ ← full pages (~81% test, ~85% benchmark)
174
  final_model.pt
175
  model_card.json
176
  results.json
177
+ confusion_matrix.json
178
+ confusion_matrix.png
179
+ benchmark_eval_results.json ← benchmark CM in JSON
180
+ with_preprocess/ ← legacy mismatch — do not use
181
  ...
182
  ```
183
 
center_crop_all/confusion_matrix.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "split": "test",
3
+ "labels": [
4
+ "uchen",
5
+ "ume"
6
+ ],
7
+ "matrix": [
8
+ [
9
+ 94,
10
+ 3
11
+ ],
12
+ [
13
+ 3,
14
+ 751
15
+ ]
16
+ ],
17
+ "test_metrics": {
18
+ "loss": 0.032431522018710204,
19
+ "accuracy": 0.9929494712103408,
20
+ "macro_f1": 0.9825466925538024,
21
+ "weighted_f1": 0.9929494712103408,
22
+ "auc_roc": 0.9996991987749186
23
+ },
24
+ "preprocess": {
25
+ "train": "center_crop_whole_page",
26
+ "val": "center_crop_whole_page",
27
+ "test": "center_crop_whole_page",
28
+ "size": 224
29
+ }
30
+ }
center_crop_all/confusion_matrix.png ADDED
center_crop_all/results.json CHANGED
@@ -16,5 +16,15 @@
16
  "test": "center_crop_whole_page",
17
  "size": 224
18
  },
19
- "inference_note": "Use --preprocess center_crop_whole_page at inference (same as train/val/test)."
 
 
 
 
 
 
 
 
 
 
20
  }
 
16
  "test": "center_crop_whole_page",
17
  "size": 224
18
  },
19
+ "inference_note": "Use --preprocess center_crop_whole_page at inference (same as train/val/test).",
20
+ "confusion_matrix": [
21
+ [
22
+ 94,
23
+ 3
24
+ ],
25
+ [
26
+ 3,
27
+ 751
28
+ ]
29
+ ]
30
  }
with_preprocess/confusion_matrix.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "split": "test",
3
+ "labels": [
4
+ "uchen",
5
+ "ume"
6
+ ],
7
+ "matrix": [
8
+ [
9
+ 99,
10
+ 0
11
+ ],
12
+ [
13
+ 381,
14
+ 387
15
+ ]
16
+ ],
17
+ "test_metrics": {
18
+ "loss": 1.5028612467717066,
19
+ "accuracy": 0.5605536332179931,
20
+ "macro_f1": 0.5060493910234842,
21
+ "weighted_f1": 0.6326582036211453,
22
+ "auc_roc": 0.9685921717171717
23
+ }
24
+ }
with_preprocess/confusion_matrix.png ADDED
with_preprocess/results.json CHANGED
@@ -13,5 +13,15 @@
13
  "splits_file": "/root/script-classification-model-train/experiments/uchen_ume_binary/checkpoints/uchen_ume_whole_page/splits.json",
14
  "skip_stage_c": false,
15
  "stage_c_skip_reason": null,
16
- "best_checkpoint": "best_stage_c_last_blocks.pt"
17
- }
 
 
 
 
 
 
 
 
 
 
 
13
  "splits_file": "/root/script-classification-model-train/experiments/uchen_ume_binary/checkpoints/uchen_ume_whole_page/splits.json",
14
  "skip_stage_c": false,
15
  "stage_c_skip_reason": null,
16
+ "best_checkpoint": "best_stage_c_last_blocks.pt",
17
+ "confusion_matrix": [
18
+ [
19
+ 99,
20
+ 0
21
+ ],
22
+ [
23
+ 381,
24
+ 387
25
+ ]
26
+ ]
27
+ }
without_preprocess/confusion_matrix.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "split": "test",
3
+ "labels": [
4
+ "uchen",
5
+ "ume"
6
+ ],
7
+ "matrix": [
8
+ [
9
+ 97,
10
+ 2
11
+ ],
12
+ [
13
+ 165,
14
+ 603
15
+ ]
16
+ ],
17
+ "test_metrics": {
18
+ "loss": 0.48820294297059763,
19
+ "accuracy": 0.8073817762399077,
20
+ "macro_f1": 0.7078823289680483,
21
+ "weighted_f1": 0.8394339697286689,
22
+ "auc_roc": 0.9698679503367003
23
+ }
24
+ }
without_preprocess/confusion_matrix.png ADDED
without_preprocess/results.json CHANGED
@@ -13,5 +13,15 @@
13
  "splits_file": "/root/script-classification-model-train/experiments/uchen_ume_binary/checkpoints/uchen_ume_binary/splits.json",
14
  "skip_stage_c": false,
15
  "stage_c_skip_reason": null,
16
- "best_checkpoint": "best_stage_c_last_blocks.pt"
17
- }
 
 
 
 
 
 
 
 
 
 
 
13
  "splits_file": "/root/script-classification-model-train/experiments/uchen_ume_binary/checkpoints/uchen_ume_binary/splits.json",
14
  "skip_stage_c": false,
15
  "stage_c_skip_reason": null,
16
+ "best_checkpoint": "best_stage_c_last_blocks.pt",
17
+ "confusion_matrix": [
18
+ [
19
+ 97,
20
+ 2
21
+ ],
22
+ [
23
+ 165,
24
+ 603
25
+ ]
26
+ ]
27
+ }