Image Classification
Transformers
Tibetan
tibetan
uchen
ume
script-classification
dinov3
fine-tuned
Eval Results (legacy)
Instructions to use openpecha/uchen-ume-classifier with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- Transformers
How to use openpecha/uchen-ume-classifier with Transformers:
# Use a pipeline as a high-level helper from transformers import pipeline pipe = pipeline("image-classification", model="openpecha/uchen-ume-classifier") pipe("https://huggingface.co/datasets/huggingface/documentation-images/resolve/main/hub/parrots.png")# Load model directly from transformers import AutoModel model = AutoModel.from_pretrained("openpecha/uchen-ume-classifier", dtype="auto") - Notebooks
- Google Colab
- Kaggle
Add test confusion matrices (JSON + PNG) for all variants
Browse files- README.md +9 -6
- center_crop_all/confusion_matrix.json +30 -0
- center_crop_all/confusion_matrix.png +0 -0
- center_crop_all/results.json +11 -1
- with_preprocess/confusion_matrix.json +24 -0
- with_preprocess/confusion_matrix.png +0 -0
- with_preprocess/results.json +12 -2
- without_preprocess/confusion_matrix.json +24 -0
- without_preprocess/confusion_matrix.png +0 -0
- without_preprocess/results.json +12 -2
README.md
CHANGED
|
@@ -164,17 +164,20 @@ python inference_uchen_ume.py \
|
|
| 164 |
## Repo layout
|
| 165 |
|
| 166 |
```
|
| 167 |
-
center_crop_all/ ←
|
| 168 |
final_model.pt
|
| 169 |
model_card.json
|
| 170 |
-
results.json
|
| 171 |
-
|
|
|
|
|
|
|
| 172 |
final_model.pt
|
| 173 |
model_card.json
|
| 174 |
results.json
|
| 175 |
-
|
| 176 |
-
|
| 177 |
-
|
|
|
|
| 178 |
...
|
| 179 |
```
|
| 180 |
|
|
|
|
| 164 |
## Repo layout
|
| 165 |
|
| 166 |
```
|
| 167 |
+
center_crop_all/ ← center_crop_whole_page at inference (~99% test)
|
| 168 |
final_model.pt
|
| 169 |
model_card.json
|
| 170 |
+
results.json ← includes confusion_matrix
|
| 171 |
+
confusion_matrix.json
|
| 172 |
+
confusion_matrix.png
|
| 173 |
+
without_preprocess/ ← full pages (~81% test, ~85% benchmark)
|
| 174 |
final_model.pt
|
| 175 |
model_card.json
|
| 176 |
results.json
|
| 177 |
+
confusion_matrix.json
|
| 178 |
+
confusion_matrix.png
|
| 179 |
+
benchmark_eval_results.json ← benchmark CM in JSON
|
| 180 |
+
with_preprocess/ ← legacy mismatch — do not use
|
| 181 |
...
|
| 182 |
```
|
| 183 |
|
center_crop_all/confusion_matrix.json
ADDED
|
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"split": "test",
|
| 3 |
+
"labels": [
|
| 4 |
+
"uchen",
|
| 5 |
+
"ume"
|
| 6 |
+
],
|
| 7 |
+
"matrix": [
|
| 8 |
+
[
|
| 9 |
+
94,
|
| 10 |
+
3
|
| 11 |
+
],
|
| 12 |
+
[
|
| 13 |
+
3,
|
| 14 |
+
751
|
| 15 |
+
]
|
| 16 |
+
],
|
| 17 |
+
"test_metrics": {
|
| 18 |
+
"loss": 0.032431522018710204,
|
| 19 |
+
"accuracy": 0.9929494712103408,
|
| 20 |
+
"macro_f1": 0.9825466925538024,
|
| 21 |
+
"weighted_f1": 0.9929494712103408,
|
| 22 |
+
"auc_roc": 0.9996991987749186
|
| 23 |
+
},
|
| 24 |
+
"preprocess": {
|
| 25 |
+
"train": "center_crop_whole_page",
|
| 26 |
+
"val": "center_crop_whole_page",
|
| 27 |
+
"test": "center_crop_whole_page",
|
| 28 |
+
"size": 224
|
| 29 |
+
}
|
| 30 |
+
}
|
center_crop_all/confusion_matrix.png
ADDED
|
center_crop_all/results.json
CHANGED
|
@@ -16,5 +16,15 @@
|
|
| 16 |
"test": "center_crop_whole_page",
|
| 17 |
"size": 224
|
| 18 |
},
|
| 19 |
-
"inference_note": "Use --preprocess center_crop_whole_page at inference (same as train/val/test)."
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 20 |
}
|
|
|
|
| 16 |
"test": "center_crop_whole_page",
|
| 17 |
"size": 224
|
| 18 |
},
|
| 19 |
+
"inference_note": "Use --preprocess center_crop_whole_page at inference (same as train/val/test).",
|
| 20 |
+
"confusion_matrix": [
|
| 21 |
+
[
|
| 22 |
+
94,
|
| 23 |
+
3
|
| 24 |
+
],
|
| 25 |
+
[
|
| 26 |
+
3,
|
| 27 |
+
751
|
| 28 |
+
]
|
| 29 |
+
]
|
| 30 |
}
|
with_preprocess/confusion_matrix.json
ADDED
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"split": "test",
|
| 3 |
+
"labels": [
|
| 4 |
+
"uchen",
|
| 5 |
+
"ume"
|
| 6 |
+
],
|
| 7 |
+
"matrix": [
|
| 8 |
+
[
|
| 9 |
+
99,
|
| 10 |
+
0
|
| 11 |
+
],
|
| 12 |
+
[
|
| 13 |
+
381,
|
| 14 |
+
387
|
| 15 |
+
]
|
| 16 |
+
],
|
| 17 |
+
"test_metrics": {
|
| 18 |
+
"loss": 1.5028612467717066,
|
| 19 |
+
"accuracy": 0.5605536332179931,
|
| 20 |
+
"macro_f1": 0.5060493910234842,
|
| 21 |
+
"weighted_f1": 0.6326582036211453,
|
| 22 |
+
"auc_roc": 0.9685921717171717
|
| 23 |
+
}
|
| 24 |
+
}
|
with_preprocess/confusion_matrix.png
ADDED
|
with_preprocess/results.json
CHANGED
|
@@ -13,5 +13,15 @@
|
|
| 13 |
"splits_file": "/root/script-classification-model-train/experiments/uchen_ume_binary/checkpoints/uchen_ume_whole_page/splits.json",
|
| 14 |
"skip_stage_c": false,
|
| 15 |
"stage_c_skip_reason": null,
|
| 16 |
-
"best_checkpoint": "best_stage_c_last_blocks.pt"
|
| 17 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 13 |
"splits_file": "/root/script-classification-model-train/experiments/uchen_ume_binary/checkpoints/uchen_ume_whole_page/splits.json",
|
| 14 |
"skip_stage_c": false,
|
| 15 |
"stage_c_skip_reason": null,
|
| 16 |
+
"best_checkpoint": "best_stage_c_last_blocks.pt",
|
| 17 |
+
"confusion_matrix": [
|
| 18 |
+
[
|
| 19 |
+
99,
|
| 20 |
+
0
|
| 21 |
+
],
|
| 22 |
+
[
|
| 23 |
+
381,
|
| 24 |
+
387
|
| 25 |
+
]
|
| 26 |
+
]
|
| 27 |
+
}
|
without_preprocess/confusion_matrix.json
ADDED
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"split": "test",
|
| 3 |
+
"labels": [
|
| 4 |
+
"uchen",
|
| 5 |
+
"ume"
|
| 6 |
+
],
|
| 7 |
+
"matrix": [
|
| 8 |
+
[
|
| 9 |
+
97,
|
| 10 |
+
2
|
| 11 |
+
],
|
| 12 |
+
[
|
| 13 |
+
165,
|
| 14 |
+
603
|
| 15 |
+
]
|
| 16 |
+
],
|
| 17 |
+
"test_metrics": {
|
| 18 |
+
"loss": 0.48820294297059763,
|
| 19 |
+
"accuracy": 0.8073817762399077,
|
| 20 |
+
"macro_f1": 0.7078823289680483,
|
| 21 |
+
"weighted_f1": 0.8394339697286689,
|
| 22 |
+
"auc_roc": 0.9698679503367003
|
| 23 |
+
}
|
| 24 |
+
}
|
without_preprocess/confusion_matrix.png
ADDED
|
without_preprocess/results.json
CHANGED
|
@@ -13,5 +13,15 @@
|
|
| 13 |
"splits_file": "/root/script-classification-model-train/experiments/uchen_ume_binary/checkpoints/uchen_ume_binary/splits.json",
|
| 14 |
"skip_stage_c": false,
|
| 15 |
"stage_c_skip_reason": null,
|
| 16 |
-
"best_checkpoint": "best_stage_c_last_blocks.pt"
|
| 17 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 13 |
"splits_file": "/root/script-classification-model-train/experiments/uchen_ume_binary/checkpoints/uchen_ume_binary/splits.json",
|
| 14 |
"skip_stage_c": false,
|
| 15 |
"stage_c_skip_reason": null,
|
| 16 |
+
"best_checkpoint": "best_stage_c_last_blocks.pt",
|
| 17 |
+
"confusion_matrix": [
|
| 18 |
+
[
|
| 19 |
+
97,
|
| 20 |
+
2
|
| 21 |
+
],
|
| 22 |
+
[
|
| 23 |
+
165,
|
| 24 |
+
603
|
| 25 |
+
]
|
| 26 |
+
]
|
| 27 |
+
}
|