Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
|
@@ -6,7 +6,7 @@ Features:
|
|
| 6 |
- πΌοΈ Image Analysis (with Face Detection, Signature Extraction, Annotated Highlights)
|
| 7 |
- π Batch Processing
|
| 8 |
- π¬ Chat with Attachments
|
| 9 |
-
All
|
| 10 |
"""
|
| 11 |
|
| 12 |
import os
|
|
@@ -120,17 +120,9 @@ device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
|
|
| 120 |
print(f"π Using device: {device}")
|
| 121 |
|
| 122 |
# ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 123 |
-
# ALL MODELS
|
| 124 |
# ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 125 |
ALL_MODELS = [
|
| 126 |
-
# ββ Qwen3-VL Official ββ
|
| 127 |
-
"Qwen/Qwen3-VL-2B-Instruct",
|
| 128 |
-
"Qwen/Qwen3-VL-4B-Instruct",
|
| 129 |
-
"Qwen/Qwen3-VL-8B-Instruct",
|
| 130 |
-
# ββ Qwen2.5-VL Official ββ
|
| 131 |
-
"Qwen/Qwen2.5-VL-7B-Instruct",
|
| 132 |
-
"Qwen/Qwen2.5-VL-3B-Instruct",
|
| 133 |
-
# ββ Custom Models ββ
|
| 134 |
"Chhagan005/Chhagan_ML-VL-OCR-v1", # Qwen2.5-VL-3B base
|
| 135 |
"Chhagan005/Chhagan-DocVL-Qwen3", # Qwen3-VL-2B LoRA adapter
|
| 136 |
"Chhagan005/CSM-DocExtract-VL", # Qwen3-VL-8B BNB INT4
|
|
@@ -240,9 +232,9 @@ def load_model(model_id: str):
|
|
| 240 |
return processor, model
|
| 241 |
|
| 242 |
# ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 243 |
-
# Pre-load default model
|
| 244 |
# ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 245 |
-
DEFAULT_MODEL = "
|
| 246 |
print(f"β³ Pre-loading default model: {DEFAULT_MODEL}")
|
| 247 |
load_model(DEFAULT_MODEL)
|
| 248 |
print(f"β
Default model ready!")
|
|
@@ -596,7 +588,8 @@ with gr.Blocks(title="Chhagan's Multi-Model Studio") as demo:
|
|
| 596 |
|
| 597 |
gr.Markdown("# π§ Chhagan's Multi-Model Studio", elem_id="app-title")
|
| 598 |
gr.Markdown(
|
| 599 |
-
|
|
|
|
| 600 |
"Document Scanning β’ Image Analysis (Face + Signature) β’ Batch Processing β’ Chat_",
|
| 601 |
elem_id="app-subtitle",
|
| 602 |
)
|
|
@@ -604,7 +597,8 @@ with gr.Blocks(title="Chhagan's Multi-Model Studio") as demo:
|
|
| 604 |
with gr.Row():
|
| 605 |
model_choice = gr.Dropdown(choices=ALL_MODELS, value=DEFAULT_MODEL,
|
| 606 |
label="π€ Select Model",
|
| 607 |
-
|
|
|
|
| 608 |
scale=3, elem_classes="model-selector")
|
| 609 |
|
| 610 |
with gr.Accordion("βοΈ Advanced Generation Parameters", open=False):
|
|
@@ -712,8 +706,8 @@ with gr.Blocks(title="Chhagan's Multi-Model Studio") as demo:
|
|
| 712 |
clear_btn.click(clear_fn, outputs=[chat_msg, chatbot], queue=False)
|
| 713 |
|
| 714 |
gr.Markdown(
|
| 715 |
-
|
| 716 |
-
"
|
| 717 |
"CSM-DocExtract-VL (BNB-INT4) β’ CSM-DocExtract-VL-HF β’ "
|
| 718 |
"CSM-DocExtract-VL-Q4KM-merged-fp16 β’ Chhagan_ML-VL-OCR-v1 β’ Chhagan-DocVL-Qwen3\n\n"
|
| 719 |
"_Built with β€οΈ using Gradio_"
|
|
|
|
| 6 |
- πΌοΈ Image Analysis (with Face Detection, Signature Extraction, Annotated Highlights)
|
| 7 |
- π Batch Processing
|
| 8 |
- π¬ Chat with Attachments
|
| 9 |
+
All 5 Chhagan VL models available across all tabs.
|
| 10 |
"""
|
| 11 |
|
| 12 |
import os
|
|
|
|
| 120 |
print(f"π Using device: {device}")
|
| 121 |
|
| 122 |
# ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 123 |
+
# ALL MODELS βββ CHANGE 1: Only Chhagan custom models remain
|
| 124 |
# ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 125 |
ALL_MODELS = [
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 126 |
"Chhagan005/Chhagan_ML-VL-OCR-v1", # Qwen2.5-VL-3B base
|
| 127 |
"Chhagan005/Chhagan-DocVL-Qwen3", # Qwen3-VL-2B LoRA adapter
|
| 128 |
"Chhagan005/CSM-DocExtract-VL", # Qwen3-VL-8B BNB INT4
|
|
|
|
| 232 |
return processor, model
|
| 233 |
|
| 234 |
# ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 235 |
+
# Pre-load default model βββ CHANGE 2: New default model
|
| 236 |
# ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 237 |
+
DEFAULT_MODEL = "Chhagan005/CSM-DocExtract-VL-HF"
|
| 238 |
print(f"β³ Pre-loading default model: {DEFAULT_MODEL}")
|
| 239 |
load_model(DEFAULT_MODEL)
|
| 240 |
print(f"β
Default model ready!")
|
|
|
|
| 588 |
|
| 589 |
gr.Markdown("# π§ Chhagan's Multi-Model Studio", elem_id="app-title")
|
| 590 |
gr.Markdown(
|
| 591 |
+
# βββ CHANGE 3: Updated subtitle (removed Qwen official mention)
|
| 592 |
+
"_Custom CSM/Chhagan VL models β "
|
| 593 |
"Document Scanning β’ Image Analysis (Face + Signature) β’ Batch Processing β’ Chat_",
|
| 594 |
elem_id="app-subtitle",
|
| 595 |
)
|
|
|
|
| 597 |
with gr.Row():
|
| 598 |
model_choice = gr.Dropdown(choices=ALL_MODELS, value=DEFAULT_MODEL,
|
| 599 |
label="π€ Select Model",
|
| 600 |
+
# βββ CHANGE 4: Updated info text
|
| 601 |
+
info="5 custom CSM/Chhagan models",
|
| 602 |
scale=3, elem_classes="model-selector")
|
| 603 |
|
| 604 |
with gr.Accordion("βοΈ Advanced Generation Parameters", open=False):
|
|
|
|
| 706 |
clear_btn.click(clear_fn, outputs=[chat_msg, chatbot], queue=False)
|
| 707 |
|
| 708 |
gr.Markdown(
|
| 709 |
+
# βββ CHANGE 5: Updated footer (removed Qwen official models, 10β5)
|
| 710 |
+
"---\n**π§ Chhagan's Multi-Model Studio** β’ 5 Models\n\n"
|
| 711 |
"CSM-DocExtract-VL (BNB-INT4) β’ CSM-DocExtract-VL-HF β’ "
|
| 712 |
"CSM-DocExtract-VL-Q4KM-merged-fp16 β’ Chhagan_ML-VL-OCR-v1 β’ Chhagan-DocVL-Qwen3\n\n"
|
| 713 |
"_Built with β€οΈ using Gradio_"
|