Chhagan005 commited on
Commit
2677013
Β·
verified Β·
1 Parent(s): 15fd926

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +10 -16
app.py CHANGED
@@ -6,7 +6,7 @@ Features:
6
  - πŸ–ΌοΈ Image Analysis (with Face Detection, Signature Extraction, Annotated Highlights)
7
  - πŸ“š Batch Processing
8
  - πŸ’¬ Chat with Attachments
9
- All 10 Qwen VL models available across all tabs.
10
  """
11
 
12
  import os
@@ -120,17 +120,9 @@ device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
120
  print(f"πŸš€ Using device: {device}")
121
 
122
  # ──────────────────────────────────────────────────────────────
123
- # ALL MODELS
124
  # ──────────────────────────────────────────────────────────────
125
  ALL_MODELS = [
126
- # ── Qwen3-VL Official ──
127
- "Qwen/Qwen3-VL-2B-Instruct",
128
- "Qwen/Qwen3-VL-4B-Instruct",
129
- "Qwen/Qwen3-VL-8B-Instruct",
130
- # ── Qwen2.5-VL Official ──
131
- "Qwen/Qwen2.5-VL-7B-Instruct",
132
- "Qwen/Qwen2.5-VL-3B-Instruct",
133
- # ── Custom Models ──
134
  "Chhagan005/Chhagan_ML-VL-OCR-v1", # Qwen2.5-VL-3B base
135
  "Chhagan005/Chhagan-DocVL-Qwen3", # Qwen3-VL-2B LoRA adapter
136
  "Chhagan005/CSM-DocExtract-VL", # Qwen3-VL-8B BNB INT4
@@ -240,9 +232,9 @@ def load_model(model_id: str):
240
  return processor, model
241
 
242
  # ──────────────────────────────────────────────────────────────
243
- # Pre-load default model
244
  # ──────────────────────────────────────────────────────────────
245
- DEFAULT_MODEL = "Qwen/Qwen3-VL-8B-Instruct"
246
  print(f"⏳ Pre-loading default model: {DEFAULT_MODEL}")
247
  load_model(DEFAULT_MODEL)
248
  print(f"βœ… Default model ready!")
@@ -596,7 +588,8 @@ with gr.Blocks(title="Chhagan's Multi-Model Studio") as demo:
596
 
597
  gr.Markdown("# 🧠 Chhagan's Multi-Model Studio", elem_id="app-title")
598
  gr.Markdown(
599
- "_Qwen3-VL + Qwen2.5-VL Official + Custom CSM/Chhagan VL models β€” "
 
600
  "Document Scanning β€’ Image Analysis (Face + Signature) β€’ Batch Processing β€’ Chat_",
601
  elem_id="app-subtitle",
602
  )
@@ -604,7 +597,8 @@ with gr.Blocks(title="Chhagan's Multi-Model Studio") as demo:
604
  with gr.Row():
605
  model_choice = gr.Dropdown(choices=ALL_MODELS, value=DEFAULT_MODEL,
606
  label="πŸ€– Select Model",
607
- info="3 Qwen3-VL + 2 Qwen2.5-VL official + 5 custom CSM/Chhagan models",
 
608
  scale=3, elem_classes="model-selector")
609
 
610
  with gr.Accordion("βš™οΈ Advanced Generation Parameters", open=False):
@@ -712,8 +706,8 @@ with gr.Blocks(title="Chhagan's Multi-Model Studio") as demo:
712
  clear_btn.click(clear_fn, outputs=[chat_msg, chatbot], queue=False)
713
 
714
  gr.Markdown(
715
- "---\n**🧠 Chhagan's Multi-Model Studio** β€’ 10 Models\n\n"
716
- "Qwen3-VL (2B/4B/8B) β€’ Qwen2.5-VL (3B/7B) β€’ "
717
  "CSM-DocExtract-VL (BNB-INT4) β€’ CSM-DocExtract-VL-HF β€’ "
718
  "CSM-DocExtract-VL-Q4KM-merged-fp16 β€’ Chhagan_ML-VL-OCR-v1 β€’ Chhagan-DocVL-Qwen3\n\n"
719
  "_Built with ❀️ using Gradio_"
 
6
  - πŸ–ΌοΈ Image Analysis (with Face Detection, Signature Extraction, Annotated Highlights)
7
  - πŸ“š Batch Processing
8
  - πŸ’¬ Chat with Attachments
9
+ All 5 Chhagan VL models available across all tabs.
10
  """
11
 
12
  import os
 
120
  print(f"πŸš€ Using device: {device}")
121
 
122
  # ──────────────────────────────────────────────────────────────
123
+ # ALL MODELS ←── CHANGE 1: Only Chhagan custom models remain
124
  # ──────────────────────────────────────────────────────────────
125
  ALL_MODELS = [
 
 
 
 
 
 
 
 
126
  "Chhagan005/Chhagan_ML-VL-OCR-v1", # Qwen2.5-VL-3B base
127
  "Chhagan005/Chhagan-DocVL-Qwen3", # Qwen3-VL-2B LoRA adapter
128
  "Chhagan005/CSM-DocExtract-VL", # Qwen3-VL-8B BNB INT4
 
232
  return processor, model
233
 
234
  # ──────────────────────────────────────────────────────────────
235
+ # Pre-load default model ←── CHANGE 2: New default model
236
  # ──────────────────────────────────────────────────────────────
237
+ DEFAULT_MODEL = "Chhagan005/CSM-DocExtract-VL-HF"
238
  print(f"⏳ Pre-loading default model: {DEFAULT_MODEL}")
239
  load_model(DEFAULT_MODEL)
240
  print(f"βœ… Default model ready!")
 
588
 
589
  gr.Markdown("# 🧠 Chhagan's Multi-Model Studio", elem_id="app-title")
590
  gr.Markdown(
591
+ # ←── CHANGE 3: Updated subtitle (removed Qwen official mention)
592
+ "_Custom CSM/Chhagan VL models β€” "
593
  "Document Scanning β€’ Image Analysis (Face + Signature) β€’ Batch Processing β€’ Chat_",
594
  elem_id="app-subtitle",
595
  )
 
597
  with gr.Row():
598
  model_choice = gr.Dropdown(choices=ALL_MODELS, value=DEFAULT_MODEL,
599
  label="πŸ€– Select Model",
600
+ # ←── CHANGE 4: Updated info text
601
+ info="5 custom CSM/Chhagan models",
602
  scale=3, elem_classes="model-selector")
603
 
604
  with gr.Accordion("βš™οΈ Advanced Generation Parameters", open=False):
 
706
  clear_btn.click(clear_fn, outputs=[chat_msg, chatbot], queue=False)
707
 
708
  gr.Markdown(
709
+ # ←── CHANGE 5: Updated footer (removed Qwen official models, 10β†’5)
710
+ "---\n**🧠 Chhagan's Multi-Model Studio** β€’ 5 Models\n\n"
711
  "CSM-DocExtract-VL (BNB-INT4) β€’ CSM-DocExtract-VL-HF β€’ "
712
  "CSM-DocExtract-VL-Q4KM-merged-fp16 β€’ Chhagan_ML-VL-OCR-v1 β€’ Chhagan-DocVL-Qwen3\n\n"
713
  "_Built with ❀️ using Gradio_"