Spaces:

xavier-fuentes
/

text-classifier

Runtime error

App Files Files Community

xavier-fuentes commited on Feb 17

Commit

3ef75e6

verified ·

1 Parent(s): 6b7e476

Upload folder using huggingface_hub

Browse files

Files changed (3) hide show

README.md +30 -19
app.py +94 -7
requirements.txt +4 -3

README.md CHANGED Viewed

@@ -1,35 +1,46 @@
 ---
 title: Zero-Shot Text Classifier
 emoji: 🏷️
-colorFrom: indigo
-colorTo: blue
 sdk: gradio
-sdk_version: 5.14.0
 app_file: app.py
 pinned: false
 ---
 # Zero-Shot Text Classifier
-This Hugging Face Space performs zero-shot text classification with:
-- Model: `facebook/bart-large-mnli`
-- Task: classify input text against user-defined labels
-- Modes: single-label and multi-label
-- Extras: preset label sets, inference timing, long-text truncation handling
-## How to use
-1. Enter text in **Text to Classify**.
-2. Enter labels in **Candidate Labels** as comma-separated values.
-3. Toggle **Multi-label mode** when needed.
-4. Click **Classify** to see score bars and a summary.
-## Presets included
-- Sentiment: positive, negative, neutral
-- Topic: tech, business, sports, science, politics
-- Intent: question, statement, request, complaint
-- Tone: formal, casual, urgent, friendly
-Built by [Xavier Fuentes](https://huggingface.co/xavier-fuentes) @ [AI Enablement Academy](https://enablement.academy) | [Buy me a coffee ☕](https://ko-fi.com/xavierfuentes)

 ---
 title: Zero-Shot Text Classifier
 emoji: 🏷️
+colorFrom: blue
+colorTo: indigo
 sdk: gradio
+sdk_version: "5.33.0"
 app_file: app.py
 pinned: false
+license: apache-2.0
+short_description: Classify text into any custom categories with Qwen3-0.6B
 ---
 # Zero-Shot Text Classifier
+Classify any text into your own custom categories using **Qwen3-0.6B** with zero-shot instruction prompting.
+## Features
+- **Custom labels**: Define any categories you want
+- **Multi-label mode**: Allow multiple labels to apply simultaneously
+- **Preset label sets**: Quick-start with Sentiment, Topic, Intent, or Tone presets
+- **Fast inference**: ~200ms on GPU via ZeroGPU
+## Why Qwen3 over BART-MNLI?
+- Qwen3-0.6B is smaller (0.6B vs 0.4B) but more capable due to modern architecture
+- Handles multi-label classification natively via instruction prompting
+- Supports structured JSON output for downstream integration
+- Better accuracy on diverse classification tasks (not limited to NLI-style inference)
+## API Usage
+```python
+from gradio_client import Client
+client = Client("xavier-fuentes/text-classifier")
+result = client.predict(
+    text="The product quality is amazing but shipping was slow",
+    candidate_labels="positive, negative, mixed",
+    multi_label=False,
+    api_name="/run_classification"
+)
+```
+Built by [Xavier Fuentes](https://huggingface.co/xavier-fuentes) @ [AI Enablement Academy](https://enablement.academy)

app.py CHANGED Viewed

@@ -1,14 +1,21 @@
 import time
 from typing import List, Tuple
 import gradio as gr
 import spaces
-from transformers import pipeline
-MODEL_ID = "facebook/bart-large-mnli"
 MAX_TEXT_CHARS = 4000
-classifier = pipeline("zero-shot-classification", model=MODEL_ID)
 PRESET_LABELS = {
     "Sentiment": "positive, negative, neutral",
@@ -69,6 +76,52 @@ def apply_preset(preset_name: str) -> str:
     return PRESET_LABELS.get(preset_name, "")
 @spaces.GPU
 def run_classification(text: str, candidate_labels: str, multi_label: bool):
     clean_text, was_truncated = truncate_text(text)
@@ -79,11 +132,43 @@ def run_classification(text: str, candidate_labels: str, multi_label: bool):
     if len(labels) < 2:
         raise gr.Error("Please provide at least 2 labels, separated by commas.")
     start = time.perf_counter()
-    result = classifier(clean_text, candidate_labels=labels, multi_label=multi_label)
     elapsed = time.perf_counter() - start
-    sorted_pairs = sorted(zip(result["labels"], result["scores"]), key=lambda x: x[1], reverse=True)
     sorted_labels = [x[0] for x in sorted_pairs]
     sorted_scores = [x[1] for x in sorted_pairs]
@@ -99,8 +184,9 @@ def run_classification(text: str, candidate_labels: str, multi_label: bool):
     summary = (
         f"Top prediction: {top_label} ({top_score:.2f}%). "
         f"Mode: {'multi-label' if multi_label else 'single-label'}. "
-        f"Inference time: {elapsed:.3f} seconds.{truncation_note}"
     )
     return chart_html, summary
@@ -109,7 +195,8 @@ def run_classification(text: str, candidate_labels: str, multi_label: bool):
 with gr.Blocks(theme=gr.themes.Soft(), title="Zero-Shot Text Classifier") as demo:
     gr.Markdown("# Zero-Shot Text Classifier")
     gr.Markdown(
-        "Classify any text into custom labels using `facebook/bart-large-mnli` with zero-shot inference."
     )
     with gr.Row():

+import json
 import time
 from typing import List, Tuple
 import gradio as gr
 import spaces
+import torch
+from transformers import AutoModelForCausalLM, AutoTokenizer
+MODEL_ID = "Qwen/Qwen3-0.6B"
 MAX_TEXT_CHARS = 4000
+tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
+model = AutoModelForCausalLM.from_pretrained(
+    MODEL_ID,
+    torch_dtype=torch.float16,
+    device_map="auto",
+)
 PRESET_LABELS = {
     "Sentiment": "positive, negative, neutral",
     return PRESET_LABELS.get(preset_name, "")
+def build_classification_prompt(text: str, labels: List[str], multi_label: bool) -> str:
+    labels_str = ", ".join(f'"{l}"' for l in labels)
+    mode_instruction = (
+        "Multiple labels can apply simultaneously. For each label, assign a confidence score between 0 and 1."
+        if multi_label
+        else "Choose the single best label. Assign confidence scores that sum to 1."
+    )
+    return (
+        f"Classify the following text into these categories: {labels_str}\n\n"
+        f"{mode_instruction}\n\n"
+        f"Text: \"{text}\"\n\n"
+        f"Respond with ONLY a JSON object mapping each label to its confidence score. "
+        f"Example: {{{', '.join(f'\"{l}\": 0.5' for l in labels[:2])}}}\n"
+        f"JSON:"
+    )
+def parse_scores(output: str, labels: List[str]) -> dict:
+    """Extract label scores from model output, with fallback parsing."""
+    # Try to find JSON in the output
+    output = output.strip()
+    # Find the first { and last }
+    start = output.find("{")
+    end = output.rfind("}")
+    if start != -1 and end != -1 and end > start:
+        json_str = output[start : end + 1]
+        try:
+            parsed = json.loads(json_str)
+            scores = {}
+            for label in labels:
+                # Try exact match, then case-insensitive
+                if label in parsed:
+                    scores[label] = float(parsed[label])
+                else:
+                    lower_map = {k.lower(): v for k, v in parsed.items()}
+                    scores[label] = float(lower_map.get(label.lower(), 0.0))
+            return scores
+        except (json.JSONDecodeError, ValueError):
+            pass
+    # Fallback: equal scores
+    return {label: 1.0 / len(labels) for label in labels}
 @spaces.GPU
 def run_classification(text: str, candidate_labels: str, multi_label: bool):
     clean_text, was_truncated = truncate_text(text)
     if len(labels) < 2:
         raise gr.Error("Please provide at least 2 labels, separated by commas.")
+    prompt = build_classification_prompt(clean_text, labels, multi_label)
+    messages = [
+        {"role": "system", "content": "You are a precise text classifier. Respond only with valid JSON."},
+        {"role": "user", "content": prompt},
+    ]
+    input_text = tokenizer.apply_chat_template(
+        messages, tokenize=False, add_generation_prompt=True,
+        enable_thinking=False,
+    )
     start = time.perf_counter()
+    inputs = tokenizer(input_text, return_tensors="pt").to(model.device)
+    with torch.no_grad():
+        outputs = model.generate(
+            **inputs,
+            max_new_tokens=256,
+            temperature=0.1,
+            do_sample=True,
+            top_p=0.9,
+        )
+    generated = tokenizer.decode(outputs[0][inputs["input_ids"].shape[1]:], skip_special_tokens=True)
     elapsed = time.perf_counter() - start
+    scores = parse_scores(generated, labels)
+    # Normalize scores
+    total = sum(scores.values())
+    if total > 0:
+        scores = {k: v / total for k, v in scores.items()}
+    else:
+        scores = {k: 1.0 / len(labels) for k in labels}
+    sorted_pairs = sorted(scores.items(), key=lambda x: x[1], reverse=True)
     sorted_labels = [x[0] for x in sorted_pairs]
     sorted_scores = [x[1] for x in sorted_pairs]
     summary = (
         f"Top prediction: {top_label} ({top_score:.2f}%). "
+        f"Model: Qwen3-0.6B. "
         f"Mode: {'multi-label' if multi_label else 'single-label'}. "
+        f"Inference time: {elapsed:.3f}s.{truncation_note}"
     )
     return chart_html, summary
 with gr.Blocks(theme=gr.themes.Soft(), title="Zero-Shot Text Classifier") as demo:
     gr.Markdown("# Zero-Shot Text Classifier")
     gr.Markdown(
+        "Classify any text into custom labels using **Qwen3-0.6B** with zero-shot instruction prompting. "
+        "No fine-tuning needed: define your own categories and classify instantly."
     )
     with gr.Row():

requirements.txt CHANGED Viewed

@@ -1,4 +1,5 @@
-gradio
-transformers
-torch
 accelerate

+gradio>=4.0
+transformers>=4.45.0
+torch>=2.0
 accelerate
+spaces