Spaces:

Kratos7270
/

NLP-Hub

Sleeping

Manas

Recommit files with PNGs tracked by LFS

6124cbc about 1 month ago

31.6 kB

	"""
	NLP Hub - Flask backend serving HuggingFace transformer models.
	Models are lazy-loaded on first request to keep startup fast.
	"""

	from flask import Flask, render_template, request, jsonify
	import os
	import threading

	app = Flask(__name__)

	# ---------------------------------------------------------------------------
	# Model registry - each entry describes a HuggingFace pipeline config
	# ---------------------------------------------------------------------------
	BESSTIE_MODELS = {
	"en-IN": "vyshnav112233/BESSTIE-RoBERTa-en-IN-seed7",
	"en-UK": "vyshnav112233/BESSTIE-RoBERTa-en-UK-seed7",
	"en-AU": "vyshnav112233/BESSTIE-RoBERTa-en-AU-seed42",
	}

	SARCASM_LANG_MODELS = {
	"en-IN": "vyshnav112233/roberta-sarcasm-en-IN-seed42",
	"en-UK": "vyshnav112233/roberta-sarcasm-en-UK-seed42",
	"en-AU": "vyshnav112233/roberta-sarcasm-en-AU-seed7",
	}

	TINYLLAMA_LORA_SARCASM_MODELS = {
	"en-IN": "vyshnav112233/task2-3-lora-sarcasm-en-IN-seed-123",
	"en-AU": "vyshnav112233/task2-3-lora-sarcasm-en-AU-seed-2024",
	"en-UK": "vyshnav112233/task2-3-lora-sarcasm-en-UK-seed-42",
	}

	LANG_AWARE_MODELS = {
	"language_roberta": BESSTIE_MODELS,
	"language_roberta_sarcasm": SARCASM_LANG_MODELS,
	"tinyllama_lora_sarcasm": TINYLLAMA_LORA_SARCASM_MODELS,
	}

	HOME_MODEL_KEYS = (
	"roberta_sentiment",
	"language_roberta",
	"logreg_sarcasm",
	"language_roberta_sarcasm",
	"tinyllama_lora_sarcasm",
	)

	MODEL_REGISTRY = {
	"roberta_sentiment": {
	"name": "Task 1: RoBERTa",
	"description": "Classifies text sentiment (positive / negative) using a fine-tuned RoBERTa model.",
	"hf_task": "sentiment-analysis",
	"hf_model": "vyshnav112233/roberta-base-sentiment",
	"display_badge": "Simanta/roberta-base",
	"icon": "fa-face-smile",
	"task_group": "task1",
	"task1_task": "sentiment",
	"family": "ptlm",
	},
	"language_roberta": {
	"name": "Task 2: RoBERTa-dialect",
	"description": "Dialect-aware sentiment analysis fine-tuned on the BESSTIE dataset for Indian, British, and Australian English.",
	"hf_task": "sentiment-analysis",
	"hf_model": "vyshnav112233/BESSTIE-RoBERTa-en-IN-seed7; vyshnav112233/BESSTIE-RoBERTa-en-UK-seed7; vyshnav112233/BESSTIE-RoBERTa-en-AU-seed42",
	"display_badge": "Ryan/RoBERTa-en-IN-seed7; Ryan/RoBERTa-en-UK-seed7; Ryan/RoBERTa-en-AU-seed42",
	"icon": "fa-brain",
	"task_group": "home",
	},
	"logreg_sarcasm": {
	"name": "Task 1: Logistic Regression",
	"description": "TF-IDF (1-2 grams) + Logistic Regression baseline for sarcasm detection. Best macro-F1 among baselines in our benchmark.",
	"hf_task": "sarcasm-detection",
	"hf_model": "sklearn/logreg_sarcasm.joblib",
	"display_badge": "Simanta/sklearn/logreg_sarcasm.joblib",
	"icon": "fa-face-grin-squint-tears",
	"task_group": "home",
	},
	"language_roberta_sarcasm": {
	"name": "Task 2: RoBERTa-dialect",
	"description": "Dialect-aware sarcasm detection fine-tuned on Indian, British, and Australian English RoBERTa checkpoints.",
	"hf_task": "sentiment-analysis",
	"hf_model": "vyshnav112233/roberta-sarcasm-en-IN-seed42; vyshnav112233/roberta-sarcasm-en-UK-seed42; vyshnav112233/roberta-sarcasm-en-AU-seed7",
	"display_badge": "Ryan/RoBERTa-en-IN-seed42; Ryan/RoBERTa-en-UK-seed42; Ryan/RoBERTa-en-AU-seed7",
	"icon": "fa-brain",
	"task_group": "home",
	},
	"tinyllama_lora_sarcasm": {
	"name": "Task 3: TinyLlama-1.1B Adapter",
	"description": "Dialect-aware sarcasm detection using TinyLlama-1.1B with LoRA adapters fine-tuned on Indian, British, and Australian English.",
	"hf_task": "sentiment-analysis",
	"hf_model": "; ".join(TINYLLAMA_LORA_SARCASM_MODELS.values()),
	"display_badge": "Omkar/LORA-en-IN-seed123; Omkar/LORA-en-AU-seed2024; Omkar/LORA-en-UK-seed42",
	"icon": "fa-microchip",
	"task_group": "home",
	},
	"lr_sarcasm": {
	"name": "Logistic Regression",
	"description": "TF-IDF + Logistic Regression baseline trained on Simanta's sarcasm labels.",
	"hf_task": "sarcasm-detection",
	"hf_model": "sklearn/lr_sarcasm.joblib",
	"icon": "fa-chart-line",
	"task_group": "task1",
	"task1_task": "sarcasm",
	"family": "classical",
	},
	"svm_sarcasm": {
	"name": "Linear SVM",
	"description": "TF-IDF + calibrated Linear SVM baseline for sarcasm detection.",
	"hf_task": "sarcasm-detection",
	"hf_model": "sklearn/svm_sarcasm.joblib",
	"icon": "fa-vector-square",
	"task_group": "task1",
	"task1_task": "sarcasm",
	"family": "classical",
	},
	"rf_sarcasm": {
	"name": "Random Forest",
	"description": "TF-IDF + Random Forest baseline for sarcasm detection.",
	"hf_task": "sarcasm-detection",
	"hf_model": "sklearn/rf_sarcasm.joblib",
	"icon": "fa-tree",
	"task_group": "task1",
	"task1_task": "sarcasm",
	"family": "classical",
	},
	"albert_sarcasm": {
	"name": "ALBERT",
	"description": "Fine-tuned ALBERT model for sarcasm detection.",
	"hf_task": "sentiment-analysis",
	"hf_model": "vyshnav112233/albert-base-v2-sarcasm",
	"icon": "fa-layer-group",
	"task_group": "task1",
	"task1_task": "sarcasm",
	"family": "ptlm",
	},
	"roberta_sarcasm": {
	"name": "RoBERTa",
	"description": "Fine-tuned RoBERTa model for sarcasm detection.",
	"hf_task": "sentiment-analysis",
	"hf_model": "vyshnav112233/roberta-base-sarcasm",
	"icon": "fa-brain",
	"task_group": "task1",
	"task1_task": "sarcasm",
	"family": "ptlm",
	},
	"distilbert_sarcasm": {
	"name": "DistilBERT",
	"description": "Fine-tuned DistilBERT model for sarcasm detection.",
	"hf_task": "sentiment-analysis",
	"hf_model": "vyshnav112233/distilbert-base-sarcasm",
	"icon": "fa-bolt",
	"task_group": "task1",
	"task1_task": "sarcasm",
	"family": "ptlm",
	},
	"lr_sentiment": {
	"name": "Logistic Regression",
	"description": "TF-IDF + Logistic Regression baseline trained on Simanta's sentiment labels.",
	"hf_task": "sentiment-analysis",
	"hf_model": "sklearn/lr_sentiment.joblib",
	"icon": "fa-chart-line",
	"task_group": "task1",
	"task1_task": "sentiment",
	"family": "classical",
	},
	"svm_sentiment": {
	"name": "Linear SVM",
	"description": "TF-IDF + calibrated Linear SVM baseline for sentiment analysis.",
	"hf_task": "sentiment-analysis",
	"hf_model": "sklearn/svm_sentiment.joblib",
	"icon": "fa-vector-square",
	"task_group": "task1",
	"task1_task": "sentiment",
	"family": "classical",
	},
	"rf_sentiment": {
	"name": "Random Forest",
	"description": "TF-IDF + Random Forest baseline for sentiment analysis.",
	"hf_task": "sentiment-analysis",
	"hf_model": "sklearn/rf_sentiment.joblib",
	"icon": "fa-tree",
	"task_group": "task1",
	"task1_task": "sentiment",
	"family": "classical",
	},
	"albert_sentiment": {
	"name": "ALBERT",
	"description": "Fine-tuned ALBERT model for sentiment analysis.",
	"hf_task": "sentiment-analysis",
	"hf_model": "vyshnav112233/albert-base-v2-sentiment",
	"icon": "fa-layer-group",
	"task_group": "task1",
	"task1_task": "sentiment",
	"family": "ptlm",
	},
	"distilbert_sentiment": {
	"name": "DistilBERT",
	"description": "Fine-tuned DistilBERT model for sentiment analysis.",
	"hf_task": "sentiment-analysis",
	"hf_model": "vyshnav112233/distilbert-base-sentiment",
	"icon": "fa-bolt",
	"task_group": "task1",
	"task1_task": "sentiment",
	"family": "ptlm",
	},
	"t2_sentiment_au": {
	"name": "RoBERTa · Trained on en-AU",
	"description": "RoBERTa-base fine-tuned only on Australian English BESSTIE sentiment data.",
	"hf_task": "sentiment-analysis",
	"hf_model": "vyshnav112233/BESSTIE-RoBERTa-en-AU-seed42",
	"icon": "fa-brain",
	"task_group": "task2",
	"task2_task": "sentiment",
	"trained_on": "en-AU",
	},
	"t2_sentiment_in": {
	"name": "RoBERTa · Trained on en-IN",
	"description": "RoBERTa-base fine-tuned only on Indian English BESSTIE sentiment data.",
	"hf_task": "sentiment-analysis",
	"hf_model": "vyshnav112233/BESSTIE-RoBERTa-en-IN-seed7",
	"icon": "fa-brain",
	"task_group": "task2",
	"task2_task": "sentiment",
	"trained_on": "en-IN",
	},
	"t2_sentiment_uk": {
	"name": "RoBERTa · Trained on en-UK",
	"description": "RoBERTa-base fine-tuned only on British English BESSTIE sentiment data.",
	"hf_task": "sentiment-analysis",
	"hf_model": "vyshnav112233/BESSTIE-RoBERTa-en-UK-seed7",
	"icon": "fa-brain",
	"task_group": "task2",
	"task2_task": "sentiment",
	"trained_on": "en-UK",
	},
	"t2_sentiment_mixed": {
	"name": "RoBERTa · Trained on Mixed (all 3)",
	"description": "RoBERTa-base fine-tuned on en-AU, en-IN, and en-UK BESSTIE sentiment data combined.",
	"hf_task": "sentiment-analysis",
	"hf_model": "vyshnav112233/BESSTIE-RoBERTa-mixed-seed123",
	"icon": "fa-brain",
	"task_group": "task2",
	"task2_task": "sentiment",
	"trained_on": "mixed",
	},
	"t2_sarcasm_au": {
	"name": "RoBERTa · Trained on en-AU",
	"description": "RoBERTa-base fine-tuned only on Australian English BESSTIE sarcasm data.",
	"hf_task": "sentiment-analysis",
	"hf_model": "vyshnav112233/roberta-sarcasm-en-AU-seed7",
	"icon": "fa-brain",
	"task_group": "task2",
	"task2_task": "sarcasm",
	"trained_on": "en-AU",
	},
	"t2_sarcasm_in": {
	"name": "RoBERTa · Trained on en-IN",
	"description": "RoBERTa-base fine-tuned only on Indian English BESSTIE sarcasm data.",
	"hf_task": "sentiment-analysis",
	"hf_model": "vyshnav112233/roberta-sarcasm-en-IN-seed42",
	"icon": "fa-brain",
	"task_group": "task2",
	"task2_task": "sarcasm",
	"trained_on": "en-IN",
	},
	"t2_sarcasm_uk": {
	"name": "RoBERTa · Trained on en-UK",
	"description": "RoBERTa-base fine-tuned only on British English BESSTIE sarcasm data.",
	"hf_task": "sentiment-analysis",
	"hf_model": "vyshnav112233/roberta-sarcasm-en-UK-seed42",
	"icon": "fa-brain",
	"task_group": "task2",
	"task2_task": "sarcasm",
	"trained_on": "en-UK",
	},
	"t3_sarcasm_au": {
	"name": "TinyLlama-LoRA · Trained on en-AU",
	"description": "TinyLlama-1.1B-Chat with a LoRA adapter fine-tuned only on Australian English sarcasm data (seed 2024).",
	"hf_task": "sentiment-analysis",
	"hf_model": TINYLLAMA_LORA_SARCASM_MODELS["en-AU"],
	"icon": "fa-microchip",
	"task_group": "task3",
	"task3_task": "sarcasm",
	"trained_on": "en-AU",
	"lora_adapter": True,
	},
	"t3_sarcasm_in": {
	"name": "TinyLlama-LoRA · Trained on en-IN",
	"description": "TinyLlama-1.1B-Chat with a LoRA adapter fine-tuned only on Indian English sarcasm data (seed 123).",
	"hf_task": "sentiment-analysis",
	"hf_model": TINYLLAMA_LORA_SARCASM_MODELS["en-IN"],
	"icon": "fa-microchip",
	"task_group": "task3",
	"task3_task": "sarcasm",
	"trained_on": "en-IN",
	"lora_adapter": True,
	},
	"t3_sarcasm_uk": {
	"name": "TinyLlama-LoRA · Trained on en-UK",
	"description": "TinyLlama-1.1B-Chat with a LoRA adapter fine-tuned only on British English sarcasm data (seed 42).",
	"hf_task": "sentiment-analysis",
	"hf_model": TINYLLAMA_LORA_SARCASM_MODELS["en-UK"],
	"icon": "fa-microchip",
	"task_group": "task3",
	"task3_task": "sarcasm",
	"trained_on": "en-UK",
	"lora_adapter": True,
	},
	}

	SKLEARN_ARTIFACTS = {
	"logreg_sarcasm": os.path.join("models", "logreg_sarcasm.joblib"),
	"lr_sarcasm": os.path.join("models", "lr_sarcasm.joblib"),
	"svm_sarcasm": os.path.join("models", "svm_sarcasm.joblib"),
	"rf_sarcasm": os.path.join("models", "rf_sarcasm.joblib"),
	"lr_sentiment": os.path.join("models", "lr_sentiment.joblib"),
	"svm_sentiment": os.path.join("models", "svm_sentiment.joblib"),
	"rf_sentiment": os.path.join("models", "rf_sentiment.joblib"),
	}

	TASK1_EVAL = {
	"sentiment": [
	{"model": "SVM", "family": "Classical", "accuracy": 0.838, "precision": 0.838, "recall": 0.838, "macro_f1": 0.838},
	{"model": "Logistic Regression", "family": "Classical", "accuracy": 0.830, "precision": 0.830, "recall": 0.830, "macro_f1": 0.830},
	{"model": "Random Forest", "family": "Classical", "accuracy": 0.795, "precision": 0.795, "recall": 0.795, "macro_f1": 0.795},
	{"model": "RoBERTa", "family": "PTLM", "accuracy": 0.896, "precision": 0.896, "recall": 0.896, "macro_f1": 0.896},
	{"model": "DistilBERT", "family": "PTLM", "accuracy": 0.868, "precision": 0.868, "recall": 0.868, "macro_f1": 0.868},
	{"model": "ALBERT", "family": "PTLM", "accuracy": 0.865, "precision": 0.865, "recall": 0.865, "macro_f1": 0.865},
	],
	"sarcasm": [
	{"model": "Random Forest", "family": "Classical", "accuracy": 0.502, "precision": 0.502, "recall": 0.502, "macro_f1": 0.502},
	{"model": "SVM", "family": "Classical", "accuracy": 0.585, "precision": 0.585, "recall": 0.585, "macro_f1": 0.585},
	{"model": "Logistic Regression", "family": "Classical", "accuracy": 0.677, "precision": 0.677, "recall": 0.677, "macro_f1": 0.677},
	{"model": "RoBERTa", "family": "PTLM", "accuracy": 0.462, "precision": 0.462, "recall": 0.462, "macro_f1": 0.462},
	{"model": "DistilBERT", "family": "PTLM", "accuracy": 0.611, "precision": 0.611, "recall": 0.611, "macro_f1": 0.611},
	{"model": "ALBERT", "family": "PTLM", "accuracy": 0.462, "precision": 0.462, "recall": 0.462, "macro_f1": 0.462},
	],
	}

	TASK2_EVAL = {
	"sentiment": [
	{"trained_on": "en-AU", "tested_on": "en-AU", "macro_f1": 0.8941, "macro_f1_std": 0.0053, "macro_p": 0.8965, "macro_r": 0.8935},
	{"trained_on": "en-AU", "tested_on": "en-IN", "macro_f1": 0.8196, "macro_f1_std": 0.0203, "macro_p": 0.8250, "macro_r": 0.8228},
	{"trained_on": "en-AU", "tested_on": "en-UK", "macro_f1": 0.9437, "macro_f1_std": 0.0007, "macro_p": 0.9443, "macro_r": 0.9436},
	{"trained_on": "en-IN", "tested_on": "en-AU", "macro_f1": 0.8659, "macro_f1_std": 0.0047, "macro_p": 0.8737, "macro_r": 0.8654},
	{"trained_on": "en-IN", "tested_on": "en-IN", "macro_f1": 0.8409, "macro_f1_std": 0.0056, "macro_p": 0.8444, "macro_r": 0.8417},
	{"trained_on": "en-IN", "tested_on": "en-UK", "macro_f1": 0.9323, "macro_f1_std": 0.0040, "macro_p": 0.9328, "macro_r": 0.9325},
	{"trained_on": "en-UK", "tested_on": "en-AU", "macro_f1": 0.8761, "macro_f1_std": 0.0168, "macro_p": 0.8855, "macro_r": 0.8748},
	{"trained_on": "en-UK", "tested_on": "en-IN", "macro_f1": 0.8463, "macro_f1_std": 0.0008, "macro_p": 0.8467, "macro_r": 0.8463},
	{"trained_on": "en-UK", "tested_on": "en-UK", "macro_f1": 0.9471, "macro_f1_std": 0.0000, "macro_p": 0.9471, "macro_r": 0.9472},
	{"trained_on": "mixed", "tested_on": "en-AU", "macro_f1": 0.8910, "macro_f1_std": 0.0070, "macro_p": 0.8942, "macro_r": 0.8902},
	{"trained_on": "mixed", "tested_on": "en-IN", "macro_f1": 0.8449, "macro_f1_std": 0.0082, "macro_p": 0.8449, "macro_r": 0.8453},
	{"trained_on": "mixed", "tested_on": "en-UK", "macro_f1": 0.9523, "macro_f1_std": 0.0078, "macro_p": 0.9535, "macro_r": 0.9521},
	],
	"sarcasm": [
	{"trained_on": "en-AU", "tested_on": "en-AU", "macro_f1": 0.7570, "macro_f1_std": 0.0078, "macro_p": 0.7542, "macro_r": 0.7892},
	{"trained_on": "en-AU", "tested_on": "en-IN", "macro_f1": 0.4896, "macro_f1_std": 0.0170, "macro_p": 0.5531, "macro_r": 0.6991},
	{"trained_on": "en-AU", "tested_on": "en-UK", "macro_f1": 0.5822, "macro_f1_std": 0.0227, "macro_p": 0.6008, "macro_r": 0.8212},
	{"trained_on": "en-IN", "tested_on": "en-AU", "macro_f1": 0.4628, "macro_f1_std": 0.0617, "macro_p": 0.6261, "macro_r": 0.5228},
	{"trained_on": "en-IN", "tested_on": "en-IN", "macro_f1": 0.6044, "macro_f1_std": 0.0447, "macro_p": 0.6131, "macro_r": 0.6320},
	{"trained_on": "en-IN", "tested_on": "en-UK", "macro_f1": 0.5533, "macro_f1_std": 0.0902, "macro_p": 0.7034, "macro_r": 0.5617},
	{"trained_on": "en-UK", "tested_on": "en-AU", "macro_f1": 0.6058, "macro_f1_std": 0.0484, "macro_p": 0.6722, "macro_r": 0.6062},
	{"trained_on": "en-UK", "tested_on": "en-IN", "macro_f1": 0.5747, "macro_f1_std": 0.0166, "macro_p": 0.5772, "macro_r": 0.7117},
	{"trained_on": "en-UK", "tested_on": "en-UK", "macro_f1": 0.7025, "macro_f1_std": 0.0215, "macro_p": 0.7029, "macro_r": 0.7291},
	],
	}

	TASK3_EVAL = {
	"sarcasm": [
	{"trained_on": "en-AU", "tested_on": "en-AU", "macro_f1": 0.7603, "macro_f1_std": 0.0291, "macro_p": 0.7588, "macro_r": 0.7902},
	{"trained_on": "en-AU", "tested_on": "en-IN", "macro_f1": 0.5005, "macro_f1_std": 0.0240, "macro_p": 0.5531, "macro_r": 0.6915},
	{"trained_on": "en-AU", "tested_on": "en-UK", "macro_f1": 0.5805, "macro_f1_std": 0.0413, "macro_p": 0.6031, "macro_r": 0.8315},
	{"trained_on": "en-IN", "tested_on": "en-AU", "macro_f1": 0.5394, "macro_f1_std": 0.1054, "macro_p": 0.7578, "macro_r": 0.5669},
	{"trained_on": "en-IN", "tested_on": "en-IN", "macro_f1": 0.5964, "macro_f1_std": 0.0817, "macro_p": 0.7411, "macro_r": 0.6797},
	{"trained_on": "en-IN", "tested_on": "en-UK", "macro_f1": 0.6661, "macro_f1_std": 0.1357, "macro_p": 0.7979, "macro_r": 0.7001},
	{"trained_on": "en-UK", "tested_on": "en-AU", "macro_f1": 0.6003, "macro_f1_std": 0.0171, "macro_p": 0.6388, "macro_r": 0.5951},
	{"trained_on": "en-UK", "tested_on": "en-IN", "macro_f1": 0.6331, "macro_f1_std": 0.0253, "macro_p": 0.6132, "macro_r": 0.7935},
	{"trained_on": "en-UK", "tested_on": "en-UK", "macro_f1": 0.7724, "macro_f1_std": 0.0088, "macro_p": 0.7418, "macro_r": 0.8183},
	],
	}

	# Lazy-loaded pipeline cache
	_pipelines = {}
	_lock = threading.Lock()


	def get_pipeline(model_key: str, lang_code: str = None):
	"""Return a cached transformers pipeline, loading on first call."""
	cache_key = f"{model_key}:{lang_code}" if model_key in LANG_AWARE_MODELS else model_key

	if cache_key in _pipelines:
	return _pipelines[cache_key]

	with _lock:
	if cache_key in _pipelines:
	return _pipelines[cache_key]

	cfg = MODEL_REGISTRY[model_key]

	if model_key in LANG_AWARE_MODELS:
	dialect_map = LANG_AWARE_MODELS[model_key]
	hf_model = dialect_map.get(lang_code, dialect_map["en-UK"])

	if model_key == "tinyllama_lora_sarcasm":
	from peft import AutoPeftModelForCausalLM
	from transformers import AutoTokenizer

	print(f"[INFO] Loading PEFT causal-LM adapter: {hf_model} ...")
	model = AutoPeftModelForCausalLM.from_pretrained(hf_model)
	model.eval()
	try:
	tokenizer = AutoTokenizer.from_pretrained(hf_model)
	except Exception:
	base_id = model.peft_config["default"].base_model_name_or_path
	tokenizer = AutoTokenizer.from_pretrained(base_id)
	if tokenizer.pad_token is None:
	tokenizer.pad_token = tokenizer.eos_token
	pipe = {"_yes_no_lora": True, "model": model, "tokenizer": tokenizer}
	else:
	from transformers import pipeline

	print(f"[INFO] Loading dialect-aware model: {hf_model} ...")
	pipe = pipeline("sentiment-analysis", model=hf_model)
	elif cfg.get("lora_adapter"):
	from peft import AutoPeftModelForCausalLM
	from transformers import AutoTokenizer

	hf_model = cfg["hf_model"]
	print(f"[INFO] Loading PEFT causal-LM adapter: {hf_model} ...")
	model = AutoPeftModelForCausalLM.from_pretrained(hf_model)
	model.eval()
	try:
	tokenizer = AutoTokenizer.from_pretrained(hf_model)
	except Exception:
	base_id = model.peft_config["default"].base_model_name_or_path
	tokenizer = AutoTokenizer.from_pretrained(base_id)
	if tokenizer.pad_token is None:
	tokenizer.pad_token = tokenizer.eos_token
	pipe = {"_yes_no_lora": True, "model": model, "tokenizer": tokenizer}
	elif model_key in SKLEARN_ARTIFACTS:
	import joblib

	artifact_path = SKLEARN_ARTIFACTS[model_key]
	print(f"[INFO] Loading sklearn artifact: {artifact_path} ...")
	pipe = joblib.load(artifact_path)
	if hasattr(pipe, "named_steps"):
	clf = pipe.named_steps.get("clf")
	if hasattr(clf, "n_jobs"):
	clf.n_jobs = 1
	else:
	from transformers import pipeline

	print(f"[INFO] Loading model: {cfg['hf_model']} ...")
	pipe = pipeline(cfg["hf_task"], model=cfg["hf_model"])

	_pipelines[cache_key] = pipe
	return pipe


	def _run_inference(model_key: str, text: str, language: str = "UK English"):
	lang_code = language if language in BESSTIE_MODELS else None
	pipe = get_pipeline(model_key, lang_code)
	cfg = MODEL_REGISTRY[model_key]
	task = cfg["hf_task"]

	if isinstance(pipe, dict) and pipe.get("_yes_no_lora"):
	import torch

	lora_model = pipe["model"]
	tokenizer = pipe["tokenizer"]

	messages = [
	{"role": "user", "content": f'Is the following text sarcastic? Answer with only "Yes" or "No".\n\nText: "{text}"'}
	]
	prompt = tokenizer.apply_chat_template(messages, tokenize=False, add_generation_prompt=True)
	inputs = tokenizer(prompt, return_tensors="pt").to(lora_model.device)

	with torch.no_grad():
	logits = lora_model(**inputs).logits[0, -1]

	yes_id = tokenizer.encode("Yes", add_special_tokens=False)[0]
	no_id = tokenizer.encode("No", add_special_tokens=False)[0]
	pair = torch.tensor([logits[yes_id].item(), logits[no_id].item()])
	probs = torch.softmax(pair, dim=0)
	prob_yes = float(probs[0])

	is_sarcastic = prob_yes > 0.5
	result = {
	"label": "SARCASTIC" if is_sarcastic else "NOT_SARCASTIC",
	"score": round(prob_yes if is_sarcastic else 1.0 - prob_yes, 4),
	}

	elif model_key in SKLEARN_ARTIFACTS:
	pred = int(pipe.predict([text])[0])
	proba = pipe.predict_proba([text])[0]
	if task == "sarcasm-detection":
	label = "SARCASTIC" if pred == 1 else "NOT_SARCASTIC"
	elif cfg.get("task1_task") == "sentiment":
	label = "POSITIVE" if pred == 1 else "NEGATIVE"
	else:
	label = str(pred)
	result = {"label": label, "score": round(float(max(proba)), 4)}

	elif task == "question-answering":
	parts = text.split("[SEP]")
	if len(parts) < 2:
	raise ValueError("For QA, separate context and question with [SEP].")
	context = parts[0].strip()
	question = parts[1].strip()
	raw = pipe(question=question, context=context)
	result = {"answer": raw["answer"], "score": round(raw["score"], 4)}

	elif task == "zero-shot-classification":
	candidate_labels = ["politics", "technology", "sports", "health", "finance", "entertainment", "science"]
	raw = pipe(text, candidate_labels=candidate_labels)
	result = {"labels": raw["labels"][:5], "scores": [round(s, 4) for s in raw["scores"][:5]]}

	elif task == "ner":
	raw = pipe(text)
	result = {
	"entities": [
	{"word": ent["word"], "entity": ent["entity"], "score": round(ent["score"], 4)}
	for ent in raw
	]
	}

	elif task == "summarization":
	max_len = min(130, max(30, len(text.split()) // 2))
	raw = pipe(text, max_length=max_len, min_length=15, do_sample=False)
	result = {"summary": raw[0]["summary_text"]}

	elif task == "text-generation":
	raw = pipe(text, max_new_tokens=120, num_return_sequences=1, do_sample=True, temperature=0.8)
	result = {"generated": raw[0]["generated_text"]}

	elif task == "fill-mask":
	result_raw = pipe(text)
	result = {
	"predictions": [
	{"token": pred["token_str"], "score": round(pred["score"], 4), "sequence": pred["sequence"]}
	for pred in result_raw[:5]
	]
	}

	else:
	raw = pipe(text)
	if isinstance(raw, list) and isinstance(raw[0], list):
	raw = raw[0]
	top = raw[0]
	result = {"label": top["label"], "score": round(top["score"], 4)}

	result["model"] = cfg["name"]
	result["language"] = language
	result["family"] = cfg.get("family", "")
	return result


	# ---------------------------------------------------------------------------
	# Routes - pages
	# ---------------------------------------------------------------------------
	@app.route("/")
	def home():
	home_models = {key: MODEL_REGISTRY[key] for key in HOME_MODEL_KEYS}
	return render_template("home.html", models=home_models)


	@app.route("/task1")
	def task1():
	task1_models = {
	key: model
	for key, model in MODEL_REGISTRY.items()
	if model.get("task_group") == "task1"
	}
	return render_template("task1.html", models=task1_models, eval_tables=TASK1_EVAL)


	@app.route("/task2")
	def task2():
	task2_models = {
	key: model
	for key, model in MODEL_REGISTRY.items()
	if model.get("task_group") == "task2"
	}
	return render_template("task2.html", models=task2_models, eval_tables=TASK2_EVAL)


	@app.route("/task3")
	def task3():
	task3_models = {
	key: model
	for key, model in MODEL_REGISTRY.items()
	if model.get("task_group") == "task3"
	}
	return render_template("task3.html", models=task3_models, eval_tables=TASK3_EVAL)


	# ---------------------------------------------------------------------------
	# API - model inference
	# ---------------------------------------------------------------------------
	@app.route("/api/infer", methods=["POST"])
	def infer():
	"""Run inference on the selected model and return JSON results."""
	data = request.get_json(force=True)
	text = data.get("text", "").strip()
	model_key = data.get("model", "")
	language = data.get("language", "UK English")

	if not text:
	return jsonify({"error": "Please enter some text."}), 400
	if model_key not in MODEL_REGISTRY:
	return jsonify({"error": f"Unknown model: {model_key}"}), 400

	lang_code = language if language in BESSTIE_MODELS else None
	if model_key in LANG_AWARE_MODELS and not lang_code:
	return jsonify({"error": "Please select a language dialect for this model."}), 400

	try:
	return jsonify(_run_inference(model_key, text, language))
	except ValueError as exc:
	return jsonify({"error": str(exc)}), 400
	except Exception as exc:
	return jsonify({"error": str(exc)}), 500


	@app.route("/api/task1/infer", methods=["POST"])
	def task1_infer():
	"""Run one Task 1 model so the frontend can fan out parallel requests."""
	data = request.get_json(force=True)
	text = data.get("text", "").strip()
	task = data.get("task", "")
	model_key = data.get("model_key", "")

	if not text:
	return jsonify({"error": "Please enter some text."}), 400
	if task not in {"sentiment", "sarcasm"}:
	return jsonify({"error": "Task must be sentiment or sarcasm."}), 400
	if model_key not in MODEL_REGISTRY:
	return jsonify({"error": f"Unknown model: {model_key}"}), 400
	if MODEL_REGISTRY[model_key].get("task_group") != "task1":
	return jsonify({"error": f"{model_key} is not a Task 1 model."}), 400
	if MODEL_REGISTRY[model_key].get("task1_task") != task:
	return jsonify({"error": f"{model_key} does not belong to the {task} task."}), 400

	try:
	return jsonify(_run_inference(model_key, text))
	except Exception as exc:
	return jsonify({"error": str(exc), "model": MODEL_REGISTRY[model_key]["name"]}), 500


	@app.route("/api/task2/infer", methods=["POST"])
	def task2_infer():
	"""Run one Task 2 model so the frontend can fan out parallel requests."""
	data = request.get_json(force=True)
	text = data.get("text", "").strip()
	task = data.get("task", "")
	model_key = data.get("model_key", "")

	if not text:
	return jsonify({"error": "Please enter some text."}), 400
	if task not in {"sentiment", "sarcasm"}:
	return jsonify({"error": "Task must be sentiment or sarcasm."}), 400
	if model_key not in MODEL_REGISTRY:
	return jsonify({"error": f"Unknown model: {model_key}"}), 400
	if MODEL_REGISTRY[model_key].get("task_group") != "task2":
	return jsonify({"error": f"{model_key} is not a Task 2 model."}), 400
	if MODEL_REGISTRY[model_key].get("task2_task") != task:
	return jsonify({"error": f"{model_key} does not belong to the {task} task."}), 400

	try:
	result = _run_inference(model_key, text)
	result["trained_on"] = MODEL_REGISTRY[model_key].get("trained_on", "")
	return jsonify(result)
	except Exception as exc:
	return jsonify({"error": str(exc), "model": MODEL_REGISTRY[model_key]["name"]}), 500


	@app.route("/api/task3/infer", methods=["POST"])
	def task3_infer():
	"""Run one Task 3 model so the frontend can fan out parallel requests."""
	data = request.get_json(force=True)
	text = data.get("text", "").strip()
	task = data.get("task", "")
	model_key = data.get("model_key", "")

	if not text:
	return jsonify({"error": "Please enter some text."}), 400
	if task not in {"sarcasm"}:
	return jsonify({"error": "Task must be sarcasm."}), 400
	if model_key not in MODEL_REGISTRY:
	return jsonify({"error": f"Unknown model: {model_key}"}), 400
	if MODEL_REGISTRY[model_key].get("task_group") != "task3":
	return jsonify({"error": f"{model_key} is not a Task 3 model."}), 400
	if MODEL_REGISTRY[model_key].get("task3_task") != task:
	return jsonify({"error": f"{model_key} does not belong to the {task} task."}), 400

	try:
	result = _run_inference(model_key, text)
	result["trained_on"] = MODEL_REGISTRY[model_key].get("trained_on", "")
	return jsonify(result)
	except Exception as exc:
	return jsonify({"error": str(exc), "model": MODEL_REGISTRY[model_key]["name"]}), 500


	# ---------------------------------------------------------------------------
	if __name__ == "__main__":
	port = int(os.environ.get("PORT", 7860))
	app.run(host="0.0.0.0", debug=True, port=port)