LilithHu's picture
Update app.py
0e24b29 verified
import gradio as gr
from transformers import AutoTokenizer, AutoModelForSequenceClassification
import torch
# 加载模型和 tokenizer
model_name = "LilithHu/new-manipulation-model"
tokenizer = AutoTokenizer.from_pretrained(model_name)
model = AutoModelForSequenceClassification.from_pretrained(model_name)
# 设置为评估模式
model.eval()
# 设置运行设备
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
model.to(device)
# 标签名
labels = ["Non-manipulative / 非操纵性", "Manipulative / 操纵性"]
# 推理函数
def classify(text):
inputs = tokenizer(text, return_tensors="pt", truncation=True, padding=True).to(device)
with torch.no_grad():
outputs = model(**inputs)
probs = torch.softmax(outputs.logits, dim=1)[0]
threshold = 0.7 # 自定义阈值
if probs[1].item() > threshold:
pred = 1 # 判为操纵性
else:
pred = 0 # 判为非操纵性
confidence = min(probs[pred].item(), 0.95) # 置信度依然可以控制上限
percent = round(confidence * 100, 2)
result = f"Prediction / 预测:\n{labels[pred]}\n"
return result
#谁大选谁
#pred = torch.argmax(probs).item()
#confidence = min(probs[pred].item(), 0.95) # 限制置信度最大为95%
# Gradio 界面
interface = gr.Interface(
fn=classify,
inputs=gr.Textbox(
lines=4,
placeholder="Enter text in English or Chinese... ",
label="📝 Input Text"
),
outputs=gr.Markdown(label="📊 Prediction"),
title="🔍 Manipulative Language Detector",
description="""
🧪 Enter a sentence in English or Chinese to detect if it's manipulative.
📌 **Disclaimer**
This system is for **research and educational purposes only**.
It **does not guarantee accuracy** and **should not be used as legal or clinical evidence**.
🤖 **Model Info**
- Model: `LilithHu/new-manipulation-model`
- Base: `mDeBERTa-v3` multilingual pre-trained model
- Fine-tuned using HuggingFace Transformers on 10,000 labeled Chinese data
⚠️ **About Examples**
The examples provided below are those **cited in the paper**, including implicit moral coercion, polite masking and false positives.
🌐 **Built with Gradio and hosted on HuggingFace Spaces**
"""
)
interface.launch()