Spaces:

enigmaize
/

arxiv-nlp_project-scibert

Sleeping

App Files Files Community

enigmaize commited on Feb 9

Commit

5e2ba76

verified ·

1 Parent(s): 4ccac33

Create app.py

Browse files

Files changed (1) hide show

app.py +54 -0

app.py ADDED Viewed

	@@ -0,0 +1,54 @@

+from transformers import AutoTokenizer, AutoModelForSequenceClassification
+from scipy.special import softmax
+import gradio as gr
+import torch
+model_name = "enigmaize/arxiv-nlp_project-scibert"
+tokenizer = AutoTokenizer.from_pretrained(model_name)
+model = AutoModelForSequenceClassification.from_pretrained(model_name)
+# Имена классов (в порядке, соответствующем вашему `num_labels`)
+labels = ['math.AC', 'cs.CV', 'cs.AI', 'cs.SY', 'math.GR', 'cs.CE', 'cs.PL', 'cs.IT', 'cs.DS', 'cs.NE', 'math.ST']
+def classify_text(text):
+    # Токенизация текста
+    inputs = tokenizer(text, return_tensors="pt", truncation=True, padding=True, max_length=512)
+    # Инференс
+    with torch.no_grad():
+        outputs = model(**inputs)
+        logits = outputs.logits
+    # Применение softmax для получения вероятностей
+    probabilities = torch.nn.functional.softmax(logits, dim=-1).squeeze().tolist()
+    # Создание словаря метка -> вероятность
+    results = {label: prob for label, prob in zip(labels, probabilities)}
+    # Сортировка по вероятности (по убыванию)
+    sorted_results = dict(sorted(results.items(), key=lambda item: item[1], reverse=True))
+    return sorted_results
+# Описание интерфейса
+description = "Enter the abstract of a scientific paper, and the model will predict its arXiv category."
+# Создание интерфейса Gradio
+interface = gr.Interface(
+    fn=classify_text, # Функция, которая будет вызываться
+    inputs=gr.Textbox(lines=10, placeholder="Paste abstract here...", label="Paper Abstract"), # Вход: текстовое поле
+    outputs=gr.Label(num_top_classes=3, label="Predicted Categories"), # Выход: метки с вероятностями
+    title="ArXiv Paper Classifier (SciBERT)",
+    description=description,
+    examples=[
+        ["We propose a novel deep learning approach for image recognition using convolutional neural networks."],
+        ["We analyze the computational complexity of algorithms for sorting and searching."],
+        ["This paper presents a statistical method for analyzing the spread of infectious diseases in populations."]
+    ] # Примеры для удобства
+)
+# Запуск интерфейса (это нужно для локального запуска, не для Spaces)
+# interface.launch()
+# Для Hugging Face Spaces, просто укажите интерфейс
+interface.launch()