Spaces:

tienti0000
/

arxiv-classifier

Sleeping

App Files Files Community

tienti0000 commited on Apr 8, 2025

Commit

6dc42cc

verified ·

1 Parent(s): 9b0f164

Upload 3 files

Browse files

Files changed (3) hide show

app.py +50 -0
arxiv_model.zip +3 -0
requirements.txt +3 -0

app.py ADDED Viewed

	@@ -0,0 +1,50 @@

+import streamlit as st
+import torch
+from transformers import AutoTokenizer, AutoModelForSequenceClassification
+import numpy as np
+@st.cache_resource
+def load_model():
+    model = AutoModelForSequenceClassification.from_pretrained("arxiv_model")
+    tokenizer = AutoTokenizer.from_pretrained("arxiv_model")
+    return model, tokenizer
+model, tokenizer = load_model()
+id2label = model.config.id2label
+st.title("🔬 ArXiv Article Classifier")
+st.markdown("Введите **название** и (по желанию) **аннотацию** статьи. Сервис предскажет вероятные темы!")
+title_input = st.text_input("Название статьи")
+abstract_input = st.text_area("Аннотация (необязательно)")
+if st.button("Классифицировать") and title_input:
+    text = title_input.strip()
+    if abstract_input.strip():
+        text += " " + abstract_input.strip()
+    inputs = tokenizer(text, return_tensors="pt", truncation=True, padding=True, max_length=512)
+    with torch.no_grad():
+        outputs = model(**inputs)
+        probs = torch.nn.functional.softmax(outputs.logits, dim=1).numpy()[0]
+    sorted_indices = np.argsort(probs)[::-1]
+    # top_labels = [(id2label[str(i)], probs[i]) for i in sorted_indices]
+    top_labels = [(id2label[i], probs[i]) for i in sorted_indices]
+    # Топ-95% по суммарной вероятности
+    cumulative = 0.0
+    top95 = []
+    for label, prob in top_labels:
+        top95.append((label, prob))
+        cumulative += prob
+        if cumulative >= 0.95:
+            break
+    st.markdown(f"### 🎯 Основная тема: `{top_labels[0][0]}` ({top_labels[0][1]*100:.2f}%)")
+    st.markdown("### 📋 Категории (до 95% суммарной вероятности):")
+    for label, prob in top95:
+        st.write(f"- `{label}`: {prob*100:.2f}%")
+else:
+    st.markdown("_Введите название статьи и нажмите кнопку выше_")

arxiv_model.zip ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:06a278334f7ae905b9a6553606501b6a224a798c792c907241c7a05c14c0ffda
+size 247670290

requirements.txt ADDED Viewed

	@@ -0,0 +1,3 @@

+transformers
+torch
+streamlit