Spaces:

VenujaDeSilva
/

stackoverflow-tag-predictor

Sleeping

File size: 6,121 Bytes

9f0e60b
 
 
 
 
f6f5b3d
 
 
9f0e60b
 
 
 
 
 
f6f5b3d
1480198
f6f5b3d
9f0e60b
 
f6f5b3d
9f0e60b
f6f5b3d
9f0e60b
f6f5b3d
1480198
9f0e60b
f6f5b3d
1480198
9f0e60b
f6f5b3d
1480198
 
 
 
 
 
 
 
 
9f0e60b
1480198
f6f5b3d
1480198
9f0e60b
f6f5b3d
 
 
1480198
 
 
 
f6f5b3d
 
9f0e60b
f6f5b3d
1480198
f6f5b3d
9f0e60b
 
f6f5b3d
1480198
 
9f0e60b
f6f5b3d
9f0e60b
1480198
9f0e60b
 
f6f5b3d
 
 
 
 
1480198
f6f5b3d
 
9f0e60b
 
 
f6f5b3d
 
 
9f0e60b
 
 
 
 
 
 
 
 
 
f6f5b3d
 
 
9f0e60b
 
 
f6f5b3d
 
 
9f0e60b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
f6f5b3d
1480198
f6f5b3d
1480198
 
 
 
 
 
9f0e60b
1480198
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
9f0e60b
f6f5b3d
1480198
f6f5b3d
1480198
 
 
 
 
 
 
 
 
 
 
 
9f0e60b
 
f6f5b3d
1480198
f6f5b3d
1480198
 
 
 
 
 
 
 
 
 
 
f6f5b3d
 
 
1480198
f6f5b3d
 
9f0e60b
1480198
9f0e60b
1480198
9f0e60b
 
f6f5b3d
 
1480198
9f0e60b
 
f6f5b3d
9f0e60b
 
f6f5b3d
 
 
1480198
f6f5b3d
 
 
 
1480198
f6f5b3d

import streamlit as st
import torch
import joblib
from transformers import AutoTokenizer, AutoModelForSequenceClassification

# -----------------------------------------------------------
# 🚀 Streamlit Page Configuration
# -----------------------------------------------------------
st.set_page_config(
    page_title="StackOverflow Tag Predictor",
    page_icon="🎯",
    layout="centered",
)

# -----------------------------------------------------------
# 🌈 Custom CSS for a Rich UI
# -----------------------------------------------------------
st.markdown("""
<style>

body {
    background-color: #F5F7FB;
}

.header {
    text-align: center;
    margin-top: -20px;
    margin-bottom: 10px;
}

.header-title {
    font-size: 48px;
    font-weight: 900;
    background: linear-gradient(90deg, #4A4AFC, #6A6AFF);
    -webkit-background-clip: text;
    -webkit-text-fill-color: transparent;
}

.header-subtitle {
    font-size: 18px;
    color: #555;
    margin-top: -10px;
    margin-bottom: 25px;
}

.card {
    background: white;
    padding: 30px;
    border-radius: 18px;
    box-shadow: 0px 6px 20px rgba(0,0,0,0.08);
    margin-bottom: 20px;
}

.result-tag {
    background: linear-gradient(90deg, #4A4AFC, #6A6AFF);
    padding: 14px 24px;
    border-radius: 14px;
    color: white;
    display: inline-block;
    font-size: 22px;
    font-weight: 700;
    animation: fadeIn 0.4s ease-out;
}

@keyframes fadeIn {
    from {opacity: 0; transform: translateY(10px);}
    to {opacity: 1; transform: translateY(0);}
}

.footer {
    text-align: center;
    margin-top: 40px;
    color: #777;
    font-size: 14px;
}

</style>
""", unsafe_allow_html=True)

# -----------------------------------------------------------
# 📦 Load Model & Tokenizer
# -----------------------------------------------------------
@st.cache_resource
def load_model():
    model = AutoModelForSequenceClassification.from_pretrained(".")
    tokenizer = AutoTokenizer.from_pretrained(".")
    return model, tokenizer

model, tokenizer = load_model()
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
model = model.to(device)

# -----------------------------------------------------------
# 🔤 Load Label Encoder
# -----------------------------------------------------------
label_encoder = joblib.load("label_encoder.joblib")
id2label = {i: label for i, label in enumerate(label_encoder.classes_)}

# -----------------------------------------------------------
# 🔮 Prediction Function
# -----------------------------------------------------------
def predict_tag(text):
    encoding = tokenizer(
        text,
        truncation=True,
        padding=True,
        max_length=128,
        return_tensors="pt"
    )
    encoding = {k: v.to(device) for k, v in encoding.items()}

    with torch.no_grad():
        outputs = model(**encoding)

    pred_id = torch.argmax(outputs.logits, dim=-1).item()
    tag = id2label[pred_id]
    confidence = torch.softmax(outputs.logits, dim=-1).max().item()

    return tag, confidence

# -----------------------------------------------------------
# 🎯 Header
# -----------------------------------------------------------
st.markdown("""
<div class="header">
    <div class="header-title">🎯 StackOverflow Tag Predictor</div>
    <div class="header-subtitle">Powered by DistilBERT • Predict the most likely tag from a question title</div>
</div>
""", unsafe_allow_html=True)

# -----------------------------------------------------------
# 🎛️ Sidebar – About the Model
# -----------------------------------------------------------
st.sidebar.title("ℹ️ About This App")
st.sidebar.write("""
This app uses a fine-tuned **DistilBERT** model trained on the
top 50 StackOverflow tags.

You can:
- Type your own question title  
- Pick from example titles  
- See model confidence  
""")

st.sidebar.write("### 🔧 Model Info")
st.sidebar.write(f"**Labels:** {len(id2label)} classes")
st.sidebar.write("**Framework:** PyTorch + HuggingFace Transformers")

# -----------------------------------------------------------
# 🧪 Example Questions Dropdown
# -----------------------------------------------------------
examples = [
    "How to fix NullPointerException in Java?",
    "What is the best way to center a div in CSS?",
    "How do I connect to a MySQL database in Python?",
    "Why is my React component not rendering?",
    "How to optimize a SQL query that is too slow?",
    "How to declare an array in C++?"
]

example_choice = st.selectbox(
    "✨ Or choose an example question:",
    ["(None)"] + examples
)

# -----------------------------------------------------------
# 📝 Main Input Card
# -----------------------------------------------------------
st.markdown("<div class='card'>", unsafe_allow_html=True)

if example_choice != "(None)":
    user_input = example_choice
else:
    user_input = st.text_area(
        "💬 Enter a StackOverflow question title:",
        height=120,
        placeholder="Example: \"How to fix NullPointerException in Java?\""
    )

predict_btn = st.button("🔍 Predict Tag", use_container_width=True)

# -----------------------------------------------------------
# 📊 Prediction Output
# -----------------------------------------------------------
if predict_btn:
    if user_input.strip() == "":
        st.warning("⚠️ Please enter a question title.")
    else:
        with st.spinner("Analyzing with AI… 🔧✨"):
            tag, confidence = predict_tag(user_input)

        st.success("Prediction ready! 🎉")

        st.markdown(f"<div class='result-tag'>{tag}</div>", unsafe_allow_html=True)

        st.markdown(
            f"### 🔥 Confidence Score: **{confidence*100:.2f}%**"
        )

st.markdown("</div>", unsafe_allow_html=True)

# -----------------------------------------------------------
# 📘 Footer
# -----------------------------------------------------------
st.markdown("""
<div class='footer'>
    Made with ❤️ using DistilBERT + Streamlit + HuggingFace Spaces<br>
    Try different example titles or write your own!
</div>
""", unsafe_allow_html=True)