Spaces:

maxcasado
/

POC2PROD

Sleeping

App Files Files Community

maxcasado commited on Nov 25, 2025

Commit

883f14c

verified ·

1 Parent(s): c9c177e

Update frontend.py

Browse files

Files changed (1) hide show

frontend.py +86 -30

frontend.py CHANGED Viewed

@@ -1,43 +1,37 @@
-# frontend.py
-import os
-import requests
 import streamlit as st
-API_URL = os.getenv("API_URL", "http://localhost:8000")
 st.set_page_config(page_title="StackOverflow Tagger", layout="wide")
 st.title("🔖 StackOverflow Tag Predictor")
-st.write(
-    "Entrez une question (titre + éventuellement description) "
-    "et récupérez les probabilités des tags StackOverflow."
-)
-question = st.text_area(
-    "Question StackOverflow",
-    height=200,
-    placeholder="Ex: How to fine-tune BERT for multi-label classification?",
-)
-top_k = st.slider("Nombre de tags à afficher (top_k)", 1, 20, 5)
-if st.button("Prédire"):
-    if not question.strip():
-        st.warning("Merci d'entrer une question.")
-    else:
-        try:
             with st.spinner("Prédiction en cours..."):
-                resp = requests.post(
-                    f"{API_URL}/predict",
-                    json={"text": question, "top_k": top_k},
-                    timeout=60,
-                )
-            resp.raise_for_status()
-            data = resp.json()
-            tags = data.get("tags", [])
             if not tags:
-                st.warning("Aucun tag renvoyé par l'API.")
             else:
                 st.subheader("Résultats")
                 for t in tags:
@@ -47,5 +41,67 @@ if st.button("Prédire"):
                 scores = {t["label"]: t["score"] for t in tags}
                 st.bar_chart(scores)
-        except Exception as e:
-            st.error(f"Erreur lors de l'appel à l'API : {e}")

 import streamlit as st
+import pandas as pd
+from io import StringIO
+from model_utils import predict_proba
 st.set_page_config(page_title="StackOverflow Tagger", layout="wide")
 st.title("🔖 StackOverflow Tag Predictor")
+tab_single, tab_csv = st.tabs(["Question unique", "CSV batch"])
+with tab_single:
+    st.write(
+        "Entrez une question (titre + éventuellement description) "
+        "et récupérez les probabilités des tags StackOverflow prédits par le modèle."
+    )
+    question = st.text_area(
+        "Question StackOverflow",
+        height=200,
+        placeholder="Ex: How to fine-tune BERT for multi-label classification?",
+    )
+    top_k = st.slider("Nombre de tags à afficher (top_k)", 1, 20, 5, key="topk_single")
+    if st.button("Prédire", key="predict_single"):
+        if not question.strip():
+            st.warning("Merci d'entrer une question.")
+        else:
             with st.spinner("Prédiction en cours..."):
+                tags = predict_proba(question, top_k=top_k)
             if not tags:
+                st.warning("Pas de tags prédits.")
             else:
                 st.subheader("Résultats")
                 for t in tags:
                 scores = {t["label"]: t["score"] for t in tags}
                 st.bar_chart(scores)
+with tab_csv:
+    st.write(
+        "Uploade un fichier CSV contenant des questions. "
+        "On ajoutera une colonne avec le tag principal prédit pour chaque ligne."
+    )
+    uploaded_file = st.file_uploader("Choisir un fichier CSV", type=["csv"])
+    if uploaded_file is not None:
+        df = pd.read_csv(uploaded_file)
+        st.write("Aperçu du CSV :")
+        st.dataframe(df.head())
+        text_column = st.selectbox(
+            "Colonne contenant la question",
+            options=list(df.columns),
+        )
+        top_k_batch = st.slider(
+            "Nombre de tags à considérer pour le batch (pour choisir le meilleur)",
+            1,
+            20,
+            5,
+            key="topk_batch",
+        )
+        if st.button("Lancer la prédiction sur le CSV"):
+            if df[text_column].isnull().all():
+                st.error("La colonne choisie ne contient pas de texte.")
+            else:
+                preds = []
+                with st.spinner("Prédiction en cours sur le CSV..."):
+                    for text in df[text_column].fillna(""):
+                        if not str(text).strip():
+                            preds.append({"best_tag": None, "best_score": None})
+                            continue
+                        tags = predict_proba(str(text), top_k=top_k_batch)
+                        if len(tags) == 0:
+                            preds.append({"best_tag": None, "best_score": None})
+                        else:
+                            best = tags[0]
+                            preds.append(
+                                {"best_tag": best["label"], "best_score": best["score"]}
+                            )
+                df["predicted_tag"] = [p["best_tag"] for p in preds]
+                df["predicted_score"] = [p["best_score"] for p in preds]
+                st.subheader("Résultats enrichis")
+                st.dataframe(df.head())
+                csv_buffer = StringIO()
+                df.to_csv(csv_buffer, index=False)
+                csv_bytes = csv_buffer.getvalue().encode("utf-8")
+                st.download_button(
+                    label="📥 Télécharger le CSV avec tags prédits",
+                    data=csv_bytes,
+                    file_name="questions_with_tags.csv",
+                    mime="text/csv",
+                )
+    else:
+        st.info("Uploade un fich