Spaces:

sathvikk
/

wikitrial

Sleeping

App Files Files Community

sathvikk commited on Jul 4, 2025

Commit

ca75932

verified ·

1 Parent(s): 3e053bf

Update src/streamlit_app.py

Browse files

Files changed (1) hide show

src/streamlit_app.py +54 -80

src/streamlit_app.py CHANGED Viewed

@@ -1,67 +1,48 @@
 import os
-os.environ["HOME"] = "/tmp"  # Fix for Hugging Face permission issue
 import streamlit as st
 import requests
 import urllib.parse
-from langdetect import detect
 st.set_page_config(page_title="WikiTrail", layout="wide")
-# Custom style
-st.markdown("""
-    <style>
-    body {
-        font-family: 'Segoe UI', sans-serif;
-        background-color: #f8f9fa;
-    }
-    .title {
-        font-size: 48px;
-        text-align: center;
-        color: #2c3e50;
-        font-weight: bold;
-        margin-bottom: 5px;
-    }
-    .subtitle {
-        text-align: center;
-        font-size: 18px;
-        color: #555;
-        margin-top: 0px;
-    }
-    .section {
-        background-color: #ffffff;
-        padding: 20px;
-        border-radius: 16px;
-        box-shadow: 0 4px 12px rgba(0,0,0,0.08);
-        margin-bottom: 25px;
-    }
-    .emoji-title {
-        font-size: 28px;
-        margin-bottom: 10px;
-        color: #2c3e50;
-    }
-    </style>
-""", unsafe_allow_html=True)
-# Title
-st.markdown("<div class='title'>📚 WikiTrail</div>", unsafe_allow_html=True)
-st.markdown("<div class='subtitle'>Explore Wikipedia topics visually and get a summarized journey.</div>", unsafe_allow_html=True)
-# Language Selector
 languages = {
     "English": "en",
     "Hindi (हिन्दी)": "hi",
     "Telugu (తెలుగు)": "te",
     "Tamil (தமிழ்)": "ta"
 }
-lang_name = st.selectbox("🌐 Select Language", list(languages.keys()), index=0)
 lang_code = languages[lang_name]
-# Topic Input
-topic_input = st.text_input("🔍 Enter a topic (in English)", placeholder="e.g., India, Gandhi, Hyderabad")
-# Wikipedia Summary Fetcher
-def fetch_topic_summary(title, lang):
     safe_title = urllib.parse.quote(title.replace(" ", "_"))
     url = f"https://{lang}.wikipedia.org/api/rest_v1/page/summary/{safe_title}"
     res = requests.get(url)
@@ -74,8 +55,8 @@ def fetch_topic_summary(title, lang):
         }
     return None
-# Related Topics
-def fetch_related_topics(title, lang):
     safe_title = urllib.parse.quote(title.replace(" ", "_"))
     url = f"https://{lang}.wikipedia.org/w/api.php?action=query&format=json&origin=*&titles={safe_title}&prop=links&pllimit=5"
     res = requests.get(url)
@@ -86,43 +67,40 @@ def fetch_related_topics(title, lang):
             return [link['title'] for link in pages[0]['links']]
     return []
-# Summary Cleaner
-def summarize_bullets(summaries, limit=3):
-    unique = list(set(summaries))
-    full = ' '.join(unique)
-    sentences = full.replace('।', '.').replace('?', '.').replace('!', '.').split('.')
-    cleaned = [s.strip() for s in sentences if s.strip()]
-    top = cleaned[:limit]
-    return ["• " + s + "." for s in top] if top else ["No summary available."]
 # Main logic
 if topic_input:
     with st.spinner("🔍 Searching Wikipedia..."):
         summaries = []
-        st.markdown("<div class='section'>", unsafe_allow_html=True)
-        st.markdown("<div class='emoji-title'>🔷 Main Topic</div>", unsafe_allow_html=True)
-        main = fetch_topic_summary(topic_input, lang_code)
-        if main and main["summary"]:
             summaries.append(main["summary"])
             st.markdown(f"### {main['title']}")
             st.write(main["summary"])
             st.markdown(f"[Read More →]({main['link']})", unsafe_allow_html=True)
         else:
-            st.warning(f"❌ No matching page found in {lang_name}. Try a different word.")
-            st.markdown("</div>", unsafe_allow_html=True)
-            st.stop()
-        st.markdown("</div>", unsafe_allow_html=True)
-        # Related Topics
-        st.markdown("<div class='section'>", unsafe_allow_html=True)
-        st.markdown("<div class='emoji-title'>🔗 Related Topics</div>", unsafe_allow_html=True)
-        related = fetch_related_topics(topic_input, lang_code)
-        if related:
-            for rel in related:
-                data = fetch_topic_summary(rel, lang_code)
                 if data and data["summary"] not in summaries:
                     summaries.append(data["summary"])
                     with st.expander(data["title"]):
@@ -130,12 +108,8 @@ if topic_input:
                         st.markdown(f"[Read More →]({data['link']})", unsafe_allow_html=True)
         else:
             st.info("No related topics found.")
-        st.markdown("</div>", unsafe_allow_html=True)
-        # Combined Summary
-        st.markdown("<div class='section'>", unsafe_allow_html=True)
-        st.markdown("<div class='emoji-title'>🧠 Combined Summary</div>", unsafe_allow_html=True)
-        bullets = summarize_bullets(summaries)
-        for b in bullets:
-            st.markdown(b)
-        st.markdown("</div>", unsafe_allow_html=True)

 import os
+os.environ["HOME"] = "/tmp"  # Hugging Face fix
 import streamlit as st
 import requests
 import urllib.parse
 st.set_page_config(page_title="WikiTrail", layout="wide")
+st.title("📚 WikiTrail")
+st.markdown("Explore Wikipedia topics visually and get a summarized journey.")
+# Language selector
 languages = {
     "English": "en",
     "Hindi (हिन्दी)": "hi",
     "Telugu (తెలుగు)": "te",
     "Tamil (தமிழ்)": "ta"
 }
+lang_name = st.selectbox("🌐 Select Language", list(languages.keys()))
 lang_code = languages[lang_name]
+# Topic input
+topic_input = st.text_input("🔍 Enter a topic (in English)", placeholder="e.g., India, Gandhi, Telangana")
+# Translate topic using Wikipedia search
+def get_translated_title(query, lang):
+    search_url = f"https://{lang}.wikipedia.org/w/api.php"
+    params = {
+        "action": "query",
+        "list": "search",
+        "srsearch": query,
+        "format": "json",
+        "origin": "*"
+    }
+    res = requests.get(search_url, params=params)
+    if res.status_code == 200:
+        results = res.json()
+        search_list = results.get("query", {}).get("search", [])
+        if search_list:
+            return search_list[0]["title"]
+    return None
+# Fetch summary
+def fetch_summary(title, lang):
     safe_title = urllib.parse.quote(title.replace(" ", "_"))
     url = f"https://{lang}.wikipedia.org/api/rest_v1/page/summary/{safe_title}"
     res = requests.get(url)
         }
     return None
+# Fetch related
+def fetch_related(title, lang):
     safe_title = urllib.parse.quote(title.replace(" ", "_"))
     url = f"https://{lang}.wikipedia.org/w/api.php?action=query&format=json&origin=*&titles={safe_title}&prop=links&pllimit=5"
     res = requests.get(url)
             return [link['title'] for link in pages[0]['links']]
     return []
+# Summarizer
+def summarize_bullets(texts, limit=3):
+    full_text = ' '.join(set(texts))
+    sentences = full_text.replace('।', '.').replace('?', '.').replace('!', '.').split('.')
+    clean = [s.strip() for s in sentences if s.strip()]
+    return ["• " + s + "." for s in clean[:limit]] if clean else ["No summary available."]
 # Main logic
 if topic_input:
     with st.spinner("🔍 Searching Wikipedia..."):
         summaries = []
+        translated_title = get_translated_title(topic_input, lang_code)
+        if not translated_title:
+            st.error(f"No matching page found in {lang_name} for '{topic_input}'")
+            st.stop()
+        # Main topic
+        st.subheader("🔷 Main Topic")
+        main = fetch_summary(translated_title, lang_code)
+        if main:
             summaries.append(main["summary"])
             st.markdown(f"### {main['title']}")
             st.write(main["summary"])
             st.markdown(f"[Read More →]({main['link']})", unsafe_allow_html=True)
         else:
+            st.warning("Couldn't fetch main topic summary.")
+        # Related
+        st.subheader("🔗 Related Topics")
+        related_titles = fetch_related(translated_title, lang_code)
+        if related_titles:
+            for title in related_titles:
+                data = fetch_summary(title, lang_code)
                 if data and data["summary"] not in summaries:
                     summaries.append(data["summary"])
                     with st.expander(data["title"]):
                         st.markdown(f"[Read More →]({data['link']})", unsafe_allow_html=True)
         else:
             st.info("No related topics found.")
+        # Bullet summary
+        st.subheader("🧠 Combined Summary")
+        for bullet in summarize_bullets(summaries):
+            st.markdown(bullet)