Spaces:

shiue2000
/

sparkAnalysis

Sleeping

App Files Files Community

shiue2000 commited on Sep 26, 2025

Commit

418284c

verified ·

1 Parent(s): 3c9a501

Update app.py

Browse files

Files changed (1) hide show

app.py +53 -32

app.py CHANGED Viewed

@@ -10,22 +10,18 @@ from datetime import datetime, timedelta
 import gradio as gr
 import logging
 from jinja2 import Template
 # ===== 字型與樣式 =====
 plt.rcParams['font.sans-serif'] = ['Microsoft JhengHei', 'Noto Sans TC', 'SimHei', 'Arial Unicode MS']
 plt.rcParams['axes.unicode_minus'] = False
 plt.style.use("seaborn-v0_8")
 # ===== 日誌 =====
 logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
 # ===== 參數 =====
 candidates = ["許智傑", "邱議瑩", "賴瑞隆", "林岱樺", "柯志恩"]
 days_back = 7
 max_tweets_per_candidate = 20
 news_file = "news_sample.csv"
 history_file = "history_sentiment.csv"
 # ===== 情緒分析 =====
 try:
     from transformers import pipeline
@@ -41,7 +37,6 @@ except:
             "label": random.choice(["positive", "negative", "neutral"]),
             "score": random.uniform(0.3, 0.9)
         }
 # ===== 模擬貼文抓取 =====
 def fetch_tweets(candidate):
     sample_texts = {
@@ -60,7 +55,6 @@ def fetch_tweets(candidate):
         }
         for i in range(random.randint(5, max_tweets_per_candidate))
     ])
 # ===== 工具: Matplotlib → base64 =====
 def fig_to_base64():
     buf = io.BytesIO()
@@ -70,11 +64,9 @@ def fig_to_base64():
     buf.close()
     plt.close()
     return img_b64
 # ===== 多圖產生器 =====
 def generate_charts(all_df, summary, df_hist):
     results = {}
     # 1. 每日情緒比例
     fig = plt.figure(figsize=(8, 5))
     summary[['Positive Ratio', 'Negative Ratio', 'Neutral Ratio']].plot(
@@ -84,7 +76,6 @@ def generate_charts(all_df, summary, df_hist):
     plt.ylabel("比例")
     plt.xlabel("候選人")
     results["img_b64_today"] = fig_to_base64()
     # 2. 歷史情緒趨勢
     fig = plt.figure(figsize=(10, 5))
     for c in candidates:
@@ -98,7 +89,6 @@ def generate_charts(all_df, summary, df_hist):
     plt.ylabel("比例")
     plt.legend()
     results["img_b64_trend"] = fig_to_base64()
     # 3. 社群情緒趨勢
     sentiment_trend = all_df.groupby([pd.Grouper(key='Date', freq='D'), 'Sentiment']).size().unstack(fill_value=0)
     sentiment_trend = sentiment_trend.div(sentiment_trend.sum(axis=1), axis=0).fillna(0)
@@ -111,7 +101,6 @@ def generate_charts(all_df, summary, df_hist):
     plt.ylabel("比例")
     plt.legend()
     results["img_social_sentiment"] = fig_to_base64()
     # 4. 平台表現
     platforms = ["X", "Facebook", "Instagram", "PTT", "Line"]
     platform_counts = pd.Series({p: random.randint(10, 100) for p in platforms})
@@ -121,7 +110,6 @@ def generate_charts(all_df, summary, df_hist):
     plt.xlabel("平台")
     plt.ylabel("貼文數量")
     results["img_platform_performance"] = fig_to_base64()
     # 5. 候選人聲量趨勢
     candidate_trend = all_df.groupby([pd.Grouper(key='Date', freq='D'), 'Candidate']).size().unstack(fill_value=0)
     fig = plt.figure(figsize=(8, 5))
@@ -133,7 +121,6 @@ def generate_charts(all_df, summary, df_hist):
     plt.ylabel("貼文數量")
     plt.legend()
     results["img_candidate_volume"] = fig_to_base64()
     # 6. 候選人情緒分析
     fig = plt.figure(figsize=(8, 5))
     summary[['Positive Ratio', 'Negative Ratio', 'Neutral Ratio']].plot(
@@ -143,7 +130,6 @@ def generate_charts(all_df, summary, df_hist):
     plt.ylabel("比例")
     plt.xlabel("候選人")
     results["img_candidate_sentiment"] = fig_to_base64()
     # 7. 知識圖譜
     fig, ax = plt.subplots(figsize=(8, 6))
     G = nx.Graph()
@@ -153,28 +139,72 @@ def generate_charts(all_df, summary, df_hist):
         G.add_edge(candidates[i], candidates[i + 1])
     nx.draw(G, nx.spring_layout(G), with_labels=True, node_color='lightgreen', font_size=12, ax=ax)
     results["img_knowledge_graph"] = fig_to_base64()
     return results
 # ===== 主分析函數 =====
 def run_analysis():
     try:
-        template_path = "templates/index.html"
-        if not os.path.exists(template_path):
-            return f"<pre>❌ 模板檔案 {template_path} 未找到</pre>"
         # --- 貼文 & 情緒分析 ---
         all_df = pd.concat([fetch_tweets(c) for c in candidates], ignore_index=True)
         all_df['Sentiment'] = all_df['Content'].apply(lambda x: sentiment(x)['label'])
         all_df['Confidence'] = all_df['Content'].apply(lambda x: sentiment(x)['score'])
         # --- 統計 ---
         summary = all_df.groupby(['Candidate', 'Sentiment']).size().unstack(fill_value=0)
         summary['Total Posts'] = summary.sum(axis=1)
         summary['Positive Ratio'] = summary.get('positive', 0) / summary['Total Posts'].replace(0, 1)
         summary['Negative Ratio'] = summary.get('negative', 0) / summary['Total Posts'].replace(0, 1)
         summary['Neutral Ratio'] = summary.get('neutral', 0) / summary['Total Posts'].replace(0, 1)
         # --- 歷史資料 ---
         today_str = datetime.now().strftime('%Y-%m-%d')
         hist_row = summary[['Positive Ratio', 'Negative Ratio', 'Neutral Ratio']].copy()
@@ -185,10 +215,8 @@ def run_analysis():
             ignore_index=True
         ) if os.path.exists(history_file) else hist_row
         df_hist.to_csv(history_file, index=False)
         # --- 圖表 ---
         charts = generate_charts(all_df, summary, df_hist)
         # --- 新聞 ---
         if os.path.exists(news_file):
             df_news = pd.read_csv(news_file)
@@ -201,10 +229,8 @@ def run_analysis():
                 "爭議": "林岱樺涉助理費爭議。"
             }
             news_table = "<p>無新聞資料</p>"
         # Convert news_summary to list of tuples to support iteration in template
         news_summary = list(news_summary.items())
         # --- 參與表 ---
         engagement_table = f"""
         <table class="min-w-full bg-white border border-gray-200">
@@ -221,9 +247,6 @@ def run_analysis():
         </table>
         """
         # --- HTML 渲染 ---
-        with open(template_path, encoding='utf-8') as f:
-            html_template = f.read()
         template = Template(html_template)
         html_content = template.render(
             report_date=datetime.now().strftime('%Y-%m-%d %H:%M'),
@@ -232,12 +255,10 @@ def run_analysis():
             news_table=news_table if news_table else "<p>未提供新聞資料</p>",
             **charts
         )
         return html_content
     except Exception:
         return f"<pre>❌ 分析失敗:\n{traceback.format_exc()}</pre>"
 # ===== Gradio 前端 =====
 if __name__ == "__main__":
     iface = gr.Interface(

 import gradio as gr
 import logging
 from jinja2 import Template
 # ===== 字型與樣式 =====
 plt.rcParams['font.sans-serif'] = ['Microsoft JhengHei', 'Noto Sans TC', 'SimHei', 'Arial Unicode MS']
 plt.rcParams['axes.unicode_minus'] = False
 plt.style.use("seaborn-v0_8")
 # ===== 日誌 =====
 logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
 # ===== 參數 =====
 candidates = ["許智傑", "邱議瑩", "賴瑞隆", "林岱樺", "柯志恩"]
 days_back = 7
 max_tweets_per_candidate = 20
 news_file = "news_sample.csv"
 history_file = "history_sentiment.csv"
 # ===== 情緒分析 =====
 try:
     from transformers import pipeline
             "label": random.choice(["positive", "negative", "neutral"]),
             "score": random.uniform(0.3, 0.9)
         }
 # ===== 模擬貼文抓取 =====
 def fetch_tweets(candidate):
     sample_texts = {
         }
         for i in range(random.randint(5, max_tweets_per_candidate))
     ])
 # ===== 工具: Matplotlib → base64 =====
 def fig_to_base64():
     buf = io.BytesIO()
     buf.close()
     plt.close()
     return img_b64
 # ===== 多圖產生器 =====
 def generate_charts(all_df, summary, df_hist):
     results = {}
     # 1. 每日情緒比例
     fig = plt.figure(figsize=(8, 5))
     summary[['Positive Ratio', 'Negative Ratio', 'Neutral Ratio']].plot(
     plt.ylabel("比例")
     plt.xlabel("候選人")
     results["img_b64_today"] = fig_to_base64()
     # 2. 歷史情緒趨勢
     fig = plt.figure(figsize=(10, 5))
     for c in candidates:
     plt.ylabel("比例")
     plt.legend()
     results["img_b64_trend"] = fig_to_base64()
     # 3. 社群情緒趨勢
     sentiment_trend = all_df.groupby([pd.Grouper(key='Date', freq='D'), 'Sentiment']).size().unstack(fill_value=0)
     sentiment_trend = sentiment_trend.div(sentiment_trend.sum(axis=1), axis=0).fillna(0)
     plt.ylabel("比例")
     plt.legend()
     results["img_social_sentiment"] = fig_to_base64()
     # 4. 平台表現
     platforms = ["X", "Facebook", "Instagram", "PTT", "Line"]
     platform_counts = pd.Series({p: random.randint(10, 100) for p in platforms})
     plt.xlabel("平台")
     plt.ylabel("貼文數量")
     results["img_platform_performance"] = fig_to_base64()
     # 5. 候選人聲量趨勢
     candidate_trend = all_df.groupby([pd.Grouper(key='Date', freq='D'), 'Candidate']).size().unstack(fill_value=0)
     fig = plt.figure(figsize=(8, 5))
     plt.ylabel("貼文數量")
     plt.legend()
     results["img_candidate_volume"] = fig_to_base64()
     # 6. 候選人情緒分析
     fig = plt.figure(figsize=(8, 5))
     summary[['Positive Ratio', 'Negative Ratio', 'Neutral Ratio']].plot(
     plt.ylabel("比例")
     plt.xlabel("候選人")
     results["img_candidate_sentiment"] = fig_to_base64()
     # 7. 知識圖譜
     fig, ax = plt.subplots(figsize=(8, 6))
     G = nx.Graph()
         G.add_edge(candidates[i], candidates[i + 1])
     nx.draw(G, nx.spring_layout(G), with_labels=True, node_color='lightgreen', font_size=12, ax=ax)
     results["img_knowledge_graph"] = fig_to_base64()
     return results
 # ===== 主分析函數 =====
 def run_analysis():
     try:
+        # Embed the template as a string to avoid file dependency and ensure syntax is correct
+        html_template = """
+<!DOCTYPE html>
+<html lang="zh-TW">
+<head>
+    <meta charset="UTF-8">
+    <meta name="viewport" content="width=device-width, initial-scale=1.0">
+    <title>2026 高雄市長選舉輿情分析報告</title>
+    <script src="https://cdn.tailwindcss.com"></script>
+</head>
+<body class="bg-gray-100 font-sans leading-normal tracking-normal">
+    <div class="container mx-auto p-4">
+        <h1 class="text-3xl font-bold mb-4">2026 高雄市長選舉輿情分析報告</h1>
+        <p class="mb-4">報告日期: {{ report_date }}</p>
+        <h2 class="text-2xl font-bold mb-2">參與度摘要</h2>
+        {{ engagement_table | safe }}
+        <h2 class="text-2xl font-bold mb-2">新聞摘要</h2>
+        <ul class="list-disc pl-5 mb-4">
+            {% for key, value in news_summary %}
+            <li><strong>{{ key }}</strong>: {{ value }}</li>
+            {% endfor %}
+        </ul>
+        <h2 class="text-2xl font-bold mb-2">新聞詳情</h2>
+        {{ news_table | safe }}
+        <h2 class="text-2xl font-bold mb-2">今日情緒比例</h2>
+        <img src="data:image/png;base64,{{ img_b64_today }}" alt="今日情緒比例" class="mb-4">
+        <h2 class="text-2xl font-bold mb-2">歷史情緒趨勢</h2>
+        <img src="data:image/png;base64,{{ img_b64_trend }}" alt="歷史情緒趨勢" class="mb-4">
+        <h2 class="text-2xl font-bold mb-2">社群情緒趨勢</h2>
+        <img src="data:image/png;base64,{{ img_social_sentiment }}" alt="社群情緒趨勢" class="mb-4">
+        <h2 class="text-2xl font-bold mb-2">平台表現</h2>
+        <img src="data:image/png;base64,{{ img_platform_performance }}" alt="平台表現" class="mb-4">
+        <h2 class="text-2xl font-bold mb-2">候選人聲量趨勢</h2>
+        <img src="data:image/png;base64,{{ img_candidate_volume }}" alt="候選人聲量趨勢" class="mb-4">
+        <h2 class="text-2xl font-bold mb-2">候選人情緒分析</h2>
+        <img src="data:image/png;base64,{{ img_candidate_sentiment }}" alt="候選人情緒分析" class="mb-4">
+        <h2 class="text-2xl font-bold mb-2">知識圖譜</h2>
+        <img src="data:image/png;base64,{{ img_knowledge_graph }}" alt="知識圖譜" class="mb-4">
+    </div>
+</body>
+</html>
+        """
         # --- 貼文 & 情緒分析 ---
         all_df = pd.concat([fetch_tweets(c) for c in candidates], ignore_index=True)
         all_df['Sentiment'] = all_df['Content'].apply(lambda x: sentiment(x)['label'])
         all_df['Confidence'] = all_df['Content'].apply(lambda x: sentiment(x)['score'])
         # --- 統計 ---
         summary = all_df.groupby(['Candidate', 'Sentiment']).size().unstack(fill_value=0)
         summary['Total Posts'] = summary.sum(axis=1)
         summary['Positive Ratio'] = summary.get('positive', 0) / summary['Total Posts'].replace(0, 1)
         summary['Negative Ratio'] = summary.get('negative', 0) / summary['Total Posts'].replace(0, 1)
         summary['Neutral Ratio'] = summary.get('neutral', 0) / summary['Total Posts'].replace(0, 1)
         # --- 歷史資料 ---
         today_str = datetime.now().strftime('%Y-%m-%d')
         hist_row = summary[['Positive Ratio', 'Negative Ratio', 'Neutral Ratio']].copy()
             ignore_index=True
         ) if os.path.exists(history_file) else hist_row
         df_hist.to_csv(history_file, index=False)
         # --- 圖表 ---
         charts = generate_charts(all_df, summary, df_hist)
         # --- 新聞 ---
         if os.path.exists(news_file):
             df_news = pd.read_csv(news_file)
                 "爭議": "林岱樺涉助理費爭議。"
             }
             news_table = "<p>無新聞資料</p>"
         # Convert news_summary to list of tuples to support iteration in template
         news_summary = list(news_summary.items())
         # --- 參與表 ---
         engagement_table = f"""
         <table class="min-w-full bg-white border border-gray-200">
         </table>
         """
         # --- HTML 渲染 ---
         template = Template(html_template)
         html_content = template.render(
             report_date=datetime.now().strftime('%Y-%m-%d %H:%M'),
             news_table=news_table if news_table else "<p>未提供新聞資料</p>",
             **charts
         )
         return html_content
     except Exception:
         return f"<pre>❌ 分析失敗:\n{traceback.format_exc()}</pre>"
 # ===== Gradio 前端 =====
 if __name__ == "__main__":
     iface = gr.Interface(