Spaces:

Dusit-P
/

Thai-Sentiment-GUI

Sleeping

App Files Files Community

Dusit-P commited on Oct 5, 2025

Commit

f1f96f6

verified ·

1 Parent(s): d65ba09

Update app.py

Browse files

Files changed (1) hide show

app.py +188 -414

app.py CHANGED Viewed

@@ -1,56 +1,26 @@
-# app.py — Thai Sentiment (WangchanBERTa Variants) - ปรับปรุง UI และเพิ่ม Shop Analysis
 import os, json, importlib.util, traceback, re, math, tempfile, datetime
 import gradio as gr
 import torch, pandas as pd
 import torch.nn.functional as F
 import plotly.graph_objects as go
-from plotly.subplots import make_subplots
 from huggingface_hub import hf_hub_download
 from safetensors.torch import load_file
 from transformers import AutoTokenizer
 # ================= Settings =================
 REPO_ID       = os.getenv("REPO_ID", "Dusit-P/thai-sentiment")
-DEFAULT_MODEL = os.getenv("DEFAULT_MODEL", "WCB")
 HF_TOKEN      = os.getenv("HF_TOKEN", None)
 # เลือกเฉพาะโมเดลที่ให้ผลดีที่สุด
 AVAILABLE_CHOICES = ["WCB", "WCB_BiLSTM"]
-# โมเดลที่ซ่อนไว้ (uncomment เพื่อเปิดใช้):
-# AVAILABLE_CHOICES = ["WCB", "WCB_BiLSTM", "WCB_CNN_BiLSTM", "WCB_4Layer_BiLSTM"]
-if DEFAULT_MODEL not in AVAILABLE_CHOICES:
-    DEFAULT_MODEL = "WCB_BiLSTM"  # เปลี่ยน default เป็นตัวที่ดีที่สุด
 NEG_COLOR = "#F87171"
 POS_COLOR = "#34D399"
-NEUTRAL_COLOR = "#94A3B8"
 TEMPLATE  = "plotly_white"
 CACHE = {}
-# ================= Date Presets (แก้ไขให้ทำงานถูกต้อง) =================
-DATE_PRESETS = {
-    "ทั้งหมด": None,
-    "7 วันล่าสุด": 7,
-    "15 วันล่าสุด": 15,
-    "30 วันล่าสุด": 30,
-    "90 วันล่าสุด": 90
-}
-def apply_date_preset(df, date_col, preset_key):
-    """กรองข้อมูลตาม preset ที่เลือก"""
-    if preset_key == "ทั้งหมด" or preset_key not in DATE_PRESETS:
-        return df
-    days = DATE_PRESETS[preset_key]
-    if days is None:
-        return df
-    now = pd.Timestamp.now()
-    cutoff = now - pd.Timedelta(days=days)
-    return df[df[date_col] >= cutoff]
 # ================= Loader =================
 def _import_models():
     if "models_module" in CACHE:
@@ -101,8 +71,8 @@ def _is_substantive_text(s, min_chars=2):
 def _format_pct(x): return f"{x*100:.2f}%"
 def _to_datetime_safe(s): return pd.to_datetime(s, errors="coerce", infer_datetime_format=True, utc=False)
-LIKELY_TEXT_COLS = ["text","review","message","comment","content","sentence","body","ข้อความ","รีวิว"]
-LIKELY_DATE_COLS = ["date","created_at","time","timestamp","datetime","วันที่","วันเวลา","เวลา"]
 LIKELY_SHOP_COLS = ["shop","store","branch","ร้าน","สาขา","ชื่อร้าน"]
 def detect_columns(df):
@@ -136,19 +106,40 @@ def detect_columns(df):
         if c.lower() in LIKELY_SHOP_COLS:
             shop_candidates.append(c)
             continue
-        # ตรวจว่ามีค่าซ้ำพอสมควร (เหมือนเป็น categorical)
         if df[c].dtype == object:
             unique_ratio = df[c].nunique() / len(df)
-            if 0.01 <= unique_ratio <= 0.5:  # 1-50% ของข้อมูลเป็นค่าซ้ำ
                 shop_candidates.append(c)
     shop_candidates = list(dict.fromkeys(shop_candidates))
     shop_col = shop_candidates[0] if len(shop_candidates) > 0 else None
     return text_col, date_candidates, date_col, shop_candidates, shop_col
 # ================= Charts =================
-def make_summary_chart(df, chart_type="pie"):
-    """สร้างกราฟสรุปแบบเดียว (ไม่ซ้ำซ้อน)"""
     total = len(df)
     neg_count = len(df[df["label"]=="negative"])
     pos_count = len(df[df["label"]=="positive"])
@@ -156,101 +147,39 @@ def make_summary_chart(df, chart_type="pie"):
     neg_avg = pd.to_numeric(df["negative(%)"].str.rstrip("%"), errors="coerce").mean()
     pos_avg = pd.to_numeric(df["positive(%)"].str.rstrip("%"), errors="coerce").mean()
-    info = (f"**📊 สรุปผลการวิเคราะห์**\n\n"
-            f"- 📝 ทั้งหมด: **{total:,}** รีวิว\n"
-            f"- 😞 เชิงลบ: **{neg_count:,}** ({neg_count/total*100:.1f}%)\n"
-            f"- 😊 เชิงบวก: **{pos_count:,}** ({pos_count/total*100:.1f}%)\n"
-            f"- 📈 ค่าเฉลี่ยความมั่นใจ:\n"
-            f"  - เชิงลบ: {neg_avg:.2f}%\n"
-            f"  - เชิงบวก: {pos_avg:.2f}%")
-    if chart_type == "pie":
-        fig = go.Figure(go.Pie(
-            labels=["😞 เชิงลบ","😊 เชิงบวก"],
-            values=[neg_count, pos_count],
-            hole=0.4,
-            marker=dict(colors=[NEG_COLOR, POS_COLOR]),
-            textinfo='label+percent',
-            textfont_size=14
-        ))
-        fig.update_layout(
-            title="สัดส่วนรีวิวเชิงบวก vs เชิงลบ",
-            template=TEMPLATE,
-            height=400
-        )
-    else:  # bar
-        fig = go.Figure()
-        fig.add_bar(
-            x=["เชิงลบ","เชิงบวก"],
-            y=[neg_count, pos_count],
-            marker_color=[NEG_COLOR, POS_COLOR],
-            text=[neg_count, pos_count],
-            textposition='auto'
-        )
-        fig.update_layout(
-            title="จำนวนรีวิวแยกตามความรู้สึก",
-            template=TEMPLATE,
-            yaxis_title="จำนวน (รีวิว)",
-            height=400
-        )
-    return fig, info
-def _resample_counts(df, date_col, freq="auto"):
-    """รวมข้อมูลตามช่วงเวลา - auto-detect frequency"""
-    if freq == "auto":
-        # Auto-detect ตามช่วงเวลาของข้อมูล
-        date_range = (df[date_col].max() - df[date_col].min()).days
-        if date_range <= 30:
-            freq = "D"  # รายวัน
-        elif date_range <= 90:
-            freq = "W"  # รายสัปดาห์
-        else:
-            freq = "M"  # รายเดือน
-    g = df.groupby([pd.Grouper(key=date_col, freq=freq),"label"]).size().unstack(fill_value=0)
-    for c in ["negative","positive"]:
-        if c not in g.columns: g[c]=0
-    return g[["negative","positive"]].sort_index(), freq
-def make_time_chart(df, date_col, freq="auto"):
-    """กราฟแนวโน้มตามเวลา"""
-    ts, actual_freq = _resample_counts(df, date_col, freq)
-    fig = go.Figure()
-    fig.add_scatter(
-        x=ts.index, y=ts["negative"],
-        mode="lines+markers",
-        name="😞 เชิงลบ",
-        line=dict(color=NEG_COLOR, width=2),
-        marker=dict(size=6)
-    )
-    fig.add_scatter(
-        x=ts.index, y=ts["positive"],
-        mode="lines+markers",
-        name="😊 เชิงบวก",
-        line=dict(color=POS_COLOR, width=2),
-        marker=dict(size=6)
-    )
-    freq_map = {"D": "รายวัน", "W": "รายสัปดาห์", "M": "รายเดือน"}
     fig.update_layout(
-        title=f"📈 แนวโน้มรีวิวตามเวลา ({freq_map[actual_freq]})",
         template=TEMPLATE,
-        xaxis_title="วันที่",
-        yaxis_title="จำนวนรีวิว",
-        hovermode='x unified',
-        height=450
     )
-    return fig
-def make_shop_analysis(df, shop_col, date_col=None, freq="auto"):
-    """วิเคราะห์แยกตามร้าน/สาขา"""
-    # 1. สรุปภาพรวมแต่ละร้าน
-    shop_summary = []
     for shop in df[shop_col].unique():
         if pd.isna(shop):
             continue
@@ -258,126 +187,84 @@ def make_shop_analysis(df, shop_col, date_col=None, freq="auto"):
         neg = len(shop_df[shop_df["label"]=="negative"])
         pos = len(shop_df[shop_df["label"]=="positive"])
         total = len(shop_df)
-        pos_ratio = pos / total * 100 if total > 0 else 0
-        shop_summary.append({
-            "ร้าน/สาขา": shop,
-            "รีวิวทั้งหมด": total,
-            "😞 เชิงลบ": neg,
-            "😊 เชิงบวก": pos,
-            "% เชิงบวก": f"{pos_ratio:.1f}%"
         })
-    summary_df = pd.DataFrame(shop_summary).sort_values("รีวิวทั้งหมด", ascending=False)
-    # 2. กราฟเปรียบเทียบร้าน
-    fig_compare = go.Figure()
-    shops = summary_df["ร้าน/สาขา"].tolist()
-    negs = summary_df["😞 เชิงลบ"].tolist()
-    poss = summary_df["😊 เชิงบวก"].tolist()
-    fig_compare.add_bar(name="😞 เชิงลบ", x=shops, y=negs, marker_color=NEG_COLOR)
-    fig_compare.add_bar(name="😊 เชิงบวก", x=shops, y=poss, marker_color=POS_COLOR)
-    fig_compare.update_layout(
-        title="🏪 เปรียบเทียบรีวิวแต่ละร้าน/สาขา",
         barmode='stack',
         template=TEMPLATE,
         xaxis_title="ร้าน/สาขา",
         yaxis_title="จำนวนรีวิว",
-        height=450
     )
-    # 3. Stacked bar แสดง Shop ตามช่วงเวลา (ถ้ามี date_col)
-    fig_time_shop = None
-    if date_col and date_col in df.columns:
-        # Auto-detect frequency
-        if freq == "auto":
-            date_range = (df[date_col].max() - df[date_col].min()).days
-            if date_range <= 30:
-                freq = "D"
-            elif date_range <= 90:
-                freq = "W"
-            else:
-                freq = "M"
-        fig_time_shop = go.Figure()
-        # เตรียมข้อมูลแยกตามร้าน
-        for shop in shops:
-            shop_df = df[df[shop_col] == shop]
-            # รวมตามเวลา
-            ts = shop_df.groupby(pd.Grouper(key=date_col, freq=freq)).size()
-            fig_time_shop.add_bar(
-                x=ts.index,
-                y=ts.values,
-                name=shop
-            )
-        freq_map = {"D": "รายวัน", "W": "รายสัปดาห์", "M": "รายเดือน"}
-        fig_time_shop.update_layout(
-            title=f"📊 จำนวนรีวิวแต่ละร้านตามเวลา ({freq_map[freq]})",
-            barmode='stack',
-            template=TEMPLATE,
-            xaxis_title="วันที่",
-            yaxis_title="จำนวนรีวิว",
-            hovermode='x unified',
-            height=450
-        )
-    return summary_df, fig_compare, fig_time_shop
-# ================= Core Predict =================
-def _predict_batch(texts, model_name, batch_size=32):
-    model,tok,cfg=load_model(model_name)
-    results=[]
-    for i in range(0,len(texts),batch_size):
-        chunk=texts[i:i+batch_size]
-        enc=tok(chunk,padding=True,truncation=True,
-                max_length=cfg.get("max_length",128),return_tensors="pt")
-        with torch.no_grad():
-            logits=model(enc["input_ids"],enc["attention_mask"])
-            probs=F.softmax(logits,dim=1).cpu().numpy()
-        for txt,p in zip(chunk,probs):
-            neg,pos=float(p[0]),float(p[1])
-            label="positive" if pos>=neg else "negative"
-            results.append({
-                "review":txt,
-                "negative(%)":_format_pct(neg),
-                "positive(%)":_format_pct(pos),
-                "label":label
-            })
-    return results
-# ================= Tab 1: วิเคราะห์หลายรีวิว =================
-def predict_many(text_block, model_choice, chart_type):
     try:
         raw = (text_block or "").splitlines()
         norm = [_norm_text(t) for t in raw]
         clean = [t for t in norm if _is_substantive_text(t)]
         if not clean:
-            return pd.DataFrame(), go.Figure(), "❌ ไม่พบข้อความที่สามารถวิเคราะห์ได้\n\nกรุณาป้อนข้อความที่มีความยาวอย่างน้อย 2 ตัวอักษร"
         results = _predict_batch(clean, model_choice)
         df = pd.DataFrame(results)
-        fig, info = make_summary_chart(df, chart_type)
         return df, fig, info
     except Exception as e:
-        return pd.DataFrame(), go.Figure(), f"❌ เกิดข้อผิดพลาด:\n\n{traceback.format_exc()}"
 # ================= Tab 2: อัปโหลด CSV =================
 def on_file_change(file_obj):
-    """เมื่ออัปโหลดไฟล์ - ตรวจหา columns อัตโนมัติ"""
     if file_obj is None:
-        return (gr.update(choices=[],value=None),
-                gr.update(choices=[],value=None),
-                gr.update(choices=[],value=None),
                 gr.update(visible=False),
                 "⚠️ กรุณาอัปโหลดไฟล์ CSV")
@@ -385,44 +272,40 @@ def on_file_change(file_obj):
         df = pd.read_csv(file_obj.name)
         text_col, date_candidates, date_col, shop_candidates, shop_col = detect_columns(df)
-        has_date = date_col is not None
         has_shop = shop_col is not None
-        note = f"✅ **ตรวจพบคอลัมน์:**\n"
         note += f"- 📝 ข้อความ: **{text_col}**\n"
-        if has_date:
             note += f"- 📅 วันที่: **{date_col}**\n"
-        else:
-            note += f"- 📅 วันที่: _ไม่พบ_\n"
         if has_shop:
-            note += f"- 🏪 ร้าน/สาขา: **{shop_col}** (พบ {df[shop_col].nunique()} ร้าน)\n"
         else:
             note += f"- 🏪 ร้าน/สาขา: _ไม่พบ_\n"
-        note += f"\n_หากไม่ถูกต้อง สามารถเลือกใหม่ได้จากเมนูด้านบน_"
         return (gr.update(choices=list(df.columns), value=text_col),
                 gr.update(choices=date_candidates if date_candidates else ["ไม่มี"], value=date_col),
                 gr.update(choices=shop_candidates if shop_candidates else ["ไม่มี"], value=shop_col),
-                gr.update(visible=has_date),
                 note)
     except Exception as e:
-        return (gr.update(choices=[],value=None),
-                gr.update(choices=[],value=None),
-                gr.update(choices=[],value=None),
                 gr.update(visible=False),
-                f"❌ ไม่สามารถอ่านไฟล์ได้:\n{str(e)}")
-def predict_csv(file_obj, model_choice, text_col, date_col, shop_col, date_preset, chart_type):
-    """วิเคราะห์รีวิวจากไฟล์ CSV"""
     if file_obj is None:
-        return (pd.DataFrame(), go.Figure(), go.Figure(),
-                gr.update(visible=False), gr.update(visible=False),
-                pd.DataFrame(), gr.update(visible=False),
-                "❌ กรุณาอัปโหลดไฟล์ CSV", None)
     try:
         df_raw = pd.read_csv(file_obj.name)
@@ -433,70 +316,57 @@ def predict_csv(file_obj, model_choice, text_col, date_col, shop_col, date_prese
         if text_col not in cols:
             text_col, _, _, _, _ = detect_columns(df_raw)
-        # ดึงข้อความและทำนาย
         texts = [_norm_text(v) for v in df_raw[text_col].tolist()]
         texts_clean = [t for t in texts if _is_substantive_text(t)]
         skipped = total_rows - len(texts_clean)
         if not texts_clean:
-            return (pd.DataFrame(), go.Figure(), go.Figure(),
-                    gr.update(visible=False), gr.update(visible=False),
-                    pd.DataFrame(), gr.update(visible=False),
-                    "❌ ไม่พบข้อความที่สามารถวิเคราะห์ได้ในไฟล์", None)
         results = _predict_batch(texts_clean, model_choice)
         df_out = pd.DataFrame(results)
-        # กราฟสรุปหลัก
-        fig_main, info = make_summary_chart(df_out, chart_type)
-        # เพิ่มข้อมูลแถวที่ข้าม
         if skipped > 0:
-            info += f"\n\n⚠️ **ข้ามแถวที่ไม่มีข้อความ:** {skipped} แถว (ใช้ {len(texts_clean)}/{total_rows} แถว)"
-        # กราฟตามเวลา
-        fig_time = go.Figure()
-        show_time = False
-        df_time_filtered = None
-        if date_col and date_col in cols and date_col != "ไม่มี":
-            dts = _to_datetime_safe(df_raw[date_col])
-            if dts.notna().any():
-                df_time = df_out.copy()
-                df_time["__dt__"] = dts
-                df_time = df_time.dropna(subset=["__dt__"])
-                # ใช้ date preset - แก้ bug ตรงนี้!
-                df_time_filtered = apply_date_preset(df_time, "__dt__", date_preset)
-                if len(df_time_filtered) > 0:
-                    fig_time = make_time_chart(df_time_filtered, "__dt__")
-                    show_time = True
-                    # แสดงข้อมูลช่วงเวลาที่กรอง
-                    if date_preset != "ทั้งหมด":
-                        info += f"\n\n📅 **ช่วงเวลาที่แสดง:** {date_preset} ({len(df_time_filtered)} รีวิว)"
-        # วิเคราะห์ตาม Shop
-        shop_summary_df = pd.DataFrame()
         fig_shop = go.Figure()
-        fig_shop_time = None
         show_shop = False
         if shop_col and shop_col in cols and shop_col != "ไม่มี":
-            df_with_shop = df_out.copy()
-            df_with_shop[shop_col] = df_raw[shop_col]
-            # ถ้ามี date ใช้ข้อมูลที่ filter แล้ว
-            if df_time_filtered is not None and len(df_time_filtered) > 0:
-                df_with_shop["__dt__"] = df_time_filtered["__dt__"]
-                df_with_shop = df_with_shop.dropna(subset=["__dt__"])
-                shop_summary_df, fig_shop, fig_shop_time = make_shop_analysis(
-                    df_with_shop, shop_col, "__dt__"
-                )
             else:
-                shop_summary_df, fig_shop, _ = make_shop_analysis(df_with_shop, shop_col)
             show_shop = True
@@ -505,18 +375,15 @@ def predict_csv(file_obj, model_choice, text_col, date_col, shop_col, date_prese
         os.close(fd)
         df_out.to_csv(path, index=False, encoding="utf-8-sig")
-        return (df_out, fig_main, fig_time,
-                gr.update(visible=show_time, value=fig_time),
                 gr.update(visible=show_shop, value=fig_shop),
-                shop_summary_df,
-                gr.update(visible=show_shop and fig_shop_time is not None, value=fig_shop_time),
                 info, path)
     except Exception as e:
-        return (pd.DataFrame(), go.Figure(), go.Figure(),
-                gr.update(visible=False), gr.update(visible=False),
-                pd.DataFrame(), gr.update(visible=False),
-                f"❌ เกิดข้อผิดพลาด:\n\n{traceback.format_exc()}", None)
 # ================= Gradio UI =================
 with gr.Blocks(title="Thai Sentiment Analysis", theme=gr.themes.Soft()) as demo:
@@ -532,35 +399,19 @@ with gr.Blocks(title="Thai Sentiment Analysis", theme=gr.themes.Soft()) as demo:
         info="WCB = เร็ว | WCB_BiLSTM = แม่นยำสูงสุด (แนะนำ)"
     )
-    # =================== Tab 1: วิเคราะห์หลายรีวิว ===================
-    with gr.Tab("📝 วิเคราะห์หลายรีวิว"):
-        gr.Markdown("""
-        **วิธีใช้:** ป้อนรีวิวหลายรายการ (แต่ละบรรทัด = 1 รีวิว) แล้วกด "เริ่มวิเคราะห์"
-        **ตัวอย่าง:**
-        ```
-        อาหารอร่อยมาก บริการดีค่ะ
-        ของแพงไป รสชาติก็ธรรมดา
-        บรรยากาศดี แต่รอนาน
-        ```
-        """)
         text_input = gr.Textbox(
-            lines=10,
-            label="📄 ข้อความรีวิว (บรรทัดละ 1 รีวิว)",
-            placeholder="ป้อนรีวิวที่ต้องการวิเคราะห์...\nแต่ละบรรทัด = 1 รีวิว"
         )
-        with gr.Row():
-            chart_type_1 = gr.Radio(
-                choices=["pie", "bar"],
-                value="pie",
-                label="📊 รูปแบบกราฟ",
-                info="Pie = วงกลม, Bar = แท่ง"
-            )
-            predict_btn_1 = gr.Button("🚀 เริ่มวิเคราะห์", variant="primary", size="lg")
-        result_df_1 = gr.Dataframe(label="📋 ผลการวิเคราะห์ทั้งหมด")
         with gr.Row():
             with gr.Column(scale=1):
@@ -570,91 +421,32 @@ with gr.Blocks(title="Thai Sentiment Analysis", theme=gr.themes.Soft()) as demo:
         predict_btn_1.click(
             predict_many,
-            [text_input, model_radio, chart_type_1],
             [result_df_1, result_chart_1, result_info_1]
         )
-    # =================== Tab 2: อัปโหลด CSV ===================
     with gr.Tab("📤 อัปโหลด CSV"):
-        gr.Markdown("""
-        **วิธีใช้:** อัปโหลดไฟล์ CSV ที่มีคอลัมน์รีวิว (และอาจมีวันที่/ร้านด้วย)
-        **คอลัมน์ที่ต้องมี:**
-        - ✅ คอลัมน์ข้อความรีวิว (เช่น "text", "review", "รีวิว")
-        - ⭐ คอลัมน์วันที่ (optional - สำหรับวิเคราะห์แนวโน้ม)
-        - ⭐ คอลัมน์ร้าน/สาขา (optional - สำหรับเปรียบเทียบร้าน)
-        """)
-        with gr.Row():
-            file_input = gr.File(
-                file_types=[".csv"],
-                label="📁 อัปโหลดไฟล์ CSV"
-            )
         detect_note = gr.Markdown("⬆️ อัปโหลดไฟล์เพื่อเริ่มต้น")
         with gr.Row():
-            text_col_dd = gr.Dropdown(
-                label="📝 คอลัมน์ข้อความรีวิว",
-                info="เลือกคอลัมน์ที่มีเนื้อหารีวิว"
-            )
-            date_col_dd = gr.Dropdown(
-                label="📅 คอลัมน์วันที่ (ถ้าไม่มีเว้นว่าง)",
-                info="สำหรับวิเคราะห์แนวโน้มตามเวลา"
-            )
-            shop_col_dd = gr.Dropdown(
-                label="🏪 คอลัมน์ร้าน/สาขา (ถ้าไม่มีเว้นว่าง)",
-                info="สำหรับเปรียบเทียบแต่ละร้าน"
-            )
-        gr.Markdown("### ⚙️ ตั้งค่าการวิเคราะห์")
-        with gr.Row():
-            date_preset = gr.Radio(
-                choices=list(DATE_PRESETS.keys()),
-                value="ทั้งหมด",
-                label="📆 ช่วงเวลาที่ต้องการวิเคราะห์",
-                info="เลือกช่วงเวลาที่ต้องการดูข้อมูล",
-                visible=False
-            )
-            chart_type_2 = gr.Radio(
-                choices=[("วงกลม", "pie"), ("แท่ง", "bar")],
-                value="pie",
-                label="📊 รูปแบบกราฟสรุป"
-            )(DATE_PRESETS.keys()),
-                value="ทั้งหมด",
-                label="📆 ช่วงเวลาที่ต้องการวิเคราะห์",
-                visible=False
-            )
-            freq = gr.Radio(
-                choices=[("รายวัน", "D"), ("รายสัปดาห์", "W"), ("รายเดือน", "M")],
-                value="D",
-                label="📊 ความละเอียดของกราฟ",
-                visible=False
-            )
-        with gr.Row():
-            use_smooth = gr.Checkbox(
-                value=True,
-                label="✨ ปรับกราฟให้เรียบ (Moving Average)",
-                info="ช่วยให้เห็นแนวโน้มชัดเจนขึ้น",
-                visible=False
-            )
-            chart_type_2 = gr.Radio(
-                choices=[("วงกลม", "pie"), ("แท่ง", "bar")],
-                value="pie",
-                label="📊 รูปแบบกราฟสรุป"
-            )
-        shop_analysis_row = gr.Row(visible=False)
-        shop_trend_row = gr.Row(visible=False)
-        predict_btn_2 = gr.Button("🚀 เริ่มวิเคราะห์ CSV", variant="primary", size="lg")
-        gr.Markdown("### 📊 ผลการวิเคราะห์")
         result_df_2 = gr.Dataframe(label="📋 ผลการวิเคราะห์ทั้งหมด")
@@ -664,49 +456,31 @@ with gr.Blocks(title="Thai Sentiment Analysis", theme=gr.themes.Soft()) as demo:
             with gr.Column(scale=1):
                 result_info_2 = gr.Markdown()
-        result_time = gr.Plot(label="📈 กราฟแนวโน้มตามเวลา", visible=False)
-        gr.Markdown("### 🏪 วิเคราะห์แยกตามร้าน/สาขา")
         shop_summary = gr.Dataframe(label="📊 สรุปแต่ละร้าน", visible=False)
-        result_shop = gr.Plot(label="🏪 เปรียบเทียบรีวิวแต่ละร้าน", visible=False)
-        result_shop_trend = gr.Plot(label="📊 รีวิวแต่ละร้านตามช่วงเวลา (Stacked Bar)", visible=False)
-        download_file = gr.File(label="💾 ดาวน์โหลดผลลัพธ์ (CSV)")
-        # Event handlers
         file_input.change(
             on_file_change,
             [file_input],
-            [text_col_dd, date_col_dd, shop_col_dd,
-             date_preset, detect_note]
         )
         predict_btn_2.click(
             predict_csv,
-            [file_input, model_radio, text_col_dd, date_col_dd, shop_col_dd,
-             date_preset, chart_type_2],
-            [result_df_2, result_chart_2, result_time,
-             result_time, result_shop,
-             shop_summary, result_shop_trend,
-             result_info_2, download_file]
         )
     gr.Markdown("""
     ---
     ### 💡 เกี่ยวกับโมเดล
-    **WangchanBERTa Variants** - โมเดล BERT ภาษาไทยที่ได้รับการฝึกสำหรับงานวิเคราะห์ความรู้สึก
-    - **WCB**: รุ่นพื้นฐาน - เร็ว เหมาะกับงานทั่วไป
-    - **WCB_BiLSTM**: เพิ่ม BiLSTM layer - **แม่นยำสูงสุด (แนะนำ)** ⭐
-    <!-- โมเดลอื่นๆ ที่ซ่อนไว้:
-    - **WCB_CNN_BiLSTM**: ใช้ CNN + BiLSTM เพิ่มประสิทธิภาพ
-    - **WCB_4Layer_BiLSTM**: BiLSTM 4 ชั้น (ช้ากว่า)
-    -->
-    📌 **หมายเหตุ:** โมเดลวิเคราะห์เฉพาะ **เชิงบวก/เชิงลบ** เท่านั้น (ไม่มี neutral)
     """)
 if __name__ == "__main__":

+# app.py — Thai Sentiment Analysis (เรียบง่าย + Shop Analysis)
 import os, json, importlib.util, traceback, re, math, tempfile, datetime
 import gradio as gr
 import torch, pandas as pd
 import torch.nn.functional as F
 import plotly.graph_objects as go
 from huggingface_hub import hf_hub_download
 from safetensors.torch import load_file
 from transformers import AutoTokenizer
 # ================= Settings =================
 REPO_ID       = os.getenv("REPO_ID", "Dusit-P/thai-sentiment")
+DEFAULT_MODEL = os.getenv("DEFAULT_MODEL", "WCB_BiLSTM")
 HF_TOKEN      = os.getenv("HF_TOKEN", None)
 # เลือกเฉพาะโมเดลที่ให้ผลดีที่สุด
 AVAILABLE_CHOICES = ["WCB", "WCB_BiLSTM"]
 NEG_COLOR = "#F87171"
 POS_COLOR = "#34D399"
 TEMPLATE  = "plotly_white"
 CACHE = {}
 # ================= Loader =================
 def _import_models():
     if "models_module" in CACHE:
 def _format_pct(x): return f"{x*100:.2f}%"
 def _to_datetime_safe(s): return pd.to_datetime(s, errors="coerce", infer_datetime_format=True, utc=False)
+LIKELY_TEXT_COLS = ["text","review","message","comment","content","ข้อความ","รีวิว"]
+LIKELY_DATE_COLS = ["date","created_at","time","timestamp","datetime","วันที่","เวลา"]
 LIKELY_SHOP_COLS = ["shop","store","branch","ร้าน","สาขา","ชื่อร้าน"]
 def detect_columns(df):
         if c.lower() in LIKELY_SHOP_COLS:
             shop_candidates.append(c)
             continue
         if df[c].dtype == object:
             unique_ratio = df[c].nunique() / len(df)
+            if 0.01 <= unique_ratio <= 0.5:
                 shop_candidates.append(c)
     shop_candidates = list(dict.fromkeys(shop_candidates))
     shop_col = shop_candidates[0] if len(shop_candidates) > 0 else None
     return text_col, date_candidates, date_col, shop_candidates, shop_col
+# ================= Core Predict =================
+def _predict_batch(texts, model_name, batch_size=32):
+    model, tok, cfg = load_model(model_name)
+    results = []
+    for i in range(0, len(texts), batch_size):
+        chunk = texts[i:i+batch_size]
+        enc = tok(chunk, padding=True, truncation=True,
+                  max_length=cfg.get("max_length",128), return_tensors="pt")
+        with torch.no_grad():
+            logits = model(enc["input_ids"], enc["attention_mask"])
+            probs = F.softmax(logits, dim=1).cpu().numpy()
+        for txt, p in zip(chunk, probs):
+            neg, pos = float(p[0]), float(p[1])
+            label = "positive" if pos >= neg else "negative"
+            results.append({
+                "review": txt,
+                "negative(%)": _format_pct(neg),
+                "positive(%)": _format_pct(pos),
+                "label": label
+            })
+    return results
 # ================= Charts =================
+def make_summary_chart(df):
+    """สร้างกราฟสรุปแบบ Pie"""
     total = len(df)
     neg_count = len(df[df["label"]=="negative"])
     pos_count = len(df[df["label"]=="positive"])
     neg_avg = pd.to_numeric(df["negative(%)"].str.rstrip("%"), errors="coerce").mean()
     pos_avg = pd.to_numeric(df["positive(%)"].str.rstrip("%"), errors="coerce").mean()
+    # Pie chart
+    fig = go.Figure(go.Pie(
+        labels=["😞 เชิงลบ", "😊 เชิงบวก"],
+        values=[neg_count, pos_count],
+        hole=0.4,
+        marker=dict(colors=[NEG_COLOR, POS_COLOR]),
+        textinfo='label+percent',
+        textfont_size=14
+    ))
     fig.update_layout(
+        title="สัดส่วนรีวิว",
         template=TEMPLATE,
+        height=400
     )
+    # Summary text
+    info = (f"**📊 สรุปผล**\n\n"
+            f"- ทั้งหมด: **{total:,}** รีวิว\n"
+            f"- เชิงลบ: **{neg_count:,}** ({neg_count/total*100:.1f}%)\n"
+            f"- เชิงบวก: **{pos_count:,}** ({pos_count/total*100:.1f}%)")
+    return fig, info
+def make_shop_chart(df, shop_col, date_col=None, days_filter=None):
+    """กราฟแสดงรีวิวแต่ละร้าน - เรียบง่าย"""
+    # กรองตาม���ันที่ถ้าต้องการ
+    if date_col and days_filter:
+        cutoff = pd.Timestamp.now() - pd.Timedelta(days=days_filter)
+        df = df[df[date_col] >= cutoff]
+    # สรุปแต่ละร้าน
+    shop_data = []
     for shop in df[shop_col].unique():
         if pd.isna(shop):
             continue
         neg = len(shop_df[shop_df["label"]=="negative"])
         pos = len(shop_df[shop_df["label"]=="positive"])
         total = len(shop_df)
+        shop_data.append({
+            "shop": str(shop),
+            "negative": neg,
+            "positive": pos,
+            "total": total,
+            "pos_pct": pos/total*100 if total > 0 else 0
         })
+    shop_df = pd.DataFrame(shop_data).sort_values("total", ascending=False)
+    # กราฟแท่ง Stacked
+    fig = go.Figure()
+    fig.add_bar(
+        name="😞 เชิงลบ",
+        x=shop_df["shop"],
+        y=shop_df["negative"],
+        marker_color=NEG_COLOR
+    )
+    fig.add_bar(
+        name="😊 เชิงบวก",
+        x=shop_df["shop"],
+        y=shop_df["positive"],
+        marker_color=POS_COLOR
+    )
+    title = "🏪 รีวิวแต่ละร้าน/สาขา"
+    if days_filter:
+        title += f" ({days_filter} วันล่าสุด)"
+    fig.update_layout(
+        title=title,
         barmode='stack',
         template=TEMPLATE,
         xaxis_title="ร้าน/สาขา",
         yaxis_title="จำนวนรีวิว",
+        height=450,
+        showlegend=True
     )
+    # ตารางสรุป
+    summary_df = pd.DataFrame({
+        "ร้าน/สาขา": shop_df["shop"],
+        "รีวิวทั้งหมด": shop_df["total"],
+        "😞 เชิงลบ": shop_df["negative"],
+        "😊 เชิงบวก": shop_df["positive"],
+        "% เชิงบวก": shop_df["pos_pct"].apply(lambda x: f"{x:.1f}%")
+    })
+    return fig, summary_df
+# ================= Tab 1: วิเคราะห์ข้อความ =================
+def predict_many(text_block, model_choice):
     try:
         raw = (text_block or "").splitlines()
         norm = [_norm_text(t) for t in raw]
         clean = [t for t in norm if _is_substantive_text(t)]
         if not clean:
+            return pd.DataFrame(), go.Figure(), "❌ ไม่พบข้อความที่วิเคราะห์ได้"
         results = _predict_batch(clean, model_choice)
         df = pd.DataFrame(results)
+        fig, info = make_summary_chart(df)
         return df, fig, info
     except Exception as e:
+        return pd.DataFrame(), go.Figure(), f"❌ เกิดข้อผิดพลาด:\n{traceback.format_exc()}"
 # ================= Tab 2: อัปโหลด CSV =================
 def on_file_change(file_obj):
+    """ตรวจหา columns เมื่ออัปโหลดไฟล์"""
     if file_obj is None:
+        return (gr.update(choices=[], value=None),
+                gr.update(choices=[], value=None),
+                gr.update(choices=[], value=None),
                 gr.update(visible=False),
                 "⚠️ กรุณาอัปโหลดไฟล์ CSV")
         df = pd.read_csv(file_obj.name)
         text_col, date_candidates, date_col, shop_candidates, shop_col = detect_columns(df)
         has_shop = shop_col is not None
+        note = f"✅ **ตรวจพบคอลัมน์**\n"
         note += f"- 📝 ข้อความ: **{text_col}**\n"
+        if date_col:
             note += f"- 📅 วันที่: **{date_col}**\n"
         if has_shop:
+            note += f"- 🏪 ร้าน/สาขา: **{shop_col}** ({df[shop_col].nunique()} ร้าน)\n"
         else:
             note += f"- 🏪 ร้าน/สาขา: _ไม่พบ_\n"
+        note += f"\n_หากไม่ถูกต้อง เลือกใหม่ได้ด้านบน_"
         return (gr.update(choices=list(df.columns), value=text_col),
                 gr.update(choices=date_candidates if date_candidates else ["ไม่มี"], value=date_col),
                 gr.update(choices=shop_candidates if shop_candidates else ["ไม่มี"], value=shop_col),
+                gr.update(visible=has_shop),
                 note)
     except Exception as e:
+        return (gr.update(choices=[], value=None),
+                gr.update(choices=[], value=None),
+                gr.update(choices=[], value=None),
                 gr.update(visible=False),
+                f"❌ ไม่สามารถอ่านไฟล์ได้: {str(e)}")
+def predict_csv(file_obj, model_choice, text_col, date_col, shop_col, days_filter):
+    """วิเคราะห์ CSV"""
     if file_obj is None:
+        return (pd.DataFrame(), go.Figure(),
+                gr.update(visible=False), pd.DataFrame(),
+                "❌ กรุณาอัปโหลดไฟล์", None)
     try:
         df_raw = pd.read_csv(file_obj.name)
         if text_col not in cols:
             text_col, _, _, _, _ = detect_columns(df_raw)
+        # ดึงข้อความ
         texts = [_norm_text(v) for v in df_raw[text_col].tolist()]
         texts_clean = [t for t in texts if _is_substantive_text(t)]
         skipped = total_rows - len(texts_clean)
         if not texts_clean:
+            return (pd.DataFrame(), go.Figure(),
+                    gr.update(visible=False), pd.DataFrame(),
+                    "❌ ไม่พบข้อความที่วิเคราะห์ได้", None)
+        # ทำนาย
         results = _predict_batch(texts_clean, model_choice)
         df_out = pd.DataFrame(results)
+        # กราฟสรุป
+        fig_main, info = make_summary_chart(df_out)
         if skipped > 0:
+            info += f"\n\n⚠️ ข้ามแถวว่าง: {skipped} แถว"
+        # วิเคราะห์ Shop (ถ้ามี)
         fig_shop = go.Figure()
+        shop_summary = pd.DataFrame()
         show_shop = False
         if shop_col and shop_col in cols and shop_col != "ไม่มี":
+            # เตรียมข้อมูล
+            df_shop = df_out.copy()
+            df_shop[shop_col] = df_raw[shop_col].iloc[:len(df_out)]
+            # เพิ่ม date ถ้ามี
+            if date_col and date_col in cols and date_col != "ไม่มี":
+                dts = _to_datetime_safe(df_raw[date_col])
+                df_shop[date_col] = dts.iloc[:len(df_out)]
+                df_shop = df_shop.dropna(subset=[date_col])
+                # แปลง days_filter
+                days = None
+                if days_filter == "7 วันล่าสุด":
+                    days = 7
+                elif days_filter == "15 วันล่าสุด":
+                    days = 15
+                elif days_filter == "30 วันล่าสุด":
+                    days = 30
+                fig_shop, shop_summary = make_shop_chart(df_shop, shop_col, date_col, days)
+                if days:
+                    info += f"\n\n📅 แสดงข้อมูล: {days_filter}"
             else:
+                fig_shop, shop_summary = make_shop_chart(df_shop, shop_col)
             show_shop = True
         os.close(fd)
         df_out.to_csv(path, index=False, encoding="utf-8-sig")
+        return (df_out, fig_main,
                 gr.update(visible=show_shop, value=fig_shop),
+                shop_summary,
                 info, path)
     except Exception as e:
+        return (pd.DataFrame(), go.Figure(),
+                gr.update(visible=False), pd.DataFrame(),
+                f"❌ เกิดข้อผิดพลาด:\n{traceback.format_exc()}", None)
 # ================= Gradio UI =================
 with gr.Blocks(title="Thai Sentiment Analysis", theme=gr.themes.Soft()) as demo:
         info="WCB = เร็ว | WCB_BiLSTM = แม่นยำสูงสุด (แนะนำ)"
     )
+    # =================== Tab 1 ===================
+    with gr.Tab("📝 วิเคราะห์ข้อความ"):
+        gr.Markdown("**วิธีใช้:** ป้อนรีวิวหลายรายการ (แต่ละบรรทัด = 1 รีวิว)")
         text_input = gr.Textbox(
+            lines=8,
+            label="📄 ข้อความรีวิว",
+            placeholder="ป้อนรีวิว แต่ละบรรทัด = 1 รีวิว\n\nตัวอย่าง:\nอาหารอร่อยมาก บริการดี\nของแพง รสชาติธรรมดา"
         )
+        predict_btn_1 = gr.Button("🚀 เริ่มวิเคราะห์", variant="primary", size="lg")
+        result_df_1 = gr.Dataframe(label="📋 ผลการวิเคราะห์")
         with gr.Row():
             with gr.Column(scale=1):
         predict_btn_1.click(
             predict_many,
+            [text_input, model_radio],
             [result_df_1, result_chart_1, result_info_1]
         )
+    # =================== Tab 2 ===================
     with gr.Tab("📤 อัปโหลด CSV"):
+        gr.Markdown("**วิธีใช้:** อัปโหลดไฟล์ CSV ที่มีคอลัมน์รีวิว (และอาจมีวันที่/ร้านด้วย)")
+        file_input = gr.File(file_types=[".csv"], label="📁 อัปโหลดไฟล์ CSV")
         detect_note = gr.Markdown("⬆️ อัปโหลดไฟล์เพื่อเริ่มต้น")
         with gr.Row():
+            text_col_dd = gr.Dropdown(label="📝 คอลัมน์ข้อความรีวิว")
+            date_col_dd = gr.Dropdown(label="📅 คอลัมน์วันที่ (ถ้ามี)")
+            shop_col_dd = gr.Dropdown(label="🏪 คอลัมน์ร้าน/สาขา (ถ้ามี)")
+        days_filter = gr.Radio(
+            choices=["ทั้งหมด", "7 วันล่าสุด", "15 วันล่าสุด", "30 วันล่าสุด"],
+            value="ทั้งหมด",
+            label="📆 ช่วงเวลา",
+            info="ใช้กรองข้อมูลเฉพาะกราฟร้าน (ถ้ามีวันที่)",
+            visible=False
+        )
+        predict_btn_2 = gr.Button("🚀 เริ่มวิเคราะห์", variant="primary", size="lg")
         result_df_2 = gr.Dataframe(label="📋 ผลการวิเคราะห์ทั้งหมด")
             with gr.Column(scale=1):
                 result_info_2 = gr.Markdown()
+        result_shop = gr.Plot(label="🏪 รีวิวแต่ละร้าน/สาขา", visible=False)
         shop_summary = gr.Dataframe(label="📊 สรุปแต่ละร้าน", visible=False)
+        download_file = gr.File(label="💾 ดาวน์โหลดผลลัพธ์")
+        # Events
         file_input.change(
             on_file_change,
             [file_input],
+            [text_col_dd, date_col_dd, shop_col_dd, days_filter, detect_note]
         )
         predict_btn_2.click(
             predict_csv,
+            [file_input, model_radio, text_col_dd, date_col_dd, shop_col_dd, days_filter],
+            [result_df_2, result_chart_2, result_shop, shop_summary, result_info_2, download_file]
         )
     gr.Markdown("""
     ---
     ### 💡 เกี่ยวกับโมเดล
+    - **WCB**: เร็ว เหมาะงานทั่วไป
+    - **WCB_BiLSTM**: แม่นยำสูงสุด ⭐ (แนะนำ)
+    📌 วิเคราะห์เฉพาะ **เชิงบวก/เชิงลบ** เท่านั้น
     """)
 if __name__ == "__main__":