Spaces:

Dusit-P
/

Thai-Sentiment-GUI

Sleeping

App Files Files Community

Dusit-P commited on Oct 5, 2025

Commit

4096fb9

verified ·

1 Parent(s): f6f7109

Update app.py

Browse files

Files changed (1) hide show

app.py +568 -126

app.py CHANGED Viewed

@@ -1,14 +1,10 @@
-# app.py — Thai Sentiment (WangchanBERTa Variants)
-# - Focus on POS/NEG only
-# - Batch + CSV tabs
-# - CSV: auto-detect text/date cols, hide date widgets if no date col
-# - DatePicker fallback to Textbox if component missing
 import os, json, importlib.util, traceback, re, math, tempfile, datetime
 import gradio as gr
 import torch, pandas as pd
 import torch.nn.functional as F
 import plotly.graph_objects as go
 from huggingface_hub import hf_hub_download
 from safetensors.torch import load_file
 from transformers import AutoTokenizer
@@ -24,28 +20,42 @@ if DEFAULT_MODEL not in AVAILABLE_CHOICES:
 NEG_COLOR = "#F87171"
 POS_COLOR = "#34D399"
 TEMPLATE  = "plotly_white"
 CACHE = {}
-# ================= Date Component Fallback =================
-try:
-    DateInput = getattr(gr, "Date", None) or getattr(gr, "DatePicker", None)
-except Exception:
-    DateInput = None
-DATE_FALLBACK_TO_TEXT = False
-if DateInput is None:
-    DateInput = gr.Textbox
-    DATE_FALLBACK_TO_TEXT = True
-def _normalize_date_input(v):
-    if v is None: return None
-    if isinstance(v, float) and math.isnan(v): return None
-    if isinstance(v, datetime.date): return pd.Timestamp(v)
-    try:
-        ts = pd.to_datetime(v, errors="coerce")
-        return ts if pd.notna(ts) else None
-    except Exception:
-        return None
 # ================= Loader =================
 def _import_models():
@@ -99,65 +109,226 @@ def _to_datetime_safe(s): return pd.to_datetime(s, errors="coerce", infer_dateti
 LIKELY_TEXT_COLS = ["text","review","message","comment","content","sentence","body","ข้อความ","รีวิว"]
 LIKELY_DATE_COLS = ["date","created_at","time","timestamp","datetime","วันที่","วันเวลา","เวลา"]
-def detect_text_and_date_cols(df):
     cols = list(df.columns)
     low = {c.lower(): c for c in cols}
     text_col = None
     for k in LIKELY_TEXT_COLS:
         if k in low: text_col = low[k]; break
     if text_col is None:
         cand = [c for c in cols if df[c].dtype == object]
         text_col = cand[0] if cand else cols[0]
     date_candidates = []
     for c in cols:
-        if c.lower() in LIKELY_DATE_COLS: date_candidates.append(c); continue
         sample = df[c].head(50)
         if _to_datetime_safe(sample).notna().sum() >= max(3, int(len(sample)*0.2)):
             date_candidates.append(c)
     date_candidates = list(dict.fromkeys(date_candidates))
-    date_col = date_candidates[0] if len(date_candidates)>0 else None
-    return text_col, date_candidates, date_col
 # ================= Charts =================
-def make_basic_charts(df):
     total = len(df)
-    neg_df = df[df["label"]=="negative"]; pos_df = df[df["label"]=="positive"]
-    fig_bar = go.Figure()
-    fig_bar.add_bar(name="negative", x=["negative"], y=[len(neg_df)], marker_color=NEG_COLOR)
-    fig_bar.add_bar(name="positive", x=["positive"], y=[len(pos_df)], marker_color=POS_COLOR)
-    fig_bar.update_layout(barmode="group", title="Label counts", template=TEMPLATE)
-    labels=["negative","positive"]; values=[len(neg_df), len(pos_df)]
-    fig_pie = go.Figure(go.Pie(labels=labels, values=values, hole=0.35,
-                               marker=dict(colors=[NEG_COLOR, POS_COLOR])))
-    fig_pie.update_layout(title="Positive vs Negative", template=TEMPLATE)
     neg_avg = pd.to_numeric(df["negative(%)"].str.rstrip("%"), errors="coerce").mean()
     pos_avg = pd.to_numeric(df["positive(%)"].str.rstrip("%"), errors="coerce").mean()
-    info=(f"**Summary**\n- Total: {total}\n- Negative: {len(neg_df)}\n- Positive: {len(pos_df)}\n"
-          f"- Avg negative: {neg_avg:.2f}%\n- Avg positive: {pos_avg:.2f}%")
-    return fig_bar, fig_pie, info
 def _resample_counts(df, date_col, freq):
     g = df.groupby([pd.Grouper(key=date_col, freq=freq),"label"]).size().unstack(fill_value=0)
     for c in ["negative","positive"]:
         if c not in g.columns: g[c]=0
     return g[["negative","positive"]].sort_index()
-def _rolling_window(freq): return 7 if freq=="D" else (4 if freq=="W" else 3)
-def make_time_chart(df, date_col, freq, use_ma):
-    ts=_resample_counts(df,date_col,freq)
-    if use_ma: ts=ts.rolling(_rolling_window(freq), min_periods=1).mean()
-    fig=go.Figure()
-    fig.add_scatter(x=ts.index,y=ts["negative"],mode="lines",name="negative",line=dict(color=NEG_COLOR))
-    fig.add_scatter(x=ts.index,y=ts["positive"],mode="lines",name="positive",line=dict(color=POS_COLOR))
-    fig.update_layout(title="Reviews over time (POS/NEG)",template=TEMPLATE,
-                      xaxis_title="Date",yaxis_title="Count")
     return fig
 # ================= Core Predict =================
 def _predict_batch(texts, model_name, batch_size=32):
-    model,tok,cfg=load_model(model_name); results=[]
     for i in range(0,len(texts),batch_size):
         chunk=texts[i:i+batch_size]
         enc=tok(chunk,padding=True,truncation=True,
@@ -168,94 +339,365 @@ def _predict_batch(texts, model_name, batch_size=32):
         for txt,p in zip(chunk,probs):
             neg,pos=float(p[0]),float(p[1])
             label="positive" if pos>=neg else "negative"
-            results.append({"review":txt,"negative(%)":_format_pct(neg),
-                            "positive(%)":_format_pct(pos),"label":label})
     return results
-# ================= Batch =================
-def predict_many(text_block, model_choice):
     try:
-        raw=(text_block or "").splitlines()
-        norm=[_norm_text(t) for t in raw]; clean=[t for t in norm if _is_substantive_text(t)]
-        if not clean: return pd.DataFrame(),go.Figure(),go.Figure(),"No valid text"
-        results=_predict_batch(clean,model_choice); df=pd.DataFrame(results)
-        bar,pie,info=make_basic_charts(df)
-        return df,bar,pie,info
-    except: return pd.DataFrame(),go.Figure(),go.Figure(),traceback.format_exc()
-# ================= CSV Inspect =================
 def on_file_change(file_obj):
     if file_obj is None:
-        return gr.update(choices=[],value=None),gr.update(choices=[],value=None),\
-               gr.update(visible=False),gr.update(visible=False),\
-               gr.update(visible=False),gr.update(visible=False),\
-               gr.update(visible=False),"Please upload a CSV"
     try:
-        df=pd.read_csv(file_obj.name)
-        text_col,date_candidates,date_col=detect_text_and_date_cols(df)
-        has_date=date_col is not None
-        note=f"Detected text col: **{text_col}**; "+("date col: **{}**".format(date_col) if has_date else "_no date col_")
-        return gr.update(choices=list(df.columns),value=text_col),\
-               gr.update(choices=date_candidates,value=date_col),\
-               gr.update(visible=has_date),gr.update(visible=has_date),\
-               gr.update(visible=has_date),gr.update(visible=has_date),\
-               gr.update(visible=has_date),note
-    except: return gr.update(choices=[],value=None),gr.update(choices=[],value=None),\
-                   gr.update(visible=False),gr.update(visible=False),\
-                   gr.update(visible=False),gr.update(visible=False),\
-                   gr.update(visible=False),"Error reading CSV"
-# ================= CSV Predict =================
-def predict_csv(file_obj,model_choice,text_col,date_col,date_from,date_to,freq,use_ma):
-    if file_obj is None: return pd.DataFrame(),go.Figure(),go.Figure(),gr.update(visible=False), "No file",None
     try:
-        df_raw=pd.read_csv(file_obj.name); cols=list(df_raw.columns)
-        if text_col not in cols: text_col,_d,_dc=detect_text_and_date_cols(df_raw);
-        texts=[_norm_text(v) for v in df_raw[text_col].tolist()]
-        texts=[t for t in texts if _is_substantive_text(t)]
-        if not texts: return pd.DataFrame(),go.Figure(),go.Figure(),gr.update(visible=False),"No valid texts",None
-        results=_predict_batch(texts,model_choice); out=pd.DataFrame(results)
-        bar,pie,info=make_basic_charts(out)
-        fig_line=go.Figure(); show_time=False
-        if date_col and date_col in cols:
-            dts=_to_datetime_safe(df_raw[date_col])
             if dts.notna().any():
-                df_time=out.copy(); df_time["__dt__"]=dts; df_time=df_time.dropna(subset=["__dt__"])
-                start_ts=_normalize_date_input(date_from); end_ts=_normalize_date_input(date_to)
-                if start_ts is not None: df_time=df_time[df_time["__dt__"]>=start_ts]
-                if end_ts is not None: df_time=df_time[df_time["__dt__"]<=end_ts]
-                if len(df_time)>0: fig_line=make_time_chart(df_time,"__dt__",freq,use_ma); show_time=True
-        fd,path=tempfile.mkstemp(suffix=".csv"); os.close(fd)
-        out.to_csv(path,index=False,encoding="utf-8-sig")
-        return out,bar,pie,gr.update(visible=show_time,value=fig_line),info,path
-    except: return pd.DataFrame(),go.Figure(),go.Figure(),gr.update(visible=False),"Error\n"+traceback.format_exc(),None
 # ================= Gradio UI =================
-with gr.Blocks(title="Thai Sentiment") as demo:
-    gr.Markdown("### Thai Sentiment — WangchanBERTa Variants")
-    model_radio=gr.Radio(choices=AVAILABLE_CHOICES,value=DEFAULT_MODEL,label="เลือกโมเดล")
-    with gr.Tab("Batch"):
-        t2=gr.Textbox(lines=8,label="รีวิว (บรรทัดละ 1)")
-        btn2=gr.Button("Predict",variant="primary")
-        df2=gr.Dataframe(); bar2=gr.Plot(); pie2=gr.Plot(); sum2=gr.Markdown()
-        btn2.click(predict_many,[t2,model_radio],[df2,bar2,pie2,sum2])
-    with gr.Tab("CSV Upload"):
         with gr.Row():
-            file_in=gr.File(file_types=[".csv"]); text_dd=gr.Dropdown(label="Text col")
-            date_dd=gr.Dropdown(label="Date col (opt)")
         with gr.Row():
-            date_from=DateInput(label="เริ่มวันที่"+(" (YYYY-MM-DD)" if DATE_FALLBACK_TO_TEXT else ""),visible=False)
-            date_to=DateInput(label="ถึงวันที่"+(" (YYYY-MM-DD)" if DATE_FALLBACK_TO_TEXT else ""),visible=False)
-            freq=gr.Radio(choices=["D","W","M"],value="D",label="Freq",visible=False)
-            use_ma=gr.Checkbox(value=True,label="MA",visible=False)
-        btn3=gr.Button("Predict CSV",variant="primary")
-        note=gr.Markdown()
-        df3=gr.Dataframe(); bar3=gr.Plot(); pie3=gr.Plot()
-        line=gr.Plot(visible=False); sum3=gr.Markdown(); dl=gr.File()
-        file_in.change(on_file_change,[file_in],[text_dd,date_dd,date_from,date_to,freq,use_ma,line,note])
-        btn3.click(predict_csv,[file_in,model_radio,text_dd,date_dd,date_from,date_to,freq,use_ma],[df3,bar3,pie3,line,sum3,dl])
-if __name__=="__main__": demo.launch()

+# app.py — Thai Sentiment (WangchanBERTa Variants) - ปรับปรุง UI และเพิ่ม Shop Analysis
 import os, json, importlib.util, traceback, re, math, tempfile, datetime
 import gradio as gr
 import torch, pandas as pd
 import torch.nn.functional as F
 import plotly.graph_objects as go
+from plotly.subplots import make_subplots
 from huggingface_hub import hf_hub_download
 from safetensors.torch import load_file
 from transformers import AutoTokenizer
 NEG_COLOR = "#F87171"
 POS_COLOR = "#34D399"
+NEUTRAL_COLOR = "#94A3B8"
 TEMPLATE  = "plotly_white"
 CACHE = {}
+# ================= Date Presets =================
+DATE_PRESETS = {
+    "ทั้งหมด": None,
+    "7 วันล่าสุด": 7,
+    "30 วันล่าสุด": 30,
+    "90 วันล่าสุด": 90,
+    "เดือนนี้": "current_month",
+    "เดือนที่แล้ว": "last_month"
+}
+def apply_date_preset(df, date_col, preset_key):
+    """กรองข้อมูลตาม preset ที่เลือก"""
+    if preset_key == "ทั้งหมด":
+        return df
+    now = pd.Timestamp.now()
+    if isinstance(DATE_PRESETS[preset_key], int):
+        days = DATE_PRESETS[preset_key]
+        cutoff = now - pd.Timedelta(days=days)
+        return df[df[date_col] >= cutoff]
+    elif DATE_PRESETS[preset_key] == "current_month":
+        start = now.replace(day=1, hour=0, minute=0, second=0, microsecond=0)
+        return df[df[date_col] >= start]
+    elif DATE_PRESETS[preset_key] == "last_month":
+        end_last = now.replace(day=1, hour=0, minute=0, second=0, microsecond=0)
+        start_last = (end_last - pd.Timedelta(days=1)).replace(day=1)
+        return df[(df[date_col] >= start_last) & (df[date_col] < end_last)]
+    return df
 # ================= Loader =================
 def _import_models():
 LIKELY_TEXT_COLS = ["text","review","message","comment","content","sentence","body","ข้อความ","รีวิว"]
 LIKELY_DATE_COLS = ["date","created_at","time","timestamp","datetime","วันที่","วันเวลา","เวลา"]
+LIKELY_SHOP_COLS = ["shop","store","branch","ร้าน","สาขา","ชื่อร้าน"]
+def detect_columns(df):
+    """ตรวจหา text, date, shop columns อัตโนมัติ"""
     cols = list(df.columns)
     low = {c.lower(): c for c in cols}
+    # Text column
     text_col = None
     for k in LIKELY_TEXT_COLS:
         if k in low: text_col = low[k]; break
     if text_col is None:
         cand = [c for c in cols if df[c].dtype == object]
         text_col = cand[0] if cand else cols[0]
+    # Date candidates
     date_candidates = []
     for c in cols:
+        if c.lower() in LIKELY_DATE_COLS:
+            date_candidates.append(c)
+            continue
         sample = df[c].head(50)
         if _to_datetime_safe(sample).notna().sum() >= max(3, int(len(sample)*0.2)):
             date_candidates.append(c)
     date_candidates = list(dict.fromkeys(date_candidates))
+    date_col = date_candidates[0] if len(date_candidates) > 0 else None
+    # Shop candidates
+    shop_candidates = []
+    for c in cols:
+        if c.lower() in LIKELY_SHOP_COLS:
+            shop_candidates.append(c)
+            continue
+        # ตรวจว่ามีค่าซ้ำพอสมควร (เหมือนเป็น categorical)
+        if df[c].dtype == object:
+            unique_ratio = df[c].nunique() / len(df)
+            if 0.01 <= unique_ratio <= 0.5:  # 1-50% ของข้อมูลเป็นค่าซ้ำ
+                shop_candidates.append(c)
+    shop_candidates = list(dict.fromkeys(shop_candidates))
+    shop_col = shop_candidates[0] if len(shop_candidates) > 0 else None
+    return text_col, date_candidates, date_col, shop_candidates, shop_col
 # ================= Charts =================
+def make_summary_chart(df, chart_type="pie"):
+    """สร้างกราฟสรุปแบบเดียว (ไม่ซ้ำซ้อน)"""
     total = len(df)
+    neg_count = len(df[df["label"]=="negative"])
+    pos_count = len(df[df["label"]=="positive"])
     neg_avg = pd.to_numeric(df["negative(%)"].str.rstrip("%"), errors="coerce").mean()
     pos_avg = pd.to_numeric(df["positive(%)"].str.rstrip("%"), errors="coerce").mean()
+    info = (f"**📊 สรุปผลการวิเคราะห์**\n\n"
+            f"- 📝 ทั้งหมด: **{total:,}** รีวิว\n"
+            f"- 😞 เชิงลบ: **{neg_count:,}** ({neg_count/total*100:.1f}%)\n"
+            f"- 😊 เชิงบวก: **{pos_count:,}** ({pos_count/total*100:.1f}%)\n"
+            f"- 📈 ค่าเฉลี่ยความมั่นใจ:\n"
+            f"  - เชิงลบ: {neg_avg:.2f}%\n"
+            f"  - เชิงบวก: {pos_avg:.2f}%")
+    if chart_type == "pie":
+        fig = go.Figure(go.Pie(
+            labels=["😞 เชิงลบ","😊 เชิงบวก"],
+            values=[neg_count, pos_count],
+            hole=0.4,
+            marker=dict(colors=[NEG_COLOR, POS_COLOR]),
+            textinfo='label+percent',
+            textfont_size=14
+        ))
+        fig.update_layout(
+            title="สัดส่วนรีวิวเชิงบวก vs เชิงลบ",
+            template=TEMPLATE,
+            height=400
+        )
+    else:  # bar
+        fig = go.Figure()
+        fig.add_bar(
+            x=["เชิงลบ","เชิงบวก"],
+            y=[neg_count, pos_count],
+            marker_color=[NEG_COLOR, POS_COLOR],
+            text=[neg_count, pos_count],
+            textposition='auto'
+        )
+        fig.update_layout(
+            title="จำนวนรีวิวแยกตามความรู้สึก",
+            template=TEMPLATE,
+            yaxis_title="จำนวน (รีวิว)",
+            height=400
+        )
+    return fig, info
 def _resample_counts(df, date_col, freq):
+    """รวมข้อมูลตามช่วงเวลา"""
     g = df.groupby([pd.Grouper(key=date_col, freq=freq),"label"]).size().unstack(fill_value=0)
     for c in ["negative","positive"]:
         if c not in g.columns: g[c]=0
     return g[["negative","positive"]].sort_index()
+def make_time_chart(df, date_col, freq, use_smooth):
+    """กราฟแนวโน้มตามเวลา"""
+    ts = _resample_counts(df, date_col, freq)
+    if use_smooth:
+        window = 7 if freq=="D" else (4 if freq=="W" else 3)
+        ts = ts.rolling(window, min_periods=1).mean()
+    fig = go.Figure()
+    fig.add_scatter(
+        x=ts.index, y=ts["negative"],
+        mode="lines+markers",
+        name="😞 เชิงลบ",
+        line=dict(color=NEG_COLOR, width=2),
+        marker=dict(size=6)
+    )
+    fig.add_scatter(
+        x=ts.index, y=ts["positive"],
+        mode="lines+markers",
+        name="😊 เชิงบวก",
+        line=dict(color=POS_COLOR, width=2),
+        marker=dict(size=6)
+    )
+    freq_map = {"D": "รายวัน", "W": "รายสัปดาห์", "M": "รายเดือน"}
+    smooth_text = " (ปรับให้เรียบแล้ว)" if use_smooth else ""
+    fig.update_layout(
+        title=f"📈 แนวโน้มรีวิวตามเวลา ({freq_map[freq]}){smooth_text}",
+        template=TEMPLATE,
+        xaxis_title="วันที่",
+        yaxis_title="จำนวนรีวิว",
+        hovermode='x unified',
+        height=450
+    )
     return fig
+def make_shop_analysis(df, shop_col, date_col=None, freq="D"):
+    """วิเคราะห์แยกตามร้าน/สาขา"""
+    # 1. สรุปภาพรวมแต่ละร้าน
+    shop_summary = []
+    for shop in df[shop_col].unique():
+        if pd.isna(shop):
+            continue
+        shop_df = df[df[shop_col] == shop]
+        neg = len(shop_df[shop_df["label"]=="negative"])
+        pos = len(shop_df[shop_df["label"]=="positive"])
+        total = len(shop_df)
+        pos_ratio = pos / total * 100 if total > 0 else 0
+        shop_summary.append({
+            "ร้าน/สาขา": shop,
+            "รีวิวทั้งหมด": total,
+            "😞 เชิงลบ": neg,
+            "😊 เชิงบวก": pos,
+            "% เชิงบวก": f"{pos_ratio:.1f}%"
+        })
+    summary_df = pd.DataFrame(shop_summary).sort_values("รีวิวทั้งหมด", ascending=False)
+    # 2. กราฟเปรียบเทียบร้าน
+    fig_compare = go.Figure()
+    shops = summary_df["ร้าน/สาขา"].tolist()
+    negs = summary_df["😞 เชิงลบ"].tolist()
+    poss = summary_df["😊 เชิงบวก"].tolist()
+    fig_compare.add_bar(name="😞 เชิงลบ", x=shops, y=negs, marker_color=NEG_COLOR)
+    fig_compare.add_bar(name="😊 เชิงบวก", x=shops, y=poss, marker_color=POS_COLOR)
+    fig_compare.update_layout(
+        title="🏪 เปรียบเทียบรีวิวแต่ละร้าน/สาขา",
+        barmode='stack',
+        template=TEMPLATE,
+        xaxis_title="ร้าน/สาขา",
+        yaxis_title="จำนวนรีวิว",
+        height=450
+    )
+    # 3. กราฟแนวโน้มตามเวลาแยกร้าน (ถ้ามี date_col)
+    fig_trend = None
+    if date_col and date_col in df.columns:
+        fig_trend = go.Figure()
+        for shop in shops[:5]:  # แสดงแค่ 5 ร้านแรก
+            shop_df = df[df[shop_col] == shop].copy()
+            if len(shop_df) == 0:
+                continue
+            # คำนวณ positive ratio ตามเวลา
+            shop_df['pos_score'] = (shop_df['label'] == 'positive').astype(int)
+            ts = shop_df.groupby(pd.Grouper(key=date_col, freq=freq))['pos_score'].mean() * 100
+            fig_trend.add_scatter(
+                x=ts.index,
+                y=ts.values,
+                mode='lines+markers',
+                name=shop,
+                line=dict(width=2),
+                marker=dict(size=5)
+            )
+        freq_map = {"D": "รายวัน", "W": "รายสัปดาห์", "M": "รายเดือน"}
+        fig_trend.update_layout(
+            title=f"📊 แนวโน้ม % รีวิวเชิงบวกแยกตามร้าน ({freq_map[freq]})",
+            template=TEMPLATE,
+            xaxis_title="วันที่",
+            yaxis_title="% รีวิวเชิงบวก",
+            hovermode='x unified',
+            height=450
+        )
+    return summary_df, fig_compare, fig_trend
 # ================= Core Predict =================
 def _predict_batch(texts, model_name, batch_size=32):
+    model,tok,cfg=load_model(model_name)
+    results=[]
     for i in range(0,len(texts),batch_size):
         chunk=texts[i:i+batch_size]
         enc=tok(chunk,padding=True,truncation=True,
         for txt,p in zip(chunk,probs):
             neg,pos=float(p[0]),float(p[1])
             label="positive" if pos>=neg else "negative"
+            results.append({
+                "review":txt,
+                "negative(%)":_format_pct(neg),
+                "positive(%)":_format_pct(pos),
+                "label":label
+            })
     return results
+# ================= Tab 1: วิเคราะห์หลายรีวิว =================
+def predict_many(text_block, model_choice, chart_type):
     try:
+        raw = (text_block or "").splitlines()
+        norm = [_norm_text(t) for t in raw]
+        clean = [t for t in norm if _is_substantive_text(t)]
+        if not clean:
+            return pd.DataFrame(), go.Figure(), "❌ ไม่พบข้อความที่สามารถวิเคราะห์ได้\n\nกรุณาป้อนข้อความที่มีความยาวอย่างน้อย 2 ตัวอักษร"
+        results = _predict_batch(clean, model_choice)
+        df = pd.DataFrame(results)
+        fig, info = make_summary_chart(df, chart_type)
+        return df, fig, info
+    except Exception as e:
+        return pd.DataFrame(), go.Figure(), f"❌ เกิดข้อผิดพลาด:\n\n{traceback.format_exc()}"
+# ================= Tab 2: อัปโหลด CSV =================
 def on_file_change(file_obj):
+    """เมื่ออัปโหลดไฟล์ - ตรวจหา columns อัตโนมัติ"""
     if file_obj is None:
+        return (gr.update(choices=[],value=None),
+                gr.update(choices=[],value=None),
+                gr.update(choices=[],value=None),
+                gr.update(visible=False),
+                gr.update(visible=False),
+                gr.update(visible=False),
+                gr.update(visible=False),
+                "⚠️ กรุณาอัปโหลดไฟล์ CSV")
     try:
+        df = pd.read_csv(file_obj.name)
+        text_col, date_candidates, date_col, shop_candidates, shop_col = detect_columns(df)
+        has_date = date_col is not None
+        has_shop = shop_col is not None
+        note = f"✅ **ตรวจพบคอลัมน์:**\n"
+        note += f"- 📝 ข้อความ: **{text_col}**\n"
+        if has_date:
+            note += f"- 📅 วันที่: **{date_col}**\n"
+        else:
+            note += f"- 📅 วันที่: _ไม่พบ_\n"
+        if has_shop:
+            note += f"- 🏪 ร้าน/สาขา: **{shop_col}** (พบ {df[shop_col].nunique()} ร้าน)\n"
+        else:
+            note += f"- 🏪 ร้าน/สาขา: _ไม่พบ_\n"
+        note += f"\n_หากไม่ถูกต้อง สามารถเลือกใหม่ได้จากเมนูด้านบน_"
+        return (gr.update(choices=list(df.columns), value=text_col),
+                gr.update(choices=date_candidates if date_candidates else ["ไม่มี"], value=date_col),
+                gr.update(choices=shop_candidates if shop_candidates else ["ไม่มี"], value=shop_col),
+                gr.update(visible=has_date),
+                gr.update(visible=has_date),
+                gr.update(visible=has_shop),
+                gr.update(visible=has_shop),
+                note)
+    except Exception as e:
+        return (gr.update(choices=[],value=None),
+                gr.update(choices=[],value=None),
+                gr.update(choices=[],value=None),
+                gr.update(visible=False),
+                gr.update(visible=False),
+                gr.update(visible=False),
+                gr.update(visible=False),
+                f"❌ ไม่สามารถอ่านไฟล์ได้:\n{str(e)}")
+def predict_csv(file_obj, model_choice, text_col, date_col, shop_col,
+                date_preset, freq, use_smooth, chart_type):
+    """วิเคราะห์รีวิวจากไฟล์ CSV"""
+    if file_obj is None:
+        return (pd.DataFrame(), go.Figure(), go.Figure(),
+                gr.update(visible=False), gr.update(visible=False),
+                pd.DataFrame(), gr.update(visible=False),
+                "❌ กรุณาอัปโหลดไฟล์ CSV", None)
     try:
+        df_raw = pd.read_csv(file_obj.name)
+        cols = list(df_raw.columns)
+        # ตรวจสอบ text column
+        if text_col not in cols:
+            text_col, _, _, _, _ = detect_columns(df_raw)
+        # ดึงข้อความและทำนาย
+        texts = [_norm_text(v) for v in df_raw[text_col].tolist()]
+        texts = [t for t in texts if _is_substantive_text(t)]
+        if not texts:
+            return (pd.DataFrame(), go.Figure(), go.Figure(),
+                    gr.update(visible=False), gr.update(visible=False),
+                    pd.DataFrame(), gr.update(visible=False),
+                    "❌ ไม่พบข้อความที่สามารถวิเคราะห์ได้ในไฟล์", None)
+        results = _predict_batch(texts, model_choice)
+        df_out = pd.DataFrame(results)
+        # กราฟสรุปหลัก
+        fig_main, info = make_summary_chart(df_out, chart_type)
+        # กราฟตามเวลา
+        fig_time = go.Figure()
+        show_time = False
+        if date_col and date_col in cols and date_col != "ไม่มี":
+            dts = _to_datetime_safe(df_raw[date_col])
             if dts.notna().any():
+                df_time = df_out.copy()
+                df_time["__dt__"] = dts
+                df_time = df_time.dropna(subset=["__dt__"])
+                # ใช้ date preset
+                df_time = apply_date_preset(df_time, "__dt__", date_preset)
+                if len(df_time) > 0:
+                    fig_time = make_time_chart(df_time, "__dt__", freq, use_smooth)
+                    show_time = True
+        # วิเคราะห์ตาม Shop
+        shop_summary_df = pd.DataFrame()
+        fig_shop = go.Figure()
+        fig_shop_trend = None
+        show_shop = False
+        if shop_col and shop_col in cols and shop_col != "ไม่มี":
+            df_with_shop = df_out.copy()
+            df_with_shop[shop_col] = df_raw[shop_col]
+            # ถ้ามี date ด้วย ให้ใส่เข้าไป
+            if date_col and date_col in cols and date_col != "ไม่มี":
+                dts = _to_datetime_safe(df_raw[date_col])
+                if dts.notna().any():
+                    df_with_shop["__dt__"] = dts
+                    df_with_shop = df_with_shop.dropna(subset=["__dt__"])
+                    df_with_shop = apply_date_preset(df_with_shop, "__dt__", date_preset)
+                    shop_summary_df, fig_shop, fig_shop_trend = make_shop_analysis(
+                        df_with_shop, shop_col, "__dt__", freq
+                    )
+                else:
+                    shop_summary_df, fig_shop, _ = make_shop_analysis(df_with_shop, shop_col)
+            else:
+                shop_summary_df, fig_shop, _ = make_shop_analysis(df_with_shop, shop_col)
+            show_shop = True
+        # บันทึกไฟล์
+        fd, path = tempfile.mkstemp(suffix=".csv")
+        os.close(fd)
+        df_out.to_csv(path, index=False, encoding="utf-8-sig")
+        return (df_out, fig_main, fig_time,
+                gr.update(visible=show_time, value=fig_time),
+                gr.update(visible=show_shop, value=fig_shop),
+                shop_summary_df,
+                gr.update(visible=show_shop and fig_shop_trend is not None, value=fig_shop_trend),
+                info, path)
+    except Exception as e:
+        return (pd.DataFrame(), go.Figure(), go.Figure(),
+                gr.update(visible=False), gr.update(visible=False),
+                pd.DataFrame(), gr.update(visible=False),
+                f"❌ เกิดข้อผิดพลาด:\n\n{traceback.format_exc()}", None)
 # ================= Gradio UI =================
+with gr.Blocks(title="Thai Sentiment Analysis", theme=gr.themes.Soft()) as demo:
+    gr.Markdown("""
+    # 🇹🇭 Thai Sentiment Analysis
+    ### วิเคราะห์ความรู้สึกรีวิวภาษาไทย (เชิงบวก/เชิงลบ)
+    """)
+    model_radio = gr.Radio(
+        choices=AVAILABLE_CHOICES,
+        value=DEFAULT_MODEL,
+        label="🤖 เลือกโมเดล",
+        info="แนะนำ: WCB สำหรับความเร็ว, WCB_4Layer_BiLSTM สำหรับความแม่นยำ"
+    )
+    # =================== Tab 1: วิเคราะห์หลายรีวิว ===================
+    with gr.Tab("📝 วิเคราะห์หลายรีวิว"):
+        gr.Markdown("""
+        **วิธีใช้:** ป้อนรีวิวหลายรายการ (แต่ละบรรทัด = 1 รีวิว) แล้วกด "เริ่มวิเคราะห์"
+        **ตัวอย่าง:**
+        ```
+        อาหารอร่อยมาก บริการดีค่ะ
+        ของแพงไป รสชาติก็ธรรมดา
+        บรรยากาศดี แต่รอนาน
+        ```
+        """)
+        text_input = gr.Textbox(
+            lines=10,
+            label="📄 ข้อความรีวิว (บรรทัดละ 1 รีวิว)",
+            placeholder="ป้อนรีวิวที่ต้องการวิเคราะห์...\nแต่ละบรรทัด = 1 รีวิว"
+        )
         with gr.Row():
+            chart_type_1 = gr.Radio(
+                choices=["pie", "bar"],
+                value="pie",
+                label="📊 รูปแบบกราฟ",
+                info="Pie = วงกลม, Bar = แท่ง"
+            )
+            predict_btn_1 = gr.Button("🚀 เริ่มวิเคราะห์", variant="primary", size="lg")
+        result_df_1 = gr.Dataframe(label="📋 ผลการวิเคราะห์ทั้งหมด")
         with gr.Row():
+            with gr.Column(scale=1):
+                result_chart_1 = gr.Plot(label="📊 กราฟสรุป")
+            with gr.Column(scale=1):
+                result_info_1 = gr.Markdown()
+        predict_btn_1.click(
+            predict_many,
+            [text_input, model_radio, chart_type_1],
+            [result_df_1, result_chart_1, result_info_1]
+        )
+    # =================== Tab 2: อัปโหลด CSV ===================
+    with gr.Tab("📤 อัปโหลด CSV"):
+        gr.Markdown("""
+        **วิธีใช้:** อัปโหลดไฟล์ CSV ที่มีคอลัมน์รีวิว (และอาจมีวันที่/ร้านด้วย)
+        **คอลัมน์ที่ต้องมี:**
+        - ✅ คอลัมน์ข้อความรีวิว (เช่น "text", "review", "รีวิว")
+        - ⭐ คอลัมน์วันที่ (optional - สำหรับวิเคราะห์แนวโน้ม)
+        - ⭐ คอลัมน์ร้าน/สาขา (optional - สำหรับเปรียบเทียบร้าน)
+        """)
+        with gr.Row():
+            file_input = gr.File(
+                file_types=[".csv"],
+                label="📁 อัปโหลดไฟล์ CSV"
+            )
+        detect_note = gr.Markdown("⬆️ อัปโหลดไฟล์เพื่อเริ่มต้น")
+        with gr.Row():
+            text_col_dd = gr.Dropdown(
+                label="📝 คอลัมน์ข้อความรีวิว",
+                info="เลือกคอลัมน์ที่มีเนื้อหารีวิว"
+            )
+            date_col_dd = gr.Dropdown(
+                label="📅 คอลัมน์วันที่ (ถ้าไม่มีเว้นว่าง)",
+                info="สำหรับวิเคราะห์แนวโน้มตามเวลา"
+            )
+            shop_col_dd = gr.Dropdown(
+                label="🏪 คอลัมน์ร้าน/สาขา (ถ้าไม่มีเว้นว่าง)",
+                info="สำหรับเปรียบเทียบแต่ละร้าน"
+            )
+        gr.Markdown("### ⚙️ ตั้งค่าการวิเคราะห์")
+        with gr.Row():
+            date_preset = gr.Radio(
+                choices=list(DATE_PRESETS.keys()),
+                value="ทั้งหมด",
+                label="📆 ช่วงเวลาที่ต้องการวิเคราะห์",
+                visible=False
+            )
+            freq = gr.Radio(
+                choices=[("รายวัน", "D"), ("รายสัปดาห์", "W"), ("รายเดือน", "M")],
+                value="D",
+                label="📊 ความละเอียดของกราฟ",
+                visible=False
+            )
+        with gr.Row():
+            use_smooth = gr.Checkbox(
+                value=True,
+                label="✨ ปรับกราฟให้เรียบ (Moving Average)",
+                info="ช่วยให้เห็นแนวโน้มชัดเจนขึ้น",
+                visible=False
+            )
+            chart_type_2 = gr.Radio(
+                choices=[("วงกลม", "pie"), ("แท่ง", "bar")],
+                value="pie",
+                label="📊 รูปแบบกราฟสรุป"
+            )
+        shop_analysis_row = gr.Row(visible=False)
+        shop_trend_row = gr.Row(visible=False)
+        predict_btn_2 = gr.Button("🚀 เริ่มวิเคราะห์ CSV", variant="primary", size="lg")
+        gr.Markdown("### 📊 ผลการวิเคราะห์")
+        result_df_2 = gr.Dataframe(label="📋 ผลการวิเคราะห์ทั้งหมด")
+        with gr.Row():
+            with gr.Column(scale=1):
+                result_chart_2 = gr.Plot(label="📊 กราฟสรุปภาพรวม")
+            with gr.Column(scale=1):
+                result_info_2 = gr.Markdown()
+        result_time = gr.Plot(label="📈 กราฟแนวโน้มตามเวลา", visible=False)
+        with shop_analysis_row:
+            gr.Markdown("### 🏪 วิเคราะห์แยกตามร้าน/สาขา")
+        shop_summary = gr.Dataframe(label="📊 สรุปแต่ละร้าน")
+        result_shop = gr.Plot(label="🏪 เปรียบเทียบรีวิวแต่ละร้าน", visible=False)
+        with shop_trend_row:
+            result_shop_trend = gr.Plot(label="📈 แนวโน้ม % เชิงบวกแยกตามร้าน", visible=False)
+        download_file = gr.File(label="💾 ดาวน์โหลดผลลัพธ์ (CSV)")
+        # Event handlers
+        file_input.change(
+            on_file_change,
+            [file_input],
+            [text_col_dd, date_col_dd, shop_col_dd,
+             date_preset, freq, use_smooth,
+             shop_analysis_row, detect_note]
+        )
+        predict_btn_2.click(
+            predict_csv,
+            [file_input, model_radio, text_col_dd, date_col_dd, shop_col_dd,
+             date_preset, freq, use_smooth, chart_type_2],
+            [result_df_2, result_chart_2, result_time,
+             result_time, result_shop,
+             shop_summary, result_shop_trend,
+             result_info_2, download_file]
+        )
+    gr.Markdown("""
+    ---
+    ### 💡 เกี่ยวกับโมเดล
+    **WangchanBERTa Variants** - โมเดล BERT ภาษาไทยที่ได้รับการฝึกสำหรับงานวิเคราะห์ความรู้สึก
+    - **WCB**: เร็ว เหมาะกับงานทั่วไป
+    - **WCB_BiLSTM**: เพิ่มความแม่นยำด้วย BiLSTM
+    - **WCB_CNN_BiLSTM**: ใช้ CNN + BiLSTM เพิ่มประสิทธิภาพ
+    - **WCB_4Layer_BiLSTM**: แม่นยำสูงสุด แต่ช้ากว่า
+    📌 **หมายเหตุ:** โมเดลวิเคราะห์เฉพาะ **เชิงบวก/เชิงลบ** เท่านั้น (ไม่มี neutral)
+    """)
+if __name__ == "__main__":
+    demo.launch()