Spaces:

asenturisk
/

SentiChat

Sleeping

App Files Files Community

dwmk commited on 10 days ago

Commit

1b8b8df

verified ·

1 Parent(s): 5d76435

Update app.py

Browse files

Files changed (1) hide show

app.py +280 -100

app.py CHANGED Viewed

@@ -5,169 +5,349 @@ import torch
 import torch.nn as nn
 import torch.nn.functional as F
 from sklearn.feature_extraction.text import TfidfVectorizer
-from sklearn.ensemble import RandomForestClassifier
 from sklearn.preprocessing import LabelEncoder
 import kagglehub
-import time
-import random
-# --- 1. ARCHITECTURE (Core logic from social_messages_benchmarks_ft_distil.py) ---
 class EpisodicMemory:
-    """Mimics Hippocampal retention and retrieval"""
     def __init__(self, capacity=2000):
-        self.memory_x, self.memory_y = [], []
         self.capacity = capacity
     def store(self, x, y):
-        curr_x, curr_y = x.detach().cpu(), y.detach().cpu()
         for i in range(curr_x.size(0)):
             if len(self.memory_x) >= self.capacity:
-                self.memory_x.pop(0); self.memory_y.pop(0)
-            self.memory_x.append(curr_x[i]); self.memory_y.append(curr_y[i])
     def retrieve(self, query_x, k=5):
-        if not self.memory_x: return None
         mem_tensor = torch.stack(self.memory_x).to(query_x.device)
         distances = torch.cdist(query_x, mem_tensor)
         top_k_indices = torch.topk(distances, k, largest=False).indices
-        return torch.stack([torch.stack([self.memory_y[idx] for idx in s_idx]) for s_idx in top_k_indices]).to(query_x.device)
 class H3MOS(nn.Module):
-    """The H3MOS architecture using Executive Core and Hippocampus"""
     def __init__(self, input_dim, hidden_dim, output_dim):
         super().__init__()
         self.executive = nn.Sequential(
-            nn.Linear(input_dim, hidden_dim),
-            nn.LayerNorm(hidden_dim),
             nn.GELU()
         )
         self.motor = nn.Linear(hidden_dim, output_dim)
-        self.hippocampus = EpisodicMemory()
     def forward(self, x, training_mode=False):
         z = self.executive(x)
         raw_logits = self.motor(z)
-        if training_mode: return raw_logits
         past_labels = self.hippocampus.retrieve(x, k=5)
-        if past_labels is None: return raw_logits
         mem_votes = torch.zeros_like(raw_logits)
         for i in range(x.size(0)):
             votes = torch.bincount(past_labels[i], minlength=raw_logits.size(1)).float()
             mem_votes[i] = votes
-        return (0.8 * raw_logits) + (0.2 * F.softmax(mem_votes, dim=1) * 5.0)
-# --- 2. DATA LOAD & TRAINING ---
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
-print(f"Initializing models on {device}...")
-path = kagglehub.dataset_download('dewanmukto/social-messages-and-emoji-reactions')
-df = pd.read_csv(path+"/messages_emojis.csv").dropna(subset=['content'])
-# Sentiment/Intent Mappings from benchmark
 sent_map = {'❤️':'Pos', '👍':'Pos', '😂':'Pos', '💯':'Pos', '😢':'Neg', '😭':'Neg', '😮':'Neu'}
 intent_map = {'❤️':'Emotion', '👍':'Agreement', '😂':'Emotion', '😮':'Surprise'}
-tfidf = TfidfVectorizer(max_features=500, stop_words='english')
 X_sparse = tfidf.fit_transform(df['content'])
 X_dense = torch.FloatTensor(X_sparse.toarray()).to(device)
-model_zoo = {}
 encoders = {}
-for task in ['emoji', 'sentiment', 'intent']:
-    y_labels = df['emoji'].values if task == 'emoji' else df['emoji'].apply(lambda x: sent_map.get(x, 'Neutral') if task == 'sentiment' else intent_map.get(x, 'Other')).values
     le = LabelEncoder()
-    y_enc = torch.LongTensor(le.fit_transform(y_labels)).to(device)
     encoders[task] = le
-    h3 = H3MOS(X_dense.shape[1], 64, len(le.classes_)).to(device)
-    opt = torch.optim.Adam(h3.parameters(), lr=0.01)
-    for _ in range(20):
-        opt.zero_grad(); F.cross_entropy(h3(X_dense, True), y_enc).backward(); opt.step()
-    rf = RandomForestClassifier(n_estimators=20).fit(X_sparse, y_labels)
-    model_zoo[task] = {"DISTIL-H3MOS": h3, "RandomForest": rf}
-# --- 3. UI LOGIC ---
-CSS = """
-.reaction-btn {
-    background: #f0f2f5; border: 1px solid #ddd; border-radius: 15px;
-    padding: 2px 8px; font-size: 14px; cursor: pointer; margin-top: 5px;
-}
-.bot-header { display: flex; align-items: center; margin-bottom: 5px; }
-.bot-avatar { width: 28px; height: 28px; border-radius: 50%; margin-right: 8px; border: 1px solid #eee; }
-.bot-name { font-weight: bold; font-size: 0.9em; color: #555; }
-"""
-def get_avatar_url(name):
-    return f"https://api.dicebear.com/7.x/adventurer/svg?seed={name}"
-def predict(text):
     vec_s = tfidf.transform([text])
     vec_t = torch.FloatTensor(vec_s.toarray()).to(device)
-    res = {}
-    for task in ['emoji', 'sentiment', 'intent']:
-        with torch.no_grad():
-            h3_idx = torch.argmax(model_zoo[task]["DISTIL-H3MOS"](vec_t)).item()
-            h3_p = encoders[task].inverse_transform([h3_idx])[0]
-        rf_p = model_zoo[task]["RandomForest"].predict(vec_s)[0]
-        res[task] = {"DISTIL-H3MOS": h3_p, "RandomForest": rf_p}
-    return res
-def chat_interface(message, history):
-    if not message:
-        yield "", history
-        return
-    preds = predict(message)
-    # Emoji Reaction Logic
-    h3_emoji = preds['emoji']['DISTIL-H3MOS']
-    rf_emoji = preds['emoji']['RandomForest']
-    details = f"DISTIL-H3MOS: {h3_emoji} | RandomForest: {rf_emoji}"
-    reaction_html = f"<button class='reaction-btn' title='{details}'>{h3_emoji} 🤖</button>"
-    # 1. Add User Message and CLEAR textbox by yielding (" ", history)
-    history.append({"role": "user", "content": f"{message}<br>{reaction_html}"})
-    yield "", history
-    # 2. Simulate Group Members
-    bots = ["DISTIL-H3MOS", "RandomForest"]
-    random.shuffle(bots)
-    for bot in bots:
-        time.sleep(random.uniform(0.6, 1.2))
-        sent = preds['sentiment'][bot]
-        intent = preds['intent'][bot]
-        avatar = get_avatar_url(bot)
-        bot_content = f"""
-        <div class="bot-header">
-            <img src="{avatar}" class="bot-avatar">
-            <span class="bot-name">{bot}</span>
-        </div>
-        <div style="padding-left: 36px;">
-            <b>Sentiment:</b> {sent}<br>
-            <b>Intent:</b> {intent}
         </div>
         """
-        history.append({"role": "assistant", "content": bot_content})
-        # Always yield a value for both [textbox, chatbot]
-        yield "", history
-with gr.Blocks() as demo:
-    gr.Markdown("### 📱 Model Group Chat")
-    chatbot = gr.Chatbot(elem_id="chat-window", avatar_images=(get_avatar_url("User"), None), height=500)
     with gr.Row():
-        txt = gr.Textbox(placeholder="Type a message...", show_label=False, scale=4)
-        btn = gr.Button("Send", variant="primary")
-    # The fix: Ensure inputs/outputs match the yield count
-    txt.submit(chat_interface, [txt, chatbot], [txt, chatbot])
-    btn.click(chat_interface, [txt, chatbot], [txt, chatbot])
-demo.launch(css=CSS)

 import torch.nn as nn
 import torch.nn.functional as F
 from sklearn.feature_extraction.text import TfidfVectorizer
+from sklearn.ensemble import RandomForestClassifier, GradientBoostingClassifier
+from sklearn.svm import SVC
+from sklearn.naive_bayes import MultinomialNB
+from sklearn.linear_model import LogisticRegression
 from sklearn.preprocessing import LabelEncoder
 import kagglehub
+import warnings
+# Suppress sklearn warnings for cleaner logs
+warnings.filterwarnings("ignore")
+# --- 1. ARCHITECTURE: H3MOS (Hippocampal Memory & Executive Core) ---
 class EpisodicMemory:
+    """Mimics Hippocampal retention and retrieval of recent experiences."""
     def __init__(self, capacity=2000):
+        self.memory_x = []
+        self.memory_y = []
         self.capacity = capacity
     def store(self, x, y):
+        # Store on CPU to save GPU VRAM
+        curr_x = x.detach().cpu()
+        curr_y = y.detach().cpu()
         for i in range(curr_x.size(0)):
             if len(self.memory_x) >= self.capacity:
+                self.memory_x.pop(0)
+                self.memory_y.pop(0)
+            self.memory_x.append(curr_x[i])
+            self.memory_y.append(curr_y[i])
     def retrieve(self, query_x, k=5):
+        if not self.memory_x:
+            return None
         mem_tensor = torch.stack(self.memory_x).to(query_x.device)
         distances = torch.cdist(query_x, mem_tensor)
         top_k_indices = torch.topk(distances, k, largest=False).indices
+        # Gather labels
+        retrieved_y = [torch.stack([self.memory_y[idx] for idx in sample_indices])
+                       for sample_indices in top_k_indices]
+        return torch.stack(retrieved_y).to(query_x.device)
 class H3MOS(nn.Module):
     def __init__(self, input_dim, hidden_dim, output_dim):
         super().__init__()
+        # Executive Core
         self.executive = nn.Sequential(
+            nn.Linear(input_dim, hidden_dim),
+            nn.LayerNorm(hidden_dim),
+            nn.GELU(),
+            nn.Dropout(0.2),
+            nn.Linear(hidden_dim, hidden_dim),
             nn.GELU()
         )
+        # Motor Policy
         self.motor = nn.Linear(hidden_dim, output_dim)
+        # Hippocampus
+        self.hippocampus = EpisodicMemory(capacity=2000)
     def forward(self, x, training_mode=False):
         z = self.executive(x)
         raw_logits = self.motor(z)
+        # Fast Path (Training or Empty Memory)
+        if training_mode or len(self.hippocampus.memory_x) < 10:
+            return raw_logits
+        # Memory Retrieval & Integration
         past_labels = self.hippocampus.retrieve(x, k=5)
+        if past_labels is None:
+             return raw_logits
         mem_votes = torch.zeros_like(raw_logits)
         for i in range(x.size(0)):
             votes = torch.bincount(past_labels[i], minlength=raw_logits.size(1)).float()
             mem_votes[i] = votes
+        mem_probs = F.softmax(mem_votes, dim=1)
+        # Dynamic Gating: 80% Neural, 20% Memory
+        return (0.8 * raw_logits) + (0.2 * mem_probs * 5.0)
+# --- 2. DATA SETUP & TRAINING PIPELINE ---
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+print(f"🚀 Initializing System on {device}...")
+# Load Data
+try:
+    path = kagglehub.dataset_download('dewanmukto/social-messages-and-emoji-reactions')
+    df = pd.read_csv(path+"/messages_emojis.csv").dropna(subset=['content'])
+except Exception as e:
+    print("Error loading data:", e)
+    # Fallback dummy data if kaggle fails (for testing)
+    df = pd.DataFrame({'content': ['test'], 'emoji': ['👍']})
+# Mappings
 sent_map = {'❤️':'Pos', '👍':'Pos', '😂':'Pos', '💯':'Pos', '😢':'Neg', '😭':'Neg', '😮':'Neu'}
 intent_map = {'❤️':'Emotion', '👍':'Agreement', '😂':'Emotion', '😮':'Surprise'}
+# Vectorization
+tfidf = TfidfVectorizer(max_features=600, stop_words='english')
 X_sparse = tfidf.fit_transform(df['content'])
 X_dense = torch.FloatTensor(X_sparse.toarray()).to(device)
+# Model Zoo Containers
+tasks = ['emoji', 'sentiment', 'intent']
+model_names = ['DISTIL', 'RandomForest', 'SVM', 'NaiveBayes', 'LogReg', 'GradBoost']
+zoo = {task: {} for task in tasks}
 encoders = {}
+print("🧠 Training Models... (This may take a moment)")
+for task in tasks:
+    # Prepare Labels
+    if task == 'emoji':
+        raw_y = df['emoji'].values
+    elif task == 'sentiment':
+        raw_y = df['emoji'].apply(lambda x: sent_map.get(x, 'Neutral')).values
+    else:
+        raw_y = df['emoji'].apply(lambda x: intent_map.get(x, 'Other')).values
     le = LabelEncoder()
+    y_nums = le.fit_transform(raw_y)
     encoders[task] = le
+    # 1. Train DISTIL-H3MOS (PyTorch)
+    y_tensor = torch.LongTensor(y_nums).to(device)
+    output_dim = len(le.classes_)
+    model = H3MOS(X_dense.shape[1], 64, output_dim).to(device)
+    optimizer = torch.optim.AdamW(model.parameters(), lr=0.01)
+    model.train()
+    # Short training loop for demo speed
+    for epoch in range(25):
+        optimizer.zero_grad()
+        out = model(X_dense, training_mode=True)
+        loss = F.cross_entropy(out, y_tensor)
+        loss.backward()
+        optimizer.step()
+        # Populate memory occasionally
+        if epoch % 5 == 0:
+            with torch.no_grad():
+                idx = torch.randperm(X_dense.size(0))[:50]
+                model.hippocampus.store(X_dense[idx], y_tensor[idx])
+    model.eval()
+    zoo[task]['DISTIL'] = model
+    # 2. Train Sklearn Models
+    zoo[task]['RandomForest'] = RandomForestClassifier(n_estimators=50).fit(X_sparse, y_nums)
+    zoo[task]['SVM'] = SVC(kernel='linear').fit(X_sparse, y_nums)
+    zoo[task]['NaiveBayes'] = MultinomialNB().fit(X_sparse, y_nums)
+    zoo[task]['LogReg'] = LogisticRegression(max_iter=500).fit(X_sparse, y_nums)
+    zoo[task]['GradBoost'] = GradientBoostingClassifier(n_estimators=30).fit(X_sparse, y_nums)
+print("✅ Training Complete.")
+# --- 3. INFERENCE LOGIC ---
+def get_predictions(text):
+    """Runs all models on the text."""
     vec_s = tfidf.transform([text])
     vec_t = torch.FloatTensor(vec_s.toarray()).to(device)
+    results = {name: {} for name in model_names}
+    for task in tasks:
+        le = encoders[task]
+        for name in model_names:
+            if name == 'DISTIL':
+                with torch.no_grad():
+                    logits = zoo[task][name](vec_t)
+                    pred_idx = torch.argmax(logits, dim=1).item()
+                    pred_label = le.inverse_transform([pred_idx])[0]
+            else:
+                pred_idx = zoo[task][name].predict(vec_s)[0]
+                pred_label = le.inverse_transform([pred_idx])[0]
+            results[name][task] = pred_label
+    return results
+# --- 4. UI STYLING & INTERFACE ---
+def get_avatar_url(seed):
+    return f"https://api.dicebear.com/7.x/bottts/svg?seed={seed}&backgroundColor=transparent"
+CSS = """
+.chat-window { font-family: 'Segoe UI', sans-serif; }
+/* User Message Styling */
+.user-reactions {
+    margin-top: 8px;
+    padding-top: 6px;
+    border-top: 1px solid rgba(255,255,255,0.3);
+    font-size: 1.2em;
+    letter-spacing: 4px;
+    text-align: right;
+    opacity: 0.9;
+}
+/* Bot Reply Container */
+.model-scroll-container {
+    display: flex;
+    gap: 12px;
+    overflow-x: auto;
+    padding: 10px 4px;
+    scrollbar-width: thin;
+}
+.model-card {
+    background: white;
+    min-width: 140px;
+    border-radius: 12px;
+    padding: 12px;
+    box-shadow: 0 4px 12px rgba(0,0,0,0.08);
+    display: flex;
+    flex-direction: column;
+    align-items: center;
+    border: 1px solid #eee;
+    transition: transform 0.2s;
+}
+.model-card:hover { transform: translateY(-3px); }
+.card-avatar {
+    width: 45px;
+    height: 45px;
+    border-radius: 50%;
+    margin-bottom: 8px;
+    border: 2px solid #f0f2f5;
+    background: #f9f9f9;
+}
+.card-name {
+    font-size: 11px;
+    font-weight: 700;
+    text-transform: uppercase;
+    color: #888;
+    margin-bottom: 4px;
+}
+.card-emoji {
+    font-size: 28px;
+    margin: 4px 0;
+}
+.card-badge {
+    font-size: 10px;
+    padding: 2px 8px;
+    border-radius: 10px;
+    margin-top: 4px;
+    font-weight: 600;
+}
+.bg-Pos { background-color: #e6fffa; color: #2c7a7b; }
+.bg-Neg { background-color: #fff5f5; color: #c53030; }
+.bg-Neu { background-color: #f7fafc; color: #4a5568; }
+.intent-row {
+    font-size: 10px;
+    color: #666;
+    margin-top: 6px;
+    border-top: 1px dashed #eee;
+    padding-top: 4px;
+    width: 100%;
+    text-align: center;
+}
+"""
+def chat_logic(message, history):
+    if not message:
+        return "", history
+    preds = get_predictions(message)
+    # 1. Create User Message HTML (with Emoji Reaction Bar)
+    # Order: DISTIL, RF, SVM, NB, LR, GB
+    reaction_string = "".join([preds[m]['emoji'] for m in model_names])
+    user_html = f"""
+    <div>
+        {message}
+        <div class="user-reactions" title="Consensus: {reaction_string}">{reaction_string}</div>
+    </div>
+    """
+    history.append({"role": "user", "content": user_html})
+    # 2. Create Single Bot Reply HTML (Horizontal Scroll Cards)
+    cards_html = '<div class="model-scroll-container">'
+    for name in model_names:
+        p = preds[name]
+        # Color coding for sentiment
+        sent_cls = "bg-Neu"
+        if "Pos" in p['sentiment']: sent_cls = "bg-Pos"
+        elif "Neg" in p['sentiment']: sent_cls = "bg-Neg"
+        cards_html += f"""
+        <div class="model-card">
+            <img src="{get_avatar_url(name)}" class="card-avatar">
+            <div class="card-name">{name}</div>
+            <div class="card-emoji">{p['emoji']}</div>
+            <div class="card-badge {sent_cls}">{p['sentiment']}</div>
+            <div class="intent-row">{p['intent']}</div>
         </div>
         """
+    cards_html += "</div>"
+    history.append({"role": "assistant", "content": cards_html})
+    return "", history
+# --- 5. LAUNCH APP ---
+with gr.Blocks(css=CSS, title="Social Benchmarks AI") as demo:
+    gr.Markdown("### 🤖 Multi-Model Social Benchmarks")
+    gr.Markdown("Type a message to see how 6 different AI architectures interpret it.")
+    chatbot = gr.Chatbot(
+        elem_id="chat-window",
+        type="messages",
+        avatar_images=(None, "https://api.dicebear.com/7.x/bottts/svg?seed=Admin"),
+        height=600,
+        render_markdown=False # Important to render our custom HTML
+    )
     with gr.Row():
+        txt = gr.Textbox(
+            placeholder="Type a social message (e.g., 'I cant believe you did that!')",
+            scale=4,
+            show_label=False,
+            container=False
+        )
+        btn = gr.Button("Analyze", variant="primary", scale=1)
+    # Event bindings
+    txt.submit(chat_logic, [txt, chatbot], [txt, chatbot])
+    btn.click(chat_logic, [txt, chatbot], [txt, chatbot])
+if __name__ == "__main__":
+    demo.launch()