Spaces:

adikwok
/

api-deepseek

Sleeping

App Files Files Community

adikwok commited on Jun 4

Commit

c34e3ae

verified ·

1 Parent(s): bcd2917

Update app.py

Browse files

Files changed (1) hide show

app.py +43 -10

app.py CHANGED Viewed

@@ -12,8 +12,12 @@ API_KEY = os.getenv("GROQ_API_KEY")
 # In-memory chat history storage
 chat_history: List[Dict[str, str]] = []
 def groq_with_memory(message: str, topic: str = "general") -> tuple:
-    """Groq API call with chat history"""
     if not API_KEY:
         return "❌ No API Key found", ""
@@ -35,14 +39,30 @@ def groq_with_memory(message: str, topic: str = "general") -> tuple:
             "timestamp": datetime.now().strftime("%Y-%m-%d %H:%M")
         })
-        # Prepare messages for API call (last 50 messages for longer context)
-        recent_history = chat_history[-50:]
-        messages = [{"role": msg["role"], "content": msg["content"]} for msg in recent_history]
         payload = {
             "model": "gemma2-9b-it",
             "messages": messages,
-            "max_tokens": 3000,  # Increased for longer responses
             "temperature": 0.7
         }
@@ -266,15 +286,28 @@ with gr.Blocks(
         if not chat_history:
             return "❌ No conversation context yet"
-        recent_history = chat_history[-50:]  # Same as what AI sees
-        context_text = f"🧠 **Current AI Context** ({len(recent_history)} messages)\n\n"
-        for msg in recent_history:
             role_icon = "👤" if msg["role"] == "user" else "🤖"
             context_text += f"{role_icon} **{msg['timestamp']}** [{msg.get('topic', 'general')}]\n"
-            context_text += f"{msg['content'][:100]}{'...' if len(msg['content']) > 100 else ''}\n\n"
-        context_text += f"\n💡 *AI can remember these {len(recent_history)} messages in current conversation*"
         return context_text
     def refresh_topic_choices():

 # In-memory chat history storage
 chat_history: List[Dict[str, str]] = []
+def count_tokens_rough(text: str) -> int:
+    """Rough token estimation (1 token ≈ 4 chars)"""
+    return len(text) // 4
 def groq_with_memory(message: str, topic: str = "general") -> tuple:
+    """Groq API call with smart context management"""
     if not API_KEY:
         return "❌ No API Key found", ""
             "timestamp": datetime.now().strftime("%Y-%m-%d %H:%M")
         })
+        # Smart context management - keep within ~6000 tokens (24k chars)
+        messages = []
+        total_chars = 0
+        max_chars = 24000  # Safe limit for gemma2-9b-it
+        # Add messages from most recent, working backwards
+        for msg in reversed(chat_history):
+            msg_content = f"{msg['content']}"
+            msg_chars = len(msg_content)
+            if total_chars + msg_chars < max_chars:
+                messages.insert(0, {"role": msg["role"], "content": msg["content"]})
+                total_chars += msg_chars
+            else:
+                break
+        # Ensure we have at least the current message
+        if not messages:
+            messages = [{"role": "user", "content": message.strip()}]
         payload = {
             "model": "gemma2-9b-it",
             "messages": messages,
+            "max_tokens": 2000,  # Conservative for safety
             "temperature": 0.7
         }
         if not chat_history:
             return "❌ No conversation context yet"
+        # Show actual context that will be sent to AI
+        messages = []
+        total_chars = 0
+        max_chars = 24000
+        for msg in reversed(chat_history):
+            msg_chars = len(msg['content'])
+            if total_chars + msg_chars < max_chars:
+                messages.insert(0, msg)
+                total_chars += msg_chars
+            else:
+                break
+        context_text = f"🧠 **Current AI Context** ({len(messages)} messages, ~{total_chars:,} chars)\n\n"
+        for msg in messages:
             role_icon = "👤" if msg["role"] == "user" else "🤖"
             context_text += f"{role_icon} **{msg['timestamp']}** [{msg.get('topic', 'general')}]\n"
+            context_text += f"{msg['content'][:150]}{'...' if len(msg['content']) > 150 else ''}\n\n"
+        context_text += f"\n💡 *AI remembers {len(messages)} messages (~{total_chars:,} characters)*"
+        context_text += f"\n🔢 *Context limit: {max_chars:,} characters*"
         return context_text
     def refresh_topic_choices():