Spaces:

AumCoreAI
/

AumCore-AI

Sleeping

App Files Files Community

AumCoreAI commited on Dec 25, 2025

Commit

0d188ca

verified ·

1 Parent(s): 2ba0ed7

Update language_detector.py

Browse files

Files changed (1) hide show

language_detector.py +69 -39

language_detector.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# language_detector.py - FINAL WORKING VERSION (200 lines)
 from langdetect import detect, DetectorFactory
 import re
@@ -33,7 +33,7 @@ def detect_input_language(text):
 def get_system_prompt(lang_mode, username):
     """Generate system prompt based on language and intent"""
-    # CORE RULES - COMMON FOR ALL
     core_rules = f"""
     ROLE: AumCore AI - Senior Coding Assistant
     USER: {username}
@@ -43,70 +43,94 @@ def get_system_prompt(lang_mode, username):
        - CODE WHEN: User says 'code', 'program', 'script', 'function', 'create', 'build'
        - CHAT WHEN: General conversation, greetings, knowledge questions
        - EXAMPLES:
-           * "google drive code" → RAW CODE
            * "hello how are you" → TEXT RESPONSE
            * "koi bhajan aata hai" → TEXT RESPONSE
-    2. CODE FORMAT:
-       - RAW PYTHON CODE ONLY
-       - NO markdown blocks (```python```)
-       - NO 'python' keyword in response
-       - Example: "from google.colab import drive\\ndrive.mount('/content/gdrive')"
     3. ERROR HANDLING:
-       - If user shows error, analyze and provide corrected code
-       - Include brief explanation of fix
     4. CODE QUALITY:
        - Production-ready code
        - Error handling included
        - Proper structure
     """
-    # LANGUAGE SPECIFIC STYLES
     styles = {
-        'hindi': """
-        STYLE: 100% Hindi (except code)
         EXAMPLES:
-        - User: "नमस्ते, कोड बताओ" → RAW CODE
-        - User: "क्या हाल है" → "सब ठीक है {username} भाई!"
-        - User: "त्रुटि: x परिभाषित नहीं" → "x = 10\\ny = x\\nprint(y)"
         """,
-        'english': """
-        STYLE: 100% English (except code)
         EXAMPLES:
-        - User: "hello, give code" → RAW CODE
-        - User: "how are you" → "I'm good {username}!"
-        - User: "error: x not defined" → "x = 10\\ny = x\\nprint(y)"
         """,
-        'mixed': """
         STYLE: 60% English + 40% Hindi (natural blend)
         EXAMPLES:
-        - User: "hi bhai, code de" → RAW CODE
-        - User: "are yaar, kya haal hai" → "Sab badhiya hai {username} bhai!"
-        - User: "error aaya: x not defined" → "x = 10\\ny = x\\nprint(y)"
         """
     }
-    # COMBINE
     full_prompt = f"""{core_rules}
     {styles.get(lang_mode, styles['mixed'])}
-    FINAL REMINDER: Be {username}'s helpful AI assistant.
-    Provide accurate code for technical requests.
-    Engage naturally in conversation.
     """
     return full_prompt.strip()
-# SIMPLE CODE GENERATOR (Optional - can be expanded)
 def generate_basic_code(task):
-    """Generate basic code templates"""
     templates = {
-        'web': """
 from fastapi import FastAPI
 import uvicorn
@@ -118,8 +142,8 @@ def home():
 if __name__ == "__main__":
     uvicorn.run(app, host="0.0.0.0", port=8000)
-""",
-        'data': """
 import pandas as pd
 import numpy as np
@@ -130,11 +154,11 @@ df = pd.read_csv("data.csv")
 print(f"Shape: {df.shape}")
 print(f"Columns: {list(df.columns)}")
 print(f"Summary:\\n{df.describe()}")
-""",
-        'drive': """
 from google.colab import drive
 drive.mount('/content/gdrive')
-"""
     }
     task_lower = task.lower()
@@ -161,4 +185,10 @@ if __name__ == "__main__":
         lang = detect_input_language(test)
         print(f"{test[:20]:20} -> {lang}")
-    print("\\n✅ language_detector.py ready for AumCore AI")

+# language_detector.py - UPDATED FOR CODE FORMATTING (200+ lines)
 from langdetect import detect, DetectorFactory
 import re
 def get_system_prompt(lang_mode, username):
     """Generate system prompt based on language and intent"""
+    # CORE RULES - UPDATED FOR MARKDOWN FORMATTING
     core_rules = f"""
     ROLE: AumCore AI - Senior Coding Assistant
     USER: {username}
        - CODE WHEN: User says 'code', 'program', 'script', 'function', 'create', 'build'
        - CHAT WHEN: General conversation, greetings, knowledge questions
        - EXAMPLES:
+           * "google drive code" → CODE IN MARKDOWN BLOCKS
            * "hello how are you" → TEXT RESPONSE
            * "koi bhajan aata hai" → TEXT RESPONSE
+    2. CODE FORMATTING (CRITICAL):
+       - ALWAYS use markdown code blocks for Python code
+       - FORMAT: ```python\\ncode here\\n```
+       - NEVER output raw code without markdown blocks
+       - EXAMPLES:
+           ✅ CORRECT: ```python\\nfrom google.colab import drive\\ndrive.mount('/content/gdrive')\\n```
+           ❌ WRONG: from google.colab import drive
     3. ERROR HANDLING:
+       - If user shows error, analyze and provide corrected code IN MARKDOWN
+       - Include brief explanation before/after code block
     4. CODE QUALITY:
        - Production-ready code
        - Error handling included
        - Proper structure
+    5. RESPONSE STRUCTURE:
+       - Code responses: Explanation (if needed) + Markdown code block
+       - Chat responses: Plain text only
+       - Error fixes: Error analysis + Corrected code in markdown
     """
+    # LANGUAGE SPECIFIC STYLES - UPDATED
     styles = {
+        'hindi': f"""
+        STYLE: 100% Hindi (code markdown blocks ke alawa)
         EXAMPLES:
+        - User: "नमस्ते, कोड बताओ"
+          You: ```python\\nfrom google.colab import drive\\ndrive.mount('/content/gdrive')\\n```
+        - User: "क्या हाल है"
+          You: "सब ठीक है {username} भाई!"
+        - User: "त्रुटि: x परिभाषित नहीं"
+          You: "त्रुटि: x define नहीं है। सही कोड:\\n```python\\nx = 10\\ny = x\\nprint(y)\\n```
         """,
+        'english': f"""
+        STYLE: 100% English (except code in markdown blocks)
         EXAMPLES:
+        - User: "hello, give code"
+          You: ```python\\nfrom google.colab import drive\\ndrive.mount('/content/gdrive')\\n```
+        - User: "how are you"
+          You: "I'm good {username}!"
+        - User: "error: x not defined"
+          You: "Error: x is not defined. Corrected code:\\n```python\\nx = 10\\ny = x\\nprint(y)\\n```
         """,
+        'mixed': f"""
         STYLE: 60% English + 40% Hindi (natural blend)
         EXAMPLES:
+        - User: "hi bhai, code de"
+          You: ```python\\nfrom google.colab import drive\\ndrive.mount('/content/gdrive')\\n```
+        - User: "are yaar, kya haal hai"
+          You: "Sab badhiya hai {username} bhai!"
+        - User: "error aaya: x not defined"
+          You: "Error: x defined nahi hai. Corrected code:\\n```python\\nx = 10\\ny = x\\nprint(y)\\n```
         """
     }
+    # COMBINE WITH EMPHASIS ON MARKDOWN
     full_prompt = f"""{core_rules}
     {styles.get(lang_mode, styles['mixed'])}
+    FINAL REMINDER:
+    - You are {username}'s helpful AI assistant
+    - FOR CODE: ALWAYS use ```python\\ncode\\n``` format
+    - This enables beautiful code formatting with copy button
+    - Without markdown blocks, code formatting won't work properly
     """
     return full_prompt.strip()
+# SIMPLE CODE GENERATOR WITH MARKDOWN
 def generate_basic_code(task):
+    """Generate basic code templates with markdown"""
     templates = {
+        'web': """```python
 from fastapi import FastAPI
 import uvicorn
 if __name__ == "__main__":
     uvicorn.run(app, host="0.0.0.0", port=8000)
+```""",
+        'data': """```python
 import pandas as pd
 import numpy as np
 print(f"Shape: {df.shape}")
 print(f"Columns: {list(df.columns)}")
 print(f"Summary:\\n{df.describe()}")
+```""",
+        'drive': """```python
 from google.colab import drive
 drive.mount('/content/gdrive')
+```"""
     }
     task_lower = task.lower()
         lang = detect_input_language(test)
         print(f"{test[:20]:20} -> {lang}")
+    # Test code generation with markdown
+    test_code = generate_basic_code("google drive")
+    print(f"\nGenerated code sample:\n{test_code[:100]}...")
+    print("\n✅ language_detector.py UPDATED for markdown formatting")
+    print("   AI will now output code in ```python blocks")
+    print("   This enables: Code boxes, Copy button, Syntax highlighting")