chat

Paused

ameliakris Claude Sonnet 4.6 commited on 27 days ago

Commit

ffcd201

1 Parent(s): e38afe2

Replace model selection with specialized coding models

Updated to 4 specialized models:
- WhiteRabbitNeo 2.5 Qwen 2.5 Coder 7B: Advanced coding assistant with security focus
- Gemma 3 Prompt Coder 270m: Ultra-fast lightweight coding specialist
- DeepSeek V4 Pro: Advanced multimodal reasoning model
- Qwen 3.6 35B A3B: Large model with aggressive reasoning

Each model has custom system prompts optimized for their capabilities.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

Files changed (1) hide show

app.py +20 -48

app.py CHANGED Viewed

@@ -15,61 +15,33 @@ llm_model = None
 # Comprehensive model configurations
 MODELS = {
-    "Dolphin 3.0 R1 Mistral 24B": {
-        "filename": "cognitivecomputations_Dolphin3.0-R1-Mistral-24B-Q8_0.gguf",
-        "repo_id": "bartowski/cognitivecomputations_Dolphin3.0-R1-Mistral-24B-GGUF",
-        "system_prompt": "You are Dolphin, an AI assistant that helps humanity, trained to specialize in reasoning and first-principles analysis. When responding, always format your replies using {reasoning}{answer}. Use at least 6 reasoning steps and perform a root cause analysis before answering. However, if the answer is very easy and requires little thought, you may leave the {reasoning} block empty. Your responses should be detailed, structured with rich Markdown formatting, and engaging with emojis. Be extensive in your explanations, just as the greatest scientific minds would be. Always reason through the problem first, unless it's trivial, in which case you may answer directly.",
         "formatter": "CHATML",
-        "description": "Latest Dolphin with enhanced reasoning capabilities"
     },
-    "Dolphin 2.9.2 Qwen2 72B": {
-        "filename": "qwen2-Q3_K_M.gguf",
-        "repo_id": "cognitivecomputations/dolphin-2.9.2-qwen2-72b-gguf",
-        "system_prompt": "You are Dolphin, a helpful AI assistant trained to be helpful, harmless, and honest. You provide detailed, accurate responses with proper reasoning and analysis.",
         "formatter": "CHATML",
-        "description": "Large 72B parameter model for complex tasks"
     },
-    "Llama 3.1 8B Instruct": {
-        "filename": "Llama-3.1-8B-Instruct-Q5_K_M.gguf",
-        "repo_id": "mradermacher/Llama-3.1-8B-Instruct-GGUF",
-        "system_prompt": "You are a helpful, intelligent assistant. Provide accurate, thoughtful responses with clear reasoning.",
         "formatter": "CHATML",
-        "description": "Fast and efficient general purpose model"
     },
-    "Mistral 7B Instruct v0.3": {
-        "filename": "Mistral-7B-Instruct-v0.3-Q5_K_M.gguf",
-        "repo_id": "microsoft/Mistral-7B-Instruct-v0.3-GGUF",
-        "system_prompt": "You are a helpful AI assistant. Provide clear, accurate, and well-reasoned responses.",
         "formatter": "CHATML",
-        "description": "Balanced performance and speed"
-    },
-    "Phi-3 Medium 128K": {
-        "filename": "Phi-3-medium-128k-instruct-Q5_K_M.gguf",
-        "repo_id": "microsoft/Phi-3-medium-128k-instruct-GGUF",
-        "system_prompt": "You are a helpful AI assistant with extensive knowledge. Provide detailed, accurate responses.",
-        "formatter": "CHATML",
-        "description": "Long context window (128K tokens)"
-    },
-    "Gemma 2 9B IT": {
-        "filename": "gemma-2-9b-it-Q5_K_M.gguf",
-        "repo_id": "mradermacher/gemma-2-9b-it-GGUF",
-        "system_prompt": "You are a helpful, harmless, and honest AI assistant. Provide clear, well-reasoned responses.",
-        "formatter": "CHATML",
-        "description": "Google's efficient instruction-tuned model"
-    },
-    "Qwen2.5 7B Instruct": {
-        "filename": "Qwen2.5-7B-Instruct-Q5_K_M.gguf",
-        "repo_id": "mradermacher/Qwen2.5-7B-Instruct-GGUF",
-        "system_prompt": "You are a helpful AI assistant named Qwen, created by Alibaba Cloud. Provide accurate, thoughtful responses.",
-        "formatter": "CHATML",
-        "description": "Strong multilingual capabilities"
-    },
-    "Yi 1.5 34B": {
-        "filename": "dolphin-2.9.1-yi-1.5-34b-Q6_K.gguf",
-        "repo_id": "bartowski/dolphin-2.9.1-yi-1.5-34b-GGUF",
-        "system_prompt": "You are Dolphin, an AI assistant trained for reasoning and analysis. Provide detailed, well-reasoned responses.",
-        "formatter": "CHATML",
-        "description": "Strong reasoning with 34B parameters"
     }
 }

 # Comprehensive model configurations
 MODELS = {
+    "WhiteRabbitNeo 2.5 Qwen 2.5 Coder 7B": {
+        "filename": "WhiteRabbitNeo-2.5-Qwen-2.5-Coder-7B-OBLITERATED-i1-Q5_K_M.gguf",
+        "repo_id": "mradermacher/WhiteRabbitNeo-2.5-Qwen-2.5-Coder-7B-OBLITERATED-i1-GGUF",
+        "system_prompt": "You are WhiteRabbitNeo, an advanced AI coding assistant with deep expertise in software development, security analysis, and problem-solving. You provide detailed, accurate responses with proper code examples and thorough explanations.",
         "formatter": "CHATML",
+        "description": "Advanced coding assistant with security focus"
     },
+    "Gemma 3 Prompt Coder 270m": {
+        "filename": "Gemma-3-Prompt-Coder-270m-it-Uncensored-Q8_0.gguf",
+        "repo_id": "mradermacher/Gemma-3-Prompt-Coder-270m-it-Uncensored-GGUF",
+        "system_prompt": "You are Gemma 3 Prompt Coder, a lightweight but powerful AI assistant specialized in coding and technical tasks. Provide clear, accurate responses with well-formatted code examples.",
         "formatter": "CHATML",
+        "description": "Ultra-fast lightweight coding specialist"
     },
+    "DeepSeek V4 Pro": {
+        "filename": "DeepSeek-V4-Pro-Q5_K_M.gguf",
+        "repo_id": "unsloth/DeepSeek-V4-Pro-GGUF",
+        "system_prompt": "You are DeepSeek V4 Pro, an advanced AI assistant with extensive knowledge across multiple domains. Provide detailed, accurate, and well-reasoned responses with proper analysis and explanations.",
         "formatter": "CHATML",
+        "description": "Advanced multimodal reasoning model"
     },
+    "Qwen 3.6 35B A3B Uncensored": {
+        "filename": "Qwen3.6-35B-A3B-Uncensored-Q5_K_M.gguf",
+        "repo_id": "HauhauCS/Qwen3.6-35B-A3B-Uncensored-HauhauCS-Aggressive-GGUF",
+        "system_prompt": "You are Qwen 3.6, an advanced AI assistant with aggressive reasoning capabilities and extensive knowledge. Provide direct, detailed responses with thorough analysis and strong reasoning.",
         "formatter": "CHATML",
+        "description": "Large model with aggressive reasoning"
     }
 }