Spaces:

sharktide
/

lightning

Running

App Files Files Community

sharktide commited on 22 days ago

Commit

792fbc3

verified ·

1 Parent(s): 5c28005

Update app.py

Browse files

Files changed (1) hide show

app.py +37 -31

app.py CHANGED Viewed

@@ -358,41 +358,47 @@ async def generate_text(
         if kw in prompt_text:
             score += 1
-    chosen_model = "meta-llama/llama-4-scout-17b-16e-instruct"
     provider = "groq"
-    if score > 10:
-        score = 10
-    if uses_tools:
-        if score >= 4:
-            chosen_model = "openai/gpt-oss-120b"
-        else:
-            chosen_model = "openai/gpt-oss-20b"
-        provider = "groq"
-    elif code_present:
-        if code_heavy and score >= 6:
-            chosen_model = "gpt-oss-120b"
-            provider = "cerebras"
-        elif score >= 4:
-            chosen_model = "llama-3.3-70b-versatile"
-            provider = "groq"
-    elif score >= 4:
         chosen_model = "meta-llama/llama-4-scout-17b-16e-instruct"
         provider = "groq"
-    if provider == "groq" and (
-        total_chars > MAX_GROQ_PROMPT_CHARS or total_bytes > MAX_GROQ_PROMPT_BYTES
-    ):
-        raise HTTPException(
-            status_code=413,
-            detail=(
-                f"Prompt exceeds Groq-safe size ({total_chars} chars, {total_bytes} bytes). "
-                f"Max Groq-safe size is {MAX_GROQ_PROMPT_CHARS} chars or {MAX_GROQ_PROMPT_BYTES} bytes."
-            ),
-        )
     await check_chat_rate_limit(request, authorization, x_client_id)

         if kw in prompt_text:
             score += 1
+    chosen_model = "llama-3.1-8b-instant"
     provider = "groq"
+    has_images = contains_images(messages)
+    if has_images:
         chosen_model = "meta-llama/llama-4-scout-17b-16e-instruct"
         provider = "groq"
+    else:
+        if score > 10:
+            score = 10
+        if uses_tools:
+            if score >= 4:
+                chosen_model = "openai/gpt-oss-120b"
+            else:
+                chosen_model = "openai/gpt-oss-20b"
+            provider = "groq"
+        elif code_present:
+            if code_heavy and score >= 6:
+                chosen_model = "gpt-oss-120b"
+                provider = "cerebras"
+            elif score >= 4:
+                chosen_model = "llama-3.3-70b-versatile"
+                provider = "groq"
+        elif score >= 4:
+            chosen_model = "meta-llama/llama-4-scout-17b-16e-instruct"
+            provider = "groq"
+        if provider == "groq" and (
+            total_chars > MAX_GROQ_PROMPT_CHARS or total_bytes > MAX_GROQ_PROMPT_BYTES
+        ):
+            raise HTTPException(
+                status_code=413,
+                detail=(
+                    f"Prompt exceeds Groq-safe size ({total_chars} chars, {total_bytes} bytes). "
+                    f"Max Groq-safe size is {MAX_GROQ_PROMPT_CHARS} chars or {MAX_GROQ_PROMPT_BYTES} bytes."
+                ),
+            )
     await check_chat_rate_limit(request, authorization, x_client_id)