Spaces:
Running
Running
Upload folder using huggingface_hub
Browse files- src/llm.py +5 -1
src/llm.py
CHANGED
|
@@ -8,12 +8,16 @@ WHY one call per query? Multi-step chains add latency and failure points.
|
|
| 8 |
|
| 9 |
import os
|
| 10 |
from groq import Groq
|
|
|
|
| 11 |
from tenacity import retry, stop_after_attempt, wait_exponential
|
| 12 |
from dotenv import load_dotenv
|
| 13 |
|
| 14 |
load_dotenv()
|
| 15 |
|
| 16 |
-
_client = Groq(
|
|
|
|
|
|
|
|
|
|
| 17 |
|
| 18 |
|
| 19 |
def call_llm_raw(messages: list) -> str:
|
|
|
|
| 8 |
|
| 9 |
import os
|
| 10 |
from groq import Groq
|
| 11 |
+
import httpx
|
| 12 |
from tenacity import retry, stop_after_attempt, wait_exponential
|
| 13 |
from dotenv import load_dotenv
|
| 14 |
|
| 15 |
load_dotenv()
|
| 16 |
|
| 17 |
+
_client = Groq(
|
| 18 |
+
api_key=os.getenv("GROQ_API_KEY"),
|
| 19 |
+
http_client=httpx.Client(verify=False, timeout=30.0)
|
| 20 |
+
)
|
| 21 |
|
| 22 |
|
| 23 |
def call_llm_raw(messages: list) -> str:
|