fixed streaming for ctransformers
Browse files
app_modules/llm_loader.py
CHANGED
|
@@ -202,7 +202,10 @@ class LLMLoader:
|
|
| 202 |
"repetition_penalty": 1.1,
|
| 203 |
}
|
| 204 |
self.llm = CTransformers(
|
| 205 |
-
model=MODEL_PATH,
|
|
|
|
|
|
|
|
|
|
| 206 |
)
|
| 207 |
elif self.llm_model_type == "hftgi":
|
| 208 |
HFTGI_SERVER_URL = os.environ.get("HFTGI_SERVER_URL")
|
|
|
|
| 202 |
"repetition_penalty": 1.1,
|
| 203 |
}
|
| 204 |
self.llm = CTransformers(
|
| 205 |
+
model=MODEL_PATH,
|
| 206 |
+
model_type="llama",
|
| 207 |
+
config=config,
|
| 208 |
+
callbacks=callbacks,
|
| 209 |
)
|
| 210 |
elif self.llm_model_type == "hftgi":
|
| 211 |
HFTGI_SERVER_URL = os.environ.get("HFTGI_SERVER_URL")
|