Spaces:
Running
Running
Upload app.py with huggingface_hub
Browse files
app.py
CHANGED
|
@@ -225,8 +225,8 @@ def load_model(model_key: str):
|
|
| 225 |
_current_model = Llama.from_pretrained(
|
| 226 |
repo_id=config['repo_id'],
|
| 227 |
filename=config['filename'],
|
| 228 |
-
n_ctx=
|
| 229 |
-
n_threads=
|
| 230 |
verbose=False,
|
| 231 |
)
|
| 232 |
_current_model_name = model_key
|
|
@@ -276,7 +276,7 @@ Answer:"""
|
|
| 276 |
|
| 277 |
response = model.create_chat_completion(
|
| 278 |
messages=messages,
|
| 279 |
-
max_tokens=
|
| 280 |
temperature=0,
|
| 281 |
)
|
| 282 |
|
|
|
|
| 225 |
_current_model = Llama.from_pretrained(
|
| 226 |
repo_id=config['repo_id'],
|
| 227 |
filename=config['filename'],
|
| 228 |
+
n_ctx=256,
|
| 229 |
+
n_threads=8,
|
| 230 |
verbose=False,
|
| 231 |
)
|
| 232 |
_current_model_name = model_key
|
|
|
|
| 276 |
|
| 277 |
response = model.create_chat_completion(
|
| 278 |
messages=messages,
|
| 279 |
+
max_tokens=8,
|
| 280 |
temperature=0,
|
| 281 |
)
|
| 282 |
|