Update engine/responder.py
Browse files- engine/responder.py +1 -1
engine/responder.py
CHANGED
|
@@ -155,7 +155,7 @@ def generate_response_hf(prompt, persona, conversation_history, stream_callback=
|
|
| 155 |
generation_kwargs = {
|
| 156 |
"input_ids": inputs["input_ids"],
|
| 157 |
"attention_mask": inputs["attention_mask"], # important for reliability
|
| 158 |
-
"max_new_tokens":
|
| 159 |
"temperature": 0.9,
|
| 160 |
"top_p": 0.9,
|
| 161 |
"do_sample": True,
|
|
|
|
| 155 |
generation_kwargs = {
|
| 156 |
"input_ids": inputs["input_ids"],
|
| 157 |
"attention_mask": inputs["attention_mask"], # important for reliability
|
| 158 |
+
"max_new_tokens": 200,
|
| 159 |
"temperature": 0.9,
|
| 160 |
"top_p": 0.9,
|
| 161 |
"do_sample": True,
|