Spaces:
Paused
Paused
Update app.py
Browse files
app.py
CHANGED
|
@@ -151,7 +151,8 @@ if st.button("Send") and prompt.strip():
|
|
| 151 |
inputs = tokenizer.apply_chat_template(
|
| 152 |
chat,
|
| 153 |
add_generation_prompt=True,
|
| 154 |
-
return_tensors="pt"
|
|
|
|
| 155 |
)
|
| 156 |
|
| 157 |
streamer = TextIteratorStreamer(
|
|
@@ -161,15 +162,15 @@ if st.button("Send") and prompt.strip():
|
|
| 161 |
)
|
| 162 |
|
| 163 |
gen_kwargs = dict(
|
| 164 |
-
|
| 165 |
max_new_tokens=MAX_NEW_TOKENS,
|
|
|
|
| 166 |
temperature=TEMPERATURE,
|
| 167 |
top_p=TOP_P,
|
| 168 |
-
do_sample=True,
|
| 169 |
-
streamer=streamer,
|
| 170 |
eos_token_id=tokenizer.eos_token_id,
|
| 171 |
pad_token_id=tokenizer.eos_token_id,
|
| 172 |
-
|
|
|
|
| 173 |
|
| 174 |
thread = threading.Thread(target=model.generate, kwargs=gen_kwargs)
|
| 175 |
thread.start()
|
|
|
|
| 151 |
inputs = tokenizer.apply_chat_template(
|
| 152 |
chat,
|
| 153 |
add_generation_prompt=True,
|
| 154 |
+
return_tensors="pt",
|
| 155 |
+
return_dict=True
|
| 156 |
)
|
| 157 |
|
| 158 |
streamer = TextIteratorStreamer(
|
|
|
|
| 162 |
)
|
| 163 |
|
| 164 |
gen_kwargs = dict(
|
| 165 |
+
**inputs,
|
| 166 |
max_new_tokens=MAX_NEW_TOKENS,
|
| 167 |
+
do_sample=True,
|
| 168 |
temperature=TEMPERATURE,
|
| 169 |
top_p=TOP_P,
|
|
|
|
|
|
|
| 170 |
eos_token_id=tokenizer.eos_token_id,
|
| 171 |
pad_token_id=tokenizer.eos_token_id,
|
| 172 |
+
streamer=streamer
|
| 173 |
+
)
|
| 174 |
|
| 175 |
thread = threading.Thread(target=model.generate, kwargs=gen_kwargs)
|
| 176 |
thread.start()
|