Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -66,16 +66,16 @@ def respond_stream(message, history, system_message, max_tokens, temperature, to
|
|
| 66 |
kwargs={**inputs, **{k: v for k, v in gen_kwargs.items() if v is not None}, "streamer": streamer}
|
| 67 |
)
|
| 68 |
|
| 69 |
-
|
|
|
|
| 70 |
token_count = 0
|
| 71 |
start_time = time.time()
|
| 72 |
|
| 73 |
with torch.inference_mode():
|
| 74 |
thread.start()
|
| 75 |
-
for
|
| 76 |
-
|
| 77 |
-
partial_text
|
| 78 |
-
yield partial_text # Tamamını gönder (append efekti)
|
| 79 |
thread.join()
|
| 80 |
|
| 81 |
end_time = time.time()
|
|
|
|
| 66 |
kwargs={**inputs, **{k: v for k, v in gen_kwargs.items() if v is not None}, "streamer": streamer}
|
| 67 |
)
|
| 68 |
|
| 69 |
+
input_len = inputs["input_ids"].shape[1]
|
| 70 |
+
partial_text = ""
|
| 71 |
token_count = 0
|
| 72 |
start_time = time.time()
|
| 73 |
|
| 74 |
with torch.inference_mode():
|
| 75 |
thread.start()
|
| 76 |
+
for new_text in streamer:
|
| 77 |
+
partial_text += new_text
|
| 78 |
+
yield partial_text
|
|
|
|
| 79 |
thread.join()
|
| 80 |
|
| 81 |
end_time = time.time()
|