Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
|
@@ -15,7 +15,7 @@ if not torch.cuda.is_available():
|
|
| 15 |
DESCRIPTION += "\n<p>Running on CPU 🥶 This demo does not work on CPU.</p>"
|
| 16 |
|
| 17 |
MAX_MAX_NEW_TOKENS = 2048
|
| 18 |
-
DEFAULT_MAX_NEW_TOKENS =
|
| 19 |
MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "4096"))
|
| 20 |
|
| 21 |
if torch.cuda.is_available():
|
|
@@ -62,6 +62,7 @@ def generate(
|
|
| 62 |
outputs = []
|
| 63 |
for text in streamer:
|
| 64 |
outputs.append(text)
|
|
|
|
| 65 |
yield "".join(outputs)
|
| 66 |
|
| 67 |
|
|
|
|
| 15 |
DESCRIPTION += "\n<p>Running on CPU 🥶 This demo does not work on CPU.</p>"
|
| 16 |
|
| 17 |
MAX_MAX_NEW_TOKENS = 2048
|
| 18 |
+
DEFAULT_MAX_NEW_TOKENS = 512
|
| 19 |
MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "4096"))
|
| 20 |
|
| 21 |
if torch.cuda.is_available():
|
|
|
|
| 62 |
outputs = []
|
| 63 |
for text in streamer:
|
| 64 |
outputs.append(text)
|
| 65 |
+
outputs = outputs.replace("||assistant|>", "").strip()
|
| 66 |
yield "".join(outputs)
|
| 67 |
|
| 68 |
|