Update app.py
Browse files
app.py
CHANGED
|
@@ -284,7 +284,8 @@ def respond(
|
|
| 284 |
repeat_penalty: float,
|
| 285 |
):
|
| 286 |
llama = Llama("models/madlad400-3b-mt-q8_0.gguf")
|
| 287 |
-
tokens = llama.tokenize(f"{message}".encode('utf-8'))
|
|
|
|
| 288 |
llama.encode(tokens)
|
| 289 |
tokens = [llama.decoder_start_token()]
|
| 290 |
for token in llama.generate(tokens, top_k=40, top_p=0.95, temp=1, repeat_penalty=1.0):
|
|
|
|
| 284 |
repeat_penalty: float,
|
| 285 |
):
|
| 286 |
llama = Llama("models/madlad400-3b-mt-q8_0.gguf")
|
| 287 |
+
#tokens = llama.tokenize(f"{message}".encode('utf-8'))#
|
| 288 |
+
tokens = llama.tokenize(b"What is the capital of France?")
|
| 289 |
llama.encode(tokens)
|
| 290 |
tokens = [llama.decoder_start_token()]
|
| 291 |
for token in llama.generate(tokens, top_k=40, top_p=0.95, temp=1, repeat_penalty=1.0):
|