llamacpp-flan-t5-large-grammar-synthesis

Sleeping

Akjava commited on Mar 20

Commit

5e8e544

verified ·

1 Parent(s): 3ce5ec4

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -88,7 +88,7 @@ def respond(
             model_id = "ggml-model-Q6_K.gguf"
             llama = Llama(f"models/{model_id}",flash_attn=False,
                         n_gpu_layers=0,
-                        n_ctx=max_tokens
                         n_threads=2,
                         n_threads_batch=2)

             model_id = "ggml-model-Q6_K.gguf"
             llama = Llama(f"models/{model_id}",flash_attn=False,
                         n_gpu_layers=0,
+                        n_ctx=max_tokens,
                         n_threads=2,
                         n_threads_batch=2)