Update app.py
Browse files
app.py
CHANGED
|
@@ -9,7 +9,7 @@ MODEL_FILE = "llama-3.2-1b-instruct.F16.gguf"
|
|
| 9 |
# Adjust context window and other params as needed
|
| 10 |
CONTEXT_WINDOW = 4096
|
| 11 |
MAX_NEW_TOKENS = 512
|
| 12 |
-
TEMPERATURE =
|
| 13 |
|
| 14 |
# --- Model Loading Function ---
|
| 15 |
def load_llm():
|
|
@@ -28,6 +28,7 @@ def load_llm():
|
|
| 28 |
n_ctx=CONTEXT_WINDOW,
|
| 29 |
n_threads=2,
|
| 30 |
verbose=False # Set to True for debugging
|
|
|
|
| 31 |
)
|
| 32 |
print("Model loaded successfully!")
|
| 33 |
return llm
|
|
|
|
| 9 |
# Adjust context window and other params as needed
|
| 10 |
CONTEXT_WINDOW = 4096
|
| 11 |
MAX_NEW_TOKENS = 512
|
| 12 |
+
TEMPERATURE = 1.5
|
| 13 |
|
| 14 |
# --- Model Loading Function ---
|
| 15 |
def load_llm():
|
|
|
|
| 28 |
n_ctx=CONTEXT_WINDOW,
|
| 29 |
n_threads=2,
|
| 30 |
verbose=False # Set to True for debugging
|
| 31 |
+
min_p=0.1
|
| 32 |
)
|
| 33 |
print("Model loaded successfully!")
|
| 34 |
return llm
|