WWMachine commited on
Commit
50e06b0
·
verified ·
1 Parent(s): 539f835

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -1
app.py CHANGED
@@ -9,7 +9,7 @@ MODEL_FILE = "llama-3.2-1b-instruct.F16.gguf"
9
  # Adjust context window and other params as needed
10
  CONTEXT_WINDOW = 4096
11
  MAX_NEW_TOKENS = 512
12
- TEMPERATURE = 0.7
13
 
14
  # --- Model Loading Function ---
15
  def load_llm():
@@ -28,6 +28,7 @@ def load_llm():
28
  n_ctx=CONTEXT_WINDOW,
29
  n_threads=2,
30
  verbose=False # Set to True for debugging
 
31
  )
32
  print("Model loaded successfully!")
33
  return llm
 
9
  # Adjust context window and other params as needed
10
  CONTEXT_WINDOW = 4096
11
  MAX_NEW_TOKENS = 512
12
+ TEMPERATURE = 1.5
13
 
14
  # --- Model Loading Function ---
15
  def load_llm():
 
28
  n_ctx=CONTEXT_WINDOW,
29
  n_threads=2,
30
  verbose=False # Set to True for debugging
31
+ min_p=0.1
32
  )
33
  print("Model loaded successfully!")
34
  return llm