YOUSEF2434 commited on
Commit
9a6badd
·
verified ·
1 Parent(s): ca42ad4

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -19,7 +19,7 @@ MAX_MAX_NEW_TOKENS = 2048
19
  DEFAULT_MAX_NEW_TOKENS = 1024
20
  MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "4096"))
21
 
22
- model_id = "google/gemma-1.1-2b-it"
23
 
24
  # Load model with int8 quantization on CUDA (if available)
25
  if torch.cuda.is_available():
 
19
  DEFAULT_MAX_NEW_TOKENS = 1024
20
  MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "4096"))
21
 
22
+ model_id = "TinyLlama/TinyLlama-1.1B-Chat-v1.0"
23
 
24
  # Load model with int8 quantization on CUDA (if available)
25
  if torch.cuda.is_available():