Update app.py
Browse files
app.py
CHANGED
|
@@ -30,7 +30,7 @@ MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "4096"))
|
|
| 30 |
|
| 31 |
# Debugging: GPU check passed, loading model
|
| 32 |
if torch.cuda.is_available():
|
| 33 |
-
model_id = "INSAIT-Institute/BgGPT-Gemma-2-
|
| 34 |
try:
|
| 35 |
print("Loading model...")
|
| 36 |
model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=torch.float16, device_map="auto", token=HF_TOKEN)
|
|
|
|
| 30 |
|
| 31 |
# Debugging: GPU check passed, loading model
|
| 32 |
if torch.cuda.is_available():
|
| 33 |
+
model_id = "INSAIT-Institute/BgGPT-Gemma-2-9B-IT-v1.0"
|
| 34 |
try:
|
| 35 |
print("Loading model...")
|
| 36 |
model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=torch.float16, device_map="auto", token=HF_TOKEN)
|