try
Browse files- create_app.py +9 -2
create_app.py
CHANGED
|
@@ -32,8 +32,15 @@ def load_models():
|
|
| 32 |
QWEN_TOKENIZER = AutoTokenizer.from_pretrained(model_name, device='auto')
|
| 33 |
QWEN_TOKENIZER.pad_token_id = QWEN_TOKENIZER.eos_token_id
|
| 34 |
print("QWEN TOKENIZER LOADED")
|
| 35 |
-
|
| 36 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 37 |
print("QWEN MODEL LOADED")
|
| 38 |
MODELS_LOADED = True
|
| 39 |
print("LOAD ENDED")
|
|
|
|
| 32 |
QWEN_TOKENIZER = AutoTokenizer.from_pretrained(model_name, device='auto')
|
| 33 |
QWEN_TOKENIZER.pad_token_id = QWEN_TOKENIZER.eos_token_id
|
| 34 |
print("QWEN TOKENIZER LOADED")
|
| 35 |
+
try:
|
| 36 |
+
QWEN_MODEL = AutoModelForCausalLM.from_pretrained(model_name).half()
|
| 37 |
+
QWEN_MODEL = QWEN_MODEL.to(device)
|
| 38 |
+
print("QWEN MODEL LOADED") # Typo fixed from your original code ("LOADED" vs. "LOADED")
|
| 39 |
+
except Exception as e:
|
| 40 |
+
print(f"ERROR LOADING QWEN MODEL: {str(e)}")
|
| 41 |
+
raise # Re-raise to see full traceback
|
| 42 |
+
# QWEN_MODEL = AutoModelForCausalLM.from_pretrained(model_name).half()
|
| 43 |
+
# QWEN_MODEL = QWEN_MODEL.to(device)
|
| 44 |
print("QWEN MODEL LOADED")
|
| 45 |
MODELS_LOADED = True
|
| 46 |
print("LOAD ENDED")
|