from app.config import MODEL_NAME def load_model(): from transformers import AutoModelForCausalLM, AutoTokenizer print("Loading tokenizer...") tokenizer = AutoTokenizer.from_pretrained( MODEL_NAME, trust_remote_code=True, extra_special_tokens={}, ) print("Loading model...") model = AutoModelForCausalLM.from_pretrained( MODEL_NAME, trust_remote_code=True, low_cpu_mem_usage=True, ) model.eval() print("Model loaded.") return tokenizer, model