import subprocess import sys # Install bitsandbytes first subprocess.check_call([sys.executable, "-m", "pip", "install", "bitsandbytes"]) # Then import and use your model from transformers import AutoTokenizer, AutoModelForCausalLM import torch model = AutoModelForCausalLM.from_pretrained( "EdysorEdutech/gatewaytrainedmodel", load_in_4bit=True, device_map="auto" )