RichardLu
/

Mistral7b_AE_res

Model card Files Files and versions

RichardLu commited on Mar 18, 2025

Commit

021be98

·

verified ·

1 Parent(s): df0ebdd

Update handler.py

Files changed (1) hide show

handler.py +8 -9

handler.py CHANGED Viewed

@@ -39,21 +39,20 @@ alpaca_prompt = (
 )
 def initialize():
-    """
-    This function loads the finetuned unsloth model and tokenizer.
-    Adjust the 'model_name' to point to your model repository.
-    """
     global model, tokenizer
-    # Set your finetuned model repository name here
-    model_name = "RichardLu/Mistral7b_AE_res"  # e.g., "unsloth/mistral-7b-instruct-v0.3-bnb-4bit-finetuned"
     model, tokenizer = FastLanguageModel.from_pretrained(
         model_name=model_name,
         max_seq_length=2048,
-        load_in_4bit=True  # Change if necessary
     )
-    # Set the model in inference mode
     FastLanguageModel.for_inference(model)
-    model.eval()
 def preprocess(request):
     """

 )
 def initialize():
     global model, tokenizer
+    model_name = "RichardLu/Mistral7b_AE_res"
+    # Read the environment variable
+    hf_auth_token = os.environ.get("HF_AUTH_TOKEN", None)
+    # Pass the token if it exists
     model, tokenizer = FastLanguageModel.from_pretrained(
         model_name=model_name,
         max_seq_length=2048,
+        load_in_4bit=True,
+        use_auth_token=hf_auth_token  # <--- Use your token here
     )
     FastLanguageModel.for_inference(model)
 def preprocess(request):
     """