Spaces:

eddddyy
/

bot

Paused

eddddyy commited on Aug 6, 2025

Commit

0204d4a

verified ·

1 Parent(s): 27693fd

Update model_loader.py

Files changed (1) hide show

model_loader.py CHANGED Viewed

@@ -1,6 +1,6 @@
 import torch
 from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
-from config import HF_TOKEN, MODEL_ID  # ✅ Make sure this line is here!
 def load_model():
     try:
@@ -8,13 +8,13 @@ def load_model():
         tokenizer = AutoTokenizer.from_pretrained(
             MODEL_ID,
-            token=HF_TOKEN,
             trust_remote_code=True
         )
         model = AutoModelForCausalLM.from_pretrained(
             MODEL_ID,
-            token=HF_TOKEN,
             trust_remote_code=True,
             device_map="auto" if torch.cuda.is_available() else "cpu",
             torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
@@ -27,7 +27,7 @@ def load_model():
             "text-generation",
             model=model,
             tokenizer=tokenizer,
-            max_new_tokens=2048,     # 🧠 Increased token window
             do_sample=True,
             temperature=0.7,
             top_p=0.9
@@ -36,4 +36,3 @@ def load_model():
     except Exception as e:
         print(f"❌ Failed to load model: {e}")
         raise RuntimeError(f"Model loading failed: {e}")

 import torch
 from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
+from config import HF_TOKEN, MODEL_ID
 def load_model():
     try:
         tokenizer = AutoTokenizer.from_pretrained(
             MODEL_ID,
+            token=HF_TOKEN if HF_TOKEN else None,
             trust_remote_code=True
         )
         model = AutoModelForCausalLM.from_pretrained(
             MODEL_ID,
+            token=HF_TOKEN if HF_TOKEN else None,
             trust_remote_code=True,
             device_map="auto" if torch.cuda.is_available() else "cpu",
             torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
             "text-generation",
             model=model,
             tokenizer=tokenizer,
+            max_new_tokens=2048,
             do_sample=True,
             temperature=0.7,
             top_p=0.9
     except Exception as e:
         print(f"❌ Failed to load model: {e}")
         raise RuntimeError(f"Model loading failed: {e}")