Update handler.py
Browse files- handler.py +7 -3
handler.py
CHANGED
|
@@ -44,7 +44,7 @@ from llava.constants import (
|
|
| 44 |
IMAGE_TOKEN_INDEX,
|
| 45 |
)
|
| 46 |
from llava.model.builder import load_pretrained_model
|
| 47 |
-
from llava.mm_utils import tokenizer_image_token
|
| 48 |
|
| 49 |
|
| 50 |
# ---------- yardımcılar ----------
|
|
@@ -144,7 +144,7 @@ class EndpointHandler:
|
|
| 144 |
def __init__(self, model_dir: Optional[str] = None):
|
| 145 |
# DEBUG banner
|
| 146 |
print("🚀 Starting up PULSE-7B handler (startup load)...")
|
| 147 |
-
print("📝 Enhanced by
|
| 148 |
print(f"🔧 Python: {sys.version}")
|
| 149 |
print(f"🔧 PyTorch: {torch.__version__}")
|
| 150 |
try:
|
|
@@ -174,7 +174,6 @@ class EndpointHandler:
|
|
| 174 |
self._startup_load_model()
|
| 175 |
print("✅ Model loaded & ready in __init__")
|
| 176 |
except Exception as e:
|
| 177 |
-
# Kritik hata: init'te patladıysa endpoint zaten ayağa kalkamaz
|
| 178 |
print(f"💥 CRITICAL: model startup load failed: {e}")
|
| 179 |
raise
|
| 180 |
|
|
@@ -194,10 +193,15 @@ class EndpointHandler:
|
|
| 194 |
model_path = _get_env("HF_MODEL_ID", "PULSE-ECG/PULSE-7B")
|
| 195 |
print(f"[DEBUG] loading model from HUB: {model_path} (HF_MODEL_BASE={model_base})")
|
| 196 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 197 |
print("[DEBUG] calling load_pretrained_model ...")
|
| 198 |
self.tokenizer, self.model, self.image_processor, self.context_len = load_pretrained_model(
|
| 199 |
model_path=model_path,
|
| 200 |
model_base=model_base,
|
|
|
|
| 201 |
load_8bit=False,
|
| 202 |
load_4bit=False,
|
| 203 |
device_map="auto",
|
|
|
|
| 44 |
IMAGE_TOKEN_INDEX,
|
| 45 |
)
|
| 46 |
from llava.model.builder import load_pretrained_model
|
| 47 |
+
from llava.mm_utils import tokenizer_image_token, get_model_name_from_path
|
| 48 |
|
| 49 |
|
| 50 |
# ---------- yardımcılar ----------
|
|
|
|
| 144 |
def __init__(self, model_dir: Optional[str] = None):
|
| 145 |
# DEBUG banner
|
| 146 |
print("🚀 Starting up PULSE-7B handler (startup load)...")
|
| 147 |
+
print("📝 Enhanced by Ubden® Team")
|
| 148 |
print(f"🔧 Python: {sys.version}")
|
| 149 |
print(f"🔧 PyTorch: {torch.__version__}")
|
| 150 |
try:
|
|
|
|
| 174 |
self._startup_load_model()
|
| 175 |
print("✅ Model loaded & ready in __init__")
|
| 176 |
except Exception as e:
|
|
|
|
| 177 |
print(f"💥 CRITICAL: model startup load failed: {e}")
|
| 178 |
raise
|
| 179 |
|
|
|
|
| 193 |
model_path = _get_env("HF_MODEL_ID", "PULSE-ECG/PULSE-7B")
|
| 194 |
print(f"[DEBUG] loading model from HUB: {model_path} (HF_MODEL_BASE={model_base})")
|
| 195 |
|
| 196 |
+
# ⬇️ FIX: LLaVA v1.2.0 imzası model_name parametresi istiyor
|
| 197 |
+
model_name = get_model_name_from_path(model_path)
|
| 198 |
+
print(f"[DEBUG] resolved model_name: {model_name}")
|
| 199 |
+
|
| 200 |
print("[DEBUG] calling load_pretrained_model ...")
|
| 201 |
self.tokenizer, self.model, self.image_processor, self.context_len = load_pretrained_model(
|
| 202 |
model_path=model_path,
|
| 203 |
model_base=model_base,
|
| 204 |
+
model_name=model_name, # <-- gerekli parametre
|
| 205 |
load_8bit=False,
|
| 206 |
load_4bit=False,
|
| 207 |
device_map="auto",
|