Fix MODEL_NAME=None: auto-discover from proxy /models endpoint, fallback to gpt-4o-mini
Browse files- inference.py +21 -0
inference.py
CHANGED
|
@@ -29,6 +29,27 @@ API_KEY = os.environ.get("API_KEY") or os.environ.get("HF_TOKEN")
|
|
| 29 |
API_BASE_URL = os.environ.get("API_BASE_URL")
|
| 30 |
MODEL_NAME = os.environ.get("MODEL_NAME")
|
| 31 |
BENCHMARK = "policy_evolver_env"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 32 |
MAX_STEPS = 5
|
| 33 |
TEMPERATURE = 0.0
|
| 34 |
SUCCESS_THRESHOLD = 0.70
|
|
|
|
| 29 |
API_BASE_URL = os.environ.get("API_BASE_URL")
|
| 30 |
MODEL_NAME = os.environ.get("MODEL_NAME")
|
| 31 |
BENCHMARK = "policy_evolver_env"
|
| 32 |
+
|
| 33 |
+
# ─── Auto-discover model if MODEL_NAME is not set ───
|
| 34 |
+
if not MODEL_NAME and API_BASE_URL and API_KEY:
|
| 35 |
+
try:
|
| 36 |
+
import httpx
|
| 37 |
+
resp = httpx.get(
|
| 38 |
+
f"{API_BASE_URL.rstrip('/')}/models",
|
| 39 |
+
headers={"Authorization": f"Bearer {API_KEY}"},
|
| 40 |
+
timeout=10,
|
| 41 |
+
)
|
| 42 |
+
if resp.status_code == 200:
|
| 43 |
+
models_data = resp.json().get("data", [])
|
| 44 |
+
if models_data:
|
| 45 |
+
MODEL_NAME = models_data[0].get("id", "gpt-4o-mini")
|
| 46 |
+
print(f"[DEBUG] Auto-discovered model: {MODEL_NAME}", flush=True)
|
| 47 |
+
except Exception as e:
|
| 48 |
+
print(f"[DEBUG] Model discovery failed: {e}", flush=True)
|
| 49 |
+
|
| 50 |
+
if not MODEL_NAME:
|
| 51 |
+
MODEL_NAME = "gpt-4o-mini"
|
| 52 |
+
print(f"[DEBUG] Using default MODEL_NAME: {MODEL_NAME}", flush=True)
|
| 53 |
MAX_STEPS = 5
|
| 54 |
TEMPERATURE = 0.0
|
| 55 |
SUCCESS_THRESHOLD = 0.70
|