3v324v23's picture
Add application file
66ad25b
import os
from pathlib import Path
import pytest
import requests
from dotenv import load_dotenv
from pluto.dispatcher import _resolve_nvidia_api_key
load_dotenv(Path(__file__).resolve().with_name(".env"))
def test_nvidia_key_resolution_prefers_model_specific(monkeypatch):
monkeypatch.setenv("NVIDIA_API_KEY", "global")
monkeypatch.setenv("NVIDIA_API_KEY_SUPER", "super")
env_var, api_key = _resolve_nvidia_api_key("nvidia/llama-3.3-nemotron-super-49b-v1")
assert env_var == "NVIDIA_API_KEY_SUPER"
assert api_key == "super"
@pytest.mark.live_api
def test_nvidia_rerank_endpoint():
rerank_key = os.getenv("NVIDIA_API_KEY_RERANK")
if not rerank_key:
pytest.skip("NVIDIA_API_KEY_RERANK not configured")
response = requests.post(
"https://ai.api.nvidia.com/v1/retrieval/nvidia/llama-nemotron-rerank-1b-v2/reranking",
headers={
"Authorization": f"Bearer {rerank_key}",
"Content-Type": "application/json",
},
json={
"model": "nvidia/llama-nemotron-rerank-1b-v2",
"query": {"text": "Hi"},
"passages": [{"text": "Hello"}],
},
timeout=20,
)
assert response.status_code == 200, response.text