Commit ·
aef9f0f
1
Parent(s): 2a47292
Pre-build KB indexes at startup, not on first query
Browse files- backend/app.py +5 -3
backend/app.py
CHANGED
|
@@ -12,7 +12,7 @@ from pydantic import BaseModel
|
|
| 12 |
|
| 13 |
from config import DOMAIN_CLIENTS, CLIENT_DOMAIN, DISPLAY_NAMES
|
| 14 |
from grader import get_embedder, get_nli_model
|
| 15 |
-
from pipeline import run
|
| 16 |
|
| 17 |
log = logging.getLogger(__name__)
|
| 18 |
logging.basicConfig(level=logging.INFO)
|
|
@@ -26,9 +26,11 @@ async def lifespan(app: FastAPI):
|
|
| 26 |
if not hf_token:
|
| 27 |
raise RuntimeError("HF_TOKEN not set")
|
| 28 |
app.state.hf_client = InferenceClient(token=hf_token)
|
| 29 |
-
get_embedder()
|
| 30 |
get_nli_model()
|
| 31 |
-
|
|
|
|
|
|
|
| 32 |
yield
|
| 33 |
|
| 34 |
|
|
|
|
| 12 |
|
| 13 |
from config import DOMAIN_CLIENTS, CLIENT_DOMAIN, DISPLAY_NAMES
|
| 14 |
from grader import get_embedder, get_nli_model
|
| 15 |
+
from pipeline import run, _build_index
|
| 16 |
|
| 17 |
log = logging.getLogger(__name__)
|
| 18 |
logging.basicConfig(level=logging.INFO)
|
|
|
|
| 26 |
if not hf_token:
|
| 27 |
raise RuntimeError("HF_TOKEN not set")
|
| 28 |
app.state.hf_client = InferenceClient(token=hf_token)
|
| 29 |
+
embedder = get_embedder()
|
| 30 |
get_nli_model()
|
| 31 |
+
for domain in DOMAIN_CLIENTS:
|
| 32 |
+
_build_index(domain, embedder)
|
| 33 |
+
log.info("Models and KB indexes pre-warmed. Ready.")
|
| 34 |
yield
|
| 35 |
|
| 36 |
|