Spaces:

cmboulanger
/

tei-annotator

Runtime error

App Files Files Community

tei-annotator / scripts /smoke_test_llm.py

cmboulanger

feat: Add webservice for demonstration

c3f33b6 about 1 month ago

raw

history blame contribute delete

7.11 kB

	#!/usr/bin/env python
	"""
	End-to-end smoke test: tei-annotator pipeline with real LLM endpoints.

	Providers tested:
	• Google Gemini 2.0 Flash
	• KISSKI (OpenAI-compatible API, llama-3.3-70b-instruct)

	Reads API keys from .env in the project root.

	Usage:
	uv run scripts/smoke_test_llm.py
	python scripts/smoke_test_llm.py # if venv is already activated
	"""

	from __future__ import annotations

	import json
	import os
	import sys
	import textwrap
	import urllib.error
	import urllib.request
	from pathlib import Path

	from dotenv import load_dotenv

	load_dotenv(Path(__file__).parent.parent / ".env")


	# ---------------------------------------------------------------------------
	# HTTP helper (stdlib urllib)
	# ---------------------------------------------------------------------------

	def _post_json(url: str, payload: dict, headers: dict) -> dict:
	body = json.dumps(payload).encode()
	req = urllib.request.Request(url, data=body, headers=headers, method="POST")
	try:
	with urllib.request.urlopen(req, timeout=60) as resp:
	return json.loads(resp.read())
	except urllib.error.HTTPError as exc:
	detail = exc.read().decode(errors="replace")
	raise RuntimeError(f"HTTP {exc.code} from {url}: {detail}") from exc


	# ---------------------------------------------------------------------------
	# call_fn factories
	# ---------------------------------------------------------------------------

	def make_gemini_call_fn(api_key: str, model: str = "gemini-2.0-flash") -> ...:
	"""Return a call_fn that sends a prompt to Gemini and returns the text reply."""
	url = (
	f"https://generativelanguage.googleapis.com/v1beta/models"
	f"/{model}:generateContent?key={api_key}"
	)

	def call_fn(prompt: str) -> str:
	payload = {
	"contents": [{"parts": [{"text": prompt}]}],
	"generationConfig": {"temperature": 0.1},
	}
	result = _post_json(url, payload, {"Content-Type": "application/json"})
	return result["candidates"][0]["content"]["parts"][0]["text"]

	call_fn.__name__ = f"gemini/{model}"
	return call_fn


	def make_kisski_call_fn(
	api_key: str,
	base_url: str = "https://chat-ai.academiccloud.de/v1",
	model: str = "llama-3.3-70b-instruct",
	) -> ...:
	"""Return a call_fn that sends a prompt to a KISSKI-hosted OpenAI-compatible model."""
	url = f"{base_url}/chat/completions"
	headers = {
	"Content-Type": "application/json",
	"Authorization": f"Bearer {api_key}",
	}

	def call_fn(prompt: str) -> str:
	payload = {
	"model": model,
	"messages": [{"role": "user", "content": prompt}],
	"temperature": 0.1,
	}
	result = _post_json(url, payload, headers)
	return result["choices"][0]["message"]["content"]

	call_fn.__name__ = f"kisski/{model}"
	return call_fn


	# ---------------------------------------------------------------------------
	# Test scenario
	# ---------------------------------------------------------------------------

	TEST_TEXT = (
	"Marie Curie was born in Warsaw, Poland, and later conducted her research "
	"in Paris, France. Together with her husband Pierre Curie, she discovered "
	"polonium and radium."
	)

	# We just check that the pipeline runs and produces some annotation.
	# Whether the LLM chose the right entities is not asserted here.
	EXPECTED_TAGS = ["persName", "placeName"]


	def _build_schema():
	from tei_annotator.models.schema import TEIAttribute, TEIElement, TEISchema

	return TEISchema(
	elements=[
	TEIElement(
	tag="persName",
	description="a person's name",
	attributes=[TEIAttribute(name="ref", description="authority URI")],
	),
	TEIElement(
	tag="placeName",
	description="a geographical place name",
	attributes=[TEIAttribute(name="ref", description="authority URI")],
	),
	]
	)


	def run_smoke_test(provider_name: str, call_fn) -> bool:
	"""
	Run the full annotate() pipeline with call_fn and print results.
	Returns True on success, False on failure.
	"""
	import re

	from tei_annotator.inference.endpoint import EndpointCapability, EndpointConfig
	from tei_annotator.pipeline import annotate

	print(f"\n{'─' * 60}")
	print(f" Provider : {provider_name}")
	print(f" Input : {TEST_TEXT[:80]}…")
	print(f"{'─' * 60}")

	try:
	result = annotate(
	text=TEST_TEXT,
	schema=_build_schema(),
	endpoint=EndpointConfig(
	capability=EndpointCapability.TEXT_GENERATION,
	call_fn=call_fn,
	),
	gliner_model=None, # skip GLiNER for speed
	)
	except Exception as exc:
	print(f" ✗ FAILED — exception during annotate(): {exc}")
	return False

	# Verify plain text is unmodified
	plain = re.sub(r"<[^>]+>", "", result.xml)
	if plain != TEST_TEXT:
	print(f" ✗ FAILED — plain text was modified by the pipeline")
	print(f" Expected : {TEST_TEXT!r}")
	print(f" Got : {plain!r}")
	return False

	# Verify at least one annotation was injected (LLM must have found something)
	has_any_tag = any(f"<{t}>" in result.xml for t in EXPECTED_TAGS)
	if not has_any_tag:
	print(f" ✗ FAILED — no annotation tags found in output")
	print(f" Output XML: {result.xml}")
	return False

	# Pretty-print the result
	tags_found = [t for t in EXPECTED_TAGS if f"<{t}>" in result.xml]
	print(f" ✓ PASSED")
	print(f" Tags found : {', '.join(tags_found)}")
	if result.fuzzy_spans:
	print(f" Fuzzy spans: {[TEST_TEXT[s.start:s.end] for s in result.fuzzy_spans]}")
	print(f" Output XML :")
	for line in textwrap.wrap(result.xml, width=72, subsequent_indent=" "):
	print(f" {line}")
	return True


	# ---------------------------------------------------------------------------
	# Main
	# ---------------------------------------------------------------------------

	def main() -> int:
	gemini_key = os.environ.get("GEMINI_API_KEY", "")
	kisski_key = os.environ.get("KISSKI_API_KEY", "")

	if not gemini_key:
	print("ERROR: GEMINI_API_KEY not set (check .env)", file=sys.stderr)
	return 1
	if not kisski_key:
	print("ERROR: KISSKI_API_KEY not set (check .env)", file=sys.stderr)
	return 1

	providers: list[tuple[str, object]] = [
	("Gemini 2.0 Flash", make_gemini_call_fn(gemini_key)),
	("KISSKI / llama-3.3-70b-instruct", make_kisski_call_fn(kisski_key)),
	]

	results: list[bool] = []
	for name, fn in providers:
	results.append(run_smoke_test(name, fn))

	print(f"\n{'═' * 60}")
	passed = sum(results)
	total = len(results)
	print(f" Result: {passed}/{total} providers passed")
	print(f"{'═' * 60}\n")

	return 0 if all(results) else 1


	if __name__ == "__main__":
	sys.exit(main())