[project] name = "oss-vs-frontier-assistant" version = "0.1.0" description = "Evaluation framework comparing an open-source assistant (Qwen) against a frontier assistant (Claude)." readme = "README.md" requires-python = "==3.11.*" # Exact pins, resolved by uv on 2026-05-22. Kept in sync with requirements.txt. dependencies = [ # --- UI --- "gradio==6.14.0", "spaces==0.50.2", # Hugging Face ZeroGPU decorator (@spaces.GPU) # --- Models --- "anthropic==0.104.0", # frontier assistant + guardrail + judge "transformers==5.9.0", # OSS assistant (Qwen) "torch==2.12.0", "accelerate==1.13.0", "huggingface-hub==1.16.1", # --- Memory / orchestration --- "langchain-core==1.4.0", "langchain-anthropic==1.4.3", "langchain-huggingface==1.2.2", "langchain-community==0.4.1", # SQLChatMessageHistory + Tavily tool # --- Config --- "pydantic-settings==2.14.1", "python-dotenv==1.2.2", # --- Tools --- "tavily-python==0.7.24", # --- Observability --- "langfuse==4.6.1", # --- Eval --- "datasets==4.8.5", "numpy==2.4.6", "matplotlib==3.10.9", ] [dependency-groups] dev = [ "pytest==9.0.3", ] [tool.uv] package = false [tool.pytest.ini_options] pythonpath = ["."] testpaths = ["tests"]