File size: 9,874 Bytes
7553a70
 
 
3f405a6
7553a70
 
 
 
 
3f405a6
7553a70
 
 
 
 
 
3f405a6
 
 
 
 
 
 
 
 
7553a70
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3f405a6
 
 
 
 
 
 
 
 
 
 
7553a70
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3f405a6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7553a70
 
 
 
a203f1b
3f405a6
 
a203f1b
 
 
 
 
3f405a6
 
7553a70
 
a203f1b
7553a70
 
 
 
 
 
 
 
 
 
 
 
 
a203f1b
7553a70
 
 
 
a203f1b
 
3f405a6
 
a203f1b
3f405a6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
a203f1b
7553a70
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
"""FastAPI application factory and configuration."""

import os
import time
import traceback
from contextlib import asynccontextmanager
from pathlib import Path
from typing import Any

from fastapi import FastAPI, HTTPException, Request
from fastapi.exception_handlers import request_validation_exception_handler
from fastapi.exceptions import RequestValidationError
from fastapi.responses import JSONResponse
from loguru import logger
from starlette.types import Receive, Scope, Send

# Circular list of last N errors for debug endpoint
_MAX_ERROR_HISTORY = 10
_error_history: list[dict] = []

def _record_error(error_dict: dict) -> None:
    _error_history.append(error_dict)
    if len(_error_history) > _MAX_ERROR_HISTORY:
        _error_history.pop(0)

from config.logging_config import configure_logging
from config.paths import server_log_path
from config.settings import get_settings
from core.trace import extract_claude_session_id_from_headers, trace_event
from providers.exceptions import ProviderError

from .admin_routes import router as admin_router
from .routes import router
from .runtime import AppRuntime, startup_failure_message
from .validation_log import summarize_request_validation_body


@asynccontextmanager
async def lifespan(app: FastAPI):
    """Application lifespan manager."""
    runtime = AppRuntime.for_app(app, settings=get_settings())
    await runtime.startup()

    yield

    await runtime.shutdown()


class GracefulLifespanApp:
    """ASGI wrapper that reports startup failures without Starlette tracebacks."""

    def __init__(self, app: FastAPI):
        self.app = app

    def __getattr__(self, name: str) -> Any:
        return getattr(self.app, name)

    async def __call__(self, scope: Scope, receive: Receive, send: Send) -> None:
        if scope["type"] != "lifespan":
            await self.app(scope, receive, send)
            return
        await self._lifespan(receive, send)

    async def _lifespan(self, receive: Receive, send: Send) -> None:
        settings = get_settings()
        runtime = AppRuntime.for_app(self.app, settings=settings)
        startup_complete = False
        while True:
            message = await receive()
            if message["type"] == "lifespan.startup":
                try:
                    await runtime.startup()
                except Exception as exc:
                    await send(
                        {
                            "type": "lifespan.startup.failed",
                            "message": startup_failure_message(settings, exc),
                        }
                    )
                    return
                startup_complete = True
                await send({"type": "lifespan.startup.complete"})
                continue

            if message["type"] == "lifespan.shutdown":
                if startup_complete:
                    try:
                        await runtime.shutdown()
                    except Exception as exc:
                        logger.error("Shutdown failed: exc_type={}", type(exc).__name__)
                        await send({"type": "lifespan.shutdown.failed", "message": ""})
                        return
                await send({"type": "lifespan.shutdown.complete"})
                return


def create_app(*, lifespan_enabled: bool = True) -> FastAPI:
    """Create and configure the FastAPI application."""
    settings = get_settings()
    log_path = Path(os.getenv("LOG_FILE", server_log_path()))
    configure_logging(log_path, verbose_third_party=settings.log_raw_api_payloads)

    app_kwargs: dict[str, Any] = {
        "title": "Claude Code Proxy",
        "version": "2.0.0",
    }
    if lifespan_enabled:
        app_kwargs["lifespan"] = lifespan
    app = FastAPI(**app_kwargs)

    @app.middleware("http")
    async def trace_http_correlation(request: Request, call_next):
        """Attach HTTP identifiers and optional Claude session id to logs."""
        claude_sid = extract_claude_session_id_from_headers(request.headers)
        with logger.contextualize(
            http_method=request.method,
            http_path=request.url.path,
            claude_session_id=claude_sid,
        ):
            response = await call_next(request)
        return response

    # Register routes
    app.include_router(admin_router)
    app.include_router(router)

    # Exception handlers
    @app.exception_handler(RequestValidationError)
    async def validation_error_handler(request: Request, exc: RequestValidationError):
        """Log request shape for 422 debugging without content values."""
        body: Any
        try:
            body = await request.json()
        except Exception as e:
            body = {"_json_error": type(e).__name__}

        message_summary, tool_names = summarize_request_validation_body(body)

        trace_event(
            stage="ingress",
            event="server.request.validation_failed",
            source="api",
            path=request.url.path,
            query=dict(request.query_params),
            error_locs=[list(error.get("loc", ())) for error in exc.errors()],
            error_types=[str(error.get("type", "")) for error in exc.errors()],
            message_summary=message_summary,
            tool_names=tool_names,
        )
        return await request_validation_exception_handler(request, exc)

    @app.exception_handler(ProviderError)
    async def provider_error_handler(request: Request, exc: ProviderError):
        """Handle provider-specific errors and return Anthropic format."""
        _record_error({
            "handler": "ProviderError",
            "type": type(exc).__name__,
            "error_type": exc.error_type,
            "status_code": exc.status_code,
            "message": exc.message,
            "traceback": traceback.format_exc(),
            "path": str(request.url),
            "method": request.method,
            "ts": time.time(),
        })
        err_settings = get_settings()
        if err_settings.log_api_error_tracebacks:
            logger.error(
                "Provider Error: error_type={} status_code={} message={}",
                exc.error_type,
                exc.status_code,
                exc.message,
            )
        else:
            logger.error(
                "Provider Error: error_type={} status_code={}",
                exc.error_type,
                exc.status_code,
            )
        return JSONResponse(
            status_code=exc.status_code,
            content=exc.to_anthropic_format(),
        )

    @app.exception_handler(HTTPException)
    async def http_error_handler(request: Request, exc: HTTPException):
        """Capture HTTPException (e.g. from services.py 500) for debugging."""
        _record_error({
            "handler": "HTTPException",
            "type": "HTTPException",
            "status_code": exc.status_code,
            "detail": str(exc.detail),
            "path": str(request.url),
            "method": request.method,
            "ts": time.time(),
        })
        return JSONResponse(
            status_code=exc.status_code,
            content={"detail": str(exc.detail)},
        )

    @app.exception_handler(Exception)
    async def general_error_handler(request: Request, exc: Exception):
        """Handle general errors and return Anthropic format."""
        settings = get_settings()
        tb_str = traceback.format_exc()
        _record_error({
            "handler": "GeneralException",
            "type": type(exc).__name__,
            "message": str(exc),
            "traceback": tb_str,
            "path": str(request.url),
            "method": request.method,
            "ts": time.time(),
        })
        if settings.log_api_error_tracebacks:
            logger.error("General Error: {}", exc)
            logger.error(tb_str)
        else:
            logger.error(
                "General Error: path={} method={} exc_type={}",
                request.url.path,
                request.method,
                type(exc).__name__,
            )
        return JSONResponse(
            status_code=500,
            content={
                "type": "error",
                "error": {
                    "type": "api_error",
                    "message": f"{type(exc).__name__}: {exc}",
                },
            },
        )

    @app.get("/debug/last-error")
    async def debug_last_error():
        """Return ALL recent errors for remote debugging."""
        if not _error_history:
            return {"status": "no errors recorded"}
        return {"errors": _error_history}

    @app.get("/debug/config")
    async def debug_config():
        """Show runtime config for diagnosing env var issues."""
        s = get_settings()
        return {
            "model": s.model,
            "model_opus": s.model_opus,
            "model_sonnet": s.model_sonnet,
            "model_haiku": s.model_haiku,
            "provider_type": s.provider_type,
            "nvidia_nim_api_key_set": bool(s.nvidia_nim_api_key),
            "env_NVIDIA_API_KEY_1": bool(os.environ.get("NVIDIA_API_KEY_1", "")),
            "env_NVIDIA_API_KEY_2": bool(os.environ.get("NVIDIA_API_KEY_2", "")),
            "env_NVIDIA_API_KEY_3": bool(os.environ.get("NVIDIA_API_KEY_3", "")),
            "env_GROQ_KEY_1": bool(os.environ.get("GROQ_KEY_1", "")),
            "env_GROQ_KEY_2": bool(os.environ.get("GROQ_KEY_2", "")),
            "anthropic_auth_token_set": bool(s.anthropic_auth_token),
            "provider_registry_exists": hasattr(app.state, "provider_registry") and app.state.provider_registry is not None,
        }

    return app


def create_asgi_app() -> GracefulLifespanApp:
    """Create the server ASGI app with graceful lifespan failure reporting."""
    return GracefulLifespanApp(create_app(lifespan_enabled=False))

app = create_asgi_app()