Spaces:
Running
Running
File size: 5,816 Bytes
bdc2878 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 | """Reverse pipeline executor β the 7-step request lifecycle.
Pipeline: plan β account β proxy β serialize β execute β classify β feedback
This executor is opt-in. Existing products-layer code that calls transport
directly continues to work; the executor wraps the same pattern with
structured feedback and classification.
"""
import asyncio
from typing import Any
from app.platform.logging.logger import logger
from app.platform.runtime.clock import now_ms
from app.platform.errors import UpstreamError
from app.control.model.spec import ModelSpec
from app.dataplane.account import AccountDirectory, get_account_directory
from app.dataplane.account.lease import AccountLease
from app.dataplane.proxy import get_proxy_runtime
from .types import ReversePlan, ReverseLeaseSet, ReverseResult, ResultCategory
from .planner import build_plan
from .classifier import classify_result
from .feedback import build_proxy_feedback
async def execute(
spec: ModelSpec,
request: dict[str, Any],
*,
payload_builder: Any | None = None,
) -> ReverseResult:
"""Execute the full reverse pipeline for one request.
Parameters
----------
spec : ModelSpec
The resolved model specification.
request : dict
The raw API request body.
payload_builder : callable, optional
``(plan, token, request) β bytes`` β serializes the request into the
upstream payload format. If None, the request dict is JSON-encoded.
Returns
-------
ReverseResult
Classified outcome of the upstream call.
"""
t0 = now_ms()
# Step 1: Plan
plan = build_plan(spec, request)
# Step 2: Acquire account
directory = await get_account_directory()
lease = await directory.reserve(plan.pool_candidates, plan.mode_id)
if lease is None:
return ReverseResult(
category=ResultCategory.RATE_LIMITED,
error="No available accounts",
latency_ms=int(now_ms() - t0),
)
# Step 3: Acquire proxy
proxy_runtime = await get_proxy_runtime()
proxy_lease = await proxy_runtime.acquire()
leases = ReverseLeaseSet(
account_idx=lease.idx,
account_token=lease.token,
proxy_lease=proxy_lease,
)
# Step 4-5: Serialize + Execute
result = await _execute_transport(plan, leases, request, payload_builder)
result.latency_ms = int(now_ms() - t0)
# Step 6: Classify (done inside _execute_transport)
# Step 7: Feedback + release (fire-and-forget)
asyncio.create_task(
_apply_feedback_and_release(plan, leases, result, directory, lease),
)
return result
async def _execute_transport(
plan: ReversePlan,
leases: ReverseLeaseSet,
request: dict[str, Any],
payload_builder: Any | None,
) -> ReverseResult:
"""Execute the transport call and classify the result."""
try:
import orjson
if payload_builder:
payload = payload_builder(plan, leases.account_token, request)
else:
payload = orjson.dumps(request)
from app.dataplane.reverse.transport.http import post_json
raw = await post_json(
plan.endpoint,
leases.account_token,
payload,
lease=leases.proxy_lease,
timeout_s=plan.timeout_s,
content_type=plan.content_type,
origin=plan.origin,
referer=plan.referer,
)
category = classify_result(200)
return ReverseResult(
category=category,
status_code=200,
payload=raw,
)
except UpstreamError as exc:
category = classify_result(exc.status, exc.details.get("body", ""))
return ReverseResult(
category=category,
status_code=exc.status,
body=exc.details.get("body", ""),
error=str(exc),
)
except Exception as exc:
logger.error(
"reverse transport execution failed: error_type={} error={}",
type(exc).__name__,
exc,
)
return ReverseResult(
category=ResultCategory.TRANSPORT_ERR,
error=str(exc),
)
async def _apply_feedback_and_release(
plan: ReversePlan,
leases: ReverseLeaseSet,
result: ReverseResult,
directory: AccountDirectory,
account_lease: AccountLease,
) -> None:
"""Apply account and proxy feedback, then release the lease (best-effort)."""
try:
# Release inflight counter.
await directory.release(account_lease)
# Account feedback via the directory's feedback API.
from app.control.account.enums import FeedbackKind
_CATEGORY_TO_FEEDBACK = {
ResultCategory.SUCCESS: FeedbackKind.SUCCESS,
ResultCategory.RATE_LIMITED: FeedbackKind.RATE_LIMITED,
ResultCategory.AUTH_FAILURE: FeedbackKind.UNAUTHORIZED,
ResultCategory.FORBIDDEN: FeedbackKind.FORBIDDEN,
ResultCategory.UPSTREAM_5XX: FeedbackKind.SERVER_ERROR,
ResultCategory.TRANSPORT_ERR: FeedbackKind.SERVER_ERROR,
ResultCategory.UNKNOWN: FeedbackKind.SERVER_ERROR,
}
fb_kind = _CATEGORY_TO_FEEDBACK.get(result.category)
if fb_kind is not None:
await directory.feedback(
leases.account_token,
fb_kind,
plan.mode_id,
)
# Proxy feedback.
if leases.proxy_lease:
proxy_fb = build_proxy_feedback(result)
proxy_runtime = await get_proxy_runtime()
await proxy_runtime.feedback(leases.proxy_lease, proxy_fb)
except Exception as exc:
logger.debug("reverse feedback update failed (non-fatal): error={}", exc)
__all__ = ["execute"]
|