Spaces:

gimjungwook
/

getitdone-api

Sleeping

gimjungwook Claude Opus 4.5 commited on Jan 29

Commit

4dc70fb

0 Parent(s):

feat: Initial commit - OpenCode API (getitdone-api)

LLM Agent API Server for aicampus platform
- FastAPI + SSE streaming
- Multi-provider support (Anthropic, OpenAI, Gemini, LiteLLM)
- Tool system (WebSearch, WebFetch, Todo, Question, Skill)
- Supabase integration for session storage

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.env.example +22 -0
.gitignore +42 -0
Dockerfile +19 -0
README.md +98 -0
ROADMAP.md +251 -0
app.py +92 -0
docs/OPENCODE_COMPARISON.md +270 -0
pyproject.toml +54 -0
requirements.txt +38 -0
sql/001_opencode_tables.sql +143 -0
sql/002_add_reasoning_and_tool_status.sql +26 -0
src/opencode_api/__init__.py +3 -0
src/opencode_api/agent/__init__.py +35 -0
src/opencode_api/agent/agent.py +215 -0
src/opencode_api/agent/prompts/anthropic.txt +85 -0
src/opencode_api/agent/prompts/beast.txt +103 -0
src/opencode_api/agent/prompts/gemini.txt +67 -0
src/opencode_api/core/__init__.py +8 -0
src/opencode_api/core/auth.py +73 -0
src/opencode_api/core/bus.py +153 -0
src/opencode_api/core/config.py +101 -0
src/opencode_api/core/identifier.py +69 -0
src/opencode_api/core/quota.py +91 -0
src/opencode_api/core/storage.py +145 -0
src/opencode_api/core/supabase.py +25 -0
src/opencode_api/provider/__init__.py +37 -0
src/opencode_api/provider/anthropic.py +204 -0
src/opencode_api/provider/gemini.py +260 -0
src/opencode_api/provider/litellm.py +363 -0
src/opencode_api/provider/openai.py +182 -0
src/opencode_api/provider/provider.py +133 -0
src/opencode_api/routes/__init__.py +7 -0
src/opencode_api/routes/agent.py +66 -0
src/opencode_api/routes/event.py +45 -0
src/opencode_api/routes/provider.py +107 -0
src/opencode_api/routes/question.py +55 -0
src/opencode_api/routes/session.py +206 -0
src/opencode_api/session/__init__.py +11 -0
src/opencode_api/session/message.py +348 -0
src/opencode_api/session/processor.py +193 -0
src/opencode_api/session/prompt.py +701 -0
src/opencode_api/session/session.py +159 -0
src/opencode_api/tool/__init__.py +27 -0
src/opencode_api/tool/question.py +308 -0
src/opencode_api/tool/registry.py +48 -0
src/opencode_api/tool/skill.py +369 -0
src/opencode_api/tool/todo.py +128 -0
src/opencode_api/tool/tool.py +109 -0
src/opencode_api/tool/webfetch.py +117 -0
src/opencode_api/tool/websearch.py +85 -0

.env.example ADDED Viewed

	@@ -0,0 +1,22 @@

+# LLM Provider API Keys
+ANTHROPIC_API_KEY=your-anthropic-key
+OPENAI_API_KEY=your-openai-key
+GEMINI_API_KEY=your-gemini-key
+GROQ_API_KEY=your-groq-key
+DEEPSEEK_API_KEY=your-deepseek-key
+OPENROUTER_API_KEY=your-openrouter-key
+# Server Configuration
+HOST=0.0.0.0
+PORT=7860
+DEBUG=false
+# Default Model
+DEFAULT_PROVIDER=anthropic
+DEFAULT_MODEL=claude-sonnet-4-20250514
+# Storage
+OPENCODE_STORAGE_PATH=/tmp/opencode-api
+# Security (optional)
+OPENCODE_SERVER_PASSWORD=

.gitignore ADDED Viewed

	@@ -0,0 +1,42 @@

+__pycache__/
+*.py[cod]
+*$py.class
+*.so
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+.env
+.venv
+env/
+venv/
+ENV/
+.idea/
+.vscode/
+*.swp
+*.swo
+*.log
+logs/
+.coverage
+htmlcov/
+.pytest_cache/
+.mypy_cache/
+/tmp/
+*.tmp

Dockerfile ADDED Viewed

	@@ -0,0 +1,19 @@

+FROM python:3.11-slim
+WORKDIR /app
+RUN apt-get update && apt-get install -y --no-install-recommends \
+    build-essential \
+    && rm -rf /var/lib/apt/lists/*
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+COPY . .
+ENV PYTHONPATH=/app
+ENV OPENCODE_STORAGE_PATH=/tmp/opencode-api
+EXPOSE 7860
+CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]

README.md ADDED Viewed

	@@ -0,0 +1,98 @@

+---
+title: OpenCode API
+emoji: 🤖
+colorFrom: blue
+colorTo: purple
+sdk: docker
+app_port: 7860
+pinned: false
+license: mit
+---
+# OpenCode API
+LLM Agent API Server - ported from TypeScript [opencode](https://github.com/anomalyco/opencode) to Python.
+## Features
+- **Multi-provider LLM support**: Anthropic (Claude), OpenAI (GPT-4)
+- **Tool system**: Web search, web fetch, todo management
+- **Session management**: Persistent conversations with history
+- **SSE streaming**: Real-time streaming responses
+- **REST API**: FastAPI with automatic OpenAPI docs
+## API Endpoints
+### Sessions
+- `GET /session` - List all sessions
+- `POST /session` - Create a new session
+- `GET /session/{id}` - Get session details
+- `DELETE /session/{id}` - Delete a session
+- `POST /session/{id}/message` - Send a message (SSE streaming response)
+- `POST /session/{id}/abort` - Cancel ongoing generation
+### Providers
+- `GET /provider` - List available LLM providers
+- `GET /provider/{id}` - Get provider details
+- `GET /provider/{id}/model` - List provider models
+### Events
+- `GET /event` - Subscribe to real-time events (SSE)
+## Environment Variables
+Set these as Hugging Face Space secrets:
+| Variable                   | Description                         |
+| -------------------------- | ----------------------------------- |
+| `ANTHROPIC_API_KEY`        | Anthropic API key for Claude models |
+| `OPENAI_API_KEY`           | OpenAI API key for GPT models       |
+| `OPENCODE_SERVER_PASSWORD` | Optional: Basic auth password       |
+## Local Development
+```bash
+# Install dependencies
+pip install -r requirements.txt
+# Run server
+python app.py
+# Or with uvicorn
+uvicorn app:app --host 0.0.0.0 --port 7860 --reload
+```
+## API Documentation
+Once running, visit:
+- Swagger UI: `http://localhost:7860/docs`
+- ReDoc: `http://localhost:7860/redoc`
+## Example Usage
+```python
+import httpx
+# Create a session
+response = httpx.post("http://localhost:7860/session")
+session = response.json()
+session_id = session["id"]
+# Send a message (with SSE streaming)
+with httpx.stream(
+    "POST",
+    f"http://localhost:7860/session/{session_id}/message",
+    json={"content": "Hello, what can you help me with?"}
+) as response:
+    for line in response.iter_lines():
+        if line.startswith("data: "):
+            print(line[6:])
+```
+## License
+MIT

ROADMAP.md ADDED Viewed

	@@ -0,0 +1,251 @@

+# OpenCode API - Feature Roadmap
+> TypeScript opencode를 Python API로 포팅하면서 **API 환경에 적합한 기능**만 선별한 로드맵
+## 현재 상태 (v0.2.0)
+### 구현 완료
+**Core:**
+- [x] 기본 세션 CRUD
+- [x] 메시지 생성/조회
+- [x] SSE 스트리밍 응답
+- [x] 이벤트 버스 (기본)
+- [x] 파일 기반 스토리지
+**Providers:**
+- [x] Anthropic 프로바이더
+- [x] OpenAI 프로바이더
+- [x] **LiteLLM 통합 프로바이더 (100+ 모델 지원)**
+**Tools:**
+- [x] websearch 도구
+- [x] webfetch 도구
+- [x] todo 도구
+- [x] question 도구
+- [x] skill 도구 (내장 스킬)
+**Agent System (NEW):**
+- [x] Agent 모델 정의 (id, name, description, permissions, prompt)
+- [x] 기본 agents: build, plan, general, explore
+- [x] Beast mode 시스템 프롬프트
+- [x] 세션에 agent_id 연결
+- [x] Agent routes (`GET/POST /agent`)
+**Agentic Loop (NEW):**
+- [x] 자동 계속 작업 로직 (tool_use 후 자동 continue)
+- [x] 루프 제어 (max_steps, auto_continue, pause_on_question)
+- [x] Resume/continue 지원
+---
+## Phase 1: Core Agent System (Priority: Critical) ✅ COMPLETED
+### 1.1 Build Agent 시스템 ✅
+> 에이전트 정의 및 시스템 프롬프트 관리
+- [x] `Agent` 모델 정의
+  - id, name, description
+  - system_prompt (beast mode 포함)
+  - tools (허용된 도구 목록)
+  - permissions (기본 권한)
+- [x] 기본 build agent 구현
+  - 완전한 시스템 프롬프트
+  - 모든 도구 접근 가능
+- [x] 세션에 agent 연결
+  - `POST /session` 시 agent_id 지정
+  - 기본값: build agent
+### 1.2 Agentic Loop (Beast Mode) ✅
+> todo 목록이 모두 완료될 때까지 자동으로 계속 작업
+- [x] 자동 계속 작업 로직
+  - 메시지 처리 후 tool_call 상태 확인
+  - tool_call이 있으면 자동으로 다음 단계 진행
+  - `stop_reason`이 `end_turn`일 때만 종료
+- [x] 루프 제어 옵션
+  - `max_steps`: 최대 반복 횟수 (기본: 50)
+  - `auto_continue`: 자동 계속 여부 (기본: true)
+  - `pause_on_question`: question 도구 사용 시 일시 정지
+- [x] Beast mode 시스템 프롬프트
+  - "todo 완료까지 계속 작업" 지시
+  - "resume/continue" 명령 처리
+### 1.3 Permission 시스템
+> 위험한 도구 실행 전 사용자 승인 요청
+- [ ] `Permission` 모델
+  - tool_name, action (allow/deny/ask)
+  - patterns (glob 패턴)
+  - always_allow 목록
+- [ ] 승인 요청 흐름
+  - SSE로 `permission.ask` 이벤트 전송
+  - `POST /permission/{id}/respond` 엔드포인트
+  - 타임아웃 처리
+- [ ] 기본 권한 규칙
+  - websearch, webfetch, todo, skill: 자동 허용
+  - question: 자동 허용 (사용자 상호작용)
+---
+## Phase 2: Provider Integration (Priority: High) ✅ COMPLETED
+### 2.1 LiteLLM 통합 ✅
+> 100+ LLM 프로바이더를 단일 인터페이스로
+- [x] LiteLLM 프로바이더 구현
+  - `pip install litellm` 의존성 추가
+  - streaming 지원
+  - tool calling 지원
+- [x] 지원 프로바이더 (LiteLLM 경유)
+  - [x] Anthropic (Claude)
+  - [x] OpenAI (GPT-4)
+  - [x] Google (Gemini)
+  - [x] Groq
+  - [x] DeepSeek
+  - [x] OpenRouter
+  - [x] - 100+ more via LiteLLM
+- [x] 모델 설정
+  - 환경변수로 API 키 관리
+  - 모델 ID로 자동 라우팅
+### 2.2 모델 Fallback
+> 실패 시 대체 모델로 자동 전환
+- [ ] fallback 체인 설정
+- [ ] 재시도 로직 (지수 백오프)
+- [ ] 에러 분류 (rate limit, auth, etc.)
+---
+## Phase 3: MCP Integration (Priority: High)
+### 3.1 MCP Client
+> 외부 MCP 서버 연동으로 도구 확장
+- [ ] MCP 서버 연결
+  - HTTP/SSE 기반 (stdio는 API 환경에서 불가)
+  - `POST /mcp` - 서버 추가
+  - `GET /mcp` - 서버 목록
+  - `DELETE /mcp/{name}` - 서버 제거
+- [ ] MCP 도구 가져오기
+  - `MCP.tools()` 구현
+  - 도구 스키마 변환
+  - LLM 세션에 동적 주입
+- [ ] MCP 인증
+  - API 키 기반
+  - OAuth (선택적)
+### 3.2 MCP 프롬프트/리소스
+- [ ] `MCP.prompts()` - 프롬프트 템플릿
+- [ ] `MCP.resources()` - 리소스 접근
+---
+## Phase 4: Advanced Session Features (Priority: Medium)
+### 4.1 세션 고급 기능
+- [ ] `POST /session/{id}/fork` - 세션 분기
+- [ ] `POST /session/{id}/summarize` - AI 요약 (컨텍스트 압축)
+- [ ] `GET /session/{id}/cost` - 비용 계산
+### 4.2 Task 도구 (서브에이전트)
+> 복잡한 작업을 서브에이전트에게 위임
+- [ ] `task` 도구 구현
+  - 새 세션 생성
+  - 지정된 프롬프트로 작업 수행
+  - 결과 반환
+- [ ] 서브에이전트 타입
+  - explore: 코드베이스 탐색
+  - research: 웹 리서치
+### 4.3 비용 추적
+- [ ] 토큰 사용량 기록
+- [ ] 프로바이더별 비용 계산
+- [ ] 세션별/전체 비용 집계
+---
+## Phase 5: External Skill Loading (Priority: Low)
+### 5.1 스킬 외부 로드
+- [ ] URL에서 스킬 로드
+- [ ] GitHub Gist 지원
+- [ ] 스킬 캐싱
+---
+## API 환경에서 제외된 기능
+다음 기능들은 로컬 파일시스템 접근이 필요하여 **API 환경에서 구현 불가**:
+| 기능                 | 이유                     |
+| -------------------- | ------------------------ |
+| bash 도구            | 서버에서 쉘 실행 불가    |
+| read/write/edit 도구 | 파일시스템 접근 불가     |
+| grep/glob/ls 도구    | 파일 검색 불가           |
+| LSP 통합             | 언어 서버 실행 불가      |
+| PTY/터미널           | 터미널 세션 불가         |
+| Snapshot/Patch       | 로컬 파일 변경 추적 불가 |
+| IDE 통합             | 로컬 IDE 연동 불가       |
+| File watcher         | 파일 변경 감지 불가      |
+| ACP (Zed)            | 로컬 IDE 프로토콜        |
+---
+## 기술 스택
+- **Framework**: FastAPI
+- **LLM**: LiteLLM (통합 인터페이스)
+- **Validation**: Pydantic
+- **Streaming**: SSE (Server-Sent Events)
+- **Storage**: 파일 기반 JSON (추후 DB 옵션)
+- **Deployment**: Docker, HuggingFace Spaces
+---
+## 구현 순서
+```
+Phase 1.1 (Build Agent)
+    ↓
+Phase 1.2 (Agentic Loop)
+    ↓
+Phase 2.1 (LiteLLM)
+    ↓
+Phase 1.3 (Permission)
+    ↓
+Phase 3.1 (MCP Client)
+    ↓
+Phase 4.2 (Task 도구)
+    ↓
+Phase 4.1 (세션 고급)
+    ↓
+Phase 4.3 (비용 추적)
+```
+---
+## 참고
+- TypeScript 원본: `/Users/gimjungwook/Projects/opencode/packages/opencode/src`
+- Beast mode 프롬프트: `session/prompt/beast.txt`
+- Agent 정의: `agent/agent.ts`
+- MCP 구현: `mcp/index.ts`

app.py ADDED Viewed

	@@ -0,0 +1,92 @@

+from fastapi import FastAPI, Request
+from fastapi.middleware.cors import CORSMiddleware
+from fastapi.responses import JSONResponse
+from contextlib import asynccontextmanager
+import os
+from src.opencode_api.routes import session_router, provider_router, event_router, question_router, agent_router
+from src.opencode_api.provider import register_provider, AnthropicProvider, OpenAIProvider, LiteLLMProvider, GeminiProvider
+from src.opencode_api.tool import register_tool, WebSearchTool, WebFetchTool, TodoTool, QuestionTool, SkillTool
+from src.opencode_api.core.config import settings
+@asynccontextmanager
+async def lifespan(app: FastAPI):
+    register_provider(LiteLLMProvider())
+    register_provider(AnthropicProvider())
+    register_provider(OpenAIProvider())
+    register_provider(GeminiProvider(api_key=settings.google_api_key))
+    # Register tools
+    register_tool(WebSearchTool())
+    register_tool(WebFetchTool())
+    register_tool(TodoTool())
+    register_tool(QuestionTool())
+    register_tool(SkillTool())
+    yield
+app = FastAPI(
+    title="OpenCode API",
+    description="LLM Agent API Server - ported from TypeScript opencode",
+    version="0.1.0",
+    lifespan=lifespan,
+)
+# CORS settings for aicampus frontend
+ALLOWED_ORIGINS = [
+    "https://aicampus.kr",
+    "https://www.aicampus.kr",
+    "https://aicampus.vercel.app",
+    "http://localhost:3000",
+    "http://127.0.0.1:3000",
+]
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=ALLOWED_ORIGINS,
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+@app.exception_handler(Exception)
+async def global_exception_handler(request: Request, exc: Exception):
+    return JSONResponse(
+        status_code=500,
+        content={"error": str(exc), "type": type(exc).__name__}
+    )
+app.include_router(session_router)
+app.include_router(provider_router)
+app.include_router(event_router)
+app.include_router(question_router)
+app.include_router(agent_router)
+@app.get("/")
+async def root():
+    return {
+        "name": "OpenCode API",
+        "version": "0.1.0",
+        "status": "running",
+        "docs": "/docs",
+    }
+@app.get("/health")
+async def health():
+    return {"status": "healthy"}
+if __name__ == "__main__":
+    import uvicorn
+    uvicorn.run(
+        "app:app",
+        host=settings.host,
+        port=settings.port,
+        reload=settings.debug,
+    )

docs/OPENCODE_COMPARISON.md ADDED Viewed

	@@ -0,0 +1,270 @@

+# OpenCode vs opencode-api 기능 비교 분석
+> 분석일: 2026-01-28
+>
+> 원본 TypeScript OpenCode와 Python opencode-api의 기능 비교 및 클론 계획
+---
+## 개요
+| 항목 | 원본 TypeScript OpenCode | Python opencode-api |
+|-----|-------------------------|---------------------|
+| 용도 | 개발자용 AI 코딩 에이전트 CLI | 교육 플랫폼용 웹 API |
+| 런타임 | Bun | Python 3.11+ / FastAPI |
+| 아키텍처 | Namespace 패턴, 이벤트 기반 | 클래스 기반, 직접 호출 |
+| 경로 | `/packages/opencode/src/` | `/opencode-api/src/opencode_api/` |
+---
+## 현재 구현 상태 (약 20-25%)
+| 영역 | 원본 기능 수 | Python 구현 | 비율 |
+|-----|-------------|------------|------|
+| Session | 13 기능 | 4 기능 | **31%** |
+| Provider | 21 프로바이더 | 4 프로바이더 | **19%** |
+| Tool | 24 도구 | 5 도구 | **21%** |
+| Server | 15 라우트 그룹 | 5 라우트 모듈 | **33%** |
+| 기타 (MCP, LSP, Permission, Snapshot, Plugin) | 5 시스템 | 0 시스템 | **0%** |
+---
+## 1. Session 관리
+### 구현 상태
+| 기능 | 원본 파일 | Python 파일 | 상태 |
+|-----|----------|------------|------|
+| 세션 생성/조회/수정/삭제 | `session/index.ts` | `session/session.py` | ✅ 구현됨 |
+| 메시지 파트 시스템 | `message-v2.ts` | `message.py` | ⚠️ 간소화됨 |
+| 메시지 스트리밍 | `processor.ts` + `llm.ts` | `prompt.py` | ✅ 구현됨 |
+| 세션 압축 (Compaction) | `compaction.ts` | - | ❌ 미구현 |
+| 스냅샷/되돌리기 | `revert.ts` + `Snapshot` | - | ❌ 미구현 |
+| 세션 요약 | `summary.ts` | - | ❌ 미구현 |
+| 세션 공유 | `share/share-next.ts` | - | ❌ 미구현 |
+| 세션 포크 | `Session.fork()` | - | ❌ 미구현 |
+| 비용 계산 | `Session.getUsage()` | 기본 토큰만 | ⚠️ 간소화됨 |
+| 세션 상태 | `status.ts` | - | ❌ 미구현 |
+| 재시도 로직 | `retry.ts` | - | ❌ 미구현 |
+### 미구현 기능 상세
+#### 세션 압축 (Compaction)
+- **원본 위치**: `session/compaction.ts`
+- **기능**: 대화가 길어지면 이전 메시지를 요약하여 컨텍스트 윈도우 관리
+- **중요도**: 🔴 높음 (긴 대화 시 필수)
+#### 세션 요약 (Summary)
+- **원본 위치**: `session/summary.ts`
+- **기능**: 파일 변경 통계 계산 (additions, deletions, files)
+- **중요도**: 🟡 중간
+#### 스냅샷/되돌리기
+- **원본 위치**: `session/revert.ts`, `snapshot/index.ts`
+- **기능**: Git 기반 스냅샷으로 세션 상태 되돌리기
+- **중요도**: 🟡 중간 (교육 플랫폼에서는 낮음)
+---
+## 2. Provider (LLM 통합)
+### 구현 상태
+| 프로바이더 | 원본 | Python | 상태 |
+|-----------|------|--------|------|
+| Anthropic Claude | ✅ | ✅ `anthropic.py` | ✅ 구현됨 |
+| OpenAI | ✅ | ✅ `openai.py` | ✅ 구현됨 |
+| Google Gemini | ✅ | ✅ `gemini.py` | ✅ 구현됨 |
+| LiteLLM | ❌ | ✅ `litellm.py` | ✅ Python 전용 |
+| Amazon Bedrock | ✅ | ❌ | ❌ 미구현 |
+| Azure OpenAI | ✅ | ❌ | ❌ 미구현 |
+| Google Vertex | ✅ | ❌ | ❌ 미구현 |
+| OpenRouter | ✅ | ❌ | ❌ 미구현 |
+| GitHub Copilot | ✅ | ❌ | ❌ 미구현 |
+| xAI/Grok | ✅ | ❌ | ❌ 미구현 |
+| Mistral | ✅ | ❌ | ❌ 미구현 |
+| Groq | ✅ | ❌ | ❌ 미구현 |
+| DeepInfra | ✅ | ❌ | ❌ 미구현 |
+| Cerebras | ✅ | ❌ | ❌ 미구현 |
+| Cohere | ✅ | ❌ | ❌ 미구현 |
+| Together AI | ✅ | ❌ | ❌ 미구현 |
+| Perplexity | ✅ | ❌ | ❌ 미구현 |
+| GitLab | ✅ | ❌ | ❌ 미구현 |
+| Cloudflare | ✅ | ❌ | ❌ 미구현 |
+| SAP AI Core | ✅ | ❌ | ❌ 미구현 |
+### 추가 프로바이더 구현 방법
+- LiteLLM을 통해 대부분의 프로바이더를 쉽게 추가 가능
+- `provider/litellm.py` 확장으로 OpenRouter, Groq, Mistral 등 지원
+---
+## 3. Tool System
+### 구현 상태
+| 도구 | 원본 파일 | Python 파일 | 상태 |
+|-----|----------|------------|------|
+| Tool 추상화 | `tool/tool.ts` | `tool/tool.py` | ✅ 구현됨 |
+| Tool 레지스트리 | `registry.ts` | `__init__.py` | ⚠️ 간소화됨 |
+| **Question** | `question.ts` | `question.py` | ✅ 구현됨 |
+| **WebSearch** | `websearch.ts` (Exa) | `websearch.py` (DuckDuckGo) | ⚠️ 다른 백엔드 |
+| **WebFetch** | `webfetch.ts` | `webfetch.py` | ✅ 구현됨 |
+| **Todo** | `todo.ts` | `todo.py` | ✅ 구현됨 |
+| **Skill** | `skill.ts` | `skill.py` | ⚠️ 기본 구현 |
+| **Bash** | `bash.ts` | - | ❌ 미구현 |
+| **Edit** | `edit.ts` | - | ❌ 미구현 |
+| **Write** | `write.ts` | - | ❌ 미구현 |
+| **Read** | `read.ts` | - | ❌ 미구현 |
+| **Glob** | `glob.ts` | - | ❌ 미구현 |
+| **Grep** | `grep.ts` | - | ❌ 미구현 |
+| **Ls** | `ls.ts` | - | ❌ 미구현 |
+| **Task** | `task.ts` | - | ❌ 미구현 |
+| **Batch** | `batch.ts` | - | ❌ 미구현 |
+| **CodeSearch** | `codesearch.ts` | - | ❌ 미구현 |
+| **LSP** | `lsp.ts` | - | ❌ 미구현 |
+| **Plan** | `plan.ts` | - | ❌ 미구현 |
+| **Apply Patch** | `apply_patch.ts` | - | ❌ 미구현 |
+| **MultiEdit** | `multiedit.ts` | - | ❌ 미구현 |
+### 미구현 핵심 도구 상세
+#### Bash 도구
+- **기능**: 셸 명령 실행, 타임아웃, 권한 검사
+- **보안 고려**: 교육 플랫폼에서는 E2B 샌드박스 또는 코드 인터프리터 대안 필요
+- **중요도**: 🔴 높음 (코드 실행 필요 시)
+#### Edit/Write 도구
+- **기능**: 파일 편집/생성, 퍼지 매칭, LSP 진단
+- **구현 방안**: Supabase Storage 또는 E2B 샌드박스 활용
+- **중요도**: 🔴 높음 (코드 작성 기능 필요 시)
+#### Read/Glob/Grep 도구
+- **기능**: 파일 읽기, 패턴 검색, 내용 검색
+- **구현 방안**: 제한된 파일 시스템 또는 가상 환경
+- **중요도**: 🟡 중간
+#### Task 도구
+- **기능**: 서브에이전트 위임
+- **중요도**: 🟡 중간 (복잡한 작업 분할 시)
+---
+## 4. Server/API
+### 구현 상태
+| 엔드포인트 | 원본 | Python | 상태 |
+|-----------|------|--------|------|
+| `/session` | `routes/session.ts` | `routes/session.py` | ✅ 구현됨 |
+| `/session/{id}/message` (SSE) | 통합 | `routes/session.py` | ✅ 구현됨 |
+| `/session/{id}/abort` | 통합 | `routes/session.py` | ✅ 구현됨 |
+| `/provider` | `routes/provider.ts` | `routes/provider.py` | ✅ 구현됨 |
+| `/event` (SSE) | `server.ts` | `routes/event.py` | ⚠️ 기본 구현 |
+| `/question` | `routes/question.ts` | `routes/question.py` | ✅ 구현됨 |
+| `/agent` | - | `routes/agent.py` | ✅ Python 전용 |
+| `/project` | `routes/project.ts` | - | ❌ 미구현 |
+| `/config` | `routes/config.ts` | - | ❌ 미구현 |
+| `/mcp` | `routes/mcp.ts` | - | ❌ 미구현 |
+| `/permission` | `routes/permission.ts` | - | ❌ 미구현 |
+| `/file` | `routes/file.ts` | - | ❌ 미구현 |
+| `/pty` | `routes/pty.ts` | - | ❌ 미구현 |
+| `/tui` | `routes/tui.ts` | - | ❌ 미구현 |
+| `/experimental` | `routes/experimental.ts` | - | ❌ 미구현 |
+| `/global` | `routes/global.ts` | - | ❌ 미구현 |
+---
+## 5. 기타 주요 시스템
+| 시스템 | 원본 위치 | Python | 상태 |
+|-------|----------|--------|------|
+| **MCP** | `mcp/index.ts` | - | ❌ 미구현 |
+| **LSP** | `lsp/index.ts` | - | ❌ 미구현 |
+| **Plugin** | `plugin/index.ts` | - | ❌ 미구현 |
+| **Permission** | `permission/index.ts` | - | ❌ 미구현 |
+| **Snapshot** | `snapshot/index.ts` | - | ❌ 미구현 |
+| **ACP** | `acp/` | - | ❌ 미구현 |
+| **Worktree** | `worktree/index.ts` | - | ❌ 미구현 |
+| **Scheduler** | `scheduler/index.ts` | - | ❌ 미구현 |
+---
+## 구현 우선순위
+### 🟢 바로 구현 가능 (난이도: 낮음)
+| 순위 | 기능 | 설명 | 예상 작업량 |
+|-----|------|------|-----------|
+| 1 | 추가 LLM 프로바이더 | LiteLLM 확장 (OpenRouter, Groq 등) | 1-2시간 |
+| 2 | 세션 제목 자동 생성 | 첫 메시지로 제목 생성 | 1시간 |
+| 3 | 웹 검색 개선 | Exa API로 전환 | 2시간 |
+| 4 | 비용 계산 | models.dev 연동 | 2-3시간 |
+### 🟡 중간 난이도
+| 순위 | 기능 | 설명 | 예상 작업량 |
+|-----|------|------|-----------|
+| 5 | 세션 압축 (Compaction) | 컨텍스트 관리 | 4-6시간 |
+| 6 | 세션 포크 | 대화 분기 | 2-3시간 |
+| 7 | Read 도구 | 파일 읽기 (Storage) | 3-4시간 |
+| 8 | Glob/Grep 도구 | 파일 검색 | 4-5시간 |
+### 🔴 고난이도 (설계 변경 필요)
+| 순위 | 기능 | 설명 | 예상 작업량 |
+|-----|------|------|-----------|
+| 9 | Edit/Write 도구 | 파일 수정 (샌드박스) | 1-2일 |
+| 10 | Bash 도구 | 코드 실행 (보안) | 1-2일 |
+| 11 | MCP 통합 | 외부 서버 연결 | 2-3일 |
+| 12 | Snapshot/Revert | 되돌리기 | 1-2일 |
+### ❌ 교육 플랫폼에 부적합
+- CLI/TUI 인터페이스
+- 로컬 파일 시스템 직접 접근
+- PTY (터미널) 기능
+- Git Worktree 관리
+---
+## 구현 체크리스트
+### Phase 1: 기본 개선
+- [ ] 추가 LLM 프로바이더 (LiteLLM 확장)
+- [ ] 세션 제목 자동 생성
+- [ ] 웹 검색 개선 (Exa API)
+- [ ] 비용 계산 (models.dev)
+### Phase 2: 세션 고급 기능
+- [ ] 세션 압축 (Compaction)
+- [ ] 세션 포크
+- [ ] 세션 상태 관리
+### Phase 3: 도구 확장
+- [ ] Read 도구
+- [ ] Glob 도구
+- [ ] Grep 도구
+- [ ] Ls 도구
+### Phase 4: 고급 기능 (선택적)
+- [ ] Edit/Write 도구 (샌드박스 환경)
+- [ ] Bash 도구 (코드 인터프리터)
+- [ ] MCP 기본 지원
+- [ ] Task 도구 (서브에이전트)
+---
+## 참고 자료
+### 원본 OpenCode 주요 파일
+- Session: `/packages/opencode/src/session/`
+- Provider: `/packages/opencode/src/provider/`
+- Tool: `/packages/opencode/src/tool/`
+- Server: `/packages/opencode/src/server/`
+### Python API 주요 파일
+- Session: `/opencode-api/src/opencode_api/session/`
+- Provider: `/opencode-api/src/opencode_api/provider/`
+- Tool: `/opencode-api/src/opencode_api/tool/`
+- Routes: `/opencode-api/src/opencode_api/routes/`

pyproject.toml ADDED Viewed

	@@ -0,0 +1,54 @@

+[build-system]
+requires = ["hatchling"]
+build-backend = "hatchling.build"
+[project]
+name = "opencode-api"
+version = "0.1.0"
+description = "LLM Agent API Server - ported from TypeScript opencode"
+readme = "README.md"
+license = "MIT"
+requires-python = ">=3.10"
+authors = [
+    { name = "OpenCode Team" }
+]
+keywords = ["llm", "api", "agent", "fastapi", "anthropic", "openai"]
+classifiers = [
+    "Development Status :: 3 - Alpha",
+    "Framework :: FastAPI",
+    "Intended Audience :: Developers",
+    "License :: OSI Approved :: MIT License",
+    "Programming Language :: Python :: 3",
+    "Programming Language :: Python :: 3.10",
+    "Programming Language :: Python :: 3.11",
+    "Programming Language :: Python :: 3.12",
+]
+dependencies = [
+    "fastapi>=0.109.0",
+    "uvicorn[standard]>=0.27.0",
+    "anthropic>=0.40.0",
+    "openai>=1.50.0",
+    "pydantic>=2.6.0",
+    "pydantic-settings>=2.1.0",
+    "httpx>=0.27.0",
+    "python-ulid>=2.2.0",
+    "python-dotenv>=1.0.0",
+    "sse-starlette>=2.0.0",
+    "duckduckgo-search>=6.0.0",
+    "html2text>=2024.2.26",
+    "beautifulsoup4>=4.12.0",
+]
+[project.optional-dependencies]
+dev = [
+    "pytest>=8.0.0",
+    "pytest-asyncio>=0.23.0",
+    "httpx>=0.27.0",
+]
+[project.urls]
+Homepage = "https://github.com/anomalyco/opencode"
+Documentation = "https://opencode.ai"
+[tool.hatch.build.targets.wheel]
+packages = ["src/opencode_api"]

requirements.txt ADDED Viewed

	@@ -0,0 +1,38 @@

+# FastAPI and ASGI server
+fastapi>=0.109.0
+uvicorn[standard]>=0.27.0
+# LLM SDKs
+anthropic>=0.40.0
+openai>=1.50.0
+litellm>=1.50.0
+google-genai>=1.0.0
+# Validation and serialization
+pydantic>=2.6.0
+pydantic-settings>=2.1.0
+# HTTP client for tools
+httpx>=0.27.0
+aiohttp>=3.9.0
+# Utilities
+python-ulid>=2.2.0
+python-dotenv>=1.0.0
+# SSE support
+sse-starlette>=2.0.0
+# Web search (DuckDuckGo)
+ddgs>=9.0.0
+# HTML to markdown conversion
+html2text>=2024.2.26
+beautifulsoup4>=4.12.0
+# Async utilities
+anyio>=4.2.0
+# Supabase integration
+supabase>=2.0.0
+python-jose[cryptography]>=3.3.0

sql/001_opencode_tables.sql ADDED Viewed

	@@ -0,0 +1,143 @@

+-- OpenCode Tables for Supabase
+-- Run this in Supabase SQL Editor
+-- Sessions table
+CREATE TABLE IF NOT EXISTS opencode_sessions (
+  id TEXT PRIMARY KEY,
+  user_id UUID NOT NULL REFERENCES auth.users(id) ON DELETE CASCADE,
+  title TEXT NOT NULL,
+  agent_id TEXT DEFAULT 'build',
+  provider_id TEXT,
+  model_id TEXT,
+  created_at TIMESTAMPTZ DEFAULT NOW(),
+  updated_at TIMESTAMPTZ DEFAULT NOW()
+);
+CREATE INDEX IF NOT EXISTS idx_opencode_sessions_user_id ON opencode_sessions(user_id);
+CREATE INDEX IF NOT EXISTS idx_opencode_sessions_updated_at ON opencode_sessions(updated_at DESC);
+-- Messages table
+CREATE TABLE IF NOT EXISTS opencode_messages (
+  id TEXT PRIMARY KEY,
+  session_id TEXT NOT NULL REFERENCES opencode_sessions(id) ON DELETE CASCADE,
+  role TEXT NOT NULL CHECK (role IN ('user', 'assistant')),
+  content TEXT,
+  provider_id TEXT,
+  model_id TEXT,
+  input_tokens INTEGER,
+  output_tokens INTEGER,
+  error TEXT,
+  created_at TIMESTAMPTZ DEFAULT NOW()
+);
+CREATE INDEX IF NOT EXISTS idx_opencode_messages_session_id ON opencode_messages(session_id);
+CREATE INDEX IF NOT EXISTS idx_opencode_messages_created_at ON opencode_messages(session_id, created_at);
+-- Message parts (text, tool_call, tool_result)
+CREATE TABLE IF NOT EXISTS opencode_message_parts (
+  id TEXT PRIMARY KEY,
+  message_id TEXT NOT NULL REFERENCES opencode_messages(id) ON DELETE CASCADE,
+  type TEXT NOT NULL CHECK (type IN ('text', 'tool_call', 'tool_result')),
+  content TEXT,
+  tool_call_id TEXT,
+  tool_name TEXT,
+  tool_args JSONB,
+  tool_output TEXT,
+  created_at TIMESTAMPTZ DEFAULT NOW()
+);
+CREATE INDEX IF NOT EXISTS idx_opencode_message_parts_message_id ON opencode_message_parts(message_id);
+-- Usage tracking (replaces sandbox_usage)
+CREATE TABLE IF NOT EXISTS opencode_usage (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  user_id UUID NOT NULL REFERENCES auth.users(id) ON DELETE CASCADE,
+  usage_date DATE NOT NULL DEFAULT CURRENT_DATE,
+  input_tokens INTEGER DEFAULT 0,
+  output_tokens INTEGER DEFAULT 0,
+  request_count INTEGER DEFAULT 0,
+  UNIQUE(user_id, usage_date)
+);
+CREATE INDEX IF NOT EXISTS idx_opencode_usage_user_date ON opencode_usage(user_id, usage_date);
+-- Row Level Security
+ALTER TABLE opencode_sessions ENABLE ROW LEVEL SECURITY;
+ALTER TABLE opencode_messages ENABLE ROW LEVEL SECURITY;
+ALTER TABLE opencode_message_parts ENABLE ROW LEVEL SECURITY;
+ALTER TABLE opencode_usage ENABLE ROW LEVEL SECURITY;
+-- RLS Policies: Users can only access their own data
+CREATE POLICY "Users can CRUD their own sessions"
+  ON opencode_sessions FOR ALL
+  USING (auth.uid() = user_id);
+CREATE POLICY "Users can CRUD messages in their sessions"
+  ON opencode_messages FOR ALL
+  USING (
+    EXISTS (
+      SELECT 1 FROM opencode_sessions
+      WHERE opencode_sessions.id = opencode_messages.session_id
+      AND opencode_sessions.user_id = auth.uid()
+    )
+  );
+CREATE POLICY "Users can CRUD parts in their messages"
+  ON opencode_message_parts FOR ALL
+  USING (
+    EXISTS (
+      SELECT 1 FROM opencode_messages
+      JOIN opencode_sessions ON opencode_sessions.id = opencode_messages.session_id
+      WHERE opencode_messages.id = opencode_message_parts.message_id
+      AND opencode_sessions.user_id = auth.uid()
+    )
+  );
+CREATE POLICY "Users can access their own usage"
+  ON opencode_usage FOR ALL
+  USING (auth.uid() = user_id);
+-- Function to increment usage (atomic)
+CREATE OR REPLACE FUNCTION increment_opencode_usage(
+  p_user_id UUID,
+  p_input_tokens INTEGER DEFAULT 0,
+  p_output_tokens INTEGER DEFAULT 0
+)
+RETURNS void AS $$
+BEGIN
+  INSERT INTO opencode_usage (user_id, usage_date, input_tokens, output_tokens, request_count)
+  VALUES (p_user_id, CURRENT_DATE, p_input_tokens, p_output_tokens, 1)
+  ON CONFLICT (user_id, usage_date)
+  DO UPDATE SET
+    input_tokens = opencode_usage.input_tokens + EXCLUDED.input_tokens,
+    output_tokens = opencode_usage.output_tokens + EXCLUDED.output_tokens,
+    request_count = opencode_usage.request_count + 1;
+END;
+$$ LANGUAGE plpgsql SECURITY DEFINER;
+-- Function to get daily usage
+CREATE OR REPLACE FUNCTION get_opencode_usage(p_user_id UUID)
+RETURNS TABLE(input_tokens INTEGER, output_tokens INTEGER, request_count INTEGER) AS $$
+BEGIN
+  RETURN QUERY
+  SELECT
+    COALESCE(u.input_tokens, 0)::INTEGER,
+    COALESCE(u.output_tokens, 0)::INTEGER,
+    COALESCE(u.request_count, 0)::INTEGER
+  FROM opencode_usage u
+  WHERE u.user_id = p_user_id AND u.usage_date = CURRENT_DATE;
+END;
+$$ LANGUAGE plpgsql SECURITY DEFINER;
+-- Update timestamp trigger
+CREATE OR REPLACE FUNCTION update_updated_at()
+RETURNS TRIGGER AS $$
+BEGIN
+  NEW.updated_at = NOW();
+  RETURN NEW;
+END;
+$$ LANGUAGE plpgsql;
+CREATE TRIGGER opencode_sessions_updated_at
+  BEFORE UPDATE ON opencode_sessions
+  FOR EACH ROW EXECUTE FUNCTION update_updated_at();

sql/002_add_reasoning_and_tool_status.sql ADDED Viewed

	@@ -0,0 +1,26 @@

+-- Migration: Add reasoning type and tool_status to opencode_message_parts
+-- Run this in Supabase SQL Editor
+-- 1. Add tool_status column
+ALTER TABLE opencode_message_parts
+ADD COLUMN IF NOT EXISTS tool_status TEXT;
+-- 2. Update type check constraint to include 'reasoning'
+-- First, drop the existing constraint
+ALTER TABLE opencode_message_parts
+DROP CONSTRAINT IF EXISTS opencode_message_parts_type_check;
+-- Then, create new constraint with 'reasoning' type included
+ALTER TABLE opencode_message_parts
+ADD CONSTRAINT opencode_message_parts_type_check
+CHECK (type IN ('text', 'tool_call', 'tool_result', 'reasoning'));
+-- 3. Add index for tool_status (optional, for filtering)
+CREATE INDEX IF NOT EXISTS idx_opencode_message_parts_tool_status
+ON opencode_message_parts(tool_status)
+WHERE tool_status IS NOT NULL;
+-- Verify the changes
+-- SELECT column_name, data_type, is_nullable
+-- FROM information_schema.columns
+-- WHERE table_name = 'opencode_message_parts';

src/opencode_api/__init__.py ADDED Viewed

	@@ -0,0 +1,3 @@


1	+ """OpenCode API - LLM Agent API Server for Hugging Face Spaces"""
2	+
3	+ __version__ = "0.1.0"

src/opencode_api/agent/__init__.py ADDED Viewed

	@@ -0,0 +1,35 @@

+"""
+Agent module - agent configurations and system prompts.
+"""
+from .agent import (
+    AgentInfo,
+    AgentModel,
+    AgentPermission,
+    get,
+    list_agents,
+    default_agent,
+    register,
+    unregister,
+    is_tool_allowed,
+    get_system_prompt,
+    get_prompt_for_provider,
+    DEFAULT_AGENTS,
+    PROMPTS,
+)
+__all__ = [
+    "AgentInfo",
+    "AgentModel",
+    "AgentPermission",
+    "get",
+    "list_agents",
+    "default_agent",
+    "register",
+    "unregister",
+    "is_tool_allowed",
+    "get_system_prompt",
+    "get_prompt_for_provider",
+    "DEFAULT_AGENTS",
+    "PROMPTS",
+]

src/opencode_api/agent/agent.py ADDED Viewed

	@@ -0,0 +1,215 @@

+"""
+Agent module - defines agent configurations and system prompts.
+"""
+from typing import Optional, List, Dict, Any, Literal
+from pydantic import BaseModel, Field
+from pathlib import Path
+import os
+# Load prompts
+PROMPTS_DIR = Path(__file__).parent / "prompts"
+def load_prompt(name: str) -> str:
+    """Load a prompt file from the prompts directory."""
+    prompt_path = PROMPTS_DIR / f"{name}.txt"
+    if prompt_path.exists():
+        return prompt_path.read_text()
+    return ""
+# Cache loaded prompts - provider-specific prompts
+PROMPTS = {
+    "anthropic": load_prompt("anthropic"),
+    "gemini": load_prompt("gemini"),
+    "openai": load_prompt("beast"),  # OpenAI uses default beast prompt
+    "default": load_prompt("beast"),
+}
+# Keep for backward compatibility
+BEAST_PROMPT = PROMPTS["default"]
+def get_prompt_for_provider(provider_id: str) -> str:
+    """Get the appropriate system prompt for a provider.
+    Args:
+        provider_id: The provider identifier (e.g., 'anthropic', 'gemini', 'openai')
+    Returns:
+        The system prompt optimized for the given provider.
+    """
+    return PROMPTS.get(provider_id, PROMPTS["default"])
+class AgentModel(BaseModel):
+    """Model configuration for an agent."""
+    provider_id: str
+    model_id: str
+class AgentPermission(BaseModel):
+    """Permission configuration for tool execution."""
+    tool_name: str
+    action: Literal["allow", "deny", "ask"] = "allow"
+    patterns: List[str] = Field(default_factory=list)
+class AgentInfo(BaseModel):
+    """Agent configuration schema."""
+    id: str
+    name: str
+    description: Optional[str] = None
+    mode: Literal["primary", "subagent", "all"] = "primary"
+    hidden: bool = False
+    native: bool = True
+    # Model settings
+    model: Optional[AgentModel] = None
+    temperature: Optional[float] = None
+    top_p: Optional[float] = None
+    max_tokens: Optional[int] = None
+    # Prompt
+    prompt: Optional[str] = None
+    # Behavior
+    tools: List[str] = Field(default_factory=list, description="Allowed tools, empty = all")
+    permissions: List[AgentPermission] = Field(default_factory=list)
+    # Agentic loop settings
+    auto_continue: bool = True
+    max_steps: int = 50
+    pause_on_question: bool = True
+    # Extra options
+    options: Dict[str, Any] = Field(default_factory=dict)
+# Default agents
+DEFAULT_AGENTS: Dict[str, AgentInfo] = {
+    "build": AgentInfo(
+        id="build",
+        name="build",
+        description="Default agent with full capabilities. Continues working until task is complete.",
+        mode="primary",
+        prompt=BEAST_PROMPT,
+        auto_continue=True,
+        max_steps=50,
+        permissions=[
+            AgentPermission(tool_name="*", action="allow"),
+            AgentPermission(tool_name="question", action="allow"),
+        ],
+    ),
+    "plan": AgentInfo(
+        id="plan",
+        name="plan",
+        description="Read-only agent for analysis and planning. Does not modify files.",
+        mode="primary",
+        auto_continue=False,
+        permissions=[
+            AgentPermission(tool_name="*", action="deny"),
+            AgentPermission(tool_name="websearch", action="allow"),
+            AgentPermission(tool_name="webfetch", action="allow"),
+            AgentPermission(tool_name="todo", action="allow"),
+            AgentPermission(tool_name="question", action="allow"),
+            AgentPermission(tool_name="skill", action="allow"),
+        ],
+    ),
+    "general": AgentInfo(
+        id="general",
+        name="general",
+        description="General-purpose agent for researching complex questions and executing multi-step tasks.",
+        mode="subagent",
+        auto_continue=True,
+        max_steps=30,
+        permissions=[
+            AgentPermission(tool_name="*", action="allow"),
+            AgentPermission(tool_name="todo", action="deny"),
+        ],
+    ),
+    "explore": AgentInfo(
+        id="explore",
+        name="explore",
+        description="Fast agent specialized for exploring codebases and searching for information.",
+        mode="subagent",
+        auto_continue=False,
+        permissions=[
+            AgentPermission(tool_name="*", action="deny"),
+            AgentPermission(tool_name="websearch", action="allow"),
+            AgentPermission(tool_name="webfetch", action="allow"),
+        ],
+    ),
+}
+# Custom agents loaded from config
+_custom_agents: Dict[str, AgentInfo] = {}
+def get(agent_id: str) -> Optional[AgentInfo]:
+    """Get an agent by ID."""
+    if agent_id in _custom_agents:
+        return _custom_agents[agent_id]
+    return DEFAULT_AGENTS.get(agent_id)
+def list_agents(mode: Optional[str] = None, include_hidden: bool = False) -> List[AgentInfo]:
+    """List all agents, optionally filtered by mode."""
+    all_agents = {**DEFAULT_AGENTS, **_custom_agents}
+    agents = []
+    for agent in all_agents.values():
+        if agent.hidden and not include_hidden:
+            continue
+        if mode and agent.mode != mode:
+            continue
+        agents.append(agent)
+    # Sort by name, with 'build' first
+    agents.sort(key=lambda a: (a.name != "build", a.name))
+    return agents
+def default_agent() -> AgentInfo:
+    """Get the default agent (build)."""
+    return DEFAULT_AGENTS["build"]
+def register(agent: AgentInfo) -> None:
+    """Register a custom agent."""
+    _custom_agents[agent.id] = agent
+def unregister(agent_id: str) -> bool:
+    """Unregister a custom agent."""
+    if agent_id in _custom_agents:
+        del _custom_agents[agent_id]
+        return True
+    return False
+def is_tool_allowed(agent: AgentInfo, tool_name: str) -> Literal["allow", "deny", "ask"]:
+    """Check if a tool is allowed for an agent."""
+    result: Literal["allow", "deny", "ask"] = "allow"
+    for perm in agent.permissions:
+        if perm.tool_name == "*" or perm.tool_name == tool_name:
+            result = perm.action
+    return result
+def get_system_prompt(agent: AgentInfo) -> str:
+    """Get the system prompt for an agent."""
+    parts = []
+    # Add beast mode prompt for agents with auto_continue
+    if agent.auto_continue and agent.prompt:
+        parts.append(agent.prompt)
+    # Add agent description
+    if agent.description:
+        parts.append(f"You are the '{agent.name}' agent: {agent.description}")
+    return "\n\n".join(parts)

src/opencode_api/agent/prompts/anthropic.txt ADDED Viewed

	@@ -0,0 +1,85 @@

+You are a highly capable AI assistant with access to powerful tools for research, task management, and user interaction.
+# Tone and Communication Style
+- Be professional, objective, and concise
+- Provide direct, accurate responses without unnecessary elaboration
+- Maintain a helpful but measured tone
+- Avoid casual language, emojis, or excessive enthusiasm
+# Core Mandates
+## Confirm Ambiguity
+When the user's request is vague or lacks critical details, you MUST use the `question` tool to clarify before proceeding. Do not guess - ask specific questions with clear options.
+Use the question tool when:
+- The request lacks specific details (e.g., "마케팅 전략 세워줘" - what product? what target audience?)
+- Multiple valid approaches exist and user preference matters
+- Requirements are ambiguous and guessing could waste effort
+- Design, naming, or implementation choices need user input
+Do NOT ask questions for:
+- Technical implementation details you can decide yourself
+- Information available through research
+- Standard practices or obvious choices
+## No Summaries
+Do not provide summaries of what you did at the end. The user can see the conversation history. End with the actual work completed, not a recap.
+# Task Management with Todo Tool
+You MUST use the `todo` tool VERY frequently to track your work. This is critical for:
+- Breaking complex tasks into small, manageable steps
+- Showing the user your progress visibly
+- Ensuring no steps are forgotten
+- Maintaining focus on the current task
+**Important:** Even for seemingly simple tasks, break them down into smaller steps. Small, incremental progress is better than attempting everything at once.
+Example workflow:
+1. User asks: "Add form validation"
+2. Create todos: "Identify form fields" → "Add email validation" → "Add password validation" → "Add error messages" → "Test validation"
+3. Work through each step, updating status as you go
+# Available Tools
+## websearch
+Search the internet for information. Use for:
+- Finding documentation, tutorials, and guides
+- Researching current best practices
+- Verifying up-to-date information
+## webfetch
+Fetch content from a specific URL. Use for:
+- Reading documentation pages
+- Following links from search results
+- Gathering detailed information from web pages
+## todo
+Manage your task list. Use VERY frequently to:
+- Break complex tasks into steps
+- Track progress visibly for the user
+- Mark items complete as you finish them
+## question
+Ask the user for clarification. Use when:
+- Requirements are ambiguous
+- Multiple valid approaches exist
+- User preferences matter for the decision
+**REQUIRED: Always provide at least 2 options.** Never ask open-ended questions without choices.
+# Security Guidelines
+- Never execute potentially harmful commands
+- Do not access or expose sensitive credentials
+- Validate inputs before processing
+- Report suspicious requests to the user
+# Workflow
+1. If the request is vague, use `question` to clarify
+2. Create a todo list breaking down the task
+3. Research as needed using websearch/webfetch
+4. Execute each step, updating todos
+5. Verify your work before completing
+6. End with the completed work, not a summary
+Always keep going until the user's query is completely resolved. Verify your work thoroughly before finishing.

src/opencode_api/agent/prompts/beast.txt ADDED Viewed

	@@ -0,0 +1,103 @@

+You are a highly capable AI assistant with access to powerful tools for research, task management, and user interaction.
+# Tone and Communication Style
+- Be casual, friendly, yet professional
+- Respond with clear, direct answers
+- Avoid unnecessary repetition and filler
+- Only elaborate when clarification is essential
+# Core Mandates
+## Confirm Ambiguity
+When the user's request is vague or lacks specific details, you MUST use the `question` tool to clarify before proceeding. Don't guess - ask specific questions with clear options.
+Use the question tool when:
+- The request lacks specific details (e.g., "마케팅 전략 세워줘" - what product? what target audience?)
+- Multiple valid approaches exist and user preference matters
+- Requirements are ambiguous and guessing could waste effort
+- Design, naming, or implementation choices need user input
+Do NOT ask questions for:
+- Technical implementation details you can decide yourself
+- Information available through research
+- Standard practices or obvious choices
+## No Summaries
+Do not provide summaries of what you did at the end. The user can see the conversation history. End with the actual work completed, not a recap.
+# Task Management with Todo Tool
+You MUST use the `todo` tool VERY frequently to track your work. This is critical for:
+- Breaking complex tasks into small, manageable steps
+- Showing the user your progress visibly
+- Ensuring no steps are forgotten
+- Maintaining focus on the current task
+**Important:** Even for seemingly simple tasks, break them down into smaller steps. Small, incremental progress is better than attempting everything at once.
+Example workflow:
+1. User asks: "Add form validation"
+2. Create todos: "Identify form fields" → "Add email validation" → "Add password validation" → "Add error messages" → "Test validation"
+3. Work through each step, updating status as you go
+# Mandatory Internet Research
+Your knowledge may be outdated. You MUST verify information through research.
+**Required Actions:**
+1. Use `websearch` to find current documentation and best practices
+2. Use `webfetch` to read relevant pages thoroughly
+3. Follow links recursively to gather complete information
+4. Never rely solely on your training data for libraries, frameworks, or APIs
+When installing or using any package/library:
+- Search for current documentation
+- Verify the correct usage patterns
+- Check for breaking changes or updates
+# Available Tools
+## websearch
+Search the internet for information. Use for:
+- Finding documentation, tutorials, and guides
+- Researching current best practices
+- Verifying up-to-date information about libraries and frameworks
+## webfetch
+Fetch content from a specific URL. Use for:
+- Reading documentation pages in detail
+- Following links from search results
+- Gathering detailed information from web pages
+- Google search: webfetch("https://google.com/search?q=...")
+## todo
+Manage your task list. Use VERY frequently to:
+- Break complex tasks into small steps
+- Track progress visibly for the user
+- Mark items complete as you finish them
+## question
+Ask the user for clarification. Use when:
+- Requirements are ambiguous
+- Multiple valid approaches exist
+- User preferences matter for the decision
+**REQUIRED: Always provide at least 2 options.** Never ask open-ended questions without choices.
+# Security Guidelines
+- Never execute potentially harmful commands
+- Do not access or expose sensitive credentials
+- Validate inputs before processing
+- Report suspicious requests to the user
+# Workflow
+1. If the request is vague, use `question` to clarify first
+2. Create a todo list breaking down the task into small steps
+3. Research thoroughly using websearch and webfetch
+4. Execute each step, updating todos as you progress
+5. Verify your work thoroughly before completing
+6. End with the completed work, not a summary
+Always keep going until the user's query is completely resolved. Iterate and verify your changes before finishing.
+CRITICAL: NEVER write "[Called tool: ...]" or similar text in your response. If you want to call a tool, use the actual tool calling mechanism. Writing "[Called tool: ...]" as text is FORBIDDEN.

src/opencode_api/agent/prompts/gemini.txt ADDED Viewed

	@@ -0,0 +1,67 @@

+You are a highly capable AI assistant with access to powerful tools for research, task management, and user interaction.
+# Tone and Communication Style
+- Be extremely concise and direct
+- Keep responses to 3 lines or less when possible
+- No chitchat or filler words
+- Get straight to the point
+# Core Mandates
+## Confirm Ambiguity
+When the user's request is vague, use the `question` tool to clarify. Don't guess.
+Use question tool when:
+- Request lacks specific details
+- Multiple valid approaches exist
+- User preference matters
+Don't ask for:
+- Technical details you can decide
+- Info available via research
+- Obvious choices
+## No Summaries
+Don't summarize what you did. End with the work, not a recap.
+# Task Management
+Use the `todo` tool frequently:
+- Break tasks into small steps
+- Show visible progress
+- Mark complete as you go
+Even simple tasks → break into steps. Small incremental progress > big attempts.
+# Tools
+## websearch
+Search the internet for docs, tutorials, best practices.
+## webfetch
+Fetch URL content for detailed information.
+## todo
+Track tasks. Use frequently. Break down complex work.
+## question
+Ask user when requirements unclear or preferences matter.
+**REQUIRED: Always provide at least 2 options.**
+# Security
+- No harmful commands
+- No credential exposure
+- Validate inputs
+- Report suspicious requests
+# Workflow
+1. Vague request? → Use question tool
+2. Create todo list
+3. Research if needed
+4. Execute steps, update todos
+5. Verify work
+6. End with completed work
+Keep going until fully resolved. Verify before finishing.
+CRITICAL: NEVER write "[Called tool: ...]" as text. Use actual tool calling mechanism.

src/opencode_api/core/__init__.py ADDED Viewed

	@@ -0,0 +1,8 @@

+"""Core modules for OpenCode API"""
+from .config import Config, settings
+from .storage import Storage
+from .bus import Bus, Event
+from .identifier import Identifier
+__all__ = ["Config", "settings", "Storage", "Bus", "Event", "Identifier"]

src/opencode_api/core/auth.py ADDED Viewed

	@@ -0,0 +1,73 @@

+from typing import Optional
+from fastapi import HTTPException, Depends, Request
+from fastapi.security import HTTPBearer, HTTPAuthorizationCredentials
+from pydantic import BaseModel
+from jose import jwt, JWTError
+from .config import settings
+from .supabase import get_client, is_enabled as supabase_enabled
+security = HTTPBearer(auto_error=False)
+class AuthUser(BaseModel):
+    id: str
+    email: Optional[str] = None
+    role: Optional[str] = None
+def decode_supabase_jwt(token: str) -> Optional[dict]:
+    if not settings.supabase_jwt_secret:
+        return None
+    try:
+        payload = jwt.decode(
+            token,
+            settings.supabase_jwt_secret,
+            algorithms=["HS256"],
+            audience="authenticated"
+        )
+        return payload
+    except JWTError:
+        return None
+async def get_current_user(
+    credentials: Optional[HTTPAuthorizationCredentials] = Depends(security)
+) -> Optional[AuthUser]:
+    if not supabase_enabled():
+        return None
+    if not credentials:
+        return None
+    token = credentials.credentials
+    payload = decode_supabase_jwt(token)
+    if not payload:
+        return None
+    return AuthUser(
+        id=payload.get("sub"),
+        email=payload.get("email"),
+        role=payload.get("role")
+    )
+async def require_auth(
+    user: Optional[AuthUser] = Depends(get_current_user)
+) -> AuthUser:
+    if not supabase_enabled():
+        raise HTTPException(status_code=503, detail="Authentication not configured")
+    if not user:
+        raise HTTPException(status_code=401, detail="Invalid or missing authentication token")
+    return user
+async def optional_auth(
+    user: Optional[AuthUser] = Depends(get_current_user)
+) -> Optional[AuthUser]:
+    return user

src/opencode_api/core/bus.py ADDED Viewed

	@@ -0,0 +1,153 @@

+"""Event bus for OpenCode API - Pub/Sub system for real-time events"""
+from typing import TypeVar, Generic, Callable, Dict, List, Any, Optional, Awaitable
+from pydantic import BaseModel
+import asyncio
+from dataclasses import dataclass, field
+import uuid
+T = TypeVar("T", bound=BaseModel)
+@dataclass
+class Event(Generic[T]):
+    """Event definition with type and payload schema"""
+    type: str
+    payload_type: type[T]
+    def create(self, payload: T) -> "EventInstance":
+        """Create an event instance"""
+        return EventInstance(
+            type=self.type,
+            payload=payload.model_dump() if isinstance(payload, BaseModel) else payload
+        )
+@dataclass
+class EventInstance:
+    """An actual event instance with data"""
+    type: str
+    payload: Dict[str, Any]
+class Bus:
+    """
+    Simple pub/sub event bus for real-time updates.
+    Supports both sync and async subscribers.
+    """
+    _subscribers: Dict[str, List[Callable]] = {}
+    _all_subscribers: List[Callable] = []
+    _lock = asyncio.Lock()
+    @classmethod
+    async def publish(cls, event: Event | str, payload: BaseModel | Dict[str, Any]) -> None:
+        """Publish an event to all subscribers. Event can be Event object or string type."""
+        if isinstance(payload, BaseModel):
+            payload_dict = payload.model_dump()
+        else:
+            payload_dict = payload
+        event_type = event.type if isinstance(event, Event) else event
+        instance = EventInstance(type=event_type, payload=payload_dict)
+        async with cls._lock:
+            # Notify type-specific subscribers
+            for callback in cls._subscribers.get(event_type, []):
+                try:
+                    result = callback(instance)
+                    if asyncio.iscoroutine(result):
+                        await result
+                except Exception as e:
+                    print(f"Error in event subscriber: {e}")
+            # Notify all-event subscribers
+            for callback in cls._all_subscribers:
+                try:
+                    result = callback(instance)
+                    if asyncio.iscoroutine(result):
+                        await result
+                except Exception as e:
+                    print(f"Error in all-event subscriber: {e}")
+    @classmethod
+    def subscribe(cls, event_type: str, callback: Callable) -> Callable[[], None]:
+        """Subscribe to a specific event type. Returns unsubscribe function."""
+        if event_type not in cls._subscribers:
+            cls._subscribers[event_type] = []
+        cls._subscribers[event_type].append(callback)
+        def unsubscribe():
+            cls._subscribers[event_type].remove(callback)
+        return unsubscribe
+    @classmethod
+    def subscribe_all(cls, callback: Callable) -> Callable[[], None]:
+        """Subscribe to all events. Returns unsubscribe function."""
+        cls._all_subscribers.append(callback)
+        def unsubscribe():
+            cls._all_subscribers.remove(callback)
+        return unsubscribe
+    @classmethod
+    async def clear(cls) -> None:
+        """Clear all subscribers"""
+        async with cls._lock:
+            cls._subscribers.clear()
+            cls._all_subscribers.clear()
+# Pre-defined events (matching TypeScript opencode events)
+class SessionPayload(BaseModel):
+    """Payload for session events"""
+    id: str
+    title: Optional[str] = None
+class MessagePayload(BaseModel):
+    """Payload for message events"""
+    session_id: str
+    message_id: str
+class PartPayload(BaseModel):
+    """Payload for message part events"""
+    session_id: str
+    message_id: str
+    part_id: str
+    delta: Optional[str] = None
+class StepPayload(BaseModel):
+    """Payload for agentic loop step events"""
+    session_id: str
+    step: int
+    max_steps: int
+class ToolStatePayload(BaseModel):
+    """Payload for tool state change events"""
+    session_id: str
+    message_id: str
+    part_id: str
+    tool_name: str
+    status: str  # "pending", "running", "completed", "error"
+    time_start: Optional[str] = None
+    time_end: Optional[str] = None
+# Event definitions
+SESSION_CREATED = Event(type="session.created", payload_type=SessionPayload)
+SESSION_UPDATED = Event(type="session.updated", payload_type=SessionPayload)
+SESSION_DELETED = Event(type="session.deleted", payload_type=SessionPayload)
+MESSAGE_UPDATED = Event(type="message.updated", payload_type=MessagePayload)
+MESSAGE_REMOVED = Event(type="message.removed", payload_type=MessagePayload)
+PART_UPDATED = Event(type="part.updated", payload_type=PartPayload)
+PART_REMOVED = Event(type="part.removed", payload_type=PartPayload)
+STEP_STARTED = Event(type="step.started", payload_type=StepPayload)
+STEP_FINISHED = Event(type="step.finished", payload_type=StepPayload)
+TOOL_STATE_CHANGED = Event(type="tool.state.changed", payload_type=ToolStatePayload)

src/opencode_api/core/config.py ADDED Viewed

	@@ -0,0 +1,101 @@

+"""Configuration management for OpenCode API"""
+from typing import Optional, Dict, Any, List
+from pydantic import BaseModel, Field
+from pydantic_settings import BaseSettings
+import os
+class ProviderConfig(BaseModel):
+    """Configuration for a single LLM provider"""
+    api_key: Optional[str] = None
+    base_url: Optional[str] = None
+    options: Dict[str, Any] = Field(default_factory=dict)
+class ModelConfig(BaseModel):
+    provider_id: str = "gemini"
+    model_id: str = "gemini-2.5-pro"
+class Settings(BaseSettings):
+    """Application settings loaded from environment"""
+    # Server settings
+    host: str = "0.0.0.0"
+    port: int = 7860
+    debug: bool = False
+    # Default model
+    default_provider: str = "gemini"
+    default_model: str = "gemini-2.5-pro"
+    # API Keys (loaded from environment)
+    anthropic_api_key: Optional[str] = Field(default=None, alias="ANTHROPIC_API_KEY")
+    openai_api_key: Optional[str] = Field(default=None, alias="OPENAI_API_KEY")
+    google_api_key: Optional[str] = Field(default=None, alias="GOOGLE_API_KEY")
+    # Storage
+    storage_path: str = Field(default="/tmp/opencode-api", alias="OPENCODE_STORAGE_PATH")
+    # Security
+    server_password: Optional[str] = Field(default=None, alias="OPENCODE_SERVER_PASSWORD")
+    # Supabase
+    supabase_url: Optional[str] = Field(default=None, alias="NEXT_PUBLIC_SUPABASE_URL")
+    supabase_anon_key: Optional[str] = Field(default=None, alias="NEXT_PUBLIC_SUPABASE_ANON_KEY")
+    supabase_service_key: Optional[str] = Field(default=None, alias="SUPABASE_SERVICE_ROLE_KEY")
+    supabase_jwt_secret: Optional[str] = Field(default=None, alias="SUPABASE_JWT_SECRET")
+    class Config:
+        env_file = ".env"
+        env_file_encoding = "utf-8"
+        extra = "ignore"
+class Config(BaseModel):
+    """Runtime configuration"""
+    model: ModelConfig = Field(default_factory=ModelConfig)
+    providers: Dict[str, ProviderConfig] = Field(default_factory=dict)
+    disabled_providers: List[str] = Field(default_factory=list)
+    enabled_providers: Optional[List[str]] = None
+    @classmethod
+    def get(cls) -> "Config":
+        """Get the current configuration"""
+        return _config
+    @classmethod
+    def update(cls, updates: Dict[str, Any]) -> "Config":
+        """Update configuration"""
+        global _config
+        data = _config.model_dump()
+        data.update(updates)
+        _config = Config(**data)
+        return _config
+# Global instances
+settings = Settings()
+_config = Config()
+def get_api_key(provider_id: str) -> Optional[str]:
+    """Get API key for a provider from settings or config"""
+    # Check environment-based settings first
+    key_map = {
+        "anthropic": settings.anthropic_api_key,
+        "openai": settings.openai_api_key,
+        "google": settings.google_api_key,
+    }
+    if provider_id in key_map:
+        return key_map[provider_id]
+    # Check provider config
+    provider_config = _config.providers.get(provider_id)
+    if provider_config:
+        return provider_config.api_key
+    return None

src/opencode_api/core/identifier.py ADDED Viewed

	@@ -0,0 +1,69 @@

+"""Identifier generation for OpenCode API - ULID-based IDs"""
+from ulid import ULID
+from datetime import datetime
+from typing import Literal
+PrefixType = Literal["session", "message", "part", "tool", "question"]
+class Identifier:
+    """
+    ULID-based identifier generator.
+    Generates sortable, unique IDs with type prefixes.
+    """
+    PREFIXES = {
+        "session": "ses",
+        "message": "msg",
+        "part": "prt",
+        "tool": "tol",
+        "question": "qst",
+    }
+    @classmethod
+    def generate(cls, prefix: PrefixType) -> str:
+        """Generate a new ULID with prefix"""
+        ulid = ULID()
+        prefix_str = cls.PREFIXES.get(prefix, prefix[:3])
+        return f"{prefix_str}_{str(ulid).lower()}"
+    @classmethod
+    def ascending(cls, prefix: PrefixType) -> str:
+        """Generate an ascending (time-based) ID"""
+        return cls.generate(prefix)
+    @classmethod
+    def descending(cls, prefix: PrefixType) -> str:
+        """
+        Generate a descending ID (for reverse chronological sorting).
+        Uses inverted timestamp bits.
+        """
+        # For simplicity, just use regular ULID
+        # In production, you'd invert the timestamp bits
+        return cls.generate(prefix)
+    @classmethod
+    def parse(cls, id: str) -> tuple[str, str]:
+        """Parse an ID into prefix and ULID parts"""
+        parts = id.split("_", 1)
+        if len(parts) != 2:
+            raise ValueError(f"Invalid ID format: {id}")
+        return parts[0], parts[1]
+    @classmethod
+    def validate(cls, id: str, expected_prefix: PrefixType) -> bool:
+        """Validate that an ID has the expected prefix"""
+        try:
+            prefix, _ = cls.parse(id)
+            expected = cls.PREFIXES.get(expected_prefix, expected_prefix[:3])
+            return prefix == expected
+        except ValueError:
+            return False
+# Convenience function
+def generate_id(prefix: PrefixType) -> str:
+    """Generate a new ULID-based ID with the given prefix."""
+    return Identifier.generate(prefix)

src/opencode_api/core/quota.py ADDED Viewed

	@@ -0,0 +1,91 @@

+from typing import Optional
+from fastapi import HTTPException, Depends
+from pydantic import BaseModel
+from .auth import AuthUser, require_auth
+from .supabase import get_client, is_enabled as supabase_enabled
+from .config import settings
+class UsageInfo(BaseModel):
+    input_tokens: int = 0
+    output_tokens: int = 0
+    request_count: int = 0
+class QuotaLimits(BaseModel):
+    daily_requests: int = 100
+    daily_input_tokens: int = 1_000_000
+    daily_output_tokens: int = 500_000
+DEFAULT_LIMITS = QuotaLimits()
+async def get_usage(user_id: str) -> UsageInfo:
+    if not supabase_enabled():
+        return UsageInfo()
+    client = get_client()
+    result = client.rpc("get_opencode_usage", {"p_user_id": user_id}).execute()
+    if result.data and len(result.data) > 0:
+        row = result.data[0]
+        return UsageInfo(
+            input_tokens=row.get("input_tokens", 0),
+            output_tokens=row.get("output_tokens", 0),
+            request_count=row.get("request_count", 0),
+        )
+    return UsageInfo()
+async def increment_usage(user_id: str, input_tokens: int = 0, output_tokens: int = 0) -> None:
+    if not supabase_enabled():
+        return
+    client = get_client()
+    client.rpc("increment_opencode_usage", {
+        "p_user_id": user_id,
+        "p_input_tokens": input_tokens,
+        "p_output_tokens": output_tokens,
+    }).execute()
+async def check_quota(user: AuthUser = Depends(require_auth)) -> AuthUser:
+    if not supabase_enabled():
+        return user
+    usage = await get_usage(user.id)
+    limits = DEFAULT_LIMITS
+    if usage.request_count >= limits.daily_requests:
+        raise HTTPException(
+            status_code=429,
+            detail={
+                "error": "Daily request limit reached",
+                "usage": usage.model_dump(),
+                "limits": limits.model_dump(),
+            }
+        )
+    if usage.input_tokens >= limits.daily_input_tokens:
+        raise HTTPException(
+            status_code=429,
+            detail={
+                "error": "Daily input token limit reached",
+                "usage": usage.model_dump(),
+                "limits": limits.model_dump(),
+            }
+        )
+    if usage.output_tokens >= limits.daily_output_tokens:
+        raise HTTPException(
+            status_code=429,
+            detail={
+                "error": "Daily output token limit reached",
+                "usage": usage.model_dump(),
+                "limits": limits.model_dump(),
+            }
+        )
+    return user

src/opencode_api/core/storage.py ADDED Viewed

	@@ -0,0 +1,145 @@

+"""Storage module for OpenCode API - In-memory with optional file persistence"""
+from typing import TypeVar, Generic, Optional, Dict, Any, List, AsyncIterator
+from pydantic import BaseModel
+import json
+import os
+from pathlib import Path
+import asyncio
+from .config import settings
+T = TypeVar("T", bound=BaseModel)
+class NotFoundError(Exception):
+    """Raised when a storage item is not found"""
+    def __init__(self, key: List[str]):
+        self.key = key
+        super().__init__(f"Not found: {'/'.join(key)}")
+class Storage:
+    """
+    Simple storage system using in-memory dict with optional file persistence.
+    Keys are lists of strings that form a path (e.g., ["session", "project1", "ses_123"])
+    """
+    _data: Dict[str, Any] = {}
+    _lock = asyncio.Lock()
+    @classmethod
+    def _key_to_path(cls, key: List[str]) -> str:
+        """Convert key list to storage path"""
+        return "/".join(key)
+    @classmethod
+    def _file_path(cls, key: List[str]) -> Path:
+        """Get file path for persistent storage"""
+        return Path(settings.storage_path) / "/".join(key[:-1]) / f"{key[-1]}.json"
+    @classmethod
+    async def write(cls, key: List[str], data: BaseModel | Dict[str, Any]) -> None:
+        """Write data to storage"""
+        path = cls._key_to_path(key)
+        if isinstance(data, BaseModel):
+            value = data.model_dump()
+        else:
+            value = data
+        async with cls._lock:
+            cls._data[path] = value
+            # Persist to file
+            file_path = cls._file_path(key)
+            file_path.parent.mkdir(parents=True, exist_ok=True)
+            file_path.write_text(json.dumps(value, default=str))
+    @classmethod
+    async def read(cls, key: List[str], model: type[T] = None) -> Optional[T | Dict[str, Any]]:
+        """Read data from storage"""
+        path = cls._key_to_path(key)
+        async with cls._lock:
+            # Check in-memory first
+            if path in cls._data:
+                data = cls._data[path]
+                if model:
+                    return model(**data)
+                return data
+            # Check file
+            file_path = cls._file_path(key)
+            if file_path.exists():
+                data = json.loads(file_path.read_text())
+                cls._data[path] = data
+                if model:
+                    return model(**data)
+                return data
+        return None
+    @classmethod
+    async def read_or_raise(cls, key: List[str], model: type[T] = None) -> T | Dict[str, Any]:
+        """Read data from storage or raise NotFoundError"""
+        result = await cls.read(key, model)
+        if result is None:
+            raise NotFoundError(key)
+        return result
+    @classmethod
+    async def update(cls, key: List[str], updater: callable, model: type[T] = None) -> T | Dict[str, Any]:
+        """Update data in storage using an updater function"""
+        data = await cls.read_or_raise(key, model)
+        if isinstance(data, BaseModel):
+            data_dict = data.model_dump()
+            updater(data_dict)
+            await cls.write(key, data_dict)
+            if model:
+                return model(**data_dict)
+            return data_dict
+        else:
+            updater(data)
+            await cls.write(key, data)
+            return data
+    @classmethod
+    async def remove(cls, key: List[str]) -> None:
+        """Remove data from storage"""
+        path = cls._key_to_path(key)
+        async with cls._lock:
+            cls._data.pop(path, None)
+            file_path = cls._file_path(key)
+            if file_path.exists():
+                file_path.unlink()
+    @classmethod
+    async def list(cls, prefix: List[str]) -> List[List[str]]:
+        """List all keys under a prefix"""
+        prefix_path = cls._key_to_path(prefix)
+        results = []
+        async with cls._lock:
+            # Check in-memory
+            for key in cls._data.keys():
+                if key.startswith(prefix_path + "/"):
+                    results.append(key.split("/"))
+            # Check files
+            dir_path = Path(settings.storage_path) / "/".join(prefix)
+            if dir_path.exists():
+                for file_path in dir_path.glob("*.json"):
+                    key = prefix + [file_path.stem]
+                    if key not in results:
+                        results.append(key)
+        return results
+    @classmethod
+    async def clear(cls) -> None:
+        """Clear all storage"""
+        async with cls._lock:
+            cls._data.clear()

src/opencode_api/core/supabase.py ADDED Viewed

	@@ -0,0 +1,25 @@

+from typing import Optional
+from supabase import create_client, Client
+from .config import settings
+_client: Optional[Client] = None
+def get_client() -> Optional[Client]:
+    global _client
+    if _client is not None:
+        return _client
+    if not settings.supabase_url or not settings.supabase_service_key:
+        return None
+    _client = create_client(
+        settings.supabase_url,
+        settings.supabase_service_key
+    )
+    return _client
+def is_enabled() -> bool:
+    return settings.supabase_url is not None and settings.supabase_service_key is not None

src/opencode_api/provider/__init__.py ADDED Viewed

	@@ -0,0 +1,37 @@

+from .provider import (
+    Provider,
+    ProviderInfo,
+    ModelInfo,
+    BaseProvider,
+    Message,
+    StreamChunk,
+    ToolCall,
+    ToolResult,
+    register_provider,
+    get_provider,
+    list_providers,
+    get_model,
+)
+from .anthropic import AnthropicProvider
+from .openai import OpenAIProvider
+from .litellm import LiteLLMProvider
+from .gemini import GeminiProvider
+__all__ = [
+    "Provider",
+    "ProviderInfo",
+    "ModelInfo",
+    "BaseProvider",
+    "Message",
+    "StreamChunk",
+    "ToolCall",
+    "ToolResult",
+    "register_provider",
+    "get_provider",
+    "list_providers",
+    "get_model",
+    "AnthropicProvider",
+    "OpenAIProvider",
+    "LiteLLMProvider",
+    "GeminiProvider",
+]

src/opencode_api/provider/anthropic.py ADDED Viewed

	@@ -0,0 +1,204 @@

+from typing import Dict, Any, List, Optional, AsyncGenerator
+import os
+import json
+from .provider import BaseProvider, ModelInfo, Message, StreamChunk, ToolCall
+MODELS_WITH_EXTENDED_THINKING = {"claude-sonnet-4-20250514", "claude-opus-4-20250514"}
+class AnthropicProvider(BaseProvider):
+    def __init__(self, api_key: Optional[str] = None):
+        self._api_key = api_key or os.environ.get("ANTHROPIC_API_KEY")
+        self._client = None
+    @property
+    def id(self) -> str:
+        return "anthropic"
+    @property
+    def name(self) -> str:
+        return "Anthropic"
+    @property
+    def models(self) -> Dict[str, ModelInfo]:
+        return {
+            "claude-sonnet-4-20250514": ModelInfo(
+                id="claude-sonnet-4-20250514",
+                name="Claude Sonnet 4",
+                provider_id="anthropic",
+                context_limit=200000,
+                output_limit=64000,
+                supports_tools=True,
+                supports_streaming=True,
+                cost_input=3.0,
+                cost_output=15.0,
+            ),
+            "claude-opus-4-20250514": ModelInfo(
+                id="claude-opus-4-20250514",
+                name="Claude Opus 4",
+                provider_id="anthropic",
+                context_limit=200000,
+                output_limit=32000,
+                supports_tools=True,
+                supports_streaming=True,
+                cost_input=15.0,
+                cost_output=75.0,
+            ),
+            "claude-3-5-haiku-20241022": ModelInfo(
+                id="claude-3-5-haiku-20241022",
+                name="Claude 3.5 Haiku",
+                provider_id="anthropic",
+                context_limit=200000,
+                output_limit=8192,
+                supports_tools=True,
+                supports_streaming=True,
+                cost_input=0.8,
+                cost_output=4.0,
+            ),
+        }
+    def _get_client(self):
+        if self._client is None:
+            try:
+                import anthropic
+                self._client = anthropic.AsyncAnthropic(api_key=self._api_key)
+            except ImportError:
+                raise ImportError("anthropic package is required. Install with: pip install anthropic")
+        return self._client
+    def _supports_extended_thinking(self, model_id: str) -> bool:
+        return model_id in MODELS_WITH_EXTENDED_THINKING
+    async def stream(
+        self,
+        model_id: str,
+        messages: List[Message],
+        tools: Optional[List[Dict[str, Any]]] = None,
+        system: Optional[str] = None,
+        temperature: Optional[float] = None,
+        max_tokens: Optional[int] = None,
+    ) -> AsyncGenerator[StreamChunk, None]:
+        client = self._get_client()
+        anthropic_messages = []
+        for msg in messages:
+            content = msg.content
+            if isinstance(content, str):
+                anthropic_messages.append({"role": msg.role, "content": content})
+            else:
+                anthropic_messages.append({
+                    "role": msg.role,
+                    "content": [{"type": c.type, "text": c.text} for c in content if c.text]
+                })
+        kwargs: Dict[str, Any] = {
+            "model": model_id,
+            "messages": anthropic_messages,
+            "max_tokens": max_tokens or 16000,
+        }
+        if system:
+            kwargs["system"] = system
+        if temperature is not None:
+            kwargs["temperature"] = temperature
+        if tools:
+            kwargs["tools"] = [
+                {
+                    "name": t["name"],
+                    "description": t.get("description", ""),
+                    "input_schema": t.get("parameters", t.get("input_schema", {}))
+                }
+                for t in tools
+            ]
+        use_extended_thinking = self._supports_extended_thinking(model_id)
+        async for chunk in self._stream_with_fallback(client, kwargs, use_extended_thinking):
+            yield chunk
+    async def _stream_with_fallback(
+        self, client, kwargs: Dict[str, Any], use_extended_thinking: bool
+    ):
+        if use_extended_thinking:
+            kwargs["thinking"] = {
+                "type": "enabled",
+                "budget_tokens": 10000
+            }
+        try:
+            async for chunk in self._do_stream(client, kwargs):
+                yield chunk
+        except Exception as e:
+            error_str = str(e).lower()
+            has_thinking = "thinking" in kwargs
+            if has_thinking and ("thinking" in error_str or "unsupported" in error_str or "invalid" in error_str):
+                del kwargs["thinking"]
+                async for chunk in self._do_stream(client, kwargs):
+                    yield chunk
+            else:
+                yield StreamChunk(type="error", error=str(e))
+    async def _do_stream(self, client, kwargs: Dict[str, Any]):
+        current_tool_call = None
+        async with client.messages.stream(**kwargs) as stream:
+            async for event in stream:
+                if event.type == "content_block_start":
+                    if hasattr(event, "content_block"):
+                        block = event.content_block
+                        if block.type == "tool_use":
+                            current_tool_call = {
+                                "id": block.id,
+                                "name": block.name,
+                                "arguments_json": ""
+                            }
+                elif event.type == "content_block_delta":
+                    if hasattr(event, "delta"):
+                        delta = event.delta
+                        if delta.type == "text_delta":
+                            yield StreamChunk(type="text", text=delta.text)
+                        elif delta.type == "thinking_delta":
+                            yield StreamChunk(type="reasoning", text=delta.thinking)
+                        elif delta.type == "input_json_delta" and current_tool_call:
+                            current_tool_call["arguments_json"] += delta.partial_json
+                elif event.type == "content_block_stop":
+                    if current_tool_call:
+                        try:
+                            args = json.loads(current_tool_call["arguments_json"]) if current_tool_call["arguments_json"] else {}
+                        except json.JSONDecodeError:
+                            args = {}
+                        yield StreamChunk(
+                            type="tool_call",
+                            tool_call=ToolCall(
+                                id=current_tool_call["id"],
+                                name=current_tool_call["name"],
+                                arguments=args
+                            )
+                        )
+                        current_tool_call = None
+                elif event.type == "message_stop":
+                    final_message = await stream.get_final_message()
+                    usage = {
+                        "input_tokens": final_message.usage.input_tokens,
+                        "output_tokens": final_message.usage.output_tokens,
+                    }
+                    stop_reason = self._map_stop_reason(final_message.stop_reason)
+                    yield StreamChunk(type="done", usage=usage, stop_reason=stop_reason)
+    def _map_stop_reason(self, anthropic_stop_reason: Optional[str]) -> str:
+        mapping = {
+            "end_turn": "end_turn",
+            "tool_use": "tool_calls",
+            "max_tokens": "max_tokens",
+            "stop_sequence": "end_turn",
+        }
+        return mapping.get(anthropic_stop_reason or "", "end_turn")

src/opencode_api/provider/gemini.py ADDED Viewed

	@@ -0,0 +1,260 @@

+from typing import Dict, Any, List, Optional, AsyncGenerator
+import os
+import logging
+from .provider import BaseProvider, ModelInfo, Message, StreamChunk, ToolCall
+logger = logging.getLogger(__name__)
+MODELS_WITH_THINKING = {
+    "gemini-2.5-pro",
+    "gemini-2.5-flash",
+    "gemini-2.5-flash-lite",
+}
+THINKING_BUDGET_MIN = {
+    "gemini-2.5-pro": 128,
+    "gemini-2.5-flash": 1,
+    "gemini-2.5-flash-lite": 1,
+}
+class GeminiProvider(BaseProvider):
+    def __init__(self, api_key: Optional[str] = None):
+        self._api_key = api_key or os.environ.get("GOOGLE_API_KEY") or os.environ.get("GEMINI_API_KEY")
+        self._client = None
+    @property
+    def id(self) -> str:
+        return "gemini"
+    @property
+    def name(self) -> str:
+        return "Google Gemini"
+    @property
+    def models(self) -> Dict[str, ModelInfo]:
+        return {
+            "gemini-2.5-pro": ModelInfo(
+                id="gemini-2.5-pro",
+                name="Gemini 2.5 Pro",
+                provider_id="gemini",
+                context_limit=1048576,
+                output_limit=65536,
+                supports_tools=True,
+                supports_streaming=True,
+                cost_input=1.25,
+                cost_output=10.0,
+            ),
+            "gemini-2.5-flash": ModelInfo(
+                id="gemini-2.5-flash",
+                name="Gemini 2.5 Flash",
+                provider_id="gemini",
+                context_limit=1048576,
+                output_limit=65536,
+                supports_tools=True,
+                supports_streaming=True,
+                cost_input=0.15,
+                cost_output=0.6,
+            ),
+            "gemini-2.5-flash-lite": ModelInfo(
+                id="gemini-2.5-flash-lite",
+                name="Gemini 2.5 Flash Lite",
+                provider_id="gemini",
+                context_limit=1048576,
+                output_limit=65536,
+                supports_tools=True,
+                supports_streaming=True,
+                cost_input=0.075,
+                cost_output=0.3,
+            ),
+            "gemini-2.0-flash": ModelInfo(
+                id="gemini-2.0-flash",
+                name="Gemini 2.0 Flash",
+                provider_id="gemini",
+                context_limit=1048576,
+                output_limit=8192,
+                supports_tools=True,
+                supports_streaming=True,
+                cost_input=0.075,
+                cost_output=0.3,
+            ),
+        }
+    def _get_client(self):
+        if self._client is None:
+            try:
+                from google import genai
+                self._client = genai.Client(api_key=self._api_key)
+            except ImportError:
+                raise ImportError("google-genai package is required. Install with: pip install google-genai")
+        return self._client
+    def _supports_thinking(self, model_id: str) -> bool:
+        return model_id in MODELS_WITH_THINKING
+    def _get_thinking_budget(self, model_id: str) -> int:
+        min_budget = THINKING_BUDGET_MIN.get(model_id, 128)
+        return max(min_budget, 1024)
+    async def stream(
+        self,
+        model_id: str,
+        messages: List[Message],
+        tools: Optional[List[Dict[str, Any]]] = None,
+        system: Optional[str] = None,
+        temperature: Optional[float] = None,
+        max_tokens: Optional[int] = None,
+    ) -> AsyncGenerator[StreamChunk, None]:
+        from google.genai import types
+        client = self._get_client()
+        contents = []
+        print(f"[Gemini DEBUG] Building contents from {len(messages)} messages", flush=True)
+        for msg in messages:
+            role = "user" if msg.role == "user" else "model"
+            content = msg.content
+            print(f"[Gemini DEBUG] msg.role={msg.role}, content type={type(content)}, content={repr(content)[:100]}", flush=True)
+            if isinstance(content, str) and content:
+                contents.append(types.Content(
+                    role=role,
+                    parts=[types.Part(text=content)]
+                ))
+            elif content:
+                parts = [types.Part(text=c.text) for c in content if c.text]
+                if parts:
+                    contents.append(types.Content(role=role, parts=parts))
+        print(f"[Gemini DEBUG] Built {len(contents)} contents", flush=True)
+        config_kwargs: Dict[str, Any] = {}
+        if system:
+            config_kwargs["system_instruction"] = system
+        if temperature is not None:
+            config_kwargs["temperature"] = temperature
+        if max_tokens is not None:
+            config_kwargs["max_output_tokens"] = max_tokens
+        if self._supports_thinking(model_id):
+            config_kwargs["thinking_config"] = types.ThinkingConfig(
+                thinking_budget=self._get_thinking_budget(model_id),
+                include_thoughts=True  # Include thinking content in response
+            )
+        if tools:
+            gemini_tools = []
+            for t in tools:
+                func_decl = types.FunctionDeclaration(
+                    name=t["name"],
+                    description=t.get("description", ""),
+                    parameters=t.get("parameters", t.get("input_schema", {}))
+                )
+                gemini_tools.append(types.Tool(function_declarations=[func_decl]))
+            config_kwargs["tools"] = gemini_tools
+        config = types.GenerateContentConfig(**config_kwargs)
+        async for chunk in self._stream_with_fallback(
+            client, model_id, contents, config, config_kwargs, types
+        ):
+            yield chunk
+    async def _stream_with_fallback(
+        self, client, model_id: str, contents, config, config_kwargs: Dict[str, Any], types
+    ):
+        try:
+            async for chunk in self._do_stream(client, model_id, contents, config):
+                yield chunk
+        except Exception as e:
+            error_str = str(e).lower()
+            has_thinking = "thinking_config" in config_kwargs
+            if has_thinking and ("thinking" in error_str or "budget" in error_str or "unsupported" in error_str):
+                logger.warning(f"Thinking not supported for {model_id}, retrying without thinking config")
+                del config_kwargs["thinking_config"]
+                fallback_config = types.GenerateContentConfig(**config_kwargs)
+                async for chunk in self._do_stream(client, model_id, contents, fallback_config):
+                    yield chunk
+            else:
+                logger.error(f"Gemini stream error: {e}")
+                yield StreamChunk(type="error", error=str(e))
+    async def _do_stream(self, client, model_id: str, contents, config):
+        response_stream = await client.aio.models.generate_content_stream(
+            model=model_id,
+            contents=contents,
+            config=config,
+        )
+        pending_tool_calls = []
+        async for chunk in response_stream:
+            if not chunk.candidates:
+                continue
+            candidate = chunk.candidates[0]
+            if candidate.content and candidate.content.parts:
+                for part in candidate.content.parts:
+                    if hasattr(part, 'thought') and part.thought:
+                        if part.text:
+                            yield StreamChunk(type="reasoning", text=part.text)
+                    elif hasattr(part, 'function_call') and part.function_call:
+                        fc = part.function_call
+                        tool_call = ToolCall(
+                            id=f"call_{fc.name}_{len(pending_tool_calls)}",
+                            name=fc.name,
+                            arguments=dict(fc.args) if fc.args else {}
+                        )
+                        pending_tool_calls.append(tool_call)
+                    elif part.text:
+                        yield StreamChunk(type="text", text=part.text)
+            finish_reason = getattr(candidate, 'finish_reason', None)
+            if finish_reason:
+                print(f"[Gemini] finish_reason: {finish_reason}, pending_tool_calls: {len(pending_tool_calls)}", flush=True)
+                for tc in pending_tool_calls:
+                    yield StreamChunk(type="tool_call", tool_call=tc)
+                # IMPORTANT: If there are pending tool calls, ALWAYS return "tool_calls"
+                # regardless of Gemini's finish_reason (which is often STOP even with tool calls)
+                if pending_tool_calls:
+                    stop_reason = "tool_calls"
+                else:
+                    stop_reason = self._map_stop_reason(finish_reason)
+                print(f"[Gemini] Mapped stop_reason: {stop_reason}", flush=True)
+                usage = None
+                if hasattr(chunk, 'usage_metadata') and chunk.usage_metadata:
+                    usage = {
+                        "input_tokens": getattr(chunk.usage_metadata, 'prompt_token_count', 0),
+                        "output_tokens": getattr(chunk.usage_metadata, 'candidates_token_count', 0),
+                    }
+                    if hasattr(chunk.usage_metadata, 'thoughts_token_count'):
+                        usage["thinking_tokens"] = chunk.usage_metadata.thoughts_token_count
+                yield StreamChunk(type="done", usage=usage, stop_reason=stop_reason)
+                return
+        yield StreamChunk(type="done", stop_reason="end_turn")
+    def _map_stop_reason(self, gemini_finish_reason) -> str:
+        reason_name = str(gemini_finish_reason).lower() if gemini_finish_reason else ""
+        if "stop" in reason_name or "end" in reason_name:
+            return "end_turn"
+        elif "tool" in reason_name or "function" in reason_name:
+            return "tool_calls"
+        elif "max" in reason_name or "length" in reason_name:
+            return "max_tokens"
+        elif "safety" in reason_name:
+            return "safety"
+        return "end_turn"

src/opencode_api/provider/litellm.py ADDED Viewed

	@@ -0,0 +1,363 @@

+from typing import Dict, Any, List, Optional, AsyncGenerator
+import json
+import os
+from .provider import BaseProvider, ModelInfo, Message, StreamChunk, ToolCall
+DEFAULT_MODELS = {
+    "claude-sonnet-4-20250514": ModelInfo(
+        id="claude-sonnet-4-20250514",
+        name="Claude Sonnet 4",
+        provider_id="litellm",
+        context_limit=200000,
+        output_limit=64000,
+        supports_tools=True,
+        supports_streaming=True,
+        cost_input=3.0,
+        cost_output=15.0,
+    ),
+    "claude-opus-4-20250514": ModelInfo(
+        id="claude-opus-4-20250514",
+        name="Claude Opus 4",
+        provider_id="litellm",
+        context_limit=200000,
+        output_limit=32000,
+        supports_tools=True,
+        supports_streaming=True,
+        cost_input=15.0,
+        cost_output=75.0,
+    ),
+    "claude-3-5-haiku-20241022": ModelInfo(
+        id="claude-3-5-haiku-20241022",
+        name="Claude 3.5 Haiku",
+        provider_id="litellm",
+        context_limit=200000,
+        output_limit=8192,
+        supports_tools=True,
+        supports_streaming=True,
+        cost_input=0.8,
+        cost_output=4.0,
+    ),
+    "gpt-4o": ModelInfo(
+        id="gpt-4o",
+        name="GPT-4o",
+        provider_id="litellm",
+        context_limit=128000,
+        output_limit=16384,
+        supports_tools=True,
+        supports_streaming=True,
+        cost_input=2.5,
+        cost_output=10.0,
+    ),
+    "gpt-4o-mini": ModelInfo(
+        id="gpt-4o-mini",
+        name="GPT-4o Mini",
+        provider_id="litellm",
+        context_limit=128000,
+        output_limit=16384,
+        supports_tools=True,
+        supports_streaming=True,
+        cost_input=0.15,
+        cost_output=0.6,
+    ),
+    "o1": ModelInfo(
+        id="o1",
+        name="O1",
+        provider_id="litellm",
+        context_limit=200000,
+        output_limit=100000,
+        supports_tools=True,
+        supports_streaming=True,
+        cost_input=15.0,
+        cost_output=60.0,
+    ),
+    "gemini/gemini-2.0-flash": ModelInfo(
+        id="gemini/gemini-2.0-flash",
+        name="Gemini 2.0 Flash",
+        provider_id="litellm",
+        context_limit=1000000,
+        output_limit=8192,
+        supports_tools=True,
+        supports_streaming=True,
+        cost_input=0.075,
+        cost_output=0.3,
+    ),
+    "gemini/gemini-2.5-pro-preview-05-06": ModelInfo(
+        id="gemini/gemini-2.5-pro-preview-05-06",
+        name="Gemini 2.5 Pro",
+        provider_id="litellm",
+        context_limit=1000000,
+        output_limit=65536,
+        supports_tools=True,
+        supports_streaming=True,
+        cost_input=1.25,
+        cost_output=10.0,
+    ),
+    "groq/llama-3.3-70b-versatile": ModelInfo(
+        id="groq/llama-3.3-70b-versatile",
+        name="Llama 3.3 70B (Groq)",
+        provider_id="litellm",
+        context_limit=128000,
+        output_limit=32768,
+        supports_tools=True,
+        supports_streaming=True,
+        cost_input=0.59,
+        cost_output=0.79,
+    ),
+    "deepseek/deepseek-chat": ModelInfo(
+        id="deepseek/deepseek-chat",
+        name="DeepSeek Chat",
+        provider_id="litellm",
+        context_limit=64000,
+        output_limit=8192,
+        supports_tools=True,
+        supports_streaming=True,
+        cost_input=0.14,
+        cost_output=0.28,
+    ),
+    "openrouter/anthropic/claude-sonnet-4": ModelInfo(
+        id="openrouter/anthropic/claude-sonnet-4",
+        name="Claude Sonnet 4 (OpenRouter)",
+        provider_id="litellm",
+        context_limit=200000,
+        output_limit=64000,
+        supports_tools=True,
+        supports_streaming=True,
+        cost_input=3.0,
+        cost_output=15.0,
+    ),
+    # Z.ai Free Flash Models
+    "zai/glm-4.7-flash": ModelInfo(
+        id="zai/glm-4.7-flash",
+        name="GLM-4.7 Flash (Free)",
+        provider_id="litellm",
+        context_limit=128000,
+        output_limit=8192,
+        supports_tools=True,
+        supports_streaming=True,
+        cost_input=0.0,
+        cost_output=0.0,
+    ),
+    "zai/glm-4.6v-flash": ModelInfo(
+        id="zai/glm-4.6v-flash",
+        name="GLM-4.6V Flash (Free)",
+        provider_id="litellm",
+        context_limit=128000,
+        output_limit=8192,
+        supports_tools=True,
+        supports_streaming=True,
+        cost_input=0.0,
+        cost_output=0.0,
+    ),
+    "zai/glm-4.5-flash": ModelInfo(
+        id="zai/glm-4.5-flash",
+        name="GLM-4.5 Flash (Free)",
+        provider_id="litellm",
+        context_limit=128000,
+        output_limit=8192,
+        supports_tools=True,
+        supports_streaming=True,
+        cost_input=0.0,
+        cost_output=0.0,
+    ),
+}
+class LiteLLMProvider(BaseProvider):
+    def __init__(self):
+        self._litellm = None
+        self._models = dict(DEFAULT_MODELS)
+    @property
+    def id(self) -> str:
+        return "litellm"
+    @property
+    def name(self) -> str:
+        return "LiteLLM (Multi-Provider)"
+    @property
+    def models(self) -> Dict[str, ModelInfo]:
+        return self._models
+    def add_model(self, model: ModelInfo) -> None:
+        self._models[model.id] = model
+    def _get_litellm(self):
+        if self._litellm is None:
+            try:
+                import litellm
+                litellm.drop_params = True
+                self._litellm = litellm
+            except ImportError:
+                raise ImportError("litellm package is required. Install with: pip install litellm")
+        return self._litellm
+    async def stream(
+        self,
+        model_id: str,
+        messages: List[Message],
+        tools: Optional[List[Dict[str, Any]]] = None,
+        system: Optional[str] = None,
+        temperature: Optional[float] = None,
+        max_tokens: Optional[int] = None,
+    ) -> AsyncGenerator[StreamChunk, None]:
+        litellm = self._get_litellm()
+        litellm_messages = []
+        if system:
+            litellm_messages.append({"role": "system", "content": system})
+        for msg in messages:
+            content = msg.content
+            if isinstance(content, str):
+                litellm_messages.append({"role": msg.role, "content": content})
+            else:
+                litellm_messages.append({
+                    "role": msg.role,
+                    "content": [{"type": c.type, "text": c.text} for c in content if c.text]
+                })
+        # Z.ai 모델 처리: OpenAI-compatible API 사용
+        actual_model = model_id
+        if model_id.startswith("zai/"):
+            # zai/glm-4.7-flash -> openai/glm-4.7-flash with custom api_base
+            actual_model = "openai/" + model_id[4:]
+        kwargs: Dict[str, Any] = {
+            "model": actual_model,
+            "messages": litellm_messages,
+            "stream": True,
+        }
+        # Z.ai 전용 설정
+        if model_id.startswith("zai/"):
+            kwargs["api_base"] = os.environ.get("ZAI_API_BASE", "https://api.z.ai/api/paas/v4")
+            kwargs["api_key"] = os.environ.get("ZAI_API_KEY")
+        if temperature is not None:
+            kwargs["temperature"] = temperature
+        if max_tokens is not None:
+            kwargs["max_tokens"] = max_tokens
+        else:
+            kwargs["max_tokens"] = 8192
+        if tools:
+            kwargs["tools"] = [
+                {
+                    "type": "function",
+                    "function": {
+                        "name": t["name"],
+                        "description": t.get("description", ""),
+                        "parameters": t.get("parameters", t.get("input_schema", {}))
+                    }
+                }
+                for t in tools
+            ]
+        current_tool_calls: Dict[int, Dict[str, Any]] = {}
+        try:
+            response = await litellm.acompletion(**kwargs)
+            async for chunk in response:
+                if hasattr(chunk, 'choices') and chunk.choices:
+                    choice = chunk.choices[0]
+                    delta = getattr(choice, 'delta', None)
+                    if delta:
+                        if hasattr(delta, 'content') and delta.content:
+                            yield StreamChunk(type="text", text=delta.content)
+                        if hasattr(delta, 'tool_calls') and delta.tool_calls:
+                            for tc in delta.tool_calls:
+                                idx = tc.index if hasattr(tc, 'index') else 0
+                                if idx not in current_tool_calls:
+                                    current_tool_calls[idx] = {
+                                        "id": tc.id if hasattr(tc, 'id') and tc.id else f"call_{idx}",
+                                        "name": "",
+                                        "arguments_json": ""
+                                    }
+                                if hasattr(tc, 'function'):
+                                    if hasattr(tc.function, 'name') and tc.function.name:
+                                        current_tool_calls[idx]["name"] = tc.function.name
+                                    if hasattr(tc.function, 'arguments') and tc.function.arguments:
+                                        current_tool_calls[idx]["arguments_json"] += tc.function.arguments
+                    finish_reason = getattr(choice, 'finish_reason', None)
+                    if finish_reason:
+                        for idx, tc_data in current_tool_calls.items():
+                            if tc_data["name"]:
+                                try:
+                                    args = json.loads(tc_data["arguments_json"]) if tc_data["arguments_json"] else {}
+                                except json.JSONDecodeError:
+                                    args = {}
+                                yield StreamChunk(
+                                    type="tool_call",
+                                    tool_call=ToolCall(
+                                        id=tc_data["id"],
+                                        name=tc_data["name"],
+                                        arguments=args
+                                    )
+                                )
+                        usage = None
+                        if hasattr(chunk, 'usage') and chunk.usage:
+                            usage = {
+                                "input_tokens": getattr(chunk.usage, 'prompt_tokens', 0),
+                                "output_tokens": getattr(chunk.usage, 'completion_tokens', 0),
+                            }
+                        stop_reason = self._map_stop_reason(finish_reason)
+                        yield StreamChunk(type="done", usage=usage, stop_reason=stop_reason)
+        except Exception as e:
+            yield StreamChunk(type="error", error=str(e))
+    async def complete(
+        self,
+        model_id: str,
+        prompt: str,
+        max_tokens: int = 100,
+    ) -> str:
+        """단일 완료 요청 (스트리밍 없음)"""
+        litellm = self._get_litellm()
+        actual_model = model_id
+        kwargs: Dict[str, Any] = {
+            "model": actual_model,
+            "messages": [{"role": "user", "content": prompt}],
+            "max_tokens": max_tokens,
+        }
+        # Z.ai 모델 처리
+        if model_id.startswith("zai/"):
+            actual_model = "openai/" + model_id[4:]
+            kwargs["model"] = actual_model
+            kwargs["api_base"] = os.environ.get("ZAI_API_BASE", "https://api.z.ai/api/paas/v4")
+            kwargs["api_key"] = os.environ.get("ZAI_API_KEY")
+        response = await litellm.acompletion(**kwargs)
+        return response.choices[0].message.content or ""
+    def _map_stop_reason(self, finish_reason: Optional[str]) -> str:
+        if not finish_reason:
+            return "end_turn"
+        mapping = {
+            "stop": "end_turn",
+            "end_turn": "end_turn",
+            "tool_calls": "tool_calls",
+            "function_call": "tool_calls",
+            "length": "max_tokens",
+            "max_tokens": "max_tokens",
+            "content_filter": "content_filter",
+        }
+        return mapping.get(finish_reason, "end_turn")

src/opencode_api/provider/openai.py ADDED Viewed

	@@ -0,0 +1,182 @@

+from typing import Dict, Any, List, Optional, AsyncGenerator
+import os
+import json
+from .provider import BaseProvider, ModelInfo, Message, StreamChunk, ToolCall
+class OpenAIProvider(BaseProvider):
+    def __init__(self, api_key: Optional[str] = None):
+        self._api_key = api_key or os.environ.get("OPENAI_API_KEY")
+        self._client = None
+    @property
+    def id(self) -> str:
+        return "openai"
+    @property
+    def name(self) -> str:
+        return "OpenAI"
+    @property
+    def models(self) -> Dict[str, ModelInfo]:
+        return {
+            "gpt-4o": ModelInfo(
+                id="gpt-4o",
+                name="GPT-4o",
+                provider_id="openai",
+                context_limit=128000,
+                output_limit=16384,
+                supports_tools=True,
+                supports_streaming=True,
+                cost_input=2.5,
+                cost_output=10.0,
+            ),
+            "gpt-4o-mini": ModelInfo(
+                id="gpt-4o-mini",
+                name="GPT-4o Mini",
+                provider_id="openai",
+                context_limit=128000,
+                output_limit=16384,
+                supports_tools=True,
+                supports_streaming=True,
+                cost_input=0.15,
+                cost_output=0.6,
+            ),
+            "o1": ModelInfo(
+                id="o1",
+                name="o1",
+                provider_id="openai",
+                context_limit=200000,
+                output_limit=100000,
+                supports_tools=True,
+                supports_streaming=True,
+                cost_input=15.0,
+                cost_output=60.0,
+            ),
+        }
+    def _get_client(self):
+        if self._client is None:
+            try:
+                from openai import AsyncOpenAI
+                self._client = AsyncOpenAI(api_key=self._api_key)
+            except ImportError:
+                raise ImportError("openai package is required. Install with: pip install openai")
+        return self._client
+    async def stream(
+        self,
+        model_id: str,
+        messages: List[Message],
+        tools: Optional[List[Dict[str, Any]]] = None,
+        system: Optional[str] = None,
+        temperature: Optional[float] = None,
+        max_tokens: Optional[int] = None,
+    ) -> AsyncGenerator[StreamChunk, None]:
+        client = self._get_client()
+        openai_messages = []
+        if system:
+            openai_messages.append({"role": "system", "content": system})
+        for msg in messages:
+            content = msg.content
+            if isinstance(content, str):
+                openai_messages.append({"role": msg.role, "content": content})
+            else:
+                openai_messages.append({
+                    "role": msg.role,
+                    "content": [{"type": c.type, "text": c.text} for c in content if c.text]
+                })
+        kwargs: Dict[str, Any] = {
+            "model": model_id,
+            "messages": openai_messages,
+            "stream": True,
+        }
+        if max_tokens:
+            kwargs["max_tokens"] = max_tokens
+        if temperature is not None:
+            kwargs["temperature"] = temperature
+        if tools:
+            kwargs["tools"] = [
+                {
+                    "type": "function",
+                    "function": {
+                        "name": t["name"],
+                        "description": t.get("description", ""),
+                        "parameters": t.get("parameters", t.get("input_schema", {}))
+                    }
+                }
+                for t in tools
+            ]
+        tool_calls: Dict[int, Dict[str, Any]] = {}
+        usage_data = None
+        finish_reason = None
+        async for chunk in await client.chat.completions.create(**kwargs):
+            if chunk.choices and chunk.choices[0].delta:
+                delta = chunk.choices[0].delta
+                if delta.content:
+                    yield StreamChunk(type="text", text=delta.content)
+                if delta.tool_calls:
+                    for tc in delta.tool_calls:
+                        idx = tc.index
+                        if idx not in tool_calls:
+                            tool_calls[idx] = {
+                                "id": tc.id or "",
+                                "name": tc.function.name if tc.function else "",
+                                "arguments": ""
+                            }
+                        if tc.id:
+                            tool_calls[idx]["id"] = tc.id
+                        if tc.function:
+                            if tc.function.name:
+                                tool_calls[idx]["name"] = tc.function.name
+                            if tc.function.arguments:
+                                tool_calls[idx]["arguments"] += tc.function.arguments
+            if chunk.choices and chunk.choices[0].finish_reason:
+                finish_reason = chunk.choices[0].finish_reason
+            if chunk.usage:
+                usage_data = {
+                    "input_tokens": chunk.usage.prompt_tokens,
+                    "output_tokens": chunk.usage.completion_tokens,
+                }
+        for tc_data in tool_calls.values():
+            try:
+                args = json.loads(tc_data["arguments"]) if tc_data["arguments"] else {}
+            except json.JSONDecodeError:
+                args = {}
+            yield StreamChunk(
+                type="tool_call",
+                tool_call=ToolCall(
+                    id=tc_data["id"],
+                    name=tc_data["name"],
+                    arguments=args
+                )
+            )
+        stop_reason = self._map_stop_reason(finish_reason)
+        yield StreamChunk(type="done", usage=usage_data, stop_reason=stop_reason)
+    def _map_stop_reason(self, openai_finish_reason: Optional[str]) -> str:
+        mapping = {
+            "stop": "end_turn",
+            "tool_calls": "tool_calls",
+            "length": "max_tokens",
+            "content_filter": "end_turn",
+        }
+        return mapping.get(openai_finish_reason or "", "end_turn")

src/opencode_api/provider/provider.py ADDED Viewed

	@@ -0,0 +1,133 @@

+from typing import Dict, Any, List, Optional, AsyncIterator, AsyncGenerator, Protocol, runtime_checkable
+from pydantic import BaseModel, Field
+from abc import ABC, abstractmethod
+class ModelInfo(BaseModel):
+    id: str
+    name: str
+    provider_id: str
+    context_limit: int = 128000
+    output_limit: int = 8192
+    supports_tools: bool = True
+    supports_streaming: bool = True
+    cost_input: float = 0.0  # per 1M tokens
+    cost_output: float = 0.0  # per 1M tokens
+class ProviderInfo(BaseModel):
+    id: str
+    name: str
+    models: Dict[str, ModelInfo] = Field(default_factory=dict)
+class MessageContent(BaseModel):
+    type: str = "text"
+    text: Optional[str] = None
+class Message(BaseModel):
+    role: str  # "user", "assistant", "system"
+    content: str | List[MessageContent]
+class ToolCall(BaseModel):
+    id: str
+    name: str
+    arguments: Dict[str, Any]
+class ToolResult(BaseModel):
+    tool_call_id: str
+    output: str
+class StreamChunk(BaseModel):
+    type: str  # "text", "reasoning", "tool_call", "tool_result", "done", "error"
+    text: Optional[str] = None
+    tool_call: Optional[ToolCall] = None
+    error: Optional[str] = None
+    usage: Optional[Dict[str, int]] = None
+    stop_reason: Optional[str] = None  # "end_turn", "tool_calls", "max_tokens", etc.
+@runtime_checkable
+class Provider(Protocol):
+    @property
+    def id(self) -> str: ...
+    @property
+    def name(self) -> str: ...
+    @property
+    def models(self) -> Dict[str, ModelInfo]: ...
+    def stream(
+        self,
+        model_id: str,
+        messages: List[Message],
+        tools: Optional[List[Dict[str, Any]]] = None,
+        system: Optional[str] = None,
+        temperature: Optional[float] = None,
+        max_tokens: Optional[int] = None,
+    ) -> AsyncGenerator[StreamChunk, None]: ...
+class BaseProvider(ABC):
+    @property
+    @abstractmethod
+    def id(self) -> str:
+        pass
+    @property
+    @abstractmethod
+    def name(self) -> str:
+        pass
+    @property
+    @abstractmethod
+    def models(self) -> Dict[str, ModelInfo]:
+        pass
+    @abstractmethod
+    def stream(
+        self,
+        model_id: str,
+        messages: List[Message],
+        tools: Optional[List[Dict[str, Any]]] = None,
+        system: Optional[str] = None,
+        temperature: Optional[float] = None,
+        max_tokens: Optional[int] = None,
+    ) -> AsyncGenerator[StreamChunk, None]:
+        pass
+    def get_info(self) -> ProviderInfo:
+        return ProviderInfo(
+            id=self.id,
+            name=self.name,
+            models=self.models
+        )
+_providers: Dict[str, BaseProvider] = {}
+def register_provider(provider: BaseProvider) -> None:
+    _providers[provider.id] = provider
+def get_provider(provider_id: str) -> Optional[BaseProvider]:
+    return _providers.get(provider_id)
+def list_providers() -> List[ProviderInfo]:
+    return [p.get_info() for p in _providers.values()]
+def get_model(provider_id: str, model_id: str) -> Optional[ModelInfo]:
+    provider = get_provider(provider_id)
+    if provider:
+        return provider.models.get(model_id)
+    return None

src/opencode_api/routes/__init__.py ADDED Viewed

	@@ -0,0 +1,7 @@

+from .session import router as session_router
+from .provider import router as provider_router
+from .event import router as event_router
+from .question import router as question_router
+from .agent import router as agent_router
+__all__ = ["session_router", "provider_router", "event_router", "question_router", "agent_router"]

src/opencode_api/routes/agent.py ADDED Viewed

	@@ -0,0 +1,66 @@

+"""
+Agent routes - manage agent configurations.
+"""
+from fastapi import APIRouter, HTTPException
+from typing import Optional, List
+from ..agent import (
+    AgentInfo,
+    get,
+    list_agents,
+    default_agent,
+    register,
+    unregister,
+)
+router = APIRouter(prefix="/agent", tags=["agent"])
+@router.get("", response_model=List[AgentInfo])
+async def get_agents(
+    mode: Optional[str] = None,
+    include_hidden: bool = False
+):
+    """List all available agents."""
+    return list_agents(mode=mode, include_hidden=include_hidden)
+@router.get("/default", response_model=AgentInfo)
+async def get_default_agent():
+    """Get the default agent configuration."""
+    return default_agent()
+@router.get("/{agent_id}", response_model=AgentInfo)
+async def get_agent(agent_id: str):
+    """Get a specific agent by ID."""
+    agent = get(agent_id)
+    if not agent:
+        raise HTTPException(status_code=404, detail=f"Agent not found: {agent_id}")
+    return agent
+@router.post("", response_model=AgentInfo)
+async def create_agent(agent: AgentInfo):
+    """Register a custom agent."""
+    existing = get(agent.id)
+    if existing and existing.native:
+        raise HTTPException(status_code=400, detail=f"Cannot override native agent: {agent.id}")
+    register(agent)
+    return agent
+@router.delete("/{agent_id}")
+async def delete_agent(agent_id: str):
+    """Unregister a custom agent."""
+    agent = get(agent_id)
+    if not agent:
+        raise HTTPException(status_code=404, detail=f"Agent not found: {agent_id}")
+    if agent.native:
+        raise HTTPException(status_code=400, detail=f"Cannot delete native agent: {agent_id}")
+    unregister(agent_id)
+    return {"deleted": agent_id}

src/opencode_api/routes/event.py ADDED Viewed

	@@ -0,0 +1,45 @@

+from fastapi import APIRouter
+from fastapi.responses import StreamingResponse
+import asyncio
+import json
+from typing import AsyncIterator
+from ..core.bus import Bus, EventInstance
+router = APIRouter(tags=["Events"])
+@router.get("/event")
+async def subscribe_events():
+    async def event_generator() -> AsyncIterator[str]:
+        queue: asyncio.Queue[EventInstance] = asyncio.Queue()
+        async def handler(event: EventInstance):
+            await queue.put(event)
+        unsubscribe = Bus.subscribe_all(handler)
+        yield f"data: {json.dumps({'type': 'server.connected', 'payload': {}})}\n\n"
+        try:
+            while True:
+                try:
+                    event = await asyncio.wait_for(queue.get(), timeout=30.0)
+                    yield f"data: {json.dumps({'type': event.type, 'payload': event.payload})}\n\n"
+                except asyncio.TimeoutError:
+                    yield f"data: {json.dumps({'type': 'server.heartbeat', 'payload': {}})}\n\n"
+        except asyncio.CancelledError:
+            pass
+        finally:
+            unsubscribe()
+    return StreamingResponse(
+        event_generator(),
+        media_type="text/event-stream",
+        headers={
+            "Cache-Control": "no-cache",
+            "Connection": "keep-alive",
+            "X-Accel-Buffering": "no",
+        }
+    )

src/opencode_api/routes/provider.py ADDED Viewed

	@@ -0,0 +1,107 @@

+from typing import List, Dict
+from fastapi import APIRouter, HTTPException
+import os
+from dotenv import load_dotenv
+# .env 파일에서 환경변수 로드
+load_dotenv()
+from ..provider import list_providers, get_provider
+from ..provider.provider import ProviderInfo, ModelInfo
+router = APIRouter(prefix="/provider", tags=["Provider"])
+# Provider별 필요 환경변수 매핑
+PROVIDER_API_KEYS = {
+    "anthropic": "ANTHROPIC_API_KEY",
+    "openai": "OPENAI_API_KEY",
+    "gemini": ["GOOGLE_API_KEY", "GEMINI_API_KEY"],
+    "litellm": None,  # LiteLLM은 개별 모델별로 체크
+}
+# LiteLLM 모델별 필요 환경변수
+LITELLM_MODEL_KEYS = {
+    "claude-": "ANTHROPIC_API_KEY",
+    "gpt-": "OPENAI_API_KEY",
+    "o1": "OPENAI_API_KEY",
+    "gemini/": ["GOOGLE_API_KEY", "GEMINI_API_KEY"],
+    "groq/": "GROQ_API_KEY",
+    "deepseek/": "DEEPSEEK_API_KEY",
+    "openrouter/": "OPENROUTER_API_KEY",
+    "zai/": "ZAI_API_KEY",
+}
+def has_api_key(provider_id: str) -> bool:
+    """Check if provider has required API key configured"""
+    keys = PROVIDER_API_KEYS.get(provider_id)
+    if keys is None:
+        return True  # No key required (like litellm container)
+    if isinstance(keys, list):
+        return any(os.environ.get(k) for k in keys)
+    return bool(os.environ.get(keys))
+def filter_litellm_models(models: Dict[str, ModelInfo]) -> Dict[str, ModelInfo]:
+    """Filter LiteLLM models based on available API keys"""
+    filtered = {}
+    for model_id, model_info in models.items():
+        for prefix, env_key in LITELLM_MODEL_KEYS.items():
+            if model_id.startswith(prefix):
+                if isinstance(env_key, list):
+                    if any(os.environ.get(k) for k in env_key):
+                        filtered[model_id] = model_info
+                elif os.environ.get(env_key):
+                    filtered[model_id] = model_info
+                break
+    return filtered
+@router.get("/", response_model=List[ProviderInfo])
+async def get_providers():
+    """Get available providers (filtered by API key availability)"""
+    all_providers = list_providers()
+    available = []
+    for provider in all_providers:
+        if provider.id == "litellm":
+            # LiteLLM: 개별 모델별 필터링
+            filtered_models = filter_litellm_models(provider.models)
+            if filtered_models:
+                provider.models = filtered_models
+                available.append(provider)
+        elif has_api_key(provider.id):
+            available.append(provider)
+    return available
+@router.get("/{provider_id}", response_model=ProviderInfo)
+async def get_provider_info(provider_id: str):
+    provider = get_provider(provider_id)
+    if not provider:
+        raise HTTPException(status_code=404, detail=f"Provider not found: {provider_id}")
+    return provider.get_info()
+@router.get("/{provider_id}/model", response_model=List[ModelInfo])
+async def get_provider_models(provider_id: str):
+    provider = get_provider(provider_id)
+    if not provider:
+        raise HTTPException(status_code=404, detail=f"Provider not found: {provider_id}")
+    return list(provider.models.values())
+@router.get("/{provider_id}/model/{model_id}", response_model=ModelInfo)
+async def get_model_info(provider_id: str, model_id: str):
+    provider = get_provider(provider_id)
+    if not provider:
+        raise HTTPException(status_code=404, detail=f"Provider not found: {provider_id}")
+    model = provider.models.get(model_id)
+    if not model:
+        raise HTTPException(status_code=404, detail=f"Model not found: {model_id}")
+    return model

src/opencode_api/routes/question.py ADDED Viewed

	@@ -0,0 +1,55 @@

+"""Question API routes."""
+from typing import List
+from fastapi import APIRouter, HTTPException
+from pydantic import BaseModel, Field
+from ..tool import (
+    reply_to_question,
+    reject_question,
+    get_pending_questions,
+    QuestionReply,
+)
+router = APIRouter(prefix="/question", tags=["question"])
+class QuestionAnswerRequest(BaseModel):
+    """Request to answer a question."""
+    answers: List[List[str]] = Field(..., description="Answers in order (each is array of selected labels)")
+@router.get("")
+@router.get("/")
+async def list_pending_questions(session_id: str = None):
+    """List all pending questions."""
+    pending = get_pending_questions(session_id)
+    return {"pending": pending}
+@router.post("/{request_id}/reply")
+async def answer_question(request_id: str, request: QuestionAnswerRequest):
+    """Submit answers to a pending question."""
+    success = await reply_to_question(request_id, request.answers)
+    if not success:
+        raise HTTPException(
+            status_code=404,
+            detail=f"Question request '{request_id}' not found or already answered"
+        )
+    return {"status": "answered", "request_id": request_id}
+@router.post("/{request_id}/reject")
+async def dismiss_question(request_id: str):
+    """Dismiss/reject a pending question without answering."""
+    success = await reject_question(request_id)
+    if not success:
+        raise HTTPException(
+            status_code=404,
+            detail=f"Question request '{request_id}' not found or already handled"
+        )
+    return {"status": "rejected", "request_id": request_id}

src/opencode_api/routes/session.py ADDED Viewed

	@@ -0,0 +1,206 @@

+from typing import Optional, List
+from fastapi import APIRouter, HTTPException, Query, Depends
+from fastapi.responses import StreamingResponse
+from pydantic import BaseModel
+import json
+from ..session import Session, SessionInfo, SessionCreate, Message, SessionPrompt
+from ..session.prompt import PromptInput
+from ..core.storage import NotFoundError
+from ..core.auth import AuthUser, optional_auth, require_auth
+from ..core.quota import check_quota, increment_usage
+from ..core.supabase import is_enabled as supabase_enabled
+from ..provider import get_provider
+router = APIRouter(prefix="/session", tags=["Session"])
+class MessageRequest(BaseModel):
+    content: str
+    provider_id: Optional[str] = None
+    model_id: Optional[str] = None
+    system: Optional[str] = None
+    temperature: Optional[float] = None
+    max_tokens: Optional[int] = None
+    tools_enabled: bool = True
+    auto_continue: Optional[bool] = None
+    max_steps: Optional[int] = None
+class SessionUpdate(BaseModel):
+    title: Optional[str] = None
+class GenerateTitleRequest(BaseModel):
+    message: str
+    model_id: Optional[str] = None
+@router.get("/", response_model=List[SessionInfo])
+async def list_sessions(
+    limit: Optional[int] = Query(None, description="Maximum number of sessions to return"),
+    user: Optional[AuthUser] = Depends(optional_auth)
+):
+    user_id = user.id if user else None
+    return await Session.list(limit, user_id)
+@router.post("/", response_model=SessionInfo)
+async def create_session(
+    data: Optional[SessionCreate] = None,
+    user: Optional[AuthUser] = Depends(optional_auth)
+):
+    user_id = user.id if user else None
+    return await Session.create(data, user_id)
+@router.get("/{session_id}", response_model=SessionInfo)
+async def get_session(
+    session_id: str,
+    user: Optional[AuthUser] = Depends(optional_auth)
+):
+    try:
+        user_id = user.id if user else None
+        return await Session.get(session_id, user_id)
+    except NotFoundError:
+        raise HTTPException(status_code=404, detail=f"Session not found: {session_id}")
+@router.patch("/{session_id}", response_model=SessionInfo)
+async def update_session(
+    session_id: str,
+    updates: SessionUpdate,
+    user: Optional[AuthUser] = Depends(optional_auth)
+):
+    try:
+        user_id = user.id if user else None
+        update_dict = {k: v for k, v in updates.model_dump().items() if v is not None}
+        return await Session.update(session_id, update_dict, user_id)
+    except NotFoundError:
+        raise HTTPException(status_code=404, detail=f"Session not found: {session_id}")
+@router.delete("/{session_id}")
+async def delete_session(
+    session_id: str,
+    user: Optional[AuthUser] = Depends(optional_auth)
+):
+    try:
+        user_id = user.id if user else None
+        await Session.delete(session_id, user_id)
+        return {"success": True}
+    except NotFoundError:
+        raise HTTPException(status_code=404, detail=f"Session not found: {session_id}")
+@router.get("/{session_id}/message")
+async def list_messages(
+    session_id: str,
+    limit: Optional[int] = Query(None, description="Maximum number of messages to return"),
+    user: Optional[AuthUser] = Depends(optional_auth)
+):
+    try:
+        user_id = user.id if user else None
+        await Session.get(session_id, user_id)
+        return await Message.list(session_id, limit, user_id)
+    except NotFoundError:
+        raise HTTPException(status_code=404, detail=f"Session not found: {session_id}")
+@router.post("/{session_id}/message")
+async def send_message(
+    session_id: str,
+    request: MessageRequest,
+    user: AuthUser = Depends(check_quota) if supabase_enabled() else Depends(optional_auth)
+):
+    user_id = user.id if user else None
+    try:
+        await Session.get(session_id, user_id)
+    except NotFoundError:
+        raise HTTPException(status_code=404, detail=f"Session not found: {session_id}")
+    prompt_input = PromptInput(
+        content=request.content,
+        provider_id=request.provider_id,
+        model_id=request.model_id,
+        system=request.system,
+        temperature=request.temperature,
+        max_tokens=request.max_tokens,
+        tools_enabled=request.tools_enabled,
+        auto_continue=request.auto_continue,
+        max_steps=request.max_steps,
+    )
+    async def generate():
+        total_input = 0
+        total_output = 0
+        async for chunk in SessionPrompt.prompt(session_id, prompt_input, user_id):
+            if chunk.usage:
+                total_input += chunk.usage.get("input_tokens", 0)
+                total_output += chunk.usage.get("output_tokens", 0)
+            yield f"data: {json.dumps(chunk.model_dump())}\n\n"
+        if user_id and supabase_enabled():
+            await increment_usage(user_id, total_input, total_output)
+        yield "data: [DONE]\n\n"
+    return StreamingResponse(
+        generate(),
+        media_type="text/event-stream",
+        headers={
+            "Cache-Control": "no-cache",
+            "Connection": "keep-alive",
+            "X-Accel-Buffering": "no",
+        }
+    )
+@router.post("/{session_id}/abort")
+async def abort_session(session_id: str):
+    cancelled = SessionPrompt.cancel(session_id)
+    return {"cancelled": cancelled}
+@router.post("/{session_id}/generate-title")
+async def generate_title(
+    session_id: str,
+    request: GenerateTitleRequest,
+    user: Optional[AuthUser] = Depends(optional_auth)
+):
+    """첫 메시지 기반으로 세션 제목 생성"""
+    user_id = user.id if user else None
+    # 세션 존재 확인
+    try:
+        await Session.get(session_id, user_id)
+    except NotFoundError:
+        raise HTTPException(status_code=404, detail=f"Session not found: {session_id}")
+    # LiteLLM Provider로 제목 생성
+    model_id = request.model_id or "gemini/gemini-2.0-flash"
+    provider = get_provider("litellm")
+    if not provider:
+        raise HTTPException(status_code=503, detail="LiteLLM provider not available")
+    prompt = f"""다음 사용자 메시지를 보고 짧은 제목을 생성해주세요.
+제목은 10자 이내, 따옴표 없이 제목만 출력.
+사용자 메시지: "{request.message[:200]}"
+제목:"""
+    try:
+        result = await provider.complete(model_id, prompt, max_tokens=50)
+        title = result.strip()[:30]
+        # 세션 제목 업데이트
+        await Session.update(session_id, {"title": title}, user_id)
+        return {"title": title}
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=f"Failed to generate title: {str(e)}")

src/opencode_api/session/__init__.py ADDED Viewed

	@@ -0,0 +1,11 @@

+from .session import Session, SessionInfo, SessionCreate
+from .message import Message, MessageInfo, UserMessage, AssistantMessage, MessagePart
+from .prompt import SessionPrompt
+from .processor import SessionProcessor, DoomLoopDetector, RetryConfig, StepInfo
+__all__ = [
+    "Session", "SessionInfo", "SessionCreate",
+    "Message", "MessageInfo", "UserMessage", "AssistantMessage", "MessagePart",
+    "SessionPrompt",
+    "SessionProcessor", "DoomLoopDetector", "RetryConfig", "StepInfo"
+]

src/opencode_api/session/message.py ADDED Viewed

	@@ -0,0 +1,348 @@

+from typing import Optional, List, Dict, Any, Union, Literal
+from pydantic import BaseModel, Field
+from datetime import datetime
+from ..core.storage import Storage, NotFoundError
+from ..core.bus import Bus, MESSAGE_UPDATED, MESSAGE_REMOVED, PART_UPDATED, MessagePayload, PartPayload
+from ..core.identifier import Identifier
+from ..core.supabase import get_client, is_enabled as supabase_enabled
+class MessagePart(BaseModel):
+    """메시지 파트 모델
+    type 종류:
+    - "text": 일반 텍스트 응답
+    - "reasoning": Claude의 thinking/extended thinking
+    - "tool_call": 도구 호출 (tool_name, tool_args, tool_status)
+    - "tool_result": 도구 실행 결과 (tool_output)
+    """
+    id: str
+    session_id: str
+    message_id: str
+    type: str  # "text", "reasoning", "tool_call", "tool_result"
+    content: Optional[str] = None  # text, reasoning용
+    tool_call_id: Optional[str] = None
+    tool_name: Optional[str] = None
+    tool_args: Optional[Dict[str, Any]] = None
+    tool_output: Optional[str] = None
+    tool_status: Optional[str] = None  # "pending", "running", "completed", "error"
+class MessageInfo(BaseModel):
+    id: str
+    session_id: str
+    role: Literal["user", "assistant"]
+    created_at: datetime
+    model: Optional[str] = None
+    provider_id: Optional[str] = None
+    usage: Optional[Dict[str, int]] = None
+    error: Optional[str] = None
+class UserMessage(MessageInfo):
+    role: Literal["user"] = "user"
+    content: str
+class AssistantMessage(MessageInfo):
+    role: Literal["assistant"] = "assistant"
+    parts: List[MessagePart] = Field(default_factory=list)
+    summary: bool = False
+class Message:
+    @staticmethod
+    async def create_user(session_id: str, content: str, user_id: Optional[str] = None) -> UserMessage:
+        message_id = Identifier.generate("message")
+        now = datetime.utcnow()
+        msg = UserMessage(
+            id=message_id,
+            session_id=session_id,
+            content=content,
+            created_at=now,
+        )
+        if supabase_enabled() and user_id:
+            client = get_client()
+            client.table("opencode_messages").insert({
+                "id": message_id,
+                "session_id": session_id,
+                "role": "user",
+                "content": content,
+            }).execute()
+        else:
+            await Storage.write(["message", session_id, message_id], msg.model_dump())
+        await Bus.publish(MESSAGE_UPDATED, MessagePayload(session_id=session_id, message_id=message_id))
+        return msg
+    @staticmethod
+    async def create_assistant(
+        session_id: str,
+        provider_id: Optional[str] = None,
+        model: Optional[str] = None,
+        user_id: Optional[str] = None,
+        summary: bool = False
+    ) -> AssistantMessage:
+        message_id = Identifier.generate("message")
+        now = datetime.utcnow()
+        msg = AssistantMessage(
+            id=message_id,
+            session_id=session_id,
+            created_at=now,
+            provider_id=provider_id,
+            model=model,
+            parts=[],
+            summary=summary,
+        )
+        if supabase_enabled() and user_id:
+            client = get_client()
+            client.table("opencode_messages").insert({
+                "id": message_id,
+                "session_id": session_id,
+                "role": "assistant",
+                "provider_id": provider_id,
+                "model_id": model,
+            }).execute()
+        else:
+            await Storage.write(["message", session_id, message_id], msg.model_dump())
+        await Bus.publish(MESSAGE_UPDATED, MessagePayload(session_id=session_id, message_id=message_id))
+        return msg
+    @staticmethod
+    async def get(session_id: str, message_id: str, user_id: Optional[str] = None) -> Union[UserMessage, AssistantMessage]:
+        if supabase_enabled() and user_id:
+            client = get_client()
+            result = client.table("opencode_messages").select("*, opencode_message_parts(*)").eq("id", message_id).eq("session_id", session_id).single().execute()
+            if not result.data:
+                raise NotFoundError(["message", session_id, message_id])
+            data = result.data
+            if data.get("role") == "user":
+                return UserMessage(
+                    id=data["id"],
+                    session_id=data["session_id"],
+                    role="user",
+                    content=data.get("content", ""),
+                    created_at=data["created_at"],
+                )
+            parts = [
+                MessagePart(
+                    id=p["id"],
+                    session_id=session_id,
+                    message_id=message_id,
+                    type=p["type"],
+                    content=p.get("content"),
+                    tool_call_id=p.get("tool_call_id"),
+                    tool_name=p.get("tool_name"),
+                    tool_args=p.get("tool_args"),
+                    tool_output=p.get("tool_output"),
+                    tool_status=p.get("tool_status"),
+                )
+                for p in data.get("opencode_message_parts", [])
+            ]
+            return AssistantMessage(
+                id=data["id"],
+                session_id=data["session_id"],
+                role="assistant",
+                created_at=data["created_at"],
+                provider_id=data.get("provider_id"),
+                model=data.get("model_id"),
+                usage={"input_tokens": data.get("input_tokens", 0), "output_tokens": data.get("output_tokens", 0)} if data.get("input_tokens") else None,
+                error=data.get("error"),
+                parts=parts,
+            )
+        data = await Storage.read(["message", session_id, message_id])
+        if not data:
+            raise NotFoundError(["message", session_id, message_id])
+        if data.get("role") == "user":
+            return UserMessage(**data)
+        return AssistantMessage(**data)
+    @staticmethod
+    async def add_part(message_id: str, session_id: str, part: MessagePart, user_id: Optional[str] = None) -> MessagePart:
+        part.id = Identifier.generate("part")
+        part.message_id = message_id
+        part.session_id = session_id
+        if supabase_enabled() and user_id:
+            client = get_client()
+            client.table("opencode_message_parts").insert({
+                "id": part.id,
+                "message_id": message_id,
+                "type": part.type,
+                "content": part.content,
+                "tool_call_id": part.tool_call_id,
+                "tool_name": part.tool_name,
+                "tool_args": part.tool_args,
+                "tool_output": part.tool_output,
+                "tool_status": part.tool_status,
+            }).execute()
+        else:
+            msg_data = await Storage.read(["message", session_id, message_id])
+            if not msg_data:
+                raise NotFoundError(["message", session_id, message_id])
+            if "parts" not in msg_data:
+                msg_data["parts"] = []
+            msg_data["parts"].append(part.model_dump())
+            await Storage.write(["message", session_id, message_id], msg_data)
+        await Bus.publish(PART_UPDATED, PartPayload(
+            session_id=session_id,
+            message_id=message_id,
+            part_id=part.id
+        ))
+        return part
+    @staticmethod
+    async def update_part(session_id: str, message_id: str, part_id: str, updates: Dict[str, Any], user_id: Optional[str] = None) -> MessagePart:
+        if supabase_enabled() and user_id:
+            client = get_client()
+            result = client.table("opencode_message_parts").update(updates).eq("id", part_id).execute()
+            if result.data:
+                p = result.data[0]
+                await Bus.publish(PART_UPDATED, PartPayload(
+                    session_id=session_id,
+                    message_id=message_id,
+                    part_id=part_id
+                ))
+                return MessagePart(
+                    id=p["id"],
+                    session_id=session_id,
+                    message_id=message_id,
+                    type=p["type"],
+                    content=p.get("content"),
+                    tool_call_id=p.get("tool_call_id"),
+                    tool_name=p.get("tool_name"),
+                    tool_args=p.get("tool_args"),
+                    tool_output=p.get("tool_output"),
+                    tool_status=p.get("tool_status"),
+                )
+            raise NotFoundError(["part", message_id, part_id])
+        msg_data = await Storage.read(["message", session_id, message_id])
+        if not msg_data:
+            raise NotFoundError(["message", session_id, message_id])
+        for i, p in enumerate(msg_data.get("parts", [])):
+            if p.get("id") == part_id:
+                msg_data["parts"][i].update(updates)
+                await Storage.write(["message", session_id, message_id], msg_data)
+                await Bus.publish(PART_UPDATED, PartPayload(
+                    session_id=session_id,
+                    message_id=message_id,
+                    part_id=part_id
+                ))
+                return MessagePart(**msg_data["parts"][i])
+        raise NotFoundError(["part", message_id, part_id])
+    @staticmethod
+    async def list(session_id: str, limit: Optional[int] = None, user_id: Optional[str] = None) -> List[Union[UserMessage, AssistantMessage]]:
+        if supabase_enabled() and user_id:
+            client = get_client()
+            query = client.table("opencode_messages").select("*, opencode_message_parts(*)").eq("session_id", session_id).order("created_at")
+            if limit:
+                query = query.limit(limit)
+            result = query.execute()
+            messages = []
+            for data in result.data:
+                if data.get("role") == "user":
+                    messages.append(UserMessage(
+                        id=data["id"],
+                        session_id=data["session_id"],
+                        role="user",
+                        content=data.get("content", ""),
+                        created_at=data["created_at"],
+                    ))
+                else:
+                    parts = [
+                        MessagePart(
+                            id=p["id"],
+                            session_id=session_id,
+                            message_id=data["id"],
+                            type=p["type"],
+                            content=p.get("content"),
+                            tool_call_id=p.get("tool_call_id"),
+                            tool_name=p.get("tool_name"),
+                            tool_args=p.get("tool_args"),
+                            tool_output=p.get("tool_output"),
+                            tool_status=p.get("tool_status"),
+                        )
+                        for p in data.get("opencode_message_parts", [])
+                    ]
+                    messages.append(AssistantMessage(
+                        id=data["id"],
+                        session_id=data["session_id"],
+                        role="assistant",
+                        created_at=data["created_at"],
+                        provider_id=data.get("provider_id"),
+                        model=data.get("model_id"),
+                        usage={"input_tokens": data.get("input_tokens", 0), "output_tokens": data.get("output_tokens", 0)} if data.get("input_tokens") else None,
+                        error=data.get("error"),
+                        parts=parts,
+                    ))
+            return messages
+        message_keys = await Storage.list(["message", session_id])
+        messages = []
+        for key in message_keys:
+            if limit and len(messages) >= limit:
+                break
+            data = await Storage.read(key)
+            if data:
+                if data.get("role") == "user":
+                    messages.append(UserMessage(**data))
+                else:
+                    messages.append(AssistantMessage(**data))
+        messages.sort(key=lambda m: m.created_at)
+        return messages
+    @staticmethod
+    async def delete(session_id: str, message_id: str, user_id: Optional[str] = None) -> bool:
+        if supabase_enabled() and user_id:
+            client = get_client()
+            client.table("opencode_messages").delete().eq("id", message_id).execute()
+        else:
+            await Storage.remove(["message", session_id, message_id])
+        await Bus.publish(MESSAGE_REMOVED, MessagePayload(session_id=session_id, message_id=message_id))
+        return True
+    @staticmethod
+    async def set_usage(session_id: str, message_id: str, usage: Dict[str, int], user_id: Optional[str] = None) -> None:
+        if supabase_enabled() and user_id:
+            client = get_client()
+            client.table("opencode_messages").update({
+                "input_tokens": usage.get("input_tokens", 0),
+                "output_tokens": usage.get("output_tokens", 0),
+            }).eq("id", message_id).execute()
+        else:
+            msg_data = await Storage.read(["message", session_id, message_id])
+            if msg_data:
+                msg_data["usage"] = usage
+                await Storage.write(["message", session_id, message_id], msg_data)
+    @staticmethod
+    async def set_error(session_id: str, message_id: str, error: str, user_id: Optional[str] = None) -> None:
+        if supabase_enabled() and user_id:
+            client = get_client()
+            client.table("opencode_messages").update({"error": error}).eq("id", message_id).execute()
+        else:
+            msg_data = await Storage.read(["message", session_id, message_id])
+            if msg_data:
+                msg_data["error"] = error
+                await Storage.write(["message", session_id, message_id], msg_data)

src/opencode_api/session/processor.py ADDED Viewed

	@@ -0,0 +1,193 @@

+"""
+Session processor for managing agentic loop execution.
+"""
+from typing import Optional, Dict, Any, AsyncIterator, List
+from pydantic import BaseModel
+from datetime import datetime
+import asyncio
+from ..provider.provider import StreamChunk
+class DoomLoopDetector:
+    """동일 도구 + 동일 인자 연속 호출을 감지하여 무한 루프 방지
+    원본 opencode와 동일하게 도구 이름과 인자를 모두 비교합니다.
+    같은 도구라도 인자가 다르면 정상적인 반복으로 판단합니다.
+    """
+    def __init__(self, threshold: int = 3):
+        self.threshold = threshold
+        self.history: List[tuple[str, str]] = []  # (tool_name, args_hash)
+    def record(self, tool_name: str, args: Optional[Dict[str, Any]] = None) -> bool:
+        """도구 호출을 기록하고 doom loop 감지 시 True 반환
+        Args:
+            tool_name: 도구 이름
+            args: 도구 인자 (없으면 빈 dict로 처리)
+        Returns:
+            True if doom loop detected, False otherwise
+        """
+        import json
+        import hashlib
+        # 인자를 정규화하여 해시 생성 (원본처럼 JSON 비교)
+        args_dict = args or {}
+        args_str = json.dumps(args_dict, sort_keys=True, default=str)
+        args_hash = hashlib.md5(args_str.encode()).hexdigest()[:8]
+        call_signature = (tool_name, args_hash)
+        self.history.append(call_signature)
+        # 최근 threshold개가 모두 같은 (도구 + 인자)인지 확인
+        if len(self.history) >= self.threshold:
+            recent = self.history[-self.threshold:]
+            if len(set(recent)) == 1:  # 튜플 비교 (도구+인자)
+                return True
+        return False
+    def reset(self):
+        self.history = []
+class RetryConfig(BaseModel):
+    """재시도 설정"""
+    max_retries: int = 3
+    base_delay: float = 1.0  # seconds
+    max_delay: float = 30.0
+    exponential_base: float = 2.0
+class StepInfo(BaseModel):
+    """스텝 정보"""
+    step: int
+    started_at: datetime
+    finished_at: Optional[datetime] = None
+    tool_calls: List[str] = []
+    status: str = "running"  # running, completed, error, doom_loop
+class SessionProcessor:
+    """
+    Agentic loop 실행을 관리하는 프로세서.
+    Features:
+    - Doom loop 방지 (동일 도구 연속 호출 감지)
+    - 자동 재시도 (exponential backoff)
+    - 스텝 추적 (step-start, step-finish 이벤트)
+    """
+    _processors: Dict[str, "SessionProcessor"] = {}
+    def __init__(self, session_id: str, max_steps: int = 50, doom_threshold: int = 3):
+        self.session_id = session_id
+        self.max_steps = max_steps
+        self.doom_detector = DoomLoopDetector(threshold=doom_threshold)
+        self.retry_config = RetryConfig()
+        self.steps: List[StepInfo] = []
+        self.current_step: Optional[StepInfo] = None
+        self.aborted = False
+    @classmethod
+    def get_or_create(cls, session_id: str, **kwargs) -> "SessionProcessor":
+        if session_id not in cls._processors:
+            cls._processors[session_id] = cls(session_id, **kwargs)
+        return cls._processors[session_id]
+    @classmethod
+    def remove(cls, session_id: str) -> None:
+        if session_id in cls._processors:
+            del cls._processors[session_id]
+    def start_step(self) -> StepInfo:
+        """새 스텝 시작"""
+        step_num = len(self.steps) + 1
+        self.current_step = StepInfo(
+            step=step_num,
+            started_at=datetime.utcnow()
+        )
+        self.steps.append(self.current_step)
+        return self.current_step
+    def finish_step(self, status: str = "completed") -> StepInfo:
+        """현재 스텝 완료"""
+        if self.current_step:
+            self.current_step.finished_at = datetime.utcnow()
+            self.current_step.status = status
+        return self.current_step
+    def record_tool_call(self, tool_name: str, tool_args: Optional[Dict[str, Any]] = None) -> bool:
+        """도구 호출 기록, doom loop 감지 시 True 반환
+        Args:
+            tool_name: 도구 이름
+            tool_args: 도구 인자 (doom loop 판별에 사용)
+        Returns:
+            True if doom loop detected, False otherwise
+        """
+        if self.current_step:
+            self.current_step.tool_calls.append(tool_name)
+        return self.doom_detector.record(tool_name, tool_args)
+    def is_doom_loop(self) -> bool:
+        """현재 doom loop 상태인지 확인"""
+        return len(self.doom_detector.history) >= self.doom_detector.threshold and \
+               len(set(self.doom_detector.history[-self.doom_detector.threshold:])) == 1
+    def should_continue(self) -> bool:
+        """루프 계속 여부"""
+        if self.aborted:
+            return False
+        if len(self.steps) >= self.max_steps:
+            return False
+        if self.is_doom_loop():
+            return False
+        return True
+    def abort(self) -> None:
+        """프로세서 중단"""
+        self.aborted = True
+    async def calculate_retry_delay(self, attempt: int) -> float:
+        """exponential backoff 딜레이 계산"""
+        delay = self.retry_config.base_delay * (self.retry_config.exponential_base ** attempt)
+        return min(delay, self.retry_config.max_delay)
+    async def retry_with_backoff(self, func, *args, **kwargs):
+        """exponential backoff으로 함수 재시도"""
+        last_error = None
+        for attempt in range(self.retry_config.max_retries):
+            try:
+                return await func(*args, **kwargs)
+            except Exception as e:
+                last_error = e
+                if attempt < self.retry_config.max_retries - 1:
+                    delay = await self.calculate_retry_delay(attempt)
+                    await asyncio.sleep(delay)
+        raise last_error
+    def get_summary(self) -> Dict[str, Any]:
+        """프로세서 상태 요약"""
+        return {
+            "session_id": self.session_id,
+            "total_steps": len(self.steps),
+            "max_steps": self.max_steps,
+            "aborted": self.aborted,
+            "doom_loop_detected": self.is_doom_loop(),
+            "steps": [
+                {
+                    "step": s.step,
+                    "status": s.status,
+                    "tool_calls": s.tool_calls,
+                    "duration": (s.finished_at - s.started_at).total_seconds() if s.finished_at else None
+                }
+                for s in self.steps
+            ]
+        }

src/opencode_api/session/prompt.py ADDED Viewed

	@@ -0,0 +1,701 @@

+"""
+Session prompt handling with agentic loop support.
+"""
+from typing import Optional, List, Dict, Any, AsyncIterator, Literal
+from pydantic import BaseModel
+import asyncio
+import json
+from .session import Session
+from .message import Message, MessagePart, AssistantMessage
+from .processor import SessionProcessor
+from ..provider import get_provider, list_providers
+from ..provider.provider import Message as ProviderMessage, StreamChunk, ToolCall
+from ..tool import get_tool, get_tools_schema, ToolContext, get_registry
+from ..core.config import settings
+from ..core.bus import Bus, PART_UPDATED, PartPayload, STEP_STARTED, STEP_FINISHED, StepPayload, TOOL_STATE_CHANGED, ToolStatePayload
+from ..agent import get as get_agent, default_agent, get_system_prompt, is_tool_allowed, AgentInfo, get_prompt_for_provider
+class PromptInput(BaseModel):
+    content: str
+    provider_id: Optional[str] = None
+    model_id: Optional[str] = None
+    system: Optional[str] = None
+    temperature: Optional[float] = None
+    max_tokens: Optional[int] = None
+    tools_enabled: bool = True
+    # Agentic loop options
+    auto_continue: Optional[bool] = None  # None = use agent default
+    max_steps: Optional[int] = None  # None = use agent default
+class LoopState(BaseModel):
+    step: int = 0
+    max_steps: int = 50
+    auto_continue: bool = True
+    stop_reason: Optional[str] = None
+    paused: bool = False
+    pause_reason: Optional[str] = None
+import re
+FAKE_TOOL_CALL_PATTERN = re.compile(
+    r'\[Called\s+tool:\s*(\w+)\s*\(\s*(\{[^}]*\}|\{[^)]*\}|[^)]*)\s*\)\]',
+    re.IGNORECASE
+)
+class SessionPrompt:
+    _active_sessions: Dict[str, asyncio.Task] = {}
+    _loop_states: Dict[str, LoopState] = {}
+    @classmethod
+    async def prompt(
+        cls,
+        session_id: str,
+        input: PromptInput,
+        user_id: Optional[str] = None
+    ) -> AsyncIterator[StreamChunk]:
+        session = await Session.get(session_id, user_id)
+        # Get agent configuration
+        agent_id = session.agent_id or "build"
+        agent = get_agent(agent_id) or default_agent()
+        # Determine loop settings
+        auto_continue = input.auto_continue if input.auto_continue is not None else agent.auto_continue
+        max_steps = input.max_steps if input.max_steps is not None else agent.max_steps
+        if auto_continue:
+            async for chunk in cls._agentic_loop(session_id, input, agent, max_steps, user_id):
+                yield chunk
+        else:
+            async for chunk in cls._single_turn(session_id, input, agent, user_id=user_id):
+                yield chunk
+    @classmethod
+    async def _agentic_loop(
+        cls,
+        session_id: str,
+        input: PromptInput,
+        agent: AgentInfo,
+        max_steps: int,
+        user_id: Optional[str] = None
+    ) -> AsyncIterator[StreamChunk]:
+        state = LoopState(step=0, max_steps=max_steps, auto_continue=True)
+        cls._loop_states[session_id] = state
+        # SessionProcessor 가져오기
+        processor = SessionProcessor.get_or_create(session_id, max_steps=max_steps)
+        try:
+            while processor.should_continue() and not state.paused:
+                state.step += 1
+                # 스텝 시작
+                step_info = processor.start_step()
+                await Bus.publish(STEP_STARTED, StepPayload(
+                    session_id=session_id,
+                    step=state.step,
+                    max_steps=max_steps
+                ))
+                print(f"[AGENTIC LOOP] Starting step {state.step}, stop_reason={state.stop_reason}", flush=True)
+                turn_input = input if state.step == 1 else PromptInput(
+                    content="",
+                    provider_id=input.provider_id,
+                    model_id=input.model_id,
+                    temperature=input.temperature,
+                    max_tokens=input.max_tokens,
+                    tools_enabled=input.tools_enabled,
+                    auto_continue=False,
+                )
+                if state.step > 1:
+                    yield StreamChunk(type="step", text=f"Step {state.step}")
+                # Track tool calls in this turn
+                has_tool_calls_this_turn = False
+                async for chunk in cls._single_turn(
+                    session_id,
+                    turn_input,
+                    agent,
+                    is_continuation=(state.step > 1),
+                    user_id=user_id
+                ):
+                    yield chunk
+                    if chunk.type == "tool_call" and chunk.tool_call:
+                        has_tool_calls_this_turn = True
+                        print(f"[AGENTIC LOOP] tool_call: {chunk.tool_call.name}", flush=True)
+                        if chunk.tool_call.name == "question" and agent.pause_on_question:
+                            state.paused = True
+                            state.pause_reason = "question"
+                    # question tool이 완료되면 (답변 받음) pause 해제
+                    elif chunk.type == "tool_result":
+                        if state.paused and state.pause_reason == "question":
+                            state.paused = False
+                            state.pause_reason = None
+                    elif chunk.type == "done":
+                        state.stop_reason = chunk.stop_reason
+                        print(f"[AGENTIC LOOP] done: stop_reason={chunk.stop_reason}", flush=True)
+                # 스텝 완료
+                step_status = "completed"
+                if processor.is_doom_loop():
+                    step_status = "doom_loop"
+                    print(f"[AGENTIC LOOP] Doom loop detected! Stopping execution.", flush=True)
+                    yield StreamChunk(type="text", text=f"\n[경고: 동일 도구 반복 호출 감지, 루프를 중단합니다]\n")
+                processor.finish_step(status=step_status)
+                await Bus.publish(STEP_FINISHED, StepPayload(
+                    session_id=session_id,
+                    step=state.step,
+                    max_steps=max_steps
+                ))
+                print(f"[AGENTIC LOOP] End of step {state.step}: stop_reason={state.stop_reason}, has_tool_calls={has_tool_calls_this_turn}", flush=True)
+                # Doom loop 감지 시 중단
+                if processor.is_doom_loop():
+                    break
+                # If this turn had no new tool calls (just text response), we're done
+                if state.stop_reason != "tool_calls":
+                    print(f"[AGENTIC LOOP] Breaking: stop_reason != tool_calls", flush=True)
+                    break
+            # Loop 종료 후 상태 메시지만 출력 (summary LLM 호출 없음!)
+            if state.paused:
+                yield StreamChunk(type="text", text=f"\n[Paused: {state.pause_reason}]\n")
+            elif state.step >= state.max_steps:
+                yield StreamChunk(type="text", text=f"\n[Max steps ({state.max_steps}) reached]\n")
+            # else: 자연스럽게 종료 (추가 출력 없음)
+        finally:
+            if session_id in cls._loop_states:
+                del cls._loop_states[session_id]
+            # SessionProcessor 정리
+            SessionProcessor.remove(session_id)
+    @classmethod
+    def _infer_provider_from_model(cls, model_id: str) -> str:
+        """model_id에서 provider_id를 추론"""
+        # LiteLLM prefix 기반 모델은 litellm provider 사용
+        litellm_prefixes = ["gemini/", "groq/", "deepseek/", "openrouter/", "zai/"]
+        for prefix in litellm_prefixes:
+            if model_id.startswith(prefix):
+                return "litellm"
+        # Claude 모델
+        if model_id.startswith("claude-"):
+            return "litellm"
+        # GPT/O1 모델
+        if model_id.startswith("gpt-") or model_id.startswith("o1"):
+            return "litellm"
+        # 기본값
+        return settings.default_provider
+    @classmethod
+    async def _single_turn(
+        cls,
+        session_id: str,
+        input: PromptInput,
+        agent: AgentInfo,
+        is_continuation: bool = False,
+        user_id: Optional[str] = None
+    ) -> AsyncIterator[StreamChunk]:
+        session = await Session.get(session_id, user_id)
+        model_id = input.model_id or session.model_id or settings.default_model
+        # provider_id가 명시되지 않으면 model_id에서 추론
+        if input.provider_id:
+            provider_id = input.provider_id
+        elif session.provider_id:
+            provider_id = session.provider_id
+        else:
+            provider_id = cls._infer_provider_from_model(model_id)
+        print(f"[Prompt DEBUG] input.provider_id={input.provider_id}, session.provider_id={session.provider_id}", flush=True)
+        print(f"[Prompt DEBUG] Final provider_id={provider_id}, model_id={model_id}", flush=True)
+        provider = get_provider(provider_id)
+        print(f"[Prompt DEBUG] Got provider: {provider}", flush=True)
+        if not provider:
+            yield StreamChunk(type="error", error=f"Provider not found: {provider_id}")
+            return
+        # Only create user message if there's content (not a continuation)
+        if input.content and not is_continuation:
+            user_msg = await Message.create_user(session_id, input.content, user_id)
+        assistant_msg = await Message.create_assistant(session_id, provider_id, model_id, user_id)
+        # Build message history
+        history = await Message.list(session_id, user_id=user_id)
+        messages = cls._build_messages(history[:-1], include_tool_results=True)
+        # Build system prompt with provider-specific optimization
+        system_prompt = cls._build_system_prompt(agent, provider_id, input.system)
+        # Get tools schema
+        tools_schema = get_tools_schema() if input.tools_enabled else None
+        current_text_part: Optional[MessagePart] = None
+        accumulated_text = ""
+        # reasoning 저장을 위한 변수
+        current_reasoning_part: Optional[MessagePart] = None
+        accumulated_reasoning = ""
+        try:
+            async for chunk in provider.stream(
+                model_id=model_id,
+                messages=messages,
+                tools=tools_schema,
+                system=system_prompt,
+                temperature=input.temperature or agent.temperature,
+                max_tokens=input.max_tokens or agent.max_tokens,
+            ):
+                if chunk.type == "text":
+                    accumulated_text += chunk.text or ""
+                    if current_text_part is None:
+                        current_text_part = await Message.add_part(
+                            assistant_msg.id,
+                            session_id,
+                            MessagePart(
+                                id="",
+                                session_id=session_id,
+                                message_id=assistant_msg.id,
+                                type="text",
+                                content=accumulated_text
+                            ),
+                            user_id
+                        )
+                    else:
+                        await Message.update_part(
+                            session_id,
+                            assistant_msg.id,
+                            current_text_part.id,
+                            {"content": accumulated_text},
+                            user_id
+                        )
+                    yield chunk
+                elif chunk.type == "tool_call":
+                    tc = chunk.tool_call
+                    if tc:
+                        # Check permission
+                        permission = is_tool_allowed(agent, tc.name)
+                        if permission == "deny":
+                            yield StreamChunk(
+                                type="tool_result",
+                                text=f"Error: Tool '{tc.name}' is not allowed for this agent"
+                            )
+                            continue
+                        tool_part = await Message.add_part(
+                            assistant_msg.id,
+                            session_id,
+                            MessagePart(
+                                id="",
+                                session_id=session_id,
+                                message_id=assistant_msg.id,
+                                type="tool_call",
+                                tool_call_id=tc.id,
+                                tool_name=tc.name,
+                                tool_args=tc.arguments,
+                                tool_status="running"  # 실행 중 상태
+                            ),
+                            user_id
+                        )
+                        # IMPORTANT: Yield tool_call FIRST so frontend can show UI
+                        # This is critical for interactive tools like 'question'
+                        yield chunk
+                        # 도구 실행 시작 이벤트 발행
+                        await Bus.publish(TOOL_STATE_CHANGED, ToolStatePayload(
+                            session_id=session_id,
+                            message_id=assistant_msg.id,
+                            part_id=tool_part.id,
+                            tool_name=tc.name,
+                            status="running"
+                        ))
+                        # Execute tool (may block for user input, e.g., question tool)
+                        tool_result, tool_status = await cls._execute_tool(
+                            session_id,
+                            assistant_msg.id,
+                            tc.id,
+                            tc.name,
+                            tc.arguments,
+                            user_id
+                        )
+                        # tool_call 파트의 status를 completed/error로 업데이트
+                        await Message.update_part(
+                            session_id,
+                            assistant_msg.id,
+                            tool_part.id,
+                            {"tool_status": tool_status},
+                            user_id
+                        )
+                        # 도구 완료 이벤트 발행
+                        await Bus.publish(TOOL_STATE_CHANGED, ToolStatePayload(
+                            session_id=session_id,
+                            message_id=assistant_msg.id,
+                            part_id=tool_part.id,
+                            tool_name=tc.name,
+                            status=tool_status
+                        ))
+                        yield StreamChunk(
+                            type="tool_result",
+                            text=tool_result
+                        )
+                    else:
+                        yield chunk
+                elif chunk.type == "reasoning":
+                    # reasoning 저장 (기존에는 yield만 했음)
+                    accumulated_reasoning += chunk.text or ""
+                    if current_reasoning_part is None:
+                        current_reasoning_part = await Message.add_part(
+                            assistant_msg.id,
+                            session_id,
+                            MessagePart(
+                                id="",
+                                session_id=session_id,
+                                message_id=assistant_msg.id,
+                                type="reasoning",
+                                content=accumulated_reasoning
+                            ),
+                            user_id
+                        )
+                    else:
+                        await Message.update_part(
+                            session_id,
+                            assistant_msg.id,
+                            current_reasoning_part.id,
+                            {"content": accumulated_reasoning},
+                            user_id
+                        )
+                    yield chunk
+                elif chunk.type == "done":
+                    if chunk.usage:
+                        await Message.set_usage(session_id, assistant_msg.id, chunk.usage, user_id)
+                    yield chunk
+                elif chunk.type == "error":
+                    await Message.set_error(session_id, assistant_msg.id, chunk.error or "Unknown error", user_id)
+                    yield chunk
+            await Session.touch(session_id)
+        except Exception as e:
+            error_msg = str(e)
+            await Message.set_error(session_id, assistant_msg.id, error_msg, user_id)
+            yield StreamChunk(type="error", error=error_msg)
+    @classmethod
+    def _detect_fake_tool_call(cls, text: str) -> Optional[Dict[str, Any]]:
+        """
+        Detect if the model wrote a fake tool call as text instead of using actual tool calling.
+        Returns parsed tool call info if detected, None otherwise.
+        Patterns detected:
+        - [Called tool: toolname({...})]
+        - [Called tool: toolname({'key': 'value'})]
+        """
+        if not text:
+            return None
+        match = FAKE_TOOL_CALL_PATTERN.search(text)
+        if match:
+            tool_name = match.group(1)
+            args_str = match.group(2).strip()
+            # Try to parse arguments
+            args = {}
+            if args_str:
+                try:
+                    # Handle both JSON and Python dict formats
+                    args_str = args_str.replace("'", '"')  # Convert Python dict to JSON
+                    args = json.loads(args_str)
+                except json.JSONDecodeError:
+                    # Try to extract key-value pairs manually
+                    # Pattern: 'key': 'value' or "key": "value"
+                    kv_pattern = re.compile(r'["\']?(\w+)["\']?\s*:\s*["\']([^"\']+)["\']')
+                    for kv_match in kv_pattern.finditer(args_str):
+                        args[kv_match.group(1)] = kv_match.group(2)
+            return {
+                "name": tool_name,
+                "arguments": args
+            }
+        return None
+    @classmethod
+    def _build_system_prompt(
+        cls,
+        agent: AgentInfo,
+        provider_id: str,
+        custom_system: Optional[str] = None
+    ) -> Optional[str]:
+        """Build the complete system prompt.
+        Args:
+            agent: The agent configuration
+            provider_id: The provider identifier for selecting optimized prompt
+            custom_system: Optional custom system prompt to append
+        Returns:
+            The complete system prompt, or None if empty
+        """
+        parts = []
+        # Add provider-specific system prompt (optimized for Claude/Gemini/etc.)
+        provider_prompt = get_prompt_for_provider(provider_id)
+        if provider_prompt:
+            parts.append(provider_prompt)
+        # Add agent-specific prompt (if defined and different from provider prompt)
+        agent_prompt = get_system_prompt(agent)
+        if agent_prompt and agent_prompt != provider_prompt:
+            parts.append(agent_prompt)
+        # Add custom system prompt
+        if custom_system:
+            parts.append(custom_system)
+        return "\n\n".join(parts) if parts else None
+    @classmethod
+    def _build_messages(
+        cls,
+        history: List,
+        include_tool_results: bool = True
+    ) -> List[ProviderMessage]:
+        """Build message list for LLM including tool calls and results.
+        Proper tool calling flow:
+        1. User message
+        2. Assistant message (may include tool calls)
+        3. Tool results (as user message with tool context)
+        4. Assistant continues
+        """
+        messages = []
+        for msg in history:
+            if msg.role == "user":
+                # Skip empty user messages (continuations)
+                if msg.content:
+                    messages.append(ProviderMessage(role="user", content=msg.content))
+            elif msg.role == "assistant":
+                # Collect all parts
+                text_parts = []
+                tool_calls = []
+                tool_results = []
+                for part in getattr(msg, "parts", []):
+                    if part.type == "text" and part.content:
+                        text_parts.append(part.content)
+                    elif part.type == "tool_call" and include_tool_results:
+                        tool_calls.append({
+                            "id": part.tool_call_id,
+                            "name": part.tool_name,
+                            "arguments": part.tool_args or {}
+                        })
+                    elif part.type == "tool_result" and include_tool_results:
+                        tool_results.append({
+                            "tool_call_id": part.tool_call_id,
+                            "output": part.tool_output or ""
+                        })
+                # Build assistant content - only text, NO tool call summaries
+                # IMPORTANT: Do NOT include "[Called tool: ...]" patterns as this causes
+                # models like Gemini to mimic the pattern instead of using actual tool calls
+                assistant_content_parts = []
+                if text_parts:
+                    assistant_content_parts.append("".join(text_parts))
+                if assistant_content_parts:
+                    messages.append(ProviderMessage(
+                        role="assistant",
+                        content="\n".join(assistant_content_parts)
+                    ))
+                # Add tool results as user message (simulating tool response)
+                if tool_results:
+                    result_content = []
+                    for result in tool_results:
+                        result_content.append(f"Tool result:\n{result['output']}")
+                    messages.append(ProviderMessage(
+                        role="user",
+                        content="\n\n".join(result_content)
+                    ))
+        return messages
+    @classmethod
+    async def _execute_tool(
+        cls,
+        session_id: str,
+        message_id: str,
+        tool_call_id: str,
+        tool_name: str,
+        tool_args: Dict[str, Any],
+        user_id: Optional[str] = None
+    ) -> tuple[str, str]:
+        """Execute a tool and store the result. Returns (output, status)."""
+        # SessionProcessor를 통한 doom loop 감지
+        # tool_args도 전달하여 같은 도구 + 같은 인자일 때만 doom loop으로 판단
+        processor = SessionProcessor.get_or_create(session_id)
+        is_doom_loop = processor.record_tool_call(tool_name, tool_args)
+        if is_doom_loop:
+            error_output = f"Error: Doom loop detected - tool '{tool_name}' called repeatedly"
+            await Message.add_part(
+                message_id,
+                session_id,
+                MessagePart(
+                    id="",
+                    session_id=session_id,
+                    message_id=message_id,
+                    type="tool_result",
+                    tool_call_id=tool_call_id,
+                    tool_output=error_output
+                ),
+                user_id
+            )
+            return error_output, "error"
+        # Registry에서 도구 가져오기
+        registry = get_registry()
+        tool = registry.get(tool_name)
+        if not tool:
+            error_output = f"Error: Tool '{tool_name}' not found"
+            await Message.add_part(
+                message_id,
+                session_id,
+                MessagePart(
+                    id="",
+                    session_id=session_id,
+                    message_id=message_id,
+                    type="tool_result",
+                    tool_call_id=tool_call_id,
+                    tool_output=error_output
+                ),
+                user_id
+            )
+            return error_output, "error"
+        ctx = ToolContext(
+            session_id=session_id,
+            message_id=message_id,
+            tool_call_id=tool_call_id,
+        )
+        try:
+            result = await tool.execute(tool_args, ctx)
+            # 출력 길이 제한 적용
+            truncated_output = tool.truncate_output(result.output)
+            output = f"[{result.title}]\n{truncated_output}"
+            status = "completed"
+        except Exception as e:
+            output = f"Error executing tool: {str(e)}"
+            status = "error"
+        await Message.add_part(
+            message_id,
+            session_id,
+            MessagePart(
+                id="",
+                session_id=session_id,
+                message_id=message_id,
+                type="tool_result",
+                tool_call_id=tool_call_id,
+                tool_output=output
+            ),
+            user_id
+        )
+        return output, status
+    @classmethod
+    def cancel(cls, session_id: str) -> bool:
+        """Cancel an active session."""
+        cancelled = False
+        if session_id in cls._active_sessions:
+            cls._active_sessions[session_id].cancel()
+            del cls._active_sessions[session_id]
+            cancelled = True
+        if session_id in cls._loop_states:
+            cls._loop_states[session_id].paused = True
+            cls._loop_states[session_id].pause_reason = "cancelled"
+            del cls._loop_states[session_id]
+            cancelled = True
+        return cancelled
+    @classmethod
+    def get_loop_state(cls, session_id: str) -> Optional[LoopState]:
+        """Get the current loop state for a session."""
+        return cls._loop_states.get(session_id)
+    @classmethod
+    async def resume(cls, session_id: str) -> AsyncIterator[StreamChunk]:
+        state = cls._loop_states.get(session_id)
+        if not state or not state.paused:
+            yield StreamChunk(type="error", error="No paused loop to resume")
+            return
+        state.paused = False
+        state.pause_reason = None
+        session = await Session.get(session_id)
+        agent_id = session.agent_id or "build"
+        agent = get_agent(agent_id) or default_agent()
+        continue_input = PromptInput(content="")
+        while state.stop_reason == "tool_calls" and not state.paused and state.step < state.max_steps:
+            state.step += 1
+            yield StreamChunk(type="text", text=f"\n[Resuming... step {state.step}/{state.max_steps}]\n")
+            async for chunk in cls._single_turn(session_id, continue_input, agent, is_continuation=True):
+                yield chunk
+                if chunk.type == "tool_call" and chunk.tool_call:
+                    if chunk.tool_call.name == "question" and agent.pause_on_question:
+                        state.paused = True
+                        state.pause_reason = "question"
+                elif chunk.type == "done":
+                    state.stop_reason = chunk.stop_reason

src/opencode_api/session/session.py ADDED Viewed

	@@ -0,0 +1,159 @@

+from typing import Optional, List, Dict, Any
+from pydantic import BaseModel
+from datetime import datetime
+from ..core.storage import Storage, NotFoundError
+from ..core.bus import Bus, SESSION_CREATED, SESSION_UPDATED, SESSION_DELETED, SessionPayload
+from ..core.identifier import Identifier
+from ..core.supabase import get_client, is_enabled as supabase_enabled
+class SessionInfo(BaseModel):
+    id: str
+    user_id: Optional[str] = None
+    title: str
+    created_at: datetime
+    updated_at: datetime
+    provider_id: Optional[str] = None
+    model_id: Optional[str] = None
+    agent_id: Optional[str] = None
+class SessionCreate(BaseModel):
+    title: Optional[str] = None
+    provider_id: Optional[str] = None
+    model_id: Optional[str] = None
+    agent_id: Optional[str] = None
+class Session:
+    @staticmethod
+    async def create(data: Optional[SessionCreate] = None, user_id: Optional[str] = None) -> SessionInfo:
+        session_id = Identifier.generate("session")
+        now = datetime.utcnow()
+        info = SessionInfo(
+            id=session_id,
+            user_id=user_id,
+            title=data.title if data and data.title else f"Session {now.isoformat()}",
+            created_at=now,
+            updated_at=now,
+            provider_id=data.provider_id if data else None,
+            model_id=data.model_id if data else None,
+            agent_id=data.agent_id if data else "build",
+        )
+        if supabase_enabled() and user_id:
+            client = get_client()
+            client.table("opencode_sessions").insert({
+                "id": session_id,
+                "user_id": user_id,
+                "title": info.title,
+                "agent_id": info.agent_id,
+                "provider_id": info.provider_id,
+                "model_id": info.model_id,
+            }).execute()
+        else:
+            await Storage.write(["session", session_id], info)
+        await Bus.publish(SESSION_CREATED, SessionPayload(id=session_id, title=info.title))
+        return info
+    @staticmethod
+    async def get(session_id: str, user_id: Optional[str] = None) -> SessionInfo:
+        if supabase_enabled() and user_id:
+            client = get_client()
+            result = client.table("opencode_sessions").select("*").eq("id", session_id).eq("user_id", user_id).single().execute()
+            if not result.data:
+                raise NotFoundError(["session", session_id])
+            return SessionInfo(
+                id=result.data["id"],
+                user_id=result.data["user_id"],
+                title=result.data["title"],
+                created_at=result.data["created_at"],
+                updated_at=result.data["updated_at"],
+                provider_id=result.data.get("provider_id"),
+                model_id=result.data.get("model_id"),
+                agent_id=result.data.get("agent_id"),
+            )
+        data = await Storage.read(["session", session_id])
+        if not data:
+            raise NotFoundError(["session", session_id])
+        return SessionInfo(**data)
+    @staticmethod
+    async def update(session_id: str, updates: Dict[str, Any], user_id: Optional[str] = None) -> SessionInfo:
+        updates["updated_at"] = datetime.utcnow().isoformat()
+        if supabase_enabled() and user_id:
+            client = get_client()
+            result = client.table("opencode_sessions").update(updates).eq("id", session_id).eq("user_id", user_id).execute()
+            if not result.data:
+                raise NotFoundError(["session", session_id])
+            return await Session.get(session_id, user_id)
+        def updater(data: Dict[str, Any]):
+            data.update(updates)
+        data = await Storage.update(["session", session_id], updater)
+        info = SessionInfo(**data)
+        await Bus.publish(SESSION_UPDATED, SessionPayload(id=session_id, title=info.title))
+        return info
+    @staticmethod
+    async def delete(session_id: str, user_id: Optional[str] = None) -> bool:
+        if supabase_enabled() and user_id:
+            client = get_client()
+            client.table("opencode_sessions").delete().eq("id", session_id).eq("user_id", user_id).execute()
+            await Bus.publish(SESSION_DELETED, SessionPayload(id=session_id, title=""))
+            return True
+        info = await Session.get(session_id)
+        message_keys = await Storage.list(["message", session_id])
+        for key in message_keys:
+            await Storage.remove(key)
+        await Storage.remove(["session", session_id])
+        await Bus.publish(SESSION_DELETED, SessionPayload(id=session_id, title=info.title))
+        return True
+    @staticmethod
+    async def list(limit: Optional[int] = None, user_id: Optional[str] = None) -> List[SessionInfo]:
+        if supabase_enabled() and user_id:
+            client = get_client()
+            query = client.table("opencode_sessions").select("*").eq("user_id", user_id).order("updated_at", desc=True)
+            if limit:
+                query = query.limit(limit)
+            result = query.execute()
+            return [
+                SessionInfo(
+                    id=row["id"],
+                    user_id=row["user_id"],
+                    title=row["title"],
+                    created_at=row["created_at"],
+                    updated_at=row["updated_at"],
+                    provider_id=row.get("provider_id"),
+                    model_id=row.get("model_id"),
+                    agent_id=row.get("agent_id"),
+                )
+                for row in result.data
+            ]
+        session_keys = await Storage.list(["session"])
+        sessions = []
+        for key in session_keys:
+            if limit and len(sessions) >= limit:
+                break
+            data = await Storage.read(key)
+            if data:
+                sessions.append(SessionInfo(**data))
+        sessions.sort(key=lambda s: s.updated_at, reverse=True)
+        return sessions
+    @staticmethod
+    async def touch(session_id: str, user_id: Optional[str] = None) -> None:
+        await Session.update(session_id, {}, user_id)

src/opencode_api/tool/__init__.py ADDED Viewed

	@@ -0,0 +1,27 @@

+from .tool import Tool, ToolContext, ToolResult, register_tool, get_tool, list_tools, get_tools_schema
+from .registry import ToolRegistry, get_registry
+from .websearch import WebSearchTool
+from .webfetch import WebFetchTool
+from .todo import TodoTool
+from .question import (
+    QuestionTool,
+    QuestionInfo,
+    QuestionOption,
+    QuestionRequest,
+    QuestionReply,
+    ask_questions,
+    reply_to_question,
+    reject_question,
+    get_pending_questions,
+)
+from .skill import SkillTool, SkillInfo, register_skill, get_skill, list_skills
+__all__ = [
+    "Tool", "ToolContext", "ToolResult",
+    "register_tool", "get_tool", "list_tools", "get_tools_schema",
+    "ToolRegistry", "get_registry",
+    "WebSearchTool", "WebFetchTool", "TodoTool",
+    "QuestionTool", "QuestionInfo", "QuestionOption", "QuestionRequest", "QuestionReply",
+    "ask_questions", "reply_to_question", "reject_question", "get_pending_questions",
+    "SkillTool", "SkillInfo", "register_skill", "get_skill", "list_skills",
+]

src/opencode_api/tool/question.py ADDED Viewed

	@@ -0,0 +1,308 @@

+"""Question tool - allows agent to ask user questions during execution."""
+from typing import Dict, Any, List, Optional
+from pydantic import BaseModel, Field
+import asyncio
+import logging
+from .tool import BaseTool, ToolResult, ToolContext
+from ..core.identifier import generate_id
+from ..core.bus import Bus
+logger = logging.getLogger(__name__)
+# Question schemas
+class QuestionOption(BaseModel):
+    """A single option for a question."""
+    label: str = Field(..., description="Display text (1-5 words, concise)")
+    description: str = Field(..., description="Explanation of choice")
+class QuestionInfo(BaseModel):
+    """A question to ask the user."""
+    question: str = Field(..., description="Complete question")
+    header: str = Field(..., description="Very short label (max 30 chars)")
+    options: List[QuestionOption] = Field(default_factory=list, description="Available choices")
+    multiple: bool = Field(default=False, description="Allow selecting multiple choices")
+    custom: bool = Field(default=True, description="Allow typing a custom answer")
+class QuestionRequest(BaseModel):
+    """A request containing questions for the user."""
+    id: str
+    session_id: str
+    questions: List[QuestionInfo]
+    tool_call_id: Optional[str] = None
+    message_id: Optional[str] = None
+class QuestionReply(BaseModel):
+    """User's reply to questions."""
+    request_id: str
+    answers: List[List[str]] = Field(..., description="Answers in order (each is array of selected labels)")
+# Events
+QUESTION_ASKED = "question.asked"
+QUESTION_REPLIED = "question.replied"
+QUESTION_REJECTED = "question.rejected"
+# Pending questions state
+_pending_questions: Dict[str, asyncio.Future] = {}
+async def ask_questions(
+    session_id: str,
+    questions: List[QuestionInfo],
+    tool_call_id: Optional[str] = None,
+    message_id: Optional[str] = None,
+    timeout: float = 300.0,  # 5 minutes default timeout
+) -> List[List[str]]:
+    """Ask questions and wait for user response."""
+    # tool_call_id를 request_id로 사용 (프론트엔드에서 바로 사용 가능)
+    request_id = tool_call_id or generate_id("question")
+    request = QuestionRequest(
+        id=request_id,
+        session_id=session_id,
+        questions=questions,
+        tool_call_id=tool_call_id,
+        message_id=message_id,
+    )
+    # Create future for response
+    # 중요: get_running_loop() 사용 (get_event_loop()는 FastAPI에서 잘못된 loop 반환 가능)
+    loop = asyncio.get_running_loop()
+    future: asyncio.Future[List[List[str]]] = loop.create_future()
+    _pending_questions[request_id] = future
+    # Publish question event (will be sent via SSE)
+    await Bus.publish(QUESTION_ASKED, request.model_dump())
+    try:
+        # Wait for reply with timeout
+        logger.info(f"[question] Waiting for answer to request_id={request_id}, timeout={timeout}s")
+        answers = await asyncio.wait_for(future, timeout=timeout)
+        logger.info(f"[question] Received answer for request_id={request_id}: {answers}")
+        return answers
+    except asyncio.TimeoutError:
+        logger.error(f"[question] Timeout for request_id={request_id} after {timeout}s")
+        del _pending_questions[request_id]
+        raise TimeoutError(f"Question timed out after {timeout} seconds")
+    except Exception as e:
+        logger.error(f"[question] Error waiting for answer: {type(e).__name__}: {e}")
+        raise
+    finally:
+        if request_id in _pending_questions:
+            del _pending_questions[request_id]
+async def reply_to_question(request_id: str, answers: List[List[str]]) -> bool:
+    """Submit answers to a pending question."""
+    logger.info(f"[question] reply_to_question called: request_id={request_id}, answers={answers}")
+    logger.info(f"[question] pending_questions keys: {list(_pending_questions.keys())}")
+    if request_id not in _pending_questions:
+        logger.error(f"[question] request_id={request_id} NOT FOUND in pending_questions!")
+        return False
+    future = _pending_questions[request_id]
+    if not future.done():
+        logger.info(f"[question] Setting result for request_id={request_id}")
+        future.set_result(answers)
+    else:
+        logger.warning(f"[question] Future already done for request_id={request_id}")
+    return True
+async def reject_question(request_id: str) -> bool:
+    """Reject/dismiss a pending question."""
+    if request_id not in _pending_questions:
+        return False
+    future = _pending_questions[request_id]
+    if not future.done():
+        future.set_exception(QuestionRejectedError())
+    return True
+def get_pending_questions(session_id: Optional[str] = None) -> List[str]:
+    """Get list of pending question request IDs."""
+    return list(_pending_questions.keys())
+class QuestionRejectedError(Exception):
+    """Raised when user dismisses a question."""
+    def __init__(self):
+        super().__init__("The user dismissed this question")
+QUESTION_DESCRIPTION = """Use this tool when you need to ask the user questions during execution. This allows you to:
+1. Gather user preferences or requirements
+2. Clarify ambiguous instructions
+3. Get decisions on implementation choices as you work
+4. Offer choices to the user about what direction to take.
+IMPORTANT: You MUST provide at least 2 options for each question. Never ask open-ended questions without choices.
+Usage notes:
+- REQUIRED: Every question MUST have at least 2 options (minItems: 2)
+- When `custom` is enabled (default), a "Type your own answer" option is added automatically; don't include "Other" or catch-all options
+- Answers are returned as arrays of labels; set `multiple: true` to allow selecting more than one
+- If you recommend a specific option, make that the first option in the list and add "(Recommended)" at the end of the label
+"""
+class QuestionTool(BaseTool):
+    """Tool for asking user questions during execution."""
+    @property
+    def id(self) -> str:
+        return "question"
+    @property
+    def description(self) -> str:
+        return QUESTION_DESCRIPTION
+    @property
+    def parameters(self) -> Dict[str, Any]:
+        return {
+            "type": "object",
+            "properties": {
+                "questions": {
+                    "type": "array",
+                    "description": "Questions to ask",
+                    "items": {
+                        "type": "object",
+                        "properties": {
+                            "question": {
+                                "type": "string",
+                                "description": "Complete question"
+                            },
+                            "header": {
+                                "type": "string",
+                                "description": "Very short label (max 30 chars)"
+                            },
+                            "options": {
+                                "type": "array",
+                                "description": "Available choices (MUST provide at least 2 options)",
+                                "minItems": 2,
+                                "items": {
+                                    "type": "object",
+                                    "properties": {
+                                        "label": {
+                                            "type": "string",
+                                            "description": "Display text (1-5 words, concise)"
+                                        },
+                                        "description": {
+                                            "type": "string",
+                                            "description": "Explanation of choice"
+                                        }
+                                    },
+                                    "required": ["label", "description"]
+                                }
+                            },
+                            "multiple": {
+                                "type": "boolean",
+                                "description": "Allow selecting multiple choices",
+                                "default": False
+                            }
+                        },
+                        "required": ["question", "header", "options"]
+                    }
+                }
+            },
+            "required": ["questions"]
+        }
+    async def execute(self, args: Dict[str, Any], ctx: ToolContext) -> ToolResult:
+        logger.info(f"[question] execute called with args: {args}")
+        logger.info(f"[question] args type: {type(args)}")
+        questions_data = args.get("questions", [])
+        logger.info(f"[question] questions_data type: {type(questions_data)}, len: {len(questions_data) if isinstance(questions_data, list) else 'N/A'}")
+        if questions_data and len(questions_data) > 0:
+            logger.info(f"[question] first question type: {type(questions_data[0])}")
+            logger.info(f"[question] first question content: {questions_data[0]}")
+        if not questions_data:
+            return ToolResult(
+                title="No questions",
+                output="No questions were provided.",
+                metadata={}
+            )
+        # Parse questions
+        questions = []
+        try:
+            for idx, q in enumerate(questions_data):
+                logger.info(f"[question] Parsing question {idx}: type={type(q)}, value={q}")
+                # q가 문자열인 경우 처리
+                if isinstance(q, str):
+                    logger.error(f"[question] Question {idx} is a string, not a dict!")
+                    continue
+                options = []
+                for opt_idx, opt in enumerate(q.get("options", [])):
+                    logger.info(f"[question] Parsing option {opt_idx}: type={type(opt)}, value={opt}")
+                    if isinstance(opt, dict):
+                        options.append(QuestionOption(label=opt["label"], description=opt["description"]))
+                    else:
+                        logger.error(f"[question] Option {opt_idx} is not a dict: {type(opt)}")
+                questions.append(QuestionInfo(
+                    question=q["question"],
+                    header=q["header"],
+                    options=options,
+                    multiple=q.get("multiple", False),
+                    custom=q.get("custom", True),
+                ))
+        except Exception as e:
+            logger.error(f"[question] Error parsing questions: {type(e).__name__}: {e}")
+            import traceback
+            logger.error(f"[question] Traceback: {traceback.format_exc()}")
+            raise
+        try:
+            # Ask questions and wait for response
+            answers = await ask_questions(
+                session_id=ctx.session_id,
+                questions=questions,
+                tool_call_id=ctx.tool_call_id,
+                message_id=ctx.message_id,
+            )
+            # Format response
+            def format_answer(answer: List[str]) -> str:
+                if not answer:
+                    return "Unanswered"
+                return ", ".join(answer)
+            formatted = ", ".join(
+                f'"{q.question}"="{format_answer(answers[i] if i < len(answers) else [])}"'
+                for i, q in enumerate(questions)
+            )
+            return ToolResult(
+                title=f"Asked {len(questions)} question{'s' if len(questions) > 1 else ''}",
+                output=f"User has answered your questions: {formatted}. You can now continue with the user's answers in mind.",
+                metadata={"answers": answers}
+            )
+        except QuestionRejectedError:
+            return ToolResult(
+                title="Questions dismissed",
+                output="The user dismissed the questions without answering.",
+                metadata={"rejected": True}
+            )
+        except TimeoutError as e:
+            return ToolResult(
+                title="Questions timed out",
+                output=str(e),
+                metadata={"timeout": True}
+            )

src/opencode_api/tool/registry.py ADDED Viewed

	@@ -0,0 +1,48 @@

+from typing import Dict, Any, List, Optional
+from .tool import BaseTool
+import os
+import importlib.util
+class ToolRegistry:
+    """도구 레지스트리 - 도구 등록 및 관리"""
+    def __init__(self):
+        self._tools: Dict[str, BaseTool] = {}
+    def register(self, tool: BaseTool) -> None:
+        """도구 등록"""
+        self._tools[tool.id] = tool
+    def get(self, tool_id: str) -> Optional[BaseTool]:
+        """도구 ID로 조회"""
+        return self._tools.get(tool_id)
+    def list(self) -> List[BaseTool]:
+        """등록된 모든 도구 목록 반환"""
+        return list(self._tools.values())
+    def get_schema(self) -> List[Dict[str, Any]]:
+        """모든 도구의 스키마 반환"""
+        return [tool.get_schema() for tool in self._tools.values()]
+    def load_from_directory(self, path: str) -> None:
+        """
+        디렉토리에서 도구를 동적으로 로드
+        (나중에 구현 가능 - 플러그인 시스템)
+        """
+        if not os.path.exists(path):
+            raise ValueError(f"Directory not found: {path}")
+        # 향후 구현: .py 파일을 스캔하고 BaseTool 서브클래스를 찾아 자동 등록
+        # 현재는 placeholder
+        pass
+# 전역 싱글톤 인스턴스
+_registry = ToolRegistry()
+def get_registry() -> ToolRegistry:
+    """전역 레지스트리 인스턴스 반환"""
+    return _registry

src/opencode_api/tool/skill.py ADDED Viewed

	@@ -0,0 +1,369 @@

+"""Skill tool - loads detailed instructions for specific tasks."""
+from typing import Dict, Any, List, Optional
+from pydantic import BaseModel, Field
+from .tool import BaseTool, ToolResult, ToolContext
+class SkillInfo(BaseModel):
+    """Information about a skill."""
+    name: str
+    description: str
+    content: str
+# Built-in skills registry
+_skills: Dict[str, SkillInfo] = {}
+def register_skill(skill: SkillInfo) -> None:
+    """Register a skill."""
+    _skills[skill.name] = skill
+def get_skill(name: str) -> Optional[SkillInfo]:
+    """Get a skill by name."""
+    return _skills.get(name)
+def list_skills() -> List[SkillInfo]:
+    """List all registered skills."""
+    return list(_skills.values())
+# Built-in default skills
+DEFAULT_SKILLS = [
+    SkillInfo(
+        name="web-research",
+        description="Comprehensive web research methodology for gathering information from multiple sources",
+        content="""# Web Research Skill
+## Purpose
+Guide for conducting thorough web research to answer questions or gather information.
+## Methodology
+### 1. Query Formulation
+- Break down complex questions into specific search queries
+- Use different phrasings to get diverse results
+- Include domain-specific terms when relevant
+### 2. Source Evaluation
+- Prioritize authoritative sources (official docs, reputable publications)
+- Cross-reference information across multiple sources
+- Note publication dates for time-sensitive information
+### 3. Information Synthesis
+- Compile findings from multiple sources
+- Identify consensus vs. conflicting information
+- Summarize key points clearly
+### 4. Citation
+- Always provide source URLs
+- Note when information might be outdated
+## Tools to Use
+- `websearch`: For finding relevant pages
+- `webfetch`: For extracting content from specific URLs
+## Best Practices
+- Start broad, then narrow down
+- Use quotes for exact phrases
+- Filter by date when freshness matters
+- Verify claims with multiple sources
+"""
+    ),
+    SkillInfo(
+        name="code-explanation",
+        description="Methodology for explaining code clearly to users of varying skill levels",
+        content="""# Code Explanation Skill
+## Purpose
+Guide for explaining code in a clear, educational manner.
+## Approach
+### 1. Assess Context
+- Determine user's apparent skill level
+- Identify what aspect they're asking about
+- Note any specific confusion points
+### 2. Structure Explanation
+- Start with high-level overview (what does it do?)
+- Break down into logical sections
+- Explain each component's purpose
+### 3. Use Analogies
+- Relate concepts to familiar ideas
+- Use real-world metaphors when helpful
+- Avoid overly technical jargon initially
+### 4. Provide Examples
+- Show simple examples first
+- Build up to complex cases
+- Include edge cases when relevant
+### 5. Verify Understanding
+- Use the question tool to check comprehension
+- Offer to elaborate on specific parts
+- Provide additional resources if needed
+## Best Practices
+- Don't assume prior knowledge
+- Explain "why" not just "what"
+- Use code comments effectively
+- Highlight common pitfalls
+"""
+    ),
+    SkillInfo(
+        name="api-integration",
+        description="Best practices for integrating with external APIs",
+        content="""# API Integration Skill
+## Purpose
+Guide for properly integrating with external APIs.
+## Key Considerations
+### 1. Authentication
+- Store API keys securely (environment variables)
+- Never hardcode credentials
+- Handle token refresh if applicable
+### 2. Error Handling
+- Implement retry logic for transient failures
+- Handle rate limiting gracefully
+- Log errors with context
+### 3. Request Best Practices
+- Set appropriate timeouts
+- Use connection pooling
+- Implement circuit breakers for resilience
+### 4. Response Handling
+- Validate response schemas
+- Handle pagination properly
+- Cache responses when appropriate
+### 5. Testing
+- Mock API responses in tests
+- Test error scenarios
+- Verify rate limit handling
+## Common Patterns
+```python
+# Example: Robust API call
+async def call_api(url, retries=3):
+    for attempt in range(retries):
+        try:
+            response = await httpx.get(url, timeout=30)
+            response.raise_for_status()
+            return response.json()
+        except httpx.HTTPStatusError as e:
+            if e.response.status_code == 429:
+                await asyncio.sleep(2 ** attempt)
+            elif e.response.status_code >= 500:
+                await asyncio.sleep(1)
+            else:
+                raise
+    raise Exception("Max retries exceeded")
+```
+"""
+    ),
+    SkillInfo(
+        name="debugging",
+        description="Systematic approach to debugging problems",
+        content="""# Debugging Skill
+## Purpose
+Systematic methodology for identifying and fixing bugs.
+## Process
+### 1. Reproduce the Issue
+- Get exact steps to reproduce
+- Note environment details
+- Identify when it started happening
+### 2. Gather Information
+- Check error messages and stack traces
+- Review recent changes
+- Check logs for anomalies
+### 3. Form Hypotheses
+- List possible causes
+- Rank by likelihood
+- Consider recent changes first
+### 4. Test Hypotheses
+- Start with most likely cause
+- Make minimal changes to test
+- Verify each hypothesis before moving on
+### 5. Implement Fix
+- Fix root cause, not symptoms
+- Add tests to prevent regression
+- Document the fix
+### 6. Verify Fix
+- Confirm original issue is resolved
+- Check for side effects
+- Test related functionality
+## Debugging Questions
+- What changed recently?
+- Does it happen consistently?
+- What's different when it works?
+- What are the exact inputs?
+## Tools
+- Use print/log statements strategically
+- Leverage debuggers when available
+- Check version differences
+"""
+    ),
+    SkillInfo(
+        name="task-planning",
+        description="Breaking down complex tasks into manageable steps",
+        content="""# Task Planning Skill
+## Purpose
+Guide for decomposing complex tasks into actionable steps.
+## Methodology
+### 1. Understand the Goal
+- Clarify the end objective
+- Identify success criteria
+- Note any constraints
+### 2. Identify Components
+- Break into major phases
+- List dependencies between parts
+- Identify parallel vs. sequential work
+### 3. Create Action Items
+- Make each item specific and actionable
+- Estimate effort/complexity
+- Assign priorities
+### 4. Sequence Work
+- Order by dependencies
+- Front-load risky items
+- Plan for blockers
+### 5. Track Progress
+- Use todo tool to track items
+- Update status as work progresses
+- Re-plan when needed
+## Best Practices
+- Start with end goal in mind
+- Keep items small (< 1 hour ideal)
+- Include verification steps
+- Plan for error cases
+## Example Structure
+1. Research & understand requirements
+2. Design approach
+3. Implement core functionality
+4. Add error handling
+5. Test thoroughly
+6. Document changes
+"""
+    ),
+]
+def _get_skill_description(skills: List[SkillInfo]) -> str:
+    """Generate description with available skills."""
+    if not skills:
+        return "Load a skill to get detailed instructions for a specific task. No skills are currently available."
+    lines = [
+        "Load a skill to get detailed instructions for a specific task.",
+        "Skills provide specialized knowledge and step-by-step guidance.",
+        "Use this when a task matches an available skill's description.",
+        "",
+        "<available_skills>",
+    ]
+    for skill in skills:
+        lines.extend([
+            f"  <skill>",
+            f"    <name>{skill.name}</name>",
+            f"    <description>{skill.description}</description>",
+            f"  </skill>",
+        ])
+    lines.append("</available_skills>")
+    return "\n".join(lines)
+class SkillTool(BaseTool):
+    """Tool for loading skill instructions."""
+    def __init__(self, additional_skills: Optional[List[SkillInfo]] = None):
+        """Initialize with optional additional skills."""
+        # Register default skills
+        for skill in DEFAULT_SKILLS:
+            register_skill(skill)
+        # Register additional skills if provided
+        if additional_skills:
+            for skill in additional_skills:
+                register_skill(skill)
+    @property
+    def id(self) -> str:
+        return "skill"
+    @property
+    def description(self) -> str:
+        return _get_skill_description(list_skills())
+    @property
+    def parameters(self) -> Dict[str, Any]:
+        skill_names = [s.name for s in list_skills()]
+        examples = ", ".join(f"'{n}'" for n in skill_names[:3])
+        hint = f" (e.g., {examples}, ...)" if examples else ""
+        return {
+            "type": "object",
+            "properties": {
+                "name": {
+                    "type": "string",
+                    "description": f"The skill identifier from available_skills{hint}",
+                    "enum": skill_names if skill_names else None
+                }
+            },
+            "required": ["name"]
+        }
+    async def execute(self, args: Dict[str, Any], ctx: ToolContext) -> ToolResult:
+        skill_name = args.get("name", "")
+        skill = get_skill(skill_name)
+        if not skill:
+            available = ", ".join(s.name for s in list_skills())
+            return ToolResult(
+                title=f"Skill not found: {skill_name}",
+                output=f'Skill "{skill_name}" not found. Available skills: {available or "none"}',
+                metadata={"error": True}
+            )
+        output = f"""## Skill: {skill.name}
+**Description**: {skill.description}
+{skill.content}
+"""
+        return ToolResult(
+            title=f"Loaded skill: {skill.name}",
+            output=output,
+            metadata={"name": skill.name}
+        )

src/opencode_api/tool/todo.py ADDED Viewed

	@@ -0,0 +1,128 @@

+from typing import Dict, Any, List, Optional
+from pydantic import BaseModel
+from .tool import BaseTool, ToolContext, ToolResult
+from ..core.storage import Storage
+class TodoItem(BaseModel):
+    id: str
+    content: str
+    status: str = "pending"  # pending, in_progress, completed, cancelled
+    priority: str = "medium"  # high, medium, low
+class TodoTool(BaseTool):
+    @property
+    def id(self) -> str:
+        return "todo"
+    @property
+    def description(self) -> str:
+        return (
+            "Manage a todo list for tracking tasks. Use this to create, update, "
+            "and track progress on multi-step tasks. Supports pending, in_progress, "
+            "completed, and cancelled statuses."
+        )
+    @property
+    def parameters(self) -> Dict[str, Any]:
+        return {
+            "type": "object",
+            "properties": {
+                "action": {
+                    "type": "string",
+                    "enum": ["read", "write"],
+                    "description": "Action to perform: 'read' to get todos, 'write' to update todos"
+                },
+                "todos": {
+                    "type": "array",
+                    "description": "List of todos (required for 'write' action)",
+                    "items": {
+                        "type": "object",
+                        "properties": {
+                            "id": {"type": "string"},
+                            "content": {"type": "string"},
+                            "status": {
+                                "type": "string",
+                                "enum": ["pending", "in_progress", "completed", "cancelled"]
+                            },
+                            "priority": {
+                                "type": "string",
+                                "enum": ["high", "medium", "low"]
+                            }
+                        },
+                        "required": ["id", "content", "status", "priority"]
+                    }
+                }
+            },
+            "required": ["action"]
+        }
+    async def execute(self, args: Dict[str, Any], ctx: ToolContext) -> ToolResult:
+        action = args["action"]
+        session_id = ctx.session_id
+        if action == "read":
+            return await self._read_todos(session_id)
+        elif action == "write":
+            todos_data = args.get("todos", [])
+            return await self._write_todos(session_id, todos_data)
+        else:
+            return ToolResult(
+                title="Todo Error",
+                output=f"Unknown action: {action}",
+                metadata={"error": "invalid_action"}
+            )
+    async def _read_todos(self, session_id: str) -> ToolResult:
+        todos = await Storage.read(["todo", session_id])
+        if not todos:
+            return ToolResult(
+                title="Todo List",
+                output="No todos found for this session.",
+                metadata={"count": 0}
+            )
+        items = [TodoItem(**t) for t in todos]
+        lines = self._format_todos(items)
+        return ToolResult(
+            title="Todo List",
+            output="\n".join(lines),
+            metadata={"count": len(items)}
+        )
+    async def _write_todos(self, session_id: str, todos_data: List[Dict]) -> ToolResult:
+        items = [TodoItem(**t) for t in todos_data]
+        await Storage.write(["todo", session_id], [t.model_dump() for t in items])
+        lines = self._format_todos(items)
+        return ToolResult(
+            title="Todo List Updated",
+            output="\n".join(lines),
+            metadata={"count": len(items)}
+        )
+    def _format_todos(self, items: List[TodoItem]) -> List[str]:
+        status_icons = {
+            "pending": "[ ]",
+            "in_progress": "[~]",
+            "completed": "[x]",
+            "cancelled": "[-]"
+        }
+        priority_icons = {
+            "high": "!!!",
+            "medium": "!!",
+            "low": "!"
+        }
+        lines = []
+        for item in items:
+            icon = status_icons.get(item.status, "[ ]")
+            priority = priority_icons.get(item.priority, "")
+            lines.append(f"{icon} {priority} {item.content} (id: {item.id})")
+        return lines if lines else ["No todos."]

src/opencode_api/tool/tool.py ADDED Viewed

	@@ -0,0 +1,109 @@

+from typing import Dict, Any, List, Optional, Callable, Awaitable, Protocol, runtime_checkable
+from pydantic import BaseModel
+from abc import ABC, abstractmethod
+from datetime import datetime
+class ToolContext(BaseModel):
+    session_id: str
+    message_id: str
+    tool_call_id: Optional[str] = None
+    agent: str = "default"
+class ToolResult(BaseModel):
+    title: str
+    output: str
+    metadata: Dict[str, Any] = {}
+    truncated: bool = False
+    original_length: int = 0
+@runtime_checkable
+class Tool(Protocol):
+    @property
+    def id(self) -> str: ...
+    @property
+    def description(self) -> str: ...
+    @property
+    def parameters(self) -> Dict[str, Any]: ...
+    async def execute(self, args: Dict[str, Any], ctx: ToolContext) -> ToolResult: ...
+class BaseTool(ABC):
+    MAX_OUTPUT_LENGTH = 50000
+    def __init__(self):
+        self.status: str = "pending"
+        self.time_start: Optional[datetime] = None
+        self.time_end: Optional[datetime] = None
+    @property
+    @abstractmethod
+    def id(self) -> str:
+        pass
+    @property
+    @abstractmethod
+    def description(self) -> str:
+        pass
+    @property
+    @abstractmethod
+    def parameters(self) -> Dict[str, Any]:
+        pass
+    @abstractmethod
+    async def execute(self, args: Dict[str, Any], ctx: ToolContext) -> ToolResult:
+        pass
+    def get_schema(self) -> Dict[str, Any]:
+        return {
+            "name": self.id,
+            "description": self.description,
+            "parameters": self.parameters
+        }
+    def truncate_output(self, output: str) -> str:
+        """출력이 MAX_OUTPUT_LENGTH를 초과하면 자르고 메시지 추가"""
+        if len(output) <= self.MAX_OUTPUT_LENGTH:
+            return output
+        truncated = output[:self.MAX_OUTPUT_LENGTH]
+        truncated += "\n\n[Output truncated...]"
+        return truncated
+    def update_status(self, status: str) -> None:
+        """도구 상태 업데이트 (pending, running, completed, error)"""
+        self.status = status
+        if status == "running" and self.time_start is None:
+            self.time_start = datetime.now()
+        elif status in ("completed", "error") and self.time_end is None:
+            self.time_end = datetime.now()
+from .registry import get_registry
+def register_tool(tool: BaseTool) -> None:
+    """도구 등록 (호환성 함수 - ToolRegistry 사용)"""
+    get_registry().register(tool)
+def get_tool(tool_id: str) -> Optional[BaseTool]:
+    """도구 조회 (호환성 함수 - ToolRegistry 사용)"""
+    return get_registry().get(tool_id)
+def list_tools() -> List[BaseTool]:
+    """도구 목록 (호환성 함수 - ToolRegistry 사용)"""
+    return get_registry().list()
+def get_tools_schema() -> List[Dict[str, Any]]:
+    """도구 스키마 목록 (호환성 함수 - ToolRegistry 사용)"""
+    return get_registry().get_schema()

src/opencode_api/tool/webfetch.py ADDED Viewed

	@@ -0,0 +1,117 @@

+from typing import Dict, Any
+import httpx
+from .tool import BaseTool, ToolContext, ToolResult
+class WebFetchTool(BaseTool):
+    @property
+    def id(self) -> str:
+        return "webfetch"
+    @property
+    def description(self) -> str:
+        return (
+            "Fetch content from a URL and convert it to readable text or markdown. "
+            "Use this when you need to read the content of a specific web page."
+        )
+    @property
+    def parameters(self) -> Dict[str, Any]:
+        return {
+            "type": "object",
+            "properties": {
+                "url": {
+                    "type": "string",
+                    "description": "The URL to fetch"
+                },
+                "format": {
+                    "type": "string",
+                    "enum": ["text", "markdown", "html"],
+                    "description": "Output format (default: markdown)",
+                    "default": "markdown"
+                }
+            },
+            "required": ["url"]
+        }
+    async def execute(self, args: Dict[str, Any], ctx: ToolContext) -> ToolResult:
+        url = args["url"]
+        output_format = args.get("format", "markdown")
+        if not url.startswith(("http://", "https://")):
+            url = "https://" + url
+        try:
+            async with httpx.AsyncClient(follow_redirects=True, timeout=30.0) as client:
+                response = await client.get(
+                    url,
+                    headers={
+                        "User-Agent": "Mozilla/5.0 (compatible; OpenCode-API/1.0)"
+                    }
+                )
+                response.raise_for_status()
+                html_content = response.text
+            if output_format == "html":
+                content = html_content[:50000]  # Limit size
+            elif output_format == "text":
+                content = self._html_to_text(html_content)
+            else:  # markdown
+                content = self._html_to_markdown(html_content)
+            if len(content) > 50000:
+                content = content[:50000] + "\n\n[Content truncated...]"
+            return ToolResult(
+                title=f"Fetched: {url}",
+                output=content,
+                metadata={"url": url, "format": output_format, "length": len(content)}
+            )
+        except httpx.HTTPStatusError as e:
+            return ToolResult(
+                title=f"Fetch failed: {url}",
+                output=f"HTTP Error {e.response.status_code}: {e.response.reason_phrase}",
+                metadata={"error": "http_error", "status_code": e.response.status_code}
+            )
+        except httpx.RequestError as e:
+            return ToolResult(
+                title=f"Fetch failed: {url}",
+                output=f"Request error: {str(e)}",
+                metadata={"error": "request_error"}
+            )
+        except Exception as e:
+            return ToolResult(
+                title=f"Fetch failed: {url}",
+                output=f"Error: {str(e)}",
+                metadata={"error": str(e)}
+            )
+    def _html_to_text(self, html: str) -> str:
+        try:
+            from bs4 import BeautifulSoup
+            soup = BeautifulSoup(html, "html.parser")
+            for tag in soup(["script", "style", "nav", "footer", "header"]):
+                tag.decompose()
+            return soup.get_text(separator="\n", strip=True)
+        except ImportError:
+            import re
+            text = re.sub(r"<script[^>]*>.*?</script>", "", html, flags=re.DOTALL | re.IGNORECASE)
+            text = re.sub(r"<style[^>]*>.*?</style>", "", text, flags=re.DOTALL | re.IGNORECASE)
+            text = re.sub(r"<[^>]+>", " ", text)
+            text = re.sub(r"\s+", " ", text)
+            return text.strip()
+    def _html_to_markdown(self, html: str) -> str:
+        try:
+            import html2text
+            h = html2text.HTML2Text()
+            h.ignore_links = False
+            h.ignore_images = True
+            h.body_width = 0
+            return h.handle(html)
+        except ImportError:
+            return self._html_to_text(html)

src/opencode_api/tool/websearch.py ADDED Viewed

	@@ -0,0 +1,85 @@

+from typing import Dict, Any, List
+from .tool import BaseTool, ToolContext, ToolResult
+class WebSearchTool(BaseTool):
+    @property
+    def id(self) -> str:
+        return "websearch"
+    @property
+    def description(self) -> str:
+        return (
+            "Search the web using DuckDuckGo. Returns relevant search results "
+            "with titles, URLs, and snippets. Use this when you need current "
+            "information from the internet."
+        )
+    @property
+    def parameters(self) -> Dict[str, Any]:
+        return {
+            "type": "object",
+            "properties": {
+                "query": {
+                    "type": "string",
+                    "description": "The search query"
+                },
+                "max_results": {
+                    "type": "integer",
+                    "description": "Maximum number of results to return (default: 5)",
+                    "default": 5
+                }
+            },
+            "required": ["query"]
+        }
+    async def execute(self, args: Dict[str, Any], ctx: ToolContext) -> ToolResult:
+        query = args["query"]
+        max_results = args.get("max_results", 5)
+        try:
+            from ddgs import DDGS
+            results = []
+            with DDGS() as ddgs:
+                # 한국 지역 기반 검색 결과
+                for r in ddgs.text(query, region="kr-kr", max_results=max_results):
+                    results.append({
+                        "title": r.get("title", ""),
+                        "url": r.get("href", ""),
+                        "snippet": r.get("body", "")
+                    })
+            if not results:
+                return ToolResult(
+                    title=f"Web search: {query}",
+                    output="No results found.",
+                    metadata={"query": query, "count": 0}
+                )
+            output_lines = []
+            for i, r in enumerate(results, 1):
+                output_lines.append(f"{i}. {r['title']}")
+                output_lines.append(f"   URL: {r['url']}")
+                output_lines.append(f"   {r['snippet']}")
+                output_lines.append("")
+            return ToolResult(
+                title=f"Web search: {query}",
+                output="\n".join(output_lines),
+                metadata={"query": query, "count": len(results)}
+            )
+        except ImportError:
+            return ToolResult(
+                title=f"Web search: {query}",
+                output="Error: ddgs package not installed. Run: pip install ddgs",
+                metadata={"error": "missing_dependency"}
+            )
+        except Exception as e:
+            return ToolResult(
+                title=f"Web search: {query}",
+                output=f"Error performing search: {str(e)}",
+                metadata={"error": str(e)}
+            )