File size: 3,574 Bytes
7f3523e |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 |
from fastapi import APIRouter, HTTPException, UploadFile, File, Form
from typing import Dict, Any, Optional, List
from pydantic import BaseModel
from datetime import datetime
from ...core.document.processor import DocumentProcessor, ProcessedDocument, DocumentConfig
import json
router = APIRouter()
class ProcessingResponse(BaseModel):
"""Document processing response"""
status: str
document: ProcessedDocument
processing_time: float
@router.post("/process", response_model=ProcessingResponse)
async def process_document(
file: UploadFile = File(...),
config: Optional[str] = Form(None)
):
"""Process document"""
try:
start_time = datetime.now()
# Parse configuration
proc_config = {}
if config:
proc_config = json.loads(config)
# Initialize processor
processor = DocumentProcessor(proc_config)
await processor.initialize()
# Process document
result = await processor.process_document(file.file)
# Calculate processing time
processing_time = (datetime.now() - start_time).total_seconds()
return ProcessingResponse(
status="success",
document=result,
processing_time=processing_time
)
except Exception as e:
raise HTTPException(
status_code=500,
detail=f"Document processing failed: {str(e)}"
)
@router.post("/batch", response_model=Dict[str, ProcessingResponse])
async def batch_process(files: List[UploadFile] = File(...)):
"""Batch process documents"""
try:
# Initialize processor
processor = DocumentProcessor()
await processor.initialize()
# Process documents
results = {}
for file in files:
start_time = datetime.now()
result = await processor.process_document(file.file)
processing_time = (datetime.now() - start_time).total_seconds()
results[file.filename] = ProcessingResponse(
status="success",
document=result,
processing_time=processing_time
)
return results
except Exception as e:
raise HTTPException(
status_code=500,
detail=f"Batch processing failed: {str(e)}"
)
@router.get("/supported-types")
async def get_supported_types():
"""Get supported document types"""
processor = DocumentProcessor()
return {
"supported_types": processor.SUPPORTED_TYPES
}
@router.get("/config/validate")
async def validate_config(config: Dict[str, Any]):
"""Validate document processing configuration"""
try:
processor = DocumentProcessor(config)
is_valid = await processor.validate_config()
return {
"valid": is_valid,
"config": config
}
except Exception as e:
raise HTTPException(
status_code=400,
detail=f"Invalid configuration: {str(e)}"
)
@router.get("/health")
async def health_check():
"""Check document processor health"""
try:
processor = DocumentProcessor()
await processor.initialize()
return {
"status": "healthy",
"timestamp": datetime.now()
}
except Exception as e:
raise HTTPException(
status_code=500,
detail=f"Health check failed: {str(e)}"
) |