File size: 3,574 Bytes
7f3523e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
from fastapi import APIRouter, HTTPException, UploadFile, File, Form
from typing import Dict, Any, Optional, List
from pydantic import BaseModel
from datetime import datetime
from ...core.document.processor import DocumentProcessor, ProcessedDocument, DocumentConfig
import json

router = APIRouter()

class ProcessingResponse(BaseModel):
    """Document processing response"""
    status: str
    document: ProcessedDocument
    processing_time: float

@router.post("/process", response_model=ProcessingResponse)
async def process_document(
    file: UploadFile = File(...),
    config: Optional[str] = Form(None)
):
    """Process document"""
    try:
        start_time = datetime.now()
        
        # Parse configuration
        proc_config = {}
        if config:
            proc_config = json.loads(config)
        
        # Initialize processor
        processor = DocumentProcessor(proc_config)
        await processor.initialize()
        
        # Process document
        result = await processor.process_document(file.file)
        
        # Calculate processing time
        processing_time = (datetime.now() - start_time).total_seconds()
        
        return ProcessingResponse(
            status="success",
            document=result,
            processing_time=processing_time
        )
        
    except Exception as e:
        raise HTTPException(
            status_code=500,
            detail=f"Document processing failed: {str(e)}"
        )

@router.post("/batch", response_model=Dict[str, ProcessingResponse])
async def batch_process(files: List[UploadFile] = File(...)):
    """Batch process documents"""
    try:
        # Initialize processor
        processor = DocumentProcessor()
        await processor.initialize()
        
        # Process documents
        results = {}
        for file in files:
            start_time = datetime.now()
            result = await processor.process_document(file.file)
            processing_time = (datetime.now() - start_time).total_seconds()
            
            results[file.filename] = ProcessingResponse(
                status="success",
                document=result,
                processing_time=processing_time
            )
        
        return results
        
    except Exception as e:
        raise HTTPException(
            status_code=500,
            detail=f"Batch processing failed: {str(e)}"
        )

@router.get("/supported-types")
async def get_supported_types():
    """Get supported document types"""
    processor = DocumentProcessor()
    return {
        "supported_types": processor.SUPPORTED_TYPES
    }

@router.get("/config/validate")
async def validate_config(config: Dict[str, Any]):
    """Validate document processing configuration"""
    try:
        processor = DocumentProcessor(config)
        is_valid = await processor.validate_config()
        
        return {
            "valid": is_valid,
            "config": config
        }
        
    except Exception as e:
        raise HTTPException(
            status_code=400,
            detail=f"Invalid configuration: {str(e)}"
        )

@router.get("/health")
async def health_check():
    """Check document processor health"""
    try:
        processor = DocumentProcessor()
        await processor.initialize()
        
        return {
            "status": "healthy",
            "timestamp": datetime.now()
        }
        
    except Exception as e:
        raise HTTPException(
            status_code=500,
            detail=f"Health check failed: {str(e)}"
        )