Agentic-Service-Data-Eyond-Catalog

Sleeping

sofhiaazzhr commited on 15 days ago

Commit

0000030

1 Parent(s): cd06c0f

[KM-556] wire document process endpoint to on_tabular_uploaded[KM-556] wire document process endpoint to on_tabular_uploaded

Files changed (1) hide show

src/api/v1/document.py CHANGED Viewed

@@ -6,7 +6,7 @@ from src.db.postgres.connection import get_db
 from src.document.document_service import document_service
 from src.middlewares.logging import get_logger, log_execution
 from src.middlewares.rate_limit import limiter
-from src.pipeline.document_pipeline.document_pipeline import document_pipeline
 from pydantic import BaseModel
 from typing import List
@@ -24,7 +24,7 @@ class DocumentResponse(BaseModel):
     created_at: str
-# NOTE: Keep in sync with SUPPORTED_FILE_TYPES in src/pipeline/document_pipeline/document_pipeline.py
 _DOC_TYPES = [
     {"doc_type": "pdf", "max_size": 10, "status": "active", "message": None},
     {"doc_type": "docx", "max_size": 10, "status": "active", "message": None},
@@ -104,5 +104,14 @@ async def process_document(
 ):
     """Process document and ingest to vector index."""
     data = await document_pipeline.process(document_id, user_id, db)
     return {"status": "success", "message": "Document processed successfully", "data": data}

 from src.document.document_service import document_service
 from src.middlewares.logging import get_logger, log_execution
 from src.middlewares.rate_limit import limiter
+from src.pipeline.document_pipeline import document_pipeline
 from pydantic import BaseModel
 from typing import List
     created_at: str
+# NOTE: Keep in sync with SUPPORTED_FILE_TYPES in src/pipeline/document_pipeline.py
 _DOC_TYPES = [
     {"doc_type": "pdf", "max_size": 10, "status": "active", "message": None},
     {"doc_type": "docx", "max_size": 10, "status": "active", "message": None},
 ):
     """Process document and ingest to vector index."""
     data = await document_pipeline.process(document_id, user_id, db)
+    document = await document_service.get_document(db, document_id)
+    if document and document.file_type in ("csv", "xlsx"):
+        from src.pipeline.triggers import on_tabular_uploaded
+        try:
+            await on_tabular_uploaded(document_id, user_id)
+        except Exception as e:
+            logger.error("catalog ingestion failed after process", document_id=document_id, error=str(e))
     return {"status": "success", "message": "Document processed successfully", "data": data}