Spaces:
Sleeping
Sleeping
File size: 1,762 Bytes
3a2c9d3 73c8596 3a2c9d3 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 | from pydantic import BaseModel, model_validator,field_validator, HttpUrl, Field
from typing import List, Dict, Any, Optional, Union
import json
class QuerySpec(BaseModel):
raw_query: str
intent: str
# entities: Dict[str, Union[str, List[str]]]
# constraints : Dict[str, Any]
entities: Optional[Any] = None
constraints: Optional[Any] = None
answer_type: str
followups: Optional[List[str]] = []
@model_validator(mode = "before")
@classmethod
def parse_nested_json(cls, values):
for field in ['entities', 'constraints']:
val = values.get(field)
if isinstance(val, str):
try:
values[field] = json.loads(val)
except json.JSONDecodeError:
pass
return values
class ClauseHit(BaseModel):
doc_id : str
page: int
chunk_id: str
text: str
metadata: Dict[str, Any]
score: float
boost: Optional[float] = None
combined_score: Optional[float] = None
@field_validator("metadata", mode="before")
def parse_metadata(cls, v):
if isinstance(v, str):
try:
return json.loads(v) if v.strip() else {}
except json.JSONDecodeError:
return {}
return v
class LogicResult(BaseModel):
answer: str
decision: str # "covered"/"not_covered"/"conditional"
confidence: float
evidence: List[ClauseHit]
rationale: str
class HackRxRunRequest(BaseModel):
documents: HttpUrl = Field(
...,
description="URL to the document (PDF, DOCX, or email blob)"
)
questions: List[str] = Field(
...,
description="List of questions to query against the document"
)
|