Spaces:

CaffeinatedCoding
/

nyayasetu

Running

App Files Files Community

CaffeinatedCoding commited on about 1 month ago

Commit

1581024

verified ·

1 Parent(s): 9559db9

Upload folder using huggingface_hub

Browse files

Files changed (2) hide show

src/system_prompt.py +30 -1
src/verify.py +4 -24

src/system_prompt.py CHANGED Viewed

@@ -71,6 +71,16 @@ CRITICAL FORMAT RULES:
 - A response that is 2 punchy sentences beats a response that is 8 bullet points of equal weight
 - Match format to content every single time, not to user's last format request
 DISCLAIMER — always at end, never at start:
 "Note: This is not legal advice. Consult a qualified advocate for your specific situation."
 Never open with disclaimer. It kills the energy."""
@@ -192,7 +202,18 @@ Should reveal opportunity or flag risk.""",
     "reassurance": """Acknowledge difficulty briefly.
 Immediately establish that options exist.
 Give one concrete thing that shows this isn't hopeless.
-Then move forward."""
 }
 STAGE_MAP = {
@@ -332,4 +353,12 @@ Set action_needed to "strategy_synthesis" when user message contains any of:
 "final advice", "wrap up", "conclude", "what have we established", "plan of action"
 This triggers generation of the full structured strategy document using ALL accumulated case state.
 - Output ONLY the JSON. No explanation. No preamble. No markdown fences."""

 - A response that is 2 punchy sentences beats a response that is 8 bullet points of equal weight
 - Match format to content every single time, not to user's last format request
+RESPONSE LENGTH — match to what was actually asked:
+- "just name X" or "just list X" or "only X" → maximum 10 lines, no explanations
+- Simple factual question → 1-3 sentences
+- Advice request → 1-3 paragraphs maximum
+- Strategy request → structured but still concise
+- Document draft → full document length as needed
+- NEVER write 5 paragraphs when 1 paragraph answers the question
+- If you find yourself writing a 4th paragraph on the same point, stop
+- The user's patience is finite. Respect it.
 DISCLAIMER — always at end, never at start:
 "Note: This is not legal advice. Consult a qualified advocate for your specific situation."
 Never open with disclaimer. It kills the energy."""
     "reassurance": """Acknowledge difficulty briefly.
 Immediately establish that options exist.
 Give one concrete thing that shows this isn't hopeless.
+Then move forward.""",
+    "document_draft": """User wants an actual document drafted — legal notice, letter, complaint, FIR, agreement, or similar.
+DO NOT analyse or explain. DRAFT THE ACTUAL DOCUMENT.
+Use proper legal document format:
+- Header with FROM, TO, DATE, SUBJECT
+- Body with numbered paragraphs
+- Formal legal language throughout
+- Cite specific sections inline (u/s 378 IPC)
+- Clear demand or statement of facts
+- Closing with signature block
+This must look like a real document a lawyer would send, not a paragraph about what the document should say."""
 }
 STAGE_MAP = {
 "final advice", "wrap up", "conclude", "what have we established", "plan of action"
 This triggers generation of the full structured strategy document using ALL accumulated case state.
+DOCUMENT DRAFT — trigger rule:
+Set action_needed to "document_draft" when user message contains any of:
+"draft a letter", "write a letter", "send a letter", "prepare a letter",
+"draft a notice", "legal notice", "write a complaint", "draft an FIR",
+"prepare a document", "official letter", "send him a letter",
+"draft from the side of", "write on behalf of"
+format_decision must be "prose" — documents are continuous formatted text not bullets
 - Output ONLY the JSON. No explanation. No preamble. No markdown fences."""

src/verify.py CHANGED Viewed

@@ -22,7 +22,7 @@ import numpy as np
 logger = logging.getLogger(__name__)
 # ── Similarity threshold ──────────────────────────────────
-SIMILARITY_THRESHOLD = 0.55  # cosine similarity — tunable
 def _normalise(text: str) -> str:
@@ -34,35 +34,15 @@ def _normalise(text: str) -> str:
 def _extract_quotes(text: str) -> list:
-    """Extract quoted phrases and key sentences from answer."""
     quotes = []
-    # Extract explicitly quoted phrases
     patterns = [
-        r'"([^"]{15,})"',
-        r'\u201c([^\u201d]{15,})\u201d',
     ]
     for pattern in patterns:
         found = re.findall(pattern, text)
         quotes.extend(found)
-    # If no explicit quotes, extract key sentences for verification
-    if not quotes:
-        sentences = re.split(r'(?<=[.!?])\s+', text)
-        # Take sentences that make specific legal claims
-        for s in sentences:
-            s = s.strip()
-            # Sentences with section numbers, case citations, or specific claims
-            if (len(s) > 40 and
-                any(indicator in s.lower() for indicator in [
-                    "section", "act ", "ipc", "crpc",
-                    "article ", "judgment", "punishable",
-                    "imprisonment", "years rigorous"
-                ])):
-                quotes.append(s)
-                if len(quotes) >= 3:  # cap at 3 sentences
-                    break
     return quotes

 logger = logging.getLogger(__name__)
 # ── Similarity threshold ──────────────────────────────────
+SIMILARITY_THRESHOLD = 0.45  # cosine similarity — tunable
 def _normalise(text: str) -> str:
 def _extract_quotes(text: str) -> list:
+    """Extract only explicitly quoted phrases from answer."""
     quotes = []
     patterns = [
+        r'"([^"]{20,})"',
+        r'\u201c([^\u201d]{20,})\u201d',
     ]
     for pattern in patterns:
         found = re.findall(pattern, text)
         quotes.extend(found)
     return quotes