Spaces:

SemiAutomat1c
/

philverify-api

Running

Ryan Christian D. Deniega Claude Sonnet 4.6 commited on Mar 17

Commit

c78c2c1

1 Parent(s): 41972d7

feat: extension button placement, text extraction, OCR display + ML improvements

Extension:
- Fix verify button placement to appear below Like/Comment/Share bar on all page types
- Fix walk-up logic to find correct post container (message container > article > innerText>100)
- Fix [dir="auto"] filter to work when postElement is a sub-section of the article
- Add obfuscated text detection to skip Facebook's character-by-character spans
- Show full caption text (no truncation) and extracted image in verification modal
- Add IMAGE TEXT (OCR) section to modal using backend ocr_text field
- Fix "Extension context invalidated" error to show refresh prompt instead of retry
- Add webNavigation SPA detection for Facebook pushState navigation

API:
- Add image_url field to TextVerifyRequest — runs Tesseract OCR alongside caption text
- Add ocr_text field to VerificationResponse for image OCR results

ML/NLP:
- Add Naive Bayes, BoW, LDA, and ensemble classifiers
- Add Tagalog RoBERTa fine-tuned model
- Improve preprocessor, NER, claim extractor, and scoring engine
- Add benchmarks page to frontend

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

Files changed (37) hide show

.firebaserc +1 -1
api/routes/verify.py +16 -1
api/schemas.py +5 -0
docs/plans/2026-03-17-extension-ui-redesign.md +104 -0
evidence/stance_detector.py +61 -4
extension/background.js +32 -4
extension/content.css +108 -37
extension/content.js +578 -234
extension/manifest.json +5 -1
extension/popup.html +88 -13
extension/popup.js +61 -36
firebase.json +8 -1
firestore.indexes.json +49 -11
firestore.rules +14 -5
frontend/src/App.jsx +2 -0
frontend/src/components/Navbar.jsx +2 -1
frontend/src/pages/BenchmarksPage.jsx +400 -0
frontend/src/pages/VerifyPage.jsx +21 -1
ml/bow_classifier.py +69 -0
ml/dataset.py +38 -0
ml/ensemble_classifier.py +76 -0
ml/eval.py +172 -0
ml/lda_analysis.py +182 -0
ml/models/tagalog_roberta_model/config.json +40 -0
ml/models/tagalog_roberta_model/tokenizer.json +0 -0
ml/models/tagalog_roberta_model/tokenizer_config.json +20 -0
ml/naive_bayes_classifier.py +111 -0
ml/tagalog_roberta_classifier.py +157 -0
ml/train_tagalog_roberta.py +287 -0
ml/train_xlmr.py +7 -1
ml/xlm_roberta_classifier.py +21 -1
nlp/claim_extractor.py +59 -53
nlp/ner.py +14 -8
nlp/preprocessor.py +57 -10
requirements.txt +1 -0
scoring/engine.py +38 -18
tests/test_improvements.py +409 -0

.firebaserc CHANGED Viewed

@@ -12,4 +12,4 @@
     }
   },
   "etags": {}
-}

     }
   },
   "etags": {}
+}

api/routes/verify.py CHANGED Viewed

@@ -77,11 +77,26 @@ async def _fetch_og_text(url: str) -> str:
 )
 async def verify_text(body: TextVerifyRequest) -> VerificationResponse:
     start = time.perf_counter()
-    logger.info("verify/text called | chars=%d", len(body.text))
     try:
         result = await run_verification(body.text, input_type="text")
         result.processing_time_ms = round((time.perf_counter() - start) * 1000, 1)
         result.extracted_text = body.text
         return result
     except Exception as exc:
         logger.exception("verify/text error: %s", exc)

 )
 async def verify_text(body: TextVerifyRequest) -> VerificationResponse:
     start = time.perf_counter()
+    logger.info("verify/text called | chars=%d | has_image=%s", len(body.text), bool(body.image_url))
     try:
         result = await run_verification(body.text, input_type="text")
         result.processing_time_ms = round((time.perf_counter() - start) * 1000, 1)
         result.extracted_text = body.text
+        # If an image URL was provided, fetch it and run OCR — store result separately
+        if body.image_url:
+            try:
+                import httpx
+                async with httpx.AsyncClient(timeout=10) as client:
+                    img_resp = await client.get(body.image_url)
+                if img_resp.status_code == 200:
+                    ocr = await extract_text_from_image(img_resp.content)
+                    if ocr:
+                        result.ocr_text = ocr.strip()
+                        logger.info("OCR from image_url: %d chars", len(result.ocr_text))
+            except Exception as ocr_exc:
+                logger.warning("OCR for image_url failed (non-fatal): %s", ocr_exc)
         return result
     except Exception as exc:
         logger.exception("verify/text error: %s", exc)

api/schemas.py CHANGED Viewed

@@ -49,6 +49,7 @@ class DomainTier(int, Enum):
 class TextVerifyRequest(BaseModel):
     text: str = Field(..., min_length=10, max_length=10_000, description="Raw text to verify")
 class URLVerifyRequest(BaseModel):
@@ -71,6 +72,7 @@ class Layer1Result(BaseModel):
         default_factory=list,
         description="Human-readable list of suspicious features detected",
     )
 class EvidenceSource(BaseModel):
@@ -78,6 +80,7 @@ class EvidenceSource(BaseModel):
     url: str
     similarity: float = Field(..., ge=0.0, le=1.0, description="Cosine similarity to input claim")
     stance: Stance
     domain_tier: DomainTier
     published_at: Optional[str] = None
     source_name: Optional[str] = None
@@ -88,6 +91,7 @@ class Layer2Result(BaseModel):
     evidence_score: float = Field(..., ge=0.0, le=100.0)
     sources: list[EvidenceSource] = []
     claim_used: Optional[str] = Field(None, description="Extracted claim sent to evidence search")
 # ── Main Response ─────────────────────────────────────────────────────────────
@@ -106,6 +110,7 @@ class VerificationResponse(BaseModel):
     input_type: str = "text"
     processing_time_ms: Optional[float] = None
     extracted_text: Optional[str] = Field(None, description="Raw text extracted from the URL / image / video for transparency")
 # ── History / Trends ──────────────────────────────────────────────────────────

 class TextVerifyRequest(BaseModel):
     text: str = Field(..., min_length=10, max_length=10_000, description="Raw text to verify")
+    image_url: Optional[str] = Field(None, description="Optional image URL to run OCR on alongside the text")
 class URLVerifyRequest(BaseModel):
         default_factory=list,
         description="Human-readable list of suspicious features detected",
     )
+    model_tier: Optional[str] = Field(None, description="Classifier used: ensemble | xlmr | tfidf")
 class EvidenceSource(BaseModel):
     url: str
     similarity: float = Field(..., ge=0.0, le=1.0, description="Cosine similarity to input claim")
     stance: Stance
+    stance_reason: Optional[str] = Field(None, description="NLI entailment or keyword reason for stance")
     domain_tier: DomainTier
     published_at: Optional[str] = None
     source_name: Optional[str] = None
     evidence_score: float = Field(..., ge=0.0, le=100.0)
     sources: list[EvidenceSource] = []
     claim_used: Optional[str] = Field(None, description="Extracted claim sent to evidence search")
+    claim_method: Optional[str] = Field(None, description="How the claim was extracted: sentence_scoring | sentence_heuristic | passthrough")
 # ── Main Response ─────────────────────────────────────────────────────────────
     input_type: str = "text"
     processing_time_ms: Optional[float] = None
     extracted_text: Optional[str] = Field(None, description="Raw text extracted from the URL / image / video for transparency")
+    ocr_text: Optional[str] = Field(None, description="Text extracted from an image via OCR (when image_url was provided alongside text)")
 # ── History / Trends ──────────────────────────────────────────────────────────

docs/plans/2026-03-17-extension-ui-redesign.md ADDED Viewed

	@@ -0,0 +1,104 @@

+# PhilVerify Extension — UI Redesign
+**Date:** 2026-03-17
+## Goals
+1. Surface new backend fields (`model_tier`, `claim_method`, `stance_reason`) without cluttering the UI
+2. Make the verdict scannable in under 2 seconds across all surfaces
+3. Visual consistency between side panel, inline modal, and history tab
+## Information Hierarchy
+Four tiers, consistent across all surfaces:
+| Tier | Content | Style |
+|------|---------|-------|
+| 1 | Verdict label | Large, bold, verdict color |
+| 2 | Credibility score | Medium weight, verdict color, slightly smaller |
+| 3 | Signals + top source | Normal weight, neutral text |
+| 4 | model_tier, claim_method | 10px monospace, muted #6b7280 |
+**Visual anchor:** 3px left border in verdict color on every result card.
+**Theme:** dark newsroom — `#0d0d0d` bg, `#1a1a1a` card surface, `#262626` borders.
+---
+## Side Panel Result Card (`popup.js renderResult`)
+**Top block**
+- 3px left border (verdict color)
+- Verdict label: 20px bold, verdict color
+- Score: same line, right-aligned
+- 1px colored hairline separator below
+**Middle block**
+- Triggered features: small inline chips (dark bg, verdict-colored border, 10px)
+- Top source: distinct link block with `#1a1a1a` bg, `#262626` border, site name + truncated title + ↗
+**Footer block**
+- `border-top: 1px solid #262626`, 8px top padding
+- `MODEL  ensemble    CLAIM VIA  sentence_scoring`
+- 10px monospace, labels `#4b5563`, values `#6b7280`
+**Bottom**
+- "Open Full Dashboard ↗" as full-width footer button with `border-top: 1px solid #262626`
+---
+## Inline Modal (content.js / content.css)
+Injected as full-width block below post. Fixed width ~320px. Same left-border spine pattern.
+```
+┌───────────────────────────────────────┐
+▌ LIKELY FAKE              84% credibility
+▌ ─────────────────────────────────────
+▌ Signals: clickbait_title, no_byline
+▌ Top Source: Rappler — "Claim is false…" ↗
+▌ ─────────────────────────────────────
+▌ model: ensemble  ·  via: sentence_scoring
+└───────────────────────────────────────┘
+```
+- Line 1: Verdict (bold, verdict color) + score right-aligned
+- Line 2: Hairline separator (verdict color, 30% opacity)
+- Line 3: Signals (up to 3, comma-separated)
+- Line 4: Top source title truncated at 45 chars + ↗
+- Line 5: Hairline separator
+- Line 6: model_tier · claim_method — 10px monospace, muted
+- `×` dismiss button top-right
+- "Verify this post" button replaced in-place by result block after verification
+---
+## History Tab
+Entry layout (~60px tall per item):
+```
+┌─────────────────────────────────────────┐
+▌ ● LIKELY FAKE  84%    ensemble          ▌
+▌ "Marcos signs new law allowing…"        ▌
+▌ 2h ago                                  ▌
+└─────────────────────────────────────────┘
+```
+- Row 1: Colored dot + verdict chip + score + model_tier (muted monospace, pushed right)
+- Row 2: Text preview (#9ca3af, 12px)
+- Row 3: Timestamp (#6b7280, 10px)
+- Left border: 2px solid verdict color
+- Hover: `background: #1a1a1a`
+Empty state: centered 32px shield SVG outline (muted) + "No verifications yet." below it.
+---
+## Files to Modify
+| File | Changes |
+|------|---------|
+| `extension/popup.js` | Rewrite `renderResult()`, update `renderHistory()` |
+| `extension/popup.css` | Add `.result-spine`, `.result-footer-meta`, `.result-chip`, update `.history-item` |
+| `extension/content.js` | Update modal HTML template |
+| `extension/content.css` | Update `.pv-badge` / modal styles, add spine + footer-meta |

evidence/stance_detector.py CHANGED Viewed

@@ -7,10 +7,15 @@ Stance labels:
   Refutes         — article content contradicts / debunks the claim
   Not Enough Info — article is related but not conclusive either way
-Strategy (rule-based hybrid — no heavy model dependency):
-  1. Keyword scan of title + description for refutation/support signals
-  2. Similarity threshold guard — low similarity → NEI
-  3. Factuality keywords override similarity-based detection
 """
 import logging
 import re
@@ -19,6 +24,28 @@ from enum import Enum
 logger = logging.getLogger(__name__)
 class Stance(str, Enum):
     SUPPORTS = "Supports"
@@ -110,6 +137,36 @@ def detect_stance(
             reason=f"Low similarity ({similarity:.2f}) — article not related to claim",
         )
     # ── Rule 2: Scan for refutation keywords ──────────────────────────────────
     refutation_hits = _scan_keywords(article_text, _REFUTATION_KEYWORDS)
     if refutation_hits:

   Refutes         — article content contradicts / debunks the claim
   Not Enough Info — article is related but not conclusive either way
+Strategy (hybrid — NLI model primary, keyword rules as fallback):
+  0. Known PH fact-check domain → always Refutes
+  1. Similarity floor — too low similarity → NEI
+  1.5 NLI entailment check (cross-encoder/nli-MiniLM2-L6-H768) when
+     article description is long enough and model is available.
+     Uses the claim as the hypothesis and the article text as the premise.
+     Falls through to keyword rules if NLI confidence < 0.65.
+  2. Keyword scan of title + description for refutation/support signals
+  3. Default NEI
 """
 import logging
 import re
 logger = logging.getLogger(__name__)
+# ── NLI model (lazy-loaded) ───────────────────────────────────────────────────
+_nli_pipe = None
+_nli_loaded = False
+def _get_nli():
+    """Return the zero-shot NLI pipeline, loading it once on first call."""
+    global _nli_pipe, _nli_loaded
+    if _nli_loaded:
+        return _nli_pipe
+    try:
+        from transformers import pipeline
+        _nli_pipe = pipeline(
+            "zero-shot-classification",
+            model="cross-encoder/nli-MiniLM2-L6-H768",
+        )
+        logger.info("NLI stance model (nli-MiniLM2-L6-H768) loaded")
+    except Exception as e:
+        logger.warning("NLI stance model unavailable (%s) — using keyword fallback", e)
+    _nli_loaded = True
+    return _nli_pipe
 class Stance(str, Enum):
     SUPPORTS = "Supports"
             reason=f"Low similarity ({similarity:.2f}) — article not related to claim",
         )
+    # ── Rule 1.5: NLI entailment — semantically compare claim to article ──────
+    nli = _get_nli()
+    if nli and len(article_description.strip()) > 30:
+        try:
+            nli_result = nli(
+                article_description[:512],
+                candidate_labels=["supports the claim", "contradicts the claim", "unrelated"],
+                hypothesis_template="This text {}.",
+            )
+            top_label = nli_result["labels"][0]
+            top_score = float(nli_result["scores"][0])
+            if top_score >= 0.65:
+                if "supports" in top_label:
+                    return StanceResult(
+                        stance=Stance.SUPPORTS,
+                        confidence=round(top_score, 2),
+                        matched_keywords=[],
+                        reason=f"NLI entailment ({top_score:.2f}): article supports claim",
+                    )
+                elif "contradicts" in top_label:
+                    return StanceResult(
+                        stance=Stance.REFUTES,
+                        confidence=round(top_score, 2),
+                        matched_keywords=[],
+                        reason=f"NLI contradiction ({top_score:.2f}): article contradicts claim",
+                    )
+            # NLI confidence below threshold — fall through to keyword rules
+        except Exception as e:
+            logger.debug("NLI inference error: %s", e)
     # ── Rule 2: Scan for refutation keywords ──────────────────────────────────
     refutation_hits = _scan_keywords(article_text, _REFUTATION_KEYWORDS)
     if refutation_hits:

extension/background.js CHANGED Viewed

@@ -20,7 +20,7 @@ const MAX_HISTORY = 50
 // ── Default settings ──────────────────────────────────────────────────────────
 const DEFAULT_SETTINGS = {
-  apiBase: 'https://philverify.web.app/api',
   autoScan: true,    // Automatically scan Facebook feed posts
 }
@@ -75,6 +75,7 @@ async function setCached(key, result, preview) {
     text_preview: preview.slice(0, 80),
     verdict: result.verdict,
     final_score: result.final_score,
   }
   const updated = [entry, ...history.filter(h => h.id !== key)].slice(0, MAX_HISTORY)
   await chrome.storage.local.set({ history: updated })
@@ -88,15 +89,17 @@ async function verifyText(text, imageUrl) {
   if (hit) return { ...hit, _fromCache: true }
   const { apiBase } = await getSettings()
-  // Build payload — include imageUrl for multimodal (text + image) analysis
   const payload = { text }
   if (imageUrl && isHttpUrl(imageUrl)) payload.image_url = imageUrl
   const res = await fetch(`${apiBase}/verify/text`, {
     method: 'POST',
     headers: { 'Content-Type': 'application/json' },
     body: JSON.stringify(payload),
   })
   if (!res.ok) {
     const body = await res.json().catch(() => ({}))
     throw new Error(body.detail ?? `API error ${res.status}`)
@@ -112,11 +115,14 @@ async function verifyUrl(url) {
   if (hit) return { ...hit, _fromCache: true }
   const { apiBase } = await getSettings()
   const res = await fetch(`${apiBase}/verify/url`, {
     method: 'POST',
     headers: { 'Content-Type': 'application/json' },
     body: JSON.stringify({ url }),
   })
   if (!res.ok) {
     const body = await res.json().catch(() => ({}))
     throw new Error(body.detail ?? `API error ${res.status}`)
@@ -203,13 +209,35 @@ chrome.runtime.onMessage.addListener((msg, _sender, sendResponse) => {
         sendResponse({ ok: false, error: 'Invalid API URL: only http/https allowed' })
         return false
       }
-      chrome.storage.local
-        .set({ settings: incoming })
         .then(() => sendResponse({ ok: true }))
       return true
     }
     default:
       break
   }
 })

 // ── Default settings ──────────────────────────────────────────────────────────
 const DEFAULT_SETTINGS = {
+  apiBase: 'http://localhost:8000/api',
   autoScan: true,    // Automatically scan Facebook feed posts
 }
     text_preview: preview.slice(0, 80),
     verdict: result.verdict,
     final_score: result.final_score,
+    model_tier: result.layer1?.model_tier ?? null,
   }
   const updated = [entry, ...history.filter(h => h.id !== key)].slice(0, MAX_HISTORY)
   await chrome.storage.local.set({ history: updated })
   if (hit) return { ...hit, _fromCache: true }
   const { apiBase } = await getSettings()
   const payload = { text }
   if (imageUrl && isHttpUrl(imageUrl)) payload.image_url = imageUrl
+  console.log('[PhilVerify BG] Calling API:', `${apiBase}/verify/text`, payload)
   const res = await fetch(`${apiBase}/verify/text`, {
     method: 'POST',
     headers: { 'Content-Type': 'application/json' },
     body: JSON.stringify(payload),
   })
+  console.log('[PhilVerify BG] API Response Status:', res.status)
   if (!res.ok) {
     const body = await res.json().catch(() => ({}))
     throw new Error(body.detail ?? `API error ${res.status}`)
   if (hit) return { ...hit, _fromCache: true }
   const { apiBase } = await getSettings()
+  console.log('[PhilVerify BG] Calling API:', `${apiBase}/verify/url`, url)
   const res = await fetch(`${apiBase}/verify/url`, {
     method: 'POST',
     headers: { 'Content-Type': 'application/json' },
     body: JSON.stringify({ url }),
   })
+  console.log('[PhilVerify BG] API Response Status:', res.status)
   if (!res.ok) {
     const body = await res.json().catch(() => ({}))
     throw new Error(body.detail ?? `API error ${res.status}`)
         sendResponse({ ok: false, error: 'Invalid API URL: only http/https allowed' })
         return false
       }
+      // Merge with existing settings so a partial update doesn't clobber other fields
+      getSettings()
+        .then(current => chrome.storage.local.set({ settings: { ...current, ...incoming } }))
         .then(() => sendResponse({ ok: true }))
       return true
     }
+    case 'CHECK_HEALTH': {
+      getSettings()
+        .then(({ apiBase }) => fetch(`${apiBase}/health`, { signal: AbortSignal.timeout(3000) }))
+        .then(res => sendResponse({ ok: res.ok, status: res.status }))
+        .catch(e => sendResponse({ ok: false, error: e.message }))
+      return true
+    }
     default:
       break
   }
 })
+// ── SPA navigation: re-scan Facebook posts after pushState navigation ─────────
+// Facebook is a single-page app — clicking Home/Profile/etc. does a pushState
+// navigation without reloading the page. The content script stays alive but
+// needs to re-scan for new post articles after the page content changes.
+chrome.webNavigation.onHistoryStateUpdated.addListener((details) => {
+  if (details.url.includes('facebook.com')) {
+    chrome.tabs.sendMessage(details.tabId, { action: 'RE_SCAN_POSTS' }, () => {
+      // Suppress "no listener" errors when the content script isn't loaded yet
+      if (chrome.runtime.lastError) {}
+    })
+  }
+})

extension/content.css CHANGED Viewed

@@ -10,8 +10,13 @@
   display: flex;
   justify-content: flex-end;
   padding: 4px 12px 8px;
-  pointer-events: none;
-  /* Let clicks pass through the wrapper */
 }
 .pv-verify-btn {
@@ -139,30 +144,67 @@
   }
 }
-/* ── Inline verification report ─────────────────────────────────────────────── */
-.pv-report {
-  display: block;
-  margin: 8px 12px 12px;
-  padding: 14px 16px;
   background: #141414;
   border: 1px solid rgba(245, 240, 232, 0.1);
-  border-radius: 8px;
   font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', system-ui, sans-serif;
   font-size: 11px;
   color: #f5f0e8;
-  max-width: 480px;
-  box-shadow: 0 4px 24px rgba(0, 0, 0, 0.5);
   position: relative;
-  z-index: 50;
 }
 /* — Header */
 .pv-report-header {
   display: flex;
   align-items: center;
   justify-content: space-between;
-  margin-bottom: 12px;
-  padding-bottom: 8px;
   border-bottom: 1px solid rgba(245, 240, 232, 0.07);
 }
@@ -182,12 +224,12 @@
   padding: 2px 6px;
   border-radius: 4px;
   touch-action: manipulation;
-  transition: color 0.15s ease;
 }
 .pv-report-close:hover {
   color: #f5f0e8;
-  background: rgba(245, 240, 232, 0.05);
 }
 .pv-report-close:focus-visible {
@@ -196,18 +238,17 @@
 /* — Verdict row */
 .pv-report-verdict-row {
-  padding: 10px 12px;
-  margin-bottom: 12px;
   border-left: 3px solid #5c554e;
-  border-radius: 0 4px 4px 0;
-  background: rgba(245, 240, 232, 0.03);
 }
 .pv-report-verdict {
-  font-size: 18px;
   font-weight: 800;
   letter-spacing: -0.01em;
-  margin-bottom: 2px;
 }
 .pv-report-score-text {
@@ -236,7 +277,7 @@
 .pv-confidence-bar-fill {
   height: 100%;
   border-radius: 3px;
-  transition: width 0.5s ease-out;
 }
 .pv-confidence-bar-value {
@@ -253,7 +294,7 @@
   display: flex;
   justify-content: space-between;
   align-items: center;
-  padding: 6px 0;
   border-bottom: 1px solid rgba(245, 240, 232, 0.05);
 }
@@ -272,9 +313,9 @@
   color: #a89f94;
 }
-/* — Suspicious signals tags */
 .pv-report-signals {
-  padding: 8px 0;
   border-bottom: 1px solid rgba(245, 240, 232, 0.05);
 }
@@ -282,7 +323,7 @@
   display: flex;
   flex-wrap: wrap;
   gap: 4px;
-  margin-top: 6px;
 }
 .pv-report-tag {
@@ -298,14 +339,14 @@
 /* — Evidence sources */
 .pv-report-sources {
-  padding: 8px 0;
   border-bottom: 1px solid rgba(245, 240, 232, 0.05);
 }
 .pv-report-sources-list {
   list-style: none;
   padding: 0;
-  margin: 6px 0 0 0;
   display: flex;
   flex-direction: column;
   gap: 4px;
@@ -341,9 +382,9 @@
   flex-shrink: 0;
 }
-/* — Explanation / Claim */
 .pv-report-explanation {
-  padding: 8px 0;
   border-bottom: 1px solid rgba(245, 240, 232, 0.05);
 }
@@ -351,14 +392,14 @@
   margin: 6px 0 0;
   font-size: 10px;
   color: #a89f94;
-  line-height: 1.5;
   font-style: italic;
 }
-/* — Full analysis link */
 .pv-report-full-link {
   display: block;
-  margin-top: 10px;
   text-align: center;
   color: #dc2626;
   font-size: 10px;
@@ -366,12 +407,42 @@
   letter-spacing: 0.08em;
   text-decoration: none;
   text-transform: uppercase;
-  padding: 6px;
   border: 1px solid rgba(220, 38, 38, 0.3);
-  border-radius: 4px;
   transition: background 0.15s ease;
 }
 .pv-report-full-link:hover {
-  background: rgba(220, 38, 38, 0.08);
-}

   display: flex;
   justify-content: flex-end;
   padding: 4px 12px 8px;
+  /* pointer-events must remain auto — do NOT set to none here */
+}
+/* When button is injected directly (strategy 1, no wrapper) */
+div > .pv-verify-btn:not(.pv-verify-btn-wrapper .pv-verify-btn) {
+  margin-left: 6px;
+  vertical-align: middle;
 }
 .pv-verify-btn {
   }
 }
+/* ── Modal overlay ───────────────────────────────────────────────────────────── */
+.pv-modal-overlay {
+  position: fixed;
+  inset: 0;
+  z-index: 2147483640;
+  display: flex;
+  align-items: center;
+  justify-content: center;
+  padding: 16px;
+  background: rgba(0, 0, 0, 0);
+  backdrop-filter: blur(0px);
+  -webkit-backdrop-filter: blur(0px);
+  transition: background 0.2s ease, backdrop-filter 0.2s ease;
+  pointer-events: none;
+}
+.pv-modal-overlay.pv-modal--open {
+  background: rgba(0, 0, 0, 0.65);
+  backdrop-filter: blur(4px);
+  -webkit-backdrop-filter: blur(4px);
+  pointer-events: auto;
+}
+.pv-modal-card {
+  width: 100%;
+  max-width: 460px;
+  max-height: 90vh;
+  overflow-y: auto;
   background: #141414;
   border: 1px solid rgba(245, 240, 232, 0.1);
+  border-radius: 12px;
+  padding: 18px 20px;
   font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', system-ui, sans-serif;
   font-size: 11px;
   color: #f5f0e8;
+  box-shadow: 0 24px 64px rgba(0, 0, 0, 0.7), 0 0 0 1px rgba(255,255,255,0.04);
   position: relative;
+  transform: scale(0.94) translateY(12px);
+  opacity: 0;
+  transition: transform 0.25s cubic-bezier(0.34, 1.56, 0.64, 1), opacity 0.2s ease;
 }
+.pv-modal--open .pv-modal-card {
+  transform: scale(1) translateY(0);
+  opacity: 1;
+}
+/* Scrollbar styling for modal card */
+.pv-modal-card::-webkit-scrollbar { width: 4px; }
+.pv-modal-card::-webkit-scrollbar-track { background: transparent; }
+.pv-modal-card::-webkit-scrollbar-thumb { background: rgba(245,240,232,0.15); border-radius: 2px; }
+/* ── Report internals (shared between modal & future contexts) ───────────────── */
 /* — Header */
 .pv-report-header {
   display: flex;
   align-items: center;
   justify-content: space-between;
+  margin-bottom: 14px;
+  padding-bottom: 10px;
   border-bottom: 1px solid rgba(245, 240, 232, 0.07);
 }
   padding: 2px 6px;
   border-radius: 4px;
   touch-action: manipulation;
+  transition: color 0.15s ease, background 0.15s ease;
 }
 .pv-report-close:hover {
   color: #f5f0e8;
+  background: rgba(245, 240, 232, 0.07);
 }
 .pv-report-close:focus-visible {
 /* — Verdict row */
 .pv-report-verdict-row {
+  padding: 12px 14px;
+  margin-bottom: 14px;
   border-left: 3px solid #5c554e;
+  border-radius: 4px;
 }
 .pv-report-verdict {
+  font-size: 20px;
   font-weight: 800;
   letter-spacing: -0.01em;
+  margin-bottom: 3px;
 }
 .pv-report-score-text {
 .pv-confidence-bar-fill {
   height: 100%;
   border-radius: 3px;
+  transition: width 0.6s cubic-bezier(0.4, 0, 0.2, 1);
 }
 .pv-confidence-bar-value {
   display: flex;
   justify-content: space-between;
   align-items: center;
+  padding: 7px 0;
   border-bottom: 1px solid rgba(245, 240, 232, 0.05);
 }
   color: #a89f94;
 }
+/* — Suspicious signals */
 .pv-report-signals {
+  padding: 10px 0;
   border-bottom: 1px solid rgba(245, 240, 232, 0.05);
 }
   display: flex;
   flex-wrap: wrap;
   gap: 4px;
+  margin-top: 8px;
 }
 .pv-report-tag {
 /* — Evidence sources */
 .pv-report-sources {
+  padding: 10px 0;
   border-bottom: 1px solid rgba(245, 240, 232, 0.05);
 }
 .pv-report-sources-list {
   list-style: none;
   padding: 0;
+  margin: 8px 0 0 0;
   display: flex;
   flex-direction: column;
   gap: 4px;
   flex-shrink: 0;
 }
+/* — Claim analyzed */
 .pv-report-explanation {
+  padding: 10px 0;
   border-bottom: 1px solid rgba(245, 240, 232, 0.05);
 }
   margin: 6px 0 0;
   font-size: 10px;
   color: #a89f94;
+  line-height: 1.6;
   font-style: italic;
 }
+/* — Full dashboard link */
 .pv-report-full-link {
   display: block;
+  margin-top: 14px;
   text-align: center;
   color: #dc2626;
   font-size: 10px;
   letter-spacing: 0.08em;
   text-decoration: none;
   text-transform: uppercase;
+  padding: 8px;
   border: 1px solid rgba(220, 38, 38, 0.3);
+  border-radius: 6px;
   transition: background 0.15s ease;
 }
 .pv-report-full-link:hover {
+  background: rgba(220, 38, 38, 0.1);
+}
+/* ── Metadata footer (model_tier + claim_method) ────────────────────────────── */
+.pv-report-meta-footer {
+  display: flex;
+  align-items: center;
+  gap: 5px;
+  padding: 8px 0 4px;
+  border-top: 1px solid rgba(245, 240, 232, 0.05);
+  margin-top: 4px;
+}
+.pv-report-meta-label {
+  font-size: 8px;
+  font-weight: 700;
+  letter-spacing: 0.1em;
+  color: #5c554e;
+  text-transform: uppercase;
+}
+.pv-report-meta-val {
+  font-size: 9px;
+  font-family: 'SF Mono', 'Menlo', monospace;
+  color: #6b7280;
+}
+.pv-report-meta-sep {
+  color: rgba(245, 240, 232, 0.12);
+  font-size: 10px;
+  margin: 0 1px;
+}

extension/content.js CHANGED Viewed

@@ -176,15 +176,59 @@
     }
   }
   function extractPostText(post) {
     expandSeeMore(post)
     // Primary selectors — platform-specific, high confidence
-    for (const sel of CFG.text) {
-      const el = post.querySelector(sel)
-      if (el?.innerText?.trim().length >= MIN_TEXT_LENGTH) {
-        log('Text extracted via primary selector:', sel)
-        return el.innerText.trim().slice(0, 2000)
       }
     }
@@ -200,33 +244,81 @@
           return t.slice(0, 2000)
         }
       }
-      // Last resort: standalone [dir="auto"] with substantial text,
-      // excluding comments, headers, and nav elements
       for (const el of post.querySelectorAll('[dir="auto"]')) {
         if (el.closest('[role="navigation"]') || el.closest('header') || el.closest('[data-testid="UFI2Comment"]')) continue
-        // Also skip if inside a nested comment article
         const parentArticle = el.closest('[role="article"]')
-        if (parentArticle && parentArticle !== post) continue
         const t = el.innerText?.trim()
-        if (t && t.length >= MIN_TEXT_LENGTH && !t.startsWith('http')) {
           log('Text extracted via broad [dir="auto"] fallback (filtered)')
           return t.slice(0, 2000)
         }
       }
     }
-    // General fallback: any span with substantial text
     for (const span of post.querySelectorAll('span')) {
       const t = span.innerText?.trim()
-      if (t && t.length >= MIN_TEXT_LENGTH && !t.startsWith('http')) {
         // Skip if inside a nested comment article
         const parentArticle = span.closest('[role="article"]')
-        if (parentArticle && parentArticle !== post) continue
         log('Text extracted via span fallback')
         return t.slice(0, 2000)
       }
     }
     log('No text found in post')
     return null
   }
@@ -234,7 +326,18 @@
   function extractPostUrl(post) {
     for (const sel of (CFG.link ?? [])) {
       const el = post.querySelector(sel)
-      if (el?.href) return CFG.unwrapUrl(el)
     }
     return null
   }
@@ -249,12 +352,19 @@
   function extractPostImage(post) {
     if (!CFG.image) return null
-    const allImgs = Array.from(post.querySelectorAll(CFG.image))
     if (!allImgs.length) { log('No candidate images found'); return null }
     // Build a set of avatar container elements to check ancestry against
     const avatarContainers = (CFG.avatarContainers ?? []).flatMap(sel =>
-      Array.from(post.querySelectorAll(sel))
     )
     const contentImgs = allImgs.filter(img => {
@@ -287,108 +397,118 @@
     return src
   }
-  // ── Post discovery (feed-based strategy) ───────────────────────────────────
   /**
-   * Checks if a [role="article"] element is a top-level post (not a comment).
-   *
-   * PRIMARY STRATEGY: Use [role="feed"] as the anchor.
-   * - [role="feed"] is a WAI-ARIA landmark that Facebook keeps for accessibility.
-   * - Direct children of the feed are always posts (wrapped in <div> containers).
-   * - Comments are always deeper nested inside another [role="article"].
    *
-   * This function checks:
-   *   1. Is this article a direct descendant of [role="feed"]? → It's a post.
-   *   2. Is this article nested inside another article? → It's a comment.
-   *   3. Neither? Use URL-based heuristic for detail pages.
    */
-  function isTopLevelPost(el) {
-    if (PLATFORM !== 'facebook') return true
-    if (el.getAttribute('role') !== 'article') return true
-    // ── Check 1: Is this article nested inside another article?
-    // If yes, it's definitely a comment (true for both feed and detail pages).
-    const parentArticle = el.parentElement?.closest('[role="article"]')
-    if (parentArticle) {
-      log('Skipping comment (nested inside parent article)')
-      return false
-    }
-    // ── Check 2: Is this article a child of [role="feed"]?
-    // Direct children of the feed are always posts.
-    const feedAncestor = el.closest('[role="feed"]')
-    if (feedAncestor) {
-      // This article is inside the feed and NOT nested in another article → post
-      return true
-    }
-    // ── Check 3: Not in a feed — could be a detail page.
-    // On detail pages (e.g. /posts/123, /permalink/, /photo/),
-    // the FIRST [role="article"] on the page is the main post.
-    // All subsequent ones are comments.
-    const path = window.location.pathname + window.location.search
-    const isDetailPage = /\/(posts|photos|permalink|story\.php|watch|reel|videos)/.test(path)
-    if (isDetailPage) {
-      const allArticles = document.querySelectorAll('[role="article"]')
-      if (allArticles.length > 0 && allArticles[0] === el) {
-        // First article on a detail page → the main post
-        return true
       }
-      // Not the first article on a detail page → comment
-      log('Skipping comment (detail page, not the first article)')
-      return false
-    }
-    // ── Fallback: Allow it (could be a page layout we haven't seen)
-    // Better to show a button on something unexpected than miss a real post.
-    return true
   }
   /**
-   * Find posts in the given DOM subtree.
-   *
-   * Two-pass strategy for Facebook:
-   *   Pass 1: Find [role="feed"] container → get [role="article"] elements
-   *           that are direct children of the feed (not nested in other articles)
-   *   Pass 2: If no feed found (detail pages, etc.), fall back to all
-   *           [role="article"] elements filtered by isTopLevelPost()
-   *
-   * For Twitter and other platforms, uses POST_SELECTORS directly.
    */
   function findPosts(root) {
-    if (PLATFORM === 'facebook') {
-      // ── Pass 1: Feed-based detection (most reliable)
-      const feeds = root.querySelectorAll('[role="feed"]')
-      if (feeds.length === 0 && root.getAttribute?.('role') === 'feed') {
-        // root itself might be the feed
-        const articles = Array.from(root.querySelectorAll('[role="article"]'))
-          .filter(el => !el.parentElement?.closest('[role="article"]'))
-        if (articles.length) {
-          log(`Found ${articles.length} posts via feed (root is feed)`)
-          return articles
-        }
-      }
-      for (const feed of feeds) {
-        // Get all articles inside this feed that are NOT nested in another article
-        const articles = Array.from(feed.querySelectorAll('[role="article"]'))
-          .filter(el => !el.parentElement?.closest('[role="article"]'))
-        if (articles.length) {
-          log(`Found ${articles.length} posts via [role="feed"] container`)
-          return articles
-        }
-      }
-      // ── Pass 2: No feed container found — detail page or unusual layout
-      const allArticles = Array.from(root.querySelectorAll('[role="article"]'))
-      const topLevel = allArticles.filter(el => isTopLevelPost(el))
-      if (topLevel.length) {
-        log(`Found ${topLevel.length} posts via fallback (no feed container)`)
-        return topLevel
-      }
-      return []
-    }
-    // Non-Facebook platforms: simple selector matching
     for (const sel of POST_SELECTORS) {
       const found = Array.from(root.querySelectorAll(sel))
       if (found.length) return found
@@ -408,15 +528,6 @@
     if (post.dataset.philverifyBtn) return
     post.dataset.philverifyBtn = 'true'
-    // Note: We do NOT gate on content availability here.
-    // Facebook lazy-loads post content via React hydration, so text/images
-    // may not be in the DOM yet when this runs. Content is checked at click
-    // time (in handleVerifyClick) when everything is fully rendered.
-    // Create wrapper (flex container for right-alignment)
-    const wrapper = document.createElement('div')
-    wrapper.className = 'pv-verify-btn-wrapper'
     // Create the button
     const btn = document.createElement('button')
     btn.className = 'pv-verify-btn'
@@ -443,29 +554,85 @@
       handleVerifyClick(post, btn)
     })
-    wrapper.appendChild(btn)
-    // Insert the wrapper inline in the post.
-    // Strategy: Find a good insertion point near the bottom of the
-    // visible post content, but BEFORE the comments section.
-    // On Facebook, we look for the action bar area or similar landmarks.
     let inserted = false
     if (PLATFORM === 'facebook') {
-      // Try to insert after the action bar (Like/Comment/Share row)
-      const actionBar = post.querySelector('[role="toolbar"]') ||
-        post.querySelector('[aria-label*="Like"]')?.closest('div:not([role="article"])')
-      if (actionBar?.parentElement) {
-        actionBar.parentElement.insertBefore(wrapper, actionBar.nextSibling)
         inserted = true
       }
     }
-    // Fallback: just append to the post (works for Twitter and other platforms)
     if (!inserted) {
       post.appendChild(wrapper)
     }
-    log('Verify button injected on post')
   }
   // ── Verify click handler ──────────────────────────────────────────────────
@@ -490,42 +657,96 @@
     const url = extractPostUrl(post)
     const image = extractPostImage(post)
     log(`Verify clicked: text=${!!text} (${text?.length ?? 0} chars), url=${!!url}, image=${!!image}`)
     // Determine what to send
     let inputSummary = ''
     if (!text && !url && !image) {
       showErrorReport(post, btn, 'Could not read post content — no text or image found.')
       return
     }
     try {
       let msgPayload
       if (url) {
         msgPayload = { type: 'VERIFY_URL', url }
         inputSummary = 'Shared link analyzed'
       } else if (text && image) {
         msgPayload = { type: 'VERIFY_TEXT', text, imageUrl: image }
         inputSummary = 'Caption + image analyzed'
       } else if (text) {
         msgPayload = { type: 'VERIFY_TEXT', text }
         inputSummary = 'Caption text only'
       } else {
         msgPayload = { type: 'VERIFY_IMAGE_URL', imageUrl: image }
         inputSummary = 'Image only (OCR)'
       }
-      const response = await new Promise((resolve, reject) => {
-        chrome.runtime.sendMessage(msgPayload, (resp) => {
-          if (chrome.runtime.lastError) reject(new Error(chrome.runtime.lastError.message))
-          else if (!resp?.ok) reject(new Error(resp?.error ?? 'Unknown error'))
-          else resolve(resp.result)
         })
-      })
       log(`Verification result: verdict=${response.verdict}, score=${response.final_score}`)
-      showVerificationReport(post, btn, response, inputSummary)
     } catch (err) {
       warn('Verification failed:', err.message)
       showErrorReport(post, btn, err.message)
@@ -534,13 +755,12 @@
   // ── Verification report rendering ─────────────────────────────────────────
-  function showVerificationReport(post, btn, result, inputSummary) {
     // Remove the button
     btn.remove()
-    // Remove any existing report on this post
-    const existing = post.querySelector('.pv-report')
-    if (existing) existing.remove()
     const verdict = result.verdict ?? 'Unknown'
     const color = VERDICT_COLORS[verdict] ?? '#5c554e'
@@ -553,13 +773,36 @@
     const features = result.layer1?.triggered_features ?? []
     const cached = result._fromCache ? ' · cached' : ''
-    // Build report using createElement (no innerHTML for XSS safety)
-    const report = document.createElement('div')
-    report.className = 'pv-report'
-    report.setAttribute('role', 'region')
-    report.setAttribute('aria-label', 'PhilVerify fact-check report')
-    // — Header row
     const header = document.createElement('div')
     header.className = 'pv-report-header'
@@ -571,22 +814,17 @@
     closeBtn.className = 'pv-report-close'
     closeBtn.textContent = '✕'
     closeBtn.setAttribute('aria-label', 'Close fact-check report')
-    closeBtn.addEventListener('click', (e) => {
-      e.stopPropagation()
-      report.remove()
-      // Re-inject the verify button so user can re-verify
-      delete post.dataset.philverifyBtn
-      injectVerifyButton(post)
-    })
     header.appendChild(logo)
     header.appendChild(closeBtn)
-    report.appendChild(header)
-    // — Verdict row (large, prominent)
     const verdictRow = document.createElement('div')
     verdictRow.className = 'pv-report-verdict-row'
     verdictRow.style.borderLeftColor = color
     const verdictLabel = document.createElement('div')
     verdictLabel.className = 'pv-report-verdict'
@@ -599,7 +837,7 @@
     verdictRow.appendChild(verdictLabel)
     verdictRow.appendChild(scoreText)
-    report.appendChild(verdictRow)
     // — Confidence bar
     const barWrap = document.createElement('div')
@@ -614,7 +852,7 @@
     const barFill = document.createElement('div')
     barFill.className = 'pv-confidence-bar-fill'
-    barFill.style.width = `${Math.min(score, 100)}%`
     barFill.style.background = color
     const barValue = document.createElement('span')
@@ -625,9 +863,9 @@
     barWrap.appendChild(barLabel)
     barWrap.appendChild(barTrack)
     barWrap.appendChild(barValue)
-    report.appendChild(barWrap)
-    // — Info rows (Language, Input)
     const addInfoRow = (labelText, valueText) => {
       const row = document.createElement('div')
       row.className = 'pv-report-row'
@@ -639,22 +877,65 @@
       val.textContent = valueText
       row.appendChild(lbl)
       row.appendChild(val)
-      report.appendChild(row)
     }
     addInfoRow('LANGUAGE', safeText(language))
     addInfoRow('INPUT', safeText(inputSummary))
-    // — Triggered signals/features
     if (features.length > 0) {
       const signalsSection = document.createElement('div')
       signalsSection.className = 'pv-report-signals'
       const signalsLabel = document.createElement('span')
       signalsLabel.className = 'pv-report-label'
       signalsLabel.textContent = 'SUSPICIOUS SIGNALS'
       signalsSection.appendChild(signalsLabel)
       const tagsWrap = document.createElement('div')
       tagsWrap.className = 'pv-report-tags'
       for (const f of features.slice(0, 5)) {
@@ -664,45 +945,43 @@
         tagsWrap.appendChild(tag)
       }
       signalsSection.appendChild(tagsWrap)
-      report.appendChild(signalsSection)
     }
     // — Evidence sources
     if (sources.length > 0) {
       const sourcesSection = document.createElement('div')
       sourcesSection.className = 'pv-report-sources'
       const sourcesLabel = document.createElement('span')
       sourcesLabel.className = 'pv-report-label'
       sourcesLabel.textContent = 'EVIDENCE SOURCES'
       sourcesSection.appendChild(sourcesLabel)
       const sourcesList = document.createElement('ul')
       sourcesList.className = 'pv-report-sources-list'
       for (const src of sources.slice(0, 5)) {
         const li = document.createElement('li')
         li.className = 'pv-report-source-item'
         const link = document.createElement('a')
         link.href = safeUrl(src.url)
         link.target = '_blank'
         link.rel = 'noreferrer'
         link.className = 'pv-report-source-link'
         link.textContent = src.title?.slice(0, 60) ?? src.source_name ?? 'View source'
         const stance = document.createElement('span')
         stance.className = 'pv-report-source-stance'
         stance.textContent = src.stance ?? ''
         if (src.stance === 'Refutes') stance.style.color = '#dc2626'
         if (src.stance === 'Supports') stance.style.color = '#16a34a'
         li.appendChild(link)
         li.appendChild(stance)
         sourcesList.appendChild(li)
       }
       sourcesSection.appendChild(sourcesList)
-      report.appendChild(sourcesSection)
     }
     // — Explanation (claim used)
@@ -717,7 +996,42 @@
       explText.textContent = result.layer2.claim_used
       explanation.appendChild(explLabel)
       explanation.appendChild(explText)
-      report.appendChild(explanation)
     }
     // — Full analysis link
@@ -727,14 +1041,22 @@
     fullLink.target = '_blank'
     fullLink.rel = 'noreferrer'
     fullLink.textContent = 'Open Full Dashboard ↗'
-    report.appendChild(fullLink)
-    // Insert report into post
-    post.appendChild(report)
   }
   function showErrorReport(post, btn, errorMessage) {
-    // Remove spinner, restore button as error state
     btn.classList.remove('pv-verify-btn--loading')
     btn.classList.add('pv-verify-btn--error')
     btn.disabled = false
@@ -744,18 +1066,21 @@
     const icon = btn.querySelector('.pv-verify-btn-icon')
     const label = btn.querySelector('.pv-verify-btn-label')
-    if (icon) icon.textContent = '⚠️'
-    if (label) label.textContent = 'Verification failed — tap to retry'
-    // On next click, retry
-    const retryHandler = (e) => {
-      e.stopPropagation()
-      e.preventDefault()
-      btn.removeEventListener('click', retryHandler)
-      btn.classList.remove('pv-verify-btn--error')
-      handleVerifyClick(post, btn)
     }
     // Remove old click listeners by replacing element
     const newBtn = btn.cloneNode(true)
     btn.replaceWith(newBtn)
@@ -769,6 +1094,17 @@
   // ── MutationObserver ──────────────────────────────────────────────────────
   const pendingPosts = new Set()
   let rafScheduled = false
@@ -786,33 +1122,15 @@
     }
   }
-  const observer = new MutationObserver((mutations) => {
-    for (const mutation of mutations) {
-      for (const node of mutation.addedNodes) {
-        if (node.nodeType !== 1) continue   // element nodes only
-        if (PLATFORM === 'facebook') {
-          // Facebook strategy: only process nodes that are inside [role="feed"]
-          // or that contain a feed. This prevents processing individual comment
-          // nodes that are added dynamically.
-          const inFeed = node.closest?.('[role="feed"]') ||
-            node.querySelector?.('[role="feed"]') ||
-            node.getAttribute?.('role') === 'feed'
-          if (!inFeed && node.getAttribute?.('role') === 'article') {
-            // An article added outside of a feed — could be a detail page.
-            // Only process if isTopLevelPost says it's a post.
-            if (isTopLevelPost(node)) {
-              scheduleProcess(node)
-            }
-            continue
-          }
-        }
-        // Check descendants for posts (findPosts handles feed-based filtering)
-        const posts = findPosts(node)
-        for (const post of posts) scheduleProcess(post)
-      }
     }
   })
   // ── Initialization ────────────────────────────────────────────────────────
@@ -821,40 +1139,59 @@
     log(`Initializing on ${PLATFORM} (${window.location.hostname})`)
     // Check autoScan setting — controls whether buttons are shown at all
-    let response
     try {
-      response = await new Promise((resolve, reject) => {
-        chrome.runtime.sendMessage({ type: 'GET_SETTINGS' }, (r) => {
-          if (chrome.runtime.lastError) {
-            warn('Settings fetch error:', chrome.runtime.lastError.message)
-            resolve({ autoScan: true })
-          } else {
-            resolve(r ?? { autoScan: true })
-          }
-        })
-      })
     } catch {
       response = { autoScan: true }
     }
     log('Settings:', response)
     if (response?.autoScan === false) {
-      log('Auto-scan disabled by settings — no verify buttons will be shown')
       return
     }
-    // Process any posts already in the DOM
-    const existing = findPosts(document.body)
-    log(`Found ${existing.length} existing posts`)
-    for (const post of existing) scheduleProcess(post)
-    // Watch for new posts (both platforms are SPAs with infinite scroll)
-    observer.observe(document.body, { childList: true, subtree: true })
-    log('MutationObserver started — watching for new posts')
   }
   init()
   // ── Auto-verify news article pages (non-social) ────────────────────────────
   // When the content script runs on a PH news site (not the homepage),
   // it auto-verifies the current URL and injects a floating verdict banner.
@@ -863,7 +1200,7 @@
     const url = window.location.href
     const path = new URL(url).pathname
     // Skip homepages and section indexes (very short paths like / or /news)
-    if (!path || path.length < 8 || path.split('/').filter(Boolean).length < 2) return
     const banner = document.createElement('div')
     banner.id = 'pv-auto-banner'
@@ -936,7 +1273,14 @@
     try {
       const response = await new Promise((resolve, reject) => {
         chrome.runtime.sendMessage({ type: 'VERIFY_URL', url }, (resp) => {
-          if (chrome.runtime.lastError) reject(new Error(chrome.runtime.lastError.message))
           else if (!resp?.ok) reject(new Error(resp?.error ?? 'Unknown error'))
           else resolve(resp.result)
         })

     }
   }
+  /** Detect Facebook's character-obfuscation spans: "s o o p S d e t r n …" */
+  function isObfuscatedText(text) {
+    const tokens = text.split(/\s+/).filter(w => w.length > 0)
+    if (tokens.length < 8) return false
+    const singleCharCount = tokens.filter(w => w.length === 1).length
+    return singleCharCount / tokens.length > 0.5
+  }
   function extractPostText(post) {
     expandSeeMore(post)
+    // ── Reshare detection ─────────────────────────────────────────────────────
+    // Re-shared Facebook posts have a nested [role="article"] inside the outer
+    // post. The sharer's caption lives in the outer [data-ad-comet-preview="message"],
+    // while the ORIGINAL post content is inside the nested article.
+    // We want to fact-check the original content, not the sharer's commentary.
+    if (PLATFORM === 'facebook') {
+      const innerArticle = Array.from(post.querySelectorAll('[role="article"]'))
+        .find(el => el !== post)
+      if (innerArticle) {
+        for (const sel of CFG.text) {
+          const el = innerArticle.querySelector(sel)
+          const t = el?.innerText?.trim()
+          if (t && t.length >= MIN_TEXT_LENGTH) {
+            log('Reshared post: extracted original content from nested article via', sel)
+            return t.slice(0, 2000)
+          }
+        }
+        for (const el of innerArticle.querySelectorAll('[dir="auto"]')) {
+          const t = el.innerText?.trim()
+          if (t && t.length >= MIN_TEXT_LENGTH && !t.startsWith('http')) {
+            log('Reshared post: extracted original content via dir=auto in nested article')
+            return t.slice(0, 2000)
+          }
+        }
+      }
+    }
     // Primary selectors — platform-specific, high confidence
+    // Also search in the nearest article ancestor in case postElement is a sub-section
+    const primarySearchRoots = [post]
+    if (PLATFORM === 'facebook') {
+      const articleAncestor = post.closest?.('[role="article"]')
+      if (articleAncestor && articleAncestor !== post) primarySearchRoots.push(articleAncestor)
+    }
+    for (const root of primarySearchRoots) {
+      for (const sel of CFG.text) {
+        const el = root.querySelector(sel)
+        if (el?.innerText?.trim().length >= MIN_TEXT_LENGTH) {
+          log('Text extracted via primary selector:', sel)
+          return el.innerText.trim().slice(0, 2000)
+        }
       }
     }
           return t.slice(0, 2000)
         }
       }
+      // Broader [dir="auto"] scan — exclude comments, navs, headers
       for (const el of post.querySelectorAll('[dir="auto"]')) {
         if (el.closest('[role="navigation"]') || el.closest('header') || el.closest('[data-testid="UFI2Comment"]')) continue
         const parentArticle = el.closest('[role="article"]')
+        // Skip only if parentArticle is a completely separate subtree from post
+        // (i.e., it doesn't contain post). If post is inside parentArticle, that's fine.
+        if (parentArticle && parentArticle !== post && !parentArticle.contains(post)) continue
         const t = el.innerText?.trim()
+        if (t && t.length >= MIN_TEXT_LENGTH && !t.startsWith('http') && !isObfuscatedText(t)) {
           log('Text extracted via broad [dir="auto"] fallback (filtered)')
           return t.slice(0, 2000)
         }
       }
+      // Last resort for Facebook: walk UP the DOM from post to find the article,
+      // then collect all [dir="auto"] text from that full article.
+      // This handles cases where postElement is only a sub-section of the full post.
+      const fullArticle = post.closest?.('[role="article"]') ?? post
+      if (fullArticle !== post) {
+        for (const el of fullArticle.querySelectorAll('[dir="auto"]')) {
+          if (el.closest('[role="navigation"]') || el.closest('header')) continue
+          const t = el.innerText?.trim()
+          if (t && t.length >= MIN_TEXT_LENGTH && !t.startsWith('http')) {
+            log('Text extracted via full-article [dir="auto"] walk-up')
+            return t.slice(0, 2000)
+          }
+        }
+        // Combine all short [dir="auto"] fragments from the full article
+        const combined = Array.from(fullArticle.querySelectorAll('[dir="auto"]'))
+          .map(el => el.innerText?.trim())
+          .filter(t => t && t.length > 5 && !t.startsWith('http'))
+          .join(' ')
+        if (combined.length >= MIN_TEXT_LENGTH) {
+          log('Text extracted by combining dir=auto fragments in full article')
+          return combined.slice(0, 2000)
+        }
+      }
+      // Combine all short [dir="auto"] fragments in the current post element
+      const allDirAuto = Array.from(post.querySelectorAll('[dir="auto"]'))
+        .map(el => el.innerText?.trim())
+        .filter(t => t && t.length > 5 && !t.startsWith('http'))
+        .join(' ')
+      if (allDirAuto.length >= MIN_TEXT_LENGTH) {
+        log('Text extracted by combining dir=auto fragments')
+        return allDirAuto.slice(0, 2000)
+      }
     }
+    // General fallback: any span with substantial text (skip obfuscated char-spans)
     for (const span of post.querySelectorAll('span')) {
       const t = span.innerText?.trim()
+      if (t && t.length >= MIN_TEXT_LENGTH && !t.startsWith('http') && !isObfuscatedText(t)) {
         // Skip if inside a nested comment article
         const parentArticle = span.closest('[role="article"]')
+        if (parentArticle && parentArticle !== post && !parentArticle.contains(post)) continue
         log('Text extracted via span fallback')
         return t.slice(0, 2000)
       }
     }
+    // Walk UP the DOM and try the full article — covers cases where postElement
+    // is a small sub-section that doesn't contain the text itself
+    const ancestor = post.closest?.('[role="article"]')
+    if (ancestor && ancestor !== post) {
+      for (const span of ancestor.querySelectorAll('span')) {
+        const t = span.innerText?.trim()
+        if (t && t.length >= MIN_TEXT_LENGTH && !t.startsWith('http') && !isObfuscatedText(t)) {
+          log('Text extracted via ancestor span walk-up')
+          return t.slice(0, 2000)
+        }
+      }
+    }
     log('No text found in post')
     return null
   }
   function extractPostUrl(post) {
     for (const sel of (CFG.link ?? [])) {
       const el = post.querySelector(sel)
+      if (el?.href) {
+        const url = CFG.unwrapUrl(el)
+        // Skip common internal Facebook/Twitter links that aren't actually shared external content
+        if (PLATFORM === 'facebook') {
+          const u = url.toLowerCase()
+          if (u.includes('facebook.com') && !u.includes('l.php')) {
+            // Probably a profile link or internal post link, ignore as "URL input"
+            continue
+          }
+        }
+        return url
+      }
     }
     return null
   }
   function extractPostImage(post) {
     if (!CFG.image) return null
+    // Search in post, then fall back to the nearest article ancestor if nothing found.
+    // postElement from the walk-up may only wrap the message text, not the image.
+    let allImgs = Array.from(post.querySelectorAll(CFG.image))
+    if (!allImgs.length && PLATFORM === 'facebook') {
+      const articleAncestor = post.closest?.('[role="article"]')
+      if (articleAncestor) allImgs = Array.from(articleAncestor.querySelectorAll(CFG.image))
+    }
     if (!allImgs.length) { log('No candidate images found'); return null }
     // Build a set of avatar container elements to check ancestry against
+    const imgSearchRoot = post.closest?.('[role="article"]') ?? post
     const avatarContainers = (CFG.avatarContainers ?? []).flatMap(sel =>
+      Array.from(imgSearchRoot.querySelectorAll(sel))
     )
     const contentImgs = allImgs.filter(img => {
     return src
   }
+  // ── Post discovery ────────────────────────────────────────────────────────
   /**
+   * Facebook: Scan the entire document for [aria-label="Hide post"] buttons.
+   * This is the same proven anchor used by the classmate's working extension.
+   * Walk up from the button to find the enclosing post container, then inject.
    *
+   * Why this works better than [role="feed"] / [role="article"] detection:
+   *   - Facebook's WAI-ARIA feed/article structure changes frequently
+   *   - The "Hide post" ✕ button is rendered on EVERY post and is very stable
+   *   - Walking up to find the enclosing article-level div is reliable
    */
+  function addButtonsToFacebookPosts() {
+    // Anchor buttons that appear in EVERY post header (both home feed and profile pages).
+    // "Actions for this post" is the ⋯ button — always visible, never on comments.
+    const hideButtons = document.querySelectorAll(
+      '[aria-label="Actions for this post"], [aria-label="Hide post"], [aria-label="hide post"], [aria-label="Hide or report this"], [aria-label="Edit post"], [aria-label="Edit memory"]'
+    )
+    let added = 0
+    hideButtons.forEach((hideBtn) => {
+      const btnContainer = hideBtn.parentElement
+      const btnGrandparent = btnContainer?.parentElement
+      if (!btnContainer || !btnGrandparent) return
+      // Skip if we already injected on this container
+      if (btnGrandparent.querySelector('.pv-verify-btn')) return
+      // Walk up from btnGrandparent to find the post container.
+      // Priority: container with a message attribute > non-empty article > first innerText>100.
+      // We don't stop on innerText>100 alone because the header grandparent often has
+      // that much text but doesn't contain the post body — keep walking for a better anchor.
+      let postElement = null
+      let innerTextFallback = null
+      let el = btnGrandparent
+      while (el && el !== document.body) {
+        // Best match: element that directly wraps the post message
+        if (el.querySelector('[data-ad-rendering-role="story_message"], [data-ad-comet-preview="message"]')) {
+          postElement = el; break
+        }
+        // Second best: an article/ARTICLE with actual content (non-skeleton)
+        if ((el.getAttribute('role') === 'article' || el.tagName === 'ARTICLE') &&
+            (el.innerText?.length ?? 0) > 100) {
+          postElement = el; break
+        }
+        // Track first innerText>100 as fallback (but keep walking for better match)
+        if (!innerTextFallback && (el.innerText?.length ?? 0) > 100) {
+          innerTextFallback = el
+        }
+        el = el.parentElement
       }
+      if (!postElement) postElement = innerTextFallback ?? btnGrandparent
+      // Skip if postElement is nested inside another article (comment / reshared post)
+      if (postElement.parentElement?.closest('[role="article"]')) return
+      // Skip if already injected on this post
+      if (postElement.dataset.philverifyBtn) return
+      // "Actions for this post" (⋯ button) and "Hide or report this" only appear in
+      // post headers, never on comments. Profile page posts don't have
+      // [data-ad-comet-preview] so skip the content check and place the button
+      // directly next to the anchor (for ⋯) or via injectVerifyButton (for the other).
+      const hideBtnLabel = hideBtn.getAttribute('aria-label')
+      // "Actions for this post" (⋯) and "Hide or report this" are in post headers only.
+      // Delegate placement to injectVerifyButton so the button lands in the action bar.
+      if (hideBtnLabel === 'Actions for this post' || hideBtnLabel === 'Hide or report this') {
+        injectVerifyButton(postElement)
+        added++
+        return
+      }
+      // For all other anchor labels (Hide post, Edit post, Edit memory): require a
+      // post message container. These labels only exist on home feed posts which
+      // always have [data-ad-comet-preview="message"].
+      if (!postElement.querySelector(
+        '[data-ad-comet-preview="message"], [data-ad-rendering-role="story_message"]'
+      )) return
+      // Delegate to injectVerifyButton so placement uses the action bar (Like/Comment/Share)
+      // on all page types — avoids the button being hidden in the post header area.
+      injectVerifyButton(postElement)
+      added++
+    })
+    if (added > 0) log(`Added ${added} verify button(s) via hide-post anchor`)
+    // ── Supplementary scan: article-based (profile pages, group pages, etc.) ──
+    // Both profile posts AND comments are [role="article"] on Facebook.
+    // Posts are top-level (no parent article); comments are nested inside posts.
+    // The nesting check below correctly distinguishes them.
+    // Note: the previous comment injection bug was caused by [aria-label="Remove"]
+    // in the button-anchor pass (now removed), not by this scan.
+    let supplementaryAdded = 0
+    document.querySelectorAll('[role="article"]').forEach(article => {
+      if (article.dataset.philverifyBtn) return
+      if (article.parentElement?.closest('[role="article"]')) return
+      // Profile page [role="article"] elements are permanent loading skeletons with no
+      // real content. Only inject on articles that actually have post message content.
+      if (PLATFORM === 'facebook' && !article.querySelector(
+        '[data-ad-comet-preview="message"], [data-ad-rendering-role="story_message"]'
+      )) return
+      injectVerifyButton(article)
+      supplementaryAdded++
+    })
+    if (supplementaryAdded > 0) log(`Added ${supplementaryAdded} verify button(s) via article scan`)
   }
   /**
+   * For Twitter and news sites: use the original selector-based approach.
    */
   function findPosts(root) {
     for (const sel of POST_SELECTORS) {
       const found = Array.from(root.querySelectorAll(sel))
       if (found.length) return found
     if (post.dataset.philverifyBtn) return
     post.dataset.philverifyBtn = 'true'
     // Create the button
     const btn = document.createElement('button')
     btn.className = 'pv-verify-btn'
       handleVerifyClick(post, btn)
     })
+    // ── Insertion strategy ───────────────────────────────────────────────────
+    // Strategy 1 (most reliable — same anchor as classmate's working extension):
+    // The "hide post" ✕ button is stable across Facebook layout changes.
+    // Insert the verify button next to it in the post header.
     let inserted = false
     if (PLATFORM === 'facebook') {
+      // Strategy: Look for the action row (Like / Comment / Share)
+      // Use the Like button as anchor — present on ALL post types (home feed + profile)
+      // postElement from walk-up may be a sub-section, so also search the nearest article ancestor.
+      if (!inserted) {
+        const searchRoot = post.closest('[role="article"]') ?? post
+        const likeBtn =
+          searchRoot.querySelector('[aria-label="Like"], [aria-label^="Like:"]') ??
+          post.querySelector('[aria-label="Like"], [aria-label^="Like:"]')
+        const actionBar =
+          likeBtn?.closest('[role="toolbar"]') ??
+          likeBtn?.closest('[role="group"]') ??
+          searchRoot.querySelector('[role="toolbar"]') ??
+          searchRoot.querySelector('[aria-label*="Comment"]')?.closest('div:not([role="article"])')
+        if (actionBar?.parentElement) {
+          const wrapper = document.createElement('div')
+          wrapper.className = 'pv-verify-btn-wrapper'
+          wrapper.appendChild(btn)
+          actionBar.parentElement.insertBefore(wrapper, actionBar.nextSibling)
+          inserted = true
+          log('Verify button injected after action bar')
+        }
+      }
+      // Strategy 3: Insert after [data-ad-comet-preview] text block
+      if (!inserted) {
+        const msgBlock =
+          post.querySelector('[data-ad-comet-preview="message"]') ??
+          post.querySelector('[data-testid="post_message"]')
+        if (msgBlock?.parentElement) {
+          const wrapper = document.createElement('div')
+          wrapper.className = 'pv-verify-btn-wrapper'
+          wrapper.appendChild(btn)
+          msgBlock.parentElement.insertBefore(wrapper, msgBlock.nextSibling)
+          inserted = true
+          log('Verify button injected after message block')
+        }
+      }
+    }
+    // Twitter: insert after tweet text block
+    if (!inserted && PLATFORM === 'twitter') {
+      const tweetText = post.querySelector('[data-testid="tweetText"]')
+      if (tweetText?.parentElement) {
+        const wrapper = document.createElement('div')
+        wrapper.className = 'pv-verify-btn-wrapper'
+        wrapper.appendChild(btn)
+        tweetText.parentElement.insertBefore(wrapper, tweetText.nextSibling)
+        inserted = true
+      }
+    }
+    // News sites: inject after the h1 headline so the button is visible without scrolling
+    if (!inserted && PLATFORM === 'news') {
+      const h1 = post.querySelector('h1')
+      if (h1?.parentElement) {
+        const wrapper = document.createElement('div')
+        wrapper.className = 'pv-verify-btn-wrapper'
+        wrapper.appendChild(btn)
+        h1.parentElement.insertBefore(wrapper, h1.nextSibling)
         inserted = true
+        log('Verify button injected after h1 headline')
       }
     }
+    // Final fallback: append a wrapped button directly to the post
     if (!inserted) {
+      const wrapper = document.createElement('div')
+      wrapper.className = 'pv-verify-btn-wrapper'
+      wrapper.appendChild(btn)
       post.appendChild(wrapper)
+      log('Verify button injected via fallback (appended to post)')
     }
   }
   // ── Verify click handler ──────────────────────────────────────────────────
     const url = extractPostUrl(post)
     const image = extractPostImage(post)
+    console.log('[PhilVerify] Extracted:', { text, url, image })
     log(`Verify clicked: text=${!!text} (${text?.length ?? 0} chars), url=${!!url}, image=${!!image}`)
     // Determine what to send
     let inputSummary = ''
     if (!text && !url && !image) {
+      console.warn('[PhilVerify] Extraction failed: No content found.')
       showErrorReport(post, btn, 'Could not read post content — no text or image found.')
       return
     }
     try {
       let msgPayload
+      let usedType = ''
+      // Start by attempting URL verification if present
       if (url) {
         msgPayload = { type: 'VERIFY_URL', url }
+        usedType = 'URL'
         inputSummary = 'Shared link analyzed'
       } else if (text && image) {
         msgPayload = { type: 'VERIFY_TEXT', text, imageUrl: image }
+        usedType = 'TEXT'
         inputSummary = 'Caption + image analyzed'
       } else if (text) {
         msgPayload = { type: 'VERIFY_TEXT', text }
+        usedType = 'TEXT'
         inputSummary = 'Caption text only'
       } else {
         msgPayload = { type: 'VERIFY_IMAGE_URL', imageUrl: image }
+        usedType = 'IMAGE'
         inputSummary = 'Image only (OCR)'
       }
+      console.log(`[PhilVerify] Attempting ${usedType} verification:`, msgPayload)
+      let response
+      try {
+        response = await new Promise((resolve, reject) => {
+          chrome.runtime.sendMessage(msgPayload, (resp) => {
+            if (chrome.runtime.lastError) {
+              const msg = chrome.runtime.lastError.message ?? ''
+              reject(new Error(
+                msg.includes('Extension context invalidated')
+                  ? 'Extension was reloaded — please refresh the page to re-activate PhilVerify.'
+                  : msg
+              ))
+            }
+            else if (!resp?.ok) reject(new Error(resp?.error ?? 'Unknown error'))
+            else resolve(resp.result)
+          })
         })
+      } catch (err) {
+        // FALLBACK LOGIC: If URL verification failed but we have text, try verifying the text instead
+        if (usedType === 'URL' && text && text.length >= MIN_TEXT_LENGTH) {
+          warn('URL verification failed, falling back to text verification:', err.message)
+          if (image) {
+            msgPayload = { type: 'VERIFY_TEXT', text, imageUrl: image }
+            inputSummary = 'Caption + image analyzed (fallback)'
+          } else {
+            msgPayload = { type: 'VERIFY_TEXT', text }
+            inputSummary = 'Caption text only (fallback)'
+          }
+          console.log('[PhilVerify] Fallback attempt (TEXT):', msgPayload)
+          response = await new Promise((resolve, reject) => {
+            chrome.runtime.sendMessage(msgPayload, (resp) => {
+              if (chrome.runtime.lastError) {
+              const msg = chrome.runtime.lastError.message ?? ''
+              reject(new Error(
+                msg.includes('Extension context invalidated')
+                  ? 'Extension was reloaded — please refresh the page to re-activate PhilVerify.'
+                  : msg
+              ))
+            }
+              else if (!resp?.ok) reject(new Error(resp?.error ?? 'Unknown error'))
+              else resolve(resp.result)
+            })
+          })
+        } else {
+          // Re-throw if no fallback possible
+          throw err
+        }
+      }
       log(`Verification result: verdict=${response.verdict}, score=${response.final_score}`)
+      const extractedText = usedType === 'URL' ? url : (usedType === 'TEXT' ? text : null)
+      showVerificationReport(post, btn, response, inputSummary, extractedText, image)
     } catch (err) {
       warn('Verification failed:', err.message)
       showErrorReport(post, btn, err.message)
   // ── Verification report rendering ─────────────────────────────────────────
+  function showVerificationReport(post, btn, result, inputSummary, extractedText, extractedImage) {
     // Remove the button
     btn.remove()
+    // Remove any existing modal
+    document.getElementById('pv-modal-overlay')?.remove()
     const verdict = result.verdict ?? 'Unknown'
     const color = VERDICT_COLORS[verdict] ?? '#5c554e'
     const features = result.layer1?.triggered_features ?? []
     const cached = result._fromCache ? ' · cached' : ''
+    // ── Backdrop overlay
+    const overlay = document.createElement('div')
+    overlay.id = 'pv-modal-overlay'
+    overlay.className = 'pv-modal-overlay'
+    overlay.setAttribute('role', 'dialog')
+    overlay.setAttribute('aria-modal', 'true')
+    overlay.setAttribute('aria-label', 'PhilVerify fact-check report')
+    function closeModal() {
+      overlay.classList.remove('pv-modal--open')
+      overlay.addEventListener('transitionend', () => {
+        overlay.remove()
+        delete post.dataset.philverifyBtn
+        addButtonsToFacebookPosts()
+      }, { once: true })
+    }
+    // Click outside card = close
+    overlay.addEventListener('click', (e) => {
+      if (e.target === overlay) closeModal()
+    })
+    // Escape key = close
+    const onKey = (e) => { if (e.key === 'Escape') { closeModal(); document.removeEventListener('keydown', onKey) } }
+    document.addEventListener('keydown', onKey)
+    // ── Modal card
+    const card = document.createElement('div')
+    card.className = 'pv-modal-card'
+    // — Header
     const header = document.createElement('div')
     header.className = 'pv-report-header'
     closeBtn.className = 'pv-report-close'
     closeBtn.textContent = '✕'
     closeBtn.setAttribute('aria-label', 'Close fact-check report')
+    closeBtn.addEventListener('click', (e) => { e.stopPropagation(); closeModal() })
     header.appendChild(logo)
     header.appendChild(closeBtn)
+    card.appendChild(header)
+    // — Verdict row
     const verdictRow = document.createElement('div')
     verdictRow.className = 'pv-report-verdict-row'
     verdictRow.style.borderLeftColor = color
+    verdictRow.style.background = bg
     const verdictLabel = document.createElement('div')
     verdictLabel.className = 'pv-report-verdict'
     verdictRow.appendChild(verdictLabel)
     verdictRow.appendChild(scoreText)
+    card.appendChild(verdictRow)
     // — Confidence bar
     const barWrap = document.createElement('div')
     const barFill = document.createElement('div')
     barFill.className = 'pv-confidence-bar-fill'
+    barFill.style.width = '0'
     barFill.style.background = color
     const barValue = document.createElement('span')
     barWrap.appendChild(barLabel)
     barWrap.appendChild(barTrack)
     barWrap.appendChild(barValue)
+    card.appendChild(barWrap)
+    // — Info rows
     const addInfoRow = (labelText, valueText) => {
       const row = document.createElement('div')
       row.className = 'pv-report-row'
       val.textContent = valueText
       row.appendChild(lbl)
       row.appendChild(val)
+      card.appendChild(row)
     }
     addInfoRow('LANGUAGE', safeText(language))
     addInfoRow('INPUT', safeText(inputSummary))
+    // — Image analyzed (thumbnail + OCR text)
+    if (extractedImage) {
+      const imgSection = document.createElement('div')
+      imgSection.className = 'pv-report-explanation'
+      const imgLabel = document.createElement('span')
+      imgLabel.className = 'pv-report-label'
+      imgLabel.textContent = 'IMAGE ANALYZED'
+      const img = document.createElement('img')
+      img.src = extractedImage
+      img.alt = 'Extracted post image'
+      img.style.cssText = 'width:100%;border-radius:6px;margin-top:6px;display:block;'
+      imgSection.appendChild(imgLabel)
+      imgSection.appendChild(img)
+      // OCR text extracted from the image
+      if (result.ocr_text) {
+        const ocrLabel = document.createElement('span')
+        ocrLabel.className = 'pv-report-label'
+        ocrLabel.style.marginTop = '8px'
+        ocrLabel.textContent = 'IMAGE TEXT (OCR)'
+        const ocrPara = document.createElement('p')
+        ocrPara.className = 'pv-report-explanation-text'
+        ocrPara.textContent = safeText(result.ocr_text)
+        imgSection.appendChild(ocrLabel)
+        imgSection.appendChild(ocrPara)
+      }
+      card.appendChild(imgSection)
+    }
+    // — Caption / text analyzed (full text, no truncation)
+    if (extractedText) {
+      const textSection = document.createElement('div')
+      textSection.className = 'pv-report-explanation'
+      const textLabel = document.createElement('span')
+      textLabel.className = 'pv-report-label'
+      textLabel.textContent = 'CAPTION TEXT'
+      const textPara = document.createElement('p')
+      textPara.className = 'pv-report-explanation-text'
+      textPara.textContent = safeText(extractedText)
+      textSection.appendChild(textLabel)
+      textSection.appendChild(textPara)
+      card.appendChild(textSection)
+    }
+    // — Signals
     if (features.length > 0) {
       const signalsSection = document.createElement('div')
       signalsSection.className = 'pv-report-signals'
       const signalsLabel = document.createElement('span')
       signalsLabel.className = 'pv-report-label'
       signalsLabel.textContent = 'SUSPICIOUS SIGNALS'
       signalsSection.appendChild(signalsLabel)
       const tagsWrap = document.createElement('div')
       tagsWrap.className = 'pv-report-tags'
       for (const f of features.slice(0, 5)) {
         tagsWrap.appendChild(tag)
       }
       signalsSection.appendChild(tagsWrap)
+      card.appendChild(signalsSection)
     }
     // — Evidence sources
     if (sources.length > 0) {
       const sourcesSection = document.createElement('div')
       sourcesSection.className = 'pv-report-sources'
       const sourcesLabel = document.createElement('span')
       sourcesLabel.className = 'pv-report-label'
       sourcesLabel.textContent = 'EVIDENCE SOURCES'
       sourcesSection.appendChild(sourcesLabel)
       const sourcesList = document.createElement('ul')
       sourcesList.className = 'pv-report-sources-list'
       for (const src of sources.slice(0, 5)) {
         const li = document.createElement('li')
         li.className = 'pv-report-source-item'
         const link = document.createElement('a')
         link.href = safeUrl(src.url)
         link.target = '_blank'
         link.rel = 'noreferrer'
         link.className = 'pv-report-source-link'
         link.textContent = src.title?.slice(0, 60) ?? src.source_name ?? 'View source'
         const stance = document.createElement('span')
         stance.className = 'pv-report-source-stance'
         stance.textContent = src.stance ?? ''
         if (src.stance === 'Refutes') stance.style.color = '#dc2626'
         if (src.stance === 'Supports') stance.style.color = '#16a34a'
+        if (src.stance_reason) {
+          stance.title = src.stance_reason
+          stance.style.cursor = 'help'
+        }
         li.appendChild(link)
         li.appendChild(stance)
         sourcesList.appendChild(li)
       }
       sourcesSection.appendChild(sourcesList)
+      card.appendChild(sourcesSection)
     }
     // — Explanation (claim used)
       explText.textContent = result.layer2.claim_used
       explanation.appendChild(explLabel)
       explanation.appendChild(explText)
+      card.appendChild(explanation)
+    }
+    // — Metadata footer (model tier + claim method)
+    const modelTier   = result.layer1?.model_tier
+    const claimMethod = result.layer2?.claim_method
+    if (modelTier || claimMethod) {
+      const metaFooter = document.createElement('div')
+      metaFooter.className = 'pv-report-meta-footer'
+      if (modelTier) {
+        const lbl = document.createElement('span')
+        lbl.className = 'pv-report-meta-label'
+        lbl.textContent = 'MODEL'
+        const val = document.createElement('span')
+        val.className = 'pv-report-meta-val'
+        val.textContent = modelTier
+        metaFooter.appendChild(lbl)
+        metaFooter.appendChild(val)
+      }
+      if (modelTier && claimMethod) {
+        const sep = document.createElement('span')
+        sep.className = 'pv-report-meta-sep'
+        sep.textContent = '·'
+        metaFooter.appendChild(sep)
+      }
+      if (claimMethod) {
+        const lbl = document.createElement('span')
+        lbl.className = 'pv-report-meta-label'
+        lbl.textContent = 'VIA'
+        const val = document.createElement('span')
+        val.className = 'pv-report-meta-val'
+        val.textContent = claimMethod
+        metaFooter.appendChild(lbl)
+        metaFooter.appendChild(val)
+      }
+      card.appendChild(metaFooter)
     }
     // — Full analysis link
     fullLink.target = '_blank'
     fullLink.rel = 'noreferrer'
     fullLink.textContent = 'Open Full Dashboard ↗'
+    card.appendChild(fullLink)
+    // Assemble and show
+    overlay.appendChild(card)
+    document.body.appendChild(overlay)
+    // Trigger animation
+    requestAnimationFrame(() => overlay.classList.add('pv-modal--open'))
+    // Animate the confidence bar fill
+    setTimeout(() => {
+      barFill.style.width = `${confidence}%`
+    }, 300)
   }
   function showErrorReport(post, btn, errorMessage) {
     btn.classList.remove('pv-verify-btn--loading')
     btn.classList.add('pv-verify-btn--error')
     btn.disabled = false
     const icon = btn.querySelector('.pv-verify-btn-icon')
     const label = btn.querySelector('.pv-verify-btn-label')
+    // Extension was reloaded — retrying is useless, user must refresh the tab
+    const needsRefresh = errorMessage.includes('Extension was reloaded') ||
+      errorMessage.includes('Extension context invalidated')
+    if (needsRefresh) {
+      if (icon) icon.textContent = '🔄'
+      if (label) label.textContent = 'Extension updated — refresh page'
+      btn.disabled = true  // No point retrying; force refresh
+      return
     }
+    if (icon) icon.textContent = '⚠️'
+    if (label) label.textContent = 'Verification failed — tap to retry'
     // Remove old click listeners by replacing element
     const newBtn = btn.cloneNode(true)
     btn.replaceWith(newBtn)
   // ── MutationObserver ──────────────────────────────────────────────────────
+  // For Facebook: debounced full rescan (new posts appear via infinite scroll)
+  let fbDebounceTimer = null
+  function scheduleFacebookScan() {
+    if (fbDebounceTimer) clearTimeout(fbDebounceTimer)
+    fbDebounceTimer = setTimeout(() => {
+      fbDebounceTimer = null
+      addButtonsToFacebookPosts()
+    }, 150)
+  }
+  // For Twitter/news: RAF-batched per-post injection
   const pendingPosts = new Set()
   let rafScheduled = false
     }
   }
+  const observer = new MutationObserver(() => {
+    if (PLATFORM === 'facebook') {
+      // Just re-scan the whole document for new hide-post buttons
+      scheduleFacebookScan()
+      return
     }
+    // Twitter / news: find posts inside mutated subtrees
+    const posts = findPosts(document.body)
+    for (const post of posts) scheduleProcess(post)
   })
   // ── Initialization ────────────────────────────────────────────────────────
     log(`Initializing on ${PLATFORM} (${window.location.hostname})`)
     // Check autoScan setting — controls whether buttons are shown at all
+    // Use a short timeout so we don't block if background worker is asleep
+    let response = { autoScan: true }
     try {
+      response = await Promise.race([
+        new Promise((resolve) => {
+          chrome.runtime.sendMessage({ type: 'GET_SETTINGS' }, (r) => {
+            if (chrome.runtime.lastError) resolve({ autoScan: true })
+            else resolve(r ?? { autoScan: true })
+          })
+        }),
+        new Promise((resolve) => setTimeout(() => resolve({ autoScan: true }), 1500)),
+      ])
     } catch {
       response = { autoScan: true }
     }
     log('Settings:', response)
     if (response?.autoScan === false) {
+      log('Auto-scan disabled — no verify buttons will be shown')
       return
     }
+    if (PLATFORM === 'facebook') {
+      // Initial scan + watch for new posts via infinite scroll
+      addButtonsToFacebookPosts()
+      observer.observe(document.body, { childList: true, subtree: true })
+      log('Facebook mode: watching for new posts via hide-post button anchor')
+    } else {
+      // Twitter / news sites: selector-based
+      const existing = findPosts(document.body)
+      log(`Found ${existing.length} existing posts`)
+      for (const post of existing) scheduleProcess(post)
+      observer.observe(document.body, { childList: true, subtree: true })
+      log('MutationObserver started')
+      // News article pages: also show auto-verify banner at top of page
+      if (PLATFORM === 'news') autoVerifyPage()
+    }
   }
   init()
+  // ── SPA navigation listener ───────────────────────────────────────────────
+  // Facebook is a single-page app. background.js fires RE_SCAN_POSTS whenever
+  // it detects a pushState navigation on facebook.com via webNavigation API.
+  // This ensures profile pages, group pages, etc. get scanned after navigation.
+  chrome.runtime.onMessage.addListener((msg) => {
+    if (msg.action === 'RE_SCAN_POSTS') {
+      log('SPA navigation detected, re-scanning for posts...')
+      // Small delay to let Facebook finish rendering the new page content
+      setTimeout(addButtonsToFacebookPosts, 500)
+    }
+  })
   // ── Auto-verify news article pages (non-social) ────────────────────────────
   // When the content script runs on a PH news site (not the homepage),
   // it auto-verifies the current URL and injects a floating verdict banner.
     const url = window.location.href
     const path = new URL(url).pathname
     // Skip homepages and section indexes (very short paths like / or /news)
+    if (!path || path.length < 5 || path.split('/').filter(Boolean).length < 1) return
     const banner = document.createElement('div')
     banner.id = 'pv-auto-banner'
     try {
       const response = await new Promise((resolve, reject) => {
         chrome.runtime.sendMessage({ type: 'VERIFY_URL', url }, (resp) => {
+          if (chrome.runtime.lastError) {
+              const msg = chrome.runtime.lastError.message ?? ''
+              reject(new Error(
+                msg.includes('Extension context invalidated')
+                  ? 'Extension was reloaded — please refresh the page to re-activate PhilVerify.'
+                  : msg
+              ))
+            }
           else if (!resp?.ok) reject(new Error(resp?.error ?? 'Unknown error'))
           else resolve(resp.result)
         })

extension/manifest.json CHANGED Viewed

@@ -8,7 +8,9 @@
     "storage",
     "activeTab",
     "scripting",
-    "sidePanel"
   ],
   "side_panel": {
@@ -18,8 +20,10 @@
   "host_permissions": [
     "https://www.facebook.com/*",
     "https://facebook.com/*",
     "https://x.com/*",
     "https://twitter.com/*",
     "https://philverify.web.app/*",
     "http://localhost:8000/*"
   ],

     "storage",
     "activeTab",
     "scripting",
+    "sidePanel",
+    "tabs",
+    "webNavigation"
   ],
   "side_panel": {
   "host_permissions": [
     "https://www.facebook.com/*",
     "https://facebook.com/*",
+    "https://*.fbcdn.net/*",
     "https://x.com/*",
     "https://twitter.com/*",
+    "https://pbs.twimg.com/*",
     "https://philverify.web.app/*",
     "http://localhost:8000/*"
   ],

extension/popup.html CHANGED Viewed

@@ -142,19 +142,6 @@
     .btn-verify:focus-visible { outline: 2px solid var(--accent-cyan); outline-offset: 2px; }
     /* ── Result card ─────────────────────────────────── */
-    .result {
-      margin-top: 10px;
-      padding: 10px 12px;
-      background: var(--bg-surface);
-      border: 1px solid var(--border);
-      border-radius: 3px;
-    }
-    .result-verdict {
-      font-size: 15px;
-      font-weight: 800;
-      letter-spacing: -0.01em;
-      margin-bottom: 4px;
-    }
     .result-score {
       font-size: 10px;
       color: var(--text-muted);
@@ -368,6 +355,94 @@
       margin-top: 6px;
       height: 14px;
     }
   </style>
 </head>
 <body>

     .btn-verify:focus-visible { outline: 2px solid var(--accent-cyan); outline-offset: 2px; }
     /* ── Result card ─────────────────────────────────── */
     .result-score {
       font-size: 10px;
       color: var(--text-muted);
       margin-top: 6px;
       height: 14px;
     }
+    /* ── Result card – spine layout ──────────────────── */
+    .result {
+      margin-top: 10px;
+      padding: 0;
+      background: var(--bg-surface);
+      border: 1px solid var(--border);
+      border-radius: 3px;
+      overflow: hidden;
+    }
+    .result-body {
+      padding: 10px 12px 0;
+    }
+    .result-top {
+      display: flex;
+      justify-content: space-between;
+      align-items: baseline;
+      margin-bottom: 6px;
+    }
+    .result-verdict {
+      font-size: 20px;
+      font-weight: 800;
+      letter-spacing: -0.01em;
+    }
+    .result-score {
+      font-size: 10px;
+      color: var(--text-muted);
+      font-family: var(--font-mono);
+    }
+    .result-hairline {
+      height: 1px;
+      opacity: 0.3;
+      margin-bottom: 8px;
+    }
+    .result-chips {
+      display: flex;
+      flex-wrap: wrap;
+      gap: 3px;
+    }
+    .result-chip {
+      padding: 2px 6px;
+      background: rgba(0,0,0,0.4);
+      border: 1px solid;
+      border-radius: 2px;
+      font-size: 9px;
+      font-family: var(--font-mono);
+      letter-spacing: 0.03em;
+    }
+    .result-meta-footer {
+      display: flex;
+      align-items: center;
+      gap: 5px;
+      padding: 6px 12px;
+      border-top: 1px solid var(--border);
+      margin-top: 8px;
+    }
+    .result-meta-label {
+      font-size: 8px;
+      font-weight: 700;
+      letter-spacing: 0.1em;
+      color: var(--text-muted);
+      text-transform: uppercase;
+    }
+    .result-meta-val {
+      font-size: 9px;
+      font-family: var(--font-mono);
+      color: #6b7280;
+    }
+    .result-meta-sep {
+      color: var(--border);
+      font-size: 10px;
+    }
+    /* ── History – spine + hover ──────────────────────── */
+    .history-item:hover { background: #1a1a1a; }
+    .history-model {
+      margin-left: auto;
+      font-size: 8px;
+      font-family: var(--font-mono);
+      color: #6b7280;
+    }
+    /* ── Empty state icon ─────────────────────────────── */
+    .state-empty-icon {
+      display: block;
+      margin: 0 auto 8px;
+      opacity: 0.25;
+    }
   </style>
 </head>
 <body>

extension/popup.js CHANGED Viewed

@@ -33,8 +33,11 @@ function safeUrl(url) {
   } catch { return '#' }
 }
 function msg(obj) {
-  return new Promise(resolve => {
-    chrome.runtime.sendMessage(obj, resolve)
   })
 }
@@ -57,39 +60,60 @@ function isUrl(s) {
 function renderResult(result, container) {
   const color = VERDICT_COLORS[result.verdict] ?? '#5c554e'
   const topSource = result.layer2?.sources?.[0]
   container.innerHTML = `
-    <div class="result" role="status" aria-live="polite">
-      <div class="result-verdict" style="color:${color}">${safeText(result.verdict)}</div>
-      <div class="result-score">${Math.round(result.final_score)}% credibility${result._fromCache ? ' (cached)' : ''}</div>
-      <div class="result-row">
-        <span class="result-label">Language</span>
-        <span class="result-val">${safeText(result.language ?? '—')}</span>
-      </div>
-      <div class="result-row">
-        <span class="result-label">Confidence</span>
-        <span class="result-val" style="color:${color}">${result.confidence?.toFixed(1)}%</span>
       </div>
-      ${result.layer1?.triggered_features?.length ? `
-      <div class="result-row">
-        <span class="result-label">Signals</span>
-        <span class="result-val">${result.layer1.triggered_features.slice(0, 3).map(safeText).join(', ')}</span>
       </div>` : ''}
-      ${topSource ? `
-      <div class="result-source">
-        <div class="result-label" style="margin-bottom:4px;">Top Source</div>
-        <a href="${safeUrl(topSource.url)}" target="_blank" rel="noreferrer">${safeText(topSource.title?.slice(0, 55) ?? topSource.source_name ?? 'View')} ↗</a>
-      </div>` : ''}
-      <a class="open-full" href="https://philverify.web.app" target="_blank" rel="noreferrer">
-        Open Full Dashboard ↗
-      </a>
     </div>
   `
 }
 function renderHistory(entries, container) {
   if (!entries.length) {
-    container.innerHTML = '<div class="state-empty">No verifications yet.</div>'
     return
   }
   container.innerHTML = `
@@ -97,10 +121,11 @@ function renderHistory(entries, container) {
       ${entries.map(e => {
         const color = VERDICT_COLORS[e.verdict] ?? '#5c554e'
         return `
-          <li class="history-item" role="listitem">
             <div class="history-item-top">
               <span class="history-verdict" style="background:${color}22;color:${color};border:1px solid ${color}4d;">${safeText(e.verdict)}</span>
               <span class="history-score">${Math.round(e.final_score)}%</span>
             </div>
             <div class="history-preview">${safeText(e.text_preview || '—')}</div>
             <div class="history-time">${timeAgo(e.timestamp)}</div>
@@ -221,19 +246,19 @@ async function checkApiStatus() {
   const dot   = document.getElementById('api-status-dot')
   const label = document.getElementById('api-status-label')
   try {
-    const { apiBase } = await msg({ type: 'GET_SETTINGS' })
-    const res = await fetch(`${apiBase ?? 'http://localhost:8000'}/health`, { signal: AbortSignal.timeout(3000) })
-    if (res.ok) {
-      dot.style.background   = 'var(--credible)'
-      label.style.color      = 'var(--credible)'
-      label.textContent      = 'ONLINE'
     } else {
-      throw new Error(`${res.status}`)
     }
   } catch {
-    dot.style.background  = 'var(--fake)'
-    label.style.color     = 'var(--fake)'
-    label.textContent     = 'OFFLINE'
   }
 }

   } catch { return '#' }
 }
 function msg(obj) {
+  return new Promise((resolve, reject) => {
+    chrome.runtime.sendMessage(obj, (resp) => {
+      if (chrome.runtime.lastError) reject(new Error(chrome.runtime.lastError.message))
+      else resolve(resp)
+    })
   })
 }
 function renderResult(result, container) {
   const color = VERDICT_COLORS[result.verdict] ?? '#5c554e'
   const topSource = result.layer2?.sources?.[0]
+  const features = result.layer1?.triggered_features ?? []
+  const modelTier = result.layer1?.model_tier
+  const claimMethod = result.layer2?.claim_method
+  const hasFooter = modelTier || claimMethod
   container.innerHTML = `
+    <div class="result" role="status" aria-live="polite" style="border-left:3px solid ${color}">
+      <div class="result-body">
+        <div class="result-top">
+          <div class="result-verdict" style="color:${color}">${safeText(result.verdict)}</div>
+          <div class="result-score">${Math.round(result.final_score)}%${result._fromCache ? ' · cached' : ''}</div>
+        </div>
+        <div class="result-hairline" style="background:${color}"></div>
+        <div class="result-row">
+          <span class="result-label">Language</span>
+          <span class="result-val">${safeText(result.language ?? '—')}</span>
+        </div>
+        <div class="result-row">
+          <span class="result-label">Confidence</span>
+          <span class="result-val" style="color:${color}">${result.confidence?.toFixed(1)}%</span>
+        </div>
+        ${features.length ? `
+        <div class="result-row">
+          <span class="result-label">Signals</span>
+          <span class="result-chips">${features.slice(0, 3).map(f => `<span class="result-chip" style="border-color:${color}55;color:${color}">${safeText(f)}</span>`).join('')}</span>
+        </div>` : ''}
+        ${topSource ? `
+        <div class="result-source">
+          <div class="result-label" style="margin-bottom:4px;">Top Source</div>
+          <a href="${safeUrl(topSource.url)}" target="_blank" rel="noreferrer">${safeText(topSource.title?.slice(0, 55) ?? topSource.source_name ?? 'View')} ↗</a>
+        </div>` : ''}
+        <a class="open-full" href="https://philverify.web.app" target="_blank" rel="noreferrer">
+          Open Full Dashboard ↗
+        </a>
       </div>
+      ${hasFooter ? `
+      <div class="result-meta-footer">
+        ${modelTier ? `<span class="result-meta-label">MODEL</span><span class="result-meta-val">${safeText(modelTier)}</span>` : ''}
+        ${modelTier && claimMethod ? '<span class="result-meta-sep">·</span>' : ''}
+        ${claimMethod ? `<span class="result-meta-label">VIA</span><span class="result-meta-val">${safeText(claimMethod)}</span>` : ''}
       </div>` : ''}
     </div>
   `
 }
 function renderHistory(entries, container) {
   if (!entries.length) {
+    container.innerHTML = `
+      <div class="state-empty">
+        <svg class="state-empty-icon" width="32" height="32" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="1.5" aria-hidden="true">
+          <path d="M12 22s8-4 8-10V5l-8-3-8 3v7c0 6 8 10 8 10z"/>
+        </svg>
+        No verifications yet.
+      </div>`
     return
   }
   container.innerHTML = `
       ${entries.map(e => {
         const color = VERDICT_COLORS[e.verdict] ?? '#5c554e'
         return `
+          <li class="history-item" role="listitem" style="border-left:2px solid ${color}">
             <div class="history-item-top">
               <span class="history-verdict" style="background:${color}22;color:${color};border:1px solid ${color}4d;">${safeText(e.verdict)}</span>
               <span class="history-score">${Math.round(e.final_score)}%</span>
+              ${e.model_tier ? `<span class="history-model">${safeText(e.model_tier)}</span>` : ''}
             </div>
             <div class="history-preview">${safeText(e.text_preview || '—')}</div>
             <div class="history-time">${timeAgo(e.timestamp)}</div>
   const dot   = document.getElementById('api-status-dot')
   const label = document.getElementById('api-status-label')
   try {
+    // Route through the service worker so the fetch uses the correct host_permissions
+    const resp = await msg({ type: 'CHECK_HEALTH' })
+    if (resp?.ok) {
+      dot.style.background = 'var(--credible)'
+      label.style.color    = 'var(--credible)'
+      label.textContent    = 'ONLINE'
     } else {
+      throw new Error(resp?.error ?? `HTTP ${resp?.status}`)
     }
   } catch {
+    dot.style.background = 'var(--fake)'
+    label.style.color    = 'var(--fake)'
+    label.textContent    = 'OFFLINE'
   }
 }

firebase.json CHANGED Viewed

@@ -1,5 +1,7 @@
 {
   "firestore": {
     "rules": "firestore.rules",
     "indexes": "firestore.indexes.json"
   },
@@ -34,5 +36,10 @@
         ]
       }
     ]
   }
-}

 {
   "firestore": {
+    "database": "(default)",
+    "location": "asia-southeast1",
     "rules": "firestore.rules",
     "indexes": "firestore.indexes.json"
   },
         ]
       }
     ]
+  },
+  "auth": {
+    "providers": {
+      "emailPassword": true
+    }
   }
+}

firestore.indexes.json CHANGED Viewed

@@ -1,13 +1,51 @@
 {
-  "indexes": [
-    {
-      "collectionGroup": "verifications",
-      "queryScope": "COLLECTION",
-      "fields": [
-        { "fieldPath": "verdict", "order": "ASCENDING" },
-        { "fieldPath": "timestamp", "order": "DESCENDING" }
-      ]
-    }
-  ],
   "fieldOverrides": []
-}

 {
+  // Example (Standard Edition):
+  //
+  // "indexes": [
+  //   {
+  //     "collectionGroup": "widgets",
+  //     "queryScope": "COLLECTION",
+  //     "fields": [
+  //       { "fieldPath": "foo", "arrayConfig": "CONTAINS" },
+  //       { "fieldPath": "bar", "mode": "DESCENDING" }
+  //     ]
+  //   },
+  //
+  //  "fieldOverrides": [
+  //    {
+  //      "collectionGroup": "widgets",
+  //      "fieldPath": "baz",
+  //      "indexes": [
+  //        { "order": "ASCENDING", "queryScope": "COLLECTION" }
+  //      ]
+  //    },
+  //   ]
+  // ]
+  //
+  // Example (Enterprise Edition):
+  //
+  // "indexes": [
+  //   {
+  //     "collectionGroup": "reviews",
+  //     "queryScope": "COLLECTION_GROUP",
+  //     "apiScope": "MONGODB_COMPATIBLE_API",
+  //     "density": "DENSE",
+  //     "multikey": false,
+  //     "fields": [
+  //       { "fieldPath": "baz", "mode": "ASCENDING" }
+  //     ]
+  //   },
+  //   {
+  //     "collectionGroup": "items",
+  //     "queryScope": "COLLECTION_GROUP",
+  //     "apiScope": "MONGODB_COMPATIBLE_API",
+  //     "density": "SPARSE_ANY",
+  //     "multikey": true,
+  //     "fields": [
+  //       { "fieldPath": "baz", "mode": "ASCENDING" }
+  //     ]
+  //   },
+  // ]
+  "indexes": [],
   "fieldOverrides": []
+}

firestore.rules CHANGED Viewed

@@ -1,9 +1,18 @@
-rules_version = '2';
 service cloud.firestore {
   match /databases/{database}/documents {
-    match /verifications/{docId} {
-      allow read: if true;
-      allow write: if false;
     }
   }
-}

+rules_version='2'
 service cloud.firestore {
   match /databases/{database}/documents {
+    match /{document=**} {
+      // This rule allows anyone with your database reference to view, edit,
+      // and delete all data in your database. It is useful for getting
+      // started, but it is configured to expire after 30 days because it
+      // leaves your app open to attackers. At that time, all client
+      // requests to your database will be denied.
+      //
+      // Make sure to write security rules for your app before that time, or
+      // else all client requests to your database will be denied until you
+      // update your rules.
+      allow read, write: if request.time < timestamp.date(2026, 4, 14);
     }
   }
+}

frontend/src/App.jsx CHANGED Viewed

@@ -4,6 +4,7 @@ import LandingPage from './pages/LandingPage.jsx'
 import VerifyPage from './pages/VerifyPage.jsx'
 import HistoryPage from './pages/HistoryPage.jsx'
 import TrendsPage from './pages/TrendsPage.jsx'
 /** Shared horizontal constraint — all pages + navbar use this */
 export const PAGE_MAX_W = 960
@@ -47,6 +48,7 @@ export default function App() {
             <Route path="/verify" element={<VerifyPage />} />
             <Route path="/history" element={<HistoryPage />} />
             <Route path="/trends" element={<TrendsPage />} />
           </Routes>
         </div>
       </div>

 import VerifyPage from './pages/VerifyPage.jsx'
 import HistoryPage from './pages/HistoryPage.jsx'
 import TrendsPage from './pages/TrendsPage.jsx'
+import BenchmarksPage from './pages/BenchmarksPage.jsx'
 /** Shared horizontal constraint — all pages + navbar use this */
 export const PAGE_MAX_W = 960
             <Route path="/verify" element={<VerifyPage />} />
             <Route path="/history" element={<HistoryPage />} />
             <Route path="/trends" element={<TrendsPage />} />
+            <Route path="/benchmarks" element={<BenchmarksPage />} />
           </Routes>
         </div>
       </div>

frontend/src/components/Navbar.jsx CHANGED Viewed

@@ -1,5 +1,5 @@
 import { NavLink, Link } from 'react-router-dom'
-import { Radar, Clock, TrendingUp, ShieldCheck, Home } from 'lucide-react'
 import { PAGE_STYLE } from '../App.jsx'
 const NAV_LINKS = [
@@ -7,6 +7,7 @@ const NAV_LINKS = [
     { to: '/verify', icon: ShieldCheck, label: 'Verify' },
     { to: '/history', icon: Clock, label: 'History' },
     { to: '/trends', icon: TrendingUp, label: 'Trends' },
 ]
 export default function Navbar() {

 import { NavLink, Link } from 'react-router-dom'
+import { Radar, Clock, TrendingUp, ShieldCheck, Home, BarChart2 } from 'lucide-react'
 import { PAGE_STYLE } from '../App.jsx'
 const NAV_LINKS = [
     { to: '/verify', icon: ShieldCheck, label: 'Verify' },
     { to: '/history', icon: Clock, label: 'History' },
     { to: '/trends', icon: TrendingUp, label: 'Trends' },
+    { to: '/benchmarks', icon: BarChart2, label: 'Benchmarks' },
 ]
 export default function Navbar() {

frontend/src/pages/BenchmarksPage.jsx ADDED Viewed

	@@ -0,0 +1,400 @@

+import { useState } from 'react'
+import {
+  BarChart, Bar, XAxis, YAxis, CartesianGrid, Tooltip,
+  ResponsiveContainer, Cell, ReferenceLine,
+} from 'recharts'
+import { PAGE_STYLE } from '../App.jsx'
+// ── Eval results (from python -m ml.eval, seed=42, 79 train / 21 val) ─────────
+const MODELS = [
+  {
+    name: 'BoW + LogReg',
+    shortName: 'BoW+LR',
+    accuracy: 52.4,
+    tier: 'classical',
+    lecture: 'Lecture 3',
+    note: 'CountVectorizer loses TF weighting — raw counts hurt precision on short headlines',
+  },
+  {
+    name: 'BoW + LogReg + Lemma',
+    shortName: 'BoW+LR+L',
+    accuracy: 52.4,
+    tier: 'classical',
+    lecture: 'Lectures 2–3',
+    note: 'No change from non-lemmatized — WordNet is English-biased; Tagalog tokens unchanged',
+  },
+  {
+    name: 'TF-IDF + LogReg',
+    shortName: 'TFIDF+LR',
+    accuracy: 61.9,
+    tier: 'classical',
+    lecture: 'Lecture 3',
+    note: 'Sublinear TF weighting reduces dominance of high-frequency terms; best classical model',
+  },
+  {
+    name: 'TF-IDF + NB',
+    shortName: 'TFIDF+NB',
+    accuracy: 42.9,
+    tier: 'classical',
+    lecture: 'Lectures 5–6',
+    note: 'Feature independence assumption breaks on 79 samples; noisy probability estimates',
+  },
+  {
+    name: 'TF-IDF + NB + Lemma',
+    shortName: 'NB+Lemma',
+    accuracy: 42.9,
+    tier: 'classical',
+    lecture: 'Lectures 2, 5–6',
+    note: 'Lemmatization again neutral — confirms English-biased lemmatizer finding',
+  },
+  {
+    name: 'LDA + LogReg',
+    shortName: 'LDA+LR',
+    accuracy: 42.9,
+    tier: 'classical',
+    lecture: 'Lecture 7',
+    note: '5 topics over 79 documents is too few for stable topic distributions',
+  },
+  {
+    name: 'XLM-RoBERTa',
+    shortName: 'XLM-R',
+    accuracy: 90.5,
+    tier: 'transformer',
+    lecture: 'Transfer Learning',
+    note: 'Pretrained on 100+ languages including Filipino; fine-tuned on combined dataset',
+  },
+  {
+    name: 'Tagalog-RoBERTa',
+    shortName: 'TL-R',
+    accuracy: 95.2,
+    tier: 'transformer',
+    lecture: 'Transfer Learning',
+    note: 'Pretrained on TLUnified Filipino corpus; higher recall on Tagalog/Taglish posts',
+  },
+  {
+    name: 'Ensemble',
+    shortName: 'Ensemble',
+    accuracy: 100.0,
+    tier: 'ensemble',
+    lecture: 'Ensemble Methods',
+    note: 'Soft-vote average of XLM-R + Tagalog-RoBERTa logits; 100% on 21-sample holdout',
+  },
+]
+const TIER_COLOR = {
+  classical:   '#d97706',  // gold
+  transformer: '#06b6d4',  // cyan
+  ensemble:    '#16a34a',  // green
+}
+const TIER_LABEL = {
+  classical:   'Classical ML',
+  transformer: 'Transformer',
+  ensemble:    'Ensemble',
+}
+const FINDINGS = [
+  {
+    lecture: 'Lecture 3',
+    title: 'TF-IDF > Bag of Words',
+    body: 'TF-IDF sublinear weighting outperforms raw BoW counts by +9.5%. Down-weighting high-frequency filler terms matters for short Filipino news headlines.',
+    color: '#d97706',
+  },
+  {
+    lecture: 'Lectures 5–6',
+    title: 'Naive Bayes struggles at small scale',
+    body: 'MultinomialNB reaches only 42.9% — 19pp below LogReg. Feature independence breaks down when training on 79 noisy, cross-lingual samples.',
+    color: '#d97706',
+  },
+  {
+    lecture: 'Lecture 7',
+    title: 'LDA needs more documents',
+    body: '5 topics over 79 training texts yields unstable distributions. Topic features are weak signal for 3-class classification; LDA would improve with 1000+ samples.',
+    color: '#d97706',
+  },
+  {
+    lecture: 'Lectures 2a–2c',
+    title: 'Lemmatization: neutral on Tagalog',
+    body: 'Zero accuracy change with WordNet lemmatization. English-biased lemmatizers return Tagalog tokens unchanged — confirms the tool is a no-op on Filipino text.',
+    color: '#06b6d4',
+  },
+]
+// ── Custom tooltip ─────────────────────────────────────────────────────────────
+function ChartTooltip({ active, payload }) {
+  if (!active || !payload?.length) return null
+  const d = payload[0].payload
+  return (
+    <div style={{
+      background: 'var(--bg-elevated)',
+      border: '1px solid var(--border-light)',
+      borderRadius: 4,
+      padding: '10px 14px',
+      fontFamily: 'var(--font-mono)',
+      fontSize: 11,
+      color: 'var(--text-primary)',
+      maxWidth: 240,
+    }}>
+      <div style={{ fontWeight: 700, marginBottom: 4 }}>{d.name}</div>
+      <div style={{ color: TIER_COLOR[d.tier], marginBottom: 6 }}>
+        {d.accuracy.toFixed(1)}% accuracy
+      </div>
+      <div style={{ color: 'var(--text-muted)', fontSize: 10, lineHeight: 1.5 }}>{d.note}</div>
+    </div>
+  )
+}
+// ── Tier legend pill ───────────────────────────────────────────────────────────
+function TierPill({ tier }) {
+  return (
+    <span style={{
+      display: 'inline-block',
+      padding: '2px 8px',
+      borderRadius: 2,
+      fontSize: 9,
+      fontFamily: 'var(--font-mono)',
+      fontWeight: 700,
+      letterSpacing: '0.06em',
+      textTransform: 'uppercase',
+      background: `${TIER_COLOR[tier]}18`,
+      color: TIER_COLOR[tier],
+      border: `1px solid ${TIER_COLOR[tier]}40`,
+    }}>
+      {TIER_LABEL[tier]}
+    </span>
+  )
+}
+export default function BenchmarksPage() {
+  const [activeRow, setActiveRow] = useState(null)
+  return (
+    <main style={{ ...PAGE_STYLE, paddingTop: 48, paddingBottom: 80 }}>
+      {/* ── Header ─────────────────────────────────────────────────────────── */}
+      <div className="fade-up-1" style={{ marginBottom: 40 }}>
+        <div style={{
+          fontFamily: 'var(--font-mono)',
+          fontSize: 10,
+          letterSpacing: '0.14em',
+          color: 'var(--accent-red)',
+          textTransform: 'uppercase',
+          marginBottom: 10,
+        }}>
+          ML Course — Model Comparison
+        </div>
+        <h1 style={{
+          fontFamily: 'var(--font-display)',
+          fontWeight: 800,
+          fontSize: 32,
+          letterSpacing: '-0.02em',
+          color: 'var(--text-primary)',
+          marginBottom: 12,
+        }}>
+          Model Benchmarks
+        </h1>
+        <p style={{
+          fontFamily: 'var(--font-body)',
+          fontSize: 14,
+          color: 'var(--text-secondary)',
+          lineHeight: 1.7,
+          maxWidth: 560,
+        }}>
+          Comparison of 9 classifier variants on a 21-sample holdout from the
+          handcrafted PhilVerify dataset (79 train / 21 val, seed 42). Classical
+          models trained in-session; transformer checkpoints fine-tuned on the
+          full combined dataset.
+        </p>
+      </div>
+      {/* ── Key findings ───────────────────────────────────────────────────── */}
+      <div className="fade-up-2" style={{ marginBottom: 48 }}>
+        <h2 style={{
+          fontFamily: 'var(--font-display)',
+          fontWeight: 700,
+          fontSize: 11,
+          letterSpacing: '0.12em',
+          textTransform: 'uppercase',
+          color: 'var(--text-muted)',
+          marginBottom: 16,
+        }}>
+          Key Findings
+        </h2>
+        <div style={{ display: 'grid', gridTemplateColumns: 'repeat(auto-fit, minmax(210px, 1fr))', gap: 12 }}>
+          {FINDINGS.map((f) => (
+            <div key={f.title} className="card" style={{ padding: '16px 18px' }}>
+              <div style={{
+                fontFamily: 'var(--font-mono)',
+                fontSize: 9,
+                letterSpacing: '0.1em',
+                textTransform: 'uppercase',
+                color: f.color,
+                marginBottom: 6,
+              }}>
+                {f.lecture}
+              </div>
+              <div style={{
+                fontFamily: 'var(--font-display)',
+                fontWeight: 700,
+                fontSize: 13,
+                color: 'var(--text-primary)',
+                marginBottom: 8,
+                lineHeight: 1.3,
+              }}>
+                {f.title}
+              </div>
+              <p style={{
+                fontFamily: 'var(--font-body)',
+                fontSize: 11,
+                color: 'var(--text-secondary)',
+                lineHeight: 1.6,
+                margin: 0,
+              }}>
+                {f.body}
+              </p>
+            </div>
+          ))}
+        </div>
+      </div>
+      {/* ── Bar chart ──────────────────────────────────────────────────────── */}
+      <div className="fade-up-3 card" style={{ padding: '24px 20px', marginBottom: 32 }}>
+        <div style={{ display: 'flex', alignItems: 'center', justifyContent: 'space-between', marginBottom: 20 }}>
+          <h2 style={{
+            fontFamily: 'var(--font-display)',
+            fontWeight: 700,
+            fontSize: 13,
+            letterSpacing: '0.06em',
+            color: 'var(--text-primary)',
+            margin: 0,
+          }}>
+            Accuracy by Model
+          </h2>
+          <div style={{ display: 'flex', gap: 12 }}>
+            {Object.entries(TIER_LABEL).map(([tier, label]) => (
+              <div key={tier} style={{ display: 'flex', alignItems: 'center', gap: 5 }}>
+                <span style={{ width: 8, height: 8, borderRadius: 2, background: TIER_COLOR[tier], display: 'inline-block' }} />
+                <span style={{ fontFamily: 'var(--font-mono)', fontSize: 9, color: 'var(--text-muted)', letterSpacing: '0.06em' }}>
+                  {label.toUpperCase()}
+                </span>
+              </div>
+            ))}
+          </div>
+        </div>
+        <ResponsiveContainer width="100%" height={280}>
+          <BarChart
+            data={MODELS}
+            layout="vertical"
+            margin={{ top: 0, right: 40, left: 8, bottom: 0 }}
+          >
+            <CartesianGrid horizontal={false} stroke="rgba(245,240,232,0.04)" />
+            <XAxis
+              type="number"
+              domain={[0, 100]}
+              tickFormatter={v => `${v}%`}
+              tick={{ fontSize: 9, fontFamily: 'var(--font-mono)', fill: 'var(--text-muted)' }}
+              tickLine={false}
+              axisLine={false}
+            />
+            <YAxis
+              type="category"
+              dataKey="shortName"
+              width={72}
+              tick={{ fontSize: 9, fontFamily: 'var(--font-mono)', fill: 'var(--text-secondary)' }}
+              tickLine={false}
+              axisLine={false}
+            />
+            <Tooltip content={<ChartTooltip />} cursor={{ fill: 'rgba(245,240,232,0.03)' }} />
+            <ReferenceLine x={61.9} stroke="rgba(217,119,6,0.3)" strokeDasharray="3 3" label={{ value: 'Classical ceiling', position: 'top', fontSize: 8, fontFamily: 'var(--font-mono)', fill: '#d97706' }} />
+            <Bar dataKey="accuracy" radius={[0, 2, 2, 0]} maxBarSize={20}>
+              {MODELS.map((m) => (
+                <Cell key={m.name} fill={TIER_COLOR[m.tier]} fillOpacity={activeRow === m.name ? 1 : 0.75} />
+              ))}
+            </Bar>
+          </BarChart>
+        </ResponsiveContainer>
+      </div>
+      {/* ── Full results table ─────────────────────────────────────────────── */}
+      <div className="fade-up-4 card" style={{ overflow: 'hidden' }}>
+        <div style={{ padding: '18px 20px 12px', borderBottom: '1px solid var(--border)' }}>
+          <h2 style={{
+            fontFamily: 'var(--font-display)',
+            fontWeight: 700,
+            fontSize: 13,
+            letterSpacing: '0.06em',
+            color: 'var(--text-primary)',
+            margin: 0,
+          }}>
+            Full Results
+          </h2>
+        </div>
+        <table style={{ width: '100%', borderCollapse: 'collapse' }}>
+          <thead>
+            <tr style={{ borderBottom: '1px solid var(--border)' }}>
+              {['Model', 'Accuracy', 'Tier', 'Lecture', 'Note'].map(h => (
+                <th key={h} style={{
+                  padding: '8px 16px',
+                  textAlign: h === 'Accuracy' ? 'right' : 'left',
+                  fontFamily: 'var(--font-mono)',
+                  fontSize: 9,
+                  fontWeight: 700,
+                  letterSpacing: '0.1em',
+                  textTransform: 'uppercase',
+                  color: 'var(--text-muted)',
+                }}>
+                  {h}
+                </th>
+              ))}
+            </tr>
+          </thead>
+          <tbody>
+            {MODELS.map((m, i) => (
+              <tr
+                key={m.name}
+                onMouseEnter={() => setActiveRow(m.name)}
+                onMouseLeave={() => setActiveRow(null)}
+                style={{
+                  borderBottom: i < MODELS.length - 1 ? '1px solid var(--border)' : 'none',
+                  background: activeRow === m.name ? 'var(--bg-elevated)' : 'transparent',
+                  transition: 'background 0.1s',
+                  borderLeft: `3px solid ${activeRow === m.name ? TIER_COLOR[m.tier] : 'transparent'}`,
+                }}
+              >
+                <td style={{ padding: '10px 16px', fontFamily: 'var(--font-display)', fontSize: 12, fontWeight: 600, color: 'var(--text-primary)' }}>
+                  {m.name}
+                </td>
+                <td style={{ padding: '10px 16px', textAlign: 'right', fontFamily: 'var(--font-mono)', fontSize: 13, fontWeight: 700, color: TIER_COLOR[m.tier] }}>
+                  {m.accuracy.toFixed(1)}%
+                </td>
+                <td style={{ padding: '10px 16px' }}>
+                  <TierPill tier={m.tier} />
+                </td>
+                <td style={{ padding: '10px 16px', fontFamily: 'var(--font-mono)', fontSize: 10, color: 'var(--text-muted)' }}>
+                  {m.lecture}
+                </td>
+                <td style={{ padding: '10px 16px', fontFamily: 'var(--font-body)', fontSize: 11, color: 'var(--text-secondary)', lineHeight: 1.5, maxWidth: 260 }}>
+                  {m.note}
+                </td>
+              </tr>
+            ))}
+          </tbody>
+        </table>
+      </div>
+      {/* ── Footer note ────────────────────────────────────────────────────── */}
+      <p className="fade-up-5" style={{
+        marginTop: 20,
+        fontFamily: 'var(--font-mono)',
+        fontSize: 10,
+        color: 'var(--text-muted)',
+        lineHeight: 1.6,
+      }}>
+        * Val set is 21 samples from a handcrafted 100-sample dataset — ensemble 100% reflects
+        near-zero variance on a small holdout, not production accuracy. Transformer models were
+        trained on the larger combined dataset; classical models trained on the 79-sample split.
+      </p>
+    </main>
+  )
+}

frontend/src/pages/VerifyPage.jsx CHANGED Viewed

@@ -894,6 +894,20 @@ export default function VerifyPage() {
                             verdict={result.layer1?.verdict}
                             score={result.layer1?.confidence}
                             delay={0}>
                             <p className="text-xs mt-2" style={{ color: 'var(--text-secondary)', fontFamily: 'var(--font-body)', lineHeight: 1.6 }}>
                                 {mlConfidenceExplanation(result.layer1?.confidence || 0, result.layer1?.verdict)}
                             </p>
@@ -923,6 +937,11 @@ export default function VerifyPage() {
                             <p className="text-xs mt-3" style={{ color: 'var(--text-muted)', fontFamily: 'var(--font-body)', lineHeight: 1.6 }}>
                                 <span style={{ color: 'var(--text-secondary)' }}>Claim searched: </span>
                                 "{result.layer2?.claim_used || 'No claim extracted'}"
                             </p>
                         </LayerCard>
                     </div>
@@ -1002,7 +1021,8 @@ export default function VerifyPage() {
                                                             <span className="text-xs tabular" style={{ color: 'var(--text-muted)' }}>
                                                                 {src.source_name || src.source}
                                                             </span>
-                                                            <span className="text-xs tabular" style={{ color: stanceColor, fontFamily: 'var(--font-display)', letterSpacing: '0.06em' }}>
                                                                 {src.stance}
                                                             </span>
                                                             <span className="text-xs tabular" style={{ color: 'var(--text-muted)' }}>

                             verdict={result.layer1?.verdict}
                             score={result.layer1?.confidence}
                             delay={0}>
+                            {result.layer1?.model_tier && (
+                                <span style={{
+                                    display: 'inline-block', fontSize: '0.62rem', padding: '2px 6px',
+                                    borderRadius: 3, marginTop: 6, marginBottom: 2,
+                                    background: result.layer1.model_tier === 'ensemble' ? 'rgba(217,119,6,0.12)' :
+                                                result.layer1.model_tier === 'xlmr' ? 'rgba(6,182,212,0.12)' : 'rgba(255,255,255,0.06)',
+                                    color: result.layer1.model_tier === 'ensemble' ? 'var(--accent-gold)' :
+                                           result.layer1.model_tier === 'xlmr' ? 'var(--accent-cyan)' : 'var(--text-muted)',
+                                    fontFamily: 'var(--font-mono)', textTransform: 'uppercase', letterSpacing: '0.08em',
+                                    border: '1px solid currentColor', opacity: 0.85,
+                                }}>
+                                    {result.layer1.model_tier}
+                                </span>
+                            )}
                             <p className="text-xs mt-2" style={{ color: 'var(--text-secondary)', fontFamily: 'var(--font-body)', lineHeight: 1.6 }}>
                                 {mlConfidenceExplanation(result.layer1?.confidence || 0, result.layer1?.verdict)}
                             </p>
                             <p className="text-xs mt-3" style={{ color: 'var(--text-muted)', fontFamily: 'var(--font-body)', lineHeight: 1.6 }}>
                                 <span style={{ color: 'var(--text-secondary)' }}>Claim searched: </span>
                                 "{result.layer2?.claim_used || 'No claim extracted'}"
+                                {result.layer2?.claim_method && (
+                                    <span style={{ marginLeft: 6, fontSize: '0.62rem', fontFamily: 'var(--font-mono)', opacity: 0.55 }}>
+                                        [{result.layer2.claim_method}]
+                                    </span>
+                                )}
                             </p>
                         </LayerCard>
                     </div>
                                                             <span className="text-xs tabular" style={{ color: 'var(--text-muted)' }}>
                                                                 {src.source_name || src.source}
                                                             </span>
+                                                            <span className="text-xs tabular" title={src.stance_reason || src.stance}
+                                                                style={{ color: stanceColor, fontFamily: 'var(--font-display)', letterSpacing: '0.06em', cursor: src.stance_reason ? 'help' : 'default' }}>
                                                                 {src.stance}
                                                             </span>
                                                             <span className="text-xs tabular" style={{ color: 'var(--text-muted)' }}>

ml/bow_classifier.py ADDED Viewed

	@@ -0,0 +1,69 @@

+"""
+PhilVerify — Bag of Words + Logistic Regression Classifier (Layer 1)
+CountVectorizer (BoW) with LogisticRegression. Identical to TFIDFClassifier except
+for the vectorizer — this isolates the BoW vs TF-IDF comparison in eval.py.
+Supports optional WordNet lemmatization.
+"""
+import logging
+from ml.naive_bayes_classifier import _lemmatize_tokens
+from ml.tfidf_classifier import Layer1Result
+logger = logging.getLogger(__name__)
+class BoWClassifier:
+    """
+    BoW (CountVectorizer) + LogisticRegression classifier.
+    Args:
+        train_samples: list[Sample] from ml.dataset. If None, uses the full 100-sample dataset.
+        lemmatize:     apply WordNet lemmatization before vectorization.
+    """
+    _LABELS = {0: "Credible", 1: "Unverified", 2: "Likely Fake"}
+    def __init__(self, train_samples=None, lemmatize: bool = False):
+        from sklearn.feature_extraction.text import CountVectorizer
+        from sklearn.linear_model import LogisticRegression
+        self._lemmatize = lemmatize
+        if train_samples is None:
+            from ml.dataset import get_dataset
+            train_samples = get_dataset()
+        texts = [self._preprocess(s.text) for s in train_samples]
+        labels = [s.label for s in train_samples]
+        self._vectorizer = CountVectorizer(ngram_range=(1, 2), max_features=1000)
+        X = self._vectorizer.fit_transform(texts)
+        self._clf = LogisticRegression(max_iter=500, C=1.0, random_state=42)
+        self._clf.fit(X, labels)
+        logger.info(
+            "BoWClassifier trained on %d samples (lemmatize=%s)",
+            len(texts), lemmatize,
+        )
+    def _preprocess(self, text: str) -> str:
+        text = text.lower()
+        if self._lemmatize:
+            return " ".join(_lemmatize_tokens(text.split()))
+        return text
+    def predict(self, text: str) -> Layer1Result:
+        processed = self._preprocess(text)
+        X = self._vectorizer.transform([processed])
+        pred_label = int(self._clf.predict(X)[0])
+        proba = self._clf.predict_proba(X)[0]
+        confidence = round(float(max(proba)) * 100, 1)
+        verdict = self._LABELS[pred_label]
+        feature_names = self._vectorizer.get_feature_names_out()
+        bow_scores = X.toarray()[0]
+        top_idx = bow_scores.argsort()[-5:][::-1]
+        triggered = [feature_names[i] for i in top_idx if bow_scores[i] > 0]
+        return Layer1Result(verdict=verdict, confidence=confidence, triggered_features=triggered)

ml/dataset.py CHANGED Viewed

@@ -10,6 +10,7 @@ Languages: English, Filipino/Tagalog, Taglish (code-switched)
 """
 from __future__ import annotations
 from dataclasses import dataclass
 LABEL_NAMES = {0: "Credible", 1: "Unverified", 2: "Likely Fake"}
@@ -199,3 +200,40 @@ def class_weights(samples: list[Sample]) -> list[float]:
     for i in range(NUM_LABELS):
         weights.append(total / (NUM_LABELS * max(counts[i], 1)))
     return weights

 """
 from __future__ import annotations
+import random as _random
 from dataclasses import dataclass
 LABEL_NAMES = {0: "Credible", 1: "Unverified", 2: "Likely Fake"}
     for i in range(NUM_LABELS):
         weights.append(total / (NUM_LABELS * max(counts[i], 1)))
     return weights
+# ── Easy Data Augmentation (EDA) ──────────────────────────────────────────────
+def _random_deletion(words: list[str], p: float = 0.12) -> list[str]:
+    """Randomly delete each word with probability p."""
+    if len(words) == 1:
+        return words
+    kept = [w for w in words if _random.random() > p]
+    return kept if kept else [_random.choice(words)]
+def _random_swap(words: list[str], n: int = 1) -> list[str]:
+    """Randomly swap n pairs of adjacent words."""
+    out = words[:]
+    for _ in range(n):
+        i, j = _random.sample(range(len(out)), 2)
+        out[i], out[j] = out[j], out[i]
+    return out
+def augment_samples(samples: list[Sample], seed: int = 42) -> list[Sample]:
+    """
+    Return augmented copies of samples using random deletion and random swap.
+    The originals are NOT included — caller decides whether to combine them.
+    Produces up to 2× the number of input samples (one deletion + one swap
+    variant per sample; samples with fewer than 4 words are skipped).
+    """
+    _random.seed(seed)
+    augmented: list[Sample] = []
+    for s in samples:
+        words = s.text.split()
+        if len(words) < 4:
+            continue
+        augmented.append(Sample(" ".join(_random_deletion(words[:])), s.label))
+        augmented.append(Sample(" ".join(_random_swap(words[:])), s.label))
+    return augmented

ml/ensemble_classifier.py ADDED Viewed

	@@ -0,0 +1,76 @@

+"""
+PhilVerify — Ensemble Classifier (Layer 1)
+Averages softmax probabilities from XLMRobertaClassifier and
+TagalogRobertaClassifier, then returns a single Layer1Result.
+When only one classifier is passed the ensemble degrades gracefully
+to that single model (no averaging needed, no performance penalty).
+"""
+from __future__ import annotations
+import logging
+from ml.xlm_roberta_classifier import Layer1Result
+logger = logging.getLogger(__name__)
+LABEL_NAMES = {0: "Credible", 1: "Unverified", 2: "Likely Fake"}
+class EnsembleClassifier:
+    """
+    Soft-voting ensemble over one or more classifiers that implement
+    predict_probs(text) → (probs_tensor, attentions, input_ids).
+    Triggered features are taken from the classifier with the highest
+    individual confidence (the most "sure" model), then deduplicated.
+    """
+    def __init__(self, classifiers: list) -> None:
+        if not classifiers:
+            raise ValueError("EnsembleClassifier requires at least one classifier")
+        self._classifiers = classifiers
+    def predict(self, text: str) -> Layer1Result:
+        import torch
+        all_probs     = []
+        all_attentions = []
+        all_input_ids  = []
+        for clf in self._classifiers:
+            try:
+                probs, attentions, input_ids = clf.predict_probs(text)
+                all_probs.append(probs)
+                all_attentions.append((attentions, input_ids, clf))
+            except Exception as exc:
+                logger.warning("Classifier %s failed during ensemble: %s", clf, exc)
+        if not all_probs:
+            # All classifiers failed — return a neutral Unverified result
+            return Layer1Result(verdict="Unverified", confidence=33.3, triggered_features=[])
+        # Average probabilities across all classifiers that succeeded
+        avg_probs  = torch.stack(all_probs).mean(dim=0)   # (num_labels,)
+        pred_label = int(avg_probs.argmax().item())
+        confidence = round(float(avg_probs[pred_label].item()) * 100, 1)
+        verdict    = LABEL_NAMES[pred_label]
+        # Triggered features: from the classifier with highest individual confidence
+        triggered: list[str] = []
+        best_conf = -1.0
+        for probs, (attentions, input_ids, clf) in zip(all_probs, all_attentions):
+            clf_conf = float(probs.max().item())
+            if clf_conf > best_conf and hasattr(clf, "_salient_tokens") and attentions:
+                best_conf = clf_conf
+                triggered = clf._salient_tokens(input_ids, attentions)
+        logger.debug(
+            "Ensemble (%d classifiers): %s %.1f%%", len(all_probs), verdict, confidence
+        )
+        return Layer1Result(
+            verdict=verdict,
+            confidence=confidence,
+            triggered_features=triggered,
+        )

ml/eval.py ADDED Viewed

	@@ -0,0 +1,172 @@

+"""
+Evaluate all PhilVerify classifiers on the held-out validation split.
+Prints per-class precision/recall/F1, confusion matrix, and a side-by-side
+accuracy summary for all model variants:
+  Classical (trained on train split):
+    BoW + LogReg
+    BoW + LogReg + Lemma
+    TF-IDF + LogReg  (legacy SEED_DATA baseline)
+    TF-IDF + NB
+    TF-IDF + NB + Lemma
+    LDA features + LogReg
+  Transformer (loaded from saved checkpoints):
+    XLM-RoBERTa
+    Tagalog-RoBERTa
+    Ensemble (XLM-R + Tagalog-RoBERTa)
+Usage:
+    cd PhilVerify
+    python -m ml.eval
+    python -m ml.eval --seed 42 --train-ratio 0.8 --skip-lda-analysis
+"""
+import argparse
+import logging
+from sklearn.metrics import accuracy_score, classification_report, confusion_matrix
+from ml.bow_classifier import BoWClassifier
+from ml.dataset import LABEL_NAMES, get_split
+from ml.ensemble_classifier import EnsembleClassifier
+from ml.lda_analysis import LDAFeatureClassifier, run_topic_analysis
+from ml.naive_bayes_classifier import NaiveBayesClassifier
+from ml.tagalog_roberta_classifier import TagalogRobertaClassifier
+from ml.tfidf_classifier import TFIDFClassifier
+from ml.xlm_roberta_classifier import ModelNotFoundError, XLMRobertaClassifier
+logging.basicConfig(level=logging.INFO, format="%(levelname)s: %(message)s")
+logger = logging.getLogger(__name__)
+LABEL_LIST = [LABEL_NAMES[i] for i in sorted(LABEL_NAMES)]
+def evaluate_classifier(name: str, clf, samples: list) -> dict:
+    true_labels, pred_labels = [], []
+    for s in samples:
+        result = clf.predict(s.text)
+        true_labels.append(LABEL_NAMES[s.label])
+        pred_labels.append(result.verdict)
+    print(f"\n{'='*62}")
+    print(f"  {name}")
+    print(f"{'='*62}")
+    print(classification_report(true_labels, pred_labels, labels=LABEL_LIST, zero_division=0))
+    print("Confusion matrix (rows = true, cols = predicted):")
+    print(f"  {'':14}", "  ".join(f"{lbl[:6]:>6}" for lbl in LABEL_LIST))
+    cm = confusion_matrix(true_labels, pred_labels, labels=LABEL_LIST)
+    for row_label, row in zip(LABEL_LIST, cm):
+        print(f"  {row_label:<14}", "  ".join(f"{v:>6}" for v in row))
+    acc = accuracy_score(true_labels, pred_labels)
+    return {"name": name, "accuracy": acc}
+def main() -> None:
+    parser = argparse.ArgumentParser(description="Evaluate PhilVerify classifiers")
+    parser.add_argument("--seed", type=int, default=42,
+                        help="Random seed (must match training seed)")
+    parser.add_argument("--train-ratio", type=float, default=0.8,
+                        help="Train split ratio (must match training)")
+    parser.add_argument("--skip-lda-analysis", action="store_true",
+                        help="Skip the LDA topic analysis printout")
+    args = parser.parse_args()
+    train_samples, val_samples = get_split(train_ratio=args.train_ratio, seed=args.seed)
+    logger.info(
+        "Train: %d samples  |  Val: %d samples  (seed=%d, train_ratio=%.1f)",
+        len(train_samples), len(val_samples), args.seed, args.train_ratio,
+    )
+    # ── LDA topic analysis (printed before classifier comparison) ────────────
+    if not args.skip_lda_analysis:
+        run_topic_analysis(train_samples)
+    results: list[dict] = []
+    # ── Classical baselines (all trained on train_samples for fair comparison) ─
+    results.append(evaluate_classifier(
+        "BoW + LogReg",
+        BoWClassifier(train_samples),
+        val_samples,
+    ))
+    results.append(evaluate_classifier(
+        "BoW + LogReg + Lemma",
+        BoWClassifier(train_samples, lemmatize=True),
+        val_samples,
+    ))
+    # Legacy baseline (trains on internal SEED_DATA, not the split — included for reference)
+    results.append(evaluate_classifier(
+        "TF-IDF + LogReg  [legacy SEED_DATA]",
+        TFIDFClassifier(),
+        val_samples,
+    ))
+    results.append(evaluate_classifier(
+        "TF-IDF + NB",
+        NaiveBayesClassifier(train_samples),
+        val_samples,
+    ))
+    results.append(evaluate_classifier(
+        "TF-IDF + NB + Lemma",
+        NaiveBayesClassifier(train_samples, lemmatize=True),
+        val_samples,
+    ))
+    results.append(evaluate_classifier(
+        "LDA features + LogReg",
+        LDAFeatureClassifier(train_samples),
+        val_samples,
+    ))
+    # ── Transformer models ───────────────────────────────────────────────────
+    xlmr = None
+    try:
+        xlmr = XLMRobertaClassifier()
+        results.append(evaluate_classifier("XLM-RoBERTa", xlmr, val_samples))
+    except ModelNotFoundError:
+        logger.warning("XLM-RoBERTa checkpoint not found — skipping")
+    tl = None
+    try:
+        tl = TagalogRobertaClassifier()
+        results.append(evaluate_classifier("Tagalog-RoBERTa", tl, val_samples))
+    except ModelNotFoundError:
+        logger.warning("Tagalog-RoBERTa checkpoint not found — skipping")
+    if xlmr is not None and tl is not None:
+        ensemble = EnsembleClassifier([xlmr, tl])
+        results.append(evaluate_classifier(
+            "Ensemble (XLM-R + Tagalog-RoBERTa)", ensemble, val_samples
+        ))
+    # ── Summary table ────────────────────────────────────────────────────────
+    print(f"\n{'='*62}")
+    print("  Summary")
+    print(f"{'='*62}")
+    print(f"  {'Model':<44} {'Accuracy':>8}")
+    print(f"  {'-'*44} {'-'*8}")
+    classical_done = False
+    for r in results:
+        is_transformer = any(
+            kw in r["name"] for kw in ("XLM", "RoBERTa", "Tagalog", "Ensemble")
+        )
+        if is_transformer and not classical_done:
+            print()  # blank separator between classical and transformer sections
+            classical_done = True
+        print(f"  {r['name']:<44} {r['accuracy'] * 100:>7.1f}%")
+    best = max(results, key=lambda r: r["accuracy"])
+    print(f"\n  Best: {best['name']}  ({best['accuracy'] * 100:.1f}%)")
+    print()
+if __name__ == "__main__":
+    main()

ml/lda_analysis.py ADDED Viewed

	@@ -0,0 +1,182 @@

+"""
+PhilVerify — LDA Topic Analysis + LDA Feature Classifier (Layer 1)
+Two responsibilities:
+  1. run_topic_analysis(samples, n_topics)
+       Fits LDA on training texts, prints top-N words per topic and the dominant
+       topic distribution per class (Credible / Unverified / Likely Fake).
+       Call directly to explore what topics the model discovers.
+  2. LDAFeatureClassifier
+       Concatenates LDA topic distribution features with TF-IDF features and feeds
+       the combined vector into LogisticRegression. Same predict() interface as
+       TFIDFClassifier — slots directly into eval.py.
+Usage:
+    python -m ml.lda_analysis          # standalone topic analysis
+    python -m ml.eval                  # compare LDAFeatureClassifier against others
+"""
+import logging
+import numpy as np
+import scipy.sparse as sp
+from ml.dataset import LABEL_NAMES, get_split
+from ml.naive_bayes_classifier import _lemmatize_tokens
+from ml.tfidf_classifier import Layer1Result
+logger = logging.getLogger(__name__)
+_LABELS = {0: "Credible", 1: "Unverified", 2: "Likely Fake"}
+# ── Standalone topic analysis ──────────────────────────────────────────────────
+def run_topic_analysis(
+    samples,
+    n_topics: int = 5,
+    n_top_words: int = 10,
+) -> None:
+    """
+    Fit LDA on samples and print:
+    - Top-N words per topic
+    - Mean topic distribution per class label
+    """
+    from sklearn.decomposition import LatentDirichletAllocation
+    from sklearn.feature_extraction.text import CountVectorizer
+    texts = [s.text.lower() for s in samples]
+    labels = [s.label for s in samples]
+    # LDA requires raw counts (not TF-IDF)
+    vectorizer = CountVectorizer(max_features=500, stop_words="english")
+    X = vectorizer.fit_transform(texts)
+    vocab = vectorizer.get_feature_names_out()
+    lda = LatentDirichletAllocation(
+        n_components=n_topics, random_state=42, max_iter=30, learning_method="batch"
+    )
+    doc_topics = lda.fit_transform(X)  # (n_samples, n_topics)
+    print(f"\n{'='*62}")
+    print(f"  LDA Topic Analysis  ({n_topics} topics, {len(samples)} samples)")
+    print(f"{'='*62}")
+    for i, topic_vec in enumerate(lda.components_):
+        top_idx = topic_vec.argsort()[-n_top_words:][::-1]
+        top_words = [vocab[j] for j in top_idx]
+        print(f"\n  Topic {i + 1}: {', '.join(top_words)}")
+    print(f"\n  Per-class dominant topics:")
+    for label_id, label_name in sorted(LABEL_NAMES.items()):
+        class_idx = [i for i, l in enumerate(labels) if l == label_id]
+        if not class_idx:
+            continue
+        mean_dist = doc_topics[class_idx].mean(axis=0)
+        top2 = mean_dist.argsort()[-2:][::-1]
+        topic_str = "  ".join(f"T{d+1}:{mean_dist[d]:.2f}" for d in top2)
+        print(f"  {label_name:<14}  {topic_str}")
+# ── LDA Feature Classifier ─────────────────────────────────────────────────────
+class LDAFeatureClassifier:
+    """
+    LDA topic distribution + TF-IDF features → LogisticRegression.
+    Feature vector = sparse_hstack([tfidf_features, lda_topic_distribution])
+    Args:
+        train_samples: list[Sample]. If None, uses the full 100-sample dataset.
+        n_topics:      number of LDA topics (default 5).
+        lemmatize:     apply WordNet lemmatization before vectorization.
+    """
+    def __init__(self, train_samples=None, n_topics: int = 5, lemmatize: bool = False):
+        from sklearn.decomposition import LatentDirichletAllocation
+        from sklearn.feature_extraction.text import CountVectorizer, TfidfVectorizer
+        from sklearn.linear_model import LogisticRegression
+        self._lemmatize = lemmatize
+        self._n_topics = n_topics
+        if train_samples is None:
+            from ml.dataset import get_dataset
+            train_samples = get_dataset()
+        texts = [self._preprocess(s.text) for s in train_samples]
+        labels = [s.label for s in train_samples]
+        # TF-IDF part
+        self._tfidf = TfidfVectorizer(
+            ngram_range=(1, 2), max_features=1000, sublinear_tf=True
+        )
+        X_tfidf = self._tfidf.fit_transform(texts)
+        # LDA part (requires raw counts)
+        self._count_vec = CountVectorizer(max_features=500)
+        X_counts = self._count_vec.fit_transform(texts)
+        self._lda = LatentDirichletAllocation(
+            n_components=n_topics, random_state=42, max_iter=30, learning_method="batch"
+        )
+        X_lda = self._lda.fit_transform(X_counts)  # dense (n_samples, n_topics)
+        # Combine: sparse TF-IDF + dense LDA → sparse
+        X_combined = sp.hstack([X_tfidf, sp.csr_matrix(X_lda)])
+        self._clf = LogisticRegression(max_iter=500, C=1.0, random_state=42)
+        self._clf.fit(X_combined, labels)
+        logger.info(
+            "LDAFeatureClassifier trained on %d samples (n_topics=%d, lemmatize=%s)",
+            len(texts), n_topics, lemmatize,
+        )
+    def _preprocess(self, text: str) -> str:
+        text = text.lower()
+        if self._lemmatize:
+            return " ".join(_lemmatize_tokens(text.split()))
+        return text
+    def predict(self, text: str) -> Layer1Result:
+        processed = self._preprocess(text)
+        X_tfidf = self._tfidf.transform([processed])
+        X_counts = self._count_vec.transform([processed])
+        X_lda = self._lda.transform(X_counts)  # (1, n_topics)
+        X_combined = sp.hstack([X_tfidf, sp.csr_matrix(X_lda)])
+        pred_label = int(self._clf.predict(X_combined)[0])
+        proba = self._clf.predict_proba(X_combined)[0]
+        confidence = round(float(max(proba)) * 100, 1)
+        verdict = _LABELS[pred_label]
+        # Top TF-IDF features
+        feature_names = self._tfidf.get_feature_names_out()
+        tfidf_scores = X_tfidf.toarray()[0]
+        top_idx = tfidf_scores.argsort()[-4:][::-1]
+        triggered = [feature_names[i] for i in top_idx if tfidf_scores[i] > 0]
+        # Prepend dominant topic label
+        dominant_topic = int(X_lda[0].argmax()) + 1
+        triggered.insert(0, f"lda_topic_{dominant_topic}")
+        return Layer1Result(
+            verdict=verdict,
+            confidence=confidence,
+            triggered_features=triggered[:5],
+        )
+# ── Direct run ─────────────────────────────────────────────────────────────────
+if __name__ == "__main__":
+    import argparse
+    parser = argparse.ArgumentParser(description="LDA topic analysis on PhilVerify dataset")
+    parser.add_argument("--n-topics", type=int, default=5)
+    parser.add_argument("--n-top-words", type=int, default=10)
+    parser.add_argument("--seed", type=int, default=42)
+    args = parser.parse_args()
+    train_samples, _ = get_split(seed=args.seed)
+    run_topic_analysis(train_samples, n_topics=args.n_topics, n_top_words=args.n_top_words)

ml/models/tagalog_roberta_model/config.json ADDED Viewed

	@@ -0,0 +1,40 @@

+{
+  "add_cross_attention": false,
+  "architectures": [
+    "RobertaForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 0,
+  "classifier_dropout": null,
+  "dtype": "float32",
+  "eos_token_id": 2,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "Credible",
+    "1": "Unverified",
+    "2": "Likely Fake"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "is_decoder": false,
+  "label2id": {
+    "Credible": 0,
+    "Likely Fake": 2,
+    "Unverified": 1
+  },
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 514,
+  "model_type": "roberta",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "tie_word_embeddings": true,
+  "transformers_version": "5.3.0",
+  "type_vocab_size": 1,
+  "use_cache": true,
+  "vocab_size": 30000
+}

ml/models/tagalog_roberta_model/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

ml/models/tagalog_roberta_model/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,20 @@

+{
+  "add_prefix_space": false,
+  "backend": "tokenizers",
+  "bos_token": "<s>",
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "errors": "replace",
+  "is_local": false,
+  "mask_token": "<mask>",
+  "max_length": 512,
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "stride": 0,
+  "tokenizer_class": "RobertaTokenizer",
+  "trim_offsets": true,
+  "truncation_side": "right",
+  "truncation_strategy": "longest_first",
+  "unk_token": "<unk>"
+}

ml/naive_bayes_classifier.py ADDED Viewed

	@@ -0,0 +1,111 @@

+"""
+PhilVerify — TF-IDF + Naive Bayes Classifier (Layer 1)
+MultinomialNB with TF-IDF features. Trains on the provided sample split so that
+eval comparisons are fair (same train/val split as transformer models).
+Supports optional WordNet lemmatization to measure its effect on Filipino/Taglish text.
+"""
+import logging
+logger = logging.getLogger(__name__)
+def _lemmatize_tokens(tokens: list[str]) -> list[str]:
+    """
+    Lemmatize tokens with POS-aware WordNet lemmatization.
+    Downloads required NLTK data on first call. Falls back to identity on any error.
+    Note: WordNet is English-biased — Tagalog tokens are returned unchanged.
+    """
+    try:
+        import nltk
+        from nltk.corpus import wordnet
+        from nltk.stem import WordNetLemmatizer
+        for resource, path in [
+            ("wordnet", "corpora/wordnet"),
+            ("averaged_perceptron_tagger_eng", "taggers/averaged_perceptron_tagger_eng"),
+        ]:
+            try:
+                nltk.data.find(path)
+            except LookupError:
+                nltk.download(resource, quiet=True)
+        def _wn_pos(tag: str) -> str:
+            if tag.startswith("J"):
+                return wordnet.ADJ
+            if tag.startswith("V"):
+                return wordnet.VERB
+            if tag.startswith("R"):
+                return wordnet.ADV
+            return wordnet.NOUN
+        lemmatizer = WordNetLemmatizer()
+        tagged = nltk.pos_tag(tokens)
+        return [lemmatizer.lemmatize(w, _wn_pos(t)) for w, t in tagged]
+    except Exception as exc:
+        logger.debug("Lemmatization skipped (%s) — returning raw tokens", exc)
+        return tokens
+# Import shared result type
+from ml.tfidf_classifier import Layer1Result  # noqa: E402
+class NaiveBayesClassifier:
+    """
+    TF-IDF + MultinomialNB classifier. Same predict() interface as TFIDFClassifier.
+    Args:
+        train_samples: list[Sample] from ml.dataset. If None, uses the full 100-sample dataset.
+        lemmatize:     apply WordNet lemmatization before vectorization.
+    """
+    _LABELS = {0: "Credible", 1: "Unverified", 2: "Likely Fake"}
+    def __init__(self, train_samples=None, lemmatize: bool = False):
+        from sklearn.feature_extraction.text import TfidfVectorizer
+        from sklearn.naive_bayes import MultinomialNB
+        self._lemmatize = lemmatize
+        if train_samples is None:
+            from ml.dataset import get_dataset
+            train_samples = get_dataset()
+        texts = [self._preprocess(s.text) for s in train_samples]
+        labels = [s.label for s in train_samples]
+        self._vectorizer = TfidfVectorizer(
+            ngram_range=(1, 2),
+            max_features=1000,
+            sublinear_tf=True,
+        )
+        X = self._vectorizer.fit_transform(texts)
+        self._clf = MultinomialNB(alpha=1.0)
+        self._clf.fit(X, labels)
+        logger.info(
+            "NaiveBayesClassifier trained on %d samples (lemmatize=%s)",
+            len(texts), lemmatize,
+        )
+    def _preprocess(self, text: str) -> str:
+        text = text.lower()
+        if self._lemmatize:
+            return " ".join(_lemmatize_tokens(text.split()))
+        return text
+    def predict(self, text: str) -> Layer1Result:
+        processed = self._preprocess(text)
+        X = self._vectorizer.transform([processed])
+        pred_label = int(self._clf.predict(X)[0])
+        proba = self._clf.predict_proba(X)[0]
+        confidence = round(float(max(proba)) * 100, 1)
+        verdict = self._LABELS[pred_label]
+        feature_names = self._vectorizer.get_feature_names_out()
+        tfidf_scores = X.toarray()[0]
+        top_idx = tfidf_scores.argsort()[-5:][::-1]
+        triggered = [feature_names[i] for i in top_idx if tfidf_scores[i] > 0]
+        return Layer1Result(verdict=verdict, confidence=confidence, triggered_features=triggered)

ml/tagalog_roberta_classifier.py ADDED Viewed

	@@ -0,0 +1,157 @@

+"""
+PhilVerify — Tagalog-RoBERTa Sequence Classifier (Layer 1)
+Fine-tuned on Philippine misinformation data using jcblaise/roberta-tagalog-base
+as the backbone. This model was pre-trained on TLUnified — a large, topically-
+varied Filipino corpus — and shows +4.47% average accuracy gain over prior
+Filipino models on classification tasks.
+Drop-in replacement for XLMRobertaClassifier — same predict() interface.
+Checkpoint: ml/models/tagalog_roberta_model/ (populated by train_tagalog_roberta.py).
+Raises ModelNotFoundError if checkpoint missing so the engine falls back gracefully.
+"""
+from __future__ import annotations
+import logging
+from dataclasses import dataclass, field
+from pathlib import Path
+from ml.xlm_roberta_classifier import Layer1Result, ModelNotFoundError
+logger = logging.getLogger(__name__)
+MODEL_DIR  = Path(__file__).parent / "models" / "tagalog_roberta_model"
+LABEL_NAMES = {0: "Credible", 1: "Unverified", 2: "Likely Fake"}
+NUM_LABELS  = 3
+MAX_LENGTH  = 256
+class TagalogRobertaClassifier:
+    """
+    jcblaise/roberta-tagalog-base fine-tuned for misinformation classification.
+    Loading is lazy: the model is not loaded until the first call to predict().
+    Raises ModelNotFoundError on instantiation if the checkpoint is missing.
+    """
+    def __init__(self) -> None:
+        if not MODEL_DIR.exists():
+            raise ModelNotFoundError(
+                f"Tagalog-RoBERTa checkpoint not found at {MODEL_DIR}. "
+                "Run `python ml/train_tagalog_roberta.py` to fine-tune the model first."
+            )
+        self._tokenizer = None
+        self._model     = None
+    # ── Lazy load ─────────────────────────────────────────────────────────────
+    def _ensure_loaded(self) -> None:
+        if self._model is not None:
+            return
+        from transformers import AutoTokenizer, AutoModelForSequenceClassification
+        import torch
+        self._torch = torch
+        logger.info("Loading Tagalog-RoBERTa from %s …", MODEL_DIR)
+        self._tokenizer = AutoTokenizer.from_pretrained(str(MODEL_DIR))
+        self._model = AutoModelForSequenceClassification.from_pretrained(
+            str(MODEL_DIR),
+            num_labels=NUM_LABELS,
+        )
+        self._model.eval()
+        logger.info("Tagalog-RoBERTa loaded — device: %s", self._device)
+    @property
+    def _device(self) -> str:
+        try:
+            import torch
+            if torch.backends.mps.is_available():
+                return "mps"
+        except Exception:
+            pass
+        try:
+            import torch
+            if torch.cuda.is_available():
+                return "cuda"
+        except Exception:
+            pass
+        return "cpu"
+    # ── Saliency: attention-based token importance ────────────────────────────
+    def _salient_tokens(self, input_ids, attentions, n: int = 5) -> list[str]:
+        import torch
+        last_layer_attn = attentions[-1]
+        cls_attn = last_layer_attn[0, :, 0, :].mean(0)
+        seq_len  = cls_attn.shape[-1]
+        tokens   = self._tokenizer.convert_ids_to_tokens(
+            input_ids[0].tolist()[:seq_len]
+        )
+        scored = []
+        for tok, score in zip(tokens, cls_attn.tolist()):
+            if tok in ("<s>", "</s>", "<pad>", "<unk>"):
+                continue
+            clean = tok.lstrip("▁").strip()
+            if len(clean) >= 3 and clean.isalpha():
+                scored.append((clean, score))
+        seen: set[str] = set()
+        result = []
+        for word, _ in sorted(scored, key=lambda x: x[1], reverse=True):
+            if word.lower() not in seen:
+                seen.add(word.lower())
+                result.append(word)
+            if len(result) >= n:
+                break
+        return result
+    # ── Public API ────────────────────────────────────────────────────────────
+    def predict(self, text: str) -> Layer1Result:
+        self._ensure_loaded()
+        import torch
+        encoding = self._tokenizer(
+            text,
+            truncation=True,
+            max_length=MAX_LENGTH,
+            return_tensors="pt",
+        )
+        with torch.no_grad():
+            outputs = self._model(
+                input_ids=encoding["input_ids"],
+                attention_mask=encoding["attention_mask"],
+                output_attentions=True,
+            )
+        logits     = outputs.logits[0]
+        probs      = torch.softmax(logits, dim=-1)
+        pred_label = int(probs.argmax().item())
+        confidence = round(float(probs[pred_label].item()) * 100, 1)
+        # SDPA attention doesn't return attentions; fallback to empty
+        triggered = self._salient_tokens(encoding["input_ids"], outputs.attentions) if outputs.attentions else []
+        return Layer1Result(
+            verdict=LABEL_NAMES[pred_label],
+            confidence=confidence,
+            triggered_features=triggered,
+        )
+    def predict_probs(self, text: str):
+        """Return raw softmax probability tensor for ensemble averaging."""
+        self._ensure_loaded()
+        import torch
+        encoding = self._tokenizer(
+            text,
+            truncation=True,
+            max_length=MAX_LENGTH,
+            return_tensors="pt",
+        )
+        with torch.no_grad():
+            outputs = self._model(
+                input_ids=encoding["input_ids"],
+                attention_mask=encoding["attention_mask"],
+                output_attentions=True,
+            )
+        return torch.softmax(outputs.logits[0], dim=-1), outputs.attentions, encoding["input_ids"]

ml/train_tagalog_roberta.py ADDED Viewed

	@@ -0,0 +1,287 @@

+#!/usr/bin/env python3
+"""
+PhilVerify — Tagalog-RoBERTa Fine-tuning Script
+Fine-tunes jcblaise/roberta-tagalog-base on the PhilVerify labeled dataset.
+The model was pre-trained on TLUnified, a large Filipino corpus, and
+outperforms XLM-RoBERTa-base on Tagalog classification by ~4.47% accuracy.
+Saves the checkpoint to ml/models/tagalog_roberta_model/ for use by
+TagalogRobertaClassifier and the EnsembleClassifier.
+Usage:
+    cd PhilVerify/
+    source venv/bin/activate
+    python ml/train_tagalog_roberta.py [--epochs N] [--lr FLOAT] [--batch-size N]
+Typical runtime (CPU, MacBook M1):  ~8–12 minutes for 5 epochs
+Typical runtime (GPU/MPS):          ~1–2 minutes
+"""
+from __future__ import annotations
+import argparse
+import logging
+import sys
+import time
+from pathlib import Path
+sys.path.insert(0, str(Path(__file__).parent.parent))
+logging.basicConfig(
+    level=logging.INFO,
+    format="%(asctime)s  %(levelname)-8s  %(message)s",
+    datefmt="%H:%M:%S",
+)
+logger = logging.getLogger(__name__)
+OUTPUT_DIR  = Path(__file__).parent / "models" / "tagalog_roberta_model"
+BASE_MODEL  = "jcblaise/roberta-tagalog-base"
+MAX_LENGTH  = 256
+# ── PyTorch Dataset ───────────────────────────────────────────────────────────
+class PhilVerifyDataset:
+    def __init__(self, samples, tokenizer) -> None:
+        self.encodings = tokenizer(
+            [s.text for s in samples],
+            truncation=True,
+            padding="max_length",
+            max_length=MAX_LENGTH,
+            return_tensors="pt",
+        )
+        import torch
+        self.labels = torch.tensor([s.label for s in samples], dtype=torch.long)
+    def __len__(self) -> int:
+        return len(self.labels)
+    def __getitem__(self, idx: int):
+        return {
+            "input_ids":      self.encodings["input_ids"][idx],
+            "attention_mask": self.encodings["attention_mask"][idx],
+            "labels":         self.labels[idx],
+        }
+# ── Freeze helpers ────────────────────────────────────────────────────────────
+def freeze_lower_layers(model, keep_top_n: int = 2) -> int:
+    frozen = 0
+    total_layers = len(model.roberta.encoder.layer)
+    unfreeze_from = total_layers - keep_top_n
+    for i, layer in enumerate(model.roberta.encoder.layer):
+        if i < unfreeze_from:
+            for p in layer.parameters():
+                p.requires_grad = False
+                frozen += p.numel()
+    for p in model.roberta.embeddings.parameters():
+        p.requires_grad = False
+        frozen += p.numel()
+    logger.info(
+        "Frozen %d / %d encoder layers (keeping top %d + classifier head). "
+        "%d params frozen.",
+        unfreeze_from, total_layers, keep_top_n, frozen,
+    )
+    return frozen
+# ── Metrics ───────────────────────────────────────────────────────────────────
+def evaluate(model, loader, device) -> dict:
+    import torch
+    model.eval()
+    all_preds, all_labels = [], []
+    total_loss = 0.0
+    n_batches  = 0
+    loss_fn    = torch.nn.CrossEntropyLoss()
+    with torch.no_grad():
+        for batch in loader:
+            batch = {k: v.to(device) for k, v in batch.items()}
+            labels  = batch["labels"]
+            outputs = model(
+                input_ids=batch["input_ids"],
+                attention_mask=batch["attention_mask"],
+            )
+            loss = loss_fn(outputs.logits, labels)
+            total_loss += loss.item()
+            preds = outputs.logits.argmax(dim=-1)
+            all_preds.extend(preds.cpu().tolist())
+            all_labels.extend(labels.cpu().tolist())
+            n_batches += 1
+    correct = sum(p == l for p, l in zip(all_preds, all_labels))
+    return {
+        "loss":     round(total_loss / max(n_batches, 1), 4),
+        "accuracy": round(correct / max(len(all_labels), 1) * 100, 1),
+    }
+# ── Main training loop ────────────────────────────────────────────────────────
+def train(
+    epochs:     int   = 5,
+    lr:         float = 2e-5,
+    batch_size: int   = 8,
+    freeze:     bool  = True,
+    keep_top_n: int   = 2,
+    seed:       int   = 42,
+) -> None:
+    import torch
+    from torch.utils.data import DataLoader
+    from transformers import AutoTokenizer, AutoModelForSequenceClassification
+    from ml.combined_dataset import get_split, class_weights, LABEL_NAMES, NUM_LABELS
+    from ml.dataset import augment_samples
+    torch.manual_seed(seed)
+    if torch.backends.mps.is_available():
+        device = torch.device("mps")
+    elif torch.cuda.is_available():
+        device = torch.device("cuda")
+    else:
+        device = torch.device("cpu")
+    logger.info("Device: %s", device)
+    train_samples, val_samples = get_split(train_ratio=0.8, seed=seed)
+    aug = augment_samples(train_samples, seed=seed)
+    train_samples = train_samples + aug
+    logger.info(
+        "Dataset: %d train (%d original + %d augmented) / %d val",
+        len(train_samples), len(train_samples) - len(aug), len(aug), len(val_samples),
+    )
+    logger.info("Loading tokenizer: %s …", BASE_MODEL)
+    tokenizer = AutoTokenizer.from_pretrained(BASE_MODEL)
+    train_ds = PhilVerifyDataset(train_samples, tokenizer)
+    val_ds   = PhilVerifyDataset(val_samples,   tokenizer)
+    train_loader = DataLoader(train_ds, batch_size=batch_size, shuffle=True)
+    val_loader   = DataLoader(val_ds,   batch_size=batch_size, shuffle=False)
+    logger.info("Loading model: %s …", BASE_MODEL)
+    model = AutoModelForSequenceClassification.from_pretrained(
+        BASE_MODEL,
+        num_labels=NUM_LABELS,
+        id2label=LABEL_NAMES,
+        label2id={v: k for k, v in LABEL_NAMES.items()},
+    )
+    if freeze:
+        freeze_lower_layers(model, keep_top_n=keep_top_n)
+    model.to(device)
+    total_params     = sum(p.numel() for p in model.parameters())
+    trainable_params = sum(p.numel() for p in model.parameters() if p.requires_grad)
+    logger.info(
+        "Parameters: %d total / %d trainable (%.1f%%)",
+        total_params, trainable_params, trainable_params / total_params * 100,
+    )
+    weights = torch.tensor(
+        class_weights(train_samples), dtype=torch.float
+    ).to(device)
+    logger.info("Class weights: %s", [round(w, 3) for w in weights.tolist()])
+    loss_fn = torch.nn.CrossEntropyLoss(weight=weights)
+    optimizer = torch.optim.AdamW(
+        filter(lambda p: p.requires_grad, model.parameters()),
+        lr=lr,
+        weight_decay=0.01,
+    )
+    total_steps  = epochs * len(train_loader)
+    warmup_steps = max(1, total_steps // 10)
+    def lr_lambda(step: int) -> float:
+        if step < warmup_steps:
+            return step / warmup_steps
+        progress = (step - warmup_steps) / max(total_steps - warmup_steps, 1)
+        return max(0.05, 1.0 - progress)
+    scheduler = torch.optim.lr_scheduler.LambdaLR(optimizer, lr_lambda)
+    best_val_acc = 0.0
+    best_epoch   = 0
+    global_step  = 0
+    for epoch in range(1, epochs + 1):
+        model.train()
+        epoch_loss = 0.0
+        t0 = time.time()
+        for batch in train_loader:
+            batch = {k: v.to(device) for k, v in batch.items()}
+            labels = batch["labels"]
+            optimizer.zero_grad()
+            outputs = model(
+                input_ids=batch["input_ids"],
+                attention_mask=batch["attention_mask"],
+            )
+            loss = loss_fn(outputs.logits, labels)
+            loss.backward()
+            torch.nn.utils.clip_grad_norm_(
+                filter(lambda p: p.requires_grad, model.parameters()), 1.0
+            )
+            optimizer.step()
+            scheduler.step()
+            epoch_loss += loss.item()
+            global_step += 1
+        avg_loss = epoch_loss / max(len(train_loader), 1)
+        val_metrics = evaluate(model, val_loader, device)
+        elapsed = time.time() - t0
+        logger.info(
+            "Epoch %d/%d  train_loss=%.4f  val_loss=%.4f  val_acc=%.1f%%  (%.0fs)",
+            epoch, epochs, avg_loss,
+            val_metrics["loss"], val_metrics["accuracy"], elapsed,
+        )
+        if val_metrics["accuracy"] >= best_val_acc:
+            best_val_acc = val_metrics["accuracy"]
+            best_epoch   = epoch
+            _save(model, tokenizer)
+    logger.info(
+        "Training complete. Best val_acc=%.1f%% at epoch %d. Saved → %s",
+        best_val_acc, best_epoch, OUTPUT_DIR,
+    )
+def _save(model, tokenizer) -> None:
+    OUTPUT_DIR.mkdir(parents=True, exist_ok=True)
+    model.save_pretrained(str(OUTPUT_DIR))
+    tokenizer.save_pretrained(str(OUTPUT_DIR))
+    logger.info("Checkpoint saved to %s", OUTPUT_DIR)
+# ── CLI ───────────────────────────────────────────────────────────────────────
+def parse_args() -> argparse.Namespace:
+    p = argparse.ArgumentParser(
+        description="Fine-tune jcblaise/roberta-tagalog-base for PhilVerify",
+    )
+    p.add_argument("--epochs",     type=int,   default=5,    help="Training epochs (default: 5)")
+    p.add_argument("--lr",         type=float, default=2e-5, help="Learning rate (default: 2e-5)")
+    p.add_argument("--batch-size", type=int,   default=8,    help="Batch size (default: 8)")
+    p.add_argument("--keep-top-n", type=int,   default=2,    help="Unfrozen encoder layers (default: 2)")
+    p.add_argument("--no-freeze",  action="store_true",      help="Train all layers")
+    p.add_argument("--seed",       type=int,   default=42,   help="Random seed (default: 42)")
+    return p.parse_args()
+if __name__ == "__main__":
+    args = parse_args()
+    train(
+        epochs=args.epochs,
+        lr=args.lr,
+        batch_size=args.batch_size,
+        freeze=not args.no_freeze,
+        keep_top_n=args.keep_top_n,
+        seed=args.seed,
+    )

ml/train_xlmr.py CHANGED Viewed

@@ -138,6 +138,7 @@ def train(
     from torch.utils.data import DataLoader
     from transformers import AutoTokenizer, AutoModelForSequenceClassification
     from ml.combined_dataset import get_split, class_weights, LABEL_NAMES, NUM_LABELS
     # ── Reproducibility ───────────────────────────────────────────────────────
     torch.manual_seed(seed)
@@ -153,7 +154,12 @@ def train(
     # ── Data ──────────────────────────────────────────────────────────────────
     train_samples, val_samples = get_split(train_ratio=0.8, seed=seed)
-    logger.info("Dataset: %d train / %d val", len(train_samples), len(val_samples))
     logger.info("Loading tokenizer: %s …", BASE_MODEL)
     tokenizer = AutoTokenizer.from_pretrained(BASE_MODEL)

     from torch.utils.data import DataLoader
     from transformers import AutoTokenizer, AutoModelForSequenceClassification
     from ml.combined_dataset import get_split, class_weights, LABEL_NAMES, NUM_LABELS
+    from ml.dataset import augment_samples
     # ── Reproducibility ───────────────────────────────────────────────────────
     torch.manual_seed(seed)
     # ── Data ──────────────────────────────────────────────────────────────────
     train_samples, val_samples = get_split(train_ratio=0.8, seed=seed)
+    aug = augment_samples(train_samples, seed=seed)
+    train_samples = train_samples + aug
+    logger.info(
+        "Dataset: %d train (%d original + %d augmented) / %d val",
+        len(train_samples), len(train_samples) - len(aug), len(aug), len(val_samples),
+    )
     logger.info("Loading tokenizer: %s …", BASE_MODEL)
     tokenizer = AutoTokenizer.from_pretrained(BASE_MODEL)

ml/xlm_roberta_classifier.py CHANGED Viewed

@@ -136,6 +136,25 @@ class XLMRobertaClassifier:
     # ── Public API (same interface as TFIDFClassifier) ────────────────────────
     def predict(self, text: str) -> Layer1Result:
         self._ensure_loaded()
         import torch
@@ -162,7 +181,8 @@ class XLMRobertaClassifier:
         confidence = round(float(probs[pred_label].item()) * 100, 1)
         verdict    = LABEL_NAMES[pred_label]
-        triggered  = self._salient_tokens(input_ids, outputs.attentions)
         return Layer1Result(
             verdict=verdict,

     # ── Public API (same interface as TFIDFClassifier) ────────────────────────
+    def predict_probs(self, text: str):
+        """Return raw softmax probability tensor for ensemble averaging."""
+        self._ensure_loaded()
+        import torch
+        encoding = self._tokenizer(
+            text,
+            truncation=True,
+            max_length=MAX_LENGTH,
+            return_tensors="pt",
+        )
+        with torch.no_grad():
+            outputs = self._model(
+                input_ids=encoding["input_ids"],
+                attention_mask=encoding["attention_mask"],
+                output_attentions=True,
+            )
+        return torch.softmax(outputs.logits[0], dim=-1), outputs.attentions, encoding["input_ids"]
     def predict(self, text: str) -> Layer1Result:
         self._ensure_loaded()
         import torch
         confidence = round(float(probs[pred_label].item()) * 100, 1)
         verdict    = LABEL_NAMES[pred_label]
+        # SDPA attention doesn't return attentions; fallback to empty
+        triggered  = self._salient_tokens(input_ids, outputs.attentions) if outputs.attentions else []
         return Layer1Result(
             verdict=verdict,

nlp/claim_extractor.py CHANGED Viewed

@@ -1,8 +1,15 @@
 """
 PhilVerify — Claim Extractor
 Extracts the key falsifiable claim from noisy social media text.
-Primary: HuggingFace summarization (t5-small)
-Fallback: First 2 sentence heuristic
 """
 import re
 import logging
@@ -12,73 +19,72 @@ logger = logging.getLogger(__name__)
 _SENTENCE_SPLIT = re.compile(r"(?<=[.!?])\s+")
 @dataclass
 class ClaimResult:
     claim: str
-    method: str   # "summarization" | "sentence_heuristic"
 class ClaimExtractor:
     """
-    Extracts the single most falsifiable claim from input text.
-    This claim is then sent to the NewsAPI evidence retrieval step.
-    Prompt engineering guide:
-      The summarization model is given a task-specific prefix to bias it
-      toward extracting assertions rather than summaries.
     """
-    _TASK_PREFIX = "Extract the main factual claim: "
-    def __init__(self):
-        self._pipe = None
-        self._loaded = False
-    def _load_model(self):
-        if self._loaded:
-            return
-        try:
-            from transformers import pipeline
-            self._pipe = pipeline(
-                "summarization",
-                model="sshleifer/distilbart-cnn-6-6",
-                max_length=80,
-                min_length=10,
-                do_sample=False,
-            )
-            logger.info("Claim extractor model loaded (distilbart-cnn-6-6)")
-        except Exception as e:
-            logger.warning("Summarization model not available (%s) — using sentence heuristic", e)
-        self._loaded = True
-    def _sentence_heuristic(self, text: str) -> str:
-        """Return the first 1-2 sentences as the claim (fast fallback)."""
-        sentences = _SENTENCE_SPLIT.split(text.strip())
-        candidates = [s.strip() for s in sentences if len(s.strip()) > 20]
-        if not candidates:
-            return text[:200].strip()
-        return " ".join(candidates[:2])
     def extract(self, text: str) -> ClaimResult:
-        self._load_model()
         if not text or len(text.strip()) < 20:
             return ClaimResult(claim=text.strip(), method="passthrough")
-        if self._pipe:
-            try:
-                input_text = self._TASK_PREFIX + text[:1024]
-                out = self._pipe(input_text, truncation=True)
-                claim = out[0]["summary_text"].strip()
-                # Strip the task prefix echo if model includes it
-                claim = re.sub(r"^extract the main factual claim:?\s*", "", claim, flags=re.I)
-                if len(claim) > 15:
-                    return ClaimResult(claim=claim, method="summarization")
-            except Exception as e:
-                logger.warning("Summarization inference error: %s", e)
         return ClaimResult(
-            claim=self._sentence_heuristic(text),
             method="sentence_heuristic",
         )

 """
 PhilVerify — Claim Extractor
 Extracts the key falsifiable claim from noisy social media text.
+Strategy: sentence scoring based on presence of named entities,
+verbs, dates, and numbers — no heavy model required.
+Filipino fake news headlines almost always embed the checkworthy
+assertion in a sentence that contains a specific number/date + person/org
+name + an attribution verb (sinabi, ayon, announced, confirmed, etc.).
+Scoring these signals finds the right sentence faster and more reliably
+than a summarization model that was trained on English news compression.
 """
 import re
 import logging
 _SENTENCE_SPLIT = re.compile(r"(?<=[.!?])\s+")
+# Numbers, percentages, or month names signal a specific, verifiable claim
+_DATE_OR_NUM = re.compile(
+    r"\b(\d[\d,.%]*"
+    r"|(?:January|February|March|April|May|June|July|August|"
+    r"September|October|November|December)"
+    r"|(?:Enero|Pebrero|Marso|Abril|Mayo|Hunyo|Hulyo|Agosto|"
+    r"Setyembre|Oktubre|Nobyembre|Disyembre))\b",
+    re.IGNORECASE,
+)
+# Attribution / assertion verbs in English and Filipino
+_VERB_PATTERN = re.compile(
+    r"\b(is|are|was|were|has|have|had|will|would"
+    r"|said|says|announced|confirmed|reported|claims|showed"
+    r"|found|revealed|arrested|killed|died|signed|approved|ordered"
+    r"|sinabi|ipinahayag|inanunsyo|kinumpirma|ayon|nagpahayag"
+    r"|inihayag|iniutos|nagsabi|ipinag-utos)\b",
+    re.IGNORECASE,
+)
 @dataclass
 class ClaimResult:
     claim: str
+    method: str   # "sentence_scoring" | "sentence_heuristic"
+def _score_sentence(sent: str) -> float:
+    """Score a sentence by how likely it is to contain a falsifiable claim."""
+    score = 0.0
+    if _DATE_OR_NUM.search(sent):
+        score += 2.0
+    score += min(3.0, len(_VERB_PATTERN.findall(sent)) * 1.0)
+    if len(sent) > 30:
+        score += 1.0
+    return score
 class ClaimExtractor:
     """
+    Extracts the single most falsifiable claim from input text using
+    sentence scoring. No heavy model required — spaCy already loaded
+    for NER; this module uses only stdlib regex.
+    The highest-scoring sentence (by date/number + verb density) is
+    returned as the claim for downstream NewsAPI evidence retrieval.
     """
     def extract(self, text: str) -> ClaimResult:
         if not text or len(text.strip()) < 20:
             return ClaimResult(claim=text.strip(), method="passthrough")
+        sentences = [s.strip() for s in _SENTENCE_SPLIT.split(text.strip())]
+        candidates = [s for s in sentences if len(s) > 15]
+        if not candidates:
+            return ClaimResult(claim=text[:200].strip(), method="sentence_heuristic")
+        scored = [(s, _score_sentence(s)) for s in candidates]
+        best_sent, best_score = max(scored, key=lambda x: x[1])
+        if best_score > 0:
+            return ClaimResult(claim=best_sent, method="sentence_scoring")
+        # All scores zero — fall back to first two sentences
         return ClaimResult(
+            claim=" ".join(candidates[:2]),
             method="sentence_heuristic",
         )

nlp/ner.py CHANGED Viewed

@@ -46,8 +46,9 @@ class NERResult:
 class EntityExtractor:
     """
-    NER using spaCy (en_core_web_sm) + Philippine entity hint layer.
-    Falls back to regex-based date extraction if spaCy not installed.
     """
     def __init__(self):
@@ -58,12 +59,17 @@ class EntityExtractor:
         if self._loaded:
             return
         try:
-            import spacy
-            self._nlp = spacy.load("en_core_web_sm")
-            logger.info("spaCy en_core_web_sm loaded")
-        except Exception as e:
-            logger.warning("spaCy not available (%s) — using hint-based NER", e)
-            self._nlp = None
         self._loaded = True
     def _hint_based_extract(self, text: str) -> NERResult:

 class EntityExtractor:
     """
+    NER using calamanCy (tl_calamancy_lg) for Tagalog-aware entity extraction.
+    Falls back to spaCy en_core_web_sm, then to regex-based hint extraction.
+    calamanCy uses the same spaCy doc.ents interface so extract() is unchanged.
     """
     def __init__(self):
         if self._loaded:
             return
         try:
+            import calamancy
+            self._nlp = calamancy.load("tl_calamancy_lg")
+            logger.info("calamanCy tl_calamancy_lg loaded")
+        except Exception:
+            try:
+                import spacy
+                self._nlp = spacy.load("en_core_web_sm")
+                logger.info("spaCy en_core_web_sm loaded (calamancy unavailable)")
+            except Exception as e:
+                logger.warning("spaCy not available (%s) — using hint-based NER", e)
+                self._nlp = None
         self._loaded = True
     def _hint_based_extract(self, text: str) -> NERResult:

nlp/preprocessor.py CHANGED Viewed

@@ -57,6 +57,7 @@ class PreprocessResult:
     normalized: str
     tokens: list[str] = field(default_factory=list)
     filtered_tokens: list[str] = field(default_factory=list)
     char_count: int = 0
     word_count: int = 0
@@ -66,18 +67,62 @@ class TextPreprocessor:
     Multi-step text cleaner for Tagalog / English / Taglish content.
     Pipeline:
-        1. strip_html       — remove HTML tags
-        2. strip_urls       — remove hyperlinks
-        3. strip_mentions   — remove @user
-        4. strip_hashtags   — remove #tag text (keep token)
-        5. strip_emojis     — remove Unicode emoji
-        6. lowercase        — normalize case
-        7. normalize_chars  — collapse repeated chars, excessive !??
-        8. strip_punct      — remove punctuation except apostrophe
-        9. tokenize         — split on whitespace
-       10. remove_stopwords — drop EN + TL stopwords
     """
     def clean(self, text: str) -> str:
         """Steps 1-6: structural cleaning."""
         text = _HTML_TAG_PATTERN.sub(" ", text)
@@ -113,12 +158,14 @@ class TextPreprocessor:
         normalized = self.normalize(cleaned)
         tokens = self.tokenize(normalized)
         filtered = self.remove_stopwords(tokens)
         return PreprocessResult(
             original=text,
             cleaned=cleaned,
             normalized=normalized,
             tokens=tokens,
             filtered_tokens=filtered,
             char_count=len(normalized),
             word_count=len(tokens),
         )

     normalized: str
     tokens: list[str] = field(default_factory=list)
     filtered_tokens: list[str] = field(default_factory=list)
+    lemmatized_tokens: list[str] = field(default_factory=list)
     char_count: int = 0
     word_count: int = 0
     Multi-step text cleaner for Tagalog / English / Taglish content.
     Pipeline:
+        1. strip_html        — remove HTML tags
+        2. strip_urls        — remove hyperlinks
+        3. strip_mentions    — remove @user
+        4. strip_hashtags    — remove #tag text (keep token)
+        5. strip_emojis      — remove Unicode emoji
+        6. lowercase         — normalize case
+        7. normalize_chars   — collapse repeated chars, excessive !??
+        8. strip_punct       — remove punctuation except apostrophe
+        9. tokenize          — split on whitespace
+       10. remove_stopwords  — drop EN + TL stopwords
+       11. lemmatize         — WordNet lemmatization (opt-in, English-biased;
+                               Tagalog tokens are returned unchanged)
+    Args:
+        lemmatize: if True, step 11 is applied and lemmatized_tokens is populated.
+                   Off by default — transformer models handle subword tokenization
+                   themselves and do not benefit from lemmatization.
     """
+    def __init__(self, lemmatize: bool = False):
+        self.lemmatize = lemmatize
+    def _lemmatize_tokens(self, tokens: list[str]) -> list[str]:
+        """
+        POS-aware WordNet lemmatization. Downloads NLTK data on first call.
+        Falls back to identity on any error (e.g. missing corpus).
+        """
+        try:
+            import nltk
+            from nltk.corpus import wordnet
+            from nltk.stem import WordNetLemmatizer
+            for resource, path in [
+                ("wordnet", "corpora/wordnet"),
+                ("averaged_perceptron_tagger_eng", "taggers/averaged_perceptron_tagger_eng"),
+            ]:
+                try:
+                    nltk.data.find(path)
+                except LookupError:
+                    nltk.download(resource, quiet=True)
+            def _wn_pos(tag: str) -> str:
+                if tag.startswith("J"):
+                    return wordnet.ADJ
+                if tag.startswith("V"):
+                    return wordnet.VERB
+                if tag.startswith("R"):
+                    return wordnet.ADV
+                return wordnet.NOUN
+            lemmatizer = WordNetLemmatizer()
+            tagged = nltk.pos_tag(tokens)
+            return [lemmatizer.lemmatize(w, _wn_pos(t)) for w, t in tagged]
+        except Exception:
+            return tokens
     def clean(self, text: str) -> str:
         """Steps 1-6: structural cleaning."""
         text = _HTML_TAG_PATTERN.sub(" ", text)
         normalized = self.normalize(cleaned)
         tokens = self.tokenize(normalized)
         filtered = self.remove_stopwords(tokens)
+        lemmatized = self._lemmatize_tokens(filtered) if self.lemmatize else []
         return PreprocessResult(
             original=text,
             cleaned=cleaned,
             normalized=normalized,
             tokens=tokens,
             filtered_tokens=filtered,
+            lemmatized_tokens=lemmatized,
             char_count=len(normalized),
             word_count=len(tokens),
         )

requirements.txt CHANGED Viewed

@@ -15,6 +15,7 @@ sentence-transformers==3.3.1
 scikit-learn==1.5.2
 safetensors>=0.4.3                # Faster, safer model serialisation (used by transformers)
 spacy==3.8.2
 langdetect==1.0.9
 nltk==3.9.1

 scikit-learn==1.5.2
 safetensors>=0.4.3                # Faster, safer model serialisation (used by transformers)
 spacy==3.8.2
+calamancy>=0.2.0                  # Tagalog NER (calamanCy tl_calamancy_lg)
 langdetect==1.0.9
 nltk==3.9.1

scoring/engine.py CHANGED Viewed

@@ -81,6 +81,7 @@ async def run_verification(
     from nlp.clickbait import ClickbaitDetector
     from nlp.claim_extractor import ClaimExtractor
     from evidence.news_fetcher import fetch_evidence, compute_similarity
     # ── Step 1: Preprocess ────────────────────────────────────────────────────
     preprocessor = _get_nlp("preprocessor", TextPreprocessor)
@@ -103,26 +104,41 @@ async def run_verification(
     claim_result = claim_extractor.extract(proc.cleaned)
     # ── Step 7: Layer 1 — ML Classifier ──────────────────────────────────────
-    # Try fine-tuned XLM-RoBERTa first; fall back to TF-IDF baseline if the
-    # checkpoint hasn't been generated yet (ml/train_xlmr.py not yet run).
-    model_tier = "xlmr"  # for observability in logs
     try:
         from ml.xlm_roberta_classifier import XLMRobertaClassifier, ModelNotFoundError
-        classifier = _get_nlp("xlmr_classifier", XLMRobertaClassifier)
     except ModelNotFoundError:
         logger.info("XLM-RoBERTa checkpoint not found — falling back to TF-IDF baseline")
-        from ml.tfidf_classifier import TFIDFClassifier
-        def _make_tfidf():
-            c = TFIDFClassifier(); c.train(); return c
-        classifier = _get_nlp("tfidf_classifier", _make_tfidf)
-        model_tier = "tfidf"
     except Exception as exc:
         logger.warning("XLM-RoBERTa load failed (%s) — falling back to TF-IDF", exc)
         from ml.tfidf_classifier import TFIDFClassifier
-        def _make_tfidf():  # noqa: F811
             c = TFIDFClassifier(); c.train(); return c
         classifier = _get_nlp("tfidf_classifier", _make_tfidf)
-        model_tier = "tfidf"
     l1 = classifier.predict(proc.cleaned)
     logger.debug("Layer-1 (%s): %s %.1f%%", model_tier, l1.verdict, l1.confidence)
@@ -137,6 +153,7 @@ async def run_verification(
         verdict=Verdict(l1.verdict),
         confidence=l1.confidence,
         triggered_features=l1.triggered_features,
     )
     # ── Step 8: Layer 2 — Evidence Retrieval ──────────────────────────────────
@@ -170,19 +187,21 @@ async def run_verification(
                 domain = (art.get("source", {}) or {}).get("name", "unknown").lower()
                 tier = get_domain_tier(domain)
-                # Simple stance heuristic — negative title keywords → Refutes
-                title_lower = (art.get("title") or "").lower()
-                stance = Stance.NOT_ENOUGH_INFO
-                if any(w in title_lower for w in ["false", "fake", "hoax", "wrong", "debunked", "fact check"]):
-                    stance = Stance.REFUTES
-                elif sim > 0.6:
-                    stance = Stance.SUPPORTS
                 evidence_sources.append(EvidenceSource(
                     title=art.get("title", ""),
                     url=art.get("url", ""),
                     similarity=sim,
                     stance=stance,
                     domain_tier=tier or DomainTier.SUSPICIOUS,
                     published_at=art.get("publishedAt"),
                     source_name=art.get("source", {}).get("name"),
@@ -208,6 +227,7 @@ async def run_verification(
         evidence_score=round(evidence_score, 1),
         sources=evidence_sources,
         claim_used=claim_result.claim,
     )
     # ── Step 9: Final Score ───────────────────────────────────────────────────

     from nlp.clickbait import ClickbaitDetector
     from nlp.claim_extractor import ClaimExtractor
     from evidence.news_fetcher import fetch_evidence, compute_similarity
+    from evidence.stance_detector import detect_stance as _detect_stance
     # ── Step 1: Preprocess ────────────────────────────────────────────────────
     preprocessor = _get_nlp("preprocessor", TextPreprocessor)
     claim_result = claim_extractor.extract(proc.cleaned)
     # ── Step 7: Layer 1 — ML Classifier ──────────────────────────────────────
+    # Priority: Ensemble (XLM-R + Tagalog-RoBERTa) → XLM-R alone → TF-IDF.
+    # Tagalog-RoBERTa requires its own fine-tuned checkpoint; if missing the
+    # engine silently falls back to XLM-R only without breaking anything.
+    model_tier = "tfidf"
+    classifier = None
     try:
         from ml.xlm_roberta_classifier import XLMRobertaClassifier, ModelNotFoundError
+        from ml.tagalog_roberta_classifier import TagalogRobertaClassifier
+        from ml.ensemble_classifier import EnsembleClassifier
+        xlmr = _get_nlp("xlmr_classifier", XLMRobertaClassifier)
+        members = [xlmr]
+        model_tier = "xlmr"
+        try:
+            tl = _get_nlp("tagalog_classifier", TagalogRobertaClassifier)
+            members.append(tl)
+            model_tier = "ensemble"
+        except ModelNotFoundError:
+            logger.info("Tagalog-RoBERTa checkpoint not found — using XLM-R only")
+        except Exception as exc:
+            logger.warning("Tagalog-RoBERTa load failed (%s) — using XLM-R only", exc)
+        classifier = EnsembleClassifier(members)
     except ModelNotFoundError:
         logger.info("XLM-RoBERTa checkpoint not found — falling back to TF-IDF baseline")
     except Exception as exc:
         logger.warning("XLM-RoBERTa load failed (%s) — falling back to TF-IDF", exc)
+    if classifier is None:
         from ml.tfidf_classifier import TFIDFClassifier
+        def _make_tfidf():
             c = TFIDFClassifier(); c.train(); return c
         classifier = _get_nlp("tfidf_classifier", _make_tfidf)
     l1 = classifier.predict(proc.cleaned)
     logger.debug("Layer-1 (%s): %s %.1f%%", model_tier, l1.verdict, l1.confidence)
         verdict=Verdict(l1.verdict),
         confidence=l1.confidence,
         triggered_features=l1.triggered_features,
+        model_tier=model_tier,
     )
     # ── Step 8: Layer 2 — Evidence Retrieval ──────────────────────────────────
                 domain = (art.get("source", {}) or {}).get("name", "unknown").lower()
                 tier = get_domain_tier(domain)
+                stance_result = _detect_stance(
+                    claim=claim_result.claim,
+                    article_title=art.get("title", ""),
+                    article_description=art.get("description", "") or "",
+                    article_url=art.get("url", ""),
+                    similarity=sim,
+                )
+                stance = Stance(stance_result.stance.value)
                 evidence_sources.append(EvidenceSource(
                     title=art.get("title", ""),
                     url=art.get("url", ""),
                     similarity=sim,
                     stance=stance,
+                    stance_reason=stance_result.reason,
                     domain_tier=tier or DomainTier.SUSPICIOUS,
                     published_at=art.get("publishedAt"),
                     source_name=art.get("source", {}).get("name"),
         evidence_score=round(evidence_score, 1),
         sources=evidence_sources,
         claim_used=claim_result.claim,
+        claim_method=claim_result.method,
     )
     # ── Step 9: Final Score ───────────────────────────────────────────────────

tests/test_improvements.py ADDED Viewed

	@@ -0,0 +1,409 @@

+"""
+Tests for the 5 NLP pipeline improvements:
+  1. calamanCy NER fallback chain
+  2. Tagalog-RoBERTa classifier (ModelNotFoundError)
+  3. EnsembleClassifier
+  4. EDA augmentation
+  5. Sentence-scoring ClaimExtractor
+  6. NLI stance detection (Rule 1.5)
+"""
+import sys
+from pathlib import Path
+from unittest.mock import patch, MagicMock
+import pytest
+# Ensure project root is on path
+sys.path.insert(0, str(Path(__file__).parent.parent))
+# ── Helpers ───────────────────────────────────────────────────────────────────
+def _make_sample(text: str, label: int = 0):
+    from ml.dataset import Sample
+    return Sample(text=text, label=label)
+# ══════════════════════════════════════════════════════════════════════════════
+# Part 1 — EDA Augmentation
+# ══════════════════════════════════════════════════════════════════════════════
+class TestEDAugmentation:
+    def test_empty_input_returns_empty(self):
+        from ml.dataset import augment_samples
+        assert augment_samples([]) == []
+    def test_augment_produces_two_variants_per_sample(self):
+        from ml.dataset import augment_samples
+        samples = [_make_sample("DOH confirms 500 new COVID cases today", 0)]
+        aug = augment_samples(samples, seed=42)
+        # One deletion + one swap variant per sample
+        assert len(aug) == 2
+    def test_augmented_labels_match_originals(self):
+        from ml.dataset import augment_samples
+        samples = [
+            _make_sample("Senate passes new bill on health care reform", 0),
+            _make_sample("SHOCKING truth about vaccines hidden by government", 2),
+        ]
+        aug = augment_samples(samples, seed=42)
+        orig_labels = {s.label for s in samples}
+        for a in aug:
+            assert a.label in orig_labels
+    def test_short_samples_skipped(self):
+        from ml.dataset import augment_samples
+        samples = [
+            _make_sample("ok", 1),          # 1 word — too short
+            _make_sample("fake news", 2),   # 2 words — too short
+        ]
+        aug = augment_samples(samples, seed=42)
+        assert aug == []
+    def test_augmented_texts_differ_from_original(self):
+        from ml.dataset import augment_samples
+        original = "GRABE sinabi ng DOH na 200 bata ang nagkasakit sa bagong virus"
+        samples = [_make_sample(original, 2)]
+        aug = augment_samples(samples, seed=99)
+        # At least one variant should differ
+        assert any(a.text != original for a in aug)
+    def test_augment_triples_training_set_size(self):
+        from ml.dataset import get_split, augment_samples
+        train, _ = get_split()
+        aug = augment_samples(train, seed=42)
+        # aug should be at most 2× train size (some short samples may be skipped)
+        assert len(aug) >= len(train)
+        assert len(aug) <= 2 * len(train)
+    def test_augmented_samples_are_non_empty(self):
+        from ml.dataset import augment_samples
+        samples = [_make_sample("The senator confirmed signing the new law today", 0)]
+        aug = augment_samples(samples, seed=42)
+        for a in aug:
+            assert len(a.text.strip()) > 0
+# ══════════════════════════════════════════════════════════════════════════════
+# Part 2 — Sentence-scoring ClaimExtractor
+# ══════════════════════════════════════════════════════════════════════════════
+class TestClaimExtractor:
+    def test_instantiates_without_loading_model(self):
+        """New ClaimExtractor has no lazy model loading at all."""
+        from nlp.claim_extractor import ClaimExtractor
+        ce = ClaimExtractor()
+        # No _pipe, no _loaded attributes
+        assert not hasattr(ce, '_pipe')
+        assert not hasattr(ce, '_loaded')
+    def test_passthrough_for_short_text(self):
+        from nlp.claim_extractor import ClaimExtractor
+        result = ClaimExtractor().extract("hi")
+        assert result.method == "passthrough"
+        assert result.claim == "hi"
+    def test_sentence_scoring_method_on_informative_sentence(self):
+        from nlp.claim_extractor import ClaimExtractor
+        # Has a date, a verb, and named org — should score high
+        text = "GRABE! Sinabi ng DOH noong Martes na 200 bata ang nagkasakit sa bagong virus sa Maynila."
+        result = ClaimExtractor().extract(text)
+        # Should pick the DOH sentence, not all text or just "GRABE!"
+        assert result.method == "sentence_scoring"
+        assert "DOH" in result.claim or "200" in result.claim
+    def test_heuristic_fallback_when_no_scored_sentences(self):
+        from nlp.claim_extractor import ClaimExtractor
+        # Text with no dates, no numbers, no verbs
+        text = "Wow amazing incredible unbelievable spectacular incomprehensible."
+        result = ClaimExtractor().extract(text)
+        assert result.method in ("sentence_heuristic", "sentence_scoring")
+    def test_returns_claim_result_dataclass(self):
+        from nlp.claim_extractor import ClaimExtractor, ClaimResult
+        result = ClaimExtractor().extract("The president signed the new healthcare law today.")
+        assert isinstance(result, ClaimResult)
+        assert isinstance(result.claim, str)
+        assert isinstance(result.method, str)
+    def test_picks_specific_sentence_over_clickbait_opener(self):
+        from nlp.claim_extractor import ClaimExtractor
+        text = "OMG! Natuklasan ng mga siyentipiko na 5,000 tao ang namatay dahil sa bagong sakit ngayong Enero."
+        result = ClaimExtractor().extract(text)
+        # The specific claim (5000 deaths) should be preferred over "OMG!"
+        assert "5,000" in result.claim or "siyentipiko" in result.claim or result.method == "sentence_scoring"
+# ══════════════════════════════════════════════════════════════════════════════
+# Part 3 — TagalogRobertaClassifier
+# ══════════════════════════════════════════════════════════════════════════════
+class TestTagalogRobertaClassifier:
+    def test_raises_model_not_found_when_checkpoint_missing(self, tmp_path, monkeypatch):
+        """ModelNotFoundError raised when checkpoint directory doesn't exist."""
+        import ml.tagalog_roberta_classifier as mod
+        monkeypatch.setattr(mod, "MODEL_DIR", tmp_path / "nonexistent_model")
+        with pytest.raises(mod.ModelNotFoundError):
+            mod.TagalogRobertaClassifier()
+    def test_model_not_found_is_subclass_of_file_not_found(self):
+        from ml.xlm_roberta_classifier import ModelNotFoundError
+        assert issubclass(ModelNotFoundError, FileNotFoundError)
+    def test_shares_same_model_not_found_error(self):
+        """Engine catches ModelNotFoundError from xlm_roberta_classifier —
+        tagalog module re-uses the same class, so the same except clause catches it."""
+        from ml.xlm_roberta_classifier import ModelNotFoundError as E1
+        from ml.tagalog_roberta_classifier import ModelNotFoundError as E2
+        assert E1 is E2
+# ══════════════════════════════════════════════════════════════════════════════
+# Part 4 — EnsembleClassifier
+# ══════════════════════════════════════════════════════════════════════════════
+class TestEnsembleClassifier:
+    def _make_stub(self, probs_list: list[float]):
+        """Return a stub classifier whose predict_probs returns fixed probabilities."""
+        import torch
+        stub = MagicMock()
+        stub.predict_probs.return_value = (
+            torch.tensor(probs_list, dtype=torch.float32),
+            None,
+            None,
+        )
+        stub._salient_tokens = MagicMock(return_value=["token1"])
+        return stub
+    def test_raises_value_error_for_empty_list(self):
+        from ml.ensemble_classifier import EnsembleClassifier
+        with pytest.raises(ValueError):
+            EnsembleClassifier([])
+    def test_single_classifier_returns_its_prediction(self):
+        import torch
+        from ml.ensemble_classifier import EnsembleClassifier
+        stub = self._make_stub([0.7, 0.2, 0.1])
+        ens = EnsembleClassifier([stub])
+        result = ens.predict("any text")
+        assert result.verdict == "Credible"
+        assert abs(result.confidence - 70.0) < 1.0
+    def test_two_classifiers_averages_probabilities(self):
+        import torch
+        from ml.ensemble_classifier import EnsembleClassifier
+        # First: [0.8, 0.1, 0.1] → Credible 80%
+        # Second: [0.4, 0.5, 0.1] → Unverified 50%
+        # Average: [0.6, 0.3, 0.1] → Credible 60%
+        stub1 = self._make_stub([0.8, 0.1, 0.1])
+        stub2 = self._make_stub([0.4, 0.5, 0.1])
+        ens = EnsembleClassifier([stub1, stub2])
+        result = ens.predict("test text")
+        assert result.verdict == "Credible"
+        assert abs(result.confidence - 60.0) < 1.5
+    def test_failing_classifier_gracefully_skipped(self):
+        import torch
+        from ml.ensemble_classifier import EnsembleClassifier
+        good = self._make_stub([0.1, 0.1, 0.8])  # Likely Fake
+        bad = MagicMock()
+        bad.predict_probs.side_effect = RuntimeError("model failed")
+        ens = EnsembleClassifier([good, bad])
+        result = ens.predict("test text")
+        # Should still get a result from the good classifier
+        assert result.verdict == "Likely Fake"
+    def test_all_classifiers_failing_returns_unverified_neutral(self):
+        from ml.ensemble_classifier import EnsembleClassifier
+        bad = MagicMock()
+        bad.predict_probs.side_effect = RuntimeError("fail")
+        ens = EnsembleClassifier([bad])
+        result = ens.predict("test")
+        assert result.verdict == "Unverified"
+        assert result.confidence == 33.3
+    def test_result_has_correct_type(self):
+        import torch
+        from ml.ensemble_classifier import EnsembleClassifier
+        from ml.xlm_roberta_classifier import Layer1Result
+        stub = self._make_stub([0.5, 0.3, 0.2])
+        ens = EnsembleClassifier([stub])
+        result = ens.predict("test")
+        assert isinstance(result, Layer1Result)
+        assert isinstance(result.triggered_features, list)
+# ══════════════════════════════════════════════════════════════════════════════
+# Part 5 — NLI Stance Detection
+# ══════════════════════════════════════════════════════════════════════════════
+class TestNLIStanceDetector:
+    def _reset_nli_cache(self):
+        """Reset the module-level NLI singleton between tests."""
+        import evidence.stance_detector as mod
+        mod._nli_pipe = None
+        mod._nli_loaded = False
+    def test_falls_through_to_keywords_when_nli_unavailable(self):
+        """When NLI model can't be loaded, keyword rules still work."""
+        import evidence.stance_detector as mod
+        self._reset_nli_cache()
+        with patch.object(mod, '_get_nli', return_value=None):
+            result = mod.detect_stance(
+                claim="Vaccines are safe",
+                article_title="Fact check: COVID vaccines proven effective",
+                article_description="Experts confirm vaccines are safe and effective after extensive testing.",
+                article_url="",
+                similarity=0.7,
+            )
+        from evidence.stance_detector import Stance
+        # "confirmed" in article → Supports keyword rule
+        assert result.stance in (Stance.SUPPORTS, Stance.NOT_ENOUGH_INFO, Stance.REFUTES)
+        # Should not crash
+    def test_nli_supports_high_confidence(self):
+        """When NLI returns 'supports' at ≥0.65, stance is SUPPORTS with NLI reason."""
+        import evidence.stance_detector as mod
+        self._reset_nli_cache()
+        mock_nli = MagicMock()
+        mock_nli.return_value = {
+            "labels": ["supports the claim", "contradicts the claim", "unrelated"],
+            "scores": [0.82, 0.12, 0.06],
+        }
+        with patch.object(mod, '_get_nli', return_value=mock_nli):
+            result = mod.detect_stance(
+                claim="Government confirmed 500 new cases",
+                article_title="Government says 500 new cases recorded",
+                article_description="Officials confirmed today that 500 new cases were recorded nationwide.",
+                similarity=0.75,
+            )
+        from evidence.stance_detector import Stance
+        assert result.stance == Stance.SUPPORTS
+        assert "NLI" in result.reason
+    def test_nli_contradicts_high_confidence(self):
+        """When NLI returns 'contradicts' at ≥0.65, stance is REFUTES with NLI reason."""
+        import evidence.stance_detector as mod
+        self._reset_nli_cache()
+        mock_nli = MagicMock()
+        mock_nli.return_value = {
+            "labels": ["contradicts the claim", "supports the claim", "unrelated"],
+            "scores": [0.78, 0.15, 0.07],
+        }
+        with patch.object(mod, '_get_nli', return_value=mock_nli):
+            result = mod.detect_stance(
+                claim="There is no evidence of fraud",
+                article_title="Evidence of widespread fraud found",
+                article_description="Investigators found extensive evidence of fraud in the election.",
+                similarity=0.6,
+            )
+        from evidence.stance_detector import Stance
+        assert result.stance == Stance.REFUTES
+        assert "NLI" in result.reason
+    def test_nli_low_confidence_falls_through_to_keywords(self):
+        """NLI confidence < 0.65 — should fall through and use keyword rules."""
+        import evidence.stance_detector as mod
+        self._reset_nli_cache()
+        mock_nli = MagicMock()
+        mock_nli.return_value = {
+            "labels": ["supports the claim", "contradicts the claim", "unrelated"],
+            "scores": [0.45, 0.35, 0.20],  # below 0.65 threshold
+        }
+        with patch.object(mod, '_get_nli', return_value=mock_nli):
+            result = mod.detect_stance(
+                claim="Senator is guilty of corruption",
+                article_title="Fact check: False claim about senator",
+                article_description="This claim has been debunked by multiple fact-checkers.",
+                similarity=0.5,
+            )
+        from evidence.stance_detector import Stance
+        # Keyword "debunked" should trigger REFUTES
+        assert result.stance == Stance.REFUTES
+    def test_short_description_skips_nli(self):
+        """Article description shorter than 30 chars → NLI skipped, no error."""
+        import evidence.stance_detector as mod
+        self._reset_nli_cache()
+        mock_nli = MagicMock()
+        with patch.object(mod, '_get_nli', return_value=mock_nli):
+            result = mod.detect_stance(
+                claim="Some claim",
+                article_title="Short article",
+                article_description="Short.",  # <30 chars
+                similarity=0.5,
+            )
+        # NLI should not have been called
+        mock_nli.assert_not_called()
+# ══════════════════════════════════════════════════════════════════════════════
+# Part 6 — calamanCy NER Fallback Chain
+# ══════════════════════════════════════════════════════════════════════════════
+class TestCalamanCyNERFallback:
+    def _fresh_extractor(self):
+        """Return a fresh (unloaded) EntityExtractor."""
+        import importlib
+        import nlp.ner
+        importlib.reload(nlp.ner)
+        return nlp.ner.EntityExtractor()
+    def test_falls_back_to_spacy_when_calamancy_missing(self, monkeypatch):
+        """When calamancy import fails, _nlp is set via spaCy en_core_web_sm."""
+        import nlp.ner as mod
+        extractor = mod.EntityExtractor()
+        extractor._loaded = False  # force reload
+        # Simulate calamancy not installed
+        original_load = extractor._load_model.__func__
+        def patched_load(self):
+            self._loaded = True
+            try:
+                raise ImportError("No module named 'calamancy'")
+            except ImportError:
+                try:
+                    import spacy
+                    self._nlp = spacy.load("en_core_web_sm")
+                except Exception:
+                    self._nlp = None
+        import types
+        extractor._load_model = types.MethodType(patched_load, extractor)
+        extractor._load_model()
+        # Either spaCy loaded successfully or fell back to None
+        assert extractor._loaded is True
+    def test_hint_based_fallback_when_both_unavailable(self):
+        """When both calamancy and spaCy fail, hint-based NER still works."""
+        import nlp.ner as mod
+        extractor = mod.EntityExtractor()
+        extractor._loaded = True
+        extractor._nlp = None  # force hint-based path
+        result = extractor.extract("Sinabi ni Marcos sa Davao tungkol sa DOH")
+        assert isinstance(result.persons, list)
+        assert isinstance(result.organizations, list)
+        assert isinstance(result.locations, list)
+        # Should find hint-based entities
+        assert any("Marcos" in p for p in result.persons)
+    def test_ner_result_method_reflects_path(self):
+        """method field on NERResult reflects which extraction path was used."""
+        import nlp.ner as mod
+        extractor = mod.EntityExtractor()
+        extractor._loaded = True
+        extractor._nlp = None
+        result = extractor._hint_based_extract("Marcos is in Manila with DOH")
+        assert result.method == "hints"
+    def test_extract_with_no_model_returns_ner_result(self):
+        from nlp.ner import EntityExtractor, NERResult
+        e = EntityExtractor()
+        e._loaded = True
+        e._nlp = None
+        result = e.extract("DOH confirmed 500 cases in Cebu on January 2026")
+        assert isinstance(result, NERResult)
+        assert len(result.dates) > 0  # Should find "January 2026"