FINAL PROFESSIONALIZATION: Synchronized with GitHub sovereign standards.

05a5750 verified 25 days ago

6.09 kB

	import json
	from pathlib import Path
	from typing import Any, Dict, List

	from pydantic import BaseModel

	from core.mcp_protocol import mcp_call


	class AuditResolution(BaseModel):
	verdict: str
	risk_score: float
	reasoning_steps: List[str]
	mcp_trace: str
	warning: str = ""


	class LogicAuditor:
	"""
	Evidence-weighted logic auditor for credential review.

	The auditor treats registry matches as supporting evidence only. It does not
	approve a credential solely because an institution exists in ROR or because a
	file name contains a trusted-looking keyword.
	"""

	def __init__(self, blacklist_path: str = "data/fraud_blacklist.json"):
	self.blacklist_path = Path(blacklist_path)

	@staticmethod
	def _normalize(value: str) -> str:
	return " ".join(value.lower().replace("&", "and").split())

	def _load_blacklist_names(self) -> set[str]:
	names: set[str] = set()
	try:
	with self.blacklist_path.open("r", encoding="utf-8") as f:
	blacklist_data = json.load(f)
	except (OSError, json.JSONDecodeError):
	return names

	for entry in blacklist_data.get("blacklist", []):
	if entry.get("name"):
	names.add(self._normalize(entry["name"]))
	for alias in entry.get("aliases", []):
	names.add(self._normalize(alias))
	return names

	async def audit(self, transcript: Dict[str, Any], profile: Dict[str, Any]) -> AuditResolution:
	print("[LOGIC] [Logic-Auditor] Initializing evidence-weighted review...")
	call = mcp_call("mcp_logic_audit", {"transcript_id": "...", "context_level": "deep"})

	reasoning_steps: List[str] = []
	anomalies: List[tuple[str, float]] = []
	warnings: List[str] = []

	inst_name = self._normalize(profile.get("name", ""))
	blacklist_names = self._load_blacklist_names()
	is_diploma_mill = profile.get("is_diploma_mill", False) or inst_name in blacklist_names
	profile_status = profile.get("status", "unknown")

	reasoning_steps.append("Step 0: Checking known diploma-mill and degree-factory indicators.")
	if is_diploma_mill or profile_status == "fraudulent":
	warning_msg = profile.get("warning") or "DIPLOMA MILL / DEGREE FACTORY DETECTED -- credentials from this institution require hard rejection."
	return AuditResolution(
	verdict="REJECTED — DIPLOMA MILL / DEGREE FACTORY",
	risk_score=100.0,
	reasoning_steps=[
	*reasoning_steps,
	f"Result 0: HARD REJECTION. '{profile.get('name', 'Unknown')}' is flagged by the fraud registry.",
	"No approval is issued because the issuing entity is disqualified.",
	],
	mcp_trace=call.trace_id,
	warning=warning_msg,
	)
	reasoning_steps.append("Result 0: No exact blacklist or alias match found.")

	reasoning_steps.append("Step 1: Mapping graduation window against institutional lifecycle.")
	grad_year = int(transcript.get("graduation_year") or 0)
	est_year = profile.get("established_year")
	if grad_year > 0 and est_year and grad_year < int(est_year):
	anomalies.append(("CRITICAL: Graduation predates the institution founding year.", 55.0))
	reasoning_steps.append("Result 1: Temporal violation found.")
	elif est_year:
	reasoning_steps.append("Result 1: Timeline is internally consistent.")
	else:
	warnings.append("Founding year unavailable; temporal validation is incomplete.")
	reasoning_steps.append("Result 1: Founding year unavailable; timeline needs review.")

	reasoning_steps.append("Step 2: Evaluating registry evidence without granting automatic approval.")
	has_ror_id = bool(profile.get("ror_id"))
	source = profile.get("source", "none")
	match_confidence = float(profile.get("match_confidence") or 0.0)
	if has_ror_id and profile_status == "active":
	reasoning_steps.append("Result 2: Active ROR presence found as supporting institution-existence evidence.")
	elif has_ror_id:
	anomalies.append((f"WARNING: ROR status is '{profile_status}', not active.", 30.0))
	reasoning_steps.append("Result 2: Registry presence found, but status requires review.")
	else:
	anomalies.append(("WARNING: No verified registry identifier was resolved.", 35.0))
	reasoning_steps.append("Result 2: No ROR identifier available.")

	if source in {"ror", "local_index"} and 0 < match_confidence < 0.80:
	anomalies.append(("WARNING: Institution match confidence is below the production threshold.", 25.0))
	reasoning_steps.append("Result 2b: Match confidence is low and should be manually reviewed.")

	reasoning_steps.append("Step 3: Checking credential-authenticity evidence.")
	if not transcript.get("credential_id") and not transcript.get("signature_verified"):
	anomalies.append(("WARNING: No credential ID or cryptographic issuer signature was verified.", 35.0))
	reasoning_steps.append("Result 3: Credential authenticity remains unproven.")
	else:
	reasoning_steps.append("Result 3: Credential-level evidence is present.")

	risk_score = min(100.0, sum(weight for _, weight in anomalies))
	if risk_score >= 85:
	verdict = "REJECTED"
	elif risk_score > 0 or warnings:
	verdict = "NEEDS_REVIEW"
	else:
	verdict = "APPROVED"

	return AuditResolution(
	verdict=verdict,
	risk_score=risk_score,
	reasoning_steps=[reasoning_steps, [item for item, _ in anomalies], *warnings],
	mcp_trace=call.trace_id,
	warning="; ".join(warnings),
	)