kofdai
/

nullai-knowledge-system

+from datetime import datetime
+import re
+import logging
+logger = logging.getLogger(__name__)
+# ドメイン別の危険な主張を検出するためのパターン
+DOMAIN_DANGEROUS_PATTERNS = {
+    "medical": [
+        (r"(必ず|絶対に|確実に).*(治る|完治|治癒)", "absolute_cure_claim", "critical"),
+        (r"(副作用|リスク).*(ない|ありません|存在しない)", "no_side_effects_claim", "critical"),
+        (r"(すべての|全ての|あらゆる)患者に(有効|効果的)", "universal_effectiveness", "high"),
+        (r"(西洋|現代)医学.*(不要|いらない|無意味)", "anti_medicine_claim", "critical"),
+        (r"(自己判断|自分で).*治療", "self_treatment_encouragement", "moderate"),
+        (r"医師.*(相談|受診).*(不要|いらない|必要ない)", "avoid_doctor_claim", "critical"),
+    ],
+    "legal": [
+        (r"(必ず|絶対に|確実に).*(勝訴|勝てる|認められる)", "absolute_outcome_claim", "critical"),
+        (r"弁護士.*(不要|いらない|必要ない)", "avoid_lawyer_claim", "critical"),
+        (r"(すべての|全ての)ケースで", "universal_applicability", "high"),
+        (r"(違法|犯罪).*(ではない|にならない).*絶対", "absolute_legality_claim", "critical"),
+        (r"(時効|期限).*(気にしなくて|無視して)", "ignore_deadlines", "critical"),
+        (r"(判例|法律).*無視", "ignore_precedent", "high"),
+    ],
+    "economics": [
+        (r"(必ず|絶対に|確実に).*(儲かる|利益|リターン)", "guaranteed_profit_claim", "critical"),
+        (r"リスク.*(ない|ゼロ|存在しない)", "no_risk_claim", "critical"),
+        (r"(すべての|全ての)投資家に", "universal_advice", "high"),
+        (r"(買う|売る)べき.*絶対", "absolute_trading_advice", "critical"),
+        (r"市場.*予測.*確実", "certain_market_prediction", "high"),
+        (r"(暴落|暴騰).*(ない|しない).*絶対", "absolute_market_stability", "high"),
+    ]
+}
+# 後方互換性のため
+DANGEROUS_CLAIM_PATTERNS = DOMAIN_DANGEROUS_PATTERNS["medical"]
+# 医学的数値の妥当性範囲
+MEDICAL_VALUE_RANGES = {
+    "血圧": {"systolic": (60, 250), "diastolic": (40, 150)},
+    "体温": {"min": 35.0, "max": 42.0},
+    "心拍数": {"min": 30, "max": 220},
+    "SpO2": {"min": 70, "max": 100},
+    "血糖値": {"min": 20, "max": 600},
+}
+# 法学ドメインの検証パターン
+LEGAL_VALIDATION_PATTERNS = {
+    "disclaimer_required": r"(免責|情報提供|法的助言ではありません)",
+    "statute_citation": r"(第\d+条|条文|法律)",
+    "precedent_citation": r"(判例|最判|最決|高判)",
+}
+# 経済学ドメインの検証パターン
+ECONOMICS_VALIDATION_PATTERNS = {
+    "data_source_required": r"(統計|データ|出典|IMF|日銀|内閣府)",
+    "uncertainty_disclosure": r"(予測|推計|不確実|シナリオ)",
+    "disclaimer_required": r"(投資助言ではありません|自己責任)",
+}
+class BetaLobeAdvanced:
+    """
+    検証院（β-Lobe）の高度な機能。
+    論理的妥当性、医学的文脈の検証、ハルシネーション検出を実装。
+    """
+    def __init__(self, db_interface, medical_ontology):
+        self.db = db_interface
+        self.ontology = medical_ontology
+    # --- 基本的なAnchor事実チェック ---
+    def _is_mentioned(self, fact: str, response: str) -> bool:
+        """事実がレスポンスに言及されているか確認"""
+        fact_keywords = [word for word in fact.split() if len(word) > 1]
+        if not fact_keywords:
+            return False
+        mentioned_count = sum(1 for kw in fact_keywords if kw in response)
+        return (mentioned_count / len(fact_keywords)) > 0.5
+    def _detect_numerical_contradiction(self, fact: str, response: str) -> bool:
+        """数値の矛盾を検出"""
+        fact_numbers = re.findall(r'[-+]?\d*\.\d+|\d+', fact)
+        if not fact_numbers:
+            return False
+        fact_value = float(fact_numbers[0])
+        response_numbers = re.findall(r'[-+]?\d*\.\d+|\d+', response)
+        if not response_numbers:
+            return True
+        # 10%以上の乖離で矛盾とみなす
+        is_far = all(abs(float(res_val) - fact_value) / max(fact_value, 0.001) > 0.1 for res_val in response_numbers)
+        return is_far
+    async def check_anchor_facts(self, response_text: str, db_context: dict) -> dict:
+        """DBの知識タイルと回答の整合性を検証"""
+        contradictions = []
+        for coord, tile in db_context.items():
+            if not tile:
+                continue
+            # タイルから主要な事実を抽出
+            anchor_facts = self._extract_anchor_facts(tile)
+            for fact in anchor_facts:
+                # 事実が言及されているか確認
+                if self._is_mentioned(fact["statement"], response_text):
+                    # 数値の矛盾をチェック
+                    if fact.get("has_numbers") and self._detect_numerical_contradiction(fact["statement"], response_text):
+                        contradictions.append({
+                            "type": "numerical_contradiction",
+                            "fact": fact["statement"],
+                            "source": coord,
+                            "severity": "high"
+                        })
+        return {
+            "contradictions": contradictions,
+            "contradiction_count": len(contradictions),
+            "passed": len(contradictions) == 0
+        }
+    def _extract_anchor_facts(self, tile: dict) -> list:
+        """タイルから検証用の事実を抽出"""
+        facts = []
+        content = tile.get("content", "") or tile.get("data", "")
+        if isinstance(content, str):
+            # 箇条書きや重要な記述を抽出
+            lines = content.split("\n")
+            for line in lines:
+                line = line.strip()
+                if len(line) > 10 and any(marker in line for marker in ["は", "である", "です", "："]):
+                    has_numbers = bool(re.search(r'\d+', line))
+                    facts.append({
+                        "statement": line[:200],  # 最大200文字
+                        "has_numbers": has_numbers
+                    })
+                    if len(facts) >= 5:  # 最大5つの事実
+                        break
+        return facts
+    # --- 危険な主張の検出（ドメイン対応） ---
+    def _detect_dangerous_claims(self, response: str, domain: str = "medical") -> list:
+        """ドメイン別の危険な主張を検出"""
+        issues = []
+        patterns = DOMAIN_DANGEROUS_PATTERNS.get(domain, DOMAIN_DANGEROUS_PATTERNS["medical"])
+        for pattern, claim_type, severity in patterns:
+            match = re.search(pattern, response)
+            if match:
+                issues.append({
+                    "type": "dangerous_claim",
+                    "domain": domain,
+                    "claim_type": claim_type,
+                    "matched_text": match.group(0),
+                    "severity": severity,
+                    "message": f"危険な主張を検出 [{domain}]: {claim_type}"
+                })
+        return issues
+    # --- ドメイン固有の検証 ---
+    def _validate_legal_response(self, response: str) -> list:
+        """法学ドメイン固有の検証"""
+        issues = []
+        # 免責事項の確認
+        if not re.search(LEGAL_VALIDATION_PATTERNS["disclaimer_required"], response):
+            issues.append({
+                "type": "missing_disclaimer",
+                "domain": "legal",
+                "severity": "high",
+                "message": "法的免責事項が欠落しています"
+            })
+        # 条文引用の確認（法律質問の場合）
+        # ここでは警告レベルにとどめる
+        if not re.search(LEGAL_VALIDATION_PATTERNS["statute_citation"], response):
+            issues.append({
+                "type": "missing_citation",
+                "domain": "legal",
+                "severity": "moderate",
+                "message": "条文への参照がありません"
+            })
+        return issues
+    def _validate_economics_response(self, response: str) -> list:
+        """経済学ドメイン固有の検証"""
+        issues = []
+        # データ出典の確認
+        if not re.search(ECONOMICS_VALIDATION_PATTERNS["data_source_required"], response):
+            issues.append({
+                "type": "missing_data_source",
+                "domain": "economics",
+                "severity": "moderate",
+                "message": "データ出典への参照がありません"
+            })
+        # 予測の場合の不確実性開示
+        if "予測" in response or "見通し" in response:
+            if not re.search(ECONOMICS_VALIDATION_PATTERNS["uncertainty_disclosure"], response):
+                issues.append({
+                    "type": "missing_uncertainty_disclosure",
+                    "domain": "economics",
+                    "severity": "high",
+                    "message": "予測の不確実性が明示されていません"
+                })
+        return issues
+    # --- 医学的数値の妥当性検証 ---
+    def _validate_medical_values(self, response: str) -> list:
+        """医学的数値が妥当な範囲内か検証"""
+        issues = []
+        # 血圧の検出と検証
+        bp_pattern = r'(\d{2,3})/(\d{2,3})\s*(?:mmHg)?'
+        bp_matches = re.findall(bp_pattern, response)
+        for systolic, diastolic in bp_matches:
+            s, d = int(systolic), int(diastolic)
+            ranges = MEDICAL_VALUE_RANGES["血圧"]
+            if not (ranges["systolic"][0] <= s <= ranges["systolic"][1]):
+                issues.append({
+                    "type": "invalid_medical_value",
+                    "value_type": "血圧（収縮期）",
+                    "value": s,
+                    "expected_range": ranges["systolic"],
+                    "severity": "high"
+                })
+            if not (ranges["diastolic"][0] <= d <= ranges["diastolic"][1]):
+                issues.append({
+                    "type": "invalid_medical_value",
+                    "value_type": "血圧（拡張期）",
+                    "value": d,
+                    "expected_range": ranges["diastolic"],
+                    "severity": "high"
+                })
+        # 体温の検出と検証
+        temp_pattern = r'(\d{2}(?:\.\d)?)\s*(?:°C|度|℃)'
+        temp_matches = re.findall(temp_pattern, response)
+        for temp in temp_matches:
+            t = float(temp)
+            ranges = MEDICAL_VALUE_RANGES["体温"]
+            if not (ranges["min"] <= t <= ranges["max"]):
+                issues.append({
+                    "type": "invalid_medical_value",
+                    "value_type": "体温",
+                    "value": t,
+                    "expected_range": (ranges["min"], ranges["max"]),
+                    "severity": "high"
+                })
+        return issues
+    # --- 高度な検証機能 ---
+    def _detect_false_dichotomy(self, response: str) -> list:
+        """偽の二者択一を検出"""
+        errors = []
+        dichotomy_pattern = r"(AかBのいずれかしかない|AかBしかない)" # 簡易パターン
+        if re.search(dichotomy_pattern, response.replace(" ","")): # 空白除去
+             errors.append({"type": "false_dichotomy", "statement": response, "severity": "moderate"})
+        return errors
+    async def _check_logical_consistency(self, question, alpha_response) -> dict:
+        """推論の論理的妥当性を検証"""
+        errors = []
+        response_text = alpha_response["main_response"]
+        # 偽の二者択一を検出
+        dichotomy_errors = self._detect_false_dichotomy(response_text)
+        errors.extend(dichotomy_errors)
+        # NOTE: 環状論理、論理的飛躍、根拠なき仮定の検出は高度なNLPが必要なため、
+        # ここではプレースホルダーとして成功を返す。
+        return {"logical_errors": errors, "error_count": len(errors), "passed": len(errors) == 0}
+    async def _verify_treatment_validity(self, response_text, db_context) -> dict:
+        """治療法の妥当性を検証"""
+        issues = []
+        # 簡易的な治療法抽出
+        mentioned_treatments_regex = re.findall(r"(\S+)が良い|(\w+)が有効な治療法|(\w+)を投与", response_text)
+        # 抽出結果はタプルのリストになるため、フラット化する
+        extracted_phrases = [item for tpl in mentioned_treatments_regex for item in tpl if item]
+        # 後処理で助詞などを除去し、治療法名を正確に切り出す
+        processed_treatments = []
+        for phrase in extracted_phrases:
+            if "には" in phrase:
+                processed_treatments.append(phrase.split("には")[-1])
+            elif "は" in phrase:
+                processed_treatments.append(phrase.split("は")[-1])
+            else:
+                processed_treatments.append(phrase)
+        for treatment in processed_treatments:
+            if not treatment: continue
+            treatment_info = await self.db.search_treatment(treatment)
+            if not treatment_info:
+                issues.append({"type": "unknown_treatment", "treatment": treatment, "severity": "moderate", "message": f"「{treatment}」は未知の治療法"})
+            elif not treatment_info.get("is_validated"):
+                issues.append({"type": "unvalidated_treatment", "treatment": treatment, "severity": "critical", "message": f"「{treatment}」は未検証の治療法"})
+        return {"valid": len(issues) == 0, "issues": issues}
+    async def _check_medical_context(self, response_text: str, db_context: dict) -> dict:
+        """医学的コンテキストが適切か確認"""
+        issues = []
+        treatment_check = await self._verify_treatment_validity(response_text, db_context)
+        if not treatment_check["valid"]:
+            issues.extend(treatment_check["issues"])
+        # NOTE: 診断基準、数値、禁忌の検証はプレースホルダー
+        return {"issues": issues, "issue_count": len(issues), "passed": len(issues) == 0}
+    async def validate_response(self, question: str, alpha_response: dict, db_context: dict, web_results=None, session_context=None, domain: str = "medical") -> dict:
+        """回答を多角的に検証する（基本＋高度、ドメイン対応）"""
+        response_text = alpha_response.get("main_response", "")
+        # alpha_responseにドメイン情報があればそちらを優先
+        domain = alpha_response.get("domain", domain)
+        logger.info(f"BetaLobe検証開始: domain={domain}")
+        # 1. 基本的なAnchor事実チェック
+        anchor_check = await self.check_anchor_facts(response_text, db_context)
+        # 2. 高度な論理チェック
+        logic_check = await self._check_logical_consistency(question, alpha_response)
+        # 3. ドメイン別の文脈チェック
+        if domain == "medical":
+            context_check = await self._check_medical_context(response_text, db_context)
+        elif domain == "legal":
+            context_issues = self._validate_legal_response(response_text)
+            context_check = {"issues": context_issues, "issue_count": len(context_issues), "passed": len(context_issues) == 0}
+        elif domain == "economics":
+            context_issues = self._validate_economics_response(response_text)
+            context_check = {"issues": context_issues, "issue_count": len(context_issues), "passed": len(context_issues) == 0}
+        else:
+            context_check = {"issues": [], "issue_count": 0, "passed": True}
+        # 4. ドメイン別の危険な主張の検出
+        dangerous_claims = self._detect_dangerous_claims(response_text, domain)
+        safety_check = {
+            "issues": dangerous_claims,
+            "issue_count": len(dangerous_claims),
+            "passed": len(dangerous_claims) == 0
+        }
+        # 5. ドメイン別の数値妥当性検証
+        if domain == "medical":
+            value_issues = self._validate_medical_values(response_text)
+        else:
+            value_issues = []  # 法学・経済学は数値検証なし（将来拡張可能）
+        value_check = {
+            "issues": value_issues,
+            "issue_count": len(value_issues),
+            "passed": len(value_issues) == 0
+        }
+        # 全ての問題を集約
+        all_issues = (
+            anchor_check["contradictions"] +
+            logic_check["logical_errors"] +
+            context_check["issues"] +
+            safety_check["issues"] +
+            value_check["issues"]
+        )
+        # 重大度を判定
+        severity = "none"
+        if any(i.get("severity") == "critical" for i in all_issues):
+            severity = "critical"
+        elif any(i.get("severity") == "high" for i in all_issues):
+            severity = "high"
+        elif any(i.get("severity") == "moderate" for i in all_issues):
+            severity = "moderate"
+        # ハルシネーションリスクスコアを計算
+        hallucination_risk = self._calculate_hallucination_risk(
+            alpha_response, anchor_check, logic_check, context_check, safety_check
+        )
+        validation_result = {
+            "timestamp": datetime.now().isoformat(),
+            "response_text": response_text[:500],  # 長い回答は切り詰め
+            "checks": {
+                "anchor_facts": anchor_check,
+                "logic": logic_check,
+                "context": context_check,
+                "safety": safety_check,
+                "medical_values": value_check
+            },
+            "all_issues": all_issues,
+            "issue_count": len(all_issues),
+            "has_contradictions": len(all_issues) > 0,
+            "severity": severity,
+            "hallucination_risk": hallucination_risk,
+            "recommendations": self._generate_recommendations(all_issues)
+        }
+        logger.info(f"検証完了: {len(all_issues)}件の問題, 重大度={severity}, ハルシネーションリスク={hallucination_risk['score']:.2f}")
+        return validation_result
+    def _calculate_hallucination_risk(self, alpha_response, anchor_check, logic_check, context_check, safety_check) -> dict:
+        """ハルシネーションリスクスコアを計算"""
+        score = 0.0
+        # Anchor事実との矛盾（最大0.4）
+        if not anchor_check["passed"]:
+            score += 0.4
+        # 論理エラー（最大0.2）
+        if not logic_check["passed"]:
+            score += 0.2
+        # 医学的文脈の問題（最大0.15）
+        if not context_check["passed"]:
+            score += 0.15
+        # 危険な主張（最大0.25）
+        if not safety_check["passed"]:
+            score += 0.25
+        # 信頼度が低い場合のペナルティ
+        confidence = alpha_response.get("confidence", 0.5)
+        if confidence < 0.4:
+            score += 0.1
+        final_score = min(1.0, score)
+        # リスクレベルの分類
+        if final_score < 0.1:
+            level = "very_low"
+        elif final_score < 0.25:
+            level = "low"
+        elif final_score < 0.5:
+            level = "moderate"
+        elif final_score < 0.75:
+            level = "high"
+        else:
+            level = "critical"
+        return {
+            "score": final_score,
+            "level": level,
+            "action_required": final_score >= 0.25
+        }
+    def _generate_recommendations(self, all_issues: list) -> list:
+        """問題に基づいて修正推奨を生成"""
+        recommendations = []
+        for issue in all_issues[:3]:  # 最大3件
+            issue_type = issue.get("type", "unknown")
+            if issue_type == "dangerous_claim":
+                recommendations.append({
+                    "type": "remove_dangerous_claim",
+                    "message": f"危険な主張を削除または修正: {issue.get('claim_type')}",
+                    "priority": "high"
+                })
+            elif issue_type == "numerical_contradiction":
+                recommendations.append({
+                    "type": "verify_numbers",
+                    "message": f"数値を確認: {issue.get('fact', '')[:50]}",
+                    "priority": "medium"
+                })
+            elif issue_type == "invalid_medical_value":
+                recommendations.append({
+                    "type": "correct_value",
+                    "message": f"{issue.get('value_type')}の値が範囲外: {issue.get('value')}",
+                    "priority": "high"
+                })
+        return recommendations