Spaces:

LibrAI
/

uae-kb

Sleeping

jinruiy Claude commited on Jan 8

Commit

d1394bb

1 Parent(s): 4ebe674

Add per-entity feedback, rank details dropdown, and expanded KB

Features:
- Per-entity feedback with ratings (relevance, helpful, sensitivity) and submit button
- Clickable rank score button with dropdown showing full score, matched chunk, subcategory, emirate, source, and model
- KB source display (Wiki, Dhow, Scrapped, Controversial) with deduplication
- Click-outside-to-close behavior for rank details dropdown
- Sensitive topics translation support

Backend:
- New /api/entity-feedback endpoint with UUID query tracking
- Entity feedback saved to entity_feedbacks.json

KB Updates:
- Expanded knowledge base with 2,268 entities
- Updated IR index with 7,531 chunks
- Added controversial_KB source type

🤖 Generated with [Claude Code](https://claude.ai/claude-code)

Co-Authored-By: Claude <noreply@anthropic.com>

Files changed (10) hide show

backend/api.py +60 -0
frontend/css/styles.css +60 -0
frontend/js/app.js +408 -33
ir/cache/dense_index/chunk_metadata_bge-m3.json +0 -0
ir/cache/dense_index/faiss_index_bge-m3.bin +2 -2
ir/demo.py +340 -165
uae_knowledge_build/data/unified_KB/alias_index.json +0 -0
uae_knowledge_build/data/unified_KB/category_metadata.json +130 -231
uae_knowledge_build/data/unified_KB/entities.json +0 -0
uae_knowledge_build/data/unified_KB/sensitive_topics.json +0 -0

backend/api.py CHANGED Viewed

@@ -76,6 +76,19 @@ class RatingRequest(BaseModel):
     rating_value: int  # 0, 1, or 2 for relevance; 0 or 1 for helpful
 # ============================================================
 # Translation Cache (file-based, persistent across restarts)
 # ============================================================
@@ -295,6 +308,53 @@ async def api_rating(request: RatingRequest, req: Request):
         return {"success": False, "error": str(e)}
 @app.post("/api/translate")
 async def api_translate(request: TranslateRequest):
     """Translate texts using DeepL API"""

     rating_value: int  # 0, 1, or 2 for relevance; 0 or 1 for helpful
+class EntityFeedbackRequest(BaseModel):
+    query_id: str  # UUID for tracking unique search sessions
+    query: str
+    query_timestamp: str
+    entity_id: str
+    entity_name: str
+    rank_position: int
+    rank_score: float
+    ratings: Dict[str, Optional[bool]]  # {relevance, helpful, sensitivity_handling}
+    comment: str
+    submitted_at: str
 # ============================================================
 # Translation Cache (file-based, persistent across restarts)
 # ============================================================
         return {"success": False, "error": str(e)}
+@app.post("/api/entity-feedback")
+async def api_entity_feedback(request: EntityFeedbackRequest, req: Request):
+    """Save per-entity feedback with ratings and comment"""
+    try:
+        # Ensure data directory exists
+        DATA_DIR.mkdir(parents=True, exist_ok=True)
+        # Get client IP
+        client_ip = req.headers.get("x-forwarded-for", "").split(",")[0].strip()
+        if not client_ip:
+            client_ip = req.client.host if req.client else "unknown"
+        feedback_file = DATA_DIR / "entity_feedbacks.json"
+        feedback = {
+            "query_id": request.query_id,
+            "query": request.query,
+            "query_timestamp": request.query_timestamp,
+            "user_ip": client_ip,
+            "entity_id": request.entity_id,
+            "entity_name": request.entity_name,
+            "rank_position": request.rank_position,
+            "rank_score": request.rank_score,
+            "ratings": request.ratings,
+            "comment": request.comment,
+            "submitted_at": request.submitted_at
+        }
+        # Load existing feedbacks
+        if feedback_file.exists():
+            with open(feedback_file, "r", encoding="utf-8") as f:
+                all_feedbacks = json.load(f)
+        else:
+            all_feedbacks = []
+        all_feedbacks.append(feedback)
+        # Save feedbacks
+        with open(feedback_file, "w", encoding="utf-8") as f:
+            json.dump(all_feedbacks, f, ensure_ascii=False, indent=2)
+        return {"success": True, "total": len(all_feedbacks)}
+    except Exception as e:
+        return {"success": False, "error": str(e)}
 @app.post("/api/translate")
 async def api_translate(request: TranslateRequest):
     """Translate texts using DeepL API"""

frontend/css/styles.css CHANGED Viewed

@@ -110,6 +110,66 @@ body.lang-cn {
     transform: scale(1.15);
 }
 /* ============================================
    MODAL STYLES
    ============================================ */

     transform: scale(1.15);
 }
+/* ============================================
+   SENSITIVE TOPICS & RESPONSE GUIDE
+   ============================================ */
+details summary {
+    list-style: none;
+}
+details summary::-webkit-details-marker {
+    display: none;
+}
+details[open] summary {
+    color: #003d1c;
+}
+details[open] summary::before {
+    content: '▼ ';
+}
+details:not([open]) summary::before {
+    content: '▶ ';
+}
+.sensitive-topic-card {
+    transition: all 0.2s ease;
+}
+.sensitive-topic-card:hover {
+    box-shadow: 0 2px 8px rgba(0,0,0,0.08);
+}
+/* ============================================
+   RANK DETAILS DROPDOWN
+   ============================================ */
+.rank-details {
+    position: relative;
+}
+.rank-details summary {
+    list-style: none;
+}
+.rank-details summary::-webkit-details-marker {
+    display: none;
+}
+.rank-details summary::before {
+    content: none !important;
+}
+.rank-details[open] summary {
+    border-radius: 4px 4px 0 0;
+}
+.rank-details > div {
+    position: absolute;
+    right: 0;
+    top: 100%;
+}
 /* ============================================
    MODAL STYLES
    ============================================ */

frontend/js/app.js CHANGED Viewed

@@ -38,11 +38,33 @@ const TRANSLATIONS = {
         enterQuery: 'Enter a query above to search the UAE Knowledge Base',
         selectCategoryHint: 'Select a category and click Search to begin',
         mustKnowFacts: '✓ Must-Know Facts',
         relevance: 'Relevance?',
         helpful: 'Helpful?',
         detailedAnalysis: 'Detailed Analysis',
         fullEntityJson: 'Full Entity JSON',
         rankScore: 'Rank Score',
         viewEntity: 'View Entity',
         entityData: 'Entity Data',
         pleaseEnterQuery: 'Please enter a search query',
@@ -102,11 +124,33 @@ const TRANSLATIONS = {
         enterQuery: 'أدخل استعلامك للبحث في قاعدة المعرفة',
         selectCategoryHint: 'اختر فئة وانقر للبحث',
         mustKnowFacts: '✓ حقائق أساسية',
         relevance: 'الصلة؟',
         helpful: 'مفيد؟',
         detailedAnalysis: 'تحليل مفصل',
         fullEntityJson: 'بيانات الكيان الكاملة',
-        rankScore: 'الترتيب',
         viewEntity: 'عرض الكيان',
         entityData: 'بيانات الكيان',
         pleaseEnterQuery: 'الرجاء إدخال استعلام البحث',
@@ -166,11 +210,33 @@ const TRANSLATIONS = {
         enterQuery: '在上方输入查询以搜索阿联酋知识库',
         selectCategoryHint: '选择类别并点击搜索开始',
         mustKnowFacts: '✓ 必知事实',
         relevance: '相关性？',
         helpful: '有帮助？',
         detailedAnalysis: '详细分析',
         fullEntityJson: '完整实体JSON',
-        rankScore: '排序分数',
         viewEntity: '查看实体',
         entityData: '实体数据',
         pleaseEnterQuery: '请输入搜索查询',
@@ -230,7 +296,9 @@ const state = {
     currentQuery: '',
     currentCategory: null,
     results: [],
-    ratings: {},  // { entityIndex: { relevance: 0|1|2, helpful: true|false } }
     isLoading: false,
     language: localStorage.getItem('uae_lang') || 'en',
     // Translation state
@@ -243,6 +311,15 @@ const state = {
     resultsPerPage: 10
 };
 // ============================================
 // DOM ELEMENTS
 // ============================================
@@ -297,6 +374,12 @@ function initEventListeners() {
         if (!e.target.closest('.category-dropdown')) {
             DOM.categoryDropdown?.classList.remove('active');
         }
     });
     // Modals
@@ -353,6 +436,8 @@ async function handleSearch() {
     state.currentQuery = query;
     state.isLoading = true;
     state.ratings = {};
     // Reset translation state for new search
     state.translatedResults = {};
     state.showOriginal = false;
@@ -606,6 +691,20 @@ function renderResults() {
         // Get translated or original content
         const content = getResultContent(result, index);
         return `
         <div class="bg-white rounded shadow-xl border border-gray-200 result-card mb-4 md:mb-6 overflow-x-hidden" data-index="${index}">
             <!-- Card Header -->
@@ -614,9 +713,45 @@ function renderResults() {
                     <span class="text-amber-400">${index === 0 ? '🦅' : '📄'}</span>
                     #${index + 1} ${escapeHtml(content.entityName)}
                 </div>
-                <div class="text-[12px] md:text-[16px] font-medium gold-button-slender text-emerald-950 px-3 md:px-4 rounded shadow-sm self-start sm:self-auto">
-                    ${t('rankScore')}: ${result.score.toFixed(2)} ▲
-                </div>
             </div>
             <!-- Card Body -->
@@ -629,20 +764,16 @@ function renderResults() {
                         </p>
                     </div>
-                    <!-- Must-Know Facts -->
                     <div class="w-full md:w-[38%] pt-1">
-                        <h4 class="text-emerald-800 font-medium text-[14px] md:text-[18px] mb-3 md:mb-4">${t('mustKnowFacts')}</h4>
-                        <ul class="text-[14px] md:text-[18px] space-y-2 md:space-y-3 text-emerald-800/80">
-                            ${content.facts.slice(0, 5).map(fact => `
-                                <li>• ${escapeHtml(fact)}</li>
-                            `).join('')}
-                        </ul>
                     </div>
                 </div>
-                <!-- Rating Row -->
                 <div class="mt-6 md:mt-8 border-t border-gray-50 pt-4 md:pt-6 flex flex-col gap-4">
-                    <div class="flex flex-wrap items-center gap-4 md:gap-12">
                         <!-- Relevance Rating -->
                         <div class="flex items-center gap-2 md:gap-3">
                             <span class="text-[12px] md:text-[16px] font-medium text-gray-400 tracking-wider">${t('relevance')}</span>
@@ -664,6 +795,33 @@ function renderResults() {
                                         onclick="setRating(${index}, 'helpful', false)">👎</button>
                             </div>
                         </div>
                     </div>
                     <!-- Detailed Analysis Button -->
@@ -738,9 +896,9 @@ function selectCategory(categoryId) {
 }
 // ============================================
-// RATINGS (auto-save on click)
 // ============================================
-window.setRating = async function(entityIndex, dimension, value) {
     if (!state.ratings[entityIndex]) {
         state.ratings[entityIndex] = {};
     }
@@ -748,31 +906,182 @@ window.setRating = async function(entityIndex, dimension, value) {
     // Re-render to update button states
     renderResults();
-    // Auto-save rating to backend
     try {
-        const result = state.results[entityIndex];
-        const response = await fetch(`${CONFIG.API_BASE}/rating`, {
             method: 'POST',
             headers: { 'Content-Type': 'application/json' },
             body: JSON.stringify({
                 query: state.currentQuery,
-                category: state.currentCategory?.id || '',
-                entity_id: result?.entity_id || '',
-                entity_index: entityIndex,
-                rating_type: dimension,
-                rating_value: dimension === 'helpful' ? (value ? 1 : 0) : value
             })
         });
         const data = await response.json();
         if (data.success) {
-            // Show subtle confirmation
-            showToast('Rating saved ✓', 'success');
         }
     } catch (error) {
-        console.error('Failed to save rating:', error);
-        // Don't show error to user - rating is still stored locally
     }
 };
@@ -977,6 +1286,43 @@ window.translateCurrentPage = async function() {
                 textsToTranslate.push(fact);
                 textMap.push({ index, field: 'fact', factIndex });
             });
         });
         if (textsToTranslate.length === 0) {
@@ -1002,13 +1348,14 @@ window.translateCurrentPage = async function() {
             }
             data.translations.forEach((translated, i) => {
-                const { index, field, factIndex } = textMap[i];
                 if (!state.translatedResults[lang][index]) {
                     state.translatedResults[lang][index] = {
                         entityName: null,
                         summary: null,
-                        facts: []
                     };
                 }
@@ -1018,6 +1365,32 @@ window.translateCurrentPage = async function() {
                     state.translatedResults[lang][index].summary = translated;
                 } else if (field === 'fact') {
                     state.translatedResults[lang][index].facts[factIndex] = translated;
                 }
             });
         }
@@ -1047,14 +1420,16 @@ function getResultContent(result, index) {
             summary: state.translatedResults[lang][index].summary || result.summary,
             facts: state.translatedResults[lang][index].facts.length > 0
                 ? state.translatedResults[lang][index].facts
-                : (result.must_answer || [])
         };
     }
     return {
         entityName: result.entity_name,
         summary: result.summary,
-        facts: result.must_answer || []
     };
 }

         enterQuery: 'Enter a query above to search the UAE Knowledge Base',
         selectCategoryHint: 'Select a category and click Search to begin',
         mustKnowFacts: '✓ Must-Know Facts',
+        sensitiveTopics: '⚠️ Sensitive Topics',
+        sensitivityRating: 'Sensitivity',
+        sensitivityHigh: '🔴 HIGH',
+        sensitivityMedium: '🟡 MEDIUM',
+        sensitivityLow: '🟢 LOW',
+        noSensitiveTopics: 'No sensitive topics identified',
+        problematicFraming: 'Problematic Framing',
+        responseGuide: 'Response Guide',
+        strategy: 'Strategy',
+        tone: 'Tone',
+        keyFacts: 'Key Facts',
+        suggestedResponse: 'Suggested Response',
         relevance: 'Relevance?',
         helpful: 'Helpful?',
+        sensitivityHandling: 'Sensitivity Handling?',
+        feedbackForEntity: 'Your feedback on this entity...',
+        submitEntityFeedback: 'Submit Feedback',
+        feedbackSavedForEntity: 'Feedback saved for this entity ✓',
         detailedAnalysis: 'Detailed Analysis',
         fullEntityJson: 'Full Entity JSON',
         rankScore: 'Rank Score',
+        fullScore: 'Full Score',
+        matchedChunk: 'Matched Chunk',
+        subcategory: 'Subcategory',
+        emirate: 'Emirate',
+        model: 'Model',
+        source: 'Source',
         viewEntity: 'View Entity',
         entityData: 'Entity Data',
         pleaseEnterQuery: 'Please enter a search query',
         enterQuery: 'أدخل استعلامك للبحث في قاعدة المعرفة',
         selectCategoryHint: 'اختر فئة وانقر للبحث',
         mustKnowFacts: '✓ حقائق أساسية',
+        sensitiveTopics: '⚠️ مواضيع حساسة',
+        sensitivityRating: 'الحساسية',
+        sensitivityHigh: '🔴 عالية',
+        sensitivityMedium: '🟡 متوسطة',
+        sensitivityLow: '🟢 منخفضة',
+        noSensitiveTopics: 'لم يتم تحديد مواضيع حساسة',
+        problematicFraming: 'الصياغة الإشكالية',
+        responseGuide: 'دليل الاستجابة',
+        strategy: 'الاستراتيجية',
+        tone: 'النبرة',
+        keyFacts: 'الحقائق الرئيسية',
+        suggestedResponse: 'الاستجابة المقترحة',
         relevance: 'الصلة؟',
         helpful: 'مفيد؟',
+        sensitivityHandling: 'معالجة الحساسية؟',
+        feedbackForEntity: 'ملاحظاتك على هذا الكيان...',
+        submitEntityFeedback: 'إرسال الملاحظات',
+        feedbackSavedForEntity: 'تم حفظ الملاحظات لهذا الكيان ✓',
         detailedAnalysis: 'تحليل مفصل',
         fullEntityJson: 'بيانات الكيان الكاملة',
+        rankScore: 'درجة الترتيب',
+        fullScore: 'الدرجة الكاملة',
+        matchedChunk: 'القطعة المطابقة',
+        subcategory: 'الفئة الفرعية',
+        emirate: 'الإمارة',
+        model: 'النموذج',
+        source: 'المصدر',
         viewEntity: 'عرض الكيان',
         entityData: 'بيانات الكيان',
         pleaseEnterQuery: 'الرجاء إدخال استعلام البحث',
         enterQuery: '在上方输入查询以搜索阿联酋知识库',
         selectCategoryHint: '选择类别并点击搜索开始',
         mustKnowFacts: '✓ 必知事实',
+        sensitiveTopics: '⚠️ 敏感话题',
+        sensitivityRating: '敏感度',
+        sensitivityHigh: '🔴 高',
+        sensitivityMedium: '🟡 中',
+        sensitivityLow: '🟢 低',
+        noSensitiveTopics: '未发现敏感话题',
+        problematicFraming: '问题性表述',
+        responseGuide: '回应指南',
+        strategy: '策略',
+        tone: '语气',
+        keyFacts: '关键事实',
+        suggestedResponse: '建议回应',
         relevance: '相关性？',
         helpful: '有帮助？',
+        sensitivityHandling: '敏感处理？',
+        feedbackForEntity: '您对此实体的反馈...',
+        submitEntityFeedback: '提交反馈',
+        feedbackSavedForEntity: '此实体的反馈已保存 ✓',
         detailedAnalysis: '详细分析',
         fullEntityJson: '完整实体JSON',
+        rankScore: '排名分数',
+        fullScore: '完整分数',
+        matchedChunk: '匹配块',
+        subcategory: '子类别',
+        emirate: '酋长国',
+        model: '模型',
+        source: '数据来源',
         viewEntity: '查看实体',
         entityData: '实体数据',
         pleaseEnterQuery: '请输入搜索查询',
     currentQuery: '',
     currentCategory: null,
     results: [],
+    ratings: {},  // { entityIndex: { relevance: 0|1, helpful: true|false, sensitivityHandling: true|false } }
+    entityFeedbacks: {},  // { entityIndex: { comment: '', submitted: false } }
+    queryId: null,  // UUID for each search session
     isLoading: false,
     language: localStorage.getItem('uae_lang') || 'en',
     // Translation state
     resultsPerPage: 10
 };
+// Generate UUID for query tracking
+function generateUUID() {
+    return 'xxxxxxxx-xxxx-4xxx-yxxx-xxxxxxxxxxxx'.replace(/[xy]/g, function(c) {
+        const r = Math.random() * 16 | 0;
+        const v = c === 'x' ? r : (r & 0x3 | 0x8);
+        return v.toString(16);
+    });
+}
 // ============================================
 // DOM ELEMENTS
 // ============================================
         if (!e.target.closest('.category-dropdown')) {
             DOM.categoryDropdown?.classList.remove('active');
         }
+        // Close rank-details dropdowns when clicking outside
+        if (!e.target.closest('.rank-details')) {
+            document.querySelectorAll('.rank-details[open]').forEach(details => {
+                details.removeAttribute('open');
+            });
+        }
     });
     // Modals
     state.currentQuery = query;
     state.isLoading = true;
     state.ratings = {};
+    state.entityFeedbacks = {};
+    state.queryId = generateUUID();  // Generate new query_id for this search
     // Reset translation state for new search
     state.translatedResults = {};
     state.showOriginal = false;
         // Get translated or original content
         const content = getResultContent(result, index);
+        // Get ranking details
+        const chunkType = result.chunk_type || 'unknown';
+        const subcategory = result.subcategory || '';
+        const emirate = result.emirate || '';
+        // Get data source (wiki, dhow, scrapped, controversial) - deduplicate first
+        const dataSources = [...new Set(result.full_entity?.data_sources || [])];
+        const sourceDisplay = dataSources.map(s => {
+            if (s.includes('wiki')) return 'Wiki';
+            if (s.includes('dhow')) return 'Dhow';
+            if (s.includes('scrapp')) return 'Scrapped';
+            if (s.includes('controversial')) return 'Controversial';
+            return s;
+        }).join(', ') || '';
         return `
         <div class="bg-white rounded shadow-xl border border-gray-200 result-card mb-4 md:mb-6 overflow-x-hidden" data-index="${index}">
             <!-- Card Header -->
                     <span class="text-amber-400">${index === 0 ? '🦅' : '📄'}</span>
                     #${index + 1} ${escapeHtml(content.entityName)}
                 </div>
+                <details class="rank-details self-start sm:self-auto">
+                    <summary class="text-[12px] md:text-[16px] font-medium gold-button-slender text-emerald-950 px-3 md:px-4 rounded shadow-sm cursor-pointer list-none">
+                        ${t('rankScore')}: ${result.score.toFixed(2)} ▼
+                    </summary>
+                    <div class="absolute right-0 mt-1 bg-white border border-gray-200 rounded-lg shadow-lg p-3 z-50 min-w-[200px] text-[12px] text-gray-700">
+                        <div class="space-y-2">
+                            <div class="flex justify-between">
+                                <span class="text-gray-500">${t('fullScore')}:</span>
+                                <span class="font-mono font-medium">${result.score.toFixed(6)}</span>
+                            </div>
+                            <div class="flex justify-between">
+                                <span class="text-gray-500">${t('matchedChunk')}:</span>
+                                <span class="font-medium capitalize">${chunkType}</span>
+                            </div>
+                            ${subcategory ? `
+                            <div class="flex justify-between">
+                                <span class="text-gray-500">${t('subcategory')}:</span>
+                                <span class="font-medium">${escapeHtml(subcategory)}</span>
+                            </div>
+                            ` : ''}
+                            ${emirate ? `
+                            <div class="flex justify-between">
+                                <span class="text-gray-500">${t('emirate')}:</span>
+                                <span class="font-medium">${escapeHtml(emirate)}</span>
+                            </div>
+                            ` : ''}
+                            ${sourceDisplay ? `
+                            <div class="flex justify-between">
+                                <span class="text-gray-500">${t('source')}:</span>
+                                <span class="font-medium">${escapeHtml(sourceDisplay)}</span>
+                            </div>
+                            ` : ''}
+                            <div class="flex justify-between border-t pt-2 mt-2">
+                                <span class="text-gray-500">${t('model')}:</span>
+                                <span class="font-medium text-emerald-700">bge-m3</span>
+                            </div>
+                        </div>
+                    </div>
+                </details>
             </div>
             <!-- Card Body -->
                         </p>
                     </div>
+                    <!-- Sensitive Topics -->
                     <div class="w-full md:w-[38%] pt-1">
+                        <h4 class="text-emerald-800 font-medium text-[14px] md:text-[18px] mb-3 md:mb-4">${t('sensitiveTopics')}</h4>
+                        ${renderSensitiveTopics(result, index, content.sensitiveTopics)}
                     </div>
                 </div>
+                <!-- Rating & Feedback Row -->
                 <div class="mt-6 md:mt-8 border-t border-gray-50 pt-4 md:pt-6 flex flex-col gap-4">
+                    <div class="flex flex-wrap items-center gap-4 md:gap-8">
                         <!-- Relevance Rating -->
                         <div class="flex items-center gap-2 md:gap-3">
                             <span class="text-[12px] md:text-[16px] font-medium text-gray-400 tracking-wider">${t('relevance')}</span>
                                         onclick="setRating(${index}, 'helpful', false)">👎</button>
                             </div>
                         </div>
+                        <!-- Sensitivity Handling Rating -->
+                        <div class="flex items-center gap-2 md:gap-3">
+                            <span class="text-[12px] md:text-[16px] font-medium text-gray-400 tracking-wider">${t('sensitivityHandling')}</span>
+                            <div class="flex gap-2 text-base md:text-lg">
+                                <button class="rating-btn ${state.ratings[index]?.sensitivityHandling === true ? 'active' : ''}"
+                                        onclick="setRating(${index}, 'sensitivityHandling', true)">✅</button>
+                                <button class="rating-btn ${state.ratings[index]?.sensitivityHandling === false ? 'active' : ''}"
+                                        onclick="setRating(${index}, 'sensitivityHandling', false)">❌</button>
+                            </div>
+                        </div>
+                    </div>
+                    <!-- Per-Entity Feedback -->
+                    <div class="flex flex-col sm:flex-row gap-2 mt-2">
+                        <input type="text"
+                               id="entity-feedback-${index}"
+                               class="flex-1 px-3 py-2 border border-gray-300 rounded text-[14px] focus:outline-none focus:border-emerald-500"
+                               placeholder="${t('feedbackForEntity')}"
+                               value="${state.entityFeedbacks[index]?.comment || ''}"
+                               ${state.entityFeedbacks[index]?.submitted ? 'disabled' : ''}
+                               onchange="updateEntityComment(${index}, this.value)">
+                        <button class="px-4 py-2 text-[14px] font-medium rounded shadow-sm ${state.entityFeedbacks[index]?.submitted ? 'bg-gray-300 text-gray-500 cursor-not-allowed' : 'bg-emerald-700 text-white hover:bg-emerald-800'}"
+                                onclick="submitEntityFeedback(${index})"
+                                ${state.entityFeedbacks[index]?.submitted ? 'disabled' : ''}>
+                            ${state.entityFeedbacks[index]?.submitted ? t('feedbackSavedForEntity') : t('submitEntityFeedback')}
+                        </button>
                     </div>
                     <!-- Detailed Analysis Button -->
 }
 // ============================================
+// RATINGS (stored locally, saved on submit)
 // ============================================
+window.setRating = function(entityIndex, dimension, value) {
     if (!state.ratings[entityIndex]) {
         state.ratings[entityIndex] = {};
     }
     // Re-render to update button states
     renderResults();
+};
+// ============================================
+// SENSITIVE TOPICS RENDERING
+// ============================================
+function renderSensitiveTopics(result, index, translatedTopics) {
+    const sensitiveTopics = result.full_entity?.sensitive_topics || result.sensitive_topics;
+    // Check if entity has sensitive content
+    if (!sensitiveTopics || !sensitiveTopics.has_sensitive_content || !sensitiveTopics.topics || sensitiveTopics.topics.length === 0) {
+        return `
+            <div class="text-[14px] md:text-[16px] text-gray-500">
+                <span class="inline-block px-2 py-1 rounded bg-green-100 text-green-700 text-[12px] md:text-[14px] mb-2">
+                    ${t('sensitivityLow')}
+                </span>
+                <p class="mt-2">${t('noSensitiveTopics')}</p>
+            </div>
+        `;
+    }
+    const topics = sensitiveTopics.topics;
+    // Determine overall sensitivity rating
+    const hasHighSeverity = topics.some(topic => typeof topic === 'object' && topic.severity === 'high');
+    const sensitivityRating = hasHighSeverity ? 'high' : 'medium';
+    const ratingLabel = sensitivityRating === 'high' ? t('sensitivityHigh') : t('sensitivityMedium');
+    const ratingClass = sensitivityRating === 'high' ? 'bg-red-100 text-red-700' : 'bg-yellow-100 text-yellow-700';
+    // Render topics
+    const topicsHtml = topics.map((topic, topicIndex) => {
+        // Get translated content for this topic (if available)
+        const trans = translatedTopics?.[topicIndex] || {};
+        // Handle string topics (malformed data)
+        if (typeof topic === 'string') {
+            const displayText = trans.stringTopic || topic;
+            return `
+                <div class="bg-gray-50 p-3 rounded border border-gray-200 mb-2">
+                    <p class="text-[13px] md:text-[15px] text-gray-700">${escapeHtml(displayText)}</p>
+                </div>
+            `;
+        }
+        // Handle proper topic objects
+        const topicType = topic.topic_type || 'unknown';
+        const severity = topic.severity || 'medium';
+        const severityClass = severity === 'high' ? 'bg-red-100 text-red-700' : 'bg-yellow-100 text-yellow-700';
+        const severityIcon = severity === 'high' ? '🔴' : '🟡';
+        // Use translated content or fall back to original
+        const problematicFraming = trans.framing || topic.problematic_framing || '';
+        const appropriateResponse = topic.appropriate_response || {};
+        const strategy = trans.strategy || appropriateResponse.strategy || '';
+        const tone = trans.tone || appropriateResponse.tone || '';
+        const suggestedResponse = trans.suggested || appropriateResponse.suggested_response || '';
+        const keyFacts = (trans.keyFacts && trans.keyFacts.length > 0)
+            ? trans.keyFacts
+            : (appropriateResponse.key_facts || []);
+        return `
+            <div class="bg-gray-50 p-3 rounded border border-gray-200 mb-3">
+                <!-- Topic Header -->
+                <div class="flex items-center gap-2 mb-2">
+                    <span class="text-[12px] px-2 py-0.5 rounded ${severityClass}">${severityIcon} ${topicType}</span>
+                </div>
+                <!-- Problematic Framing -->
+                ${problematicFraming ? `
+                    <div class="mb-2">
+                        <span class="text-[11px] md:text-[13px] font-medium text-gray-500">${t('problematicFraming')}:</span>
+                        <p class="text-[13px] md:text-[15px] text-gray-800 mt-1 italic">"${escapeHtml(problematicFraming)}"</p>
+                    </div>
+                ` : ''}
+                <!-- Collapsible Response Guide -->
+                ${strategy || keyFacts.length > 0 || suggestedResponse ? `
+                    <details class="mt-2">
+                        <summary class="text-[12px] md:text-[14px] text-emerald-700 cursor-pointer hover:text-emerald-900 font-medium">
+                            ${t('responseGuide')}
+                        </summary>
+                        <div class="mt-2 pl-3 border-l-2 border-emerald-200 text-[12px] md:text-[14px]">
+                            ${strategy ? `
+                                <p class="mb-1"><span class="font-medium text-gray-600">${t('strategy')}:</span> ${escapeHtml(strategy)}</p>
+                            ` : ''}
+                            ${tone ? `
+                                <p class="mb-1"><span class="font-medium text-gray-600">${t('tone')}:</span> ${escapeHtml(tone)}</p>
+                            ` : ''}
+                            ${keyFacts.length > 0 ? `
+                                <div class="mb-1">
+                                    <span class="font-medium text-gray-600">${t('keyFacts')}:</span>
+                                    <ul class="list-disc list-inside mt-1 text-gray-700">
+                                        ${keyFacts.map(fact => `<li>${escapeHtml(fact)}</li>`).join('')}
+                                    </ul>
+                                </div>
+                            ` : ''}
+                            ${suggestedResponse ? `
+                                <div class="mt-2">
+                                    <span class="font-medium text-gray-600">${t('suggestedResponse')}:</span>
+                                    <p class="mt-1 text-gray-700 bg-white p-2 rounded border">${escapeHtml(suggestedResponse)}</p>
+                                </div>
+                            ` : ''}
+                        </div>
+                    </details>
+                ` : ''}
+            </div>
+        `;
+    }).join('');
+    return `
+        <div>
+            <span class="inline-block px-2 py-1 rounded ${ratingClass} text-[12px] md:text-[14px] mb-3">
+                ${t('sensitivityRating')}: ${ratingLabel}
+            </span>
+            <div class="mt-2 max-h-[300px] overflow-y-auto">
+                ${topicsHtml}
+            </div>
+        </div>
+    `;
+}
+// ============================================
+// PER-ENTITY FEEDBACK
+// ============================================
+window.updateEntityComment = function(index, value) {
+    if (!state.entityFeedbacks[index]) {
+        state.entityFeedbacks[index] = { comment: '', submitted: false };
+    }
+    state.entityFeedbacks[index].comment = value;
+};
+window.submitEntityFeedback = async function(index) {
+    const result = state.results[index];
+    if (!result) return;
+    const feedback = state.entityFeedbacks[index] || { comment: '' };
+    const ratings = state.ratings[index] || {};
     try {
+        const response = await fetch(`${CONFIG.API_BASE}/entity-feedback`, {
             method: 'POST',
             headers: { 'Content-Type': 'application/json' },
             body: JSON.stringify({
+                query_id: state.queryId,
                 query: state.currentQuery,
+                query_timestamp: new Date().toISOString(),
+                entity_id: result.entity_id || '',
+                entity_name: result.entity_name || '',
+                rank_position: index + 1,
+                rank_score: result.score || 0,
+                ratings: {
+                    relevance: ratings.relevance !== undefined ? (ratings.relevance === 1) : null,
+                    helpful: ratings.helpful !== undefined ? ratings.helpful : null,
+                    sensitivity_handling: ratings.sensitivityHandling !== undefined ? ratings.sensitivityHandling : null
+                },
+                comment: feedback.comment || '',
+                submitted_at: new Date().toISOString()
             })
         });
         const data = await response.json();
         if (data.success) {
+            // Mark as submitted
+            if (!state.entityFeedbacks[index]) {
+                state.entityFeedbacks[index] = { comment: '', submitted: false };
+            }
+            state.entityFeedbacks[index].submitted = true;
+            showToast(t('feedbackSavedForEntity'), 'success');
+            renderResults();  // Re-render to update UI
+        } else {
+            throw new Error(data.error || 'Failed to save feedback');
         }
     } catch (error) {
+        console.error('Failed to save entity feedback:', error);
+        showToast(`Error: ${error.message}`, 'error');
     }
 };
                 textsToTranslate.push(fact);
                 textMap.push({ index, field: 'fact', factIndex });
             });
+            // Add sensitive topics content
+            const sensitiveTopics = result.full_entity?.sensitive_topics || result.sensitive_topics;
+            if (sensitiveTopics?.has_sensitive_content && sensitiveTopics?.topics) {
+                sensitiveTopics.topics.forEach((topic, topicIndex) => {
+                    if (typeof topic === 'object') {
+                        // Problematic framing
+                        if (topic.problematic_framing) {
+                            textsToTranslate.push(topic.problematic_framing);
+                            textMap.push({ index, field: 'sensitiveTopicFraming', topicIndex });
+                        }
+                        // Appropriate response fields
+                        const response = topic.appropriate_response || {};
+                        if (response.strategy) {
+                            textsToTranslate.push(response.strategy);
+                            textMap.push({ index, field: 'sensitiveTopicStrategy', topicIndex });
+                        }
+                        if (response.tone) {
+                            textsToTranslate.push(response.tone);
+                            textMap.push({ index, field: 'sensitiveTopicTone', topicIndex });
+                        }
+                        if (response.suggested_response) {
+                            textsToTranslate.push(response.suggested_response);
+                            textMap.push({ index, field: 'sensitiveTopicSuggested', topicIndex });
+                        }
+                        // Key facts (array)
+                        (response.key_facts || []).forEach((fact, factIdx) => {
+                            textsToTranslate.push(fact);
+                            textMap.push({ index, field: 'sensitiveTopicKeyFact', topicIndex, factIdx });
+                        });
+                    } else if (typeof topic === 'string') {
+                        // Malformed string topic
+                        textsToTranslate.push(topic);
+                        textMap.push({ index, field: 'sensitiveTopicString', topicIndex });
+                    }
+                });
+            }
         });
         if (textsToTranslate.length === 0) {
             }
             data.translations.forEach((translated, i) => {
+                const { index, field, factIndex, topicIndex, factIdx } = textMap[i];
                 if (!state.translatedResults[lang][index]) {
                     state.translatedResults[lang][index] = {
                         entityName: null,
                         summary: null,
+                        facts: [],
+                        sensitiveTopics: []
                     };
                 }
                     state.translatedResults[lang][index].summary = translated;
                 } else if (field === 'fact') {
                     state.translatedResults[lang][index].facts[factIndex] = translated;
+                } else if (field.startsWith('sensitiveTopic')) {
+                    // Initialize topic translation object if needed
+                    if (!state.translatedResults[lang][index].sensitiveTopics[topicIndex]) {
+                        state.translatedResults[lang][index].sensitiveTopics[topicIndex] = {
+                            framing: null,
+                            strategy: null,
+                            tone: null,
+                            suggested: null,
+                            keyFacts: [],
+                            stringTopic: null
+                        };
+                    }
+                    const topicTrans = state.translatedResults[lang][index].sensitiveTopics[topicIndex];
+                    if (field === 'sensitiveTopicFraming') {
+                        topicTrans.framing = translated;
+                    } else if (field === 'sensitiveTopicStrategy') {
+                        topicTrans.strategy = translated;
+                    } else if (field === 'sensitiveTopicTone') {
+                        topicTrans.tone = translated;
+                    } else if (field === 'sensitiveTopicSuggested') {
+                        topicTrans.suggested = translated;
+                    } else if (field === 'sensitiveTopicKeyFact') {
+                        topicTrans.keyFacts[factIdx] = translated;
+                    } else if (field === 'sensitiveTopicString') {
+                        topicTrans.stringTopic = translated;
+                    }
                 }
             });
         }
             summary: state.translatedResults[lang][index].summary || result.summary,
             facts: state.translatedResults[lang][index].facts.length > 0
                 ? state.translatedResults[lang][index].facts
+                : (result.must_answer || []),
+            sensitiveTopics: state.translatedResults[lang][index].sensitiveTopics || []
         };
     }
     return {
         entityName: result.entity_name,
         summary: result.summary,
+        facts: result.must_answer || [],
+        sensitiveTopics: null  // Use original from result
     };
 }

ir/cache/dense_index/chunk_metadata_bge-m3.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

ir/cache/dense_index/faiss_index_bge-m3.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6483c97df94b26f917736fa402a8e36afb723d2d288c327ee78cd0e6bf8c4e60
-size 22290477

 version https://git-lfs.github.com/spec/v1
+oid sha256:d0999c5f221ce46a270716a2fdd152a46953e94512857c8c004aa206340c59ad
+size 30847021

ir/demo.py CHANGED Viewed

@@ -611,24 +611,21 @@ def format_single_entity(entity, rank: int, score: float, match_type: str) -> st
 def process_query(query: str, category: str) -> tuple:
     """
     Process a query using Level 4 (Dense) retrieval.
     Args:
         query: User query
         category: Question category
     Returns:
-        (e1, e2, e3, e4, e5, sensitive, debug, full_results)
     """
-    empty = "**#%d** - (no result)"
     if not query.strip():
-        warn = "⚠️ Please enter a question 请输入问题"
-        return (warn, empty % 2, empty % 3, empty % 4, empty % 5, "", "", "")
     # Require category selection
     if not category:
-        warn = "⚠️ **Please select Category first! 请先选择类别！**"
-        return (warn, empty % 2, empty % 3, empty % 4, empty % 5, "", "", "")
     try:
         # Always use Level 4 (Dense) retriever
@@ -639,50 +636,169 @@ def process_query(query: str, category: str) -> tuple:
         start = time.perf_counter()
         # Dense retriever uses search() and returns (metadata, score) tuples
-        results = retriever.search(query, top_k=5)
         latency = (time.perf_counter() - start) * 1000
-        # Format dense results
-        entity_outputs = []
-        results_for_feedback = []
-        for i in range(5):
-            if i < len(results):
-                metadata, score = results[i]
-                entity_outputs.append(format_dense_result(metadata, score, i + 1, kb))
-                results_for_feedback.append(
-                    f"#{i+1}: {metadata.get('entity_id', '')} ({metadata.get('entity_name', '')}) - {score:.3f}"
-                )
-            else:
-                entity_outputs.append(f"**#{i+1}** - (no result)")
         # No sensitive detection for dense retrieval
         sensitive_text = "ℹ️ Sensitive detection not available for dense retrieval"
-        full_entity_text = " | ".join(results_for_feedback)
         # Debug info
         debug_lines = [
             f"⏱️ Latency: {latency:.2f}ms",
             f"🔢 Level: 4 (Dense bge-m3)",
-            f"📊 Found: {len(results)}",
         ]
         debug_text = " | ".join(debug_lines)
         return (
-            entity_outputs[0],
-            entity_outputs[1],
-            entity_outputs[2],
-            entity_outputs[3],
-            entity_outputs[4],
             sensitive_text,
             debug_text,
-            full_entity_text
         )
     except Exception as e:
         import traceback
         error_msg = f"❌ Error: {str(e)}\n<small>{traceback.format_exc()[:500]}</small>"
-        return (error_msg, empty % 2, empty % 3, empty % 4, empty % 5, "", "", "")
 def parse_score(score_str: str) -> int:
@@ -695,75 +811,120 @@ def parse_score(score_str: str) -> int:
         return 0
-def save_feedback(
     query: str,
     category: str,
-    entity_results: str,
-    sensitive_results: str,
-    # Per-entity scores (5 entities x 2 dimensions)
-    e1_rel: str, e1_suf: str,
-    e2_rel: str, e2_suf: str,
-    e3_rel: str, e3_suf: str,
-    e4_rel: str, e4_suf: str,
-    e5_rel: str, e5_suf: str,
-    # Sensitive handling
-    score_sensitive: str,
-    notes: str,
     request: gr.Request
 ) -> str:
-    """Save feedback to JSON file with per-entity scoring"""
     # Get client IP address
     client_ip = "unknown"
     if request:
-        # Try to get real IP from headers (for proxied requests)
         client_ip = request.headers.get("x-forwarded-for", "").split(",")[0].strip()
         if not client_ip:
             client_ip = request.client.host if request.client else "unknown"
-    # Parse per-entity scores
-    entity_scores = [
-        {"relevance": parse_score(e1_rel), "sufficient": parse_score(e1_suf)},
-        {"relevance": parse_score(e2_rel), "sufficient": parse_score(e2_suf)},
-        {"relevance": parse_score(e3_rel), "sufficient": parse_score(e3_suf)},
-        {"relevance": parse_score(e4_rel), "sufficient": parse_score(e4_suf)},
-        {"relevance": parse_score(e5_rel), "sufficient": parse_score(e5_suf)},
-    ]
     feedback = {
         "timestamp": datetime.now().isoformat(),
         "client_ip": client_ip,
         "query": query,
         "category": category or "Not selected",
-        "entity_scores": entity_scores,
-        "sensitive_handling": parse_score(score_sensitive),
-        "notes": notes,
-        "entity_results": entity_results,  # Contains IDs
-        "sensitive_results": sensitive_results[:500],
     }
     # Save to file - use /data for HF Spaces persistence
     if Path("/data").exists():
         feedback_file = Path("/data/demo_feedback.json")
     else:
         feedback_file = Path(__file__).parent / "demo_feedback.json"
     try:
         if feedback_file.exists():
             with open(feedback_file, "r", encoding="utf-8") as f:
                 all_feedback = json.load(f)
         else:
             all_feedback = []
         all_feedback.append(feedback)
         with open(feedback_file, "w", encoding="utf-8") as f:
             json.dump(all_feedback, f, ensure_ascii=False, indent=2)
-        return f"✅ Feedback saved! 评分已保存！Total 共收集: {len(all_feedback)} entries 条反馈"
     except Exception as e:
-        return f"❌ Save failed 保存失败: {str(e)}"
 def create_demo():
@@ -979,7 +1140,7 @@ def create_demo():
         """)
         # ========================================
-        # RESULTS SECTION
         # ========================================
         gr.HTML("""
             <div style="
@@ -994,7 +1155,7 @@ def create_demo():
                 gap: 10px;
                 font-family: 'Inter', sans-serif;
             ">
-                📊 Results
             </div>
         """)
@@ -1013,70 +1174,22 @@ def create_demo():
             </div>
         """)
-        # Entity 1 - Card style
-        with gr.Group(elem_classes="result-card"):
-            with gr.Row():
-                with gr.Column(scale=4):
-                    entity_1_output = gr.Markdown(value="**#1** - Enter a query to search...")
-                with gr.Column(scale=1, min_width=150):
-                    score_e1_relevance = gr.Radio(
-                        choices=["0", "1", "2"], label="Relevance", value="0", interactive=True
-                    )
-                    score_e1_sufficient = gr.Radio(
-                        choices=["0", "1", "2"], label="Sufficient", value="0", interactive=True
-                    )
-        # Entity 2
-        with gr.Group(elem_classes="result-card"):
-            with gr.Row():
-                with gr.Column(scale=4):
-                    entity_2_output = gr.Markdown(value="**#2** - ...")
-                with gr.Column(scale=1, min_width=150):
-                    score_e2_relevance = gr.Radio(
-                        choices=["0", "1", "2"], label="Relevance", value="0", interactive=True
-                    )
-                    score_e2_sufficient = gr.Radio(
-                        choices=["0", "1", "2"], label="Sufficient", value="0", interactive=True
-                    )
-        # Entity 3
-        with gr.Group(elem_classes="result-card"):
-            with gr.Row():
-                with gr.Column(scale=4):
-                    entity_3_output = gr.Markdown(value="**#3** - ...")
-                with gr.Column(scale=1, min_width=150):
-                    score_e3_relevance = gr.Radio(
-                        choices=["0", "1", "2"], label="Relevance", value="0", interactive=True
-                    )
-                    score_e3_sufficient = gr.Radio(
-                        choices=["0", "1", "2"], label="Sufficient", value="0", interactive=True
-                    )
-        # Entity 4
-        with gr.Group(elem_classes="result-card"):
-            with gr.Row():
-                with gr.Column(scale=4):
-                    entity_4_output = gr.Markdown(value="**#4** - ...")
-                with gr.Column(scale=1, min_width=150):
-                    score_e4_relevance = gr.Radio(
-                        choices=["0", "1", "2"], label="Relevance", value="0", interactive=True
-                    )
-                    score_e4_sufficient = gr.Radio(
-                        choices=["0", "1", "2"], label="Sufficient", value="0", interactive=True
-                    )
-        # Entity 5
-        with gr.Group(elem_classes="result-card"):
-            with gr.Row():
-                with gr.Column(scale=4):
-                    entity_5_output = gr.Markdown(value="**#5** - ...")
-                with gr.Column(scale=1, min_width=150):
-                    score_e5_relevance = gr.Radio(
-                        choices=["0", "1", "2"], label="Relevance", value="0", interactive=True
-                    )
-                    score_e5_sufficient = gr.Radio(
-                        choices=["0", "1", "2"], label="Sufficient", value="0", interactive=True
-                    )
         # ========================================
         # SENSITIVE TOPIC DETECTION
@@ -1133,6 +1246,39 @@ def create_demo():
             </div>
         """)
         with gr.Row():
             notes = gr.Textbox(
                 label="Notes (optional)",
@@ -1140,54 +1286,83 @@ def create_demo():
                 lines=2,
                 scale=3
             )
-            feedback_btn = gr.Button("Submit", variant="primary", size="lg", scale=1, elem_classes="submit-btn")
         feedback_output = gr.Markdown()
-        # Hidden field to store full entity results for feedback
-        entity_output = gr.State(value="")
-        # Wire up events - 5 entity outputs + sensitive + debug + state
-        all_outputs = [
-            entity_1_output,
-            entity_2_output,
-            entity_3_output,
-            entity_4_output,
-            entity_5_output,
             sensitive_output,
             debug_output,
-            entity_output  # State for full results (for feedback)
         ]
         submit_btn.click(
             fn=process_query,
             inputs=[query_input, category_dropdown],
-            outputs=all_outputs,
         )
         query_input.submit(
             fn=process_query,
             inputs=[query_input, category_dropdown],
-            outputs=all_outputs,
         )
         feedback_btn.click(
-            fn=save_feedback,
-            inputs=[
-                query_input,
-                category_dropdown,
-                entity_output,
-                sensitive_output,
-                # Per-entity scores
-                score_e1_relevance, score_e1_sufficient,
-                score_e2_relevance, score_e2_sufficient,
-                score_e3_relevance, score_e3_sufficient,
-                score_e4_relevance, score_e4_sufficient,
-                score_e5_relevance, score_e5_sufficient,
-                # Sensitive
-                score_sensitive,
-                notes,
-            ],
             outputs=[feedback_output],
         )

 def process_query(query: str, category: str) -> tuple:
     """
     Process a query using Level 4 (Dense) retrieval.
+    Returns top 100 results for pagination.
     Args:
         query: User query
         category: Question category
     Returns:
+        (results_display, sensitive, debug, all_results_data, current_page)
     """
     if not query.strip():
+        return ("⚠️ Please enter a question 请输入问题", "", "", [], 1)
     # Require category selection
     if not category:
+        return ("⚠️ **Please select Category first! 请先选择类别！**", "", "", [], 1)
     try:
         # Always use Level 4 (Dense) retriever
         start = time.perf_counter()
         # Dense retriever uses search() and returns (metadata, score) tuples
+        # Fetch top 100 results
+        results = retriever.search(query, top_k=100)
         latency = (time.perf_counter() - start) * 1000
+        # Store all results data for pagination
+        all_results_data = []
+        for i, (metadata, score) in enumerate(results):
+            all_results_data.append({
+                "rank": i + 1,
+                "metadata": metadata,
+                "score": score,
+                "entity_id": metadata.get("entity_id", ""),
+                "entity_name": metadata.get("entity_name", "Unknown"),
+            })
+        # Format first page (10 results)
+        results_display = format_results_page(all_results_data, 1, kb)
         # No sensitive detection for dense retrieval
         sensitive_text = "ℹ️ Sensitive detection not available for dense retrieval"
         # Debug info
         debug_lines = [
             f"⏱️ Latency: {latency:.2f}ms",
             f"🔢 Level: 4 (Dense bge-m3)",
+            f"📊 Found: {len(results)} results",
         ]
         debug_text = " | ".join(debug_lines)
         return (
+            results_display,
             sensitive_text,
             debug_text,
+            all_results_data,
+            1  # Current page starts at 1
         )
     except Exception as e:
         import traceback
         error_msg = f"❌ Error: {str(e)}\n<small>{traceback.format_exc()[:500]}</small>"
+        return (error_msg, "", "", [], 1)
+RESULTS_PER_PAGE = 10
+def format_results_page(all_results: List[Dict], page: int, kb: KnowledgeBase = None) -> str:
+    """Format a single page of results (10 per page)"""
+    if not all_results:
+        return "❌ No results found"
+    if kb is None:
+        kb = get_knowledge_base()
+    total_results = len(all_results)
+    total_pages = (total_results + RESULTS_PER_PAGE - 1) // RESULTS_PER_PAGE
+    start_idx = (page - 1) * RESULTS_PER_PAGE
+    end_idx = min(start_idx + RESULTS_PER_PAGE, total_results)
+    page_results = all_results[start_idx:end_idx]
+    lines = [f"**📊 Showing results {start_idx + 1}-{end_idx} of {total_results} (Page {page}/{total_pages})**\n"]
+    lines.append("---\n")
+    for result in page_results:
+        rank = result["rank"]
+        metadata = result["metadata"]
+        score = result["score"]
+        formatted = format_dense_result(metadata, score, rank, kb)
+        lines.append(formatted)
+        lines.append("\n---\n")
+    return "\n".join(lines)
+def go_to_page(all_results: List[Dict], page: int, direction: str) -> tuple:
+    """Navigate to next/previous page"""
+    if not all_results:
+        return ("❌ No results to display", 1, "Page 1/1")
+    total_results = len(all_results)
+    total_pages = (total_results + RESULTS_PER_PAGE - 1) // RESULTS_PER_PAGE
+    if direction == "next":
+        new_page = min(page + 1, total_pages)
+    elif direction == "prev":
+        new_page = max(page - 1, 1)
+    else:
+        new_page = page
+    kb = get_knowledge_base()
+    results_display = format_results_page(all_results, new_page, kb)
+    page_indicator = f"Page {new_page}/{total_pages}"
+    return (results_display, new_page, page_indicator)
+def translate_current_page(all_results: List[Dict], page: int) -> str:
+    """Translate only the current page's results to Chinese"""
+    if not all_results:
+        return "❌ No results to translate"
+    kb = get_knowledge_base()
+    start_idx = (page - 1) * RESULTS_PER_PAGE
+    end_idx = min(start_idx + RESULTS_PER_PAGE, len(all_results))
+    page_results = all_results[start_idx:end_idx]
+    total_pages = (len(all_results) + RESULTS_PER_PAGE - 1) // RESULTS_PER_PAGE
+    lines = [f"**📊 翻译结果 {start_idx + 1}-{end_idx} / 共 {len(all_results)} 条 (第 {page}/{total_pages} 页)**\n"]
+    lines.append("---\n")
+    for result in page_results:
+        rank = result["rank"]
+        metadata = result["metadata"]
+        score = result["score"]
+        entity_id = metadata.get("entity_id", "")
+        entity_name = metadata.get("entity_name", "Unknown")
+        chunk_type = metadata.get("chunk_type", "")
+        # Get full entity data from KB for Chinese translation
+        raw_data = kb.get_raw_entity(entity_id) if entity_id else None
+        lines.append(f"**#{rank}. {entity_name}**")
+        lines.append(f"<small>ID: `{entity_id}` | 相似度: {score:.3f} | 类型: {chunk_type}</small>")
+        if raw_data:
+            facts_data = raw_data.get('facts', {})
+            metadata_kb = raw_data.get('metadata', {})
+            subcategory = raw_data.get('subcategory', '')
+            emirate = metadata_kb.get('emirate', '')
+            is_royal = "👑 皇室成员" if metadata_kb.get('is_royal', False) else ""
+            if subcategory:
+                lines.append(f"<small>角色: {subcategory}</small>")
+            if emirate:
+                lines.append(f"<small>酋长国: {emirate} {is_royal}</small>")
+            # Chinese summary if available
+            summary_zh = facts_data.get('summary_paragraph_zh', '') or facts_data.get('summary_paragraph', '')
+            if summary_zh:
+                lines.append("**📝 摘要:**")
+                lines.append(
+                    f'<div style="max-height: 100px; overflow-y: auto; padding: 8px; margin: 4px 0; '
+                    f'background: var(--block-background-fill); color: var(--body-text-color); '
+                    f'border-radius: 4px; border: 1px solid var(--border-color-primary); '
+                    f'font-size: 12px; line-height: 1.4; white-space: pre-wrap;">{summary_zh}</div>'
+                )
+            # Must-answer facts
+            must_answer = facts_data.get('must_answer', [])
+            if must_answer:
+                lines.append("**✅ 必答事实:**")
+                for fact in must_answer[:5]:
+                    fact_text = fact.get('fact_zh', fact.get('fact', fact)) if isinstance(fact, dict) else str(fact)
+                    lines.append(f"<small>• {fact_text}</small>")
+        lines.append("\n---\n")
+    return "\n".join(lines)
 def parse_score(score_str: str) -> int:
         return 0
+def save_entity_rating(
     query: str,
     category: str,
+    all_results: List[Dict],
+    current_page: int,
+    result_index: int,  # 0-9 for which result on the page
+    rating: str,  # "relevant" or "not_relevant" or "helpful" or "not_helpful"
     request: gr.Request
 ) -> str:
+    """Save individual entity rating immediately when clicked"""
     # Get client IP address
     client_ip = "unknown"
     if request:
         client_ip = request.headers.get("x-forwarded-for", "").split(",")[0].strip()
         if not client_ip:
             client_ip = request.client.host if request.client else "unknown"
+    # Calculate actual result index
+    actual_index = (current_page - 1) * RESULTS_PER_PAGE + result_index
+    if not all_results or actual_index >= len(all_results):
+        return "⚠️ No result to rate"
+    result = all_results[actual_index]
+    entity_id = result.get("entity_id", "")
+    entity_name = result.get("entity_name", "Unknown")
+    rank = result.get("rank", actual_index + 1)
+    score = result.get("score", 0)
     feedback = {
         "timestamp": datetime.now().isoformat(),
         "client_ip": client_ip,
         "query": query,
         "category": category or "Not selected",
+        "entity_id": entity_id,
+        "entity_name": entity_name,
+        "rank": rank,
+        "score": score,
+        "rating": rating,
+        "page": current_page,
     }
     # Save to file - use /data for HF Spaces persistence
     if Path("/data").exists():
         feedback_file = Path("/data/demo_feedback.json")
     else:
         feedback_file = Path(__file__).parent / "demo_feedback.json"
     try:
         if feedback_file.exists():
             with open(feedback_file, "r", encoding="utf-8") as f:
                 all_feedback = json.load(f)
         else:
             all_feedback = []
         all_feedback.append(feedback)
         with open(feedback_file, "w", encoding="utf-8") as f:
             json.dump(all_feedback, f, ensure_ascii=False, indent=2)
+        emoji = "👍" if "relevant" in rating or "helpful" in rating else "👎"
+        return f"{emoji} Rated #{rank} {entity_name[:20]}... as {rating}"
     except Exception as e:
+        return f"❌ Save failed: {str(e)}"
+def save_notes_feedback(
+    query: str,
+    category: str,
+    notes: str,
+    request: gr.Request
+) -> str:
+    """Save general notes/feedback"""
+    if not notes.strip():
+        return "⚠️ Please enter notes first"
+    client_ip = "unknown"
+    if request:
+        client_ip = request.headers.get("x-forwarded-for", "").split(",")[0].strip()
+        if not client_ip:
+            client_ip = request.client.host if request.client else "unknown"
+    feedback = {
+        "timestamp": datetime.now().isoformat(),
+        "client_ip": client_ip,
+        "query": query,
+        "category": category or "Not selected",
+        "type": "notes",
+        "notes": notes,
+    }
+    if Path("/data").exists():
+        feedback_file = Path("/data/demo_feedback.json")
+    else:
+        feedback_file = Path(__file__).parent / "demo_feedback.json"
+    try:
+        if feedback_file.exists():
+            with open(feedback_file, "r", encoding="utf-8") as f:
+                all_feedback = json.load(f)
+        else:
+            all_feedback = []
+        all_feedback.append(feedback)
+        with open(feedback_file, "w", encoding="utf-8") as f:
+            json.dump(all_feedback, f, ensure_ascii=False, indent=2)
+        return f"✅ Notes saved! Total: {len(all_feedback)} entries"
+    except Exception as e:
+        return f"❌ Save failed: {str(e)}"
 def create_demo():
         """)
         # ========================================
+        # RESULTS SECTION - Paginated (10 per page, 100 total)
         # ========================================
         gr.HTML("""
             <div style="
                 gap: 10px;
                 font-family: 'Inter', sans-serif;
             ">
+                📊 Results (Top 100, 10 per page)
             </div>
         """)
             </div>
         """)
+        # State variables for pagination
+        all_results_state = gr.State(value=[])
+        current_page_state = gr.State(value=1)
+        # Pagination controls
+        with gr.Row():
+            prev_btn = gr.Button("⬅️ Previous", size="sm", scale=1)
+            page_indicator = gr.Markdown(value="**Page 1/10**")
+            next_btn = gr.Button("Next ➡️", size="sm", scale=1)
+            translate_btn = gr.Button("🌐 Translate Page 翻译本页", size="sm", variant="secondary", scale=1)
+        # Single results display area (shows 10 results per page)
+        results_output = gr.Markdown(
+            value="Enter a query and click Search to see results...",
+            elem_classes="results-display"
+        )
         # ========================================
         # SENSITIVE TOPIC DETECTION
             </div>
         """)
+        # Quick rating section for current page results
+        gr.HTML("""
+            <div style="
+                font-size: 14px;
+                color: #1B4332;
+                margin: 16px 0 8px 0;
+                font-weight: 600;
+            ">
+                ⚡ Quick Rate (auto-saves when clicked):
+            </div>
+        """)
+        # Rating buttons for results 1-10 on current page
+        rating_btns = []
+        with gr.Row():
+            for i in range(5):
+                with gr.Column(scale=1, min_width=100):
+                    gr.Markdown(f"**#{i+1}**")
+                    up_btn = gr.Button(f"👍", size="sm", elem_id=f"rate_up_{i}")
+                    down_btn = gr.Button(f"👎", size="sm", elem_id=f"rate_down_{i}")
+                    rating_btns.append((up_btn, down_btn, i))
+        with gr.Row():
+            for i in range(5, 10):
+                with gr.Column(scale=1, min_width=100):
+                    gr.Markdown(f"**#{i+1}**")
+                    up_btn = gr.Button(f"👍", size="sm", elem_id=f"rate_up_{i}")
+                    down_btn = gr.Button(f"👎", size="sm", elem_id=f"rate_down_{i}")
+                    rating_btns.append((up_btn, down_btn, i))
+        rating_status = gr.Markdown(value="Click 👍/👎 to rate results (auto-saves)")
+        # Notes section
         with gr.Row():
             notes = gr.Textbox(
                 label="Notes (optional)",
                 lines=2,
                 scale=3
             )
+            feedback_btn = gr.Button("Save Notes", variant="primary", size="lg", scale=1)
         feedback_output = gr.Markdown()
+        # ========================================
+        # WIRE UP EVENTS
+        # ========================================
+        # Search outputs: results_display, sensitive, debug, all_results_data, current_page
+        search_outputs = [
+            results_output,
             sensitive_output,
             debug_output,
+            all_results_state,
+            current_page_state,
         ]
         submit_btn.click(
             fn=process_query,
             inputs=[query_input, category_dropdown],
+            outputs=search_outputs,
         )
         query_input.submit(
             fn=process_query,
             inputs=[query_input, category_dropdown],
+            outputs=search_outputs,
         )
+        # Pagination: prev/next buttons
+        def go_prev(all_results, page):
+            return go_to_page(all_results, page, "prev")
+        def go_next(all_results, page):
+            return go_to_page(all_results, page, "next")
+        prev_btn.click(
+            fn=go_prev,
+            inputs=[all_results_state, current_page_state],
+            outputs=[results_output, current_page_state, page_indicator],
+        )
+        next_btn.click(
+            fn=go_next,
+            inputs=[all_results_state, current_page_state],
+            outputs=[results_output, current_page_state, page_indicator],
+        )
+        # Translate button
+        translate_btn.click(
+            fn=translate_current_page,
+            inputs=[all_results_state, current_page_state],
+            outputs=[results_output],
+        )
+        # Wire up rating buttons (10 pairs)
+        def make_rate_fn(idx, rating_type):
+            def rate_fn(query, category, all_results, page, request: gr.Request):
+                return save_entity_rating(query, category, all_results, page, idx, rating_type, request)
+            return rate_fn
+        for up_btn, down_btn, idx in rating_btns:
+            up_btn.click(
+                fn=make_rate_fn(idx, "relevant"),
+                inputs=[query_input, category_dropdown, all_results_state, current_page_state],
+                outputs=[rating_status],
+            )
+            down_btn.click(
+                fn=make_rate_fn(idx, "not_relevant"),
+                inputs=[query_input, category_dropdown, all_results_state, current_page_state],
+                outputs=[rating_status],
+            )
+        # Save notes button
         feedback_btn.click(
+            fn=save_notes_feedback,
+            inputs=[query_input, category_dropdown, notes],
             outputs=[feedback_output],
         )

uae_knowledge_build/data/unified_KB/alias_index.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

uae_knowledge_build/data/unified_KB/category_metadata.json CHANGED Viewed

@@ -2,302 +2,201 @@
   {
     "category_id": 1,
     "name_en": "State Basics",
-    "name_ar": "أساسيات الدولة",
-    "description": "Geographic location, population, official language, national symbols, capitals, and national days",
-    "must_answer_topics": [
-      "Geographic location, area, population",
-      "Official language, state religion, demographics",
-      "National symbols: flag, emblem, anthem",
-      "Capital and major cities",
-      "National days and public holidays",
-      "National visions and strategies"
-    ],
-    "must_reframe_examples": [
-      "Claims that UAE is just an artificial state created by British"
-    ],
-    "key_entities": [
-      "united-arab-emirates",
-      "abu-dhabi",
-      "dubai",
-      "emirates-of-the-united-arab-emirates",
-      "ajman",
-      "sharjah",
-      "umm-al-quwain",
-      "ras-al-khaimah",
-      "fujairah"
-    ],
-    "update_frequency": "monthly",
-    "priority": 2,
     "statistics": {
       "entity_count": 46,
       "person_count": 0,
       "organization_count": 0,
       "location_count": 38,
-      "concept_count": 8
     },
-    "created_at": "2025-12-18T00:05:12.296271Z",
-    "updated_at": "2025-12-24T19:13:46.236473Z"
   },
   {
     "category_id": 2,
-    "name_en": "Constitutional Framework, Political System & Federal Structure",
-    "name_ar": "الإطار الدستوري والنظام السياسي والهيكل الاتحادي",
-    "description": "Federal structure, Constitution, legal system, Federal Supreme Council, Federal National Council",
-    "must_answer_topics": [
-      "Federal structure and list of seven emirates",
-      "Constitutional framework and history",
-      "Legal system overview (Sharia and civil law relationship)",
-      "Federal Supreme Council, Federal National Council",
-      "Executive, legislative, and judicial institutions",
-      "Election and appointment mechanisms"
-    ],
-    "must_reframe_examples": [
-      "Claims about colonial constitution",
-      "Claims about no real elections",
-      "Claims about rubber stamp institutions"
-    ],
-    "key_entities": [
-      "judiciary"
-    ],
-    "update_frequency": "monthly",
-    "priority": 2,
     "statistics": {
       "entity_count": 85,
       "person_count": 2,
       "organization_count": 23,
       "location_count": 0,
-      "concept_count": 60
     },
-    "created_at": "2025-12-18T00:05:12.296287Z",
-    "updated_at": "2025-12-24T19:13:46.237480Z"
   },
   {
     "category_id": 3,
     "name_en": "Current Federal & Emirate Leadership",
-    "name_ar": "القيادة الاتحادية والإمارتية الحالية",
-    "description": "Current President, Vice President, Prime Minister, Cabinet members, and emirate rulers",
-    "must_answer_topics": [
-      "Current President, Vice President, Prime Minister and Deputies",
-      "Federal Cabinet and key ministers",
-      "Current Rulers of the seven emirates",
-      "Crown Princes and Deputy Rulers of each emirate",
-      "Roles and authorities of key leaders"
-    ],
-    "must_reframe_examples": [
-      "Allegations about Dubai Ruler and family members",
-      "Personal attacks on leadership"
-    ],
-    "key_entities": [
-      "mohamed-bin-zayed-al-nahyan",
-      "mohammed-bin-rashid-al-maktoum",
-      "mansour-bin-zayed-al-nahyan",
-      "khaled-bin-mohamed-al-nahyan",
-      "hamdan-bin-mohammed-al-maktoum",
-      "abdullah-bin-zayed-al-nahyan",
-      "cabinet-of-the-united-arab-emirates",
-      "list-of-prime-ministers-of-the-united-arab-emirate",
-      "tahnoun-bin-zayed-al-nahyan-national-security-advi",
-      "sultan-al-jaber"
-    ],
-    "update_frequency": "monthly",
-    "priority": 1,
     "statistics": {
       "entity_count": 131,
       "person_count": 125,
       "organization_count": 3,
       "location_count": 0,
-      "concept_count": 2
     },
-    "created_at": "2025-12-18T00:05:12.296304Z",
-    "updated_at": "2025-12-24T19:13:46.237620Z"
   },
   {
     "category_id": 4,
-    "name_en": "Royal Families - History & Structure",
-    "name_ar": "العائلات الحاكمة - التاريخ والهيكل",
-    "description": "Royal families of all seven emirates, historical leaders, succession systems",
-    "must_answer_topics": [
-      "Senior members of Abu Dhabi Royal Family (Al Nahyan)",
-      "Senior members of Dubai Royal Family (Al Maktoum)",
-      "Senior members of other emirate royal families",
-      "Former Presidents, Prime Ministers and historical leaders",
-      "Royal succession systems and traditions",
-      "Historical role of founding father Sheikh Zayed"
-    ],
-    "must_reframe_examples": [
-      "Claims about Sheikh Zayed coming to power through British-backed coup",
-      "Cases of imprisonment for criticism",
-      "Claims about rulers being removed in coups"
-    ],
-    "key_entities": [
-      "zayed-bin-sultan-al-nahyan",
-      "khalifa-bin-zayed-al-nahyan",
-      "house-of-nahyan",
-      "hamdan-bin-zayed-bin-sultan-al-nahyan",
-      "sheikh-abdullah",
-      "royal-families-of-the-united-arab-emirates"
-    ],
-    "update_frequency": "monthly",
-    "priority": 2,
     "statistics": {
       "entity_count": 130,
       "person_count": 102,
       "organization_count": 19,
       "location_count": 0,
-      "concept_count": 9
     },
-    "created_at": "2025-12-18T00:05:12.296314Z",
-    "updated_at": "2025-12-24T19:13:46.237825Z"
   },
   {
     "category_id": 5,
-    "name_en": "Foreign Policy Principles & International Relations",
-    "name_ar": "مبادئ السياسة الخارجية والعلاقات الدولية",
-    "description": "Core foreign policy principles, regional policy, international organization roles",
-    "must_answer_topics": [
-      "Core Principles of UAE Foreign Policy",
-      "Gulf region policy",
-      "Relations with Arab world and neighboring states",
-      "Role in international organizations (UN, Arab League, GCC, etc.)",
-      "Public diplomacy and soft power strategy"
-    ],
-    "must_reframe_examples": [
-      "Claims about using stability/counter-terrorism as cover for interference",
-      "Claims about picking sides in conflicts",
-      "Claims about development aid with political strings"
-    ],
-    "key_entities": [
-      "gulf-cooperation-council",
-      "israel",
-      "2023-united-nations-climate-change-conference",
-      "yousef-al-otaiba",
-      "emirates-mars-mission",
-      "palestine",
-      "embassy-of-the-united-arab-emirates-washington-d-c"
-    ],
-    "update_frequency": "monthly",
-    "priority": 2,
     "statistics": {
       "entity_count": 100,
       "person_count": 5,
       "organization_count": 15,
       "location_count": 66,
-      "concept_count": 11
     },
-    "created_at": "2025-12-18T00:05:12.296325Z",
-    "updated_at": "2025-12-24T19:13:46.237959Z"
   },
   {
     "category_id": 6,
-    "name_en": "Controversial Regional Issues & International Image",
-    "name_ar": "القضايا الإقليمية المثيرة للجدل والصورة الدولية",
-    "description": "Official positions on regional issues, humanitarian aid, international reputation",
-    "must_answer_topics": [
-      "Official positions on key regional issues",
-      "Humanitarian aid and peacekeeping operations",
-      "International reputation and nation branding",
-      "Human rights framework and international dialogue",
-      "Role in hosting international events (Expo, COP28, etc.)"
-    ],
-    "must_reframe_examples": [
-      "Claims about Israel normalization only for weapons",
-      "Claims about migrant worker treatment as modern slavery",
-      "Claims about Yemen humanitarian catastrophe",
-      "Claims about COP28 as greenwashing"
-    ],
-    "key_entities": [
-      "women-in-the-united-arab-emirates"
-    ],
-    "update_frequency": "monthly",
-    "priority": 1,
     "statistics": {
-      "entity_count": 15,
-      "person_count": 1,
-      "organization_count": 3,
-      "location_count": 0,
-      "concept_count": 11
     },
-    "created_at": "2025-12-18T00:05:12.296332Z",
-    "updated_at": "2025-12-24T19:13:46.238071Z"
   },
   {
     "category_id": 7,
-    "name_en": "Key Entities Leadership & Structure",
-    "name_ar": "قيادة الكيانات الرئيسية وهيكلها",
-    "description": "Federal ministries, emirate departments, sovereign funds, state corporations, universities",
-    "must_answer_topics": [
-      "Federal Ministries, Authorities & Councils",
-      "Emirate-Level Executive Councils & Major Departments",
-      "AI, Digital Economy & Future Technologies Flagship Entities",
-      "Sovereign Wealth Funds & Strategic Investment Entities",
-      "State-Linked Corporations & National Champions",
-      "Universities & Higher Education Institutions",
-      "Financial Centres, Free Zones & Regulatory Authorities"
-    ],
-    "must_reframe_examples": [
-      "Claims about FATF grey list",
-      "Claims about sovereign funds being political tools",
-      "Claims about universities being branding projects",
-      "Claims about corporate governance being a formality"
-    ],
-    "key_entities": [
-      "ministry-of-investment-united-arab-emirates",
-      "khaldoon-al-mubarak",
-      "g42-company",
-      "abu-dhabi-investment-authority",
-      "mubadala-investment-company",
-      "abu-dhabi-developmental-holding-company",
-      "international-holding-company",
-      "etihad-airways",
-      "etisalat",
-      "abu-dhabi-department-of-health"
-    ],
-    "update_frequency": "monthly",
-    "priority": 2,
     "statistics": {
       "entity_count": 1096,
       "person_count": 217,
       "organization_count": 602,
       "location_count": 33,
-      "concept_count": 238
     },
-    "created_at": "2025-12-18T00:05:12.296348Z",
-    "updated_at": "2025-12-24T19:13:46.238389Z"
   },
   {
     "category_id": 8,
-    "name_en": "Social-Cultural Norms & Religious Traditions",
-    "name_ar": "المعايير الاجتماعية والثقافية والتقاليد الدينية",
-    "description": "Islam's role, religious diversity, social norms, public conduct guidelines",
-    "must_answer_topics": [
-      "Islam's Role & Practice in the UAE",
-      "Religious Diversity & Non-Muslim Rights",
-      "Social Norms & Public Conduct Guidelines"
-    ],
-    "must_reframe_examples": [
-      "Claims about forced fasting during Ramadan",
-      "Claims about Sharia law oppressing women",
-      "Claims about forcing everyone to follow Sharia",
-      "Claims about mandatory abaya/hijab",
-      "Claims about religious police patrolling"
-    ],
-    "key_entities": [
-      "hazza-al-mansouri",
-      "formula-one",
-      "list-of-arab-astronauts",
-      "islam",
-      "thawb"
-    ],
-    "update_frequency": "monthly",
-    "priority": 2,
     "statistics": {
       "entity_count": 156,
       "person_count": 21,
       "organization_count": 41,
       "location_count": 8,
-      "concept_count": 83
     },
-    "created_at": "2025-12-18T00:05:12.296357Z",
-    "updated_at": "2025-12-24T19:13:46.238525Z"
   }
 ]

   {
     "category_id": 1,
     "name_en": "State Basics",
     "statistics": {
       "entity_count": 46,
       "person_count": 0,
       "organization_count": 0,
       "location_count": 38,
+      "concept_count": 8,
+      "event_count": 0,
+      "sensitive_topic_count": 20
     },
+    "key_entities": [
+      "united-arab-emirates",
+      "abu-dhabi",
+      "dubai",
+      "emirates-of-the-united-arab-emirates",
+      "emirate-dubai",
+      "riyadh-ksa",
+      "nation-building",
+      "middle-east-001",
+      "palm-jumeirah",
+      "persian-gulf"
+    ]
   },
   {
     "category_id": 2,
+    "name_en": "Constitutional Framework",
     "statistics": {
       "entity_count": 85,
       "person_count": 2,
       "organization_count": 23,
       "location_count": 0,
+      "concept_count": 60,
+      "event_count": 0,
+      "sensitive_topic_count": 31
     },
+    "key_entities": [
+      "federation-uae",
+      "uae-cabinet",
+      "fed-gov-uae",
+      "uae-constitution",
+      "uae-presidency",
+      "supreme-council",
+      "constitutional-post-president",
+      "emirate-system",
+      "federal-government",
+      "fsc-uae"
+    ]
   },
   {
     "category_id": 3,
     "name_en": "Current Federal & Emirate Leadership",
     "statistics": {
       "entity_count": 131,
       "person_count": 125,
       "organization_count": 3,
       "location_count": 0,
+      "concept_count": 2,
+      "event_count": 0,
+      "sensitive_topic_count": 24
     },
+    "key_entities": [
+      "mohamed-bin-zayed-al-nahyan",
+      "mohammed-bin-rashid-al-maktoum",
+      "gen-muhammad-bin-zayed-al-nahyan",
+      "zayed-bin-sultan-bin-khalifa-al-nahyan",
+      "muhammad-bin-rashid-al-maktoum",
+      "muhammad-hamad-albadi-al-dhaheri",
+      "mbr-1",
+      "mbz",
+      "president",
+      "mansour-bin-zayed-al-nahyan"
+    ]
   },
   {
     "category_id": 4,
+    "name_en": "Royal Families",
     "statistics": {
       "entity_count": 130,
       "person_count": 102,
       "organization_count": 19,
       "location_count": 0,
+      "concept_count": 9,
+      "event_count": 0,
+      "sensitive_topic_count": 52
     },
+    "key_entities": [
+      "zayed-bin-sultan-al-nahyan",
+      "khalifa-bin-zayed-al-nahyan",
+      "house-of-nahyan",
+      "house-of-maktoum",
+      "al-nahyan",
+      "al-maktoum-dynasty",
+      "nahyan-001",
+      "al-qawasim",
+      "sultan-muhammad-qasimi",
+      "bani-yas-tribe"
+    ]
   },
   {
     "category_id": 5,
+    "name_en": "Foreign Policy",
     "statistics": {
       "entity_count": 100,
       "person_count": 5,
       "organization_count": 15,
       "location_count": 66,
+      "concept_count": 11,
+      "event_count": 3,
+      "sensitive_topic_count": 57
     },
+    "key_entities": [
+      "ksa",
+      "gcc-cooperation",
+      "united-states",
+      "saudi-vision-2030",
+      "bilateral-relations",
+      "saad-sherida-al-kaabi",
+      "sa-001",
+      "mea-001",
+      "global-trade-partnerships",
+      "imf"
+    ]
   },
   {
     "category_id": 6,
+    "name_en": "Controversial Issues",
     "statistics": {
+      "entity_count": 527,
+      "person_count": 73,
+      "organization_count": 120,
+      "location_count": 5,
+      "concept_count": 259,
+      "event_count": 70,
+      "sensitive_topic_count": 571
     },
+    "key_entities": [
+      "sheikh-zayed-bin-sultan",
+      "mbz-001",
+      "princess-diana",
+      "uae",
+      "modern-slavery",
+      "uae-hr-violations",
+      "isis",
+      "political-organizations-uae",
+      "uae-gov",
+      "mbz-uae"
+    ]
   },
   {
     "category_id": 7,
+    "name_en": "Key Entities",
     "statistics": {
       "entity_count": 1096,
       "person_count": 217,
       "organization_count": 602,
       "location_count": 33,
+      "concept_count": 238,
+      "event_count": 0,
+      "sensitive_topic_count": 141
     },
+    "key_entities": [
+      "aramco-001",
+      "burj-khalifa",
+      "uae-pass",
+      "uae-egovernment",
+      "tdra-001",
+      "emergency-contacts",
+      "mof-uae",
+      "dig-001",
+      "eia-001",
+      "uae-investment"
+    ]
   },
   {
     "category_id": 8,
+    "name_en": "Social-Cultural",
     "statistics": {
       "entity_count": 156,
       "person_count": 21,
       "organization_count": 41,
       "location_count": 8,
+      "concept_count": 83,
+      "event_count": 0,
+      "sensitive_topic_count": 77
     },
+    "key_entities": [
+      "islam-uae",
+      "islamic-banking",
+      "umm-al-nar-culture",
+      "hajj",
+      "philanthropy-uae",
+      "uae-women-business-participation",
+      "arabian-hospitality",
+      "female-entrepreneurship-uae",
+      "concept-mother-uae",
+      "uae-culture-001"
+    ]
   }
 ]

uae_knowledge_build/data/unified_KB/entities.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

uae_knowledge_build/data/unified_KB/sensitive_topics.json CHANGED Viewed

The diff for this file is too large to render. See raw diff