Spaces:

JJS341
/

Coreference-Bot

Running

App Files Files Community

JJS341 commited on 26 days ago

Commit

d6000e4

verified ·

1 Parent(s): 6b87ab3

Update app.py

Browse files

Files changed (1) hide show

app.py +27 -29

app.py CHANGED Viewed

@@ -1,10 +1,17 @@
 import os
 import sys
-# 1. 強制下載 Spacy 英文模型
 os.system(f"{sys.executable} -m spacy download en_core_web_sm")
-# 2. 解決新舊版本 Hub 相容性的 Mock 補丁
 try:
     import huggingface_hub
     if not hasattr(huggingface_hub, 'HfFolder'):
@@ -22,7 +29,7 @@ import spacy
 from fastcoref import FCoref
 from deep_translator import GoogleTranslator
-# 3. 初始化 Spacy NLP 詞性解析器與指代模型
 print("🚀 [System] 正在初始化 NLP 詞性解析器...")
 nlp = spacy.load("en_core_web_sm")
@@ -34,7 +41,7 @@ except:
     model = FCoref('biu-nlp/f-coref', device='cpu')
     print("✅ [System] 備用路徑加載成功！")
-# 4. 核心運算邏輯
 def coref_learning_pipeline(user_input):
     if not user_input.strip():
         return "等待輸入...", "等待輸入...", "等待輸入..."
@@ -42,56 +49,45 @@ def coref_learning_pipeline(user_input):
     try:
         # A. 判斷語言並進行中翻英橋接
         has_chinese = any('\u4e00' <= char <= '\u9fff' for char in user_input)
         if has_chinese:
             working_text = GoogleTranslator(source='zh-CN', target='en').translate(user_input)
             mode_notice = "中文輸入模式（已啟動 AI 跨語言橋接）"
-            # 💥 關鍵修正：如果原本輸入中文，這裡就輸出對應的「英文化語意空間」
-            translation_text = working_text
-            translation_label = "📖 完整文本翻譯 (中 ➔ 英)"
         else:
             working_text = user_input
             mode_notice = "英文原語模式"
-            # 如果原本輸入英文，這裡維持「英翻中」
-            translation_text = GoogleTranslator(source='en', target='zh-TW').translate(working_text)
-            translation_label = "📖 完整文本翻譯 (英 ➔ 中)"
         # B. 執行 AI 指代消解運算
         preds = model.predict(texts=[working_text])
         clusters = preds[0].get_clusters()
-        # C. 欄位一：生成「英翻中結果」
-        translation_text = GoogleTranslator(source='en', target='zh-TW').translate(working_text)
-        # D. 💥 欄位二：全新重構【AI 智慧單字本】（利用詞性精準抓取名詞，消滅人名）
         vocab_output = ""
         doc = nlp(working_text)
         extracted_words = set()
-        # E. 欄位三：生成「AI 語意共指報告」
-        report_text = f"✨ 系統狀態：{mode_notice}\n"
-        report_text += f"📝 英文運算空間: {working_text}\n"
         for token in doc:
-            # 只抓普通名詞 (NOUN)，排除專有名詞/人名 (PROPN) 與代名詞 (PRON)
             if token.pos_ == "NOUN" and len(token.text) > 2:
-                # 統一轉成單數原型原型，畫面更漂亮（例如把 lambs 變成 lamb）
                 extracted_words.add(token.lemma_.lower())
         if extracted_words:
             for word in sorted(extracted_words):
                 try:
-                    # 翻成繁體中文
                     word_zh = GoogleTranslator(source='en', target='zh-TW').translate(word)
-                    # 輸出格式：【Farmer ➔ 農夫】
                     vocab_output += f"🔸 {word.capitalize()} ➔ {word_zh}\n"
                 except:
                     pass
         else:
             vocab_output = "ℹ️ 未偵測到適合學習的核心英文單字。"
-        # E. 欄位三：生成「AI 語意共指報告」
         report_text = f"✨ 系統狀態：{mode_notice}\n"
         report_text += f"📝 英文運算空間: {working_text}\n"
         report_text += "-----------------------------------------\n"
@@ -109,31 +105,33 @@ def coref_learning_pipeline(user_input):
                 report_text += f" 🔗 鏈結 {i+1} (中): {cluster_str_zh}\n"
                 report_text += f"    └─ (英): {cluster_str_en}\n"
         return translation_text, vocab_output, report_text
     except Exception as e:
         return f"錯誤: {str(e)}", "無法整合單字", f"運行異常: {str(e)}"
-# 5. 精美 UI 介面設計
 with gr.Blocks(theme=gr.themes.Soft(primary_hue="blue", secondary_hue="indigo")) as demo:
-    gr.Markdown("# 🤖 AI 跨語言智慧語意學習終端")
-    gr.Markdown("### 🚀 專案亮點：結合核心指代消解 (Coreference Resolution) 與 NLP 智慧名詞提取技術")
     with gr.Row():
         with gr.Column(scale=1):
             txt_input = gr.Textbox(
                 label="📥 請輸入中文或英文段落 (Input Text)",
-                placeholder="例如：Mary is a farmer. Mary has a little lamb.",
                 lines=5
             )
             btn_submit = gr.Button("🔥 執行多維度 AI 語意解析", variant="primary")
         with gr.Column(scale=1):
-            out_translation = gr.Textbox(label="📖 完整文本翻譯 (Translation)", lines=3)
-            # 這裡就是真正的智慧單字本！
             out_vocab = gr.Textbox(label="📚 AI 智慧單字本 (Vocabulary Booklet)", lines=5)
             out_report = gr.Textbox(label="🎯 AI 語意消解報告 (Coreference Report)", lines=5)
     btn_submit.click(
         fn=coref_learning_pipeline,
         inputs=txt_input,

 import os
 import sys
+import warnings
+import logging
+# 1. 抑制所有討厭的非同步與資源回收警告 (解決 ValueError: Invalid file descriptor: -1)
+warnings.filterwarnings("ignore", category=RuntimeWarning)
+warnings.filterwarnings("ignore", message="Exception ignored in")
+logging.getLogger("asyncio").setLevel(logging.ERROR)
+# 2. 強制下載 Spacy 英文模型
 os.system(f"{sys.executable} -m spacy download en_core_web_sm")
+# 3. 解決新舊版本 Hub 相容性的 Mock 補丁
 try:
     import huggingface_hub
     if not hasattr(huggingface_hub, 'HfFolder'):
 from fastcoref import FCoref
 from deep_translator import GoogleTranslator
+# 4. 初始化 Spacy NLP 詞性解析器與指代模型
 print("🚀 [System] 正在初始化 NLP 詞性解析器...")
 nlp = spacy.load("en_core_web_sm")
     model = FCoref('biu-nlp/f-coref', device='cpu')
     print("✅ [System] 備用路徑加載成功！")
+# 5. 核心運算邏輯
 def coref_learning_pipeline(user_input):
     if not user_input.strip():
         return "等待輸入...", "等待輸入...", "等待輸入..."
     try:
         # A. 判斷語言並進行中翻英橋接
         has_chinese = any('\u4e00' <= char <= '\u9fff' for char in user_input)
         if has_chinese:
             working_text = GoogleTranslator(source='zh-CN', target='en').translate(user_input)
             mode_notice = "中文輸入模式（已啟動 AI 跨語言橋接）"
+            # ✨ 關鍵修正：輸入中文時，完整文本翻譯欄位輸出「英文」
+            translation_text = f"【英文對照】\n{working_text}"
         else:
             working_text = user_input
             mode_notice = "英文原語模式"
+            # ✨ 關鍵修正：輸入英文時，完整文本翻譯欄位輸出「繁體中文」
+            translated_zh = GoogleTranslator(source='en', target='zh-TW').translate(working_text)
+            translation_text = f"【中文翻譯】\n{translated_zh}"
         # B. 執行 AI 指代消解運算
         preds = model.predict(texts=[working_text])
         clusters = preds[0].get_clusters()
+        # C. 建立【AI 智慧單字本】
         vocab_output = ""
         doc = nlp(working_text)
         extracted_words = set()
         for token in doc:
             if token.pos_ == "NOUN" and len(token.text) > 2:
                 extracted_words.add(token.lemma_.lower())
         if extracted_words:
             for word in sorted(extracted_words):
                 try:
                     word_zh = GoogleTranslator(source='en', target='zh-TW').translate(word)
                     vocab_output += f"🔸 {word.capitalize()} ➔ {word_zh}\n"
                 except:
                     pass
         else:
             vocab_output = "ℹ️ 未偵測到適合學習的核心英文單字。"
+        # D. 生成「AI 語意共指報告」
         report_text = f"✨ 系統狀態：{mode_notice}\n"
         report_text += f"📝 英文運算空間: {working_text}\n"
         report_text += "-----------------------------------------\n"
                 report_text += f" 🔗 鏈結 {i+1} (中): {cluster_str_zh}\n"
                 report_text += f"    └─ (英): {cluster_str_en}\n"
+        # 💥 這裡非常重要！必須依序回傳給前端的三個框框
         return translation_text, vocab_output, report_text
     except Exception as e:
         return f"錯誤: {str(e)}", "無法整合單字", f"運行異常: {str(e)}"
+# 6. 精美 UI 介面設計
 with gr.Blocks(theme=gr.themes.Soft(primary_hue="blue", secondary_hue="indigo")) as demo:
+    gr.Markdown("# 🤖 Janice's AI 跨語言智慧語意學習終端")
+    gr.Markdown("### 🚀 專題亮點：結合核心指代消解 (Coreference Resolution) 與 NLP 智慧名詞提取技術")
     with gr.Row():
         with gr.Column(scale=1):
             txt_input = gr.Textbox(
                 label="📥 請輸入中文或英文段落 (Input Text)",
+                placeholder="例如：Mary is a Farmer. Mary had a little lamb.",
                 lines=5
             )
             btn_submit = gr.Button("🔥 執行多維度 AI 語意解析", variant="primary")
         with gr.Column(scale=1):
+            # 前端三個輸出元件定義
+            out_translation = gr.Textbox(label="📖 完整文本翻譯/對照 (Translation/Context)", lines=3)
             out_vocab = gr.Textbox(label="📚 AI 智慧單字本 (Vocabulary Booklet)", lines=5)
             out_report = gr.Textbox(label="🎯 AI 語意消解報告 (Coreference Report)", lines=5)
+    # 點擊按鈕時，將三個輸出結果精準對接到各自的 Textbox 組件
     btn_submit.click(
         fn=coref_learning_pipeline,
         inputs=txt_input,