Spaces:

Maya0808
/

UserStudy2

Sleeping

App Files Files Community

Mayamaya commited on Jul 31, 2025

Commit

436f21d

1 Parent(s): 19edf05

ミスを発券

Browse files

Files changed (4) hide show

app.py +61 -18
combined_data/lapwing/texts/bounding_boxes.json +32 -0
logs/evaluation_ui_log_2025-07-31_11-17-08_603378.log +10 -0
results/P99/evaluation_results_P99_20250731_111915.json +112 -0

app.py CHANGED Viewed

@@ -1,17 +1,22 @@
 import os
 import sys
 import glob
 import json
 import random
-import re
 from functools import partial
 from datetime import datetime
 from collections import defaultdict, Counter
 import gradio as gr
 from loguru import logger
-# --- Global State (unchanged) ---
 GLOBAL_STATE = {
     "participant_id": None,
     "data_loaded": False,
@@ -28,9 +33,10 @@ GLOBAL_STATE = {
     "current_ranks": {},
     "current_absolute_score": None,
     "current_absolute_score_worst": None,
 }
-# --- Configuration (unchanged) ---
 BASE_RESULTS_DIR = "./results"
 LOG_DIR = "./logs"
 COMBINED_DATA_DIR = "./combined_data"
@@ -52,7 +58,34 @@ CRITERIA_GUIDANCE_EN = [
 IMAGE_LABELS = ['A', 'B', 'C', 'D', 'E']
-# --- Helper Functions (unchanged) ---
 def get_image_path_from_prediction(prediction: dict) -> str:
     if not GLOBAL_STATE["image_mapping"]:
         logger.error("Image mapping is not loaded.")
@@ -71,6 +104,15 @@ def get_image_path_from_prediction(prediction: dict) -> str:
 def load_evaluation_data(participant_id: str):
     mapping_path = os.path.join(COMBINED_DATA_DIR, MAPPING_FILENAME)
     if not os.path.exists(mapping_path):
         return f"<p class='feedback red'>Error: Mapping file not found at {mapping_path}</p>", gr.update(
@@ -182,8 +224,6 @@ def handle_absolute_score_worst_click(score):
 # --- UI Logic ---
-# ▼▼▼ 修正後の display_current_prompt_and_criterion 関数 ▼▼▼
 def display_current_prompt_and_criterion():
     if not GLOBAL_STATE["data_loaded"] or GLOBAL_STATE["current_prompt_index"] >= len(GLOBAL_STATE["all_eval_data"]):
         done_msg = "<p class='feedback green' style='text-align: center; font-size: 1.2em;'>All prompts have been evaluated! Please proceed to the 'Export' tab. <br>すべてのプロンプトの評価が完了しました！「エクスポート」タブに進んでください。</p>"
@@ -212,16 +252,11 @@ def display_current_prompt_and_criterion():
     criterion_name = CRITERIA[criterion_idx]
     progress_text = f"Prompt {GLOBAL_STATE['current_prompt_index'] + 1} / {len(GLOBAL_STATE['all_eval_data'])}  -  **{criterion_name}**"
-    # ▼▼▼ 修正1: プロンプト表示のフォントサイズを3倍に変更 ▼▼▼
     prompt_display_text = f"<p style='font-size: 3em; font-weight: bold;'>テキスト(TEXT): {prompt_text}</p>"
-    # ▼▼▼ 修正2: 統合された指示文を生成（注意文の変更） ▼▼▼
     guidance_part = (
         f"<p style='color: red; font-weight: bold; font-size: 1.1em;'>"
         f"5つの画像を、「{CRITERIA_GUIDANCE_JP[criterion_idx]}」を基準にランキングしてください。<br>"
         f"Please rank the 5 images based on {CRITERIA_GUIDANCE_EN[criterion_idx]}"
         f"</p>"
     )
     rules_part = (
@@ -240,7 +275,6 @@ def display_current_prompt_and_criterion():
         "<p style='font-size: 0.9em; color: #555;'>"
         "設問や英単語の意味についてはAIに質問したり検索したりしても構いません。ただし、画像そのものが示す感情をAIに質問するのはお控えください。<br>"
         "You are welcome to use AI or web search to understand the questions or the meaning of English words. However, please refrain from asking an AI about the emotion shown in the images themselves."
         "</p>"
     )
     combined_instructions = f"{guidance_part}<hr>{rules_part}<hr>{ai_note_part}"
@@ -257,7 +291,18 @@ def display_current_prompt_and_criterion():
     for cond_name in current_image_order:
         prediction = current_data["predictions"][cond_name]
         img_path = get_image_path_from_prediction(prediction)
-        image_updates.append(gr.update(value=img_path if img_path and os.path.exists(img_path) else None))
     saved_ranks_dict = GLOBAL_STATE["evaluation_results"].get(prompt_text, {}).get("ranks", {}).get(criterion_name)
     if saved_ranks_dict:
@@ -307,7 +352,7 @@ def display_current_prompt_and_criterion():
     ]
-# ▼▼▼ 修正後の validate_and_navigate 関数 (変更なし) ▼▼▼
 def validate_and_navigate():
     ranks = GLOBAL_STATE["current_ranks"]
     error_msg = None
@@ -406,7 +451,6 @@ def navigate_previous():
     return display_current_prompt_and_criterion()
-# ▼▼▼ 修正後の export_results 関数 (変更なし) ▼▼▼
 def export_results(participant_id, alignment_reason, naturalness_reason, attractiveness_reason, optional_comment):
     if not alignment_reason.strip() or not naturalness_reason.strip() or not attractiveness_reason.strip():
         error_msg = "<p class='feedback red'>Please fill in the reasoning for all three criteria (Alignment, Naturalness, Attractiveness). / 3つの評価基準（一致度, 自然さ, 魅力度）すべての判断理由を記入してください。</p>"
@@ -480,7 +524,6 @@ def export_results(participant_id, alignment_reason, naturalness_reason, attract
     return gr.update(value=filepath, visible=True), status_message
-# ▼▼▼ 修正後の create_gradio_interface 関数 (変更なし) ▼▼▼
 def create_gradio_interface():
     css = """
     .gradio-container { font-family: 'Arial', sans-serif; }
@@ -564,7 +607,7 @@ def create_gradio_interface():
                         with gr.Column(scale=1):
                             with gr.Group():
                                 gr.Markdown(f"<div class='image-label' style='text-align: center;'>{label}</div>")
-                                img = gr.Image(type="filepath", show_label=False, height=300)
                                 image_components.append(img)
                                 with gr.Row(elem_classes="rank-btn-row"):
                                     rank_list = ["1位", "2位", "3位", "4位", "5位"]
@@ -637,7 +680,7 @@ def create_gradio_interface():
                 download_file = gr.File(label="Download JSON", visible=False)
                 export_status = gr.Markdown()
-        # --- Event Handlers (unchanged) ---
         def check_and_confirm_id(pid):
             pid = pid.strip()
             if re.fullmatch(r"P\d{2}", pid):

+# ==============================================================================
+# evaluation_interface のコードブロック（修正済み）
+# ==============================================================================
 import os
 import sys
 import glob
 import json
 import random
 from functools import partial
 from datetime import datetime
 from collections import defaultdict, Counter
 import gradio as gr
 from loguru import logger
+from PIL import Image  # ★ 修正点1: PILライブラリをインポート
+import re
+# --- Global State ---
 GLOBAL_STATE = {
     "participant_id": None,
     "data_loaded": False,
     "current_ranks": {},
     "current_absolute_score": None,
     "current_absolute_score_worst": None,
+    "hide_bbox_dict": {},  # ★ 修正点2: マスキング情報を格納するキーを追加
 }
+# --- Configuration ---
 BASE_RESULTS_DIR = "./results"
 LOG_DIR = "./logs"
 COMBINED_DATA_DIR = "./combined_data"
 IMAGE_LABELS = ['A', 'B', 'C', 'D', 'E']
+# ★ 修正点3: マスキング用のヘルパー関数を classification_interface からコピー
+# --- Helper Functions ---
+def load_bbox_json(bbox_json_path):
+    """バウンディングボックス情報をJSONファイルから読み込む"""
+    try:
+        with open(bbox_json_path, 'r', encoding='utf-8') as f:
+            bbox_data = json.load(f)
+        # evaluation_interface では hide (隠す領域) のみ必要
+        GLOBAL_STATE["hide_bbox_dict"] = bbox_data.get("Hide", {})
+        logger.info(f"Successfully loaded bounding box data from {bbox_json_path}")
+    except Exception as e:
+        logger.error(f"Failed to load bounding box JSON: {e}")
+        GLOBAL_STATE["hide_bbox_dict"] = {}
+def create_masked_image(image: Image.Image):
+    """画像に黒塗りのマスクを適用する"""
+    hide_bbox_dict = GLOBAL_STATE.get("hide_bbox_dict", {})
+    if not hide_bbox_dict:
+        return image
+    masked_img = image.copy()
+    for _, box_coords in hide_bbox_dict.items():
+        box = (box_coords['left'], box_coords['top'], box_coords['right'], box_coords['bottom'])
+        black_rectangle = Image.new('RGB', (box[2] - box[0], box[3] - box[1]), color='black')
+        masked_img.paste(black_rectangle, (box[0], box[1]))
+    return masked_img
 def get_image_path_from_prediction(prediction: dict) -> str:
     if not GLOBAL_STATE["image_mapping"]:
         logger.error("Image mapping is not loaded.")
 def load_evaluation_data(participant_id: str):
+    # ★ 修正点4: バウンディングボックス情報を読み込む処理を追加
+    # classification_interfaceのパス構造を参考に、bboxファイルのパスを構築
+    bbox_json_path = os.path.join(COMBINED_DATA_DIR, "lapwing", "texts", "bounding_boxes.json")
+    if os.path.exists(bbox_json_path):
+        load_bbox_json(bbox_json_path)
+    else:
+        logger.warning(f"Bounding box file not found at {bbox_json_path}. Images will not be masked.")
+        GLOBAL_STATE["hide_bbox_dict"] = {}
     mapping_path = os.path.join(COMBINED_DATA_DIR, MAPPING_FILENAME)
     if not os.path.exists(mapping_path):
         return f"<p class='feedback red'>Error: Mapping file not found at {mapping_path}</p>", gr.update(
 # --- UI Logic ---
 def display_current_prompt_and_criterion():
     if not GLOBAL_STATE["data_loaded"] or GLOBAL_STATE["current_prompt_index"] >= len(GLOBAL_STATE["all_eval_data"]):
         done_msg = "<p class='feedback green' style='text-align: center; font-size: 1.2em;'>All prompts have been evaluated! Please proceed to the 'Export' tab. <br>すべてのプロンプトの評価が完了しました！「エクスポート」タブに進んでください。</p>"
     criterion_name = CRITERIA[criterion_idx]
     progress_text = f"Prompt {GLOBAL_STATE['current_prompt_index'] + 1} / {len(GLOBAL_STATE['all_eval_data'])}  -  **{criterion_name}**"
     prompt_display_text = f"<p style='font-size: 3em; font-weight: bold;'>テキスト(TEXT): {prompt_text}</p>"
     guidance_part = (
         f"<p style='color: red; font-weight: bold; font-size: 1.1em;'>"
         f"5つの画像を、「{CRITERIA_GUIDANCE_JP[criterion_idx]}」を基準にランキングしてください。<br>"
         f"Please rank the 5 images based on {CRITERIA_GUIDANCE_EN[criterion_idx]}"
         f"</p>"
     )
     rules_part = (
         "<p style='font-size: 0.9em; color: #555;'>"
         "設問や英単語の意味についてはAIに質問したり検索したりしても構いません。ただし、画像そのものが示す感情をAIに質問するのはお控えください。<br>"
         "You are welcome to use AI or web search to understand the questions or the meaning of English words. However, please refrain from asking an AI about the emotion shown in the images themselves."
         "</p>"
     )
     combined_instructions = f"{guidance_part}<hr>{rules_part}<hr>{ai_note_part}"
     for cond_name in current_image_order:
         prediction = current_data["predictions"][cond_name]
         img_path = get_image_path_from_prediction(prediction)
+        # ★ 修正点5: 画像を読み込み、マスキングを適用する
+        if img_path and os.path.exists(img_path):
+            try:
+                pil_img = Image.open(img_path).convert('RGB')
+                masked_img = create_masked_image(pil_img)
+                image_updates.append(gr.update(value=masked_img))
+            except Exception as e:
+                logger.error(f"Failed to open or mask image {img_path}: {e}")
+                image_updates.append(gr.update(value=None))
+        else:
+            image_updates.append(gr.update(value=None))
     saved_ranks_dict = GLOBAL_STATE["evaluation_results"].get(prompt_text, {}).get("ranks", {}).get(criterion_name)
     if saved_ranks_dict:
     ]
+# --- (以降の関数は変更なし) ---
 def validate_and_navigate():
     ranks = GLOBAL_STATE["current_ranks"]
     error_msg = None
     return display_current_prompt_and_criterion()
 def export_results(participant_id, alignment_reason, naturalness_reason, attractiveness_reason, optional_comment):
     if not alignment_reason.strip() or not naturalness_reason.strip() or not attractiveness_reason.strip():
         error_msg = "<p class='feedback red'>Please fill in the reasoning for all three criteria (Alignment, Naturalness, Attractiveness). / 3つの評価基準（一致度, 自然さ, 魅力度）すべての判断理由を記入してください。</p>"
     return gr.update(value=filepath, visible=True), status_message
 def create_gradio_interface():
     css = """
     .gradio-container { font-family: 'Arial', sans-serif; }
                         with gr.Column(scale=1):
                             with gr.Group():
                                 gr.Markdown(f"<div class='image-label' style='text-align: center;'>{label}</div>")
+                                img = gr.Image(type="pil", show_label=False, height=300)  # typeを"pil"に変更
                                 image_components.append(img)
                                 with gr.Row(elem_classes="rank-btn-row"):
                                     rank_list = ["1位", "2位", "3位", "4位", "5位"]
                 download_file = gr.File(label="Download JSON", visible=False)
                 export_status = gr.Markdown()
+        # --- Event Handlers ---
         def check_and_confirm_id(pid):
             pid = pid.strip()
             if re.fullmatch(r"P\d{2}", pid):

combined_data/lapwing/texts/bounding_boxes.json ADDED Viewed

	@@ -0,0 +1,32 @@

+{
+    "Show": {
+        "Eyebrow": {
+            "left": 120,
+            "top": 200,
+            "right": 392,
+            "bottom": 302
+        },
+        "Eyes": {
+            "left": 130,
+            "top": 270,
+            "right": 382,
+            "bottom": 365
+        }
+    },
+    "Hide": {
+        "Mouth": {
+            "left": 160,
+            "top": 409,
+            "right": 352,
+            "bottom": 482
+        }
+    },
+    "Crop": {
+        "Crop": {
+            "left": 26,
+            "top": 26,
+            "right": 486,
+            "bottom": 486
+        }
+    }
+}

logs/evaluation_ui_log_2025-07-31_11-17-08_603378.log ADDED Viewed

	@@ -0,0 +1,10 @@

+2025-07-31 11:17:27.491 | INFO     | __main__:load_bbox_json:70 - Successfully loaded bounding box data from ./combined_data\lapwing\texts\bounding_boxes.json
+2025-07-31 11:17:27.493 | INFO     | __main__:load_evaluation_data:124 - Successfully loaded image mapping. Image directory: ./combined_data\lapwing\images
+2025-07-31 11:17:27.520 | INFO     | __main__:load_evaluation_data:172 - Loaded and merged data for 2 prompts.
+2025-07-31 11:17:49.041 | INFO     | __main__:validate_and_navigate:429 - Saved rank for P:P99, Prompt:'happy', Criterion:Alignment, Ranks:{'Ours': 1, 'w_o_HitL': 5, 'w_o_Proto_Loss': 1, 'LLM-based': 1, 'w_o_Tuning': 4}
+2025-07-31 11:18:00.202 | INFO     | __main__:validate_and_navigate:429 - Saved rank for P:P99, Prompt:'happy', Criterion:Naturalness, Ranks:{'Ours': 1, 'w_o_Tuning': 5, 'LLM-based': 1, 'w_o_Proto_Loss': 1, 'w_o_HitL': 4}
+2025-07-31 11:18:17.995 | INFO     | __main__:validate_and_navigate:429 - Saved rank for P:P99, Prompt:'happy', Criterion:Attractiveness, Ranks:{'LLM-based': 1, 'Ours': 1, 'w_o_Proto_Loss': 1, 'w_o_Tuning': 5, 'w_o_HitL': 4}
+2025-07-31 11:18:40.255 | INFO     | __main__:validate_and_navigate:429 - Saved rank for P:P99, Prompt:'sad', Criterion:Alignment, Ranks:{'LLM-based': 5, 'w_o_HitL': 4, 'Ours': 2, 'w_o_Proto_Loss': 2, 'w_o_Tuning': 1}
+2025-07-31 11:18:53.544 | INFO     | __main__:validate_and_navigate:429 - Saved rank for P:P99, Prompt:'sad', Criterion:Naturalness, Ranks:{'w_o_HitL': 4, 'LLM-based': 5, 'w_o_Tuning': 3, 'Ours': 1, 'w_o_Proto_Loss': 1}
+2025-07-31 11:19:04.031 | INFO     | __main__:validate_and_navigate:429 - Saved rank for P:P99, Prompt:'sad', Criterion:Attractiveness, Ranks:{'w_o_Tuning': 4, 'LLM-based': 5, 'w_o_HitL': 3, 'Ours': 1, 'w_o_Proto_Loss': 1}
+2025-07-31 11:19:15.845 | INFO     | __main__:export_results:511 - Successfully exported results to: ./results\P99\evaluation_results_P99_20250731_111915.json

results/P99/evaluation_results_P99_20250731_111915.json ADDED Viewed

	@@ -0,0 +1,112 @@

+{
+  "metadata": {
+    "participant_id": "P99",
+    "export_timestamp": "2025-07-31T11:19:15.844354",
+    "total_prompts_evaluated": 2,
+    "evaluation_duration_seconds": 96.511394,
+    "reasoning": {
+      "alignment": "あいう",
+      "naturalness": "あいう",
+      "attractiveness": "あいう"
+    },
+    "optional_comment": "あいう"
+  },
+  "results": [
+    {
+      "prompt": "happy",
+      "prompt_category": "basic_emotion",
+      "image_order_alignment": [
+        "Ours",
+        "w_o_HitL",
+        "w_o_Proto_Loss",
+        "LLM-based",
+        "w_o_Tuning"
+      ],
+      "image_order_naturalness": [
+        "Ours",
+        "w_o_Tuning",
+        "LLM-based",
+        "w_o_Proto_Loss",
+        "w_o_HitL"
+      ],
+      "image_order_attractiveness": [
+        "LLM-based",
+        "Ours",
+        "w_o_Proto_Loss",
+        "w_o_Tuning",
+        "w_o_HitL"
+      ],
+      "alignment_ranks": {
+        "Ours": 1,
+        "w_o_HitL": 5,
+        "w_o_Proto_Loss": 1,
+        "LLM-based": 1,
+        "w_o_Tuning": 4
+      },
+      "naturalness_ranks": {
+        "Ours": 1,
+        "w_o_Tuning": 5,
+        "LLM-based": 1,
+        "w_o_Proto_Loss": 1,
+        "w_o_HitL": 4
+      },
+      "attractiveness_ranks": {
+        "LLM-based": 1,
+        "Ours": 1,
+        "w_o_Proto_Loss": 1,
+        "w_o_Tuning": 5,
+        "w_o_HitL": 4
+      },
+      "alignment_absolute_score": 6,
+      "alignment_absolute_score_worst": 2
+    },
+    {
+      "prompt": "sad",
+      "prompt_category": "basic_emotion",
+      "image_order_alignment": [
+        "LLM-based",
+        "w_o_HitL",
+        "Ours",
+        "w_o_Proto_Loss",
+        "w_o_Tuning"
+      ],
+      "image_order_naturalness": [
+        "w_o_HitL",
+        "LLM-based",
+        "w_o_Tuning",
+        "Ours",
+        "w_o_Proto_Loss"
+      ],
+      "image_order_attractiveness": [
+        "w_o_Tuning",
+        "LLM-based",
+        "w_o_HitL",
+        "Ours",
+        "w_o_Proto_Loss"
+      ],
+      "alignment_ranks": {
+        "LLM-based": 5,
+        "w_o_HitL": 4,
+        "Ours": 2,
+        "w_o_Proto_Loss": 2,
+        "w_o_Tuning": 1
+      },
+      "naturalness_ranks": {
+        "w_o_HitL": 4,
+        "LLM-based": 5,
+        "w_o_Tuning": 3,
+        "Ours": 1,
+        "w_o_Proto_Loss": 1
+      },
+      "attractiveness_ranks": {
+        "w_o_Tuning": 4,
+        "LLM-based": 5,
+        "w_o_HitL": 3,
+        "Ours": 1,
+        "w_o_Proto_Loss": 1
+      },
+      "alignment_absolute_score": 6,
+      "alignment_absolute_score_worst": 1
+    }
+  ]
+}