Spaces:

kaburia
/

policy-coherence-annotator

Paused

App Files Files Community

kaburia commited on Nov 17, 2025

Commit

3857216

1 Parent(s): 2431094

initial test

Browse files

Files changed (2) hide show

gradio_app.py +434 -0
requirements.txt +21 -0

gradio_app.py ADDED Viewed

	@@ -0,0 +1,434 @@

+import gradio as gr
+import pandas as pd
+import os
+from huggingface_hub import HfApi
+from datasets import load_dataset, Dataset
+import io
+# from dotenv import load_dotenv
+# # Load environment variables from a .env file (if present) and read HF token
+# load_dotenv()
+# HF_TOKEN = os.getenv("HF_TOKEN", "YOUR_HF_WRITE_TOKEN_HERE")
+# --- 1. CONFIGURATION ---
+# --- !!! NEW: DEBUG/TESTING MODE !!! ---
+# Set to True to use local CSV files instead of Hugging Face Hub
+# This will read from PREDICTIONS_CSV and read/write to LOCAL_DATASET_PATH
+DEBUG_TESTING = False
+LOCAL_DATASET_PATH = "/content/drive/MyDrive/policy-evaluations/sentiment_dataset_eval.csv"
+PREDICTIONS_CSV = "model_predictions.csv" # From batch_inference.py
+# --- End Debug Config ---
+HF = 'hf'
+token = 'pQQADyqfDNewBCejvPmyMGlzpdgqDFSAFE'
+HF_DATASET_REPO = "kaburia/policy-evaluations" # Your HF Dataset repo
+HF_TOKEN = HF + '_' + token
+# --- Email Authentication ---
+APPROVED_EMAILS = {
+    "email1@gmail.com": "user1",
+    "email2@gmail.com": "user2",
+    "admin@policy.org": "admin_user",
+    "test@test.com": "test_user" # Added for easier debugging
+    # Add more authorized emails and their tags here
+}
+# --- Define Interaction Choices ---
+DRILL_DOWN_MAP = {
+    "coherent": ["+3 Indivisible", "+2 Reinforcing", "+1 Enabling"],
+    "neutral": ["0 Consistent"],
+    "incoherent": ["-1 Constraining", "-2 Counteracting", "-3 Cancelling"]
+}
+ALL_DRILL_DOWN_CHOICES = DRILL_DOWN_MAP["coherent"] + DRILL_DOWN_MAP["neutral"] + DRILL_DOWN_MAP["incoherent"]
+VERIFY_CHOICES = ["neutral", "coherent", "incoherent"]
+# --- 2. DATA LOADING FUNCTIONS ---
+def load_data_from_hub(token):
+    """
+    (LIVE MODE) Loads the dataset from Hugging Face, converts to Pandas,
+    and identifies pending rows.
+    """
+    if not token or token == "YOUR_HF_WRITE_TOKEN_HERE":
+        return None, None, "Error: Hugging Face Token is not configured."
+    try:
+        # Load the dataset
+        ds = load_dataset(HF_DATASET_REPO, token=token, split="train", cache_dir="./cache")
+        full_df = ds.to_pandas()
+        # Ensure required columns exist
+        if "UserVerifiedClass" not in full_df.columns:
+            return None, None, "Error: Dataset is missing 'UserVerifiedClass' column. Please run setup script."
+        # Create a unique key
+        full_df['key'] = full_df['PolicyA'] + '||' + full_df['PolicyB']
+        # Find rows that have NOT been annotated
+        pending_df = full_df[full_df['UserVerifiedClass'].isnull()].reset_index(drop=True)
+        status = f"Loaded {len(pending_df)} remaining items to annotate. ({len(full_df) - len(pending_df)} already complete) [LIVE: HF Hub]"
+        return full_df, pending_df, status
+    except Exception as e:
+        return None, None, f"Error loading dataset from Hub: {e}"
+def load_data_from_local():
+    """
+    (DEBUG MODE) Loads the dataset from a local CSV file.
+    If it doesn't exist, it initializes it from 'model_predictions.csv'.
+    """
+    try:
+        if not os.path.exists(LOCAL_DATASET_PATH):
+            # First run: Initialize local file from predictions
+            print(f"'{LOCAL_DATASET_PATH}' not found. Initializing from '{PREDICTIONS_CSV}'...")
+            if not os.path.exists(PREDICTIONS_CSV):
+                return None, None, f"Error: '{PREDICTIONS_CSV}' not found. Please run batch_inference.py first."
+            df = pd.read_csv(PREDICTIONS_CSV)
+            # --- FIX: Check for 'model_label' ---
+            if "model_label" not in df.columns:
+                 return None, None, f"Error: '{PREDICTIONS_CSV}' is missing 'model_label' column. Please run batch_inference.py"
+            # --- END FIX ---
+            df["UserVerifiedClass"] = pd.NA
+            df["DrillDownInteraction"] = pd.NA
+            df["AnnotatorUsername"] = pd.NA
+            df.to_csv(LOCAL_DATASET_PATH, index=False)
+            print(f"Initialized '{LOCAL_DATASET_PATH}'.")
+        # Load the (now existing) local file
+        full_df = pd.read_csv(LOCAL_DATASET_PATH)
+        # Ensure columns are present
+        for col in ["UserVerifiedClass", "DrillDownInteraction", "AnnotatorUsername"]:
+            if col not in full_df.columns:
+                full_df[col] = pd.NA
+        full_df['key'] = full_df['PolicyA'].astype(str) + '||' + full_df['PolicyB'].astype(str)
+        pending_df = full_df[full_df['UserVerifiedClass'].isnull()].reset_index(drop=True)
+        status = f"Loaded {len(pending_df)} remaining items to annotate. ({len(full_df) - len(pending_df)} complete) [DEBUG: Local CSV]"
+        return full_df, pending_df, status
+    except Exception as e:
+        return None, None, f"Error loading local dataset: {e}"
+# --- 3. DATA SAVING FUNCTIONS ---
+def save_annotation_to_hub(index, verified_class, drill_down, user_tag, token, full_df, pending_df):
+    """
+    (LIVE MODE) Updates the DataFrame and pushes the entire dataset back to the Hub.
+    """
+    if not drill_down:
+        return {status_box: "Error: Please select a drill-down interaction."}
+    if not user_tag:
+        return {status_box: "Error: User tag is missing. Please re-login."}
+    try:
+        # 1. Get the unique key of the item we just annotated
+        current_key = pending_df.loc[index, 'key']
+        # 2. Update the *full* DataFrame with the annotation and user_tag
+        full_df.loc[full_df['key'] == current_key, 'UserVerifiedClass'] = verified_class
+        full_df.loc[full_df['key'] == current_key, 'DrillDownInteraction'] = drill_down
+        full_df.loc[full_df['key'] == current_key, 'AnnotatorUsername'] = user_tag
+        # 3. Convert back to a Dataset object
+        ds_to_upload = Dataset.from_pandas(full_df.drop(columns=['key']))
+        # 4. Push to Hub
+        ds_to_upload.push_to_hub(HF_DATASET_REPO, token=token)
+        save_status = f"Saved to Hub: {verified_class} | {drill_down} by {user_tag}"
+        # 5. Load the next item
+        next_index = index + 1
+        ui_updates = load_next_item(pending_df, next_index) # Pass pending_df
+        ui_updates[status_box] = save_status
+        ui_updates[full_df_state] = full_df # Store the updated full_df in state
+        return ui_updates
+    except Exception as e:
+        return {status_box: f"Error saving to Hub: {e}"}
+def save_annotation_to_local(index, verified_class, drill_down, user_tag, full_df, pending_df):
+    """
+    (DEBUG MODE) Updates the DataFrame and saves it back to the local CSV.
+    """
+    if not drill_down:
+        return {status_box: "Error: Please select a drill-down interaction."}
+    if not user_tag:
+        return {status_box: "Error: User tag is missing. Please re-login."}
+    try:
+        # 1. Get key
+        current_key = pending_df.loc[index, 'key']
+        # 2. Update full DataFrame
+        full_df.loc[full_df['key'] == current_key, 'UserVerifiedClass'] = verified_class
+        full_df.loc[full_df['key'] == current_key, 'DrillDownInteraction'] = drill_down
+        full_df.loc[full_df['key'] == current_key, 'AnnotatorUsername'] = user_tag
+        # 3. Save to local CSV (overwriting)
+        full_df.drop(columns=['key']).to_csv(LOCAL_DATASET_PATH, index=False)
+        save_status = f"Saved (Local): {verified_class} | {drill_down} by {user_tag}"
+        # 4. Load next item
+        next_index = index + 1
+        ui_updates = load_next_item(pending_df, next_index)
+        ui_updates[status_box] = save_status
+        ui_updates[full_df_state] = full_df # Store updated df in state
+        return ui_updates
+    except Exception as e:
+        return {status_box: f"Error saving locally: {e}"}
+# --- 4. GRADIO UI ---
+with gr.Blocks(theme=gr.themes.Soft()) as demo:
+    gr.Markdown("# Policy Coherence Annotation Tool")
+    gr.Markdown(
+        """
+        Welcome! This tool is for human-in-the-loop annotation.
+        1.  Log in with your email address.
+        2.  The model's prediction for two policies will be shown.
+        3.  **Step 1:** Verify if the model's 3-class prediction (neutral, coherent, incoherent) is correct, or change it.
+        4.  **Step 2:** Based on your verified choice, select a 7-class drill-down label. When you choose one of the categories we will ask the level
+        For example if it is incoherent, we shall ask to choose from "-1 Constraining", "-2 Counteracting", "-3 Cancelling"
+        5.  Click 'Save & Next' to submit your annotation and load the next item.
+        ---
+        ### Drill-Down Definitions
+        - **+3 Indivisible**: Inextricably linked to the achievement of another goal.
+        - **+2 Reinforcing**: Aids the achievement of another goal.
+        - **+1 Enabling**: Creates conditions that further another goal.
+        - **0 Consistent**: No significant positive or negative interactions.
+        - **-1 Constraining**: Limits options on another goal.
+        - **-2 Counteracting**: Clashes with another goal.
+        - **-3 Cancelling**: Makes it impossible to reach another goal.
+        """
+    )
+    # --- State variables ---
+    full_df_state = gr.State()
+    pending_df_state = gr.State()
+    current_index_state = gr.State(value=0)
+    hf_token_state = gr.State()
+    user_tag_state = gr.State()
+    # --- Section 1: Login ---
+    with gr.Group() as login_box:
+        with gr.Row():
+            email_box = gr.Textbox(label="Email", placeholder="Enter your authorized email...")
+        login_btn = gr.Button("Login & Load Dataset", variant="primary")
+        progress_bar = gr.Markdown(value="Waiting for login...")
+    # --- Section 2: Annotation (hidden until loaded) ---
+    with gr.Group(visible=False) as annotation_box:
+        # --- MODIFIED: Use gr.Row for side-by-side table layout ---
+        with gr.Row():
+            policy_a_display = gr.Textbox(label="Policy / Objective A", interactive=False, lines=5, container=True)
+            policy_b_display = gr.Textbox(label="Policy / Objective B", interactive=False, lines=5, container=True)
+        # --- END MODIFICATION ---
+        with gr.Row():
+            model_confidence_label = gr.Label(label="Model Confidence")
+            user_verified_radio = gr.Radio(
+                label="Step 1: Verify/Correct Classification",
+                choices=VERIFY_CHOICES,
+                info="The model's prediction is selected by default."
+            )
+        # --- UPDATED: Markdown instructions moved to top ---
+        user_drill_down_dropdown = gr.Dropdown(
+            label="Step 2: Drill-Down Interaction",
+            choices=[], # Will be populated dynamically
+            interactive=True
+        )
+        save_btn = gr.Button("Save & Next", variant="stop")
+        status_box = gr.Textbox(label="Status", interactive=False)
+    # --- 5. UI Event Handlers ---
+    def update_drill_down_choices(verified_class):
+        """
+        Updates the drill-down dropdown based on the 3-class selection.
+        """
+        choices = DRILL_DOWN_MAP.get(verified_class, [])
+        value = choices[0] if len(choices) == 1 else None # Auto-select "0 Consistent"
+        # --- FIX: Return the constructor (Gradio 4.x syntax) ---
+        return gr.Dropdown(
+            choices=choices,
+            value=value,
+            interactive=len(choices) > 1 # Disable interaction if only one choice
+        )
+    def load_next_item(pending_df, index):
+        """
+        Loads the item at 'index' from the PENDING DataFrame into the UI.
+        """
+        if pending_df is None:
+            return {status_box: "Data not loaded."}
+        total_items = len(pending_df)
+        if index >= total_items:
+            return {
+                progress_bar: gr.Markdown(f"**Annotation Complete! ({total_items} items total)**"),
+                policy_a_display: "All items annotated.",
+                policy_b_display: "",
+                annotation_box: gr.Group(visible=False)
+            }
+        row = pending_df.iloc[index]
+        # --- FIX: Use "model_label" from CSV ---
+        model_pred = row["model_label"]
+        # --- NEW: Build conf_dict conditionally ---
+        if "model_confidence" in row:
+            # New format: "model_label" + "model_confidence"
+            confidence = row["model_confidence"]
+            conf_dict = {}
+            # Distribute probability
+            remaining_prob = (1.0 - confidence) / 2.0
+            for l in VERIFY_CHOICES: # ["neutral", "coherent", "incoherent"]
+                if l == model_pred:
+                    conf_dict[l] = confidence
+                else:
+                    conf_dict[l] = remaining_prob
+        else:
+            # Old format: "Confidence_Neutral", etc.
+            conf_dict = {
+                "neutral": row.get("Confidence_Neutral", 0.0),
+                "coherent": row.get("Confidence_Coherent", 0.0),
+                "incoherent": row.get("Confidence_Incoherent", 0.0)
+            }
+        # --- END NEW ---
+        # --- NEW: Update drill-down based on model_pred ---
+        drill_down_choices = DRILL_DOWN_MAP.get(model_pred, [])
+        drill_down_value = drill_down_choices[0] if len(drill_down_choices) == 1 else None
+        drill_down_interactive = len(drill_down_choices) > 1
+        return {
+            progress_bar: gr.Markdown(f"**Annotating Item {index + 1} of {total_items}**"),
+            policy_a_display: row["PolicyA"],
+            policy_b_display: row["PolicyB"],
+            model_confidence_label: conf_dict,
+            user_verified_radio: model_pred,
+            # --- FIX: Return the constructor (Gradio 4.x syntax) ---
+            user_drill_down_dropdown: gr.Dropdown(
+                choices=drill_down_choices,
+                value=drill_down_value,
+                interactive=drill_down_interactive
+            ),
+            current_index_state: index,
+            annotation_box: gr.Group(visible=True)
+        }
+    # When 'Login' is clicked:
+    def login_and_load(email):
+        # --- Authentication Step ---
+        if email not in APPROVED_EMAILS:
+            return {
+                progress_bar: gr.Markdown(f"<font color='red'>Error: Email '{email}' is not authorized.</font>"),
+                login_box: gr.Group(visible=True)
+            }
+        user_tag = APPROVED_EMAILS[email] # Get the tag (e.g., "user1")
+        # --- NEW: Branching Logic for Debug/Live ---
+        if DEBUG_TESTING:
+            print("--- DEBUG MODE: Loading from local CSV ---")
+            full_df, pending_df, status = load_data_from_local()
+            token_to_store = "debug_mode" # Placeholder
+        else:
+            print("--- LIVE MODE: Loading from Hugging Face Hub ---")
+            if HF_TOKEN == "YOUR_HF_WRITE_TOKEN_HERE" or not HF_TOKEN:
+                 return {
+                    progress_bar: gr.Markdown(f"<font color='red'>Error: App is not configured. HF_TOKEN is missing.</font>"),
+                    login_box: gr.Group(visible=True)
+                }
+            full_df, pending_df, status = load_data_from_hub(HF_TOKEN)
+            token_to_store = HF_TOKEN
+        # --- Common Logic ---
+        if full_df is None:
+            return {
+                progress_bar: gr.Markdown(f"<font color='red'>{status}</font>"),
+                login_box: gr.Group(visible=True)
+            }
+        # --- Load the first item ---
+        first_item_updates = load_next_item(pending_df, 0)
+        # --- Save all data to state and update UI ---
+        first_item_updates[full_df_state] = full_df
+        first_item_updates[pending_df_state] = pending_df
+        first_item_updates[progress_bar] = f"Login successful as **{user_tag}**. {status}"
+        first_item_updates[hf_token_state] = token_to_store # Save token/debug_flag to state
+        first_item_updates[user_tag_state] = user_tag
+        first_item_updates[login_box] = gr.Group(visible=False) # Hide login box
+        first_item_updates[annotation_box] = gr.Group(visible=True) # Show annotation box
+        return first_item_updates
+    login_btn.click(
+        fn=login_and_load,
+        inputs=[email_box], # Input is ONLY the email box
+        outputs=[
+            progress_bar, policy_a_display, policy_b_display,
+            model_confidence_label, user_verified_radio, user_drill_down_dropdown,
+            current_index_state, annotation_box, login_box,
+            full_df_state, pending_df_state, hf_token_state, user_tag_state, status_box
+        ]
+    )
+    # --- NEW: Wrapper for Save Button ---
+    def save_wrapper(index, verified_class, drill_down, user_tag, token, full_df, pending_df):
+        if DEBUG_TESTING:
+            return save_annotation_to_local(index, verified_class, drill_down, user_tag, full_df, pending_df)
+        else:
+            return save_annotation_to_hub(index, verified_class, drill_down, user_tag, token, full_df, pending_df)
+    # --- NEW: Event listener for dynamic drill-down ---
+    user_verified_radio.change(
+        fn=update_drill_down_choices,
+        inputs=user_verified_radio,
+        outputs=user_drill_down_dropdown
+    )
+    # When 'Save & Next' is clicked
+    save_btn.click(
+        fn=save_wrapper, # Call the new wrapper function
+        inputs=[
+            current_index_state,
+            user_verified_radio,
+            user_drill_down_dropdown,
+            user_tag_state, # Pass the user tag from state
+            hf_token_state, # Pass the token from state
+            full_df_state,
+            pending_df_state
+        ],
+        outputs=[
+            progress_bar, policy_a_display, policy_b_display,
+            model_confidence_label, user_verified_radio, user_drill_down_dropdown,
+            current_index_state, annotation_box, status_box, full_df_state
+        ]
+    )
+if __name__ == "__main__":
+    if DEBUG_TESTING:
+        print("\n" + "="*30)
+        print("--- RUNNING IN DEBUG MODE ---")
+        print(f"--- Data will be read/written to '{LOCAL_DATASET_PATH}' ---")
+        print("="*30 + "\n")
+    elif HF_TOKEN == "YOUR_HF_WRITE_TOKEN_HERE":
+        print("\n--- WARNING: HF_TOKEN NOT SET ---")
+        print("Please edit 'annotation_app.py' and add your HF_TOKEN to the top.")
+    demo.launch(debug=True, share=True)

requirements.txt ADDED Viewed

	@@ -0,0 +1,21 @@

+huggingface_hub==0.25.2
+gradio
+transformers>=4.40.0
+# langchain>=0.1.14
+# sentence-transformers>=2.5.1
+# faiss-cpu>=1.7.4
+# torch>=2.1.0
+# langchain-community>=0.0.30
+# gradio-client==1.11.0
+# pydantic==2.10.6
+numpy
+pandas
+requests
+datasets
+# boto3
+# rank-bm25
+# pypdf
+# Pillow
+# pytesseract
+# openai