liarMP4

Sleeping

App Files Files Community

GlazedDon0t commited on 22 days ago

Commit

dc4573e

1 Parent(s): d3b4e50

fina p3

Browse files

Files changed (1) hide show

src/labeling_logic.py +78 -0

src/labeling_logic.py CHANGED Viewed

@@ -1,6 +1,41 @@
 # labeling_logic.py
 LABELING_PROMPT_TEMPLATE = """
 You are an AI Factuality Assessment Agent operating under the "Ali Arsanjani Factuality Factors" framework.
 Your goal is to mass-label video content, quantifying "Veracity Vectors" and "Modality Alignment".
@@ -27,6 +62,7 @@ Your goal is to mass-label video content, quantifying "Veracity Vectors" and "Mo
 - Strings containing commas MUST be quoted.
 - ALL scores must be filled (use 0 if unsure, do not leave blank).
 - **MODALITY SCORING:** You must provide 3 distinct alignment scores: Video-Audio, Video-Caption, and Audio-Caption.
 **TOON SCHEMA:**
 {toon_schema}
@@ -37,6 +73,38 @@ Your goal is to mass-label video content, quantifying "Veracity Vectors" and "Mo
 <thinking>
 """
 SCORE_INSTRUCTIONS_REASONING = """
 **Constraints:**
 1. Provide specific reasoning for EACH score in the `vectors` and `modalities` tables.
@@ -66,6 +134,9 @@ disinfo: analysis[1]{class,intent,threat}:
 final: assessment[1]{score,reasoning}:
 (Int 1-100),"Final synthesis of why this score was given"
 """
 SCHEMA_REASONING = """
@@ -92,9 +163,14 @@ disinfo: analysis[1]{class,intent,threat}:
 final: assessment[1]{score,reasoning}:
 (Int 1-100),"Final synthesis of why this score was given"
 """
 FCOT_MACRO_PROMPT = """
 **Fractal Chain of Thought - Stage 1: Macro-Scale Hypothesis (Wide Aperture)**
 You are analyzing a video for factuality.
@@ -138,6 +214,8 @@ FCOT_SYNTHESIS_PROMPT = """
 **Output Format**:
 Strictly fill out the following TOON schema based on the consensus. Do not include markdown code blocks.
 **TOON SCHEMA**:
 {toon_schema}

 # labeling_logic.py
+import os
+import json
+PROMPT_VARIANTS = {
+    "standard": {
+        "description": "Standard Persona",
+        "instruction": "You are a Factuality Agent."
+    },
+    "skeptic": {
+        "description": "Skeptical Persona",
+        "instruction": "You are a highly skeptical Factuality Agent. Assume claims might be misleading until verified."
+    },
+    "lenient": {
+        "description": "Lenient Persona",
+        "instruction": "You are a lenient Factuality Agent. Assume claims are true unless overtly false."
+    }
+}
+TEXT_ONLY_INSTRUCTIONS = """
+**NOTE: No video provided.** Analyze the text only (caption and transcript). Do not make assumptions about visual elements unless described in the text. Visual and Audio integrity scores should be estimated based on textual claims if applicable, or defaulted if completely unknowable.
+"""
+def get_formatted_tag_list():
+    path = "data/tags.json"
+    if os.path.exists(path):
+        try:
+            with open(path, 'r') as f:
+                tags = json.load(f)
+                if tags:
+                    return "Suggested tags: " + ", ".join(tags.keys())
+        except Exception:
+            pass
+    return "Provide relevant comma-separated tags."
 LABELING_PROMPT_TEMPLATE = """
+{system_persona}
 You are an AI Factuality Assessment Agent operating under the "Ali Arsanjani Factuality Factors" framework.
 Your goal is to mass-label video content, quantifying "Veracity Vectors" and "Modality Alignment".
 - Strings containing commas MUST be quoted.
 - ALL scores must be filled (use 0 if unsure, do not leave blank).
 - **MODALITY SCORING:** You must provide 3 distinct alignment scores: Video-Audio, Video-Caption, and Audio-Caption.
+- **TAGS:** {tag_list_text}
 **TOON SCHEMA:**
 {toon_schema}
 <thinking>
 """
+LABELING_PROMPT_TEMPLATE_NO_COT = """
+{system_persona}
+You are an AI Factuality Assessment Agent operating under the "Ali Arsanjani Factuality Factors" framework.
+Your goal is to mass-label video content, quantifying "Veracity Vectors" and "Modality Alignment".
+**INPUT DATA:**
+- **User Caption:** "{caption}"
+- **Audio Transcript:** "{transcript}"
+- **Visuals:** (Provided in video context)
+**INSTRUCTIONS:**
+1.  **Grounding:** Cross-reference claims in the transcript with your internal knowledge base (and tools if active).
+2.  **Output Format:** Output strictly in **TOON** format (Token-Oriented Object Notation) as defined below.
+**CRITICAL CONSTRAINTS:**
+- Do NOT repeat the input data.
+- **DO NOT use Markdown code blocks.** (Output plain text only).
+- Use strict `Key : Type [ Count ] {{ Headers }} :` format followed by data lines.
+- Strings containing commas MUST be quoted.
+- ALL scores must be filled (use 0 if unsure, do not leave blank).
+- **MODALITY SCORING:** You must provide 3 distinct alignment scores: Video-Audio, Video-Caption, and Audio-Caption.
+- **TAGS:** {tag_list_text}
+**TOON SCHEMA:**
+{toon_schema}
+{score_instructions}
+**RESPONSE:**
+"""
 SCORE_INSTRUCTIONS_REASONING = """
 **Constraints:**
 1. Provide specific reasoning for EACH score in the `vectors` and `modalities` tables.
 final: assessment[1]{score,reasoning}:
 (Int 1-100),"Final synthesis of why this score was given"
+tags: keywords[1]{tags}:
+"Comma-separated list of tags"
 """
 SCHEMA_REASONING = """
 final: assessment[1]{score,reasoning}:
 (Int 1-100),"Final synthesis of why this score was given"
+tags: keywords[1]{tags}:
+"Comma-separated list of tags"
 """
 FCOT_MACRO_PROMPT = """
+{system_persona}
 **Fractal Chain of Thought - Stage 1: Macro-Scale Hypothesis (Wide Aperture)**
 You are analyzing a video for factuality.
 **Output Format**:
 Strictly fill out the following TOON schema based on the consensus. Do not include markdown code blocks.
+**TAGS GUIDANCE**: {tag_list_text}
 **TOON SCHEMA**:
 {toon_schema}