Spaces:

BtB-ExpC
/

Exercises

Sleeping

App Files Files Community

BtB-ExpC commited on Feb 12, 2025

Commit

42cb0d0

1 Parent(s): b3e1ebb

search_field

Browse files

Files changed (4) hide show

app/ui/prompts_tab.py +0 -2
app/ui/test_set_tab.py +2 -4
config/system_prompt_texts.py +6 -6
main.py +1 -0

app/ui/prompts_tab.py CHANGED Viewed

@@ -1,6 +1,4 @@
 import gradio as gr
-from chains.learning_objectives_generator.runner import run_learning_objectives_generator
-from config.llm_config import llms
 def build_prompts_tab():
     with gr.TabItem("🗒🚧️ See Prompts"):

 import gradio as gr
 def build_prompts_tab():
     with gr.TabItem("🗒🚧️ See Prompts"):

app/ui/test_set_tab.py CHANGED Viewed

@@ -1,6 +1,4 @@
 import gradio as gr
-from chains.learning_objectives_generator.runner import run_learning_objectives_generator
-from config.llm_config import llms
 def build_test_set_tab():
     with gr.TabItem("❔ Test Set"):
@@ -24,7 +22,7 @@ def build_test_set_tab():
             with gr.Column(scale=2):
                 pass # only here to keep the first column in check: force narrower dropdown
-        gr.HTML = gr.Textbox(label="Text Search 🚧", placeholder="Dummy placeholder element, doesn't work")
         with open("test_samples.md", "r", encoding="utf-8") as file:
             markdown_content = file.read()
@@ -33,4 +31,4 @@ def build_test_set_tab():
     # Return references
-    return (subset_choice, )

 import gradio as gr
 def build_test_set_tab():
     with gr.TabItem("❔ Test Set"):
             with gr.Column(scale=2):
                 pass # only here to keep the first column in check: force narrower dropdown
+        search_field = gr.Textbox(label="Text Search 🚧", placeholder="Dummy placeholder element, doesn't work")
         with open("test_samples.md", "r", encoding="utf-8") as file:
             markdown_content = file.read()
     # Return references
+    return (subset_choice, search_field, )

config/system_prompt_texts.py CHANGED Viewed

@@ -179,13 +179,13 @@ Do some reasoning first, and give your diagnosis then.
 template_diagnose_distractor_clearly_wrong_text = """
 <task_definition>
-   You assess multiple-choice exercise distractors (incorrect answer options) to identify any that are completely ineffective due to being too obviously wrong.
 </task_definition>
 <key_concepts>
     <effectiveness_criterion>
         A distractor is considered effective if it sounds plausible to at least some students. It's acceptable if most students would dismiss it, as long as not all of them would.
-        The given exercise is considered effective only if ALL distractors are effective
     </effectiveness_criterion>
     <failure_threshold>
@@ -198,16 +198,16 @@ template_diagnose_distractor_clearly_wrong_text = """
 </key_concepts>
 <analysis_guidance>
-    Your analysis should engage deeply with understanding the student perspective. Really try to vividly imagine this hypothetical Dumb Student, in line with the test's likely target demographic. They are bottom of their class. What would be their likely interpretations, their thought patterns? Really inhabit this perspective as you examine each distractor in the context of the exercise.
-    Explore multiple angles in your reasoning. Consider edge cases, alternative interpretations, and different ways different students might approach the exercise. Document your thought process thoroughly, showing the nuance in your considerations.
 </analysis_guidance>
 <output_requirements>
-    1. Focus solely on diagnosing the issue for the distractors in this exercise (no need to suggest improvements)
     2. Show detailed reasoning throughout your analysis
     3. Maintain nuance and depth in your exploration
-    4. Finally (and only then, in your very last sentence) conclude with a clear, direct final verdict about the
 </output_requirements>
 """

 template_diagnose_distractor_clearly_wrong_text = """
 <task_definition>
+   You assess multiple-choice exercise distractors (incorrect answer options) of a given exercise, to identify any distractors that are completely ineffective due to being too obviously wrong. Your final goal is to state your assessment of whether the exercise as a whole is acceptable or not.
 </task_definition>
 <key_concepts>
     <effectiveness_criterion>
         A distractor is considered effective if it sounds plausible to at least some students. It's acceptable if most students would dismiss it, as long as not all of them would.
+        The given exercise is acceptable only if ALL of its distractors are considered effective.
     </effectiveness_criterion>
     <failure_threshold>
 </key_concepts>
 <analysis_guidance>
+    Your analysis should engage deeply with understanding the student perspective in the context of this particular exercise. Really try to vividly imagine the hypothetical Dumb Student, in line with the test's likely target demographic. They are bottom of their class. What would be their likely interpretations, their thought patterns? Really inhabit this perspective as you carefully examine each distractor one by one.
+    Explore multiple angles in your reasoning. Consider edge cases, alternative interpretations, and different ways different students might approach the exercise. Take the exact phrasing of the exercise seriously. Document your thought process thoroughly, showing the nuance in your considerations.
 </analysis_guidance>
 <output_requirements>
+    1. Focus solely on diagnosing the issue for the given distractors (no need to suggest improvements)
     2. Show detailed reasoning throughout your analysis
     3. Maintain nuance and depth in your exploration
+    4. Finally (and only then, in your very last sentence) conclude with a clear, binary verdict about your diagnosis
 </output_requirements>
 """

main.py CHANGED Viewed

@@ -92,6 +92,7 @@ with gr.Blocks() as interface:
             # Build unfinished tab
             (subset_choice,
              ) = build_test_set_tab()
     # -------------------------------

             # Build unfinished tab
             (subset_choice,
+             search_field,
              ) = build_test_set_tab()
     # -------------------------------