retry
Browse files- app/ui/prompts_tab.py +2 -3
- app/ui/test_set_tab.py +1 -1
- config/system_prompt_texts.py +1 -1
app/ui/prompts_tab.py
CHANGED
|
@@ -22,8 +22,7 @@ def build_prompts_tab():
|
|
| 22 |
with gr.Column(scale=2):
|
| 23 |
pass # only here to keep the first column in check: force narrower dropdown
|
| 24 |
|
| 25 |
-
|
| 26 |
-
|
| 27 |
|
| 28 |
# Return references
|
| 29 |
-
return (pipeline_choice, )
|
|
|
|
| 22 |
with gr.Column(scale=2):
|
| 23 |
pass # only here to keep the first column in check: force narrower dropdown
|
| 24 |
|
| 25 |
+
search_field = gr.Textbox(label="Text Search 🚧", placeholder="Dummy placeholder element, doesn't work")
|
|
|
|
| 26 |
|
| 27 |
# Return references
|
| 28 |
+
return (pipeline_choice, search_field, )
|
app/ui/test_set_tab.py
CHANGED
|
@@ -27,7 +27,7 @@ def build_test_set_tab():
|
|
| 27 |
with open("test_samples.md", "r", encoding="utf-8") as file:
|
| 28 |
markdown_content = file.read()
|
| 29 |
|
| 30 |
-
|
| 31 |
|
| 32 |
|
| 33 |
# Return references
|
|
|
|
| 27 |
with open("test_samples.md", "r", encoding="utf-8") as file:
|
| 28 |
markdown_content = file.read()
|
| 29 |
|
| 30 |
+
gr.Markdown(markdown_content)
|
| 31 |
|
| 32 |
|
| 33 |
# Return references
|
config/system_prompt_texts.py
CHANGED
|
@@ -185,7 +185,7 @@ template_diagnose_distractor_clearly_wrong_text = """
|
|
| 185 |
<key_concepts>
|
| 186 |
<effectiveness_criterion>
|
| 187 |
A distractor is considered effective if it sounds plausible to at least some students. It's acceptable if most students would dismiss it, as long as not all of them would.
|
| 188 |
-
The given exercise is acceptable only if ALL of its distractors are considered effective.
|
| 189 |
</effectiveness_criterion>
|
| 190 |
|
| 191 |
<failure_threshold>
|
|
|
|
| 185 |
<key_concepts>
|
| 186 |
<effectiveness_criterion>
|
| 187 |
A distractor is considered effective if it sounds plausible to at least some students. It's acceptable if most students would dismiss it, as long as not all of them would.
|
| 188 |
+
The given exercise is acceptable only if ALL of its distractors are considered effective .
|
| 189 |
</effectiveness_criterion>
|
| 190 |
|
| 191 |
<failure_threshold>
|