Spaces:
Running
Running
Refactor evaluation interface: Update label for evaluated pairs checkbox and improve documentation for QA pairs dataframe function.
Browse files- app.py +1 -1
- web/evaluation_interface.py +7 -5
app.py
CHANGED
|
@@ -1247,7 +1247,7 @@ with gr.Blocks(css="""
|
|
| 1247 |
|
| 1248 |
# QA pairs table section
|
| 1249 |
show_evaluated = gr.Checkbox(
|
| 1250 |
-
label="Show
|
| 1251 |
value=False
|
| 1252 |
)
|
| 1253 |
qa_table = gr.Dataframe(
|
|
|
|
| 1247 |
|
| 1248 |
# QA pairs table section
|
| 1249 |
show_evaluated = gr.Checkbox(
|
| 1250 |
+
label="Show Only Evaluated Pairs",
|
| 1251 |
value=False
|
| 1252 |
)
|
| 1253 |
qa_table = gr.Dataframe(
|
web/evaluation_interface.py
CHANGED
|
@@ -56,23 +56,24 @@ def get_qa_pairs_dataframe(evaluator, show_evaluated=False, force_reload=False):
|
|
| 56 |
|
| 57 |
Args:
|
| 58 |
evaluator: ChatEvaluator instance
|
| 59 |
-
show_evaluated: If True,
|
| 60 |
force_reload: If True, force reload from dataset
|
| 61 |
|
| 62 |
Returns:
|
| 63 |
DataFrame with QA pairs
|
| 64 |
"""
|
| 65 |
try:
|
| 66 |
-
# Get QA pairs
|
| 67 |
qa_pairs = evaluator.get_qa_pairs_for_evaluation(limit=100, force_reload=force_reload)
|
| 68 |
|
| 69 |
# Get annotations
|
| 70 |
annotations = evaluator.get_annotations(force_reload=force_reload)
|
| 71 |
evaluated_ids = {a.get("conversation_id") for a in annotations}
|
| 72 |
|
| 73 |
-
# Filter
|
| 74 |
-
if
|
| 75 |
-
|
|
|
|
| 76 |
|
| 77 |
# Convert to DataFrame
|
| 78 |
if qa_pairs:
|
|
@@ -91,6 +92,7 @@ def get_qa_pairs_dataframe(evaluator, show_evaluated=False, force_reload=False):
|
|
| 91 |
else:
|
| 92 |
import pandas as pd
|
| 93 |
return pd.DataFrame(columns=["Conversation ID", "Question", "Answer", "Evaluated"])
|
|
|
|
| 94 |
except Exception as e:
|
| 95 |
logger.error(f"Error getting QA pairs dataframe: {e}")
|
| 96 |
import pandas as pd
|
|
|
|
| 56 |
|
| 57 |
Args:
|
| 58 |
evaluator: ChatEvaluator instance
|
| 59 |
+
show_evaluated: If True, show only evaluated pairs. If False, show all pairs
|
| 60 |
force_reload: If True, force reload from dataset
|
| 61 |
|
| 62 |
Returns:
|
| 63 |
DataFrame with QA pairs
|
| 64 |
"""
|
| 65 |
try:
|
| 66 |
+
# Get QA pairs
|
| 67 |
qa_pairs = evaluator.get_qa_pairs_for_evaluation(limit=100, force_reload=force_reload)
|
| 68 |
|
| 69 |
# Get annotations
|
| 70 |
annotations = evaluator.get_annotations(force_reload=force_reload)
|
| 71 |
evaluated_ids = {a.get("conversation_id") for a in annotations}
|
| 72 |
|
| 73 |
+
# Filter pairs based on show_evaluated flag
|
| 74 |
+
if show_evaluated:
|
| 75 |
+
# Show only evaluated pairs
|
| 76 |
+
qa_pairs = [qa for qa in qa_pairs if qa["conversation_id"] in evaluated_ids]
|
| 77 |
|
| 78 |
# Convert to DataFrame
|
| 79 |
if qa_pairs:
|
|
|
|
| 92 |
else:
|
| 93 |
import pandas as pd
|
| 94 |
return pd.DataFrame(columns=["Conversation ID", "Question", "Answer", "Evaluated"])
|
| 95 |
+
|
| 96 |
except Exception as e:
|
| 97 |
logger.error(f"Error getting QA pairs dataframe: {e}")
|
| 98 |
import pandas as pd
|