Rulga commited on
Commit
c564619
·
1 Parent(s): 6f3f7b2

Refactor evaluation interface: Update label for evaluated pairs checkbox and improve documentation for QA pairs dataframe function.

Browse files
Files changed (2) hide show
  1. app.py +1 -1
  2. web/evaluation_interface.py +7 -5
app.py CHANGED
@@ -1247,7 +1247,7 @@ with gr.Blocks(css="""
1247
 
1248
  # QA pairs table section
1249
  show_evaluated = gr.Checkbox(
1250
- label="Show Already Evaluated Pairs",
1251
  value=False
1252
  )
1253
  qa_table = gr.Dataframe(
 
1247
 
1248
  # QA pairs table section
1249
  show_evaluated = gr.Checkbox(
1250
+ label="Show Only Evaluated Pairs",
1251
  value=False
1252
  )
1253
  qa_table = gr.Dataframe(
web/evaluation_interface.py CHANGED
@@ -56,23 +56,24 @@ def get_qa_pairs_dataframe(evaluator, show_evaluated=False, force_reload=False):
56
 
57
  Args:
58
  evaluator: ChatEvaluator instance
59
- show_evaluated: If True, include already evaluated pairs
60
  force_reload: If True, force reload from dataset
61
 
62
  Returns:
63
  DataFrame with QA pairs
64
  """
65
  try:
66
- # Get QA pairs with potential force reload
67
  qa_pairs = evaluator.get_qa_pairs_for_evaluation(limit=100, force_reload=force_reload)
68
 
69
  # Get annotations
70
  annotations = evaluator.get_annotations(force_reload=force_reload)
71
  evaluated_ids = {a.get("conversation_id") for a in annotations}
72
 
73
- # Filter out already evaluated pairs if needed
74
- if not show_evaluated:
75
- qa_pairs = [qa for qa in qa_pairs if qa["conversation_id"] not in evaluated_ids]
 
76
 
77
  # Convert to DataFrame
78
  if qa_pairs:
@@ -91,6 +92,7 @@ def get_qa_pairs_dataframe(evaluator, show_evaluated=False, force_reload=False):
91
  else:
92
  import pandas as pd
93
  return pd.DataFrame(columns=["Conversation ID", "Question", "Answer", "Evaluated"])
 
94
  except Exception as e:
95
  logger.error(f"Error getting QA pairs dataframe: {e}")
96
  import pandas as pd
 
56
 
57
  Args:
58
  evaluator: ChatEvaluator instance
59
+ show_evaluated: If True, show only evaluated pairs. If False, show all pairs
60
  force_reload: If True, force reload from dataset
61
 
62
  Returns:
63
  DataFrame with QA pairs
64
  """
65
  try:
66
+ # Get QA pairs
67
  qa_pairs = evaluator.get_qa_pairs_for_evaluation(limit=100, force_reload=force_reload)
68
 
69
  # Get annotations
70
  annotations = evaluator.get_annotations(force_reload=force_reload)
71
  evaluated_ids = {a.get("conversation_id") for a in annotations}
72
 
73
+ # Filter pairs based on show_evaluated flag
74
+ if show_evaluated:
75
+ # Show only evaluated pairs
76
+ qa_pairs = [qa for qa in qa_pairs if qa["conversation_id"] in evaluated_ids]
77
 
78
  # Convert to DataFrame
79
  if qa_pairs:
 
92
  else:
93
  import pandas as pd
94
  return pd.DataFrame(columns=["Conversation ID", "Question", "Answer", "Evaluated"])
95
+
96
  except Exception as e:
97
  logger.error(f"Error getting QA pairs dataframe: {e}")
98
  import pandas as pd