diana3135 commited on
Commit
4010b2c
·
1 Parent(s): 0c0398a

add alignment and inimitability, remove comment

Browse files
Files changed (1) hide show
  1. utils.py +17 -17
utils.py CHANGED
@@ -71,22 +71,22 @@ def modify_with_suggestion(task_description, text, suggestions, api_key = None):
71
 
72
  def get_evaluation_with_gpt(task_description, text, api_key=None):
73
  prompt = (
74
- f"Given the task: {task_description}, the provided answer is: {text}\n"
75
- f"Evaluate the answer using a scale from 0 to 10. Scores should reflect stricter quality thresholds:\n"
76
- f"0-4 indicates below-average quality with significant shortcomings.\n"
77
- f"5-6 represents acceptable quality.\n"
78
- f"7-8 signifies good quality, showing substantial thought.\n"
79
- f"9-10 represents exceptional quality, with insightful, and highly concrete suggestions.\n\n"
80
- f"When evaluating, use the entire scoring range and avoid defaulting to mid-range scores.\n\n"
81
- f"Evaluate based on the criteria:\n\n"
82
- f"Novelty: The uniqueness and innovation of the ideas."
83
- f"Implementability: The practicality of suggested actions.\n"
84
- f"Inimitability: Difficult for competitors to replicate.\n"
85
-
86
- f"Please format the output exactly as follows:\n"
87
- f"Novelty: [Score]\nComment: [Short comment on Novelty]\n"
88
- f"Implementability: [Score]\nComment: [Short comment on Implementability]\n"
89
- f"Inimitability: [Score]\nComment: [Short comment on Inimitability]\n"
90
- f"Overall Score: [Score]\nOverall Comment: [Overall feedback]\n"
91
  )
92
  return generate_text_with_gpt(prompt, api_key)
 
71
 
72
  def get_evaluation_with_gpt(task_description, text, api_key=None):
73
  prompt = (
74
+ f"Given the task: {task_description}, the provided answer is: {text}\n"
75
+ f"Evaluate the answer using a scale from 0 to 10. Scores should reflect how well the ideas fit each specific evaluation criteria:\n"
76
+ f"0-2: Poor fit; the idea demonstrates minimal relevance to the criteria.\n"
77
+ f"3-5: Partial fit; the idea shows some relevance but contains significant shortcomings.\n"
78
+ f"6-8: Good fit; the idea aligns well with the criteria, showing clear relevance and thoughtfulness.\n"
79
+ f"9-10: Excellent fit; the idea fully aligns with the criteria, demonstrating exceptional insight.\n\n"
80
+ f"When evaluating, use the entire scoring range and avoid defaulting to mid-range scores.\n\n"
81
+ f"Evaluate based on the following criteria:\n"
82
+ f"Novelty: The uniqueness and innovation of the ideas.\n"
83
+ f"Implementability: The practicality of suggested actions.\n"
84
+ f"Inimitability: The difficulty for competitors to replicate the ideas.\n"
85
+ f"Alignment: The degree to which the ideas align with Airbnb’s goals and 17 SDGs.\n\n"
86
+ f"Please format the output exactly as follows:\n"
87
+ f"Novelty: [Score]\n"
88
+ f"Implementability: [Score]\n"
89
+ f"Inimitability: [Score]\n"
90
+ f"Alignment: [Score]\n"
91
  )
92
  return generate_text_with_gpt(prompt, api_key)