Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -599,7 +599,7 @@ class OnnxBgeEmbeddings(Embeddings):
|
|
| 599 |
class LLMEvaluator:
|
| 600 |
def __init__(self):
|
| 601 |
# Qwen 2.5 0.5B is fast but needs "Few-Shot" examples to be strict.
|
| 602 |
-
self.repo_id = "onnx-community/Qwen2.5-
|
| 603 |
self.local_dir = "onnx_qwen_local"
|
| 604 |
|
| 605 |
print(f"🔄 Preparing CPU LLM: {self.repo_id}...")
|
|
@@ -637,8 +637,8 @@ class LLMEvaluator:
|
|
| 637 |
Your job is to check if the Student Answer is FACTUALLY present in the Context.
|
| 638 |
|
| 639 |
GRADING ALGORITHM:
|
| 640 |
-
1. IF the Student Answer mentions things NOT in the Context -> PENALTY (-
|
| 641 |
-
2. IF the Student Answer interprets the text opposite to its meaning -> PENALTY (-100%).
|
| 642 |
3. IF the Student Answer is generic fluff -> SCORE: 0.
|
| 643 |
|
| 644 |
--- EXAMPLE 1 (HALLUCINATION) ---
|
|
|
|
| 599 |
class LLMEvaluator:
|
| 600 |
def __init__(self):
|
| 601 |
# Qwen 2.5 0.5B is fast but needs "Few-Shot" examples to be strict.
|
| 602 |
+
self.repo_id = "onnx-community/Qwen2.5-1.5B-Instruct"
|
| 603 |
self.local_dir = "onnx_qwen_local"
|
| 604 |
|
| 605 |
print(f"🔄 Preparing CPU LLM: {self.repo_id}...")
|
|
|
|
| 637 |
Your job is to check if the Student Answer is FACTUALLY present in the Context.
|
| 638 |
|
| 639 |
GRADING ALGORITHM:
|
| 640 |
+
1. IF the Student Answer mentions things NOT in the Context -> PENALTY (-50% of the marks).
|
| 641 |
+
2. IF the Student Answer interprets the text opposite to its meaning -> PENALTY (-100% of the marks).
|
| 642 |
3. IF the Student Answer is generic fluff -> SCORE: 0.
|
| 643 |
|
| 644 |
--- EXAMPLE 1 (HALLUCINATION) ---
|