Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -168,7 +168,7 @@ def run_evaluation(num_samples, progress=gr.Progress()):
|
|
| 168 |
# π CUAD Model Evaluation Results
|
| 169 |
|
| 170 |
## π― Overall Performance
|
| 171 |
-
- **Model**: AvocadoMuffin/roberta-cuad-qa-
|
| 172 |
- **Dataset**: CUAD (Contract Understanding Atticus Dataset)
|
| 173 |
- **Samples Evaluated**: {len(exact_matches)}
|
| 174 |
- **Evaluation Date**: {datetime.now().strftime("%Y-%m-%d %H:%M:%S")}
|
|
@@ -191,7 +191,7 @@ def run_evaluation(num_samples, progress=gr.Progress()):
|
|
| 191 |
results_file = f"cuad_evaluation_results_{timestamp}.json"
|
| 192 |
|
| 193 |
detailed_results = {
|
| 194 |
-
"model_name": "AvocadoMuffin/roberta-cuad-qa-
|
| 195 |
"dataset": "cuad",
|
| 196 |
"num_samples": len(exact_matches),
|
| 197 |
"exact_match_score": avg_exact_match,
|
|
|
|
| 168 |
# π CUAD Model Evaluation Results
|
| 169 |
|
| 170 |
## π― Overall Performance
|
| 171 |
+
- **Model**: AvocadoMuffin/roberta-cuad-qa-v3
|
| 172 |
- **Dataset**: CUAD (Contract Understanding Atticus Dataset)
|
| 173 |
- **Samples Evaluated**: {len(exact_matches)}
|
| 174 |
- **Evaluation Date**: {datetime.now().strftime("%Y-%m-%d %H:%M:%S")}
|
|
|
|
| 191 |
results_file = f"cuad_evaluation_results_{timestamp}.json"
|
| 192 |
|
| 193 |
detailed_results = {
|
| 194 |
+
"model_name": "AvocadoMuffin/roberta-cuad-qa-v3",
|
| 195 |
"dataset": "cuad",
|
| 196 |
"num_samples": len(exact_matches),
|
| 197 |
"exact_match_score": avg_exact_match,
|