Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -168,7 +168,7 @@ def run_evaluation(num_samples, progress=gr.Progress()):
|
|
168 |
# π CUAD Model Evaluation Results
|
169 |
|
170 |
## π― Overall Performance
|
171 |
-
- **Model**: AvocadoMuffin/roberta-cuad-qa-
|
172 |
- **Dataset**: CUAD (Contract Understanding Atticus Dataset)
|
173 |
- **Samples Evaluated**: {len(exact_matches)}
|
174 |
- **Evaluation Date**: {datetime.now().strftime("%Y-%m-%d %H:%M:%S")}
|
@@ -191,7 +191,7 @@ def run_evaluation(num_samples, progress=gr.Progress()):
|
|
191 |
results_file = f"cuad_evaluation_results_{timestamp}.json"
|
192 |
|
193 |
detailed_results = {
|
194 |
-
"model_name": "AvocadoMuffin/roberta-cuad-qa-
|
195 |
"dataset": "cuad",
|
196 |
"num_samples": len(exact_matches),
|
197 |
"exact_match_score": avg_exact_match,
|
|
|
168 |
# π CUAD Model Evaluation Results
|
169 |
|
170 |
## π― Overall Performance
|
171 |
+
- **Model**: AvocadoMuffin/roberta-cuad-qa-v3
|
172 |
- **Dataset**: CUAD (Contract Understanding Atticus Dataset)
|
173 |
- **Samples Evaluated**: {len(exact_matches)}
|
174 |
- **Evaluation Date**: {datetime.now().strftime("%Y-%m-%d %H:%M:%S")}
|
|
|
191 |
results_file = f"cuad_evaluation_results_{timestamp}.json"
|
192 |
|
193 |
detailed_results = {
|
194 |
+
"model_name": "AvocadoMuffin/roberta-cuad-qa-v3",
|
195 |
"dataset": "cuad",
|
196 |
"num_samples": len(exact_matches),
|
197 |
"exact_match_score": avg_exact_match,
|