Spaces:
Sleeping
Sleeping
Michela commited on
Commit ·
05202ae
1
Parent(s): ff0861b
Update app.py
Browse files
app.py
CHANGED
|
@@ -2,22 +2,11 @@
|
|
| 2 |
import gradio as gr
|
| 3 |
import pandas as pd
|
| 4 |
from difflib import SequenceMatcher
|
| 5 |
-
import os
|
| 6 |
-
|
| 7 |
-
# Get script's directory
|
| 8 |
-
script_dir = os.path.dirname(os.path.abspath(__file__))
|
| 9 |
-
|
| 10 |
-
### Debugging ###
|
| 11 |
-
# Print the contents of the data directory
|
| 12 |
-
data_path = os.path.join(os.path.dirname(os.path.abspath(__file__)), "data/retrieval_results/sonnini_original_ocr")
|
| 13 |
-
print(f"Checking folder: {data_path}")
|
| 14 |
-
print("Files in directory:", os.listdir(data_path) if os.path.exists(data_path) else "Directory not found!")
|
| 15 |
-
####
|
| 16 |
|
| 17 |
# Import results
|
| 18 |
-
results_clean = pd.read_csv("
|
| 19 |
-
results_prep = pd.read_csv("
|
| 20 |
-
results_orig = pd.read_csv("
|
| 21 |
|
| 22 |
# Drop 'text_prep' from results_orig
|
| 23 |
results_clean.drop(columns=['text_prep'], inplace=True)
|
|
|
|
| 2 |
import gradio as gr
|
| 3 |
import pandas as pd
|
| 4 |
from difflib import SequenceMatcher
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5 |
|
| 6 |
# Import results
|
| 7 |
+
results_clean = pd.read_csv("data/retrieval_results/sonnini_cleaned/i_onit-sonnini-DHd2025-clean-q_Pferd, Pferde.csv").head(100)
|
| 8 |
+
results_prep = pd.read_csv("data/retrieval_results/sonnini_llm_corrected/i_onit-sonnini-DHd2025-prep-q_Pferd, Pferde.csv").head(100)
|
| 9 |
+
results_orig = pd.read_csv("data/retrieval_results/sonnini_original_ocr/i_onit-test-index-sonnini-q_Pferd-Pferde.csv").head(100)
|
| 10 |
|
| 11 |
# Drop 'text_prep' from results_orig
|
| 12 |
results_clean.drop(columns=['text_prep'], inplace=True)
|