Spaces:
Sleeping
Sleeping
Nicolai Berk
commited on
Commit
·
456bc55
1
Parent(s):
cdedfb1
Fix data loader
Browse files
app.py
CHANGED
|
@@ -8,8 +8,8 @@ from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
|
|
| 8 |
|
| 9 |
# Load corpus
|
| 10 |
print("Loading dataset...")
|
| 11 |
-
dataset = load_dataset("rag-datasets/rag-mini-wikipedia", "text-corpus"
|
| 12 |
-
corpus = [
|
| 13 |
|
| 14 |
# Embedding model
|
| 15 |
print("Encoding corpus...")
|
|
|
|
| 8 |
|
| 9 |
# Load corpus
|
| 10 |
print("Loading dataset...")
|
| 11 |
+
dataset = load_dataset("rag-datasets/rag-mini-wikipedia", "text-corpus")
|
| 12 |
+
corpus = [item for item in dataset["passages"]]
|
| 13 |
|
| 14 |
# Embedding model
|
| 15 |
print("Encoding corpus...")
|