Spaces:
Running
on
Zero
Running
on
Zero
Nicolai Berk
commited on
Commit
·
456bc55
1
Parent(s):
cdedfb1
Fix data loader
Browse files
app.py
CHANGED
@@ -8,8 +8,8 @@ from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
|
|
8 |
|
9 |
# Load corpus
|
10 |
print("Loading dataset...")
|
11 |
-
dataset = load_dataset("rag-datasets/rag-mini-wikipedia", "text-corpus"
|
12 |
-
corpus = [
|
13 |
|
14 |
# Embedding model
|
15 |
print("Encoding corpus...")
|
|
|
8 |
|
9 |
# Load corpus
|
10 |
print("Loading dataset...")
|
11 |
+
dataset = load_dataset("rag-datasets/rag-mini-wikipedia", "text-corpus")
|
12 |
+
corpus = [item for item in dataset["passages"]]
|
13 |
|
14 |
# Embedding model
|
15 |
print("Encoding corpus...")
|