Update app.py
Browse files
app.py
CHANGED
|
@@ -17,8 +17,7 @@ def train_model(number):
|
|
| 17 |
number = int(number)
|
| 18 |
try:
|
| 19 |
dataset = load_dataset("allenai/c4", "sk", split="train", streaming=True)
|
| 20 |
-
slovak_texts =
|
| 21 |
-
|
| 22 |
inputs = tokenizer(
|
| 23 |
slovak_texts,
|
| 24 |
return_tensors="pt",
|
|
|
|
| 17 |
number = int(number)
|
| 18 |
try:
|
| 19 |
dataset = load_dataset("allenai/c4", "sk", split="train", streaming=True)
|
| 20 |
+
slovak_texts = [example['text'] for example in dataset.take(number)]
|
|
|
|
| 21 |
inputs = tokenizer(
|
| 22 |
slovak_texts,
|
| 23 |
return_tensors="pt",
|