flamiry commited on
Commit
140e2c5
·
verified ·
1 Parent(s): b9cc8c8

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -2
app.py CHANGED
@@ -17,8 +17,7 @@ def train_model(number):
17
  number = int(number)
18
  try:
19
  dataset = load_dataset("allenai/c4", "sk", split="train", streaming=True)
20
- slovak_texts = list(dataset.take(number))
21
-
22
  inputs = tokenizer(
23
  slovak_texts,
24
  return_tensors="pt",
 
17
  number = int(number)
18
  try:
19
  dataset = load_dataset("allenai/c4", "sk", split="train", streaming=True)
20
+ slovak_texts = [example['text'] for example in dataset.take(number)]
 
21
  inputs = tokenizer(
22
  slovak_texts,
23
  return_tensors="pt",