Spaces:
Paused
Paused
Update train.py
Browse files
train.py
CHANGED
|
@@ -57,7 +57,7 @@ def load_data():
|
|
| 57 |
return dataset
|
| 58 |
|
| 59 |
def encode_decode(text, tok):
|
| 60 |
-
tokenized_texts =
|
| 61 |
texts,
|
| 62 |
padding="max_length",
|
| 63 |
truncation=True,
|
|
@@ -66,7 +66,7 @@ def encode_decode(text, tok):
|
|
| 66 |
).input_ids
|
| 67 |
|
| 68 |
if tokenized_texts.dim() >= 1:
|
| 69 |
-
decoded_texts =
|
| 70 |
else:
|
| 71 |
print('Found invalid entry in examples. Returning dummy..')
|
| 72 |
decoded_texts = ['Nothing to see here.']
|
|
|
|
| 57 |
return dataset
|
| 58 |
|
| 59 |
def encode_decode(text, tok):
|
| 60 |
+
tokenized_texts = tok(
|
| 61 |
texts,
|
| 62 |
padding="max_length",
|
| 63 |
truncation=True,
|
|
|
|
| 66 |
).input_ids
|
| 67 |
|
| 68 |
if tokenized_texts.dim() >= 1:
|
| 69 |
+
decoded_texts = tok.batch_decode(tokenized_texts)
|
| 70 |
else:
|
| 71 |
print('Found invalid entry in examples. Returning dummy..')
|
| 72 |
decoded_texts = ['Nothing to see here.']
|