Spaces:
Paused
Paused
Update app.py
Browse files
app.py
CHANGED
|
@@ -10,7 +10,7 @@ from datasets import load_dataset
|
|
| 10 |
from tokenizers import ByteLevelBPETokenizer
|
| 11 |
import trl
|
| 12 |
|
| 13 |
-
dataset = load_dataset("nroggendorff/openhermes", split="train")
|
| 14 |
|
| 15 |
def get_training_corpus():
|
| 16 |
for i in range(0, len(dataset), 1000):
|
|
|
|
| 10 |
from tokenizers import ByteLevelBPETokenizer
|
| 11 |
import trl
|
| 12 |
|
| 13 |
+
dataset = load_dataset("nroggendorff/openhermes", split="train")#.select(range(int(4e+4)))
|
| 14 |
|
| 15 |
def get_training_corpus():
|
| 16 |
for i in range(0, len(dataset), 1000):
|