Spaces:
Paused
Paused
Update app.py
Browse files
app.py
CHANGED
|
@@ -9,7 +9,7 @@ import requests as rq
|
|
| 9 |
import gc
|
| 10 |
from tokenizers import ByteLevelBPETokenizer
|
| 11 |
|
| 12 |
-
dataset = load_dataset("nroggendorff/openhermes", split="train")
|
| 13 |
|
| 14 |
def get_training_corpus():
|
| 15 |
for i in range(0, len(dataset), 1000):
|
|
@@ -104,8 +104,7 @@ args = TrainingArguments(
|
|
| 104 |
save_steps=100000,
|
| 105 |
fp16=True,
|
| 106 |
optim="sgd",
|
| 107 |
-
optim_target_modules=["attn", "mlp"]
|
| 108 |
-
max_grad_norm=0.3
|
| 109 |
)
|
| 110 |
|
| 111 |
trainer = trl.SFTTrainer(
|
|
|
|
| 9 |
import gc
|
| 10 |
from tokenizers import ByteLevelBPETokenizer
|
| 11 |
|
| 12 |
+
dataset = load_dataset("nroggendorff/openhermes", split="train")#.select(range(int(5e+4)))
|
| 13 |
|
| 14 |
def get_training_corpus():
|
| 15 |
for i in range(0, len(dataset), 1000):
|
|
|
|
| 104 |
save_steps=100000,
|
| 105 |
fp16=True,
|
| 106 |
optim="sgd",
|
| 107 |
+
optim_target_modules=["attn", "mlp"]
|
|
|
|
| 108 |
)
|
| 109 |
|
| 110 |
trainer = trl.SFTTrainer(
|