Update README.md
Browse files
README.md
CHANGED
|
@@ -6,7 +6,25 @@ metrics:
|
|
| 6 |
- rouge
|
| 7 |
pipeline_tag: summarization
|
| 8 |
---
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 9 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10 |
|
| 11 |
# Training Results
|
| 12 |
|
|
|
|
| 6 |
- rouge
|
| 7 |
pipeline_tag: summarization
|
| 8 |
---
|
| 9 |
+
# Hyperparameters
|
| 10 |
+
learning_rate=2e-5
|
| 11 |
+
per_device_train_batch_size=14
|
| 12 |
+
per_device_eval_batch_size=14
|
| 13 |
+
weight_decay=0.01
|
| 14 |
+
save_total_limit=3
|
| 15 |
+
num_train_epochs=3
|
| 16 |
+
predict_with_generate=True
|
| 17 |
+
fp16=True
|
| 18 |
|
| 19 |
+
# Training Output
|
| 20 |
+
global_step=3003,
|
| 21 |
+
training_loss=2.5178213735600132,
|
| 22 |
+
metrics={'train_runtime': 8703.174,
|
| 23 |
+
'train_samples_per_second': 4.83,
|
| 24 |
+
'train_steps_per_second': 0.345,
|
| 25 |
+
'total_flos': 9.272950245870797e+16,
|
| 26 |
+
'train_loss': 2.5178213735600132,
|
| 27 |
+
'epoch': 3.0}
|
| 28 |
|
| 29 |
# Training Results
|
| 30 |
|