Update README.md
Browse files
README.md
CHANGED
|
@@ -81,6 +81,15 @@ python3 -m fastchat.serve.cli --model-path LLM360/AmberChat
|
|
| 81 |
| Max Seq Length | 2048 |
|
| 82 |
| Vocab Size | 32000 |
|
| 83 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 84 |
|
| 85 |
# Evaluation
|
| 86 |
|
|
|
|
| 81 |
| Max Seq Length | 2048 |
|
| 82 |
| Vocab Size | 32000 |
|
| 83 |
|
| 84 |
+
| Training Hyperparameter | Value |
|
| 85 |
+
| ----------- | ----------- |
|
| 86 |
+
| learning_rate | 2e-5 |
|
| 87 |
+
| num_train_epochs | 3 |
|
| 88 |
+
| per_device_train_batch_size | 2 |
|
| 89 |
+
| gradient_accumulation_steps | 16 |
|
| 90 |
+
| warmup_ratio | 0.04 |
|
| 91 |
+
| model_max_length | 2048 |
|
| 92 |
+
|
| 93 |
|
| 94 |
# Evaluation
|
| 95 |
|