Update README.md
Browse files
README.md
CHANGED
@@ -81,6 +81,15 @@ python3 -m fastchat.serve.cli --model-path LLM360/AmberChat
|
|
81 |
| Max Seq Length | 2048 |
|
82 |
| Vocab Size | 32000 |
|
83 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
84 |
|
85 |
# Evaluation
|
86 |
|
|
|
81 |
| Max Seq Length | 2048 |
|
82 |
| Vocab Size | 32000 |
|
83 |
|
84 |
+
| Training Hyperparameter | Value |
|
85 |
+
| ----------- | ----------- |
|
86 |
+
| learning_rate | 2e-5 |
|
87 |
+
| num_train_epochs | 3 |
|
88 |
+
| per_device_train_batch_size | 2 |
|
89 |
+
| gradient_accumulation_steps | 16 |
|
90 |
+
| warmup_ratio | 0.04 |
|
91 |
+
| model_max_length | 2048 |
|
92 |
+
|
93 |
|
94 |
# Evaluation
|
95 |
|