Update README.md
Browse files
README.md
CHANGED
@@ -28,7 +28,7 @@ flash_attention: true
|
|
28 |
gradient_accumulation_steps: 4
|
29 |
gradient_checkpointing: true
|
30 |
hf_use_auth_token: true
|
31 |
-
hub_model_id: ibivibiv/
|
32 |
learning_rate: 0.0002
|
33 |
load_in_4bit: true
|
34 |
logging_steps: 1
|
@@ -59,7 +59,7 @@ warmup_steps: 10
|
|
59 |
|
60 |
# math-llama-3-8b-instruct
|
61 |
|
62 |
-
This model is a fine-tuned version of [meta-llama/Meta-Llama-3-8B-Instruct](https://huggingface.co/meta-llama/Meta-Llama-3-8B-Instruct) on the
|
63 |
|
64 |
## Model description
|
65 |
|
|
|
28 |
gradient_accumulation_steps: 4
|
29 |
gradient_checkpointing: true
|
30 |
hf_use_auth_token: true
|
31 |
+
hub_model_id: ibivibiv/llama-3-8b-instruct-alpaca-gpt-4
|
32 |
learning_rate: 0.0002
|
33 |
load_in_4bit: true
|
34 |
logging_steps: 1
|
|
|
59 |
|
60 |
# math-llama-3-8b-instruct
|
61 |
|
62 |
+
This model is a fine-tuned version of [meta-llama/Meta-Llama-3-8B-Instruct](https://huggingface.co/meta-llama/Meta-Llama-3-8B-Instruct) on the alpaca-gpt-4 dataset.
|
63 |
|
64 |
## Model description
|
65 |
|