pretrain model
Browse files
scripts/pretrain-model.yaml
CHANGED
@@ -7,8 +7,8 @@ model_name: "Llama-3.2-1B"
|
|
7 |
# A ``litgpt.Config`` object to define the model architecture. Mutually exclusive with
|
8 |
# ``model_config``. (type: Optional[Config], default: null)
|
9 |
model_config:
|
10 |
-
padded_vocab_size:
|
11 |
-
vocab_size:
|
12 |
block_size: 8192
|
13 |
n_layer: 8
|
14 |
n_head: 32
|
|
|
7 |
# A ``litgpt.Config`` object to define the model architecture. Mutually exclusive with
|
8 |
# ``model_config``. (type: Optional[Config], default: null)
|
9 |
model_config:
|
10 |
+
padded_vocab_size: 32768
|
11 |
+
vocab_size: 32768
|
12 |
block_size: 8192
|
13 |
n_layer: 8
|
14 |
n_head: 32
|