mtasic85 commited on
Commit
652f453
1 Parent(s): f3788fa

pretrain model

Browse files
Files changed (1) hide show
  1. scripts/pretrain-model.yaml +2 -2
scripts/pretrain-model.yaml CHANGED
@@ -7,8 +7,8 @@ model_name: "Llama-3.2-1B"
7
  # A ``litgpt.Config`` object to define the model architecture. Mutually exclusive with
8
  # ``model_config``. (type: Optional[Config], default: null)
9
  model_config:
10
- padded_vocab_size: 38400
11
- vocab_size: 38400
12
  block_size: 8192
13
  n_layer: 8
14
  n_head: 32
 
7
  # A ``litgpt.Config`` object to define the model architecture. Mutually exclusive with
8
  # ``model_config``. (type: Optional[Config], default: null)
9
  model_config:
10
+ padded_vocab_size: 32768
11
+ vocab_size: 32768
12
  block_size: 8192
13
  n_layer: 8
14
  n_head: 32