File size: 336 Bytes
dcf87c3 |
1 2 3 4 5 6 7 8 9 10 11 12 |
- optim.name=adafactor
- optim.lr_scheduler=legacy
- model.name=/home/jovyan/bert-train/nanot5/templates/base_slavic_120k_sub
- optim.grad_acc=8
- model.overwrite.dropout_rate=0.1
- model.klass=hf_t5
- eval.every_steps=5000
- optim.total_steps=120000
- model.add_config.is_bf16=True
- checkpoint.every_steps=10000
- model.compile=False
|