File size: 832 Bytes
1fab95f |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 |
{
"repo_id": "habanoz/haber-gpt-3-40M-8k-c4tr-v1.003",
"trainer_config": {
"seed": 145,
"seq_length": 1024,
"gradient_accumulation_steps": 6,
"batch_size": 40,
"data_dir": "c4tr.003",
"max_iters": 20000,
"warmup_iters": 2000,
"grad_norm_clip": 1.0,
"out_dir": "haber-gpt-3-40M-8k-c4tr-v1.003",
"dtype": "float16",
"compile": true,
"gc": false,
"learning_rate": 0.0018,
"decay_lr": true,
"lr_decay_iters": 20000,
"min_lr": 0.00018,
"weight_decay": 0.1,
"beta1": 0.9,
"beta2": 0.95,
"log_interval": 50,
"eval_interval": 1000,
"eval_iters": 100,
"promised_flops": 65000000000000.0,
"wandb_log": true,
"wandb_project": "Haber-GPT-3-40M",
"wandb_run_name": "haber-gpt-3-40M-8k-c4tr-v1.003",
"wandb_run_id": "1733943696"
}
} |