File size: 940 Bytes
18187e5
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
{
    "output_dir": "output/user-baichuan2-13b-v2-3.6",
    "model_name_or_path": "/home/jiakangxiang/.cache/modelscope/hub/baichuan-inc/Baichuan2-13B-Chat",
    "train_file": "./data/train.jsonl",
    "template_name": "baichuan2",
    "num_train_epochs": 1,
    "per_device_train_batch_size": 1,
    "gradient_accumulation_steps": 16,
    "learning_rate": 0.0001,
    "max_seq_length": 3200,
    "logging_steps": 10,
    "save_steps": 100,
    "save_total_limit": 3,
    "lr_scheduler_type": "constant_with_warmup",
    "warmup_steps": 50,
    "lora_rank": 16,
    "lora_alpha": 16,
    "lora_dropout": 0.05,
    "gradient_checkpointing": true,
    "disable_tqdm": false,
    "optim": "paged_adamw_32bit",
    "seed": 42,
    "fp16": true,
    "bf16": false,
    "report_to": "tensorboard",
    "dataloader_num_workers": 0,
    "save_strategy": "steps",
    "weight_decay": 0,
    "max_grad_norm": 0.3,
    "remove_unused_columns": false
}