lingchensanwen commited on
Commit
4f9c29d
·
verified ·
1 Parent(s): f801920

Upload qlora.yml

Browse files
Files changed (1) hide show
  1. qlora.yml +99 -0
qlora.yml ADDED
@@ -0,0 +1,99 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ base_model: meta-llama/Llama-2-7b-chat-hf
2
+ model_type: LlamaForCausalLM
3
+ tokenizer_type: LlamaTokenizer
4
+ # hub_model_id: llama2-generation
5
+
6
+ load_in_8bit: false
7
+ load_in_4bit: true
8
+ strict: false
9
+
10
+ datasets:
11
+ - path: /home/yw23374/axolotl/examples/mistral/data/final_data/upsampled_train.json
12
+ ds_type: json
13
+ type: alpaca
14
+ split: train
15
+
16
+ test_datasets:
17
+ - path: /home/yw23374/axolotl/examples/mistral/data/final_data/val.json
18
+ ds_type: json
19
+ type: alpaca
20
+ split: train
21
+
22
+ load_best_model_at_end: False
23
+ early_stopping_patience:
24
+ dataset_prepared_path:
25
+ val_set_size: 0
26
+ output_dir: ./qlora-out-llama2-balance-3nd
27
+
28
+ adapter: qlora
29
+ lora_model_dir:
30
+
31
+ sequence_len: 4096
32
+ sample_packing: false
33
+ pad_to_sequence_len: false
34
+
35
+ lora_r: 32
36
+ lora_alpha: 16
37
+ lora_dropout: 0.15
38
+ lora_target_linear: true
39
+ lora_fan_in_fan_out:
40
+ lora_target_modules:
41
+ - gate_proj
42
+ - down_proj
43
+ - up_proj
44
+ - q_proj
45
+ - v_proj
46
+ - k_proj
47
+ - o_proj
48
+
49
+ wandb_project: fine-tune-sal
50
+ wandb_entity:
51
+ wandb_watch:
52
+ wandb_run_id:
53
+ wandb_log_model:
54
+
55
+ gradient_accumulation_steps: 2
56
+ micro_batch_size: 1
57
+ num_epochs: 5 #3 before, 5 for balanced
58
+ optimizer: adamw_bnb_8bit
59
+ lr_scheduler: cosine
60
+ learning_rate: 0.0001
61
+
62
+ train_on_inputs: false
63
+ group_by_length: false
64
+ bf16: true
65
+ fp16: false
66
+ tf32: false
67
+
68
+ gradient_checkpointing: true
69
+ early_stopping_patience:
70
+ resume_from_checkpoint:
71
+ local_rank:
72
+ logging_steps: 1
73
+ xformers_attention:
74
+ flash_attention: true
75
+
76
+ wandb_project: fine-tune-sal
77
+ wandb_entity:
78
+ wandb_watch:
79
+ wandb_run_id:
80
+ wandb_log_model:
81
+
82
+ warmup_steps: 10
83
+ eval_steps: 0.05
84
+ eval_table_size:
85
+ eval_table_max_new_tokens: 128
86
+ save_steps:
87
+ debug:
88
+ deepspeed:
89
+ weight_decay: 0.0
90
+ fsdp:
91
+ fsdp_config:
92
+ special_tokens:
93
+ bos_token: "<s>"
94
+ eos_token: "</s>"
95
+ unk_token: "<unk>"
96
+
97
+ # tokens: # these are delimiters
98
+ # - "<|im_start|>"
99
+ # - "<|im_end|>"