torchrun --nproc_per_node=4 /home/tosi-n/ark/gorilla/supervised-fine-tune-qlora.py \ --model_name_or_path meta-llama/Llama-2-13b-hf \ --bf16 True \ --output_dir /home/tosi-n/ark/jack-alm/ \ --model_max_length 8192 \ --use_flash_attn True \ --data_path /home/tosi-n/ark/data/line_item_and_alm_data_v1.json \ --low_rank_training True \ --num_train_epochs 3 \ --per_device_train_batch_size 1 \ --per_device_eval_batch_size 2 \ --gradient_accumulation_steps 1 \ --evaluation_strategy "no" \ --save_strategy "steps" \ --save_steps 200 \ --save_total_limit 2 \ --learning_rate 2e-5 \ --weight_decay 0.0 \ --warmup_steps 20 \ --lr_scheduler_type "constant_with_warmup" \ --logging_steps 1 \ --deepspeed "/home/tosi-n/ark/gorilla/ds_configs/stage2.json" \ --tf32 True #