AdGPT / lauguage_model_fine_tuning /launch_supervised_fine_tune_teacher.sh
goodmodeler's picture
ADD: LLM SFT, RLHF and Distillation
c1c9e88
#!/bin/bash
# launch_training.sh - 启动QLoRA训练脚本
echo " Preparing QLoRA Fine-tuning Environment..."
# 检查GPU
echo " GPU Information:"
nvidia-smi --query-gpu=name,memory.total,memory.free --format=csv
# 设置环境变量
export CUDA_VISIBLE_DEVICES=0
export TOKENIZERS_PARALLELISM=false
export WANDB_PROJECT="qlora-ad-copy-generation" # Optional
# 创建输出目录
mkdir -p ./results
mkdir -p ./logs
# 启动训练(支持多GPU)
echo " Starting QLoRA training..."
# 单GPU训练
python qlora_finetune.py 2>&1 | tee ./logs/training_$(date +%Y%m%d_%H%M%S).log
# 多GPU训练
# accelerate launch --multi_gpu --num_processes=2 qlora_finetune.py
echo " Training script launched. Check logs for progress."