#!/bin/bash #SBATCH --job-name=gpt2_train #SBATCH --nodes=1 #SBATCH --ntasks-per-node=1 #SBATCH --cpus-per-task=32 #SBATCH --time=26:00:00 #Request 24 hours #SBATCH --mem=128GB #Request 128GB per node #SBATCH --partition=gpu #Request the GPU partition/queue #SBATCH --gres=gpu:a100:1 #Request one A100 GPU to use #SBATCH --output=gpt2_train.%j.log #Redirect stdout/err to file # Run the training script python train.py --config configs/config.yaml