| #SBATCH --job-name=qwen-lora-finetune # Descriptive job name | |
| #SBATCH --partition=h200_normal_q # or a100_normal_q depending on GPU availability | |
| #SBATCH --account=ece_6514 # Your ARC account | |
| #SBATCH --output=logs/qwen_lora_%j.out | |
| #SBATCH --error=logs/qwen_lora_%j.err | |
| #SBATCH --time=1:00:00 # 24-hour wall time | |
| #SBATCH --gres=gpu:1 # Request 1 GPU | |
| #SBATCH --mem=16G | |
| #SBATCH --ntasks-per-node=2 # Two CPU tasks for dataloader | |
| # Load necessary modules and activate conda environment | |
| module purge | |
| # Load modules | |
| module --ignore_cache load Miniconda3/24.7.1-0 | |
| module --ignore_cache load PyTorch/2.1.2-foss-2023a | |
| # Source conda for script | |
| source /cm/local/apps/Miniconda3/24.7.1-0/etc/profile.d/conda.sh | |
| conda activate cvenv | |
| # Safety: unset PYTHONPATH to avoid HPC NumPy conflicts | |
| unset PYTHONPATH | |
| # Start the fine-tuning process | |
| echo "π Starting fine-tuning job..." | |
| python sft_lora_finetuner.py | |
| echo "β Fine-tuning completed." |