/ repo3-fine-tuning-template / run_training.bat
run_training.bat
1 @echo off 2 chcp 65001 >nul 3 4 REM 设置环境变量抑制TensorFlow AVX警告 5 set TF_CPP_MIN_LOG_LEVEL=2 6 set TF_ENABLE_ONEDNN_OPTS=0 7 8 echo ========================================== 9 echo Qwen3 DPO Fine-tuning 项目 10 echo ========================================== 11 12 REM 检查Python环境 13 python --version >nul 2>&1 14 if errorlevel 1 ( 15 echo 错误: 未找到Python,请先安装Python 16 pause 17 exit /b 1 18 ) 19 20 REM 检查CUDA 21 nvidia-smi >nul 2>&1 22 if errorlevel 1 ( 23 echo 警告: 未检测到NVIDIA GPU,将使用CPU训练(速度会很慢) 24 ) else ( 25 echo 检测到NVIDIA GPU: 26 nvidia-smi --query-gpu=name,memory.total --format=csv,noheader,nounits 27 ) 28 29 REM 创建必要的目录 30 echo 创建项目目录... 31 if not exist "data" mkdir data 32 if not exist "outputs" mkdir outputs 33 if not exist "logs" mkdir logs 34 35 REM 安装依赖 36 echo 安装项目依赖... 37 pip install -r requirements.txt 38 39 REM 检查依赖安装 40 echo 检查依赖安装... 41 python -c "import torch; import transformers; import trl; import datasets; import peft; print(f'PyTorch版本: {torch.__version__}'); print(f'Transformers版本: {transformers.__version__}'); print(f'TRL版本: {trl.__version__}'); print(f'Datasets版本: {datasets.__version__}'); print(f'PEFT版本: {peft.__version__}'); print(f'CUDA可用: {torch.cuda.is_available()}'); print(f'GPU数量: {torch.cuda.device_count()}' if torch.cuda.is_available() else 'GPU数量: 0')" 42 43 REM 创建示例数据 44 echo 准备训练数据... 45 python data_utils.py 46 47 REM 开始训练 48 echo 开始DPO训练... 49 echo 注意: 训练过程可能需要较长时间,请耐心等待... 50 echo 训练日志将保存到 dpo_training.log 51 echo 模型将保存到 outputs/dpo_qwen3_4b/ 52 53 python dpo_train.py 54 55 echo ========================================== 56 echo 训练完成! 57 echo ========================================== 58 echo 训练后的模型保存在: outputs/dpo_qwen3_4b/ 59 echo 训练日志保存在: dpo_training.log 60 echo. 61 echo 要测试模型,请运行: python test_model.py 62 pause