/ repo3-fine-tuning-template / run_training.bat
run_training.bat
 1  @echo off
 2  chcp 65001 >nul
 3  
 4  REM 设置环境变量抑制TensorFlow AVX警告
 5  set TF_CPP_MIN_LOG_LEVEL=2
 6  set TF_ENABLE_ONEDNN_OPTS=0
 7  
 8  echo ==========================================
 9  echo Qwen3 DPO Fine-tuning 项目
10  echo ==========================================
11  
12  REM 检查Python环境
13  python --version >nul 2>&1
14  if errorlevel 1 (
15      echo 错误: 未找到Python,请先安装Python
16      pause
17      exit /b 1
18  )
19  
20  REM 检查CUDA
21  nvidia-smi >nul 2>&1
22  if errorlevel 1 (
23      echo 警告: 未检测到NVIDIA GPU,将使用CPU训练(速度会很慢)
24  ) else (
25      echo 检测到NVIDIA GPU:
26      nvidia-smi --query-gpu=name,memory.total --format=csv,noheader,nounits
27  )
28  
29  REM 创建必要的目录
30  echo 创建项目目录...
31  if not exist "data" mkdir data
32  if not exist "outputs" mkdir outputs
33  if not exist "logs" mkdir logs
34  
35  REM 安装依赖
36  echo 安装项目依赖...
37  pip install -r requirements.txt
38  
39  REM 检查依赖安装
40  echo 检查依赖安装...
41  python -c "import torch; import transformers; import trl; import datasets; import peft; print(f'PyTorch版本: {torch.__version__}'); print(f'Transformers版本: {transformers.__version__}'); print(f'TRL版本: {trl.__version__}'); print(f'Datasets版本: {datasets.__version__}'); print(f'PEFT版本: {peft.__version__}'); print(f'CUDA可用: {torch.cuda.is_available()}'); print(f'GPU数量: {torch.cuda.device_count()}' if torch.cuda.is_available() else 'GPU数量: 0')"
42  
43  REM 创建示例数据
44  echo 准备训练数据...
45  python data_utils.py
46  
47  REM 开始训练
48  echo 开始DPO训练...
49  echo 注意: 训练过程可能需要较长时间,请耐心等待...
50  echo 训练日志将保存到 dpo_training.log
51  echo 模型将保存到 outputs/dpo_qwen3_4b/
52  
53  python dpo_train.py
54  
55  echo ==========================================
56  echo 训练完成!
57  echo ==========================================
58  echo 训练后的模型保存在: outputs/dpo_qwen3_4b/
59  echo 训练日志保存在: dpo_training.log
60  echo.
61  echo 要测试模型,请运行: python test_model.py
62  pause