From dae929ac3f187b48fd3c9b29cf1e0442708a30c9 Mon Sep 17 00:00:00 2001 From: Zitian Gao Date: Thu, 29 May 2025 19:21:15 +0800 Subject: update params --- README.md | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/README.md b/README.md index 5fde44e..d7a9978 100644 --- a/README.md +++ b/README.md @@ -19,7 +19,7 @@ accelerate launch train.py \ --model_path /path/to/Qwen2.5-Math-7B \ --train_data dataset/1shot_rlvr/pi1_r1280.parquet \ --effective_batch 64 \ - --micro_batch_size auto \ + --micro_batch_size 2 \ --temperature 0.5 \ --learning_rate 2e-5 \ --max_steps 50 \ @@ -39,7 +39,7 @@ accelerate launch train.py \ --model_path /path/to/Qwen2.5-Math-7B \ --train_data dataset/numina/numina_00.parquet \ --effective_batch 64 \ - --micro_batch_size auto \ + --micro_batch_size 2 \ --temperature 0.5 \ --learning_rate 2e-5 \ --max_steps 50 \ -- cgit v1.2.3