diff --git a/examples/llm_finetune/qwen/qwen3_moe_30b_lora.yaml b/examples/llm_finetune/qwen/qwen3_moe_30b_lora.yaml index 69eb5497ec..4d701eef03 100644 --- a/examples/llm_finetune/qwen/qwen3_moe_30b_lora.yaml +++ b/examples/llm_finetune/qwen/qwen3_moe_30b_lora.yaml @@ -15,7 +15,7 @@ recipe: TrainFinetuneRecipeForNextTokenPrediction step_scheduler: global_batch_size: 1024 - local_batch_size: 128 + local_batch_size: 64 ckpt_every_steps: 100 val_every_steps: 50 num_epochs: 2