diff --git a/recipes/configs/qwen2/7B_full_single_device.yaml b/recipes/configs/qwen2/7B_full_single_device.yaml index 8b0afb08cc..560dd5fc9f 100644 --- a/recipes/configs/qwen2/7B_full_single_device.yaml +++ b/recipes/configs/qwen2/7B_full_single_device.yaml @@ -60,7 +60,7 @@ optimizer_in_bwd: True loss: _component_: torchtune.modules.loss.CEWithChunkedOutputLoss max_steps_per_epoch: null -gradient_accumulation_steps: 16 +gradient_accumulation_steps: 1 compile: False # Training environment