From 439ca307c53b441a2efa52e5c6b94947b9400da8 Mon Sep 17 00:00:00 2001 From: John Lambert Date: Tue, 26 Nov 2024 13:31:44 -0500 Subject: [PATCH] Update learning rate for #116 --- machine/jobs/settings.yaml | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/machine/jobs/settings.yaml b/machine/jobs/settings.yaml index bcbe7c7..00d9517 100644 --- a/machine/jobs/settings.yaml +++ b/machine/jobs/settings.yaml @@ -8,15 +8,17 @@ default: train_params: do_train: true optim: adamw_torch - warmup_steps: 4000 + warmup_steps: 1000 per_device_train_batch_size: 16 gradient_accumulation_steps: 4 label_smoothing_factor: 0.2 group_by_length: true gradient_checkpointing: true + lr_scheduler_type: cosine + learning_rate: 0.0002 fp16: true save_strategy: no - max_steps: 20000 + max_steps: 5000 generate_params: device: 0 num_beams: 2