From 71d31bb7c5a89a08d21bc7a6801213b798217e4a Mon Sep 17 00:00:00 2001 From: Guangming Sheng Date: Sat, 15 Mar 2025 11:18:24 +0000 Subject: [PATCH] add weight decay option in config --- verl/trainer/config/ppo_megatron_trainer.yaml | 2 ++ verl/trainer/config/ppo_trainer.yaml | 2 ++ 2 files changed, 4 insertions(+) diff --git a/verl/trainer/config/ppo_megatron_trainer.yaml b/verl/trainer/config/ppo_megatron_trainer.yaml index c903934b8bb..18e08298300 100644 --- a/verl/trainer/config/ppo_megatron_trainer.yaml +++ b/verl/trainer/config/ppo_megatron_trainer.yaml @@ -42,6 +42,7 @@ actor_rollout_ref: min_lr_ratio: null # only useful for warmup with cosine warmup_style: constant # select from constant/cosine total_training_steps: -1 # must be override by program + weight_decay: 0.01 megatron: tensor_model_parallel_size: 4 pipeline_model_parallel_size: 1 @@ -106,6 +107,7 @@ critic: min_lr_ratio: null # only useful for warmup with cosine warmup_style: constant # select from constant/cosine total_training_steps: -1 # must be override by program + weight_decay: 0.01 model: path: ~/models/deepseek-llm-7b-chat tokenizer_path: ${actor_rollout_ref.model.path} diff --git a/verl/trainer/config/ppo_trainer.yaml b/verl/trainer/config/ppo_trainer.yaml index eab987d3aad..226b44acb89 100644 --- a/verl/trainer/config/ppo_trainer.yaml +++ b/verl/trainer/config/ppo_trainer.yaml @@ -46,6 +46,7 @@ actor_rollout_ref: min_lr_ratio: null # only useful for warmup with cosine warmup_style: constant # select from constant/cosine total_training_steps: -1 # must be override by program + weight_decay: 0.01 fsdp_config: wrap_policy: # transformer_layer_cls_to_wrap: None @@ -109,6 +110,7 @@ critic: min_lr_ratio: null # only useful for warmup with cosine warmup_style: constant # select from constant/cosine total_training_steps: -1 # must be override by program + weight_decay: 0.01 model: path: ~/models/deepseek-llm-7b-chat tokenizer_path: ${actor_rollout_ref.model.path}