Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion dockerfiles/Dockerfile.nemo-rl
Original file line number Diff line number Diff line change
Expand Up @@ -49,7 +49,7 @@ ENV NEMO_RL_VENV_DIR=/opt/ray_venvs
FROM base AS hermetic

ARG NEMO_RL_COMMIT
ENV NEMO_RL_COMMIT=${NEMO_RL_COMMIT:-838475ff8ea8949a3bbb9bc6f222bb0c282ae5ab}
ENV NEMO_RL_COMMIT=${NEMO_RL_COMMIT:-85eeb8d059b0249cace427dd5dec9573107be224}

RUN git clone https://github.com/NVIDIA-NeMo/RL.git /opt/NeMo-RL && cd /opt/NeMo-RL && git checkout ${NEMO_RL_COMMIT} && git submodule update --init --recursive

Expand Down
1 change: 1 addition & 0 deletions nemo_skills/training/nemo_rl/configs/grpo.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -43,6 +43,7 @@ policy:
model_name: ???
tokenizer:
name: ${policy.model_name} ## specify if you'd like to use a tokenizer different from the model's default
chat_template_kwargs: null # can be used to pass kwargs to the chat template, e.g., enable_thinking=true
train_global_batch_size: 512
train_micro_batch_size: 4
generation_batch_size: 32 # Only used when generating using HF backend
Expand Down
1 change: 1 addition & 0 deletions nemo_skills/training/nemo_rl/configs/sft.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -28,6 +28,7 @@ policy:
tokenizer:
name: ${policy.model_name} ## specify if you'd like to use a tokenizer different from the model's default
chat_template: "infer_from_data" ## Can be: null (passthrough), "default" (tokenizer's default), "infer_from_data" (auto-detect from data), or custom jinja2 template
chat_template_kwargs: null # can be used to pass kwargs to the chat template, e.g., enable_thinking=true
train_global_batch_size: 32
train_micro_batch_size: 1
max_total_sequence_length: 4096
Expand Down