diff --git a/rllm/trainer/verl/ray_runtime_env.py b/rllm/trainer/verl/ray_runtime_env.py index f89058e13..d22e803bd 100644 --- a/rllm/trainer/verl/ray_runtime_env.py +++ b/rllm/trainer/verl/ray_runtime_env.py @@ -7,7 +7,9 @@ "VLLM_LOGGING_LEVEL": "WARN", "VLLM_ALLOW_RUNTIME_LORA_UPDATING": "true", "CUDA_DEVICE_MAX_CONNECTIONS": "1", - "VLLM_USE_V1": "1", + # TODO: disable compile cache due to cache corruption issue + # https://github.com/vllm-project/vllm/issues/31199 + "VLLM_DISABLE_COMPILE_CACHE": "1", # To prevent hanging or crash during synchronization of weights between actor and rollout # in disaggregated mode. See: # https://docs.vllm.ai/en/latest/usage/troubleshooting.html?h=nccl_cumem_enable#known-issues