diff --git a/tests/functional/grpo.sh b/tests/functional/grpo.sh index d19bf05e61..1504c95c83 100755 --- a/tests/functional/grpo.sh +++ b/tests/functional/grpo.sh @@ -38,5 +38,5 @@ uv run coverage run -a --data-file=$PROJECT_ROOT/tests/.coverage --source=$PROJE uv run tests/json_dump_tb_logs.py $LOG_DIR --output_path $JSON_METRICS uv run tests/check_metrics.py $JSON_METRICS \ - 'max(data["train/gen_kl_error"]) < 1.05' + 'max(data["train/gen_kl_error"]) < 0.001'