From cec80f26448d4a26d01e8ecc414ac915bc416c8c Mon Sep 17 00:00:00 2001 From: Didan Deng <33117903+wtomin@users.noreply.github.com> Date: Thu, 9 Apr 2026 14:50:05 +0800 Subject: [PATCH] flux2.dev cpu offload Signed-off-by: Didan Deng <33117903+wtomin@users.noreply.github.com> --- .../online_serving/test_flux_2_dev_expansion.py | 16 ++++++---------- 1 file changed, 6 insertions(+), 10 deletions(-) diff --git a/tests/e2e/online_serving/test_flux_2_dev_expansion.py b/tests/e2e/online_serving/test_flux_2_dev_expansion.py index eba0fbda225..00480f71b82 100644 --- a/tests/e2e/online_serving/test_flux_2_dev_expansion.py +++ b/tests/e2e/online_serving/test_flux_2_dev_expansion.py @@ -2,13 +2,11 @@ End-to-end diffusion coverage for FLUX.2-dev in online serving mode. Coverage: -- Cache-DiT cache acceleration backend - CPU offload -This test verifies that FLUX.2-dev can be launched with the Cache-DiT backend -and CPU offload enabled, accepts text-to-image requests through the -OpenAI-compatible API, and returns valid generated images with the requested -resolution. +This test verifies that FLUX.2-dev can be launched with CPU offload enabled, +accepts text-to-image requests through the OpenAI-compatible API, and returns +valid generated images with the requested resolution. assert_diffusion_response validates successful generation and the expected image resolution. @@ -32,19 +30,17 @@ def _get_flux_2_dev_feature_cases(model: str): - """Return FLUX.2-dev diffusion feature cases for Cache-DiT + CPU offload.""" + """Return FLUX.2-dev diffusion feature cases for CPU offload.""" return [ pytest.param( OmniServerParams( model=model, server_args=[ - "--cache-backend", - "cache_dit", "--enable-cpu-offload", ], ), - id="cache_dit_cpu_offload", + id="cpu_offload", marks=SINGLE_CARD_FEATURE_MARKS, ), ] @@ -61,7 +57,7 @@ def test_flux_2_dev( omni_server: OmniServer, openai_client: OpenAIClientHandler, ): - """Validate FLUX.2-dev online serving with Cache-DiT and CPU offload.""" + """Validate FLUX.2-dev online serving with CPU offload.""" messages = dummy_messages_from_mix_data(content_text=PROMPT)