diff --git a/python/sglang/multimodal_gen/runtime/pipelines_core/schedule_batch.py b/python/sglang/multimodal_gen/runtime/pipelines_core/schedule_batch.py index 6da1a9b097d1..9118770a5893 100644 --- a/python/sglang/multimodal_gen/runtime/pipelines_core/schedule_batch.py +++ b/python/sglang/multimodal_gen/runtime/pipelines_core/schedule_batch.py @@ -21,10 +21,6 @@ import torch from sglang.multimodal_gen.configs.sample.sampling_params import SamplingParams -from sglang.multimodal_gen.configs.sample.teacache import ( - TeaCacheParams, - WanTeaCacheParams, -) from sglang.multimodal_gen.runtime.server_args import ( ServerArgs, _sanitize_for_logging, @@ -143,9 +139,6 @@ class Req: is_warmup: bool = False - # TeaCache parameters - teacache_params: TeaCacheParams | WanTeaCacheParams | None = None - # STA parameters STA_param: list | None = None is_cfg_negative: bool = False diff --git a/python/sglang/multimodal_gen/test/server/perf_baselines.json b/python/sglang/multimodal_gen/test/server/perf_baselines.json index 757652442f9d..335d121bad03 100644 --- a/python/sglang/multimodal_gen/test/server/perf_baselines.json +++ b/python/sglang/multimodal_gen/test/server/perf_baselines.json @@ -807,69 +807,69 @@ }, "wan2_1_t2v_1.3b_teacache_enabled": { "stages_ms": { + "DenoisingStage": 4598.36, "InputValidationStage": 0.07, - "TextEncodingStage": 2237.78, - "TimestepPreparationStage": 2.1, - "LatentPreparationStage": 0.84, - "DenoisingStage": 13041.23, - "DecodingStage": 1274.63, - "per_frame_generation": null + "DecodingStage": 552.92, + "LatentPreparationStage": 0.26, + "per_frame_generation": null, + "TextEncodingStage": 1114.01, + "TimestepPreparationStage": 2.1 }, "denoise_step_ms": { - "0": 240.71, - "1": 248.13, - "2": 246.48, - "3": 247.87, - "4": 249.38, - "5": 246.76, - "6": 250.42, - "7": 250.81, - "8": 250.98, - "9": 249.9, - "10": 246.72, - "11": 249.79, - "12": 250.46, - "13": 249.19, - "14": 247.55, - "15": 250.12, - "16": 247.57, - "17": 247.21, - "18": 247.32, - "19": 247.42, - "20": 248.21, - "21": 247.19, - "22": 247.72, - "23": 247.45, - "24": 247.9, - "25": 247.87, - "26": 247.18, - "27": 247.65, - "28": 246.91, - "29": 248.26, - "30": 247.82, - "31": 247.73, - "32": 247.38, - "33": 247.84, - "34": 247.46, - "35": 247.52, - "36": 247.94, - "37": 248.76, - "38": 248.01, - "39": 247.45, - "40": 247.84, - "41": 248.33, - "42": 247.41, - "43": 248.16, - "44": 248.18, - "45": 248.44, - "46": 248.65, - "47": 247.73, - "48": 247.48, - "49": 247.54 - }, - "expected_e2e_ms": 18382.19, - "expected_avg_denoise_ms": 260.76, - "expected_median_denoise_ms": 247.84 + "0": 94.24, + "1": 172.68, + "2": 169.48, + "3": 169.08, + "4": 168.38, + "5": 167.27, + "6": 62.95, + "7": 119.56, + "8": 53.34, + "9": 121.85, + "10": 47.64, + "11": 125.75, + "12": 3.24, + "13": 48.21, + "14": 125.17, + "15": 3.71, + "16": 48.15, + "17": 124.61, + "18": 3.3, + "19": 47.25, + "20": 129.33, + "21": 3.11, + "22": 48.03, + "23": 127.46, + "24": 3.37, + "25": 45.6, + "26": 127.17, + "27": 3.35, + "28": 49.83, + "29": 125.42, + "30": 3.19, + "31": 42.76, + "32": 131.19, + "33": 2.93, + "34": 130.04, + "35": 44.77, + "36": 131.45, + "37": 44.06, + "38": 131.02, + "39": 43.48, + "40": 130.42, + "41": 45.24, + "42": 129.46, + "43": 44.6, + "44": 130.33, + "45": 173.84, + "46": 175.58, + "47": 168.16, + "48": 173.85, + "49": 177.56 + }, + "expected_e2e_ms": 6497.84, + "expected_avg_denoise_ms": 91.85, + "expected_median_denoise_ms": 120.7 }, "wan2_1_t2v_1.3b": { "stages_ms": {