Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
25 commits
Select commit Hold shift + click to select a range
f97afaf
Remove Bagel yaml and update examples
princepride Apr 20, 2026
cc4667c
fix some bug
princepride Apr 20, 2026
f79f2c1
fix some bug
princepride Apr 20, 2026
2f652a3
Address review findings: think pipeline, mooncake bindings, XPU overr…
princepride Apr 20, 2026
01ebc5d
fix some bug
princepride Apr 20, 2026
e3aa65e
fix: restore KV transfer fields lost during PipelineConfig→StageConfi…
princepride Apr 21, 2026
2898670
Merge branch 'main' into remove-bagel-yaml
princepride Apr 21, 2026
8a50ca2
Merge branch 'main' into remove-bagel-yaml
princepride Apr 21, 2026
d3ef6af
Add bagel_single_stage pipeline to registry
princepride Apr 21, 2026
5629b7c
change --stage-configs-path to --deploy-config
princepride Apr 22, 2026
3a296dd
Merge branch 'main' into remove-bagel-yaml
lishunyang12 Apr 22, 2026
978de4c
Merge branch 'main' into remove-bagel-yaml
princepride Apr 22, 2026
b350c82
Merge branch 'main' into remove-bagel-yaml
princepride Apr 22, 2026
d4bd9cd
fix some bug
princepride Apr 22, 2026
ed271e1
fix some bug
princepride Apr 22, 2026
463fe2c
change to use from_cli_args
princepride Apr 22, 2026
1a3f831
Merge branch 'main' into remove-bagel-yaml
princepride Apr 22, 2026
349ec52
fix doc bug
princepride Apr 22, 2026
d2664f9
Merge branch 'main' into remove-bagel-yaml
princepride Apr 22, 2026
4c73dcc
Merge branch 'main' into remove-bagel-yaml
princepride Apr 23, 2026
6951940
remove --stage-configs-path
princepride Apr 23, 2026
9b951b3
Merge branch 'main' into remove-bagel-yaml
princepride Apr 23, 2026
ae23e14
Merge branch 'main' into remove-bagel-yaml
lishunyang12 Apr 23, 2026
f757c79
Merge branch 'main' into remove-bagel-yaml
princepride Apr 24, 2026
30258ac
Merge branch 'main' into remove-bagel-yaml
princepride Apr 24, 2026
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
347 changes: 185 additions & 162 deletions docs/user_guide/examples/offline_inference/bagel.md

Large diffs are not rendered by default.

300 changes: 125 additions & 175 deletions docs/user_guide/examples/online_serving/bagel.md

Large diffs are not rendered by default.

345 changes: 184 additions & 161 deletions examples/offline_inference/bagel/README.md

Large diffs are not rendered by default.

29 changes: 17 additions & 12 deletions examples/offline_inference/bagel/end2end.py
Original file line number Diff line number Diff line change
Expand Up @@ -53,7 +53,12 @@ def parse_args():
parser.add_argument("--shm-threshold-bytes", type=int, default=65536)
parser.add_argument("--worker-backend", type=str, default="process", choices=["process", "ray"])
parser.add_argument("--ray-address", type=str, default=None)
parser.add_argument("--stage-configs-path", type=str, default=None)
parser.add_argument(
"--deploy-config",
type=str,
default=None,
help="Path to deploy YAML. If unset, auto-loads vllm_omni/deploy/bagel.yaml based on the HF model_type.",
)
parser.add_argument("--steps", type=int, default=50, help="Number of inference steps.")

parser.add_argument("--cfg-text-scale", type=float, default=4.0, help="Text CFG scale (default: 4.0)")
Expand Down Expand Up @@ -149,14 +154,12 @@ def main():
from vllm_omni.entrypoints.omni import Omni

omni_kwargs = {}
stage_configs_path = args.stage_configs_path
is_single_stage = stage_configs_path and "single_stage" in stage_configs_path
if args.think and stage_configs_path is None:
stage_configs_path = "vllm_omni/model_executor/stage_configs/bagel_think.yaml"
print(f"[Info] Think mode enabled, using stage config: {stage_configs_path}")
if stage_configs_path:
omni_kwargs["stage_configs_path"] = stage_configs_path
is_single_stage = "single_stage" in stage_configs_path
deploy_config = args.deploy_config
if args.think and deploy_config is None:
deploy_config = "vllm_omni/deploy/bagel_think.yaml"
print(f"[Info] Think mode enabled, using deploy config: {deploy_config}")
if deploy_config:
omni_kwargs["deploy_config"] = deploy_config

omni_kwargs.update(
{
Expand All @@ -173,7 +176,7 @@ def main():
if args.quantization:
omni_kwargs["quantization_config"] = args.quantization

omni = Omni(model=model_name, **omni_kwargs)
omni = Omni.from_cli_args(args, model=model_name, **omni_kwargs)

formatted_prompts = []
for p in prompts:
Expand Down Expand Up @@ -218,9 +221,11 @@ def main():
formatted_prompts.append(prompt_dict)

params_list = omni.default_sampling_params_list
# Bagel exposes 1 sampling param set for single-stage (DiT-only) and
# 2 for two-stage (Thinker + DiT). This heuristic may need updating
# if future pipelines break that 1:1 mapping.
is_single_stage = len(params_list) == 1
Comment thread
princepride marked this conversation as resolved.

# For single-stage DiT, think/text params go into the diffusion sampling params extra_args.
# For 2-stage, diffusion params are at index 1.
diffusion_params_idx = 0 if is_single_stage else (1 if len(params_list) > 1 else 0)
diffusion_params = params_list[diffusion_params_idx]

Expand Down
Loading
Loading