Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1,042 changes: 1,042 additions & 0 deletions collector/vllm/collect_mla_module_v2.py

Large diffs are not rendered by default.

File renamed without changes.
576 changes: 576 additions & 0 deletions collector/vllm/collect_moe_v2.py

Large diffs are not rendered by default.

33 changes: 25 additions & 8 deletions collector/vllm/registry.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,11 +4,13 @@
"""
Declarative registry mapping ops to collector modules for vLLM.

No version forks exist yet. When vLLM API changes require a fork,
add a ``versions`` tuple following the trtllm registry pattern.
For versioned entries, ``versions`` is a tuple of :class:`VersionRoute` in
**descending** order. The resolver picks the first route whose min_version
is <= the runtime version. To add support for a new vLLM version:
add a new VersionRoute at the top of the versions tuple.
"""

from collector.registry_types import OpEntry
from collector.registry_types import OpEntry, VersionRoute

REGISTRY: list[OpEntry] = [
OpEntry(
Expand All @@ -31,9 +33,12 @@
),
OpEntry(
op="moe",
module="collector.vllm.collect_moe",
get_func="get_moe_test_cases",
run_func="run_moe_torch",
versions=(
VersionRoute("0.17.0", "collector.vllm.collect_moe_v2"),
VersionRoute("0.0.0", "collector.vllm.collect_moe_v1"),
),
),
OpEntry(
op="mla_context",
Expand All @@ -49,27 +54,39 @@
),
OpEntry(
op="mla_context_module",
module="collector.vllm.collect_mla_module",
get_func="get_mla_context_module_test_cases",
run_func="run_mla_module_worker",
versions=(
VersionRoute("0.17.0", "collector.vllm.collect_mla_module_v2"),
VersionRoute("0.0.0", "collector.vllm.collect_mla_module_v1"),
),
),
OpEntry(
op="mla_generation_module",
module="collector.vllm.collect_mla_module",
get_func="get_mla_generation_module_test_cases",
run_func="run_mla_module_worker",
versions=(
VersionRoute("0.17.0", "collector.vllm.collect_mla_module_v2"),
VersionRoute("0.0.0", "collector.vllm.collect_mla_module_v1"),
),
),
OpEntry(
op="dsa_context_module",
module="collector.vllm.collect_mla_module",
get_func="get_dsa_context_module_test_cases",
run_func="run_mla_module_worker",
versions=(
VersionRoute("0.17.0", "collector.vllm.collect_mla_module_v2"),
VersionRoute("0.0.0", "collector.vllm.collect_mla_module_v1"),
),
),
OpEntry(
op="dsa_generation_module",
module="collector.vllm.collect_mla_module",
get_func="get_dsa_generation_module_test_cases",
run_func="run_mla_module_worker",
versions=(
VersionRoute("0.17.0", "collector.vllm.collect_mla_module_v2"),
VersionRoute("0.0.0", "collector.vllm.collect_mla_module_v1"),
),
),
OpEntry(
op="gdn",
Expand Down
Git LFS file not shown
Git LFS file not shown
Git LFS file not shown
Git LFS file not shown
Git LFS file not shown
Git LFS file not shown
Git LFS file not shown
Loading