From 480094b0385bdc0816795cd85dbaf794bfc20718 Mon Sep 17 00:00:00 2001 From: functionstackx <47992694+functionstackx@users.noreply.github.com> Date: Sat, 2 May 2026 23:51:11 -0400 Subject: [PATCH] Re-append kimik2.5-int4-b300-vllm changelog entry Co-Authored-By: Claude Opus 4.7 (1M context) --- perf-changelog.yaml | 9 +++++++++ 1 file changed, 9 insertions(+) diff --git a/perf-changelog.yaml b/perf-changelog.yaml index 2d37ff5d4..e25542834 100644 --- a/perf-changelog.yaml +++ b/perf-changelog.yaml @@ -2131,3 +2131,12 @@ - "Search-space: tp=8 and tp=4/ep=1 over conc 4-64, on both 1024/1024 and 8192/1024 ISL/OSL" - "At the time of submission, https://docs.vllm.ai/projects/recipes/en/latest/moonshotai/Kimi-K2.5.html does not have a B300-specific recipe, so this reuses the existing Kimi-K2.5 INT4 B200 vLLM recipe as-is until B300-specific tuning is available" pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1057 + +- config-keys: + - kimik2.5-int4-b300-vllm + description: + - "Add Kimi-K2.5 INT4 B300 vLLM benchmark" + - "Image: vllm/vllm-openai:v0.20.0-cu130" + - "Search-space: tp=8 and tp=4/ep=1 over conc 4-64, on both 1024/1024 and 8192/1024 ISL/OSL" + - "At the time of submission, https://docs.vllm.ai/projects/recipes/en/latest/moonshotai/Kimi-K2.5.html does not have a B300-specific recipe, so this reuses the existing Kimi-K2.5 INT4 B200 vLLM recipe as-is until B300-specific tuning is available" + pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1057