Skip to content
Closed
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
@@ -0,0 +1,76 @@
{
"version": "kc-mission-v1",
"name": "vllm-2614-rfc-automatic-prefix-caching",
"missionClass": "solution",
"author": "KubeStellar Bot",
"authorGithub": "kubestellar",
"mission": {
"title": "vllm: [RFC] Automatic Prefix Caching",
"description": "[RFC] Automatic Prefix Caching. This issue affects 58+ users.",
"type": "troubleshoot",
"status": "completed",
"steps": [
{
"title": "Identify vllm troubleshoot symptoms",
"description": "Check for the issue in your vllm installation:\n```bash\nvllm version\nvllm status 2>&1 | head -20\n```\nLook for errors or warnings that may indicate the issue."
},
{
"title": "Review vllm configuration",
"description": "Review the relevant vllm configuration:\nThis RFC discusses our plan for implementing automatic prefix caching in vLLM."
},
{
"title": "Apply the fix for [RFC] Automatic Prefix Caching",
"description": "The goal of this diff is to allow for automatic prefix caching. This is done by adding an additional level of indirection between the logical and physical blocks which allows for identical logical blocks to map to the same physical block. \n\nThis diff replaces the existing manual prefix caching\n```yaml\nhash(prefix tokens, tokens in this block)\n```"
},
{
"title": "Confirm [RFC] Automatic Prefix Caching is resolved",
"description": "Verify the fix by checking that the original error no longer occurs:\nTest vllm to confirm the issue is resolved.\nConfirm that the issue symptoms are gone."
}
],
"resolution": {
"summary": "The goal of this diff is to allow for automatic prefix caching. This is done by adding an additional level of indirection between the logical and physical blocks which allows for identical logical blocks to map to the same physical block. \n\nThis diff replaces the existing manual prefix caching mechanism added in #1669\n\nBefore:\n```\nLogical block table --> physical block table.",
"codeSnippets": [
"hash(prefix tokens, tokens in this block)",
"Logical block table --> hash table --> physical block table.",
"Logical block table --> physical block table."
]
}
},
"metadata": {
"tags": [
"vllm",
"community",
"llm-serving",
"troubleshoot"
],
"cncfProjects": [
"vllm"
],
"targetResourceKinds": [],
"difficulty": "advanced",
"issueTypes": [
"troubleshoot"
],
"maturity": "community",
"sourceUrls": {
"issue": "https://github.com/vllm-project/vllm/issues/2614",
"repo": "https://github.com/vllm-project/vllm",
"pr": "https://github.com/vllm-project/vllm/pull/2762"
},
"reactions": 58,
"comments": 17,
"synthesizedBy": "copilot"
},
"prerequisites": {
"tools": [
"vllm"
],
"description": "A working vllm installation or development environment."
},
"security": {
"scannedAt": "2026-03-11T06:43:59.534Z",
"scannerVersion": "cncf-gen-3.0.0",
"sanitized": true,
"findings": []
}
}
Loading