File tree Expand file tree Collapse file tree 4 files changed +14
-14
lines changed
scheduling/framework/plugins/multi/prefix Expand file tree Collapse file tree 4 files changed +14
-14
lines changed Original file line number Diff line number Diff line change @@ -152,7 +152,7 @@ data:
152152 plugins:
153153 - type: queue-scorer
154154 - type: kv-cache-scorer
155- - type: prefix-cache
155+ - type: prefix-cache-scorer
156156 parameters:
157157 hashBlockSize: 64
158158 maxPrefixBlocksToMatch: 256
@@ -168,7 +168,7 @@ data:
168168 weight: 1
169169 - pluginRef: kv-cache-scorer
170170 weight: 1
171- - pluginRef: prefix-cache
171+ - pluginRef: prefix-cache-scorer
172172 weight: 1
173173 - pluginRef: max-score-picker
174174 ---
Original file line number Diff line number Diff line change @@ -657,8 +657,8 @@ plugins:
657657 type: low-queue-filter
658658 parameters:
659659 threshold: 10
660- - name: prefixCache
661- type: prefix-cache
660+ - name: prefixCacheScorer
661+ type: prefix-cache-scorer
662662 parameters:
663663 hashBlockSize: 32
664664- name: maxScorePicker
@@ -669,7 +669,7 @@ schedulingProfiles:
669669- name: default
670670 plugins:
671671 - pluginRef: lowQueueFilter
672- - pluginRef: prefixCache
672+ - pluginRef: prefixCacheScorer
673673 weight: 50
674674 - pluginRef: maxScorePicker
675675`
@@ -683,14 +683,14 @@ kind: EndpointPickerConfig
683683plugins:
684684- name:profileHandler
685685 type: single-profile
686- - name: prefixCache
687- type: prefix-cache
686+ - name: prefixCacheScorer
687+ type: prefix-cache-scorer
688688 parameters:
689689 hashBlockSize: asdf
690690schedulingProfiles:
691691- name: default
692692 plugins:
693- - pluginRef: prefixCache
693+ - pluginRef: prefixCacheScorer
694694 weight: 50
695695`
696696
@@ -703,14 +703,14 @@ kind: EndpointPickerConfig
703703plugins:
704704- name: profileHandler
705705 type: single-profile
706- - name: prefixCache
707- type: prefix-cache
706+ - name: prefixCacheScorer
707+ type: prefix-cache-scorer
708708 parameters:
709709 hashBlockSize: 32
710710schedulingProfiles:
711711- name: default
712712 plugins:
713- - pluginRef: prefixCache
713+ - pluginRef: prefixCacheScorer
714714`
715715
716716// multiple pickers in scheduling profile
Original file line number Diff line number Diff line change @@ -52,7 +52,7 @@ const (
5252 // in vLLM, we will have 250K / 16 = 31.25K blocks.
5353 DefaultLRUCapacityPerServer = 31250
5454
55- PrefixCachePluginType = "prefix-cache"
55+ PrefixCachePluginType = "prefix-cache-scorer "
5656)
5757
5858type Config struct {
Original file line number Diff line number Diff line change @@ -154,7 +154,7 @@ data:
154154 plugins:
155155 - type: queue-scorer
156156 - type: kv-cache-scorer
157- - type: prefix-cache
157+ - type: prefix-cache-scorer
158158 parameters:
159159 hashBlockSize: 64
160160 maxPrefixBlocksToMatch: 256
@@ -170,7 +170,7 @@ data:
170170 weight: 1
171171 - pluginRef: kv-cache-scorer
172172 weight: 1
173- - pluginRef: prefix-cache
173+ - pluginRef: prefix-cache-scorer
174174 weight: 1
175175 - pluginRef: max-score-picker
176176 ---
You can’t perform that action at this time.
0 commit comments