Skip to content

Commit b54a49c

Browse files
committed
renamed prefix-cache to prefix-cache-scorer
Signed-off-by: Nir Rozenbaum <[email protected]>
1 parent f0f6212 commit b54a49c

File tree

4 files changed

+14
-14
lines changed

4 files changed

+14
-14
lines changed

config/manifests/inferencepool-resources.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -152,7 +152,7 @@ data:
152152
plugins:
153153
- type: queue-scorer
154154
- type: kv-cache-scorer
155-
- type: prefix-cache
155+
- type: prefix-cache-scorer
156156
parameters:
157157
hashBlockSize: 64
158158
maxPrefixBlocksToMatch: 256
@@ -168,7 +168,7 @@ data:
168168
weight: 1
169169
- pluginRef: kv-cache-scorer
170170
weight: 1
171-
- pluginRef: prefix-cache
171+
- pluginRef: prefix-cache-scorer
172172
weight: 1
173173
- pluginRef: max-score-picker
174174
---

pkg/epp/common/config/loader/configloader_test.go

Lines changed: 9 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -657,8 +657,8 @@ plugins:
657657
type: low-queue-filter
658658
parameters:
659659
threshold: 10
660-
- name: prefixCache
661-
type: prefix-cache
660+
- name: prefixCacheScorer
661+
type: prefix-cache-scorer
662662
parameters:
663663
hashBlockSize: 32
664664
- name: maxScorePicker
@@ -669,7 +669,7 @@ schedulingProfiles:
669669
- name: default
670670
plugins:
671671
- pluginRef: lowQueueFilter
672-
- pluginRef: prefixCache
672+
- pluginRef: prefixCacheScorer
673673
weight: 50
674674
- pluginRef: maxScorePicker
675675
`
@@ -683,14 +683,14 @@ kind: EndpointPickerConfig
683683
plugins:
684684
- name:profileHandler
685685
type: single-profile
686-
- name: prefixCache
687-
type: prefix-cache
686+
- name: prefixCacheScorer
687+
type: prefix-cache-scorer
688688
parameters:
689689
hashBlockSize: asdf
690690
schedulingProfiles:
691691
- name: default
692692
plugins:
693-
- pluginRef: prefixCache
693+
- pluginRef: prefixCacheScorer
694694
weight: 50
695695
`
696696

@@ -703,14 +703,14 @@ kind: EndpointPickerConfig
703703
plugins:
704704
- name: profileHandler
705705
type: single-profile
706-
- name: prefixCache
707-
type: prefix-cache
706+
- name: prefixCacheScorer
707+
type: prefix-cache-scorer
708708
parameters:
709709
hashBlockSize: 32
710710
schedulingProfiles:
711711
- name: default
712712
plugins:
713-
- pluginRef: prefixCache
713+
- pluginRef: prefixCacheScorer
714714
`
715715

716716
// multiple pickers in scheduling profile

pkg/epp/scheduling/framework/plugins/multi/prefix/plugin.go

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -52,7 +52,7 @@ const (
5252
// in vLLM, we will have 250K / 16 = 31.25K blocks.
5353
DefaultLRUCapacityPerServer = 31250
5454

55-
PrefixCachePluginType = "prefix-cache"
55+
PrefixCachePluginType = "prefix-cache-scorer"
5656
)
5757

5858
type Config struct {

test/testdata/inferencepool-e2e.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -154,7 +154,7 @@ data:
154154
plugins:
155155
- type: queue-scorer
156156
- type: kv-cache-scorer
157-
- type: prefix-cache
157+
- type: prefix-cache-scorer
158158
parameters:
159159
hashBlockSize: 64
160160
maxPrefixBlocksToMatch: 256
@@ -170,7 +170,7 @@ data:
170170
weight: 1
171171
- pluginRef: kv-cache-scorer
172172
weight: 1
173-
- pluginRef: prefix-cache
173+
- pluginRef: prefix-cache-scorer
174174
weight: 1
175175
- pluginRef: max-score-picker
176176
---

0 commit comments

Comments
 (0)