Skip to content

Commit 5975c6d

Browse files
FabhiahnYuhanLiu11
andauthored
Added option to specify priority class (#557)
Signed-off-by: Fabijan Marič Vild <[email protected]> Co-authored-by: Yuhan Liu <[email protected]>
1 parent 3bb6b73 commit 5975c6d

File tree

5 files changed

+16
-0
lines changed

5 files changed

+16
-0
lines changed

helm/templates/deployment-cache-server.yaml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -16,6 +16,9 @@ spec:
1616
labels:
1717
{{- include "chart.cacheserverLabels" . | nindent 8 }}
1818
spec:
19+
{{- if .Values.cacheserverSpec.priorityClassName}}
20+
priorityClassName: {{ .Values.cacheserverSpec.priorityClassName | quote }}
21+
{{- end }}
1922
{{- if .Values.cacheserverSpec.nodeSelectorTerms}}
2023
affinity:
2124
nodeAffinity:

helm/templates/deployment-router.yaml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,9 @@ spec:
1818
{{- include "chart.routerLabels" . | nindent 8 }}
1919
spec:
2020
serviceAccountName: {{ .Release.Name }}-router-service-account
21+
{{- if .Values.routerSpec.priorityClassName }}
22+
priorityClassName: {{ .Values.routerSpec.priorityClassName | quote }}
23+
{{- end }}
2124
{{- if .Values.routerSpec.nodeSelectorTerms }}
2225
affinity:
2326
nodeAffinity:

helm/templates/deployment-vllm-multi.yaml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -43,6 +43,9 @@ spec:
4343
helm-release-name: {{ .Release.Name }}
4444
{{- include "chart.engineLabels" . | nindent 8 }}
4545
spec:
46+
{{- if $modelSpec.priorityClassName }}
47+
priorityClassName: {{ $modelSpec.priorityClassName | quote }}
48+
{{- end }}
4649
{{- if hasKey $modelSpec "initContainer" }}
4750
{{- $container := $modelSpec.initContainer }}
4851
initContainers:

helm/values.schema.json

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -88,6 +88,9 @@
8888
"requestGPUType": {
8989
"type": "string"
9090
},
91+
"priorityClassName": {
92+
"type": "string"
93+
},
9194
"pvcStorage": {
9295
"type": "string"
9396
},

helm/values.yaml

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,7 @@ servingEngineSpec:
1818
# Each entry in the modelSpec array should contain the following fields:
1919
# - annotations: (Optional, map) The annotations to add to the deployment, e.g., {model: "opt125m"}
2020
# - serviceAccountName: (Optional, string) The name of the service account to use for the deployment, e.g., "vllm-service-account"
21+
# - priorityClassName: (Optional, string) The name of the priority class name for the deployment, e.g., "high-priority"
2122
# - podAnnotations: (Optional, map) The annotations to add to the pod, e.g., {model: "opt125m"}
2223
# - name: (string) The name of the model, e.g., "example-model"
2324
# - repository: (string) The repository of the model, e.g., "vllm/vllm-openai"
@@ -267,6 +268,9 @@ routerSpec:
267268
# -- Number of replicas
268269
replicaCount: 1
269270

271+
# -- Priority Class
272+
priorityClassName: ""
273+
270274
# -- Container port
271275
containerPort: 8000
272276

0 commit comments

Comments
 (0)