1818
1919 ```bash
2020 kubectl create secret generic hf-token --from-literal=token=$HF_TOKEN # Your Hugging Face Token with access to the set of Llama models
21- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0-rc.1 /config/manifests/vllm/gpu-deployment.yaml
21+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0/config/manifests/vllm/gpu-deployment.yaml
2222 ```
2323
2424--8<-- "site-src/_ includes/model-server-cpu.md"
2525
2626 ```bash
27- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0-rc.1 /config/manifests/vllm/cpu-deployment.yaml
27+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0/config/manifests/vllm/cpu-deployment.yaml
2828 ```
2929
3030--8<-- "site-src/_ includes/model-server-sim.md"
3131
3232 ```bash
33- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0-rc.1 /config/manifests/vllm/sim-deployment.yaml
33+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0/config/manifests/vllm/sim-deployment.yaml
3434 ```
3535
3636### Install the Inference Extension CRDs
3737
3838``` bash
39- kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extension/releases/download/v1.2.0-rc.1 /manifests.yaml
39+ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extension/releases/download/v1.2.0/manifests.yaml
4040```
4141
4242### Install the Gateway
@@ -111,7 +111,7 @@ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extens
111111 Set the chart version and then select a tab to follow the provider-specific instructions.
112112
113113 ``` bash
114- export IGW_CHART_VERSION=v1.2.0-rc.1
114+ export IGW_CHART_VERSION=v1.2.0
115115 ```
116116
117117--8<-- "site-src/_ includes/epp.md"
@@ -129,7 +129,7 @@ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extens
129129 1. Deploy the Inference Gateway:
130130
131131 ```bash
132- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0-rc.1 /config/manifests/gateway/gke/gateway.yaml
132+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0/config/manifests/gateway/gke/gateway.yaml
133133 ```
134134
135135 Confirm that the Gateway was assigned an IP address and reports a `Programmed=True` status:
@@ -142,7 +142,7 @@ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extens
142142 1. Deploy the HTTPRoute:
143143
144144 ```bash
145- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0-rc.1 /config/manifests/gateway/gke/httproute.yaml
145+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0/config/manifests/gateway/gke/httproute.yaml
146146 ```
147147
148148 1. Confirm that the HTTPRoute status conditions include `Accepted=True` and `ResolvedRefs=True`:
@@ -191,7 +191,7 @@ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extens
191191 1. Deploy the Inference Gateway:
192192
193193 ```bash
194- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0-rc.1 /config/manifests/gateway/agentgateway/gateway.yaml
194+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0/config/manifests/gateway/agentgateway/gateway.yaml
195195 ```
196196
197197 Confirm that the Gateway was assigned an IP address and reports a `Programmed=True` status:
@@ -202,7 +202,7 @@ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extens
202202 1. Deploy the HTTPRoute:
203203
204204 ```bash
205- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0-rc.1 /config/manifests/gateway/agentgateway/httproute.yaml
205+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0/config/manifests/gateway/agentgateway/httproute.yaml
206206 ```
207207
208208 1. Confirm that the HTTPRoute status conditions include `Accepted=True` and `ResolvedRefs=True`:
@@ -267,7 +267,7 @@ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extens
267267Deploy the sample InferenceObjective which allows you to specify priority of requests.
268268
269269 ``` bash
270- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0-rc.1 /config/manifests/inferenceobjective.yaml
270+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0/config/manifests/inferenceobjective.yaml
271271 ```
272272
273273--8<-- "site-src/_ includes/test.md"
@@ -283,35 +283,35 @@ Deploy the sample InferenceObjective which allows you to specify priority of req
283283
284284 ``` bash
285285 helm uninstall vllm-llama3-8b-instruct
286- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0-rc.1 /config/manifests/inferenceobjective.yaml --ignore-not-found
287- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0-rc.1 /config/manifests/vllm/cpu-deployment.yaml --ignore-not-found
288- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0-rc.1 /config/manifests/vllm/gpu-deployment.yaml --ignore-not-found
289- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0-rc.1 /config/manifests/vllm/sim-deployment.yaml --ignore-not-found
286+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0/config/manifests/inferenceobjective.yaml --ignore-not-found
287+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0/config/manifests/vllm/cpu-deployment.yaml --ignore-not-found
288+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0/config/manifests/vllm/gpu-deployment.yaml --ignore-not-found
289+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0/config/manifests/vllm/sim-deployment.yaml --ignore-not-found
290290 kubectl delete secret hf-token --ignore-not-found
291291 ```
292292
293293 1. Uninstall the Gateway API Inference Extension CRDs:
294294
295295 ` ` ` bash
296- kubectl delete -f https://github.com/kubernetes-sigs/gateway-api-inference-extension/releases/download/v1.2.0-rc.1 /manifests.yaml --ignore-not-found
296+ kubectl delete -f https://github.com/kubernetes-sigs/gateway-api-inference-extension/releases/download/v1.2.0/manifests.yaml --ignore-not-found
297297 ` ` `
298298
299299 1. Choose one of the following options to cleanup the Inference Gateway.
300300
301301=== " GKE"
302302
303303 ` ` ` bash
304- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0-rc.1 /config/manifests/gateway/gke/gateway.yaml --ignore-not-found
305- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0-rc.1 /config/manifests/gateway/gke/healthcheck.yaml --ignore-not-found
306- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0-rc.1 /config/manifests/gateway/gke/gcp-backend-policy.yaml --ignore-not-found
307- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0-rc.1 /config/manifests/gateway/gke/httproute.yaml --ignore-not-found
304+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0/config/manifests/gateway/gke/gateway.yaml --ignore-not-found
305+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0/config/manifests/gateway/gke/healthcheck.yaml --ignore-not-found
306+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0/config/manifests/gateway/gke/gcp-backend-policy.yaml --ignore-not-found
307+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0/config/manifests/gateway/gke/httproute.yaml --ignore-not-found
308308 ` ` `
309309
310310=== " Istio"
311311
312312 ` ` ` bash
313- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0-rc.1 /config/manifests/gateway/istio/gateway.yaml --ignore-not-found
314- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0-rc.1 /config/manifests/gateway/istio/httproute.yaml --ignore-not-found
313+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0/config/manifests/gateway/istio/gateway.yaml --ignore-not-found
314+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0/config/manifests/gateway/istio/httproute.yaml --ignore-not-found
315315 ` ` `
316316
317317 The following steps assume you would like to clean up ALL Istio resources that were created in this quickstart guide.
@@ -331,8 +331,8 @@ Deploy the sample InferenceObjective which allows you to specify priority of req
331331=== " Kgateway"
332332
333333 ` ` ` bash
334- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0-rc.1 /config/manifests/gateway/agentgateway/gateway.yaml --ignore-not-found
335- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0-rc.1 /config/manifests/gateway/agentgateway/httproute.yaml --ignore-not-found
334+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0/config/manifests/gateway/agentgateway/gateway.yaml --ignore-not-found
335+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.2.0/config/manifests/gateway/agentgateway/httproute.yaml --ignore-not-found
336336 ` ` `
337337
338338 The following steps assume you would like to cleanup ALL Kgateway resources that were created in this quickstart guide.
0 commit comments