1616
1717 ```bash
1818 kubectl create secret generic hf-token --from-literal=token=$HF_TOKEN # Your Hugging Face Token with access to the set of Llama models
19- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/vllm/gpu-deployment.yaml
19+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/vllm/gpu-deployment.yaml
2020 ```
2121
2222--8<-- "site-src/_ includes/model-server-cpu.md"
2323
2424 ```bash
25- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/vllm/cpu-deployment.yaml
25+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/vllm/cpu-deployment.yaml
2626 ```
2727
2828--8<-- "site-src/_ includes/model-server-sim.md"
2929
3030 ```bash
31- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/vllm/sim-deployment.yaml
31+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/vllm/sim-deployment.yaml
3232 ```
3333
3434### Install the Inference Extension CRDs
3535
3636``` bash
37- kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extension/releases/download/v1.0.1 /v1-manifests.yaml
37+ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extension/releases/download/v1.0.2 /v1-manifests.yaml
3838```
3939
4040### Deploy the InferencePool and Endpoint Picker Extension
@@ -44,7 +44,7 @@ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extens
4444 Set the chart version and then select a tab to follow the provider-specific instructions.
4545
4646 ``` bash
47- export IGW_CHART_VERSION=v1.0.1
47+ export IGW_CHART_VERSION=v1.0.2
4848 ```
4949
5050--8<-- "site-src/_ includes/epp.md"
@@ -62,7 +62,7 @@ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extens
6262 2. Deploy Inference Gateway:
6363
6464 ```bash
65- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/gateway/gke/gateway.yaml
65+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/gke/gateway.yaml
6666 ```
6767
6868 Confirm that the Gateway was assigned an IP address and reports a `Programmed=True` status:
@@ -75,7 +75,7 @@ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extens
7575 3. Deploy the HTTPRoute
7676
7777 ```bash
78- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/gateway/gke/httproute.yaml
78+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/gke/httproute.yaml
7979 ```
8080
8181 4. Confirm that the HTTPRoute status conditions include `Accepted=True` and `ResolvedRefs=True`:
@@ -167,7 +167,7 @@ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extens
167167 4. Deploy the Gateway
168168
169169 ```bash
170- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/gateway/kgateway/gateway.yaml
170+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/kgateway/gateway.yaml
171171 ```
172172
173173 Confirm that the Gateway was assigned an IP address and reports a `Programmed=True` status:
@@ -180,7 +180,7 @@ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extens
180180 5. Deploy the HTTPRoute
181181
182182 ```bash
183- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/gateway/kgateway/httproute.yaml
183+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/kgateway/httproute.yaml
184184 ```
185185
186186 6. Confirm that the HTTPRoute status conditions include `Accepted=True` and `ResolvedRefs=True`:
@@ -214,7 +214,7 @@ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extens
214214 4. Deploy the Gateway
215215
216216 ```bash
217- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/gateway/agentgateway/gateway.yaml
217+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/agentgateway/gateway.yaml
218218 ```
219219
220220 Confirm that the Gateway was assigned an IP address and reports a `Programmed=True` status:
@@ -227,7 +227,7 @@ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extens
227227 5. Deploy the HTTPRoute
228228
229229 ```bash
230- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/gateway/agentgateway/httproute.yaml
230+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/agentgateway/httproute.yaml
231231 ```
232232
233233 6. Confirm that the HTTPRoute status conditions include `Accepted=True` and `ResolvedRefs=True`:
@@ -241,7 +241,7 @@ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extens
241241Deploy the sample InferenceObjective which allows you to specify priority of requests.
242242
243243 ``` bash
244- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/inferenceobjective.yaml
244+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/inferenceobjective.yaml
245245 ```
246246
247247--8<-- "site-src/_ includes/test.md"
@@ -257,36 +257,36 @@ Deploy the sample InferenceObjective which allows you to specify priority of req
257257
258258 ``` bash
259259 helm uninstall vllm-llama3-8b-instruct
260- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/inferenceobjective.yaml --ignore-not-found
261- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/vllm/cpu-deployment.yaml --ignore-not-found
262- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/vllm/gpu-deployment.yaml --ignore-not-found
263- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/vllm/sim-deployment.yaml --ignore-not-found
260+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/inferenceobjective.yaml --ignore-not-found
261+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/vllm/cpu-deployment.yaml --ignore-not-found
262+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/vllm/gpu-deployment.yaml --ignore-not-found
263+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/vllm/sim-deployment.yaml --ignore-not-found
264264 kubectl delete secret hf-token --ignore-not-found
265265 ```
266266
267267 1. Uninstall the Gateway API Inference Extension CRDs
268268
269269 ` ` ` bash
270- kubectl delete -k https://github.com/kubernetes-sigs/gateway-api-inference-extension/releases/download/v1.0.1 /manifests.yaml --ignore-not-found
270+ kubectl delete -f https://github.com/kubernetes-sigs/gateway-api-inference-extension/releases/download/v1.0.2 /manifests.yaml --ignore-not-found
271271 ` ` `
272272
273273 1. Choose one of the following options to cleanup the Inference Gateway.
274274
275275=== " GKE"
276276
277277 ` ` ` bash
278- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/gateway/gke/gateway.yaml --ignore-not-found
279- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/gateway/gke/healthcheck.yaml --ignore-not-found
280- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/gateway/gke/gcp-backend-policy.yaml --ignore-not-found
281- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/gateway/gke/httproute.yaml --ignore-not-found
278+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/gke/gateway.yaml --ignore-not-found
279+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/gke/healthcheck.yaml --ignore-not-found
280+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/gke/gcp-backend-policy.yaml --ignore-not-found
281+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/gke/httproute.yaml --ignore-not-found
282282 ` ` `
283283
284284=== " Istio"
285285
286286 ` ` ` bash
287- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/gateway/istio/gateway.yaml --ignore-not-found
288- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/gateway/istio/destination-rule.yaml --ignore-not-found
289- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/gateway/istio/httproute.yaml --ignore-not-found
287+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/istio/gateway.yaml --ignore-not-found
288+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/istio/destination-rule.yaml --ignore-not-found
289+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/istio/httproute.yaml --ignore-not-found
290290 ` ` `
291291
292292 The following steps assume you would like to clean up ALL Istio resources that were created in this quickstart guide.
@@ -306,8 +306,8 @@ Deploy the sample InferenceObjective which allows you to specify priority of req
306306=== " Kgateway"
307307
308308 ` ` ` bash
309- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/gateway/kgateway/gateway.yaml --ignore-not-found
310- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/gateway/kgateway/httproute.yaml --ignore-not-found
309+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/kgateway/gateway.yaml --ignore-not-found
310+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/kgateway/httproute.yaml --ignore-not-found
311311 ` ` `
312312
313313 The following steps assume you would like to cleanup ALL Kgateway resources that were created in this quickstart guide.
@@ -333,8 +333,8 @@ Deploy the sample InferenceObjective which allows you to specify priority of req
333333=== " Agentgateway"
334334
335335 ` ` ` bash
336- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/gateway/agentgateway/gateway.yaml --ignore-not-found
337- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.1 /config/manifests/gateway/agentgateway/httproute.yaml --ignore-not-found
336+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/agentgateway/gateway.yaml --ignore-not-found
337+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/agentgateway/httproute.yaml --ignore-not-found
338338 ` ` `
339339
340340 The following steps assume you would like to cleanup ALL Kgateway resources that were created in this quickstart guide.
0 commit comments