1616
1717 ```bash
1818 kubectl create secret generic hf-token --from-literal=token=$HF_TOKEN # Your Hugging Face Token with access to the set of Llama models
19- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/vllm/gpu-deployment.yaml
19+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.1.0 /config/manifests/vllm/gpu-deployment.yaml
2020 ```
2121
2222--8<-- "site-src/_ includes/model-server-cpu.md"
2323
2424 ```bash
25- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/vllm/cpu-deployment.yaml
25+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.1.0 /config/manifests/vllm/cpu-deployment.yaml
2626 ```
2727
2828--8<-- "site-src/_ includes/model-server-sim.md"
2929
3030 ```bash
31- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/vllm/sim-deployment.yaml
31+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.1.0 /config/manifests/vllm/sim-deployment.yaml
3232 ```
3333
3434### Install the Inference Extension CRDs
3535
3636``` bash
37- kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extension/releases/download/v1.0.2 /manifests.yaml
37+ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extension/releases/download/v1.1.0 /manifests.yaml
3838```
3939
4040### Install the Gateway
@@ -94,7 +94,7 @@ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extens
9494 Set the chart version and then select a tab to follow the provider-specific instructions.
9595
9696 ``` bash
97- export IGW_CHART_VERSION=v1.0.2
97+ export IGW_CHART_VERSION=v1.1.0
9898 ```
9999
100100--8<-- "site-src/_ includes/epp.md"
@@ -112,7 +112,7 @@ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extens
112112 2. Deploy the Inference Gateway:
113113
114114 ```bash
115- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/gke/gateway.yaml
115+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.1.0 /config/manifests/gateway/gke/gateway.yaml
116116 ```
117117
118118 Confirm that the Gateway was assigned an IP address and reports a `Programmed=True` status:
@@ -125,7 +125,7 @@ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extens
125125 3. Deploy the HTTPRoute
126126
127127 ```bash
128- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/gke/httproute.yaml
128+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.1.0 /config/manifests/gateway/gke/httproute.yaml
129129 ```
130130
131131 4. Confirm that the HTTPRoute status conditions include `Accepted=True` and `ResolvedRefs=True`:
@@ -180,7 +180,7 @@ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extens
180180 1. Deploy the Inference Gateway
181181
182182 ```bash
183- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/agentgateway/gateway.yaml
183+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.1.0 /config/manifests/gateway/agentgateway/gateway.yaml
184184 ```
185185
186186 Confirm that the Gateway was assigned an IP address and reports a `Programmed=True` status:
@@ -191,7 +191,7 @@ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extens
191191 2. Deploy the HTTPRoute
192192
193193 ```bash
194- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/agentgateway/httproute.yaml
194+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.1.0 /config/manifests/gateway/agentgateway/httproute.yaml
195195 ```
196196
197197 3. Confirm that the HTTPRoute status conditions include `Accepted=True` and `ResolvedRefs=True`:
@@ -205,7 +205,7 @@ kubectl apply -f https://github.com/kubernetes-sigs/gateway-api-inference-extens
205205Deploy the sample InferenceObjective which allows you to specify priority of requests.
206206
207207 ``` bash
208- kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/inferenceobjective.yaml
208+ kubectl apply -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.1.0 /config/manifests/inferenceobjective.yaml
209209 ```
210210
211211--8<-- "site-src/_ includes/test.md"
@@ -221,36 +221,36 @@ Deploy the sample InferenceObjective which allows you to specify priority of req
221221
222222 ``` bash
223223 helm uninstall vllm-llama3-8b-instruct
224- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/inferenceobjective.yaml --ignore-not-found
225- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/vllm/cpu-deployment.yaml --ignore-not-found
226- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/vllm/gpu-deployment.yaml --ignore-not-found
227- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/vllm/sim-deployment.yaml --ignore-not-found
224+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.1.0 /config/manifests/inferenceobjective.yaml --ignore-not-found
225+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.1.0 /config/manifests/vllm/cpu-deployment.yaml --ignore-not-found
226+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.1.0 /config/manifests/vllm/gpu-deployment.yaml --ignore-not-found
227+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.1.0 /config/manifests/vllm/sim-deployment.yaml --ignore-not-found
228228 kubectl delete secret hf-token --ignore-not-found
229229 ```
230230
231231 1. Uninstall the Gateway API Inference Extension CRDs
232232
233233 ` ` ` bash
234- kubectl delete -f https://github.com/kubernetes-sigs/gateway-api-inference-extension/releases/download/v1.0.2 /manifests.yaml --ignore-not-found
234+ kubectl delete -f https://github.com/kubernetes-sigs/gateway-api-inference-extension/releases/download/v1.1.0 /manifests.yaml --ignore-not-found
235235 ` ` `
236236
237237 1. Choose one of the following options to cleanup the Inference Gateway.
238238
239239=== " GKE"
240240
241241 ` ` ` bash
242- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/gke/gateway.yaml --ignore-not-found
243- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/gke/healthcheck.yaml --ignore-not-found
244- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/gke/gcp-backend-policy.yaml --ignore-not-found
245- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/gke/httproute.yaml --ignore-not-found
242+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.1.0 /config/manifests/gateway/gke/gateway.yaml --ignore-not-found
243+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.1.0 /config/manifests/gateway/gke/healthcheck.yaml --ignore-not-found
244+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.1.0 /config/manifests/gateway/gke/gcp-backend-policy.yaml --ignore-not-found
245+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.1.0 /config/manifests/gateway/gke/httproute.yaml --ignore-not-found
246246 ` ` `
247247
248248=== " Istio"
249249
250250 ` ` ` bash
251- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/istio/gateway.yaml --ignore-not-found
252- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/istio/destination-rule.yaml --ignore-not-found
253- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/istio/httproute.yaml --ignore-not-found
251+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.1.0 /config/manifests/gateway/istio/gateway.yaml --ignore-not-found
252+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.1.0 /config/manifests/gateway/istio/destination-rule.yaml --ignore-not-found
253+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.1.0 /config/manifests/gateway/istio/httproute.yaml --ignore-not-found
254254 ` ` `
255255
256256 The following steps assume you would like to clean up ALL Istio resources that were created in this quickstart guide.
@@ -270,8 +270,8 @@ Deploy the sample InferenceObjective which allows you to specify priority of req
270270=== " Kgateway"
271271
272272 ` ` ` bash
273- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/agentgateway/gateway.yaml --ignore-not-found
274- kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.0.2 /config/manifests/gateway/agentgateway/httproute.yaml --ignore-not-found
273+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.1.0 /config/manifests/gateway/agentgateway/gateway.yaml --ignore-not-found
274+ kubectl delete -f https://raw.githubusercontent.com/kubernetes-sigs/gateway-api-inference-extension/refs/tags/v1.1.0 /config/manifests/gateway/agentgateway/httproute.yaml --ignore-not-found
275275 ` ` `
276276
277277 The following steps assume you would like to cleanup ALL Kgateway resources that were created in this quickstart guide.
0 commit comments