Created
August 14, 2025 11:12
-
-
Save yankay/dbf1a365bcbe86d7c8768ad121509134 to your computer and use it in GitHub Desktop.
部署 GIE
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| # 参考 https://gateway-api-inference-extension.sigs.k8s.io/guides/ | |
| # 运行 https://gist.github.com/yankay/3193834858f688f1f062e3356832a77f | |
| # 运行 minikube tunnel 放在一边 | |
| # 安装 istio | |
| cd /tmp | |
| wget https://github.com/kubernetes-sigs/gateway-api/releases/download/v1.3.0/experimental-install.yaml | |
| kubectl apply -f experimental-install.yaml | |
| TAG=$(curl https://storage.googleapis.com/istio-build/dev/1.27-dev) | |
| wget https://storage.googleapis.com/istio-build/dev/$TAG/istioctl-$TAG-linux-amd64.tar.gz | |
| tar -xvf istioctl-$TAG-linux-amd64.tar.gz | |
| ./istioctl install --set tag=$TAG --set hub=gcr.io/istio-testing --set values.pilot.env.ENABLE_GATEWAY_API_INFERENCE_EXTENSION=true | |
| # 安装 GIE | |
| cd /root/oss/gateway-api-inference-extension | |
| git checkout v0.5.1 # 重要,因为 https://github.com/istio/istio/issues/57219 还没有实现 | |
| kubectl apply -f config/manifests/vllm/sim-deployment.yaml | |
| kubectl apply -k config/crd | |
| kubectl apply -f config/manifests/inferencemodel.yaml | |
| kubectl apply -f config/manifests/inferencepool-resources.yaml | |
| kubectl apply -f config/manifests/gateway/istio | |
| # Confirm that the HTTPRoute status conditions include Accepted=True and ResolvedRefs=True: | |
| kubectl get httproute llm-route -o yaml | |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment