File tree Expand file tree Collapse file tree 3 files changed +33
-2
lines changed
config/charts/inferencepool Expand file tree Collapse file tree 3 files changed +33
-2
lines changed Original file line number Diff line number Diff line change @@ -16,7 +16,7 @@ To install via the latest published chart in staging (--version v0 indicates la
16
16
``` txt
17
17
$ helm install vllm-llama3-8b-instruct \
18
18
--set inferencePool.modelServers.matchLabels.app=vllm-llama3-8b-instruct \
19
- --set provider.name=[none|gke] \
19
+ --set provider.name=[none|gke|istio ] \
20
20
oci://us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension/charts/inferencepool --version v0
21
21
```
22
22
@@ -95,7 +95,7 @@ Use `--set inferencePool.modelServerType=triton-tensorrt-llm` to install for Tri
95
95
$ helm install triton-llama3-8b-instruct \
96
96
--set inferencePool.modelServers.matchLabels.app=triton-llama3-8b-instruct \
97
97
--set inferencePool.modelServerType=triton-tensorrt-llm \
98
- --set provider.name=[none|gke] \
98
+ --set provider.name=[none|gke|istio ] \
99
99
oci://us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension/charts/inferencepool --version v0
100
100
` ` `
101
101
Original file line number Diff line number Diff line change
1
+ {{- if eq .Values.provider.name "istio" }}
2
+ ---
3
+ {{- if .Values.istio.destinationRule.enabled }}
4
+ apiVersion : networking.istio.io/v1beta1
5
+ kind : DestinationRule
6
+ metadata :
7
+ name : {{ include "gateway-api-inference-extension.name" . }}
8
+ spec :
9
+ host : {{ .Values.istio.destinationRule.host | default (printf "%s.%s.svc.cluster.local" (include "gateway-api-inference-extension.name" .) .Release.Namespace) }}
10
+ trafficPolicy :
11
+ tls :
12
+ mode : SIMPLE
13
+ insecureSkipVerify : true
14
+ {{- if .Values.istio.destinationRule.trafficPolicy.connectionPool }}
15
+ connectionPool :
16
+ {{- .Values.istio.destinationRule.trafficPolicy.connectionPool | toYaml | nindent 6 }}
17
+ {{- end }}
18
+ {{- end }}
19
+ {{- end }}
Original file line number Diff line number Diff line change @@ -67,6 +67,7 @@ inferencePool:
67
67
# This will soon be deprecated when upstream GW providers support v1, just doing something simple for now.
68
68
targetPortNumber : 8000
69
69
70
+ # Options: ["gke", "istio", "none"]
70
71
provider :
71
72
name : none
72
73
@@ -75,3 +76,14 @@ provider:
75
76
gke :
76
77
# Set to true if the cluster is an Autopilot cluster.
77
78
autopilot : false
79
+
80
+ istio :
81
+ destinationRule :
82
+ enabled : true
83
+ # Provide a way to override the default calculated host
84
+ host : " "
85
+ # Optional: Enables customization of the traffic policy
86
+ trafficPolicy : {}
87
+ # connectionPool:
88
+ # http:
89
+ # maxRequestsPerConnection: 256000
You can’t perform that action at this time.
0 commit comments