generated from kubernetes/kubernetes-template-project
-
Notifications
You must be signed in to change notification settings - Fork 69
/
Copy pathext_proc.yaml
69 lines (69 loc) · 1.49 KB
/
ext_proc.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
apiVersion: apps/v1
kind: Deployment
metadata:
name: instance-gateway-ext-proc
namespace: default
labels:
app: instance-gateway-ext-proc
spec:
replicas: 1
selector:
matchLabels:
app: instance-gateway-ext-proc
template:
metadata:
labels:
app: instance-gateway-ext-proc
spec:
containers:
- name: instance-gateway-ext-proc
image: ghcr.io/tomatillo-and-multiverse/ext-proc:demo
args:
#TODO: specify label selector and dynamically update pods
- -pods
- "vllm-78665f78c4-h4kx4,vllm-78665f78c4-hnz84"
- -podIPs
- "10.24.11.6:8000,10.24.5.7:8000"
- -enable-fairness
- "false"
ports:
- containerPort: 9002
- name: curl
image: curlimages/curl
command: ["sleep", "3600"]
---
apiVersion: v1
kind: Service
metadata:
name: instance-gateway-ext-proc
namespace: default
spec:
selector:
app: instance-gateway-ext-proc
ports:
- protocol: TCP
port: 9002
targetPort: 9002
type: ClusterIP
---
apiVersion: gateway.envoyproxy.io/v1alpha1
kind: EnvoyExtensionPolicy
metadata:
name: ext-proc-policy
namespace: default
spec:
extProc:
- backendRefs:
- group: ""
kind: Service
name: instance-gateway-ext-proc
port: 9002
processingMode:
request:
body: Buffered
response:
messageTimeout: 5s
targetRef:
group: gateway.networking.k8s.io
kind: HTTPRoute
name: llm-route