forked from kubernetes-sigs/gateway-api-inference-extension
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathgateway.yaml
50 lines (49 loc) · 1.01 KB
/
gateway.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
---
apiVersion: gateway.networking.k8s.io/v1
kind: Gateway
metadata:
name: <GATEWAY-NAME>
spec:
gatewayClassName: <GATEWAY-NAME>
listeners:
- name: http
protocol: HTTP
port: 8080
- name: llm-gw
protocol: HTTP
port: 8081
---
apiVersion: gateway.networking.k8s.io/v1
kind: GatewayClass
metadata:
name: <GATEWAY-NAME>
spec:
controllerName: gateway.envoyproxy.io/gatewayclass-controller
---
apiVersion: gateway.envoyproxy.io/v1alpha1
kind: Backend
metadata:
name: backend-dummy
spec:
endpoints:
- fqdn:
# Both these values are arbitrary and unused as the PatchPolicy redirects requests.
hostname: 'foo.bar.com'
port: 8080
---
apiVersion: gateway.networking.k8s.io/v1
kind: HTTPRoute
metadata:
name: llm-route
spec:
parentRefs:
- name: <GATEWAY-NAME>
sectionName: llm-gw
rules:
- backendRefs:
- group: gateway.envoyproxy.io
kind: Backend
name: backend-dummy
timeouts:
request: "24h"
backendRequest: "24h"