Skip to content

Commit fac33cc

Browse files
committed
rename my-pool to vllm-llama2-7b
1 parent 9927ff4 commit fac33cc

File tree

5 files changed

+20
-20
lines changed

5 files changed

+20
-20
lines changed

config/manifests/inferencepool.yaml

+10-10
Original file line numberDiff line numberDiff line change
@@ -2,22 +2,22 @@ apiVersion: inference.networking.x-k8s.io/v1alpha2
22
kind: InferencePool
33
metadata:
44
labels:
5-
name: my-pool
5+
name: vllm-llama2-7b
66
spec:
77
targetPortNumber: 8000
88
selector:
9-
app: my-pool
9+
app: vllm-llama2-7b
1010
extensionRef:
11-
name: my-pool-epp
11+
name: vllm-llama2-7b-epp
1212
---
1313
apiVersion: v1
1414
kind: Service
1515
metadata:
16-
name: my-pool-epp
16+
name: vllm-llama2-7b-epp
1717
namespace: default
1818
spec:
1919
selector:
20-
app: my-pool-epp
20+
app: vllm-llama2-7b-epp
2121
ports:
2222
- protocol: TCP
2323
port: 9002
@@ -27,27 +27,27 @@ spec:
2727
apiVersion: apps/v1
2828
kind: Deployment
2929
metadata:
30-
name: my-pool-epp
30+
name: vllm-llama2-7b-epp
3131
namespace: default
3232
labels:
33-
app: my-pool-epp
33+
app: vllm-llama2-7b-epp
3434
spec:
3535
replicas: 1
3636
selector:
3737
matchLabels:
38-
app: my-pool-epp
38+
app: vllm-llama2-7b-epp
3939
template:
4040
metadata:
4141
labels:
42-
app: my-pool-epp
42+
app: vllm-llama2-7b-epp
4343
spec:
4444
containers:
4545
- name: epp
4646
image: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension/epp:main
4747
imagePullPolicy: Always
4848
args:
4949
- -poolName
50-
- "my-pool"
50+
- "vllm-llama2-7b"
5151
- -v
5252
- "4"
5353
- -grpcPort

config/manifests/vllm/cpu-deployment.yaml

+3-3
Original file line numberDiff line numberDiff line change
@@ -1,16 +1,16 @@
11
apiVersion: apps/v1
22
kind: Deployment
33
metadata:
4-
name: my-pool
4+
name: vllm-llama2-7b
55
spec:
66
replicas: 3
77
selector:
88
matchLabels:
9-
app: my-pool
9+
app: vllm-llama2-7b
1010
template:
1111
metadata:
1212
labels:
13-
app: my-pool
13+
app: vllm-llama2-7b
1414
spec:
1515
containers:
1616
- name: lora

config/manifests/vllm/gpu-deployment.yaml

+3-3
Original file line numberDiff line numberDiff line change
@@ -1,16 +1,16 @@
11
apiVersion: apps/v1
22
kind: Deployment
33
metadata:
4-
name: my-pool
4+
name: vllm-llama2-7b
55
spec:
66
replicas: 3
77
selector:
88
matchLabels:
9-
app: my-pool
9+
app: vllm-llama2-7b
1010
template:
1111
metadata:
1212
labels:
13-
app: my-pool
13+
app: vllm-llama2-7b
1414
spec:
1515
containers:
1616
- name: lora

test/e2e/epp/e2e_suite_test.go

+2-2
Original file line numberDiff line numberDiff line change
@@ -57,15 +57,15 @@ const (
5757
// TODO [danehans]: Must be "default" until https://github.com/kubernetes-sigs/gateway-api-inference-extension/issues/227 is fixed
5858
nsName = "default"
5959
// modelServerName is the name of the model server test resources.
60-
modelServerName = "my-pool"
60+
modelServerName = "vllm-llama2-7b"
6161
// modelName is the test model name.
6262
modelName = "tweet-summary"
6363
// envoyName is the name of the envoy proxy test resources.
6464
envoyName = "envoy"
6565
// envoyPort is the listener port number of the test envoy proxy.
6666
envoyPort = "8081"
6767
// inferExtName is the name of the inference extension test resources.
68-
inferExtName = "my-pool-epp"
68+
inferExtName = "vllm-llama2-7b-epp"
6969
// clientManifest is the manifest for the client test resources.
7070
clientManifest = "../../testdata/client.yaml"
7171
// modelServerSecretManifest is the manifest for the model server secret resource.

test/testdata/envoy.yaml

+2-2
Original file line numberDiff line numberDiff line change
@@ -100,7 +100,7 @@ data:
100100
grpc_service:
101101
envoy_grpc:
102102
cluster_name: ext_proc
103-
authority: my-pool-epp.default:9002
103+
authority: vllm-llama2-7b-epp.default:9002
104104
timeout: 10s
105105
processing_mode:
106106
request_header_mode: SEND
@@ -194,7 +194,7 @@ data:
194194
- endpoint:
195195
address:
196196
socket_address:
197-
address: my-pool-epp.default
197+
address: vllm-llama2-7b-epp.default
198198
port_value: 9002
199199
health_status: HEALTHY
200200
load_balancing_weight: 1

0 commit comments

Comments
 (0)