We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 28f3999 commit 59272c1Copy full SHA for 59272c1
pkg/manifests/ext_proc.yaml
@@ -49,7 +49,6 @@ spec:
49
containers:
50
- name: inference-gateway-ext-proc
51
# TODO(https://github.com/kubernetes-sigs/llm-instance-gateway/issues/34) Update the image and args.
52
- image: us-central1-docker.pkg.dev/k8s-staging-images/llm-instance-gateway/epp:main
53
args:
54
- -serverPoolName
55
- "vllm-llama2-7b-pool"
@@ -59,7 +58,8 @@ spec:
59
58
60
ports:
61
- containerPort: 9002
62
-
+ - name: metrics
+ containerPort: 9090
63
- name: curl
64
image: curlimages/curl
65
command: ["sleep", "3600"]
0 commit comments