diff --git a/examples/poc/manifests/vllm/vllm-lora-deployment.yaml b/examples/poc/manifests/vllm/vllm-lora-deployment.yaml index dcd729b0..fc9c1d6b 100644 --- a/examples/poc/manifests/vllm/vllm-lora-deployment.yaml +++ b/examples/poc/manifests/vllm/vllm-lora-deployment.yaml @@ -78,9 +78,9 @@ spec: timeoutSeconds: 1 resources: limits: - nvidia.com/gpu: 2 + nvidia.com/gpu: 1 requests: - nvidia.com/gpu: 2 + nvidia.com/gpu: 1 volumeMounts: - mountPath: /data name: data