File tree 3 files changed +6
-6
lines changed
3 files changed +6
-6
lines changed Original file line number Diff line number Diff line change @@ -40,7 +40,7 @@ roleRef:
40
40
kind : ClusterRole
41
41
name : pod-read
42
42
---
43
- apiVersion : inference.networking.x-k8s.io/v1alpha1
43
+ apiVersion : inference.networking.x-k8s.io/v1alpha2
44
44
kind : InferencePool
45
45
metadata :
46
46
labels :
Original file line number Diff line number Diff line change 1
- apiVersion : inference.networking.x-k8s.io/v1alpha1
1
+ apiVersion : inference.networking.x-k8s.io/v1alpha2
2
2
kind : InferenceModel
3
3
metadata :
4
4
name : inferencemodel-sample
Original file line number Diff line number Diff line change 1
- apiVersion : inference.networking.x-k8s.io/v1alpha1
1
+ apiVersion : inference.networking.x-k8s.io/v1alpha2
2
2
kind : InferencePool
3
3
metadata :
4
4
name : vllm-llama2-7b-pool
10
10
extensionRef :
11
11
name : epp
12
12
---
13
- apiVersion : inference.networking.x-k8s.io/v1alpha1
13
+ apiVersion : inference.networking.x-k8s.io/v1alpha2
14
14
kind : InferenceModel
15
15
metadata :
16
16
name : inferencemodel-sample
24
24
- name : sql-lora-1fdg2
25
25
weight : 100
26
26
---
27
- apiVersion : inference.networking.x-k8s.io/v1alpha1
27
+ apiVersion : inference.networking.x-k8s.io/v1alpha2
28
28
kind : InferenceModel
29
29
metadata :
30
30
name : inferencemodel-sheddable
37
37
- name : sql-lora-1fdg3
38
38
weight : 100
39
39
---
40
- apiVersion : inference.networking.x-k8s.io/v1alpha1
40
+ apiVersion : inference.networking.x-k8s.io/v1alpha2
41
41
kind : InferenceModel
42
42
metadata :
43
43
name : inferencemodel-generic
You can’t perform that action at this time.
0 commit comments