File tree 4 files changed +163
-165
lines changed
examples/dynamic-lora-sidecar
4 files changed +163
-165
lines changed Original file line number Diff line number Diff line change @@ -56,22 +56,26 @@ spec:
56
56
valueFrom :
57
57
secretKeyRef :
58
58
name : hf-token # The name of your Kubernetes Secret
59
- key : HF_TOKEN # The specific key within the Secret
59
+ key : token # The specific key within the Secret
60
60
- name : DYNAMIC_LORA_ROLLOUT_CONFIG
61
61
value : " /config/configmap.yaml"
62
62
volumeMounts :
63
63
- mountPath : /dev/shm
64
64
name : dshm
65
65
initContainers :
66
66
- name : configmap-reader-1
67
+ tty : true
68
+ stdin : true
67
69
image : us-docker.pkg.dev/kunjanp-gke-dev-2/lora-sidecar/sidecar:latest
68
70
restartPolicy : Always
71
+ imagePullPolicy : Always
69
72
env :
70
- DYNAMIC_LORA_ROLLOUT_CONFIG : " /config/configmap.yaml"
73
+ - name : DYNAMIC_LORA_ROLLOUT_CONFIG
74
+ value : " /config/configmap.yaml"
71
75
volumeMounts :
72
76
- name : config-volume
73
- mountPath : /config/configmap.yaml
74
- subPath : configmap.yaml
77
+ mountPath : /config
78
+ # subPath: configmap.yaml
75
79
volumes :
76
80
- name : dshm
77
81
emptyDir :
@@ -106,8 +110,21 @@ data:
106
110
configmap.yaml : |
107
111
vLLMLoRAConfig:
108
112
host: localhost
109
- models:
113
+ name: sql-loras-llama
114
+ port: '8000'
115
+ ensureExist:
116
+ models:
110
117
- base-model: meta-llama/Llama-2-7b-hf
111
118
id: sql-lora-v1
112
119
source: yard1/llama-2-7b-sql-lora-test
113
- name: sql-lora
120
+ - base-model: meta-llama/Llama-2-7b-hf
121
+ id: sql-lora-v3
122
+ source: yard1/llama-2-7b-sql-lora-test
123
+ - base-model: meta-llama/Llama-2-7b-hf
124
+ id: sql-lora-v4
125
+ source: yard1/llama-2-7b-sql-lora-test
126
+ ensureNotExist:
127
+ models:
128
+ - base-model: meta-llama/Llama-2-7b-hf
129
+ id: sql-lora-v2
130
+ source: yard1/llama-2-7b-sql-lora-test
Original file line number Diff line number Diff line change 1
1
aiohttp == 3.10.10
2
2
pyyaml == 6.0.2
3
3
requests == 2.32.3
4
- watchdog == 5.0.3
4
+ watchdog == 5.0.3
5
+ watchfiles == 0.24.0
Original file line number Diff line number Diff line change 1
1
vLLMLoRAConfig :
2
2
host : localhost
3
- models :
4
- - base-model : meta-llama/Llama-2-7b-hf
5
- id : sql-lora-v1
6
- source : yard1/llama-2-7b-sql-lora-test
7
- status :
8
- errors :
9
- - ' '
10
- operation : load
11
- timestamp : 2024-10-23 15:43:07 UTC+0000
12
- toRemove : false
13
- - base-model : meta-llama/Llama-2-7b-hf
14
- id : sql-lora-v2
15
- source : yard1/llama-2-7b-sql-lora-test
16
- status :
17
- errors :
18
- - already unloaded
19
- operation : unload
20
- timestamp : 2024-10-23 15:43:07 UTC+0000
21
- toRemove : true
22
3
name : sql-loras-llama
23
- port : ' 8000'
4
+ port : 8000
5
+ ensureExist :
6
+ models :
7
+ - base-model : meta-llama/Llama-2-7b-hf
8
+ id : sql-lora-v1
9
+ source : yard1/llama-2-7b-sql-lora-test
10
+ ensureNotExist :
11
+ models :
12
+ - base-model : meta-llama/Llama-2-7b-hf
13
+ id : sql-lora-v2
14
+ source : yard1/llama-2-7b-sql-lora-test
You can’t perform that action at this time.
0 commit comments