File tree 1 file changed +6
-0
lines changed
1 file changed +6
-0
lines changed Original file line number Diff line number Diff line change @@ -2051,6 +2051,11 @@ def __post_init__(self):
2051
2051
f"max_cpu_loras ({ self .max_cpu_loras } ) must be >= "
2052
2052
f"max_loras ({ self .max_loras } )" )
2053
2053
2054
+ def verify_with_cache_config (self , cache_config : CacheConfig ):
2055
+ # TODO LoRA supports CPU offload.
2056
+ if cache_config .cpu_offload_gb > 0 :
2057
+ raise ValueError ("CPU offload is not supported with LoRA yet." )
2058
+
2054
2059
def verify_with_model_config (self , model_config : ModelConfig ):
2055
2060
if self .lora_dtype in (None , "auto" ):
2056
2061
self .lora_dtype = model_config .dtype
@@ -3138,6 +3143,7 @@ def __post_init__(self):
3138
3143
self .cache_config .verify_with_parallel_config (self .parallel_config )
3139
3144
3140
3145
if self .lora_config :
3146
+ self .lora_config .verify_with_cache_config (self .cache_config )
3141
3147
self .lora_config .verify_with_model_config (self .model_config )
3142
3148
self .lora_config .verify_with_scheduler_config (
3143
3149
self .scheduler_config )
You can’t perform that action at this time.
0 commit comments