File tree 1 file changed +6
-6
lines changed
1 file changed +6
-6
lines changed Original file line number Diff line number Diff line change 15
15
from utils import ArgPool , Bench , CudaGraphBenchParams
16
16
from weight_shapes import WEIGHT_SHAPES
17
17
18
- from vllm .lora .ops .bgmv_expand import bgmv_expand
19
- from vllm .lora .ops .bgmv_expand_slice import bgmv_expand_slice
20
- from vllm .lora .ops .bgmv_shrink import bgmv_shrink
21
- from vllm .lora .ops .sgmv_expand import sgmv_expand
22
- from vllm .lora .ops .sgmv_shrink import sgmv_shrink
23
- from vllm .lora .ops .utils import _LORA_A_PTR_DICT , _LORA_B_PTR_DICT
18
+ from vllm .lora .ops .triton_ops . bgmv_expand import bgmv_expand
19
+ from vllm .lora .ops .triton_ops . bgmv_expand_slice import bgmv_expand_slice
20
+ from vllm .lora .ops .triton_ops . bgmv_shrink import bgmv_shrink
21
+ from vllm .lora .ops .triton_ops . sgmv_expand import sgmv_expand
22
+ from vllm .lora .ops .triton_ops . sgmv_shrink import sgmv_shrink
23
+ from vllm .lora .ops .triton_ops . utils import _LORA_A_PTR_DICT , _LORA_B_PTR_DICT
24
24
from vllm .utils import FlexibleArgumentParser
25
25
26
26
DEFAULT_MODELS = list (WEIGHT_SHAPES .keys ())
You can’t perform that action at this time.
0 commit comments