We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent a79cc68 commit 1b67297Copy full SHA for 1b67297
vllm/model_executor/models/bloom.py
@@ -42,7 +42,7 @@
42
from vllm.model_executor.sampling_metadata import SamplingMetadata
43
from vllm.sequence import IntermediateTensors
44
45
-from .interfaces import SupportsPP, SupportsV0Only
+from .interfaces import SupportsPP, SupportsQuant, SupportsV0Only
46
from .utils import (is_pp_missing_parameter,
47
make_empty_intermediate_tensors_factory, make_layers,
48
maybe_prefix)
@@ -279,7 +279,7 @@ def forward(
279
return hidden_states
280
281
282
-class BloomForCausalLM(nn.Module, SupportsPP, SupportsV0Only):
+class BloomForCausalLM(nn.Module, SupportsPP, SupportsV0Only, SupportsQuant):
283
284
def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""):
285
super().__init__()
0 commit comments