Skip to content

Commit 5d043c1

Browse files
authored
[Quant] Bamba SupportsQuant (vllm-project#14698)
Signed-off-by: Kyle Sayers <[email protected]>
1 parent 36d1ccb commit 5d043c1

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

vllm/model_executor/models/bamba.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -33,7 +33,7 @@
3333
from vllm.utils import LayerBlockType
3434

3535
from .interfaces import (HasInnerState, IsHybrid, SupportsLoRA, SupportsPP,
36-
SupportsV0Only)
36+
SupportsQuant, SupportsV0Only)
3737
from .utils import (is_pp_missing_parameter,
3838
make_empty_intermediate_tensors_factory, make_layers,
3939
maybe_prefix)
@@ -367,7 +367,7 @@ def forward(
367367

368368

369369
class BambaForCausalLM(nn.Module, HasInnerState, SupportsLoRA, SupportsPP,
370-
IsHybrid, SupportsV0Only):
370+
IsHybrid, SupportsV0Only, SupportsQuant):
371371
packed_modules_mapping = {
372372
"qkv_proj": [
373373
"q_proj",

0 commit comments

Comments
 (0)