Skip to content

Commit b18f54f

Browse files
committed
remove bitpacking value
1 parent 769215a commit b18f54f

File tree

1 file changed

+0
-3
lines changed

1 file changed

+0
-3
lines changed

hqq/utils/vllm.py

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -463,8 +463,6 @@ def get_quant_method(
463463
class HQQGemLiteVLLMLinear(HQQBaseVLLMLinear):
464464
"""Linear HQQ VLLM with GemLite backend"""
465465

466-
gemlite_packing_bitwidth = 32
467-
468466
def __init__(
469467
self,
470468
quant_config: QuantizationConfig,
@@ -492,7 +490,6 @@ def process_weights_after_loading(self, layer: torch.nn.Module) -> None:
492490
layer.scale.view(-1, 1),
493491
layer.zero.view(-1, 1),
494492
bias=None,
495-
packing_bitwidth=HQQGemLiteVLLMLinear.gemlite_packing_bitwidth,
496493
)
497494

498495
layer.gemlite_linear = gemlite_linear

0 commit comments

Comments
 (0)