Skip to content

Commit

Permalink
ping
Browse files Browse the repository at this point in the history
  • Loading branch information
alexm-neuralmagic committed Jul 24, 2024
1 parent 430d5ea commit 4cb2a17
Showing 1 changed file with 1 addition and 1 deletion.
2 changes: 1 addition & 1 deletion vllm/model_executor/layers/quantization/awq_marlin.py
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,7 @@ class AWQMarlinConfig(QuantizationConfig):
def __init__(self, weight_bits: int, group_size: int, has_zp: bool,
lm_head_quantized: bool) -> None:
self.weight_bits = weight_bits
self.pack_factor = 32 // self.weight_bits # packed into int32
self.pack_factor = 32 // self.weight_bits # packed into 32bits
self.group_size = group_size
self.has_zp = has_zp
self.lm_head_quantized = lm_head_quantized
Expand Down

0 comments on commit 4cb2a17

Please sign in to comment.