Skip to content

Commit

Permalink
Move cutlass_fp8_supported into __init__
Browse files Browse the repository at this point in the history
  • Loading branch information
zeyugao committed Jul 28, 2024
1 parent cbd081f commit 1386d1e
Showing 1 changed file with 2 additions and 1 deletion.
3 changes: 2 additions & 1 deletion vllm/model_executor/layers/quantization/fbgemm_fp8.py
Original file line number Diff line number Diff line change
Expand Up @@ -73,6 +73,7 @@ class FBGEMMFp8LinearMethod(LinearMethodBase):

def __init__(self, quant_config: FBGEMMFp8Config):
self.quant_config = quant_config
self.cutlass_fp8_supported = cutlass_fp8_supported()

def create_weights(
self,
Expand Down Expand Up @@ -146,5 +147,5 @@ def apply(self,
input_scale=None,
input_scale_ub=layer.input_scale_ub,
bias=bias,
cutlass_fp8_supported=cutlass_fp8_supported(),
cutlass_fp8_supported=self.cutlass_fp8_supported,
use_per_token_if_dynamic=True)

0 comments on commit 1386d1e

Please sign in to comment.