Skip to content

Commit

Permalink
minor updates
Browse files Browse the repository at this point in the history
Signed-off-by: Sage Moore <[email protected]>
  • Loading branch information
SageMoore committed Dec 9, 2024
1 parent 6915fa2 commit 6d4b8d0
Show file tree
Hide file tree
Showing 2 changed files with 1 addition and 3 deletions.
2 changes: 0 additions & 2 deletions tests/kernels/test_fused_quant_activation.py
Original file line number Diff line number Diff line change
Expand Up @@ -16,9 +16,7 @@

def ref_impl(silu_and_mul: SiluAndMul, x: torch.Tensor,
scale: torch.Tensor) -> torch.Tensor:
# Norm
silu_and_mul_out = silu_and_mul.forward_native(x)
# Quant
out, scales = ops.scaled_fp8_quant(silu_and_mul_out, scale)
return out

Expand Down
2 changes: 1 addition & 1 deletion vllm/compilation/pass_manager.py
Original file line number Diff line number Diff line change
Expand Up @@ -45,7 +45,7 @@ def configure(self, pass_config: CompilationConfig.PassConfig):
if pass_config.enable_reshape:
self.passes += [RedundantReshapesPass(pass_config)]

if True:
if pass_config.enable_fusion:
self.passes += [FusionPass.instance(pass_config)]
self.passes += [ActivationQuantFusionPass.instance(pass_config)]

Expand Down

0 comments on commit 6d4b8d0

Please sign in to comment.