Skip to content

Commit

Permalink
remove comment
Browse files Browse the repository at this point in the history
  • Loading branch information
charlifu committed Jun 13, 2024
1 parent d61cbff commit cde8b15
Showing 1 changed file with 0 additions and 2 deletions.
2 changes: 0 additions & 2 deletions vllm/model_executor/layers/quantization/fp8_rocm.py
Original file line number Diff line number Diff line change
Expand Up @@ -24,10 +24,8 @@
class Fp8RocmConfig(QuantizationConfig):

def __init__(self) -> None:
# self.quantized_weights_path = config["quantized_weights"]
self._tuned = {}
gemm_type = os.getenv("FP8_GEMM", "fp8_16")
#print(f"Integral Cross factor = {self.factor}")
if gemm_type == "fp8_8":
self.gemm_method = Fp8RocmLinearMethod.apply_fp8_8
tuned_filename = "/tmp/tuned_fp8_8.csv"
Expand Down

0 comments on commit cde8b15

Please sign in to comment.