Skip to content

Commit

Permalink
format
Browse files Browse the repository at this point in the history
  • Loading branch information
SageMoore committed Dec 6, 2024
1 parent 407a858 commit 134ae2f
Showing 1 changed file with 1 addition and 6 deletions.
7 changes: 1 addition & 6 deletions benchmarks/benchmark_latency.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,7 @@
import time
from pathlib import Path
from typing import List, Optional
from vllm.config import CompilationConfig

import numpy as np
import torch
from tqdm import tqdm
Expand All @@ -21,11 +21,6 @@ def main(args: argparse.Namespace):

engine_args = EngineArgs.from_cli_args(args)

config = CompilationConfig(
level=3,
custom_ops=["+silu_and_mul"],
)
engine_args.compilation_config = config
# NOTE(woosuk): If the request cannot be processed in a single batch,
# the engine will automatically process the request in multiple batches.
llm = LLM(**dataclasses.asdict(engine_args))
Expand Down

0 comments on commit 134ae2f

Please sign in to comment.