Skip to content

Commit

Permalink
format
Browse files Browse the repository at this point in the history
  • Loading branch information
SageMoore committed Dec 6, 2024
1 parent 1b6f920 commit b9f853b
Showing 1 changed file with 4 additions and 2 deletions.
6 changes: 4 additions & 2 deletions vllm/compilation/backends.py
Original file line number Diff line number Diff line change
Expand Up @@ -253,7 +253,8 @@ def __call__(self, graph: fx.GraphModule, example_inputs) -> Callable:

from torch._dynamo.utils import lazy_format_graph_code
logger.debug("%s", lazy_format_graph_code("before split", self.graph))
logger.debug("%s", lazy_format_graph_code("after split", self.split_gm))
logger.debug("%s", lazy_format_graph_code("after split",
self.split_gm))

compilation_counter.num_piecewise_graphs_seen += len(
self.piecewise_graphs)
Expand Down Expand Up @@ -479,7 +480,8 @@ def __call__(self, *args) -> Any:
]
assert new_input_addresses == entry.input_addresses, (
"Input addresses for cudagraphs are different during replay."
f" Expected {entry.input_addresses}, got {new_input_addresses}")
f" Expected {entry.input_addresses}, got {new_input_addresses}"
)

entry.cudagraph.replay()
return entry.output

0 comments on commit b9f853b

Please sign in to comment.