Skip to content

Commit

Permalink
Minors
Browse files Browse the repository at this point in the history
  • Loading branch information
s5u13b committed Oct 21, 2024
1 parent 7a69945 commit 2c9842d
Show file tree
Hide file tree
Showing 4 changed files with 5 additions and 5 deletions.
6 changes: 3 additions & 3 deletions llumnix/backends/vllm/llm_engine.py
Original file line number Diff line number Diff line change
Expand Up @@ -362,9 +362,9 @@ def commit_dst_request(self, backend_request: SequenceGroupLlumnix) -> None:
async def send_blocks(self, dst_ray_actor: "ray.actor.ActorHandle", src_blocks: List[int], dst_blocks: List[int]) -> None:
await dst_ray_actor.execute_engine_method.remote("_run_workers",
"migrate_cache",
dst_blocks=dst_blocks,
src_blocks=src_blocks,
src_worker_handle_list=self.worker_handle_list)
dst_blocks=dst_blocks,
src_blocks=src_blocks,
src_worker_handle_list=self.worker_handle_list)

def _run_workers(self, *args, **kwargs):
# pylint: disable=protected-access
Expand Down
1 change: 0 additions & 1 deletion llumnix/backends/vllm/sequence.py
Original file line number Diff line number Diff line change
Expand Up @@ -22,7 +22,6 @@ class SequenceGroupLlumnix(SequenceGroup, LlumnixRequest):
def __init__(self, request_id, server_info, expected_steps: int, *args, **kwargs) -> None:
SequenceGroup.__init__(self, request_id, *args, **kwargs)
LlumnixRequest.__init__(self, request_id, server_info, expected_steps)
self.try_schedule_times = 0

@property
def prompt_len(self) -> int:
Expand Down
1 change: 1 addition & 0 deletions llumnix/llumlet/request.py
Original file line number Diff line number Diff line change
Expand Up @@ -36,6 +36,7 @@ def __init__(self, request_id: int, server_info: ServerInfo, expected_steps: int
self.last_preemption_time = None
self.stage_timestamps = []
self.stage_num_blocks_list = []
self.try_schedule_times = 0
self.waiting_migrating = False
# end-of-migration
self.eom = False
Expand Down
2 changes: 1 addition & 1 deletion tests/e2e_test/test_e2e.py
Original file line number Diff line number Diff line change
Expand Up @@ -59,7 +59,7 @@ def generate_launch_command(result_filename: str = "", launch_ray_cluster: bool
f"--max-model-len {max_model_len} "
f"--dispatch-policy {dispatch_policy} "
f"--trust-remote-code "
f"--request-migration-policy SR "
f"--request-migration-policy LCR "
f"--migration-backend {migration_backend} "
f"--migration-cache-blocks 32 "
f"--tensor-parallel-size 1 "
Expand Down

0 comments on commit 2c9842d

Please sign in to comment.