From 751e6c83f03fb41db9def00628938e5128c26483 Mon Sep 17 00:00:00 2001 From: Xinyi-ECNU <1668529909@qq.com> Date: Tue, 24 Sep 2024 21:11:07 +0800 Subject: [PATCH] fix ci --- llumnix/backends/vllm/scheduler.py | 12 ++++++------ llumnix/llumlet/llumlet.py | 1 + 2 files changed, 7 insertions(+), 6 deletions(-) diff --git a/llumnix/backends/vllm/scheduler.py b/llumnix/backends/vllm/scheduler.py index dcf00d7..430b5e4 100644 --- a/llumnix/backends/vllm/scheduler.py +++ b/llumnix/backends/vllm/scheduler.py @@ -207,16 +207,16 @@ def schedule(self) -> Tuple[List[SequenceGroupMetadata], SchedulerOutputs]: return seq_group_metadata_list, scheduler_outputs def _schedule_running(self, running_queue: deque, *args, **kwargs): - filtered_running_queue = [] - remove_running = [] - for seq_group in list(running_queue): + filtered_running_queue = deque() + remove_running = deque() + for seq_group in running_queue: if seq_group.output_len >= seq_group.expected_steps: - remove_running.append(seq_group) + remove_running.extend([seq_group]) else: - filtered_running_queue.append(seq_group) + filtered_running_queue.extend([seq_group]) remaining_running, running_scheduled = super()._schedule_running(filtered_running_queue, *args, **kwargs) for seq_group in remove_running: - remaining_running.append(seq_group) + remaining_running.extend([seq_group]) return remaining_running, running_scheduled def add_seq_group(self, *args, **kwargs): diff --git a/llumnix/llumlet/llumlet.py b/llumnix/llumlet/llumlet.py index 9a12b83..f04e4eb 100644 --- a/llumnix/llumlet/llumlet.py +++ b/llumnix/llumlet/llumlet.py @@ -120,6 +120,7 @@ def migrate_out(self, dst_instance_name: str, num_requests: int) -> List[str]: migrate_out_request.stage_timestamps.append(time.time()) self.backend_engine.remove_migrating_out_request_last_stage(migrate_out_request) else: + migrate_out_request.reset_migration_args() ray.get(migrate_in_ray_actor.execute_migration_method.remote("free_dst_pre_alloc_cache", migrate_out_request.request_id)) continue_migrate = False t1 = time.time()