Skip to content

Commit

Permalink
Remove TODO
Browse files Browse the repository at this point in the history
  • Loading branch information
s5u13b committed Oct 10, 2024
1 parent 4a79be7 commit 8e6ef6b
Showing 1 changed file with 0 additions and 1 deletion.
1 change: 0 additions & 1 deletion llumnix/backends/vllm/llm_engine.py
Original file line number Diff line number Diff line change
Expand Up @@ -257,7 +257,6 @@ def _put_request_outputs_to_server(self, request_outputs: List[RequestOutput], s
if server_id not in server_info_dict:
server_info_dict[server_id] = server_info
# TODO(s5u13b): Reduce the across-actor overhead.
# TODO(s5u13b): It is not necessary to use async_put_queue_actor when output_queue_type is RayQueue.
self.async_put_queue_actor.put_nowait_to_servers.remote(server_request_outputs, server_info_dict)

class BackendVLLM(BackendInterface):
Expand Down

0 comments on commit 8e6ef6b

Please sign in to comment.