more cleanup

LucasWilkinson · LucasWilkinson · commit 79d0a01cd467 · 2025-09-04T20:04:28.000Z
Signed-off-by: Lucas Wilkinson &lt;lwilkins@redhat.com&gt;
diff --git a/vllm/engine/arg_utils.py b/vllm/engine/arg_utils.py
@@ -687,8 +687,6 @@ def add_cli_args(parser: FlexibleArgumentParser) -> FlexibleArgumentParser:
             "--microbatch-schedule",
             dest="microbatch_schedule",
             **parallel_kwargs["microbatch_schedule"])
-        parallel_group.add_argument("--enable-async-comms",
-                                    **parallel_kwargs["enable_async_comms"])
         parallel_group.add_argument("--enable-eplb",
                                     **parallel_kwargs["enable_eplb"])
         parallel_group.add_argument("--eplb-config",
diff --git a/vllm/v1/worker/ubatching.py b/vllm/v1/worker/ubatching.py
@@ -153,7 +153,6 @@ def _cpu_yield(self, check_context: bool = True):
         # It is critical for correctness that only one thread is running
         # at a time. These asserts just make sure that this is the only
         # thread running before waking the other one up and going to sleep
-        print(f"CPU yield {self.id} {type(forward_context._forward_context)} {type(self.forward_context)}")
         assert (
             not check_context or
             forward_context._forward_context is self.forward_context)
@@ -172,11 +171,6 @@ def switch_to_comm_sync(self):
         self.update_stream(self.comm_stream)
         self._wait_comm_done()
 
-    def switch_to_compute_sync(self):
-        self._signal_comm_done()
-        self.update_stream(self.compute_stream)
-        self._wait_compute_done()
-
     def maybe_run_recv_hook(self):
         if self.recv_hook is not None:
             self.recv_hook()
@@ -291,7 +285,6 @@ def make_ubatch_contexts(
     comm_stream: torch.cuda.Stream,
     forward_contexts: list[ForwardContext],
     ready_barrier: threading.Barrier,
-    device: Optional[torch.device] = None,
     schedule: Schedule = Schedule.MLP_OVERLAP,
     delayed_start: bool = False,
 ) -> list[UBatchContext]: