Update vllm/v1/worker/gpu_model_runner.py

LucasWilkinson · ProExpertProg · LucasWilkinson · commit 90c7c8bef462 · 2025-11-18T15:33:49.000Z
Co-authored-by: Luka Govedič &lt;ProExpertProg@users.noreply.github.com&gt;
Signed-off-by: Lucas Wilkinson &lt;LucasWilkinson@users.noreply.github.com&gt;
diff --git a/vllm/v1/worker/gpu_model_runner.py b/vllm/v1/worker/gpu_model_runner.py
@@ -2618,7 +2618,7 @@ def _determine_batch_execution_and_padding(
         ubatch_slices, num_tokens_across_dp = None, None
         if self.vllm_config.parallel_config.data_parallel_size > 1:
             # Disable DP padding when running eager to avoid excessive padding when
-            # running prefills. This lets us set enforce_eager on the prefiller in
+            # running prefills. This lets us set cudagraph_mode="NONE" on the prefiller in
             # a P/D setup and still use CUDA graphs (enabled by this padding) on the
             # decoder.
             allow_dp_padding = (