diff --git a/vllm/engine/llm_engine.py b/vllm/engine/llm_engine.py index e1f21f90f9083..900206d5a80fb 100644 --- a/vllm/engine/llm_engine.py +++ b/vllm/engine/llm_engine.py @@ -1666,7 +1666,7 @@ def _get_stats(self, finished_reason_requests: List[str] = [] # NOTE: This loop assumes prefill seq_groups are before - # decode seq_groups in scheduled_seq_groups. + # decode seq_groups in scheduled_seq_groups if scheduler_outputs is not None: # For async postprocessor, already finished sequences need to be # not counted. (to avoid double counting)