diff --git a/vllm/sequence.py b/vllm/sequence.py index 69a6e20ef0512..c5e6729b80aa3 100644 --- a/vllm/sequence.py +++ b/vllm/sequence.py @@ -780,7 +780,7 @@ def get_last_token_latency(self) -> float: "seq_group.get_last_token_latency() should not be called " "if the seq_group is in prefill phase.") return self.last_token_latency - + def maybe_set_first_token_time(self, time: float) -> None: """Sets the first token time for Request level timings.""" # Note: in a case where a sequence_group is swapped and