Skip to content

Commit 982f911

Browse files
committed
first_scheduled_time can be None
1 parent 3937c1f commit 982f911

File tree

1 file changed

+12
-10
lines changed

1 file changed

+12
-10
lines changed

vllm/engine/llm_engine.py

Lines changed: 12 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -1875,16 +1875,18 @@ def _get_stats(self,
18751875
# Latency timings
18761876
time_e2e_requests.append(now -
18771877
seq_group.metrics.arrival_time)
1878-
time_queue_requests.append(
1879-
seq_group.metrics.first_scheduled_time -
1880-
seq_group.metrics.arrival_time)
1881-
time_prefill_requests.append(
1882-
seq_group.metrics.first_token_time -
1883-
seq_group.metrics.first_scheduled_time)
1884-
time_decode_requests.append(
1885-
now - seq_group.metrics.first_token_time)
1886-
time_inference_requests.append(
1887-
now - seq_group.metrics.first_scheduled_time)
1878+
if (seq_group.metrics.first_scheduled_time is not None and
1879+
seq_group.metrics.first_token_time is not None):
1880+
time_queue_requests.append(
1881+
seq_group.metrics.first_scheduled_time -
1882+
seq_group.metrics.arrival_time)
1883+
time_prefill_requests.append(
1884+
seq_group.metrics.first_token_time -
1885+
seq_group.metrics.first_scheduled_time)
1886+
time_decode_requests.append(
1887+
now - seq_group.metrics.first_token_time)
1888+
time_inference_requests.append(
1889+
now - seq_group.metrics.first_scheduled_time)
18881890
# Metadata
18891891
num_prompt_tokens_requests.append(
18901892
len(seq_group.prompt_token_ids))

0 commit comments

Comments
 (0)