@@ -1875,16 +1875,18 @@ def _get_stats(self,
18751875 # Latency timings
18761876 time_e2e_requests .append (now -
18771877 seq_group .metrics .arrival_time )
1878- time_queue_requests .append (
1879- seq_group .metrics .first_scheduled_time -
1880- seq_group .metrics .arrival_time )
1881- time_prefill_requests .append (
1882- seq_group .metrics .first_token_time -
1883- seq_group .metrics .first_scheduled_time )
1884- time_decode_requests .append (
1885- now - seq_group .metrics .first_token_time )
1886- time_inference_requests .append (
1887- now - seq_group .metrics .first_scheduled_time )
1878+ if (seq_group .metrics .first_scheduled_time is not None and
1879+ seq_group .metrics .first_token_time is not None ):
1880+ time_queue_requests .append (
1881+ seq_group .metrics .first_scheduled_time -
1882+ seq_group .metrics .arrival_time )
1883+ time_prefill_requests .append (
1884+ seq_group .metrics .first_token_time -
1885+ seq_group .metrics .first_scheduled_time )
1886+ time_decode_requests .append (
1887+ now - seq_group .metrics .first_token_time )
1888+ time_inference_requests .append (
1889+ now - seq_group .metrics .first_scheduled_time )
18881890 # Metadata
18891891 num_prompt_tokens_requests .append (
18901892 len (seq_group .prompt_token_ids ))
0 commit comments