We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
inf
1 parent 2c19d96 commit a4398fbCopy full SHA for a4398fb
vllm/benchmarks/serve.py
@@ -189,9 +189,16 @@ async def get_request(
189
total_requests,
190
request_rate,
191
)
192
+ assert current_request_rate > 0.0, (
193
+ f"Obtained non-positive request rate {current_request_rate}."
194
+ )
195
request_rates.append(current_request_rate)
196
if current_request_rate == float("inf"):
197
delay_ts.append(0)
198
+ elif burstiness == float("inf"):
199
+ # when burstiness tends to infinity, the delay time becomes constant
200
+ # and tends to the inverse of the request rate
201
+ delay_ts.append(1.0 / current_request_rate)
202
else:
203
theta = 1.0 / (current_request_rate * burstiness)
204
0 commit comments