mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-19 15:57:01 +08:00
[Feature][Benchmarks] Support inf burstiness (#26941)
Signed-off-by: Sophie du Couédic <sop@zurich.ibm.com>
This commit is contained in:
parent
2c19d96777
commit
a4398fbb5e
@ -189,9 +189,16 @@ async def get_request(
|
|||||||
total_requests,
|
total_requests,
|
||||||
request_rate,
|
request_rate,
|
||||||
)
|
)
|
||||||
|
assert current_request_rate > 0.0, (
|
||||||
|
f"Obtained non-positive request rate {current_request_rate}."
|
||||||
|
)
|
||||||
request_rates.append(current_request_rate)
|
request_rates.append(current_request_rate)
|
||||||
if current_request_rate == float("inf"):
|
if current_request_rate == float("inf"):
|
||||||
delay_ts.append(0)
|
delay_ts.append(0)
|
||||||
|
elif burstiness == float("inf"):
|
||||||
|
# when burstiness tends to infinity, the delay time becomes constant
|
||||||
|
# and tends to the inverse of the request rate
|
||||||
|
delay_ts.append(1.0 / current_request_rate)
|
||||||
else:
|
else:
|
||||||
theta = 1.0 / (current_request_rate * burstiness)
|
theta = 1.0 / (current_request_rate * burstiness)
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user