mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-16 12:35:01 +08:00
Fix raw_request extraction in load_aware_call decorator (#15382)
Signed-off-by: Daniel Salib <danielsalib@meta.com>
This commit is contained in:
parent
6c663dfd5e
commit
5aefd6ac31
@ -68,13 +68,20 @@ def decrement_server_load(request: Request):
|
|||||||
def load_aware_call(func):
|
def load_aware_call(func):
|
||||||
|
|
||||||
@functools.wraps(func)
|
@functools.wraps(func)
|
||||||
async def wrapper(*args, raw_request: Request, **kwargs):
|
async def wrapper(*args, **kwargs):
|
||||||
|
raw_request = kwargs.get("raw_request",
|
||||||
|
args[1] if len(args) > 1 else None)
|
||||||
|
|
||||||
|
if raw_request is None:
|
||||||
|
raise ValueError(
|
||||||
|
"raw_request required when server load tracking is enabled")
|
||||||
|
|
||||||
if not raw_request.app.state.enable_server_load_tracking:
|
if not raw_request.app.state.enable_server_load_tracking:
|
||||||
return await func(*args, raw_request=raw_request, **kwargs)
|
return await func(*args, **kwargs)
|
||||||
|
|
||||||
raw_request.app.state.server_load_metrics += 1
|
raw_request.app.state.server_load_metrics += 1
|
||||||
try:
|
try:
|
||||||
response = await func(*args, raw_request=raw_request, **kwargs)
|
response = await func(*args, **kwargs)
|
||||||
except Exception:
|
except Exception:
|
||||||
raw_request.app.state.server_load_metrics -= 1
|
raw_request.app.state.server_load_metrics -= 1
|
||||||
raise
|
raise
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user