mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-05 11:37:58 +08:00
run format
Signed-off-by: clark <panf2333@gmail.com>
This commit is contained in:
parent
16ed827378
commit
6c8fae82dd
@ -5,7 +5,9 @@ import pandas as pd
|
|||||||
|
|
||||||
if __name__ == "__main__":
|
if __name__ == "__main__":
|
||||||
data = []
|
data = []
|
||||||
for name in ['disagg_prefill_http', 'disagg_prefill_zmq', 'chunked_prefill']:
|
for name in [
|
||||||
|
'disagg_prefill_http', 'disagg_prefill_zmq', 'chunked_prefill'
|
||||||
|
]:
|
||||||
for qps in [2, 4, 6, 8, 10, 12]:
|
for qps in [2, 4, 6, 8, 10, 12]:
|
||||||
with open(f"results/{name}-qps-{qps}.json") as f:
|
with open(f"results/{name}-qps-{qps}.json") as f:
|
||||||
x = json.load(f)
|
x = json.load(f)
|
||||||
@ -18,7 +20,6 @@ if __name__ == "__main__":
|
|||||||
dis_zmq_df = df[df['name'] == 'disagg_prefill_zmq']
|
dis_zmq_df = df[df['name'] == 'disagg_prefill_zmq']
|
||||||
chu_df = df[df['name'] == 'chunked_prefill']
|
chu_df = df[df['name'] == 'chunked_prefill']
|
||||||
|
|
||||||
|
|
||||||
plt.style.use('bmh')
|
plt.style.use('bmh')
|
||||||
plt.rcParams['font.size'] = 20
|
plt.rcParams['font.size'] = 20
|
||||||
|
|
||||||
@ -51,7 +52,6 @@ if __name__ == "__main__":
|
|||||||
fig.savefig(f'results/http_zmq_chunk/{key}.png')
|
fig.savefig(f'results/http_zmq_chunk/{key}.png')
|
||||||
plt.close(fig)
|
plt.close(fig)
|
||||||
|
|
||||||
|
|
||||||
fig1, ax1 = plt.subplots(figsize=(11, 7))
|
fig1, ax1 = plt.subplots(figsize=(11, 7))
|
||||||
plt.plot(dis_http_df['qps'],
|
plt.plot(dis_http_df['qps'],
|
||||||
dis_http_df[key],
|
dis_http_df[key],
|
||||||
|
|||||||
@ -212,22 +212,21 @@ async def run_disagg_connector(args, **uvicorn_kwargs) -> None:
|
|||||||
|
|
||||||
|
|
||||||
if __name__ == "__main__":
|
if __name__ == "__main__":
|
||||||
# NOTE(simon):
|
# NOTE(simon):
|
||||||
# This section should be in sync with vllm/scripts.py for CLI entrypoints.
|
# This section should be in sync with vllm/scripts.py for CLI entrypoints.
|
||||||
parser = FlexibleArgumentParser(
|
parser = FlexibleArgumentParser(description="vLLM disagg zmq server.")
|
||||||
description="vLLM disagg zmq server.")
|
|
||||||
parser.add_argument("--port",
|
parser.add_argument("--port",
|
||||||
type=int,
|
type=int,
|
||||||
default=8000,
|
default=8000,
|
||||||
help="The fastapi server port")
|
help="The fastapi server port")
|
||||||
parser.add_argument("--prefill-addr",
|
parser.add_argument("--prefill-addr",
|
||||||
type=str,
|
type=str,
|
||||||
required=True,
|
required=True,
|
||||||
help="The prefill address IP:PORT")
|
help="The prefill address IP:PORT")
|
||||||
parser.add_argument("--decode-addr",
|
parser.add_argument("--decode-addr",
|
||||||
type=str,
|
type=str,
|
||||||
required=True,
|
required=True,
|
||||||
help="The decode address IP:PORT")
|
help="The decode address IP:PORT")
|
||||||
|
|
||||||
args = parser.parse_args()
|
args = parser.parse_args()
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user