diff --git a/benchmarks/disagg_benchmarks/zmq/visualize_benchmark_results_zmq_http.py b/benchmarks/disagg_benchmarks/zmq/visualize_benchmark_results_zmq_http.py index 82a9a6184920e..155a5d5f88986 100644 --- a/benchmarks/disagg_benchmarks/zmq/visualize_benchmark_results_zmq_http.py +++ b/benchmarks/disagg_benchmarks/zmq/visualize_benchmark_results_zmq_http.py @@ -5,7 +5,9 @@ import pandas as pd if __name__ == "__main__": data = [] - for name in ['disagg_prefill_http', 'disagg_prefill_zmq', 'chunked_prefill']: + for name in [ + 'disagg_prefill_http', 'disagg_prefill_zmq', 'chunked_prefill' + ]: for qps in [2, 4, 6, 8, 10, 12]: with open(f"results/{name}-qps-{qps}.json") as f: x = json.load(f) @@ -18,7 +20,6 @@ if __name__ == "__main__": dis_zmq_df = df[df['name'] == 'disagg_prefill_zmq'] chu_df = df[df['name'] == 'chunked_prefill'] - plt.style.use('bmh') plt.rcParams['font.size'] = 20 @@ -51,7 +52,6 @@ if __name__ == "__main__": fig.savefig(f'results/http_zmq_chunk/{key}.png') plt.close(fig) - fig1, ax1 = plt.subplots(figsize=(11, 7)) plt.plot(dis_http_df['qps'], dis_http_df[key], diff --git a/vllm/entrypoints/disagg_connector.py b/vllm/entrypoints/disagg_connector.py index 5dea31f1c67a1..5eaff166cb75a 100644 --- a/vllm/entrypoints/disagg_connector.py +++ b/vllm/entrypoints/disagg_connector.py @@ -212,22 +212,21 @@ async def run_disagg_connector(args, **uvicorn_kwargs) -> None: if __name__ == "__main__": - # NOTE(simon): + # NOTE(simon): # This section should be in sync with vllm/scripts.py for CLI entrypoints. - parser = FlexibleArgumentParser( - description="vLLM disagg zmq server.") + parser = FlexibleArgumentParser(description="vLLM disagg zmq server.") parser.add_argument("--port", - type=int, - default=8000, - help="The fastapi server port") + type=int, + default=8000, + help="The fastapi server port") parser.add_argument("--prefill-addr", - type=str, - required=True, - help="The prefill address IP:PORT") + type=str, + required=True, + help="The prefill address IP:PORT") parser.add_argument("--decode-addr", - type=str, - required=True, - help="The decode address IP:PORT") + type=str, + required=True, + help="The decode address IP:PORT") args = parser.parse_args()