diff --git a/benchmarks/benchmark_serving_structured_output.py b/benchmarks/benchmark_serving_structured_output.py index 7ad0791a98681..e52f16a8b1299 100644 --- a/benchmarks/benchmark_serving_structured_output.py +++ b/benchmarks/benchmark_serving_structured_output.py @@ -11,7 +11,7 @@ On the client side, run: --model \ --dataset json \ --structured-output-ratio 1.0 \ - --structured-output-backend xgrammar \ + --structured-output-backend auto \ --request-rate 10 \ --num-prompts 1000 @@ -997,12 +997,14 @@ if __name__ == "__main__": type=float, default=1.0, help="Ratio of Structured Outputs requests") - parser.add_argument( - "--structured-output-backend", - type=str, - choices=["outlines", "lm-format-enforcer", "xgrammar", "guidance"], - default="xgrammar", - help="Backend to use for structured outputs") + parser.add_argument("--structured-output-backend", + type=str, + choices=[ + "outlines", "lm-format-enforcer", "xgrammar", + "guidance", "auto" + ], + default="auto", + help="Backend to use for structured outputs") args = parser.parse_args() main(args)