update benchmark_serving_structured_output to include auto backend (#16438)

Signed-off-by: Chenyaaang <chenyangli@google.com>
This commit is contained in:
Chenyaaang 2025-04-10 21:25:52 -07:00 committed by GitHub
parent 3e397a9484
commit d544d141ec
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -11,7 +11,7 @@ On the client side, run:
--model <your_model> \ --model <your_model> \
--dataset json \ --dataset json \
--structured-output-ratio 1.0 \ --structured-output-ratio 1.0 \
--structured-output-backend xgrammar \ --structured-output-backend auto \
--request-rate 10 \ --request-rate 10 \
--num-prompts 1000 --num-prompts 1000
@ -997,12 +997,14 @@ if __name__ == "__main__":
type=float, type=float,
default=1.0, default=1.0,
help="Ratio of Structured Outputs requests") help="Ratio of Structured Outputs requests")
parser.add_argument( parser.add_argument("--structured-output-backend",
"--structured-output-backend", type=str,
type=str, choices=[
choices=["outlines", "lm-format-enforcer", "xgrammar", "guidance"], "outlines", "lm-format-enforcer", "xgrammar",
default="xgrammar", "guidance", "auto"
help="Backend to use for structured outputs") ],
default="auto",
help="Backend to use for structured outputs")
args = parser.parse_args() args = parser.parse_args()
main(args) main(args)