update benchmark_serving_structured_output to include auto backend (#16438)

Signed-off-by: Chenyaaang <chenyangli@google.com>
This commit is contained in:
Chenyaaang 2025-04-10 21:25:52 -07:00 committed by GitHub
parent 3e397a9484
commit d544d141ec
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -11,7 +11,7 @@ On the client side, run:
--model <your_model> \ --model <your_model> \
--dataset json \ --dataset json \
--structured-output-ratio 1.0 \ --structured-output-ratio 1.0 \
--structured-output-backend xgrammar \ --structured-output-backend auto \
--request-rate 10 \ --request-rate 10 \
--num-prompts 1000 --num-prompts 1000
@ -997,11 +997,13 @@ if __name__ == "__main__":
type=float, type=float,
default=1.0, default=1.0,
help="Ratio of Structured Outputs requests") help="Ratio of Structured Outputs requests")
parser.add_argument( parser.add_argument("--structured-output-backend",
"--structured-output-backend",
type=str, type=str,
choices=["outlines", "lm-format-enforcer", "xgrammar", "guidance"], choices=[
default="xgrammar", "outlines", "lm-format-enforcer", "xgrammar",
"guidance", "auto"
],
default="auto",
help="Backend to use for structured outputs") help="Backend to use for structured outputs")
args = parser.parse_args() args = parser.parse_args()