update benchmark_serving_structured_output to include auto backend (#16438)
Signed-off-by: Chenyaaang <chenyangli@google.com>
This commit is contained in:
parent
3e397a9484
commit
d544d141ec
@ -11,7 +11,7 @@ On the client side, run:
|
|||||||
--model <your_model> \
|
--model <your_model> \
|
||||||
--dataset json \
|
--dataset json \
|
||||||
--structured-output-ratio 1.0 \
|
--structured-output-ratio 1.0 \
|
||||||
--structured-output-backend xgrammar \
|
--structured-output-backend auto \
|
||||||
--request-rate 10 \
|
--request-rate 10 \
|
||||||
--num-prompts 1000
|
--num-prompts 1000
|
||||||
|
|
||||||
@ -997,11 +997,13 @@ if __name__ == "__main__":
|
|||||||
type=float,
|
type=float,
|
||||||
default=1.0,
|
default=1.0,
|
||||||
help="Ratio of Structured Outputs requests")
|
help="Ratio of Structured Outputs requests")
|
||||||
parser.add_argument(
|
parser.add_argument("--structured-output-backend",
|
||||||
"--structured-output-backend",
|
|
||||||
type=str,
|
type=str,
|
||||||
choices=["outlines", "lm-format-enforcer", "xgrammar", "guidance"],
|
choices=[
|
||||||
default="xgrammar",
|
"outlines", "lm-format-enforcer", "xgrammar",
|
||||||
|
"guidance", "auto"
|
||||||
|
],
|
||||||
|
default="auto",
|
||||||
help="Backend to use for structured outputs")
|
help="Backend to use for structured outputs")
|
||||||
|
|
||||||
args = parser.parse_args()
|
args = parser.parse_args()
|
||||||
|
Loading…
x
Reference in New Issue
Block a user