vllm/benchmarks/run_structured_output_benchmark.sh

#!/bin/bash

# Define the model to use
MODEL=${1:-"Qwen/Qwen2.5-7B-Instruct"}

# Define the backend to use
BACKEND=${2:-"vllm"}

# Define the dataset to use
DATASET=${3:-"xgrammar_bench"}

# Define the guided decoding backend
GUIDED_BACKEND=${4:-"xgrammar"}

SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
OUTPUT_DIR=${5:-"$SCRIPT_DIR/structured_output_benchmark_results"}

GUIDED_RATIO=${6:-0.5}

# Create output directory if it doesn't exist
mkdir -p "$OUTPUT_DIR"

# Define QPS values to test
QPS_VALUES=(70 60 50 25 20 15 10)

# Common parameters
COMMON_PARAMS="--backend $BACKEND \
               --model $MODEL \
               --dataset $DATASET \
               --structured-output-backend $GUIDED_BACKEND \
               --structured-output-ratio $GUIDED_RATIO \
               --save-results \
               --result-dir $OUTPUT_DIR"

echo "Starting structured output benchmark with model: $MODEL"
echo "Backend: $BACKEND"
echo "Dataset: $DATASET"
echo "Structured output backend: $GUIDED_BACKEND"
echo "Results will be saved to: $OUTPUT_DIR"
echo "----------------------------------------"

# Run benchmarks with different QPS values
for qps in "${QPS_VALUES[@]}"; do
  echo "Running benchmark with QPS: $qps"

  # Get git hash and branch for the filename
  GIT_HASH=$(git rev-parse --short HEAD 2>/dev/null || echo "unknown")
  GIT_BRANCH=$(git rev-parse --abbrev-ref HEAD 2>/dev/null || echo "unknown")

  # Construct filename for this run
  FILENAME="${GUIDED_BACKEND}_${BACKEND}_${qps}qps_$(basename $MODEL)_${DATASET}_${GIT_HASH}.json"

  # Run the benchmark
  python "$SCRIPT_DIR/benchmark_serving_structured_output.py" $COMMON_PARAMS \
    --request-rate $qps \
    --result-filename "$FILENAME" \
    --tokenizer-mode ${TOKENIZER_MODE:-"auto"} \
    --port ${PORT:-8000}

  echo "Completed benchmark with QPS: $qps"
  echo "----------------------------------------"
done

echo "All benchmarks completed!"
echo "Results saved to: $OUTPUT_DIR"
[V1][Core] Support for Structured Outputs (#12388) Signed-off-by: Aaron Pham <contact@aarnphm.xyz> Signed-off-by: Russell Bryant <rbryant@redhat.com> Co-authored-by: Russell Bryant <rbryant@redhat.com> Co-authored-by: Michael Goin <mgoin64@gmail.com> Co-authored-by: Nick Hill <nhill@redhat.com> 2025-03-07 10:19:11 -05:00			`#!/bin/bash`

			`# Define the model to use`
			`MODEL=${1:-"Qwen/Qwen2.5-7B-Instruct"}`

			`# Define the backend to use`
			`BACKEND=${2:-"vllm"}`

			`# Define the dataset to use`
			`DATASET=${3:-"xgrammar_bench"}`

			`# Define the guided decoding backend`
			`GUIDED_BACKEND=${4:-"xgrammar"}`

			`SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"`
			`OUTPUT_DIR=${5:-"$SCRIPT_DIR/structured_output_benchmark_results"}`

			`GUIDED_RATIO=${6:-0.5}`

			`# Create output directory if it doesn't exist`
			`mkdir -p "$OUTPUT_DIR"`

			`# Define QPS values to test`
			`QPS_VALUES=(70 60 50 25 20 15 10)`

			`# Common parameters`
			`COMMON_PARAMS="--backend $BACKEND \`
			`--model $MODEL \`
			`--dataset $DATASET \`
			`--structured-output-backend $GUIDED_BACKEND \`
			`--structured-output-ratio $GUIDED_RATIO \`
			`--save-results \`
			`--result-dir $OUTPUT_DIR"`

			`echo "Starting structured output benchmark with model: $MODEL"`
			`echo "Backend: $BACKEND"`
			`echo "Dataset: $DATASET"`
			`echo "Structured output backend: $GUIDED_BACKEND"`
			`echo "Results will be saved to: $OUTPUT_DIR"`
			`echo "----------------------------------------"`

			`# Run benchmarks with different QPS values`
			`for qps in "${QPS_VALUES[@]}"; do`
			`echo "Running benchmark with QPS: $qps"`

			`# Get git hash and branch for the filename`
			`GIT_HASH=$(git rev-parse --short HEAD 2>/dev/null \|\| echo "unknown")`
			`GIT_BRANCH=$(git rev-parse --abbrev-ref HEAD 2>/dev/null \|\| echo "unknown")`

			`# Construct filename for this run`
			`FILENAME="${GUIDED_BACKEND}_${BACKEND}_${qps}qps_$(basename $MODEL)_${DATASET}_${GIT_HASH}.json"`

			`# Run the benchmark`
			`python "$SCRIPT_DIR/benchmark_serving_structured_output.py" $COMMON_PARAMS \`
			`--request-rate $qps \`
			`--result-filename "$FILENAME" \`
[Misc][Benchmark] Add support for different `tokenizer_mode` (#15040) Signed-off-by: Aaron Pham <contact@aarnphm.xyz> Signed-off-by: Russell Bryant <rbryant@redhat.com> Co-authored-by: Russell Bryant <rbryant@redhat.com> 2025-03-19 10:56:50 -04:00			`--tokenizer-mode ${TOKENIZER_MODE:-"auto"} \`
[V1][Core] Support for Structured Outputs (#12388) Signed-off-by: Aaron Pham <contact@aarnphm.xyz> Signed-off-by: Russell Bryant <rbryant@redhat.com> Co-authored-by: Russell Bryant <rbryant@redhat.com> Co-authored-by: Michael Goin <mgoin64@gmail.com> Co-authored-by: Nick Hill <nhill@redhat.com> 2025-03-07 10:19:11 -05:00			`--port ${PORT:-8000}`

			`echo "Completed benchmark with QPS: $qps"`
			`echo "----------------------------------------"`
			`done`

			`echo "All benchmarks completed!"`
			`echo "Results saved to: $OUTPUT_DIR"`