run_benchmark.sh 452 B

123456789101112
  1. TOTAL_SECONDS=120
  2. QPS_RATES=("1" "3" "5" "7" "9")
  3. for QPS in ${QPS_RATES[@]}; do
  4. NUM_PROMPTS=$((TOTAL_SECONDS * QPS))
  5. echo "===== RUNNING NUM_PROMPTS = $NUM_PROMPTS QPS = $QPS ====="
  6. uv run benchmarks/benchmark_serving.py \
  7. --model $MODEL \
  8. --dataset-name sonnet --sonnet-input-len 550 --sonnet-output-len 150 --dataset-path benchmarks/sonnet.txt \
  9. --num-prompts $NUM_PROMPTS --request-rate $QPS --save-result
  10. done