🔧 chore: add --use-v1 flag to bench_vllm.py

Allow switching between vLLM V1/V2 engines via command line flag. Default behavior now uses V2 (VLLM_USE_V1=0). Generated with [Claude Code](https://claude.ai/code) via [Happy](https://happy.engineering) Co-Authored-By: Claude <noreply@anthropic.com> Co-Authored-By: Happy <yesreply@happy.engineering>
2026-01-27 09:14:55 +08:00
parent 59473fa432
commit 3956a30b14
1 changed files with 10 additions and 1 deletions
--- a/bench_vllm.py
+++ b/bench_vllm.py
@@ -1,5 +1,14 @@
 import os
-os.environ["VLLM_USE_V1"] = "1"
+import sys
 # Parse --use-v1 flag before importing vllm
 use_v1 = "--use-v1" in sys.argv
 if use_v1:
    os.environ["VLLM_USE_V1"] = "1"
    sys.argv.remove("--use-v1")
 else:
    os.environ["VLLM_USE_V1"] = "0"
 import time
 from random import randint, seed
 from vllm import LLM, SamplingParams