From 56e59a4abac3897195530b86fd1d7a98667a04ca Mon Sep 17 00:00:00 2001 From: Guancheng Fu <110874468+gc-fu@users.noreply.github.com> Date: Mon, 18 Nov 2024 20:33:41 +0800 Subject: [PATCH] Update benchmark_vllm_throughput.py --- docker/llm/serving/xpu/docker/benchmark_vllm_throughput.py | 1 + 1 file changed, 1 insertion(+) diff --git a/docker/llm/serving/xpu/docker/benchmark_vllm_throughput.py b/docker/llm/serving/xpu/docker/benchmark_vllm_throughput.py index 5702db8907b..fe035865752 100644 --- a/docker/llm/serving/xpu/docker/benchmark_vllm_throughput.py +++ b/docker/llm/serving/xpu/docker/benchmark_vllm_throughput.py @@ -388,4 +388,5 @@ def main(args: argparse.Namespace): if args.tokenizer != args.model: raise ValueError("Tokenizer must be the same as the model for MII " "backend.") + main(args)