From ed96036690843ccbe3d99fde4d8ddb717c8ddcf9 Mon Sep 17 00:00:00 2001 From: Gregory Shtrasberg Date: Thu, 21 Mar 2024 17:55:28 +0000 Subject: [PATCH] Fix parameter --- benchmarks/benchmark_throughput.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/benchmarks/benchmark_throughput.py b/benchmarks/benchmark_throughput.py index 89c7e8dafe0e..5b8d4419245c 100644 --- a/benchmarks/benchmark_throughput.py +++ b/benchmarks/benchmark_throughput.py @@ -9,6 +9,7 @@ from transformers import (AutoModelForCausalLM, AutoTokenizer, PreTrainedTokenizerBase) from tqdm import tqdm +from torch.distributed import launch def sample_requests( @@ -93,7 +94,7 @@ def run_vllm( scales_path=scales_path, device=device, enable_prefix_caching=enable_prefix_caching, - worker_use_torchrun=args.worker_use_torchrun,) + worker_use_torchrun=worker_use_torchrun,) # Add the requests to the engine. for prompt, _, output_len in requests: