diff --git a/vLLM/A100/Throughput_measurement/benchmark_throughput.py b/vLLM/A100/Throughput_measurement/benchmark_throughput.py index b7c364b..0af862d 100644 --- a/vLLM/A100/Throughput_measurement/benchmark_throughput.py +++ b/vLLM/A100/Throughput_measurement/benchmark_throughput.py @@ -33,7 +33,7 @@ def main(args: argparse.Namespace): ray_workers_use_nsight=args.ray_workers_use_nsight, use_v2_block_manager=args.use_v2_block_manager, enable_chunked_prefill=args.enable_chunked_prefill, - download_dir='/lus/grand/projects/datascience/krishnat/model_weights/LLaMA/llama_cache/', + download_dir=args.download_dir, block_size=args.block_size, gpu_memory_utilization=args.gpu_memory_utilization, load_format=args.load_format,