From 689746df88677ff9d6f32eb6f9644f4c15b82d7d Mon Sep 17 00:00:00 2001 From: Brian Ryu Date: Fri, 5 Dec 2025 18:30:10 +0000 Subject: [PATCH] Make cupti the default. Add use_cuda_events as alternative. Deprecate use_cupti --- benchmarks/flashinfer_benchmark.py | 18 +++++++++++++++++- 1 file changed, 17 insertions(+), 1 deletion(-) diff --git a/benchmarks/flashinfer_benchmark.py b/benchmarks/flashinfer_benchmark.py index bd02172eb2..330d734221 100644 --- a/benchmarks/flashinfer_benchmark.py +++ b/benchmarks/flashinfer_benchmark.py @@ -79,7 +79,13 @@ def parse_args(line=sys.argv[1:]): "--use_cupti", action="store_true", default=False, - help="Use CUPTI for timing GPU kernels when available.", + help="[DEPRECATED] Use CUPTI for timing GPU kernels. This is now the default behavior.", + ) + parser.add_argument( + "--use_cuda_events", + action="store_true", + default=False, + help="Use CUDA events for timing GPU kernels instead of CUPTI.", ) parser.add_argument( "--refcheck", @@ -155,6 +161,16 @@ def parse_args(line=sys.argv[1:]): if args.generate_repro_command: args.repro_command = "python3 flashinfer_benchmark.py " + " ".join(line) + + # Deprecation warning for use_cupti + if args.use_cupti: + print( + "[WARNING] --use_cupti is deprecated and will be removed in a future release. CUPTI is now enabled by default." + ) + # use_cupti is deprecated and will be removed in a future release. CUPTI is now enabled by default. + # If --use_cuda_events is passed, disable use_cupti + args.use_cupti = not args.use_cuda_events + return args