From 36573815647ac2c89f2612990796fc0c566db214 Mon Sep 17 00:00:00 2001 From: Keren Zhou Date: Mon, 15 Apr 2024 16:27:58 -0400 Subject: [PATCH] [PROTON] Support kernels launched with `cudaLaunchKernelExC` and `cuLaunchKernelEx` on sm>=90 (#3668) e.g., cublas/cutlass gemm kernels like `sm90_xmma_gemm_f16f16_f16f32_f32_tn_n_tilesize128x128x64_warpgroupsize1x1x1_execute_segment_k_off_kernel__5x_cublas` --- third_party/proton/csrc/lib/Profiler/CuptiProfiler.cpp | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/third_party/proton/csrc/lib/Profiler/CuptiProfiler.cpp b/third_party/proton/csrc/lib/Profiler/CuptiProfiler.cpp index bf1a2b2a4236..61c73395d673 100644 --- a/third_party/proton/csrc/lib/Profiler/CuptiProfiler.cpp +++ b/third_party/proton/csrc/lib/Profiler/CuptiProfiler.cpp @@ -177,6 +177,8 @@ std::pair matchKernelCbId(CUpti_CallbackId cbId) { case CUPTI_RUNTIME_TRACE_CBID_cudaLaunchKernel_v7000: case CUPTI_RUNTIME_TRACE_CBID_cudaLaunch_ptsz_v7000: case CUPTI_RUNTIME_TRACE_CBID_cudaLaunchKernel_ptsz_v7000: + case CUPTI_RUNTIME_TRACE_CBID_cudaLaunchKernelExC_v11060: + case CUPTI_RUNTIME_TRACE_CBID_cudaLaunchKernelExC_ptsz_v11060: case CUPTI_RUNTIME_TRACE_CBID_cudaLaunchCooperativeKernel_v9000: case CUPTI_RUNTIME_TRACE_CBID_cudaLaunchCooperativeKernel_ptsz_v9000: case CUPTI_RUNTIME_TRACE_CBID_cudaLaunchCooperativeKernelMultiDevice_v9000: { @@ -188,6 +190,8 @@ std::pair matchKernelCbId(CUpti_CallbackId cbId) { case CUPTI_DRIVER_TRACE_CBID_cuLaunchGridAsync: case CUPTI_DRIVER_TRACE_CBID_cuLaunchKernel: case CUPTI_DRIVER_TRACE_CBID_cuLaunchKernel_ptsz: + case CUPTI_DRIVER_TRACE_CBID_cuLaunchKernelEx: + case CUPTI_DRIVER_TRACE_CBID_cuLaunchKernelEx_ptsz: case CUPTI_DRIVER_TRACE_CBID_cuLaunchCooperativeKernel: case CUPTI_DRIVER_TRACE_CBID_cuLaunchCooperativeKernel_ptsz: case CUPTI_DRIVER_TRACE_CBID_cuLaunchCooperativeKernelMultiDevice: {