From 357859fbf14549589c633b5c4e783a3d538e1da5 Mon Sep 17 00:00:00 2001 From: Evgeny Mankov Date: Wed, 16 Oct 2024 23:30:04 +0100 Subject: [PATCH] [HIPIFY][perl][fix] Fix warning reporting for unsupported APIs + [Reason] Only BLAS API were taken into account, even though we already have RAND, SPARSE, and DNN with `ROC` support + As a result, erroneous warnings were emitted by `hipify-perl` for APIs which are actually supported by `-roc` hipification + Updated the regenerated `hipify-perl` script --- bin/hipify-perl | 3100 ++++++++++++++++++++++++++--------------- src/CUDA2HIP_Perl.cpp | 4 +- 2 files changed, 2000 insertions(+), 1104 deletions(-) diff --git a/bin/hipify-perl b/bin/hipify-perl index d1c8f4d5..489c722b 100755 --- a/bin/hipify-perl +++ b/bin/hipify-perl @@ -9110,157 +9110,6 @@ sub warnUnsupportedFunctions { "libraryPropertyType_t", "libraryPropertyType", "gesvdjInfo", - "cusparseZhybsv_solve", - "cusparseZhybsv_analysis", - "cusparseZhyb2dense", - "cusparseZhyb2csc", - "cusparseZgtsv_nopivot", - "cusparseZgtsvStridedBatch", - "cusparseZgtsv", - "cusparseZgebsr2gebsr_bufferSizeExt", - "cusparseZgebsr2gebsc_bufferSizeExt", - "cusparseZdense2hyb", - "cusparseZcsrsv_solve", - "cusparseZcsrsv_analysis", - "cusparseZcsrsm_solve", - "cusparseZcsrsm_analysis", - "cusparseZcsrmv_mp", - "cusparseZcsrilu0", - "cusparseZcsric0", - "cusparseZcsr2gebsr_bufferSizeExt", - "cusparseZcsc2hyb", - "cusparseZbsrsm2_bufferSizeExt", - "cusparseZbsrilu02_bufferSizeExt", - "cusparseZbsric02_bufferSizeExt", - "cusparseXgebsr2csr", - "cusparseSpVecDescr", - "cusparseSpSV_updateMatrix", - "cusparseSpSVUpdate_t", - "cusparseSpSM_updateMatrix", - "cusparseSpSMUpdate_t", - "cusparseSpMatSetNumBatches", - "cusparseSpMatGetNumBatches", - "cusparseSpMatDescr", - "cusparseSpMMOp_destroyPlan", - "cusparseSpMMOp_createPlan", - "cusparseSpMMOpPlan_t", - "cusparseSpMMOpPlan", - "cusparseSpMMOpAlg_t", - "cusparseSpMMOp", - "cusparseSpGEMM_getNumProducts", - "cusparseSpGEMM_estimateMemory", - "cusparseSolveAnalysisInfo_t", - "cusparseSolveAnalysisInfo", - "cusparseSideMode_t", - "cusparseShybsv_solve", - "cusparseShybsv_analysis", - "cusparseShyb2dense", - "cusparseShyb2csc", - "cusparseSgtsv_nopivot", - "cusparseSgtsvStridedBatch", - "cusparseSgtsv", - "cusparseSgebsr2gebsr_bufferSizeExt", - "cusparseSgebsr2gebsc_bufferSizeExt", - "cusparseSdense2hyb", - "cusparseScsrsv_solve", - "cusparseScsrsv_analysis", - "cusparseScsrsm_solve", - "cusparseScsrsm_analysis", - "cusparseScsrmv_mp", - "cusparseScsrilu0", - "cusparseScsric0", - "cusparseScsr2gebsr_bufferSizeExt", - "cusparseScsc2hyb", - "cusparseSbsrsm2_bufferSizeExt", - "cusparseSbsrilu02_bufferSizeExt", - "cusparseSbsric02_bufferSizeExt", - "cusparseMatDescr", - "cusparseLoggerSetMask", - "cusparseLoggerSetLevel", - "cusparseLoggerSetFile", - "cusparseLoggerSetCallback", - "cusparseLoggerOpenFile", - "cusparseLoggerForceDisable", - "cusparseLoggerCallback_t", - "cusparseHybMat", - "cusparseHpruneDense2csr_bufferSizeExt", - "cusparseHpruneDense2csrNnzByPercentage", - "cusparseHpruneDense2csrNnz", - "cusparseHpruneDense2csrByPercentage_bufferSizeExt", - "cusparseHpruneDense2csrByPercentage", - "cusparseHpruneDense2csr", - "cusparseHpruneCsr2csr_bufferSizeExt", - "cusparseHpruneCsr2csrNnzByPercentage", - "cusparseHpruneCsr2csrNnz", - "cusparseHpruneCsr2csrByPercentage_bufferSizeExt", - "cusparseHpruneCsr2csrByPercentage", - "cusparseHpruneCsr2csr", - "cusparseGetLevelInfo", - "cusparseDnVecDescr", - "cusparseDnMatDescr", - "cusparseDhybsv_solve", - "cusparseDhybsv_analysis", - "cusparseDhyb2dense", - "cusparseDhyb2csc", - "cusparseDgtsv_nopivot", - "cusparseDgtsvStridedBatch", - "cusparseDgtsv", - "cusparseDgebsr2gebsr_bufferSizeExt", - "cusparseDgebsr2gebsc_bufferSizeExt", - "cusparseDestroySolveAnalysisInfo", - "cusparseDdense2hyb", - "cusparseDcsrsv_solve", - "cusparseDcsrsv_analysis", - "cusparseDcsrsm_solve", - "cusparseDcsrsm_analysis", - "cusparseDcsrmv_mp", - "cusparseDcsrilu0", - "cusparseDcsric0", - "cusparseDcsr2gebsr_bufferSizeExt", - "cusparseDcsc2hyb", - "cusparseDbsrsm2_bufferSizeExt", - "cusparseDbsrilu02_bufferSizeExt", - "cusparseDbsric02_bufferSizeExt", - "cusparseCsrsv_solveEx", - "cusparseCsrsv_analysisEx", - "cusparseCsrmvEx_bufferSize", - "cusparseCsrmvEx", - "cusparseCsrilu0Ex", - "cusparseCsr2cscEx", - "cusparseCreateSolveAnalysisInfo", - "cusparseCreateSlicedEll", - "cusparseCreateConstSlicedEll", - "cusparseCreateConstBsr", - "cusparseCreateBsr", - "cusparseContext", - "cusparseConstrainedGeMM_bufferSize", - "cusparseConstrainedGeMM", - "cusparseColorInfo", - "cusparseColorAlg_t", - "cusparseChybsv_solve", - "cusparseChybsv_analysis", - "cusparseChyb2dense", - "cusparseChyb2csc", - "cusparseCgtsv_nopivot", - "cusparseCgtsvStridedBatch", - "cusparseCgtsv", - "cusparseCgebsr2gebsr_bufferSizeExt", - "cusparseCgebsr2gebsc_bufferSizeExt", - "cusparseCdense2hyb", - "cusparseCcsrsv_solve", - "cusparseCcsrsv_analysis", - "cusparseCcsrsm_solve", - "cusparseCcsrsm_analysis", - "cusparseCcsrmv_mp", - "cusparseCcsrilu0", - "cusparseCcsric0", - "cusparseCcsr2gebsr_bufferSizeExt", - "cusparseCcsc2hyb", - "cusparseCbsrsm2_bufferSizeExt", - "cusparseCbsrilu02_bufferSizeExt", - "cusparseCbsric02_bufferSizeExt", - "cusparseBsrSetStridedBatch", - "cusparseAlgMode_t", "cusolverStorevMode_t", "cusolverSpZcsrzfdHost", "cusolverSpZcsrqrsvBatched", @@ -9598,25 +9447,6 @@ sub warnUnsupportedFunctions { "cusolverDnCEgels_bufferSize", "cusolverDnCEgels", "cusolverDirectMode_t", - "curand_mtgp32_specific", - "curand_mtgp32_single_specific", - "curand_mtgp32_single", - "curand_Philox4x32_10", - "curandMethod_t", - "curandMethod", - "curandHistogramM2_t", - "curandHistogramM2_st", - "curandHistogramM2V_t", - "curandHistogramM2V_st", - "curandHistogramM2K_t", - "curandHistogramM2K_st", - "curandGetProperty", - "curandDistribution_t", - "curandDistribution_st", - "curandDistributionShift_t", - "curandDistributionShift_st", - "curandDistributionM2Shift_t", - "curandDistributionM2Shift_st", "cufftXtWorkAreaPolicy_t", "cufftXtWorkAreaPolicy", "cufftXtSubFormat_t", @@ -9654,268 +9484,6 @@ sub warnUnsupportedFunctions { "cufftCompatibility", "cufftBox3d_t", "cufftBox3d", - "cudnnWgradMode_t", - "cudnnTransformTensorEx", - "cudnnTransformTensor", - "cudnnTransformFilter", - "cudnnTensorTransformStruct", - "cudnnTensorTransformDescriptor_t", - "cudnnTensorStruct", - "cudnnSpatialTransformerStruct", - "cudnnSpatialTransformerDescriptor_t", - "cudnnSpatialTfSamplerForward", - "cudnnSpatialTfSamplerBackward", - "cudnnSpatialTfGridGeneratorForward", - "cudnnSpatialTfGridGeneratorBackward", - "cudnnSignalMode_t", - "cudnnSeverity_t", - "cudnnSetTensorTransformDescriptor", - "cudnnSetTensorNdDescriptorEx", - "cudnnSetSpatialTransformerNdDescriptor", - "cudnnSetSeqDataDescriptor", - "cudnnSetRNNProjectionLayers", - "cudnnSetRNNPaddingMode", - "cudnnSetRNNMatrixMathType", - "cudnnSetRNNDescriptor_v8", - "cudnnSetRNNDataDescriptor", - "cudnnSetRNNBiasMode", - "cudnnSetRNNAlgorithmDescriptor", - "cudnnSetFusedOpsVariantParamPackAttribute", - "cudnnSetFusedOpsConstParamPackAttribute", - "cudnnSetConvolutionReorderType", - "cudnnSetCallback", - "cudnnSetCTCLossDescriptor_v9", - "cudnnSetCTCLossDescriptor_v8", - "cudnnSetCTCLossDescriptorEx", - "cudnnSetCTCLossDescriptor", - "cudnnSetAttnDescriptor", - "cudnnSetAlgorithmPerformance", - "cudnnSetAlgorithmDescriptor", - "cudnnSetActivationDescriptorSwishBeta", - "cudnnSeqDataStruct", - "cudnnSeqDataDescriptor_t", - "cudnnSeqDataAxis_t", - "cudnnSaveAlgorithm", - "cudnnSamplerType_t", - "cudnnRuntimeTag_t", - "cudnnRngDistribution_t", - "cudnnRestoreDropoutDescriptor", - "cudnnRestoreAlgorithm", - "cudnnResampleMode_t", - "cudnnReorderType_t", - "cudnnReorderFilterAndBias", - "cudnnReduceTensorStruct", - "cudnnRNNStruct", - "cudnnRNNSetClip_v9", - "cudnnRNNSetClip_v8", - "cudnnRNNSetClip", - "cudnnRNNPaddingMode_t", - "cudnnRNNGetClip_v9", - "cudnnRNNGetClip_v8", - "cudnnRNNGetClip", - "cudnnRNNForwardTrainingEx", - "cudnnRNNForwardInferenceEx", - "cudnnRNNForward", - "cudnnRNNDataStruct", - "cudnnRNNDataLayout_t", - "cudnnRNNDataDescriptor_t", - "cudnnRNNClipMode_t", - "cudnnRNNBackwardWeights_v8", - "cudnnRNNBackwardWeightsEx", - "cudnnRNNBackwardData_v8", - "cudnnRNNBackwardDataEx", - "cudnnQueryRuntimeError", - "cudnnPoolingStruct", - "cudnnPointwiseMode_t", - "cudnnPersistentRNNPlan", - "cudnnPaddingMode_t", - "cudnnOpsVersionCheck", - "cudnnOpsTrainVersionCheck", - "cudnnOpsInferVersionCheck", - "cudnnOpTensorStruct", - "cudnnNormalizationForwardTraining", - "cudnnNormalizationForwardInference", - "cudnnNormalizationBackward", - "cudnnNormOps_t", - "cudnnNormMode_t", - "cudnnNormAlgo_t", - "cudnnMultiHeadAttnWeightKind_t", - "cudnnMultiHeadAttnForward", - "cudnnMultiHeadAttnBackwardWeights", - "cudnnMultiHeadAttnBackwardData", - "cudnnMakeFusedOpsPlan", - "cudnnLossNormalizationMode_t", - "cudnnLRNStruct", - "cudnnInitTransformDest", - "cudnnIm2Col", - "cudnnGraphVersionCheck", - "cudnnGetTensorTransformDescriptor", - "cudnnGetTensorSizeInBytes", - "cudnnGetSeqDataDescriptor", - "cudnnGetReductionIndicesSize", - "cudnnGetRNNWeightSpaceSize", - "cudnnGetRNNWeightParams", - "cudnnGetRNNTempSpaceSizes", - "cudnnGetRNNProjectionLayers", - "cudnnGetRNNPaddingMode", - "cudnnGetRNNMatrixMathType", - "cudnnGetRNNForwardTrainingAlgorithmMaxCount", - "cudnnGetRNNForwardInferenceAlgorithmMaxCount", - "cudnnGetRNNDescriptor_v8", - "cudnnGetRNNDescriptor_v6", - "cudnnGetRNNDataDescriptor", - "cudnnGetRNNBiasMode", - "cudnnGetRNNBackwardWeightsAlgorithmMaxCount", - "cudnnGetRNNBackwardDataAlgorithmMaxCount", - "cudnnGetProperty", - "cudnnGetPoolingNdForwardOutputDim", - "cudnnGetPoolingNdDescriptor", - "cudnnGetNormalizationTrainingReserveSpaceSize", - "cudnnGetNormalizationForwardTrainingWorkspaceSize", - "cudnnGetNormalizationBackwardWorkspaceSize", - "cudnnGetMultiHeadAttnWeights", - "cudnnGetMultiHeadAttnBuffers", - "cudnnGetMaxDeviceVersion", - "cudnnGetLastErrorString", - "cudnnGetFusedOpsVariantParamPackAttribute", - "cudnnGetFusedOpsConstParamPackAttribute", - "cudnnGetFoldedConvBackwardDataDescriptors", - "cudnnGetFilterSizeInBytes", - "cudnnGetDropoutDescriptor", - "cudnnGetCudartVersion", - "cudnnGetConvolutionReorderType", - "cudnnGetConvolutionNdForwardOutputDim", - "cudnnGetConvolutionNdDescriptor", - "cudnnGetConvolutionMathType", - "cudnnGetConvolutionGroupCount", - "cudnnGetConvolutionForwardAlgorithm_v7", - "cudnnGetConvolutionForwardAlgorithmMaxCount", - "cudnnGetConvolutionBackwardFilterAlgorithm_v7", - "cudnnGetConvolutionBackwardFilterAlgorithmMaxCount", - "cudnnGetConvolutionBackwardDataAlgorithm_v7", - "cudnnGetConvolutionBackwardDataAlgorithmMaxCount", - "cudnnGetCallback", - "cudnnGetCTCLossWorkspaceSize_v8", - "cudnnGetCTCLossWorkspaceSize", - "cudnnGetCTCLossDescriptor_v9", - "cudnnGetCTCLossDescriptor_v8", - "cudnnGetCTCLossDescriptorEx", - "cudnnGetCTCLossDescriptor", - "cudnnGetBatchNormalizationTrainingExReserveSpaceSize", - "cudnnGetBatchNormalizationForwardTrainingExWorkspaceSize", - "cudnnGetBatchNormalizationBackwardExWorkspaceSize", - "cudnnGetAttnDescriptor", - "cudnnGetAlgorithmSpaceSize", - "cudnnGetAlgorithmPerformance", - "cudnnGetAlgorithmDescriptor", - "cudnnGetActivationDescriptorSwishBeta", - "cudnnGenStatsMode_t", - "cudnnFusedOps_t", - "cudnnFusedOpsVariantParamStruct", - "cudnnFusedOpsVariantParamPack_t", - "cudnnFusedOpsVariantParamLabel_t", - "cudnnFusedOpsPointerPlaceHolder_t", - "cudnnFusedOpsPlan_t", - "cudnnFusedOpsPlanStruct", - "cudnnFusedOpsExecute", - "cudnnFusedOpsConstParamStruct", - "cudnnFusedOpsConstParamPack_t", - "cudnnFusedOpsConstParamLabel_t", - "cudnnFraction_t", - "cudnnFractionStruct", - "cudnnForwardMode_t", - "cudnnFoldingDirection_t", - "cudnnFindRNNForwardTrainingAlgorithmEx", - "cudnnFindRNNForwardInferenceAlgorithmEx", - "cudnnFindRNNBackwardWeightsAlgorithmEx", - "cudnnFindRNNBackwardDataAlgorithmEx", - "cudnnFilterStruct", - "cudnnErrQueryMode_t", - "cudnnDropoutStruct", - "cudnnDropoutGetReserveSpaceSize", - "cudnnDropoutForward", - "cudnnDropoutBackward", - "cudnnDivisiveNormalizationForward", - "cudnnDivisiveNormalizationBackward", - "cudnnDivNormMode_t", - "cudnnDeterminism_t", - "cudnnDestroyTensorTransformDescriptor", - "cudnnDestroySpatialTransformerDescriptor", - "cudnnDestroySeqDataDescriptor", - "cudnnDestroyRNNDataDescriptor", - "cudnnDestroyFusedOpsVariantParamPack", - "cudnnDestroyFusedOpsPlan", - "cudnnDestroyFusedOpsConstParamPack", - "cudnnDestroyCTCLossDescriptor", - "cudnnDestroyAttnDescriptor", - "cudnnDestroyAlgorithmPerformance", - "cudnnDestroyAlgorithmDescriptor", - "cudnnDeriveNormTensorDescriptor", - "cudnnDebug_t", - "cudnnDebugStruct", - "cudnnCreateTensorTransformDescriptor", - "cudnnCreateSpatialTransformerDescriptor", - "cudnnCreateSeqDataDescriptor", - "cudnnCreateRNNDataDescriptor", - "cudnnCreateFusedOpsVariantParamPack", - "cudnnCreateFusedOpsPlan", - "cudnnCreateFusedOpsConstParamPack", - "cudnnCreateCTCLossDescriptor", - "cudnnCreateAttnDescriptor", - "cudnnCreateAlgorithmPerformance", - "cudnnCreateAlgorithmDescriptor", - "cudnnCopyAlgorithmDescriptor", - "cudnnConvolutionStruct", - "cudnnConvolutionBiasActivationForward", - "cudnnContext", - "cudnnCnnTrainVersionCheck", - "cudnnCnnInferVersionCheck", - "cudnnCallback_t", - "cudnnCTCLoss_v8", - "cudnnCTCLossStruct", - "cudnnCTCLossDescriptor_t", - "cudnnCTCLossAlgo_t", - "cudnnCTCLoss", - "cudnnCTCGradMode_t", - "cudnnBuildRNNDynamic", - "cudnnBnFinalizeStatsMode_t", - "cudnnBatchNormalizationForwardTrainingEx", - "cudnnBatchNormalizationBackwardEx", - "cudnnBatchNormOps_t", - "cudnnBackendUpdateCudaGraph", - "cudnnBackendTensorReordering_t", - "cudnnBackendSetAttribute", - "cudnnBackendPopulateCudaGraph", - "cudnnBackendNumericalNote_t", - "cudnnBackendNormMode_t", - "cudnnBackendNormFwdPhase_t", - "cudnnBackendLayoutType_t", - "cudnnBackendKnobType_t", - "cudnnBackendInitialize", - "cudnnBackendHeurMode_t", - "cudnnBackendGetAttribute", - "cudnnBackendFinalize", - "cudnnBackendExecute", - "cudnnBackendDestroyDescriptor", - "cudnnBackendDescriptor_t", - "cudnnBackendDescriptorType_t", - "cudnnBackendCreateDescriptor", - "cudnnBackendBehaviorNote_t", - "cudnnBackendAttributeType_t", - "cudnnBackendAttributeName_t", - "cudnnAttnStruct", - "cudnnAttnQueryMap_t", - "cudnnAttnDescriptor_t", - "cudnnAlgorithm_t", - "cudnnAlgorithmUnionStruct", - "cudnnAlgorithmStruct", - "cudnnAlgorithmPerformance_t", - "cudnnAlgorithmPerformanceStruct", - "cudnnAlgorithmDescriptor_t", - "cudnnAdvVersionCheck", - "cudnnAdvTrainVersionCheck", - "cudnnAdvInferVersionCheck", - "cudnnActivationStruct", "cudaWGLGetDevice", "cudaVDPAUSetVDPAUDevice", "cudaVDPAUGetDevice", @@ -10630,8 +10198,6 @@ sub warnUnsupportedFunctions { "cuArrayGetSparseProperties", "cuArrayGetPlane", "cuArrayGetMemoryRequirements", - "csrsv2Info", - "csrsm2Info", "csrqrInfo_t", "csrqrInfoHost_t", "csrqrInfoHost", @@ -10660,7 +10226,6 @@ sub warnUnsupportedFunctions { "__nv_bfloat16_raw", "__nv_bfloat162_raw", "__nv_bfloat162", - "__curand_umul", "__NV_SATFINITE", "__NV_NOSAT", "__NV_E5M2", @@ -11287,28 +10852,6 @@ sub warnUnsupportedFunctions { "CU_AD_FORMAT_BC1_UNORM_SRGB", "CU_AD_FORMAT_BC1_UNORM", "CU_AD_FORMAT_AYUV", - "CUSPARSE_SPSV_UPDATE_GENERAL", - "CUSPARSE_SPSV_UPDATE_DIAGONAL", - "CUSPARSE_SPSM_UPDATE_GENERAL", - "CUSPARSE_SPSM_UPDATE_DIAGONAL", - "CUSPARSE_SPMV_SELL_ALG1", - "CUSPARSE_SPMM_OP_ALG_DEFAULT", - "CUSPARSE_SPMM_BSR_ALG1", - "CUSPARSE_SPMMA_PREPROCESS", - "CUSPARSE_SPMMA_ALG4", - "CUSPARSE_SPMMA_ALG3", - "CUSPARSE_SPMMA_ALG2", - "CUSPARSE_SPMMA_ALG1", - "CUSPARSE_SIDE_RIGHT", - "CUSPARSE_SIDE_LEFT", - "CUSPARSE_FORMAT_SLICED_ELLPACK", - "CUSPARSE_FORMAT_BSR", - "CUSPARSE_COLOR_ALG1", - "CUSPARSE_COLOR_ALG0", - "CUSPARSE_ALG_NAIVE", - "CUSPARSE_ALG_MERGE_PATH", - "CUSPARSE_ALG1", - "CUSPARSE_ALG0", "CUSOLVER_STATUS_IRS_PARAMS_NOT_INITIALIZED", "CUSOLVER_STATUS_IRS_PARAMS_INVALID_REFINE", "CUSOLVER_STATUS_IRS_PARAMS_INVALID_PREC", @@ -11352,20 +10895,6 @@ sub warnUnsupportedFunctions { "CUSOLVER_C_16BF", "CUSOLVER_ALG_2", "CUSOLVERDN_POTRF", - "CURAND_REJECTION", - "CURAND_POISSON", - "CURAND_M2", - "CURAND_M1", - "CURAND_KNUTH", - "CURAND_ITR", - "CURAND_HITR", - "CURAND_FAST_REJECTION", - "CURAND_DISCRETE_GAUSS", - "CURAND_DEVICE_API", - "CURAND_DEFINITION", - "CURAND_CHOOSE_BEST", - "CURAND_BINARY_SEARCH", - "CURAND_3RD", "CUGLmap_flags_enum", "CUGLmap_flags", "CUFFT_XT_FORMAT_OUTPUT", @@ -11388,637 +10917,6 @@ sub warnUnsupportedFunctions { "CUFFT_COPY_DEVICE_TO_DEVICE", "CUFFT_COMPATIBILITY_FFTW_PADDING", "CUFFT_COMPATIBILITY_DEFAULT", - "CUDNN_ZERO_PAD", - "CUDNN_WGRAD_MODE_SET", - "CUDNN_WGRAD_MODE_ADD", - "CUDNN_TYPE_VOID_PTR", - "CUDNN_TYPE_TENSOR_REORDERING_MODE", - "CUDNN_TYPE_SIGNAL_MODE", - "CUDNN_TYPE_RNG_DISTRIBUTION", - "CUDNN_TYPE_RESAMPLE_MODE", - "CUDNN_TYPE_REDUCTION_OPERATOR_TYPE", - "CUDNN_TYPE_POINTWISE_MODE", - "CUDNN_TYPE_PADDING_MODE", - "CUDNN_TYPE_NUMERICAL_NOTE", - "CUDNN_TYPE_NORM_MODE", - "CUDNN_TYPE_NORM_FWD_PHASE", - "CUDNN_TYPE_NAN_PROPOGATION", - "CUDNN_TYPE_LAYOUT_TYPE", - "CUDNN_TYPE_KNOB_TYPE", - "CUDNN_TYPE_INT64", - "CUDNN_TYPE_INT32", - "CUDNN_TYPE_HEUR_MODE", - "CUDNN_TYPE_HANDLE", - "CUDNN_TYPE_GENSTATS_MODE", - "CUDNN_TYPE_FRACTION", - "CUDNN_TYPE_FLOAT", - "CUDNN_TYPE_DOUBLE", - "CUDNN_TYPE_DATA_TYPE", - "CUDNN_TYPE_CONVOLUTION_MODE", - "CUDNN_TYPE_CHAR", - "CUDNN_TYPE_BOOLEAN", - "CUDNN_TYPE_BN_FINALIZE_STATS_MODE", - "CUDNN_TYPE_BEHAVIOR_NOTE", - "CUDNN_TYPE_BACKEND_DESCRIPTOR", - "CUDNN_TYPE_ATTRIB_NAME", - "CUDNN_TRANSFORM_UNFOLD", - "CUDNN_TRANSFORM_FOLD", - "CUDNN_TENSOR_REORDERING_NONE", - "CUDNN_TENSOR_REORDERING_INT8x32", - "CUDNN_TENSOR_REORDERING_F16x16", - "CUDNN_TENSOR_OP_MATH_ALLOW_CONVERSION", - "CUDNN_STATUS_VERSION_MISMATCH", - "CUDNN_STATUS_SUBLIBRARY_VERSION_MISMATCH", - "CUDNN_STATUS_SUBLIBRARY_LOADING_FAILED", - "CUDNN_STATUS_SPECIFIC_ERROR", - "CUDNN_STATUS_SERIALIZATION_VERSION_MISMATCH", - "CUDNN_STATUS_RUNTIME_IN_PROGRESS", - "CUDNN_STATUS_RUNTIME_FP_OVERFLOW", - "CUDNN_STATUS_NOT_SUPPORTED_SUBLIBRARY_UNAVAILABLE", - "CUDNN_STATUS_NOT_SUPPORTED_SHARED_MEMORY_INSUFFICIENT", - "CUDNN_STATUS_NOT_SUPPORTED_SHAPE", - "CUDNN_STATUS_NOT_SUPPORTED_RUNTIME_PREREQUISITE_MISSING", - "CUDNN_STATUS_NOT_SUPPORTED_PADDING", - "CUDNN_STATUS_NOT_SUPPORTED_LAYOUT", - "CUDNN_STATUS_NOT_SUPPORTED_INCOMPATIBLE_CUDA_DRIVER", - "CUDNN_STATUS_NOT_SUPPORTED_INCOMPATIBLE_CUDART", - "CUDNN_STATUS_NOT_SUPPORTED_GRAPH_PATTERN", - "CUDNN_STATUS_NOT_SUPPORTED_DATA_TYPE", - "CUDNN_STATUS_NOT_SUPPORTED_CUDA_GRAPH_NATIVE_API", - "CUDNN_STATUS_NOT_SUPPORTED_BAD_LAUNCH_PARAM", - "CUDNN_STATUS_NOT_SUPPORTED_ARCH_MISMATCH", - "CUDNN_STATUS_INTERNAL_ERROR_UNEXPECTED_VALUE", - "CUDNN_STATUS_INTERNAL_ERROR_TEXTURE_CREATION_FAILED", - "CUDNN_STATUS_INTERNAL_ERROR_HOST_ALLOCATION_FAILED", - "CUDNN_STATUS_INTERNAL_ERROR_DEVICE_ALLOCATION_FAILED", - "CUDNN_STATUS_INTERNAL_ERROR_COMPILATION_FAILED", - "CUDNN_STATUS_INTERNAL_ERROR_BAD_LAUNCH_PARAM", - "CUDNN_STATUS_FULL_ERROR_CODE", - "CUDNN_STATUS_EXECUTION_FAILED_CURAND", - "CUDNN_STATUS_EXECUTION_FAILED_CUDA_DRIVER", - "CUDNN_STATUS_EXECUTION_FAILED_CUDART", - "CUDNN_STATUS_EXECUTION_FAILED_CUBLAS", - "CUDNN_STATUS_DEPRECATED", - "CUDNN_STATUS_CATEGORY", - "CUDNN_STATUS_BAD_PARAM_STREAM_MISMATCH", - "CUDNN_STATUS_BAD_PARAM_SIZE_INSUFFICIENT", - "CUDNN_STATUS_BAD_PARAM_SHAPE_MISMATCH", - "CUDNN_STATUS_BAD_PARAM_OUT_OF_BOUND", - "CUDNN_STATUS_BAD_PARAM_NULL_POINTER", - "CUDNN_STATUS_BAD_PARAM_NOT_FINALIZED", - "CUDNN_STATUS_BAD_PARAM_MISALIGNED_POINTER", - "CUDNN_STATUS_BAD_PARAM_DUPLICATED_ENTRIES", - "CUDNN_STATUS_BAD_PARAM_CUDA_GRAPH_MISMATCH", - "CUDNN_STATUS_BAD_PARAM_ATTRIBUTE_TYPE", - "CUDNN_SIGNAL_WAIT", - "CUDNN_SIGNAL_SET", - "CUDNN_SEV_WARNING_EN", - "CUDNN_SEV_WARNING", - "CUDNN_SEV_INFO_EN", - "CUDNN_SEV_INFO", - "CUDNN_SEV_FATAL", - "CUDNN_SEV_ERROR_EN", - "CUDNN_SEV_ERROR", - "CUDNN_SEQDATA_VECT_DIM", - "CUDNN_SEQDATA_TIME_DIM", - "CUDNN_SEQDATA_DIM_COUNT", - "CUDNN_SEQDATA_BEAM_DIM", - "CUDNN_SEQDATA_BATCH_DIM", - "CUDNN_SCALAR_SIZE_T_WORKSPACE_SIZE_IN_BYTES", - "CUDNN_SCALAR_INT64_T_BN_ACCUMULATION_COUNT", - "CUDNN_SCALAR_DOUBLE_BN_EXP_AVG_FACTOR", - "CUDNN_SCALAR_DOUBLE_BN_EPSILON", - "CUDNN_SAMPLER_BILINEAR", - "CUDNN_RNN_PADDED_IO_ENABLED", - "CUDNN_RNN_PADDED_IO_DISABLED", - "CUDNN_RNN_DATA_LAYOUT_SEQ_MAJOR_UNPACKED", - "CUDNN_RNN_DATA_LAYOUT_SEQ_MAJOR_PACKED", - "CUDNN_RNN_DATA_LAYOUT_BATCH_MAJOR_UNPACKED", - "CUDNN_RNN_CLIP_NONE", - "CUDNN_RNN_CLIP_MINMAX", - "CUDNN_RNN_ALGO_COUNT", - "CUDNN_RNG_DISTRIBUTION_UNIFORM", - "CUDNN_RNG_DISTRIBUTION_NORMAL", - "CUDNN_RNG_DISTRIBUTION_BERNOULLI", - "CUDNN_RMS_NORM", - "CUDNN_RESAMPLE_NEAREST", - "CUDNN_RESAMPLE_MAXPOOL", - "CUDNN_RESAMPLE_BILINEAR", - "CUDNN_RESAMPLE_AVGPOOL_INCLUDE_PADDING", - "CUDNN_RESAMPLE_AVGPOOL_EXCLUDE_PADDING", - "CUDNN_RESAMPLE_AVGPOOL", - "CUDNN_PTR_ZDATA", - "CUDNN_PTR_YSUM", - "CUDNN_PTR_YSQSUM", - "CUDNN_PTR_YDATA", - "CUDNN_PTR_XDATA", - "CUDNN_PTR_WORKSPACE", - "CUDNN_PTR_WDATA", - "CUDNN_PTR_NULL", - "CUDNN_PTR_ELEM_ALIGNED", - "CUDNN_PTR_DZDATA", - "CUDNN_PTR_DYDATA", - "CUDNN_PTR_DXDATA", - "CUDNN_PTR_DWDATA", - "CUDNN_PTR_BN_Z_EQSCALE", - "CUDNN_PTR_BN_Z_EQBIAS", - "CUDNN_PTR_BN_SCALE", - "CUDNN_PTR_BN_SAVED_MEAN", - "CUDNN_PTR_BN_SAVED_INVSTD", - "CUDNN_PTR_BN_RUNNING_VAR", - "CUDNN_PTR_BN_RUNNING_MEAN", - "CUDNN_PTR_BN_EQSCALE", - "CUDNN_PTR_BN_EQBIAS", - "CUDNN_PTR_BN_DSCALE", - "CUDNN_PTR_BN_DBIAS", - "CUDNN_PTR_BN_BIAS", - "CUDNN_PTR_ACTIVATION_BITMASK", - "CUDNN_PTR_16B_ALIGNED", - "CUDNN_POINTWISE_TANH_FWD", - "CUDNN_POINTWISE_TANH_BWD", - "CUDNN_POINTWISE_TAN", - "CUDNN_POINTWISE_SWISH_FWD", - "CUDNN_POINTWISE_SWISH_BWD", - "CUDNN_POINTWISE_SUB", - "CUDNN_POINTWISE_SQRT", - "CUDNN_POINTWISE_SOFTPLUS_FWD", - "CUDNN_POINTWISE_SOFTPLUS_BWD", - "CUDNN_POINTWISE_SIN", - "CUDNN_POINTWISE_SIGMOID_FWD", - "CUDNN_POINTWISE_SIGMOID_BWD", - "CUDNN_POINTWISE_RSQRT", - "CUDNN_POINTWISE_RELU_FWD", - "CUDNN_POINTWISE_RELU_BWD", - "CUDNN_POINTWISE_RECIPROCAL", - "CUDNN_POINTWISE_POW", - "CUDNN_POINTWISE_NEG", - "CUDNN_POINTWISE_MUL", - "CUDNN_POINTWISE_MOD", - "CUDNN_POINTWISE_MIN", - "CUDNN_POINTWISE_MAX", - "CUDNN_POINTWISE_LOGICAL_OR", - "CUDNN_POINTWISE_LOGICAL_NOT", - "CUDNN_POINTWISE_LOGICAL_AND", - "CUDNN_POINTWISE_LOG", - "CUDNN_POINTWISE_IDENTITY", - "CUDNN_POINTWISE_GEN_INDEX", - "CUDNN_POINTWISE_GELU_FWD", - "CUDNN_POINTWISE_GELU_BWD", - "CUDNN_POINTWISE_GELU_APPROX_TANH_FWD", - "CUDNN_POINTWISE_GELU_APPROX_TANH_BWD", - "CUDNN_POINTWISE_FLOOR", - "CUDNN_POINTWISE_EXP", - "CUDNN_POINTWISE_ERF", - "CUDNN_POINTWISE_ELU_FWD", - "CUDNN_POINTWISE_ELU_BWD", - "CUDNN_POINTWISE_DIV", - "CUDNN_POINTWISE_COS", - "CUDNN_POINTWISE_CMP_NEQ", - "CUDNN_POINTWISE_CMP_LT", - "CUDNN_POINTWISE_CMP_LE", - "CUDNN_POINTWISE_CMP_GT", - "CUDNN_POINTWISE_CMP_GE", - "CUDNN_POINTWISE_CMP_EQ", - "CUDNN_POINTWISE_CEIL", - "CUDNN_POINTWISE_BINARY_SELECT", - "CUDNN_POINTWISE_ATAN2", - "CUDNN_POINTWISE_ADD_SQUARE", - "CUDNN_POINTWISE_ADD", - "CUDNN_POINTWISE_ABS", - "CUDNN_PARAM_ZDESC", - "CUDNN_PARAM_ZDATA_PLACEHOLDER", - "CUDNN_PARAM_YSUM_PLACEHOLDER", - "CUDNN_PARAM_YSTATS_DESC", - "CUDNN_PARAM_YSQSUM_PLACEHOLDER", - "CUDNN_PARAM_YDESC", - "CUDNN_PARAM_YDATA_PLACEHOLDER", - "CUDNN_PARAM_XDESC", - "CUDNN_PARAM_XDATA_PLACEHOLDER", - "CUDNN_PARAM_WDESC", - "CUDNN_PARAM_WDATA_PLACEHOLDER", - "CUDNN_PARAM_DZDESC", - "CUDNN_PARAM_DZDATA_PLACEHOLDER", - "CUDNN_PARAM_DYDESC", - "CUDNN_PARAM_DYDATA_PLACEHOLDER", - "CUDNN_PARAM_DXDESC", - "CUDNN_PARAM_DXDATA_PLACEHOLDER", - "CUDNN_PARAM_DWDESC", - "CUDNN_PARAM_DWDATA_PLACEHOLDER", - "CUDNN_PARAM_CONV_DESC", - "CUDNN_PARAM_BN_Z_EQSCALE_PLACEHOLDER", - "CUDNN_PARAM_BN_Z_EQSCALEBIAS_DESC", - "CUDNN_PARAM_BN_Z_EQBIAS_PLACEHOLDER", - "CUDNN_PARAM_BN_SCALE_PLACEHOLDER", - "CUDNN_PARAM_BN_SCALEBIAS_MEANVAR_DESC", - "CUDNN_PARAM_BN_SAVED_MEAN_PLACEHOLDER", - "CUDNN_PARAM_BN_SAVED_INVSTD_PLACEHOLDER", - "CUDNN_PARAM_BN_RUNNING_VAR_PLACEHOLDER", - "CUDNN_PARAM_BN_RUNNING_MEAN_PLACEHOLDER", - "CUDNN_PARAM_BN_MODE", - "CUDNN_PARAM_BN_EQSCALE_PLACEHOLDER", - "CUDNN_PARAM_BN_EQSCALEBIAS_DESC", - "CUDNN_PARAM_BN_EQBIAS_PLACEHOLDER", - "CUDNN_PARAM_BN_DSCALE_PLACEHOLDER", - "CUDNN_PARAM_BN_DBIAS_PLACEHOLDER", - "CUDNN_PARAM_BN_BIAS_PLACEHOLDER", - "CUDNN_PARAM_ACTIVATION_DESC", - "CUDNN_PARAM_ACTIVATION_BITMASK_PLACEHOLDER", - "CUDNN_PARAM_ACTIVATION_BITMASK_DESC", - "CUDNN_OP_TENSOR_NOT", - "CUDNN_NUMERICAL_NOTE_WINOGRAD_TILE_6x6", - "CUDNN_NUMERICAL_NOTE_WINOGRAD_TILE_4x4", - "CUDNN_NUMERICAL_NOTE_WINOGRAD_TILE_13x13", - "CUDNN_NUMERICAL_NOTE_WINOGRAD", - "CUDNN_NUMERICAL_NOTE_TYPE_COUNT", - "CUDNN_NUMERICAL_NOTE_TENSOR_CORE", - "CUDNN_NUMERICAL_NOTE_STRICT_NAN_PROP", - "CUDNN_NUMERICAL_NOTE_REDUCED_PRECISION_REDUCTION", - "CUDNN_NUMERICAL_NOTE_NONDETERMINISTIC", - "CUDNN_NUMERICAL_NOTE_FFT", - "CUDNN_NUMERICAL_NOTE_DOWN_CONVERT_INPUTS", - "CUDNN_NO_REORDER", - "CUDNN_NORM_PER_CHANNEL", - "CUDNN_NORM_PER_ACTIVATION", - "CUDNN_NORM_OPS_NORM_ADD_ACTIVATION", - "CUDNN_NORM_OPS_NORM_ACTIVATION", - "CUDNN_NORM_OPS_NORM", - "CUDNN_NORM_FWD_TRAINING", - "CUDNN_NORM_FWD_INFERENCE", - "CUDNN_NORM_ALGO_STANDARD", - "CUDNN_NORM_ALGO_PERSIST", - "CUDNN_NON_DETERMINISTIC", - "CUDNN_NEG_INF_PAD", - "CUDNN_MH_ATTN_V_WEIGHTS", - "CUDNN_MH_ATTN_V_BIASES", - "CUDNN_MH_ATTN_Q_WEIGHTS", - "CUDNN_MH_ATTN_Q_BIASES", - "CUDNN_MH_ATTN_O_WEIGHTS", - "CUDNN_MH_ATTN_O_BIASES", - "CUDNN_MH_ATTN_K_WEIGHTS", - "CUDNN_MH_ATTN_K_BIASES", - "CUDNN_LRN_MIN_N", - "CUDNN_LRN_MIN_K", - "CUDNN_LRN_MIN_BETA", - "CUDNN_LRN_MAX_N", - "CUDNN_LOSS_NORMALIZATION_SOFTMAX", - "CUDNN_LOSS_NORMALIZATION_NONE", - "CUDNN_LAYOUT_TYPE_PREFERRED_PAD8CK", - "CUDNN_LAYOUT_TYPE_PREFERRED_PAD4CK", - "CUDNN_LAYOUT_TYPE_PREFERRED_NHWC", - "CUDNN_LAYOUT_TYPE_PREFERRED_NCHW", - "CUDNN_LAYOUT_TYPE_COUNT", - "CUDNN_LAYER_NORM", - "CUDNN_KNOB_TYPE_WORKSPACE", - "CUDNN_KNOB_TYPE_WINO_TILE", - "CUDNN_KNOB_TYPE_USE_TEX", - "CUDNN_KNOB_TYPE_TILE_SIZE", - "CUDNN_KNOB_TYPE_TILE_ROWS", - "CUDNN_KNOB_TYPE_TILE_COLS", - "CUDNN_KNOB_TYPE_TILE_CGA_N", - "CUDNN_KNOB_TYPE_TILE_CGA_M", - "CUDNN_KNOB_TYPE_TILE_CGA", - "CUDNN_KNOB_TYPE_TILEK", - "CUDNN_KNOB_TYPE_SWIZZLE", - "CUDNN_KNOB_TYPE_STAGES", - "CUDNN_KNOB_TYPE_SPLIT_RS", - "CUDNN_KNOB_TYPE_SPLIT_K_SLC", - "CUDNN_KNOB_TYPE_SPLIT_K_BUF", - "CUDNN_KNOB_TYPE_SPLIT_K", - "CUDNN_KNOB_TYPE_SPLIT_H", - "CUDNN_KNOB_TYPE_SPLIT_COLS", - "CUDNN_KNOB_TYPE_SPECFILT", - "CUDNN_KNOB_TYPE_SLICED", - "CUDNN_KNOB_TYPE_SINGLEBUFFER", - "CUDNN_KNOB_TYPE_REDUCTION_MODE", - "CUDNN_KNOB_TYPE_OCCUPANCY", - "CUDNN_KNOB_TYPE_NUM_C_PER_BLOCK", - "CUDNN_KNOB_TYPE_MULTIPLY", - "CUDNN_KNOB_TYPE_LOAD_SIZE", - "CUDNN_KNOB_TYPE_LDGC", - "CUDNN_KNOB_TYPE_LDGB", - "CUDNN_KNOB_TYPE_LDGA", - "CUDNN_KNOB_TYPE_KERNEL_CFG", - "CUDNN_KNOB_TYPE_KBLOCK", - "CUDNN_KNOB_TYPE_IDX_MODE", - "CUDNN_KNOB_TYPE_EDGE", - "CUDNN_KNOB_TYPE_CTA_SPLIT_K_MODE", - "CUDNN_KNOB_TYPE_COUNTS", - "CUDNN_KNOB_TYPE_CHUNK_K", - "CUDNN_KNOB_TYPE_BLOCK_SIZE", - "CUDNN_KNOB_TYPE_ARRAY_SIZE_PER_THREAD", - "CUDNN_INSTANCE_NORM", - "CUDNN_HEUR_MODE_INSTANT", - "CUDNN_HEUR_MODE_FALLBACK", - "CUDNN_HEUR_MODE_B", - "CUDNN_HEUR_MODE_A", - "CUDNN_HEUR_MODES_COUNT", - "CUDNN_GROUP_NORM", - "CUDNN_GENSTATS_SUM_SQSUM", - "CUDNN_FWD_MODE_TRAINING", - "CUDNN_FWD_MODE_INFERENCE", - "CUDNN_FUSED_SCALE_BIAS_ADD_ACTIVATION_GEN_BITMASK", - "CUDNN_FUSED_SCALE_BIAS_ACTIVATION_WGRAD", - "CUDNN_FUSED_SCALE_BIAS_ACTIVATION_CONV_BNSTATS", - "CUDNN_FUSED_DACTIVATION_FORK_DBATCHNORM", - "CUDNN_FUSED_CONV_SCALE_BIAS_ADD_ACTIVATION", - "CUDNN_FUSED_BN_FINALIZE_STATISTICS_TRAINING", - "CUDNN_FUSED_BN_FINALIZE_STATISTICS_INFERENCE", - "CUDNN_FMA_MATH", - "CUDNN_ERRQUERY_RAWCODE", - "CUDNN_ERRQUERY_NONBLOCKING", - "CUDNN_ERRQUERY_BLOCKING", - "CUDNN_EDGE_VAL_PAD", - "CUDNN_DIVNORM_PRECOMPUTED_MEANS", - "CUDNN_DIM_MAX", - "CUDNN_DETERMINISTIC", - "CUDNN_DEFAULT_REORDER", - "CUDNN_DATA_UINT8x4", - "CUDNN_DATA_UINT8", - "CUDNN_DATA_INT8x32", - "CUDNN_DATA_INT64", - "CUDNN_DATA_FP8_E5M2", - "CUDNN_DATA_FP8_E4M3", - "CUDNN_DATA_FAST_FLOAT_FOR_FP8", - "CUDNN_DATA_BOOLEAN", - "CUDNN_DATA_BFLOAT16", - "CUDNN_CTC_ZERO_OOB_GRADIENTS", - "CUDNN_CTC_SKIP_OOB_GRADIENTS", - "CUDNN_CTC_LOSS_ALGO_NON_DETERMINISTIC", - "CUDNN_CTC_LOSS_ALGO_DETERMINISTIC", - "CUDNN_BN_FINALIZE_STATISTICS_TRAINING", - "CUDNN_BN_FINALIZE_STATISTICS_INFERENCE", - "CUDNN_BEHAVIOR_NOTE_TYPE_COUNT", - "CUDNN_BEHAVIOR_NOTE_SUPPORTS_CUDA_GRAPH_NATIVE_API", - "CUDNN_BEHAVIOR_NOTE_RUNTIME_COMPILATION", - "CUDNN_BEHAVIOR_NOTE_REQUIRES_FILTER_INT8x32_REORDER", - "CUDNN_BEHAVIOR_NOTE_REQUIRES_BIAS_INT8x32_REORDER", - "CUDNN_BATCH_NORM", - "CUDNN_BATCHNORM_OPS_BN_ADD_ACTIVATION", - "CUDNN_BATCHNORM_OPS_BN_ACTIVATION", - "CUDNN_BATCHNORM_OPS_BN", - "CUDNN_BACKEND_VARIANT_PACK_DESCRIPTOR", - "CUDNN_BACKEND_TENSOR_DESCRIPTOR", - "CUDNN_BACKEND_RNG_DESCRIPTOR", - "CUDNN_BACKEND_RESAMPLE_DESCRIPTOR", - "CUDNN_BACKEND_REDUCTION_DESCRIPTOR", - "CUDNN_BACKEND_POINTWISE_DESCRIPTOR", - "CUDNN_BACKEND_OPERATION_SIGNAL_DESCRIPTOR", - "CUDNN_BACKEND_OPERATION_RNG_DESCRIPTOR", - "CUDNN_BACKEND_OPERATION_RESHAPE_DESCRIPTOR", - "CUDNN_BACKEND_OPERATION_RESAMPLE_FWD_DESCRIPTOR", - "CUDNN_BACKEND_OPERATION_RESAMPLE_BWD_DESCRIPTOR", - "CUDNN_BACKEND_OPERATION_REDUCTION_DESCRIPTOR", - "CUDNN_BACKEND_OPERATION_POINTWISE_DESCRIPTOR", - "CUDNN_BACKEND_OPERATION_PAGED_CACHE_LOAD_DESCRIPTOR", - "CUDNN_BACKEND_OPERATION_NORM_FORWARD_DESCRIPTOR", - "CUDNN_BACKEND_OPERATION_NORM_BACKWARD_DESCRIPTOR", - "CUDNN_BACKEND_OPERATION_MATMUL_DESCRIPTOR", - "CUDNN_BACKEND_OPERATION_GEN_STATS_DESCRIPTOR", - "CUDNN_BACKEND_OPERATION_CONVOLUTION_FORWARD_DESCRIPTOR", - "CUDNN_BACKEND_OPERATION_CONVOLUTION_BACKWARD_FILTER_DESCRIPTOR", - "CUDNN_BACKEND_OPERATION_CONVOLUTION_BACKWARD_DATA_DESCRIPTOR", - "CUDNN_BACKEND_OPERATION_CONCAT_DESCRIPTOR", - "CUDNN_BACKEND_OPERATION_BN_FINALIZE_STATISTICS_DESCRIPTOR", - "CUDNN_BACKEND_OPERATION_BN_BWD_WEIGHTS_DESCRIPTOR", - "CUDNN_BACKEND_OPERATIONGRAPH_DESCRIPTOR", - "CUDNN_BACKEND_MATMUL_DESCRIPTOR", - "CUDNN_BACKEND_LAYOUT_INFO_DESCRIPTOR", - "CUDNN_BACKEND_KNOB_INFO_DESCRIPTOR", - "CUDNN_BACKEND_KNOB_CHOICE_DESCRIPTOR", - "CUDNN_BACKEND_KERNEL_CACHE_DESCRIPTOR", - "CUDNN_BACKEND_INTERMEDIATE_INFO_DESCRIPTOR", - "CUDNN_BACKEND_EXECUTION_PLAN_DESCRIPTOR", - "CUDNN_BACKEND_ENGINE_DESCRIPTOR", - "CUDNN_BACKEND_ENGINEHEUR_DESCRIPTOR", - "CUDNN_BACKEND_ENGINECFG_DESCRIPTOR", - "CUDNN_BACKEND_CONVOLUTION_DESCRIPTOR", - "CUDNN_ATTR_VARIANT_PACK_WORKSPACE", - "CUDNN_ATTR_VARIANT_PACK_UNIQUE_IDS", - "CUDNN_ATTR_VARIANT_PACK_INTERMEDIATES", - "CUDNN_ATTR_VARIANT_PACK_DATA_POINTERS", - "CUDNN_ATTR_TENSOR_VECTOR_COUNT", - "CUDNN_ATTR_TENSOR_VECTORIZED_DIMENSION", - "CUDNN_ATTR_TENSOR_UNIQUE_ID", - "CUDNN_ATTR_TENSOR_STRIDES", - "CUDNN_ATTR_TENSOR_REORDERING_MODE", - "CUDNN_ATTR_TENSOR_RAGGED_OFFSET_DESC", - "CUDNN_ATTR_TENSOR_IS_VIRTUAL", - "CUDNN_ATTR_TENSOR_IS_BY_VALUE", - "CUDNN_ATTR_TENSOR_DIMENSIONS", - "CUDNN_ATTR_TENSOR_DATA_TYPE", - "CUDNN_ATTR_TENSOR_BYTE_ALIGNMENT", - "CUDNN_ATTR_RNG_UNIFORM_DIST_MINIMUM", - "CUDNN_ATTR_RNG_UNIFORM_DIST_MAXIMUM", - "CUDNN_ATTR_RNG_NORMAL_DIST_STANDARD_DEVIATION", - "CUDNN_ATTR_RNG_NORMAL_DIST_MEAN", - "CUDNN_ATTR_RNG_DISTRIBUTION", - "CUDNN_ATTR_RNG_BERNOULLI_DIST_PROBABILITY", - "CUDNN_ATTR_RESAMPLE_WINDOW_DIMS", - "CUDNN_ATTR_RESAMPLE_STRIDES", - "CUDNN_ATTR_RESAMPLE_SPATIAL_DIMS", - "CUDNN_ATTR_RESAMPLE_PRE_PADDINGS", - "CUDNN_ATTR_RESAMPLE_POST_PADDINGS", - "CUDNN_ATTR_RESAMPLE_PADDING_MODE", - "CUDNN_ATTR_RESAMPLE_NAN_PROPAGATION", - "CUDNN_ATTR_RESAMPLE_MODE", - "CUDNN_ATTR_RESAMPLE_COMP_TYPE", - "CUDNN_ATTR_REDUCTION_OPERATOR", - "CUDNN_ATTR_REDUCTION_COMP_TYPE", - "CUDNN_ATTR_POINTWISE_SWISH_BETA", - "CUDNN_ATTR_POINTWISE_SOFTPLUS_BETA", - "CUDNN_ATTR_POINTWISE_RELU_UPPER_CLIP", - "CUDNN_ATTR_POINTWISE_RELU_LOWER_CLIP_SLOPE", - "CUDNN_ATTR_POINTWISE_RELU_LOWER_CLIP", - "CUDNN_ATTR_POINTWISE_NAN_PROPAGATION", - "CUDNN_ATTR_POINTWISE_MODE", - "CUDNN_ATTR_POINTWISE_MATH_PREC", - "CUDNN_ATTR_POINTWISE_ELU_ALPHA", - "CUDNN_ATTR_POINTWISE_AXIS", - "CUDNN_ATTR_OPERATION_SIGNAL_YDESC", - "CUDNN_ATTR_OPERATION_SIGNAL_XDESC", - "CUDNN_ATTR_OPERATION_SIGNAL_VALUE", - "CUDNN_ATTR_OPERATION_SIGNAL_MODE", - "CUDNN_ATTR_OPERATION_SIGNAL_FLAGDESC", - "CUDNN_ATTR_OPERATION_RNG_YDESC", - "CUDNN_ATTR_OPERATION_RNG_SEED", - "CUDNN_ATTR_OPERATION_RNG_OFFSET_DESC", - "CUDNN_ATTR_OPERATION_RNG_DESC", - "CUDNN_ATTR_OPERATION_RESHAPE_YDESC", - "CUDNN_ATTR_OPERATION_RESHAPE_XDESC", - "CUDNN_ATTR_OPERATION_RESAMPLE_FWD_YDESC", - "CUDNN_ATTR_OPERATION_RESAMPLE_FWD_XDESC", - "CUDNN_ATTR_OPERATION_RESAMPLE_FWD_IDXDESC", - "CUDNN_ATTR_OPERATION_RESAMPLE_FWD_DESC", - "CUDNN_ATTR_OPERATION_RESAMPLE_FWD_BETA", - "CUDNN_ATTR_OPERATION_RESAMPLE_FWD_ALPHA", - "CUDNN_ATTR_OPERATION_RESAMPLE_BWD_YDESC", - "CUDNN_ATTR_OPERATION_RESAMPLE_BWD_XDESC", - "CUDNN_ATTR_OPERATION_RESAMPLE_BWD_IDXDESC", - "CUDNN_ATTR_OPERATION_RESAMPLE_BWD_DYDESC", - "CUDNN_ATTR_OPERATION_RESAMPLE_BWD_DXDESC", - "CUDNN_ATTR_OPERATION_RESAMPLE_BWD_DESC", - "CUDNN_ATTR_OPERATION_RESAMPLE_BWD_BETA", - "CUDNN_ATTR_OPERATION_RESAMPLE_BWD_ALPHA", - "CUDNN_ATTR_OPERATION_REDUCTION_YDESC", - "CUDNN_ATTR_OPERATION_REDUCTION_XDESC", - "CUDNN_ATTR_OPERATION_REDUCTION_DESC", - "CUDNN_ATTR_OPERATION_POINTWISE_YDESC", - "CUDNN_ATTR_OPERATION_POINTWISE_XDESC", - "CUDNN_ATTR_OPERATION_POINTWISE_TDESC", - "CUDNN_ATTR_OPERATION_POINTWISE_PW_DESCRIPTOR", - "CUDNN_ATTR_OPERATION_POINTWISE_DYDESC", - "CUDNN_ATTR_OPERATION_POINTWISE_DXDESC", - "CUDNN_ATTR_OPERATION_POINTWISE_BDESC", - "CUDNN_ATTR_OPERATION_POINTWISE_ALPHA2", - "CUDNN_ATTR_OPERATION_POINTWISE_ALPHA1", - "CUDNN_ATTR_OPERATION_PAGED_CACHE_LOAD_YDESC", - "CUDNN_ATTR_OPERATION_PAGED_CACHE_LOAD_SEQUENCE_DESC", - "CUDNN_ATTR_OPERATION_PAGED_CACHE_LOAD_PAGE_TABLE_DESC", - "CUDNN_ATTR_OPERATION_PAGED_CACHE_LOAD_CONTAINER_DESC", - "CUDNN_ATTR_OPERATION_NORM_FWD_YDESC", - "CUDNN_ATTR_OPERATION_NORM_FWD_XDESC", - "CUDNN_ATTR_OPERATION_NORM_FWD_SCALE_DESC", - "CUDNN_ATTR_OPERATION_NORM_FWD_PHASE", - "CUDNN_ATTR_OPERATION_NORM_FWD_PEER_STAT_DESCS", - "CUDNN_ATTR_OPERATION_NORM_FWD_OUTPUT_RUNNING_VAR_DESC", - "CUDNN_ATTR_OPERATION_NORM_FWD_OUTPUT_RUNNING_MEAN_DESC", - "CUDNN_ATTR_OPERATION_NORM_FWD_MODE", - "CUDNN_ATTR_OPERATION_NORM_FWD_MEAN_DESC", - "CUDNN_ATTR_OPERATION_NORM_FWD_INV_VARIANCE_DESC", - "CUDNN_ATTR_OPERATION_NORM_FWD_INPUT_RUNNING_VAR_DESC", - "CUDNN_ATTR_OPERATION_NORM_FWD_INPUT_RUNNING_MEAN_DESC", - "CUDNN_ATTR_OPERATION_NORM_FWD_EXP_AVG_FACTOR_DESC", - "CUDNN_ATTR_OPERATION_NORM_FWD_EPSILON_DESC", - "CUDNN_ATTR_OPERATION_NORM_FWD_BIAS_DESC", - "CUDNN_ATTR_OPERATION_NORM_BWD_XDESC", - "CUDNN_ATTR_OPERATION_NORM_BWD_SCALE_DESC", - "CUDNN_ATTR_OPERATION_NORM_BWD_PEER_STAT_DESCS", - "CUDNN_ATTR_OPERATION_NORM_BWD_MODE", - "CUDNN_ATTR_OPERATION_NORM_BWD_MEAN_DESC", - "CUDNN_ATTR_OPERATION_NORM_BWD_INV_VARIANCE_DESC", - "CUDNN_ATTR_OPERATION_NORM_BWD_EPSILON_DESC", - "CUDNN_ATTR_OPERATION_NORM_BWD_DYDESC", - "CUDNN_ATTR_OPERATION_NORM_BWD_DXDESC", - "CUDNN_ATTR_OPERATION_NORM_BWD_DSCALE_DESC", - "CUDNN_ATTR_OPERATION_NORM_BWD_DBIAS_DESC", - "CUDNN_ATTR_OPERATION_MATMUL_IRREGULARLY_STRIDED_BATCH_COUNT", - "CUDNN_ATTR_OPERATION_MATMUL_GEMM_N_OVERRIDE_DESC", - "CUDNN_ATTR_OPERATION_MATMUL_GEMM_M_OVERRIDE_DESC", - "CUDNN_ATTR_OPERATION_MATMUL_GEMM_K_OVERRIDE_DESC", - "CUDNN_ATTR_OPERATION_MATMUL_DESC", - "CUDNN_ATTR_OPERATION_MATMUL_CDESC", - "CUDNN_ATTR_OPERATION_MATMUL_BDESC", - "CUDNN_ATTR_OPERATION_MATMUL_ADESC", - "CUDNN_ATTR_OPERATION_GENSTATS_XDESC", - "CUDNN_ATTR_OPERATION_GENSTATS_SUMDESC", - "CUDNN_ATTR_OPERATION_GENSTATS_SQSUMDESC", - "CUDNN_ATTR_OPERATION_GENSTATS_MODE", - "CUDNN_ATTR_OPERATION_GENSTATS_MATH_PREC", - "CUDNN_ATTR_OPERATION_CONVOLUTION_FORWARD_Y", - "CUDNN_ATTR_OPERATION_CONVOLUTION_FORWARD_X", - "CUDNN_ATTR_OPERATION_CONVOLUTION_FORWARD_W", - "CUDNN_ATTR_OPERATION_CONVOLUTION_FORWARD_CONV_DESC", - "CUDNN_ATTR_OPERATION_CONVOLUTION_FORWARD_BETA", - "CUDNN_ATTR_OPERATION_CONVOLUTION_FORWARD_ALPHA", - "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_FILTER_X", - "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_FILTER_DY", - "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_FILTER_DW", - "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_FILTER_CONV_DESC", - "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_FILTER_BETA", - "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_FILTER_ALPHA", - "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_DATA_W", - "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_DATA_DY", - "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_DATA_DX", - "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_DATA_CONV_DESC", - "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_DATA_BETA", - "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_DATA_ALPHA", - "CUDNN_ATTR_OPERATION_CONCAT_OUTPUT_DESC", - "CUDNN_ATTR_OPERATION_CONCAT_INPUT_DESCS", - "CUDNN_ATTR_OPERATION_CONCAT_INPLACE_INDEX", - "CUDNN_ATTR_OPERATION_CONCAT_AXIS", - "CUDNN_ATTR_OPERATION_BN_FINALIZE_Y_SUM_DESC", - "CUDNN_ATTR_OPERATION_BN_FINALIZE_Y_SQ_SUM_DESC", - "CUDNN_ATTR_OPERATION_BN_FINALIZE_UPDATED_RUNNING_VAR_DESC", - "CUDNN_ATTR_OPERATION_BN_FINALIZE_UPDATED_RUNNING_MEAN_DESC", - "CUDNN_ATTR_OPERATION_BN_FINALIZE_STATS_MODE", - "CUDNN_ATTR_OPERATION_BN_FINALIZE_SCALE_DESC", - "CUDNN_ATTR_OPERATION_BN_FINALIZE_SAVED_MEAN_DESC", - "CUDNN_ATTR_OPERATION_BN_FINALIZE_SAVED_INV_STD_DESC", - "CUDNN_ATTR_OPERATION_BN_FINALIZE_PREV_RUNNING_VAR_DESC", - "CUDNN_ATTR_OPERATION_BN_FINALIZE_PREV_RUNNING_MEAN_DESC", - "CUDNN_ATTR_OPERATION_BN_FINALIZE_MATH_PREC", - "CUDNN_ATTR_OPERATION_BN_FINALIZE_EXP_AVERATE_FACTOR_DESC", - "CUDNN_ATTR_OPERATION_BN_FINALIZE_EQ_SCALE_DESC", - "CUDNN_ATTR_OPERATION_BN_FINALIZE_EQ_BIAS_DESC", - "CUDNN_ATTR_OPERATION_BN_FINALIZE_EPSILON_DESC", - "CUDNN_ATTR_OPERATION_BN_FINALIZE_BIAS_DESC", - "CUDNN_ATTR_OPERATION_BN_FINALIZE_ACCUM_COUNT_DESC", - "CUDNN_ATTR_OPERATION_BN_BWD_WEIGHTS_X_DESC", - "CUDNN_ATTR_OPERATION_BN_BWD_WEIGHTS_MEAN_DESC", - "CUDNN_ATTR_OPERATION_BN_BWD_WEIGHTS_MATH_PREC", - "CUDNN_ATTR_OPERATION_BN_BWD_WEIGHTS_INVSTD_DESC", - "CUDNN_ATTR_OPERATION_BN_BWD_WEIGHTS_EQ_X_SCALE_DESC", - "CUDNN_ATTR_OPERATION_BN_BWD_WEIGHTS_EQ_DY_SCALE_DESC", - "CUDNN_ATTR_OPERATION_BN_BWD_WEIGHTS_EQ_BIAS", - "CUDNN_ATTR_OPERATION_BN_BWD_WEIGHTS_DY_DESC", - "CUDNN_ATTR_OPERATION_BN_BWD_WEIGHTS_DBN_SCALE_DESC", - "CUDNN_ATTR_OPERATION_BN_BWD_WEIGHTS_DBN_BIAS_DESC", - "CUDNN_ATTR_OPERATION_BN_BWD_WEIGHTS_BN_SCALE_DESC", - "CUDNN_ATTR_OPERATIONGRAPH_OPS", - "CUDNN_ATTR_OPERATIONGRAPH_IS_DYNAMIC_SHAPE_ENABLED", - "CUDNN_ATTR_OPERATIONGRAPH_HANDLE", - "CUDNN_ATTR_OPERATIONGRAPH_ENGINE_GLOBAL_COUNT", - "CUDNN_ATTR_MATMUL_PADDING_VALUE", - "CUDNN_ATTR_MATMUL_COMP_TYPE", - "CUDNN_ATTR_LAYOUT_INFO_TYPES", - "CUDNN_ATTR_LAYOUT_INFO_TENSOR_UID", - "CUDNN_ATTR_KNOB_INFO_TYPE", - "CUDNN_ATTR_KNOB_INFO_STRIDE", - "CUDNN_ATTR_KNOB_INFO_MINIMUM_VALUE", - "CUDNN_ATTR_KNOB_INFO_MAXIMUM_VALUE", - "CUDNN_ATTR_KNOB_CHOICE_KNOB_VALUE", - "CUDNN_ATTR_KNOB_CHOICE_KNOB_TYPE", - "CUDNN_ATTR_KERNEL_CACHE_OPERATION_GRAPH", - "CUDNN_ATTR_KERNEL_CACHE_IS_ENGINECFG_KERNEL_CACHED", - "CUDNN_ATTR_INTERMEDIATE_INFO_UNIQUE_ID", - "CUDNN_ATTR_INTERMEDIATE_INFO_SIZE", - "CUDNN_ATTR_INTERMEDIATE_INFO_DEPENDENT_DATA_UIDS", - "CUDNN_ATTR_INTERMEDIATE_INFO_DEPENDENT_ATTRIBUTES", - "CUDNN_ATTR_EXECUTION_PLAN_WORKSPACE_SIZE", - "CUDNN_ATTR_EXECUTION_PLAN_RUN_ONLY_INTERMEDIATE_UIDS", - "CUDNN_ATTR_EXECUTION_PLAN_KERNEL_CACHE", - "CUDNN_ATTR_EXECUTION_PLAN_JSON_REPRESENTATION", - "CUDNN_ATTR_EXECUTION_PLAN_HANDLE", - "CUDNN_ATTR_EXECUTION_PLAN_ENGINE_CONFIG", - "CUDNN_ATTR_EXECUTION_PLAN_COMPUTED_INTERMEDIATE_UIDS", - "CUDNN_ATTR_ENGINE_SM_COUNT_TARGET", - "CUDNN_ATTR_ENGINE_OPERATION_GRAPH", - "CUDNN_ATTR_ENGINE_NUMERICAL_NOTE", - "CUDNN_ATTR_ENGINE_LAYOUT_INFO", - "CUDNN_ATTR_ENGINE_KNOB_INFO", - "CUDNN_ATTR_ENGINE_GLOBAL_INDEX", - "CUDNN_ATTR_ENGINE_BEHAVIOR_NOTE", - "CUDNN_ATTR_ENGINEHEUR_SM_COUNT_TARGET", - "CUDNN_ATTR_ENGINEHEUR_RESULTS", - "CUDNN_ATTR_ENGINEHEUR_OPERATION_GRAPH", - "CUDNN_ATTR_ENGINEHEUR_MODE", - "CUDNN_ATTR_ENGINECFG_WORKSPACE_SIZE", - "CUDNN_ATTR_ENGINECFG_SHARED_MEMORY_USED", - "CUDNN_ATTR_ENGINECFG_KNOB_CHOICES", - "CUDNN_ATTR_ENGINECFG_INTERMEDIATE_INFO", - "CUDNN_ATTR_ENGINECFG_ENGINE", - "CUDNN_ATTR_CONVOLUTION_SPATIAL_DIMS", - "CUDNN_ATTR_CONVOLUTION_PRE_PADDINGS", - "CUDNN_ATTR_CONVOLUTION_POST_PADDINGS", - "CUDNN_ATTR_CONVOLUTION_FILTER_STRIDES", - "CUDNN_ATTR_CONVOLUTION_DILATIONS", - "CUDNN_ATTR_CONVOLUTION_CONV_MODE", - "CUDNN_ATTR_CONVOLUTION_COMP_TYPE", - "CUDNN_ATTN_WKIND_COUNT", - "CUDNN_ATTN_QUERYMAP_ONE_TO_ONE", - "CUDNN_ATTN_QUERYMAP_ALL_TO_ONE", - "CUDNN_ATTN_ENABLE_PROJ_BIASES", - "CUDNN_ATTN_DISABLE_PROJ_BIASES", "CUDA_POINTER_ATTRIBUTE_P2P_TOKENS_v1", "CUDA_POINTER_ATTRIBUTE_P2P_TOKENS_st", "CUDA_POINTER_ATTRIBUTE_P2P_TOKENS", @@ -12177,6 +11075,438 @@ sub warnHipOnlyUnsupportedFunctions { my $line_num = shift; my $k = 0; foreach $func ( + "cusparseZhybsv_solve", + "cusparseZhybsv_analysis", + "cusparseZhyb2dense", + "cusparseZhyb2csc", + "cusparseZgtsv_nopivot", + "cusparseZgtsvStridedBatch", + "cusparseZgtsv", + "cusparseZgebsr2gebsr_bufferSizeExt", + "cusparseZgebsr2gebsc_bufferSizeExt", + "cusparseZdense2hyb", + "cusparseZcsrsv_solve", + "cusparseZcsrsv_analysis", + "cusparseZcsrsm_solve", + "cusparseZcsrsm_analysis", + "cusparseZcsrmv_mp", + "cusparseZcsrilu0", + "cusparseZcsric0", + "cusparseZcsr2gebsr_bufferSizeExt", + "cusparseZcsc2hyb", + "cusparseZbsrsm2_bufferSizeExt", + "cusparseZbsrilu02_bufferSizeExt", + "cusparseZbsric02_bufferSizeExt", + "cusparseXgebsr2csr", + "cusparseSpVecDescr", + "cusparseSpSV_updateMatrix", + "cusparseSpSVUpdate_t", + "cusparseSpSM_updateMatrix", + "cusparseSpSMUpdate_t", + "cusparseSpMatSetNumBatches", + "cusparseSpMatGetNumBatches", + "cusparseSpMatDescr", + "cusparseSpMMOp_destroyPlan", + "cusparseSpMMOp_createPlan", + "cusparseSpMMOpPlan_t", + "cusparseSpMMOpPlan", + "cusparseSpMMOpAlg_t", + "cusparseSpMMOp", + "cusparseSpGEMM_getNumProducts", + "cusparseSpGEMM_estimateMemory", + "cusparseSolveAnalysisInfo_t", + "cusparseSolveAnalysisInfo", + "cusparseSideMode_t", + "cusparseShybsv_solve", + "cusparseShybsv_analysis", + "cusparseShyb2dense", + "cusparseShyb2csc", + "cusparseSgtsv_nopivot", + "cusparseSgtsvStridedBatch", + "cusparseSgtsv", + "cusparseSgebsr2gebsr_bufferSizeExt", + "cusparseSgebsr2gebsc_bufferSizeExt", + "cusparseSdense2hyb", + "cusparseScsrsv_solve", + "cusparseScsrsv_analysis", + "cusparseScsrsm_solve", + "cusparseScsrsm_analysis", + "cusparseScsrmv_mp", + "cusparseScsrilu0", + "cusparseScsric0", + "cusparseScsr2gebsr_bufferSizeExt", + "cusparseScsc2hyb", + "cusparseSbsrsm2_bufferSizeExt", + "cusparseSbsrilu02_bufferSizeExt", + "cusparseSbsric02_bufferSizeExt", + "cusparseMatDescr", + "cusparseLoggerSetMask", + "cusparseLoggerSetLevel", + "cusparseLoggerSetFile", + "cusparseLoggerSetCallback", + "cusparseLoggerOpenFile", + "cusparseLoggerForceDisable", + "cusparseLoggerCallback_t", + "cusparseHybMat", + "cusparseHpruneDense2csr_bufferSizeExt", + "cusparseHpruneDense2csrNnzByPercentage", + "cusparseHpruneDense2csrNnz", + "cusparseHpruneDense2csrByPercentage_bufferSizeExt", + "cusparseHpruneDense2csrByPercentage", + "cusparseHpruneDense2csr", + "cusparseHpruneCsr2csr_bufferSizeExt", + "cusparseHpruneCsr2csrNnzByPercentage", + "cusparseHpruneCsr2csrNnz", + "cusparseHpruneCsr2csrByPercentage_bufferSizeExt", + "cusparseHpruneCsr2csrByPercentage", + "cusparseHpruneCsr2csr", + "cusparseGetLevelInfo", + "cusparseDnVecDescr", + "cusparseDnMatDescr", + "cusparseDhybsv_solve", + "cusparseDhybsv_analysis", + "cusparseDhyb2dense", + "cusparseDhyb2csc", + "cusparseDgtsv_nopivot", + "cusparseDgtsvStridedBatch", + "cusparseDgtsv", + "cusparseDgebsr2gebsr_bufferSizeExt", + "cusparseDgebsr2gebsc_bufferSizeExt", + "cusparseDestroySolveAnalysisInfo", + "cusparseDdense2hyb", + "cusparseDcsrsv_solve", + "cusparseDcsrsv_analysis", + "cusparseDcsrsm_solve", + "cusparseDcsrsm_analysis", + "cusparseDcsrmv_mp", + "cusparseDcsrilu0", + "cusparseDcsric0", + "cusparseDcsr2gebsr_bufferSizeExt", + "cusparseDcsc2hyb", + "cusparseDbsrsm2_bufferSizeExt", + "cusparseDbsrilu02_bufferSizeExt", + "cusparseDbsric02_bufferSizeExt", + "cusparseCsrsv_solveEx", + "cusparseCsrsv_analysisEx", + "cusparseCsrmvEx_bufferSize", + "cusparseCsrmvEx", + "cusparseCsrilu0Ex", + "cusparseCsr2cscEx", + "cusparseCreateSolveAnalysisInfo", + "cusparseCreateSlicedEll", + "cusparseCreateConstSlicedEll", + "cusparseCreateConstBsr", + "cusparseCreateBsr", + "cusparseContext", + "cusparseConstrainedGeMM_bufferSize", + "cusparseConstrainedGeMM", + "cusparseColorInfo", + "cusparseColorAlg_t", + "cusparseChybsv_solve", + "cusparseChybsv_analysis", + "cusparseChyb2dense", + "cusparseChyb2csc", + "cusparseCgtsv_nopivot", + "cusparseCgtsvStridedBatch", + "cusparseCgtsv", + "cusparseCgebsr2gebsr_bufferSizeExt", + "cusparseCgebsr2gebsc_bufferSizeExt", + "cusparseCdense2hyb", + "cusparseCcsrsv_solve", + "cusparseCcsrsv_analysis", + "cusparseCcsrsm_solve", + "cusparseCcsrsm_analysis", + "cusparseCcsrmv_mp", + "cusparseCcsrilu0", + "cusparseCcsric0", + "cusparseCcsr2gebsr_bufferSizeExt", + "cusparseCcsc2hyb", + "cusparseCbsrsm2_bufferSizeExt", + "cusparseCbsrilu02_bufferSizeExt", + "cusparseCbsric02_bufferSizeExt", + "cusparseBsrSetStridedBatch", + "cusparseAlgMode_t", + "curand_mtgp32_specific", + "curand_mtgp32_single_specific", + "curand_mtgp32_single", + "curand_Philox4x32_10", + "curandMethod_t", + "curandMethod", + "curandHistogramM2_t", + "curandHistogramM2_st", + "curandHistogramM2V_t", + "curandHistogramM2V_st", + "curandHistogramM2K_t", + "curandHistogramM2K_st", + "curandGetProperty", + "curandDistribution_t", + "curandDistribution_st", + "curandDistributionShift_t", + "curandDistributionShift_st", + "curandDistributionM2Shift_t", + "curandDistributionM2Shift_st", + "cudnnWgradMode_t", + "cudnnTransformTensorEx", + "cudnnTransformTensor", + "cudnnTransformFilter", + "cudnnTensorTransformStruct", + "cudnnTensorTransformDescriptor_t", + "cudnnTensorStruct", + "cudnnSpatialTransformerStruct", + "cudnnSpatialTransformerDescriptor_t", + "cudnnSpatialTfSamplerForward", + "cudnnSpatialTfSamplerBackward", + "cudnnSpatialTfGridGeneratorForward", + "cudnnSpatialTfGridGeneratorBackward", + "cudnnSignalMode_t", + "cudnnSeverity_t", + "cudnnSetTensorTransformDescriptor", + "cudnnSetTensorNdDescriptorEx", + "cudnnSetSpatialTransformerNdDescriptor", + "cudnnSetSeqDataDescriptor", + "cudnnSetRNNProjectionLayers", + "cudnnSetRNNPaddingMode", + "cudnnSetRNNMatrixMathType", + "cudnnSetRNNDescriptor_v8", + "cudnnSetRNNDataDescriptor", + "cudnnSetRNNBiasMode", + "cudnnSetRNNAlgorithmDescriptor", + "cudnnSetFusedOpsVariantParamPackAttribute", + "cudnnSetFusedOpsConstParamPackAttribute", + "cudnnSetConvolutionReorderType", + "cudnnSetCallback", + "cudnnSetCTCLossDescriptor_v9", + "cudnnSetCTCLossDescriptor_v8", + "cudnnSetCTCLossDescriptorEx", + "cudnnSetCTCLossDescriptor", + "cudnnSetAttnDescriptor", + "cudnnSetAlgorithmPerformance", + "cudnnSetAlgorithmDescriptor", + "cudnnSetActivationDescriptorSwishBeta", + "cudnnSeqDataStruct", + "cudnnSeqDataDescriptor_t", + "cudnnSeqDataAxis_t", + "cudnnSaveAlgorithm", + "cudnnSamplerType_t", + "cudnnRuntimeTag_t", + "cudnnRngDistribution_t", + "cudnnRestoreDropoutDescriptor", + "cudnnRestoreAlgorithm", + "cudnnResampleMode_t", + "cudnnReorderType_t", + "cudnnReorderFilterAndBias", + "cudnnReduceTensorStruct", + "cudnnRNNStruct", + "cudnnRNNSetClip_v9", + "cudnnRNNSetClip_v8", + "cudnnRNNSetClip", + "cudnnRNNPaddingMode_t", + "cudnnRNNGetClip_v9", + "cudnnRNNGetClip_v8", + "cudnnRNNGetClip", + "cudnnRNNForwardTrainingEx", + "cudnnRNNForwardInferenceEx", + "cudnnRNNForward", + "cudnnRNNDataStruct", + "cudnnRNNDataLayout_t", + "cudnnRNNDataDescriptor_t", + "cudnnRNNClipMode_t", + "cudnnRNNBackwardWeights_v8", + "cudnnRNNBackwardWeightsEx", + "cudnnRNNBackwardData_v8", + "cudnnRNNBackwardDataEx", + "cudnnQueryRuntimeError", + "cudnnPoolingStruct", + "cudnnPointwiseMode_t", + "cudnnPersistentRNNPlan", + "cudnnPaddingMode_t", + "cudnnOpsVersionCheck", + "cudnnOpsTrainVersionCheck", + "cudnnOpsInferVersionCheck", + "cudnnOpTensorStruct", + "cudnnNormalizationForwardTraining", + "cudnnNormalizationForwardInference", + "cudnnNormalizationBackward", + "cudnnNormOps_t", + "cudnnNormMode_t", + "cudnnNormAlgo_t", + "cudnnMultiHeadAttnWeightKind_t", + "cudnnMultiHeadAttnForward", + "cudnnMultiHeadAttnBackwardWeights", + "cudnnMultiHeadAttnBackwardData", + "cudnnMakeFusedOpsPlan", + "cudnnLossNormalizationMode_t", + "cudnnLRNStruct", + "cudnnInitTransformDest", + "cudnnIm2Col", + "cudnnGraphVersionCheck", + "cudnnGetTensorTransformDescriptor", + "cudnnGetTensorSizeInBytes", + "cudnnGetSeqDataDescriptor", + "cudnnGetReductionIndicesSize", + "cudnnGetRNNWeightSpaceSize", + "cudnnGetRNNWeightParams", + "cudnnGetRNNTempSpaceSizes", + "cudnnGetRNNProjectionLayers", + "cudnnGetRNNPaddingMode", + "cudnnGetRNNMatrixMathType", + "cudnnGetRNNForwardTrainingAlgorithmMaxCount", + "cudnnGetRNNForwardInferenceAlgorithmMaxCount", + "cudnnGetRNNDescriptor_v8", + "cudnnGetRNNDescriptor_v6", + "cudnnGetRNNDataDescriptor", + "cudnnGetRNNBiasMode", + "cudnnGetRNNBackwardWeightsAlgorithmMaxCount", + "cudnnGetRNNBackwardDataAlgorithmMaxCount", + "cudnnGetProperty", + "cudnnGetPoolingNdForwardOutputDim", + "cudnnGetPoolingNdDescriptor", + "cudnnGetNormalizationTrainingReserveSpaceSize", + "cudnnGetNormalizationForwardTrainingWorkspaceSize", + "cudnnGetNormalizationBackwardWorkspaceSize", + "cudnnGetMultiHeadAttnWeights", + "cudnnGetMultiHeadAttnBuffers", + "cudnnGetMaxDeviceVersion", + "cudnnGetLastErrorString", + "cudnnGetFusedOpsVariantParamPackAttribute", + "cudnnGetFusedOpsConstParamPackAttribute", + "cudnnGetFoldedConvBackwardDataDescriptors", + "cudnnGetFilterSizeInBytes", + "cudnnGetDropoutDescriptor", + "cudnnGetCudartVersion", + "cudnnGetConvolutionReorderType", + "cudnnGetConvolutionNdForwardOutputDim", + "cudnnGetConvolutionNdDescriptor", + "cudnnGetConvolutionMathType", + "cudnnGetConvolutionGroupCount", + "cudnnGetConvolutionForwardAlgorithm_v7", + "cudnnGetConvolutionForwardAlgorithmMaxCount", + "cudnnGetConvolutionBackwardFilterAlgorithm_v7", + "cudnnGetConvolutionBackwardFilterAlgorithmMaxCount", + "cudnnGetConvolutionBackwardDataAlgorithm_v7", + "cudnnGetConvolutionBackwardDataAlgorithmMaxCount", + "cudnnGetCallback", + "cudnnGetCTCLossWorkspaceSize_v8", + "cudnnGetCTCLossWorkspaceSize", + "cudnnGetCTCLossDescriptor_v9", + "cudnnGetCTCLossDescriptor_v8", + "cudnnGetCTCLossDescriptorEx", + "cudnnGetCTCLossDescriptor", + "cudnnGetBatchNormalizationTrainingExReserveSpaceSize", + "cudnnGetBatchNormalizationForwardTrainingExWorkspaceSize", + "cudnnGetBatchNormalizationBackwardExWorkspaceSize", + "cudnnGetAttnDescriptor", + "cudnnGetAlgorithmSpaceSize", + "cudnnGetAlgorithmPerformance", + "cudnnGetAlgorithmDescriptor", + "cudnnGetActivationDescriptorSwishBeta", + "cudnnGenStatsMode_t", + "cudnnFusedOps_t", + "cudnnFusedOpsVariantParamStruct", + "cudnnFusedOpsVariantParamPack_t", + "cudnnFusedOpsVariantParamLabel_t", + "cudnnFusedOpsPointerPlaceHolder_t", + "cudnnFusedOpsPlan_t", + "cudnnFusedOpsPlanStruct", + "cudnnFusedOpsExecute", + "cudnnFusedOpsConstParamStruct", + "cudnnFusedOpsConstParamPack_t", + "cudnnFusedOpsConstParamLabel_t", + "cudnnFraction_t", + "cudnnFractionStruct", + "cudnnForwardMode_t", + "cudnnFoldingDirection_t", + "cudnnFindRNNForwardTrainingAlgorithmEx", + "cudnnFindRNNForwardInferenceAlgorithmEx", + "cudnnFindRNNBackwardWeightsAlgorithmEx", + "cudnnFindRNNBackwardDataAlgorithmEx", + "cudnnFilterStruct", + "cudnnErrQueryMode_t", + "cudnnDropoutStruct", + "cudnnDropoutGetReserveSpaceSize", + "cudnnDropoutForward", + "cudnnDropoutBackward", + "cudnnDivisiveNormalizationForward", + "cudnnDivisiveNormalizationBackward", + "cudnnDivNormMode_t", + "cudnnDeterminism_t", + "cudnnDestroyTensorTransformDescriptor", + "cudnnDestroySpatialTransformerDescriptor", + "cudnnDestroySeqDataDescriptor", + "cudnnDestroyRNNDataDescriptor", + "cudnnDestroyFusedOpsVariantParamPack", + "cudnnDestroyFusedOpsPlan", + "cudnnDestroyFusedOpsConstParamPack", + "cudnnDestroyCTCLossDescriptor", + "cudnnDestroyAttnDescriptor", + "cudnnDestroyAlgorithmPerformance", + "cudnnDestroyAlgorithmDescriptor", + "cudnnDeriveNormTensorDescriptor", + "cudnnDebug_t", + "cudnnDebugStruct", + "cudnnCreateTensorTransformDescriptor", + "cudnnCreateSpatialTransformerDescriptor", + "cudnnCreateSeqDataDescriptor", + "cudnnCreateRNNDataDescriptor", + "cudnnCreateFusedOpsVariantParamPack", + "cudnnCreateFusedOpsPlan", + "cudnnCreateFusedOpsConstParamPack", + "cudnnCreateCTCLossDescriptor", + "cudnnCreateAttnDescriptor", + "cudnnCreateAlgorithmPerformance", + "cudnnCreateAlgorithmDescriptor", + "cudnnCopyAlgorithmDescriptor", + "cudnnConvolutionStruct", + "cudnnConvolutionBiasActivationForward", + "cudnnContext", + "cudnnCnnTrainVersionCheck", + "cudnnCnnInferVersionCheck", + "cudnnCallback_t", + "cudnnCTCLoss_v8", + "cudnnCTCLossStruct", + "cudnnCTCLossDescriptor_t", + "cudnnCTCLossAlgo_t", + "cudnnCTCLoss", + "cudnnCTCGradMode_t", + "cudnnBuildRNNDynamic", + "cudnnBnFinalizeStatsMode_t", + "cudnnBatchNormalizationForwardTrainingEx", + "cudnnBatchNormalizationBackwardEx", + "cudnnBatchNormOps_t", + "cudnnBackendUpdateCudaGraph", + "cudnnBackendTensorReordering_t", + "cudnnBackendSetAttribute", + "cudnnBackendPopulateCudaGraph", + "cudnnBackendNumericalNote_t", + "cudnnBackendNormMode_t", + "cudnnBackendNormFwdPhase_t", + "cudnnBackendLayoutType_t", + "cudnnBackendKnobType_t", + "cudnnBackendInitialize", + "cudnnBackendHeurMode_t", + "cudnnBackendGetAttribute", + "cudnnBackendFinalize", + "cudnnBackendExecute", + "cudnnBackendDestroyDescriptor", + "cudnnBackendDescriptor_t", + "cudnnBackendDescriptorType_t", + "cudnnBackendCreateDescriptor", + "cudnnBackendBehaviorNote_t", + "cudnnBackendAttributeType_t", + "cudnnBackendAttributeName_t", + "cudnnAttnStruct", + "cudnnAttnQueryMap_t", + "cudnnAttnDescriptor_t", + "cudnnAlgorithm_t", + "cudnnAlgorithmUnionStruct", + "cudnnAlgorithmStruct", + "cudnnAlgorithmPerformance_t", + "cudnnAlgorithmPerformanceStruct", + "cudnnAlgorithmDescriptor_t", + "cudnnAdvVersionCheck", + "cudnnAdvTrainVersionCheck", + "cudnnAdvInferVersionCheck", + "cudnnActivationStruct", "cublasZtrttp", "cublasZtrsm_v2_64", "cublasZtrsm_64", @@ -12396,6 +11726,676 @@ sub warnHipOnlyUnsupportedFunctions { "cublasAsumEx_64", "cublasAsumEx", "cublasAlloc", + "csrsv2Info", + "csrsm2Info", + "__curand_umul", + "CUSPARSE_SPSV_UPDATE_GENERAL", + "CUSPARSE_SPSV_UPDATE_DIAGONAL", + "CUSPARSE_SPSM_UPDATE_GENERAL", + "CUSPARSE_SPSM_UPDATE_DIAGONAL", + "CUSPARSE_SPMV_SELL_ALG1", + "CUSPARSE_SPMM_OP_ALG_DEFAULT", + "CUSPARSE_SPMM_BSR_ALG1", + "CUSPARSE_SPMMA_PREPROCESS", + "CUSPARSE_SPMMA_ALG4", + "CUSPARSE_SPMMA_ALG3", + "CUSPARSE_SPMMA_ALG2", + "CUSPARSE_SPMMA_ALG1", + "CUSPARSE_SIDE_RIGHT", + "CUSPARSE_SIDE_LEFT", + "CUSPARSE_FORMAT_SLICED_ELLPACK", + "CUSPARSE_FORMAT_BSR", + "CUSPARSE_COLOR_ALG1", + "CUSPARSE_COLOR_ALG0", + "CUSPARSE_ALG_NAIVE", + "CUSPARSE_ALG_MERGE_PATH", + "CUSPARSE_ALG1", + "CUSPARSE_ALG0", + "CURAND_REJECTION", + "CURAND_POISSON", + "CURAND_M2", + "CURAND_M1", + "CURAND_KNUTH", + "CURAND_ITR", + "CURAND_HITR", + "CURAND_FAST_REJECTION", + "CURAND_DISCRETE_GAUSS", + "CURAND_DEVICE_API", + "CURAND_DEFINITION", + "CURAND_CHOOSE_BEST", + "CURAND_BINARY_SEARCH", + "CURAND_3RD", + "CUDNN_ZERO_PAD", + "CUDNN_WGRAD_MODE_SET", + "CUDNN_WGRAD_MODE_ADD", + "CUDNN_TYPE_VOID_PTR", + "CUDNN_TYPE_TENSOR_REORDERING_MODE", + "CUDNN_TYPE_SIGNAL_MODE", + "CUDNN_TYPE_RNG_DISTRIBUTION", + "CUDNN_TYPE_RESAMPLE_MODE", + "CUDNN_TYPE_REDUCTION_OPERATOR_TYPE", + "CUDNN_TYPE_POINTWISE_MODE", + "CUDNN_TYPE_PADDING_MODE", + "CUDNN_TYPE_NUMERICAL_NOTE", + "CUDNN_TYPE_NORM_MODE", + "CUDNN_TYPE_NORM_FWD_PHASE", + "CUDNN_TYPE_NAN_PROPOGATION", + "CUDNN_TYPE_LAYOUT_TYPE", + "CUDNN_TYPE_KNOB_TYPE", + "CUDNN_TYPE_INT64", + "CUDNN_TYPE_INT32", + "CUDNN_TYPE_HEUR_MODE", + "CUDNN_TYPE_HANDLE", + "CUDNN_TYPE_GENSTATS_MODE", + "CUDNN_TYPE_FRACTION", + "CUDNN_TYPE_FLOAT", + "CUDNN_TYPE_DOUBLE", + "CUDNN_TYPE_DATA_TYPE", + "CUDNN_TYPE_CONVOLUTION_MODE", + "CUDNN_TYPE_CHAR", + "CUDNN_TYPE_BOOLEAN", + "CUDNN_TYPE_BN_FINALIZE_STATS_MODE", + "CUDNN_TYPE_BEHAVIOR_NOTE", + "CUDNN_TYPE_BACKEND_DESCRIPTOR", + "CUDNN_TYPE_ATTRIB_NAME", + "CUDNN_TRANSFORM_UNFOLD", + "CUDNN_TRANSFORM_FOLD", + "CUDNN_TENSOR_REORDERING_NONE", + "CUDNN_TENSOR_REORDERING_INT8x32", + "CUDNN_TENSOR_REORDERING_F16x16", + "CUDNN_TENSOR_OP_MATH_ALLOW_CONVERSION", + "CUDNN_STATUS_VERSION_MISMATCH", + "CUDNN_STATUS_SUBLIBRARY_VERSION_MISMATCH", + "CUDNN_STATUS_SUBLIBRARY_LOADING_FAILED", + "CUDNN_STATUS_SPECIFIC_ERROR", + "CUDNN_STATUS_SERIALIZATION_VERSION_MISMATCH", + "CUDNN_STATUS_RUNTIME_IN_PROGRESS", + "CUDNN_STATUS_RUNTIME_FP_OVERFLOW", + "CUDNN_STATUS_NOT_SUPPORTED_SUBLIBRARY_UNAVAILABLE", + "CUDNN_STATUS_NOT_SUPPORTED_SHARED_MEMORY_INSUFFICIENT", + "CUDNN_STATUS_NOT_SUPPORTED_SHAPE", + "CUDNN_STATUS_NOT_SUPPORTED_RUNTIME_PREREQUISITE_MISSING", + "CUDNN_STATUS_NOT_SUPPORTED_PADDING", + "CUDNN_STATUS_NOT_SUPPORTED_LAYOUT", + "CUDNN_STATUS_NOT_SUPPORTED_INCOMPATIBLE_CUDA_DRIVER", + "CUDNN_STATUS_NOT_SUPPORTED_INCOMPATIBLE_CUDART", + "CUDNN_STATUS_NOT_SUPPORTED_GRAPH_PATTERN", + "CUDNN_STATUS_NOT_SUPPORTED_DATA_TYPE", + "CUDNN_STATUS_NOT_SUPPORTED_CUDA_GRAPH_NATIVE_API", + "CUDNN_STATUS_NOT_SUPPORTED_BAD_LAUNCH_PARAM", + "CUDNN_STATUS_NOT_SUPPORTED_ARCH_MISMATCH", + "CUDNN_STATUS_INTERNAL_ERROR_UNEXPECTED_VALUE", + "CUDNN_STATUS_INTERNAL_ERROR_TEXTURE_CREATION_FAILED", + "CUDNN_STATUS_INTERNAL_ERROR_HOST_ALLOCATION_FAILED", + "CUDNN_STATUS_INTERNAL_ERROR_DEVICE_ALLOCATION_FAILED", + "CUDNN_STATUS_INTERNAL_ERROR_COMPILATION_FAILED", + "CUDNN_STATUS_INTERNAL_ERROR_BAD_LAUNCH_PARAM", + "CUDNN_STATUS_FULL_ERROR_CODE", + "CUDNN_STATUS_EXECUTION_FAILED_CURAND", + "CUDNN_STATUS_EXECUTION_FAILED_CUDA_DRIVER", + "CUDNN_STATUS_EXECUTION_FAILED_CUDART", + "CUDNN_STATUS_EXECUTION_FAILED_CUBLAS", + "CUDNN_STATUS_DEPRECATED", + "CUDNN_STATUS_CATEGORY", + "CUDNN_STATUS_BAD_PARAM_STREAM_MISMATCH", + "CUDNN_STATUS_BAD_PARAM_SIZE_INSUFFICIENT", + "CUDNN_STATUS_BAD_PARAM_SHAPE_MISMATCH", + "CUDNN_STATUS_BAD_PARAM_OUT_OF_BOUND", + "CUDNN_STATUS_BAD_PARAM_NULL_POINTER", + "CUDNN_STATUS_BAD_PARAM_NOT_FINALIZED", + "CUDNN_STATUS_BAD_PARAM_MISALIGNED_POINTER", + "CUDNN_STATUS_BAD_PARAM_DUPLICATED_ENTRIES", + "CUDNN_STATUS_BAD_PARAM_CUDA_GRAPH_MISMATCH", + "CUDNN_STATUS_BAD_PARAM_ATTRIBUTE_TYPE", + "CUDNN_SIGNAL_WAIT", + "CUDNN_SIGNAL_SET", + "CUDNN_SEV_WARNING_EN", + "CUDNN_SEV_WARNING", + "CUDNN_SEV_INFO_EN", + "CUDNN_SEV_INFO", + "CUDNN_SEV_FATAL", + "CUDNN_SEV_ERROR_EN", + "CUDNN_SEV_ERROR", + "CUDNN_SEQDATA_VECT_DIM", + "CUDNN_SEQDATA_TIME_DIM", + "CUDNN_SEQDATA_DIM_COUNT", + "CUDNN_SEQDATA_BEAM_DIM", + "CUDNN_SEQDATA_BATCH_DIM", + "CUDNN_SCALAR_SIZE_T_WORKSPACE_SIZE_IN_BYTES", + "CUDNN_SCALAR_INT64_T_BN_ACCUMULATION_COUNT", + "CUDNN_SCALAR_DOUBLE_BN_EXP_AVG_FACTOR", + "CUDNN_SCALAR_DOUBLE_BN_EPSILON", + "CUDNN_SAMPLER_BILINEAR", + "CUDNN_RNN_PADDED_IO_ENABLED", + "CUDNN_RNN_PADDED_IO_DISABLED", + "CUDNN_RNN_DATA_LAYOUT_SEQ_MAJOR_UNPACKED", + "CUDNN_RNN_DATA_LAYOUT_SEQ_MAJOR_PACKED", + "CUDNN_RNN_DATA_LAYOUT_BATCH_MAJOR_UNPACKED", + "CUDNN_RNN_CLIP_NONE", + "CUDNN_RNN_CLIP_MINMAX", + "CUDNN_RNN_ALGO_COUNT", + "CUDNN_RNG_DISTRIBUTION_UNIFORM", + "CUDNN_RNG_DISTRIBUTION_NORMAL", + "CUDNN_RNG_DISTRIBUTION_BERNOULLI", + "CUDNN_RMS_NORM", + "CUDNN_RESAMPLE_NEAREST", + "CUDNN_RESAMPLE_MAXPOOL", + "CUDNN_RESAMPLE_BILINEAR", + "CUDNN_RESAMPLE_AVGPOOL_INCLUDE_PADDING", + "CUDNN_RESAMPLE_AVGPOOL_EXCLUDE_PADDING", + "CUDNN_RESAMPLE_AVGPOOL", + "CUDNN_PTR_ZDATA", + "CUDNN_PTR_YSUM", + "CUDNN_PTR_YSQSUM", + "CUDNN_PTR_YDATA", + "CUDNN_PTR_XDATA", + "CUDNN_PTR_WORKSPACE", + "CUDNN_PTR_WDATA", + "CUDNN_PTR_NULL", + "CUDNN_PTR_ELEM_ALIGNED", + "CUDNN_PTR_DZDATA", + "CUDNN_PTR_DYDATA", + "CUDNN_PTR_DXDATA", + "CUDNN_PTR_DWDATA", + "CUDNN_PTR_BN_Z_EQSCALE", + "CUDNN_PTR_BN_Z_EQBIAS", + "CUDNN_PTR_BN_SCALE", + "CUDNN_PTR_BN_SAVED_MEAN", + "CUDNN_PTR_BN_SAVED_INVSTD", + "CUDNN_PTR_BN_RUNNING_VAR", + "CUDNN_PTR_BN_RUNNING_MEAN", + "CUDNN_PTR_BN_EQSCALE", + "CUDNN_PTR_BN_EQBIAS", + "CUDNN_PTR_BN_DSCALE", + "CUDNN_PTR_BN_DBIAS", + "CUDNN_PTR_BN_BIAS", + "CUDNN_PTR_ACTIVATION_BITMASK", + "CUDNN_PTR_16B_ALIGNED", + "CUDNN_POINTWISE_TANH_FWD", + "CUDNN_POINTWISE_TANH_BWD", + "CUDNN_POINTWISE_TAN", + "CUDNN_POINTWISE_SWISH_FWD", + "CUDNN_POINTWISE_SWISH_BWD", + "CUDNN_POINTWISE_SUB", + "CUDNN_POINTWISE_SQRT", + "CUDNN_POINTWISE_SOFTPLUS_FWD", + "CUDNN_POINTWISE_SOFTPLUS_BWD", + "CUDNN_POINTWISE_SIN", + "CUDNN_POINTWISE_SIGMOID_FWD", + "CUDNN_POINTWISE_SIGMOID_BWD", + "CUDNN_POINTWISE_RSQRT", + "CUDNN_POINTWISE_RELU_FWD", + "CUDNN_POINTWISE_RELU_BWD", + "CUDNN_POINTWISE_RECIPROCAL", + "CUDNN_POINTWISE_POW", + "CUDNN_POINTWISE_NEG", + "CUDNN_POINTWISE_MUL", + "CUDNN_POINTWISE_MOD", + "CUDNN_POINTWISE_MIN", + "CUDNN_POINTWISE_MAX", + "CUDNN_POINTWISE_LOGICAL_OR", + "CUDNN_POINTWISE_LOGICAL_NOT", + "CUDNN_POINTWISE_LOGICAL_AND", + "CUDNN_POINTWISE_LOG", + "CUDNN_POINTWISE_IDENTITY", + "CUDNN_POINTWISE_GEN_INDEX", + "CUDNN_POINTWISE_GELU_FWD", + "CUDNN_POINTWISE_GELU_BWD", + "CUDNN_POINTWISE_GELU_APPROX_TANH_FWD", + "CUDNN_POINTWISE_GELU_APPROX_TANH_BWD", + "CUDNN_POINTWISE_FLOOR", + "CUDNN_POINTWISE_EXP", + "CUDNN_POINTWISE_ERF", + "CUDNN_POINTWISE_ELU_FWD", + "CUDNN_POINTWISE_ELU_BWD", + "CUDNN_POINTWISE_DIV", + "CUDNN_POINTWISE_COS", + "CUDNN_POINTWISE_CMP_NEQ", + "CUDNN_POINTWISE_CMP_LT", + "CUDNN_POINTWISE_CMP_LE", + "CUDNN_POINTWISE_CMP_GT", + "CUDNN_POINTWISE_CMP_GE", + "CUDNN_POINTWISE_CMP_EQ", + "CUDNN_POINTWISE_CEIL", + "CUDNN_POINTWISE_BINARY_SELECT", + "CUDNN_POINTWISE_ATAN2", + "CUDNN_POINTWISE_ADD_SQUARE", + "CUDNN_POINTWISE_ADD", + "CUDNN_POINTWISE_ABS", + "CUDNN_PARAM_ZDESC", + "CUDNN_PARAM_ZDATA_PLACEHOLDER", + "CUDNN_PARAM_YSUM_PLACEHOLDER", + "CUDNN_PARAM_YSTATS_DESC", + "CUDNN_PARAM_YSQSUM_PLACEHOLDER", + "CUDNN_PARAM_YDESC", + "CUDNN_PARAM_YDATA_PLACEHOLDER", + "CUDNN_PARAM_XDESC", + "CUDNN_PARAM_XDATA_PLACEHOLDER", + "CUDNN_PARAM_WDESC", + "CUDNN_PARAM_WDATA_PLACEHOLDER", + "CUDNN_PARAM_DZDESC", + "CUDNN_PARAM_DZDATA_PLACEHOLDER", + "CUDNN_PARAM_DYDESC", + "CUDNN_PARAM_DYDATA_PLACEHOLDER", + "CUDNN_PARAM_DXDESC", + "CUDNN_PARAM_DXDATA_PLACEHOLDER", + "CUDNN_PARAM_DWDESC", + "CUDNN_PARAM_DWDATA_PLACEHOLDER", + "CUDNN_PARAM_CONV_DESC", + "CUDNN_PARAM_BN_Z_EQSCALE_PLACEHOLDER", + "CUDNN_PARAM_BN_Z_EQSCALEBIAS_DESC", + "CUDNN_PARAM_BN_Z_EQBIAS_PLACEHOLDER", + "CUDNN_PARAM_BN_SCALE_PLACEHOLDER", + "CUDNN_PARAM_BN_SCALEBIAS_MEANVAR_DESC", + "CUDNN_PARAM_BN_SAVED_MEAN_PLACEHOLDER", + "CUDNN_PARAM_BN_SAVED_INVSTD_PLACEHOLDER", + "CUDNN_PARAM_BN_RUNNING_VAR_PLACEHOLDER", + "CUDNN_PARAM_BN_RUNNING_MEAN_PLACEHOLDER", + "CUDNN_PARAM_BN_MODE", + "CUDNN_PARAM_BN_EQSCALE_PLACEHOLDER", + "CUDNN_PARAM_BN_EQSCALEBIAS_DESC", + "CUDNN_PARAM_BN_EQBIAS_PLACEHOLDER", + "CUDNN_PARAM_BN_DSCALE_PLACEHOLDER", + "CUDNN_PARAM_BN_DBIAS_PLACEHOLDER", + "CUDNN_PARAM_BN_BIAS_PLACEHOLDER", + "CUDNN_PARAM_ACTIVATION_DESC", + "CUDNN_PARAM_ACTIVATION_BITMASK_PLACEHOLDER", + "CUDNN_PARAM_ACTIVATION_BITMASK_DESC", + "CUDNN_OP_TENSOR_NOT", + "CUDNN_NUMERICAL_NOTE_WINOGRAD_TILE_6x6", + "CUDNN_NUMERICAL_NOTE_WINOGRAD_TILE_4x4", + "CUDNN_NUMERICAL_NOTE_WINOGRAD_TILE_13x13", + "CUDNN_NUMERICAL_NOTE_WINOGRAD", + "CUDNN_NUMERICAL_NOTE_TYPE_COUNT", + "CUDNN_NUMERICAL_NOTE_TENSOR_CORE", + "CUDNN_NUMERICAL_NOTE_STRICT_NAN_PROP", + "CUDNN_NUMERICAL_NOTE_REDUCED_PRECISION_REDUCTION", + "CUDNN_NUMERICAL_NOTE_NONDETERMINISTIC", + "CUDNN_NUMERICAL_NOTE_FFT", + "CUDNN_NUMERICAL_NOTE_DOWN_CONVERT_INPUTS", + "CUDNN_NO_REORDER", + "CUDNN_NORM_PER_CHANNEL", + "CUDNN_NORM_PER_ACTIVATION", + "CUDNN_NORM_OPS_NORM_ADD_ACTIVATION", + "CUDNN_NORM_OPS_NORM_ACTIVATION", + "CUDNN_NORM_OPS_NORM", + "CUDNN_NORM_FWD_TRAINING", + "CUDNN_NORM_FWD_INFERENCE", + "CUDNN_NORM_ALGO_STANDARD", + "CUDNN_NORM_ALGO_PERSIST", + "CUDNN_NON_DETERMINISTIC", + "CUDNN_NEG_INF_PAD", + "CUDNN_MH_ATTN_V_WEIGHTS", + "CUDNN_MH_ATTN_V_BIASES", + "CUDNN_MH_ATTN_Q_WEIGHTS", + "CUDNN_MH_ATTN_Q_BIASES", + "CUDNN_MH_ATTN_O_WEIGHTS", + "CUDNN_MH_ATTN_O_BIASES", + "CUDNN_MH_ATTN_K_WEIGHTS", + "CUDNN_MH_ATTN_K_BIASES", + "CUDNN_LRN_MIN_N", + "CUDNN_LRN_MIN_K", + "CUDNN_LRN_MIN_BETA", + "CUDNN_LRN_MAX_N", + "CUDNN_LOSS_NORMALIZATION_SOFTMAX", + "CUDNN_LOSS_NORMALIZATION_NONE", + "CUDNN_LAYOUT_TYPE_PREFERRED_PAD8CK", + "CUDNN_LAYOUT_TYPE_PREFERRED_PAD4CK", + "CUDNN_LAYOUT_TYPE_PREFERRED_NHWC", + "CUDNN_LAYOUT_TYPE_PREFERRED_NCHW", + "CUDNN_LAYOUT_TYPE_COUNT", + "CUDNN_LAYER_NORM", + "CUDNN_KNOB_TYPE_WORKSPACE", + "CUDNN_KNOB_TYPE_WINO_TILE", + "CUDNN_KNOB_TYPE_USE_TEX", + "CUDNN_KNOB_TYPE_TILE_SIZE", + "CUDNN_KNOB_TYPE_TILE_ROWS", + "CUDNN_KNOB_TYPE_TILE_COLS", + "CUDNN_KNOB_TYPE_TILE_CGA_N", + "CUDNN_KNOB_TYPE_TILE_CGA_M", + "CUDNN_KNOB_TYPE_TILE_CGA", + "CUDNN_KNOB_TYPE_TILEK", + "CUDNN_KNOB_TYPE_SWIZZLE", + "CUDNN_KNOB_TYPE_STAGES", + "CUDNN_KNOB_TYPE_SPLIT_RS", + "CUDNN_KNOB_TYPE_SPLIT_K_SLC", + "CUDNN_KNOB_TYPE_SPLIT_K_BUF", + "CUDNN_KNOB_TYPE_SPLIT_K", + "CUDNN_KNOB_TYPE_SPLIT_H", + "CUDNN_KNOB_TYPE_SPLIT_COLS", + "CUDNN_KNOB_TYPE_SPECFILT", + "CUDNN_KNOB_TYPE_SLICED", + "CUDNN_KNOB_TYPE_SINGLEBUFFER", + "CUDNN_KNOB_TYPE_REDUCTION_MODE", + "CUDNN_KNOB_TYPE_OCCUPANCY", + "CUDNN_KNOB_TYPE_NUM_C_PER_BLOCK", + "CUDNN_KNOB_TYPE_MULTIPLY", + "CUDNN_KNOB_TYPE_LOAD_SIZE", + "CUDNN_KNOB_TYPE_LDGC", + "CUDNN_KNOB_TYPE_LDGB", + "CUDNN_KNOB_TYPE_LDGA", + "CUDNN_KNOB_TYPE_KERNEL_CFG", + "CUDNN_KNOB_TYPE_KBLOCK", + "CUDNN_KNOB_TYPE_IDX_MODE", + "CUDNN_KNOB_TYPE_EDGE", + "CUDNN_KNOB_TYPE_CTA_SPLIT_K_MODE", + "CUDNN_KNOB_TYPE_COUNTS", + "CUDNN_KNOB_TYPE_CHUNK_K", + "CUDNN_KNOB_TYPE_BLOCK_SIZE", + "CUDNN_KNOB_TYPE_ARRAY_SIZE_PER_THREAD", + "CUDNN_INSTANCE_NORM", + "CUDNN_HEUR_MODE_INSTANT", + "CUDNN_HEUR_MODE_FALLBACK", + "CUDNN_HEUR_MODE_B", + "CUDNN_HEUR_MODE_A", + "CUDNN_HEUR_MODES_COUNT", + "CUDNN_GROUP_NORM", + "CUDNN_GENSTATS_SUM_SQSUM", + "CUDNN_FWD_MODE_TRAINING", + "CUDNN_FWD_MODE_INFERENCE", + "CUDNN_FUSED_SCALE_BIAS_ADD_ACTIVATION_GEN_BITMASK", + "CUDNN_FUSED_SCALE_BIAS_ACTIVATION_WGRAD", + "CUDNN_FUSED_SCALE_BIAS_ACTIVATION_CONV_BNSTATS", + "CUDNN_FUSED_DACTIVATION_FORK_DBATCHNORM", + "CUDNN_FUSED_CONV_SCALE_BIAS_ADD_ACTIVATION", + "CUDNN_FUSED_BN_FINALIZE_STATISTICS_TRAINING", + "CUDNN_FUSED_BN_FINALIZE_STATISTICS_INFERENCE", + "CUDNN_FMA_MATH", + "CUDNN_ERRQUERY_RAWCODE", + "CUDNN_ERRQUERY_NONBLOCKING", + "CUDNN_ERRQUERY_BLOCKING", + "CUDNN_EDGE_VAL_PAD", + "CUDNN_DIVNORM_PRECOMPUTED_MEANS", + "CUDNN_DIM_MAX", + "CUDNN_DETERMINISTIC", + "CUDNN_DEFAULT_REORDER", + "CUDNN_DATA_UINT8x4", + "CUDNN_DATA_UINT8", + "CUDNN_DATA_INT8x32", + "CUDNN_DATA_INT64", + "CUDNN_DATA_FP8_E5M2", + "CUDNN_DATA_FP8_E4M3", + "CUDNN_DATA_FAST_FLOAT_FOR_FP8", + "CUDNN_DATA_BOOLEAN", + "CUDNN_DATA_BFLOAT16", + "CUDNN_CTC_ZERO_OOB_GRADIENTS", + "CUDNN_CTC_SKIP_OOB_GRADIENTS", + "CUDNN_CTC_LOSS_ALGO_NON_DETERMINISTIC", + "CUDNN_CTC_LOSS_ALGO_DETERMINISTIC", + "CUDNN_BN_FINALIZE_STATISTICS_TRAINING", + "CUDNN_BN_FINALIZE_STATISTICS_INFERENCE", + "CUDNN_BEHAVIOR_NOTE_TYPE_COUNT", + "CUDNN_BEHAVIOR_NOTE_SUPPORTS_CUDA_GRAPH_NATIVE_API", + "CUDNN_BEHAVIOR_NOTE_RUNTIME_COMPILATION", + "CUDNN_BEHAVIOR_NOTE_REQUIRES_FILTER_INT8x32_REORDER", + "CUDNN_BEHAVIOR_NOTE_REQUIRES_BIAS_INT8x32_REORDER", + "CUDNN_BATCH_NORM", + "CUDNN_BATCHNORM_OPS_BN_ADD_ACTIVATION", + "CUDNN_BATCHNORM_OPS_BN_ACTIVATION", + "CUDNN_BATCHNORM_OPS_BN", + "CUDNN_BACKEND_VARIANT_PACK_DESCRIPTOR", + "CUDNN_BACKEND_TENSOR_DESCRIPTOR", + "CUDNN_BACKEND_RNG_DESCRIPTOR", + "CUDNN_BACKEND_RESAMPLE_DESCRIPTOR", + "CUDNN_BACKEND_REDUCTION_DESCRIPTOR", + "CUDNN_BACKEND_POINTWISE_DESCRIPTOR", + "CUDNN_BACKEND_OPERATION_SIGNAL_DESCRIPTOR", + "CUDNN_BACKEND_OPERATION_RNG_DESCRIPTOR", + "CUDNN_BACKEND_OPERATION_RESHAPE_DESCRIPTOR", + "CUDNN_BACKEND_OPERATION_RESAMPLE_FWD_DESCRIPTOR", + "CUDNN_BACKEND_OPERATION_RESAMPLE_BWD_DESCRIPTOR", + "CUDNN_BACKEND_OPERATION_REDUCTION_DESCRIPTOR", + "CUDNN_BACKEND_OPERATION_POINTWISE_DESCRIPTOR", + "CUDNN_BACKEND_OPERATION_PAGED_CACHE_LOAD_DESCRIPTOR", + "CUDNN_BACKEND_OPERATION_NORM_FORWARD_DESCRIPTOR", + "CUDNN_BACKEND_OPERATION_NORM_BACKWARD_DESCRIPTOR", + "CUDNN_BACKEND_OPERATION_MATMUL_DESCRIPTOR", + "CUDNN_BACKEND_OPERATION_GEN_STATS_DESCRIPTOR", + "CUDNN_BACKEND_OPERATION_CONVOLUTION_FORWARD_DESCRIPTOR", + "CUDNN_BACKEND_OPERATION_CONVOLUTION_BACKWARD_FILTER_DESCRIPTOR", + "CUDNN_BACKEND_OPERATION_CONVOLUTION_BACKWARD_DATA_DESCRIPTOR", + "CUDNN_BACKEND_OPERATION_CONCAT_DESCRIPTOR", + "CUDNN_BACKEND_OPERATION_BN_FINALIZE_STATISTICS_DESCRIPTOR", + "CUDNN_BACKEND_OPERATION_BN_BWD_WEIGHTS_DESCRIPTOR", + "CUDNN_BACKEND_OPERATIONGRAPH_DESCRIPTOR", + "CUDNN_BACKEND_MATMUL_DESCRIPTOR", + "CUDNN_BACKEND_LAYOUT_INFO_DESCRIPTOR", + "CUDNN_BACKEND_KNOB_INFO_DESCRIPTOR", + "CUDNN_BACKEND_KNOB_CHOICE_DESCRIPTOR", + "CUDNN_BACKEND_KERNEL_CACHE_DESCRIPTOR", + "CUDNN_BACKEND_INTERMEDIATE_INFO_DESCRIPTOR", + "CUDNN_BACKEND_EXECUTION_PLAN_DESCRIPTOR", + "CUDNN_BACKEND_ENGINE_DESCRIPTOR", + "CUDNN_BACKEND_ENGINEHEUR_DESCRIPTOR", + "CUDNN_BACKEND_ENGINECFG_DESCRIPTOR", + "CUDNN_BACKEND_CONVOLUTION_DESCRIPTOR", + "CUDNN_ATTR_VARIANT_PACK_WORKSPACE", + "CUDNN_ATTR_VARIANT_PACK_UNIQUE_IDS", + "CUDNN_ATTR_VARIANT_PACK_INTERMEDIATES", + "CUDNN_ATTR_VARIANT_PACK_DATA_POINTERS", + "CUDNN_ATTR_TENSOR_VECTOR_COUNT", + "CUDNN_ATTR_TENSOR_VECTORIZED_DIMENSION", + "CUDNN_ATTR_TENSOR_UNIQUE_ID", + "CUDNN_ATTR_TENSOR_STRIDES", + "CUDNN_ATTR_TENSOR_REORDERING_MODE", + "CUDNN_ATTR_TENSOR_RAGGED_OFFSET_DESC", + "CUDNN_ATTR_TENSOR_IS_VIRTUAL", + "CUDNN_ATTR_TENSOR_IS_BY_VALUE", + "CUDNN_ATTR_TENSOR_DIMENSIONS", + "CUDNN_ATTR_TENSOR_DATA_TYPE", + "CUDNN_ATTR_TENSOR_BYTE_ALIGNMENT", + "CUDNN_ATTR_RNG_UNIFORM_DIST_MINIMUM", + "CUDNN_ATTR_RNG_UNIFORM_DIST_MAXIMUM", + "CUDNN_ATTR_RNG_NORMAL_DIST_STANDARD_DEVIATION", + "CUDNN_ATTR_RNG_NORMAL_DIST_MEAN", + "CUDNN_ATTR_RNG_DISTRIBUTION", + "CUDNN_ATTR_RNG_BERNOULLI_DIST_PROBABILITY", + "CUDNN_ATTR_RESAMPLE_WINDOW_DIMS", + "CUDNN_ATTR_RESAMPLE_STRIDES", + "CUDNN_ATTR_RESAMPLE_SPATIAL_DIMS", + "CUDNN_ATTR_RESAMPLE_PRE_PADDINGS", + "CUDNN_ATTR_RESAMPLE_POST_PADDINGS", + "CUDNN_ATTR_RESAMPLE_PADDING_MODE", + "CUDNN_ATTR_RESAMPLE_NAN_PROPAGATION", + "CUDNN_ATTR_RESAMPLE_MODE", + "CUDNN_ATTR_RESAMPLE_COMP_TYPE", + "CUDNN_ATTR_REDUCTION_OPERATOR", + "CUDNN_ATTR_REDUCTION_COMP_TYPE", + "CUDNN_ATTR_POINTWISE_SWISH_BETA", + "CUDNN_ATTR_POINTWISE_SOFTPLUS_BETA", + "CUDNN_ATTR_POINTWISE_RELU_UPPER_CLIP", + "CUDNN_ATTR_POINTWISE_RELU_LOWER_CLIP_SLOPE", + "CUDNN_ATTR_POINTWISE_RELU_LOWER_CLIP", + "CUDNN_ATTR_POINTWISE_NAN_PROPAGATION", + "CUDNN_ATTR_POINTWISE_MODE", + "CUDNN_ATTR_POINTWISE_MATH_PREC", + "CUDNN_ATTR_POINTWISE_ELU_ALPHA", + "CUDNN_ATTR_POINTWISE_AXIS", + "CUDNN_ATTR_OPERATION_SIGNAL_YDESC", + "CUDNN_ATTR_OPERATION_SIGNAL_XDESC", + "CUDNN_ATTR_OPERATION_SIGNAL_VALUE", + "CUDNN_ATTR_OPERATION_SIGNAL_MODE", + "CUDNN_ATTR_OPERATION_SIGNAL_FLAGDESC", + "CUDNN_ATTR_OPERATION_RNG_YDESC", + "CUDNN_ATTR_OPERATION_RNG_SEED", + "CUDNN_ATTR_OPERATION_RNG_OFFSET_DESC", + "CUDNN_ATTR_OPERATION_RNG_DESC", + "CUDNN_ATTR_OPERATION_RESHAPE_YDESC", + "CUDNN_ATTR_OPERATION_RESHAPE_XDESC", + "CUDNN_ATTR_OPERATION_RESAMPLE_FWD_YDESC", + "CUDNN_ATTR_OPERATION_RESAMPLE_FWD_XDESC", + "CUDNN_ATTR_OPERATION_RESAMPLE_FWD_IDXDESC", + "CUDNN_ATTR_OPERATION_RESAMPLE_FWD_DESC", + "CUDNN_ATTR_OPERATION_RESAMPLE_FWD_BETA", + "CUDNN_ATTR_OPERATION_RESAMPLE_FWD_ALPHA", + "CUDNN_ATTR_OPERATION_RESAMPLE_BWD_YDESC", + "CUDNN_ATTR_OPERATION_RESAMPLE_BWD_XDESC", + "CUDNN_ATTR_OPERATION_RESAMPLE_BWD_IDXDESC", + "CUDNN_ATTR_OPERATION_RESAMPLE_BWD_DYDESC", + "CUDNN_ATTR_OPERATION_RESAMPLE_BWD_DXDESC", + "CUDNN_ATTR_OPERATION_RESAMPLE_BWD_DESC", + "CUDNN_ATTR_OPERATION_RESAMPLE_BWD_BETA", + "CUDNN_ATTR_OPERATION_RESAMPLE_BWD_ALPHA", + "CUDNN_ATTR_OPERATION_REDUCTION_YDESC", + "CUDNN_ATTR_OPERATION_REDUCTION_XDESC", + "CUDNN_ATTR_OPERATION_REDUCTION_DESC", + "CUDNN_ATTR_OPERATION_POINTWISE_YDESC", + "CUDNN_ATTR_OPERATION_POINTWISE_XDESC", + "CUDNN_ATTR_OPERATION_POINTWISE_TDESC", + "CUDNN_ATTR_OPERATION_POINTWISE_PW_DESCRIPTOR", + "CUDNN_ATTR_OPERATION_POINTWISE_DYDESC", + "CUDNN_ATTR_OPERATION_POINTWISE_DXDESC", + "CUDNN_ATTR_OPERATION_POINTWISE_BDESC", + "CUDNN_ATTR_OPERATION_POINTWISE_ALPHA2", + "CUDNN_ATTR_OPERATION_POINTWISE_ALPHA1", + "CUDNN_ATTR_OPERATION_PAGED_CACHE_LOAD_YDESC", + "CUDNN_ATTR_OPERATION_PAGED_CACHE_LOAD_SEQUENCE_DESC", + "CUDNN_ATTR_OPERATION_PAGED_CACHE_LOAD_PAGE_TABLE_DESC", + "CUDNN_ATTR_OPERATION_PAGED_CACHE_LOAD_CONTAINER_DESC", + "CUDNN_ATTR_OPERATION_NORM_FWD_YDESC", + "CUDNN_ATTR_OPERATION_NORM_FWD_XDESC", + "CUDNN_ATTR_OPERATION_NORM_FWD_SCALE_DESC", + "CUDNN_ATTR_OPERATION_NORM_FWD_PHASE", + "CUDNN_ATTR_OPERATION_NORM_FWD_PEER_STAT_DESCS", + "CUDNN_ATTR_OPERATION_NORM_FWD_OUTPUT_RUNNING_VAR_DESC", + "CUDNN_ATTR_OPERATION_NORM_FWD_OUTPUT_RUNNING_MEAN_DESC", + "CUDNN_ATTR_OPERATION_NORM_FWD_MODE", + "CUDNN_ATTR_OPERATION_NORM_FWD_MEAN_DESC", + "CUDNN_ATTR_OPERATION_NORM_FWD_INV_VARIANCE_DESC", + "CUDNN_ATTR_OPERATION_NORM_FWD_INPUT_RUNNING_VAR_DESC", + "CUDNN_ATTR_OPERATION_NORM_FWD_INPUT_RUNNING_MEAN_DESC", + "CUDNN_ATTR_OPERATION_NORM_FWD_EXP_AVG_FACTOR_DESC", + "CUDNN_ATTR_OPERATION_NORM_FWD_EPSILON_DESC", + "CUDNN_ATTR_OPERATION_NORM_FWD_BIAS_DESC", + "CUDNN_ATTR_OPERATION_NORM_BWD_XDESC", + "CUDNN_ATTR_OPERATION_NORM_BWD_SCALE_DESC", + "CUDNN_ATTR_OPERATION_NORM_BWD_PEER_STAT_DESCS", + "CUDNN_ATTR_OPERATION_NORM_BWD_MODE", + "CUDNN_ATTR_OPERATION_NORM_BWD_MEAN_DESC", + "CUDNN_ATTR_OPERATION_NORM_BWD_INV_VARIANCE_DESC", + "CUDNN_ATTR_OPERATION_NORM_BWD_EPSILON_DESC", + "CUDNN_ATTR_OPERATION_NORM_BWD_DYDESC", + "CUDNN_ATTR_OPERATION_NORM_BWD_DXDESC", + "CUDNN_ATTR_OPERATION_NORM_BWD_DSCALE_DESC", + "CUDNN_ATTR_OPERATION_NORM_BWD_DBIAS_DESC", + "CUDNN_ATTR_OPERATION_MATMUL_IRREGULARLY_STRIDED_BATCH_COUNT", + "CUDNN_ATTR_OPERATION_MATMUL_GEMM_N_OVERRIDE_DESC", + "CUDNN_ATTR_OPERATION_MATMUL_GEMM_M_OVERRIDE_DESC", + "CUDNN_ATTR_OPERATION_MATMUL_GEMM_K_OVERRIDE_DESC", + "CUDNN_ATTR_OPERATION_MATMUL_DESC", + "CUDNN_ATTR_OPERATION_MATMUL_CDESC", + "CUDNN_ATTR_OPERATION_MATMUL_BDESC", + "CUDNN_ATTR_OPERATION_MATMUL_ADESC", + "CUDNN_ATTR_OPERATION_GENSTATS_XDESC", + "CUDNN_ATTR_OPERATION_GENSTATS_SUMDESC", + "CUDNN_ATTR_OPERATION_GENSTATS_SQSUMDESC", + "CUDNN_ATTR_OPERATION_GENSTATS_MODE", + "CUDNN_ATTR_OPERATION_GENSTATS_MATH_PREC", + "CUDNN_ATTR_OPERATION_CONVOLUTION_FORWARD_Y", + "CUDNN_ATTR_OPERATION_CONVOLUTION_FORWARD_X", + "CUDNN_ATTR_OPERATION_CONVOLUTION_FORWARD_W", + "CUDNN_ATTR_OPERATION_CONVOLUTION_FORWARD_CONV_DESC", + "CUDNN_ATTR_OPERATION_CONVOLUTION_FORWARD_BETA", + "CUDNN_ATTR_OPERATION_CONVOLUTION_FORWARD_ALPHA", + "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_FILTER_X", + "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_FILTER_DY", + "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_FILTER_DW", + "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_FILTER_CONV_DESC", + "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_FILTER_BETA", + "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_FILTER_ALPHA", + "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_DATA_W", + "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_DATA_DY", + "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_DATA_DX", + "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_DATA_CONV_DESC", + "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_DATA_BETA", + "CUDNN_ATTR_OPERATION_CONVOLUTION_BWD_DATA_ALPHA", + "CUDNN_ATTR_OPERATION_CONCAT_OUTPUT_DESC", + "CUDNN_ATTR_OPERATION_CONCAT_INPUT_DESCS", + "CUDNN_ATTR_OPERATION_CONCAT_INPLACE_INDEX", + "CUDNN_ATTR_OPERATION_CONCAT_AXIS", + "CUDNN_ATTR_OPERATION_BN_FINALIZE_Y_SUM_DESC", + "CUDNN_ATTR_OPERATION_BN_FINALIZE_Y_SQ_SUM_DESC", + "CUDNN_ATTR_OPERATION_BN_FINALIZE_UPDATED_RUNNING_VAR_DESC", + "CUDNN_ATTR_OPERATION_BN_FINALIZE_UPDATED_RUNNING_MEAN_DESC", + "CUDNN_ATTR_OPERATION_BN_FINALIZE_STATS_MODE", + "CUDNN_ATTR_OPERATION_BN_FINALIZE_SCALE_DESC", + "CUDNN_ATTR_OPERATION_BN_FINALIZE_SAVED_MEAN_DESC", + "CUDNN_ATTR_OPERATION_BN_FINALIZE_SAVED_INV_STD_DESC", + "CUDNN_ATTR_OPERATION_BN_FINALIZE_PREV_RUNNING_VAR_DESC", + "CUDNN_ATTR_OPERATION_BN_FINALIZE_PREV_RUNNING_MEAN_DESC", + "CUDNN_ATTR_OPERATION_BN_FINALIZE_MATH_PREC", + "CUDNN_ATTR_OPERATION_BN_FINALIZE_EXP_AVERATE_FACTOR_DESC", + "CUDNN_ATTR_OPERATION_BN_FINALIZE_EQ_SCALE_DESC", + "CUDNN_ATTR_OPERATION_BN_FINALIZE_EQ_BIAS_DESC", + "CUDNN_ATTR_OPERATION_BN_FINALIZE_EPSILON_DESC", + "CUDNN_ATTR_OPERATION_BN_FINALIZE_BIAS_DESC", + "CUDNN_ATTR_OPERATION_BN_FINALIZE_ACCUM_COUNT_DESC", + "CUDNN_ATTR_OPERATION_BN_BWD_WEIGHTS_X_DESC", + "CUDNN_ATTR_OPERATION_BN_BWD_WEIGHTS_MEAN_DESC", + "CUDNN_ATTR_OPERATION_BN_BWD_WEIGHTS_MATH_PREC", + "CUDNN_ATTR_OPERATION_BN_BWD_WEIGHTS_INVSTD_DESC", + "CUDNN_ATTR_OPERATION_BN_BWD_WEIGHTS_EQ_X_SCALE_DESC", + "CUDNN_ATTR_OPERATION_BN_BWD_WEIGHTS_EQ_DY_SCALE_DESC", + "CUDNN_ATTR_OPERATION_BN_BWD_WEIGHTS_EQ_BIAS", + "CUDNN_ATTR_OPERATION_BN_BWD_WEIGHTS_DY_DESC", + "CUDNN_ATTR_OPERATION_BN_BWD_WEIGHTS_DBN_SCALE_DESC", + "CUDNN_ATTR_OPERATION_BN_BWD_WEIGHTS_DBN_BIAS_DESC", + "CUDNN_ATTR_OPERATION_BN_BWD_WEIGHTS_BN_SCALE_DESC", + "CUDNN_ATTR_OPERATIONGRAPH_OPS", + "CUDNN_ATTR_OPERATIONGRAPH_IS_DYNAMIC_SHAPE_ENABLED", + "CUDNN_ATTR_OPERATIONGRAPH_HANDLE", + "CUDNN_ATTR_OPERATIONGRAPH_ENGINE_GLOBAL_COUNT", + "CUDNN_ATTR_MATMUL_PADDING_VALUE", + "CUDNN_ATTR_MATMUL_COMP_TYPE", + "CUDNN_ATTR_LAYOUT_INFO_TYPES", + "CUDNN_ATTR_LAYOUT_INFO_TENSOR_UID", + "CUDNN_ATTR_KNOB_INFO_TYPE", + "CUDNN_ATTR_KNOB_INFO_STRIDE", + "CUDNN_ATTR_KNOB_INFO_MINIMUM_VALUE", + "CUDNN_ATTR_KNOB_INFO_MAXIMUM_VALUE", + "CUDNN_ATTR_KNOB_CHOICE_KNOB_VALUE", + "CUDNN_ATTR_KNOB_CHOICE_KNOB_TYPE", + "CUDNN_ATTR_KERNEL_CACHE_OPERATION_GRAPH", + "CUDNN_ATTR_KERNEL_CACHE_IS_ENGINECFG_KERNEL_CACHED", + "CUDNN_ATTR_INTERMEDIATE_INFO_UNIQUE_ID", + "CUDNN_ATTR_INTERMEDIATE_INFO_SIZE", + "CUDNN_ATTR_INTERMEDIATE_INFO_DEPENDENT_DATA_UIDS", + "CUDNN_ATTR_INTERMEDIATE_INFO_DEPENDENT_ATTRIBUTES", + "CUDNN_ATTR_EXECUTION_PLAN_WORKSPACE_SIZE", + "CUDNN_ATTR_EXECUTION_PLAN_RUN_ONLY_INTERMEDIATE_UIDS", + "CUDNN_ATTR_EXECUTION_PLAN_KERNEL_CACHE", + "CUDNN_ATTR_EXECUTION_PLAN_JSON_REPRESENTATION", + "CUDNN_ATTR_EXECUTION_PLAN_HANDLE", + "CUDNN_ATTR_EXECUTION_PLAN_ENGINE_CONFIG", + "CUDNN_ATTR_EXECUTION_PLAN_COMPUTED_INTERMEDIATE_UIDS", + "CUDNN_ATTR_ENGINE_SM_COUNT_TARGET", + "CUDNN_ATTR_ENGINE_OPERATION_GRAPH", + "CUDNN_ATTR_ENGINE_NUMERICAL_NOTE", + "CUDNN_ATTR_ENGINE_LAYOUT_INFO", + "CUDNN_ATTR_ENGINE_KNOB_INFO", + "CUDNN_ATTR_ENGINE_GLOBAL_INDEX", + "CUDNN_ATTR_ENGINE_BEHAVIOR_NOTE", + "CUDNN_ATTR_ENGINEHEUR_SM_COUNT_TARGET", + "CUDNN_ATTR_ENGINEHEUR_RESULTS", + "CUDNN_ATTR_ENGINEHEUR_OPERATION_GRAPH", + "CUDNN_ATTR_ENGINEHEUR_MODE", + "CUDNN_ATTR_ENGINECFG_WORKSPACE_SIZE", + "CUDNN_ATTR_ENGINECFG_SHARED_MEMORY_USED", + "CUDNN_ATTR_ENGINECFG_KNOB_CHOICES", + "CUDNN_ATTR_ENGINECFG_INTERMEDIATE_INFO", + "CUDNN_ATTR_ENGINECFG_ENGINE", + "CUDNN_ATTR_CONVOLUTION_SPATIAL_DIMS", + "CUDNN_ATTR_CONVOLUTION_PRE_PADDINGS", + "CUDNN_ATTR_CONVOLUTION_POST_PADDINGS", + "CUDNN_ATTR_CONVOLUTION_FILTER_STRIDES", + "CUDNN_ATTR_CONVOLUTION_DILATIONS", + "CUDNN_ATTR_CONVOLUTION_CONV_MODE", + "CUDNN_ATTR_CONVOLUTION_COMP_TYPE", + "CUDNN_ATTN_WKIND_COUNT", + "CUDNN_ATTN_QUERYMAP_ONE_TO_ONE", + "CUDNN_ATTN_QUERYMAP_ALL_TO_ONE", + "CUDNN_ATTN_ENABLE_PROJ_BIASES", + "CUDNN_ATTN_DISABLE_PROJ_BIASES", "CUDA_R_8F_E5M2", "CUDA_R_8F_E4M3", "CUDA_R_64U", @@ -12695,6 +12695,513 @@ sub warnRocOnlyUnsupportedFunctions { my $line_num = shift; my $k = 0; foreach $func ( + "cusparseZhybsv_solve", + "cusparseZhybsv_analysis", + "cusparseZhyb2dense", + "cusparseZhyb2csr", + "cusparseZhyb2csc", + "cusparseZgtsv_nopivot", + "cusparseZgtsvStridedBatch", + "cusparseZgtsv", + "cusparseZgemmi", + "cusparseZgebsr2gebsr_bufferSizeExt", + "cusparseZgebsr2gebsc_bufferSizeExt", + "cusparseZdense2hyb", + "cusparseZcsru2csr_bufferSizeExt", + "cusparseZcsru2csr", + "cusparseZcsrsv_solve", + "cusparseZcsrsv_analysis", + "cusparseZcsrsm_solve", + "cusparseZcsrsm_analysis", + "cusparseZcsrmv_mp", + "cusparseZcsrilu0", + "cusparseZcsric0", + "cusparseZcsrgemm", + "cusparseZcsrgeam2_bufferSizeExt", + "cusparseZcsr2gebsr_bufferSizeExt", + "cusparseZcsr2csru", + "cusparseZcsr2csc", + "cusparseZcsc2hyb", + "cusparseZbsrsm2_bufferSizeExt", + "cusparseZbsrilu02_bufferSizeExt", + "cusparseZbsric02_bufferSizeExt", + "cusparseXgebsr2csr", + "cusparseXcsrgemmNnz", + "cusparseSpSV_updateMatrix", + "cusparseSpSV_solve", + "cusparseSpSV_destroyDescr", + "cusparseSpSV_createDescr", + "cusparseSpSV_analysis", + "cusparseSpSVUpdate_t", + "cusparseSpSVDescr_t", + "cusparseSpSVDescr", + "cusparseSpSM_updateMatrix", + "cusparseSpSM_destroyDescr", + "cusparseSpSM_createDescr", + "cusparseSpSM_bufferSize", + "cusparseSpSMUpdate_t", + "cusparseSpSMDescr_t", + "cusparseSpSMDescr", + "cusparseSpMatSetNumBatches", + "cusparseSpMatGetNumBatches", + "cusparseSpMV_preprocess", + "cusparseSpMMOp_destroyPlan", + "cusparseSpMMOp_createPlan", + "cusparseSpMMOpPlan_t", + "cusparseSpMMOpPlan", + "cusparseSpMMOpAlg_t", + "cusparseSpMMOp", + "cusparseSpGEMMreuse_workEstimation", + "cusparseSpGEMMreuse_nnz", + "cusparseSpGEMMreuse_copy", + "cusparseSpGEMMreuse_compute", + "cusparseSpGEMM_workEstimation", + "cusparseSpGEMM_getNumProducts", + "cusparseSpGEMM_estimateMemory", + "cusparseSpGEMM_destroyDescr", + "cusparseSpGEMM_createDescr", + "cusparseSpGEMM_copy", + "cusparseSpGEMM_compute", + "cusparseSpGEMMDescr_t", + "cusparseSpGEMMDescr", + "cusparseSolveAnalysisInfo_t", + "cusparseSolveAnalysisInfo", + "cusparseSideMode_t", + "cusparseShybsv_solve", + "cusparseShybsv_analysis", + "cusparseShyb2dense", + "cusparseShyb2csr", + "cusparseShyb2csc", + "cusparseSgtsv_nopivot", + "cusparseSgtsvStridedBatch", + "cusparseSgtsv", + "cusparseSgemmi", + "cusparseSgebsr2gebsr_bufferSizeExt", + "cusparseSgebsr2gebsc_bufferSizeExt", + "cusparseSdense2hyb", + "cusparseScsru2csr_bufferSizeExt", + "cusparseScsru2csr", + "cusparseScsrsv_solve", + "cusparseScsrsv_analysis", + "cusparseScsrsm_solve", + "cusparseScsrsm_analysis", + "cusparseScsrmv_mp", + "cusparseScsrilu0", + "cusparseScsric0", + "cusparseScsrgemm", + "cusparseScsrgeam2_bufferSizeExt", + "cusparseScsr2gebsr_bufferSizeExt", + "cusparseScsr2csru", + "cusparseScsr2csc", + "cusparseScsc2hyb", + "cusparseSbsrsm2_bufferSizeExt", + "cusparseSbsrilu02_bufferSizeExt", + "cusparseSbsric02_bufferSizeExt", + "cusparseLoggerSetMask", + "cusparseLoggerSetLevel", + "cusparseLoggerSetFile", + "cusparseLoggerSetCallback", + "cusparseLoggerOpenFile", + "cusparseLoggerForceDisable", + "cusparseLoggerCallback_t", + "cusparseHpruneDense2csr_bufferSizeExt", + "cusparseHpruneDense2csrNnzByPercentage", + "cusparseHpruneDense2csrNnz", + "cusparseHpruneDense2csrByPercentage_bufferSizeExt", + "cusparseHpruneDense2csrByPercentage", + "cusparseHpruneDense2csr", + "cusparseHpruneCsr2csr_bufferSizeExt", + "cusparseHpruneCsr2csrNnzByPercentage", + "cusparseHpruneCsr2csrNnz", + "cusparseHpruneCsr2csrByPercentage_bufferSizeExt", + "cusparseHpruneCsr2csrByPercentage", + "cusparseHpruneCsr2csr", + "cusparseGetLevelInfo", + "cusparseDhybsv_solve", + "cusparseDhybsv_analysis", + "cusparseDhyb2dense", + "cusparseDhyb2csr", + "cusparseDhyb2csc", + "cusparseDgtsv_nopivot", + "cusparseDgtsvStridedBatch", + "cusparseDgtsv", + "cusparseDgemmi", + "cusparseDgebsr2gebsr_bufferSizeExt", + "cusparseDgebsr2gebsc_bufferSizeExt", + "cusparseDestroySolveAnalysisInfo", + "cusparseDestroyCsru2csrInfo", + "cusparseDenseToSparse_convert", + "cusparseDdense2hyb", + "cusparseDcsru2csr_bufferSizeExt", + "cusparseDcsru2csr", + "cusparseDcsrsv_solve", + "cusparseDcsrsv_analysis", + "cusparseDcsrsm_solve", + "cusparseDcsrsm_analysis", + "cusparseDcsrmv_mp", + "cusparseDcsrilu0", + "cusparseDcsric0", + "cusparseDcsrgemm", + "cusparseDcsrgeam2_bufferSizeExt", + "cusparseDcsr2gebsr_bufferSizeExt", + "cusparseDcsr2csru", + "cusparseDcsr2csc", + "cusparseDcsc2hyb", + "cusparseDbsrsm2_bufferSizeExt", + "cusparseDbsrilu02_bufferSizeExt", + "cusparseDbsric02_bufferSizeExt", + "cusparseCsrsv_solveEx", + "cusparseCsrsv_analysisEx", + "cusparseCsrmvEx_bufferSize", + "cusparseCsrmvEx", + "cusparseCsrilu0Ex", + "cusparseCsr2cscEx2", + "cusparseCsr2cscEx", + "cusparseCsr2CscAlg_t", + "cusparseCreateSolveAnalysisInfo", + "cusparseCreateSlicedEll", + "cusparseCreateCsru2csrInfo", + "cusparseCreateConstSlicedEll", + "cusparseCreateConstBsr", + "cusparseCreateBsr", + "cusparseConstrainedGeMM_bufferSize", + "cusparseConstrainedGeMM", + "cusparseColorAlg_t", + "cusparseChybsv_solve", + "cusparseChybsv_analysis", + "cusparseChyb2dense", + "cusparseChyb2csr", + "cusparseChyb2csc", + "cusparseCgtsv_nopivot", + "cusparseCgtsvStridedBatch", + "cusparseCgtsv", + "cusparseCgemmi", + "cusparseCgebsr2gebsr_bufferSizeExt", + "cusparseCgebsr2gebsc_bufferSizeExt", + "cusparseCdense2hyb", + "cusparseCcsru2csr_bufferSizeExt", + "cusparseCcsru2csr", + "cusparseCcsrsv_solve", + "cusparseCcsrsv_analysis", + "cusparseCcsrsm_solve", + "cusparseCcsrsm_analysis", + "cusparseCcsrmv_mp", + "cusparseCcsrilu0", + "cusparseCcsric0", + "cusparseCcsrgemm", + "cusparseCcsrgeam2_bufferSizeExt", + "cusparseCcsr2gebsr_bufferSizeExt", + "cusparseCcsr2csru", + "cusparseCcsr2csc", + "cusparseCcsc2hyb", + "cusparseCbsrsm2_bufferSizeExt", + "cusparseCbsrilu02_bufferSizeExt", + "cusparseCbsric02_bufferSizeExt", + "cusparseBsrSetStridedBatch", + "cusparseAlgMode_t", + "curand_mtgp32_specific", + "curand_mtgp32_single_specific", + "curand_mtgp32_single", + "curand_Philox4x32_10", + "curandState_t", + "curandStateXORWOW_t", + "curandStateXORWOW", + "curandState", + "curandMethod_t", + "curandMethod", + "curandHistogramM2_t", + "curandHistogramM2_st", + "curandHistogramM2V_t", + "curandHistogramM2V_st", + "curandHistogramM2K_t", + "curandHistogramM2K_st", + "curandGetProperty", + "curandDistribution_t", + "curandDistribution_st", + "curandDistributionShift_t", + "curandDistributionShift_st", + "curandDistributionM2Shift_t", + "curandDistributionM2Shift_st", + "curandDirectionVectors64_t", + "curandDirectionVectors32_t", + "cudnnWgradMode_t", + "cudnnTransformTensorEx", + "cudnnTransformFilter", + "cudnnTensorTransformStruct", + "cudnnTensorTransformDescriptor_t", + "cudnnTensorStruct", + "cudnnSpatialTransformerStruct", + "cudnnSpatialTransformerDescriptor_t", + "cudnnSpatialTfSamplerForward", + "cudnnSpatialTfSamplerBackward", + "cudnnSpatialTfGridGeneratorForward", + "cudnnSpatialTfGridGeneratorBackward", + "cudnnSignalMode_t", + "cudnnSeverity_t", + "cudnnSetTensorTransformDescriptor", + "cudnnSetTensorNdDescriptorEx", + "cudnnSetTensorNdDescriptor", + "cudnnSetTensor4dDescriptor", + "cudnnSetSpatialTransformerNdDescriptor", + "cudnnSetSeqDataDescriptor", + "cudnnSetRNNProjectionLayers", + "cudnnSetRNNPaddingMode", + "cudnnSetRNNMatrixMathType", + "cudnnSetRNNDescriptor_v8", + "cudnnSetRNNDescriptor_v5", + "cudnnSetRNNDescriptor", + "cudnnSetRNNDataDescriptor", + "cudnnSetRNNBiasMode", + "cudnnSetRNNAlgorithmDescriptor", + "cudnnSetPersistentRNNPlan", + "cudnnSetOpTensorDescriptor", + "cudnnSetFusedOpsVariantParamPackAttribute", + "cudnnSetFusedOpsConstParamPackAttribute", + "cudnnSetFilterNdDescriptor", + "cudnnSetFilter4dDescriptor", + "cudnnSetConvolutionReorderType", + "cudnnSetConvolutionNdDescriptor", + "cudnnSetConvolutionMathType", + "cudnnSetConvolution2dDescriptor", + "cudnnSetCallback", + "cudnnSetCTCLossDescriptor_v9", + "cudnnSetCTCLossDescriptor_v8", + "cudnnSetCTCLossDescriptorEx", + "cudnnSetAttnDescriptor", + "cudnnSetAlgorithmPerformance", + "cudnnSetAlgorithmDescriptor", + "cudnnSetActivationDescriptorSwishBeta", + "cudnnSetActivationDescriptor", + "cudnnSeqDataStruct", + "cudnnSeqDataDescriptor_t", + "cudnnSeqDataAxis_t", + "cudnnSaveAlgorithm", + "cudnnSamplerType_t", + "cudnnRuntimeTag_t", + "cudnnRestoreAlgorithm", + "cudnnResampleMode_t", + "cudnnReorderType_t", + "cudnnReorderFilterAndBias", + "cudnnReduceTensorStruct", + "cudnnRNNStruct", + "cudnnRNNSetClip_v9", + "cudnnRNNSetClip_v8", + "cudnnRNNSetClip", + "cudnnRNNGetClip_v9", + "cudnnRNNGetClip_v8", + "cudnnRNNGetClip", + "cudnnRNNForwardTrainingEx", + "cudnnRNNForwardInferenceEx", + "cudnnRNNForward", + "cudnnRNNDataStruct", + "cudnnRNNDataLayout_t", + "cudnnRNNDataDescriptor_t", + "cudnnRNNClipMode_t", + "cudnnRNNBackwardWeights_v8", + "cudnnRNNBackwardWeightsEx", + "cudnnRNNBackwardData_v8", + "cudnnRNNBackwardDataEx", + "cudnnQueryRuntimeError", + "cudnnPoolingStruct", + "cudnnPoolingForward", + "cudnnPoolingBackward", + "cudnnPersistentRNNPlan_t", + "cudnnPersistentRNNPlan", + "cudnnOpsVersionCheck", + "cudnnOpsTrainVersionCheck", + "cudnnOpsInferVersionCheck", + "cudnnOpTensorStruct", + "cudnnOpTensorDescriptor_t", + "cudnnOpTensor", + "cudnnNormalizationForwardTraining", + "cudnnNormalizationForwardInference", + "cudnnNormalizationBackward", + "cudnnNormOps_t", + "cudnnNormMode_t", + "cudnnNormAlgo_t", + "cudnnMultiHeadAttnWeightKind_t", + "cudnnMultiHeadAttnForward", + "cudnnMultiHeadAttnBackwardWeights", + "cudnnMultiHeadAttnBackwardData", + "cudnnMathType_t", + "cudnnMakeFusedOpsPlan", + "cudnnLossNormalizationMode_t", + "cudnnLRNStruct", + "cudnnLRNCrossChannelForward", + "cudnnLRNCrossChannelBackward", + "cudnnInitTransformDest", + "cudnnIm2Col", + "cudnnGraphVersionCheck", + "cudnnGetVersion", + "cudnnGetTensorTransformDescriptor", + "cudnnGetTensorSizeInBytes", + "cudnnGetTensorNdDescriptor", + "cudnnGetSeqDataDescriptor", + "cudnnGetRNNWeightSpaceSize", + "cudnnGetRNNWeightParams", + "cudnnGetRNNTempSpaceSizes", + "cudnnGetRNNProjectionLayers", + "cudnnGetRNNPaddingMode", + "cudnnGetRNNMatrixMathType", + "cudnnGetRNNLinLayerMatrixParams", + "cudnnGetRNNLinLayerBiasParams", + "cudnnGetRNNForwardTrainingAlgorithmMaxCount", + "cudnnGetRNNForwardInferenceAlgorithmMaxCount", + "cudnnGetRNNDescriptor_v8", + "cudnnGetRNNDataDescriptor", + "cudnnGetRNNBiasMode", + "cudnnGetRNNBackwardWeightsAlgorithmMaxCount", + "cudnnGetRNNBackwardDataAlgorithmMaxCount", + "cudnnGetProperty", + "cudnnGetOpTensorDescriptor", + "cudnnGetNormalizationTrainingReserveSpaceSize", + "cudnnGetNormalizationForwardTrainingWorkspaceSize", + "cudnnGetNormalizationBackwardWorkspaceSize", + "cudnnGetMultiHeadAttnWeights", + "cudnnGetMultiHeadAttnBuffers", + "cudnnGetMaxDeviceVersion", + "cudnnGetLastErrorString", + "cudnnGetFusedOpsVariantParamPackAttribute", + "cudnnGetFusedOpsConstParamPackAttribute", + "cudnnGetFoldedConvBackwardDataDescriptors", + "cudnnGetFilterSizeInBytes", + "cudnnGetFilterNdDescriptor", + "cudnnGetFilter4dDescriptor", + "cudnnGetCudartVersion", + "cudnnGetConvolutionReorderType", + "cudnnGetConvolutionNdForwardOutputDim", + "cudnnGetConvolutionNdDescriptor", + "cudnnGetConvolutionMathType", + "cudnnGetConvolutionGroupCount", + "cudnnGetConvolutionForwardAlgorithm_v7", + "cudnnGetConvolutionForwardAlgorithmMaxCount", + "cudnnGetConvolutionForwardAlgorithm", + "cudnnGetConvolutionBackwardFilterWorkspaceSize", + "cudnnGetConvolutionBackwardFilterAlgorithm_v7", + "cudnnGetConvolutionBackwardFilterAlgorithmMaxCount", + "cudnnGetConvolutionBackwardFilterAlgorithm", + "cudnnGetConvolutionBackwardDataAlgorithm_v7", + "cudnnGetConvolutionBackwardDataAlgorithmMaxCount", + "cudnnGetConvolutionBackwardDataAlgorithm", + "cudnnGetConvolution2dDescriptor", + "cudnnGetCallback", + "cudnnGetCTCLossWorkspaceSize_v8", + "cudnnGetCTCLossDescriptor_v9", + "cudnnGetCTCLossDescriptor_v8", + "cudnnGetCTCLossDescriptorEx", + "cudnnGetBatchNormalizationTrainingExReserveSpaceSize", + "cudnnGetBatchNormalizationForwardTrainingExWorkspaceSize", + "cudnnGetBatchNormalizationBackwardExWorkspaceSize", + "cudnnGetAttnDescriptor", + "cudnnGetAlgorithmSpaceSize", + "cudnnGetAlgorithmPerformance", + "cudnnGetAlgorithmDescriptor", + "cudnnGetActivationDescriptorSwishBeta", + "cudnnGetActivationDescriptor", + "cudnnGenStatsMode_t", + "cudnnFusedOps_t", + "cudnnFusedOpsVariantParamStruct", + "cudnnFusedOpsVariantParamPack_t", + "cudnnFusedOpsVariantParamLabel_t", + "cudnnFusedOpsPointerPlaceHolder_t", + "cudnnFusedOpsPlan_t", + "cudnnFusedOpsPlanStruct", + "cudnnFusedOpsExecute", + "cudnnFusedOpsConstParamStruct", + "cudnnFusedOpsConstParamPack_t", + "cudnnFusedOpsConstParamLabel_t", + "cudnnFraction_t", + "cudnnFractionStruct", + "cudnnFoldingDirection_t", + "cudnnFindRNNForwardTrainingAlgorithmEx", + "cudnnFindRNNForwardInferenceAlgorithmEx", + "cudnnFindRNNBackwardWeightsAlgorithmEx", + "cudnnFindRNNBackwardDataAlgorithmEx", + "cudnnFindConvolutionForwardAlgorithm", + "cudnnFindConvolutionBackwardFilterAlgorithmEx", + "cudnnFindConvolutionBackwardFilterAlgorithm", + "cudnnFindConvolutionBackwardDataAlgorithmEx", + "cudnnFindConvolutionBackwardDataAlgorithm", + "cudnnFilterStruct", + "cudnnErrQueryMode_t", + "cudnnDropoutStruct", + "cudnnDivisiveNormalizationForward", + "cudnnDivisiveNormalizationBackward", + "cudnnDivNormMode_t", + "cudnnDeterminism_t", + "cudnnDestroyTensorTransformDescriptor", + "cudnnDestroySpatialTransformerDescriptor", + "cudnnDestroySeqDataDescriptor", + "cudnnDestroyRNNDataDescriptor", + "cudnnDestroyPersistentRNNPlan", + "cudnnDestroyOpTensorDescriptor", + "cudnnDestroyFusedOpsVariantParamPack", + "cudnnDestroyFusedOpsPlan", + "cudnnDestroyFusedOpsConstParamPack", + "cudnnDestroyFilterDescriptor", + "cudnnDestroyAttnDescriptor", + "cudnnDestroyAlgorithmPerformance", + "cudnnDestroyAlgorithmDescriptor", + "cudnnDeriveNormTensorDescriptor", + "cudnnDebug_t", + "cudnnDebugStruct", + "cudnnCreateTensorTransformDescriptor", + "cudnnCreateSpatialTransformerDescriptor", + "cudnnCreateSeqDataDescriptor", + "cudnnCreateRNNDataDescriptor", + "cudnnCreatePersistentRNNPlan", + "cudnnCreateOpTensorDescriptor", + "cudnnCreateFusedOpsVariantParamPack", + "cudnnCreateFusedOpsPlan", + "cudnnCreateFusedOpsConstParamPack", + "cudnnCreateFilterDescriptor", + "cudnnCreateAttnDescriptor", + "cudnnCreateAlgorithmPerformance", + "cudnnCreateAlgorithmDescriptor", + "cudnnCopyAlgorithmDescriptor", + "cudnnConvolutionStruct", + "cudnnConvolutionFwdPreference_t", + "cudnnConvolutionBwdFilterPreference_t", + "cudnnConvolutionBwdFilterAlgo_t", + "cudnnConvolutionBwdFilterAlgoPerf_t", + "cudnnConvolutionBwdFilterAlgoPerfStruct", + "cudnnConvolutionBwdDataPreference_t", + "cudnnConvolutionBackwardFilter", + "cudnnCnnTrainVersionCheck", + "cudnnCnnInferVersionCheck", + "cudnnCallback_t", + "cudnnCTCLoss_v8", + "cudnnCTCLossStruct", + "cudnnCTCGradMode_t", + "cudnnBuildRNNDynamic", + "cudnnBnFinalizeStatsMode_t", + "cudnnBatchNormalizationForwardTrainingEx", + "cudnnBatchNormalizationBackwardEx", + "cudnnBatchNormOps_t", + "cudnnBackendUpdateCudaGraph", + "cudnnBackendTensorReordering_t", + "cudnnBackendPopulateCudaGraph", + "cudnnBackendNumericalNote_t", + "cudnnBackendNormMode_t", + "cudnnBackendNormFwdPhase_t", + "cudnnBackendLayoutType_t", + "cudnnBackendKnobType_t", + "cudnnBackendInitialize", + "cudnnBackendBehaviorNote_t", + "cudnnAttnStruct", + "cudnnAttnQueryMap_t", + "cudnnAttnDescriptor_t", + "cudnnAlgorithm_t", + "cudnnAlgorithmUnionStruct", + "cudnnAlgorithmStruct", + "cudnnAlgorithmPerformance_t", + "cudnnAlgorithmPerformanceStruct", + "cudnnAlgorithmDescriptor_t", + "cudnnAdvVersionCheck", + "cudnnAdvTrainVersionCheck", + "cudnnAdvInferVersionCheck", + "cudnnAddTensor", + "cudnnActivationStruct", "cublasZtrttp", "cublasZtrmm_v2_64", "cublasZtrmm_64", @@ -12930,6 +13437,395 @@ sub warnRocOnlyUnsupportedFunctions { "cublasAsumEx_64", "cublasAsumEx", "cublasAlloc", + "csru2csrInfo_t", + "csru2csrInfo", + "__curand_umul", + "CUSPARSE_STATUS_MATRIX_TYPE_NOT_SUPPORTED", + "CUSPARSE_STATUS_MAPPING_ERROR", + "CUSPARSE_STATUS_INSUFFICIENT_RESOURCES", + "CUSPARSE_STATUS_EXECUTION_FAILED", + "CUSPARSE_SPSV_UPDATE_GENERAL", + "CUSPARSE_SPSV_UPDATE_DIAGONAL", + "CUSPARSE_SPSM_UPDATE_GENERAL", + "CUSPARSE_SPSM_UPDATE_DIAGONAL", + "CUSPARSE_SPMM_OP_ALG_DEFAULT", + "CUSPARSE_SPMM_COO_ALG4", + "CUSPARSE_SPMM_BSR_ALG1", + "CUSPARSE_SPMMA_PREPROCESS", + "CUSPARSE_SPMMA_ALG4", + "CUSPARSE_SPMMA_ALG3", + "CUSPARSE_SPMMA_ALG2", + "CUSPARSE_SPMMA_ALG1", + "CUSPARSE_SPGEMM_CSR_ALG_NONDETERMINITIC", + "CUSPARSE_SPGEMM_CSR_ALG_DETERMINITIC", + "CUSPARSE_SPGEMM_ALG3", + "CUSPARSE_SPGEMM_ALG2", + "CUSPARSE_SPGEMM_ALG1", + "CUSPARSE_SIDE_RIGHT", + "CUSPARSE_SIDE_LEFT", + "CUSPARSE_MV_ALG_DEFAULT", + "CUSPARSE_MM_ALG_DEFAULT", + "CUSPARSE_CSRMV_ALG2", + "CUSPARSE_CSRMV_ALG1", + "CUSPARSE_CSRMM_ALG1", + "CUSPARSE_CSR2CSC_ALG_DEFAULT", + "CUSPARSE_CSR2CSC_ALG2", + "CUSPARSE_CSR2CSC_ALG1", + "CUSPARSE_COOMV_ALG", + "CUSPARSE_COOMM_ALG3", + "CUSPARSE_COOMM_ALG2", + "CUSPARSE_COOMM_ALG1", + "CUSPARSE_COLOR_ALG1", + "CUSPARSE_COLOR_ALG0", + "CUSPARSE_ALG_NAIVE", + "CUSPARSE_ALG_MERGE_PATH", + "CUSPARSE_ALG1", + "CUSPARSE_ALG0", + "CURAND_STATUS_PREEXISTING_FAILURE", + "CURAND_STATUS_INITIALIZATION_FAILED", + "CURAND_STATUS_ARCH_MISMATCH", + "CURAND_RNG_TEST", + "CURAND_REJECTION", + "CURAND_POISSON", + "CURAND_M2", + "CURAND_M1", + "CURAND_KNUTH", + "CURAND_ITR", + "CURAND_HITR", + "CURAND_FAST_REJECTION", + "CURAND_DISCRETE_GAUSS", + "CURAND_DEVICE_API", + "CURAND_DEFINITION", + "CURAND_CHOOSE_BEST", + "CURAND_BINARY_SEARCH", + "CURAND_3RD", + "CUDNN_WGRAD_MODE_SET", + "CUDNN_WGRAD_MODE_ADD", + "CUDNN_TRANSFORM_UNFOLD", + "CUDNN_TRANSFORM_FOLD", + "CUDNN_TENSOR_REORDERING_NONE", + "CUDNN_TENSOR_REORDERING_INT8x32", + "CUDNN_TENSOR_REORDERING_F16x16", + "CUDNN_TENSOR_OP_MATH_ALLOW_CONVERSION", + "CUDNN_TENSOR_OP_MATH", + "CUDNN_TENSOR_NCHW_VECT_C", + "CUDNN_STATUS_SUBLIBRARY_VERSION_MISMATCH", + "CUDNN_STATUS_SUBLIBRARY_LOADING_FAILED", + "CUDNN_STATUS_SPECIFIC_ERROR", + "CUDNN_STATUS_SERIALIZATION_VERSION_MISMATCH", + "CUDNN_STATUS_RUNTIME_PREREQUISITE_MISSING", + "CUDNN_STATUS_RUNTIME_IN_PROGRESS", + "CUDNN_STATUS_RUNTIME_FP_OVERFLOW", + "CUDNN_STATUS_NOT_SUPPORTED_SUBLIBRARY_UNAVAILABLE", + "CUDNN_STATUS_NOT_SUPPORTED_SHARED_MEMORY_INSUFFICIENT", + "CUDNN_STATUS_NOT_SUPPORTED_SHAPE", + "CUDNN_STATUS_NOT_SUPPORTED_RUNTIME_PREREQUISITE_MISSING", + "CUDNN_STATUS_NOT_SUPPORTED_PADDING", + "CUDNN_STATUS_NOT_SUPPORTED_LAYOUT", + "CUDNN_STATUS_NOT_SUPPORTED_INCOMPATIBLE_CUDA_DRIVER", + "CUDNN_STATUS_NOT_SUPPORTED_INCOMPATIBLE_CUDART", + "CUDNN_STATUS_NOT_SUPPORTED_GRAPH_PATTERN", + "CUDNN_STATUS_NOT_SUPPORTED_DATA_TYPE", + "CUDNN_STATUS_NOT_SUPPORTED_CUDA_GRAPH_NATIVE_API", + "CUDNN_STATUS_NOT_SUPPORTED_BAD_LAUNCH_PARAM", + "CUDNN_STATUS_NOT_SUPPORTED_ARCH_MISMATCH", + "CUDNN_STATUS_MAPPING_ERROR", + "CUDNN_STATUS_LICENSE_ERROR", + "CUDNN_STATUS_INTERNAL_ERROR_UNEXPECTED_VALUE", + "CUDNN_STATUS_INTERNAL_ERROR_TEXTURE_CREATION_FAILED", + "CUDNN_STATUS_INTERNAL_ERROR_HOST_ALLOCATION_FAILED", + "CUDNN_STATUS_INTERNAL_ERROR_DEVICE_ALLOCATION_FAILED", + "CUDNN_STATUS_INTERNAL_ERROR_COMPILATION_FAILED", + "CUDNN_STATUS_INTERNAL_ERROR_BAD_LAUNCH_PARAM", + "CUDNN_STATUS_FULL_ERROR_CODE", + "CUDNN_STATUS_EXECUTION_FAILED_CURAND", + "CUDNN_STATUS_EXECUTION_FAILED_CUDA_DRIVER", + "CUDNN_STATUS_EXECUTION_FAILED_CUDART", + "CUDNN_STATUS_EXECUTION_FAILED_CUBLAS", + "CUDNN_STATUS_EXECUTION_FAILED", + "CUDNN_STATUS_DEPRECATED", + "CUDNN_STATUS_CATEGORY", + "CUDNN_STATUS_BAD_PARAM_STREAM_MISMATCH", + "CUDNN_STATUS_BAD_PARAM_SIZE_INSUFFICIENT", + "CUDNN_STATUS_BAD_PARAM_SHAPE_MISMATCH", + "CUDNN_STATUS_BAD_PARAM_OUT_OF_BOUND", + "CUDNN_STATUS_BAD_PARAM_NULL_POINTER", + "CUDNN_STATUS_BAD_PARAM_NOT_FINALIZED", + "CUDNN_STATUS_BAD_PARAM_MISALIGNED_POINTER", + "CUDNN_STATUS_BAD_PARAM_DUPLICATED_ENTRIES", + "CUDNN_STATUS_BAD_PARAM_CUDA_GRAPH_MISMATCH", + "CUDNN_STATUS_BAD_PARAM_ATTRIBUTE_TYPE", + "CUDNN_STATUS_ARCH_MISMATCH", + "CUDNN_SIGNAL_WAIT", + "CUDNN_SIGNAL_SET", + "CUDNN_SEV_WARNING_EN", + "CUDNN_SEV_WARNING", + "CUDNN_SEV_INFO_EN", + "CUDNN_SEV_INFO", + "CUDNN_SEV_FATAL", + "CUDNN_SEV_ERROR_EN", + "CUDNN_SEV_ERROR", + "CUDNN_SEQDATA_VECT_DIM", + "CUDNN_SEQDATA_TIME_DIM", + "CUDNN_SEQDATA_DIM_COUNT", + "CUDNN_SEQDATA_BEAM_DIM", + "CUDNN_SEQDATA_BATCH_DIM", + "CUDNN_SCALAR_SIZE_T_WORKSPACE_SIZE_IN_BYTES", + "CUDNN_SCALAR_INT64_T_BN_ACCUMULATION_COUNT", + "CUDNN_SCALAR_DOUBLE_BN_EXP_AVG_FACTOR", + "CUDNN_SCALAR_DOUBLE_BN_EPSILON", + "CUDNN_SAMPLER_BILINEAR", + "CUDNN_RNN_DATA_LAYOUT_SEQ_MAJOR_UNPACKED", + "CUDNN_RNN_DATA_LAYOUT_SEQ_MAJOR_PACKED", + "CUDNN_RNN_DATA_LAYOUT_BATCH_MAJOR_UNPACKED", + "CUDNN_RNN_CLIP_NONE", + "CUDNN_RNN_CLIP_MINMAX", + "CUDNN_RNN_ALGO_PERSIST_STATIC_SMALL_H", + "CUDNN_RNN_ALGO_PERSIST_STATIC", + "CUDNN_RNN_ALGO_PERSIST_DYNAMIC", + "CUDNN_RNN_ALGO_COUNT", + "CUDNN_RMS_NORM", + "CUDNN_RESAMPLE_NEAREST", + "CUDNN_RESAMPLE_MAXPOOL", + "CUDNN_RESAMPLE_BILINEAR", + "CUDNN_RESAMPLE_AVGPOOL_INCLUDE_PADDING", + "CUDNN_RESAMPLE_AVGPOOL_EXCLUDE_PADDING", + "CUDNN_RESAMPLE_AVGPOOL", + "CUDNN_REDUCE_TENSOR_MUL_NO_ZEROS", + "CUDNN_PTR_ZDATA", + "CUDNN_PTR_YSUM", + "CUDNN_PTR_YSQSUM", + "CUDNN_PTR_YDATA", + "CUDNN_PTR_XDATA", + "CUDNN_PTR_WORKSPACE", + "CUDNN_PTR_WDATA", + "CUDNN_PTR_NULL", + "CUDNN_PTR_ELEM_ALIGNED", + "CUDNN_PTR_DZDATA", + "CUDNN_PTR_DYDATA", + "CUDNN_PTR_DXDATA", + "CUDNN_PTR_DWDATA", + "CUDNN_PTR_BN_Z_EQSCALE", + "CUDNN_PTR_BN_Z_EQBIAS", + "CUDNN_PTR_BN_SCALE", + "CUDNN_PTR_BN_SAVED_MEAN", + "CUDNN_PTR_BN_SAVED_INVSTD", + "CUDNN_PTR_BN_RUNNING_VAR", + "CUDNN_PTR_BN_RUNNING_MEAN", + "CUDNN_PTR_BN_EQSCALE", + "CUDNN_PTR_BN_EQBIAS", + "CUDNN_PTR_BN_DSCALE", + "CUDNN_PTR_BN_DBIAS", + "CUDNN_PTR_BN_BIAS", + "CUDNN_PTR_ACTIVATION_BITMASK", + "CUDNN_PTR_16B_ALIGNED", + "CUDNN_POOLING_MAX_DETERMINISTIC", + "CUDNN_POINTWISE_ATAN2", + "CUDNN_PARAM_ZDESC", + "CUDNN_PARAM_ZDATA_PLACEHOLDER", + "CUDNN_PARAM_YSUM_PLACEHOLDER", + "CUDNN_PARAM_YSTATS_DESC", + "CUDNN_PARAM_YSQSUM_PLACEHOLDER", + "CUDNN_PARAM_YDESC", + "CUDNN_PARAM_YDATA_PLACEHOLDER", + "CUDNN_PARAM_XDESC", + "CUDNN_PARAM_XDATA_PLACEHOLDER", + "CUDNN_PARAM_WDESC", + "CUDNN_PARAM_WDATA_PLACEHOLDER", + "CUDNN_PARAM_DZDESC", + "CUDNN_PARAM_DZDATA_PLACEHOLDER", + "CUDNN_PARAM_DYDESC", + "CUDNN_PARAM_DYDATA_PLACEHOLDER", + "CUDNN_PARAM_DXDESC", + "CUDNN_PARAM_DXDATA_PLACEHOLDER", + "CUDNN_PARAM_DWDESC", + "CUDNN_PARAM_DWDATA_PLACEHOLDER", + "CUDNN_PARAM_CONV_DESC", + "CUDNN_PARAM_BN_Z_EQSCALE_PLACEHOLDER", + "CUDNN_PARAM_BN_Z_EQSCALEBIAS_DESC", + "CUDNN_PARAM_BN_Z_EQBIAS_PLACEHOLDER", + "CUDNN_PARAM_BN_SCALE_PLACEHOLDER", + "CUDNN_PARAM_BN_SCALEBIAS_MEANVAR_DESC", + "CUDNN_PARAM_BN_SAVED_MEAN_PLACEHOLDER", + "CUDNN_PARAM_BN_SAVED_INVSTD_PLACEHOLDER", + "CUDNN_PARAM_BN_RUNNING_VAR_PLACEHOLDER", + "CUDNN_PARAM_BN_RUNNING_MEAN_PLACEHOLDER", + "CUDNN_PARAM_BN_MODE", + "CUDNN_PARAM_BN_EQSCALE_PLACEHOLDER", + "CUDNN_PARAM_BN_EQSCALEBIAS_DESC", + "CUDNN_PARAM_BN_EQBIAS_PLACEHOLDER", + "CUDNN_PARAM_BN_DSCALE_PLACEHOLDER", + "CUDNN_PARAM_BN_DBIAS_PLACEHOLDER", + "CUDNN_PARAM_BN_BIAS_PLACEHOLDER", + "CUDNN_PARAM_ACTIVATION_DESC", + "CUDNN_PARAM_ACTIVATION_BITMASK_PLACEHOLDER", + "CUDNN_PARAM_ACTIVATION_BITMASK_DESC", + "CUDNN_OP_TENSOR_SQRT", + "CUDNN_OP_TENSOR_NOT", + "CUDNN_NUMERICAL_NOTE_WINOGRAD_TILE_6x6", + "CUDNN_NUMERICAL_NOTE_WINOGRAD_TILE_4x4", + "CUDNN_NUMERICAL_NOTE_WINOGRAD_TILE_13x13", + "CUDNN_NUMERICAL_NOTE_WINOGRAD", + "CUDNN_NUMERICAL_NOTE_TYPE_COUNT", + "CUDNN_NUMERICAL_NOTE_TENSOR_CORE", + "CUDNN_NUMERICAL_NOTE_STRICT_NAN_PROP", + "CUDNN_NUMERICAL_NOTE_REDUCED_PRECISION_REDUCTION", + "CUDNN_NUMERICAL_NOTE_NONDETERMINISTIC", + "CUDNN_NUMERICAL_NOTE_FFT", + "CUDNN_NUMERICAL_NOTE_DOWN_CONVERT_INPUTS", + "CUDNN_NO_REORDER", + "CUDNN_NORM_PER_CHANNEL", + "CUDNN_NORM_PER_ACTIVATION", + "CUDNN_NORM_OPS_NORM_ADD_ACTIVATION", + "CUDNN_NORM_OPS_NORM_ACTIVATION", + "CUDNN_NORM_OPS_NORM", + "CUDNN_NORM_FWD_TRAINING", + "CUDNN_NORM_FWD_INFERENCE", + "CUDNN_NORM_ALGO_STANDARD", + "CUDNN_NORM_ALGO_PERSIST", + "CUDNN_NON_DETERMINISTIC", + "CUDNN_MH_ATTN_V_WEIGHTS", + "CUDNN_MH_ATTN_V_BIASES", + "CUDNN_MH_ATTN_Q_WEIGHTS", + "CUDNN_MH_ATTN_Q_BIASES", + "CUDNN_MH_ATTN_O_WEIGHTS", + "CUDNN_MH_ATTN_O_BIASES", + "CUDNN_MH_ATTN_K_WEIGHTS", + "CUDNN_MH_ATTN_K_BIASES", + "CUDNN_LRN_MIN_N", + "CUDNN_LRN_MIN_K", + "CUDNN_LRN_MIN_BETA", + "CUDNN_LRN_MAX_N", + "CUDNN_LOSS_NORMALIZATION_SOFTMAX", + "CUDNN_LOSS_NORMALIZATION_NONE", + "CUDNN_LAYOUT_TYPE_PREFERRED_PAD8CK", + "CUDNN_LAYOUT_TYPE_PREFERRED_PAD4CK", + "CUDNN_LAYOUT_TYPE_PREFERRED_NHWC", + "CUDNN_LAYOUT_TYPE_PREFERRED_NCHW", + "CUDNN_LAYOUT_TYPE_COUNT", + "CUDNN_LAYER_NORM", + "CUDNN_KNOB_TYPE_WORKSPACE", + "CUDNN_KNOB_TYPE_WINO_TILE", + "CUDNN_KNOB_TYPE_USE_TEX", + "CUDNN_KNOB_TYPE_TILE_SIZE", + "CUDNN_KNOB_TYPE_TILE_ROWS", + "CUDNN_KNOB_TYPE_TILE_COLS", + "CUDNN_KNOB_TYPE_TILE_CGA_N", + "CUDNN_KNOB_TYPE_TILE_CGA_M", + "CUDNN_KNOB_TYPE_TILE_CGA", + "CUDNN_KNOB_TYPE_TILEK", + "CUDNN_KNOB_TYPE_SWIZZLE", + "CUDNN_KNOB_TYPE_STAGES", + "CUDNN_KNOB_TYPE_SPLIT_RS", + "CUDNN_KNOB_TYPE_SPLIT_K_SLC", + "CUDNN_KNOB_TYPE_SPLIT_K_BUF", + "CUDNN_KNOB_TYPE_SPLIT_K", + "CUDNN_KNOB_TYPE_SPLIT_H", + "CUDNN_KNOB_TYPE_SPLIT_COLS", + "CUDNN_KNOB_TYPE_SPECFILT", + "CUDNN_KNOB_TYPE_SLICED", + "CUDNN_KNOB_TYPE_SINGLEBUFFER", + "CUDNN_KNOB_TYPE_REDUCTION_MODE", + "CUDNN_KNOB_TYPE_OCCUPANCY", + "CUDNN_KNOB_TYPE_NUM_C_PER_BLOCK", + "CUDNN_KNOB_TYPE_MULTIPLY", + "CUDNN_KNOB_TYPE_LOAD_SIZE", + "CUDNN_KNOB_TYPE_LDGC", + "CUDNN_KNOB_TYPE_LDGB", + "CUDNN_KNOB_TYPE_LDGA", + "CUDNN_KNOB_TYPE_KERNEL_CFG", + "CUDNN_KNOB_TYPE_KBLOCK", + "CUDNN_KNOB_TYPE_IDX_MODE", + "CUDNN_KNOB_TYPE_EDGE", + "CUDNN_KNOB_TYPE_CTA_SPLIT_K_MODE", + "CUDNN_KNOB_TYPE_COUNTS", + "CUDNN_KNOB_TYPE_CHUNK_K", + "CUDNN_KNOB_TYPE_BLOCK_SIZE", + "CUDNN_KNOB_TYPE_ARRAY_SIZE_PER_THREAD", + "CUDNN_INSTANCE_NORM", + "CUDNN_GROUP_NORM", + "CUDNN_GENSTATS_SUM_SQSUM", + "CUDNN_FUSED_SCALE_BIAS_ADD_ACTIVATION_GEN_BITMASK", + "CUDNN_FUSED_SCALE_BIAS_ACTIVATION_WGRAD", + "CUDNN_FUSED_SCALE_BIAS_ACTIVATION_CONV_BNSTATS", + "CUDNN_FUSED_DACTIVATION_FORK_DBATCHNORM", + "CUDNN_FUSED_CONV_SCALE_BIAS_ADD_ACTIVATION", + "CUDNN_FUSED_BN_FINALIZE_STATISTICS_TRAINING", + "CUDNN_FUSED_BN_FINALIZE_STATISTICS_INFERENCE", + "CUDNN_FMA_MATH", + "CUDNN_ERRQUERY_RAWCODE", + "CUDNN_ERRQUERY_NONBLOCKING", + "CUDNN_ERRQUERY_BLOCKING", + "CUDNN_DIVNORM_PRECOMPUTED_MEANS", + "CUDNN_DIM_MAX", + "CUDNN_DETERMINISTIC", + "CUDNN_DEFAULT_REORDER", + "CUDNN_DEFAULT_MATH", + "CUDNN_DATA_UINT8x4", + "CUDNN_DATA_UINT8", + "CUDNN_DATA_INT8x32", + "CUDNN_DATA_FAST_FLOAT_FOR_FP8", + "CUDNN_DATA_BOOLEAN", + "CUDNN_CTC_ZERO_OOB_GRADIENTS", + "CUDNN_CTC_SKIP_OOB_GRADIENTS", + "CUDNN_CTC_LOSS_ALGO_NON_DETERMINISTIC", + "CUDNN_CONVOLUTION_FWD_SPECIFY_WORKSPACE_LIMIT", + "CUDNN_CONVOLUTION_FWD_PREFER_FASTEST", + "CUDNN_CONVOLUTION_FWD_NO_WORKSPACE", + "CUDNN_CONVOLUTION_FWD_ALGO_WINOGRAD_NONFUSED", + "CUDNN_CONVOLUTION_FWD_ALGO_IMPLICIT_PRECOMP_GEMM", + "CUDNN_CONVOLUTION_FWD_ALGO_FFT_TILING", + "CUDNN_CONVOLUTION_FWD_ALGO_COUNT", + "CUDNN_CONVOLUTION_BWD_FILTER_SPECIFY_WORKSPACE_LIMIT", + "CUDNN_CONVOLUTION_BWD_FILTER_PREFER_FASTEST", + "CUDNN_CONVOLUTION_BWD_FILTER_NO_WORKSPACE", + "CUDNN_CONVOLUTION_BWD_FILTER_ALGO_WINOGRAD_NONFUSED", + "CUDNN_CONVOLUTION_BWD_FILTER_ALGO_WINOGRAD", + "CUDNN_CONVOLUTION_BWD_FILTER_ALGO_FFT_TILING", + "CUDNN_CONVOLUTION_BWD_FILTER_ALGO_FFT", + "CUDNN_CONVOLUTION_BWD_FILTER_ALGO_COUNT", + "CUDNN_CONVOLUTION_BWD_FILTER_ALGO_3", + "CUDNN_CONVOLUTION_BWD_FILTER_ALGO_1", + "CUDNN_CONVOLUTION_BWD_FILTER_ALGO_0", + "CUDNN_CONVOLUTION_BWD_DATA_SPECIFY_WORKSPACE_LIMIT", + "CUDNN_CONVOLUTION_BWD_DATA_PREFER_FASTEST", + "CUDNN_CONVOLUTION_BWD_DATA_NO_WORKSPACE", + "CUDNN_CONVOLUTION_BWD_DATA_ALGO_WINOGRAD_NONFUSED", + "CUDNN_CONVOLUTION_BWD_DATA_ALGO_FFT_TILING", + "CUDNN_BN_MIN_EPSILON", + "CUDNN_BN_FINALIZE_STATISTICS_TRAINING", + "CUDNN_BN_FINALIZE_STATISTICS_INFERENCE", + "CUDNN_BEHAVIOR_NOTE_TYPE_COUNT", + "CUDNN_BEHAVIOR_NOTE_SUPPORTS_CUDA_GRAPH_NATIVE_API", + "CUDNN_BEHAVIOR_NOTE_RUNTIME_COMPILATION", + "CUDNN_BEHAVIOR_NOTE_REQUIRES_FILTER_INT8x32_REORDER", + "CUDNN_BEHAVIOR_NOTE_REQUIRES_BIAS_INT8x32_REORDER", + "CUDNN_BATCH_NORM", + "CUDNN_BATCHNORM_SPATIAL_PERSISTENT", + "CUDNN_BATCHNORM_OPS_BN_ADD_ACTIVATION", + "CUDNN_BATCHNORM_OPS_BN_ACTIVATION", + "CUDNN_BATCHNORM_OPS_BN", + "CUDNN_BACKEND_OPERATION_RESHAPE_DESCRIPTOR", + "CUDNN_BACKEND_OPERATION_PAGED_CACHE_LOAD_DESCRIPTOR", + "CUDNN_BACKEND_OPERATION_BN_FINALIZE_STATISTICS_DESCRIPTOR", + "CUDNN_BACKEND_OPERATION_BN_BWD_WEIGHTS_DESCRIPTOR", + "CUDNN_BACKEND_KERNEL_CACHE_DESCRIPTOR", + "CUDNN_ATTR_OPERATION_PAGED_CACHE_LOAD_YDESC", + "CUDNN_ATTR_OPERATION_PAGED_CACHE_LOAD_SEQUENCE_DESC", + "CUDNN_ATTR_OPERATION_PAGED_CACHE_LOAD_PAGE_TABLE_DESC", + "CUDNN_ATTR_OPERATION_PAGED_CACHE_LOAD_CONTAINER_DESC", + "CUDNN_ATTR_OPERATIONGRAPH_IS_DYNAMIC_SHAPE_ENABLED", + "CUDNN_ATTR_KERNEL_CACHE_OPERATION_GRAPH", + "CUDNN_ATTR_KERNEL_CACHE_IS_ENGINECFG_KERNEL_CACHED", + "CUDNN_ATTR_EXECUTION_PLAN_KERNEL_CACHE", + "CUDNN_ATTR_ENGINECFG_WORKSPACE_SIZE", + "CUDNN_ATTR_ENGINECFG_SHARED_MEMORY_USED", + "CUDNN_ATTN_WKIND_COUNT", + "CUDNN_ATTN_QUERYMAP_ONE_TO_ONE", + "CUDNN_ATTN_QUERYMAP_ALL_TO_ONE", + "CUDNN_ATTN_ENABLE_PROJ_BIASES", + "CUDNN_ATTN_DISABLE_PROJ_BIASES", + "CUDNN_ACTIVATION_SWISH", "CUDA_R_8F_E5M2", "CUDA_R_8F_E4M3", "CUDA_R_64U", diff --git a/src/CUDA2HIP_Perl.cpp b/src/CUDA2HIP_Perl.cpp index ef402091..2bc73b2f 100644 --- a/src/CUDA2HIP_Perl.cpp +++ b/src/CUDA2HIP_Perl.cpp @@ -597,7 +597,7 @@ namespace perl { for (auto ma = CUDA_RENAMES_MAP().rbegin(); ma != CUDA_RENAMES_MAP().rend(); ++ma) { TranslateToRoc = false; if (Statistics::isUnsupported(ma->second)) { - if (ma->second.apiType == API_BLAS) { + if (ma->second.apiType == API_BLAS || ma->second.apiType == API_SPARSE || ma->second.apiType == API_RAND || ma->second.apiType == API_DNN) { sHipUnsupported << (countHipOnlyUnsupported ? ",\n" : "") << tab_2 << "\"" << ma->first.str() << "\""; countHipOnlyUnsupported++; } else { @@ -607,7 +607,7 @@ namespace perl { } TranslateToRoc = true; if (Statistics::isUnsupported(ma->second)) { - if (ma->second.apiType == API_BLAS) { + if (ma->second.apiType == API_BLAS || ma->second.apiType == API_SPARSE || ma->second.apiType == API_RAND || ma->second.apiType == API_DNN) { sRocUnsupported << (countRocOnlyUnsupported ? ",\n" : "") << tab_2 << "\"" << ma->first.str() << "\""; countRocOnlyUnsupported++; }