diff --git a/bin/hipify-perl b/bin/hipify-perl index ab714494..6191c4e1 100755 --- a/bin/hipify-perl +++ b/bin/hipify-perl @@ -12534,13 +12534,51 @@ sub warnHipOnlyUnsupportedFunctions { "CUBLASLT_MATMUL_TILE_8x192", "CUBLASLT_MATMUL_TILE_8x16", "CUBLASLT_MATMUL_TILE_8x128", + "CUBLASLT_MATMUL_TILE_80x64", + "CUBLASLT_MATMUL_TILE_80x576", + "CUBLASLT_MATMUL_TILE_80x512", + "CUBLASLT_MATMUL_TILE_80x448", + "CUBLASLT_MATMUL_TILE_80x384", + "CUBLASLT_MATMUL_TILE_80x320", + "CUBLASLT_MATMUL_TILE_80x256", + "CUBLASLT_MATMUL_TILE_80x192", + "CUBLASLT_MATMUL_TILE_80x128", + "CUBLASLT_MATMUL_TILE_72x640", + "CUBLASLT_MATMUL_TILE_72x64", + "CUBLASLT_MATMUL_TILE_72x576", + "CUBLASLT_MATMUL_TILE_72x512", + "CUBLASLT_MATMUL_TILE_72x448", + "CUBLASLT_MATMUL_TILE_72x384", + "CUBLASLT_MATMUL_TILE_72x320", + "CUBLASLT_MATMUL_TILE_72x256", + "CUBLASLT_MATMUL_TILE_72x192", + "CUBLASLT_MATMUL_TILE_72x128", "CUBLASLT_MATMUL_TILE_64x96", "CUBLASLT_MATMUL_TILE_64x8", + "CUBLASLT_MATMUL_TILE_64x768", + "CUBLASLT_MATMUL_TILE_64x704", + "CUBLASLT_MATMUL_TILE_64x640", "CUBLASLT_MATMUL_TILE_64x64", + "CUBLASLT_MATMUL_TILE_64x576", "CUBLASLT_MATMUL_TILE_64x512", + "CUBLASLT_MATMUL_TILE_64x448", + "CUBLASLT_MATMUL_TILE_64x384", + "CUBLASLT_MATMUL_TILE_64x320", "CUBLASLT_MATMUL_TILE_64x32", "CUBLASLT_MATMUL_TILE_64x256", + "CUBLASLT_MATMUL_TILE_64x192", "CUBLASLT_MATMUL_TILE_64x128", + "CUBLASLT_MATMUL_TILE_56x768", + "CUBLASLT_MATMUL_TILE_56x704", + "CUBLASLT_MATMUL_TILE_56x640", + "CUBLASLT_MATMUL_TILE_56x576", + "CUBLASLT_MATMUL_TILE_56x512", + "CUBLASLT_MATMUL_TILE_56x448", + "CUBLASLT_MATMUL_TILE_56x384", + "CUBLASLT_MATMUL_TILE_56x320", + "CUBLASLT_MATMUL_TILE_56x256", + "CUBLASLT_MATMUL_TILE_56x192", + "CUBLASLT_MATMUL_TILE_56x128", "CUBLASLT_MATMUL_TILE_512x64", "CUBLASLT_MATMUL_TILE_48x768", "CUBLASLT_MATMUL_TILE_48x704", @@ -14052,13 +14090,51 @@ sub warnRocOnlyUnsupportedFunctions { "CUBLASLT_MATMUL_TILE_8x192", "CUBLASLT_MATMUL_TILE_8x16", "CUBLASLT_MATMUL_TILE_8x128", + "CUBLASLT_MATMUL_TILE_80x64", + "CUBLASLT_MATMUL_TILE_80x576", + "CUBLASLT_MATMUL_TILE_80x512", + "CUBLASLT_MATMUL_TILE_80x448", + "CUBLASLT_MATMUL_TILE_80x384", + "CUBLASLT_MATMUL_TILE_80x320", + "CUBLASLT_MATMUL_TILE_80x256", + "CUBLASLT_MATMUL_TILE_80x192", + "CUBLASLT_MATMUL_TILE_80x128", + "CUBLASLT_MATMUL_TILE_72x640", + "CUBLASLT_MATMUL_TILE_72x64", + "CUBLASLT_MATMUL_TILE_72x576", + "CUBLASLT_MATMUL_TILE_72x512", + "CUBLASLT_MATMUL_TILE_72x448", + "CUBLASLT_MATMUL_TILE_72x384", + "CUBLASLT_MATMUL_TILE_72x320", + "CUBLASLT_MATMUL_TILE_72x256", + "CUBLASLT_MATMUL_TILE_72x192", + "CUBLASLT_MATMUL_TILE_72x128", "CUBLASLT_MATMUL_TILE_64x96", "CUBLASLT_MATMUL_TILE_64x8", + "CUBLASLT_MATMUL_TILE_64x768", + "CUBLASLT_MATMUL_TILE_64x704", + "CUBLASLT_MATMUL_TILE_64x640", "CUBLASLT_MATMUL_TILE_64x64", + "CUBLASLT_MATMUL_TILE_64x576", "CUBLASLT_MATMUL_TILE_64x512", + "CUBLASLT_MATMUL_TILE_64x448", + "CUBLASLT_MATMUL_TILE_64x384", + "CUBLASLT_MATMUL_TILE_64x320", "CUBLASLT_MATMUL_TILE_64x32", "CUBLASLT_MATMUL_TILE_64x256", + "CUBLASLT_MATMUL_TILE_64x192", "CUBLASLT_MATMUL_TILE_64x128", + "CUBLASLT_MATMUL_TILE_56x768", + "CUBLASLT_MATMUL_TILE_56x704", + "CUBLASLT_MATMUL_TILE_56x640", + "CUBLASLT_MATMUL_TILE_56x576", + "CUBLASLT_MATMUL_TILE_56x512", + "CUBLASLT_MATMUL_TILE_56x448", + "CUBLASLT_MATMUL_TILE_56x384", + "CUBLASLT_MATMUL_TILE_56x320", + "CUBLASLT_MATMUL_TILE_56x256", + "CUBLASLT_MATMUL_TILE_56x192", + "CUBLASLT_MATMUL_TILE_56x128", "CUBLASLT_MATMUL_TILE_512x64", "CUBLASLT_MATMUL_TILE_48x768", "CUBLASLT_MATMUL_TILE_48x704", diff --git a/docs/tables/CUBLAS_API_supported_by_HIP.md b/docs/tables/CUBLAS_API_supported_by_HIP.md index ee8ad63c..1e33e012 100644 --- a/docs/tables/CUBLAS_API_supported_by_HIP.md +++ b/docs/tables/CUBLAS_API_supported_by_HIP.md @@ -401,13 +401,51 @@ |`CUBLASLT_MATMUL_TILE_48x704`|12.6| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_48x768`|12.6| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_512x64`|10.1| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x128`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x192`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x256`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x320`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x384`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x448`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x512`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x576`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x640`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x704`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x768`|12.6| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_64x128`|10.1| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x192`|12.6| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_64x256`|10.1| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_64x32`|10.1| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x320`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x384`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x448`|12.6| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_64x512`|10.1| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x576`|12.6| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_64x64`|10.1| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x640`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x704`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x768`|12.6| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_64x8`|10.1| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_64x96`|11.3| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x128`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x192`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x256`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x320`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x384`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x448`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x512`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x576`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x64`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x640`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x128`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x192`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x256`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x320`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x384`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x448`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x512`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x576`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x64`|12.6| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_8x128`|12.6| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_8x16`|10.1| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_8x192`|12.6| | | | | | | | | | diff --git a/docs/tables/CUBLAS_API_supported_by_HIP_and_ROC.md b/docs/tables/CUBLAS_API_supported_by_HIP_and_ROC.md index a95fbf83..853e7afa 100644 --- a/docs/tables/CUBLAS_API_supported_by_HIP_and_ROC.md +++ b/docs/tables/CUBLAS_API_supported_by_HIP_and_ROC.md @@ -401,13 +401,51 @@ |`CUBLASLT_MATMUL_TILE_48x704`|12.6| | | | | | | | | | | | | | | | |`CUBLASLT_MATMUL_TILE_48x768`|12.6| | | | | | | | | | | | | | | | |`CUBLASLT_MATMUL_TILE_512x64`|10.1| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x128`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x192`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x256`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x320`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x384`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x448`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x512`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x576`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x640`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x704`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x768`|12.6| | | | | | | | | | | | | | | | |`CUBLASLT_MATMUL_TILE_64x128`|10.1| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x192`|12.6| | | | | | | | | | | | | | | | |`CUBLASLT_MATMUL_TILE_64x256`|10.1| | | | | | | | | | | | | | | | |`CUBLASLT_MATMUL_TILE_64x32`|10.1| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x320`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x384`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x448`|12.6| | | | | | | | | | | | | | | | |`CUBLASLT_MATMUL_TILE_64x512`|10.1| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x576`|12.6| | | | | | | | | | | | | | | | |`CUBLASLT_MATMUL_TILE_64x64`|10.1| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x640`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x704`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x768`|12.6| | | | | | | | | | | | | | | | |`CUBLASLT_MATMUL_TILE_64x8`|10.1| | | | | | | | | | | | | | | | |`CUBLASLT_MATMUL_TILE_64x96`|11.3| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x128`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x192`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x256`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x320`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x384`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x448`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x512`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x576`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x64`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x640`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x128`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x192`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x256`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x320`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x384`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x448`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x512`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x576`|12.6| | | | | | | | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x64`|12.6| | | | | | | | | | | | | | | | |`CUBLASLT_MATMUL_TILE_8x128`|12.6| | | | | | | | | | | | | | | | |`CUBLASLT_MATMUL_TILE_8x16`|10.1| | | | | | | | | | | | | | | | |`CUBLASLT_MATMUL_TILE_8x192`|12.6| | | | | | | | | | | | | | | | diff --git a/docs/tables/CUBLAS_API_supported_by_ROC.md b/docs/tables/CUBLAS_API_supported_by_ROC.md index a85c584a..d3e5d316 100644 --- a/docs/tables/CUBLAS_API_supported_by_ROC.md +++ b/docs/tables/CUBLAS_API_supported_by_ROC.md @@ -401,13 +401,51 @@ |`CUBLASLT_MATMUL_TILE_48x704`|12.6| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_48x768`|12.6| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_512x64`|10.1| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x128`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x192`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x256`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x320`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x384`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x448`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x512`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x576`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x640`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x704`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_56x768`|12.6| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_64x128`|10.1| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x192`|12.6| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_64x256`|10.1| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_64x32`|10.1| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x320`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x384`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x448`|12.6| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_64x512`|10.1| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x576`|12.6| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_64x64`|10.1| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x640`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x704`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_64x768`|12.6| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_64x8`|10.1| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_64x96`|11.3| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x128`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x192`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x256`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x320`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x384`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x448`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x512`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x576`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x64`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_72x640`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x128`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x192`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x256`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x320`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x384`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x448`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x512`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x576`|12.6| | | | | | | | | | +|`CUBLASLT_MATMUL_TILE_80x64`|12.6| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_8x128`|12.6| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_8x16`|10.1| | | | | | | | | | |`CUBLASLT_MATMUL_TILE_8x192`|12.6| | | | | | | | | | diff --git a/src/CUDA2HIP_BLAS_API_types.cpp b/src/CUDA2HIP_BLAS_API_types.cpp index 23c90533..330a3223 100644 --- a/src/CUDA2HIP_BLAS_API_types.cpp +++ b/src/CUDA2HIP_BLAS_API_types.cpp @@ -308,6 +308,44 @@ const std::map CUDA_BLAS_TYPE_NAME_MAP { {"CUBLASLT_MATMUL_TILE_48x640", {"HIPBLASLT_MATMUL_TILE_48x640", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, {"CUBLASLT_MATMUL_TILE_48x704", {"HIPBLASLT_MATMUL_TILE_48x704", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, {"CUBLASLT_MATMUL_TILE_48x768", {"HIPBLASLT_MATMUL_TILE_48x768", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_56x128", {"HIPBLASLT_MATMUL_TILE_56x128", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_56x192", {"HIPBLASLT_MATMUL_TILE_56x192", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_56x256", {"HIPBLASLT_MATMUL_TILE_56x256", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_56x320", {"HIPBLASLT_MATMUL_TILE_56x320", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_56x384", {"HIPBLASLT_MATMUL_TILE_56x384", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_56x448", {"HIPBLASLT_MATMUL_TILE_56x448", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_56x512", {"HIPBLASLT_MATMUL_TILE_56x512", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_56x576", {"HIPBLASLT_MATMUL_TILE_56x576", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_56x640", {"HIPBLASLT_MATMUL_TILE_56x640", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_56x704", {"HIPBLASLT_MATMUL_TILE_56x704", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_56x768", {"HIPBLASLT_MATMUL_TILE_56x768", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_64x192", {"HIPBLASLT_MATMUL_TILE_64x192", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_64x320", {"HIPBLASLT_MATMUL_TILE_64x320", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_64x384", {"HIPBLASLT_MATMUL_TILE_64x384", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_64x448", {"HIPBLASLT_MATMUL_TILE_64x448", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_64x576", {"HIPBLASLT_MATMUL_TILE_64x576", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_64x640", {"HIPBLASLT_MATMUL_TILE_64x640", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_64x704", {"HIPBLASLT_MATMUL_TILE_64x704", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_64x768", {"HIPBLASLT_MATMUL_TILE_64x768", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_72x64", {"HIPBLASLT_MATMUL_TILE_72x64", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_72x128", {"HIPBLASLT_MATMUL_TILE_72x128", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_72x192", {"HIPBLASLT_MATMUL_TILE_72x192", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_72x256", {"HIPBLASLT_MATMUL_TILE_72x256", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_72x320", {"HIPBLASLT_MATMUL_TILE_72x320", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_72x384", {"HIPBLASLT_MATMUL_TILE_72x384", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_72x448", {"HIPBLASLT_MATMUL_TILE_72x448", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_72x512", {"HIPBLASLT_MATMUL_TILE_72x512", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_72x576", {"HIPBLASLT_MATMUL_TILE_72x576", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_72x640", {"HIPBLASLT_MATMUL_TILE_72x640", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_80x64", {"HIPBLASLT_MATMUL_TILE_80x64", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_80x128", {"HIPBLASLT_MATMUL_TILE_80x128", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_80x192", {"HIPBLASLT_MATMUL_TILE_80x192", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_80x256", {"HIPBLASLT_MATMUL_TILE_80x256", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_80x320", {"HIPBLASLT_MATMUL_TILE_80x320", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_80x384", {"HIPBLASLT_MATMUL_TILE_80x384", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_80x448", {"HIPBLASLT_MATMUL_TILE_80x448", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_80x512", {"HIPBLASLT_MATMUL_TILE_80x512", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, + {"CUBLASLT_MATMUL_TILE_80x576", {"HIPBLASLT_MATMUL_TILE_80x576", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, {"CUBLASLT_MATMUL_TILE_END", {"HIPBLASLT_MATMUL_TILE_END", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, {"cublasLtMatmulStages_t", {"hipblasLtMatmulStages_t", "", CONV_TYPE, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, {"CUBLASLT_MATMUL_STAGES_UNDEFINED", {"HIPBLASLT_MATMUL_STAGES_UNDEFINED", "", CONV_NUMERIC_LITERAL, API_BLAS, SEC::BLAS_LT_DATA_TYPES, UNSUPPORTED}}, @@ -1033,6 +1071,44 @@ const std::map CUDA_BLAS_TYPE_NAME_VER_MAP { {"CUBLASLT_MATMUL_TILE_48x640", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 {"CUBLASLT_MATMUL_TILE_48x704", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 {"CUBLASLT_MATMUL_TILE_48x768", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_56x128", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_56x192", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_56x256", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_56x320", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_56x384", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_56x448", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_56x512", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_56x576", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_56x640", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_56x704", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_56x768", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_64x192", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_64x320", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_64x384", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_64x448", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_64x576", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_64x640", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_64x704", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_64x768", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_72x64", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_72x128", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_72x192", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_72x256", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_72x320", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_72x384", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_72x448", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_72x512", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_72x576", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_72x640", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_80x64", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_80x128", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_80x192", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_80x256", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_80x320", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_80x384", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_80x448", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_80x512", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 + {"CUBLASLT_MATMUL_TILE_80x576", {CUDA_126, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 12062, CUBLAS_VERSION 120603, CUBLAS_VER_MAJOR 12 CUBLAS_VER_MINOR 6 CUBLAS_VER_PATCH 3 }; const std::map HIP_BLAS_TYPE_NAME_VER_MAP {