diff --git a/CMakeLists.txt b/CMakeLists.txt index 30cfe7be..02df74d2 100644 --- a/CMakeLists.txt +++ b/CMakeLists.txt @@ -139,7 +139,7 @@ if (NOT HIPIFY_CLANG_TESTS_ONLY) if(MSVC) target_link_libraries(hipify-clang PRIVATE version) - target_compile_options(hipify-clang PRIVATE ${STD} /Od /GR- /EHs- /EHc-) + target_compile_options(hipify-clang PRIVATE ${STD} /Od /GR- /EHs- /EHc- /MP) if((LLVM_PACKAGE_VERSION VERSION_EQUAL "18.0.0" OR LLVM_PACKAGE_VERSION VERSION_GREATER "18.0.0") AND MSVC_VERSION VERSION_GREATER "1919") target_compile_options(hipify-clang PRIVATE /Zc:preprocessor) endif() diff --git a/bin/hipconvertinplace-perl.sh b/bin/hipconvertinplace-perl.sh index 5a4dff3d..0d4202fa 100755 --- a/bin/hipconvertinplace-perl.sh +++ b/bin/hipconvertinplace-perl.sh @@ -12,7 +12,7 @@ # (this is useful for testing improvements to the hipify-perl toolset). SCRIPT_DIR="$(dirname "$(realpath "$0")")" -PRIV_SCRIPT_DIR="$SCRIPT_DIR/../../libexec/hipify" +PRIV_SCRIPT_DIR="$SCRIPT_DIR/../libexec/hipify" SEARCH_DIR=$1 shift $SCRIPT_DIR/hipify-perl -inplace -print-stats "$@" `$PRIV_SCRIPT_DIR/findcode.sh $SEARCH_DIR` diff --git a/bin/hipconvertinplace.sh b/bin/hipconvertinplace.sh index 8a4cebb4..8250667a 100755 --- a/bin/hipconvertinplace.sh +++ b/bin/hipconvertinplace.sh @@ -7,7 +7,7 @@ # preserves the existing directory structure. SCRIPT_DIR="$(dirname "$(realpath "$0")")" -PRIV_SCRIPT_DIR="$SCRIPT_DIR/../../libexec/hipify" +PRIV_SCRIPT_DIR="$SCRIPT_DIR/../libexec/hipify" SEARCH_DIR=$1 hipify_args='' diff --git a/bin/hipexamine-perl.sh b/bin/hipexamine-perl.sh index 1ce1591d..ac628196 100755 --- a/bin/hipexamine-perl.sh +++ b/bin/hipexamine-perl.sh @@ -7,7 +7,7 @@ SCRIPT_DIR="$(dirname "$(realpath "$0")")" -PRIV_SCRIPT_DIR="$SCRIPT_DIR/../../libexec/hipify" +PRIV_SCRIPT_DIR="$SCRIPT_DIR/../libexec/hipify" SEARCH_DIR=$1 shift $SCRIPT_DIR/hipify-perl -no-output -print-stats "$@" `$PRIV_SCRIPT_DIR/findcode.sh $SEARCH_DIR` diff --git a/bin/hipexamine.sh b/bin/hipexamine.sh index 028f922a..c6059e24 100755 --- a/bin/hipexamine.sh +++ b/bin/hipexamine.sh @@ -5,7 +5,7 @@ # Generate CUDA->HIP conversion statistics for all the code files in the specified directory. SCRIPT_DIR="$(dirname "$(realpath "$0")")" -PRIV_SCRIPT_DIR="$SCRIPT_DIR/../../libexec/hipify" +PRIV_SCRIPT_DIR="$SCRIPT_DIR/../libexec/hipify" SEARCH_DIR=$1 hipify_args='' diff --git a/bin/hipify-perl b/bin/hipify-perl index 6397256d..d596c73c 100755 --- a/bin/hipify-perl +++ b/bin/hipify-perl @@ -1076,6 +1076,8 @@ my %removed_funcs = ( ); my %experimental_funcs = ( + "cusparseCscGet" => "6.1.0", + "cusparseConstCscGet" => "6.1.0", "cusolverSpSetStream" => "6.1.0", "cusolverSpScsrlsvcholHost" => "6.1.0", "cusolverSpScsrlsvchol" => "6.1.0", @@ -1084,6 +1086,41 @@ my %experimental_funcs = ( "cusolverSpDcsrlsvcholHost" => "6.1.0", "cusolverSpDcsrlsvchol" => "6.1.0", "cusolverSpCreate" => "6.1.0", + "cudaMemcpyNodeParams" => "6.1.0", + "cudaMemFreeNodeParams" => "6.1.0", + "cudaGraphNodeSetParams" => "6.1.0", + "cudaGraphNodeParams" => "6.1.0", + "cudaGraphInstantiateWithParams" => "6.1.0", + "cudaGraphInstantiateSuccess" => "6.1.0", + "cudaGraphInstantiateResult" => "6.1.0", + "cudaGraphInstantiateParams_st" => "6.1.0", + "cudaGraphInstantiateParams" => "6.1.0", + "cudaGraphInstantiateNodeOperationNotSupported" => "6.1.0", + "cudaGraphInstantiateMultipleDevicesNotSupported" => "6.1.0", + "cudaGraphInstantiateInvalidStructure" => "6.1.0", + "cudaGraphInstantiateError" => "6.1.0", + "cudaGraphExternalSemaphoresWaitNodeSetParams" => "6.1.0", + "cudaGraphExternalSemaphoresWaitNodeGetParams" => "6.1.0", + "cudaGraphExternalSemaphoresSignalNodeSetParams" => "6.1.0", + "cudaGraphExternalSemaphoresSignalNodeGetParams" => "6.1.0", + "cudaGraphExecNodeSetParams" => "6.1.0", + "cudaGraphExecGetFlags" => "6.1.0", + "cudaGraphExecExternalSemaphoresWaitNodeSetParams" => "6.1.0", + "cudaGraphExecExternalSemaphoresSignalNodeSetParams" => "6.1.0", + "cudaGraphAddNode" => "6.1.0", + "cudaGraphAddExternalSemaphoresWaitNode" => "6.1.0", + "cudaGraphAddExternalSemaphoresSignalNode" => "6.1.0", + "cudaGetDriverEntryPoint" => "6.1.0", + "cudaGPUDirectRDMAWritesOrderingOwner" => "6.1.0", + "cudaGPUDirectRDMAWritesOrderingNone" => "6.1.0", + "cudaGPUDirectRDMAWritesOrderingAllDevices" => "6.1.0", + "cudaGPUDirectRDMAWritesOrdering" => "6.1.0", + "cudaFlushGPUDirectRDMAWritesOptions" => "6.1.0", + "cudaFlushGPUDirectRDMAWritesOptionMemOps" => "6.1.0", + "cudaFlushGPUDirectRDMAWritesOptionHost" => "6.1.0", + "cudaEventWaitNodeParams" => "6.1.0", + "cudaEventRecordNodeParams" => "6.1.0", + "cudaChildGraphNodeParams" => "6.1.0", "cublasZswap_64" => "6.1.0", "cublasZscal_64" => "6.1.0", "cublasZrot_64" => "6.1.0", @@ -1135,7 +1172,62 @@ my %experimental_funcs = ( "cublasCdotc_64" => "6.1.0", "cublasCcopy_64" => "6.1.0", "cublasCaxpy_64" => "6.1.0", + "cuGraphNodeSetParams" => "6.1.0", + "cuGraphMemcpyNodeSetParams" => "6.1.0", + "cuGraphMemcpyNodeGetParams" => "6.1.0", + "cuGraphInstantiateWithParams" => "6.1.0", + "cuGraphExternalSemaphoresWaitNodeSetParams" => "6.1.0", + "cuGraphExternalSemaphoresWaitNodeGetParams" => "6.1.0", + "cuGraphExternalSemaphoresSignalNodeSetParams" => "6.1.0", + "cuGraphExternalSemaphoresSignalNodeGetParams" => "6.1.0", + "cuGraphExecNodeSetParams" => "6.1.0", + "cuGraphExecMemsetNodeSetParams" => "6.1.0", + "cuGraphExecMemcpyNodeSetParams" => "6.1.0", + "cuGraphExecGetFlags" => "6.1.0", + "cuGraphExecExternalSemaphoresWaitNodeSetParams" => "6.1.0", + "cuGraphExecExternalSemaphoresSignalNodeSetParams" => "6.1.0", + "cuGraphAddNode" => "6.1.0", + "cuGraphAddMemsetNode" => "6.1.0", + "cuGraphAddMemFreeNode" => "6.1.0", + "cuGraphAddExternalSemaphoresWaitNode" => "6.1.0", + "cuGraphAddExternalSemaphoresSignalNode" => "6.1.0", + "cuGetProcAddress" => "6.1.0", + "CUgraphNodeParams_st" => "6.1.0", + "CUgraphNodeParams" => "6.1.0", + "CUgraphInstantiateResult_enum" => "6.1.0", + "CUgraphInstantiateResult" => "6.1.0", + "CUflushGPUDirectRDMAWritesOptions_enum" => "6.1.0", + "CUflushGPUDirectRDMAWritesOptions" => "6.1.0", + "CUdriverProcAddressQueryResult_enum" => "6.1.0", + "CUdriverProcAddressQueryResult" => "6.1.0", + "CU_GPU_DIRECT_RDMA_WRITES_ORDERING_OWNER" => "6.1.0", + "CU_GPU_DIRECT_RDMA_WRITES_ORDERING_NONE" => "6.1.0", + "CU_GPU_DIRECT_RDMA_WRITES_ORDERING_ALL_DEVICES" => "6.1.0", + "CU_GET_PROC_ADDRESS_VERSION_NOT_SUFFICIENT" => "6.1.0", + "CU_GET_PROC_ADDRESS_SYMBOL_NOT_FOUND" => "6.1.0", + "CU_GET_PROC_ADDRESS_SUCCESS" => "6.1.0", + "CU_FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_MEMOPS" => "6.1.0", + "CU_FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_HOST" => "6.1.0", "CUSOLVER_STATUS_MATRIX_TYPE_NOT_SUPPORTED" => "6.1.0", + "CUGPUDirectRDMAWritesOrdering_enum" => "6.1.0", + "CUGPUDirectRDMAWritesOrdering" => "6.1.0", + "CUDA_MEM_FREE_NODE_PARAMS_st" => "6.1.0", + "CUDA_MEM_FREE_NODE_PARAMS" => "6.1.0", + "CUDA_MEMCPY_NODE_PARAMS_st" => "6.1.0", + "CUDA_MEMCPY_NODE_PARAMS" => "6.1.0", + "CUDA_GRAPH_INSTANTIATE_SUCCESS" => "6.1.0", + "CUDA_GRAPH_INSTANTIATE_PARAMS_st" => "6.1.0", + "CUDA_GRAPH_INSTANTIATE_PARAMS" => "6.1.0", + "CUDA_GRAPH_INSTANTIATE_NODE_OPERATION_NOT_SUPPORTED" => "6.1.0", + "CUDA_GRAPH_INSTANTIATE_MULTIPLE_CTXS_NOT_SUPPORTED" => "6.1.0", + "CUDA_GRAPH_INSTANTIATE_INVALID_STRUCTURE" => "6.1.0", + "CUDA_GRAPH_INSTANTIATE_ERROR" => "6.1.0", + "CUDA_EVENT_WAIT_NODE_PARAMS_st" => "6.1.0", + "CUDA_EVENT_WAIT_NODE_PARAMS" => "6.1.0", + "CUDA_EVENT_RECORD_NODE_PARAMS_st" => "6.1.0", + "CUDA_EVENT_RECORD_NODE_PARAMS" => "6.1.0", + "CUDA_CHILD_GRAPH_NODE_PARAMS_st" => "6.1.0", + "CUDA_CHILD_GRAPH_NODE_PARAMS" => "6.1.0", "CUBLAS_TF32_TENSOR_OP_MATH" => "6.1.0", "CUBLAS_TENSOR_OP_MATH" => "6.1.0", "CUBLAS_PEDANTIC_MATH" => "6.1.0", @@ -1278,6 +1370,40 @@ sub subst { } sub experimentalSubstitutions { + subst("cuGraphAddExternalSemaphoresSignalNode", "hipGraphAddExternalSemaphoresSignalNode", "graph"); + subst("cuGraphAddExternalSemaphoresWaitNode", "hipGraphAddExternalSemaphoresWaitNode", "graph"); + subst("cuGraphAddMemFreeNode", "hipDrvGraphAddMemFreeNode", "graph"); + subst("cuGraphAddMemsetNode", "hipDrvGraphAddMemsetNode", "graph"); + subst("cuGraphAddNode", "hipGraphAddNode", "graph"); + subst("cuGraphExecExternalSemaphoresSignalNodeSetParams", "hipGraphExecExternalSemaphoresSignalNodeSetParams", "graph"); + subst("cuGraphExecExternalSemaphoresWaitNodeSetParams", "hipGraphExecExternalSemaphoresWaitNodeSetParams", "graph"); + subst("cuGraphExecGetFlags", "hipGraphExecGetFlags", "graph"); + subst("cuGraphExecMemcpyNodeSetParams", "hipDrvGraphExecMemcpyNodeSetParams", "graph"); + subst("cuGraphExecMemsetNodeSetParams", "hipDrvGraphExecMemsetNodeSetParams", "graph"); + subst("cuGraphExecNodeSetParams", "hipGraphExecNodeSetParams", "graph"); + subst("cuGraphExternalSemaphoresSignalNodeGetParams", "hipGraphExternalSemaphoresSignalNodeGetParams", "graph"); + subst("cuGraphExternalSemaphoresSignalNodeSetParams", "hipGraphExternalSemaphoresSignalNodeSetParams", "graph"); + subst("cuGraphExternalSemaphoresWaitNodeGetParams", "hipGraphExternalSemaphoresWaitNodeGetParams", "graph"); + subst("cuGraphExternalSemaphoresWaitNodeSetParams", "hipGraphExternalSemaphoresWaitNodeSetParams", "graph"); + subst("cuGraphInstantiateWithParams", "hipGraphInstantiateWithParams", "graph"); + subst("cuGraphMemcpyNodeGetParams", "hipDrvGraphMemcpyNodeGetParams", "graph"); + subst("cuGraphMemcpyNodeSetParams", "hipDrvGraphMemcpyNodeSetParams", "graph"); + subst("cuGraphNodeSetParams", "hipGraphNodeSetParams", "graph"); + subst("cudaGraphAddExternalSemaphoresSignalNode", "hipGraphAddExternalSemaphoresSignalNode", "graph"); + subst("cudaGraphAddExternalSemaphoresWaitNode", "hipGraphAddExternalSemaphoresWaitNode", "graph"); + subst("cudaGraphAddNode", "hipGraphAddNode", "graph"); + subst("cudaGraphExecExternalSemaphoresSignalNodeSetParams", "hipGraphExecExternalSemaphoresSignalNodeSetParams", "graph"); + subst("cudaGraphExecExternalSemaphoresWaitNodeSetParams", "hipGraphExecExternalSemaphoresWaitNodeSetParams", "graph"); + subst("cudaGraphExecGetFlags", "hipGraphExecGetFlags", "graph"); + subst("cudaGraphExecNodeSetParams", "hipGraphExecNodeSetParams", "graph"); + subst("cudaGraphExternalSemaphoresSignalNodeGetParams", "hipGraphExternalSemaphoresSignalNodeGetParams", "graph"); + subst("cudaGraphExternalSemaphoresSignalNodeSetParams", "hipGraphExternalSemaphoresSignalNodeSetParams", "graph"); + subst("cudaGraphExternalSemaphoresWaitNodeGetParams", "hipGraphExternalSemaphoresWaitNodeGetParams", "graph"); + subst("cudaGraphExternalSemaphoresWaitNodeSetParams", "hipGraphExternalSemaphoresWaitNodeSetParams", "graph"); + subst("cudaGraphInstantiateWithParams", "hipGraphInstantiateWithParams", "graph"); + subst("cudaGraphNodeSetParams", "hipGraphNodeSetParams", "graph"); + subst("cuGetProcAddress", "hipGetProcAddress", "driver_entry_point"); + subst("cudaGetDriverEntryPoint", "hipGetProcAddress", "driver_entry_point"); subst("cublasAxpyEx_64", "hipblasAxpyEx_64", "library"); subst("cublasCaxpy_64", "hipblasCaxpy_v2_64", "library"); subst("cublasCcopy_64", "hipblasCcopy_v2_64", "library"); @@ -1341,14 +1467,72 @@ sub experimentalSubstitutions { subst("cusolverSpScsrlsvchol", "hipsolverSpScsrlsvchol", "library"); subst("cusolverSpScsrlsvcholHost", "hipsolverSpScsrlsvcholHost", "library"); subst("cusolverSpSetStream", "hipsolverSpSetStream", "library"); + subst("cusparseConstCscGet", "hipsparseConstCscGet", "library"); + subst("cusparseCscGet", "hipsparseCscGet", "library"); + subst("CUDA_CHILD_GRAPH_NODE_PARAMS", "hipChildGraphNodeParams", "type"); + subst("CUDA_CHILD_GRAPH_NODE_PARAMS_st", "hipChildGraphNodeParams", "type"); + subst("CUDA_EVENT_RECORD_NODE_PARAMS", "hipEventRecordNodeParams", "type"); + subst("CUDA_EVENT_RECORD_NODE_PARAMS_st", "hipEventRecordNodeParams", "type"); + subst("CUDA_EVENT_WAIT_NODE_PARAMS", "hipEventWaitNodeParams", "type"); + subst("CUDA_EVENT_WAIT_NODE_PARAMS_st", "hipEventWaitNodeParams", "type"); + subst("CUDA_GRAPH_INSTANTIATE_PARAMS", "hipGraphInstantiateParams", "type"); + subst("CUDA_GRAPH_INSTANTIATE_PARAMS_st", "hipGraphInstantiateParams", "type"); + subst("CUDA_MEMCPY_NODE_PARAMS", "hipMemcpyNodeParams", "type"); + subst("CUDA_MEMCPY_NODE_PARAMS_st", "hipMemcpyNodeParams", "type"); + subst("CUDA_MEM_FREE_NODE_PARAMS", "hipMemFreeNodeParams", "type"); + subst("CUDA_MEM_FREE_NODE_PARAMS_st", "hipMemFreeNodeParams", "type"); + subst("CUGPUDirectRDMAWritesOrdering", "hipGPUDirectRDMAWritesOrdering", "type"); + subst("CUGPUDirectRDMAWritesOrdering_enum", "hipGPUDirectRDMAWritesOrdering", "type"); + subst("CUdriverProcAddressQueryResult", "hipDriverProcAddressQueryResult", "type"); + subst("CUdriverProcAddressQueryResult_enum", "hipDriverProcAddressQueryResult", "type"); + subst("CUflushGPUDirectRDMAWritesOptions", "hipFlushGPUDirectRDMAWritesOptions", "type"); + subst("CUflushGPUDirectRDMAWritesOptions_enum", "hipFlushGPUDirectRDMAWritesOptions", "type"); + subst("CUgraphInstantiateResult", "hipGraphInstantiateResult", "type"); + subst("CUgraphInstantiateResult_enum", "hipGraphInstantiateResult", "type"); + subst("CUgraphNodeParams", "hipGraphNodeParams", "type"); + subst("CUgraphNodeParams_st", "hipGraphNodeParams", "type"); subst("cublasMath_t", "hipblasMath_t", "type"); + subst("cudaChildGraphNodeParams", "hipChildGraphNodeParams", "type"); + subst("cudaEventRecordNodeParams", "hipEventRecordNodeParams", "type"); + subst("cudaEventWaitNodeParams", "hipEventWaitNodeParams", "type"); + subst("cudaFlushGPUDirectRDMAWritesOptions", "hipFlushGPUDirectRDMAWritesOptions", "type"); + subst("cudaGPUDirectRDMAWritesOrdering", "hipGPUDirectRDMAWritesOrdering", "type"); + subst("cudaGraphInstantiateParams", "hipGraphInstantiateParams", "type"); + subst("cudaGraphInstantiateParams_st", "hipGraphInstantiateParams", "type"); + subst("cudaGraphInstantiateResult", "hipGraphInstantiateResult", "type"); + subst("cudaGraphNodeParams", "hipGraphNodeParams", "type"); + subst("cudaMemFreeNodeParams", "hipMemFreeNodeParams", "type"); + subst("cudaMemcpyNodeParams", "hipMemcpyNodeParams", "type"); subst("cusolverSpHandle_t", "hipsolverSpHandle_t", "type"); subst("CUBLAS_DEFAULT_MATH", "HIPBLAS_DEFAULT_MATH", "numeric_literal"); subst("CUBLAS_MATH_DISALLOW_REDUCED_PRECISION_REDUCTION", "HIPBLAS_MATH_DISALLOW_REDUCED_PRECISION_REDUCTION", "numeric_literal"); subst("CUBLAS_PEDANTIC_MATH", "HIPBLAS_PEDANTIC_MATH", "numeric_literal"); subst("CUBLAS_TENSOR_OP_MATH", "HIPBLAS_TENSOR_OP_MATH", "numeric_literal"); subst("CUBLAS_TF32_TENSOR_OP_MATH", "HIPBLAS_TF32_TENSOR_OP_MATH", "numeric_literal"); + subst("CUDA_GRAPH_INSTANTIATE_ERROR", "hipGraphInstantiateError", "numeric_literal"); + subst("CUDA_GRAPH_INSTANTIATE_INVALID_STRUCTURE", "hipGraphInstantiateInvalidStructure", "numeric_literal"); + subst("CUDA_GRAPH_INSTANTIATE_MULTIPLE_CTXS_NOT_SUPPORTED", "hipGraphInstantiateMultipleDevicesNotSupported", "numeric_literal"); + subst("CUDA_GRAPH_INSTANTIATE_NODE_OPERATION_NOT_SUPPORTED", "hipGraphInstantiateNodeOperationNotSupported", "numeric_literal"); + subst("CUDA_GRAPH_INSTANTIATE_SUCCESS", "hipGraphInstantiateSuccess", "numeric_literal"); subst("CUSOLVER_STATUS_MATRIX_TYPE_NOT_SUPPORTED", "HIPSOLVER_STATUS_MATRIX_TYPE_NOT_SUPPORTED", "numeric_literal"); + subst("CU_FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_HOST", "hipFlushGPUDirectRDMAWritesOptionHost", "numeric_literal"); + subst("CU_FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_MEMOPS", "hipFlushGPUDirectRDMAWritesOptionMemOps", "numeric_literal"); + subst("CU_GET_PROC_ADDRESS_SUCCESS", "HIP_GET_PROC_ADDRESS_SUCCESS", "numeric_literal"); + subst("CU_GET_PROC_ADDRESS_SYMBOL_NOT_FOUND", "HIP_GET_PROC_ADDRESS_SYMBOL_NOT_FOUND", "numeric_literal"); + subst("CU_GET_PROC_ADDRESS_VERSION_NOT_SUFFICIENT", "HIP_GET_PROC_ADDRESS_VERSION_NOT_SUFFICIENT", "numeric_literal"); + subst("CU_GPU_DIRECT_RDMA_WRITES_ORDERING_ALL_DEVICES", "hipGPUDirectRDMAWritesOrderingAllDevices", "numeric_literal"); + subst("CU_GPU_DIRECT_RDMA_WRITES_ORDERING_NONE", "hipGPUDirectRDMAWritesOrderingNone", "numeric_literal"); + subst("CU_GPU_DIRECT_RDMA_WRITES_ORDERING_OWNER", "hipGPUDirectRDMAWritesOrderingOwner", "numeric_literal"); + subst("cudaFlushGPUDirectRDMAWritesOptionHost", "hipFlushGPUDirectRDMAWritesOptionHost", "numeric_literal"); + subst("cudaFlushGPUDirectRDMAWritesOptionMemOps", "hipFlushGPUDirectRDMAWritesOptionMemOps", "numeric_literal"); + subst("cudaGPUDirectRDMAWritesOrderingAllDevices", "hipGPUDirectRDMAWritesOrderingAllDevices", "numeric_literal"); + subst("cudaGPUDirectRDMAWritesOrderingNone", "hipGPUDirectRDMAWritesOrderingNone", "numeric_literal"); + subst("cudaGPUDirectRDMAWritesOrderingOwner", "hipGPUDirectRDMAWritesOrderingOwner", "numeric_literal"); + subst("cudaGraphInstantiateError", "hipGraphInstantiateError", "numeric_literal"); + subst("cudaGraphInstantiateInvalidStructure", "hipGraphInstantiateInvalidStructure", "numeric_literal"); + subst("cudaGraphInstantiateMultipleDevicesNotSupported", "hipGraphInstantiateMultipleDevicesNotSupported", "numeric_literal"); + subst("cudaGraphInstantiateNodeOperationNotSupported", "hipGraphInstantiateNodeOperationNotSupported", "numeric_literal"); + subst("cudaGraphInstantiateSuccess", "hipGraphInstantiateSuccess", "numeric_literal"); } sub rocSubstitutions { @@ -2053,6 +2237,7 @@ sub rocSubstitutions { subst("cusparseCreateMatDescr", "rocsparse_create_mat_descr", "library"); subst("cusparseCreatePruneInfo", "rocsparse_create_mat_info", "library"); subst("cusparseCreateSpVec", "rocsparse_create_spvec_descr", "library"); + subst("cusparseCscGet", "rocsparse_csc_get", "library"); subst("cusparseCscSetPointers", "rocsparse_csc_set_pointers", "library"); subst("cusparseCsctr", "rocsparse_csctr", "library"); subst("cusparseCsr2cscEx2_bufferSize", "rocsparse_csr2csc_buffer_size", "library"); @@ -2272,8 +2457,11 @@ sub rocSubstitutions { subst("cusparseShybmv", "rocsparse_shybmv", "library"); subst("cusparseSnnz", "rocsparse_snnz", "library"); subst("cusparseSnnz_compress", "rocsparse_snnz_compress", "library"); + subst("cusparseSpMM", "rocsparse_spmm", "library"); subst("cusparseSpMM_bufferSize", "rocsparse_spmm", "library"); + subst("cusparseSpMM_preprocess", "rocsparse_spmm", "library"); subst("cusparseSpMV", "rocsparse_spmv", "library"); + subst("cusparseSpMV_bufferSize", "rocsparse_spmv", "library"); subst("cusparseSpMatGetAttribute", "rocsparse_spmat_get_attribute", "library"); subst("cusparseSpMatGetFormat", "rocsparse_spmat_get_format", "library"); subst("cusparseSpMatGetIndexBase", "rocsparse_spmat_get_index_base", "library"); @@ -2285,6 +2473,9 @@ sub rocSubstitutions { subst("cusparseSpMatSetValues", "rocsparse_spmat_set_values", "library"); subst("cusparseSpSM_analysis", "rocsparse_spsm", "library"); subst("cusparseSpSM_solve", "rocsparse_spsm", "library"); + subst("cusparseSpSV_bufferSize", "rocsparse_spsv", "library"); + subst("cusparseSpVV", "rocsparse_spvv", "library"); + subst("cusparseSpVV_bufferSize", "rocsparse_spvv", "library"); subst("cusparseSpVecGet", "rocsparse_spvec_get", "library"); subst("cusparseSpVecGetIndexBase", "rocsparse_spvec_get_index_base", "library"); subst("cusparseSpVecGetValues", "rocsparse_spvec_get_values", "library"); @@ -3106,15 +3297,10 @@ sub simpleSubstitutions { subst("cuGraphAddEmptyNode", "hipGraphAddEmptyNode", "graph"); subst("cuGraphAddEventRecordNode", "hipGraphAddEventRecordNode", "graph"); subst("cuGraphAddEventWaitNode", "hipGraphAddEventWaitNode", "graph"); - subst("cuGraphAddExternalSemaphoresSignalNode", "hipGraphAddExternalSemaphoresSignalNode", "graph"); - subst("cuGraphAddExternalSemaphoresWaitNode", "hipGraphAddExternalSemaphoresWaitNode", "graph"); subst("cuGraphAddHostNode", "hipGraphAddHostNode", "graph"); subst("cuGraphAddKernelNode", "hipGraphAddKernelNode", "graph"); subst("cuGraphAddMemAllocNode", "hipGraphAddMemAllocNode", "graph"); - subst("cuGraphAddMemFreeNode", "hipGraphAddMemFreeNode", "graph"); subst("cuGraphAddMemcpyNode", "hipDrvGraphAddMemcpyNode", "graph"); - subst("cuGraphAddMemsetNode", "hipGraphAddMemsetNode", "graph"); - subst("cuGraphAddNode", "hipGraphAddNode", "graph"); subst("cuGraphBatchMemOpNodeGetParams", "hipGraphBatchMemOpNodeGetParams", "graph"); subst("cuGraphBatchMemOpNodeSetParams", "hipGraphBatchMemOpNodeSetParams", "graph"); subst("cuGraphChildGraphNodeGetGraph", "hipGraphChildGraphNodeGetGraph", "graph"); @@ -3132,17 +3318,9 @@ sub simpleSubstitutions { subst("cuGraphExecDestroy", "hipGraphExecDestroy", "graph"); subst("cuGraphExecEventRecordNodeSetEvent", "hipGraphExecEventRecordNodeSetEvent", "graph"); subst("cuGraphExecEventWaitNodeSetEvent", "hipGraphExecEventWaitNodeSetEvent", "graph"); - subst("cuGraphExecExternalSemaphoresSignalNodeSetParams", "hipGraphExecExternalSemaphoresSignalNodeSetParams", "graph"); - subst("cuGraphExecExternalSemaphoresWaitNodeSetParams", "hipGraphExecExternalSemaphoresWaitNodeSetParams", "graph"); - subst("cuGraphExecGetFlags", "hipGraphExecGetFlags", "graph"); subst("cuGraphExecHostNodeSetParams", "hipGraphExecHostNodeSetParams", "graph"); subst("cuGraphExecKernelNodeSetParams", "hipGraphExecKernelNodeSetParams", "graph"); - subst("cuGraphExecNodeSetParams", "hipGraphExecNodeSetParams", "graph"); subst("cuGraphExecUpdate", "hipGraphExecUpdate", "graph"); - subst("cuGraphExternalSemaphoresSignalNodeGetParams", "hipGraphExternalSemaphoresSignalNodeGetParams", "graph"); - subst("cuGraphExternalSemaphoresSignalNodeSetParams", "hipGraphExternalSemaphoresSignalNodeSetParams", "graph"); - subst("cuGraphExternalSemaphoresWaitNodeGetParams", "hipGraphExternalSemaphoresWaitNodeGetParams", "graph"); - subst("cuGraphExternalSemaphoresWaitNodeSetParams", "hipGraphExternalSemaphoresWaitNodeSetParams", "graph"); subst("cuGraphGetEdges", "hipGraphGetEdges", "graph"); subst("cuGraphGetNodes", "hipGraphGetNodes", "graph"); subst("cuGraphGetRootNodes", "hipGraphGetRootNodes", "graph"); @@ -3150,7 +3328,6 @@ sub simpleSubstitutions { subst("cuGraphHostNodeSetParams", "hipGraphHostNodeSetParams", "graph"); subst("cuGraphInstantiate", "hipGraphInstantiate", "graph"); subst("cuGraphInstantiateWithFlags", "hipGraphInstantiateWithFlags", "graph"); - subst("cuGraphInstantiateWithParams", "hipGraphInstantiateWithParams", "graph"); subst("cuGraphInstantiate_v2", "hipGraphInstantiate", "graph"); subst("cuGraphKernelNodeCopyAttributes", "hipGraphKernelNodeCopyAttributes", "graph"); subst("cuGraphKernelNodeGetAttribute", "hipGraphKernelNodeGetAttribute", "graph"); @@ -3160,8 +3337,6 @@ sub simpleSubstitutions { subst("cuGraphLaunch", "hipGraphLaunch", "graph"); subst("cuGraphMemAllocNodeGetParams", "hipGraphMemAllocNodeGetParams", "graph"); subst("cuGraphMemFreeNodeGetParams", "hipGraphMemFreeNodeGetParams", "graph"); - subst("cuGraphMemcpyNodeGetParams", "hipGraphMemcpyNodeGetParams", "graph"); - subst("cuGraphMemcpyNodeSetParams", "hipGraphMemcpyNodeSetParams", "graph"); subst("cuGraphMemsetNodeGetParams", "hipGraphMemsetNodeGetParams", "graph"); subst("cuGraphMemsetNodeSetParams", "hipGraphMemsetNodeSetParams", "graph"); subst("cuGraphNodeFindInClone", "hipGraphNodeFindInClone", "graph"); @@ -3170,7 +3345,6 @@ sub simpleSubstitutions { subst("cuGraphNodeGetEnabled", "hipGraphNodeGetEnabled", "graph"); subst("cuGraphNodeGetType", "hipGraphNodeGetType", "graph"); subst("cuGraphNodeSetEnabled", "hipGraphNodeSetEnabled", "graph"); - subst("cuGraphNodeSetParams", "hipGraphNodeSetParams", "graph"); subst("cuGraphReleaseUserObject", "hipGraphReleaseUserObject", "graph"); subst("cuGraphRemoveDependencies", "hipGraphRemoveDependencies", "graph"); subst("cuGraphRetainUserObject", "hipGraphRetainUserObject", "graph"); @@ -3186,8 +3360,6 @@ sub simpleSubstitutions { subst("cudaGraphAddEmptyNode", "hipGraphAddEmptyNode", "graph"); subst("cudaGraphAddEventRecordNode", "hipGraphAddEventRecordNode", "graph"); subst("cudaGraphAddEventWaitNode", "hipGraphAddEventWaitNode", "graph"); - subst("cudaGraphAddExternalSemaphoresSignalNode", "hipGraphAddExternalSemaphoresSignalNode", "graph"); - subst("cudaGraphAddExternalSemaphoresWaitNode", "hipGraphAddExternalSemaphoresWaitNode", "graph"); subst("cudaGraphAddHostNode", "hipGraphAddHostNode", "graph"); subst("cudaGraphAddKernelNode", "hipGraphAddKernelNode", "graph"); subst("cudaGraphAddMemAllocNode", "hipGraphAddMemAllocNode", "graph"); @@ -3211,8 +3383,6 @@ sub simpleSubstitutions { subst("cudaGraphExecDestroy", "hipGraphExecDestroy", "graph"); subst("cudaGraphExecEventRecordNodeSetEvent", "hipGraphExecEventRecordNodeSetEvent", "graph"); subst("cudaGraphExecEventWaitNodeSetEvent", "hipGraphExecEventWaitNodeSetEvent", "graph"); - subst("cudaGraphExecExternalSemaphoresSignalNodeSetParams", "hipGraphExecExternalSemaphoresSignalNodeSetParams", "graph"); - subst("cudaGraphExecExternalSemaphoresWaitNodeSetParams", "hipGraphExecExternalSemaphoresWaitNodeSetParams", "graph"); subst("cudaGraphExecHostNodeSetParams", "hipGraphExecHostNodeSetParams", "graph"); subst("cudaGraphExecKernelNodeSetParams", "hipGraphExecKernelNodeSetParams", "graph"); subst("cudaGraphExecMemcpyNodeSetParams", "hipGraphExecMemcpyNodeSetParams", "graph"); @@ -3221,10 +3391,6 @@ sub simpleSubstitutions { subst("cudaGraphExecMemcpyNodeSetParamsToSymbol", "hipGraphExecMemcpyNodeSetParamsToSymbol", "graph"); subst("cudaGraphExecMemsetNodeSetParams", "hipGraphExecMemsetNodeSetParams", "graph"); subst("cudaGraphExecUpdate", "hipGraphExecUpdate", "graph"); - subst("cudaGraphExternalSemaphoresSignalNodeGetParams", "hipGraphExternalSemaphoresSignalNodeGetParams", "graph"); - subst("cudaGraphExternalSemaphoresSignalNodeSetParams", "hipGraphExternalSemaphoresSignalNodeSetParams", "graph"); - subst("cudaGraphExternalSemaphoresWaitNodeGetParams", "hipGraphExternalSemaphoresWaitNodeGetParams", "graph"); - subst("cudaGraphExternalSemaphoresWaitNodeSetParams", "hipGraphExternalSemaphoresWaitNodeSetParams", "graph"); subst("cudaGraphGetEdges", "hipGraphGetEdges", "graph"); subst("cudaGraphGetNodes", "hipGraphGetNodes", "graph"); subst("cudaGraphGetRootNodes", "hipGraphGetRootNodes", "graph"); @@ -7737,7 +7903,6 @@ sub warnUnsupportedFunctions { "cusparseCsrmvEx", "cusparseCsrilu0Ex", "cusparseCsr2cscEx", - "cusparseCscGet", "cusparseCreateSolveAnalysisInfo", "cusparseCreateSlicedEll", "cusparseCreateConstSlicedEll", @@ -7746,7 +7911,6 @@ sub warnUnsupportedFunctions { "cusparseContext", "cusparseConstrainedGeMM_bufferSize", "cusparseConstrainedGeMM", - "cusparseConstCscGet", "cusparseColorInfo", "cusparseColorAlg_t", "cusparseChybsv_solve", @@ -8482,7 +8646,6 @@ sub warnUnsupportedFunctions { "cudaMemsetParamsV2", "cudaMemoryTypeUnregistered", "cudaMemcpyToArrayAsync", - "cudaMemcpyNodeParams", "cudaMemcpyFromArrayAsync", "cudaMemcpyArrayToArray", "cudaMemcpy3DPeerParms", @@ -8497,7 +8660,6 @@ sub warnUnsupportedFunctions { "cudaMemLocationTypeHostNumaCurrent", "cudaMemLocationTypeHostNuma", "cudaMemLocationTypeHost", - "cudaMemFreeNodeParams", "cudaMemFabricHandle_t", "cudaMemFabricHandle_st", "cudaMemAllocNodeParamsV2", @@ -8564,28 +8726,15 @@ sub warnUnsupportedFunctions { "cudaGraphicsCubeFaceNegativeX", "cudaGraphicsCubeFace", "cudaGraphRemoveDependencies_v2", - "cudaGraphNodeSetParams", - "cudaGraphNodeParams", "cudaGraphNodeGetDependentNodes_v2", "cudaGraphNodeGetDependencies_v2", "cudaGraphKernelNodePortProgrammatic", "cudaGraphKernelNodePortLaunchCompletion", "cudaGraphKernelNodePortDefault", - "cudaGraphInstantiateWithParams", - "cudaGraphInstantiateSuccess", - "cudaGraphInstantiateResult", - "cudaGraphInstantiateParams_st", - "cudaGraphInstantiateParams", - "cudaGraphInstantiateNodeOperationNotSupported", - "cudaGraphInstantiateMultipleDevicesNotSupported", - "cudaGraphInstantiateInvalidStructure", - "cudaGraphInstantiateError", "cudaGraphGetEdges_v2", "cudaGraphExecUpdateResultInfo_st", "cudaGraphExecUpdateResultInfo", "cudaGraphExecUpdateErrorAttributesChanged", - "cudaGraphExecNodeSetParams", - "cudaGraphExecGetFlags", "cudaGraphEdgeData_st", "cudaGraphEdgeData", "cudaGraphDependencyType_enum", @@ -8601,7 +8750,6 @@ sub warnUnsupportedFunctions { "cudaGraphCondTypeIf", "cudaGraphCondAssignDefault", "cudaGraphAddNode_v2", - "cudaGraphAddNode", "cudaGraphAddDependencies_v2", "cudaGetTextureObjectTextureDesc_v2", "cudaGetSurfaceReference", @@ -8611,11 +8759,6 @@ sub warnUnsupportedFunctions { "cudaGetKernel", "cudaGetFuncBySymbol", "cudaGetDriverEntryPointFlags", - "cudaGetDriverEntryPoint", - "cudaGPUDirectRDMAWritesOrderingOwner", - "cudaGPUDirectRDMAWritesOrderingNone", - "cudaGPUDirectRDMAWritesOrderingAllDevices", - "cudaGPUDirectRDMAWritesOrdering", "cudaGLUnregisterBufferObject", "cudaGLUnmapBufferObjectAsync", "cudaGLUnmapBufferObject", @@ -8642,9 +8785,6 @@ sub warnUnsupportedFunctions { "cudaFlushGPUDirectRDMAWritesTargetCurrentDevice", "cudaFlushGPUDirectRDMAWritesTarget", "cudaFlushGPUDirectRDMAWritesScope", - "cudaFlushGPUDirectRDMAWritesOptions", - "cudaFlushGPUDirectRDMAWritesOptionMemOps", - "cudaFlushGPUDirectRDMAWritesOptionHost", "cudaExternalSemaphoreWaitSkipNvSciBufMemSync", "cudaExternalSemaphoreSignalSkipNvSciBufMemSync", "cudaExternalSemaphoreHandleTypeTimelineSemaphoreWin32", @@ -8656,11 +8796,9 @@ sub warnUnsupportedFunctions { "cudaExternalMemoryMipmappedArrayDesc", "cudaExternalMemoryHandleTypeNvSciBuf", "cudaExternalMemoryGetMappedMipmappedArray", - "cudaEventWaitNodeParams", "cudaEventWaitExternal", "cudaEventWaitDefault", "cudaEventRecordWithFlags", - "cudaEventRecordNodeParams", "cudaEventRecordExternal", "cudaEventRecordDefault", "cudaEventCreateFromEGLSync", @@ -8932,7 +9070,6 @@ sub warnUnsupportedFunctions { "cudaClusterSchedulingPolicyLoadBalancing", "cudaClusterSchedulingPolicyDefault", "cudaClusterSchedulingPolicy", - "cudaChildGraphNodeParams", "cudaChannelFormatKindUnsignedNormalized8X4", "cudaChannelFormatKindUnsignedNormalized8X2", "cudaChannelFormatKindUnsignedNormalized8X1", @@ -9078,12 +9215,9 @@ sub warnUnsupportedFunctions { "cuGraphNodeGetDependentNodes_v2", "cuGraphNodeGetDependencies_v2", "cuGraphGetEdges_v2", - "cuGraphExecMemsetNodeSetParams", - "cuGraphExecMemcpyNodeSetParams", "cuGraphConditionalHandleCreate", "cuGraphAddNode_v2", "cuGraphAddDependencies_v2", - "cuGetProcAddress", "cuGLUnregisterBufferObject", "cuGLUnmapBufferObjectAsync", "cuGLUnmapBufferObject", @@ -9300,10 +9434,6 @@ sub warnUnsupportedFunctions { "CUipcMem_flags", "CUgraphicsMapResourceFlags_enum", "CUgraphicsMapResourceFlags", - "CUgraphNodeParams_st", - "CUgraphNodeParams", - "CUgraphInstantiateResult_enum", - "CUgraphInstantiateResult", "CUgraphExecUpdateResultInfo_v1", "CUgraphExecUpdateResultInfo_st", "CUgraphExecUpdateResultInfo", @@ -9318,8 +9448,6 @@ sub warnUnsupportedFunctions { "CUflushGPUDirectRDMAWritesTarget", "CUflushGPUDirectRDMAWritesScope_enum", "CUflushGPUDirectRDMAWritesScope", - "CUflushGPUDirectRDMAWritesOptions_enum", - "CUflushGPUDirectRDMAWritesOptions", "CUexternalSemaphore_st", "CUexternalMemory_st", "CUextSemaphore_st", @@ -9350,8 +9478,6 @@ sub warnUnsupportedFunctions { "CUeglColorFormat", "CUdriverProcAddress_flags_enum", "CUdriverProcAddress_flags", - "CUdriverProcAddressQueryResult_enum", - "CUdriverProcAddressQueryResult", "CUdevprop_v1", "CUdevprop_st", "CUdevprop", @@ -9553,15 +9679,9 @@ sub warnUnsupportedFunctions { "CU_GRAPHICS_MAP_RESOURCE_FLAGS_WRITE_DISCARD", "CU_GRAPHICS_MAP_RESOURCE_FLAGS_READ_ONLY", "CU_GRAPHICS_MAP_RESOURCE_FLAGS_NONE", - "CU_GPU_DIRECT_RDMA_WRITES_ORDERING_OWNER", - "CU_GPU_DIRECT_RDMA_WRITES_ORDERING_NONE", - "CU_GPU_DIRECT_RDMA_WRITES_ORDERING_ALL_DEVICES", "CU_GL_MAP_RESOURCE_FLAGS_WRITE_DISCARD", "CU_GL_MAP_RESOURCE_FLAGS_READ_ONLY", "CU_GL_MAP_RESOURCE_FLAGS_NONE", - "CU_GET_PROC_ADDRESS_VERSION_NOT_SUFFICIENT", - "CU_GET_PROC_ADDRESS_SYMBOL_NOT_FOUND", - "CU_GET_PROC_ADDRESS_SUCCESS", "CU_GET_PROC_ADDRESS_PER_THREAD_DEFAULT_STREAM", "CU_GET_PROC_ADDRESS_LEGACY_STREAM", "CU_GET_PROC_ADDRESS_DEFAULT", @@ -9574,8 +9694,6 @@ sub warnUnsupportedFunctions { "CU_FLUSH_GPU_DIRECT_RDMA_WRITES_TO_OWNER", "CU_FLUSH_GPU_DIRECT_RDMA_WRITES_TO_ALL_DEVICES", "CU_FLUSH_GPU_DIRECT_RDMA_WRITES_TARGET_CURRENT_CTX", - "CU_FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_MEMOPS", - "CU_FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_HOST", "CU_EXTERNAL_SEMAPHORE_HANDLE_TYPE_TIMELINE_SEMAPHORE_WIN32", "CU_EXTERNAL_SEMAPHORE_HANDLE_TYPE_TIMELINE_SEMAPHORE_FD", "CU_EXTERNAL_SEMAPHORE_HANDLE_TYPE_NVSCISYNC", @@ -9872,8 +9990,6 @@ sub warnUnsupportedFunctions { "CURAND_CHOOSE_BEST", "CURAND_BINARY_SEARCH", "CURAND_3RD", - "CUGPUDirectRDMAWritesOrdering_enum", - "CUGPUDirectRDMAWritesOrdering", "CUGLmap_flags_enum", "CUGLmap_flags", "CUFFT_XT_FORMAT_OUTPUT", @@ -10477,14 +10593,10 @@ sub warnUnsupportedFunctions { "CUDA_POINTER_ATTRIBUTE_ACCESS_FLAGS", "CUDA_NVSCISYNC_ATTR_WAIT", "CUDA_NVSCISYNC_ATTR_SIGNAL", - "CUDA_MEM_FREE_NODE_PARAMS_st", - "CUDA_MEM_FREE_NODE_PARAMS", "CUDA_MEM_ALLOC_NODE_PARAMS_v2_st", "CUDA_MEM_ALLOC_NODE_PARAMS_v2", "CUDA_MEMSET_NODE_PARAMS_v2_st", "CUDA_MEMSET_NODE_PARAMS_v2", - "CUDA_MEMCPY_NODE_PARAMS_st", - "CUDA_MEMCPY_NODE_PARAMS", "CUDA_MEMCPY3D_PEER_v1", "CUDA_MEMCPY3D_PEER_st", "CUDA_MEMCPY3D_PEER", @@ -10494,22 +10606,11 @@ sub warnUnsupportedFunctions { "CUDA_KERNEL_NODE_PARAMS_v2", "CUDA_HOST_NODE_PARAMS_v2_st", "CUDA_HOST_NODE_PARAMS_v2", - "CUDA_GRAPH_INSTANTIATE_SUCCESS", - "CUDA_GRAPH_INSTANTIATE_PARAMS_st", - "CUDA_GRAPH_INSTANTIATE_PARAMS", - "CUDA_GRAPH_INSTANTIATE_NODE_OPERATION_NOT_SUPPORTED", - "CUDA_GRAPH_INSTANTIATE_MULTIPLE_CTXS_NOT_SUPPORTED", - "CUDA_GRAPH_INSTANTIATE_INVALID_STRUCTURE", - "CUDA_GRAPH_INSTANTIATE_ERROR", "CUDA_EXTERNAL_SEMAPHORE_WAIT_SKIP_NVSCIBUF_MEMSYNC", "CUDA_EXTERNAL_SEMAPHORE_SIGNAL_SKIP_NVSCIBUF_MEMSYNC", "CUDA_EXTERNAL_MEMORY_MIPMAPPED_ARRAY_DESC_v1", "CUDA_EXTERNAL_MEMORY_MIPMAPPED_ARRAY_DESC_st", "CUDA_EXTERNAL_MEMORY_MIPMAPPED_ARRAY_DESC", - "CUDA_EVENT_WAIT_NODE_PARAMS_st", - "CUDA_EVENT_WAIT_NODE_PARAMS", - "CUDA_EVENT_RECORD_NODE_PARAMS_st", - "CUDA_EVENT_RECORD_NODE_PARAMS", "CUDA_ERROR_UNSUPPORTED_PTX_VERSION", "CUDA_ERROR_UNSUPPORTED_EXEC_AFFINITY", "CUDA_ERROR_UNSUPPORTED_DEVSIDE_SYNC", @@ -10544,8 +10645,6 @@ sub warnUnsupportedFunctions { "CUDA_ERROR_CDP_NOT_SUPPORTED", "CUDA_EGL_MAX_PLANES", "CUDA_CONDITIONAL_NODE_PARAMS", - "CUDA_CHILD_GRAPH_NODE_PARAMS_st", - "CUDA_CHILD_GRAPH_NODE_PARAMS", "CUDA_CB", "CUDA_BATCH_MEM_OP_NODE_PARAMS_v2_st", "CUDA_BATCH_MEM_OP_NODE_PARAMS_v2", diff --git a/docs/hipify-clang.md b/docs/hipify-clang.md index 6c592b77..09e6ae86 100644 --- a/docs/hipify-clang.md +++ b/docs/hipify-clang.md @@ -426,7 +426,7 @@ CMake 3.16.8, GNU C/C++ 9.2, Python 2.7. Recommended build system requirements: -CMake 3.28.1, GNU C/C++ 13.2, Python 3.11.6. +CMake 3.28.3, GNU C/C++ 13.2, Python 3.12.2. Here is an example of building `hipify-clang` with testing support on `Ubuntu 23.10.01`: @@ -470,7 +470,7 @@ cmake -- - Binary path : /usr/llvm/17.0.6/dist/bin -- Linker detection: GNU ld -- ---- The below configuring for hipify-clang testing only ---- --- Found Python: /usr/bin/python3.11 (found version "3.11.6") found components: Interpreter +-- Found Python: /usr/bin/python3.12 (found version "3.12.2") found components: Interpreter -- Found lit: /usr/local/bin/lit -- Found FileCheck: /GIT/LLVM/trunk/dist/FileCheck -- Initial CUDA to configure: @@ -506,7 +506,7 @@ LLVM 17.0.6 - will be used for testing x86_64 - Platform architecture Linux 6.5.0-15-generic - Platform OS 64 - hipify-clang binary bitness -64 - python 3.11.6 binary bitness +64 - python 3.12.2 binary bitness =============================================================== -- Testing: 102 tests, 12 threads -- Testing Time: 6.70s @@ -532,8 +532,8 @@ Total Discovered Tests: 102 | 14.0.0 - 14.0.6 | 7.0 - 11.7.1 | 8.0.5 - 8.4.1 | 2017.15.9.57*, 2019.16.11.17, 2022.17.2.6 | 3.24.0 | 3.10.6 | | 15.0.0 - 15.0.7 | 7.0 - 11.8.0 | 8.0.5 - 8.8.1 | 2019.16.11.25, 2022.17.5.2 | 3.26.0 | 3.11.2 | | 16.0.0 - 16.0.6 | 7.0 - 12.2.2 | 8.0.5 - 8.9.5 | 2019.16.11.29, 2022.17.7.1 | 3.27.3 | 3.11.4 | -| 17.0.1** 17.0.6 | 7.0 - 12.3.2 | 8.0.5 - 8.9.7 | 2019.16.11.32, 2022.17.8.3 | 3.28.1 | 3.12.1 | -| 19.0.0git | 7.0 - 12.3.2 | 8.0.5 - 8.9.7 | 2019.16.11.32, 2022.17.8.3 | 3.28.1 | 3.12.1 | +| 17.0.1** 17.0.6 | 7.0 - 12.3.2 | 8.0.5 - 8.9.7 | 2019.16.11.34, 2022.17.9.0 | 3.28.3 | 3.12.2 | +| 19.0.0git | 7.0 - 12.3.2 | 8.0.5 - 8.9.7 | 2019.16.11.34, 2022.17.9.0 | 3.28.3 | 3.12.2 | `*` LLVM 14.x.x is the latest major release supporting Visual Studio 2017. To build LLVM 14.x.x correctly by Visual Studio 2017, `-DLLVM_FORCE_USE_OLD_TOOLCHAIN=ON` should be added to a corresponding CMake command line. @@ -586,7 +586,7 @@ cmake -- - LLVM Include path : D:/LLVM/17.0.6/dist/include -- - Binary path : D:/LLVM/17.0.6/dist/bin -- ---- The below configuring for hipify-clang testing only ---- --- Found Python: C:/Users/TT/AppData/Local/Programs/Python/Python312/python.exe (found version "3.12.0") found components: Interpreter +-- Found Python: C:/Users/TT/AppData/Local/Programs/Python/Python312/python.exe (found version "3.12.2") found components: Interpreter -- Found lit: C:/Users/TT/AppData/Local/Programs/Python/Python312/Scripts/lit.exe -- Found FileCheck: D:/LLVM/17.0.6/dist/bin/FileCheck.exe -- Initial CUDA to configure: diff --git a/docs/sphinx/requirements.in b/docs/sphinx/requirements.in index 170ba424..6c61f389 100644 --- a/docs/sphinx/requirements.in +++ b/docs/sphinx/requirements.in @@ -1 +1 @@ -rocm-docs-core==0.34.0 +rocm-docs-core==0.34.2 diff --git a/docs/sphinx/requirements.txt b/docs/sphinx/requirements.txt index e5fec3f8..f0047768 100644 --- a/docs/sphinx/requirements.txt +++ b/docs/sphinx/requirements.txt @@ -26,7 +26,7 @@ charset-normalizer==3.1.0 # via requests click==8.1.3 # via sphinx-external-toc -cryptography==42.0.0 +cryptography==42.0.2 # via pyjwt deprecated==1.2.13 # via pygithub @@ -100,7 +100,7 @@ requests==2.31.0 # via # pygithub # sphinx -rocm-docs-core==0.34.0 +rocm-docs-core==0.34.2 # via -r requirements.in smmap==5.0.0 # via gitdb diff --git a/docs/supported_apis.md b/docs/supported_apis.md index 2817b5f8..038cb811 100644 --- a/docs/supported_apis.md +++ b/docs/supported_apis.md @@ -1,16 +1,18 @@ # Supported CUDA APIs -- [Runtime API](tables/CUDA_Runtime_API_functions_supported_by_HIP.md) -- [Driver API](tables/CUDA_Driver_API_functions_supported_by_HIP.md) -- [cuComplex API](tables/cuComplex_API_supported_by_HIP.md) -- [Device API](tables/CUDA_Device_API_supported_by_HIP.md) -- [RTC API](tables/CUDA_RTC_API_supported_by_HIP.md) -- [cuBLAS](tables/CUBLAS_API_supported_by_HIP.md) -- [cuRAND](tables/CURAND_API_supported_by_HIP.md) -- [cuDNN](tables/CUDNN_API_supported_by_HIP.md) -- [cuFFT](tables/CUFFT_API_supported_by_HIP.md) -- [cuSPARSE](tables/CUSPARSE_API_supported_by_HIP.md) -- [cuSOLVER](tables/CUSOLVER_API_supported_by_HIP.md) -- [CUB](tables/CUB_API_supported_by_HIP.md) +| **CUDA** | **HIP** | **ROC** | **HIP & ROC** | +|:----------------|:---------------------------------------------------------------------|:---------------|:----------------------------| +| Runtime API | [HIP API](tables/CUDA_Runtime_API_functions_supported_by_HIP.md) | | | +| Driver API | [HIP API](tables/CUDA_Driver_API_functions_supported_by_HIP.md) | | | +| Complex API | [HIP API](tables/cuComplex_API_supported_by_HIP.md) | | | +| Device API | [HIP Device API](tables/CUDA_Device_API_supported_by_HIP.md) | | | +| RTC API | [HIP RTC API](tables/CUDA_RTC_API_supported_by_HIP.md) | | | +| BLAS API | [HIP BLAS API](tables/CUBLAS_API_supported_by_HIP.md) | [ROC BLAS API](tables/CUBLAS_API_supported_by_ROC.md) | [HIP + ROC BLAS API](tables/CUBLAS_API_supported_by_HIP_and_ROC.md) | +| SPARSE API | [HIP SPARSE API](tables/CUSPARSE_API_supported_by_HIP.md) | [ROC SPARSE API](tables/CUSPARSE_API_supported_by_ROC.md) | [HIP + ROC SPARSE API](tables/CUSPARSE_API_supported_by_HIP_and_ROC.md) | +| SOLVER API | [HIP SOLVER API](tables/CUSOLVER_API_supported_by_HIP.md) | | | +| RAND API | [HIP RAND API](tables/CURAND_API_supported_by_HIP.md) | | | +| FFT API | [HIP FFT API](tables/CUFFT_API_supported_by_HIP.md) | | | +| DNN API | [HIP DNN API](tables/CUDNN_API_supported_by_HIP.md) | | | +| CUB API | [HIP CUB API](tables/CUB_API_supported_by_HIP.md) | | | To generate the above documentation with the actual information about all supported CUDA APIs in Markdown format, run `hipify-clang --md` with or without specifying the output directory (`-o`). diff --git a/docs/tables/CUDA_Driver_API_functions_supported_by_HIP.md b/docs/tables/CUDA_Driver_API_functions_supported_by_HIP.md index 0ee31983..708f7862 100644 --- a/docs/tables/CUDA_Driver_API_functions_supported_by_HIP.md +++ b/docs/tables/CUDA_Driver_API_functions_supported_by_HIP.md @@ -34,8 +34,8 @@ |`CUDA_BATCH_MEM_OP_NODE_PARAMS_v2`|12.2| | | | | | | | | | |`CUDA_BATCH_MEM_OP_NODE_PARAMS_v2_st`|12.2| | | | | | | | | | |`CUDA_CB`| | | | | | | | | | | -|`CUDA_CHILD_GRAPH_NODE_PARAMS`|12.2| | | | | | | | | | -|`CUDA_CHILD_GRAPH_NODE_PARAMS_st`|12.2| | | | | | | | | | +|`CUDA_CHILD_GRAPH_NODE_PARAMS`|12.2| | | |`hipChildGraphNodeParams`|6.1.0| | | |6.1.0| +|`CUDA_CHILD_GRAPH_NODE_PARAMS_st`|12.2| | | |`hipChildGraphNodeParams`|6.1.0| | | |6.1.0| |`CUDA_CONDITIONAL_NODE_PARAMS`|12.3| | | | | | | | | | |`CUDA_COOPERATIVE_LAUNCH_MULTI_DEVICE_NO_POST_LAUNCH_SYNC`|9.0| | | |`hipCooperativeLaunchMultiDeviceNoPostSync`|3.2.0| | | | | |`CUDA_COOPERATIVE_LAUNCH_MULTI_DEVICE_NO_PRE_LAUNCH_SYNC`|9.0| | | |`hipCooperativeLaunchMultiDeviceNoPreSync`|3.2.0| | | | | @@ -132,10 +132,10 @@ |`CUDA_ERROR_UNSUPPORTED_EXEC_AFFINITY`|11.4| | | | | | | | | | |`CUDA_ERROR_UNSUPPORTED_LIMIT`| | | | |`hipErrorUnsupportedLimit`|1.6.0| | | | | |`CUDA_ERROR_UNSUPPORTED_PTX_VERSION`|11.1| | | | | | | | | | -|`CUDA_EVENT_RECORD_NODE_PARAMS`|12.2| | | | | | | | | | -|`CUDA_EVENT_RECORD_NODE_PARAMS_st`|12.2| | | | | | | | | | -|`CUDA_EVENT_WAIT_NODE_PARAMS`|12.2| | | | | | | | | | -|`CUDA_EVENT_WAIT_NODE_PARAMS_st`|12.2| | | | | | | | | | +|`CUDA_EVENT_RECORD_NODE_PARAMS`|12.2| | | |`hipEventRecordNodeParams`|6.1.0| | | |6.1.0| +|`CUDA_EVENT_RECORD_NODE_PARAMS_st`|12.2| | | |`hipEventRecordNodeParams`|6.1.0| | | |6.1.0| +|`CUDA_EVENT_WAIT_NODE_PARAMS`|12.2| | | |`hipEventWaitNodeParams`|6.1.0| | | |6.1.0| +|`CUDA_EVENT_WAIT_NODE_PARAMS_st`|12.2| | | |`hipEventWaitNodeParams`|6.1.0| | | |6.1.0| |`CUDA_EXTERNAL_MEMORY_BUFFER_DESC`|10.0| | | |`hipExternalMemoryBufferDesc`|4.3.0| | | | | |`CUDA_EXTERNAL_MEMORY_BUFFER_DESC_st`|10.0| | | |`hipExternalMemoryBufferDesc_st`|4.3.0| | | | | |`CUDA_EXTERNAL_MEMORY_BUFFER_DESC_v1`|11.3| | | |`hipExternalMemoryBufferDesc`|4.3.0| | | | | @@ -167,17 +167,17 @@ |`CUDA_EXT_SEM_WAIT_NODE_PARAMS_v1`|11.3| | | |`hipExternalSemaphoreWaitNodeParams`|6.0.0| | | | | |`CUDA_EXT_SEM_WAIT_NODE_PARAMS_v2`|12.2| | | |`hipExternalSemaphoreWaitNodeParams`|6.0.0| | | | | |`CUDA_EXT_SEM_WAIT_NODE_PARAMS_v2_st`|12.2| | | |`hipExternalSemaphoreWaitNodeParams`|6.0.0| | | | | -|`CUDA_GRAPH_INSTANTIATE_ERROR`|12.0| | | | | | | | | | +|`CUDA_GRAPH_INSTANTIATE_ERROR`|12.0| | | |`hipGraphInstantiateError`|6.1.0| | | |6.1.0| |`CUDA_GRAPH_INSTANTIATE_FLAG_AUTO_FREE_ON_LAUNCH`|11.4| | | |`hipGraphInstantiateFlagAutoFreeOnLaunch`|5.2.0| | | | | |`CUDA_GRAPH_INSTANTIATE_FLAG_DEVICE_LAUNCH`|12.0| | | |`hipGraphInstantiateFlagDeviceLaunch`|5.6.0| | | | | |`CUDA_GRAPH_INSTANTIATE_FLAG_UPLOAD`|12.0| | | |`hipGraphInstantiateFlagUpload`|5.6.0| | | | | |`CUDA_GRAPH_INSTANTIATE_FLAG_USE_NODE_PRIORITY`|11.7| | | |`hipGraphInstantiateFlagUseNodePriority`|5.6.0| | | | | -|`CUDA_GRAPH_INSTANTIATE_INVALID_STRUCTURE`|12.0| | | | | | | | | | -|`CUDA_GRAPH_INSTANTIATE_MULTIPLE_CTXS_NOT_SUPPORTED`|12.0| | | | | | | | | | -|`CUDA_GRAPH_INSTANTIATE_NODE_OPERATION_NOT_SUPPORTED`|12.0| | | | | | | | | | -|`CUDA_GRAPH_INSTANTIATE_PARAMS`|12.0| | | | | | | | | | -|`CUDA_GRAPH_INSTANTIATE_PARAMS_st`|12.0| | | | | | | | | | -|`CUDA_GRAPH_INSTANTIATE_SUCCESS`|12.0| | | | | | | | | | +|`CUDA_GRAPH_INSTANTIATE_INVALID_STRUCTURE`|12.0| | | |`hipGraphInstantiateInvalidStructure`|6.1.0| | | |6.1.0| +|`CUDA_GRAPH_INSTANTIATE_MULTIPLE_CTXS_NOT_SUPPORTED`|12.0| | | |`hipGraphInstantiateMultipleDevicesNotSupported`|6.1.0| | | |6.1.0| +|`CUDA_GRAPH_INSTANTIATE_NODE_OPERATION_NOT_SUPPORTED`|12.0| | | |`hipGraphInstantiateNodeOperationNotSupported`|6.1.0| | | |6.1.0| +|`CUDA_GRAPH_INSTANTIATE_PARAMS`|12.0| | | |`hipGraphInstantiateParams`|6.1.0| | | |6.1.0| +|`CUDA_GRAPH_INSTANTIATE_PARAMS_st`|12.0| | | |`hipGraphInstantiateParams`|6.1.0| | | |6.1.0| +|`CUDA_GRAPH_INSTANTIATE_SUCCESS`|12.0| | | |`hipGraphInstantiateSuccess`|6.1.0| | | |6.1.0| |`CUDA_HOST_NODE_PARAMS`|10.0| | | |`hipHostNodeParams`|4.3.0| | | | | |`CUDA_HOST_NODE_PARAMS_st`|10.0| | | |`hipHostNodeParams`|4.3.0| | | | | |`CUDA_HOST_NODE_PARAMS_v1`|11.3| | | |`hipHostNodeParams`|4.3.0| | | | | @@ -206,8 +206,8 @@ |`CUDA_MEMCPY3D_v1`| | | | |`HIP_MEMCPY3D`|3.2.0| | | | | |`CUDA_MEMCPY3D_v1_st`| | | | |`HIP_MEMCPY3D`|3.2.0| | | | | |`CUDA_MEMCPY3D_v2`|11.3| | | |`HIP_MEMCPY3D`|3.2.0| | | | | -|`CUDA_MEMCPY_NODE_PARAMS`|12.2| | | | | | | | | | -|`CUDA_MEMCPY_NODE_PARAMS_st`|12.2| | | | | | | | | | +|`CUDA_MEMCPY_NODE_PARAMS`|12.2| | | |`hipMemcpyNodeParams`|6.1.0| | | |6.1.0| +|`CUDA_MEMCPY_NODE_PARAMS_st`|12.2| | | |`hipMemcpyNodeParams`|6.1.0| | | |6.1.0| |`CUDA_MEMSET_NODE_PARAMS`|10.0| | | |`hipMemsetParams`|4.3.0| | | | | |`CUDA_MEMSET_NODE_PARAMS_st`|10.0| | | |`hipMemsetParams`|4.3.0| | | | | |`CUDA_MEMSET_NODE_PARAMS_v1`|11.3| | | |`hipMemsetParams`|4.3.0| | | | | @@ -219,8 +219,8 @@ |`CUDA_MEM_ALLOC_NODE_PARAMS_v1_st`|12.2| | | |`hipMemAllocNodeParams`|5.5.0| | | | | |`CUDA_MEM_ALLOC_NODE_PARAMS_v2`|12.2| | | | | | | | | | |`CUDA_MEM_ALLOC_NODE_PARAMS_v2_st`|12.2| | | | | | | | | | -|`CUDA_MEM_FREE_NODE_PARAMS`|12.2| | | | | | | | | | -|`CUDA_MEM_FREE_NODE_PARAMS_st`|12.2| | | | | | | | | | +|`CUDA_MEM_FREE_NODE_PARAMS`|12.2| | | |`hipMemFreeNodeParams`|6.1.0| | | |6.1.0| +|`CUDA_MEM_FREE_NODE_PARAMS_st`|12.2| | | |`hipMemFreeNodeParams`|6.1.0| | | |6.1.0| |`CUDA_NVSCISYNC_ATTR_SIGNAL`|10.2| | | | | | | | | | |`CUDA_NVSCISYNC_ATTR_WAIT`|10.2| | | | | | | | | | |`CUDA_POINTER_ATTRIBUTE_ACCESS_FLAGS`|11.1| | | | | | | | | | @@ -242,8 +242,8 @@ |`CUGLDeviceList_enum`| | | | |`hipGLDeviceList`|4.4.0| | | | | |`CUGLmap_flags`| | | | | | | | | | | |`CUGLmap_flags_enum`| | | | | | | | | | | -|`CUGPUDirectRDMAWritesOrdering`|11.3| | | | | | | | | | -|`CUGPUDirectRDMAWritesOrdering_enum`|11.3| | | | | | | | | | +|`CUGPUDirectRDMAWritesOrdering`|11.3| | | |`hipGPUDirectRDMAWritesOrdering`|6.1.0| | | |6.1.0| +|`CUGPUDirectRDMAWritesOrdering_enum`|11.3| | | |`hipGPUDirectRDMAWritesOrdering`|6.1.0| | | |6.1.0| |`CU_ACCESS_PROPERTY_NORMAL`|11.0| | | |`hipAccessPropertyNormal`|5.2.0| | | | | |`CU_ACCESS_PROPERTY_PERSISTING`|11.0| | | |`hipAccessPropertyPersisting`|5.2.0| | | | | |`CU_ACCESS_PROPERTY_STREAMING`|11.0| | | |`hipAccessPropertyStreaming`|5.2.0| | | | | @@ -600,8 +600,8 @@ |`CU_EXTERNAL_SEMAPHORE_HANDLE_TYPE_OPAQUE_WIN32_KMT`|10.0| | | |`hipExternalSemaphoreHandleTypeOpaqueWin32Kmt`|4.4.0| | | | | |`CU_EXTERNAL_SEMAPHORE_HANDLE_TYPE_TIMELINE_SEMAPHORE_FD`|11.2| | | | | | | | | | |`CU_EXTERNAL_SEMAPHORE_HANDLE_TYPE_TIMELINE_SEMAPHORE_WIN32`|11.2| | | | | | | | | | -|`CU_FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_HOST`|11.3| | | | | | | | | | -|`CU_FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_MEMOPS`|11.3| | | | | | | | | | +|`CU_FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_HOST`|11.3| | | |`hipFlushGPUDirectRDMAWritesOptionHost`|6.1.0| | | |6.1.0| +|`CU_FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_MEMOPS`|11.3| | | |`hipFlushGPUDirectRDMAWritesOptionMemOps`|6.1.0| | | |6.1.0| |`CU_FLUSH_GPU_DIRECT_RDMA_WRITES_TARGET_CURRENT_CTX`|11.3| | | | | | | | | | |`CU_FLUSH_GPU_DIRECT_RDMA_WRITES_TO_ALL_DEVICES`|11.3| | | | | | | | | | |`CU_FLUSH_GPU_DIRECT_RDMA_WRITES_TO_OWNER`|11.3| | | | | | | | | | @@ -629,18 +629,18 @@ |`CU_GET_PROC_ADDRESS_DEFAULT`|11.3| | | | | | | | | | |`CU_GET_PROC_ADDRESS_LEGACY_STREAM`|11.3| | | | | | | | | | |`CU_GET_PROC_ADDRESS_PER_THREAD_DEFAULT_STREAM`|11.3| | | | | | | | | | -|`CU_GET_PROC_ADDRESS_SUCCESS`|12.0| | | | | | | | | | -|`CU_GET_PROC_ADDRESS_SYMBOL_NOT_FOUND`|12.0| | | | | | | | | | -|`CU_GET_PROC_ADDRESS_VERSION_NOT_SUFFICIENT`|12.0| | | | | | | | | | +|`CU_GET_PROC_ADDRESS_SUCCESS`|12.0| | | |`HIP_GET_PROC_ADDRESS_SUCCESS`|6.1.0| | | |6.1.0| +|`CU_GET_PROC_ADDRESS_SYMBOL_NOT_FOUND`|12.0| | | |`HIP_GET_PROC_ADDRESS_SYMBOL_NOT_FOUND`|6.1.0| | | |6.1.0| +|`CU_GET_PROC_ADDRESS_VERSION_NOT_SUFFICIENT`|12.0| | | |`HIP_GET_PROC_ADDRESS_VERSION_NOT_SUFFICIENT`|6.1.0| | | |6.1.0| |`CU_GL_DEVICE_LIST_ALL`| | | | |`hipGLDeviceListAll`|4.4.0| | | | | |`CU_GL_DEVICE_LIST_CURRENT_FRAME`| | | | |`hipGLDeviceListCurrentFrame`|4.4.0| | | | | |`CU_GL_DEVICE_LIST_NEXT_FRAME`| | | | |`hipGLDeviceListNextFrame`|4.4.0| | | | | |`CU_GL_MAP_RESOURCE_FLAGS_NONE`| | | | | | | | | | | |`CU_GL_MAP_RESOURCE_FLAGS_READ_ONLY`| | | | | | | | | | | |`CU_GL_MAP_RESOURCE_FLAGS_WRITE_DISCARD`| | | | | | | | | | | -|`CU_GPU_DIRECT_RDMA_WRITES_ORDERING_ALL_DEVICES`|11.3| | | | | | | | | | -|`CU_GPU_DIRECT_RDMA_WRITES_ORDERING_NONE`|11.3| | | | | | | | | | -|`CU_GPU_DIRECT_RDMA_WRITES_ORDERING_OWNER`|11.3| | | | | | | | | | +|`CU_GPU_DIRECT_RDMA_WRITES_ORDERING_ALL_DEVICES`|11.3| | | |`hipGPUDirectRDMAWritesOrderingAllDevices`|6.1.0| | | |6.1.0| +|`CU_GPU_DIRECT_RDMA_WRITES_ORDERING_NONE`|11.3| | | |`hipGPUDirectRDMAWritesOrderingNone`|6.1.0| | | |6.1.0| +|`CU_GPU_DIRECT_RDMA_WRITES_ORDERING_OWNER`|11.3| | | |`hipGPUDirectRDMAWritesOrderingOwner`|6.1.0| | | |6.1.0| |`CU_GRAPHICS_MAP_RESOURCE_FLAGS_NONE`| | | | | | | | | | | |`CU_GRAPHICS_MAP_RESOURCE_FLAGS_READ_ONLY`| | | | | | | | | | | |`CU_GRAPHICS_MAP_RESOURCE_FLAGS_WRITE_DISCARD`| | | | | | | | | | | @@ -1083,8 +1083,8 @@ |`CUdevprop`| | | | | | | | | | | |`CUdevprop_st`| | | | | | | | | | | |`CUdevprop_v1`|11.3| | | | | | | | | | -|`CUdriverProcAddressQueryResult`|12.0| | | | | | | | | | -|`CUdriverProcAddressQueryResult_enum`|12.0| | | | | | | | | | +|`CUdriverProcAddressQueryResult`|12.0| | | |`hipDriverProcAddressQueryResult`|6.1.0| | | |6.1.0| +|`CUdriverProcAddressQueryResult_enum`|12.0| | | |`hipDriverProcAddressQueryResult`|6.1.0| | | |6.1.0| |`CUdriverProcAddress_flags`|11.3| | | | | | | | | | |`CUdriverProcAddress_flags_enum`|11.3| | | | | | | | | | |`CUeglColorFormat`|9.0| | | | | | | | | | @@ -1123,8 +1123,8 @@ |`CUexternalSemaphoreHandleType_enum`|10.0| | | |`hipExternalSemaphoreHandleType_enum`|4.4.0| | | | | |`CUfilter_mode`| | | | |`HIPfilter_mode`|3.5.0| | | | | |`CUfilter_mode_enum`| | | | |`HIPfilter_mode_enum`|3.5.0| | | | | -|`CUflushGPUDirectRDMAWritesOptions`|11.3| | | | | | | | | | -|`CUflushGPUDirectRDMAWritesOptions_enum`|11.3| | | | | | | | | | +|`CUflushGPUDirectRDMAWritesOptions`|11.3| | | |`hipFlushGPUDirectRDMAWritesOptions`|6.1.0| | | |6.1.0| +|`CUflushGPUDirectRDMAWritesOptions_enum`|11.3| | | |`hipFlushGPUDirectRDMAWritesOptions`|6.1.0| | | |6.1.0| |`CUflushGPUDirectRDMAWritesScope`|11.3| | | | | | | | | | |`CUflushGPUDirectRDMAWritesScope_enum`|11.3| | | | | | | | | | |`CUflushGPUDirectRDMAWritesTarget`|11.3| | | | | | | | | | @@ -1152,15 +1152,15 @@ |`CUgraphExecUpdateResultInfo_v1`|12.0| | | | | | | | | | |`CUgraphExecUpdateResult_enum`|10.2| | | |`hipGraphExecUpdateResult`|4.3.0| | | | | |`CUgraphExec_st`|10.0| | | |`hipGraphExec`|4.3.0| | | | | -|`CUgraphInstantiateResult`|12.0| | | | | | | | | | -|`CUgraphInstantiateResult_enum`|12.0| | | | | | | | | | +|`CUgraphInstantiateResult`|12.0| | | |`hipGraphInstantiateResult`|6.1.0| | | |6.1.0| +|`CUgraphInstantiateResult_enum`|12.0| | | |`hipGraphInstantiateResult`|6.1.0| | | |6.1.0| |`CUgraphInstantiate_flags`|11.4| | | |`hipGraphInstantiateFlags`|5.2.0| | | | | |`CUgraphInstantiate_flags_enum`|11.4| | | |`hipGraphInstantiateFlags`|5.2.0| | | | | |`CUgraphMem_attribute`|11.4| | | |`hipGraphMemAttributeType`|5.3.0| | | | | |`CUgraphMem_attribute_enum`|11.4| | | |`hipGraphMemAttributeType`|5.3.0| | | | | |`CUgraphNode`|10.0| | | |`hipGraphNode_t`|4.3.0| | | | | -|`CUgraphNodeParams`|12.2| | | | | | | | | | -|`CUgraphNodeParams_st`|12.2| | | | | | | | | | +|`CUgraphNodeParams`|12.2| | | |`hipGraphNodeParams`|6.1.0| | | |6.1.0| +|`CUgraphNodeParams_st`|12.2| | | |`hipGraphNodeParams`|6.1.0| | | |6.1.0| |`CUgraphNodeType`|10.0| | | |`hipGraphNodeType`|4.3.0| | | | | |`CUgraphNodeType_enum`|10.0| | | |`hipGraphNodeType`|4.3.0| | | | | |`CUgraphNode_st`|10.0| | | |`hipGraphNode`|4.3.0| | | | | @@ -1805,15 +1805,15 @@ |`cuGraphAddEmptyNode`|10.0| | | |`hipGraphAddEmptyNode`|4.5.0| | | | | |`cuGraphAddEventRecordNode`|11.1| | | |`hipGraphAddEventRecordNode`|5.0.0| | | | | |`cuGraphAddEventWaitNode`|11.1| | | |`hipGraphAddEventWaitNode`|5.0.0| | | | | -|`cuGraphAddExternalSemaphoresSignalNode`|11.2| | | |`hipGraphAddExternalSemaphoresSignalNode`|6.0.0| | | | | -|`cuGraphAddExternalSemaphoresWaitNode`|11.2| | | |`hipGraphAddExternalSemaphoresWaitNode`|6.0.0| | | | | +|`cuGraphAddExternalSemaphoresSignalNode`|11.2| | | |`hipGraphAddExternalSemaphoresSignalNode`|6.1.0| | | |6.1.0| +|`cuGraphAddExternalSemaphoresWaitNode`|11.2| | | |`hipGraphAddExternalSemaphoresWaitNode`|6.1.0| | | |6.1.0| |`cuGraphAddHostNode`|10.0| | | |`hipGraphAddHostNode`|5.0.0| | | | | |`cuGraphAddKernelNode`|10.0| | | |`hipGraphAddKernelNode`|4.3.0| | | | | |`cuGraphAddMemAllocNode`|11.4| | | |`hipGraphAddMemAllocNode`|5.5.0| | | | | -|`cuGraphAddMemFreeNode`|11.4| | | |`hipGraphAddMemFreeNode`|5.5.0| | | | | +|`cuGraphAddMemFreeNode`|11.4| | | |`hipDrvGraphAddMemFreeNode`|6.1.0| | | |6.1.0| |`cuGraphAddMemcpyNode`|10.0| | | |`hipDrvGraphAddMemcpyNode`|6.0.0| | | | | -|`cuGraphAddMemsetNode`|10.0| | | |`hipGraphAddMemsetNode`|4.3.0| | | | | -|`cuGraphAddNode`|12.2| | | |`hipGraphAddNode`| | | | | | +|`cuGraphAddMemsetNode`|10.0| | | |`hipDrvGraphAddMemsetNode`|6.1.0| | | |6.1.0| +|`cuGraphAddNode`|12.2| | | |`hipGraphAddNode`|6.1.0| | | |6.1.0| |`cuGraphAddNode_v2`|12.3| | | | | | | | | | |`cuGraphBatchMemOpNodeGetParams`|11.7| | | |`hipGraphBatchMemOpNodeGetParams`| | | | | | |`cuGraphBatchMemOpNodeSetParams`|11.7| | | |`hipGraphBatchMemOpNodeSetParams`| | | | | | @@ -1833,19 +1833,19 @@ |`cuGraphExecDestroy`|10.0| | | |`hipGraphExecDestroy`|4.3.0| | | | | |`cuGraphExecEventRecordNodeSetEvent`|11.1| | | |`hipGraphExecEventRecordNodeSetEvent`|5.0.0| | | | | |`cuGraphExecEventWaitNodeSetEvent`|11.1| | | |`hipGraphExecEventWaitNodeSetEvent`|5.0.0| | | | | -|`cuGraphExecExternalSemaphoresSignalNodeSetParams`|11.2| | | |`hipGraphExecExternalSemaphoresSignalNodeSetParams`|6.0.0| | | | | -|`cuGraphExecExternalSemaphoresWaitNodeSetParams`|11.2| | | |`hipGraphExecExternalSemaphoresWaitNodeSetParams`|6.0.0| | | | | -|`cuGraphExecGetFlags`|12.0| | | |`hipGraphExecGetFlags`| | | | | | +|`cuGraphExecExternalSemaphoresSignalNodeSetParams`|11.2| | | |`hipGraphExecExternalSemaphoresSignalNodeSetParams`|6.1.0| | | |6.1.0| +|`cuGraphExecExternalSemaphoresWaitNodeSetParams`|11.2| | | |`hipGraphExecExternalSemaphoresWaitNodeSetParams`|6.1.0| | | |6.1.0| +|`cuGraphExecGetFlags`|12.0| | | |`hipGraphExecGetFlags`|6.1.0| | | |6.1.0| |`cuGraphExecHostNodeSetParams`|10.2| | | |`hipGraphExecHostNodeSetParams`|5.0.0| | | | | |`cuGraphExecKernelNodeSetParams`|10.1| | | |`hipGraphExecKernelNodeSetParams`|4.5.0| | | | | -|`cuGraphExecMemcpyNodeSetParams`|10.2| | | | | | | | | | -|`cuGraphExecMemsetNodeSetParams`|10.2| | | | | | | | | | -|`cuGraphExecNodeSetParams`|12.2| | | |`hipGraphExecNodeSetParams`| | | | | | +|`cuGraphExecMemcpyNodeSetParams`|10.2| | | |`hipDrvGraphExecMemcpyNodeSetParams`|6.1.0| | | |6.1.0| +|`cuGraphExecMemsetNodeSetParams`|10.2| | | |`hipDrvGraphExecMemsetNodeSetParams`|6.1.0| | | |6.1.0| +|`cuGraphExecNodeSetParams`|12.2| | | |`hipGraphExecNodeSetParams`|6.1.0| | | |6.1.0| |`cuGraphExecUpdate`|10.2| | | |`hipGraphExecUpdate`|5.0.0| | | | | -|`cuGraphExternalSemaphoresSignalNodeGetParams`|11.2| | | |`hipGraphExternalSemaphoresSignalNodeGetParams`|6.0.0| | | | | -|`cuGraphExternalSemaphoresSignalNodeSetParams`|11.2| | | |`hipGraphExternalSemaphoresSignalNodeSetParams`|6.0.0| | | | | -|`cuGraphExternalSemaphoresWaitNodeGetParams`|11.2| | | |`hipGraphExternalSemaphoresWaitNodeGetParams`|6.0.0| | | | | -|`cuGraphExternalSemaphoresWaitNodeSetParams`|11.2| | | |`hipGraphExternalSemaphoresWaitNodeSetParams`|6.0.0| | | | | +|`cuGraphExternalSemaphoresSignalNodeGetParams`|11.2| | | |`hipGraphExternalSemaphoresSignalNodeGetParams`|6.1.0| | | |6.1.0| +|`cuGraphExternalSemaphoresSignalNodeSetParams`|11.2| | | |`hipGraphExternalSemaphoresSignalNodeSetParams`|6.1.0| | | |6.1.0| +|`cuGraphExternalSemaphoresWaitNodeGetParams`|11.2| | | |`hipGraphExternalSemaphoresWaitNodeGetParams`|6.1.0| | | |6.1.0| +|`cuGraphExternalSemaphoresWaitNodeSetParams`|11.2| | | |`hipGraphExternalSemaphoresWaitNodeSetParams`|6.1.0| | | |6.1.0| |`cuGraphGetEdges`|10.0| | | |`hipGraphGetEdges`|5.0.0| | | | | |`cuGraphGetEdges_v2`|12.3| | | | | | | | | | |`cuGraphGetNodes`|10.0| | | |`hipGraphGetNodes`|4.5.0| | | | | @@ -1854,7 +1854,7 @@ |`cuGraphHostNodeSetParams`|10.0| | | |`hipGraphHostNodeSetParams`|5.0.0| | | | | |`cuGraphInstantiate`|10.0| | | |`hipGraphInstantiate`|4.3.0| | | | | |`cuGraphInstantiateWithFlags`|11.4| | | |`hipGraphInstantiateWithFlags`|5.0.0| | | | | -|`cuGraphInstantiateWithParams`|12.0| | | |`hipGraphInstantiateWithParams`| | | | | | +|`cuGraphInstantiateWithParams`|12.0| | | |`hipGraphInstantiateWithParams`|6.1.0| | | |6.1.0| |`cuGraphInstantiate_v2`|11.0| | | |`hipGraphInstantiate`|4.3.0| | | | | |`cuGraphKernelNodeCopyAttributes`|11.0| | | |`hipGraphKernelNodeCopyAttributes`|5.5.0| | | | | |`cuGraphKernelNodeGetAttribute`|11.0| | | |`hipGraphKernelNodeGetAttribute`|5.2.0| | | | | @@ -1864,8 +1864,8 @@ |`cuGraphLaunch`|10.0| | | |`hipGraphLaunch`|4.3.0| | | | | |`cuGraphMemAllocNodeGetParams`|11.4| | | |`hipGraphMemAllocNodeGetParams`|5.5.0| | | | | |`cuGraphMemFreeNodeGetParams`|11.4| | | |`hipGraphMemFreeNodeGetParams`|5.5.0| | | | | -|`cuGraphMemcpyNodeGetParams`|10.0| | | |`hipGraphMemcpyNodeGetParams`|4.5.0| | | | | -|`cuGraphMemcpyNodeSetParams`|10.0| | | |`hipGraphMemcpyNodeSetParams`|4.5.0| | | | | +|`cuGraphMemcpyNodeGetParams`|10.0| | | |`hipDrvGraphMemcpyNodeGetParams`|6.1.0| | | |6.1.0| +|`cuGraphMemcpyNodeSetParams`|10.0| | | |`hipDrvGraphMemcpyNodeSetParams`|6.1.0| | | |6.1.0| |`cuGraphMemsetNodeGetParams`|10.0| | | |`hipGraphMemsetNodeGetParams`|4.5.0| | | | | |`cuGraphMemsetNodeSetParams`|10.0| | | |`hipGraphMemsetNodeSetParams`|4.5.0| | | | | |`cuGraphNodeFindInClone`|10.0| | | |`hipGraphNodeFindInClone`|5.0.0| | | | | @@ -1876,7 +1876,7 @@ |`cuGraphNodeGetEnabled`|11.6| | | |`hipGraphNodeGetEnabled`|5.5.0| | | | | |`cuGraphNodeGetType`|10.0| | | |`hipGraphNodeGetType`|5.0.0| | | | | |`cuGraphNodeSetEnabled`|11.6| | | |`hipGraphNodeSetEnabled`|5.5.0| | | | | -|`cuGraphNodeSetParams`|12.2| | | |`hipGraphNodeSetParams`| | | | | | +|`cuGraphNodeSetParams`|12.2| | | |`hipGraphNodeSetParams`|6.1.0| | | |6.1.0| |`cuGraphReleaseUserObject`|11.3| | | |`hipGraphReleaseUserObject`|5.3.0| | | | | |`cuGraphRemoveDependencies`|10.0| | | |`hipGraphRemoveDependencies`|5.0.0| | | | | |`cuGraphRemoveDependencies_v2`|12.3| | | | | | | | | | @@ -1994,7 +1994,7 @@ |**CUDA**|**A**|**D**|**C**|**R**|**HIP**|**A**|**D**|**C**|**R**|**E**| |:--|:-:|:-:|:-:|:-:|:--|:-:|:-:|:-:|:-:|:-:| -|`cuGetProcAddress`|11.3| | | | | | | | | | +|`cuGetProcAddress`|11.3| | | |`hipGetProcAddress`|6.1.0| | | |6.1.0| ## **34. Coredump Attributes Control API** diff --git a/docs/tables/CUDA_Runtime_API_functions_supported_by_HIP.md b/docs/tables/CUDA_Runtime_API_functions_supported_by_HIP.md index ea51b0b2..711617db 100644 --- a/docs/tables/CUDA_Runtime_API_functions_supported_by_HIP.md +++ b/docs/tables/CUDA_Runtime_API_functions_supported_by_HIP.md @@ -421,8 +421,8 @@ |`cudaGraphAddEmptyNode`|10.0| | | |`hipGraphAddEmptyNode`|4.5.0| | | | | |`cudaGraphAddEventRecordNode`|11.1| | | |`hipGraphAddEventRecordNode`|5.0.0| | | | | |`cudaGraphAddEventWaitNode`|11.1| | | |`hipGraphAddEventWaitNode`|5.0.0| | | | | -|`cudaGraphAddExternalSemaphoresSignalNode`|11.2| | | |`hipGraphAddExternalSemaphoresSignalNode`|6.0.0| | | | | -|`cudaGraphAddExternalSemaphoresWaitNode`|11.2| | | |`hipGraphAddExternalSemaphoresWaitNode`|6.0.0| | | | | +|`cudaGraphAddExternalSemaphoresSignalNode`|11.2| | | |`hipGraphAddExternalSemaphoresSignalNode`|6.1.0| | | |6.1.0| +|`cudaGraphAddExternalSemaphoresWaitNode`|11.2| | | |`hipGraphAddExternalSemaphoresWaitNode`|6.1.0| | | |6.1.0| |`cudaGraphAddHostNode`|10.0| | | |`hipGraphAddHostNode`|5.0.0| | | | | |`cudaGraphAddKernelNode`|10.0| | | |`hipGraphAddKernelNode`|4.3.0| | | | | |`cudaGraphAddMemAllocNode`|11.4| | | |`hipGraphAddMemAllocNode`|5.5.0| | | | | @@ -432,7 +432,7 @@ |`cudaGraphAddMemcpyNodeFromSymbol`|11.1| | | |`hipGraphAddMemcpyNodeFromSymbol`|5.0.0| | | | | |`cudaGraphAddMemcpyNodeToSymbol`|11.1| | | |`hipGraphAddMemcpyNodeToSymbol`|5.0.0| | | | | |`cudaGraphAddMemsetNode`|10.0| | | |`hipGraphAddMemsetNode`|4.3.0| | | | | -|`cudaGraphAddNode`|12.2| | | | | | | | | | +|`cudaGraphAddNode`|12.2| | | |`hipGraphAddNode`|6.1.0| | | |6.1.0| |`cudaGraphAddNode_v2`|12.3| | | | | | | | | | |`cudaGraphChildGraphNodeGetGraph`|10.0| | | |`hipGraphChildGraphNodeGetGraph`|5.0.0| | | | | |`cudaGraphClone`|10.0| | | |`hipGraphClone`|5.0.0| | | | | @@ -449,9 +449,9 @@ |`cudaGraphExecDestroy`|10.0| | | |`hipGraphExecDestroy`|4.3.0| | | | | |`cudaGraphExecEventRecordNodeSetEvent`|11.1| | | |`hipGraphExecEventRecordNodeSetEvent`|5.0.0| | | | | |`cudaGraphExecEventWaitNodeSetEvent`|11.1| | | |`hipGraphExecEventWaitNodeSetEvent`|5.0.0| | | | | -|`cudaGraphExecExternalSemaphoresSignalNodeSetParams`|11.2| | | |`hipGraphExecExternalSemaphoresSignalNodeSetParams`|6.0.0| | | | | -|`cudaGraphExecExternalSemaphoresWaitNodeSetParams`|11.2| | | |`hipGraphExecExternalSemaphoresWaitNodeSetParams`|6.0.0| | | | | -|`cudaGraphExecGetFlags`|12.0| | | | | | | | | | +|`cudaGraphExecExternalSemaphoresSignalNodeSetParams`|11.2| | | |`hipGraphExecExternalSemaphoresSignalNodeSetParams`|6.1.0| | | |6.1.0| +|`cudaGraphExecExternalSemaphoresWaitNodeSetParams`|11.2| | | |`hipGraphExecExternalSemaphoresWaitNodeSetParams`|6.1.0| | | |6.1.0| +|`cudaGraphExecGetFlags`|12.0| | | |`hipGraphExecGetFlags`|6.1.0| | | |6.1.0| |`cudaGraphExecHostNodeSetParams`|11.0| | | |`hipGraphExecHostNodeSetParams`|5.0.0| | | | | |`cudaGraphExecKernelNodeSetParams`|11.0| | | |`hipGraphExecKernelNodeSetParams`|4.5.0| | | | | |`cudaGraphExecMemcpyNodeSetParams`|11.0| | | |`hipGraphExecMemcpyNodeSetParams`|5.0.0| | | | | @@ -459,12 +459,12 @@ |`cudaGraphExecMemcpyNodeSetParamsFromSymbol`|11.1| | | |`hipGraphExecMemcpyNodeSetParamsFromSymbol`|5.0.0| | | | | |`cudaGraphExecMemcpyNodeSetParamsToSymbol`|11.1| | | |`hipGraphExecMemcpyNodeSetParamsToSymbol`|5.0.0| | | | | |`cudaGraphExecMemsetNodeSetParams`|11.0| | | |`hipGraphExecMemsetNodeSetParams`|5.0.0| | | | | -|`cudaGraphExecNodeSetParams`|12.2| | | | | | | | | | +|`cudaGraphExecNodeSetParams`|12.2| | | |`hipGraphExecNodeSetParams`|6.1.0| | | |6.1.0| |`cudaGraphExecUpdate`|11.0| | | |`hipGraphExecUpdate`|5.0.0| | | | | -|`cudaGraphExternalSemaphoresSignalNodeGetParams`|11.2| | | |`hipGraphExternalSemaphoresSignalNodeGetParams`|6.0.0| | | | | -|`cudaGraphExternalSemaphoresSignalNodeSetParams`|11.2| | | |`hipGraphExternalSemaphoresSignalNodeSetParams`|6.0.0| | | | | -|`cudaGraphExternalSemaphoresWaitNodeGetParams`|11.2| | | |`hipGraphExternalSemaphoresWaitNodeGetParams`|6.0.0| | | | | -|`cudaGraphExternalSemaphoresWaitNodeSetParams`|11.2| | | |`hipGraphExternalSemaphoresWaitNodeSetParams`|6.0.0| | | | | +|`cudaGraphExternalSemaphoresSignalNodeGetParams`|11.2| | | |`hipGraphExternalSemaphoresSignalNodeGetParams`|6.1.0| | | |6.1.0| +|`cudaGraphExternalSemaphoresSignalNodeSetParams`|11.2| | | |`hipGraphExternalSemaphoresSignalNodeSetParams`|6.1.0| | | |6.1.0| +|`cudaGraphExternalSemaphoresWaitNodeGetParams`|11.2| | | |`hipGraphExternalSemaphoresWaitNodeGetParams`|6.1.0| | | |6.1.0| +|`cudaGraphExternalSemaphoresWaitNodeSetParams`|11.2| | | |`hipGraphExternalSemaphoresWaitNodeSetParams`|6.1.0| | | |6.1.0| |`cudaGraphGetEdges`|10.0| | | |`hipGraphGetEdges`|5.0.0| | | | | |`cudaGraphGetEdges_v2`|12.3| | | | | | | | | | |`cudaGraphGetNodes`|10.0| | | |`hipGraphGetNodes`|4.5.0| | | | | @@ -473,7 +473,7 @@ |`cudaGraphHostNodeSetParams`|10.0| | | |`hipGraphHostNodeSetParams`|5.0.0| | | | | |`cudaGraphInstantiate`|10.0| | | |`hipGraphInstantiate`|4.3.0| | | | | |`cudaGraphInstantiateWithFlags`|11.4| | | |`hipGraphInstantiateWithFlags`|5.0.0| | | | | -|`cudaGraphInstantiateWithParams`|12.0| | | | | | | | | | +|`cudaGraphInstantiateWithParams`|12.0| | | |`hipGraphInstantiateWithParams`|6.1.0| | | |6.1.0| |`cudaGraphKernelNodeCopyAttributes`|11.0| | | |`hipGraphKernelNodeCopyAttributes`|5.5.0| | | | | |`cudaGraphKernelNodeGetAttribute`|11.0| | | |`hipGraphKernelNodeGetAttribute`|5.2.0| | | | | |`cudaGraphKernelNodeGetParams`|11.0| | | |`hipGraphKernelNodeGetParams`|4.5.0| | | | | @@ -497,7 +497,7 @@ |`cudaGraphNodeGetEnabled`|11.6| | | |`hipGraphNodeGetEnabled`|5.5.0| | | | | |`cudaGraphNodeGetType`|11.0| | | |`hipGraphNodeGetType`|5.0.0| | | | | |`cudaGraphNodeSetEnabled`|11.6| | | |`hipGraphNodeSetEnabled`|5.5.0| | | | | -|`cudaGraphNodeSetParams`|12.2| | | | | | | | | | +|`cudaGraphNodeSetParams`|12.2| | | |`hipGraphNodeSetParams`|6.1.0| | | |6.1.0| |`cudaGraphReleaseUserObject`|11.3| | | |`hipGraphReleaseUserObject`|5.3.0| | | | | |`cudaGraphRemoveDependencies`|11.0| | | |`hipGraphRemoveDependencies`|5.0.0| | | | | |`cudaGraphRemoveDependencies_v2`|12.3| | | | | | | | | | @@ -511,7 +511,7 @@ |**CUDA**|**A**|**D**|**C**|**R**|**HIP**|**A**|**D**|**C**|**R**|**E**| |:--|:-:|:-:|:-:|:-:|:--|:-:|:-:|:-:|:-:|:-:| -|`cudaGetDriverEntryPoint`|11.3| | | | | | | | | | +|`cudaGetDriverEntryPoint`|11.3| | | |`hipGetProcAddress`|6.1.0| | | |6.1.0| ## **30. C++ API Routines** @@ -612,7 +612,7 @@ |`cudaChannelFormatKindUnsignedNormalized8X1`|11.5| | | | | | | | | | |`cudaChannelFormatKindUnsignedNormalized8X2`|11.5| | | | | | | | | | |`cudaChannelFormatKindUnsignedNormalized8X4`|11.5| | | | | | | | | | -|`cudaChildGraphNodeParams`|12.2| | | | | | | | | | +|`cudaChildGraphNodeParams`|12.2| | | |`hipChildGraphNodeParams`|6.1.0| | | |6.1.0| |`cudaClusterSchedulingPolicy`|11.8| | | | | | | | | | |`cudaClusterSchedulingPolicyDefault`|11.8| | | | | | | | | | |`cudaClusterSchedulingPolicyLoadBalancing`|11.8| | | | | | | | | | @@ -1029,10 +1029,10 @@ |`cudaEventInterprocess`| | | | |`hipEventInterprocess`|1.6.0| | | | | |`cudaEventRecordDefault`|11.1| | | | | | | | | | |`cudaEventRecordExternal`|11.1| | | | | | | | | | -|`cudaEventRecordNodeParams`|12.2| | | | | | | | | | +|`cudaEventRecordNodeParams`|12.2| | | |`hipEventRecordNodeParams`|6.1.0| | | |6.1.0| |`cudaEventWaitDefault`|11.1| | | | | | | | | | |`cudaEventWaitExternal`| | | | | | | | | | | -|`cudaEventWaitNodeParams`|12.2| | | | | | | | | | +|`cudaEventWaitNodeParams`|12.2| | | |`hipEventWaitNodeParams`|6.1.0| | | |6.1.0| |`cudaEvent_t`| | | | |`hipEvent_t`|1.6.0| | | | | |`cudaExtent`| | | | |`hipExtent`|1.7.0| | | | | |`cudaExternalMemoryBufferDesc`|10.0| | | |`hipExternalMemoryBufferDesc`|4.3.0| | | | | @@ -1074,9 +1074,9 @@ |`cudaExternalSemaphore_t`|10.0| | | |`hipExternalSemaphore_t`|4.4.0| | | | | |`cudaFilterModeLinear`| | | | |`hipFilterModeLinear`|1.7.0| | | | | |`cudaFilterModePoint`| | | | |`hipFilterModePoint`|1.6.0| | | | | -|`cudaFlushGPUDirectRDMAWritesOptionHost`|11.3| | | | | | | | | | -|`cudaFlushGPUDirectRDMAWritesOptionMemOps`|11.3| | | | | | | | | | -|`cudaFlushGPUDirectRDMAWritesOptions`|11.3| | | | | | | | | | +|`cudaFlushGPUDirectRDMAWritesOptionHost`|11.3| | | |`hipFlushGPUDirectRDMAWritesOptionHost`|6.1.0| | | |6.1.0| +|`cudaFlushGPUDirectRDMAWritesOptionMemOps`|11.3| | | |`hipFlushGPUDirectRDMAWritesOptionMemOps`|6.1.0| | | |6.1.0| +|`cudaFlushGPUDirectRDMAWritesOptions`|11.3| | | |`hipFlushGPUDirectRDMAWritesOptions`|6.1.0| | | |6.1.0| |`cudaFlushGPUDirectRDMAWritesScope`|11.3| | | | | | | | | | |`cudaFlushGPUDirectRDMAWritesTarget`|11.3| | | | | | | | | | |`cudaFlushGPUDirectRDMAWritesTargetCurrentDevice`|11.3| | | | | | | | | | @@ -1109,10 +1109,10 @@ |`cudaGLMapFlagsNone`| | | | | | | | | | | |`cudaGLMapFlagsReadOnly`| | | | | | | | | | | |`cudaGLMapFlagsWriteDiscard`| | | | | | | | | | | -|`cudaGPUDirectRDMAWritesOrdering`|11.3| | | | | | | | | | -|`cudaGPUDirectRDMAWritesOrderingAllDevices`|11.3| | | | | | | | | | -|`cudaGPUDirectRDMAWritesOrderingNone`|11.3| | | | | | | | | | -|`cudaGPUDirectRDMAWritesOrderingOwner`|11.3| | | | | | | | | | +|`cudaGPUDirectRDMAWritesOrdering`|11.3| | | |`hipGPUDirectRDMAWritesOrdering`|6.1.0| | | |6.1.0| +|`cudaGPUDirectRDMAWritesOrderingAllDevices`|11.3| | | |`hipGPUDirectRDMAWritesOrderingAllDevices`|6.1.0| | | |6.1.0| +|`cudaGPUDirectRDMAWritesOrderingNone`|11.3| | | |`hipGPUDirectRDMAWritesOrderingNone`|6.1.0| | | |6.1.0| +|`cudaGPUDirectRDMAWritesOrderingOwner`|11.3| | | |`hipGPUDirectRDMAWritesOrderingOwner`|6.1.0| | | |6.1.0| |`cudaGetDriverEntryPointFlags`|11.3| | | | | | | | | | |`cudaGraphCondAssignDefault`|12.3| | | | | | | | | | |`cudaGraphCondTypeIf`|12.3| | | | | | | | | | @@ -1151,19 +1151,19 @@ |`cudaGraphExecUpdateResultInfo_st`|12.0| | | | | | | | | | |`cudaGraphExecUpdateSuccess`|10.2| | | |`hipGraphExecUpdateSuccess`|4.3.0| | | | | |`cudaGraphExec_t`|10.0| | | |`hipGraphExec_t`|4.3.0| | | | | -|`cudaGraphInstantiateError`|12.0| | | | | | | | | | +|`cudaGraphInstantiateError`|12.0| | | |`hipGraphInstantiateError`|6.1.0| | | |6.1.0| |`cudaGraphInstantiateFlagAutoFreeOnLaunch`|11.4| | | |`hipGraphInstantiateFlagAutoFreeOnLaunch`|5.2.0| | | | | |`cudaGraphInstantiateFlagDeviceLaunch`|12.0| | | |`hipGraphInstantiateFlagDeviceLaunch`|5.6.0| | | | | |`cudaGraphInstantiateFlagUpload`|12.0| | | |`hipGraphInstantiateFlagUpload`|5.6.0| | | | | |`cudaGraphInstantiateFlagUseNodePriority`|11.7| | | |`hipGraphInstantiateFlagUseNodePriority`|5.6.0| | | | | |`cudaGraphInstantiateFlags`|11.4| | | |`hipGraphInstantiateFlags`|5.2.0| | | | | -|`cudaGraphInstantiateInvalidStructure`|12.0| | | | | | | | | | -|`cudaGraphInstantiateMultipleDevicesNotSupported`|12.0| | | | | | | | | | -|`cudaGraphInstantiateNodeOperationNotSupported`|12.0| | | | | | | | | | -|`cudaGraphInstantiateParams`|12.0| | | | | | | | | | -|`cudaGraphInstantiateParams_st`|12.0| | | | | | | | | | -|`cudaGraphInstantiateResult`|12.0| | | | | | | | | | -|`cudaGraphInstantiateSuccess`|12.0| | | | | | | | | | +|`cudaGraphInstantiateInvalidStructure`|12.0| | | |`hipGraphInstantiateInvalidStructure`|6.1.0| | | |6.1.0| +|`cudaGraphInstantiateMultipleDevicesNotSupported`|12.0| | | |`hipGraphInstantiateMultipleDevicesNotSupported`|6.1.0| | | |6.1.0| +|`cudaGraphInstantiateNodeOperationNotSupported`|12.0| | | |`hipGraphInstantiateNodeOperationNotSupported`|6.1.0| | | |6.1.0| +|`cudaGraphInstantiateParams`|12.0| | | |`hipGraphInstantiateParams`|6.1.0| | | |6.1.0| +|`cudaGraphInstantiateParams_st`|12.0| | | |`hipGraphInstantiateParams`|6.1.0| | | |6.1.0| +|`cudaGraphInstantiateResult`|12.0| | | |`hipGraphInstantiateResult`|6.1.0| | | |6.1.0| +|`cudaGraphInstantiateSuccess`|12.0| | | |`hipGraphInstantiateSuccess`|6.1.0| | | |6.1.0| |`cudaGraphKernelNodePortDefault`|12.3| | | | | | | | | | |`cudaGraphKernelNodePortLaunchCompletion`|12.3| | | | | | | | | | |`cudaGraphKernelNodePortProgrammatic`|12.3| | | | | | | | | | @@ -1172,7 +1172,7 @@ |`cudaGraphMemAttrUsedMemCurrent`|11.4| | | |`hipGraphMemAttrUsedMemCurrent`|5.3.0| | | | | |`cudaGraphMemAttrUsedMemHigh`|11.4| | | |`hipGraphMemAttrUsedMemHigh`|5.3.0| | | | | |`cudaGraphMemAttributeType`|11.4| | | |`hipGraphMemAttributeType`|5.3.0| | | | | -|`cudaGraphNodeParams`|12.2| | | | | | | | | | +|`cudaGraphNodeParams`|12.2| | | |`hipGraphNodeParams`|6.1.0| | | |6.1.0| |`cudaGraphNodeType`|10.0| | | |`hipGraphNodeType`|4.3.0| | | | | |`cudaGraphNodeTypeConditional`|12.3| | | |`hipGraphNodeTypeConditional`| | | | | | |`cudaGraphNodeTypeCount`|10.0| | | |`hipGraphNodeTypeCount`|4.3.0| | | | | @@ -1297,7 +1297,7 @@ |`cudaMemAttachSingle`| | | | |`hipMemAttachSingle`|3.7.0| | | | | |`cudaMemFabricHandle_st`|12.3| | | | | | | | | | |`cudaMemFabricHandle_t`|12.3| | | | | | | | | | -|`cudaMemFreeNodeParams`|12.2| | | | | | | | | | +|`cudaMemFreeNodeParams`|12.2| | | |`hipMemFreeNodeParams`|6.1.0| | | |6.1.0| |`cudaMemHandleTypeNone`|11.2| | | |`hipMemHandleTypeNone`|5.2.0| | | | | |`cudaMemHandleTypePosixFileDescriptor`|11.2| | | |`hipMemHandleTypePosixFileDescriptor`|5.2.0| | | | | |`cudaMemHandleTypeWin32`|11.2| | | |`hipMemHandleTypeWin32`|5.2.0| | | | | @@ -1338,7 +1338,7 @@ |`cudaMemcpyHostToDevice`| | | | |`hipMemcpyHostToDevice`|1.5.0| | | | | |`cudaMemcpyHostToHost`| | | | |`hipMemcpyHostToHost`|1.5.0| | | | | |`cudaMemcpyKind`| | | | |`hipMemcpyKind`|1.5.0| | | | | -|`cudaMemcpyNodeParams`|12.2| | | | | | | | | | +|`cudaMemcpyNodeParams`|12.2| | | |`hipMemcpyNodeParams`|6.1.0| | | |6.1.0| |`cudaMemoryAdvise`|8.0| | | |`hipMemoryAdvise`|3.7.0| | | | | |`cudaMemoryType`| | | | |`hipMemoryType`|1.6.0| | | | | |`cudaMemoryTypeDevice`| | | | |`hipMemoryTypeDevice`|1.6.0| | | | | diff --git a/docs/tables/CUSPARSE_API_supported_by_HIP.md b/docs/tables/CUSPARSE_API_supported_by_HIP.md index 9a3cd43c..09a76186 100644 --- a/docs/tables/CUSPARSE_API_supported_by_HIP.md +++ b/docs/tables/CUSPARSE_API_supported_by_HIP.md @@ -221,33 +221,33 @@ |**CUDA**|**A**|**D**|**C**|**R**|**HIP**|**A**|**D**|**C**|**R**|**E**| |:--|:-:|:-:|:-:|:-:|:--|:-:|:-:|:-:|:-:|:-:| |`cusparseCopyMatDescr`|8.0| | |12.0|`hipsparseCopyMatDescr`|1.9.2| | | | | -|`cusparseCreateBsric02Info`| |12.2| | |`hipsparseCreateBsric02Info`|3.8.0| | | | | -|`cusparseCreateBsrilu02Info`| |12.2| | |`hipsparseCreateBsrilu02Info`|3.9.0| | | | | -|`cusparseCreateBsrsm2Info`| |12.2| | |`hipsparseCreateBsrsm2Info`|4.5.0| | | | | -|`cusparseCreateBsrsv2Info`| |12.2| | |`hipsparseCreateBsrsv2Info`|3.6.0| | | | | -|`cusparseCreateColorInfo`| |12.2| | |`hipsparseCreateColorInfo`|4.5.0| | | | | +|`cusparseCreateBsric02Info`| |12.2| | |`hipsparseCreateBsric02Info`|3.8.0|6.1.0| | | | +|`cusparseCreateBsrilu02Info`| |12.2| | |`hipsparseCreateBsrilu02Info`|3.9.0|6.1.0| | | | +|`cusparseCreateBsrsm2Info`| |12.2| | |`hipsparseCreateBsrsm2Info`|4.5.0|6.1.0| | | | +|`cusparseCreateBsrsv2Info`| |12.2| | |`hipsparseCreateBsrsv2Info`|3.6.0|6.1.0| | | | +|`cusparseCreateColorInfo`| |12.2| | |`hipsparseCreateColorInfo`|4.5.0|6.1.0| | | | |`cusparseCreateCsrgemm2Info`| |11.0| |12.0|`hipsparseCreateCsrgemm2Info`|2.8.0| | | | | -|`cusparseCreateCsric02Info`| |12.2| | |`hipsparseCreateCsric02Info`|3.1.0| | | | | -|`cusparseCreateCsrilu02Info`| |12.2| | |`hipsparseCreateCsrilu02Info`|1.9.2| | | | | +|`cusparseCreateCsric02Info`| |12.2| | |`hipsparseCreateCsric02Info`|3.1.0|6.1.0| | | | +|`cusparseCreateCsrilu02Info`| |12.2| | |`hipsparseCreateCsrilu02Info`|1.9.2|6.1.0| | | | |`cusparseCreateCsrsm2Info`|9.2|11.3| |12.0|`hipsparseCreateCsrsm2Info`|3.1.0| | | | | |`cusparseCreateCsrsv2Info`| |11.3| |12.0|`hipsparseCreateCsrsv2Info`|1.9.2| | | | | |`cusparseCreateHybMat`| |10.2| |11.0|`hipsparseCreateHybMat`|1.9.2| | | | | |`cusparseCreateMatDescr`| | | | |`hipsparseCreateMatDescr`|1.9.2| | | | | -|`cusparseCreatePruneInfo`|9.0|12.2| | |`hipsparseCreatePruneInfo`|3.9.0| | | | | +|`cusparseCreatePruneInfo`|9.0|12.2| | |`hipsparseCreatePruneInfo`|3.9.0|6.1.0| | | | |`cusparseCreateSolveAnalysisInfo`| |10.2| |11.0| | | | | | | -|`cusparseDestroyBsric02Info`| |12.2| | |`hipsparseDestroyBsric02Info`|3.8.0| | | | | -|`cusparseDestroyBsrilu02Info`| |12.2| | |`hipsparseDestroyBsrilu02Info`|3.9.0| | | | | -|`cusparseDestroyBsrsm2Info`| |12.2| | |`hipsparseDestroyBsrsm2Info`|4.5.0| | | | | -|`cusparseDestroyBsrsv2Info`| |12.2| | |`hipsparseDestroyBsrsv2Info`|3.6.0| | | | | -|`cusparseDestroyColorInfo`| |12.2| | |`hipsparseDestroyColorInfo`|4.5.0| | | | | +|`cusparseDestroyBsric02Info`| |12.2| | |`hipsparseDestroyBsric02Info`|3.8.0|6.1.0| | | | +|`cusparseDestroyBsrilu02Info`| |12.2| | |`hipsparseDestroyBsrilu02Info`|3.9.0|6.1.0| | | | +|`cusparseDestroyBsrsm2Info`| |12.2| | |`hipsparseDestroyBsrsm2Info`|4.5.0|6.1.0| | | | +|`cusparseDestroyBsrsv2Info`| |12.2| | |`hipsparseDestroyBsrsv2Info`|3.6.0|6.1.0| | | | +|`cusparseDestroyColorInfo`| |12.2| | |`hipsparseDestroyColorInfo`|4.5.0|6.1.0| | | | |`cusparseDestroyCsrgemm2Info`| |11.0| |12.0|`hipsparseDestroyCsrgemm2Info`|2.8.0| | | | | -|`cusparseDestroyCsric02Info`| |12.2| | |`hipsparseDestroyCsric02Info`|3.1.0| | | | | -|`cusparseDestroyCsrilu02Info`| |12.2| | |`hipsparseDestroyCsrilu02Info`|1.9.2| | | | | +|`cusparseDestroyCsric02Info`| |12.2| | |`hipsparseDestroyCsric02Info`|3.1.0|6.1.0| | | | +|`cusparseDestroyCsrilu02Info`| |12.2| | |`hipsparseDestroyCsrilu02Info`|1.9.2|6.1.0| | | | |`cusparseDestroyCsrsm2Info`|9.2|11.3| |12.0|`hipsparseDestroyCsrsm2Info`|3.1.0| | | | | |`cusparseDestroyCsrsv2Info`| |11.3| |12.0|`hipsparseDestroyCsrsv2Info`|1.9.2| | | | | |`cusparseDestroyHybMat`| |10.2| |11.0|`hipsparseDestroyHybMat`|1.9.2| | | | | |`cusparseDestroyMatDescr`| | | | |`hipsparseDestroyMatDescr`|1.9.2| | | | | -|`cusparseDestroyPruneInfo`|9.0|12.2| | |`hipsparseDestroyPruneInfo`|3.9.0| | | | | +|`cusparseDestroyPruneInfo`|9.0|12.2| | |`hipsparseDestroyPruneInfo`|3.9.0|6.1.0| | | | |`cusparseDestroySolveAnalysisInfo`| |10.2| |11.0| | | | | | | |`cusparseGetLevelInfo`| | | |11.0| | | | | | | |`cusparseGetMatDiagType`| | | | |`hipsparseGetMatDiagType`|1.9.2| | | | | @@ -293,11 +293,11 @@ |**CUDA**|**A**|**D**|**C**|**R**|**HIP**|**A**|**D**|**C**|**R**|**E**| |:--|:-:|:-:|:-:|:-:|:--|:-:|:-:|:-:|:-:|:-:| |`cusparseCbsrmv`| | | | |`hipsparseCbsrmv`|3.5.0| | | | | -|`cusparseCbsrsv2_analysis`| |12.2| | |`hipsparseCbsrsv2_analysis`|3.6.0| | | | | -|`cusparseCbsrsv2_bufferSize`| |12.2| | |`hipsparseCbsrsv2_bufferSize`|3.6.0| | | | | +|`cusparseCbsrsv2_analysis`| |12.2| | |`hipsparseCbsrsv2_analysis`|3.6.0|6.1.0| | | | +|`cusparseCbsrsv2_bufferSize`| |12.2| | |`hipsparseCbsrsv2_bufferSize`|3.6.0|6.1.0| | | | |`cusparseCbsrsv2_bufferSizeExt`| |12.2| | |`hipsparseCbsrsv2_bufferSizeExt`|3.6.0| | | | | -|`cusparseCbsrsv2_solve`| |12.2| | |`hipsparseCbsrsv2_solve`|3.6.0| | | | | -|`cusparseCbsrxmv`| |12.2| | |`hipsparseCbsrxmv`|4.5.0| | | | | +|`cusparseCbsrsv2_solve`| |12.2| | |`hipsparseCbsrsv2_solve`|3.6.0|6.1.0| | | | +|`cusparseCbsrxmv`| |12.2| | |`hipsparseCbsrxmv`|4.5.0|6.1.0| | | | |`cusparseCcsrmv`| |10.2| |11.0|`hipsparseCcsrmv`|3.1.0| | | | | |`cusparseCcsrmv_mp`|8.0|10.2| |11.0| | | | | | | |`cusparseCcsrsv2_analysis`| |11.3| |12.0|`hipsparseCcsrsv2_analysis`|3.1.0| | | | | @@ -316,11 +316,11 @@ |`cusparseCsrsv_analysisEx`|8.0|10.2| |11.0| | | | | | | |`cusparseCsrsv_solveEx`|8.0|10.2| |11.0| | | | | | | |`cusparseDbsrmv`| | | | |`hipsparseDbsrmv`|3.5.0| | | | | -|`cusparseDbsrsv2_analysis`| |12.2| | |`hipsparseDbsrsv2_analysis`|3.6.0| | | | | -|`cusparseDbsrsv2_bufferSize`| |12.2| | |`hipsparseDbsrsv2_bufferSize`|3.6.0| | | | | +|`cusparseDbsrsv2_analysis`| |12.2| | |`hipsparseDbsrsv2_analysis`|3.6.0|6.1.0| | | | +|`cusparseDbsrsv2_bufferSize`| |12.2| | |`hipsparseDbsrsv2_bufferSize`|3.6.0|6.1.0| | | | |`cusparseDbsrsv2_bufferSizeExt`| |12.2| | |`hipsparseDbsrsv2_bufferSizeExt`|3.6.0| | | | | -|`cusparseDbsrsv2_solve`| |12.2| | |`hipsparseDbsrsv2_solve`|3.6.0| | | | | -|`cusparseDbsrxmv`| |12.2| | |`hipsparseDbsrxmv`|4.5.0| | | | | +|`cusparseDbsrsv2_solve`| |12.2| | |`hipsparseDbsrsv2_solve`|3.6.0|6.1.0| | | | +|`cusparseDbsrxmv`| |12.2| | |`hipsparseDbsrxmv`|4.5.0|6.1.0| | | | |`cusparseDcsrmv`| |10.2| |11.0|`hipsparseDcsrmv`|1.9.2| | | | | |`cusparseDcsrmv_mp`|8.0|10.2| |11.0| | | | | | | |`cusparseDcsrsv2_analysis`| |11.3| |12.0|`hipsparseDcsrsv2_analysis`|1.9.2| | | | | @@ -335,11 +335,11 @@ |`cusparseDhybsv_analysis`| |10.2| |11.0| | | | | | | |`cusparseDhybsv_solve`| |10.2| |11.0| | | | | | | |`cusparseSbsrmv`| | | | |`hipsparseSbsrmv`|3.5.0| | | | | -|`cusparseSbsrsv2_analysis`| |12.2| | |`hipsparseSbsrsv2_analysis`|3.6.0| | | | | -|`cusparseSbsrsv2_bufferSize`| |12.2| | |`hipsparseSbsrsv2_bufferSize`|3.6.0| | | | | +|`cusparseSbsrsv2_analysis`| |12.2| | |`hipsparseSbsrsv2_analysis`|3.6.0|6.1.0| | | | +|`cusparseSbsrsv2_bufferSize`| |12.2| | |`hipsparseSbsrsv2_bufferSize`|3.6.0|6.1.0| | | | |`cusparseSbsrsv2_bufferSizeExt`| |12.2| | |`hipsparseSbsrsv2_bufferSizeExt`|3.6.0| | | | | -|`cusparseSbsrsv2_solve`| |12.2| | |`hipsparseSbsrsv2_solve`|3.6.0| | | | | -|`cusparseSbsrxmv`| |12.2| | |`hipsparseSbsrxmv`|4.5.0| | | | | +|`cusparseSbsrsv2_solve`| |12.2| | |`hipsparseSbsrsv2_solve`|3.6.0|6.1.0| | | | +|`cusparseSbsrxmv`| |12.2| | |`hipsparseSbsrxmv`|4.5.0|6.1.0| | | | |`cusparseScsrmv`| |10.2| |11.0|`hipsparseScsrmv`|1.9.2| | | | | |`cusparseScsrmv_mp`|8.0|10.2| |11.0| | | | | | | |`cusparseScsrsv2_analysis`| |11.3| |12.0|`hipsparseScsrsv2_analysis`|1.9.2| | | | | @@ -353,14 +353,14 @@ |`cusparseShybmv`| |10.2| |11.0|`hipsparseShybmv`|1.9.2| | | | | |`cusparseShybsv_analysis`| |10.2| |11.0| | | | | | | |`cusparseShybsv_solve`| |10.2| |11.0| | | | | | | -|`cusparseXbsrsv2_zeroPivot`| |12.2| | |`hipsparseXbsrsv2_zeroPivot`|3.6.0| | | | | +|`cusparseXbsrsv2_zeroPivot`| |12.2| | |`hipsparseXbsrsv2_zeroPivot`|3.6.0|6.1.0| | | | |`cusparseXcsrsv2_zeroPivot`| |11.3| |12.0|`hipsparseXcsrsv2_zeroPivot`|1.9.2| | | | | |`cusparseZbsrmv`| | | | |`hipsparseZbsrmv`|3.5.0| | | | | -|`cusparseZbsrsv2_analysis`| |12.2| | |`hipsparseZbsrsv2_analysis`|3.6.0| | | | | -|`cusparseZbsrsv2_bufferSize`| |12.2| | |`hipsparseZbsrsv2_bufferSize`|3.6.0| | | | | +|`cusparseZbsrsv2_analysis`| |12.2| | |`hipsparseZbsrsv2_analysis`|3.6.0|6.1.0| | | | +|`cusparseZbsrsv2_bufferSize`| |12.2| | |`hipsparseZbsrsv2_bufferSize`|3.6.0|6.1.0| | | | |`cusparseZbsrsv2_bufferSizeExt`| |12.2| | |`hipsparseZbsrsv2_bufferSizeExt`|3.6.0| | | | | -|`cusparseZbsrsv2_solve`| |12.2| | |`hipsparseZbsrsv2_solve`|3.6.0| | | | | -|`cusparseZbsrxmv`| |12.2| | |`hipsparseZbsrxmv`|4.5.0| | | | | +|`cusparseZbsrsv2_solve`| |12.2| | |`hipsparseZbsrsv2_solve`|3.6.0|6.1.0| | | | +|`cusparseZbsrxmv`| |12.2| | |`hipsparseZbsrxmv`|4.5.0|6.1.0| | | | |`cusparseZcsrmv`| |10.2| |11.0|`hipsparseZcsrmv`|3.1.0| | | | | |`cusparseZcsrmv_mp`|8.0|10.2| |11.0| | | | | | | |`cusparseZcsrsv2_analysis`| |11.3| |12.0|`hipsparseZcsrsv2_analysis`|3.1.0| | | | | @@ -380,10 +380,10 @@ |**CUDA**|**A**|**D**|**C**|**R**|**HIP**|**A**|**D**|**C**|**R**|**E**| |:--|:-:|:-:|:-:|:-:|:--|:-:|:-:|:-:|:-:|:-:| |`cusparseCbsrmm`| | | | |`hipsparseCbsrmm`|3.7.0| | | | | -|`cusparseCbsrsm2_analysis`| |12.2| | |`hipsparseCbsrsm2_analysis`|4.5.0| | | | | -|`cusparseCbsrsm2_bufferSize`| |12.2| | |`hipsparseCbsrsm2_bufferSize`|4.5.0| | | | | +|`cusparseCbsrsm2_analysis`| |12.2| | |`hipsparseCbsrsm2_analysis`|4.5.0|6.1.0| | | | +|`cusparseCbsrsm2_bufferSize`| |12.2| | |`hipsparseCbsrsm2_bufferSize`|4.5.0|6.1.0| | | | |`cusparseCbsrsm2_bufferSizeExt`| |12.2| | | | | | | | | -|`cusparseCbsrsm2_solve`| |12.2| | |`hipsparseCbsrsm2_solve`|4.5.0| | | | | +|`cusparseCbsrsm2_solve`| |12.2| | |`hipsparseCbsrsm2_solve`|4.5.0|6.1.0| | | | |`cusparseCcsrmm`| |10.2| |11.0|`hipsparseCcsrmm`|3.1.0| | | | | |`cusparseCcsrmm2`| |10.2| |11.0|`hipsparseCcsrmm2`|3.1.0| | | | | |`cusparseCcsrsm2_analysis`|9.2|11.3| |12.0|`hipsparseCcsrsm2_analysis`|3.1.0| | | | | @@ -393,10 +393,10 @@ |`cusparseCcsrsm_solve`| |10.2| |11.0| | | | | | | |`cusparseCgemmi`|8.0|11.0| |12.0|`hipsparseCgemmi`|3.7.0| | | | | |`cusparseDbsrmm`| | | | |`hipsparseDbsrmm`|3.7.0| | | | | -|`cusparseDbsrsm2_analysis`| |12.2| | |`hipsparseDbsrsm2_analysis`|4.5.0| | | | | -|`cusparseDbsrsm2_bufferSize`| |12.2| | |`hipsparseDbsrsm2_bufferSize`|4.5.0| | | | | +|`cusparseDbsrsm2_analysis`| |12.2| | |`hipsparseDbsrsm2_analysis`|4.5.0|6.1.0| | | | +|`cusparseDbsrsm2_bufferSize`| |12.2| | |`hipsparseDbsrsm2_bufferSize`|4.5.0|6.1.0| | | | |`cusparseDbsrsm2_bufferSizeExt`| |12.2| | | | | | | | | -|`cusparseDbsrsm2_solve`| |12.2| | |`hipsparseDbsrsm2_solve`|4.5.0| | | | | +|`cusparseDbsrsm2_solve`| |12.2| | |`hipsparseDbsrsm2_solve`|4.5.0|6.1.0| | | | |`cusparseDcsrmm`| |10.2| |11.0|`hipsparseDcsrmm`|1.9.2| | | | | |`cusparseDcsrmm2`| |10.2| |11.0|`hipsparseDcsrmm2`|1.9.2| | | | | |`cusparseDcsrsm2_analysis`|9.2|11.3| |12.0|`hipsparseDcsrsm2_analysis`|3.1.0| | | | | @@ -406,10 +406,10 @@ |`cusparseDcsrsm_solve`| |10.2| |11.0| | | | | | | |`cusparseDgemmi`|8.0|11.0| |12.0|`hipsparseDgemmi`|3.7.0| | | | | |`cusparseSbsrmm`| | | | |`hipsparseSbsrmm`|3.7.0| | | | | -|`cusparseSbsrsm2_analysis`| |12.2| | |`hipsparseSbsrsm2_analysis`|4.5.0| | | | | -|`cusparseSbsrsm2_bufferSize`| |12.2| | |`hipsparseSbsrsm2_bufferSize`|4.5.0| | | | | +|`cusparseSbsrsm2_analysis`| |12.2| | |`hipsparseSbsrsm2_analysis`|4.5.0|6.1.0| | | | +|`cusparseSbsrsm2_bufferSize`| |12.2| | |`hipsparseSbsrsm2_bufferSize`|4.5.0|6.1.0| | | | |`cusparseSbsrsm2_bufferSizeExt`| |12.2| | | | | | | | | -|`cusparseSbsrsm2_solve`| |12.2| | |`hipsparseSbsrsm2_solve`|4.5.0| | | | | +|`cusparseSbsrsm2_solve`| |12.2| | |`hipsparseSbsrsm2_solve`|4.5.0|6.1.0| | | | |`cusparseScsrmm`| |10.2| |11.0|`hipsparseScsrmm`|1.9.2| | | | | |`cusparseScsrmm2`| |10.2| |11.0|`hipsparseScsrmm2`|1.9.2| | | | | |`cusparseScsrsm2_analysis`|9.2|11.3| |12.0|`hipsparseScsrsm2_analysis`|3.1.0| | | | | @@ -418,13 +418,13 @@ |`cusparseScsrsm_analysis`| |10.2| |11.0| | | | | | | |`cusparseScsrsm_solve`| |10.2| |11.0| | | | | | | |`cusparseSgemmi`|8.0|11.0| |12.0|`hipsparseSgemmi`|3.7.0| | | | | -|`cusparseXbsrsm2_zeroPivot`| |12.2| | |`hipsparseXbsrsm2_zeroPivot`|4.5.0| | | | | +|`cusparseXbsrsm2_zeroPivot`| |12.2| | |`hipsparseXbsrsm2_zeroPivot`|4.5.0|6.1.0| | | | |`cusparseXcsrsm2_zeroPivot`|9.2|11.3| |12.0|`hipsparseXcsrsm2_zeroPivot`|3.1.0| | | | | |`cusparseZbsrmm`| | | | |`hipsparseZbsrmm`|3.7.0| | | | | -|`cusparseZbsrsm2_analysis`| |12.2| | |`hipsparseZbsrsm2_analysis`|4.5.0| | | | | -|`cusparseZbsrsm2_bufferSize`| |12.2| | |`hipsparseZbsrsm2_bufferSize`|4.5.0| | | | | +|`cusparseZbsrsm2_analysis`| |12.2| | |`hipsparseZbsrsm2_analysis`|4.5.0|6.1.0| | | | +|`cusparseZbsrsm2_bufferSize`| |12.2| | |`hipsparseZbsrsm2_bufferSize`|4.5.0|6.1.0| | | | |`cusparseZbsrsm2_bufferSizeExt`| |12.2| | | | | | | | | -|`cusparseZbsrsm2_solve`| |12.2| | |`hipsparseZbsrsm2_solve`|4.5.0| | | | | +|`cusparseZbsrsm2_solve`| |12.2| | |`hipsparseZbsrsm2_solve`|4.5.0|6.1.0| | | | |`cusparseZcsrmm`| |10.2| |11.0|`hipsparseZcsrmm`|3.1.0| | | | | |`cusparseZcsrmm2`| |10.2| |11.0|`hipsparseZcsrmm2`|3.1.0| | | | | |`cusparseZcsrsm2_analysis`|9.2|11.3| |12.0|`hipsparseZcsrsm2_analysis`|3.1.0| | | | | @@ -471,26 +471,26 @@ |**CUDA**|**A**|**D**|**C**|**R**|**HIP**|**A**|**D**|**C**|**R**|**E**| |:--|:-:|:-:|:-:|:-:|:--|:-:|:-:|:-:|:-:|:-:| -|`cusparseCbsric02`| |12.2| | |`hipsparseCbsric02`|3.8.0| | | | | -|`cusparseCbsric02_analysis`| |12.2| | |`hipsparseCbsric02_analysis`|3.8.0| | | | | -|`cusparseCbsric02_bufferSize`| |12.2| | |`hipsparseCbsric02_bufferSize`|3.8.0| | | | | +|`cusparseCbsric02`| |12.2| | |`hipsparseCbsric02`|3.8.0|6.1.0| | | | +|`cusparseCbsric02_analysis`| |12.2| | |`hipsparseCbsric02_analysis`|3.8.0|6.1.0| | | | +|`cusparseCbsric02_bufferSize`| |12.2| | |`hipsparseCbsric02_bufferSize`|3.8.0|6.1.0| | | | |`cusparseCbsric02_bufferSizeExt`| |12.2| | | | | | | | | -|`cusparseCbsrilu02`| |12.2| | |`hipsparseCbsrilu02`|3.9.0| | | | | -|`cusparseCbsrilu02_analysis`| |12.2| | |`hipsparseCbsrilu02_analysis`|3.9.0| | | | | -|`cusparseCbsrilu02_bufferSize`| |12.2| | |`hipsparseCbsrilu02_bufferSize`|3.9.0| | | | | +|`cusparseCbsrilu02`| |12.2| | |`hipsparseCbsrilu02`|3.9.0|6.1.0| | | | +|`cusparseCbsrilu02_analysis`| |12.2| | |`hipsparseCbsrilu02_analysis`|3.9.0|6.1.0| | | | +|`cusparseCbsrilu02_bufferSize`| |12.2| | |`hipsparseCbsrilu02_bufferSize`|3.9.0|6.1.0| | | | |`cusparseCbsrilu02_bufferSizeExt`| |12.2| | | | | | | | | -|`cusparseCbsrilu02_numericBoost`| |12.2| | |`hipsparseCbsrilu02_numericBoost`|3.9.0| | | | | +|`cusparseCbsrilu02_numericBoost`| |12.2| | |`hipsparseCbsrilu02_numericBoost`|3.9.0|6.1.0| | | | |`cusparseCcsric0`| |10.2| |11.0| | | | | | | -|`cusparseCcsric02`| |12.2| | |`hipsparseCcsric02`|3.1.0| | | | | -|`cusparseCcsric02_analysis`| |12.2| | |`hipsparseCcsric02_analysis`|3.1.0| | | | | -|`cusparseCcsric02_bufferSize`| |12.2| | |`hipsparseCcsric02_bufferSize`|3.1.0| | | | | +|`cusparseCcsric02`| |12.2| | |`hipsparseCcsric02`|3.1.0|6.1.0| | | | +|`cusparseCcsric02_analysis`| |12.2| | |`hipsparseCcsric02_analysis`|3.1.0|6.1.0| | | | +|`cusparseCcsric02_bufferSize`| |12.2| | |`hipsparseCcsric02_bufferSize`|3.1.0|6.1.0| | | | |`cusparseCcsric02_bufferSizeExt`| |12.2| | |`hipsparseCcsric02_bufferSizeExt`|3.1.0| | | | | |`cusparseCcsrilu0`| |10.2| |11.0| | | | | | | -|`cusparseCcsrilu02`| |12.2| | |`hipsparseCcsrilu02`|3.1.0| | | | | -|`cusparseCcsrilu02_analysis`| |12.2| | |`hipsparseCcsrilu02_analysis`|3.1.0| | | | | -|`cusparseCcsrilu02_bufferSize`| |12.2| | |`hipsparseCcsrilu02_bufferSize`|3.1.0| | | | | +|`cusparseCcsrilu02`| |12.2| | |`hipsparseCcsrilu02`|3.1.0|6.1.0| | | | +|`cusparseCcsrilu02_analysis`| |12.2| | |`hipsparseCcsrilu02_analysis`|3.1.0|6.1.0| | | | +|`cusparseCcsrilu02_bufferSize`| |12.2| | |`hipsparseCcsrilu02_bufferSize`|3.1.0|6.1.0| | | | |`cusparseCcsrilu02_bufferSizeExt`| |12.2| | |`hipsparseCcsrilu02_bufferSizeExt`|3.1.0| | | | | -|`cusparseCcsrilu02_numericBoost`| |12.2| | |`hipsparseCcsrilu02_numericBoost`|3.10.0| | | | | +|`cusparseCcsrilu02_numericBoost`| |12.2| | |`hipsparseCcsrilu02_numericBoost`|3.10.0|6.1.0| | | | |`cusparseCgpsvInterleavedBatch`|9.2| | | |`hipsparseCgpsvInterleavedBatch`|5.1.0| | | | | |`cusparseCgpsvInterleavedBatch_bufferSizeExt`|9.2| | | |`hipsparseCgpsvInterleavedBatch_bufferSizeExt`|5.1.0| | | | | |`cusparseCgtsv`| |10.2| |11.0| | | | | | | @@ -505,26 +505,26 @@ |`cusparseCgtsvStridedBatch`| |10.2| |11.0| | | | | | | |`cusparseCgtsv_nopivot`| |10.2| |11.0| | | | | | | |`cusparseCsrilu0Ex`|8.0|10.2| |11.0| | | | | | | -|`cusparseDbsric02`| |12.2| | |`hipsparseDbsric02`|3.8.0| | | | | -|`cusparseDbsric02_analysis`| |12.2| | |`hipsparseDbsric02_analysis`|3.8.0| | | | | -|`cusparseDbsric02_bufferSize`| |12.2| | |`hipsparseDbsric02_bufferSize`|3.8.0| | | | | +|`cusparseDbsric02`| |12.2| | |`hipsparseDbsric02`|3.8.0|6.1.0| | | | +|`cusparseDbsric02_analysis`| |12.2| | |`hipsparseDbsric02_analysis`|3.8.0|6.1.0| | | | +|`cusparseDbsric02_bufferSize`| |12.2| | |`hipsparseDbsric02_bufferSize`|3.8.0|6.1.0| | | | |`cusparseDbsric02_bufferSizeExt`| |12.2| | | | | | | | | -|`cusparseDbsrilu02`| |12.2| | |`hipsparseDbsrilu02`|3.9.0| | | | | -|`cusparseDbsrilu02_analysis`| |12.2| | |`hipsparseDbsrilu02_analysis`|3.9.0| | | | | -|`cusparseDbsrilu02_bufferSize`| |12.2| | |`hipsparseDbsrilu02_bufferSize`|3.9.0| | | | | +|`cusparseDbsrilu02`| |12.2| | |`hipsparseDbsrilu02`|3.9.0|6.1.0| | | | +|`cusparseDbsrilu02_analysis`| |12.2| | |`hipsparseDbsrilu02_analysis`|3.9.0|6.1.0| | | | +|`cusparseDbsrilu02_bufferSize`| |12.2| | |`hipsparseDbsrilu02_bufferSize`|3.9.0|6.1.0| | | | |`cusparseDbsrilu02_bufferSizeExt`| |12.2| | | | | | | | | -|`cusparseDbsrilu02_numericBoost`| |12.2| | |`hipsparseDbsrilu02_numericBoost`|3.9.0| | | | | +|`cusparseDbsrilu02_numericBoost`| |12.2| | |`hipsparseDbsrilu02_numericBoost`|3.9.0|6.1.0| | | | |`cusparseDcsric0`| |10.2| |11.0| | | | | | | -|`cusparseDcsric02`| |12.2| | |`hipsparseDcsric02`|3.1.0| | | | | -|`cusparseDcsric02_analysis`| |12.2| | |`hipsparseDcsric02_analysis`|3.1.0| | | | | -|`cusparseDcsric02_bufferSize`| |12.2| | |`hipsparseDcsric02_bufferSize`|3.1.0| | | | | +|`cusparseDcsric02`| |12.2| | |`hipsparseDcsric02`|3.1.0|6.1.0| | | | +|`cusparseDcsric02_analysis`| |12.2| | |`hipsparseDcsric02_analysis`|3.1.0|6.1.0| | | | +|`cusparseDcsric02_bufferSize`| |12.2| | |`hipsparseDcsric02_bufferSize`|3.1.0|6.1.0| | | | |`cusparseDcsric02_bufferSizeExt`| |12.2| | |`hipsparseDcsric02_bufferSizeExt`|3.1.0| | | | | |`cusparseDcsrilu0`| |10.2| |11.0| | | | | | | -|`cusparseDcsrilu02`| |12.2| | |`hipsparseDcsrilu02`|1.9.2| | | | | -|`cusparseDcsrilu02_analysis`| |12.2| | |`hipsparseDcsrilu02_analysis`|1.9.2| | | | | -|`cusparseDcsrilu02_bufferSize`| |12.2| | |`hipsparseDcsrilu02_bufferSize`|1.9.2| | | | | +|`cusparseDcsrilu02`| |12.2| | |`hipsparseDcsrilu02`|1.9.2|6.1.0| | | | +|`cusparseDcsrilu02_analysis`| |12.2| | |`hipsparseDcsrilu02_analysis`|1.9.2|6.1.0| | | | +|`cusparseDcsrilu02_bufferSize`| |12.2| | |`hipsparseDcsrilu02_bufferSize`|1.9.2|6.1.0| | | | |`cusparseDcsrilu02_bufferSizeExt`| |12.2| | |`hipsparseDcsrilu02_bufferSizeExt`|1.9.2| | | | | -|`cusparseDcsrilu02_numericBoost`| |12.2| | |`hipsparseDcsrilu02_numericBoost`|3.10.0| | | | | +|`cusparseDcsrilu02_numericBoost`| |12.2| | |`hipsparseDcsrilu02_numericBoost`|3.10.0|6.1.0| | | | |`cusparseDgpsvInterleavedBatch`|9.2| | | |`hipsparseDgpsvInterleavedBatch`|5.1.0| | | | | |`cusparseDgpsvInterleavedBatch_bufferSizeExt`|9.2| | | |`hipsparseDgpsvInterleavedBatch_bufferSizeExt`|5.1.0| | | | | |`cusparseDgtsv`| |10.2| |11.0| | | | | | | @@ -538,26 +538,26 @@ |`cusparseDgtsvInterleavedBatch_bufferSizeExt`|9.2| | | |`hipsparseDgtsvInterleavedBatch_bufferSizeExt`|5.1.0| | | | | |`cusparseDgtsvStridedBatch`| |10.2| |11.0| | | | | | | |`cusparseDgtsv_nopivot`| |10.2| |11.0| | | | | | | -|`cusparseSbsric02`| |12.2| | |`hipsparseSbsric02`|3.8.0| | | | | -|`cusparseSbsric02_analysis`| |12.2| | |`hipsparseSbsric02_analysis`|3.8.0| | | | | -|`cusparseSbsric02_bufferSize`| |12.2| | |`hipsparseSbsric02_bufferSize`|3.8.0| | | | | +|`cusparseSbsric02`| |12.2| | |`hipsparseSbsric02`|3.8.0|6.1.0| | | | +|`cusparseSbsric02_analysis`| |12.2| | |`hipsparseSbsric02_analysis`|3.8.0|6.1.0| | | | +|`cusparseSbsric02_bufferSize`| |12.2| | |`hipsparseSbsric02_bufferSize`|3.8.0|6.1.0| | | | |`cusparseSbsric02_bufferSizeExt`| |12.2| | | | | | | | | -|`cusparseSbsrilu02`| |12.2| | |`hipsparseSbsrilu02`|3.9.0| | | | | -|`cusparseSbsrilu02_analysis`| |12.2| | |`hipsparseSbsrilu02_analysis`|3.9.0| | | | | -|`cusparseSbsrilu02_bufferSize`| |12.2| | |`hipsparseSbsrilu02_bufferSize`|3.9.0| | | | | +|`cusparseSbsrilu02`| |12.2| | |`hipsparseSbsrilu02`|3.9.0|6.1.0| | | | +|`cusparseSbsrilu02_analysis`| |12.2| | |`hipsparseSbsrilu02_analysis`|3.9.0|6.1.0| | | | +|`cusparseSbsrilu02_bufferSize`| |12.2| | |`hipsparseSbsrilu02_bufferSize`|3.9.0|6.1.0| | | | |`cusparseSbsrilu02_bufferSizeExt`| |12.2| | | | | | | | | -|`cusparseSbsrilu02_numericBoost`| |12.2| | |`hipsparseSbsrilu02_numericBoost`|3.9.0| | | | | +|`cusparseSbsrilu02_numericBoost`| |12.2| | |`hipsparseSbsrilu02_numericBoost`|3.9.0|6.1.0| | | | |`cusparseScsric0`| |10.2| |11.0| | | | | | | -|`cusparseScsric02`| |12.2| | |`hipsparseScsric02`|3.1.0| | | | | -|`cusparseScsric02_analysis`| |12.2| | |`hipsparseScsric02_analysis`|3.1.0| | | | | -|`cusparseScsric02_bufferSize`| |12.2| | |`hipsparseScsric02_bufferSize`|3.1.0| | | | | +|`cusparseScsric02`| |12.2| | |`hipsparseScsric02`|3.1.0|6.1.0| | | | +|`cusparseScsric02_analysis`| |12.2| | |`hipsparseScsric02_analysis`|3.1.0|6.1.0| | | | +|`cusparseScsric02_bufferSize`| |12.2| | |`hipsparseScsric02_bufferSize`|3.1.0|6.1.0| | | | |`cusparseScsric02_bufferSizeExt`| |12.2| | |`hipsparseScsric02_bufferSizeExt`|3.1.0| | | | | |`cusparseScsrilu0`| |10.2| |11.0| | | | | | | -|`cusparseScsrilu02`| |12.2| | |`hipsparseScsrilu02`|1.9.2| | | | | -|`cusparseScsrilu02_analysis`| |12.2| | |`hipsparseScsrilu02_analysis`|1.9.2| | | | | -|`cusparseScsrilu02_bufferSize`| |12.2| | |`hipsparseScsrilu02_bufferSize`|1.9.2| | | | | +|`cusparseScsrilu02`| |12.2| | |`hipsparseScsrilu02`|1.9.2|6.1.0| | | | +|`cusparseScsrilu02_analysis`| |12.2| | |`hipsparseScsrilu02_analysis`|1.9.2|6.1.0| | | | +|`cusparseScsrilu02_bufferSize`| |12.2| | |`hipsparseScsrilu02_bufferSize`|1.9.2|6.1.0| | | | |`cusparseScsrilu02_bufferSizeExt`| |12.2| | |`hipsparseScsrilu02_bufferSizeExt`|1.9.2| | | | | -|`cusparseScsrilu02_numericBoost`| |12.2| | |`hipsparseScsrilu02_numericBoost`|3.10.0| | | | | +|`cusparseScsrilu02_numericBoost`| |12.2| | |`hipsparseScsrilu02_numericBoost`|3.10.0|6.1.0| | | | |`cusparseSgpsvInterleavedBatch`|9.2| | | |`hipsparseSgpsvInterleavedBatch`|5.1.0| | | | | |`cusparseSgpsvInterleavedBatch_bufferSizeExt`|9.2| | | |`hipsparseSgpsvInterleavedBatch_bufferSizeExt`|5.1.0| | | | | |`cusparseSgtsv`| |10.2| |11.0| | | | | | | @@ -571,30 +571,30 @@ |`cusparseSgtsvInterleavedBatch_bufferSizeExt`|9.2| | | |`hipsparseSgtsvInterleavedBatch_bufferSizeExt`|5.1.0| | | | | |`cusparseSgtsvStridedBatch`| |10.2| |11.0| | | | | | | |`cusparseSgtsv_nopivot`| |10.2| |11.0| | | | | | | -|`cusparseXbsric02_zeroPivot`| |12.2| | |`hipsparseXbsric02_zeroPivot`|3.8.0| | | | | -|`cusparseXbsrilu02_zeroPivot`| |12.2| | |`hipsparseXbsrilu02_zeroPivot`|3.9.0| | | | | -|`cusparseXcsric02_zeroPivot`| |12.2| | |`hipsparseXcsric02_zeroPivot`|3.1.0| | | | | -|`cusparseXcsrilu02_zeroPivot`| |12.2| | |`hipsparseXcsrilu02_zeroPivot`|1.9.2| | | | | -|`cusparseZbsric02`| |12.2| | |`hipsparseZbsric02`|3.8.0| | | | | -|`cusparseZbsric02_analysis`| |12.2| | |`hipsparseZbsric02_analysis`|3.8.0| | | | | -|`cusparseZbsric02_bufferSize`| |12.2| | |`hipsparseZbsric02_bufferSize`|3.8.0| | | | | +|`cusparseXbsric02_zeroPivot`| |12.2| | |`hipsparseXbsric02_zeroPivot`|3.8.0|6.1.0| | | | +|`cusparseXbsrilu02_zeroPivot`| |12.2| | |`hipsparseXbsrilu02_zeroPivot`|3.9.0|6.1.0| | | | +|`cusparseXcsric02_zeroPivot`| |12.2| | |`hipsparseXcsric02_zeroPivot`|3.1.0|6.1.0| | | | +|`cusparseXcsrilu02_zeroPivot`| |12.2| | |`hipsparseXcsrilu02_zeroPivot`|1.9.2|6.1.0| | | | +|`cusparseZbsric02`| |12.2| | |`hipsparseZbsric02`|3.8.0|6.1.0| | | | +|`cusparseZbsric02_analysis`| |12.2| | |`hipsparseZbsric02_analysis`|3.8.0|6.1.0| | | | +|`cusparseZbsric02_bufferSize`| |12.2| | |`hipsparseZbsric02_bufferSize`|3.8.0|6.1.0| | | | |`cusparseZbsric02_bufferSizeExt`| |12.2| | | | | | | | | -|`cusparseZbsrilu02`| |12.2| | |`hipsparseZbsrilu02`|3.9.0| | | | | -|`cusparseZbsrilu02_analysis`| |12.2| | |`hipsparseZbsrilu02_analysis`|3.9.0| | | | | -|`cusparseZbsrilu02_bufferSize`| |12.2| | |`hipsparseZbsrilu02_bufferSize`|3.9.0| | | | | +|`cusparseZbsrilu02`| |12.2| | |`hipsparseZbsrilu02`|3.9.0|6.1.0| | | | +|`cusparseZbsrilu02_analysis`| |12.2| | |`hipsparseZbsrilu02_analysis`|3.9.0|6.1.0| | | | +|`cusparseZbsrilu02_bufferSize`| |12.2| | |`hipsparseZbsrilu02_bufferSize`|3.9.0|6.1.0| | | | |`cusparseZbsrilu02_bufferSizeExt`| |12.2| | | | | | | | | -|`cusparseZbsrilu02_numericBoost`| |12.2| | |`hipsparseZbsrilu02_numericBoost`|3.9.0| | | | | +|`cusparseZbsrilu02_numericBoost`| |12.2| | |`hipsparseZbsrilu02_numericBoost`|3.9.0|6.1.0| | | | |`cusparseZcsric0`| |10.2| |11.0| | | | | | | -|`cusparseZcsric02`| |12.2| | |`hipsparseZcsric02`|3.1.0| | | | | -|`cusparseZcsric02_analysis`| |12.2| | |`hipsparseZcsric02_analysis`|3.1.0| | | | | -|`cusparseZcsric02_bufferSize`| |12.2| | |`hipsparseZcsric02_bufferSize`|3.1.0| | | | | +|`cusparseZcsric02`| |12.2| | |`hipsparseZcsric02`|3.1.0|6.1.0| | | | +|`cusparseZcsric02_analysis`| |12.2| | |`hipsparseZcsric02_analysis`|3.1.0|6.1.0| | | | +|`cusparseZcsric02_bufferSize`| |12.2| | |`hipsparseZcsric02_bufferSize`|3.1.0|6.1.0| | | | |`cusparseZcsric02_bufferSizeExt`| |12.2| | |`hipsparseZcsric02_bufferSizeExt`|3.1.0| | | | | |`cusparseZcsrilu0`| |10.2| |11.0| | | | | | | -|`cusparseZcsrilu02`| |12.2| | |`hipsparseZcsrilu02`|3.1.0| | | | | -|`cusparseZcsrilu02_analysis`| |12.2| | |`hipsparseZcsrilu02_analysis`|3.1.0| | | | | -|`cusparseZcsrilu02_bufferSize`| |12.2| | |`hipsparseZcsrilu02_bufferSize`|3.1.0| | | | | +|`cusparseZcsrilu02`| |12.2| | |`hipsparseZcsrilu02`|3.1.0|6.1.0| | | | +|`cusparseZcsrilu02_analysis`| |12.2| | |`hipsparseZcsrilu02_analysis`|3.1.0|6.1.0| | | | +|`cusparseZcsrilu02_bufferSize`| |12.2| | |`hipsparseZcsrilu02_bufferSize`|3.1.0|6.1.0| | | | |`cusparseZcsrilu02_bufferSizeExt`| |12.2| | |`hipsparseZcsrilu02_bufferSizeExt`|3.1.0| | | | | -|`cusparseZcsrilu02_numericBoost`| |12.2| | |`hipsparseZcsrilu02_numericBoost`|3.10.0| | | | | +|`cusparseZcsrilu02_numericBoost`| |12.2| | |`hipsparseZcsrilu02_numericBoost`|3.10.0|6.1.0| | | | |`cusparseZgpsvInterleavedBatch`|9.2| | | |`hipsparseZgpsvInterleavedBatch`|5.1.0| | | | | |`cusparseZgpsvInterleavedBatch_bufferSizeExt`|9.2| | | |`hipsparseZgpsvInterleavedBatch_bufferSizeExt`|5.1.0| | | | | |`cusparseZgtsv`| |10.2| |11.0| | | | | | | @@ -613,10 +613,10 @@ |**CUDA**|**A**|**D**|**C**|**R**|**HIP**|**A**|**D**|**C**|**R**|**E**| |:--|:-:|:-:|:-:|:-:|:--|:-:|:-:|:-:|:-:|:-:| -|`cusparseCcsrcolor`| |12.2| | |`hipsparseCcsrcolor`|4.5.0| | | | | -|`cusparseDcsrcolor`| |12.2| | |`hipsparseDcsrcolor`|4.5.0| | | | | -|`cusparseScsrcolor`| |12.2| | |`hipsparseScsrcolor`|4.5.0| | | | | -|`cusparseZcsrcolor`| |12.2| | |`hipsparseZcsrcolor`|4.5.0| | | | | +|`cusparseCcsrcolor`| |12.2| | |`hipsparseCcsrcolor`|4.5.0|6.1.0| | | | +|`cusparseDcsrcolor`| |12.2| | |`hipsparseDcsrcolor`|4.5.0|6.1.0| | | | +|`cusparseScsrcolor`| |12.2| | |`hipsparseScsrcolor`|4.5.0|6.1.0| | | | +|`cusparseZcsrcolor`| |12.2| | |`hipsparseZcsrcolor`|4.5.0|6.1.0| | | | ## **14. CUSPARSE Format Conversion Reference** @@ -628,14 +628,14 @@ |`cusparseCcsr2bsr`| | | | |`hipsparseCcsr2bsr`|3.5.0| | | | | |`cusparseCcsr2csc`| |10.2| |11.0|`hipsparseCcsr2csc`|3.1.0| | | | | |`cusparseCcsr2csr_compress`|8.0|12.2| | |`hipsparseCcsr2csr_compress`|3.5.0| | | | | -|`cusparseCcsr2csru`| |12.2| | |`hipsparseCcsr2csru`|4.2.0| | | | | +|`cusparseCcsr2csru`| |12.2| | |`hipsparseCcsr2csru`|4.2.0|6.1.0| | | | |`cusparseCcsr2dense`| |11.1| |12.0|`hipsparseCcsr2dense`|3.5.0| | | | | |`cusparseCcsr2gebsr`| | | | |`hipsparseCcsr2gebsr`|4.1.0| | | | | |`cusparseCcsr2gebsr_bufferSize`| | | | |`hipsparseCcsr2gebsr_bufferSize`|4.1.0| | | | | |`cusparseCcsr2gebsr_bufferSizeExt`| | | | | | | | | | | |`cusparseCcsr2hyb`| |10.2| |11.0|`hipsparseCcsr2hyb`|3.1.0| | | | | -|`cusparseCcsru2csr`| |12.2| | |`hipsparseCcsru2csr`|4.2.0| | | | | -|`cusparseCcsru2csr_bufferSizeExt`| |12.2| | |`hipsparseCcsru2csr_bufferSizeExt`|4.2.0| | | | | +|`cusparseCcsru2csr`| |12.2| | |`hipsparseCcsru2csr`|4.2.0|6.1.0| | | | +|`cusparseCcsru2csr_bufferSizeExt`| |12.2| | |`hipsparseCcsru2csr_bufferSizeExt`|4.2.0|6.1.0| | | | |`cusparseCdense2csc`| |11.1| |12.0|`hipsparseCdense2csc`|3.5.0| | | | | |`cusparseCdense2csr`| |11.1| |12.0|`hipsparseCdense2csr`|3.5.0| | | | | |`cusparseCdense2hyb`| |10.2| |11.0| | | | | | | @@ -650,9 +650,9 @@ |`cusparseChyb2csr`| |10.2| |11.0|`hipsparseChyb2csr`|3.1.0| | | | | |`cusparseChyb2dense`| |10.2| |11.0| | | | | | | |`cusparseCnnz`| | | | |`hipsparseCnnz`|3.2.0| | | | | -|`cusparseCnnz_compress`|8.0|12.2| | |`hipsparseCnnz_compress`|3.5.0| | | | | +|`cusparseCnnz_compress`|8.0|12.2| | |`hipsparseCnnz_compress`|3.5.0|6.1.0| | | | |`cusparseCreateCsru2csrInfo`| |12.2| | |`hipsparseCreateCsru2csrInfo`|4.2.0| | | | | -|`cusparseCreateIdentityPermutation`| |12.2| | |`hipsparseCreateIdentityPermutation`|1.9.2| | | | | +|`cusparseCreateIdentityPermutation`| |12.2| | |`hipsparseCreateIdentityPermutation`|1.9.2|6.1.0| | | | |`cusparseCsr2cscEx`|8.0|10.2| |11.0| | | | | | | |`cusparseCsr2cscEx2`|10.1| | | |`hipsparseCsr2cscEx2`|5.4.0| | | | | |`cusparseCsr2cscEx2_bufferSize`|10.1| | | |`hipsparseCsr2cscEx2_bufferSize`|5.4.0| | | | | @@ -662,14 +662,14 @@ |`cusparseDcsr2bsr`| | | | |`hipsparseDcsr2bsr`|3.5.0| | | | | |`cusparseDcsr2csc`| |10.2| |11.0|`hipsparseDcsr2csc`|1.9.2| | | | | |`cusparseDcsr2csr_compress`|8.0|12.2| | |`hipsparseDcsr2csr_compress`|3.5.0| | | | | -|`cusparseDcsr2csru`| |12.2| | |`hipsparseDcsr2csru`|4.2.0| | | | | +|`cusparseDcsr2csru`| |12.2| | |`hipsparseDcsr2csru`|4.2.0|6.1.0| | | | |`cusparseDcsr2dense`| |11.1| |12.0|`hipsparseDcsr2dense`|3.5.0| | | | | |`cusparseDcsr2gebsr`| | | | |`hipsparseDcsr2gebsr`|4.1.0| | | | | |`cusparseDcsr2gebsr_bufferSize`| | | | |`hipsparseDcsr2gebsr_bufferSize`|4.1.0| | | | | |`cusparseDcsr2gebsr_bufferSizeExt`| | | | | | | | | | | |`cusparseDcsr2hyb`| |10.2| |11.0|`hipsparseDcsr2hyb`|1.9.2| | | | | -|`cusparseDcsru2csr`| |12.2| | |`hipsparseDcsru2csr`|4.2.0| | | | | -|`cusparseDcsru2csr_bufferSizeExt`| |12.2| | |`hipsparseDcsru2csr_bufferSizeExt`|4.2.0| | | | | +|`cusparseDcsru2csr`| |12.2| | |`hipsparseDcsru2csr`|4.2.0|6.1.0| | | | +|`cusparseDcsru2csr_bufferSizeExt`| |12.2| | |`hipsparseDcsru2csr_bufferSizeExt`|4.2.0|6.1.0| | | | |`cusparseDdense2csc`| |11.1| |12.0|`hipsparseDdense2csc`|3.5.0| | | | | |`cusparseDdense2csr`| |11.1| |12.0|`hipsparseDdense2csr`|3.5.0| | | | | |`cusparseDdense2hyb`| |10.2| |11.0| | | | | | | @@ -685,18 +685,18 @@ |`cusparseDhyb2csr`| |10.2| |11.0|`hipsparseDhyb2csr`|3.1.0| | | | | |`cusparseDhyb2dense`| |10.2| |11.0| | | | | | | |`cusparseDnnz`| | | | |`hipsparseDnnz`|3.2.0| | | | | -|`cusparseDnnz_compress`|8.0|12.2| | |`hipsparseDnnz_compress`|3.5.0| | | | | -|`cusparseDpruneCsr2csr`|9.0|12.2| | |`hipsparseDpruneCsr2csr`|3.9.0| | | | | -|`cusparseDpruneCsr2csrByPercentage`|9.0|12.2| | |`hipsparseDpruneCsr2csrByPercentage`|3.9.0| | | | | -|`cusparseDpruneCsr2csrByPercentage_bufferSizeExt`|9.0|12.2| | |`hipsparseDpruneCsr2csrByPercentage_bufferSizeExt`|3.9.0| | | | | -|`cusparseDpruneCsr2csrNnz`|9.0|12.2| | |`hipsparseDpruneCsr2csrNnz`|3.9.0| | | | | -|`cusparseDpruneCsr2csrNnzByPercentage`|9.0|12.2| | |`hipsparseDpruneCsr2csrNnzByPercentage`|3.9.0| | | | | -|`cusparseDpruneCsr2csr_bufferSizeExt`|9.0|12.2| | |`hipsparseDpruneCsr2csr_bufferSizeExt`|3.9.0| | | | | -|`cusparseDpruneDense2csr`|9.0|12.2| | |`hipsparseDpruneDense2csr`|3.9.0| | | | | -|`cusparseDpruneDense2csrByPercentage`|9.0|12.2| | |`hipsparseDpruneDense2csrByPercentage`|3.9.0| | | | | -|`cusparseDpruneDense2csrByPercentage_bufferSizeExt`|9.0|12.2| | |`hipsparseDpruneDense2csrByPercentage_bufferSizeExt`|3.9.0| | | | | -|`cusparseDpruneDense2csrNnz`|9.0|12.2| | |`hipsparseDpruneDense2csrNnz`|3.9.0| | | | | -|`cusparseDpruneDense2csrNnzByPercentage`|9.0|12.2| | |`hipsparseDpruneDense2csrNnzByPercentage`|3.9.0| | | | | +|`cusparseDnnz_compress`|8.0|12.2| | |`hipsparseDnnz_compress`|3.5.0|6.1.0| | | | +|`cusparseDpruneCsr2csr`|9.0|12.2| | |`hipsparseDpruneCsr2csr`|3.9.0|6.1.0| | | | +|`cusparseDpruneCsr2csrByPercentage`|9.0|12.2| | |`hipsparseDpruneCsr2csrByPercentage`|3.9.0|6.1.0| | | | +|`cusparseDpruneCsr2csrByPercentage_bufferSizeExt`|9.0|12.2| | |`hipsparseDpruneCsr2csrByPercentage_bufferSizeExt`|3.9.0|6.1.0| | | | +|`cusparseDpruneCsr2csrNnz`|9.0|12.2| | |`hipsparseDpruneCsr2csrNnz`|3.9.0|6.1.0| | | | +|`cusparseDpruneCsr2csrNnzByPercentage`|9.0|12.2| | |`hipsparseDpruneCsr2csrNnzByPercentage`|3.9.0|6.1.0| | | | +|`cusparseDpruneCsr2csr_bufferSizeExt`|9.0|12.2| | |`hipsparseDpruneCsr2csr_bufferSizeExt`|3.9.0|6.1.0| | | | +|`cusparseDpruneDense2csr`|9.0|12.2| | |`hipsparseDpruneDense2csr`|3.9.0|6.1.0| | | | +|`cusparseDpruneDense2csrByPercentage`|9.0|12.2| | |`hipsparseDpruneDense2csrByPercentage`|3.9.0|6.1.0| | | | +|`cusparseDpruneDense2csrByPercentage_bufferSizeExt`|9.0|12.2| | |`hipsparseDpruneDense2csrByPercentage_bufferSizeExt`|3.9.0|6.1.0| | | | +|`cusparseDpruneDense2csrNnz`|9.0|12.2| | |`hipsparseDpruneDense2csrNnz`|3.9.0|6.1.0| | | | +|`cusparseDpruneDense2csrNnzByPercentage`|9.0|12.2| | |`hipsparseDpruneDense2csrNnzByPercentage`|3.9.0|6.1.0| | | | |`cusparseDpruneDense2csr_bufferSizeExt`|9.0|12.2| | |`hipsparseDpruneDense2csr_bufferSizeExt`|3.9.0| | | | | |`cusparseHpruneCsr2csr`|9.0|12.2| | | | | | | | | |`cusparseHpruneCsr2csrByPercentage`|9.0|12.2| | | | | | | | | @@ -716,14 +716,14 @@ |`cusparseScsr2bsr`| | | | |`hipsparseScsr2bsr`|3.5.0| | | | | |`cusparseScsr2csc`| |10.2| |11.0|`hipsparseScsr2csc`|1.9.2| | | | | |`cusparseScsr2csr_compress`|8.0|12.2| | |`hipsparseScsr2csr_compress`|3.5.0| | | | | -|`cusparseScsr2csru`| |12.2| | |`hipsparseScsr2csru`|4.2.0| | | | | +|`cusparseScsr2csru`| |12.2| | |`hipsparseScsr2csru`|4.2.0|6.1.0| | | | |`cusparseScsr2dense`| |11.1| |12.0|`hipsparseScsr2dense`|3.5.0| | | | | |`cusparseScsr2gebsr`| | | | |`hipsparseScsr2gebsr`|4.1.0| | | | | |`cusparseScsr2gebsr_bufferSize`| | | | |`hipsparseScsr2gebsr_bufferSize`|4.1.0| | | | | |`cusparseScsr2gebsr_bufferSizeExt`| | | | | | | | | | | |`cusparseScsr2hyb`| |10.2| |11.0|`hipsparseScsr2hyb`|1.9.2| | | | | -|`cusparseScsru2csr`| |12.2| | |`hipsparseScsru2csr`|4.2.0| | | | | -|`cusparseScsru2csr_bufferSizeExt`| |12.2| | |`hipsparseScsru2csr_bufferSizeExt`|4.2.0| | | | | +|`cusparseScsru2csr`| |12.2| | |`hipsparseScsru2csr`|4.2.0|6.1.0| | | | +|`cusparseScsru2csr_bufferSizeExt`| |12.2| | |`hipsparseScsru2csr_bufferSizeExt`|4.2.0|6.1.0| | | | |`cusparseSdense2csc`| |11.1| |12.0|`hipsparseSdense2csc`|3.5.0| | | | | |`cusparseSdense2csr`| |11.1| |12.0|`hipsparseSdense2csr`|3.5.0| | | | | |`cusparseSdense2hyb`| |10.2| |11.0| | | | | | | @@ -738,18 +738,18 @@ |`cusparseShyb2csr`| |10.2| |11.0|`hipsparseShyb2csr`|3.1.0| | | | | |`cusparseShyb2dense`| |10.2| |11.0| | | | | | | |`cusparseSnnz`| | | | |`hipsparseSnnz`|3.2.0| | | | | -|`cusparseSnnz_compress`|8.0|12.2| | |`hipsparseSnnz_compress`|3.5.0| | | | | -|`cusparseSpruneCsr2csr`|9.0|12.2| | |`hipsparseSpruneCsr2csr`|3.9.0| | | | | -|`cusparseSpruneCsr2csrByPercentage`|9.0|12.2| | |`hipsparseSpruneCsr2csrByPercentage`|3.9.0| | | | | -|`cusparseSpruneCsr2csrByPercentage_bufferSizeExt`|9.0|12.2| | |`hipsparseSpruneCsr2csrByPercentage_bufferSizeExt`|3.9.0| | | | | -|`cusparseSpruneCsr2csrNnz`|9.0|12.2| | |`hipsparseSpruneCsr2csrNnz`|3.9.0| | | | | -|`cusparseSpruneCsr2csrNnzByPercentage`|9.0|12.2| | |`hipsparseSpruneCsr2csrNnzByPercentage`|3.9.0| | | | | -|`cusparseSpruneCsr2csr_bufferSizeExt`|9.0|12.2| | |`hipsparseSpruneCsr2csr_bufferSizeExt`|3.9.0| | | | | -|`cusparseSpruneDense2csr`|9.0|12.2| | |`hipsparseSpruneDense2csr`|3.9.0| | | | | -|`cusparseSpruneDense2csrByPercentage`|9.0|12.2| | |`hipsparseSpruneDense2csrByPercentage`|3.9.0| | | | | -|`cusparseSpruneDense2csrByPercentage_bufferSizeExt`|9.0|12.2| | |`hipsparseSpruneDense2csrByPercentage_bufferSizeExt`|3.9.0| | | | | -|`cusparseSpruneDense2csrNnz`|9.0|12.2| | |`hipsparseSpruneDense2csrNnz`|3.9.0| | | | | -|`cusparseSpruneDense2csrNnzByPercentage`|9.0|12.2| | |`hipsparseSpruneDense2csrNnzByPercentage`|3.9.0| | | | | +|`cusparseSnnz_compress`|8.0|12.2| | |`hipsparseSnnz_compress`|3.5.0|6.1.0| | | | +|`cusparseSpruneCsr2csr`|9.0|12.2| | |`hipsparseSpruneCsr2csr`|3.9.0|6.1.0| | | | +|`cusparseSpruneCsr2csrByPercentage`|9.0|12.2| | |`hipsparseSpruneCsr2csrByPercentage`|3.9.0|6.1.0| | | | +|`cusparseSpruneCsr2csrByPercentage_bufferSizeExt`|9.0|12.2| | |`hipsparseSpruneCsr2csrByPercentage_bufferSizeExt`|3.9.0|6.1.0| | | | +|`cusparseSpruneCsr2csrNnz`|9.0|12.2| | |`hipsparseSpruneCsr2csrNnz`|3.9.0|6.1.0| | | | +|`cusparseSpruneCsr2csrNnzByPercentage`|9.0|12.2| | |`hipsparseSpruneCsr2csrNnzByPercentage`|3.9.0|6.1.0| | | | +|`cusparseSpruneCsr2csr_bufferSizeExt`|9.0|12.2| | |`hipsparseSpruneCsr2csr_bufferSizeExt`|3.9.0|6.1.0| | | | +|`cusparseSpruneDense2csr`|9.0|12.2| | |`hipsparseSpruneDense2csr`|3.9.0|6.1.0| | | | +|`cusparseSpruneDense2csrByPercentage`|9.0|12.2| | |`hipsparseSpruneDense2csrByPercentage`|3.9.0|6.1.0| | | | +|`cusparseSpruneDense2csrByPercentage_bufferSizeExt`|9.0|12.2| | |`hipsparseSpruneDense2csrByPercentage_bufferSizeExt`|3.9.0|6.1.0| | | | +|`cusparseSpruneDense2csrNnz`|9.0|12.2| | |`hipsparseSpruneDense2csrNnz`|3.9.0|6.1.0| | | | +|`cusparseSpruneDense2csrNnzByPercentage`|9.0|12.2| | |`hipsparseSpruneDense2csrNnzByPercentage`|3.9.0|6.1.0| | | | |`cusparseSpruneDense2csr_bufferSizeExt`|9.0|12.2| | |`hipsparseSpruneDense2csr_bufferSizeExt`|3.9.0| | | | | |`cusparseXcoo2csr`| | | | |`hipsparseXcoo2csr`|1.9.2| | | | | |`cusparseXcoosortByColumn`| | | | |`hipsparseXcoosortByColumn`|1.9.2| | | | | @@ -770,14 +770,14 @@ |`cusparseZcsr2bsr`| | | | |`hipsparseZcsr2bsr`|3.5.0| | | | | |`cusparseZcsr2csc`| |10.2| |11.0|`hipsparseZcsr2csc`|3.1.0| | | | | |`cusparseZcsr2csr_compress`|8.0|12.2| | |`hipsparseZcsr2csr_compress`|3.5.0| | | | | -|`cusparseZcsr2csru`| |12.2| | |`hipsparseZcsr2csru`|4.2.0| | | | | +|`cusparseZcsr2csru`| |12.2| | |`hipsparseZcsr2csru`|4.2.0|6.1.0| | | | |`cusparseZcsr2dense`| |11.1| |12.0|`hipsparseZcsr2dense`|3.5.0| | | | | |`cusparseZcsr2gebsr`| | | | |`hipsparseZcsr2gebsr`|4.1.0| | | | | |`cusparseZcsr2gebsr_bufferSize`| | | | |`hipsparseZcsr2gebsr_bufferSize`|4.1.0| | | | | |`cusparseZcsr2gebsr_bufferSizeExt`| | | | | | | | | | | |`cusparseZcsr2hyb`| |10.2| |11.0|`hipsparseZcsr2hyb`|3.1.0| | | | | -|`cusparseZcsru2csr`| |12.2| | |`hipsparseZcsru2csr`|4.2.0| | | | | -|`cusparseZcsru2csr_bufferSizeExt`| |12.2| | |`hipsparseZcsru2csr_bufferSizeExt`|4.2.0| | | | | +|`cusparseZcsru2csr`| |12.2| | |`hipsparseZcsru2csr`|4.2.0|6.1.0| | | | +|`cusparseZcsru2csr_bufferSizeExt`| |12.2| | |`hipsparseZcsru2csr_bufferSizeExt`|4.2.0|6.1.0| | | | |`cusparseZdense2csc`| |11.1| |12.0|`hipsparseZdense2csc`|3.5.0| | | | | |`cusparseZdense2csr`| |11.1| |12.0|`hipsparseZdense2csr`|3.5.0| | | | | |`cusparseZdense2hyb`| |10.2| |11.0| | | | | | | @@ -792,7 +792,7 @@ |`cusparseZhyb2csr`| |10.2| |11.0|`hipsparseZhyb2csr`|3.1.0| | | | | |`cusparseZhyb2dense`| |10.2| |11.0| | | | | | | |`cusparseZnnz`| | | | |`hipsparseZnnz`|3.2.0| | | | | -|`cusparseZnnz_compress`|8.0|12.2| | |`hipsparseZnnz_compress`|3.5.0| | | | | +|`cusparseZnnz_compress`|8.0|12.2| | |`hipsparseZnnz_compress`|3.5.0|6.1.0| | | | ## **15. CUSPARSE Generic API Reference** @@ -803,7 +803,7 @@ |`cusparseBsrSetStridedBatch`|12.1| | | | | | | | | | |`cusparseConstBlockedEllGet`|12.0| | | |`hipsparseConstBlockedEllGet`|6.0.0| | | | | |`cusparseConstCooGet`|12.0| | | |`hipsparseConstCooGet`|6.0.0| | | | | -|`cusparseConstCscGet`|12.0| | | | | | | | | | +|`cusparseConstCscGet`|12.0| | | |`hipsparseConstCscGet`|6.1.0| | | |6.1.0| |`cusparseConstCsrGet`|12.0| | | |`hipsparseConstCsrGet`|6.0.0| | | | | |`cusparseConstDnMatGet`|12.0| | | |`hipsparseConstDnMatGet`|6.0.0| | | | | |`cusparseConstDnMatGetValues`|12.0| | | |`hipsparseConstDnMatGetValues`|6.0.0| | | | | @@ -837,7 +837,7 @@ |`cusparseCreateDnVec`|10.2| | | |`hipsparseCreateDnVec`|4.1.0| | | | | |`cusparseCreateSlicedEll`|12.1| | | | | | | | | | |`cusparseCreateSpVec`|10.2| | | |`hipsparseCreateSpVec`|4.1.0| | | | | -|`cusparseCscGet`|11.7| | | | | | | | | | +|`cusparseCscGet`|11.7| | | |`hipsparseCscGet`|6.1.0| | | |6.1.0| |`cusparseCscSetPointers`|11.1| | | |`hipsparseCscSetPointers`|4.2.0| | | | | |`cusparseCsrGet`|10.2| | | |`hipsparseCsrGet`|4.1.0| | | | | |`cusparseCsrSetPointers`|11.0| | | |`hipsparseCsrSetPointers`|4.1.0| | | | | @@ -858,7 +858,7 @@ |`cusparseDnVecGetValues`|10.2| | | |`hipsparseDnVecGetValues`|4.1.0| | | | | |`cusparseDnVecSetValues`|10.2| | | |`hipsparseDnVecSetValues`|4.1.0| | | | | |`cusparseGather`|11.0| |12.0| |`hipsparseGather`|4.1.0| |6.0.0| | | -|`cusparseRot`|11.0|12.2| | |`hipsparseRot`|4.1.0| | | | | +|`cusparseRot`|11.0|12.2| | |`hipsparseRot`|4.1.0|6.1.0| | | | |`cusparseSDDMM`|11.2| |12.0| |`hipsparseSDDMM`|4.3.0| |6.0.0| | | |`cusparseSDDMM_bufferSize`|11.2| |12.0| |`hipsparseSDDMM_bufferSize`|4.3.0| |6.0.0| | | |`cusparseSDDMM_preprocess`|11.2| |12.0| |`hipsparseSDDMM_preprocess`|4.3.0| |6.0.0| | | @@ -880,8 +880,8 @@ |`cusparseSpMMOp_destroyPlan`|11.5| | | | | | | | | | |`cusparseSpMM_bufferSize`|10.1| |12.0| |`hipsparseSpMM_bufferSize`|4.2.0| |6.0.0| | | |`cusparseSpMM_preprocess`|11.2| |12.0| |`hipsparseSpMM_preprocess`|4.5.0| |6.0.0| | | -|`cusparseSpMV`|10.2| |12.0| |`hipsparseSpMV`|4.1.0| |6.0.0| | | -|`cusparseSpMV_bufferSize`|10.2| |12.0| |`hipsparseSpMV_bufferSize`|4.1.0| |6.0.0| | | +|`cusparseSpMV`|10.1| |12.0| |`hipsparseSpMV`|4.1.0| |6.0.0| | | +|`cusparseSpMV_bufferSize`|10.1| |12.0| |`hipsparseSpMV_bufferSize`|4.1.0| |6.0.0| | | |`cusparseSpMatGetAttribute`|11.3| |12.0| |`hipsparseSpMatGetAttribute`|4.5.0| |6.0.0| | | |`cusparseSpMatGetFormat`|10.1| |12.0| |`hipsparseSpMatGetFormat`|4.1.0| |6.0.0| | | |`cusparseSpMatGetIndexBase`|10.1| |12.0| |`hipsparseSpMatGetIndexBase`|4.1.0| |6.0.0| | | @@ -904,8 +904,8 @@ |`cusparseSpSV_destroyDescr`|11.3| | | |`hipsparseSpSV_destroyDescr`|4.5.0| | | | | |`cusparseSpSV_solve`|11.3| |12.0| |`hipsparseSpSV_solve`|4.5.0| |6.0.0| | | |`cusparseSpSV_updateMatrix`|12.1| | | | | | | | | | -|`cusparseSpVV`|10.2| |12.0| |`hipsparseSpVV`|4.1.0| |6.0.0| | | -|`cusparseSpVV_bufferSize`|10.2| |12.0| |`hipsparseSpVV_bufferSize`|4.1.0| |6.0.0| | | +|`cusparseSpVV`|10.1| |12.0| |`hipsparseSpVV`|4.1.0| |6.0.0| | | +|`cusparseSpVV_bufferSize`|10.1| |12.0| |`hipsparseSpVV_bufferSize`|4.1.0| |6.0.0| | | |`cusparseSpVecGet`|10.2| | | |`hipsparseSpVecGet`|4.1.0| | | | | |`cusparseSpVecGetIndexBase`|10.2| |12.0| |`hipsparseSpVecGetIndexBase`|4.1.0| |6.0.0| | | |`cusparseSpVecGetValues`|10.2| | | |`hipsparseSpVecGetValues`|4.1.0| | | | | diff --git a/docs/tables/CUSPARSE_API_supported_by_HIP_and_ROC.md b/docs/tables/CUSPARSE_API_supported_by_HIP_and_ROC.md index 45890e96..b80891da 100644 --- a/docs/tables/CUSPARSE_API_supported_by_HIP_and_ROC.md +++ b/docs/tables/CUSPARSE_API_supported_by_HIP_and_ROC.md @@ -221,33 +221,33 @@ |**CUDA**|**A**|**D**|**C**|**R**|**HIP**|**A**|**D**|**C**|**R**|**E**|**ROC**|**A**|**D**|**C**|**R**|**E**| |:--|:-:|:-:|:-:|:-:|:--|:-:|:-:|:-:|:-:|:-:|:--|:-:|:-:|:-:|:-:|:-:| |`cusparseCopyMatDescr`|8.0| | |12.0|`hipsparseCopyMatDescr`|1.9.2| | | | |`rocsparse_copy_mat_descr`|1.9.0| | | | | -|`cusparseCreateBsric02Info`| |12.2| | |`hipsparseCreateBsric02Info`|3.8.0| | | | |`rocsparse_create_mat_info`|1.9.0| | | | | -|`cusparseCreateBsrilu02Info`| |12.2| | |`hipsparseCreateBsrilu02Info`|3.9.0| | | | |`rocsparse_create_mat_info`|1.9.0| | | | | -|`cusparseCreateBsrsm2Info`| |12.2| | |`hipsparseCreateBsrsm2Info`|4.5.0| | | | |`rocsparse_create_mat_info`|1.9.0| | | | | -|`cusparseCreateBsrsv2Info`| |12.2| | |`hipsparseCreateBsrsv2Info`|3.6.0| | | | |`rocsparse_create_mat_info`|1.9.0| | | | | -|`cusparseCreateColorInfo`| |12.2| | |`hipsparseCreateColorInfo`|4.5.0| | | | |`rocsparse_create_color_info`|4.5.0| | | | | +|`cusparseCreateBsric02Info`| |12.2| | |`hipsparseCreateBsric02Info`|3.8.0|6.1.0| | | |`rocsparse_create_mat_info`|1.9.0| | | | | +|`cusparseCreateBsrilu02Info`| |12.2| | |`hipsparseCreateBsrilu02Info`|3.9.0|6.1.0| | | |`rocsparse_create_mat_info`|1.9.0| | | | | +|`cusparseCreateBsrsm2Info`| |12.2| | |`hipsparseCreateBsrsm2Info`|4.5.0|6.1.0| | | |`rocsparse_create_mat_info`|1.9.0| | | | | +|`cusparseCreateBsrsv2Info`| |12.2| | |`hipsparseCreateBsrsv2Info`|3.6.0|6.1.0| | | |`rocsparse_create_mat_info`|1.9.0| | | | | +|`cusparseCreateColorInfo`| |12.2| | |`hipsparseCreateColorInfo`|4.5.0|6.1.0| | | |`rocsparse_create_color_info`|4.5.0| | | | | |`cusparseCreateCsrgemm2Info`| |11.0| |12.0|`hipsparseCreateCsrgemm2Info`|2.8.0| | | | |`rocsparse_create_mat_info`|1.9.0| | | | | -|`cusparseCreateCsric02Info`| |12.2| | |`hipsparseCreateCsric02Info`|3.1.0| | | | |`rocsparse_create_mat_info`|1.9.0| | | | | -|`cusparseCreateCsrilu02Info`| |12.2| | |`hipsparseCreateCsrilu02Info`|1.9.2| | | | |`rocsparse_create_mat_info`|1.9.0| | | | | +|`cusparseCreateCsric02Info`| |12.2| | |`hipsparseCreateCsric02Info`|3.1.0|6.1.0| | | |`rocsparse_create_mat_info`|1.9.0| | | | | +|`cusparseCreateCsrilu02Info`| |12.2| | |`hipsparseCreateCsrilu02Info`|1.9.2|6.1.0| | | |`rocsparse_create_mat_info`|1.9.0| | | | | |`cusparseCreateCsrsm2Info`|9.2|11.3| |12.0|`hipsparseCreateCsrsm2Info`|3.1.0| | | | |`rocsparse_create_mat_info`|1.9.0| | | | | |`cusparseCreateCsrsv2Info`| |11.3| |12.0|`hipsparseCreateCsrsv2Info`|1.9.2| | | | |`rocsparse_create_mat_info`|1.9.0| | | | | |`cusparseCreateHybMat`| |10.2| |11.0|`hipsparseCreateHybMat`|1.9.2| | | | |`rocsparse_create_hyb_mat`|1.9.0| | | | | |`cusparseCreateMatDescr`| | | | |`hipsparseCreateMatDescr`|1.9.2| | | | |`rocsparse_create_mat_descr`|1.9.0| | | | | -|`cusparseCreatePruneInfo`|9.0|12.2| | |`hipsparseCreatePruneInfo`|3.9.0| | | | |`rocsparse_create_mat_info`|1.9.0| | | | | +|`cusparseCreatePruneInfo`|9.0|12.2| | |`hipsparseCreatePruneInfo`|3.9.0|6.1.0| | | |`rocsparse_create_mat_info`|1.9.0| | | | | |`cusparseCreateSolveAnalysisInfo`| |10.2| |11.0| | | | | | | | | | | | | -|`cusparseDestroyBsric02Info`| |12.2| | |`hipsparseDestroyBsric02Info`|3.8.0| | | | |`rocsparse_destroy_mat_info`|1.9.0| | | | | -|`cusparseDestroyBsrilu02Info`| |12.2| | |`hipsparseDestroyBsrilu02Info`|3.9.0| | | | |`rocsparse_destroy_mat_info`|1.9.0| | | | | -|`cusparseDestroyBsrsm2Info`| |12.2| | |`hipsparseDestroyBsrsm2Info`|4.5.0| | | | |`rocsparse_destroy_mat_info`|1.9.0| | | | | -|`cusparseDestroyBsrsv2Info`| |12.2| | |`hipsparseDestroyBsrsv2Info`|3.6.0| | | | |`rocsparse_destroy_mat_info`|1.9.0| | | | | -|`cusparseDestroyColorInfo`| |12.2| | |`hipsparseDestroyColorInfo`|4.5.0| | | | |`rocsparse_destroy_color_info`|4.5.0| | | | | +|`cusparseDestroyBsric02Info`| |12.2| | |`hipsparseDestroyBsric02Info`|3.8.0|6.1.0| | | |`rocsparse_destroy_mat_info`|1.9.0| | | | | +|`cusparseDestroyBsrilu02Info`| |12.2| | |`hipsparseDestroyBsrilu02Info`|3.9.0|6.1.0| | | |`rocsparse_destroy_mat_info`|1.9.0| | | | | +|`cusparseDestroyBsrsm2Info`| |12.2| | |`hipsparseDestroyBsrsm2Info`|4.5.0|6.1.0| | | |`rocsparse_destroy_mat_info`|1.9.0| | | | | +|`cusparseDestroyBsrsv2Info`| |12.2| | |`hipsparseDestroyBsrsv2Info`|3.6.0|6.1.0| | | |`rocsparse_destroy_mat_info`|1.9.0| | | | | +|`cusparseDestroyColorInfo`| |12.2| | |`hipsparseDestroyColorInfo`|4.5.0|6.1.0| | | |`rocsparse_destroy_color_info`|4.5.0| | | | | |`cusparseDestroyCsrgemm2Info`| |11.0| |12.0|`hipsparseDestroyCsrgemm2Info`|2.8.0| | | | |`rocsparse_destroy_mat_info`|1.9.0| | | | | -|`cusparseDestroyCsric02Info`| |12.2| | |`hipsparseDestroyCsric02Info`|3.1.0| | | | |`rocsparse_destroy_mat_info`|1.9.0| | | | | -|`cusparseDestroyCsrilu02Info`| |12.2| | |`hipsparseDestroyCsrilu02Info`|1.9.2| | | | |`rocsparse_destroy_mat_info`|1.9.0| | | | | +|`cusparseDestroyCsric02Info`| |12.2| | |`hipsparseDestroyCsric02Info`|3.1.0|6.1.0| | | |`rocsparse_destroy_mat_info`|1.9.0| | | | | +|`cusparseDestroyCsrilu02Info`| |12.2| | |`hipsparseDestroyCsrilu02Info`|1.9.2|6.1.0| | | |`rocsparse_destroy_mat_info`|1.9.0| | | | | |`cusparseDestroyCsrsm2Info`|9.2|11.3| |12.0|`hipsparseDestroyCsrsm2Info`|3.1.0| | | | |`rocsparse_destroy_mat_info`|1.9.0| | | | | |`cusparseDestroyCsrsv2Info`| |11.3| |12.0|`hipsparseDestroyCsrsv2Info`|1.9.2| | | | |`rocsparse_destroy_mat_info`|1.9.0| | | | | |`cusparseDestroyHybMat`| |10.2| |11.0|`hipsparseDestroyHybMat`|1.9.2| | | | |`rocsparse_destroy_hyb_mat`|1.9.0| | | | | |`cusparseDestroyMatDescr`| | | | |`hipsparseDestroyMatDescr`|1.9.2| | | | |`rocsparse_destroy_mat_descr`|1.9.0| | | | | -|`cusparseDestroyPruneInfo`|9.0|12.2| | |`hipsparseDestroyPruneInfo`|3.9.0| | | | |`rocsparse_destroy_mat_info`|1.9.0| | | | | +|`cusparseDestroyPruneInfo`|9.0|12.2| | |`hipsparseDestroyPruneInfo`|3.9.0|6.1.0| | | |`rocsparse_destroy_mat_info`|1.9.0| | | | | |`cusparseDestroySolveAnalysisInfo`| |10.2| |11.0| | | | | | | | | | | | | |`cusparseGetLevelInfo`| | | |11.0| | | | | | | | | | | | | |`cusparseGetMatDiagType`| | | | |`hipsparseGetMatDiagType`|1.9.2| | | | |`rocsparse_get_mat_diag_type`|1.9.0| | | | | @@ -293,11 +293,11 @@ |**CUDA**|**A**|**D**|**C**|**R**|**HIP**|**A**|**D**|**C**|**R**|**E**|**ROC**|**A**|**D**|**C**|**R**|**E**| |:--|:-:|:-:|:-:|:-:|:--|:-:|:-:|:-:|:-:|:-:|:--|:-:|:-:|:-:|:-:|:-:| |`cusparseCbsrmv`| | | | |`hipsparseCbsrmv`|3.5.0| | | | |`rocsparse_cbsrmv`|3.5.0|5.4.0| | | | -|`cusparseCbsrsv2_analysis`| |12.2| | |`hipsparseCbsrsv2_analysis`|3.6.0| | | | |`rocsparse_cbsrsv_analysis`|3.6.0| | | | | -|`cusparseCbsrsv2_bufferSize`| |12.2| | |`hipsparseCbsrsv2_bufferSize`|3.6.0| | | | |`rocsparse_cbsrsv_buffer_size`|3.6.0| | | | | +|`cusparseCbsrsv2_analysis`| |12.2| | |`hipsparseCbsrsv2_analysis`|3.6.0|6.1.0| | | |`rocsparse_cbsrsv_analysis`|3.6.0| | | | | +|`cusparseCbsrsv2_bufferSize`| |12.2| | |`hipsparseCbsrsv2_bufferSize`|3.6.0|6.1.0| | | |`rocsparse_cbsrsv_buffer_size`|3.6.0| | | | | |`cusparseCbsrsv2_bufferSizeExt`| |12.2| | |`hipsparseCbsrsv2_bufferSizeExt`|3.6.0| | | | |`rocsparse_cbsrsv_buffer_size`|3.6.0| | | | | -|`cusparseCbsrsv2_solve`| |12.2| | |`hipsparseCbsrsv2_solve`|3.6.0| | | | |`rocsparse_cbsrsv_solve`|3.6.0| | | | | -|`cusparseCbsrxmv`| |12.2| | |`hipsparseCbsrxmv`|4.5.0| | | | |`rocsparse_cbsrxmv`|4.5.0| | | | | +|`cusparseCbsrsv2_solve`| |12.2| | |`hipsparseCbsrsv2_solve`|3.6.0|6.1.0| | | |`rocsparse_cbsrsv_solve`|3.6.0| | | | | +|`cusparseCbsrxmv`| |12.2| | |`hipsparseCbsrxmv`|4.5.0|6.1.0| | | |`rocsparse_cbsrxmv`|4.5.0| | | | | |`cusparseCcsrmv`| |10.2| |11.0|`hipsparseCcsrmv`|3.1.0| | | | |`rocsparse_ccsrmv`|1.9.0| | | | | |`cusparseCcsrmv_mp`|8.0|10.2| |11.0| | | | | | | | | | | | | |`cusparseCcsrsv2_analysis`| |11.3| |12.0|`hipsparseCcsrsv2_analysis`|3.1.0| | | | |`rocsparse_ccsrsv_analysis`|2.10.0| | | | | @@ -316,11 +316,11 @@ |`cusparseCsrsv_analysisEx`|8.0|10.2| |11.0| | | | | | | | | | | | | |`cusparseCsrsv_solveEx`|8.0|10.2| |11.0| | | | | | | | | | | | | |`cusparseDbsrmv`| | | | |`hipsparseDbsrmv`|3.5.0| | | | |`rocsparse_dbsrmv`|3.5.0|5.4.0| | | | -|`cusparseDbsrsv2_analysis`| |12.2| | |`hipsparseDbsrsv2_analysis`|3.6.0| | | | |`rocsparse_dbsrsv_analysis`|3.6.0| | | | | -|`cusparseDbsrsv2_bufferSize`| |12.2| | |`hipsparseDbsrsv2_bufferSize`|3.6.0| | | | |`rocsparse_dbsrsv_buffer_size`|3.6.0| | | | | +|`cusparseDbsrsv2_analysis`| |12.2| | |`hipsparseDbsrsv2_analysis`|3.6.0|6.1.0| | | |`rocsparse_dbsrsv_analysis`|3.6.0| | | | | +|`cusparseDbsrsv2_bufferSize`| |12.2| | |`hipsparseDbsrsv2_bufferSize`|3.6.0|6.1.0| | | |`rocsparse_dbsrsv_buffer_size`|3.6.0| | | | | |`cusparseDbsrsv2_bufferSizeExt`| |12.2| | |`hipsparseDbsrsv2_bufferSizeExt`|3.6.0| | | | |`rocsparse_dbsrsv_buffer_size`|3.6.0| | | | | -|`cusparseDbsrsv2_solve`| |12.2| | |`hipsparseDbsrsv2_solve`|3.6.0| | | | |`rocsparse_dbsrsv_solve`|3.6.0| | | | | -|`cusparseDbsrxmv`| |12.2| | |`hipsparseDbsrxmv`|4.5.0| | | | |`rocsparse_dbsrxmv`|4.5.0| | | | | +|`cusparseDbsrsv2_solve`| |12.2| | |`hipsparseDbsrsv2_solve`|3.6.0|6.1.0| | | |`rocsparse_dbsrsv_solve`|3.6.0| | | | | +|`cusparseDbsrxmv`| |12.2| | |`hipsparseDbsrxmv`|4.5.0|6.1.0| | | |`rocsparse_dbsrxmv`|4.5.0| | | | | |`cusparseDcsrmv`| |10.2| |11.0|`hipsparseDcsrmv`|1.9.2| | | | |`rocsparse_dcsrmv`|1.9.0| | | | | |`cusparseDcsrmv_mp`|8.0|10.2| |11.0| | | | | | | | | | | | | |`cusparseDcsrsv2_analysis`| |11.3| |12.0|`hipsparseDcsrsv2_analysis`|1.9.2| | | | |`rocsparse_dcsrsv_analysis`|1.9.0| | | | | @@ -335,11 +335,11 @@ |`cusparseDhybsv_analysis`| |10.2| |11.0| | | | | | | | | | | | | |`cusparseDhybsv_solve`| |10.2| |11.0| | | | | | | | | | | | | |`cusparseSbsrmv`| | | | |`hipsparseSbsrmv`|3.5.0| | | | |`rocsparse_sbsrmv`|3.5.0|5.4.0| | | | -|`cusparseSbsrsv2_analysis`| |12.2| | |`hipsparseSbsrsv2_analysis`|3.6.0| | | | |`rocsparse_sbsrsv_analysis`|3.6.0| | | | | -|`cusparseSbsrsv2_bufferSize`| |12.2| | |`hipsparseSbsrsv2_bufferSize`|3.6.0| | | | |`rocsparse_sbsrsv_buffer_size`|3.6.0| | | | | +|`cusparseSbsrsv2_analysis`| |12.2| | |`hipsparseSbsrsv2_analysis`|3.6.0|6.1.0| | | |`rocsparse_sbsrsv_analysis`|3.6.0| | | | | +|`cusparseSbsrsv2_bufferSize`| |12.2| | |`hipsparseSbsrsv2_bufferSize`|3.6.0|6.1.0| | | |`rocsparse_sbsrsv_buffer_size`|3.6.0| | | | | |`cusparseSbsrsv2_bufferSizeExt`| |12.2| | |`hipsparseSbsrsv2_bufferSizeExt`|3.6.0| | | | |`rocsparse_sbsrsv_buffer_size`|3.6.0| | | | | -|`cusparseSbsrsv2_solve`| |12.2| | |`hipsparseSbsrsv2_solve`|3.6.0| | | | |`rocsparse_sbsrsv_solve`|3.6.0| | | | | -|`cusparseSbsrxmv`| |12.2| | |`hipsparseSbsrxmv`|4.5.0| | | | |`rocsparse_sbsrxmv`|4.5.0| | | | | +|`cusparseSbsrsv2_solve`| |12.2| | |`hipsparseSbsrsv2_solve`|3.6.0|6.1.0| | | |`rocsparse_sbsrsv_solve`|3.6.0| | | | | +|`cusparseSbsrxmv`| |12.2| | |`hipsparseSbsrxmv`|4.5.0|6.1.0| | | |`rocsparse_sbsrxmv`|4.5.0| | | | | |`cusparseScsrmv`| |10.2| |11.0|`hipsparseScsrmv`|1.9.2| | | | |`rocsparse_scsrmv`|1.9.0| | | | | |`cusparseScsrmv_mp`|8.0|10.2| |11.0| | | | | | | | | | | | | |`cusparseScsrsv2_analysis`| |11.3| |12.0|`hipsparseScsrsv2_analysis`|1.9.2| | | | |`rocsparse_scsrsv_analysis`|1.9.0| | | | | @@ -353,14 +353,14 @@ |`cusparseShybmv`| |10.2| |11.0|`hipsparseShybmv`|1.9.2| | | | |`rocsparse_shybmv`|1.9.0| | | | | |`cusparseShybsv_analysis`| |10.2| |11.0| | | | | | | | | | | | | |`cusparseShybsv_solve`| |10.2| |11.0| | | | | | | | | | | | | -|`cusparseXbsrsv2_zeroPivot`| |12.2| | |`hipsparseXbsrsv2_zeroPivot`|3.6.0| | | | |`rocsparse_bsrsv_zero_pivot`|3.6.0| | | | | +|`cusparseXbsrsv2_zeroPivot`| |12.2| | |`hipsparseXbsrsv2_zeroPivot`|3.6.0|6.1.0| | | |`rocsparse_bsrsv_zero_pivot`|3.6.0| | | | | |`cusparseXcsrsv2_zeroPivot`| |11.3| |12.0|`hipsparseXcsrsv2_zeroPivot`|1.9.2| | | | |`rocsparse_csrsv_zero_pivot`|1.9.0| | | | | |`cusparseZbsrmv`| | | | |`hipsparseZbsrmv`|3.5.0| | | | |`rocsparse_zbsrmv`|3.5.0|5.4.0| | | | -|`cusparseZbsrsv2_analysis`| |12.2| | |`hipsparseZbsrsv2_analysis`|3.6.0| | | | |`rocsparse_zbsrsv_analysis`|3.6.0| | | | | -|`cusparseZbsrsv2_bufferSize`| |12.2| | |`hipsparseZbsrsv2_bufferSize`|3.6.0| | | | |`rocsparse_zbsrsv_buffer_size`|3.6.0| | | | | +|`cusparseZbsrsv2_analysis`| |12.2| | |`hipsparseZbsrsv2_analysis`|3.6.0|6.1.0| | | |`rocsparse_zbsrsv_analysis`|3.6.0| | | | | +|`cusparseZbsrsv2_bufferSize`| |12.2| | |`hipsparseZbsrsv2_bufferSize`|3.6.0|6.1.0| | | |`rocsparse_zbsrsv_buffer_size`|3.6.0| | | | | |`cusparseZbsrsv2_bufferSizeExt`| |12.2| | |`hipsparseZbsrsv2_bufferSizeExt`|3.6.0| | | | |`rocsparse_zbsrsv_buffer_size`|3.6.0| | | | | -|`cusparseZbsrsv2_solve`| |12.2| | |`hipsparseZbsrsv2_solve`|3.6.0| | | | |`rocsparse_zbsrsv_solve`|3.6.0| | | | | -|`cusparseZbsrxmv`| |12.2| | |`hipsparseZbsrxmv`|4.5.0| | | | |`rocsparse_zbsrxmv`|4.5.0| | | | | +|`cusparseZbsrsv2_solve`| |12.2| | |`hipsparseZbsrsv2_solve`|3.6.0|6.1.0| | | |`rocsparse_zbsrsv_solve`|3.6.0| | | | | +|`cusparseZbsrxmv`| |12.2| | |`hipsparseZbsrxmv`|4.5.0|6.1.0| | | |`rocsparse_zbsrxmv`|4.5.0| | | | | |`cusparseZcsrmv`| |10.2| |11.0|`hipsparseZcsrmv`|3.1.0| | | | |`rocsparse_zcsrmv`|1.9.0| | | | | |`cusparseZcsrmv_mp`|8.0|10.2| |11.0| | | | | | | | | | | | | |`cusparseZcsrsv2_analysis`| |11.3| |12.0|`hipsparseZcsrsv2_analysis`|3.1.0| | | | |`rocsparse_zcsrsv_analysis`|2.10.0| | | | | @@ -380,10 +380,10 @@ |**CUDA**|**A**|**D**|**C**|**R**|**HIP**|**A**|**D**|**C**|**R**|**E**|**ROC**|**A**|**D**|**C**|**R**|**E**| |:--|:-:|:-:|:-:|:-:|:--|:-:|:-:|:-:|:-:|:-:|:--|:-:|:-:|:-:|:-:|:-:| |`cusparseCbsrmm`| | | | |`hipsparseCbsrmm`|3.7.0| | | | |`rocsparse_cbsrmm`|3.7.0| | | | | -|`cusparseCbsrsm2_analysis`| |12.2| | |`hipsparseCbsrsm2_analysis`|4.5.0| | | | |`rocsparse_cbsrsm_analysis`|3.6.0| | | | | -|`cusparseCbsrsm2_bufferSize`| |12.2| | |`hipsparseCbsrsm2_bufferSize`|4.5.0| | | | |`rocsparse_cbsrsm_buffer_size`|4.5.0| | | | | +|`cusparseCbsrsm2_analysis`| |12.2| | |`hipsparseCbsrsm2_analysis`|4.5.0|6.1.0| | | |`rocsparse_cbsrsm_analysis`|3.6.0| | | | | +|`cusparseCbsrsm2_bufferSize`| |12.2| | |`hipsparseCbsrsm2_bufferSize`|4.5.0|6.1.0| | | |`rocsparse_cbsrsm_buffer_size`|4.5.0| | | | | |`cusparseCbsrsm2_bufferSizeExt`| |12.2| | | | | | | | | | | | | | | -|`cusparseCbsrsm2_solve`| |12.2| | |`hipsparseCbsrsm2_solve`|4.5.0| | | | |`rocsparse_cbsrsm_solve`|4.5.0| | | | | +|`cusparseCbsrsm2_solve`| |12.2| | |`hipsparseCbsrsm2_solve`|4.5.0|6.1.0| | | |`rocsparse_cbsrsm_solve`|4.5.0| | | | | |`cusparseCcsrmm`| |10.2| |11.0|`hipsparseCcsrmm`|3.1.0| | | | |`rocsparse_ccsrmm`|1.9.0| | | | | |`cusparseCcsrmm2`| |10.2| |11.0|`hipsparseCcsrmm2`|3.1.0| | | | |`rocsparse_ccsrmm`|1.9.0| | | | | |`cusparseCcsrsm2_analysis`|9.2|11.3| |12.0|`hipsparseCcsrsm2_analysis`|3.1.0| | | | |`rocsparse_ccsrsm_analysis`|3.1.0| | | | | @@ -393,10 +393,10 @@ |`cusparseCcsrsm_solve`| |10.2| |11.0| | | | | | | | | | | | | |`cusparseCgemmi`|8.0|11.0| |12.0|`hipsparseCgemmi`|3.7.0| | | | | | | | | | | |`cusparseDbsrmm`| | | | |`hipsparseDbsrmm`|3.7.0| | | | |`rocsparse_dbsrmm`|3.7.0| | | | | -|`cusparseDbsrsm2_analysis`| |12.2| | |`hipsparseDbsrsm2_analysis`|4.5.0| | | | |`rocsparse_dbsrsm_analysis`|3.6.0| | | | | -|`cusparseDbsrsm2_bufferSize`| |12.2| | |`hipsparseDbsrsm2_bufferSize`|4.5.0| | | | |`rocsparse_dbsrsm_buffer_size`|4.5.0| | | | | +|`cusparseDbsrsm2_analysis`| |12.2| | |`hipsparseDbsrsm2_analysis`|4.5.0|6.1.0| | | |`rocsparse_dbsrsm_analysis`|3.6.0| | | | | +|`cusparseDbsrsm2_bufferSize`| |12.2| | |`hipsparseDbsrsm2_bufferSize`|4.5.0|6.1.0| | | |`rocsparse_dbsrsm_buffer_size`|4.5.0| | | | | |`cusparseDbsrsm2_bufferSizeExt`| |12.2| | | | | | | | | | | | | | | -|`cusparseDbsrsm2_solve`| |12.2| | |`hipsparseDbsrsm2_solve`|4.5.0| | | | |`rocsparse_dbsrsm_solve`|4.5.0| | | | | +|`cusparseDbsrsm2_solve`| |12.2| | |`hipsparseDbsrsm2_solve`|4.5.0|6.1.0| | | |`rocsparse_dbsrsm_solve`|4.5.0| | | | | |`cusparseDcsrmm`| |10.2| |11.0|`hipsparseDcsrmm`|1.9.2| | | | |`rocsparse_dcsrmm`|1.9.0| | | | | |`cusparseDcsrmm2`| |10.2| |11.0|`hipsparseDcsrmm2`|1.9.2| | | | |`rocsparse_dcsrmm`|1.9.0| | | | | |`cusparseDcsrsm2_analysis`|9.2|11.3| |12.0|`hipsparseDcsrsm2_analysis`|3.1.0| | | | |`rocsparse_dcsrsm_analysis`|3.1.0| | | | | @@ -406,10 +406,10 @@ |`cusparseDcsrsm_solve`| |10.2| |11.0| | | | | | | | | | | | | |`cusparseDgemmi`|8.0|11.0| |12.0|`hipsparseDgemmi`|3.7.0| | | | | | | | | | | |`cusparseSbsrmm`| | | | |`hipsparseSbsrmm`|3.7.0| | | | |`rocsparse_sbsrmm`|3.7.0| | | | | -|`cusparseSbsrsm2_analysis`| |12.2| | |`hipsparseSbsrsm2_analysis`|4.5.0| | | | |`rocsparse_sbsrsm_analysis`|3.6.0| | | | | -|`cusparseSbsrsm2_bufferSize`| |12.2| | |`hipsparseSbsrsm2_bufferSize`|4.5.0| | | | |`rocsparse_sbsrsm_buffer_size`|4.5.0| | | | | +|`cusparseSbsrsm2_analysis`| |12.2| | |`hipsparseSbsrsm2_analysis`|4.5.0|6.1.0| | | |`rocsparse_sbsrsm_analysis`|3.6.0| | | | | +|`cusparseSbsrsm2_bufferSize`| |12.2| | |`hipsparseSbsrsm2_bufferSize`|4.5.0|6.1.0| | | |`rocsparse_sbsrsm_buffer_size`|4.5.0| | | | | |`cusparseSbsrsm2_bufferSizeExt`| |12.2| | | | | | | | | | | | | | | -|`cusparseSbsrsm2_solve`| |12.2| | |`hipsparseSbsrsm2_solve`|4.5.0| | | | |`rocsparse_sbsrsm_solve`|4.5.0| | | | | +|`cusparseSbsrsm2_solve`| |12.2| | |`hipsparseSbsrsm2_solve`|4.5.0|6.1.0| | | |`rocsparse_sbsrsm_solve`|4.5.0| | | | | |`cusparseScsrmm`| |10.2| |11.0|`hipsparseScsrmm`|1.9.2| | | | |`rocsparse_scsrmm`|1.9.0| | | | | |`cusparseScsrmm2`| |10.2| |11.0|`hipsparseScsrmm2`|1.9.2| | | | |`rocsparse_scsrmm`|1.9.0| | | | | |`cusparseScsrsm2_analysis`|9.2|11.3| |12.0|`hipsparseScsrsm2_analysis`|3.1.0| | | | |`rocsparse_scsrsm_analysis`|3.1.0| | | | | @@ -418,13 +418,13 @@ |`cusparseScsrsm_analysis`| |10.2| |11.0| | | | | | | | | | | | | |`cusparseScsrsm_solve`| |10.2| |11.0| | | | | | | | | | | | | |`cusparseSgemmi`|8.0|11.0| |12.0|`hipsparseSgemmi`|3.7.0| | | | | | | | | | | -|`cusparseXbsrsm2_zeroPivot`| |12.2| | |`hipsparseXbsrsm2_zeroPivot`|4.5.0| | | | |`rocsparse_bsrsm_zero_pivot`|4.5.0| | | | | +|`cusparseXbsrsm2_zeroPivot`| |12.2| | |`hipsparseXbsrsm2_zeroPivot`|4.5.0|6.1.0| | | |`rocsparse_bsrsm_zero_pivot`|4.5.0| | | | | |`cusparseXcsrsm2_zeroPivot`|9.2|11.3| |12.0|`hipsparseXcsrsm2_zeroPivot`|3.1.0| | | | |`rocsparse_csrsm_zero_pivot`|3.1.0| | | | | |`cusparseZbsrmm`| | | | |`hipsparseZbsrmm`|3.7.0| | | | |`rocsparse_zbsrmm`|3.7.0| | | | | -|`cusparseZbsrsm2_analysis`| |12.2| | |`hipsparseZbsrsm2_analysis`|4.5.0| | | | |`rocsparse_zbsrsm_analysis`|3.6.0| | | | | -|`cusparseZbsrsm2_bufferSize`| |12.2| | |`hipsparseZbsrsm2_bufferSize`|4.5.0| | | | |`rocsparse_zbsrsm_buffer_size`|4.5.0| | | | | +|`cusparseZbsrsm2_analysis`| |12.2| | |`hipsparseZbsrsm2_analysis`|4.5.0|6.1.0| | | |`rocsparse_zbsrsm_analysis`|3.6.0| | | | | +|`cusparseZbsrsm2_bufferSize`| |12.2| | |`hipsparseZbsrsm2_bufferSize`|4.5.0|6.1.0| | | |`rocsparse_zbsrsm_buffer_size`|4.5.0| | | | | |`cusparseZbsrsm2_bufferSizeExt`| |12.2| | | | | | | | | | | | | | | -|`cusparseZbsrsm2_solve`| |12.2| | |`hipsparseZbsrsm2_solve`|4.5.0| | | | |`rocsparse_zbsrsm_solve`|4.5.0| | | | | +|`cusparseZbsrsm2_solve`| |12.2| | |`hipsparseZbsrsm2_solve`|4.5.0|6.1.0| | | |`rocsparse_zbsrsm_solve`|4.5.0| | | | | |`cusparseZcsrmm`| |10.2| |11.0|`hipsparseZcsrmm`|3.1.0| | | | |`rocsparse_zcsrmm`|1.9.0| | | | | |`cusparseZcsrmm2`| |10.2| |11.0|`hipsparseZcsrmm2`|3.1.0| | | | |`rocsparse_zcsrmm`|1.9.0| | | | | |`cusparseZcsrsm2_analysis`|9.2|11.3| |12.0|`hipsparseZcsrsm2_analysis`|3.1.0| | | | |`rocsparse_zcsrsm_analysis`|3.1.0| | | | | @@ -471,26 +471,26 @@ |**CUDA**|**A**|**D**|**C**|**R**|**HIP**|**A**|**D**|**C**|**R**|**E**|**ROC**|**A**|**D**|**C**|**R**|**E**| |:--|:-:|:-:|:-:|:-:|:--|:-:|:-:|:-:|:-:|:-:|:--|:-:|:-:|:-:|:-:|:-:| -|`cusparseCbsric02`| |12.2| | |`hipsparseCbsric02`|3.8.0| | | | |`rocsparse_cbsric0`|3.8.0| | | | | -|`cusparseCbsric02_analysis`| |12.2| | |`hipsparseCbsric02_analysis`|3.8.0| | | | |`rocsparse_cbsric0_analysis`|3.6.0| | | | | -|`cusparseCbsric02_bufferSize`| |12.2| | |`hipsparseCbsric02_bufferSize`|3.8.0| | | | |`rocsparse_cbsric0_buffer_size`|3.8.0| | | | | +|`cusparseCbsric02`| |12.2| | |`hipsparseCbsric02`|3.8.0|6.1.0| | | |`rocsparse_cbsric0`|3.8.0| | | | | +|`cusparseCbsric02_analysis`| |12.2| | |`hipsparseCbsric02_analysis`|3.8.0|6.1.0| | | |`rocsparse_cbsric0_analysis`|3.6.0| | | | | +|`cusparseCbsric02_bufferSize`| |12.2| | |`hipsparseCbsric02_bufferSize`|3.8.0|6.1.0| | | |`rocsparse_cbsric0_buffer_size`|3.8.0| | | | | |`cusparseCbsric02_bufferSizeExt`| |12.2| | | | | | | | | | | | | | | -|`cusparseCbsrilu02`| |12.2| | |`hipsparseCbsrilu02`|3.9.0| | | | |`rocsparse_cbsrilu0`|3.9.0| | | | | -|`cusparseCbsrilu02_analysis`| |12.2| | |`hipsparseCbsrilu02_analysis`|3.9.0| | | | |`rocsparse_cbsrilu0_analysis`|3.6.0| | | | | -|`cusparseCbsrilu02_bufferSize`| |12.2| | |`hipsparseCbsrilu02_bufferSize`|3.9.0| | | | |`rocsparse_cbsrilu0_buffer_size`|3.8.0| | | | | +|`cusparseCbsrilu02`| |12.2| | |`hipsparseCbsrilu02`|3.9.0|6.1.0| | | |`rocsparse_cbsrilu0`|3.9.0| | | | | +|`cusparseCbsrilu02_analysis`| |12.2| | |`hipsparseCbsrilu02_analysis`|3.9.0|6.1.0| | | |`rocsparse_cbsrilu0_analysis`|3.6.0| | | | | +|`cusparseCbsrilu02_bufferSize`| |12.2| | |`hipsparseCbsrilu02_bufferSize`|3.9.0|6.1.0| | | |`rocsparse_cbsrilu0_buffer_size`|3.8.0| | | | | |`cusparseCbsrilu02_bufferSizeExt`| |12.2| | | | | | | | | | | | | | | -|`cusparseCbsrilu02_numericBoost`| |12.2| | |`hipsparseCbsrilu02_numericBoost`|3.9.0| | | | |`rocsparse_dcbsrilu0_numeric_boost`|4.5.0| | | | | +|`cusparseCbsrilu02_numericBoost`| |12.2| | |`hipsparseCbsrilu02_numericBoost`|3.9.0|6.1.0| | | |`rocsparse_dcbsrilu0_numeric_boost`|4.5.0| | | | | |`cusparseCcsric0`| |10.2| |11.0| | | | | | | | | | | | | -|`cusparseCcsric02`| |12.2| | |`hipsparseCcsric02`|3.1.0| | | | |`rocsparse_ccsric0`|3.1.0| | | | | -|`cusparseCcsric02_analysis`| |12.2| | |`hipsparseCcsric02_analysis`|3.1.0| | | | |`rocsparse_ccsric0_analysis`|3.1.0| | | | | -|`cusparseCcsric02_bufferSize`| |12.2| | |`hipsparseCcsric02_bufferSize`|3.1.0| | | | |`rocsparse_ccsric0_buffer_size`|3.1.0| | | | | +|`cusparseCcsric02`| |12.2| | |`hipsparseCcsric02`|3.1.0|6.1.0| | | |`rocsparse_ccsric0`|3.1.0| | | | | +|`cusparseCcsric02_analysis`| |12.2| | |`hipsparseCcsric02_analysis`|3.1.0|6.1.0| | | |`rocsparse_ccsric0_analysis`|3.1.0| | | | | +|`cusparseCcsric02_bufferSize`| |12.2| | |`hipsparseCcsric02_bufferSize`|3.1.0|6.1.0| | | |`rocsparse_ccsric0_buffer_size`|3.1.0| | | | | |`cusparseCcsric02_bufferSizeExt`| |12.2| | |`hipsparseCcsric02_bufferSizeExt`|3.1.0| | | | |`rocsparse_ccsric0_buffer_size`|3.1.0| | | | | |`cusparseCcsrilu0`| |10.2| |11.0| | | | | | | | | | | | | -|`cusparseCcsrilu02`| |12.2| | |`hipsparseCcsrilu02`|3.1.0| | | | |`rocsparse_ccsrilu0`|2.10.0| | | | | -|`cusparseCcsrilu02_analysis`| |12.2| | |`hipsparseCcsrilu02_analysis`|3.1.0| | | | |`rocsparse_ccsrilu0_analysis`|2.10.0| | | | | -|`cusparseCcsrilu02_bufferSize`| |12.2| | |`hipsparseCcsrilu02_bufferSize`|3.1.0| | | | |`rocsparse_ccsrilu0_buffer_size`|2.10.0| | | | | +|`cusparseCcsrilu02`| |12.2| | |`hipsparseCcsrilu02`|3.1.0|6.1.0| | | |`rocsparse_ccsrilu0`|2.10.0| | | | | +|`cusparseCcsrilu02_analysis`| |12.2| | |`hipsparseCcsrilu02_analysis`|3.1.0|6.1.0| | | |`rocsparse_ccsrilu0_analysis`|2.10.0| | | | | +|`cusparseCcsrilu02_bufferSize`| |12.2| | |`hipsparseCcsrilu02_bufferSize`|3.1.0|6.1.0| | | |`rocsparse_ccsrilu0_buffer_size`|2.10.0| | | | | |`cusparseCcsrilu02_bufferSizeExt`| |12.2| | |`hipsparseCcsrilu02_bufferSizeExt`|3.1.0| | | | |`rocsparse_ccsrilu0_buffer_size`|2.10.0| | | | | -|`cusparseCcsrilu02_numericBoost`| |12.2| | |`hipsparseCcsrilu02_numericBoost`|3.10.0| | | | |`rocsparse_dccsrilu0_numeric_boost`|4.5.0| | | | | +|`cusparseCcsrilu02_numericBoost`| |12.2| | |`hipsparseCcsrilu02_numericBoost`|3.10.0|6.1.0| | | |`rocsparse_dccsrilu0_numeric_boost`|4.5.0| | | | | |`cusparseCgpsvInterleavedBatch`|9.2| | | |`hipsparseCgpsvInterleavedBatch`|5.1.0| | | | |`rocsparse_cgpsv_interleaved_batch`|5.1.0| | | | | |`cusparseCgpsvInterleavedBatch_bufferSizeExt`|9.2| | | |`hipsparseCgpsvInterleavedBatch_bufferSizeExt`|5.1.0| | | | |`rocsparse_cgpsv_interleaved_batch_buffer_size`|5.1.0| | | | | |`cusparseCgtsv`| |10.2| |11.0| | | | | | | | | | | | | @@ -505,26 +505,26 @@ |`cusparseCgtsvStridedBatch`| |10.2| |11.0| | | | | | | | | | | | | |`cusparseCgtsv_nopivot`| |10.2| |11.0| | | | | | | | | | | | | |`cusparseCsrilu0Ex`|8.0|10.2| |11.0| | | | | | | | | | | | | -|`cusparseDbsric02`| |12.2| | |`hipsparseDbsric02`|3.8.0| | | | |`rocsparse_dbsric0`|3.8.0| | | | | -|`cusparseDbsric02_analysis`| |12.2| | |`hipsparseDbsric02_analysis`|3.8.0| | | | |`rocsparse_dbsric0_analysis`|3.6.0| | | | | -|`cusparseDbsric02_bufferSize`| |12.2| | |`hipsparseDbsric02_bufferSize`|3.8.0| | | | |`rocsparse_dbsric0_buffer_size`|3.8.0| | | | | +|`cusparseDbsric02`| |12.2| | |`hipsparseDbsric02`|3.8.0|6.1.0| | | |`rocsparse_dbsric0`|3.8.0| | | | | +|`cusparseDbsric02_analysis`| |12.2| | |`hipsparseDbsric02_analysis`|3.8.0|6.1.0| | | |`rocsparse_dbsric0_analysis`|3.6.0| | | | | +|`cusparseDbsric02_bufferSize`| |12.2| | |`hipsparseDbsric02_bufferSize`|3.8.0|6.1.0| | | |`rocsparse_dbsric0_buffer_size`|3.8.0| | | | | |`cusparseDbsric02_bufferSizeExt`| |12.2| | | | | | | | | | | | | | | -|`cusparseDbsrilu02`| |12.2| | |`hipsparseDbsrilu02`|3.9.0| | | | |`rocsparse_dbsrilu0`|3.9.0| | | | | -|`cusparseDbsrilu02_analysis`| |12.2| | |`hipsparseDbsrilu02_analysis`|3.9.0| | | | |`rocsparse_dbsrilu0_analysis`|3.6.0| | | | | -|`cusparseDbsrilu02_bufferSize`| |12.2| | |`hipsparseDbsrilu02_bufferSize`|3.9.0| | | | |`rocsparse_dbsrilu0_buffer_size`|3.8.0| | | | | +|`cusparseDbsrilu02`| |12.2| | |`hipsparseDbsrilu02`|3.9.0|6.1.0| | | |`rocsparse_dbsrilu0`|3.9.0| | | | | +|`cusparseDbsrilu02_analysis`| |12.2| | |`hipsparseDbsrilu02_analysis`|3.9.0|6.1.0| | | |`rocsparse_dbsrilu0_analysis`|3.6.0| | | | | +|`cusparseDbsrilu02_bufferSize`| |12.2| | |`hipsparseDbsrilu02_bufferSize`|3.9.0|6.1.0| | | |`rocsparse_dbsrilu0_buffer_size`|3.8.0| | | | | |`cusparseDbsrilu02_bufferSizeExt`| |12.2| | | | | | | | | | | | | | | -|`cusparseDbsrilu02_numericBoost`| |12.2| | |`hipsparseDbsrilu02_numericBoost`|3.9.0| | | | |`rocsparse_dbsrilu0_numeric_boost`|3.9.0| | | | | +|`cusparseDbsrilu02_numericBoost`| |12.2| | |`hipsparseDbsrilu02_numericBoost`|3.9.0|6.1.0| | | |`rocsparse_dbsrilu0_numeric_boost`|3.9.0| | | | | |`cusparseDcsric0`| |10.2| |11.0| | | | | | | | | | | | | -|`cusparseDcsric02`| |12.2| | |`hipsparseDcsric02`|3.1.0| | | | |`rocsparse_dcsric0`|3.1.0| | | | | -|`cusparseDcsric02_analysis`| |12.2| | |`hipsparseDcsric02_analysis`|3.1.0| | | | |`rocsparse_dcsric0_analysis`|3.1.0| | | | | -|`cusparseDcsric02_bufferSize`| |12.2| | |`hipsparseDcsric02_bufferSize`|3.1.0| | | | |`rocsparse_dcsric0_buffer_size`|3.1.0| | | | | +|`cusparseDcsric02`| |12.2| | |`hipsparseDcsric02`|3.1.0|6.1.0| | | |`rocsparse_dcsric0`|3.1.0| | | | | +|`cusparseDcsric02_analysis`| |12.2| | |`hipsparseDcsric02_analysis`|3.1.0|6.1.0| | | |`rocsparse_dcsric0_analysis`|3.1.0| | | | | +|`cusparseDcsric02_bufferSize`| |12.2| | |`hipsparseDcsric02_bufferSize`|3.1.0|6.1.0| | | |`rocsparse_dcsric0_buffer_size`|3.1.0| | | | | |`cusparseDcsric02_bufferSizeExt`| |12.2| | |`hipsparseDcsric02_bufferSizeExt`|3.1.0| | | | |`rocsparse_dcsric0_buffer_size`|3.1.0| | | | | |`cusparseDcsrilu0`| |10.2| |11.0| | | | | | | | | | | | | -|`cusparseDcsrilu02`| |12.2| | |`hipsparseDcsrilu02`|1.9.2| | | | |`rocsparse_dcsrilu0`|1.9.0| | | | | -|`cusparseDcsrilu02_analysis`| |12.2| | |`hipsparseDcsrilu02_analysis`|1.9.2| | | | |`rocsparse_dcsrilu0_analysis`|1.9.0| | | | | -|`cusparseDcsrilu02_bufferSize`| |12.2| | |`hipsparseDcsrilu02_bufferSize`|1.9.2| | | | |`rocsparse_dcsrilu0_buffer_size`|1.9.0| | | | | +|`cusparseDcsrilu02`| |12.2| | |`hipsparseDcsrilu02`|1.9.2|6.1.0| | | |`rocsparse_dcsrilu0`|1.9.0| | | | | +|`cusparseDcsrilu02_analysis`| |12.2| | |`hipsparseDcsrilu02_analysis`|1.9.2|6.1.0| | | |`rocsparse_dcsrilu0_analysis`|1.9.0| | | | | +|`cusparseDcsrilu02_bufferSize`| |12.2| | |`hipsparseDcsrilu02_bufferSize`|1.9.2|6.1.0| | | |`rocsparse_dcsrilu0_buffer_size`|1.9.0| | | | | |`cusparseDcsrilu02_bufferSizeExt`| |12.2| | |`hipsparseDcsrilu02_bufferSizeExt`|1.9.2| | | | |`rocsparse_dcsrilu0_buffer_size`|1.9.0| | | | | -|`cusparseDcsrilu02_numericBoost`| |12.2| | |`hipsparseDcsrilu02_numericBoost`|3.10.0| | | | |`rocsparse_dcsrilu0_numeric_boost`|3.9.0| | | | | +|`cusparseDcsrilu02_numericBoost`| |12.2| | |`hipsparseDcsrilu02_numericBoost`|3.10.0|6.1.0| | | |`rocsparse_dcsrilu0_numeric_boost`|3.9.0| | | | | |`cusparseDgpsvInterleavedBatch`|9.2| | | |`hipsparseDgpsvInterleavedBatch`|5.1.0| | | | |`rocsparse_dgpsv_interleaved_batch`|5.1.0| | | | | |`cusparseDgpsvInterleavedBatch_bufferSizeExt`|9.2| | | |`hipsparseDgpsvInterleavedBatch_bufferSizeExt`|5.1.0| | | | |`rocsparse_dgpsv_interleaved_batch_buffer_size`|5.1.0| | | | | |`cusparseDgtsv`| |10.2| |11.0| | | | | | | | | | | | | @@ -538,26 +538,26 @@ |`cusparseDgtsvInterleavedBatch_bufferSizeExt`|9.2| | | |`hipsparseDgtsvInterleavedBatch_bufferSizeExt`|5.1.0| | | | |`rocsparse_dgtsv_interleaved_batch_buffer_size`|5.1.0| | | | | |`cusparseDgtsvStridedBatch`| |10.2| |11.0| | | | | | | | | | | | | |`cusparseDgtsv_nopivot`| |10.2| |11.0| | | | | | | | | | | | | -|`cusparseSbsric02`| |12.2| | |`hipsparseSbsric02`|3.8.0| | | | |`rocsparse_sbsric0`|3.8.0| | | | | -|`cusparseSbsric02_analysis`| |12.2| | |`hipsparseSbsric02_analysis`|3.8.0| | | | |`rocsparse_sbsric0_analysis`|3.6.0| | | | | -|`cusparseSbsric02_bufferSize`| |12.2| | |`hipsparseSbsric02_bufferSize`|3.8.0| | | | |`rocsparse_sbsric0_buffer_size`|3.8.0| | | | | +|`cusparseSbsric02`| |12.2| | |`hipsparseSbsric02`|3.8.0|6.1.0| | | |`rocsparse_sbsric0`|3.8.0| | | | | +|`cusparseSbsric02_analysis`| |12.2| | |`hipsparseSbsric02_analysis`|3.8.0|6.1.0| | | |`rocsparse_sbsric0_analysis`|3.6.0| | | | | +|`cusparseSbsric02_bufferSize`| |12.2| | |`hipsparseSbsric02_bufferSize`|3.8.0|6.1.0| | | |`rocsparse_sbsric0_buffer_size`|3.8.0| | | | | |`cusparseSbsric02_bufferSizeExt`| |12.2| | | | | | | | | | | | | | | -|`cusparseSbsrilu02`| |12.2| | |`hipsparseSbsrilu02`|3.9.0| | | | |`rocsparse_sbsrilu0`|3.9.0| | | | | -|`cusparseSbsrilu02_analysis`| |12.2| | |`hipsparseSbsrilu02_analysis`|3.9.0| | | | |`rocsparse_sbsrilu0_analysis`|3.6.0| | | | | -|`cusparseSbsrilu02_bufferSize`| |12.2| | |`hipsparseSbsrilu02_bufferSize`|3.9.0| | | | |`rocsparse_sbsrilu0_buffer_size`|3.8.0| | | | | +|`cusparseSbsrilu02`| |12.2| | |`hipsparseSbsrilu02`|3.9.0|6.1.0| | | |`rocsparse_sbsrilu0`|3.9.0| | | | | +|`cusparseSbsrilu02_analysis`| |12.2| | |`hipsparseSbsrilu02_analysis`|3.9.0|6.1.0| | | |`rocsparse_sbsrilu0_analysis`|3.6.0| | | | | +|`cusparseSbsrilu02_bufferSize`| |12.2| | |`hipsparseSbsrilu02_bufferSize`|3.9.0|6.1.0| | | |`rocsparse_sbsrilu0_buffer_size`|3.8.0| | | | | |`cusparseSbsrilu02_bufferSizeExt`| |12.2| | | | | | | | | | | | | | | -|`cusparseSbsrilu02_numericBoost`| |12.2| | |`hipsparseSbsrilu02_numericBoost`|3.9.0| | | | |`rocsparse_dsbsrilu0_numeric_boost`|4.5.0| | | | | +|`cusparseSbsrilu02_numericBoost`| |12.2| | |`hipsparseSbsrilu02_numericBoost`|3.9.0|6.1.0| | | |`rocsparse_dsbsrilu0_numeric_boost`|4.5.0| | | | | |`cusparseScsric0`| |10.2| |11.0| | | | | | | | | | | | | -|`cusparseScsric02`| |12.2| | |`hipsparseScsric02`|3.1.0| | | | |`rocsparse_scsric0`|3.1.0| | | | | -|`cusparseScsric02_analysis`| |12.2| | |`hipsparseScsric02_analysis`|3.1.0| | | | |`rocsparse_scsric0_analysis`|3.1.0| | | | | -|`cusparseScsric02_bufferSize`| |12.2| | |`hipsparseScsric02_bufferSize`|3.1.0| | | | |`rocsparse_scsric0_buffer_size`|3.1.0| | | | | +|`cusparseScsric02`| |12.2| | |`hipsparseScsric02`|3.1.0|6.1.0| | | |`rocsparse_scsric0`|3.1.0| | | | | +|`cusparseScsric02_analysis`| |12.2| | |`hipsparseScsric02_analysis`|3.1.0|6.1.0| | | |`rocsparse_scsric0_analysis`|3.1.0| | | | | +|`cusparseScsric02_bufferSize`| |12.2| | |`hipsparseScsric02_bufferSize`|3.1.0|6.1.0| | | |`rocsparse_scsric0_buffer_size`|3.1.0| | | | | |`cusparseScsric02_bufferSizeExt`| |12.2| | |`hipsparseScsric02_bufferSizeExt`|3.1.0| | | | |`rocsparse_scsric0_buffer_size`|3.1.0| | | | | |`cusparseScsrilu0`| |10.2| |11.0| | | | | | | | | | | | | -|`cusparseScsrilu02`| |12.2| | |`hipsparseScsrilu02`|1.9.2| | | | |`rocsparse_scsrilu0`|1.9.0| | | | | -|`cusparseScsrilu02_analysis`| |12.2| | |`hipsparseScsrilu02_analysis`|1.9.2| | | | |`rocsparse_scsrilu0_analysis`|1.9.0| | | | | -|`cusparseScsrilu02_bufferSize`| |12.2| | |`hipsparseScsrilu02_bufferSize`|1.9.2| | | | |`rocsparse_scsrilu0_buffer_size`|1.9.0| | | | | +|`cusparseScsrilu02`| |12.2| | |`hipsparseScsrilu02`|1.9.2|6.1.0| | | |`rocsparse_scsrilu0`|1.9.0| | | | | +|`cusparseScsrilu02_analysis`| |12.2| | |`hipsparseScsrilu02_analysis`|1.9.2|6.1.0| | | |`rocsparse_scsrilu0_analysis`|1.9.0| | | | | +|`cusparseScsrilu02_bufferSize`| |12.2| | |`hipsparseScsrilu02_bufferSize`|1.9.2|6.1.0| | | |`rocsparse_scsrilu0_buffer_size`|1.9.0| | | | | |`cusparseScsrilu02_bufferSizeExt`| |12.2| | |`hipsparseScsrilu02_bufferSizeExt`|1.9.2| | | | |`rocsparse_scsrilu0_buffer_size`|1.9.0| | | | | -|`cusparseScsrilu02_numericBoost`| |12.2| | |`hipsparseScsrilu02_numericBoost`|3.10.0| | | | |`rocsparse_dscsrilu0_numeric_boost`|4.5.0| | | | | +|`cusparseScsrilu02_numericBoost`| |12.2| | |`hipsparseScsrilu02_numericBoost`|3.10.0|6.1.0| | | |`rocsparse_dscsrilu0_numeric_boost`|4.5.0| | | | | |`cusparseSgpsvInterleavedBatch`|9.2| | | |`hipsparseSgpsvInterleavedBatch`|5.1.0| | | | |`rocsparse_sgpsv_interleaved_batch`|5.1.0| | | | | |`cusparseSgpsvInterleavedBatch_bufferSizeExt`|9.2| | | |`hipsparseSgpsvInterleavedBatch_bufferSizeExt`|5.1.0| | | | |`rocsparse_sgpsv_interleaved_batch_buffer_size`|5.1.0| | | | | |`cusparseSgtsv`| |10.2| |11.0| | | | | | | | | | | | | @@ -571,30 +571,30 @@ |`cusparseSgtsvInterleavedBatch_bufferSizeExt`|9.2| | | |`hipsparseSgtsvInterleavedBatch_bufferSizeExt`|5.1.0| | | | |`rocsparse_sgtsv_interleaved_batch_buffer_size`|5.1.0| | | | | |`cusparseSgtsvStridedBatch`| |10.2| |11.0| | | | | | | | | | | | | |`cusparseSgtsv_nopivot`| |10.2| |11.0| | | | | | | | | | | | | -|`cusparseXbsric02_zeroPivot`| |12.2| | |`hipsparseXbsric02_zeroPivot`|3.8.0| | | | |`rocsparse_bsric0_zero_pivot`|3.8.0| | | | | -|`cusparseXbsrilu02_zeroPivot`| |12.2| | |`hipsparseXbsrilu02_zeroPivot`|3.9.0| | | | |`rocsparse_bsrilu0_zero_pivot`|3.9.0| | | | | -|`cusparseXcsric02_zeroPivot`| |12.2| | |`hipsparseXcsric02_zeroPivot`|3.1.0| | | | |`rocsparse_csric0_zero_pivot`|3.1.0| | | | | -|`cusparseXcsrilu02_zeroPivot`| |12.2| | |`hipsparseXcsrilu02_zeroPivot`|1.9.2| | | | |`rocsparse_csrilu0_zero_pivot`|1.9.0| | | | | -|`cusparseZbsric02`| |12.2| | |`hipsparseZbsric02`|3.8.0| | | | |`rocsparse_zbsric0`|3.8.0| | | | | -|`cusparseZbsric02_analysis`| |12.2| | |`hipsparseZbsric02_analysis`|3.8.0| | | | |`rocsparse_zbsric0_analysis`|3.6.0| | | | | -|`cusparseZbsric02_bufferSize`| |12.2| | |`hipsparseZbsric02_bufferSize`|3.8.0| | | | |`rocsparse_zbsric0_buffer_size`|3.8.0| | | | | +|`cusparseXbsric02_zeroPivot`| |12.2| | |`hipsparseXbsric02_zeroPivot`|3.8.0|6.1.0| | | |`rocsparse_bsric0_zero_pivot`|3.8.0| | | | | +|`cusparseXbsrilu02_zeroPivot`| |12.2| | |`hipsparseXbsrilu02_zeroPivot`|3.9.0|6.1.0| | | |`rocsparse_bsrilu0_zero_pivot`|3.9.0| | | | | +|`cusparseXcsric02_zeroPivot`| |12.2| | |`hipsparseXcsric02_zeroPivot`|3.1.0|6.1.0| | | |`rocsparse_csric0_zero_pivot`|3.1.0| | | | | +|`cusparseXcsrilu02_zeroPivot`| |12.2| | |`hipsparseXcsrilu02_zeroPivot`|1.9.2|6.1.0| | | |`rocsparse_csrilu0_zero_pivot`|1.9.0| | | | | +|`cusparseZbsric02`| |12.2| | |`hipsparseZbsric02`|3.8.0|6.1.0| | | |`rocsparse_zbsric0`|3.8.0| | | | | +|`cusparseZbsric02_analysis`| |12.2| | |`hipsparseZbsric02_analysis`|3.8.0|6.1.0| | | |`rocsparse_zbsric0_analysis`|3.6.0| | | | | +|`cusparseZbsric02_bufferSize`| |12.2| | |`hipsparseZbsric02_bufferSize`|3.8.0|6.1.0| | | |`rocsparse_zbsric0_buffer_size`|3.8.0| | | | | |`cusparseZbsric02_bufferSizeExt`| |12.2| | | | | | | | | | | | | | | -|`cusparseZbsrilu02`| |12.2| | |`hipsparseZbsrilu02`|3.9.0| | | | |`rocsparse_zbsrilu0`|3.9.0| | | | | -|`cusparseZbsrilu02_analysis`| |12.2| | |`hipsparseZbsrilu02_analysis`|3.9.0| | | | |`rocsparse_zbsrilu0_analysis`|3.6.0| | | | | -|`cusparseZbsrilu02_bufferSize`| |12.2| | |`hipsparseZbsrilu02_bufferSize`|3.9.0| | | | |`rocsparse_zbsrilu0_buffer_size`|3.8.0| | | | | +|`cusparseZbsrilu02`| |12.2| | |`hipsparseZbsrilu02`|3.9.0|6.1.0| | | |`rocsparse_zbsrilu0`|3.9.0| | | | | +|`cusparseZbsrilu02_analysis`| |12.2| | |`hipsparseZbsrilu02_analysis`|3.9.0|6.1.0| | | |`rocsparse_zbsrilu0_analysis`|3.6.0| | | | | +|`cusparseZbsrilu02_bufferSize`| |12.2| | |`hipsparseZbsrilu02_bufferSize`|3.9.0|6.1.0| | | |`rocsparse_zbsrilu0_buffer_size`|3.8.0| | | | | |`cusparseZbsrilu02_bufferSizeExt`| |12.2| | | | | | | | | | | | | | | -|`cusparseZbsrilu02_numericBoost`| |12.2| | |`hipsparseZbsrilu02_numericBoost`|3.9.0| | | | |`rocsparse_zbsrilu0_numeric_boost`|3.9.0| | | | | +|`cusparseZbsrilu02_numericBoost`| |12.2| | |`hipsparseZbsrilu02_numericBoost`|3.9.0|6.1.0| | | |`rocsparse_zbsrilu0_numeric_boost`|3.9.0| | | | | |`cusparseZcsric0`| |10.2| |11.0| | | | | | | | | | | | | -|`cusparseZcsric02`| |12.2| | |`hipsparseZcsric02`|3.1.0| | | | |`rocsparse_zcsric0`|3.1.0| | | | | -|`cusparseZcsric02_analysis`| |12.2| | |`hipsparseZcsric02_analysis`|3.1.0| | | | |`rocsparse_zcsric0_analysis`|3.1.0| | | | | -|`cusparseZcsric02_bufferSize`| |12.2| | |`hipsparseZcsric02_bufferSize`|3.1.0| | | | |`rocsparse_zcsric0_buffer_size`|3.1.0| | | | | +|`cusparseZcsric02`| |12.2| | |`hipsparseZcsric02`|3.1.0|6.1.0| | | |`rocsparse_zcsric0`|3.1.0| | | | | +|`cusparseZcsric02_analysis`| |12.2| | |`hipsparseZcsric02_analysis`|3.1.0|6.1.0| | | |`rocsparse_zcsric0_analysis`|3.1.0| | | | | +|`cusparseZcsric02_bufferSize`| |12.2| | |`hipsparseZcsric02_bufferSize`|3.1.0|6.1.0| | | |`rocsparse_zcsric0_buffer_size`|3.1.0| | | | | |`cusparseZcsric02_bufferSizeExt`| |12.2| | |`hipsparseZcsric02_bufferSizeExt`|3.1.0| | | | |`rocsparse_zcsric0_buffer_size`|3.1.0| | | | | |`cusparseZcsrilu0`| |10.2| |11.0| | | | | | | | | | | | | -|`cusparseZcsrilu02`| |12.2| | |`hipsparseZcsrilu02`|3.1.0| | | | |`rocsparse_zcsrilu0`|2.10.0| | | | | -|`cusparseZcsrilu02_analysis`| |12.2| | |`hipsparseZcsrilu02_analysis`|3.1.0| | | | |`rocsparse_zcsrilu0_analysis`|2.10.0| | | | | -|`cusparseZcsrilu02_bufferSize`| |12.2| | |`hipsparseZcsrilu02_bufferSize`|3.1.0| | | | |`rocsparse_zcsrilu0_buffer_size`|2.10.0| | | | | +|`cusparseZcsrilu02`| |12.2| | |`hipsparseZcsrilu02`|3.1.0|6.1.0| | | |`rocsparse_zcsrilu0`|2.10.0| | | | | +|`cusparseZcsrilu02_analysis`| |12.2| | |`hipsparseZcsrilu02_analysis`|3.1.0|6.1.0| | | |`rocsparse_zcsrilu0_analysis`|2.10.0| | | | | +|`cusparseZcsrilu02_bufferSize`| |12.2| | |`hipsparseZcsrilu02_bufferSize`|3.1.0|6.1.0| | | |`rocsparse_zcsrilu0_buffer_size`|2.10.0| | | | | |`cusparseZcsrilu02_bufferSizeExt`| |12.2| | |`hipsparseZcsrilu02_bufferSizeExt`|3.1.0| | | | |`rocsparse_zcsrilu0_buffer_size`|2.10.0| | | | | -|`cusparseZcsrilu02_numericBoost`| |12.2| | |`hipsparseZcsrilu02_numericBoost`|3.10.0| | | | |`rocsparse_zcsrilu0_numeric_boost`|3.9.0| | | | | +|`cusparseZcsrilu02_numericBoost`| |12.2| | |`hipsparseZcsrilu02_numericBoost`|3.10.0|6.1.0| | | |`rocsparse_zcsrilu0_numeric_boost`|3.9.0| | | | | |`cusparseZgpsvInterleavedBatch`|9.2| | | |`hipsparseZgpsvInterleavedBatch`|5.1.0| | | | |`rocsparse_zgpsv_interleaved_batch`|5.1.0| | | | | |`cusparseZgpsvInterleavedBatch_bufferSizeExt`|9.2| | | |`hipsparseZgpsvInterleavedBatch_bufferSizeExt`|5.1.0| | | | |`rocsparse_zgpsv_interleaved_batch_buffer_size`|5.1.0| | | | | |`cusparseZgtsv`| |10.2| |11.0| | | | | | | | | | | | | @@ -613,10 +613,10 @@ |**CUDA**|**A**|**D**|**C**|**R**|**HIP**|**A**|**D**|**C**|**R**|**E**|**ROC**|**A**|**D**|**C**|**R**|**E**| |:--|:-:|:-:|:-:|:-:|:--|:-:|:-:|:-:|:-:|:-:|:--|:-:|:-:|:-:|:-:|:-:| -|`cusparseCcsrcolor`| |12.2| | |`hipsparseCcsrcolor`|4.5.0| | | | |`rocsparse_ccsrcolor`|4.5.0| | | | | -|`cusparseDcsrcolor`| |12.2| | |`hipsparseDcsrcolor`|4.5.0| | | | |`rocsparse_dcsrcolor`|4.5.0| | | | | -|`cusparseScsrcolor`| |12.2| | |`hipsparseScsrcolor`|4.5.0| | | | |`rocsparse_scsrcolor`|4.5.0| | | | | -|`cusparseZcsrcolor`| |12.2| | |`hipsparseZcsrcolor`|4.5.0| | | | |`rocsparse_zcsrcolor`|4.5.0| | | | | +|`cusparseCcsrcolor`| |12.2| | |`hipsparseCcsrcolor`|4.5.0|6.1.0| | | |`rocsparse_ccsrcolor`|4.5.0| | | | | +|`cusparseDcsrcolor`| |12.2| | |`hipsparseDcsrcolor`|4.5.0|6.1.0| | | |`rocsparse_dcsrcolor`|4.5.0| | | | | +|`cusparseScsrcolor`| |12.2| | |`hipsparseScsrcolor`|4.5.0|6.1.0| | | |`rocsparse_scsrcolor`|4.5.0| | | | | +|`cusparseZcsrcolor`| |12.2| | |`hipsparseZcsrcolor`|4.5.0|6.1.0| | | |`rocsparse_zcsrcolor`|4.5.0| | | | | ## **14. CUSPARSE Format Conversion Reference** @@ -628,14 +628,14 @@ |`cusparseCcsr2bsr`| | | | |`hipsparseCcsr2bsr`|3.5.0| | | | |`rocsparse_ccsr2bsr`|3.5.0| | | | | |`cusparseCcsr2csc`| |10.2| |11.0|`hipsparseCcsr2csc`|3.1.0| | | | | | | | | | | |`cusparseCcsr2csr_compress`|8.0|12.2| | |`hipsparseCcsr2csr_compress`|3.5.0| | | | |`rocsparse_ccsr2csr_compress`|3.5.0| | | | | -|`cusparseCcsr2csru`| |12.2| | |`hipsparseCcsr2csru`|4.2.0| | | | | | | | | | | +|`cusparseCcsr2csru`| |12.2| | |`hipsparseCcsr2csru`|4.2.0|6.1.0| | | | | | | | | | |`cusparseCcsr2dense`| |11.1| |12.0|`hipsparseCcsr2dense`|3.5.0| | | | |`rocsparse_ccsr2dense`|3.5.0| | | | | |`cusparseCcsr2gebsr`| | | | |`hipsparseCcsr2gebsr`|4.1.0| | | | |`rocsparse_ccsr2gebsr`|4.1.0| | | | | |`cusparseCcsr2gebsr_bufferSize`| | | | |`hipsparseCcsr2gebsr_bufferSize`|4.1.0| | | | |`rocsparse_ccsr2gebsr_buffer_size`|4.1.0| | | | | |`cusparseCcsr2gebsr_bufferSizeExt`| | | | | | | | | | | | | | | | | |`cusparseCcsr2hyb`| |10.2| |11.0|`hipsparseCcsr2hyb`|3.1.0| | | | |`rocsparse_ccsr2hyb`|2.10.0| | | | | -|`cusparseCcsru2csr`| |12.2| | |`hipsparseCcsru2csr`|4.2.0| | | | | | | | | | | -|`cusparseCcsru2csr_bufferSizeExt`| |12.2| | |`hipsparseCcsru2csr_bufferSizeExt`|4.2.0| | | | | | | | | | | +|`cusparseCcsru2csr`| |12.2| | |`hipsparseCcsru2csr`|4.2.0|6.1.0| | | | | | | | | | +|`cusparseCcsru2csr_bufferSizeExt`| |12.2| | |`hipsparseCcsru2csr_bufferSizeExt`|4.2.0|6.1.0| | | | | | | | | | |`cusparseCdense2csc`| |11.1| |12.0|`hipsparseCdense2csc`|3.5.0| | | | |`rocsparse_cdense2csc`|3.2.0| | | | | |`cusparseCdense2csr`| |11.1| |12.0|`hipsparseCdense2csr`|3.5.0| | | | |`rocsparse_cdense2csr`|3.2.0| | | | | |`cusparseCdense2hyb`| |10.2| |11.0| | | | | | | | | | | | | @@ -650,9 +650,9 @@ |`cusparseChyb2csr`| |10.2| |11.0|`hipsparseChyb2csr`|3.1.0| | | | | | | | | | | |`cusparseChyb2dense`| |10.2| |11.0| | | | | | | | | | | | | |`cusparseCnnz`| | | | |`hipsparseCnnz`|3.2.0| | | | |`rocsparse_cnnz`|3.2.0| | | | | -|`cusparseCnnz_compress`|8.0|12.2| | |`hipsparseCnnz_compress`|3.5.0| | | | |`rocsparse_cnnz_compress`|3.5.0| | | | | +|`cusparseCnnz_compress`|8.0|12.2| | |`hipsparseCnnz_compress`|3.5.0|6.1.0| | | |`rocsparse_cnnz_compress`|3.5.0| | | | | |`cusparseCreateCsru2csrInfo`| |12.2| | |`hipsparseCreateCsru2csrInfo`|4.2.0| | | | | | | | | | | -|`cusparseCreateIdentityPermutation`| |12.2| | |`hipsparseCreateIdentityPermutation`|1.9.2| | | | |`rocsparse_create_identity_permutation`|1.9.0| | | | | +|`cusparseCreateIdentityPermutation`| |12.2| | |`hipsparseCreateIdentityPermutation`|1.9.2|6.1.0| | | |`rocsparse_create_identity_permutation`|1.9.0| | | | | |`cusparseCsr2cscEx`|8.0|10.2| |11.0| | | | | | | | | | | | | |`cusparseCsr2cscEx2`|10.1| | | |`hipsparseCsr2cscEx2`|5.4.0| | | | | | | | | | | |`cusparseCsr2cscEx2_bufferSize`|10.1| | | |`hipsparseCsr2cscEx2_bufferSize`|5.4.0| | | | |`rocsparse_csr2csc_buffer_size`|1.9.0| | | | | @@ -662,14 +662,14 @@ |`cusparseDcsr2bsr`| | | | |`hipsparseDcsr2bsr`|3.5.0| | | | |`rocsparse_dcsr2bsr`|3.5.0| | | | | |`cusparseDcsr2csc`| |10.2| |11.0|`hipsparseDcsr2csc`|1.9.2| | | | | | | | | | | |`cusparseDcsr2csr_compress`|8.0|12.2| | |`hipsparseDcsr2csr_compress`|3.5.0| | | | |`rocsparse_dcsr2csr_compress`|3.5.0| | | | | -|`cusparseDcsr2csru`| |12.2| | |`hipsparseDcsr2csru`|4.2.0| | | | | | | | | | | +|`cusparseDcsr2csru`| |12.2| | |`hipsparseDcsr2csru`|4.2.0|6.1.0| | | | | | | | | | |`cusparseDcsr2dense`| |11.1| |12.0|`hipsparseDcsr2dense`|3.5.0| | | | |`rocsparse_dcsr2dense`|3.5.0| | | | | |`cusparseDcsr2gebsr`| | | | |`hipsparseDcsr2gebsr`|4.1.0| | | | |`rocsparse_dcsr2gebsr`|4.1.0| | | | | |`cusparseDcsr2gebsr_bufferSize`| | | | |`hipsparseDcsr2gebsr_bufferSize`|4.1.0| | | | |`rocsparse_dcsr2gebsr_buffer_size`|4.1.0| | | | | |`cusparseDcsr2gebsr_bufferSizeExt`| | | | | | | | | | | | | | | | | |`cusparseDcsr2hyb`| |10.2| |11.0|`hipsparseDcsr2hyb`|1.9.2| | | | |`rocsparse_dcsr2hyb`|1.9.0| | | | | -|`cusparseDcsru2csr`| |12.2| | |`hipsparseDcsru2csr`|4.2.0| | | | | | | | | | | -|`cusparseDcsru2csr_bufferSizeExt`| |12.2| | |`hipsparseDcsru2csr_bufferSizeExt`|4.2.0| | | | | | | | | | | +|`cusparseDcsru2csr`| |12.2| | |`hipsparseDcsru2csr`|4.2.0|6.1.0| | | | | | | | | | +|`cusparseDcsru2csr_bufferSizeExt`| |12.2| | |`hipsparseDcsru2csr_bufferSizeExt`|4.2.0|6.1.0| | | | | | | | | | |`cusparseDdense2csc`| |11.1| |12.0|`hipsparseDdense2csc`|3.5.0| | | | |`rocsparse_ddense2csc`|3.2.0| | | | | |`cusparseDdense2csr`| |11.1| |12.0|`hipsparseDdense2csr`|3.5.0| | | | |`rocsparse_ddense2csr`|3.2.0| | | | | |`cusparseDdense2hyb`| |10.2| |11.0| | | | | | | | | | | | | @@ -685,18 +685,18 @@ |`cusparseDhyb2csr`| |10.2| |11.0|`hipsparseDhyb2csr`|3.1.0| | | | | | | | | | | |`cusparseDhyb2dense`| |10.2| |11.0| | | | | | | | | | | | | |`cusparseDnnz`| | | | |`hipsparseDnnz`|3.2.0| | | | |`rocsparse_dnnz`|3.2.0| | | | | -|`cusparseDnnz_compress`|8.0|12.2| | |`hipsparseDnnz_compress`|3.5.0| | | | |`rocsparse_dnnz_compress`|3.5.0| | | | | -|`cusparseDpruneCsr2csr`|9.0|12.2| | |`hipsparseDpruneCsr2csr`|3.9.0| | | | |`rocsparse_dprune_csr2csr`|3.9.0| | | | | -|`cusparseDpruneCsr2csrByPercentage`|9.0|12.2| | |`hipsparseDpruneCsr2csrByPercentage`|3.9.0| | | | |`rocsparse_dprune_csr2csr_by_percentage`|3.9.0| | | | | -|`cusparseDpruneCsr2csrByPercentage_bufferSizeExt`|9.0|12.2| | |`hipsparseDpruneCsr2csrByPercentage_bufferSizeExt`|3.9.0| | | | |`rocsparse_dprune_csr2csr_by_percentage_buffer_size`|3.9.0| | | | | -|`cusparseDpruneCsr2csrNnz`|9.0|12.2| | |`hipsparseDpruneCsr2csrNnz`|3.9.0| | | | |`rocsparse_dprune_csr2csr_nnz`|3.9.0| | | | | -|`cusparseDpruneCsr2csrNnzByPercentage`|9.0|12.2| | |`hipsparseDpruneCsr2csrNnzByPercentage`|3.9.0| | | | |`rocsparse_dprune_csr2csr_nnz_by_percentage`|3.9.0| | | | | -|`cusparseDpruneCsr2csr_bufferSizeExt`|9.0|12.2| | |`hipsparseDpruneCsr2csr_bufferSizeExt`|3.9.0| | | | |`rocsparse_dprune_csr2csr_buffer_size`|3.9.0| | | | | -|`cusparseDpruneDense2csr`|9.0|12.2| | |`hipsparseDpruneDense2csr`|3.9.0| | | | |`rocsparse_dprune_dense2csr`|3.9.0| | | | | -|`cusparseDpruneDense2csrByPercentage`|9.0|12.2| | |`hipsparseDpruneDense2csrByPercentage`|3.9.0| | | | |`rocsparse_dprune_dense2csr_by_percentage`|3.9.0| | | | | -|`cusparseDpruneDense2csrByPercentage_bufferSizeExt`|9.0|12.2| | |`hipsparseDpruneDense2csrByPercentage_bufferSizeExt`|3.9.0| | | | |`rocsparse_dprune_dense2csr_by_percentage_buffer_size`|3.9.0| | | | | -|`cusparseDpruneDense2csrNnz`|9.0|12.2| | |`hipsparseDpruneDense2csrNnz`|3.9.0| | | | |`rocsparse_dprune_dense2csr_nnz`|3.9.0| | | | | -|`cusparseDpruneDense2csrNnzByPercentage`|9.0|12.2| | |`hipsparseDpruneDense2csrNnzByPercentage`|3.9.0| | | | |`rocsparse_dprune_dense2csr_nnz_by_percentage`|3.9.0| | | | | +|`cusparseDnnz_compress`|8.0|12.2| | |`hipsparseDnnz_compress`|3.5.0|6.1.0| | | |`rocsparse_dnnz_compress`|3.5.0| | | | | +|`cusparseDpruneCsr2csr`|9.0|12.2| | |`hipsparseDpruneCsr2csr`|3.9.0|6.1.0| | | |`rocsparse_dprune_csr2csr`|3.9.0| | | | | +|`cusparseDpruneCsr2csrByPercentage`|9.0|12.2| | |`hipsparseDpruneCsr2csrByPercentage`|3.9.0|6.1.0| | | |`rocsparse_dprune_csr2csr_by_percentage`|3.9.0| | | | | +|`cusparseDpruneCsr2csrByPercentage_bufferSizeExt`|9.0|12.2| | |`hipsparseDpruneCsr2csrByPercentage_bufferSizeExt`|3.9.0|6.1.0| | | |`rocsparse_dprune_csr2csr_by_percentage_buffer_size`|3.9.0| | | | | +|`cusparseDpruneCsr2csrNnz`|9.0|12.2| | |`hipsparseDpruneCsr2csrNnz`|3.9.0|6.1.0| | | |`rocsparse_dprune_csr2csr_nnz`|3.9.0| | | | | +|`cusparseDpruneCsr2csrNnzByPercentage`|9.0|12.2| | |`hipsparseDpruneCsr2csrNnzByPercentage`|3.9.0|6.1.0| | | |`rocsparse_dprune_csr2csr_nnz_by_percentage`|3.9.0| | | | | +|`cusparseDpruneCsr2csr_bufferSizeExt`|9.0|12.2| | |`hipsparseDpruneCsr2csr_bufferSizeExt`|3.9.0|6.1.0| | | |`rocsparse_dprune_csr2csr_buffer_size`|3.9.0| | | | | +|`cusparseDpruneDense2csr`|9.0|12.2| | |`hipsparseDpruneDense2csr`|3.9.0|6.1.0| | | |`rocsparse_dprune_dense2csr`|3.9.0| | | | | +|`cusparseDpruneDense2csrByPercentage`|9.0|12.2| | |`hipsparseDpruneDense2csrByPercentage`|3.9.0|6.1.0| | | |`rocsparse_dprune_dense2csr_by_percentage`|3.9.0| | | | | +|`cusparseDpruneDense2csrByPercentage_bufferSizeExt`|9.0|12.2| | |`hipsparseDpruneDense2csrByPercentage_bufferSizeExt`|3.9.0|6.1.0| | | |`rocsparse_dprune_dense2csr_by_percentage_buffer_size`|3.9.0| | | | | +|`cusparseDpruneDense2csrNnz`|9.0|12.2| | |`hipsparseDpruneDense2csrNnz`|3.9.0|6.1.0| | | |`rocsparse_dprune_dense2csr_nnz`|3.9.0| | | | | +|`cusparseDpruneDense2csrNnzByPercentage`|9.0|12.2| | |`hipsparseDpruneDense2csrNnzByPercentage`|3.9.0|6.1.0| | | |`rocsparse_dprune_dense2csr_nnz_by_percentage`|3.9.0| | | | | |`cusparseDpruneDense2csr_bufferSizeExt`|9.0|12.2| | |`hipsparseDpruneDense2csr_bufferSizeExt`|3.9.0| | | | |`rocsparse_dprune_dense2csr_buffer_size`|3.9.0| | | | | |`cusparseHpruneCsr2csr`|9.0|12.2| | | | | | | | | | | | | | | |`cusparseHpruneCsr2csrByPercentage`|9.0|12.2| | | | | | | | | | | | | | | @@ -716,14 +716,14 @@ |`cusparseScsr2bsr`| | | | |`hipsparseScsr2bsr`|3.5.0| | | | |`rocsparse_scsr2bsr`|3.5.0| | | | | |`cusparseScsr2csc`| |10.2| |11.0|`hipsparseScsr2csc`|1.9.2| | | | | | | | | | | |`cusparseScsr2csr_compress`|8.0|12.2| | |`hipsparseScsr2csr_compress`|3.5.0| | | | |`rocsparse_scsr2csr_compress`|3.5.0| | | | | -|`cusparseScsr2csru`| |12.2| | |`hipsparseScsr2csru`|4.2.0| | | | | | | | | | | +|`cusparseScsr2csru`| |12.2| | |`hipsparseScsr2csru`|4.2.0|6.1.0| | | | | | | | | | |`cusparseScsr2dense`| |11.1| |12.0|`hipsparseScsr2dense`|3.5.0| | | | |`rocsparse_scsr2dense`|3.5.0| | | | | |`cusparseScsr2gebsr`| | | | |`hipsparseScsr2gebsr`|4.1.0| | | | |`rocsparse_scsr2gebsr`|4.1.0| | | | | |`cusparseScsr2gebsr_bufferSize`| | | | |`hipsparseScsr2gebsr_bufferSize`|4.1.0| | | | |`rocsparse_scsr2gebsr_buffer_size`|4.1.0| | | | | |`cusparseScsr2gebsr_bufferSizeExt`| | | | | | | | | | | | | | | | | |`cusparseScsr2hyb`| |10.2| |11.0|`hipsparseScsr2hyb`|1.9.2| | | | |`rocsparse_scsr2hyb`|1.9.0| | | | | -|`cusparseScsru2csr`| |12.2| | |`hipsparseScsru2csr`|4.2.0| | | | | | | | | | | -|`cusparseScsru2csr_bufferSizeExt`| |12.2| | |`hipsparseScsru2csr_bufferSizeExt`|4.2.0| | | | | | | | | | | +|`cusparseScsru2csr`| |12.2| | |`hipsparseScsru2csr`|4.2.0|6.1.0| | | | | | | | | | +|`cusparseScsru2csr_bufferSizeExt`| |12.2| | |`hipsparseScsru2csr_bufferSizeExt`|4.2.0|6.1.0| | | | | | | | | | |`cusparseSdense2csc`| |11.1| |12.0|`hipsparseSdense2csc`|3.5.0| | | | |`rocsparse_sdense2csc`|3.2.0| | | | | |`cusparseSdense2csr`| |11.1| |12.0|`hipsparseSdense2csr`|3.5.0| | | | |`rocsparse_sdense2csr`|3.2.0| | | | | |`cusparseSdense2hyb`| |10.2| |11.0| | | | | | | | | | | | | @@ -738,18 +738,18 @@ |`cusparseShyb2csr`| |10.2| |11.0|`hipsparseShyb2csr`|3.1.0| | | | | | | | | | | |`cusparseShyb2dense`| |10.2| |11.0| | | | | | | | | | | | | |`cusparseSnnz`| | | | |`hipsparseSnnz`|3.2.0| | | | |`rocsparse_snnz`|3.2.0| | | | | -|`cusparseSnnz_compress`|8.0|12.2| | |`hipsparseSnnz_compress`|3.5.0| | | | |`rocsparse_snnz_compress`|3.5.0| | | | | -|`cusparseSpruneCsr2csr`|9.0|12.2| | |`hipsparseSpruneCsr2csr`|3.9.0| | | | |`rocsparse_sprune_csr2csr`|3.9.0| | | | | -|`cusparseSpruneCsr2csrByPercentage`|9.0|12.2| | |`hipsparseSpruneCsr2csrByPercentage`|3.9.0| | | | |`rocsparse_sprune_csr2csr_by_percentage`|3.9.0| | | | | -|`cusparseSpruneCsr2csrByPercentage_bufferSizeExt`|9.0|12.2| | |`hipsparseSpruneCsr2csrByPercentage_bufferSizeExt`|3.9.0| | | | |`rocsparse_sprune_csr2csr_by_percentage_buffer_size`|3.9.0| | | | | -|`cusparseSpruneCsr2csrNnz`|9.0|12.2| | |`hipsparseSpruneCsr2csrNnz`|3.9.0| | | | |`rocsparse_sprune_csr2csr_nnz`|3.9.0| | | | | -|`cusparseSpruneCsr2csrNnzByPercentage`|9.0|12.2| | |`hipsparseSpruneCsr2csrNnzByPercentage`|3.9.0| | | | |`rocsparse_sprune_csr2csr_nnz_by_percentage`|3.9.0| | | | | -|`cusparseSpruneCsr2csr_bufferSizeExt`|9.0|12.2| | |`hipsparseSpruneCsr2csr_bufferSizeExt`|3.9.0| | | | |`rocsparse_sprune_csr2csr_buffer_size`|3.9.0| | | | | -|`cusparseSpruneDense2csr`|9.0|12.2| | |`hipsparseSpruneDense2csr`|3.9.0| | | | |`rocsparse_sprune_dense2csr`|3.9.0| | | | | -|`cusparseSpruneDense2csrByPercentage`|9.0|12.2| | |`hipsparseSpruneDense2csrByPercentage`|3.9.0| | | | |`rocsparse_sprune_dense2csr_by_percentage`|3.9.0| | | | | -|`cusparseSpruneDense2csrByPercentage_bufferSizeExt`|9.0|12.2| | |`hipsparseSpruneDense2csrByPercentage_bufferSizeExt`|3.9.0| | | | |`rocsparse_sprune_dense2csr_by_percentage_buffer_size`|3.9.0| | | | | -|`cusparseSpruneDense2csrNnz`|9.0|12.2| | |`hipsparseSpruneDense2csrNnz`|3.9.0| | | | |`rocsparse_sprune_dense2csr_nnz`|3.9.0| | | | | -|`cusparseSpruneDense2csrNnzByPercentage`|9.0|12.2| | |`hipsparseSpruneDense2csrNnzByPercentage`|3.9.0| | | | |`rocsparse_sprune_dense2csr_nnz_by_percentage`|3.9.0| | | | | +|`cusparseSnnz_compress`|8.0|12.2| | |`hipsparseSnnz_compress`|3.5.0|6.1.0| | | |`rocsparse_snnz_compress`|3.5.0| | | | | +|`cusparseSpruneCsr2csr`|9.0|12.2| | |`hipsparseSpruneCsr2csr`|3.9.0|6.1.0| | | |`rocsparse_sprune_csr2csr`|3.9.0| | | | | +|`cusparseSpruneCsr2csrByPercentage`|9.0|12.2| | |`hipsparseSpruneCsr2csrByPercentage`|3.9.0|6.1.0| | | |`rocsparse_sprune_csr2csr_by_percentage`|3.9.0| | | | | +|`cusparseSpruneCsr2csrByPercentage_bufferSizeExt`|9.0|12.2| | |`hipsparseSpruneCsr2csrByPercentage_bufferSizeExt`|3.9.0|6.1.0| | | |`rocsparse_sprune_csr2csr_by_percentage_buffer_size`|3.9.0| | | | | +|`cusparseSpruneCsr2csrNnz`|9.0|12.2| | |`hipsparseSpruneCsr2csrNnz`|3.9.0|6.1.0| | | |`rocsparse_sprune_csr2csr_nnz`|3.9.0| | | | | +|`cusparseSpruneCsr2csrNnzByPercentage`|9.0|12.2| | |`hipsparseSpruneCsr2csrNnzByPercentage`|3.9.0|6.1.0| | | |`rocsparse_sprune_csr2csr_nnz_by_percentage`|3.9.0| | | | | +|`cusparseSpruneCsr2csr_bufferSizeExt`|9.0|12.2| | |`hipsparseSpruneCsr2csr_bufferSizeExt`|3.9.0|6.1.0| | | |`rocsparse_sprune_csr2csr_buffer_size`|3.9.0| | | | | +|`cusparseSpruneDense2csr`|9.0|12.2| | |`hipsparseSpruneDense2csr`|3.9.0|6.1.0| | | |`rocsparse_sprune_dense2csr`|3.9.0| | | | | +|`cusparseSpruneDense2csrByPercentage`|9.0|12.2| | |`hipsparseSpruneDense2csrByPercentage`|3.9.0|6.1.0| | | |`rocsparse_sprune_dense2csr_by_percentage`|3.9.0| | | | | +|`cusparseSpruneDense2csrByPercentage_bufferSizeExt`|9.0|12.2| | |`hipsparseSpruneDense2csrByPercentage_bufferSizeExt`|3.9.0|6.1.0| | | |`rocsparse_sprune_dense2csr_by_percentage_buffer_size`|3.9.0| | | | | +|`cusparseSpruneDense2csrNnz`|9.0|12.2| | |`hipsparseSpruneDense2csrNnz`|3.9.0|6.1.0| | | |`rocsparse_sprune_dense2csr_nnz`|3.9.0| | | | | +|`cusparseSpruneDense2csrNnzByPercentage`|9.0|12.2| | |`hipsparseSpruneDense2csrNnzByPercentage`|3.9.0|6.1.0| | | |`rocsparse_sprune_dense2csr_nnz_by_percentage`|3.9.0| | | | | |`cusparseSpruneDense2csr_bufferSizeExt`|9.0|12.2| | |`hipsparseSpruneDense2csr_bufferSizeExt`|3.9.0| | | | |`rocsparse_sprune_dense2csr_buffer_size`|3.9.0| | | | | |`cusparseXcoo2csr`| | | | |`hipsparseXcoo2csr`|1.9.2| | | | |`rocsparse_coo2csr`|1.9.0| | | | | |`cusparseXcoosortByColumn`| | | | |`hipsparseXcoosortByColumn`|1.9.2| | | | |`rocsparse_coosort_by_column`|1.9.0| | | | | @@ -770,14 +770,14 @@ |`cusparseZcsr2bsr`| | | | |`hipsparseZcsr2bsr`|3.5.0| | | | |`rocsparse_zcsr2bsr`|3.5.0| | | | | |`cusparseZcsr2csc`| |10.2| |11.0|`hipsparseZcsr2csc`|3.1.0| | | | | | | | | | | |`cusparseZcsr2csr_compress`|8.0|12.2| | |`hipsparseZcsr2csr_compress`|3.5.0| | | | |`rocsparse_zcsr2csr_compress`|3.5.0| | | | | -|`cusparseZcsr2csru`| |12.2| | |`hipsparseZcsr2csru`|4.2.0| | | | | | | | | | | +|`cusparseZcsr2csru`| |12.2| | |`hipsparseZcsr2csru`|4.2.0|6.1.0| | | | | | | | | | |`cusparseZcsr2dense`| |11.1| |12.0|`hipsparseZcsr2dense`|3.5.0| | | | |`rocsparse_zcsr2dense`|3.5.0| | | | | |`cusparseZcsr2gebsr`| | | | |`hipsparseZcsr2gebsr`|4.1.0| | | | |`rocsparse_zcsr2gebsr`|4.1.0| | | | | |`cusparseZcsr2gebsr_bufferSize`| | | | |`hipsparseZcsr2gebsr_bufferSize`|4.1.0| | | | |`rocsparse_zcsr2gebsr_buffer_size`|4.1.0| | | | | |`cusparseZcsr2gebsr_bufferSizeExt`| | | | | | | | | | | | | | | | | |`cusparseZcsr2hyb`| |10.2| |11.0|`hipsparseZcsr2hyb`|3.1.0| | | | |`rocsparse_zcsr2hyb`|2.10.0| | | | | -|`cusparseZcsru2csr`| |12.2| | |`hipsparseZcsru2csr`|4.2.0| | | | | | | | | | | -|`cusparseZcsru2csr_bufferSizeExt`| |12.2| | |`hipsparseZcsru2csr_bufferSizeExt`|4.2.0| | | | | | | | | | | +|`cusparseZcsru2csr`| |12.2| | |`hipsparseZcsru2csr`|4.2.0|6.1.0| | | | | | | | | | +|`cusparseZcsru2csr_bufferSizeExt`| |12.2| | |`hipsparseZcsru2csr_bufferSizeExt`|4.2.0|6.1.0| | | | | | | | | | |`cusparseZdense2csc`| |11.1| |12.0|`hipsparseZdense2csc`|3.5.0| | | | |`rocsparse_zdense2csc`|3.2.0| | | | | |`cusparseZdense2csr`| |11.1| |12.0|`hipsparseZdense2csr`|3.5.0| | | | |`rocsparse_zdense2csr`|3.2.0| | | | | |`cusparseZdense2hyb`| |10.2| |11.0| | | | | | | | | | | | | @@ -792,18 +792,18 @@ |`cusparseZhyb2csr`| |10.2| |11.0|`hipsparseZhyb2csr`|3.1.0| | | | | | | | | | | |`cusparseZhyb2dense`| |10.2| |11.0| | | | | | | | | | | | | |`cusparseZnnz`| | | | |`hipsparseZnnz`|3.2.0| | | | |`rocsparse_znnz`|3.2.0| | | | | -|`cusparseZnnz_compress`|8.0|12.2| | |`hipsparseZnnz_compress`|3.5.0| | | | |`rocsparse_znnz_compress`|3.5.0| | | | | +|`cusparseZnnz_compress`|8.0|12.2| | |`hipsparseZnnz_compress`|3.5.0|6.1.0| | | |`rocsparse_znnz_compress`|3.5.0| | | | | ## **15. CUSPARSE Generic API Reference** |**CUDA**|**A**|**D**|**C**|**R**|**HIP**|**A**|**D**|**C**|**R**|**E**|**ROC**|**A**|**D**|**C**|**R**|**E**| |:--|:-:|:-:|:-:|:-:|:--|:-:|:-:|:-:|:-:|:-:|:--|:-:|:-:|:-:|:-:|:-:| -|`cusparseAxpby`|11.0| |12.0| |`hipsparseAxpby`|4.1.0| |6.0.0| | |`rocsparse_axpby`|4.1.0| | | | | +|`cusparseAxpby`|11.0| |12.0| |`hipsparseAxpby`|4.1.0| |6.0.0| | |`rocsparse_axpby`|4.1.0| |6.0.0| | | |`cusparseBlockedEllGet`|11.2| | | |`hipsparseBlockedEllGet`|4.5.0| | | | |`rocsparse_bell_get`|4.1.0| | | | | |`cusparseBsrSetStridedBatch`|12.1| | | | | | | | | | | | | | | | |`cusparseConstBlockedEllGet`|12.0| | | |`hipsparseConstBlockedEllGet`|6.0.0| | | | |`rocsparse_const_bell_get`|6.0.0| | | | | |`cusparseConstCooGet`|12.0| | | |`hipsparseConstCooGet`|6.0.0| | | | |`rocsparse_const_coo_get`|6.0.0| | | | | -|`cusparseConstCscGet`|12.0| | | | | | | | | |`rocsparse_const_csc_get`|6.0.0| | | | | +|`cusparseConstCscGet`|12.0| | | |`hipsparseConstCscGet`|6.1.0| | | |6.1.0|`rocsparse_const_csc_get`|6.0.0| | | | | |`cusparseConstCsrGet`|12.0| | | |`hipsparseConstCsrGet`|6.0.0| | | | |`rocsparse_const_csr_get`|6.0.0| | | | | |`cusparseConstDnMatGet`|12.0| | | |`hipsparseConstDnMatGet`|6.0.0| | | | |`rocsparse_const_dnmat_get`|6.0.0| | | | | |`cusparseConstDnMatGetValues`|12.0| | | |`hipsparseConstDnMatGetValues`|6.0.0| | | | |`rocsparse_const_dnmat_get_values`|6.0.0| | | | | @@ -837,7 +837,7 @@ |`cusparseCreateDnVec`|10.2| | | |`hipsparseCreateDnVec`|4.1.0| | | | |`rocsparse_create_dnvec_descr`|4.1.0| | | | | |`cusparseCreateSlicedEll`|12.1| | | | | | | | | | | | | | | | |`cusparseCreateSpVec`|10.2| | | |`hipsparseCreateSpVec`|4.1.0| | | | |`rocsparse_create_spvec_descr`|4.1.0| | | | | -|`cusparseCscGet`|11.7| | | | | | | | | | | | | | | | +|`cusparseCscGet`|11.7| | | |`hipsparseCscGet`|6.1.0| | | |6.1.0|`rocsparse_csc_get`|6.1.0| | | |6.1.0| |`cusparseCscSetPointers`|11.1| | | |`hipsparseCscSetPointers`|4.2.0| | | | |`rocsparse_csc_set_pointers`|4.1.0| | | | | |`cusparseCsrGet`|10.2| | | |`hipsparseCsrGet`|4.1.0| | | | |`rocsparse_csr_get`|4.1.0| | | | | |`cusparseCsrSetPointers`|11.0| | | |`hipsparseCsrSetPointers`|4.1.0| | | | |`rocsparse_csr_set_pointers`|4.1.0| | | | | @@ -857,12 +857,12 @@ |`cusparseDnVecGet`|10.2| | | |`hipsparseDnVecGet`|4.1.0| | | | |`rocsparse_dnvec_get`|4.1.0| | | | | |`cusparseDnVecGetValues`|10.2| | | |`hipsparseDnVecGetValues`|4.1.0| | | | |`rocsparse_dnvec_get_values`|4.1.0| | | | | |`cusparseDnVecSetValues`|10.2| | | |`hipsparseDnVecSetValues`|4.1.0| | | | |`rocsparse_dnvec_set_values`|4.1.0| | | | | -|`cusparseGather`|11.0| |12.0| |`hipsparseGather`|4.1.0| |6.0.0| | |`rocsparse_gather`|4.1.0| | | | | -|`cusparseRot`|11.0|12.2| | |`hipsparseRot`|4.1.0| | | | |`rocsparse_rot`|4.1.0| | | | | -|`cusparseSDDMM`|11.2| |12.0| |`hipsparseSDDMM`|4.3.0| |6.0.0| | |`rocsparse_sddmm`|4.3.0| | | | | -|`cusparseSDDMM_bufferSize`|11.2| |12.0| |`hipsparseSDDMM_bufferSize`|4.3.0| |6.0.0| | |`rocsparse_sddmm_buffer_size`|4.3.0| | | | | -|`cusparseSDDMM_preprocess`|11.2| |12.0| |`hipsparseSDDMM_preprocess`|4.3.0| |6.0.0| | |`rocsparse_sddmm_preprocess`|4.3.0| | | | | -|`cusparseScatter`|11.0| |12.0| |`hipsparseScatter`|4.1.0| |6.0.0| | |`rocsparse_scatter`|4.1.0| | | | | +|`cusparseGather`|11.0| |12.0| |`hipsparseGather`|4.1.0| |6.0.0| | |`rocsparse_gather`|4.1.0| |6.0.0| | | +|`cusparseRot`|11.0|12.2| | |`hipsparseRot`|4.1.0|6.1.0| | | |`rocsparse_rot`|4.1.0| | | | | +|`cusparseSDDMM`|11.2| |12.0| |`hipsparseSDDMM`|4.3.0| |6.0.0| | |`rocsparse_sddmm`|4.3.0| |6.0.0| | | +|`cusparseSDDMM_bufferSize`|11.2| |12.0| |`hipsparseSDDMM_bufferSize`|4.3.0| |6.0.0| | |`rocsparse_sddmm_buffer_size`|4.3.0| |6.0.0| | | +|`cusparseSDDMM_preprocess`|11.2| |12.0| |`hipsparseSDDMM_preprocess`|4.3.0| |6.0.0| | |`rocsparse_sddmm_preprocess`|4.3.0| |6.0.0| | | +|`cusparseScatter`|11.0| |12.0| |`hipsparseScatter`|4.1.0| |6.0.0| | |`rocsparse_scatter`|4.1.0| |6.0.0| | | |`cusparseSpGEMM_compute`|11.0| |12.0| |`hipsparseSpGEMM_compute`|4.1.0| |6.0.0| | | | | | | | | |`cusparseSpGEMM_copy`|11.0| |12.0| |`hipsparseSpGEMM_copy`|4.1.0| |6.0.0| | | | | | | | | |`cusparseSpGEMM_createDescr`|11.0| | | |`hipsparseSpGEMM_createDescr`|4.1.0| | | | | | | | | | | @@ -874,14 +874,14 @@ |`cusparseSpGEMMreuse_copy`|11.3| |12.0| |`hipsparseSpGEMMreuse_copy`|5.1.0| |6.0.0| | | | | | | | | |`cusparseSpGEMMreuse_nnz`|11.3| |12.0| |`hipsparseSpGEMMreuse_nnz`|5.1.0| |6.0.0| | | | | | | | | |`cusparseSpGEMMreuse_workEstimation`|11.3| |12.0| |`hipsparseSpGEMMreuse_workEstimation`|5.1.0| |6.0.0| | | | | | | | | -|`cusparseSpMM`|10.1| |12.0| |`hipsparseSpMM`|4.2.0| |6.0.0| | | | | | | | | +|`cusparseSpMM`|10.1| |12.0| |`hipsparseSpMM`|4.2.0| |6.0.0| | |`rocsparse_spmm`|4.2.0| |6.0.0| | | |`cusparseSpMMOp`|11.5| | | | | | | | | | | | | | | | |`cusparseSpMMOp_createPlan`|11.5| | | | | | | | | | | | | | | | |`cusparseSpMMOp_destroyPlan`|11.5| | | | | | | | | | | | | | | | |`cusparseSpMM_bufferSize`|10.1| |12.0| |`hipsparseSpMM_bufferSize`|4.2.0| |6.0.0| | |`rocsparse_spmm`|4.2.0| |6.0.0| | | -|`cusparseSpMM_preprocess`|11.2| |12.0| |`hipsparseSpMM_preprocess`|4.5.0| |6.0.0| | | | | | | | | -|`cusparseSpMV`|10.2| |12.0| |`hipsparseSpMV`|4.1.0| |6.0.0| | |`rocsparse_spmv`|4.1.0| | | | | -|`cusparseSpMV_bufferSize`|10.2| |12.0| |`hipsparseSpMV_bufferSize`|4.1.0| |6.0.0| | | | | | | | | +|`cusparseSpMM_preprocess`|11.2| |12.0| |`hipsparseSpMM_preprocess`|4.5.0| |6.0.0| | |`rocsparse_spmm`|4.2.0| |6.0.0| | | +|`cusparseSpMV`|10.1| |12.0| |`hipsparseSpMV`|4.1.0| |6.0.0| | |`rocsparse_spmv`|4.1.0| |6.0.0| | | +|`cusparseSpMV_bufferSize`|10.1| |12.0| |`hipsparseSpMV_bufferSize`|4.1.0| |6.0.0| | |`rocsparse_spmv`|4.1.0| |6.0.0| | | |`cusparseSpMatGetAttribute`|11.3| |12.0| |`hipsparseSpMatGetAttribute`|4.5.0| |6.0.0| | |`rocsparse_spmat_get_attribute`|4.5.0| |6.0.0| | | |`cusparseSpMatGetFormat`|10.1| |12.0| |`hipsparseSpMatGetFormat`|4.1.0| |6.0.0| | |`rocsparse_spmat_get_format`|4.1.0| |6.0.0| | | |`cusparseSpMatGetIndexBase`|10.1| |12.0| |`hipsparseSpMatGetIndexBase`|4.1.0| |6.0.0| | |`rocsparse_spmat_get_index_base`|4.1.0| |6.0.0| | | @@ -899,13 +899,13 @@ |`cusparseSpSM_destroyDescr`|11.3| | | |`hipsparseSpSM_destroyDescr`|4.5.0| | | | | | | | | | | |`cusparseSpSM_solve`|11.3| |12.0| |`hipsparseSpSM_solve`|4.5.0| |6.0.0| | |`rocsparse_spsm`|4.5.0| |6.0.0| | | |`cusparseSpSV_analysis`|11.3| |12.0| |`hipsparseSpSV_analysis`|4.5.0| |6.0.0| | | | | | | | | -|`cusparseSpSV_bufferSize`|11.3| |12.0| |`hipsparseSpSV_bufferSize`|4.5.0| |6.0.0| | | | | | | | | +|`cusparseSpSV_bufferSize`|11.3| |12.0| |`hipsparseSpSV_bufferSize`|4.5.0| |6.0.0| | |`rocsparse_spsv`|4.5.0| |6.0.0| | | |`cusparseSpSV_createDescr`|11.3| | | |`hipsparseSpSV_createDescr`|4.5.0| | | | | | | | | | | |`cusparseSpSV_destroyDescr`|11.3| | | |`hipsparseSpSV_destroyDescr`|4.5.0| | | | | | | | | | | |`cusparseSpSV_solve`|11.3| |12.0| |`hipsparseSpSV_solve`|4.5.0| |6.0.0| | | | | | | | | |`cusparseSpSV_updateMatrix`|12.1| | | | | | | | | | | | | | | | -|`cusparseSpVV`|10.2| |12.0| |`hipsparseSpVV`|4.1.0| |6.0.0| | | | | | | | | -|`cusparseSpVV_bufferSize`|10.2| |12.0| |`hipsparseSpVV_bufferSize`|4.1.0| |6.0.0| | | | | | | | | +|`cusparseSpVV`|10.1| |12.0| |`hipsparseSpVV`|4.1.0| |6.0.0| | |`rocsparse_spvv`|4.1.0| |6.0.0| | | +|`cusparseSpVV_bufferSize`|10.1| |12.0| |`hipsparseSpVV_bufferSize`|4.1.0| |6.0.0| | |`rocsparse_spvv`|4.1.0| |6.0.0| | | |`cusparseSpVecGet`|10.2| | | |`hipsparseSpVecGet`|4.1.0| | | | |`rocsparse_spvec_get`|4.1.0| | | | | |`cusparseSpVecGetIndexBase`|10.2| |12.0| |`hipsparseSpVecGetIndexBase`|4.1.0| |6.0.0| | |`rocsparse_spvec_get_index_base`|4.1.0| |6.0.0| | | |`cusparseSpVecGetValues`|10.2| | | |`hipsparseSpVecGetValues`|4.1.0| | | | |`rocsparse_spvec_get_values`|4.1.0| | | | | diff --git a/docs/tables/CUSPARSE_API_supported_by_ROC.md b/docs/tables/CUSPARSE_API_supported_by_ROC.md index 26b4bbdd..4b273ca8 100644 --- a/docs/tables/CUSPARSE_API_supported_by_ROC.md +++ b/docs/tables/CUSPARSE_API_supported_by_ROC.md @@ -798,7 +798,7 @@ |**CUDA**|**A**|**D**|**C**|**R**|**ROC**|**A**|**D**|**C**|**R**|**E**| |:--|:-:|:-:|:-:|:-:|:--|:-:|:-:|:-:|:-:|:-:| -|`cusparseAxpby`|11.0| |12.0| |`rocsparse_axpby`|4.1.0| | | | | +|`cusparseAxpby`|11.0| |12.0| |`rocsparse_axpby`|4.1.0| |6.0.0| | | |`cusparseBlockedEllGet`|11.2| | | |`rocsparse_bell_get`|4.1.0| | | | | |`cusparseBsrSetStridedBatch`|12.1| | | | | | | | | | |`cusparseConstBlockedEllGet`|12.0| | | |`rocsparse_const_bell_get`|6.0.0| | | | | @@ -837,7 +837,7 @@ |`cusparseCreateDnVec`|10.2| | | |`rocsparse_create_dnvec_descr`|4.1.0| | | | | |`cusparseCreateSlicedEll`|12.1| | | | | | | | | | |`cusparseCreateSpVec`|10.2| | | |`rocsparse_create_spvec_descr`|4.1.0| | | | | -|`cusparseCscGet`|11.7| | | | | | | | | | +|`cusparseCscGet`|11.7| | | |`rocsparse_csc_get`|6.1.0| | | |6.1.0| |`cusparseCscSetPointers`|11.1| | | |`rocsparse_csc_set_pointers`|4.1.0| | | | | |`cusparseCsrGet`|10.2| | | |`rocsparse_csr_get`|4.1.0| | | | | |`cusparseCsrSetPointers`|11.0| | | |`rocsparse_csr_set_pointers`|4.1.0| | | | | @@ -857,12 +857,12 @@ |`cusparseDnVecGet`|10.2| | | |`rocsparse_dnvec_get`|4.1.0| | | | | |`cusparseDnVecGetValues`|10.2| | | |`rocsparse_dnvec_get_values`|4.1.0| | | | | |`cusparseDnVecSetValues`|10.2| | | |`rocsparse_dnvec_set_values`|4.1.0| | | | | -|`cusparseGather`|11.0| |12.0| |`rocsparse_gather`|4.1.0| | | | | +|`cusparseGather`|11.0| |12.0| |`rocsparse_gather`|4.1.0| |6.0.0| | | |`cusparseRot`|11.0|12.2| | |`rocsparse_rot`|4.1.0| | | | | -|`cusparseSDDMM`|11.2| |12.0| |`rocsparse_sddmm`|4.3.0| | | | | -|`cusparseSDDMM_bufferSize`|11.2| |12.0| |`rocsparse_sddmm_buffer_size`|4.3.0| | | | | -|`cusparseSDDMM_preprocess`|11.2| |12.0| |`rocsparse_sddmm_preprocess`|4.3.0| | | | | -|`cusparseScatter`|11.0| |12.0| |`rocsparse_scatter`|4.1.0| | | | | +|`cusparseSDDMM`|11.2| |12.0| |`rocsparse_sddmm`|4.3.0| |6.0.0| | | +|`cusparseSDDMM_bufferSize`|11.2| |12.0| |`rocsparse_sddmm_buffer_size`|4.3.0| |6.0.0| | | +|`cusparseSDDMM_preprocess`|11.2| |12.0| |`rocsparse_sddmm_preprocess`|4.3.0| |6.0.0| | | +|`cusparseScatter`|11.0| |12.0| |`rocsparse_scatter`|4.1.0| |6.0.0| | | |`cusparseSpGEMM_compute`|11.0| |12.0| | | | | | | | |`cusparseSpGEMM_copy`|11.0| |12.0| | | | | | | | |`cusparseSpGEMM_createDescr`|11.0| | | | | | | | | | @@ -874,14 +874,14 @@ |`cusparseSpGEMMreuse_copy`|11.3| |12.0| | | | | | | | |`cusparseSpGEMMreuse_nnz`|11.3| |12.0| | | | | | | | |`cusparseSpGEMMreuse_workEstimation`|11.3| |12.0| | | | | | | | -|`cusparseSpMM`|10.1| |12.0| | | | | | | | +|`cusparseSpMM`|10.1| |12.0| |`rocsparse_spmm`|4.2.0| |6.0.0| | | |`cusparseSpMMOp`|11.5| | | | | | | | | | |`cusparseSpMMOp_createPlan`|11.5| | | | | | | | | | |`cusparseSpMMOp_destroyPlan`|11.5| | | | | | | | | | |`cusparseSpMM_bufferSize`|10.1| |12.0| |`rocsparse_spmm`|4.2.0| |6.0.0| | | -|`cusparseSpMM_preprocess`|11.2| |12.0| | | | | | | | -|`cusparseSpMV`|10.2| |12.0| |`rocsparse_spmv`|4.1.0| | | | | -|`cusparseSpMV_bufferSize`|10.2| |12.0| | | | | | | | +|`cusparseSpMM_preprocess`|11.2| |12.0| |`rocsparse_spmm`|4.2.0| |6.0.0| | | +|`cusparseSpMV`|10.1| |12.0| |`rocsparse_spmv`|4.1.0| |6.0.0| | | +|`cusparseSpMV_bufferSize`|10.1| |12.0| |`rocsparse_spmv`|4.1.0| |6.0.0| | | |`cusparseSpMatGetAttribute`|11.3| |12.0| |`rocsparse_spmat_get_attribute`|4.5.0| |6.0.0| | | |`cusparseSpMatGetFormat`|10.1| |12.0| |`rocsparse_spmat_get_format`|4.1.0| |6.0.0| | | |`cusparseSpMatGetIndexBase`|10.1| |12.0| |`rocsparse_spmat_get_index_base`|4.1.0| |6.0.0| | | @@ -899,13 +899,13 @@ |`cusparseSpSM_destroyDescr`|11.3| | | | | | | | | | |`cusparseSpSM_solve`|11.3| |12.0| |`rocsparse_spsm`|4.5.0| |6.0.0| | | |`cusparseSpSV_analysis`|11.3| |12.0| | | | | | | | -|`cusparseSpSV_bufferSize`|11.3| |12.0| | | | | | | | +|`cusparseSpSV_bufferSize`|11.3| |12.0| |`rocsparse_spsv`|4.5.0| |6.0.0| | | |`cusparseSpSV_createDescr`|11.3| | | | | | | | | | |`cusparseSpSV_destroyDescr`|11.3| | | | | | | | | | |`cusparseSpSV_solve`|11.3| |12.0| | | | | | | | |`cusparseSpSV_updateMatrix`|12.1| | | | | | | | | | -|`cusparseSpVV`|10.2| |12.0| | | | | | | | -|`cusparseSpVV_bufferSize`|10.2| |12.0| | | | | | | | +|`cusparseSpVV`|10.1| |12.0| |`rocsparse_spvv`|4.1.0| |6.0.0| | | +|`cusparseSpVV_bufferSize`|10.1| |12.0| |`rocsparse_spvv`|4.1.0| |6.0.0| | | |`cusparseSpVecGet`|10.2| | | |`rocsparse_spvec_get`|4.1.0| | | | | |`cusparseSpVecGetIndexBase`|10.2| |12.0| |`rocsparse_spvec_get_index_base`|4.1.0| |6.0.0| | | |`cusparseSpVecGetValues`|10.2| | | |`rocsparse_spvec_get_values`|4.1.0| | | | | diff --git a/src/ArgParse.cpp b/src/ArgParse.cpp index 847604ca..78e06894 100644 --- a/src/ArgParse.cpp +++ b/src/ArgParse.cpp @@ -247,6 +247,7 @@ const std::vector hipifyOptions { std::string(Versions.ArgStr), std::string(NoUndocumented.ArgStr), std::string(NoWarningsUndocumented.ArgStr), + std::string(HipifyAMAP.ArgStr), }; const std::vector hipifyOptionsWithTwoArgs { diff --git a/src/CUDA2HIP_Driver_API_functions.cpp b/src/CUDA2HIP_Driver_API_functions.cpp index 70181fe2..da31fbda 100644 --- a/src/CUDA2HIP_Driver_API_functions.cpp +++ b/src/CUDA2HIP_Driver_API_functions.cpp @@ -641,10 +641,7 @@ const std::map CUDA_DRIVER_FUNCTION_MAP { // RUNTIME: cudaError_t CUDARTAPI cudaGraphAddMemcpyNode(cudaGraphNode_t *pGraphNode, cudaGraph_t graph, const cudaGraphNode_t *pDependencies, size_t numDependencies, const struct cudaMemcpy3DParms *pCopyParams); {"cuGraphAddMemcpyNode", {"hipDrvGraphAddMemcpyNode", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, // no analogue - // NOTE: Not equal to cudaGraphAddMemsetNode due to different signatures: - // DRIVER: CUresult CUDAAPI cuGraphAddMemsetNode(CUgraphNode *phGraphNode, CUgraph hGraph, const CUgraphNode *dependencies, size_t numDependencies, const CUDA_MEMSET_NODE_PARAMS *memsetParams, CUcontext ctx); - // RUNTIME: cudaError_t CUDARTAPI cudaGraphAddMemcpyNode(cudaGraphNode_t *pGraphNode, cudaGraph_t graph, const cudaGraphNode_t *pDependencies, size_t numDependencies, const struct cudaMemcpy3DParms *pCopyParams); - {"cuGraphAddMemsetNode", {"hipGraphAddMemsetNode", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, + {"cuGraphAddMemsetNode", {"hipDrvGraphAddMemsetNode", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cudaGraphChildGraphNodeGetGraph {"cuGraphChildGraphNodeGetGraph", {"hipGraphChildGraphNodeGetGraph", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, // cudaGraphClone @@ -688,10 +685,10 @@ const std::map CUDA_DRIVER_FUNCTION_MAP { {"cuGraphKernelNodeSetParams", {"hipGraphKernelNodeSetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, // cudaGraphLaunch {"cuGraphLaunch", {"hipGraphLaunch", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, - // cudaGraphMemcpyNodeGetParams - {"cuGraphMemcpyNodeGetParams", {"hipGraphMemcpyNodeGetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, - // cudaGraphMemcpyNodeSetParams - {"cuGraphMemcpyNodeSetParams", {"hipGraphMemcpyNodeSetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, + // cudaGraphMemcpyNodeGetParams (?) + {"cuGraphMemcpyNodeGetParams", {"hipDrvGraphMemcpyNodeGetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_EXPERIMENTAL}}, + // cudaGraphMemcpyNodeSetParams (?) + {"cuGraphMemcpyNodeSetParams", {"hipDrvGraphMemcpyNodeSetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cudaGraphMemsetNodeGetParams {"cuGraphMemsetNodeGetParams", {"hipGraphMemsetNodeGetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, // cudaGraphMemsetNodeSetParams @@ -717,18 +714,12 @@ const std::map CUDA_DRIVER_FUNCTION_MAP { // cudaGraphRemoveDependencies_v2 {"cuGraphRemoveDependencies_v2", {"hipGraphRemoveDependencies_v2", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_UNSUPPORTED}}, // no analogue - // NOTE: Not equal to cudaGraphExecMemcpyNodeSetParams due to different signatures: - // DRIVER: CUresult CUDAAPI cuGraphExecMemcpyNodeSetParams(CUgraphExec hGraphExec, CUgraphNode hNode, const CUDA_MEMCPY3D *copyParams, CUcontext ctx); - // RUNTIME: cudaError_t CUDARTAPI cudaGraphExecMemcpyNodeSetParams(cudaGraphExec_t hGraphExec, cudaGraphNode_t node, const struct cudaMemcpy3DParms *pNodeParams); - {"cuGraphExecMemcpyNodeSetParams", {"hipGraphExecMemcpyNodeSetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_UNSUPPORTED}}, + {"cuGraphExecMemcpyNodeSetParams", {"hipDrvGraphExecMemcpyNodeSetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_EXPERIMENTAL}}, // no analogue - // NOTE: Not equal to cudaGraphExecMemcpyNodeSetParams due to different signatures: - // DRIVER: CUresult CUDAAPI cuGraphExecMemsetNodeSetParams(CUgraphExec hGraphExec, CUgraphNode hNode, const CUDA_MEMSET_NODE_PARAMS *memsetParams, CUcontext ctx); - // RUNTIME: cudaError_t CUDARTAPI cudaGraphExecMemsetNodeSetParams(cudaGraphExec_t hGraphExec, cudaGraphNode_t node, const struct cudaMemsetParams *pNodeParams); - {"cuGraphExecMemsetNodeSetParams", {"hipGraphExecMemsetNodeSetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_UNSUPPORTED}}, + {"cuGraphExecMemsetNodeSetParams", {"hipDrvGraphExecMemsetNodeSetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cudaGraphExecHostNodeSetParams {"cuGraphExecHostNodeSetParams", {"hipGraphExecHostNodeSetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, - // TODO: take into account the new signature since 12.0 + // TODO: take into account the new signature since 12.0 // cudaGraphExecUpdate {"cuGraphExecUpdate", {"hipGraphExecUpdate", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, // cudaGraphAddEventRecordNode @@ -752,21 +743,21 @@ const std::map CUDA_DRIVER_FUNCTION_MAP { // cudaGraphUpload {"cuGraphUpload", {"hipGraphUpload", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, // cudaGraphAddExternalSemaphoresSignalNode - {"cuGraphAddExternalSemaphoresSignalNode", {"hipGraphAddExternalSemaphoresSignalNode", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, + {"cuGraphAddExternalSemaphoresSignalNode", {"hipGraphAddExternalSemaphoresSignalNode", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cudaGraphExternalSemaphoresSignalNodeGetParams - {"cuGraphExternalSemaphoresSignalNodeGetParams", {"hipGraphExternalSemaphoresSignalNodeGetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, + {"cuGraphExternalSemaphoresSignalNodeGetParams", {"hipGraphExternalSemaphoresSignalNodeGetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cudaGraphExternalSemaphoresSignalNodeSetParams - {"cuGraphExternalSemaphoresSignalNodeSetParams", {"hipGraphExternalSemaphoresSignalNodeSetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, + {"cuGraphExternalSemaphoresSignalNodeSetParams", {"hipGraphExternalSemaphoresSignalNodeSetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cudaGraphAddExternalSemaphoresWaitNode - {"cuGraphAddExternalSemaphoresWaitNode", {"hipGraphAddExternalSemaphoresWaitNode", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, + {"cuGraphAddExternalSemaphoresWaitNode", {"hipGraphAddExternalSemaphoresWaitNode", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cudaGraphExternalSemaphoresWaitNodeGetParams - {"cuGraphExternalSemaphoresWaitNodeGetParams", {"hipGraphExternalSemaphoresWaitNodeGetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, + {"cuGraphExternalSemaphoresWaitNodeGetParams", {"hipGraphExternalSemaphoresWaitNodeGetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cudaGraphExternalSemaphoresWaitNodeSetParams - {"cuGraphExternalSemaphoresWaitNodeSetParams", {"hipGraphExternalSemaphoresWaitNodeSetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, + {"cuGraphExternalSemaphoresWaitNodeSetParams", {"hipGraphExternalSemaphoresWaitNodeSetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cudaGraphExecExternalSemaphoresSignalNodeSetParams - {"cuGraphExecExternalSemaphoresSignalNodeSetParams", {"hipGraphExecExternalSemaphoresSignalNodeSetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, + {"cuGraphExecExternalSemaphoresSignalNodeSetParams", {"hipGraphExecExternalSemaphoresSignalNodeSetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cudaGraphExecExternalSemaphoresWaitNodeSetParams - {"cuGraphExecExternalSemaphoresWaitNodeSetParams", {"hipGraphExecExternalSemaphoresWaitNodeSetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, + {"cuGraphExecExternalSemaphoresWaitNodeSetParams", {"hipGraphExecExternalSemaphoresWaitNodeSetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cudaUserObjectCreate {"cuUserObjectCreate", {"hipUserObjectCreate", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, // cudaUserObjectRetain @@ -781,8 +772,8 @@ const std::map CUDA_DRIVER_FUNCTION_MAP { {"cuGraphAddMemAllocNode", {"hipGraphAddMemAllocNode", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, // cudaGraphMemAllocNodeGetParams {"cuGraphMemAllocNodeGetParams", {"hipGraphMemAllocNodeGetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, - // cudaGraphAddMemFreeNode - {"cuGraphAddMemFreeNode", {"hipGraphAddMemFreeNode", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, + // no analogue + {"cuGraphAddMemFreeNode", {"hipDrvGraphAddMemFreeNode", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cudaGraphMemFreeNodeGetParams {"cuGraphMemFreeNodeGetParams", {"hipGraphMemFreeNodeGetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, // cudaDeviceGraphMemTrim @@ -802,17 +793,17 @@ const std::map CUDA_DRIVER_FUNCTION_MAP { // {"cuGraphExecBatchMemOpNodeSetParams", {"hipGraphExecBatchMemOpNodeSetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, // cudaGraphInstantiateWithParams - {"cuGraphInstantiateWithParams", {"hipGraphInstantiateWithParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, + {"cuGraphInstantiateWithParams", {"hipGraphInstantiateWithParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cudaGraphExecGetFlags - {"cuGraphExecGetFlags", {"hipGraphExecGetFlags", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, + {"cuGraphExecGetFlags", {"hipGraphExecGetFlags", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cudaGraphAddNode - {"cuGraphAddNode", {"hipGraphAddNode", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, + {"cuGraphAddNode", {"hipGraphAddNode", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cudaGraphAddNode_v2 {"cuGraphAddNode_v2", {"hipGraphAddNode_v2", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_UNSUPPORTED}}, // cudaGraphNodeSetParams - {"cuGraphNodeSetParams", {"hipGraphNodeSetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, + {"cuGraphNodeSetParams", {"hipGraphNodeSetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cudaGraphExecNodeSetParams - {"cuGraphExecNodeSetParams", {"hipGraphExecNodeSetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH}}, + {"cuGraphExecNodeSetParams", {"hipGraphExecNodeSetParams", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cudaGraphConditionalHandleCreate {"cuGraphConditionalHandleCreate", {"hipGraphConditionalHandleCreate", "", CONV_GRAPH, API_DRIVER, SEC::GRAPH, HIP_UNSUPPORTED}}, @@ -939,7 +930,7 @@ const std::map CUDA_DRIVER_FUNCTION_MAP { // 33. Driver Entry Point Access // cudaGetDriverEntryPoint - {"cuGetProcAddress", {"hipGetProcAddress", "", CONV_DRIVER_ENTRY_POINT, API_DRIVER, SEC::DRIVER_ENTRY_POINT, HIP_UNSUPPORTED}}, + {"cuGetProcAddress", {"hipGetProcAddress", "", CONV_DRIVER_ENTRY_POINT, API_DRIVER, SEC::DRIVER_ENTRY_POINT, HIP_EXPERIMENTAL}}, // 34. Coredump Attributes Control API // @@ -1583,6 +1574,13 @@ const std::map HIP_DRIVER_FUNCTION_VER_MAP { {"hipArrayGetDescriptor", {HIP_5060, HIP_0, HIP_0 }}, {"hipArray3DGetDescriptor", {HIP_5060, HIP_0, HIP_0 }}, {"hipDrvGraphAddMemcpyNode", {HIP_6000, HIP_0, HIP_0, }}, + {"hipGetProcAddress", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipDrvGraphMemcpyNodeGetParams", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipDrvGraphMemcpyNodeSetParams", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipDrvGraphAddMemsetNode", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipDrvGraphAddMemFreeNode", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipDrvGraphExecMemcpyNodeSetParams", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipDrvGraphExecMemsetNodeSetParams", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, }; const std::map CUDA_DRIVER_API_SECTION_MAP { diff --git a/src/CUDA2HIP_Driver_API_types.cpp b/src/CUDA2HIP_Driver_API_types.cpp index b12c79e8..88f8b9d8 100644 --- a/src/CUDA2HIP_Driver_API_types.cpp +++ b/src/CUDA2HIP_Driver_API_types.cpp @@ -110,9 +110,9 @@ const std::map CUDA_DRIVER_TYPE_NAME_MAP { {"CUDA_MEMCPY3D_PEER", {"hip_Memcpy3D_Peer", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, {"CUDA_MEMCPY3D_PEER_v1", {"hip_Memcpy3D_Peer", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, - {"CUDA_MEMCPY_NODE_PARAMS_st", {"hiMemcpyNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"CUDA_MEMCPY_NODE_PARAMS_st", {"hipMemcpyNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // cudaMemcpyNodeParams - {"CUDA_MEMCPY_NODE_PARAMS", {"hiMemcpyNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"CUDA_MEMCPY_NODE_PARAMS", {"hipMemcpyNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, {"CUDA_MEMSET_NODE_PARAMS_st", {"hipMemsetParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES}}, // cudaMemsetParams @@ -328,24 +328,24 @@ const std::map CUDA_DRIVER_TYPE_NAME_MAP { {"CUDA_MEM_ALLOC_NODE_PARAMS_v2", {"hipMemAllocNodeParams_v2", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, // cudaMemFreeNodeParams - {"CUDA_MEM_FREE_NODE_PARAMS_st", {"hipMemFreeNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, - {"CUDA_MEM_FREE_NODE_PARAMS", {"hipMemFreeNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"CUDA_MEM_FREE_NODE_PARAMS_st", {"hipMemFreeNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, + {"CUDA_MEM_FREE_NODE_PARAMS", {"hipMemFreeNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // cudaChildGraphNodeParams - {"CUDA_CHILD_GRAPH_NODE_PARAMS_st", {"hipChildGraphNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, - {"CUDA_CHILD_GRAPH_NODE_PARAMS", {"hipChildGraphNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"CUDA_CHILD_GRAPH_NODE_PARAMS_st", {"hipChildGraphNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, + {"CUDA_CHILD_GRAPH_NODE_PARAMS", {"hipChildGraphNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // cudaEventRecordNodeParams - {"CUDA_EVENT_RECORD_NODE_PARAMS_st", {"hipEventRecordNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, - {"CUDA_EVENT_RECORD_NODE_PARAMS", {"hipEventRecordNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"CUDA_EVENT_RECORD_NODE_PARAMS_st", {"hipEventRecordNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, + {"CUDA_EVENT_RECORD_NODE_PARAMS", {"hipEventRecordNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // cudaEventWaitNodeParams - {"CUDA_EVENT_WAIT_NODE_PARAMS_st", {"hipEventWaitNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, - {"CUDA_EVENT_WAIT_NODE_PARAMS", {"hipEventWaitNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"CUDA_EVENT_WAIT_NODE_PARAMS_st", {"hipEventWaitNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, + {"CUDA_EVENT_WAIT_NODE_PARAMS", {"hipEventWaitNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // cudaGraphNodeParams - {"CUgraphNodeParams_st", {"hipGraphNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, - {"CUgraphNodeParams", {"hipGraphNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"CUgraphNodeParams_st", {"hipGraphNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, + {"CUgraphNodeParams", {"hipGraphNodeParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // cudaArrayMemoryRequirements {"CUDA_ARRAY_MEMORY_REQUIREMENTS_st", {"hipArrayMemoryRequirements", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, @@ -385,9 +385,9 @@ const std::map CUDA_DRIVER_TYPE_NAME_MAP { {"CUkernel", {"hipKernel", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, // cudaGraphInstantiateParams_st - {"CUDA_GRAPH_INSTANTIATE_PARAMS_st", {"HIP_GRAPH_INSTANTIATE_PARAMS", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"CUDA_GRAPH_INSTANTIATE_PARAMS_st", {"hipGraphInstantiateParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // cudaGraphInstantiateParams - {"CUDA_GRAPH_INSTANTIATE_PARAMS", {"HIP_GRAPH_INSTANTIATE_PARAMS", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"CUDA_GRAPH_INSTANTIATE_PARAMS", {"hipGraphInstantiateParams", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // cudaLaunchMemSyncDomainMap_st {"CUlaunchMemSyncDomainMap_st", {"hipLaunchMemSyncDomainMap", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, @@ -2196,24 +2196,24 @@ const std::map CUDA_DRIVER_TYPE_NAME_MAP { {"CU_GET_PROC_ADDRESS_PER_THREAD_DEFAULT_STREAM", {"hipEnablePerThreadDefaultStream", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, // 1 << 1 // cudaFlushGPUDirectRDMAWritesOptions - {"CUflushGPUDirectRDMAWritesOptions", {"hipFlushGPUDirectRDMAWritesOptions", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, - {"CUflushGPUDirectRDMAWritesOptions_enum", {"hipFlushGPUDirectRDMAWritesOptions", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"CUflushGPUDirectRDMAWritesOptions", {"hipFlushGPUDirectRDMAWritesOptions", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, + {"CUflushGPUDirectRDMAWritesOptions_enum", {"hipFlushGPUDirectRDMAWritesOptions", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // CUflushGPUDirectRDMAWritesOptions enum values // cudaFlushGPUDirectRDMAWritesOptionHost - {"CU_FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_HOST", {"hipFlushGPUDirectRDMAWritesOptionHost", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, // 1<<0 + {"CU_FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_HOST", {"hipFlushGPUDirectRDMAWritesOptionHost", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // 1<<0 // cudaFlushGPUDirectRDMAWritesOptionMemOps - {"CU_FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_MEMOPS", {"hipFlushGPUDirectRDMAWritesOptionMemOps", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, // 1<<1 + {"CU_FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_MEMOPS", {"hipFlushGPUDirectRDMAWritesOptionMemOps", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // 1<<1 // cudaGPUDirectRDMAWritesOrdering - {"CUGPUDirectRDMAWritesOrdering", {"hipGPUDirectRDMAWritesOrdering", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, - {"CUGPUDirectRDMAWritesOrdering_enum", {"hipGPUDirectRDMAWritesOrdering", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"CUGPUDirectRDMAWritesOrdering", {"hipGPUDirectRDMAWritesOrdering", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, + {"CUGPUDirectRDMAWritesOrdering_enum", {"hipGPUDirectRDMAWritesOrdering", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // CUGPUDirectRDMAWritesOrdering enum values // cudaGPUDirectRDMAWritesOrderingNone - {"CU_GPU_DIRECT_RDMA_WRITES_ORDERING_NONE", {"hipGPUDirectRDMAWritesOrderingNone", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, // 0 + {"CU_GPU_DIRECT_RDMA_WRITES_ORDERING_NONE", {"hipGPUDirectRDMAWritesOrderingNone", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // 0 // cudaGPUDirectRDMAWritesOrderingOwner - {"CU_GPU_DIRECT_RDMA_WRITES_ORDERING_OWNER", {"hipGPUDirectRDMAWritesOrderingOwner", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, // 100 + {"CU_GPU_DIRECT_RDMA_WRITES_ORDERING_OWNER", {"hipGPUDirectRDMAWritesOrderingOwner", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // 100 // cudaGPUDirectRDMAWritesOrderingAllDevices - {"CU_GPU_DIRECT_RDMA_WRITES_ORDERING_ALL_DEVICES", {"hipGPUDirectRDMAWritesOrderingAllDevices", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, // 200 + {"CU_GPU_DIRECT_RDMA_WRITES_ORDERING_ALL_DEVICES", {"hipGPUDirectRDMAWritesOrderingAllDevices", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // 200 // cudaFlushGPUDirectRDMAWritesScope {"CUflushGPUDirectRDMAWritesScope", {"hipFlushGPUDirectRDMAWritesScope", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, @@ -2418,19 +2418,19 @@ const std::map CUDA_DRIVER_TYPE_NAME_MAP { {"CU_LAUNCH_ATTRIBUTE_MAX", {"hipLaunchAttributeMax", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, // cudaGraphInstantiateResult - {"CUgraphInstantiateResult", {"hipGraphInstantiateResult", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, - {"CUgraphInstantiateResult_enum", {"hipGraphInstantiateResult", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"CUgraphInstantiateResult", {"hipGraphInstantiateResult", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, + {"CUgraphInstantiateResult_enum", {"hipGraphInstantiateResult", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // CUgraphInstantiateResult enum values // cudaGraphInstantiateSuccess - {"CUDA_GRAPH_INSTANTIATE_SUCCESS", {"hipGraphInstantiateSuccess", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"CUDA_GRAPH_INSTANTIATE_SUCCESS", {"hipGraphInstantiateSuccess", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // cudaGraphInstantiateError - {"CUDA_GRAPH_INSTANTIATE_ERROR", {"hipGraphInstantiateError", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"CUDA_GRAPH_INSTANTIATE_ERROR", {"hipGraphInstantiateError", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // cudaGraphInstantiateInvalidStructure - {"CUDA_GRAPH_INSTANTIATE_INVALID_STRUCTURE", {"hipGraphInstantiateInvalidStructure", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"CUDA_GRAPH_INSTANTIATE_INVALID_STRUCTURE", {"hipGraphInstantiateInvalidStructure", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // cudaGraphInstantiateNodeOperationNotSupported - {"CUDA_GRAPH_INSTANTIATE_NODE_OPERATION_NOT_SUPPORTED", {"hipGraphInstantiateNodeOperationNotSupported", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"CUDA_GRAPH_INSTANTIATE_NODE_OPERATION_NOT_SUPPORTED", {"hipGraphInstantiateNodeOperationNotSupported", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // cudaGraphInstantiateMultipleDevicesNotSupported - {"CUDA_GRAPH_INSTANTIATE_MULTIPLE_CTXS_NOT_SUPPORTED", {"hipGraphInstantiateMultipleDevicesNotSupported", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"CUDA_GRAPH_INSTANTIATE_MULTIPLE_CTXS_NOT_SUPPORTED", {"hipGraphInstantiateMultipleDevicesNotSupported", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // cudaLaunchMemSyncDomain {"CUlaunchMemSyncDomain", {"hipLaunchMemSyncDomain", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, @@ -2442,15 +2442,15 @@ const std::map CUDA_DRIVER_TYPE_NAME_MAP { {"CU_LAUNCH_MEM_SYNC_DOMAIN_REMOTE", {"hipLaunchMemSyncDomainRemote", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, // - {"CUdriverProcAddressQueryResult", {"hipDriverProcAddressQueryResult", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, - {"CUdriverProcAddressQueryResult_enum", {"hipDriverProcAddressQueryResult", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"CUdriverProcAddressQueryResult", {"hipDriverProcAddressQueryResult", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, + {"CUdriverProcAddressQueryResult_enum", {"hipDriverProcAddressQueryResult", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // CUdriverProcAddressQueryResult enum values // - {"CU_GET_PROC_ADDRESS_SUCCESS", {"HIP_GET_PROC_ADDRESS_SUCCESS", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"CU_GET_PROC_ADDRESS_SUCCESS", {"HIP_GET_PROC_ADDRESS_SUCCESS", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // - {"CU_GET_PROC_ADDRESS_SYMBOL_NOT_FOUND", {"HIP_GET_PROC_ADDRESS_SYMBOL_NOT_FOUND", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"CU_GET_PROC_ADDRESS_SYMBOL_NOT_FOUND", {"HIP_GET_PROC_ADDRESS_SYMBOL_NOT_FOUND", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // - {"CU_GET_PROC_ADDRESS_VERSION_NOT_SUFFICIENT", {"HIP_GET_PROC_ADDRESS_VERSION_NOT_SUFFICIENT", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"CU_GET_PROC_ADDRESS_VERSION_NOT_SUFFICIENT", {"HIP_GET_PROC_ADDRESS_VERSION_NOT_SUFFICIENT", "", CONV_NUMERIC_LITERAL, API_DRIVER, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // {"CUlibraryOption", {"hipLibraryOption", "", CONV_TYPE, API_DRIVER, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, @@ -4057,4 +4057,8 @@ const std::map HIP_DRIVER_TYPE_NAME_VER_MAP { {"hipDeviceAttributeHostRegisterSupported", {HIP_6000, HIP_0, HIP_0, }}, {"hipExternalSemaphoreSignalNodeParams", {HIP_6000, HIP_0, HIP_0, }}, {"hipExternalSemaphoreWaitNodeParams", {HIP_6000, HIP_0, HIP_0, }}, + {"hipDriverProcAddressQueryResult", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"HIP_GET_PROC_ADDRESS_SUCCESS", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"HIP_GET_PROC_ADDRESS_SYMBOL_NOT_FOUND", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"HIP_GET_PROC_ADDRESS_VERSION_NOT_SUFFICIENT", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, }; diff --git a/src/CUDA2HIP_Runtime_API_functions.cpp b/src/CUDA2HIP_Runtime_API_functions.cpp index fad7b61c..f5e8fb40 100644 --- a/src/CUDA2HIP_Runtime_API_functions.cpp +++ b/src/CUDA2HIP_Runtime_API_functions.cpp @@ -727,19 +727,13 @@ const std::map CUDA_RUNTIME_FUNCTION_MAP { // cuGraphExecKernelNodeSetParams {"cudaGraphExecKernelNodeSetParams", {"hipGraphExecKernelNodeSetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH}}, // no analogue - // NOTE: Not equal to cuGraphExecMemcpyNodeSetParams due to different signatures: - // DRIVER: CUresult CUDAAPI cuGraphExecMemcpyNodeSetParams(CUgraphExec hGraphExec, CUgraphNode hNode, const CUDA_MEMCPY3D *copyParams, CUcontext ctx); - // RUNTIME: cudaError_t CUDARTAPI cudaGraphExecMemcpyNodeSetParams(cudaGraphExec_t hGraphExec, cudaGraphNode_t node, const struct cudaMemcpy3DParms *pNodeParams); {"cudaGraphExecMemcpyNodeSetParams", {"hipGraphExecMemcpyNodeSetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH}}, // no analogue - // NOTE: Not equal to cuGraphExecMemsetNodeSetParams due to different signatures: - // DRIVER: CUresult CUDAAPI cuGraphExecMemsetNodeSetParams(CUgraphExec hGraphExec, CUgraphNode hNode, const CUDA_MEMSET_NODE_PARAMS *memsetParams, CUcontext ctx); - // RUNTIME: cudaError_t CUDARTAPI cudaGraphExecMemsetNodeSetParams(cudaGraphExec_t hGraphExec, cudaGraphNode_t node, const struct cudaMemsetParams *pNodeParams); {"cudaGraphExecMemsetNodeSetParams", {"hipGraphExecMemsetNodeSetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH}}, // cuGraphExecHostNodeSetParams {"cudaGraphExecHostNodeSetParams", {"hipGraphExecHostNodeSetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH}}, // cuGraphExecUpdate - // NOTE: CUDA signature changed since 12.0 + // NOTE: CUDA signature has changed since 12.0 {"cudaGraphExecUpdate", {"hipGraphExecUpdate", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH}}, // cuGraphKernelNodeGetParams {"cudaGraphKernelNodeGetParams", {"hipGraphKernelNodeGetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH}}, @@ -812,21 +806,21 @@ const std::map CUDA_RUNTIME_FUNCTION_MAP { // cuGraphUpload {"cudaGraphUpload", {"hipGraphUpload", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH}}, // cuGraphAddExternalSemaphoresSignalNode - {"cudaGraphAddExternalSemaphoresSignalNode", {"hipGraphAddExternalSemaphoresSignalNode", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH}}, + {"cudaGraphAddExternalSemaphoresSignalNode", {"hipGraphAddExternalSemaphoresSignalNode", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cuGraphExternalSemaphoresSignalNodeGetParams - {"cudaGraphExternalSemaphoresSignalNodeGetParams", {"hipGraphExternalSemaphoresSignalNodeGetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH}}, + {"cudaGraphExternalSemaphoresSignalNodeGetParams", {"hipGraphExternalSemaphoresSignalNodeGetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cuGraphExternalSemaphoresSignalNodeSetParams - {"cudaGraphExternalSemaphoresSignalNodeSetParams", {"hipGraphExternalSemaphoresSignalNodeSetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH}}, + {"cudaGraphExternalSemaphoresSignalNodeSetParams", {"hipGraphExternalSemaphoresSignalNodeSetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cuGraphAddExternalSemaphoresWaitNode - {"cudaGraphAddExternalSemaphoresWaitNode", {"hipGraphAddExternalSemaphoresWaitNode", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH}}, + {"cudaGraphAddExternalSemaphoresWaitNode", {"hipGraphAddExternalSemaphoresWaitNode", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cuGraphExternalSemaphoresWaitNodeGetParams - {"cudaGraphExternalSemaphoresWaitNodeGetParams", {"hipGraphExternalSemaphoresWaitNodeGetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH}}, + {"cudaGraphExternalSemaphoresWaitNodeGetParams", {"hipGraphExternalSemaphoresWaitNodeGetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cuGraphExternalSemaphoresWaitNodeSetParams - {"cudaGraphExternalSemaphoresWaitNodeSetParams", {"hipGraphExternalSemaphoresWaitNodeSetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH}}, + {"cudaGraphExternalSemaphoresWaitNodeSetParams", {"hipGraphExternalSemaphoresWaitNodeSetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cuGraphExecExternalSemaphoresSignalNodeSetParams - {"cudaGraphExecExternalSemaphoresSignalNodeSetParams", {"hipGraphExecExternalSemaphoresSignalNodeSetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH}}, + {"cudaGraphExecExternalSemaphoresSignalNodeSetParams", {"hipGraphExecExternalSemaphoresSignalNodeSetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cuGraphExecExternalSemaphoresWaitNodeSetParams - {"cudaGraphExecExternalSemaphoresWaitNodeSetParams", {"hipGraphExecExternalSemaphoresWaitNodeSetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH}}, + {"cudaGraphExecExternalSemaphoresWaitNodeSetParams", {"hipGraphExecExternalSemaphoresWaitNodeSetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cuUserObjectCreate {"cudaUserObjectCreate", {"hipUserObjectCreate", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH}}, // cuUserObjectRetain @@ -841,7 +835,7 @@ const std::map CUDA_RUNTIME_FUNCTION_MAP { {"cudaGraphAddMemAllocNode", {"hipGraphAddMemAllocNode", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH}}, // cuGraphMemAllocNodeGetParams {"cudaGraphMemAllocNodeGetParams", {"hipGraphMemAllocNodeGetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH}}, - // cuGraphAddMemFreeNode + // no analogue {"cudaGraphAddMemFreeNode", {"hipGraphAddMemFreeNode", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH}}, // cuGraphMemFreeNodeGetParams {"cudaGraphMemFreeNodeGetParams", {"hipGraphMemFreeNodeGetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH}}, @@ -857,23 +851,23 @@ const std::map CUDA_RUNTIME_FUNCTION_MAP { // cuGraphNodeSetEnabled {"cudaGraphNodeSetEnabled", {"hipGraphNodeSetEnabled", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH}}, // cuGraphInstantiateWithParams - {"cudaGraphInstantiateWithParams", {"hipGraphInstantiateWithParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH, HIP_UNSUPPORTED}}, + {"cudaGraphInstantiateWithParams", {"hipGraphInstantiateWithParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cuGraphExecGetFlags - {"cudaGraphExecGetFlags", {"hipGraphExecGetFlags", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH, HIP_UNSUPPORTED}}, + {"cudaGraphExecGetFlags", {"hipGraphExecGetFlags", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cuGraphAddNode - {"cudaGraphAddNode", {"hipGraphAddNode", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH, HIP_UNSUPPORTED}}, + {"cudaGraphAddNode", {"hipGraphAddNode", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cuGraphAddNode_v2 {"cudaGraphAddNode_v2", {"hipGraphAddNode_v2", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH, HIP_UNSUPPORTED}}, // cuGraphNodeSetParams - {"cudaGraphNodeSetParams", {"hipGraphNodeSetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH, HIP_UNSUPPORTED}}, + {"cudaGraphNodeSetParams", {"hipGraphNodeSetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cuGraphExecNodeSetParams - {"cudaGraphExecNodeSetParams", {"hipGraphExecNodeSetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH, HIP_UNSUPPORTED}}, + {"cudaGraphExecNodeSetParams", {"hipGraphExecNodeSetParams", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH, HIP_EXPERIMENTAL}}, // cuGraphConditionalHandleCreate {"cudaGraphConditionalHandleCreate", {"hipGraphConditionalHandleCreate", "", CONV_GRAPH, API_RUNTIME, SEC::GRAPH, HIP_UNSUPPORTED}}, // 29. Driver Entry Point Access // cuGetProcAddress - {"cudaGetDriverEntryPoint", {"hipGetProcAddress", "", CONV_DRIVER_ENTRY_POINT, API_RUNTIME, SEC::DRIVER_ENTRY_POINT, HIP_UNSUPPORTED}}, + {"cudaGetDriverEntryPoint", {"hipGetProcAddress", "", CONV_DRIVER_ENTRY_POINT, API_RUNTIME, SEC::DRIVER_ENTRY_POINT, HIP_EXPERIMENTAL}}, // 30. C++ API Routines {"cudaGetKernel", {"hipGetKernel", "", CONV_CPP, API_RUNTIME, SEC::CPP, HIP_UNSUPPORTED}}, @@ -1406,14 +1400,19 @@ const std::map HIP_RUNTIME_FUNCTION_VER_MAP { {"hipOccupancyMaxPotentialBlockSizeVariableSMem", {HIP_5050, HIP_0, HIP_0 }}, {"hipOccupancyMaxPotentialBlockSizeVariableSMemWithFlags", {HIP_5050, HIP_0, HIP_0 }}, {"hipArrayGetInfo", {HIP_5060, HIP_0, HIP_0 }}, - {"hipGraphAddExternalSemaphoresWaitNode", {HIP_6000, HIP_0, HIP_0, }}, - {"hipGraphAddExternalSemaphoresSignalNode", {HIP_6000, HIP_0, HIP_0, }}, - {"hipGraphExternalSemaphoresSignalNodeSetParams", {HIP_6000, HIP_0, HIP_0, }}, - {"hipGraphExternalSemaphoresSignalNodeGetParams", {HIP_6000, HIP_0, HIP_0, }}, - {"hipGraphExternalSemaphoresWaitNodeGetParams", {HIP_6000, HIP_0, HIP_0, }}, - {"hipGraphExternalSemaphoresWaitNodeSetParams", {HIP_6000, HIP_0, HIP_0, }}, - {"hipGraphExecExternalSemaphoresSignalNodeSetParams", {HIP_6000, HIP_0, HIP_0, }}, - {"hipGraphExecExternalSemaphoresWaitNodeSetParams", {HIP_6000, HIP_0, HIP_0, }}, + {"hipGraphAddExternalSemaphoresWaitNode", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGraphAddExternalSemaphoresSignalNode", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGraphExternalSemaphoresSignalNodeSetParams", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGraphExternalSemaphoresSignalNodeGetParams", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGraphExternalSemaphoresWaitNodeGetParams", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGraphExternalSemaphoresWaitNodeSetParams", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGraphExecExternalSemaphoresSignalNodeSetParams", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGraphExecExternalSemaphoresWaitNodeSetParams", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGraphInstantiateWithParams", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGraphAddNode", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGraphExecGetFlags", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGraphNodeSetParams", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGraphExecNodeSetParams", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, }; const std::map CUDA_RUNTIME_API_SECTION_MAP { diff --git a/src/CUDA2HIP_Runtime_API_types.cpp b/src/CUDA2HIP_Runtime_API_types.cpp index f39c1278..7db4cae4 100644 --- a/src/CUDA2HIP_Runtime_API_types.cpp +++ b/src/CUDA2HIP_Runtime_API_types.cpp @@ -230,19 +230,19 @@ const std::map CUDA_RUNTIME_TYPE_NAME_MAP { {"cudaMemAllocNodeParamsV2", {"hipMemAllocNodeParams_v2", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, // CUDA_MEM_FREE_NODE_PARAMS_st - {"cudaMemFreeNodeParams", {"hipMemFreeNodeParams", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"cudaMemFreeNodeParams", {"hipMemFreeNodeParams", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // CUDA_CHILD_GRAPH_NODE_PARAMS_st - {"cudaChildGraphNodeParams", {"hipChildGraphNodeParams", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"cudaChildGraphNodeParams", {"hipChildGraphNodeParams", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // CUDA_EVENT_RECORD_NODE_PARAMS_st - {"cudaEventRecordNodeParams", {"hipEventRecordNodeParams", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"cudaEventRecordNodeParams", {"hipEventRecordNodeParams", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // CUDA_EVENT_WAIT_NODE_PARAMS_st - {"cudaEventWaitNodeParams", {"hipEventWaitNodeParams", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"cudaEventWaitNodeParams", {"hipEventWaitNodeParams", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // CUgraphNodeParams_st - {"cudaGraphNodeParams", {"hipGraphNodeParams", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"cudaGraphNodeParams", {"hipGraphNodeParams", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // CUDA_ARRAY_MEMORY_REQUIREMENTS_st {"cudaArrayMemoryRequirements", {"hipArrayMemoryRequirements", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, @@ -258,7 +258,7 @@ const std::map CUDA_RUNTIME_TYPE_NAME_MAP { {"cudaKernel_t", {"hipKernel", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, // CUDA_MEMCPY_NODE_PARAMS - {"cudaMemcpyNodeParams", {"hiMemcpyNodeParams", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"cudaMemcpyNodeParams", {"hipMemcpyNodeParams", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // CUDA_CONDITIONAL_NODE_PARAMS {"cudaConditionalNodeParams", {"hipConditionalNodeParams", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, @@ -290,9 +290,9 @@ const std::map CUDA_RUNTIME_TYPE_NAME_MAP { {"cudaLaunchConfig_t", {"hipLaunchConfig", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, // CUDA_GRAPH_INSTANTIATE_PARAMS_st - {"cudaGraphInstantiateParams_st", {"hipGraphInstantiateParams", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"cudaGraphInstantiateParams_st", {"hipGraphInstantiateParams", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // CUDA_GRAPH_INSTANTIATE_PARAMS - {"cudaGraphInstantiateParams", {"hipGraphInstantiateParams", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"cudaGraphInstantiateParams", {"hipGraphInstantiateParams", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // CUgraphExecUpdateResultInfo_st {"cudaGraphExecUpdateResultInfo_st", {"hipGraphExecUpdateResultInfo", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, @@ -1734,22 +1734,22 @@ const std::map CUDA_RUNTIME_TYPE_NAME_MAP { {"cudaGraphUserObjectMove", {"hipGraphUserObjectMove", "", CONV_NUMERIC_LITERAL, API_RUNTIME, SEC::DATA_TYPES}}, // 0x1 // CUflushGPUDirectRDMAWritesOptions - {"cudaFlushGPUDirectRDMAWritesOptions", {"hipFlushGPUDirectRDMAWritesOptions", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"cudaFlushGPUDirectRDMAWritesOptions", {"hipFlushGPUDirectRDMAWritesOptions", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // cudaFlushGPUDirectRDMAWritesOptions enum values // CU_FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_HOST - {"cudaFlushGPUDirectRDMAWritesOptionHost", {"hipFlushGPUDirectRDMAWritesOptionHost", "", CONV_NUMERIC_LITERAL, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, // 1<<0 + {"cudaFlushGPUDirectRDMAWritesOptionHost", {"hipFlushGPUDirectRDMAWritesOptionHost", "", CONV_NUMERIC_LITERAL, API_RUNTIME, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // 1<<0 // CU_FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_MEMOPS - {"cudaFlushGPUDirectRDMAWritesOptionMemOps", {"hipFlushGPUDirectRDMAWritesOptionMemOps", "", CONV_NUMERIC_LITERAL, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, // 1<<1 + {"cudaFlushGPUDirectRDMAWritesOptionMemOps", {"hipFlushGPUDirectRDMAWritesOptionMemOps", "", CONV_NUMERIC_LITERAL, API_RUNTIME, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // 1<<1 // CUGPUDirectRDMAWritesOrdering - {"cudaGPUDirectRDMAWritesOrdering", {"hipGPUDirectRDMAWritesOrdering", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"cudaGPUDirectRDMAWritesOrdering", {"hipGPUDirectRDMAWritesOrdering", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // cudaGPUDirectRDMAWritesOrdering enum values // CU_GPU_DIRECT_RDMA_WRITES_ORDERING_NONE - {"cudaGPUDirectRDMAWritesOrderingNone", {"hipGPUDirectRDMAWritesOrderingNone", "", CONV_NUMERIC_LITERAL, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, // 0 + {"cudaGPUDirectRDMAWritesOrderingNone", {"hipGPUDirectRDMAWritesOrderingNone", "", CONV_NUMERIC_LITERAL, API_RUNTIME, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // 0 // CU_GPU_DIRECT_RDMA_WRITES_ORDERING_OWNER - {"cudaGPUDirectRDMAWritesOrderingOwner", {"hipGPUDirectRDMAWritesOrderingOwner", "", CONV_NUMERIC_LITERAL, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, // 100 + {"cudaGPUDirectRDMAWritesOrderingOwner", {"hipGPUDirectRDMAWritesOrderingOwner", "", CONV_NUMERIC_LITERAL, API_RUNTIME, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // 100 // CU_GPU_DIRECT_RDMA_WRITES_ORDERING_ALL_DEVICES - {"cudaGPUDirectRDMAWritesOrderingAllDevices", {"hipGPUDirectRDMAWritesOrderingAllDevices", "", CONV_NUMERIC_LITERAL, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, // 200 + {"cudaGPUDirectRDMAWritesOrderingAllDevices", {"hipGPUDirectRDMAWritesOrderingAllDevices", "", CONV_NUMERIC_LITERAL, API_RUNTIME, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // 200 // CUflushGPUDirectRDMAWritesScope {"cudaFlushGPUDirectRDMAWritesScope", {"hipFlushGPUDirectRDMAWritesScope", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, @@ -1864,18 +1864,18 @@ const std::map CUDA_RUNTIME_TYPE_NAME_MAP { {"cudaLaunchAttributeLaunchCompletionEvent", {"hipLaunchAttributeLaunchCompletionEvent", "", CONV_NUMERIC_LITERAL, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, // CUgraphInstantiateResult - {"cudaGraphInstantiateResult", {"hipGraphInstantiateResult", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"cudaGraphInstantiateResult", {"hipGraphInstantiateResult", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // cudaGraphInstantiateResult enum values // CUDA_GRAPH_INSTANTIATE_SUCCESS - {"cudaGraphInstantiateSuccess", {"hipGraphInstantiateSuccess", "", CONV_NUMERIC_LITERAL, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"cudaGraphInstantiateSuccess", {"hipGraphInstantiateSuccess", "", CONV_NUMERIC_LITERAL, API_RUNTIME, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // CUDA_GRAPH_INSTANTIATE_ERROR - {"cudaGraphInstantiateError", {"hipGraphInstantiateError", "", CONV_NUMERIC_LITERAL, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"cudaGraphInstantiateError", {"hipGraphInstantiateError", "", CONV_NUMERIC_LITERAL, API_RUNTIME, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // CUDA_GRAPH_INSTANTIATE_INVALID_STRUCTURE - {"cudaGraphInstantiateInvalidStructure", {"hipGraphInstantiateInvalidStructure", "", CONV_NUMERIC_LITERAL, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"cudaGraphInstantiateInvalidStructure", {"hipGraphInstantiateInvalidStructure", "", CONV_NUMERIC_LITERAL, API_RUNTIME, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // CUDA_GRAPH_INSTANTIATE_NODE_OPERATION_NOT_SUPPORTED - {"cudaGraphInstantiateNodeOperationNotSupported", {"hipGraphInstantiateNodeOperationNotSupported", "", CONV_NUMERIC_LITERAL, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"cudaGraphInstantiateNodeOperationNotSupported", {"hipGraphInstantiateNodeOperationNotSupported", "", CONV_NUMERIC_LITERAL, API_RUNTIME, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // CUDA_GRAPH_INSTANTIATE_MULTIPLE_CTXS_NOT_SUPPORTED - {"cudaGraphInstantiateMultipleDevicesNotSupported", {"hipGraphInstantiateMultipleDevicesNotSupported", "", CONV_NUMERIC_LITERAL, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, + {"cudaGraphInstantiateMultipleDevicesNotSupported", {"hipGraphInstantiateMultipleDevicesNotSupported", "", CONV_NUMERIC_LITERAL, API_RUNTIME, SEC::DATA_TYPES, HIP_EXPERIMENTAL}}, // no analogues {"cudaDriverEntryPointQueryResult", {"hipDriverEntryPointQueryResult", "", CONV_TYPE, API_RUNTIME, SEC::DATA_TYPES, HIP_UNSUPPORTED}}, @@ -2908,4 +2908,24 @@ const std::map HIP_RUNTIME_TYPE_NAME_VER_MAP { {"hipGraphInstantiateFlagDeviceLaunch", {HIP_5060, HIP_0, HIP_0 }}, {"hipGraphInstantiateFlagUseNodePriority", {HIP_5060, HIP_0, HIP_0 }}, {"hipHostRegisterReadOnly", {HIP_5060, HIP_0, HIP_0 }}, + {"hipFlushGPUDirectRDMAWritesOptions", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipFlushGPUDirectRDMAWritesOptionHost", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipFlushGPUDirectRDMAWritesOptionMemOps", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGPUDirectRDMAWritesOrdering", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGPUDirectRDMAWritesOrderingNone", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGPUDirectRDMAWritesOrderingOwner", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGPUDirectRDMAWritesOrderingAllDevices", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGraphInstantiateResult", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGraphInstantiateSuccess", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGraphInstantiateError", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGraphInstantiateInvalidStructure", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGraphInstantiateNodeOperationNotSupported", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGraphInstantiateMultipleDevicesNotSupported", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGraphInstantiateParams", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipMemcpyNodeParams", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipChildGraphNodeParams", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipEventWaitNodeParams", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipEventRecordNodeParams", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipMemFreeNodeParams", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipGraphNodeParams", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, }; diff --git a/src/CUDA2HIP_SPARSE_API_functions.cpp b/src/CUDA2HIP_SPARSE_API_functions.cpp index ef401e16..7fa7c2c9 100644 --- a/src/CUDA2HIP_SPARSE_API_functions.cpp +++ b/src/CUDA2HIP_SPARSE_API_functions.cpp @@ -64,24 +64,24 @@ const std::map CUDA_SPARSE_FUNCTION_MAP { {"cusparseDestroyCsrsv2Info", {"hipsparseDestroyCsrsv2Info", "rocsparse_destroy_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED | CUDA_REMOVED}}, {"cusparseCreateCsrsm2Info", {"hipsparseCreateCsrsm2Info", "rocsparse_create_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED | CUDA_REMOVED}}, {"cusparseDestroyCsrsm2Info", {"hipsparseDestroyCsrsm2Info", "rocsparse_destroy_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED | CUDA_REMOVED}}, - {"cusparseCreateCsric02Info", {"hipsparseCreateCsric02Info", "rocsparse_create_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED}}, - {"cusparseDestroyCsric02Info", {"hipsparseDestroyCsric02Info", "rocsparse_destroy_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED}}, - {"cusparseCreateCsrilu02Info", {"hipsparseCreateCsrilu02Info", "rocsparse_create_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED}}, - {"cusparseDestroyCsrilu02Info", {"hipsparseDestroyCsrilu02Info", "rocsparse_destroy_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED}}, - {"cusparseCreateBsrsv2Info", {"hipsparseCreateBsrsv2Info", "rocsparse_create_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED}}, - {"cusparseDestroyBsrsv2Info", {"hipsparseDestroyBsrsv2Info", "rocsparse_destroy_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED}}, - {"cusparseCreateBsrsm2Info", {"hipsparseCreateBsrsm2Info", "rocsparse_create_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED}}, - {"cusparseDestroyBsrsm2Info", {"hipsparseDestroyBsrsm2Info", "rocsparse_destroy_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED}}, - {"cusparseCreateBsric02Info", {"hipsparseCreateBsric02Info", "rocsparse_create_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED}}, - {"cusparseDestroyBsric02Info", {"hipsparseDestroyBsric02Info", "rocsparse_destroy_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED}}, - {"cusparseCreateBsrilu02Info", {"hipsparseCreateBsrilu02Info", "rocsparse_create_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED}}, - {"cusparseDestroyBsrilu02Info", {"hipsparseDestroyBsrilu02Info", "rocsparse_destroy_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED}}, + {"cusparseCreateCsric02Info", {"hipsparseCreateCsric02Info", "rocsparse_create_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDestroyCsric02Info", {"hipsparseDestroyCsric02Info", "rocsparse_destroy_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCreateCsrilu02Info", {"hipsparseCreateCsrilu02Info", "rocsparse_create_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDestroyCsrilu02Info", {"hipsparseDestroyCsrilu02Info", "rocsparse_destroy_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCreateBsrsv2Info", {"hipsparseCreateBsrsv2Info", "rocsparse_create_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDestroyBsrsv2Info", {"hipsparseDestroyBsrsv2Info", "rocsparse_destroy_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCreateBsrsm2Info", {"hipsparseCreateBsrsm2Info", "rocsparse_create_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDestroyBsrsm2Info", {"hipsparseDestroyBsrsm2Info", "rocsparse_destroy_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCreateBsric02Info", {"hipsparseCreateBsric02Info", "rocsparse_create_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDestroyBsric02Info", {"hipsparseDestroyBsric02Info", "rocsparse_destroy_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCreateBsrilu02Info", {"hipsparseCreateBsrilu02Info", "rocsparse_create_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDestroyBsrilu02Info", {"hipsparseDestroyBsrilu02Info", "rocsparse_destroy_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseCreateCsrgemm2Info", {"hipsparseCreateCsrgemm2Info", "rocsparse_create_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED | CUDA_REMOVED}}, {"cusparseDestroyCsrgemm2Info", {"hipsparseDestroyCsrgemm2Info", "rocsparse_destroy_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED | CUDA_REMOVED}}, - {"cusparseCreatePruneInfo", {"hipsparseCreatePruneInfo", "rocsparse_create_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED}}, - {"cusparseDestroyPruneInfo", {"hipsparseDestroyPruneInfo", "rocsparse_destroy_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED}}, - {"cusparseCreateColorInfo", {"hipsparseCreateColorInfo", "rocsparse_create_color_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED}}, - {"cusparseDestroyColorInfo", {"hipsparseDestroyColorInfo", "rocsparse_destroy_color_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED}}, + {"cusparseCreatePruneInfo", {"hipsparseCreatePruneInfo", "rocsparse_create_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDestroyPruneInfo", {"hipsparseDestroyPruneInfo", "rocsparse_destroy_mat_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCreateColorInfo", {"hipsparseCreateColorInfo", "rocsparse_create_color_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDestroyColorInfo", {"hipsparseDestroyColorInfo", "rocsparse_destroy_color_info", CONV_LIB_FUNC, API_SPARSE, 7, CUDA_DEPRECATED | HIP_DEPRECATED}}, // 8. cuSPARSE Level 1 Function Reference {"cusparseSaxpyi", {"hipsparseSaxpyi", "rocsparse_saxpyi", CONV_LIB_FUNC, API_SPARSE, 8, CUDA_DEPRECATED | CUDA_REMOVED}}, @@ -123,10 +123,10 @@ const std::map CUDA_SPARSE_FUNCTION_MAP { {"cusparseCbsrmv", {"hipsparseCbsrmv", "rocsparse_cbsrmv", CONV_LIB_FUNC, API_SPARSE, 9, ROC_DEPRECATED}}, {"cusparseZbsrmv", {"hipsparseZbsrmv", "rocsparse_zbsrmv", CONV_LIB_FUNC, API_SPARSE, 9, ROC_DEPRECATED}}, - {"cusparseSbsrxmv", {"hipsparseSbsrxmv", "rocsparse_sbsrxmv", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED}}, - {"cusparseDbsrxmv", {"hipsparseDbsrxmv", "rocsparse_dbsrxmv", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED}}, - {"cusparseCbsrxmv", {"hipsparseCbsrxmv", "rocsparse_cbsrxmv", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED}}, - {"cusparseZbsrxmv", {"hipsparseZbsrxmv", "rocsparse_zbsrxmv", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED}}, + {"cusparseSbsrxmv", {"hipsparseSbsrxmv", "rocsparse_sbsrxmv", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDbsrxmv", {"hipsparseDbsrxmv", "rocsparse_dbsrxmv", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCbsrxmv", {"hipsparseCbsrxmv", "rocsparse_cbsrxmv", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseZbsrxmv", {"hipsparseZbsrxmv", "rocsparse_zbsrxmv", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseScsrmv", {"hipsparseScsrmv", "rocsparse_scsrmv", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED | CUDA_REMOVED}}, {"cusparseDcsrmv", {"hipsparseDcsrmv", "rocsparse_dcsrmv", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED | CUDA_REMOVED}}, @@ -151,30 +151,30 @@ const std::map CUDA_SPARSE_FUNCTION_MAP { {"cusparseCgemvi_bufferSize", {"hipsparseCgemvi_bufferSize", "rocsparse_cgemvi_buffer_size", CONV_LIB_FUNC, API_SPARSE, 9}}, {"cusparseZgemvi_bufferSize", {"hipsparseZgemvi_bufferSize", "rocsparse_zgemvi_buffer_size", CONV_LIB_FUNC, API_SPARSE, 9}}, - {"cusparseSbsrsv2_bufferSize", {"hipsparseSbsrsv2_bufferSize", "rocsparse_sbsrsv_buffer_size", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED}}, + {"cusparseSbsrsv2_bufferSize", {"hipsparseSbsrsv2_bufferSize", "rocsparse_sbsrsv_buffer_size", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseSbsrsv2_bufferSizeExt", {"hipsparseSbsrsv2_bufferSizeExt", "rocsparse_sbsrsv_buffer_size", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED}}, - {"cusparseDbsrsv2_bufferSize", {"hipsparseDbsrsv2_bufferSize", "rocsparse_dbsrsv_buffer_size", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED}}, + {"cusparseDbsrsv2_bufferSize", {"hipsparseDbsrsv2_bufferSize", "rocsparse_dbsrsv_buffer_size", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseDbsrsv2_bufferSizeExt", {"hipsparseDbsrsv2_bufferSizeExt", "rocsparse_dbsrsv_buffer_size", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED}}, - {"cusparseCbsrsv2_bufferSize", {"hipsparseCbsrsv2_bufferSize", "rocsparse_cbsrsv_buffer_size", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED}}, + {"cusparseCbsrsv2_bufferSize", {"hipsparseCbsrsv2_bufferSize", "rocsparse_cbsrsv_buffer_size", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseCbsrsv2_bufferSizeExt", {"hipsparseCbsrsv2_bufferSizeExt", "rocsparse_cbsrsv_buffer_size", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED}}, - {"cusparseZbsrsv2_bufferSize", {"hipsparseZbsrsv2_bufferSize", "rocsparse_zbsrsv_buffer_size", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED}}, + {"cusparseZbsrsv2_bufferSize", {"hipsparseZbsrsv2_bufferSize", "rocsparse_zbsrsv_buffer_size", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseZbsrsv2_bufferSizeExt", {"hipsparseZbsrsv2_bufferSizeExt", "rocsparse_zbsrsv_buffer_size", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED}}, - {"cusparseSbsrsv2_analysis", {"hipsparseSbsrsv2_analysis", "rocsparse_sbsrsv_analysis", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED}}, - {"cusparseDbsrsv2_analysis", {"hipsparseDbsrsv2_analysis", "rocsparse_dbsrsv_analysis", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED}}, - {"cusparseCbsrsv2_analysis", {"hipsparseCbsrsv2_analysis", "rocsparse_cbsrsv_analysis", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED}}, - {"cusparseZbsrsv2_analysis", {"hipsparseZbsrsv2_analysis", "rocsparse_zbsrsv_analysis", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED}}, + {"cusparseSbsrsv2_analysis", {"hipsparseSbsrsv2_analysis", "rocsparse_sbsrsv_analysis", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDbsrsv2_analysis", {"hipsparseDbsrsv2_analysis", "rocsparse_dbsrsv_analysis", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCbsrsv2_analysis", {"hipsparseCbsrsv2_analysis", "rocsparse_cbsrsv_analysis", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseZbsrsv2_analysis", {"hipsparseZbsrsv2_analysis", "rocsparse_zbsrsv_analysis", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseScsrsv_solve", {"hipsparseScsrsv_solve", "", CONV_LIB_FUNC, API_SPARSE, 9, UNSUPPORTED | CUDA_DEPRECATED | CUDA_REMOVED}}, {"cusparseDcsrsv_solve", {"hipsparseDcsrsv_solve", "", CONV_LIB_FUNC, API_SPARSE, 9, UNSUPPORTED | CUDA_DEPRECATED | CUDA_REMOVED}}, {"cusparseCcsrsv_solve", {"hipsparseCcsrsv_solve", "", CONV_LIB_FUNC, API_SPARSE, 9, UNSUPPORTED | CUDA_DEPRECATED | CUDA_REMOVED}}, {"cusparseZcsrsv_solve", {"hipsparseZcsrsv_solve", "", CONV_LIB_FUNC, API_SPARSE, 9, UNSUPPORTED | CUDA_DEPRECATED | CUDA_REMOVED}}, - {"cusparseSbsrsv2_solve", {"hipsparseSbsrsv2_solve", "rocsparse_sbsrsv_solve", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED}}, - {"cusparseDbsrsv2_solve", {"hipsparseDbsrsv2_solve", "rocsparse_dbsrsv_solve", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED}}, - {"cusparseCbsrsv2_solve", {"hipsparseCbsrsv2_solve", "rocsparse_cbsrsv_solve", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED}}, - {"cusparseZbsrsv2_solve", {"hipsparseZbsrsv2_solve", "rocsparse_zbsrsv_solve", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED}}, - {"cusparseXbsrsv2_zeroPivot", {"hipsparseXbsrsv2_zeroPivot", "rocsparse_bsrsv_zero_pivot", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED}}, + {"cusparseSbsrsv2_solve", {"hipsparseSbsrsv2_solve", "rocsparse_sbsrsv_solve", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDbsrsv2_solve", {"hipsparseDbsrsv2_solve", "rocsparse_dbsrsv_solve", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCbsrsv2_solve", {"hipsparseCbsrsv2_solve", "rocsparse_cbsrsv_solve", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseZbsrsv2_solve", {"hipsparseZbsrsv2_solve", "rocsparse_zbsrsv_solve", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseXbsrsv2_zeroPivot", {"hipsparseXbsrsv2_zeroPivot", "rocsparse_bsrsv_zero_pivot", CONV_LIB_FUNC, API_SPARSE, 9, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseScsrsv_analysis", {"hipsparseScsrsv_analysis", "", CONV_LIB_FUNC, API_SPARSE, 9, UNSUPPORTED | CUDA_DEPRECATED | CUDA_REMOVED}}, {"cusparseDcsrsv_analysis", {"hipsparseDcsrsv_analysis", "", CONV_LIB_FUNC, API_SPARSE, 9, UNSUPPORTED | CUDA_DEPRECATED | CUDA_REMOVED}}, @@ -262,25 +262,25 @@ const std::map CUDA_SPARSE_FUNCTION_MAP { {"cusparseCbsrmm", {"hipsparseCbsrmm", "rocsparse_cbsrmm", CONV_LIB_FUNC, API_SPARSE, 10}}, {"cusparseZbsrmm", {"hipsparseZbsrmm", "rocsparse_zbsrmm", CONV_LIB_FUNC, API_SPARSE, 10}}, - {"cusparseSbsrsm2_bufferSize", {"hipsparseSbsrsm2_bufferSize", "rocsparse_sbsrsm_buffer_size", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED}}, + {"cusparseSbsrsm2_bufferSize", {"hipsparseSbsrsm2_bufferSize", "rocsparse_sbsrsm_buffer_size", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseSbsrsm2_bufferSizeExt", {"hipsparseSbsrsm2_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 10, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseDbsrsm2_bufferSize", {"hipsparseDbsrsm2_bufferSize", "rocsparse_dbsrsm_buffer_size", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED}}, + {"cusparseDbsrsm2_bufferSize", {"hipsparseDbsrsm2_bufferSize", "rocsparse_dbsrsm_buffer_size", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseDbsrsm2_bufferSizeExt", {"hipsparseDbsrsm2_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 10, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseCbsrsm2_bufferSize", {"hipsparseCbsrsm2_bufferSize", "rocsparse_cbsrsm_buffer_size", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED}}, + {"cusparseCbsrsm2_bufferSize", {"hipsparseCbsrsm2_bufferSize", "rocsparse_cbsrsm_buffer_size", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseCbsrsm2_bufferSizeExt", {"hipsparseCbsrsm2_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 10, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseZbsrsm2_bufferSize", {"hipsparseZbsrsm2_bufferSize", "rocsparse_zbsrsm_buffer_size", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED}}, + {"cusparseZbsrsm2_bufferSize", {"hipsparseZbsrsm2_bufferSize", "rocsparse_zbsrsm_buffer_size", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseZbsrsm2_bufferSizeExt", {"hipsparseZbsrsm2_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 10, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseSbsrsm2_analysis", {"hipsparseSbsrsm2_analysis", "rocsparse_sbsrsm_analysis", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED}}, - {"cusparseDbsrsm2_analysis", {"hipsparseDbsrsm2_analysis", "rocsparse_dbsrsm_analysis", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED}}, - {"cusparseCbsrsm2_analysis", {"hipsparseCbsrsm2_analysis", "rocsparse_cbsrsm_analysis", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED}}, - {"cusparseZbsrsm2_analysis", {"hipsparseZbsrsm2_analysis", "rocsparse_zbsrsm_analysis", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED}}, + {"cusparseSbsrsm2_analysis", {"hipsparseSbsrsm2_analysis", "rocsparse_sbsrsm_analysis", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDbsrsm2_analysis", {"hipsparseDbsrsm2_analysis", "rocsparse_dbsrsm_analysis", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCbsrsm2_analysis", {"hipsparseCbsrsm2_analysis", "rocsparse_cbsrsm_analysis", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseZbsrsm2_analysis", {"hipsparseZbsrsm2_analysis", "rocsparse_zbsrsm_analysis", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED | HIP_DEPRECATED}}, - {"cusparseSbsrsm2_solve", {"hipsparseSbsrsm2_solve", "rocsparse_sbsrsm_solve", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED}}, - {"cusparseDbsrsm2_solve", {"hipsparseDbsrsm2_solve", "rocsparse_dbsrsm_solve", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED}}, - {"cusparseCbsrsm2_solve", {"hipsparseCbsrsm2_solve", "rocsparse_cbsrsm_solve", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED}}, - {"cusparseZbsrsm2_solve", {"hipsparseZbsrsm2_solve", "rocsparse_zbsrsm_solve", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED}}, - {"cusparseXbsrsm2_zeroPivot", {"hipsparseXbsrsm2_zeroPivot", "rocsparse_bsrsm_zero_pivot", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED}}, + {"cusparseSbsrsm2_solve", {"hipsparseSbsrsm2_solve", "rocsparse_sbsrsm_solve", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDbsrsm2_solve", {"hipsparseDbsrsm2_solve", "rocsparse_dbsrsm_solve", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCbsrsm2_solve", {"hipsparseCbsrsm2_solve", "rocsparse_cbsrsm_solve", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseZbsrsm2_solve", {"hipsparseZbsrsm2_solve", "rocsparse_zbsrsm_solve", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseXbsrsm2_zeroPivot", {"hipsparseXbsrsm2_zeroPivot", "rocsparse_bsrsm_zero_pivot", CONV_LIB_FUNC, API_SPARSE, 10, CUDA_DEPRECATED | HIP_DEPRECATED}}, // NOTE: rocsparse_(s|d|c|z)gemmi have additional argument: rocsparse_mat_descr // TODO: Add rocsparse_create_mat_descr() call before rocsparse_(s|d|c|z)gemmi call and rocsparse_destroy_mat_descr() after @@ -333,46 +333,46 @@ const std::map CUDA_SPARSE_FUNCTION_MAP { {"cusparseCcsric0", {"hipsparseCcsric0", "", CONV_LIB_FUNC, API_SPARSE, 12, UNSUPPORTED | CUDA_DEPRECATED | CUDA_REMOVED}}, {"cusparseZcsric0", {"hipsparseZcsric0", "", CONV_LIB_FUNC, API_SPARSE, 12, UNSUPPORTED | CUDA_DEPRECATED | CUDA_REMOVED}}, - {"cusparseScsric02_bufferSize", {"hipsparseScsric02_bufferSize", "rocsparse_scsric0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseScsric02_bufferSize", {"hipsparseScsric02_bufferSize", "rocsparse_scsric0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseScsric02_bufferSizeExt", {"hipsparseScsric02_bufferSizeExt", "rocsparse_scsric0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseDcsric02_bufferSize", {"hipsparseDcsric02_bufferSize", "rocsparse_dcsric0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseDcsric02_bufferSize", {"hipsparseDcsric02_bufferSize", "rocsparse_dcsric0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseDcsric02_bufferSizeExt", {"hipsparseDcsric02_bufferSizeExt", "rocsparse_dcsric0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseCcsric02_bufferSize", {"hipsparseCcsric02_bufferSize", "rocsparse_ccsric0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseCcsric02_bufferSize", {"hipsparseCcsric02_bufferSize", "rocsparse_ccsric0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseCcsric02_bufferSizeExt", {"hipsparseCcsric02_bufferSizeExt", "rocsparse_ccsric0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseZcsric02_bufferSize", {"hipsparseZcsric02_bufferSize", "rocsparse_zcsric0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseZcsric02_bufferSize", {"hipsparseZcsric02_bufferSize", "rocsparse_zcsric0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseZcsric02_bufferSizeExt", {"hipsparseZcsric02_bufferSizeExt", "rocsparse_zcsric0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseScsric02_analysis", {"hipsparseScsric02_analysis", "rocsparse_scsric0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseDcsric02_analysis", {"hipsparseDcsric02_analysis", "rocsparse_dcsric0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseCcsric02_analysis", {"hipsparseCcsric02_analysis", "rocsparse_ccsric0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseZcsric02_analysis", {"hipsparseZcsric02_analysis", "rocsparse_zcsric0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseScsric02_analysis", {"hipsparseScsric02_analysis", "rocsparse_scsric0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDcsric02_analysis", {"hipsparseDcsric02_analysis", "rocsparse_dcsric0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCcsric02_analysis", {"hipsparseCcsric02_analysis", "rocsparse_ccsric0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseZcsric02_analysis", {"hipsparseZcsric02_analysis", "rocsparse_zcsric0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, - {"cusparseScsric02", {"hipsparseScsric02", "rocsparse_scsric0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseDcsric02", {"hipsparseDcsric02", "rocsparse_dcsric0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseCcsric02", {"hipsparseCcsric02", "rocsparse_ccsric0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseZcsric02", {"hipsparseZcsric02", "rocsparse_zcsric0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseScsric02", {"hipsparseScsric02", "rocsparse_scsric0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDcsric02", {"hipsparseDcsric02", "rocsparse_dcsric0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCcsric02", {"hipsparseCcsric02", "rocsparse_ccsric0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseZcsric02", {"hipsparseZcsric02", "rocsparse_zcsric0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, - {"cusparseXcsric02_zeroPivot", {"hipsparseXcsric02_zeroPivot", "rocsparse_csric0_zero_pivot", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseSbsric02_bufferSize", {"hipsparseSbsric02_bufferSize", "rocsparse_sbsric0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseXcsric02_zeroPivot", {"hipsparseXcsric02_zeroPivot", "rocsparse_csric0_zero_pivot", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseSbsric02_bufferSize", {"hipsparseSbsric02_bufferSize", "rocsparse_sbsric0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseSbsric02_bufferSizeExt", {"hipsparseSbsric02_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 12, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseDbsric02_bufferSize", {"hipsparseDbsric02_bufferSize", "rocsparse_dbsric0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseDbsric02_bufferSize", {"hipsparseDbsric02_bufferSize", "rocsparse_dbsric0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseDbsric02_bufferSizeExt", {"hipsparseDbsric02_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 12, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseCbsric02_bufferSize", {"hipsparseCbsric02_bufferSize", "rocsparse_cbsric0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseCbsric02_bufferSize", {"hipsparseCbsric02_bufferSize", "rocsparse_cbsric0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseCbsric02_bufferSizeExt", {"hipsparseCbsric02_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 12, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseZbsric02_bufferSize", {"hipsparseZbsric02_bufferSize", "rocsparse_zbsric0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseZbsric02_bufferSize", {"hipsparseZbsric02_bufferSize", "rocsparse_zbsric0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseZbsric02_bufferSizeExt", {"hipsparseZbsric02_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 12, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseSbsric02_analysis", {"hipsparseSbsric02_analysis", "rocsparse_sbsric0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseDbsric02_analysis", {"hipsparseDbsric02_analysis", "rocsparse_dbsric0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseCbsric02_analysis", {"hipsparseCbsric02_analysis", "rocsparse_cbsric0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseZbsric02_analysis", {"hipsparseZbsric02_analysis", "rocsparse_zbsric0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseSbsric02_analysis", {"hipsparseSbsric02_analysis", "rocsparse_sbsric0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDbsric02_analysis", {"hipsparseDbsric02_analysis", "rocsparse_dbsric0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCbsric02_analysis", {"hipsparseCbsric02_analysis", "rocsparse_cbsric0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseZbsric02_analysis", {"hipsparseZbsric02_analysis", "rocsparse_zbsric0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, - {"cusparseSbsric02", {"hipsparseSbsric02", "rocsparse_sbsric0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseDbsric02", {"hipsparseDbsric02", "rocsparse_dbsric0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseCbsric02", {"hipsparseCbsric02", "rocsparse_cbsric0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseZbsric02", {"hipsparseZbsric02", "rocsparse_zbsric0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseSbsric02", {"hipsparseSbsric02", "rocsparse_sbsric0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDbsric02", {"hipsparseDbsric02", "rocsparse_dbsric0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCbsric02", {"hipsparseCbsric02", "rocsparse_cbsric0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseZbsric02", {"hipsparseZbsric02", "rocsparse_zbsric0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, // TODO: rocsparse_get_stream and hipStreamSynchronize need to be added correspondingly before and after rocsparse_bsric0_zero_pivot call, because cusparseXbsric02_zeroPivot is blocking, and rocsparse_bsric0_zero_pivot is not - {"cusparseXbsric02_zeroPivot", {"hipsparseXbsric02_zeroPivot", "rocsparse_bsric0_zero_pivot", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseXbsric02_zeroPivot", {"hipsparseXbsric02_zeroPivot", "rocsparse_bsric0_zero_pivot", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, // 12.2. Incomplete LU Factorization: level 0 // NOTE: rocsparse_(s|d|c|z)csrilu0 have different signatures, thus they are also unsupported yet @@ -382,55 +382,55 @@ const std::map CUDA_SPARSE_FUNCTION_MAP { {"cusparseZcsrilu0", {"hipsparseZcsrilu0", "", CONV_LIB_FUNC, API_SPARSE, 12, UNSUPPORTED | CUDA_DEPRECATED | CUDA_REMOVED}}, {"cusparseCsrilu0Ex", {"hipsparseCsrilu0Ex", "", CONV_LIB_FUNC, API_SPARSE, 12, UNSUPPORTED | CUDA_DEPRECATED | CUDA_REMOVED}}, - {"cusparseScsrilu02_numericBoost", {"hipsparseScsrilu02_numericBoost", "rocsparse_dscsrilu0_numeric_boost", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseDcsrilu02_numericBoost", {"hipsparseDcsrilu02_numericBoost", "rocsparse_dcsrilu0_numeric_boost", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseCcsrilu02_numericBoost", {"hipsparseCcsrilu02_numericBoost", "rocsparse_dccsrilu0_numeric_boost", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseZcsrilu02_numericBoost", {"hipsparseZcsrilu02_numericBoost", "rocsparse_zcsrilu0_numeric_boost", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseScsrilu02_numericBoost", {"hipsparseScsrilu02_numericBoost", "rocsparse_dscsrilu0_numeric_boost", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDcsrilu02_numericBoost", {"hipsparseDcsrilu02_numericBoost", "rocsparse_dcsrilu0_numeric_boost", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCcsrilu02_numericBoost", {"hipsparseCcsrilu02_numericBoost", "rocsparse_dccsrilu0_numeric_boost", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseZcsrilu02_numericBoost", {"hipsparseZcsrilu02_numericBoost", "rocsparse_zcsrilu0_numeric_boost", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, - {"cusparseScsrilu02_bufferSize", {"hipsparseScsrilu02_bufferSize", "rocsparse_scsrilu0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseScsrilu02_bufferSize", {"hipsparseScsrilu02_bufferSize", "rocsparse_scsrilu0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseScsrilu02_bufferSizeExt", {"hipsparseScsrilu02_bufferSizeExt", "rocsparse_scsrilu0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseDcsrilu02_bufferSize", {"hipsparseDcsrilu02_bufferSize", "rocsparse_dcsrilu0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseDcsrilu02_bufferSize", {"hipsparseDcsrilu02_bufferSize", "rocsparse_dcsrilu0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseDcsrilu02_bufferSizeExt", {"hipsparseDcsrilu02_bufferSizeExt", "rocsparse_dcsrilu0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseCcsrilu02_bufferSize", {"hipsparseCcsrilu02_bufferSize", "rocsparse_ccsrilu0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseCcsrilu02_bufferSize", {"hipsparseCcsrilu02_bufferSize", "rocsparse_ccsrilu0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseCcsrilu02_bufferSizeExt", {"hipsparseCcsrilu02_bufferSizeExt", "rocsparse_ccsrilu0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseZcsrilu02_bufferSize", {"hipsparseZcsrilu02_bufferSize", "rocsparse_zcsrilu0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseZcsrilu02_bufferSize", {"hipsparseZcsrilu02_bufferSize", "rocsparse_zcsrilu0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseZcsrilu02_bufferSizeExt", {"hipsparseZcsrilu02_bufferSizeExt", "rocsparse_zcsrilu0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseScsrilu02_analysis", {"hipsparseScsrilu02_analysis", "rocsparse_scsrilu0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseDcsrilu02_analysis", {"hipsparseDcsrilu02_analysis", "rocsparse_dcsrilu0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseCcsrilu02_analysis", {"hipsparseCcsrilu02_analysis", "rocsparse_ccsrilu0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseZcsrilu02_analysis", {"hipsparseZcsrilu02_analysis", "rocsparse_zcsrilu0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseScsrilu02_analysis", {"hipsparseScsrilu02_analysis", "rocsparse_scsrilu0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDcsrilu02_analysis", {"hipsparseDcsrilu02_analysis", "rocsparse_dcsrilu0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCcsrilu02_analysis", {"hipsparseCcsrilu02_analysis", "rocsparse_ccsrilu0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseZcsrilu02_analysis", {"hipsparseZcsrilu02_analysis", "rocsparse_zcsrilu0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, - {"cusparseScsrilu02", {"hipsparseScsrilu02", "rocsparse_scsrilu0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseDcsrilu02", {"hipsparseDcsrilu02", "rocsparse_dcsrilu0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseCcsrilu02", {"hipsparseCcsrilu02", "rocsparse_ccsrilu0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseZcsrilu02", {"hipsparseZcsrilu02", "rocsparse_zcsrilu0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseXcsrilu02_zeroPivot", {"hipsparseXcsrilu02_zeroPivot", "rocsparse_csrilu0_zero_pivot", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseScsrilu02", {"hipsparseScsrilu02", "rocsparse_scsrilu0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDcsrilu02", {"hipsparseDcsrilu02", "rocsparse_dcsrilu0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCcsrilu02", {"hipsparseCcsrilu02", "rocsparse_ccsrilu0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseZcsrilu02", {"hipsparseZcsrilu02", "rocsparse_zcsrilu0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseXcsrilu02_zeroPivot", {"hipsparseXcsrilu02_zeroPivot", "rocsparse_csrilu0_zero_pivot", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, - {"cusparseSbsrilu02_numericBoost", {"hipsparseSbsrilu02_numericBoost", "rocsparse_dsbsrilu0_numeric_boost", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseDbsrilu02_numericBoost", {"hipsparseDbsrilu02_numericBoost", "rocsparse_dbsrilu0_numeric_boost", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseCbsrilu02_numericBoost", {"hipsparseCbsrilu02_numericBoost", "rocsparse_dcbsrilu0_numeric_boost", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseZbsrilu02_numericBoost", {"hipsparseZbsrilu02_numericBoost", "rocsparse_zbsrilu0_numeric_boost", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseSbsrilu02_numericBoost", {"hipsparseSbsrilu02_numericBoost", "rocsparse_dsbsrilu0_numeric_boost", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDbsrilu02_numericBoost", {"hipsparseDbsrilu02_numericBoost", "rocsparse_dbsrilu0_numeric_boost", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCbsrilu02_numericBoost", {"hipsparseCbsrilu02_numericBoost", "rocsparse_dcbsrilu0_numeric_boost", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseZbsrilu02_numericBoost", {"hipsparseZbsrilu02_numericBoost", "rocsparse_zbsrilu0_numeric_boost", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, - {"cusparseSbsrilu02_bufferSize", {"hipsparseSbsrilu02_bufferSize", "rocsparse_sbsrilu0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseSbsrilu02_bufferSize", {"hipsparseSbsrilu02_bufferSize", "rocsparse_sbsrilu0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseSbsrilu02_bufferSizeExt", {"hipsparseSbsrilu02_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 12, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseDbsrilu02_bufferSize", {"hipsparseDbsrilu02_bufferSize", "rocsparse_dbsrilu0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseDbsrilu02_bufferSize", {"hipsparseDbsrilu02_bufferSize", "rocsparse_dbsrilu0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseDbsrilu02_bufferSizeExt", {"hipsparseDbsrilu02_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 12, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseCbsrilu02_bufferSize", {"hipsparseCbsrilu02_bufferSize", "rocsparse_cbsrilu0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseCbsrilu02_bufferSize", {"hipsparseCbsrilu02_bufferSize", "rocsparse_cbsrilu0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseCbsrilu02_bufferSizeExt", {"hipsparseCbsrilu02_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 12, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseZbsrilu02_bufferSize", {"hipsparseZbsrilu02_bufferSize", "rocsparse_zbsrilu0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseZbsrilu02_bufferSize", {"hipsparseZbsrilu02_bufferSize", "rocsparse_zbsrilu0_buffer_size", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseZbsrilu02_bufferSizeExt", {"hipsparseZbsrilu02_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 12, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseSbsrilu02_analysis", {"hipsparseSbsrilu02_analysis", "rocsparse_sbsrilu0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseDbsrilu02_analysis", {"hipsparseDbsrilu02_analysis", "rocsparse_dbsrilu0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseCbsrilu02_analysis", {"hipsparseCbsrilu02_analysis", "rocsparse_cbsrilu0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseZbsrilu02_analysis", {"hipsparseZbsrilu02_analysis", "rocsparse_zbsrilu0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseSbsrilu02_analysis", {"hipsparseSbsrilu02_analysis", "rocsparse_sbsrilu0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDbsrilu02_analysis", {"hipsparseDbsrilu02_analysis", "rocsparse_dbsrilu0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCbsrilu02_analysis", {"hipsparseCbsrilu02_analysis", "rocsparse_cbsrilu0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseZbsrilu02_analysis", {"hipsparseZbsrilu02_analysis", "rocsparse_zbsrilu0_analysis", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, - {"cusparseSbsrilu02", {"hipsparseSbsrilu02", "rocsparse_sbsrilu0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseDbsrilu02", {"hipsparseDbsrilu02", "rocsparse_dbsrilu0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseCbsrilu02", {"hipsparseCbsrilu02", "rocsparse_cbsrilu0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseZbsrilu02", {"hipsparseZbsrilu02", "rocsparse_zbsrilu0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, - {"cusparseXbsrilu02_zeroPivot", {"hipsparseXbsrilu02_zeroPivot", "rocsparse_bsrilu0_zero_pivot", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED}}, + {"cusparseSbsrilu02", {"hipsparseSbsrilu02", "rocsparse_sbsrilu0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDbsrilu02", {"hipsparseDbsrilu02", "rocsparse_dbsrilu0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCbsrilu02", {"hipsparseCbsrilu02", "rocsparse_cbsrilu0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseZbsrilu02", {"hipsparseZbsrilu02", "rocsparse_zbsrilu0", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseXbsrilu02_zeroPivot", {"hipsparseXbsrilu02_zeroPivot", "rocsparse_bsrilu0_zero_pivot", CONV_LIB_FUNC, API_SPARSE, 12, CUDA_DEPRECATED | HIP_DEPRECATED}}, // 12.3. Tridiagonal Solve // NOTE: rocsparse_(s|d|c|z)gtsv have an additional parameter void* temp_buffer @@ -503,10 +503,10 @@ const std::map CUDA_SPARSE_FUNCTION_MAP { {"cusparseZgpsvInterleavedBatch", {"hipsparseZgpsvInterleavedBatch", "rocsparse_zgpsv_interleaved_batch", CONV_LIB_FUNC, API_SPARSE, 12}}, // 13. cuSPARSE Matrix Reorderings Reference - {"cusparseScsrcolor", {"hipsparseScsrcolor", "rocsparse_scsrcolor", CONV_LIB_FUNC, API_SPARSE, 13, CUDA_DEPRECATED}}, - {"cusparseDcsrcolor", {"hipsparseDcsrcolor", "rocsparse_dcsrcolor", CONV_LIB_FUNC, API_SPARSE, 13, CUDA_DEPRECATED}}, - {"cusparseCcsrcolor", {"hipsparseCcsrcolor", "rocsparse_ccsrcolor", CONV_LIB_FUNC, API_SPARSE, 13, CUDA_DEPRECATED}}, - {"cusparseZcsrcolor", {"hipsparseZcsrcolor", "rocsparse_zcsrcolor", CONV_LIB_FUNC, API_SPARSE, 13, CUDA_DEPRECATED}}, + {"cusparseScsrcolor", {"hipsparseScsrcolor", "rocsparse_scsrcolor", CONV_LIB_FUNC, API_SPARSE, 13, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDcsrcolor", {"hipsparseDcsrcolor", "rocsparse_dcsrcolor", CONV_LIB_FUNC, API_SPARSE, 13, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCcsrcolor", {"hipsparseCcsrcolor", "rocsparse_ccsrcolor", CONV_LIB_FUNC, API_SPARSE, 13, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseZcsrcolor", {"hipsparseZcsrcolor", "rocsparse_zcsrcolor", CONV_LIB_FUNC, API_SPARSE, 13, CUDA_DEPRECATED | HIP_DEPRECATED}}, // 14. cuSPARSE Format Conversion Reference {"cusparseSbsr2csr", {"hipsparseSbsr2csr", "rocsparse_sbsr2csr", CONV_LIB_FUNC, API_SPARSE, 14}}, @@ -647,7 +647,7 @@ const std::map CUDA_SPARSE_FUNCTION_MAP { {"cusparseCnnz", {"hipsparseCnnz", "rocsparse_cnnz", CONV_LIB_FUNC, API_SPARSE, 14}}, {"cusparseZnnz", {"hipsparseZnnz", "rocsparse_znnz", CONV_LIB_FUNC, API_SPARSE, 14}}, - {"cusparseCreateIdentityPermutation", {"hipsparseCreateIdentityPermutation", "rocsparse_create_identity_permutation", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, + {"cusparseCreateIdentityPermutation", {"hipsparseCreateIdentityPermutation", "rocsparse_create_identity_permutation", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseXcoosort_bufferSizeExt", {"hipsparseXcoosort_bufferSizeExt", "rocsparse_coosort_buffer_size", CONV_LIB_FUNC, API_SPARSE, 14}}, {"cusparseXcoosortByRow", {"hipsparseXcoosortByRow", "rocsparse_coosort_by_row", CONV_LIB_FUNC, API_SPARSE, 14}}, @@ -662,73 +662,73 @@ const std::map CUDA_SPARSE_FUNCTION_MAP { {"cusparseCreateCsru2csrInfo", {"hipsparseCreateCsru2csrInfo", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED}}, {"cusparseDestroyCsru2csrInfo", {"hipsparseDestroyCsru2csrInfo", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseScsru2csr", {"hipsparseScsru2csr", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseDcsru2csr", {"hipsparseDcsru2csr", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseCcsru2csr", {"hipsparseCcsru2csr", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseZcsru2csr", {"hipsparseZcsru2csr", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED}}, + {"cusparseScsru2csr", {"hipsparseScsru2csr", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDcsru2csr", {"hipsparseDcsru2csr", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCcsru2csr", {"hipsparseCcsru2csr", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseZcsru2csr", {"hipsparseZcsru2csr", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED | HIP_DEPRECATED}}, - {"cusparseScsru2csr_bufferSizeExt", {"hipsparseScsru2csr_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseDcsru2csr_bufferSizeExt", {"hipsparseDcsru2csr_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseCcsru2csr_bufferSizeExt", {"hipsparseCcsru2csr_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseZcsru2csr_bufferSizeExt", {"hipsparseZcsru2csr_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED}}, + {"cusparseScsru2csr_bufferSizeExt", {"hipsparseScsru2csr_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDcsru2csr_bufferSizeExt", {"hipsparseDcsru2csr_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCcsru2csr_bufferSizeExt", {"hipsparseCcsru2csr_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseZcsru2csr_bufferSizeExt", {"hipsparseZcsru2csr_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED | HIP_DEPRECATED}}, - {"cusparseScsr2csru", {"hipsparseScsr2csru", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseDcsr2csru", {"hipsparseDcsr2csru", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseCcsr2csru", {"hipsparseCcsr2csru", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseZcsr2csru", {"hipsparseZcsr2csru", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED}}, + {"cusparseScsr2csru", {"hipsparseScsr2csru", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDcsr2csru", {"hipsparseDcsr2csru", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCcsr2csru", {"hipsparseCcsr2csru", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseZcsr2csru", {"hipsparseZcsr2csru", "", CONV_LIB_FUNC, API_SPARSE, 14, ROC_UNSUPPORTED | CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseHpruneDense2csr", {"hipsparseHpruneDense2csr", "", CONV_LIB_FUNC, API_SPARSE, 14, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseSpruneDense2csr", {"hipsparseSpruneDense2csr", "rocsparse_sprune_dense2csr", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, - {"cusparseDpruneDense2csr", {"hipsparseDpruneDense2csr", "rocsparse_dprune_dense2csr", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, + {"cusparseSpruneDense2csr", {"hipsparseSpruneDense2csr", "rocsparse_sprune_dense2csr", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDpruneDense2csr", {"hipsparseDpruneDense2csr", "rocsparse_dprune_dense2csr", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseHpruneDense2csr_bufferSizeExt", {"hipsparseHpruneDense2csr_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 14, UNSUPPORTED | CUDA_DEPRECATED}}, {"cusparseSpruneDense2csr_bufferSizeExt", {"hipsparseSpruneDense2csr_bufferSizeExt", "rocsparse_sprune_dense2csr_buffer_size", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, {"cusparseDpruneDense2csr_bufferSizeExt", {"hipsparseDpruneDense2csr_bufferSizeExt", "rocsparse_dprune_dense2csr_buffer_size", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, {"cusparseHpruneDense2csrNnz", {"hipsparseHpruneDense2csrNnz", "", CONV_LIB_FUNC, API_SPARSE, 14, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseSpruneDense2csrNnz", {"hipsparseSpruneDense2csrNnz", "rocsparse_sprune_dense2csr_nnz", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, - {"cusparseDpruneDense2csrNnz", {"hipsparseDpruneDense2csrNnz", "rocsparse_dprune_dense2csr_nnz", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, + {"cusparseSpruneDense2csrNnz", {"hipsparseSpruneDense2csrNnz", "rocsparse_sprune_dense2csr_nnz", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDpruneDense2csrNnz", {"hipsparseDpruneDense2csrNnz", "rocsparse_dprune_dense2csr_nnz", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseHpruneCsr2csr", {"hipsparseHpruneCsr2csr", "", CONV_LIB_FUNC, API_SPARSE, 14, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseSpruneCsr2csr", {"hipsparseSpruneCsr2csr", "rocsparse_sprune_csr2csr", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, - {"cusparseDpruneCsr2csr", {"hipsparseDpruneCsr2csr", "rocsparse_dprune_csr2csr", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, + {"cusparseSpruneCsr2csr", {"hipsparseSpruneCsr2csr", "rocsparse_sprune_csr2csr", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDpruneCsr2csr", {"hipsparseDpruneCsr2csr", "rocsparse_dprune_csr2csr", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseHpruneCsr2csr_bufferSizeExt", {"hipsparseHpruneCsr2csr_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 14, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseSpruneCsr2csr_bufferSizeExt", {"hipsparseSpruneCsr2csr_bufferSizeExt", "rocsparse_sprune_csr2csr_buffer_size", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, - {"cusparseDpruneCsr2csr_bufferSizeExt", {"hipsparseDpruneCsr2csr_bufferSizeExt", "rocsparse_dprune_csr2csr_buffer_size", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, + {"cusparseSpruneCsr2csr_bufferSizeExt", {"hipsparseSpruneCsr2csr_bufferSizeExt", "rocsparse_sprune_csr2csr_buffer_size", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDpruneCsr2csr_bufferSizeExt", {"hipsparseDpruneCsr2csr_bufferSizeExt", "rocsparse_dprune_csr2csr_buffer_size", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseHpruneCsr2csrNnz", {"hipsparseHpruneCsr2csrNnz", "", CONV_LIB_FUNC, API_SPARSE, 14, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseSpruneCsr2csrNnz", {"hipsparseSpruneCsr2csrNnz", "rocsparse_sprune_csr2csr_nnz", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, - {"cusparseDpruneCsr2csrNnz", {"hipsparseDpruneCsr2csrNnz", "rocsparse_dprune_csr2csr_nnz", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, + {"cusparseSpruneCsr2csrNnz", {"hipsparseSpruneCsr2csrNnz", "rocsparse_sprune_csr2csr_nnz", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDpruneCsr2csrNnz", {"hipsparseDpruneCsr2csrNnz", "rocsparse_dprune_csr2csr_nnz", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseHpruneDense2csrByPercentage", {"hipsparseHpruneDense2csrByPercentage", "", CONV_LIB_FUNC, API_SPARSE, 14, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseSpruneDense2csrByPercentage", {"hipsparseSpruneDense2csrByPercentage", "rocsparse_sprune_dense2csr_by_percentage", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, - {"cusparseDpruneDense2csrByPercentage", {"hipsparseDpruneDense2csrByPercentage", "rocsparse_dprune_dense2csr_by_percentage", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, + {"cusparseSpruneDense2csrByPercentage", {"hipsparseSpruneDense2csrByPercentage", "rocsparse_sprune_dense2csr_by_percentage", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDpruneDense2csrByPercentage", {"hipsparseDpruneDense2csrByPercentage", "rocsparse_dprune_dense2csr_by_percentage", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseHpruneDense2csrByPercentage_bufferSizeExt", {"hipsparseHpruneDense2csrByPercentage_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 14, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseSpruneDense2csrByPercentage_bufferSizeExt", {"hipsparseSpruneDense2csrByPercentage_bufferSizeExt", "rocsparse_sprune_dense2csr_by_percentage_buffer_size", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, - {"cusparseDpruneDense2csrByPercentage_bufferSizeExt", {"hipsparseDpruneDense2csrByPercentage_bufferSizeExt", "rocsparse_dprune_dense2csr_by_percentage_buffer_size", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, + {"cusparseSpruneDense2csrByPercentage_bufferSizeExt", {"hipsparseSpruneDense2csrByPercentage_bufferSizeExt", "rocsparse_sprune_dense2csr_by_percentage_buffer_size", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDpruneDense2csrByPercentage_bufferSizeExt", {"hipsparseDpruneDense2csrByPercentage_bufferSizeExt", "rocsparse_dprune_dense2csr_by_percentage_buffer_size", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseHpruneDense2csrNnzByPercentage", {"hipsparseHpruneDense2csrNnzByPercentage", "", CONV_LIB_FUNC, API_SPARSE, 14, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseSpruneDense2csrNnzByPercentage", {"hipsparseSpruneDense2csrNnzByPercentage", "rocsparse_sprune_dense2csr_nnz_by_percentage", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, - {"cusparseDpruneDense2csrNnzByPercentage", {"hipsparseDpruneDense2csrNnzByPercentage", "rocsparse_dprune_dense2csr_nnz_by_percentage", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, + {"cusparseSpruneDense2csrNnzByPercentage", {"hipsparseSpruneDense2csrNnzByPercentage", "rocsparse_sprune_dense2csr_nnz_by_percentage", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDpruneDense2csrNnzByPercentage", {"hipsparseDpruneDense2csrNnzByPercentage", "rocsparse_dprune_dense2csr_nnz_by_percentage", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseHpruneCsr2csrByPercentage", {"hipsparseHpruneCsr2csrByPercentage", "", CONV_LIB_FUNC, API_SPARSE, 14, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseSpruneCsr2csrByPercentage", {"hipsparseSpruneCsr2csrByPercentage", "rocsparse_sprune_csr2csr_by_percentage", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, - {"cusparseDpruneCsr2csrByPercentage", {"hipsparseDpruneCsr2csrByPercentage", "rocsparse_dprune_csr2csr_by_percentage", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, + {"cusparseSpruneCsr2csrByPercentage", {"hipsparseSpruneCsr2csrByPercentage", "rocsparse_sprune_csr2csr_by_percentage", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDpruneCsr2csrByPercentage", {"hipsparseDpruneCsr2csrByPercentage", "rocsparse_dprune_csr2csr_by_percentage", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseHpruneCsr2csrByPercentage_bufferSizeExt", {"hipsparseHpruneCsr2csrByPercentage_bufferSizeExt", "", CONV_LIB_FUNC, API_SPARSE, 14, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseSpruneCsr2csrByPercentage_bufferSizeExt", {"hipsparseSpruneCsr2csrByPercentage_bufferSizeExt", "rocsparse_sprune_csr2csr_by_percentage_buffer_size", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, - {"cusparseDpruneCsr2csrByPercentage_bufferSizeExt", {"hipsparseDpruneCsr2csrByPercentage_bufferSizeExt", "rocsparse_dprune_csr2csr_by_percentage_buffer_size", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, + {"cusparseSpruneCsr2csrByPercentage_bufferSizeExt", {"hipsparseSpruneCsr2csrByPercentage_bufferSizeExt", "rocsparse_sprune_csr2csr_by_percentage_buffer_size", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDpruneCsr2csrByPercentage_bufferSizeExt", {"hipsparseDpruneCsr2csrByPercentage_bufferSizeExt", "rocsparse_dprune_csr2csr_by_percentage_buffer_size", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, {"cusparseHpruneCsr2csrNnzByPercentage", {"hipsparseHpruneCsr2csrNnzByPercentage", "", CONV_LIB_FUNC, API_SPARSE, 14, UNSUPPORTED | CUDA_DEPRECATED}}, - {"cusparseSpruneCsr2csrNnzByPercentage", {"hipsparseSpruneCsr2csrNnzByPercentage", "rocsparse_sprune_csr2csr_nnz_by_percentage", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, - {"cusparseDpruneCsr2csrNnzByPercentage", {"hipsparseDpruneCsr2csrNnzByPercentage", "rocsparse_dprune_csr2csr_nnz_by_percentage", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, + {"cusparseSpruneCsr2csrNnzByPercentage", {"hipsparseSpruneCsr2csrNnzByPercentage", "rocsparse_sprune_csr2csr_nnz_by_percentage", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDpruneCsr2csrNnzByPercentage", {"hipsparseDpruneCsr2csrNnzByPercentage", "rocsparse_dprune_csr2csr_nnz_by_percentage", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, - {"cusparseSnnz_compress", {"hipsparseSnnz_compress", "rocsparse_snnz_compress", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, - {"cusparseDnnz_compress", {"hipsparseDnnz_compress", "rocsparse_dnnz_compress", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, - {"cusparseCnnz_compress", {"hipsparseCnnz_compress", "rocsparse_cnnz_compress", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, - {"cusparseZnnz_compress", {"hipsparseZnnz_compress", "rocsparse_znnz_compress", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED}}, + {"cusparseSnnz_compress", {"hipsparseSnnz_compress", "rocsparse_snnz_compress", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseDnnz_compress", {"hipsparseDnnz_compress", "rocsparse_dnnz_compress", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseCnnz_compress", {"hipsparseCnnz_compress", "rocsparse_cnnz_compress", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, + {"cusparseZnnz_compress", {"hipsparseZnnz_compress", "rocsparse_znnz_compress", CONV_LIB_FUNC, API_SPARSE, 14, CUDA_DEPRECATED | HIP_DEPRECATED}}, // 15. cuSPARSE Generic API Reference // Generic Sparse API helper functions @@ -749,8 +749,8 @@ const std::map CUDA_SPARSE_FUNCTION_MAP { {"cusparseConstCsrGet", {"hipsparseConstCsrGet", "rocsparse_const_csr_get", CONV_LIB_FUNC, API_SPARSE, 15}}, {"cusparseCsrSetPointers", {"hipsparseCsrSetPointers", "rocsparse_csr_set_pointers", CONV_LIB_FUNC, API_SPARSE, 15}}, {"cusparseCscSetPointers", {"hipsparseCscSetPointers", "rocsparse_csc_set_pointers", CONV_LIB_FUNC, API_SPARSE, 15}}, - {"cusparseCscGet", {"hipsparseCscGet", "", CONV_LIB_FUNC, API_SPARSE, 15, UNSUPPORTED}}, - {"cusparseConstCscGet", {"hipsparseConstCscGet", "rocsparse_const_csc_get", CONV_LIB_FUNC, API_SPARSE, 15, HIP_UNSUPPORTED}}, + {"cusparseCscGet", {"hipsparseCscGet", "rocsparse_csc_get", CONV_LIB_FUNC, API_SPARSE, 15, HIP_EXPERIMENTAL}}, + {"cusparseConstCscGet", {"hipsparseConstCscGet", "rocsparse_const_csc_get", CONV_LIB_FUNC, API_SPARSE, 15, HIP_EXPERIMENTAL}}, {"cusparseCooSetPointers", {"hipsparseCooSetPointers", "rocsparse_coo_set_pointers", CONV_LIB_FUNC, API_SPARSE, 15}}, {"cusparseCsrSetStridedBatch", {"hipsparseCsrSetStridedBatch", "rocsparse_csr_set_strided_batch", CONV_LIB_FUNC, API_SPARSE, 15}}, {"cusparseSpMatGetFormat", {"hipsparseSpMatGetFormat", "rocsparse_spmat_get_format", CONV_LIB_FUNC, API_SPARSE, 15}}, @@ -819,17 +819,15 @@ const std::map CUDA_SPARSE_FUNCTION_MAP { // Sparse Triangular Vector Solve {"cusparseSpSV_createDescr", {"hipsparseSpSV_createDescr", "", CONV_LIB_FUNC, API_SPARSE, 15, ROC_UNSUPPORTED}}, {"cusparseSpSV_destroyDescr", {"hipsparseSpSV_destroyDescr", "", CONV_LIB_FUNC, API_SPARSE, 15, ROC_UNSUPPORTED}}, - {"cusparseSpSV_bufferSize", {"hipsparseSpSV_bufferSize", "", CONV_LIB_FUNC, API_SPARSE, 15, ROC_UNSUPPORTED}}, + {"cusparseSpSV_bufferSize", {"hipsparseSpSV_bufferSize", "rocsparse_spsv", CONV_LIB_FUNC, API_SPARSE, 15}}, {"cusparseSpSV_analysis", {"hipsparseSpSV_analysis", "", CONV_LIB_FUNC, API_SPARSE, 15, ROC_UNSUPPORTED}}, {"cusparseSpSV_solve", {"hipsparseSpSV_solve", "", CONV_LIB_FUNC, API_SPARSE, 15, ROC_UNSUPPORTED}}, {"cusparseSpSV_updateMatrix", {"hipsparseSpSV_updateMatrix", "", CONV_LIB_FUNC, API_SPARSE, 15, UNSUPPORTED}}, // Sparse Matrix * Matrix Multiplication - // TODO: hipification cusparseSpMM into rocsparse_spmm needs additional variable declared and allocated - {"cusparseSpMM", {"hipsparseSpMM", "", CONV_LIB_FUNC, API_SPARSE, 15, ROC_UNSUPPORTED}}, + {"cusparseSpMM", {"hipsparseSpMM", "rocsparse_spmm", CONV_LIB_FUNC, API_SPARSE, 15}}, {"cusparseSpMM_bufferSize", {"hipsparseSpMM_bufferSize", "rocsparse_spmm", CONV_LIB_FUNC, API_SPARSE, 15}}, - // TODO: hipification cusparseSpMM_preprocess into rocsparse_spmm needs additional variable declared and allocated - {"cusparseSpMM_preprocess", {"hipsparseSpMM_preprocess", "", CONV_LIB_FUNC, API_SPARSE, 15, ROC_UNSUPPORTED}}, + {"cusparseSpMM_preprocess", {"hipsparseSpMM_preprocess", "rocsparse_spmm", CONV_LIB_FUNC, API_SPARSE, 15}}, {"cusparseSpMMOp", {"hipsparseSpMMOp", "", CONV_LIB_FUNC, API_SPARSE, 15, UNSUPPORTED}}, {"cusparseSpMMOp_createPlan", {"hipsparseSpMMOp_createPlan", "", CONV_LIB_FUNC, API_SPARSE, 15, UNSUPPORTED}}, {"cusparseSpMMOp_destroyPlan", {"hipsparseSpMMOp_destroyPlan", "", CONV_LIB_FUNC, API_SPARSE, 15, UNSUPPORTED}}, @@ -853,18 +851,17 @@ const std::map CUDA_SPARSE_FUNCTION_MAP { {"cusparseConstrainedGeMM_bufferSize", {"hipsparseConstrainedGeMM_bufferSize", "", CONV_LIB_FUNC, API_SPARSE, 15, UNSUPPORTED | CUDA_DEPRECATED | CUDA_REMOVED}}, // Sparse Vector * Vector Operations - // NOTE: rocsparse_spvv has one additional argument: size_t* buffer_size, thus cusparseSpVV is still ROC_UNSUPPORTED - {"cusparseSpVV", {"hipsparseSpVV", "", CONV_LIB_FUNC, API_SPARSE, 15, ROC_UNSUPPORTED}}, - {"cusparseSpVV_bufferSize", {"hipsparseSpVV_bufferSize", "", CONV_LIB_FUNC, API_SPARSE, 15, ROC_UNSUPPORTED}}, + {"cusparseSpVV", {"hipsparseSpVV", "rocsparse_spvv", CONV_LIB_FUNC, API_SPARSE, 15}}, + {"cusparseSpVV_bufferSize", {"hipsparseSpVV_bufferSize", "rocsparse_spvv", CONV_LIB_FUNC, API_SPARSE, 15}}, {"cusparseAxpby", {"hipsparseAxpby", "rocsparse_axpby", CONV_LIB_FUNC, API_SPARSE, 15}}, {"cusparseGather", {"hipsparseGather", "rocsparse_gather", CONV_LIB_FUNC, API_SPARSE, 15}}, {"cusparseScatter", {"hipsparseScatter", "rocsparse_scatter", CONV_LIB_FUNC, API_SPARSE, 15}}, - {"cusparseRot", {"hipsparseRot", "rocsparse_rot", CONV_LIB_FUNC, API_SPARSE, 15, CUDA_DEPRECATED}}, + {"cusparseRot", {"hipsparseRot", "rocsparse_rot", CONV_LIB_FUNC, API_SPARSE, 15, CUDA_DEPRECATED | HIP_DEPRECATED}}, // Sparse Matrix * Vector Multiplication {"cusparseSpMV", {"hipsparseSpMV", "rocsparse_spmv", CONV_LIB_FUNC, API_SPARSE, 15}}, - {"cusparseSpMV_bufferSize", {"hipsparseSpMV_bufferSize", "", CONV_LIB_FUNC, API_SPARSE, 15, ROC_UNSUPPORTED}}, + {"cusparseSpMV_bufferSize", {"hipsparseSpMV_bufferSize", "rocsparse_spmv", CONV_LIB_FUNC, API_SPARSE, 15}}, {"cusparseSparseToDense", {"hipsparseSparseToDense", "rocsparse_sparse_to_dense", CONV_LIB_FUNC, API_SPARSE, 15}}, {"cusparseSparseToDense_bufferSize", {"hipsparseSparseToDense_bufferSize", "rocsparse_sparse_to_dense", CONV_LIB_FUNC, API_SPARSE, 15}}, @@ -1164,12 +1161,12 @@ const std::map CUDA_SPARSE_FUNCTION_VER_MAP { {"cusparseDnVecGet", {CUDA_102, CUDA_0, CUDA_0 }}, {"cusparseDnVecGetValues", {CUDA_102, CUDA_0, CUDA_0 }}, {"cusparseDnVecSetValues", {CUDA_102, CUDA_0, CUDA_0 }}, - {"cusparseSpMM", {CUDA_101, CUDA_0, CUDA_0 }}, - {"cusparseSpMM_bufferSize", {CUDA_101, CUDA_0, CUDA_0 }}, - {"cusparseSpVV", {CUDA_102, CUDA_0, CUDA_0 }}, - {"cusparseSpVV_bufferSize", {CUDA_102, CUDA_0, CUDA_0 }}, - {"cusparseSpMV", {CUDA_102, CUDA_0, CUDA_0 }}, - {"cusparseSpMV_bufferSize", {CUDA_102, CUDA_0, CUDA_0 }}, + {"cusparseSpMM", {CUDA_101, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 10010 C: CUSPARSE_VERSION 12000 + {"cusparseSpMM_bufferSize", {CUDA_101, CUDA_0, CUDA_0 }}, // A: CUDA_VERSION 10010 C: CUSPARSE_VERSION 12000 + {"cusparseSpVV", {CUDA_101, CUDA_0, CUDA_0 }}, // A: CUSPARSE_VERSION 10200 C: CUSPARSE_VERSION 12000 + {"cusparseSpVV_bufferSize", {CUDA_101, CUDA_0, CUDA_0 }}, // A: CUSPARSE_VERSION 10200 C: CUSPARSE_VERSION 12000 + {"cusparseSpMV", {CUDA_101, CUDA_0, CUDA_0 }}, // A: CUSPARSE_VERSION 10200 C: CUSPARSE_VERSION 12000 + {"cusparseSpMV_bufferSize", {CUDA_101, CUDA_0, CUDA_0 }}, // A: CUSPARSE_VERSION 10200 C: CUSPARSE_VERSION 12000 {"cusparseSaxpyi", {CUDA_0, CUDA_110, CUDA_120}}, {"cusparseDaxpyi", {CUDA_0, CUDA_110, CUDA_120}}, {"cusparseCaxpyi", {CUDA_0, CUDA_110, CUDA_120}}, @@ -1485,20 +1482,20 @@ const std::map HIP_SPARSE_FUNCTION_VER_MAP { {"hipsparseDestroyCsrsv2Info", {HIP_1092, HIP_0, HIP_0 }}, {"hipsparseCreateCsrsm2Info", {HIP_3010, HIP_0, HIP_0 }}, {"hipsparseDestroyCsrsm2Info", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseCreateCsric02Info", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseDestroyCsric02Info", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseCreateCsrilu02Info", {HIP_1092, HIP_0, HIP_0 }}, - {"hipsparseDestroyCsrilu02Info", {HIP_1092, HIP_0, HIP_0 }}, - {"hipsparseCreateBsrsv2Info", {HIP_3060, HIP_0, HIP_0 }}, - {"hipsparseDestroyBsrsv2Info", {HIP_3060, HIP_0, HIP_0 }}, - {"hipsparseCreateBsric02Info", {HIP_3080, HIP_0, HIP_0 }}, - {"hipsparseDestroyBsric02Info", {HIP_3080, HIP_0, HIP_0 }}, - {"hipsparseCreateBsrilu02Info", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseDestroyBsrilu02Info", {HIP_3090, HIP_0, HIP_0 }}, + {"hipsparseCreateCsric02Info", {HIP_3010, HIP_6010, HIP_0 }}, + {"hipsparseDestroyCsric02Info", {HIP_3010, HIP_6010, HIP_0 }}, + {"hipsparseCreateCsrilu02Info", {HIP_1092, HIP_6010, HIP_0 }}, + {"hipsparseDestroyCsrilu02Info", {HIP_1092, HIP_6010, HIP_0 }}, + {"hipsparseCreateBsrsv2Info", {HIP_3060, HIP_6010, HIP_0 }}, + {"hipsparseDestroyBsrsv2Info", {HIP_3060, HIP_6010, HIP_0 }}, + {"hipsparseCreateBsric02Info", {HIP_3080, HIP_6010, HIP_0 }}, + {"hipsparseDestroyBsric02Info", {HIP_3080, HIP_6010, HIP_0 }}, + {"hipsparseCreateBsrilu02Info", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseDestroyBsrilu02Info", {HIP_3090, HIP_6010, HIP_0 }}, {"hipsparseCreateCsrgemm2Info", {HIP_2080, HIP_0, HIP_0 }}, {"hipsparseDestroyCsrgemm2Info", {HIP_2080, HIP_0, HIP_0 }}, - {"hipsparseCreatePruneInfo", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseDestroyPruneInfo", {HIP_3090, HIP_0, HIP_0 }}, + {"hipsparseCreatePruneInfo", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseDestroyPruneInfo", {HIP_3090, HIP_6010, HIP_0 }}, {"hipsparseSaxpyi", {HIP_1092, HIP_0, HIP_0 }}, {"hipsparseDaxpyi", {HIP_1092, HIP_0, HIP_0 }}, {"hipsparseCaxpyi", {HIP_3010, HIP_0, HIP_0 }}, @@ -1531,23 +1528,23 @@ const std::map HIP_SPARSE_FUNCTION_VER_MAP { {"hipsparseDcsrmv", {HIP_1092, HIP_0, HIP_0 }}, {"hipsparseCcsrmv", {HIP_3010, HIP_0, HIP_0 }}, {"hipsparseZcsrmv", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseSbsrsv2_bufferSize", {HIP_3060, HIP_0, HIP_0 }}, + {"hipsparseSbsrsv2_bufferSize", {HIP_3060, HIP_6010, HIP_0 }}, {"hipsparseSbsrsv2_bufferSizeExt", {HIP_3060, HIP_0, HIP_0 }}, - {"hipsparseDbsrsv2_bufferSize", {HIP_3060, HIP_0, HIP_0 }}, + {"hipsparseDbsrsv2_bufferSize", {HIP_3060, HIP_6010, HIP_0 }}, {"hipsparseDbsrsv2_bufferSizeExt", {HIP_3060, HIP_0, HIP_0 }}, - {"hipsparseCbsrsv2_bufferSize", {HIP_3060, HIP_0, HIP_0 }}, + {"hipsparseCbsrsv2_bufferSize", {HIP_3060, HIP_6010, HIP_0 }}, {"hipsparseCbsrsv2_bufferSizeExt", {HIP_3060, HIP_0, HIP_0 }}, - {"hipsparseZbsrsv2_bufferSize", {HIP_3060, HIP_0, HIP_0 }}, + {"hipsparseZbsrsv2_bufferSize", {HIP_3060, HIP_6010, HIP_0 }}, {"hipsparseZbsrsv2_bufferSizeExt", {HIP_3060, HIP_0, HIP_0 }}, - {"hipsparseSbsrsv2_analysis", {HIP_3060, HIP_0, HIP_0 }}, - {"hipsparseDbsrsv2_analysis", {HIP_3060, HIP_0, HIP_0 }}, - {"hipsparseCbsrsv2_analysis", {HIP_3060, HIP_0, HIP_0 }}, - {"hipsparseZbsrsv2_analysis", {HIP_3060, HIP_0, HIP_0 }}, - {"hipsparseSbsrsv2_solve", {HIP_3060, HIP_0, HIP_0 }}, - {"hipsparseDbsrsv2_solve", {HIP_3060, HIP_0, HIP_0 }}, - {"hipsparseCbsrsv2_solve", {HIP_3060, HIP_0, HIP_0 }}, - {"hipsparseZbsrsv2_solve", {HIP_3060, HIP_0, HIP_0 }}, - {"hipsparseXbsrsv2_zeroPivot", {HIP_3060, HIP_0, HIP_0 }}, + {"hipsparseSbsrsv2_analysis", {HIP_3060, HIP_6010, HIP_0 }}, + {"hipsparseDbsrsv2_analysis", {HIP_3060, HIP_6010, HIP_0 }}, + {"hipsparseCbsrsv2_analysis", {HIP_3060, HIP_6010, HIP_0 }}, + {"hipsparseZbsrsv2_analysis", {HIP_3060, HIP_6010, HIP_0 }}, + {"hipsparseSbsrsv2_solve", {HIP_3060, HIP_6010, HIP_0 }}, + {"hipsparseDbsrsv2_solve", {HIP_3060, HIP_6010, HIP_0 }}, + {"hipsparseCbsrsv2_solve", {HIP_3060, HIP_6010, HIP_0 }}, + {"hipsparseZbsrsv2_solve", {HIP_3060, HIP_6010, HIP_0 }}, + {"hipsparseXbsrsv2_zeroPivot", {HIP_3060, HIP_6010, HIP_0 }}, {"hipsparseScsrsv2_bufferSize", {HIP_1092, HIP_0, HIP_0 }}, {"hipsparseScsrsv2_bufferSizeExt", {HIP_1092, HIP_0, HIP_0 }}, {"hipsparseDcsrsv2_bufferSize", {HIP_1092, HIP_0, HIP_0 }}, @@ -1626,74 +1623,74 @@ const std::map HIP_SPARSE_FUNCTION_VER_MAP { {"hipsparseDcsrgemm2_bufferSizeExt", {HIP_2080, HIP_0, HIP_0 }}, {"hipsparseCcsrgemm2_bufferSizeExt", {HIP_3010, HIP_0, HIP_0 }}, {"hipsparseZcsrgemm2_bufferSizeExt", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseScsric02_bufferSize", {HIP_3010, HIP_0, HIP_0 }}, + {"hipsparseScsric02_bufferSize", {HIP_3010, HIP_6010, HIP_0 }}, {"hipsparseScsric02_bufferSizeExt", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseDcsric02_bufferSize", {HIP_3010, HIP_0, HIP_0 }}, + {"hipsparseDcsric02_bufferSize", {HIP_3010, HIP_6010, HIP_0 }}, {"hipsparseDcsric02_bufferSizeExt", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseCcsric02_bufferSize", {HIP_3010, HIP_0, HIP_0 }}, + {"hipsparseCcsric02_bufferSize", {HIP_3010, HIP_6010, HIP_0 }}, {"hipsparseCcsric02_bufferSizeExt", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseZcsric02_bufferSize", {HIP_3010, HIP_0, HIP_0 }}, + {"hipsparseZcsric02_bufferSize", {HIP_3010, HIP_6010, HIP_0 }}, {"hipsparseZcsric02_bufferSizeExt", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseScsric02_analysis", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseDcsric02_analysis", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseCcsric02_analysis", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseZcsric02_analysis", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseScsric02", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseDcsric02", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseCcsric02", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseZcsric02", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseXcsric02_zeroPivot", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseSbsric02_bufferSize", {HIP_3080, HIP_0, HIP_0 }}, - {"hipsparseDbsric02_bufferSize", {HIP_3080, HIP_0, HIP_0 }}, - {"hipsparseCbsric02_bufferSize", {HIP_3080, HIP_0, HIP_0 }}, - {"hipsparseZbsric02_bufferSize", {HIP_3080, HIP_0, HIP_0 }}, - {"hipsparseSbsric02_analysis", {HIP_3080, HIP_0, HIP_0 }}, - {"hipsparseDbsric02_analysis", {HIP_3080, HIP_0, HIP_0 }}, - {"hipsparseCbsric02_analysis", {HIP_3080, HIP_0, HIP_0 }}, - {"hipsparseZbsric02_analysis", {HIP_3080, HIP_0, HIP_0 }}, - {"hipsparseSbsric02", {HIP_3080, HIP_0, HIP_0 }}, - {"hipsparseDbsric02", {HIP_3080, HIP_0, HIP_0 }}, - {"hipsparseCbsric02", {HIP_3080, HIP_0, HIP_0 }}, - {"hipsparseZbsric02", {HIP_3080, HIP_0, HIP_0 }}, - {"hipsparseXbsric02_zeroPivot", {HIP_3080, HIP_0, HIP_0 }}, - {"hipsparseScsrilu02_numericBoost", {HIP_3100, HIP_0, HIP_0 }}, - {"hipsparseDcsrilu02_numericBoost", {HIP_3100, HIP_0, HIP_0 }}, - {"hipsparseCcsrilu02_numericBoost", {HIP_3100, HIP_0, HIP_0 }}, - {"hipsparseZcsrilu02_numericBoost", {HIP_3100, HIP_0, HIP_0 }}, - {"hipsparseXcsrilu02_zeroPivot", {HIP_1092, HIP_0, HIP_0 }}, - {"hipsparseScsrilu02_bufferSize", {HIP_1092, HIP_0, HIP_0 }}, + {"hipsparseScsric02_analysis", {HIP_3010, HIP_6010, HIP_0 }}, + {"hipsparseDcsric02_analysis", {HIP_3010, HIP_6010, HIP_0 }}, + {"hipsparseCcsric02_analysis", {HIP_3010, HIP_6010, HIP_0 }}, + {"hipsparseZcsric02_analysis", {HIP_3010, HIP_6010, HIP_0 }}, + {"hipsparseScsric02", {HIP_3010, HIP_6010, HIP_0 }}, + {"hipsparseDcsric02", {HIP_3010, HIP_6010, HIP_0 }}, + {"hipsparseCcsric02", {HIP_3010, HIP_6010, HIP_0 }}, + {"hipsparseZcsric02", {HIP_3010, HIP_6010, HIP_0 }}, + {"hipsparseXcsric02_zeroPivot", {HIP_3010, HIP_6010, HIP_0 }}, + {"hipsparseSbsric02_bufferSize", {HIP_3080, HIP_6010, HIP_0 }}, + {"hipsparseDbsric02_bufferSize", {HIP_3080, HIP_6010, HIP_0 }}, + {"hipsparseCbsric02_bufferSize", {HIP_3080, HIP_6010, HIP_0 }}, + {"hipsparseZbsric02_bufferSize", {HIP_3080, HIP_6010, HIP_0 }}, + {"hipsparseSbsric02_analysis", {HIP_3080, HIP_6010, HIP_0 }}, + {"hipsparseDbsric02_analysis", {HIP_3080, HIP_6010, HIP_0 }}, + {"hipsparseCbsric02_analysis", {HIP_3080, HIP_6010, HIP_0 }}, + {"hipsparseZbsric02_analysis", {HIP_3080, HIP_6010, HIP_0 }}, + {"hipsparseSbsric02", {HIP_3080, HIP_6010, HIP_0 }}, + {"hipsparseDbsric02", {HIP_3080, HIP_6010, HIP_0 }}, + {"hipsparseCbsric02", {HIP_3080, HIP_6010, HIP_0 }}, + {"hipsparseZbsric02", {HIP_3080, HIP_6010, HIP_0 }}, + {"hipsparseXbsric02_zeroPivot", {HIP_3080, HIP_6010, HIP_0 }}, + {"hipsparseScsrilu02_numericBoost", {HIP_3100, HIP_6010, HIP_0 }}, + {"hipsparseDcsrilu02_numericBoost", {HIP_3100, HIP_6010, HIP_0 }}, + {"hipsparseCcsrilu02_numericBoost", {HIP_3100, HIP_6010, HIP_0 }}, + {"hipsparseZcsrilu02_numericBoost", {HIP_3100, HIP_6010, HIP_0 }}, + {"hipsparseXcsrilu02_zeroPivot", {HIP_1092, HIP_6010, HIP_0 }}, + {"hipsparseScsrilu02_bufferSize", {HIP_1092, HIP_6010, HIP_0 }}, {"hipsparseScsrilu02_bufferSizeExt", {HIP_1092, HIP_0, HIP_0 }}, - {"hipsparseDcsrilu02_bufferSize", {HIP_1092, HIP_0, HIP_0 }}, + {"hipsparseDcsrilu02_bufferSize", {HIP_1092, HIP_6010, HIP_0 }}, {"hipsparseDcsrilu02_bufferSizeExt", {HIP_1092, HIP_0, HIP_0 }}, - {"hipsparseCcsrilu02_bufferSize", {HIP_3010, HIP_0, HIP_0 }}, + {"hipsparseCcsrilu02_bufferSize", {HIP_3010, HIP_6010, HIP_0 }}, {"hipsparseCcsrilu02_bufferSizeExt", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseZcsrilu02_bufferSize", {HIP_3010, HIP_0, HIP_0 }}, + {"hipsparseZcsrilu02_bufferSize", {HIP_3010, HIP_6010, HIP_0 }}, {"hipsparseZcsrilu02_bufferSizeExt", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseScsrilu02_analysis", {HIP_1092, HIP_0, HIP_0 }}, - {"hipsparseDcsrilu02_analysis", {HIP_1092, HIP_0, HIP_0 }}, - {"hipsparseCcsrilu02_analysis", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseZcsrilu02_analysis", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseScsrilu02", {HIP_1092, HIP_0, HIP_0 }}, - {"hipsparseDcsrilu02", {HIP_1092, HIP_0, HIP_0 }}, - {"hipsparseCcsrilu02", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseZcsrilu02", {HIP_3010, HIP_0, HIP_0 }}, - {"hipsparseSbsrilu02_numericBoost", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseDbsrilu02_numericBoost", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseCbsrilu02_numericBoost", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseZbsrilu02_numericBoost", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseSbsrilu02_bufferSize", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseDbsrilu02_bufferSize", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseCbsrilu02_bufferSize", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseZbsrilu02_bufferSize", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseSbsrilu02_analysis", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseDbsrilu02_analysis", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseCbsrilu02_analysis", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseZbsrilu02_analysis", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseSbsrilu02", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseDbsrilu02", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseCbsrilu02", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseZbsrilu02", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseXbsrilu02_zeroPivot", {HIP_3090, HIP_0, HIP_0 }}, + {"hipsparseScsrilu02_analysis", {HIP_1092, HIP_6010, HIP_0 }}, + {"hipsparseDcsrilu02_analysis", {HIP_1092, HIP_6010, HIP_0 }}, + {"hipsparseCcsrilu02_analysis", {HIP_3010, HIP_6010, HIP_0 }}, + {"hipsparseZcsrilu02_analysis", {HIP_3010, HIP_6010, HIP_0 }}, + {"hipsparseScsrilu02", {HIP_1092, HIP_6010, HIP_0 }}, + {"hipsparseDcsrilu02", {HIP_1092, HIP_6010, HIP_0 }}, + {"hipsparseCcsrilu02", {HIP_3010, HIP_6010, HIP_0 }}, + {"hipsparseZcsrilu02", {HIP_3010, HIP_6010, HIP_0 }}, + {"hipsparseSbsrilu02_numericBoost", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseDbsrilu02_numericBoost", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseCbsrilu02_numericBoost", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseZbsrilu02_numericBoost", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseSbsrilu02_bufferSize", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseDbsrilu02_bufferSize", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseCbsrilu02_bufferSize", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseZbsrilu02_bufferSize", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseSbsrilu02_analysis", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseDbsrilu02_analysis", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseCbsrilu02_analysis", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseZbsrilu02_analysis", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseSbsrilu02", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseDbsrilu02", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseCbsrilu02", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseZbsrilu02", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseXbsrilu02_zeroPivot", {HIP_3090, HIP_6010, HIP_0 }}, {"hipsparseSbsr2csr", {HIP_3050, HIP_0, HIP_0 }}, {"hipsparseDbsr2csr", {HIP_3050, HIP_0, HIP_0 }}, {"hipsparseCbsr2csr", {HIP_3050, HIP_0, HIP_0 }}, @@ -1741,7 +1738,7 @@ const std::map HIP_SPARSE_FUNCTION_VER_MAP { {"hipsparseDnnz", {HIP_3020, HIP_0, HIP_0 }}, {"hipsparseCnnz", {HIP_3020, HIP_0, HIP_0 }}, {"hipsparseZnnz", {HIP_3020, HIP_0, HIP_0 }}, - {"hipsparseCreateIdentityPermutation", {HIP_1092, HIP_0, HIP_0 }}, + {"hipsparseCreateIdentityPermutation", {HIP_1092, HIP_6010, HIP_0 }}, {"hipsparseXcoosort_bufferSizeExt", {HIP_1092, HIP_0, HIP_0 }}, {"hipsparseXcoosortByRow", {HIP_1092, HIP_0, HIP_0 }}, {"hipsparseXcoosortByColumn", {HIP_1092, HIP_0, HIP_0 }}, @@ -1749,34 +1746,34 @@ const std::map HIP_SPARSE_FUNCTION_VER_MAP { {"hipsparseXcsrsort", {HIP_1092, HIP_0, HIP_0 }}, {"hipsparseXcscsort_bufferSizeExt", {HIP_2100, HIP_0, HIP_0 }}, {"hipsparseXcscsort", {HIP_2100, HIP_0, HIP_0 }}, - {"hipsparseSpruneDense2csr", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseDpruneDense2csr", {HIP_3090, HIP_0, HIP_0 }}, + {"hipsparseSpruneDense2csr", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseDpruneDense2csr", {HIP_3090, HIP_6010, HIP_0 }}, {"hipsparseSpruneDense2csr_bufferSizeExt", {HIP_3090, HIP_0, HIP_0 }}, {"hipsparseDpruneDense2csr_bufferSizeExt", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseSpruneDense2csrNnz", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseDpruneDense2csrNnz", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseSpruneCsr2csr", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseDpruneCsr2csr", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseSpruneCsr2csr_bufferSizeExt", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseDpruneCsr2csr_bufferSizeExt", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseSpruneCsr2csrNnz", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseDpruneCsr2csrNnz", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseSpruneDense2csrByPercentage", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseDpruneDense2csrByPercentage", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseSpruneDense2csrByPercentage_bufferSizeExt", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseDpruneDense2csrByPercentage_bufferSizeExt", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseSpruneDense2csrNnzByPercentage", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseDpruneDense2csrNnzByPercentage", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseSpruneCsr2csrByPercentage", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseDpruneCsr2csrByPercentage", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseSpruneCsr2csrByPercentage_bufferSizeExt", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseDpruneCsr2csrByPercentage_bufferSizeExt", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseSpruneCsr2csrNnzByPercentage", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseDpruneCsr2csrNnzByPercentage", {HIP_3090, HIP_0, HIP_0 }}, - {"hipsparseSnnz_compress", {HIP_3050, HIP_0, HIP_0 }}, - {"hipsparseDnnz_compress", {HIP_3050, HIP_0, HIP_0 }}, - {"hipsparseCnnz_compress", {HIP_3050, HIP_0, HIP_0 }}, - {"hipsparseZnnz_compress", {HIP_3050, HIP_0, HIP_0 }}, + {"hipsparseSpruneDense2csrNnz", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseDpruneDense2csrNnz", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseSpruneCsr2csr", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseDpruneCsr2csr", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseSpruneCsr2csr_bufferSizeExt", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseDpruneCsr2csr_bufferSizeExt", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseSpruneCsr2csrNnz", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseDpruneCsr2csrNnz", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseSpruneDense2csrByPercentage", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseDpruneDense2csrByPercentage", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseSpruneDense2csrByPercentage_bufferSizeExt", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseDpruneDense2csrByPercentage_bufferSizeExt", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseSpruneDense2csrNnzByPercentage", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseDpruneDense2csrNnzByPercentage", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseSpruneCsr2csrByPercentage", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseDpruneCsr2csrByPercentage", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseSpruneCsr2csrByPercentage_bufferSizeExt", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseDpruneCsr2csrByPercentage_bufferSizeExt", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseSpruneCsr2csrNnzByPercentage", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseDpruneCsr2csrNnzByPercentage", {HIP_3090, HIP_6010, HIP_0 }}, + {"hipsparseSnnz_compress", {HIP_3050, HIP_6010, HIP_0 }}, + {"hipsparseDnnz_compress", {HIP_3050, HIP_6010, HIP_0 }}, + {"hipsparseCnnz_compress", {HIP_3050, HIP_6010, HIP_0 }}, + {"hipsparseZnnz_compress", {HIP_3050, HIP_6010, HIP_0 }}, {"hipsparseSgebsr2gebsc_bufferSize", {HIP_4010, HIP_0, HIP_0 }}, {"hipsparseDgebsr2gebsc_bufferSize", {HIP_4010, HIP_0, HIP_0 }}, {"hipsparseCgebsr2gebsc_bufferSize", {HIP_4010, HIP_0, HIP_0 }}, @@ -1841,23 +1838,23 @@ const std::map HIP_SPARSE_FUNCTION_VER_MAP { {"hipsparseAxpby", {HIP_4010, HIP_0, HIP_0 }}, {"hipsparseGather", {HIP_4010, HIP_0, HIP_0 }}, {"hipsparseScatter", {HIP_4010, HIP_0, HIP_0 }}, - {"hipsparseRot", {HIP_4010, HIP_0, HIP_0 }}, + {"hipsparseRot", {HIP_4010, HIP_6010, HIP_0 }}, {"hipsparseSpMV", {HIP_4010, HIP_0, HIP_0 }}, {"hipsparseSpMV_bufferSize", {HIP_4010, HIP_0, HIP_0 }}, {"hipsparseCreateCsru2csrInfo", {HIP_4020, HIP_0, HIP_0 }}, {"hipsparseDestroyCsru2csrInfo", {HIP_4020, HIP_0, HIP_0 }}, - {"hipsparseScsru2csr_bufferSizeExt", {HIP_4020, HIP_0, HIP_0 }}, - {"hipsparseDcsru2csr_bufferSizeExt", {HIP_4020, HIP_0, HIP_0 }}, - {"hipsparseCcsru2csr_bufferSizeExt", {HIP_4020, HIP_0, HIP_0 }}, - {"hipsparseZcsru2csr_bufferSizeExt", {HIP_4020, HIP_0, HIP_0 }}, - {"hipsparseScsru2csr", {HIP_4020, HIP_0, HIP_0 }}, - {"hipsparseDcsru2csr", {HIP_4020, HIP_0, HIP_0 }}, - {"hipsparseCcsru2csr", {HIP_4020, HIP_0, HIP_0 }}, - {"hipsparseZcsru2csr", {HIP_4020, HIP_0, HIP_0 }}, - {"hipsparseScsr2csru", {HIP_4020, HIP_0, HIP_0 }}, - {"hipsparseDcsr2csru", {HIP_4020, HIP_0, HIP_0 }}, - {"hipsparseCcsr2csru", {HIP_4020, HIP_0, HIP_0 }}, - {"hipsparseZcsr2csru", {HIP_4020, HIP_0, HIP_0 }}, + {"hipsparseScsru2csr_bufferSizeExt", {HIP_4020, HIP_6010, HIP_0 }}, + {"hipsparseDcsru2csr_bufferSizeExt", {HIP_4020, HIP_6010, HIP_0 }}, + {"hipsparseCcsru2csr_bufferSizeExt", {HIP_4020, HIP_6010, HIP_0 }}, + {"hipsparseZcsru2csr_bufferSizeExt", {HIP_4020, HIP_6010, HIP_0 }}, + {"hipsparseScsru2csr", {HIP_4020, HIP_6010, HIP_0 }}, + {"hipsparseDcsru2csr", {HIP_4020, HIP_6010, HIP_0 }}, + {"hipsparseCcsru2csr", {HIP_4020, HIP_6010, HIP_0 }}, + {"hipsparseZcsru2csr", {HIP_4020, HIP_6010, HIP_0 }}, + {"hipsparseScsr2csru", {HIP_4020, HIP_6010, HIP_0 }}, + {"hipsparseDcsr2csru", {HIP_4020, HIP_6010, HIP_0 }}, + {"hipsparseCcsr2csru", {HIP_4020, HIP_6010, HIP_0 }}, + {"hipsparseZcsr2csru", {HIP_4020, HIP_6010, HIP_0 }}, {"hipsparseCreateCsc", {HIP_4020, HIP_0, HIP_0 }}, {"hipsparseCscSetPointers", {HIP_4020, HIP_0, HIP_0 }}, {"hipsparseCooSetPointers", {HIP_4020, HIP_0, HIP_0 }}, @@ -1900,31 +1897,31 @@ const std::map HIP_SPARSE_FUNCTION_VER_MAP { {"hipsparseSDDMM", {HIP_4030, HIP_0, HIP_0 }}, {"hipsparseSDDMM_bufferSize", {HIP_4030, HIP_0, HIP_0 }}, {"hipsparseSDDMM_preprocess", {HIP_4030, HIP_0, HIP_0 }}, - {"hipsparseCreateBsrsm2Info", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseDestroyBsrsm2Info", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseCreateColorInfo", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseDestroyColorInfo", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseSbsrxmv", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseDbsrxmv", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseCbsrxmv", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseZbsrxmv", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseXbsrsm2_zeroPivot", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseSbsrsm2_bufferSize", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseDbsrsm2_bufferSize", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseCbsrsm2_bufferSize", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseZbsrsm2_bufferSize", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseSbsrsm2_analysis", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseDbsrsm2_analysis", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseCbsrsm2_analysis", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseZbsrsm2_analysis", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseSbsrsm2_solve", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseDbsrsm2_solve", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseCbsrsm2_solve", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseZbsrsm2_solve", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseScsrcolor", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseDcsrcolor", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseCcsrcolor", {HIP_4050, HIP_0, HIP_0 }}, - {"hipsparseZcsrcolor", {HIP_4050, HIP_0, HIP_0 }}, + {"hipsparseCreateBsrsm2Info", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseDestroyBsrsm2Info", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseCreateColorInfo", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseDestroyColorInfo", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseSbsrxmv", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseDbsrxmv", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseCbsrxmv", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseZbsrxmv", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseXbsrsm2_zeroPivot", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseSbsrsm2_bufferSize", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseDbsrsm2_bufferSize", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseCbsrsm2_bufferSize", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseZbsrsm2_bufferSize", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseSbsrsm2_analysis", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseDbsrsm2_analysis", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseCbsrsm2_analysis", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseZbsrsm2_analysis", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseSbsrsm2_solve", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseDbsrsm2_solve", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseCbsrsm2_solve", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseZbsrsm2_solve", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseScsrcolor", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseDcsrcolor", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseCcsrcolor", {HIP_4050, HIP_6010, HIP_0 }}, + {"hipsparseZcsrcolor", {HIP_4050, HIP_6010, HIP_0 }}, {"hipsparseCreateBlockedEll", {HIP_4050, HIP_0, HIP_0 }}, {"hipsparseBlockedEllGet", {HIP_4050, HIP_0, HIP_0 }}, {"hipsparseSpMatGetAttribute", {HIP_4050, HIP_0, HIP_0 }}, @@ -1996,6 +1993,8 @@ const std::map HIP_SPARSE_FUNCTION_VER_MAP { {"hipsparseCreateConstDnMat", {HIP_6000, HIP_0, HIP_0, }}, {"hipsparseConstDnMatGet", {HIP_6000, HIP_0, HIP_0, }}, {"hipsparseConstDnMatGetValues", {HIP_6000, HIP_0, HIP_0, }}, + {"hipsparseCscGet", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, + {"hipsparseConstCscGet", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, {"rocsparse_create_handle", {HIP_1090, HIP_0, HIP_0 }}, {"rocsparse_destroy_handle", {HIP_1090, HIP_0, HIP_0 }}, @@ -2431,6 +2430,9 @@ const std::map HIP_SPARSE_FUNCTION_VER_MAP { {"rocsparse_dense_to_sparse", {HIP_4010, HIP_0, HIP_0 }}, {"rocsparse_spmm", {HIP_4020, HIP_0, HIP_0 }}, {"rocsparse_spsm", {HIP_4050, HIP_0, HIP_0 }}, + {"rocsparse_spvv", {HIP_4010, HIP_0, HIP_0 }}, + {"rocsparse_spsv", {HIP_4050, HIP_0, HIP_0 }}, + {"rocsparse_csc_get", {HIP_6010, HIP_0, HIP_0, HIP_LATEST}}, }; const std::map CUDA_SPARSE_FUNCTION_CHANGED_VER_MAP { @@ -2537,6 +2539,15 @@ const std::map HIP_SPARSE_FUNCTION_CHANG {"rocsparse_dense_to_sparse", {HIP_6000}}, {"rocsparse_spmm", {HIP_6000}}, {"rocsparse_spsm", {HIP_6000}}, + {"rocsparse_spvv", {HIP_6000}}, + {"rocsparse_spmv", {HIP_6000}}, + {"rocsparse_scatter", {HIP_6000}}, + {"rocsparse_gather", {HIP_6000}}, + {"rocsparse_axpby", {HIP_6000}}, + {"rocsparse_sddmm", {HIP_6000}}, + {"rocsparse_sddmm_buffer_size", {HIP_6000}}, + {"rocsparse_sddmm_preprocess", {HIP_6000}}, + {"rocsparse_spsv", {HIP_6000}}, }; const std::map CUDA_SPARSE_API_SECTION_MAP { diff --git a/src/CUDA2HIP_Scripting.h b/src/CUDA2HIP_Scripting.h index 039d1ef9..a2e4a7ff 100644 --- a/src/CUDA2HIP_Scripting.h +++ b/src/CUDA2HIP_Scripting.h @@ -22,6 +22,10 @@ THE SOFTWARE. #pragma once +#include +#include +#include + namespace hipify { enum CastTypes { diff --git a/src/HipifyAction.cpp b/src/HipifyAction.cpp index a24c728d..3080b5e8 100644 --- a/src/HipifyAction.cpp +++ b/src/HipifyAction.cpp @@ -213,6 +213,13 @@ const std::string sCusparseSpSM_analysis = "cusparseSpSM_analysis"; const std::string sCusparseSpSM_solve = "cusparseSpSM_solve"; const std::string sCusparseXcsrgeam2Nnz = "cusparseXcsrgeam2Nnz"; const std::string sCudaMallocHost = "cudaMallocHost"; +const std::string sCusparseSpMM = "cusparseSpMM"; +const std::string sCusparseSpVV = "cusparseSpVV"; +const std::string sCusparseSpVV_bufferSize = "cusparseSpVV_bufferSize"; +const std::string sCusparseSpMV = "cusparseSpMV"; +const std::string sCusparseSpMV_bufferSize = "cusparseSpMV_bufferSize"; +const std::string sCusparseSpMM_preprocess = "cusparseSpMM_preprocess"; +const std::string sCusparseSpSV_bufferSize = "cusparseSpSV_bufferSize"; // CUDA_OVERLOADED const std::string sCudaEventCreate = "cudaEventCreate"; @@ -2048,6 +2055,85 @@ std::map> FuncArgCasts { } } }, + {sCusparseSpMM, + { + { + { + {10, {e_add_const_argument, cw_None, "rocsparse_spmm_stage_compute, nullptr"}}, + }, + true, + false + } + } + }, + {sCusparseSpVV_bufferSize, + { + { + { + {7, {e_add_const_argument, cw_None, "nullptr"}}, + }, + true, + false + } + } + }, + {sCusparseSpVV, + { + { + { + {6, {e_add_const_argument, cw_None, "nullptr"}} + }, + true, + false + } + } + }, + {sCusparseSpMV_bufferSize, + { + { + { + {9, {e_add_const_argument, cw_None, "rocsparse_spmv_stage_buffer_size"}}, + {11, {e_add_const_argument, cw_None, "nullptr"}}, + }, + true, + false + } + } + }, + {sCusparseSpMV, + { + { + { + {9, {e_add_const_argument, cw_None, "rocsparse_spmv_stage_compute"}} + }, + true, + false + } + } + }, + {sCusparseSpMM_preprocess, + { + { + { + {10, {e_add_const_argument, cw_None, "rocsparse_spmm_stage_preprocess, nullptr"}}, + }, + true, + false + } + } + }, + {sCusparseSpSV_bufferSize, + { + { + { + {8, {e_replace_argument_with_const, cw_None, "rocsparse_spsv_stage_buffer_size"}}, + {10, {e_add_const_argument, cw_None, "nullptr"}}, + }, + true, + false + } + } + }, }; void HipifyAction::RewriteString(StringRef s, clang::SourceLocation start) { @@ -2906,11 +2992,18 @@ std::unique_ptr HipifyAction::CreateASTConsumer(clang::Compi sCusparseSparseToDense_bufferSize, sCusparseDenseToSparse_bufferSize, sCusparseDenseToSparse_analysis, + sCusparseSpMM, sCusparseSpMM_bufferSize, sCusparseSpSM_analysis, sCusparseSpSM_solve, sCusparseXcsrgeam2Nnz, - sCudaMallocHost + sCudaMallocHost, + sCusparseSpVV, + sCusparseSpVV_bufferSize, + sCusparseSpMV, + sCusparseSpMV_bufferSize, + sCusparseSpMM_preprocess, + sCusparseSpSV_bufferSize ) ) ) diff --git a/tests/unit_tests/synthetic/driver_enums.cu b/tests/unit_tests/synthetic/driver_enums.cu index 7da052bb..65c0212b 100644 --- a/tests/unit_tests/synthetic/driver_enums.cu +++ b/tests/unit_tests/synthetic/driver_enums.cu @@ -1070,6 +1070,26 @@ int main() { cudaGraphDebugDotFlags GRAPH_DEBUG_DOT_FLAGS_EXT_SEMAS_WAIT_NODE_PARAMS = cudaGraphDebugDotFlagsExtSemasWaitNodeParams; cudaGraphDebugDotFlags GRAPH_DEBUG_DOT_FLAGS_KERNEL_NODE_ATTRIBUTES = cudaGraphDebugDotFlagsKernelNodeAttributes; cudaGraphDebugDotFlags GRAPH_DEBUG_DOT_FLAGS_HANDLES = cudaGraphDebugDotFlagsHandles; + + // CHECK: hipFlushGPUDirectRDMAWritesOptions flushGPUDirectRDMAWritesOptions; + // CHECK-NEXT: hipFlushGPUDirectRDMAWritesOptions flushGPUDirectRDMAWritesOptions_enum; + // CHECK-NEXT: hipFlushGPUDirectRDMAWritesOptions FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_HOST = hipFlushGPUDirectRDMAWritesOptionHost; + // CHECK-NEXT: hipFlushGPUDirectRDMAWritesOptions FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_MEMOPS = hipFlushGPUDirectRDMAWritesOptionMemOps; + CUflushGPUDirectRDMAWritesOptions flushGPUDirectRDMAWritesOptions; + CUflushGPUDirectRDMAWritesOptions_enum flushGPUDirectRDMAWritesOptions_enum; + CUflushGPUDirectRDMAWritesOptions FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_HOST = CU_FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_HOST; + CUflushGPUDirectRDMAWritesOptions FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_MEMOPS = CU_FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_MEMOPS; + + // CHECK: hipGPUDirectRDMAWritesOrdering GPUDirectRDMAWritesOrdering; + // CHECK-NEXT: hipGPUDirectRDMAWritesOrdering GPUDirectRDMAWritesOrdering_enum; + // CHECK-NEXT: hipGPUDirectRDMAWritesOrdering GPU_DIRECT_RDMA_WRITES_ORDERING_NONE = hipGPUDirectRDMAWritesOrderingNone; + // CHECK-NEXT: hipGPUDirectRDMAWritesOrdering GPU_DIRECT_RDMA_WRITES_ORDERING_OWNER = hipGPUDirectRDMAWritesOrderingOwner; + // CHECK-NEXT: hipGPUDirectRDMAWritesOrdering GPU_DIRECT_RDMA_WRITES_ORDERING_ALL_DEVICES = hipGPUDirectRDMAWritesOrderingAllDevices; + CUGPUDirectRDMAWritesOrdering GPUDirectRDMAWritesOrdering; + CUGPUDirectRDMAWritesOrdering_enum GPUDirectRDMAWritesOrdering_enum; + CUGPUDirectRDMAWritesOrdering GPU_DIRECT_RDMA_WRITES_ORDERING_NONE = CU_GPU_DIRECT_RDMA_WRITES_ORDERING_NONE; + CUGPUDirectRDMAWritesOrdering GPU_DIRECT_RDMA_WRITES_ORDERING_OWNER = CU_GPU_DIRECT_RDMA_WRITES_ORDERING_OWNER; + CUGPUDirectRDMAWritesOrdering GPU_DIRECT_RDMA_WRITES_ORDERING_ALL_DEVICES = CU_GPU_DIRECT_RDMA_WRITES_ORDERING_ALL_DEVICES; #endif #if CUDA_VERSION >= 11040 @@ -1112,6 +1132,32 @@ int main() { // CHECK-NEXT: hipGraphInstantiateFlags GRAPH_INSTANTIATE_FLAG_DEVICE_LAUNCH = hipGraphInstantiateFlagDeviceLaunch; CUgraphInstantiate_flags GRAPH_INSTANTIATE_FLAG_UPLOAD = CUDA_GRAPH_INSTANTIATE_FLAG_UPLOAD; CUgraphInstantiate_flags GRAPH_INSTANTIATE_FLAG_DEVICE_LAUNCH = CUDA_GRAPH_INSTANTIATE_FLAG_DEVICE_LAUNCH; + + // CHECK: hipGraphInstantiateResult graphInstantiateResult; + // CHECK-NEXT: hipGraphInstantiateResult graphInstantiateResult_enum; + // CHECK-NEXT: hipGraphInstantiateResult GRAPH_INSTANTIATE_SUCCESS = hipGraphInstantiateSuccess; + // CHECK-NEXT: hipGraphInstantiateResult GRAPH_INSTANTIATE_ERROR = hipGraphInstantiateError; + // CHECK-NEXT: hipGraphInstantiateResult GRAPH_INSTANTIATE_INVALID_STRUCTURE = hipGraphInstantiateInvalidStructure; + // CHECK-NEXT: hipGraphInstantiateResult GRAPH_INSTANTIATE_NODE_OPERATION_NOT_SUPPORTED = hipGraphInstantiateNodeOperationNotSupported; + // CHECK-NEXT: hipGraphInstantiateResult GRAPH_INSTANTIATE_MULTIPLE_CTXS_NOT_SUPPORTED = hipGraphInstantiateMultipleDevicesNotSupported; + CUgraphInstantiateResult graphInstantiateResult; + CUgraphInstantiateResult_enum graphInstantiateResult_enum; + CUgraphInstantiateResult GRAPH_INSTANTIATE_SUCCESS = CUDA_GRAPH_INSTANTIATE_SUCCESS; + CUgraphInstantiateResult GRAPH_INSTANTIATE_ERROR = CUDA_GRAPH_INSTANTIATE_ERROR; + CUgraphInstantiateResult GRAPH_INSTANTIATE_INVALID_STRUCTURE = CUDA_GRAPH_INSTANTIATE_INVALID_STRUCTURE; + CUgraphInstantiateResult GRAPH_INSTANTIATE_NODE_OPERATION_NOT_SUPPORTED = CUDA_GRAPH_INSTANTIATE_NODE_OPERATION_NOT_SUPPORTED; + CUgraphInstantiateResult GRAPH_INSTANTIATE_MULTIPLE_CTXS_NOT_SUPPORTED = CUDA_GRAPH_INSTANTIATE_MULTIPLE_CTXS_NOT_SUPPORTED; + + // CHECK: hipDriverProcAddressQueryResult driverProcAddressQueryResult; + // CHECK-NEXT:hipDriverProcAddressQueryResult driverProcAddressQueryResult_enum; + // CHECK-NEXT:hipDriverProcAddressQueryResult GET_PROC_ADDRESS_SUCCESS = HIP_GET_PROC_ADDRESS_SUCCESS; + // CHECK-NEXT:hipDriverProcAddressQueryResult GET_PROC_ADDRESS_SYMBOL_NOT_FOUND = HIP_GET_PROC_ADDRESS_SYMBOL_NOT_FOUND; + // CHECK-NEXT:hipDriverProcAddressQueryResult GET_PROC_ADDRESS_VERSION_NOT_SUFFICIENT = HIP_GET_PROC_ADDRESS_VERSION_NOT_SUFFICIENT; + CUdriverProcAddressQueryResult driverProcAddressQueryResult; + CUdriverProcAddressQueryResult_enum driverProcAddressQueryResult_enum; + CUdriverProcAddressQueryResult GET_PROC_ADDRESS_SUCCESS = CU_GET_PROC_ADDRESS_SUCCESS; + CUdriverProcAddressQueryResult GET_PROC_ADDRESS_SYMBOL_NOT_FOUND = CU_GET_PROC_ADDRESS_SYMBOL_NOT_FOUND; + CUdriverProcAddressQueryResult GET_PROC_ADDRESS_VERSION_NOT_SUFFICIENT = CU_GET_PROC_ADDRESS_VERSION_NOT_SUFFICIENT; #endif return 0; diff --git a/tests/unit_tests/synthetic/driver_functions.cu b/tests/unit_tests/synthetic/driver_functions.cu index 9b6b1d6f..58e8789f 100644 --- a/tests/unit_tests/synthetic/driver_functions.cu +++ b/tests/unit_tests/synthetic/driver_functions.cu @@ -1193,13 +1193,13 @@ int main() { result = cuGraphLaunch(graphExec, stream); // CUDA: CUresult CUDAAPI cuGraphMemcpyNodeGetParams(CUgraphNode hNode, CUDA_MEMCPY3D *nodeParams); - // HIP: hipError_t hipGraphMemcpyNodeGetParams(hipGraphNode_t node, hipMemcpy3DParms* pNodeParams); - // CHECK: result = hipGraphMemcpyNodeGetParams(graphNode, &MEMCPY3D); + // HIP: hipError_t hipDrvGraphMemcpyNodeGetParams(hipGraphNode_t node, hipMemcpy3DParms* pNodeParams); + // CHECK: result = hipDrvGraphMemcpyNodeGetParams(graphNode, &MEMCPY3D); result = cuGraphMemcpyNodeGetParams(graphNode, &MEMCPY3D); // CUDA: CUresult CUDAAPI cuGraphMemcpyNodeSetParams(CUgraphNode hNode, const CUDA_MEMCPY3D *nodeParams); - // HIP: hipError_t hipGraphMemcpyNodeSetParams(hipGraphNode_t node, const hipMemcpy3DParms* pNodeParams); - // CHECK: result = hipGraphMemcpyNodeSetParams(graphNode, &MEMCPY3D); + // HIP: hipError_t hipDrvGraphMemcpyNodeSetParams(hipGraphNode_t node, const hipMemcpy3DParms* pNodeParams); + // CHECK: result = hipDrvGraphMemcpyNodeSetParams(graphNode, &MEMCPY3D); result = cuGraphMemcpyNodeSetParams(graphNode, &MEMCPY3D); // CUDA: CUresult CUDAAPI cuGraphMemsetNodeGetParams(CUgraphNode hNode, CUDA_MEMSET_NODE_PARAMS *nodeParams); @@ -1746,8 +1746,8 @@ int main() { result = cuGraphMemAllocNodeGetParams(graphNode, &MEM_ALLOC_NODE_PARAMS); // CUDA: CUresult CUDAAPI cuGraphAddMemFreeNode(CUgraphNode *phGraphNode, CUgraph hGraph, const CUgraphNode *dependencies, size_t numDependencies, CUdeviceptr dptr); - // HIP: hipError_t hipGraphAddMemFreeNode(hipGraphNode_t* pGraphNode, hipGraph_t graph, const hipGraphNode_t* pDependencies, size_t numDependencies, void* dev_ptr); - // CHECK: result = hipGraphAddMemFreeNode(&graphNode, graph, &graphNode2, bytes, deviceptr); + // HIP: hipError_t hipDrvGraphAddMemFreeNode(hipGraphNode_t* pGraphNode, hipGraph_t graph, const hipGraphNode_t* pDependencies, size_t numDependencies, void* dev_ptr); + // CHECK: result = hipDrvGraphAddMemFreeNode(&graphNode, graph, &graphNode2, bytes, deviceptr); result = cuGraphAddMemFreeNode(&graphNode, graph, &graphNode2, bytes, deviceptr); // CUDA: CUresult CUDAAPI cuGraphMemFreeNodeGetParams(CUgraphNode hNode, CUdeviceptr *dptr_out); diff --git a/tests/unit_tests/synthetic/driver_structs.cu b/tests/unit_tests/synthetic/driver_structs.cu index e3f181ae..a56e7b98 100644 --- a/tests/unit_tests/synthetic/driver_structs.cu +++ b/tests/unit_tests/synthetic/driver_structs.cu @@ -308,6 +308,13 @@ int main() { CUDA_MEM_ALLOC_NODE_PARAMS_st MEM_ALLOC_NODE_PARAMS_st; #endif +#if CUDA_VERSION >= 12000 + // CHECK: hipGraphInstantiateParams GRAPH_INSTANTIATE_PARAMS_st; + // CHECK-NEXT: hipGraphInstantiateParams GRAPH_INSTANTIATE_PARAMS; + CUDA_GRAPH_INSTANTIATE_PARAMS_st GRAPH_INSTANTIATE_PARAMS_st; + CUDA_GRAPH_INSTANTIATE_PARAMS GRAPH_INSTANTIATE_PARAMS; +#endif + #if CUDA_VERSION >= 12020 // CHECK: hipMemAllocNodeParams MEM_ALLOC_NODE_PARAMS_v1_st; // CHECK-NEXT: hipMemAllocNodeParams MEM_ALLOC_NODE_PARAMS_v1; @@ -323,6 +330,36 @@ int main() { // CHECK-NEXT: hipExternalSemaphoreWaitNodeParams EXT_SEM_WAIT_NODE_PARAMS_v2; CUDA_EXT_SEM_WAIT_NODE_PARAMS_v2_st EXT_SEM_WAIT_NODE_PARAMS_v2_st; CUDA_EXT_SEM_WAIT_NODE_PARAMS_v2 EXT_SEM_WAIT_NODE_PARAMS_v2; + + // CHECK: hipMemcpyNodeParams MEMCPY_NODE_PARAMS_st; + // CHECK-NEXT: hipMemcpyNodeParams MEMCPY_NODE_PARAMS; + CUDA_MEMCPY_NODE_PARAMS_st MEMCPY_NODE_PARAMS_st; + CUDA_MEMCPY_NODE_PARAMS MEMCPY_NODE_PARAMS; + + // CHECK: hipChildGraphNodeParams CHILD_GRAPH_NODE_PARAMS_st; + // CHECK-NEXT: hipChildGraphNodeParams CHILD_GRAPH_NODE_PARAMS; + CUDA_CHILD_GRAPH_NODE_PARAMS_st CHILD_GRAPH_NODE_PARAMS_st; + CUDA_CHILD_GRAPH_NODE_PARAMS CHILD_GRAPH_NODE_PARAMS; + + // CHECK: hipMemFreeNodeParams MEM_FREE_NODE_PARAMS_st; + // CHECK-NEXT: hipMemFreeNodeParams MEM_FREE_NODE_PARAMS; + CUDA_MEM_FREE_NODE_PARAMS_st MEM_FREE_NODE_PARAMS_st; + CUDA_MEM_FREE_NODE_PARAMS MEM_FREE_NODE_PARAMS; + + // CHECK: hipEventRecordNodeParams EVENT_RECORD_NODE_PARAMS_st; + // CHECK-NEXT: hipEventRecordNodeParams EVENT_RECORD_NODE_PARAMS; + CUDA_EVENT_RECORD_NODE_PARAMS_st EVENT_RECORD_NODE_PARAMS_st; + CUDA_EVENT_RECORD_NODE_PARAMS EVENT_RECORD_NODE_PARAMS; + + // CHECK: hipEventWaitNodeParams EVENT_WAIT_NODE_PARAMS_st; + // CHECK-NEXT: hipEventWaitNodeParams EVENT_WAIT_NODE_PARAMS; + CUDA_EVENT_WAIT_NODE_PARAMS_st EVENT_WAIT_NODE_PARAMS_st; + CUDA_EVENT_WAIT_NODE_PARAMS EVENT_WAIT_NODE_PARAMS; + + // CHECK: hipGraphNodeParams graphNodeParams_st; + // CHECK-NEXT: hipGraphNodeParams graphNodeParams; + CUgraphNodeParams_st graphNodeParams_st; + CUgraphNodeParams graphNodeParams; #endif return 0; diff --git a/tests/unit_tests/synthetic/libraries/cusparse2hipsparse.cu b/tests/unit_tests/synthetic/libraries/cusparse2hipsparse.cu index fefca166..845051c6 100644 --- a/tests/unit_tests/synthetic/libraries/cusparse2hipsparse.cu +++ b/tests/unit_tests/synthetic/libraries/cusparse2hipsparse.cu @@ -145,7 +145,9 @@ int main() { int csrSortedRowPtr = 0; int csrSortedColInd = 0; int cscRowIndA = 0; + int cscRowIndB = 0; int cscColPtrA = 0; + int cscColPtrB = 0; int csrRowPtrA = 0; int csrRowPtrB = 0; int csrRowPtrD = 0; @@ -202,6 +204,7 @@ int main() { const void** const cooRowInd_const = const_cast(&cooRowInd); int icooRowInd = 0; void *cscRowInd = nullptr; + const void** const cscRowInd_const = const_cast(&cscRowInd); void *csrColInd = nullptr; const void** const csrColInd_const = const_cast(&csrColInd); void *cooColInd = nullptr; @@ -213,11 +216,13 @@ int main() { void *csrValues = nullptr; const void** const csrValues_const = const_cast(&csrValues); void *cscValues = nullptr; + const void** const cscValues_const = const_cast(&cscValues); void *ellValue = nullptr; const void** const ellValue_const = const_cast(&ellValue); void *csrRowOffsets = nullptr; const void** const csrRowOffsets_const = const_cast(&csrRowOffsets); void *cscColOffsets = nullptr; + const void** const cscColOffsets_const = const_cast(&cscColOffsets); void *cooRows = nullptr; int icooRows = 0; void *cooColumns = nullptr; @@ -322,6 +327,7 @@ int main() { bsric02Info_t bsric02_info; bsrsm2Info_t bsrsm2_info; bsrsv2Info_t bsrsv2_info; + csru2csrInfo_t csru2_info; // CHECK: hipDoubleComplex dcomplex, dcomplexA, dcomplexAlpha, dcomplexB, dcomplexBeta, dcomplexC, dcomplexF, dcomplexX, dcomplexY, dComplexbsrSortedValA, dComplexbsrSortedValC, dComplexcsrSortedValA, dComplexcsrSortedValB, dComplexcsrSortedValC, dComplexcsrSortedValD, dcomplextol, dComplexbsrSortedVal, dComplexbscVal, dComplexcscSortedVal, dcomplexds, dcomplexdl, dcomplexd, dcomplexdu, dcomplexdw, dcomplexx, dcomplex_boost_val, dcomplex_resultDevHostPtr; cuDoubleComplex dcomplex, dcomplexA, dcomplexAlpha, dcomplexB, dcomplexBeta, dcomplexC, dcomplexF, dcomplexX, dcomplexY, dComplexbsrSortedValA, dComplexbsrSortedValC, dComplexcsrSortedValA, dComplexcsrSortedValB, dComplexcsrSortedValC, dComplexcsrSortedValD, dcomplextol, dComplexbsrSortedVal, dComplexbscVal, dComplexcscSortedVal, dcomplexds, dcomplexdl, dcomplexd, dcomplexdu, dcomplexdw, dcomplexx, dcomplex_boost_val, dcomplex_resultDevHostPtr; @@ -1317,6 +1323,76 @@ int main() { // CHECK: status_t = hipsparseDestroyBsrilu02Info(bsrilu02_info); status_t = cusparseDestroyBsrilu02Info(bsrilu02_info); + // CUDA: CUSPARSE_DEPRECATED cusparseStatus_t CUSPARSEAPI cusparseCreateCsru2csrInfo(csru2csrInfo_t* info); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseCreateCsru2csrInfo(csru2csrInfo_t* info); + // CHECK: status_t = hipsparseCreateCsru2csrInfo(&csru2_info); + status_t = cusparseCreateCsru2csrInfo(&csru2_info); + + // CUDA: CUSPARSE_DEPRECATED cusparseStatus_t CUSPARSEAPI cusparseDestroyCsru2csrInfo(csru2csrInfo_t info); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseDestroyCsru2csrInfo(csru2csrInfo_t info); + // CHECK: status_t = hipsparseDestroyCsru2csrInfo(csru2_info); + status_t = cusparseDestroyCsru2csrInfo(csru2_info); + + // CUDA: CUSPARSE_DEPRECATED cusparseStatus_t CUSPARSEAPI cusparseZcsru2csr(cusparseHandle_t handle, int m, int n, int nnz, const cusparseMatDescr_t descrA, cuDoubleComplex* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, void* pBuffer); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseZcsru2csr(hipsparseHandle_t handle, int m, int n, int nnz, const hipsparseMatDescr_t descrA, hipDoubleComplex* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, void* pBuffer); + // CHECK: status_t = hipsparseZcsru2csr(handle_t, m, n, innz, matDescr_A, &dComplexbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, pBuffer); + status_t = cusparseZcsru2csr(handle_t, m, n, innz, matDescr_A, &dComplexbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, pBuffer); + + // CUDA: CUSPARSE_DEPRECATED cusparseStatus_t CUSPARSEAPI cusparseCcsru2csr(cusparseHandle_t handle, int m, int n, int nnz, const cusparseMatDescr_t descrA, cuComplex* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, void* pBuffer); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseCcsru2csr(hipsparseHandle_t handle, int m, int n, int nnz, const hipsparseMatDescr_t descrA, hipComplex* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, void* pBuffer); + // CHECK: status_t = hipsparseCcsru2csr(handle_t, m, n, innz, matDescr_A, &complexbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, pBuffer); + status_t = cusparseCcsru2csr(handle_t, m, n, innz, matDescr_A, &complexbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, pBuffer); + + // CUDA: CUSPARSE_DEPRECATED cusparseStatus_t CUSPARSEAPI cusparseDcsru2csr(cusparseHandle_t handle, int m, int n, int nnz, const cusparseMatDescr_t descrA, double* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, void* pBuffer); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseDcsru2csr(hipsparseHandle_t handle, int m, int n, int nnz, const hipsparseMatDescr_t descrA, double* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, void* pBuffer); + // CHECK: status_t = hipsparseDcsru2csr(handle_t, m, n, innz, matDescr_A, &dbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, pBuffer); + status_t = cusparseDcsru2csr(handle_t, m, n, innz, matDescr_A, &dbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, pBuffer); + + // CUDA: CUSPARSE_DEPRECATED cusparseStatus_t CUSPARSEAPI cusparseScsru2csr(cusparseHandle_t handle, int m, int n, int nnz, const cusparseMatDescr_t descrA, float* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, void* pBuffer); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseScsru2csr(hipsparseHandle_t handle, int m, int n, int nnz, const hipsparseMatDescr_t descrA, float* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, void* pBuffer); + // CHECK: status_t = hipsparseScsru2csr(handle_t, m, n, innz, matDescr_A, &fbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, pBuffer); + status_t = cusparseScsru2csr(handle_t, m, n, innz, matDescr_A, &fbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, pBuffer); + + // CUDA: CUSPARSE_DEPRECATED cusparseStatus_t CUSPARSEAPI cusparseZcsru2csr_bufferSizeExt(cusparseHandle_t handle, int m, int n, int nnz, cuDoubleComplex* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, size_t* pBufferSizeInBytes); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseZcsru2csr_bufferSizeExt(hipsparseHandle_t handle, int m, int n, int nnz, hipDoubleComplex* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, size_t* pBufferSizeInBytes); + // CHECK: status_t = hipsparseZcsru2csr_bufferSizeExt(handle_t, m, n, innz, &dComplexbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, &bufferSize); + status_t = cusparseZcsru2csr_bufferSizeExt(handle_t, m, n, innz, &dComplexbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, &bufferSize); + + // CUDA: CUSPARSE_DEPRECATED cusparseStatus_t CUSPARSEAPI cusparseCcsru2csr_bufferSizeExt(cusparseHandle_t handle, int m, int n, int nnz, cuComplex* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, size_t* pBufferSizeInBytes); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseCcsru2csr_bufferSizeExt(hipsparseHandle_t handle, int m, int n, int nnz, hipComplex* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, size_t* pBufferSizeInBytes); + // CHECK: status_t = hipsparseCcsru2csr_bufferSizeExt(handle_t, m, n, innz, &complexbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, &bufferSize); + status_t = cusparseCcsru2csr_bufferSizeExt(handle_t, m, n, innz, &complexbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, &bufferSize); + + // CUDA: CUSPARSE_DEPRECATED cusparseStatus_t CUSPARSEAPI cusparseDcsru2csr_bufferSizeExt(cusparseHandle_t handle, int m, int n, int nnz, double* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, size_t* pBufferSizeInBytes); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseDcsru2csr_bufferSizeExt(hipsparseHandle_t handle, int m, int n, int nnz, double* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, size_t* pBufferSizeInBytes); + // CHECK: status_t = hipsparseDcsru2csr_bufferSizeExt(handle_t, m, n, innz, &dbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, &bufferSize); + status_t = cusparseDcsru2csr_bufferSizeExt(handle_t, m, n, innz, &dbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, &bufferSize); + + // CUDA: CUSPARSE_DEPRECATED cusparseStatus_t CUSPARSEAPI cusparseScsru2csr_bufferSizeExt(cusparseHandle_t handle, int m, int n, int nnz, float* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, size_t* pBufferSizeInBytes); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseScsru2csr_bufferSizeExt(hipsparseHandle_t handle, int m, int n, int nnz, float* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, size_t* pBufferSizeInBytes); + // CHECK: status_t = hipsparseScsru2csr_bufferSizeExt(handle_t, m, n, innz, &fbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, &bufferSize); + status_t = cusparseScsru2csr_bufferSizeExt(handle_t, m, n, innz, &fbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, &bufferSize); + + // CUDA: CUSPARSE_DEPRECATED cusparseStatus_t CUSPARSEAPI cusparseZcsr2csru(cusparseHandle_t handle, int m, int n, int nnz, const cusparseMatDescr_t descrA, cuDoubleComplex* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, void* pBuffer); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseZcsr2csru(hipsparseHandle_t handle, int m, int n, int nnz, const hipsparseMatDescr_t descrA, hipDoubleComplex* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, void* pBuffer); + // CHECK: status_t = hipsparseZcsr2csru(handle_t, m, n, innz, matDescr_A, &dComplexbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, pBuffer); + status_t = cusparseZcsr2csru(handle_t, m, n, innz, matDescr_A, &dComplexbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, pBuffer); + + // CUDA: CUSPARSE_DEPRECATED cusparseStatus_t CUSPARSEAPI cusparseCcsr2csru(cusparseHandle_t handle, int m, int n, int nnz, const cusparseMatDescr_t descrA, cuComplex* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, void* pBuffer); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseCcsr2csru(hipsparseHandle_t handle, int m, int n, int nnz, const hipsparseMatDescr_t descrA, hipComplex* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, void* pBuffer); + // CHECK: status_t = hipsparseCcsr2csru(handle_t, m, n, innz, matDescr_A, &complexbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, pBuffer); + status_t = cusparseCcsr2csru(handle_t, m, n, innz, matDescr_A, &complexbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, pBuffer); + + // CUDA: CUSPARSE_DEPRECATED cusparseStatus_t CUSPARSEAPI cusparseDcsr2csru(cusparseHandle_t handle, int m, int n, int nnz, const cusparseMatDescr_t descrA, double* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, void* pBuffer); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseDcsr2csru(hipsparseHandle_t handle, int m, int n, int nnz, const hipsparseMatDescr_t descrA, double* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, void* pBuffer); + // CHECK: status_t = hipsparseDcsr2csru(handle_t, m, n, innz, matDescr_A, &dbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, pBuffer); + status_t = cusparseDcsr2csru(handle_t, m, n, innz, matDescr_A, &dbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, pBuffer); + + // CUDA: CUSPARSE_DEPRECATED cusparseStatus_t CUSPARSEAPI cusparseScsr2csru(cusparseHandle_t handle, int m, int n, int nnz, const cusparseMatDescr_t descrA, float* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, void* pBuffer); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseScsr2csru(hipsparseHandle_t handle, int m, int n, int nnz, const hipsparseMatDescr_t descrA, float* csrVal, const int* csrRowPtr, int* csrColInd, csru2csrInfo_t info, void* pBuffer); + // CHECK: status_t = hipsparseScsr2csru(handle_t, m, n, innz, matDescr_A, &fbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, pBuffer); + status_t = cusparseScsr2csru(handle_t, m, n, innz, matDescr_A, &fbsrSortedVal, &bsrSortedRowPtr, &bsrSortedColInd, csru2_info, pBuffer); + #if CUDA_VERSION >= 7050 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseZgemvi(cusparseHandle_t handle, cusparseOperation_t transA, int m, int n, const cuDoubleComplex* alpha, const cuDoubleComplex* A, int lda, int nnz, const cuDoubleComplex* xVal, const int* xInd, const cuDoubleComplex* beta, cuDoubleComplex* y, cusparseIndexBase_t idxBase, void* pBuffer); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseZgemvi(hipsparseHandle_t handle, hipsparseOperation_t transA, int m, int n, const hipDoubleComplex* alpha, const hipDoubleComplex* A, int lda, int nnz, const hipDoubleComplex* x, const int* xInd, const hipDoubleComplex* beta, hipDoubleComplex* y, hipsparseIndexBase_t idxBase, void* pBuffer); @@ -1416,6 +1492,26 @@ int main() { // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseCopyMatDescr(hipsparseMatDescr_t dest, const hipsparseMatDescr_t src); // CHECK: status_t = hipsparseCopyMatDescr(matDescr_t, matDescr_t_2); status_t = cusparseCopyMatDescr(matDescr_t, matDescr_t_2); + + // CUDA: CUSPARSE_DEPRECATED(cusparseSpMM) cusparseStatus_t CUSPARSEAPI cusparseZgemmi(cusparseHandle_t handle, int m, int n, int k, int nnz, const cuDoubleComplex* alpha, const cuDoubleComplex* A, int lda, const cuDoubleComplex* cscValB, const int* cscColPtrB, const int* cscRowIndB, const cuDoubleComplex* beta, cuDoubleComplex* C, int ldc); + // HIP: DEPRECATED_CUDA_11000("The routine will be removed in CUDA 12") HIPSPARSE_EXPORT hipsparseStatus_t hipsparseZgemmi(hipsparseHandle_t handle, int m, int n, int k, int nnz, const hipDoubleComplex* alpha, const hipDoubleComplex* A, int lda, const hipDoubleComplex* cscValB, const int* cscColPtrB, const int* cscRowIndB, const hipDoubleComplex* beta, hipDoubleComplex* C, int ldc); + // CHECK: status_t = hipsparseZgemmi(handle_t, m, n, k, innz, &dcomplexAlpha, &dcomplexA, lda, &dcomplexB, &cscColPtrB, &cscRowIndB, &dcomplexBeta, &dcomplexC, ldc); + status_t = cusparseZgemmi(handle_t, m, n, k, innz, &dcomplexAlpha, &dcomplexA, lda, &dcomplexB, &cscColPtrB, &cscRowIndB, &dcomplexBeta, &dcomplexC, ldc); + + // CUDA: CUSPARSE_DEPRECATED(cusparseSpMM) cusparseStatus_t CUSPARSEAPI cusparseCgemmi(cusparseHandle_t handle, int m, int n, int k, int nnz, const cuComplex* alpha, const cuComplex* A, int lda, const cuComplex* cscValB, const int* cscColPtrB, const int* cscRowIndB, const cuComplex* beta, cuComplex* C, int ldc); + // HIP: DEPRECATED_CUDA_11000("The routine will be removed in CUDA 12") HIPSPARSE_EXPORT hipsparseStatus_t hipsparseCgemmi(hipsparseHandle_t handle, int m, int n, int k, int nnz, const hipComplex* alpha, const hipComplex* A, int lda, const hipComplex* cscValB, const int* cscColPtrB, const int* cscRowIndB, const hipComplex* beta, hipComplex* C, int ldc); + // CHECK: status_t = hipsparseCgemmi(handle_t, m, n, k, innz, &complexAlpha, &complexA, lda, &complexB, &cscColPtrB, &cscRowIndB, &complexBeta, &complexC, ldc); + status_t = cusparseCgemmi(handle_t, m, n, k, innz, &complexAlpha, &complexA, lda, &complexB, &cscColPtrB, &cscRowIndB, &complexBeta, &complexC, ldc); + + // CUDA: CUSPARSE_DEPRECATED(cusparseSpMM) cusparseStatus_t CUSPARSEAPI cusparseDgemmi(cusparseHandle_t handle, int m, int n, int k, int nnz, const double* alpha, const double* A, int lda, const double* cscValB, const int* cscColPtrB, const int* cscRowIndB, const double* beta, double* C, int ldc); + // HIP: DEPRECATED_CUDA_11000("The routine will be removed in CUDA 12") HIPSPARSE_EXPORT hipsparseStatus_t hipsparseDgemmi(hipsparseHandle_t handle, int m, int n, int k, int nnz, const double* alpha, const double* A, int lda, const double* cscValB, const int* cscColPtrB, const int* cscRowIndB, const double* beta, double* C, int ldc); + // CHECK: status_t = hipsparseDgemmi(handle_t, m, n, k, innz, &dAlpha, &dA, lda, &dB, &cscColPtrB, &cscRowIndB, &dBeta, &dC, ldc); + status_t = cusparseDgemmi(handle_t, m, n, k, innz, &dAlpha, &dA, lda, &dB, &cscColPtrB, &cscRowIndB, &dBeta, &dC, ldc); + + // CUDA: CUSPARSE_DEPRECATED(cusparseSpMM) cusparseStatus_t CUSPARSEAPI cusparseSgemmi(cusparseHandle_t handle, int m, int n, int k, int nnz, const float* alpha, const float* A, int lda, const float* cscValB, const int* cscColPtrB, const int* cscRowIndB, const float* beta, float* C, int ldc); + // HIP: DEPRECATED_CUDA_11000("The routine will be removed in CUDA 12") HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSgemmi(hipsparseHandle_t handle, int m, int n, int k, int nnz, const float* alpha, const float* A, int lda, const float* cscValB, const int* cscColPtrB, const int* cscRowIndB, const float* beta, float* C, int ldc); + // CHECK: status_t = hipsparseSgemmi(handle_t, m, n, k, innz, &fAlpha, &fA, lda, &fB, &cscColPtrB, &cscRowIndB, &fBeta, &fC, ldc); + status_t = cusparseSgemmi(handle_t, m, n, k, innz, &fAlpha, &fA, lda, &fB, &cscColPtrB, &cscRowIndB, &fBeta, &fC, ldc); #endif #if CUDA_VERSION >= 9000 @@ -1858,6 +1954,26 @@ int main() { // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseXcsrgeam2Nnz(hipsparseHandle_t handle, int m, int n, const hipsparseMatDescr_t descrA, int nnzA, const int* csrSortedRowPtrA, const int* csrSortedColIndA, const hipsparseMatDescr_t descrB, int nnzB, const int* csrSortedRowPtrB, const int* csrSortedColIndB, const hipsparseMatDescr_t descrC, int* csrSortedRowPtrC, int* nnzTotalDevHostPtr, void* workspace); // CHECK: status_t = hipsparseXcsrgeam2Nnz(handle_t, m, n, matDescr_A, nnza, &csrRowPtrA, &csrColIndA, matDescr_B, nnzb, &csrRowPtrB, &csrColIndB, matDescr_C, &csrRowPtrC, &nnzTotalDevHostPtr, workspace); status_t = cusparseXcsrgeam2Nnz(handle_t, m, n, matDescr_A, nnza, &csrRowPtrA, &csrColIndA, matDescr_B, nnzb, &csrRowPtrB, &csrColIndB, matDescr_C, &csrRowPtrC, &nnzTotalDevHostPtr, workspace); + + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseZcsrgeam2_bufferSizeExt(cusparseHandle_t handle, int m, int n, const cuDoubleComplex* alpha, const cusparseMatDescr_t descrA, int nnzA, const cuDoubleComplex* csrSortedValA, const int* csrSortedRowPtrA, const int* csrSortedColIndA, const cuDoubleComplex* beta, const cusparseMatDescr_t descrB, int nnzB, const cuDoubleComplex* csrSortedValB, const int* csrSortedRowPtrB, const int* csrSortedColIndB, const cusparseMatDescr_t descrC, const cuDoubleComplex* csrSortedValC, const int* csrSortedRowPtrC, const int* csrSortedColIndC, size_t* pBufferSizeInBytes); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseZcsrgeam2_bufferSizeExt(hipsparseHandle_t handle, int m, int n, const hipDoubleComplex* alpha, const hipsparseMatDescr_t descrA, int nnzA, const hipDoubleComplex* csrSortedValA, const int* csrSortedRowPtrA, const int* csrSortedColIndA, const hipDoubleComplex* beta, const hipsparseMatDescr_t descrB, int nnzB, const hipDoubleComplex* csrSortedValB, const int* csrSortedRowPtrB, const int* csrSortedColIndB, const hipsparseMatDescr_t descrC, const hipDoubleComplex* csrSortedValC, const int* csrSortedRowPtrC, const int* csrSortedColIndC, size_t* pBufferSizeInBytes); + // CHECK: status_t = hipsparseZcsrgeam2_bufferSizeExt(handle_t, m, n, &dcomplexA, matDescr_A, nnza, &dComplexcsrSortedValA, &csrRowPtrA, &csrColIndA, &dcomplexB, matDescr_B, nnzb, &dComplexcsrSortedValB, &csrRowPtrB, &csrColIndB, matDescr_C, &dComplexcsrSortedValC, &csrRowPtrC, &csrColIndC, &bufferSize); + status_t = cusparseZcsrgeam2_bufferSizeExt(handle_t, m, n, &dcomplexA, matDescr_A, nnza, &dComplexcsrSortedValA, &csrRowPtrA, &csrColIndA, &dcomplexB, matDescr_B, nnzb, &dComplexcsrSortedValB, &csrRowPtrB, &csrColIndB, matDescr_C, &dComplexcsrSortedValC, &csrRowPtrC, &csrColIndC, &bufferSize); + + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseCcsrgeam2_bufferSizeExt(cusparseHandle_t handle, int m, int n, const cuComplex* alpha, const cusparseMatDescr_t descrA, int nnzA, const cuComplex* csrSortedValA, const int* csrSortedRowPtrA, const int* csrSortedColIndA, const cuComplex* beta, const cusparseMatDescr_t descrB, int nnzB, const cuComplex* csrSortedValB, const int* csrSortedRowPtrB, const int* csrSortedColIndB, const cusparseMatDescr_t descrC, const cuComplex* csrSortedValC, const int* csrSortedRowPtrC, const int* csrSortedColIndC, size_t* pBufferSizeInBytes); + // HIP: HIPSPARSE_EXPORThipsparseStatus_t hipsparseCcsrgeam2_bufferSizeExt(hipsparseHandle_t handle, int m, int n, const hipComplex* alpha, const hipsparseMatDescr_t descrA, int nnzA, const hipComplex* csrSortedValA, const int* csrSortedRowPtrA, const int* csrSortedColIndA, const hipComplex* beta, const hipsparseMatDescr_t descrB, int nnzB, const hipComplex* csrSortedValB, const int* csrSortedRowPtrB, const int* csrSortedColIndB, const hipsparseMatDescr_t descrC, const hipComplex* csrSortedValC, const int* csrSortedRowPtrC, const int* csrSortedColIndC, size_t* pBufferSizeInBytes); + // CHECK: status_t = hipsparseCcsrgeam2_bufferSizeExt(handle_t, m, n, &complexA, matDescr_A, nnza, &complexcsrSortedValA, &csrRowPtrA, &csrColIndA, &complexB, matDescr_B, nnzb, &complexcsrSortedValB, &csrRowPtrB, &csrColIndB, matDescr_C, &complexcsrSortedValC, &csrRowPtrC, &csrColIndC, &bufferSize); + status_t = cusparseCcsrgeam2_bufferSizeExt(handle_t, m, n, &complexA, matDescr_A, nnza, &complexcsrSortedValA, &csrRowPtrA, &csrColIndA, &complexB, matDescr_B, nnzb, &complexcsrSortedValB, &csrRowPtrB, &csrColIndB, matDescr_C, &complexcsrSortedValC, &csrRowPtrC, &csrColIndC, &bufferSize); + + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseDcsrgeam2_bufferSizeExt(cusparseHandle_t handle, int m, int n, const double* alpha, const cusparseMatDescr_t descrA, int nnzA, const double* csrSortedValA, const int* csrSortedRowPtrA, const int* csrSortedColIndA, const double* beta, const cusparseMatDescr_t descrB, int nnzB, const double* csrSortedValB, const int* csrSortedRowPtrB, const int* csrSortedColIndB, const cusparseMatDescr_t descrC, const double* csrSortedValC, const int* csrSortedRowPtrC, const int* csrSortedColIndC, size_t* pBufferSizeInBytes); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseDcsrgeam2_bufferSizeExt(hipsparseHandle_t handle, int m, int n, const double* alpha, const hipsparseMatDescr_t descrA, int nnzA, const double* csrSortedValA, const int* csrSortedRowPtrA, const int* csrSortedColIndA, const double* beta, const hipsparseMatDescr_t descrB, int nnzB, const double* csrSortedValB, const int* csrSortedRowPtrB, const int* csrSortedColIndB, const hipsparseMatDescr_t descrC, const double* csrSortedValC, const int* csrSortedRowPtrC, const int* csrSortedColIndC, size_t* pBufferSizeInBytes); + // CHECK: status_t = hipsparseDcsrgeam2_bufferSizeExt(handle_t, m, n, &dA, matDescr_A, nnza, &dcsrSortedValA, &csrRowPtrA, &csrColIndA, &dB, matDescr_B, nnzb, &dcsrSortedValB, &csrRowPtrB, &csrColIndB, matDescr_C, &dcsrSortedValC, &csrRowPtrC, &csrColIndC, &bufferSize); + status_t = cusparseDcsrgeam2_bufferSizeExt(handle_t, m, n, &dA, matDescr_A, nnza, &dcsrSortedValA, &csrRowPtrA, &csrColIndA, &dB, matDescr_B, nnzb, &dcsrSortedValB, &csrRowPtrB, &csrColIndB, matDescr_C, &dcsrSortedValC, &csrRowPtrC, &csrColIndC, &bufferSize); + + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseScsrgeam2_bufferSizeExt(cusparseHandle_t handle, int m, int n, const float* alpha, const cusparseMatDescr_t descrA, int nnzA, const float* csrSortedValA, const int* csrSortedRowPtrA, const int* csrSortedColIndA, const float* beta, const cusparseMatDescr_t descrB, int nnzB, const float* csrSortedValB, const int* csrSortedRowPtrB, const int* csrSortedColIndB, const cusparseMatDescr_t descrC, const float* csrSortedValC, const int* csrSortedRowPtrC, const int* csrSortedColIndC, size_t* pBufferSizeInBytes); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseScsrgeam2_bufferSizeExt(hipsparseHandle_t handle, int m, int n, const float* alpha, const hipsparseMatDescr_t descrA, int nnzA, const float* csrSortedValA, const int* csrSortedRowPtrA, const int* csrSortedColIndA, const float* beta, const hipsparseMatDescr_t descrB, int nnzB, const float* csrSortedValB, const int* csrSortedRowPtrB, const int* csrSortedColIndB, const hipsparseMatDescr_t descrC, const float* csrSortedValC, const int* csrSortedRowPtrC, const int* csrSortedColIndC, size_t* pBufferSizeInBytes); + // CHECK: status_t = hipsparseScsrgeam2_bufferSizeExt(handle_t, m, n, &fA, matDescr_A, nnza, &csrSortedValA, &csrRowPtrA, &csrColIndA, &fB, matDescr_B, nnzb, &csrSortedValB, &csrRowPtrB, &csrColIndB, matDescr_C, &csrSortedValC, &csrRowPtrC, &csrColIndC, &bufferSize); + status_t = cusparseScsrgeam2_bufferSizeExt(handle_t, m, n, &fA, matDescr_A, nnza, &csrSortedValA, &csrRowPtrA, &csrColIndA, &fB, matDescr_B, nnzb, &csrSortedValB, &csrRowPtrB, &csrColIndB, matDescr_C, &csrSortedValC, &csrRowPtrC, &csrColIndC, &bufferSize); #endif #if CUDA_VERSION >= 10010 @@ -1866,6 +1982,11 @@ int main() { cusparseCsr2CscAlg_t Csr2CscAlg_t; cusparseCsr2CscAlg_t CSR2CSC_ALG1 = CUSPARSE_CSR2CSC_ALG1; + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseCsr2cscEx2(cusparseHandle_t handle, int m, int n, int nnz, const void* csrVal, const int* csrRowPtr, const int* csrColInd, void* cscVal, int* cscColPtr, int* cscRowInd, cudaDataType valType, cusparseAction_t copyValues, cusparseIndexBase_t idxBase, cusparseCsr2CscAlg_t alg, void* buffer); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseCsr2cscEx2(hipsparseHandle_t handle, int m, int n, int nnz, const void* csrVal, const int* csrRowPtr, const int* csrColInd, void* cscVal, int* cscColPtr, int* cscRowInd, hipDataType valType, hipsparseAction_t copyValues, hipsparseIndexBase_t idxBase, hipsparseCsr2CscAlg_t alg, void* buffer); + // CHECK: status_t = hipsparseCsr2cscEx2(handle_t, m, n, innz, pcsrVal, &csrRowPtrA, &csrColIndA, pcscVal, &cscColPtrA, &cscRowIndA, dataType, action_t, indexBase_t, Csr2CscAlg_t, pBuffer); + status_t = cusparseCsr2cscEx2(handle_t, m, n, innz, pcsrVal, &csrRowPtrA, &csrColIndA, pcscVal, &cscColPtrA, &cscRowIndA, dataType, action_t, indexBase_t, Csr2CscAlg_t, pBuffer); + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseCsr2cscEx2_bufferSize(cusparseHandle_t handle, int m, int n, int nnz, const void* csrVal, const int* csrRowPtr, const int* csrColInd, void* cscVal, int* cscColPtr, int* cscRowInd, cudaDataType valType, cusparseAction_t copyValues, cusparseIndexBase_t idxBase, cusparseCsr2CscAlg_t alg, size_t* bufferSize); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseCsr2cscEx2_bufferSize(hipsparseHandle_t handle, int m, int n, int nnz, const void* csrVal, const int* csrRowPtr, const int* csrColInd, void* cscVal, int* cscColPtr, int* cscRowInd, hipDataType valType, hipsparseAction_t copyValues, hipsparseIndexBase_t idxBase, hipsparseCsr2CscAlg_t alg, size_t* bufferSize); // CHECK: status_t = hipsparseCsr2cscEx2_bufferSize(handle_t, m, n, innz, pcsrVal, &csrRowPtrA, &csrColIndA, pcscVal, &cscColPtrA, &cscRowIndA, dataType, action_t, indexBase_t, Csr2CscAlg_t, &bufferSize); @@ -1979,7 +2100,6 @@ int main() { // CHECK: status_t = hipsparseSpMM_bufferSize(handle_t, opA, opB, alpha, spmatA, dnmatB, beta, dnmatC, dataType, spMMAlg_t, &bufferSize); status_t = cusparseSpMM_bufferSize(handle_t, opA, opB, alpha, spmatA, dnmatB, beta, dnmatC, dataType, spMMAlg_t, &bufferSize); - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpMM(cusparseHandle_t handle, cusparseOperation_t transA, cusparseOperation_t transB, const void* alpha, const cusparseSpMatDescr_t matA, const cusparseDnMatDescr_t matB, const void* beta, cusparseDnMatDescr_t matC, cudaDataType computeType, cusparseSpMMAlg_t alg, void* externalBuffer); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSpMM(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void* alpha, const hipsparseSpMatDescr_t matA, const hipsparseDnMatDescr_t matB, const void* beta, const hipsparseDnMatDescr_t matC, hipDataType computeType, hipsparseSpMMAlg_t alg, void* externalBuffer); // CHECK: status_t = hipsparseSpMM(handle_t, opA, opB, alpha, spmatA, dnmatB, beta, dnmatC, dataType, spMMAlg_t, tempBuffer); @@ -2026,7 +2146,7 @@ int main() { status_t = cusparseDestroyCsrgemm2Info(csrgemm2_info); #endif -#if (CUDA_VERSION >= 10020 && CUDA_VERSION < 11000 && !defined(_WIN32)) || CUDA_VERSION >= 11000 +#if (CUDA_VERSION >= 10010 && CUSPARSE_VERSION >= 10200 && CUDA_VERSION < 11000 && !defined(_WIN32)) || CUDA_VERSION >= 11000 // CHECK: hipsparseSpVecDescr_t spVecDescr_t; cusparseSpVecDescr_t spVecDescr_t; @@ -2062,25 +2182,21 @@ int main() { // CHECK: status_t = hipsparseDestroyDnVec(dnVecDescr_t); status_t = cusparseDestroyDnVec(dnVecDescr_t); - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpVV_bufferSize(cusparseHandle_t handle, cusparseOperation_t opX, const cusparseSpVecDescr_t vecX, const cusparseDnVecDescr_t vecY, const void* result, cudaDataType computeType, size_t* bufferSize); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSpVV_bufferSize(hipsparseHandle_t handle, hipsparseOperation_t opX, hipsparseSpVecDescr_t vecX, hipsparseDnVecDescr_t vecY, void* result, hipDataType computeType, size_t* bufferSize); // CHECK: status_t = hipsparseSpVV_bufferSize(handle_t, opX, spVecDescr_t, vecY, result, dataType, &bufferSize); status_t = cusparseSpVV_bufferSize(handle_t, opX, spVecDescr_t, vecY, result, dataType, &bufferSize); - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpVV(cusparseHandle_t handle, cusparseOperation_t opX, const cusparseSpVecDescr_t vecX, const cusparseDnVecDescr_t vecY, void* result, cudaDataType computeType, void* externalBuffer); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSpVV(hipsparseHandle_t handle, hipsparseOperation_t opX, hipsparseSpVecDescr_t vecX, hipsparseDnVecDescr_t vecY, void* result, hipDataType computeType, void* externalBuffer); // CHECK: status_t = hipsparseSpVV(handle_t, opX, spVecDescr_t, vecY, result, dataType, tempBuffer); status_t = cusparseSpVV(handle_t, opX, spVecDescr_t, vecY, result, dataType, tempBuffer); - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpMV_bufferSize(cusparseHandle_t handle, cusparseOperation_t opA, const void* alpha, const cusparseSpMatDescr_t matA, const cusparseDnVecDescr_t vecX, const void* beta, const cusparseDnVecDescr_t vecY, cudaDataType computeType, cusparseSpMVAlg_t alg, size_t* bufferSize); // HIP: hipsparseStatus_t hipsparseSpMV_bufferSize(hipsparseHandle_t handle, hipsparseOperation_t opA, const void* alpha, const hipsparseSpMatDescr_t matA, const hipsparseDnVecDescr_t vecX, const void* beta, const hipsparseDnVecDescr_t vecY, hipDataType computeType, hipsparseSpMVAlg_t alg, size_t* bufferSize); // CHECK: status_t = hipsparseSpMV_bufferSize(handle_t, opA, alpha, spmatA, vecX, beta, vecY, dataType, spMVAlg_t, &bufferSize); status_t = cusparseSpMV_bufferSize(handle_t, opA, alpha, spmatA, vecX, beta, vecY, dataType, spMVAlg_t, &bufferSize); - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpMV(cusparseHandle_t handle, cusparseOperation_t opA, const void* alpha, const cusparseSpMatDescr_t matA, const cusparseDnVecDescr_t vecX, const void* beta, const cusparseDnVecDescr_t vecY, cudaDataType computeType, cusparseSpMVAlg_t alg, void* externalBuffer); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSpMV(hipsparseHandle_t handle, hipsparseOperation_t opA, const void* alpha, const hipsparseSpMatDescr_t matA, const hipsparseDnVecDescr_t vecX, const void* beta, const hipsparseDnVecDescr_t vecY, hipDataType computeType, hipsparseSpMVAlg_t alg, void* externalBuffer); // CHECK: status_t = hipsparseSpMV(handle_t, opA, alpha, spmatA, vecX, beta, vecY, dataType, spMVAlg_t, tempBuffer); @@ -2481,25 +2597,32 @@ int main() { // CHECK: status_t = hipsparseCsrSetPointers(spMatDescr_t, csrRowOffsets, csrColInd, csrValues); status_t = cusparseCsrSetPointers(spMatDescr_t, csrRowOffsets, csrColInd, csrValues); + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpGEMM_createDescr(cusparseSpGEMMDescr_t* descr); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSpGEMM_createDescr(hipsparseSpGEMMDescr_t* descr); + // CHECK: status_t = hipsparseSpGEMM_createDescr(&spGEMMDescr); + status_t = cusparseSpGEMM_createDescr(&spGEMMDescr); + + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpGEMM_destroyDescr(cusparseSpGEMMDescr_t descr); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSpGEMM_destroyDescr(hipsparseSpGEMMDescr_t descr); + // CHECK: status_t = hipsparseSpGEMM_destroyDescr(spGEMMDescr); + status_t = cusparseSpGEMM_destroyDescr(spGEMMDescr); + #if CUDA_VERSION < 12000 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpMatGetSize(cusparseSpMatDescr_t spMatDescr, int64_t* rows, int64_t* cols, int64_t* nnz); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSpMatGetSize(hipsparseSpMatDescr_t spMatDescr, int64_t* rows, int64_t* cols, int64_t* nnz); // CHECK: status_t = hipsparseSpMatGetSize(spMatDescr_t, &rows, &cols, &nnz); status_t = cusparseSpMatGetSize(spMatDescr_t, &rows, &cols, &nnz); - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpGEMM_workEstimation(cusparseHandle_t handle, cusparseOperation_t opA, cusparseOperation_t opB, const void* alpha, cusparseSpMatDescr_t matA, cusparseSpMatDescr_t matB, const void* beta, cusparseSpMatDescr_t matC, cudaDataType computeType, cusparseSpGEMMAlg_t alg, cusparseSpGEMMDescr_t spgemmDescr, size_t* bufferSize1, void* externalBuffer1); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSpGEMM_workEstimation(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void* alpha, hipsparseSpMatDescr_t matA, hipsparseSpMatDescr_t matB, const void* beta, hipsparseSpMatDescr_t matC, hipDataType computeType, hipsparseSpGEMMAlg_t alg, hipsparseSpGEMMDescr_t spgemmDescr, size_t* bufferSize1, void* externalBuffer1); // CHECK: status_t = hipsparseSpGEMM_workEstimation(handle_t, opA, opB, alpha, spmatA, spmatB, beta, spmatC, dataType, spGEMMAlg_t, spGEMMDescr, &bufferSize, tempBuffer); status_t = cusparseSpGEMM_workEstimation(handle_t, opA, opB, alpha, spmatA, spmatB, beta, spmatC, dataType, spGEMMAlg_t, spGEMMDescr, &bufferSize, tempBuffer); - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpGEMM_compute(cusparseHandle_t handle, cusparseOperation_t opA, cusparseOperation_t opB, const void* alpha, cusparseSpMatDescr_t matA, cusparseSpMatDescr_t matB, const void* beta, cusparseSpMatDescr_t matC, cudaDataType computeType, cusparseSpGEMMAlg_t alg, cusparseSpGEMMDescr_t spgemmDescr, size_t* bufferSize2, void* externalBuffer2); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSpGEMM_compute(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void* alpha, hipsparseSpMatDescr_t matA, hipsparseSpMatDescr_t matB, const void* beta, hipsparseSpMatDescr_t matC, hipDataType computeType, hipsparseSpGEMMAlg_t alg, hipsparseSpGEMMDescr_t spgemmDescr, size_t* bufferSize2, void* externalBuffer2); // CHECK: status_t = hipsparseSpGEMM_compute(handle_t, opA, opB, alpha, spmatA, spmatB, beta, spmatC, dataType, spGEMMAlg_t, spGEMMDescr, &bufferSize, tempBuffer); status_t = cusparseSpGEMM_compute(handle_t, opA, opB, alpha, spmatA, spmatB, beta, spmatC, dataType, spGEMMAlg_t, spGEMMDescr, &bufferSize, tempBuffer); - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpGEMM_copy(cusparseHandle_t handle, cusparseOperation_t opA, cusparseOperation_t opB, const void* alpha, cusparseSpMatDescr_t matA, cusparseSpMatDescr_t matB, const void* beta, cusparseSpMatDescr_t matC, cudaDataType computeType, cusparseSpGEMMAlg_t alg, cusparseSpGEMMDescr_t spgemmDescr); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSpGEMM_copy(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void* alpha, hipsparseSpMatDescr_t matA, hipsparseSpMatDescr_t matB, const void* beta, hipsparseSpMatDescr_t matC, hipDataType computeType, hipsparseSpGEMMAlg_t alg, hipsparseSpGEMMDescr_t spgemmDescr); // CHECK: status_t = hipsparseSpGEMM_copy(handle_t, opA, opB, alpha, spmatA, spmatB, beta, spmatC, dataType, spGEMMAlg_t, spGEMMDescr); @@ -2539,19 +2662,16 @@ int main() { status_t = cusparseRot(handle_t, c_coeff, s_coeff, spVecDescr_t, vecY); #if CUDA_VERSION < 12000 - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseScatter(cusparseHandle_t handle, cusparseSpVecDescr_t vecX, cusparseDnVecDescr_t vecY); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseScatter(hipsparseHandle_t handle, hipsparseSpVecDescr_t vecX, hipsparseDnVecDescr_t vecY); // CHECK: status_t = hipsparseScatter(handle_t, spVecDescr_t, vecY); status_t = cusparseScatter(handle_t, spVecDescr_t, vecY); - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseGather(cusparseHandle_t handle, cusparseDnVecDescr_t vecY, cusparseSpVecDescr_t vecX); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseGather(hipsparseHandle_t handle, hipsparseDnVecDescr_t vecY, hipsparseSpVecDescr_t vecX); // CHECK: status_t = hipsparseGather(handle_t, vecY, spVecDescr_t); status_t = cusparseGather(handle_t, vecY, spVecDescr_t); - // TODO: Mark as C-Changed in 12.0.0 // CUDA: CUSPARSE_DEPRECATED(cusparseAxpby) cusparseStatus_t CUSPARSEAPI cusparseSaxpyi(cusparseHandle_t handle, int nnz, const float* alpha, const float* xVal, const int* xInd, float* y, cusparseIndexBase_t idxBase); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseAxpby(hipsparseHandle_t handle, const void* alpha, hipsparseSpVecDescr_t vecX, const void* beta, hipsparseDnVecDescr_t vecY); // CHECK: status_t = hipsparseAxpby(handle_t, alpha, spVecDescr_t, beta, vecY); @@ -2606,7 +2726,6 @@ int main() { // CHECK: status_t = hipsparseDenseToSparse_analysis(handle_t, dnmatA, spmatB, denseToSparseAlg_t, tempBuffer); status_t = cusparseDenseToSparse_analysis(handle_t, dnmatA, spmatB, denseToSparseAlg_t, tempBuffer); - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseDenseToSparse_convert(cusparseHandle_t handle, cusparseDnMatDescr_t matA, cusparseSpMatDescr_t matB, cusparseDenseToSparseAlg_t alg, void* buffer); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseDenseToSparse_convert(hipsparseHandle_t handle, hipsparseDnMatDescr_t matA, hipsparseSpMatDescr_t matB, hipsparseDenseToSparseAlg_t alg, void* externalBuffer); // CHECK: status_t = hipsparseDenseToSparse_convert(handle_t, dnmatA, spmatB, denseToSparseAlg_t, tempBuffer); @@ -2650,25 +2769,21 @@ int main() { status_t = cusparseBlockedEllGet(spMatDescr_t, &rows, &cols, &ellBlockSize, &ellCols, &ellColInd, &ellValue, &ellIdxType, &indexBase_t, &dataType); #if CUDA_VERSION < 12000 - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpMM_preprocess(cusparseHandle_t handle, cusparseOperation_t opA, cusparseOperation_t opB, const void* alpha, cusparseSpMatDescr_t matA, cusparseDnMatDescr_t matB, const void* beta, cusparseDnMatDescr_t matC, cudaDataType computeType, cusparseSpMMAlg_t alg, void* externalBuffer); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSpMM_preprocess(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void* alpha, const hipsparseSpMatDescr_t matA, const hipsparseDnMatDescr_t matB, const void* beta, const hipsparseDnMatDescr_t matC, hipDataType computeType, hipsparseSpMMAlg_t alg, void* externalBuffer); // CHECK: status_t = hipsparseSpMM_preprocess(handle_t, opA, opB, alpha, spmatA, dnmatB, beta, dnmatC, dataType, spMMAlg_t, tempBuffer); status_t = cusparseSpMM_preprocess(handle_t, opA, opB, alpha, spmatA, dnmatB, beta, dnmatC, dataType, spMMAlg_t, tempBuffer); - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSDDMM_bufferSize(cusparseHandle_t handle, cusparseOperation_t opA, cusparseOperation_t opB, const void* alpha, cusparseDnMatDescr_t matA, cusparseDnMatDescr_t matB, const void* beta, cusparseSpMatDescr_t matC, cudaDataType computeType, cusparseSDDMMAlg_t alg, size_t* bufferSize); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSDDMM_bufferSize(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void* alpha, const hipsparseDnMatDescr_t A, const hipsparseDnMatDescr_t B, const void* beta, hipsparseSpMatDescr_t C, hipDataType computeType, hipsparseSDDMMAlg_t alg, size_t* bufferSize); // CHECK: status_t = hipsparseSDDMM_bufferSize(handle_t, opA, opB, alpha, dnmatA, dnmatB, beta, spmatC, dataType, sDDMMAlg_t, &bufferSize); status_t = cusparseSDDMM_bufferSize(handle_t, opA, opB, alpha, dnmatA, dnmatB, beta, spmatC, dataType, sDDMMAlg_t, &bufferSize); - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSDDMM_preprocess(cusparseHandle_t handle, cusparseOperation_t opA, cusparseOperation_t opB, const void* alpha, cusparseDnMatDescr_t matA, cusparseDnMatDescr_t matB, const void* beta, cusparseSpMatDescr_t matC, cudaDataType computeType, cusparseSDDMMAlg_t alg, void* externalBuffer); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSDDMM_preprocess(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void* alpha, const hipsparseDnMatDescr_t A, const hipsparseDnMatDescr_t B, const void* beta, hipsparseSpMatDescr_t C, hipDataType computeType, hipsparseSDDMMAlg_t alg, void* tempBuffer); // CHECK: status_t = hipsparseSDDMM_preprocess(handle_t, opA, opB, alpha, dnmatA, dnmatB, beta, spmatC, dataType, sDDMMAlg_t, tempBuffer); status_t = cusparseSDDMM_preprocess(handle_t, opA, opB, alpha, dnmatA, dnmatB, beta, spmatC, dataType, sDDMMAlg_t, tempBuffer); - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSDDMM(cusparseHandle_t handle, cusparseOperation_t opA, cusparseOperation_t opB, const void* alpha, cusparseDnMatDescr_t matA, cusparseDnMatDescr_t matB, const void* beta, cusparseSpMatDescr_t matC, cudaDataType computeType, cusparseSDDMMAlg_t alg, void* externalBuffer); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSDDMM(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void* alpha, const hipsparseDnMatDescr_t A, const hipsparseDnMatDescr_t B, const void* beta, hipsparseSpMatDescr_t C, hipDataType computeType, hipsparseSDDMMAlg_t alg, void* tempBuffer); // CHECK: status_t = hipsparseSDDMM(handle_t, opA, opB, alpha, dnmatA, dnmatB, beta, spmatC, dataType, sDDMMAlg_t, tempBuffer); @@ -2692,25 +2807,32 @@ int main() { // CHECK: hipsparseSpSVDescr_t spSVDescr; cusparseSpSVDescr_t spSVDescr; + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpSV_createDescr(cusparseSpSVDescr_t* descr); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSpSV_createDescr(hipsparseSpSVDescr_t* descr); + // CHECK: status_t = hipsparseSpSV_createDescr(&spSVDescr); + status_t = cusparseSpSV_createDescr(&spSVDescr); + + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpSV_destroyDescr(cusparseSpSVDescr_t descr); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSpSV_destroyDescr(hipsparseSpSVDescr_t descr); + // CHECK: status_t = hipsparseSpSV_destroyDescr(spSVDescr); + status_t = cusparseSpSV_destroyDescr(spSVDescr); + #if CUDA_VERSION < 12000 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpMatGetAttribute(cusparseSpMatDescr_t spMatDescr, cusparseSpMatAttribute_t attribute, void* data, size_t dataSize); // HIP: hipsparseStatus_t hipsparseSpMatGetAttribute(hipsparseSpMatDescr_t spMatDescr, hipsparseSpMatAttribute_t attribute, void* data, size_t dataSize); // CHECK: status_t = hipsparseSpMatGetAttribute(spMatDescr_t, spMatAttribute_t, &data, dataSize); status_t = cusparseSpMatGetAttribute(spMatDescr_t, spMatAttribute_t, &data, dataSize); - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpSV_bufferSize(cusparseHandle_t handle, cusparseOperation_t opA, const void* alpha, cusparseSpMatDescr_t matA, cusparseDnVecDescr_t vecX, cusparseDnVecDescr_t vecY, cudaDataType computeType, cusparseSpSVAlg_t alg, cusparseSpSVDescr_t spsvDescr, size_t* bufferSize); // HIP: hipsparseStatus_t hipsparseSpSV_bufferSize(hipsparseHandle_t handle, hipsparseOperation_t opA, const void* alpha, const hipsparseSpMatDescr_t matA, const hipsparseDnVecDescr_t x, const hipsparseDnVecDescr_t y, hipDataType computeType, hipsparseSpSVAlg_t alg, hipsparseSpSVDescr_t spsvDescr, size_t* bufferSize); // CHECK: status_t = hipsparseSpSV_bufferSize(handle_t, opA, alpha, spmatA, vecX, vecY, dataType, spSVAlg_t, spSVDescr, &bufferSize); status_t = cusparseSpSV_bufferSize(handle_t, opA, alpha, spmatA, vecX, vecY, dataType, spSVAlg_t, spSVDescr, &bufferSize); - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpSV_analysis(cusparseHandle_t handle, cusparseOperation_t opA, const void* alpha, cusparseSpMatDescr_t matA, cusparseDnVecDescr_t vecX, cusparseDnVecDescr_t vecY, cudaDataType computeType, cusparseSpSVAlg_t alg, cusparseSpSVDescr_t spsvDescr, void* externalBuffer); // HIP: hipsparseStatus_t hipsparseSpSV_analysis(hipsparseHandle_t handle, hipsparseOperation_t opA, const void* alpha, const hipsparseSpMatDescr_t matA, const hipsparseDnVecDescr_t x, const hipsparseDnVecDescr_t y, hipDataType computeType, hipsparseSpSVAlg_t alg, hipsparseSpSVDescr_t spsvDescr, void* externalBuffer); // CHECK: status_t = hipsparseSpSV_analysis(handle_t, opA, alpha, spmatA, vecX, vecY, dataType, spSVAlg_t, spSVDescr, tempBuffer); status_t = cusparseSpSV_analysis(handle_t, opA, alpha, spmatA, vecX, vecY, dataType, spSVAlg_t, spSVDescr, tempBuffer); - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpSV_solve(cusparseHandle_t handle, cusparseOperation_t opA, const void* alpha, cusparseSpMatDescr_t matA, cusparseDnVecDescr_t vecX, cusparseDnVecDescr_t vecY, cudaDataType computeType, cusparseSpSVAlg_t alg, cusparseSpSVDescr_t spsvDescr); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSpSV_solve(hipsparseHandle_t handle, hipsparseOperation_t opA, const void* alpha, const hipsparseSpMatDescr_t matA, const hipsparseDnVecDescr_t x, const hipsparseDnVecDescr_t y, hipDataType computeType, hipsparseSpSVAlg_t alg, hipsparseSpSVDescr_t spsvDescr); // CHECK: status_t = hipsparseSpSV_solve(handle_t, opA, alpha, spmatA, vecX, vecY, dataType, spSVAlg_t, spSVDescr); @@ -2737,32 +2859,64 @@ int main() { cusparseSpGEMMAlg_t SPGEMM_CSR_ALG_DETERMINITIC = CUSPARSE_SPGEMM_CSR_ALG_DETERMINITIC; cusparseSpGEMMAlg_t SPGEMM_CSR_ALG_NONDETERMINITIC = CUSPARSE_SPGEMM_CSR_ALG_NONDETERMINITIC; + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpSM_createDescr(cusparseSpSMDescr_t* descr); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSpSM_createDescr(hipsparseSpSMDescr_t* descr); + // CHECK: status_t = hipsparseSpSM_createDescr(&spSMDescr); + status_t = cusparseSpSM_createDescr(&spSMDescr); + + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpSM_destroyDescr(cusparseSpSMDescr_t descr); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSpSM_destroyDescr(hipsparseSpSMDescr_t descr); + // CHECK: status_t = hipsparseSpSM_destroyDescr(spSMDescr); + status_t = cusparseSpSM_destroyDescr(spSMDescr); + +#if CUDA_VERSION < 11000 + // CUDA: CUSPARSE_DEPRECATED_HINT(cusparseXcsrgemm2) cusparseStatus_t CUSPARSEAPI cusparseZcsrgemm(cusparseHandle_t handle, cusparseOperation_t transA, cusparseOperation_t transB, int m, int n, int k, const cusparseMatDescr_t descrA, int nnzA, const cuDoubleComplex* csrSortedValA, const int* csrSortedRowPtrA, const int* csrSortedColIndA, const cusparseMatDescr_t descrB, int nnzB, const cuDoubleComplex* csrSortedValB, const int* csrSortedRowPtrB, const int* csrSortedColIndB, const cusparseMatDescr_t descrC, cuDoubleComplex* csrSortedValC, const int* csrSortedRowPtrC, int* csrSortedColIndC); + // HIP: DEPRECATED_CUDA_10000("The routine will be removed in CUDA 11") HIPSPARSE_EXPORT hipsparseStatus_t hipsparseZcsrgemm(hipsparseHandle_t handle, hipsparseOperation_t transA, hipsparseOperation_t transB, int m, int n, int k, const hipsparseMatDescr_t descrA, int nnzA, const hipDoubleComplex* csrValA, const int* csrRowPtrA, const int* csrColIndA, const hipsparseMatDescr_t descrB, int nnzB, const hipDoubleComplex* csrValB, const int* csrRowPtrB, const int* csrColIndB, const hipsparseMatDescr_t descrC, hipDoubleComplex* csrValC, const int* csrRowPtrC, int* csrColIndC); + // CHECK: status_t = hipsparseZcsrgemm(handle_t, opA, opB, m, n, k, matDescr_A, nnza, &dcomplexA, &csrRowPtrA, &csrColIndA, matDescr_B, nnzb, &dComplexcsrSortedValB, &csrRowPtrB, &csrColIndB, matDescr_C, &dComplexcsrSortedValC, &csrRowPtrC, &csrColIndD); + status_t = cusparseZcsrgemm(handle_t, opA, opB, m, n, k, matDescr_A, nnza, &dcomplexA, &csrRowPtrA, &csrColIndA, matDescr_B, nnzb, &dComplexcsrSortedValB, &csrRowPtrB, &csrColIndB, matDescr_C, &dComplexcsrSortedValC, &csrRowPtrC, &csrColIndD); + + // CUDA: CUSPARSE_DEPRECATED_HINT(cusparseXcsrgemm2) cusparseStatus_t CUSPARSEAPI cusparseCcsrgemm(cusparseHandle_t handle, cusparseOperation_t transA, cusparseOperation_t transB, int m, int n, int k, const cusparseMatDescr_t descrA, int nnzA, const cuComplex* csrSortedValA, const int* csrSortedRowPtrA, const int* csrSortedColIndA, const cusparseMatDescr_t descrB, int nnzB, const cuComplex* csrSortedValB, const int* csrSortedRowPtrB, const int* csrSortedColIndB, const cusparseMatDescr_t descrC, cuComplex* csrSortedValC, const int* csrSortedRowPtrC, int* csrSortedColIndC); + // HIP: DEPRECATED_CUDA_10000("The routine will be removed in CUDA 11") HIPSPARSE_EXPORT hipsparseStatus_t hipsparseCcsrgemm(hipsparseHandle_t handle, hipsparseOperation_t transA, hipsparseOperation_t transB, int m, int n, int k, const hipsparseMatDescr_t descrA, int nnzA, const hipComplex* csrValA, const int* csrRowPtrA, const int* csrColIndA, const hipsparseMatDescr_t descrB, int nnzB, const hipComplex* csrValB, const int* csrRowPtrB, const int* csrColIndB, const hipsparseMatDescr_t descrC, hipComplex* csrValC, const int* csrRowPtrC, int* csrColIndC); + // CHECK: status_t = hipsparseCcsrgemm(handle_t, opA, opB, m, n, k, matDescr_A, nnza, &complexA, &csrRowPtrA, &csrColIndA, matDescr_B, nnzb, &complexcsrSortedValB, &csrRowPtrB, &csrColIndB, matDescr_C, &complexcsrSortedValC, &csrRowPtrC, &csrColIndD); + status_t = cusparseCcsrgemm(handle_t, opA, opB, m, n, k, matDescr_A, nnza, &complexA, &csrRowPtrA, &csrColIndA, matDescr_B, nnzb, &complexcsrSortedValB, &csrRowPtrB, &csrColIndB, matDescr_C, &complexcsrSortedValC, &csrRowPtrC, &csrColIndD); + + // CUDA: CUSPARSE_DEPRECATED_HINT(cusparseXcsrgemm2) cusparseStatus_t CUSPARSEAPI cusparseDcsrgemm(cusparseHandle_t handle, cusparseOperation_t transA, cusparseOperation_t transB, int m, int n, int k, const cusparseMatDescr_t descrA, int nnzA, const double* csrSortedValA, const int* csrSortedRowPtrA, const int* csrSortedColIndA, const cusparseMatDescr_t descrB, int nnzB, const double* csrSortedValB, const int* csrSortedRowPtrB, const int* csrSortedColIndB, const cusparseMatDescr_t descrC, double* csrSortedValC, const int* csrSortedRowPtrC, int* csrSortedColIndC); + // HIP: DEPRECATED_CUDA_10000("The routine will be removed in CUDA 11") HIPSPARSE_EXPORT hipsparseStatus_t hipsparseDcsrgemm(hipsparseHandle_t handle, hipsparseOperation_t transA, hipsparseOperation_t transB, int m, int n, int k, const hipsparseMatDescr_t descrA, int nnzA, const double* csrValA, const int* csrRowPtrA, const int* csrColIndA, const hipsparseMatDescr_t descrB, int nnzB, const double* csrValB, const int* csrRowPtrB, const int* csrColIndB, const hipsparseMatDescr_t descrC, double* csrValC, const int* csrRowPtrC, int* csrColIndC); + // CHECK: status_t = hipsparseDcsrgemm(handle_t, opA, opB, m, n, k, matDescr_A, nnza, &dA, &csrRowPtrA, &csrColIndA, matDescr_B, nnzb, &dB, &csrRowPtrB, &csrColIndB, matDescr_C, &dC, &csrRowPtrC, &csrColIndD); + status_t = cusparseDcsrgemm(handle_t, opA, opB, m, n, k, matDescr_A, nnza, &dA, &csrRowPtrA, &csrColIndA, matDescr_B, nnzb, &dB, &csrRowPtrB, &csrColIndB, matDescr_C, &dC, &csrRowPtrC, &csrColIndD); + + // CUDA: CUSPARSE_DEPRECATED_HINT(cusparseXcsrgemm2) cusparseStatus_t CUSPARSEAPI cusparseScsrgemm(cusparseHandle_t handle, cusparseOperation_t transA, cusparseOperation_t transB, int m, int n, int k, const cusparseMatDescr_t descrA, const int nnzA, const float* csrSortedValA, const int* csrSortedRowPtrA, const int* csrSortedColIndA, const cusparseMatDescr_t descrB, const int nnzB, const float* csrSortedValB, const int* csrSortedRowPtrB, const int* csrSortedColIndB, const cusparseMatDescr_t descrC, float* csrSortedValC, const int* csrSortedRowPtrC, int* csrSortedColIndC); + // HIP: DEPRECATED_CUDA_10000("The routine will be removed in CUDA 11") HIPSPARSE_EXPORT hipsparseStatus_t hipsparseScsrgemm(hipsparseHandle_t handle, hipsparseOperation_t transA, hipsparseOperation_t transB, int m, int n, int k, const hipsparseMatDescr_t descrA, int nnzA, const float* csrValA, const int* csrRowPtrA, const int* csrColIndA, const hipsparseMatDescr_t descrB, int nnzB, const float* csrValB, const int* csrRowPtrB, const int* csrColIndB, const hipsparseMatDescr_t descrC, float* csrValC, const int* csrRowPtrC, int* csrColIndC); + // CHECK: status_t = hipsparseScsrgemm(handle_t, opA, opB, m, n, k, matDescr_A, nnza, &fA, &csrRowPtrA, &csrColIndA, matDescr_B, nnzb, &fB, &csrRowPtrB, &csrColIndB, matDescr_C, &fC, &csrRowPtrC, &csrColIndD); + status_t = cusparseScsrgemm(handle_t, opA, opB, m, n, k, matDescr_A, nnza, &fA, &csrRowPtrA, &csrColIndA, matDescr_B, nnzb, &fB, &csrRowPtrB, &csrColIndB, matDescr_C, &fC, &csrRowPtrC, &csrColIndD); + + // CUDA: CUSPARSE_DEPRECATED_HINT(cusparseXcsrgemm2) cusparseStatus_t CUSPARSEAPI cusparseXcsrgemmNnz(cusparseHandle_t handle, cusparseOperation_t transA, cusparseOperation_t transB, int m, int n, int k, const cusparseMatDescr_t descrA, const int nnzA, const int* csrSortedRowPtrA, const int* csrSortedColIndA, const cusparseMatDescr_t descrB, const int nnzB, const int* csrSortedRowPtrB, const int* csrSortedColIndB, const cusparseMatDescr_t descrC, int* csrSortedRowPtrC, int* nnzTotalDevHostPtr); + // HIP: DEPRECATED_CUDA_10000("The routine will be removed in CUDA 11") HIPSPARSE_EXPORT hipsparseStatus_t hipsparseXcsrgemmNnz(hipsparseHandle_t handle, hipsparseOperation_t transA, hipsparseOperation_t transB, int m, int n, int k, const hipsparseMatDescr_t descrA, int nnzA, const int* csrRowPtrA, const int* csrColIndA, const hipsparseMatDescr_t descrB, int nnzB, const int* csrRowPtrB, const int* csrColIndB, const hipsparseMatDescr_t descrC, int* csrRowPtrC, int* nnzTotalDevHostPtr); + // CHECK: status_t = hipsparseXcsrgemmNnz(handle_t, opA, opB, m, n, k, matDescr_A, nnza, &csrRowPtrA, &csrColIndA, matDescr_B, nnzb, &csrRowPtrB, &csrColIndB, matDescr_C, &csrRowPtrC, &csrColIndD, &nnzTotalDevHostPtr); + status_t = cusparseXcsrgemmNnz(handle_t, opA, opB, m, n, k, matDescr_A, nnza, &csrRowPtrA, &csrColIndA, matDescr_B, nnzb, &csrRowPtrB, &csrColIndB, matDescr_C, &csrRowPtrC, &csrColIndD, &nnzTotalDevHostPtr); +#endif + #if CUDA_VERSION < 12000 - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpGEMMreuse_workEstimation(cusparseHandle_t handle, cusparseOperation_t opA, cusparseOperation_t opB, cusparseSpMatDescr_t matA, cusparseSpMatDescr_t matB, cusparseSpMatDescr_t matC, cusparseSpGEMMAlg_t alg, cusparseSpGEMMDescr_t spgemmDescr, size_t* bufferSize1, void* externalBuffer1); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSpGEMMreuse_workEstimation(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, hipsparseSpMatDescr_t matA, hipsparseSpMatDescr_t matB, hipsparseSpMatDescr_t matC, hipsparseSpGEMMAlg_t alg, hipsparseSpGEMMDescr_t spgemmDescr, size_t* bufferSize1, void* externalBuffer1); // CHECK: status_t = hipsparseSpGEMMreuse_workEstimation(handle_t, opA, opB, spmatA, spmatB, spmatC, spGEMMAlg_t, spGEMMDescr, &bufferSize, tempBuffer); status_t = cusparseSpGEMMreuse_workEstimation(handle_t, opA, opB, spmatA, spmatB, spmatC, spGEMMAlg_t, spGEMMDescr, &bufferSize, tempBuffer); - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpGEMMreuse_nnz(cusparseHandle_t handle, cusparseOperation_t opA, cusparseOperation_t opB, cusparseSpMatDescr_t matA, cusparseSpMatDescr_t matB, cusparseSpMatDescr_t matC, cusparseSpGEMMAlg_t alg, cusparseSpGEMMDescr_t spgemmDescr, size_t* bufferSize2, void* externalBuffer2, size_t* bufferSize3, void* externalBuffer3, size_t* bufferSize4, void* externalBuffer4); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSpGEMMreuse_nnz(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, hipsparseSpMatDescr_t matA, hipsparseSpMatDescr_t matB, hipsparseSpMatDescr_t matC, hipsparseSpGEMMAlg_t alg, hipsparseSpGEMMDescr_t spgemmDescr, size_t* bufferSize2, void* externalBuffer2, size_t* bufferSize3, void* externalBuffer3, size_t* bufferSize4, void* externalBuffer4); // CHECK: status_t = hipsparseSpGEMMreuse_nnz(handle_t, opA, opB, spmatA, spmatB, spmatC, spGEMMAlg_t, spGEMMDescr, &bufferSize2, tempBuffer2, &bufferSize3, tempBuffer3, &bufferSize4, tempBuffer4); status_t = cusparseSpGEMMreuse_nnz(handle_t, opA, opB, spmatA, spmatB, spmatC, spGEMMAlg_t, spGEMMDescr, &bufferSize2, tempBuffer2, &bufferSize3, tempBuffer3, &bufferSize4, tempBuffer4); - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpGEMMreuse_compute(cusparseHandle_t handle, cusparseOperation_t opA, cusparseOperation_t opB, const void* alpha, cusparseSpMatDescr_t matA, cusparseSpMatDescr_t matB, const void* beta, cusparseSpMatDescr_t matC, cudaDataType computeType, cusparseSpGEMMAlg_t alg, cusparseSpGEMMDescr_t spgemmDescr); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSpGEMMreuse_compute(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void* alpha, hipsparseSpMatDescr_t matA, hipsparseSpMatDescr_t matB, const void* beta, hipsparseSpMatDescr_t matC, hipDataType computeType, hipsparseSpGEMMAlg_t alg, hipsparseSpGEMMDescr_t spgemmDescr); // CHECK: status_t = hipsparseSpGEMMreuse_compute(handle_t, opA, opB, alpha, spmatA, spmatB, beta, spmatC, dataType, spGEMMAlg_t, spGEMMDescr); status_t = cusparseSpGEMMreuse_compute(handle_t, opA, opB, alpha, spmatA, spmatB, beta, spmatC, dataType, spGEMMAlg_t, spGEMMDescr); - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpGEMMreuse_copy(cusparseHandle_t handle, cusparseOperation_t opA, cusparseOperation_t opB, cusparseSpMatDescr_t matA, cusparseSpMatDescr_t matB, cusparseSpMatDescr_t matC, cusparseSpGEMMAlg_t alg, cusparseSpGEMMDescr_t spgemmDescr, size_t* bufferSize5, void* externalBuffer5); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSpGEMMreuse_copy(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, hipsparseSpMatDescr_t matA, hipsparseSpMatDescr_t matB, hipsparseSpMatDescr_t matC, hipsparseSpGEMMAlg_t alg, hipsparseSpGEMMDescr_t spgemmDescr, size_t* bufferSize5, void* externalBuffer5); // CHECK: status_t = hipsparseSpGEMMreuse_copy(handle_t, opA, opB, spmatA, spmatB, spmatC, spGEMMAlg_t, spGEMMDescr, &bufferSize5, tempBuffer5); status_t = cusparseSpGEMMreuse_copy(handle_t, opA, opB, spmatA, spmatB, spmatC, spGEMMAlg_t, spGEMMDescr, &bufferSize5, tempBuffer5); - // TODO: Mark as C-Changed in 12.0.0 // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpSM_bufferSize(cusparseHandle_t handle, cusparseOperation_t opA, cusparseOperation_t opB, const void* alpha, cusparseSpMatDescr_t matA, cusparseDnMatDescr_t matB, cusparseDnMatDescr_t matC, cudaDataType computeType, cusparseSpSMAlg_t alg, cusparseSpSMDescr_t spsmDescr, size_t* bufferSize); // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseSpSM_bufferSize(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void* alpha, const hipsparseSpMatDescr_t matA, const hipsparseDnMatDescr_t matB, const hipsparseDnMatDescr_t matC, hipDataType computeType, hipsparseSpSMAlg_t alg, hipsparseSpSMDescr_t spsmDescr, size_t* bufferSize); // CHECK: status_t = hipsparseSpSM_bufferSize(handle_t, opA, opB, alpha, spmatA, dnmatB, dnmatC, dataType, spSMAlg_t, spSMDescr, &bufferSize); @@ -2775,6 +2929,13 @@ int main() { #endif #endif +#if CUDA_VERSION >= 11070 + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseCscGet(cusparseSpMatDescr_t spMatDescr, int64_t* rows, int64_t* cols, int64_t* nnz, void** cscColOffsets, void** cscRowInd, void** cscValues, cusparseIndexType_t* cscColOffsetsType, cusparseIndexType_t* cscRowIndType, cusparseIndexBase_t* idxBase, cudaDataType* valueType); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseCscGet(const hipsparseSpMatDescr_t spMatDescr, int64_t* rows, int64_t* cols, int64_t* nnz, void** cscColOffsets, void** cscRowInd, void** cscValues, hipsparseIndexType_t* cscColOffsetsType, hipsparseIndexType_t* cscRowIndType, hipsparseIndexBase_t* idxBase, hipDataType* valueType); + // CHECK: status_t = hipsparseCscGet(spmatA, &rows, &cols, &nnz, &cscColOffsets, &cscRowInd, &cscValues, &cscColOffsetsType, &cscRowIndType, &indexBase_t, &dataType); + status_t = cusparseCscGet(spmatA, &rows, &cols, &nnz, &cscColOffsets, &cscRowInd, &cscValues, &cscColOffsetsType, &cscRowIndType, &indexBase_t, &dataType); +#endif + #if CUDA_VERSION < 12000 // CUDA: CUSPARSE_DEPRECATED(cusparseSparseToDense) cusparseStatus_t CUSPARSEAPI cusparseZcsc2dense(cusparseHandle_t handle, int m, int n, const cusparseMatDescr_t descrA, const cuDoubleComplex* cscSortedValA, const int* cscSortedRowIndA, const int* cscSortedColPtrA, cuDoubleComplex* A, int lda); // HIP: DEPRECATED_CUDA_11000("The routine will be removed in CUDA 12") HIPSPARSE_EXPORT hipsparseStatus_t hipsparseZcsc2dense(hipsparseHandle_t handle, int m, int n, const hipsparseMatDescr_t descr, const hipDoubleComplex* csc_val, const int* csc_row_ind, const int* csc_col_ptr, hipDoubleComplex* A, int ld); @@ -3353,6 +3514,11 @@ int main() { // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseConstDnVecGetValues(hipsparseConstDnVecDescr_t dnVecDescr, const void** values); // CHECK: status_t = hipsparseConstDnVecGetValues(constDnVecDescr, values_const); status_t = cusparseConstDnVecGetValues(constDnVecDescr, values_const); + + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseConstCscGet(cusparseConstSpMatDescr_t spMatDescr, int64_t* rows, int64_t* cols, int64_t* nnz, const void** cscColOffsets, const void** cscRowInd, const void** cscValues, cusparseIndexType_t* cscColOffsetsType, cusparseIndexType_t* cscRowIndType, cusparseIndexBase_t* idxBase, cudaDataType* valueType); + // HIP: HIPSPARSE_EXPORT hipsparseStatus_t hipsparseConstCscGet(hipsparseConstSpMatDescr_t spMatDescr, int64_t* rows, int64_t* cols, int64_t* nnz, const void** cscColOffsets, const void** cscRowInd, const void** cscValues, hipsparseIndexType_t* cscColOffsetsType, hipsparseIndexType_t* cscRowIndType, hipsparseIndexBase_t* idxBase, hipDataType* valueType); + // CHECK: status_t = hipsparseConstCscGet(constSpMatDescr, &rows, &cols, &nnz, cscColOffsets_const, cscRowInd_const, cscValues_const, &cscColOffsetsType, &cscRowIndType, &indexBase_t, &dataType); + status_t = cusparseConstCscGet(constSpMatDescr, &rows, &cols, &nnz, cscColOffsets_const, cscRowInd_const, cscValues_const, &cscColOffsetsType, &cscRowIndType, &indexBase_t, &dataType); #endif return 0; diff --git a/tests/unit_tests/synthetic/libraries/cusparse2rocsparse.cu b/tests/unit_tests/synthetic/libraries/cusparse2rocsparse.cu index 7b33ef39..32942db3 100644 --- a/tests/unit_tests/synthetic/libraries/cusparse2rocsparse.cu +++ b/tests/unit_tests/synthetic/libraries/cusparse2rocsparse.cu @@ -1656,11 +1656,11 @@ int main() { status_t = cusparseDestroyPruneInfo(prune_info); #endif -#if (CUDA_VERSION >= 10010 && CUDA_VERSION < 11000 && !defined(_WIN32)) || CUDA_VERSION >= 11000 +#if (CUDA_VERSION >= 10010 && CUSPARSE_VERSION >= 10200 && CUDA_VERSION < 11000 && !defined(_WIN32)) || CUDA_VERSION >= 11000 // CHECK: _rocsparse_spmat_descr *spMatDescr = nullptr; - // CHECK-NEXT: rocsparse_spmat_descr spMatDescr_t, matC; + // CHECK-NEXT: rocsparse_spmat_descr spMatDescr_t, matC, spmatA, spmatB, spmatC; cusparseSpMatDescr *spMatDescr = nullptr; - cusparseSpMatDescr_t spMatDescr_t, matC; + cusparseSpMatDescr_t spMatDescr_t, matC, spmatA, spmatB, spmatC; // CHECK: _rocsparse_dnmat_descr *dnMatDescr = nullptr; // CHECK-NEXT: rocsparse_dnmat_descr dnMatDescr_t, matA, matB; @@ -1731,35 +1731,6 @@ int main() { // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_dnmat_get(const rocsparse_dnmat_descr descr, int64_t* rows, int64_t* cols, int64_t* ld, void** values, rocsparse_datatype* data_type, rocsparse_order* order); // CHECK: status_t = rocsparse_dnmat_get(dnMatDescr_t, &rows, &cols, &ld, &values, &dataType, &order_t); status_t = cusparseDnMatGet(dnMatDescr_t, &rows, &cols, &ld, &values, &dataType, &order_t); - -#if CUDA_VERSION < 12000 - // CUDA: cusparseStatus_t CUSPARSEAPI cusparseDnMatGetStridedBatch(cusparseConstDnMatDescr_t dnMatDescr, int* batchCount, int64_t* batchStride); - // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_dnmat_get_strided_batch(rocsparse_dnmat_descr descr, int* batch_count, int64_t* batch_stride); - // CHECK: status_t = rocsparse_dnmat_get_strided_batch(dnMatDescr_t, &batchCount, &batchStride); - status_t = cusparseDnMatGetStridedBatch(dnMatDescr_t, &batchCount, &batchStride); -#endif -#endif - -#if CUDA_VERSION < 12000 - // CUDA: cusparseStatus_t CUSPARSEAPI cusparseDestroySpMat(cusparseSpMatDescr_t spMatDescr); - // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_destroy_spmat_descr(rocsparse_spmat_descr descr); - // CHECK: status_t = rocsparse_destroy_spmat_descr(spMatDescr_t); - status_t = cusparseDestroySpMat(spMatDescr_t); - - // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpMatGetFormat(cusparseConstSpMatDescr_t spMatDescr, cusparseFormat_t* format); - // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_spmat_get_format(const rocsparse_spmat_descr descr, rocsparse_format* format); - // CHECK: status_t = rocsparse_spmat_get_format(spMatDescr_t, &format_t); - status_t = cusparseSpMatGetFormat(spMatDescr_t, &format_t); - - // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpMatGetIndexBase(cusparseConstSpMatDescr_t spMatDescr, cusparseIndexBase_t* idxBase); - // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_spmat_get_index_base(const rocsparse_spmat_descr descr, rocsparse_index_base* idx_base); - // CHECK: status_t = rocsparse_spmat_get_index_base(spMatDescr_t, &indexBase_t); - status_t = cusparseSpMatGetIndexBase(spMatDescr_t, &indexBase_t); - - // CUDA: cusparseStatus_t CUSPARSEAPI cusparseDestroyDnMat(cusparseConstDnMatDescr_t dnMatDescr); - // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_destroy_dnmat_descr(rocsparse_dnmat_descr descr); - // CHECK: status_t = rocsparse_destroy_dnmat_descr(dnMatDescr_t); - status_t = cusparseDestroyDnMat(dnMatDescr_t); #endif #endif @@ -1768,7 +1739,7 @@ int main() { cusparseStatus_t STATUS_NOT_SUPPORTED = CUSPARSE_STATUS_NOT_SUPPORTED; #endif -#if (CUDA_VERSION >= 10020 && CUDA_VERSION < 11000 && !defined(_WIN32)) || CUDA_VERSION >= 11000 +#if (CUDA_VERSION >= 10020 && CUSPARSE_VERSION >= 10200 && CUDA_VERSION < 11000 && !defined(_WIN32)) || CUDA_VERSION >= 11000 // CHECK: _rocsparse_spvec_descr *spVecDescr = nullptr; // CHECK-NEXT: rocsparse_spvec_descr spVecDescr_t; cusparseSpVecDescr *spVecDescr = nullptr; @@ -1852,11 +1823,6 @@ int main() { // CHECK: status_t = rocsparse_dnmat_set_values(dnMatDescr_t, values); status_t = cusparseDnMatSetValues(dnMatDescr_t, values); - // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpMV(cusparseHandle_t handle, cusparseOperation_t opA, const void* alpha, cusparseConstSpMatDescr_t matA, cusparseConstDnVecDescr_t vecX, const void* beta, cusparseDnVecDescr_t vecY, cudaDataType computeType, cusparseSpMVAlg_t alg, void* externalBuffer); - // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_spmv(rocsparse_handle handle, rocsparse_operation trans, const void* alpha, const rocsparse_spmat_descr mat, const rocsparse_dnvec_descr x, const void* beta, const rocsparse_dnvec_descr y, rocsparse_datatype compute_type, rocsparse_spmv_alg alg, size_t* buffer_size, void* temp_buffer); - // CHECK: status_t = rocsparse_spmv(handle_t, opA, alpha, spMatDescr_t, vecX, beta, vecY, dataType, spMVAlg_t, tempBuffer); - status_t = cusparseSpMV(handle_t, opA, alpha, spMatDescr_t, vecX, beta, vecY, dataType, spMVAlg_t, tempBuffer); - #if CUDA_VERSION < 12000 // CHECK: rocsparse_format FORMAT_COO_AOS = rocsparse_format_coo_aos; cusparseFormat_t FORMAT_COO_AOS = CUSPARSE_FORMAT_COO_AOS; @@ -1876,25 +1842,10 @@ int main() { // CHECK: status_t = rocsparse_spmat_set_strided_batch(spMatDescr_t, batchCount); status_t = cusparseSpMatSetStridedBatch(spMatDescr_t, batchCount); - // CUDA: cusparseStatus_t CUSPARSEAPI cusparseDestroySpVec(cusparseSpVecDescr_t spVecDescr); - // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_destroy_spvec_descr(rocsparse_spvec_descr descr); - // CHECK: status_t = rocsparse_destroy_spvec_descr(spVecDescr_t); - status_t = cusparseDestroySpVec(spVecDescr_t); - // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpVecGetIndexBase(cusparseConstSpVecDescr_t spVecDescr, cusparseIndexBase_t* idxBase); // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_spvec_get_index_base(const rocsparse_spvec_descr descr, rocsparse_index_base* idx_base); // CHECK: status_t = rocsparse_spvec_get_index_base(spVecDescr_t, &indexBase_t); status_t = cusparseSpVecGetIndexBase(spVecDescr_t, &indexBase_t); - - // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpMatGetStridedBatch(cusparseConstSpMatDescr_t spMatDescr, int* batchCount); - // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_spmat_get_strided_batch(rocsparse_spmat_descr descr, int* batch_count); - // CHECK: status_t = rocsparse_spmat_get_strided_batch(spMatDescr_t, &batchCount); - status_t = cusparseSpMatGetStridedBatch(spMatDescr_t, &batchCount); - - // CUDA: cusparseStatus_t CUSPARSEAPI cusparseDestroyDnVec(cusparseConstDnVecDescr_t dnVecDescr); - // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_destroy_dnvec_descr(rocsparse_dnvec_descr descr); - // CHECK: status_t = rocsparse_destroy_dnvec_descr(dnVecDescr_t); - status_t = cusparseDestroyDnVec(dnVecDescr_t); #endif #endif @@ -2061,13 +2012,6 @@ int main() { // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_csr_set_pointers(rocsparse_spmat_descr descr, void* csr_row_ptr, void* csr_col_ind, void* csr_val); // CHECK: status_t = rocsparse_csr_set_pointers(spMatDescr_t, csrRowOffsets, csrColInd, csrValues); status_t = cusparseCsrSetPointers(spMatDescr_t, csrRowOffsets, csrColInd, csrValues); - -#if CUDA_VERSION < 12000 - // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpMatGetSize(cusparseConstSpMatDescr_t spMatDescr, int64_t* rows, int64_t* cols, int64_t* nnz); - // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_spmat_get_size(rocsparse_spmat_descr descr, int64_t* rows, int64_t* cols, int64_t* nnz); - // CHECK: status_t = rocsparse_spmat_get_size(spMatDescr_t, &rows, &cols, &nnz); - status_t = cusparseSpMatGetSize(spMatDescr_t, &rows, &cols, &nnz); -#endif #endif #if CUDA_VERSION >= 11000 && CUSPARSE_VERSION >= 11100 @@ -2098,21 +2042,6 @@ int main() { // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_rot(rocsparse_handle handle, const void* c, const void* s, rocsparse_spvec_descr x, rocsparse_dnvec_descr y); // CHECK: status_t = rocsparse_rot(handle_t, c_coeff, s_coeff, spVecDescr_t, vecY); status_t = cusparseRot(handle_t, c_coeff, s_coeff, spVecDescr_t, vecY); - - // CUDA: cusparseStatus_t CUSPARSEAPI cusparseScatter(cusparseHandle_t handle, cusparseConstSpVecDescr_t vecX, cusparseDnVecDescr_t vecY); - // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_scatter(rocsparse_handle handle, const rocsparse_spvec_descr x, rocsparse_dnvec_descr y); - // CHECK: status_t = rocsparse_scatter(handle_t, spVecDescr_t, vecY); - status_t = cusparseScatter(handle_t, spVecDescr_t, vecY); - - // CUDA: cusparseStatus_t CUSPARSEAPI cusparseGather(cusparseHandle_t handle, cusparseConstDnVecDescr_t vecY, cusparseSpVecDescr_t vecX); - // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_gather(rocsparse_handle handle, const rocsparse_dnvec_descr y, rocsparse_spvec_descr x); - // CHECK: status_t = rocsparse_gather(handle_t, vecY, spVecDescr_t); - status_t = cusparseGather(handle_t, vecY, spVecDescr_t); - - // CUDA: cusparseStatus_t CUSPARSEAPI cusparseAxpby(cusparseHandle_t handle, const void* alpha, cusparseConstSpVecDescr_t vecX, const void* beta, cusparseDnVecDescr_t vecY); - // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_axpby(rocsparse_handle handle, const void* alpha, const rocsparse_spvec_descr x, const void* beta, rocsparse_dnvec_descr y); - // CHECK: status_t = rocsparse_axpby(handle_t, alpha, spVecDescr_t, beta, vecY); - status_t = cusparseAxpby(handle_t, alpha, spVecDescr_t, beta, vecY); #endif #if CUDA_VERSION >= 11010 && CUSPARSE_VERSION >= 11300 @@ -2176,21 +2105,6 @@ int main() { // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_bell_get(const rocsparse_spmat_descr descr, int64_t* rows, int64_t* cols, rocsparse_direction* ell_block_dir, int64_t* ell_block_dim, int64_t* ell_cols, void** ell_col_ind, void** ell_val, rocsparse_indextype* idx_type, rocsparse_index_base* idx_base, rocsparse_datatype* data_type); // CHECK: status_t = rocsparse_bell_get(spMatDescr_t, &rows, &cols, &ellBlockSize, &ellCols, &ellColInd, &ellValue, &ellIdxType, &indexBase_t, &dataType); status_t = cusparseBlockedEllGet(spMatDescr_t, &rows, &cols, &ellBlockSize, &ellCols, &ellColInd, &ellValue, &ellIdxType, &indexBase_t, &dataType); - - // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSDDMM_preprocess(cusparseHandle_t handle, cusparseOperation_t opA, cusparseOperation_t opB, const void* alpha, cusparseConstDnMatDescr_t matA, cusparseConstDnMatDescr_t matB, const void* beta, cusparseSpMatDescr_t matC, cudaDataType computeType, cusparseSDDMMAlg_t alg, void* externalBuffer); - // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_sddmm_preprocess(rocsparse_handle handle, rocsparse_operation opA, rocsparse_operation opB, const void* alpha, const rocsparse_dnmat_descr A, const rocsparse_dnmat_descr B, const void* beta, rocsparse_spmat_descr C, rocsparse_datatype compute_type, rocsparse_sddmm_alg alg, void* temp_buffer); - // CHECK: status_t = rocsparse_sddmm_preprocess(handle_t, opA, opB, alpha, matA, matB, beta, matC, dataType, sDDMMAlg_t, tempBuffer); - status_t = cusparseSDDMM_preprocess(handle_t, opA, opB, alpha, matA, matB, beta, matC, dataType, sDDMMAlg_t, tempBuffer); - - // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSDDMM_bufferSize(cusparseHandle_t handle, cusparseOperation_t opA, cusparseOperation_t opB, const void* alpha, cusparseConstDnMatDescr_t matA, cusparseConstDnMatDescr_t matB, const void* beta, cusparseSpMatDescr_t matC, cudaDataType computeType, cusparseSDDMMAlg_t alg, size_t* bufferSize); - // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_sddmm_buffer_size(rocsparse_handle handle, rocsparse_operation opA, rocsparse_operation opB, const void* alpha, const rocsparse_dnmat_descr A, const rocsparse_dnmat_descr B, const void* beta, rocsparse_spmat_descr C, rocsparse_datatype compute_type, rocsparse_sddmm_alg alg, size_t* buffer_size); - // CHECK: status_t = rocsparse_sddmm_buffer_size(handle_t, opA, opB, alpha, matA, matB, beta, matC, dataType, sDDMMAlg_t, &bufferSize); - status_t = cusparseSDDMM_bufferSize(handle_t, opA, opB, alpha, matA, matB, beta, matC, dataType, sDDMMAlg_t, &bufferSize); - - // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSDDMM(cusparseHandle_t handle, cusparseOperation_t opA, cusparseOperation_t opB, const void* alpha, cusparseConstDnMatDescr_t matA, cusparseConstDnMatDescr_t matB, const void* beta, cusparseSpMatDescr_t matC, cudaDataType computeType, cusparseSDDMMAlg_t alg, void* externalBuffer); - // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_sddmm(rocsparse_handle handle, rocsparse_operation opA, rocsparse_operation opB, const void* alpha, const rocsparse_dnmat_descr A, const rocsparse_dnmat_descr B, const void* beta, rocsparse_spmat_descr C, rocsparse_datatype compute_type, rocsparse_sddmm_alg alg, void* temp_buffer); - // CHECK: status_t = rocsparse_sddmm(handle_t, opA, opB, alpha, matA, matB, beta, matC, dataType, sDDMMAlg_t, tempBuffer); - status_t = cusparseSDDMM(handle_t, opA, opB, alpha, matA, matB, beta, matC, dataType, sDDMMAlg_t, tempBuffer); #endif #if CUDA_VERSION >= 11030 @@ -2210,13 +2124,6 @@ int main() { // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_spmat_set_attribute(rocsparse_spmat_descr descr, rocsparse_spmat_attribute attribute, const void* data, size_t data_size); // CHECK: status_t = rocsparse_spmat_set_attribute(spMatDescr_t, spMatAttribute_t, &data, dataSize); status_t = cusparseSpMatSetAttribute(spMatDescr_t, spMatAttribute_t, &data, dataSize); - -#if CUDA_VERSION < 12000 - // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpMatGetAttribute(cusparseConstSpMatDescr_t spMatDescr, cusparseSpMatAttribute_t attribute, void* data, size_t dataSize); - // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_spmat_get_attribute(rocsparse_spmat_descr descr, rocsparse_spmat_attribute attribute, void* data, size_t data_size); - // CHECK: status_t = rocsparse_spmat_get_attribute(spMatDescr_t, spMatAttribute_t, &data, dataSize); - status_t = cusparseSpMatGetAttribute(spMatDescr_t, spMatAttribute_t, &data, dataSize); -#endif #endif #if CUDA_VERSION >= 11030 && CUSPARSE_VERSION >= 11600 @@ -2226,6 +2133,13 @@ int main() { cusparseSpSMAlg_t SPSM_ALG_DEFAULT = CUSPARSE_SPSM_ALG_DEFAULT; #endif +#if CUDA_VERSION >= 11070 + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseCscGet(cusparseSpMatDescr_t spMatDescr, int64_t* rows, int64_t* cols, int64_t* nnz, void** cscColOffsets, void** cscRowInd, void** cscValues, cusparseIndexType_t* cscColOffsetsType, cusparseIndexType_t* cscRowIndType, cusparseIndexBase_t* idxBase, cudaDataType* valueType); + // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_csc_get(const rocsparse_spmat_descr descr, int64_t* rows, int64_t* cols, int64_t* nnz, void** csc_col_ptr, void** csc_row_ind, void** csc_val, rocsparse_indextype* col_ptr_type, rocsparse_indextype* row_ind_type, rocsparse_index_base* idx_base, rocsparse_datatype* data_type); + // CHECK: status_t = rocsparse_csc_get(spmatA, &rows, &cols, &nnz, &cscColOffsets, &cscRowInd, &cscValues, &cscColOffsetsType, &cscRowIndType, &indexBase_t, &dataType); + status_t = cusparseCscGet(spmatA, &rows, &cols, &nnz, &cscColOffsets, &cscRowInd, &cscValues, &cscColOffsetsType, &cscRowIndType, &indexBase_t, &dataType); +#endif + #if CUDA_VERSION < 12000 // CHECK: rocsparse_mat_info csrgemm2_info; csrgemm2Info_t csrgemm2_info; @@ -2634,6 +2548,21 @@ int main() { // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_dnmat_get_strided_batch(rocsparse_const_dnmat_descr descr, int* batch_count, int64_t* batch_stride); // CHECK: status_t = rocsparse_dnmat_get_strided_batch(constDnMatDescr, &batchCount, &batchStride); status_t = cusparseDnMatGetStridedBatch(constDnMatDescr, &batchCount, &batchStride); + + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseScatter(cusparseHandle_t handle, cusparseConstSpVecDescr_t vecX, cusparseDnVecDescr_t vecY); + // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_scatter(rocsparse_handle handle, rocsparse_const_spvec_descr x, rocsparse_dnvec_descr y); + // CHECK: status_t = rocsparse_scatter(handle_t, constSpVecDescr, vecY); + status_t = cusparseScatter(handle_t, constSpVecDescr, vecY); + + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseGather(cusparseHandle_t handle, cusparseConstDnVecDescr_t vecY, cusparseSpVecDescr_t vecX); + // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_gather(rocsparse_handle handle, rocsparse_const_dnvec_descr y, rocsparse_spvec_descr x); + // CHECK: status_t = rocsparse_gather(handle_t, constDnVecDescr, spVecDescr_t); + status_t = cusparseGather(handle_t, constDnVecDescr, spVecDescr_t); + + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseAxpby(cusparseHandle_t handle, const void* alpha, cusparseConstSpVecDescr_t vecX, const void* beta, cusparseDnVecDescr_t vecY); + // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_axpby(rocsparse_handle handle, const void* alpha, rocsparse_const_spvec_descr x, const void* beta, rocsparse_dnvec_descr y); + // CHECK: status_t = rocsparse_axpby(handle_t, alpha, constSpVecDescr, beta, vecY); + status_t = cusparseAxpby(handle_t, alpha, constSpVecDescr, beta, vecY); #endif #if CUDA_VERSION >= 12010 && CUSPARSE_VERSION >= 12100 diff --git a/tests/unit_tests/synthetic/libraries/cusparse2rocsparse_10010_12000.cu b/tests/unit_tests/synthetic/libraries/cusparse2rocsparse_10010_12000.cu index e91120b5..361095ca 100644 --- a/tests/unit_tests/synthetic/libraries/cusparse2rocsparse_10010_12000.cu +++ b/tests/unit_tests/synthetic/libraries/cusparse2rocsparse_10010_12000.cu @@ -47,6 +47,8 @@ int main() { void *pcscVal = nullptr; void *alpha = nullptr; void *beta = nullptr; + void *tempBuffer = nullptr; + void* result = nullptr; // CHECK: rocsparse_operation opA, opB, opX; cusparseOperation_t opA, opB, opX; @@ -57,7 +59,7 @@ int main() { cudaDataType dataType; #endif -#if CUDA_VERSION >= 10010 +#if CUDA_VERSION >= 10010 && CUSPARSE_VERSION >= 10200 // TODO: cusparseCsr2CscAlg_t has no analogue in rocSPARSE. The deletion of declaration and usage is needed to be implemented cusparseCsr2CscAlg_t Csr2CscAlg_t; @@ -71,12 +73,15 @@ int main() { // CHECK: rocsparse_spmm_alg spMMAlg_t; cusparseSpMMAlg_t spMMAlg_t; -#if CUDA_VERSION < 12000 - // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpMM_bufferSize(cusparseHandle_t handle, cusparseOperation_t opA, cusparseOperation_t opB, const void* alpha, const cusparseSpMatDescr_t matA, const cusparseDnMatDescr_t matB, const void* beta, cusparseDnMatDescr_t matC, cudaDataType computeType, cusparseSpMMAlg_t alg, size_t* bufferSize); - // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_spmm(rocsparse_handle handle, rocsparse_operation trans_A, rocsparse_operation trans_B, const void* alpha, const rocsparse_spmat_descr mat_A, const rocsparse_dnmat_descr mat_B, const void* beta, const rocsparse_dnmat_descr mat_C, rocsparse_datatype compute_type, rocsparse_spmm_alg alg, rocsparse_spmm_stage stage, size_t* buffer_size, void* temp_buffer); - // CHECK: status_t = rocsparse_spmm(handle_t, opA, opB, alpha, spmatA, dnmatB, beta, dnmatC, dataType, spMMAlg_t, rocsparse_spmm_stage_compute, &bufferSize, nullptr); - status_t = cusparseSpMM_bufferSize(handle_t, opA, opB, alpha, spmatA, dnmatB, beta, dnmatC, dataType, spMMAlg_t, &bufferSize); -#endif + // CHECK: _rocsparse_spvec_descr *spVecDescr = nullptr; + // CHECK-NEXT: rocsparse_spvec_descr spVecDescr_t; + cusparseSpVecDescr *spVecDescr = nullptr; + cusparseSpVecDescr_t spVecDescr_t; + + // CHECK: _rocsparse_dnvec_descr *dnVecDescr = nullptr; + // CHECK-NEXT: rocsparse_dnvec_descr dnVecDescr_t, vecX, vecY; + cusparseDnVecDescr *dnVecDescr = nullptr; + cusparseDnVecDescr_t dnVecDescr_t, vecX, vecY; #endif #endif diff --git a/tests/unit_tests/synthetic/libraries/cusparse2rocsparse_12000.cu b/tests/unit_tests/synthetic/libraries/cusparse2rocsparse_12000.cu index 33cff8d8..1bac5840 100644 --- a/tests/unit_tests/synthetic/libraries/cusparse2rocsparse_12000.cu +++ b/tests/unit_tests/synthetic/libraries/cusparse2rocsparse_12000.cu @@ -71,6 +71,7 @@ int main() { void *tempBuffer = nullptr; void *alpha = nullptr; void *beta = nullptr; + void* result = nullptr; // TODO: should be rocsparse_double_complex // TODO: add to TypeOverloads cuDoubleComplex -> rocsparse_double_complex under a new option --sparse @@ -88,7 +89,7 @@ int main() { cudaDataType dataType; #endif -#if (CUDA_VERSION >= 10010 && CUDA_VERSION < 11000 && !defined(_WIN32)) || CUDA_VERSION >= 11000 +#if (CUDA_VERSION >= 10010 && CUSPARSE_VERSION >= 10200 && CUDA_VERSION < 11000 && !defined(_WIN32)) || CUDA_VERSION >= 11000 // CHECK: rocsparse_spmat_descr spMatDescr_t, spmatA, spmatB, spmatC; cusparseSpMatDescr_t spMatDescr_t, spmatA, spmatB, spmatC; @@ -97,6 +98,14 @@ int main() { // CHECK: rocsparse_spmm_alg spMMAlg_t; cusparseSpMMAlg_t spMMAlg_t; + + // CHECK: _rocsparse_dnvec_descr *dnVecDescr = nullptr; + // CHECK-NEXT: rocsparse_dnvec_descr dnVecDescr_t, vecX, vecY; + cusparseDnVecDescr *dnVecDescr = nullptr; + cusparseDnVecDescr_t dnVecDescr_t, vecX, vecY; + + // CHECK: rocsparse_spmv_alg spMVAlg_t; + cusparseSpMVAlg_t spMVAlg_t; #endif #if CUDA_VERSION >= 11010 && CUSPARSE_VERSION >= 11300 @@ -107,6 +116,13 @@ int main() { cusparseDenseToSparseAlg_t denseToSparseAlg_t; #endif +#if CUDA_VERSION >= 11020 && CUSPARSE_VERSION >= 11400 + // CHECK: rocsparse_sddmm_alg sDDMMAlg_t; + // CHECK-NEXT: rocsparse_sddmm_alg SDDMM_ALG_DEFAULT = rocsparse_sddmm_alg_default; + cusparseSDDMMAlg_t sDDMMAlg_t; + cusparseSDDMMAlg_t SDDMM_ALG_DEFAULT = CUSPARSE_SDDMM_ALG_DEFAULT; +#endif + #if CUDA_VERSION >= 11030 && CUSPARSE_VERSION >= 11600 // CHECK: rocsparse_spsm_alg spSMAlg_t; // CHECK-NEXT: rocsparse_spsm_alg SPSM_ALG_DEFAULT = rocsparse_spsm_alg_default; @@ -118,6 +134,14 @@ int main() { #endif #if CUDA_VERSION >= 12000 + // CHECK: rocsparse_spsv_alg spSVAlg_t; + // CHECK-NEXT: rocsparse_spsv_alg SPSV_ALG_DEFAULT = rocsparse_spsv_alg_default; + cusparseSpSVAlg_t spSVAlg_t; + cusparseSpSVAlg_t SPSV_ALG_DEFAULT = CUSPARSE_SPSV_ALG_DEFAULT; + + // TODO: remove decalration of cusparseSpSVDescr_t, as it is not mirroved and not used in rocSPARSE + cusparseSpSVDescr_t spSVDescr; + // CHECK: rocsparse_const_spmat_descr constSpMatDescr = nullptr; // CHECK-NEXT: rocsparse_const_spmat_descr constSpMatDescrB = nullptr; cusparseConstSpMatDescr_t constSpMatDescr = nullptr; @@ -128,6 +152,12 @@ int main() { cusparseConstDnMatDescr_t constDnMatDescr = nullptr; cusparseConstDnMatDescr_t constDnMatDescrB = nullptr; + // CHECK: rocsparse_const_spvec_descr constSpVecDescr = nullptr; + cusparseConstSpVecDescr_t constSpVecDescr = nullptr; + + // CHECK: rocsparse_const_dnvec_descr constDnVecDescr = nullptr; + cusparseConstDnVecDescr_t constDnVecDescr = nullptr; + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSparseToDense(cusparseHandle_t handle, cusparseConstSpMatDescr_t matA, cusparseDnMatDescr_t matB, cusparseSparseToDenseAlg_t alg, void* externalBuffer); // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_sparse_to_dense(rocsparse_handle handle, rocsparse_const_spmat_descr mat_A, rocsparse_dnmat_descr mat_B, rocsparse_sparse_to_dense_alg alg, size_t* buffer_size, void* temp_buffer); // CHECK: status_t = rocsparse_sparse_to_dense(handle_t, constSpMatDescr, dnmatB, sparseToDenseAlg_t, nullptr, tempBuffer); @@ -162,6 +192,56 @@ int main() { // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_spsm(rocsparse_handle handle, rocsparse_operation trans_A, rocsparse_operation trans_B, const void* alpha, rocsparse_const_spmat_descr matA, rocsparse_const_dnmat_descr matB, const rocsparse_dnmat_descr matC, rocsparse_datatype compute_type, rocsparse_spsm_alg alg, rocsparse_spsm_stage stage, size_t* buffer_size, void* temp_buffer); // CHECK: status_t = rocsparse_spsm(handle_t, opA, opB, alpha, constSpMatDescr, constDnMatDescrB, dnmatC, dataType, spSMAlg_t, rocsparse_spsm_stage_compute, nullptr, nullptr); status_t = cusparseSpSM_solve(handle_t, opA, opB, alpha, constSpMatDescr, constDnMatDescrB, dnmatC, dataType, spSMAlg_t, spSMDescr); + + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpMM(cusparseHandle_t handle, cusparseOperation_t opA, cusparseOperation_t opB, const void* alpha, cusparseConstSpMatDescr_t matA, cusparseConstDnMatDescr_t matB, const void* beta, cusparseDnMatDescr_t matC, cudaDataType computeType, cusparseSpMMAlg_t alg, void* externalBuffer); + // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_spmm(rocsparse_handle handle, rocsparse_operation trans_A, rocsparse_operation trans_B, const void* alpha, rocsparse_const_spmat_descr mat_A, rocsparse_const_dnmat_descr mat_B, const void* beta, const rocsparse_dnmat_descr mat_C, rocsparse_datatype compute_type, rocsparse_spmm_alg alg, rocsparse_spmm_stage stage, size_t* buffer_size, void* temp_buffer); + // CHECK: status_t = rocsparse_spmm(handle_t, opA, opB, alpha, constSpMatDescr, constDnMatDescr, beta, dnmatC, dataType, spMMAlg_t, rocsparse_spmm_stage_compute, nullptr, tempBuffer); + status_t = cusparseSpMM(handle_t, opA, opB, alpha, constSpMatDescr, constDnMatDescr, beta, dnmatC, dataType, spMMAlg_t, tempBuffer); + + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpVV(cusparseHandle_t handle, cusparseOperation_t opX, cusparseConstSpVecDescr_t vecX, cusparseConstDnVecDescr_t vecY, void* result, cudaDataType computeType, void* externalBuffer); + // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_spvv(rocsparse_handle handle, rocsparse_operation trans, rocsparse_const_spvec_descr x, rocsparse_const_dnvec_descr y, void* result, rocsparse_datatype compute_type, size_t* buffer_size, void* temp_buffer); + // CHECK: status_t = rocsparse_spvv(handle_t, opX, constSpVecDescr, constDnVecDescr, result, dataType, nullptr, tempBuffer); + status_t = cusparseSpVV(handle_t, opX, constSpVecDescr, constDnVecDescr, result, dataType, tempBuffer); + + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpVV_bufferSize(cusparseHandle_t handle, cusparseOperation_t opX, cusparseConstSpVecDescr_t vecX, cusparseConstDnVecDescr_t vecY, const void* result, cudaDataType computeType, size_t* bufferSize); + // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_spvv(rocsparse_handle handle, rocsparse_operation trans, rocsparse_const_spvec_descr x, rocsparse_const_dnvec_descr y, void* result, rocsparse_datatype compute_type, size_t* buffer_size, void* temp_buffer); + // CHECK: status_t = rocsparse_spvv(handle_t, opX, constSpVecDescr, constDnVecDescr, result, dataType, &bufferSize, nullptr); + status_t = cusparseSpVV_bufferSize(handle_t, opX, constSpVecDescr, constDnVecDescr, result, dataType, &bufferSize); + + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpMV(cusparseHandle_t handle, cusparseOperation_t opA, const void* alpha, cusparseConstSpMatDescr_t matA, cusparseConstDnVecDescr_t vecX, const void* beta, cusparseDnVecDescr_t vecY, cudaDataType computeType, cusparseSpMVAlg_t alg, void* externalBuffer); + // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_spmv(rocsparse_handle handle, rocsparse_operation trans, const void* alpha, rocsparse_const_spmat_descr mat, rocsparse_const_dnvec_descr x, const void* beta, const rocsparse_dnvec_descr y, rocsparse_datatype compute_type, rocsparse_spmv_alg alg, rocsparse_spmv_stage stage, size_t* buffer_size, void* temp_buffer); + // CHECK: status_t = rocsparse_spmv(handle_t, opA, alpha, constSpMatDescr, constDnVecDescr, beta, vecY, dataType, spMVAlg_t, rocsparse_spmv_stage_compute, tempBuffer); + status_t = cusparseSpMV(handle_t, opA, alpha, constSpMatDescr, constDnVecDescr, beta, vecY, dataType, spMVAlg_t, tempBuffer); + + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpMV_bufferSize(cusparseHandle_t handle, cusparseOperation_t opA, const void* alpha, cusparseConstSpMatDescr_t matA, cusparseConstDnVecDescr_t vecX, const void* beta, cusparseDnVecDescr_t vecY, cudaDataType computeType, cusparseSpMVAlg_t alg, size_t* bufferSize); + // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_spmv(rocsparse_handle handle, rocsparse_operation trans, const void* alpha, rocsparse_const_spmat_descr mat, rocsparse_const_dnvec_descr x, const void* beta, const rocsparse_dnvec_descr y, rocsparse_datatype compute_type, rocsparse_spmv_alg alg, rocsparse_spmv_stage stage, size_t* buffer_size, void* temp_buffer); + // CHECK: status_t = rocsparse_spmv(handle_t, opA, alpha, constSpMatDescr, constDnVecDescr, beta, vecY, dataType, spMVAlg_t, rocsparse_spmv_stage_buffer_size, &bufferSize, nullptr); + status_t = cusparseSpMV_bufferSize(handle_t, opA, alpha, constSpMatDescr, constDnVecDescr, beta, vecY, dataType, spMVAlg_t, &bufferSize); + + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpMM_preprocess(cusparseHandle_t handle, cusparseOperation_t opA, cusparseOperation_t opB, const void* alpha, cusparseConstSpMatDescr_t matA, cusparseConstDnMatDescr_t matB, const void* beta, cusparseDnMatDescr_t matC, cudaDataType computeType, cusparseSpMMAlg_t alg, void* externalBuffer); + // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_spmm(rocsparse_handle handle, rocsparse_operation trans_A, rocsparse_operation trans_B, const void* alpha, const rocsparse_spmat_descr mat_A, const rocsparse_dnmat_descr mat_B, const void* beta, const rocsparse_dnmat_descr mat_C, rocsparse_datatype compute_type, rocsparse_spmm_alg alg, rocsparse_spmm_stage stage, size_t* buffer_size, void* temp_buffer); + // CHECK: status_t = rocsparse_spmm(handle_t, opA, opB, alpha, constSpMatDescr, constDnMatDescr, beta, dnmatC, dataType, spMMAlg_t, rocsparse_spmm_stage_preprocess, nullptr, tempBuffer); + status_t = cusparseSpMM_preprocess(handle_t, opA, opB, alpha, constSpMatDescr, constDnMatDescr, beta, dnmatC, dataType, spMMAlg_t, tempBuffer); + + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSDDMM_bufferSize(cusparseHandle_t handle, cusparseOperation_t opA, cusparseOperation_t opB, const void* alpha, cusparseConstDnMatDescr_t matA, cusparseConstDnMatDescr_t matB, const void* beta, cusparseSpMatDescr_t matC, cudaDataType computeType, cusparseSDDMMAlg_t alg, size_t* bufferSize); + // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_sddmm_buffer_size(rocsparse_handle handle, rocsparse_operation opA, rocsparse_operation opB, const void* alpha, const rocsparse_dnmat_descr A, const rocsparse_dnmat_descr B, const void* beta, rocsparse_spmat_descr C, rocsparse_datatype compute_type, rocsparse_sddmm_alg alg, size_t* buffer_size); + // CHECK: status_t = rocsparse_sddmm_buffer_size(handle_t, opA, opB, alpha, constDnMatDescr, constDnMatDescrB, beta, spmatC, dataType, sDDMMAlg_t, &bufferSize); + status_t = cusparseSDDMM_bufferSize(handle_t, opA, opB, alpha, constDnMatDescr, constDnMatDescrB, beta, spmatC, dataType, sDDMMAlg_t, &bufferSize); + + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSDDMM_preprocess(cusparseHandle_t handle, cusparseOperation_t opA, cusparseOperation_t opB, const void* alpha, cusparseConstDnMatDescr_t matA, cusparseConstDnMatDescr_t matB, const void* beta, cusparseSpMatDescr_t matC, cudaDataType computeType, cusparseSDDMMAlg_t alg, void* externalBuffer); + // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_sddmm_preprocess(rocsparse_handle handle, rocsparse_operation opA, rocsparse_operation opB, const void* alpha, rocsparse_const_dnmat_descr A, rocsparse_const_dnmat_descr B, const void* beta, rocsparse_spmat_descr C, rocsparse_datatype compute_type, rocsparse_sddmm_alg alg, void* temp_buffer); + // CHECK: status_t = rocsparse_sddmm_preprocess(handle_t, opA, opB, alpha, constDnMatDescr, constDnMatDescrB, beta, spmatC, dataType, sDDMMAlg_t, tempBuffer); + status_t = cusparseSDDMM_preprocess(handle_t, opA, opB, alpha, constDnMatDescr, constDnMatDescrB, beta, spmatC, dataType, sDDMMAlg_t, tempBuffer); + + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSDDMM(cusparseHandle_t handle, cusparseOperation_t opA, cusparseOperation_t opB, const void* alpha, cusparseConstDnMatDescr_t matA, cusparseConstDnMatDescr_t matB, const void* beta, cusparseSpMatDescr_t matC, cudaDataType computeType, cusparseSDDMMAlg_t alg, void* externalBuffer); + // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_sddmm(rocsparse_handle handle, rocsparse_operation opA, rocsparse_operation opB, const void* alpha, rocsparse_const_dnmat_descr A, rocsparse_const_dnmat_descr B, const void* beta, rocsparse_spmat_descr C, rocsparse_datatype compute_type, rocsparse_sddmm_alg alg, void* temp_buffer); + // CHECK: status_t = rocsparse_sddmm(handle_t, opA, opB, alpha, constDnMatDescr, constDnMatDescrB, beta, spmatC, dataType, sDDMMAlg_t, tempBuffer); + status_t = cusparseSDDMM(handle_t, opA, opB, alpha, constDnMatDescr, constDnMatDescrB, beta, spmatC, dataType, sDDMMAlg_t, tempBuffer); + + // CUDA: cusparseStatus_t CUSPARSEAPI cusparseSpSV_bufferSize(cusparseHandle_t handle, cusparseOperation_t opA, const void* alpha, cusparseConstSpMatDescr_t matA, cusparseConstDnVecDescr_t vecX, cusparseDnVecDescr_t vecY, cudaDataType computeType, cusparseSpSVAlg_t alg, cusparseSpSVDescr_t spsvDescr, size_t* bufferSize); + // ROC: ROCSPARSE_EXPORT rocsparse_status rocsparse_spsv(rocsparse_handle handle, rocsparse_operation trans, const void* alpha, rocsparse_const_spmat_descr mat, rocsparse_const_dnvec_descr x, const rocsparse_dnvec_descr y, rocsparse_datatype compute_type, rocsparse_spsv_alg alg, rocsparse_spsv_stage stage, size_t* buffer_size, void* temp_buffer); + // CHECK: status_t = rocsparse_spsv(handle_t, opA, alpha, constSpMatDescr, constDnVecDescr, vecY, dataType, spSVAlg_t, rocsparse_spsv_stage_buffer_size, &bufferSize, nullptr); + status_t = cusparseSpSV_bufferSize(handle_t, opA, alpha, constSpMatDescr, constDnVecDescr, vecY, dataType, spSVAlg_t, spSVDescr, &bufferSize); #endif return 0; diff --git a/tests/unit_tests/synthetic/runtime_enums.cu b/tests/unit_tests/synthetic/runtime_enums.cu index f143a8f9..7560a872 100644 --- a/tests/unit_tests/synthetic/runtime_enums.cu +++ b/tests/unit_tests/synthetic/runtime_enums.cu @@ -815,7 +815,6 @@ int main() { cudaUserObjectRetainFlags UserObjectRetainFlags; cudaUserObjectRetainFlags GraphUserObjectMove = cudaGraphUserObjectMove; - // CHECK: hipGraphDebugDotFlags graphDebugDot_flags; // CHECK-NEXT: hipGraphDebugDotFlags graphDebugDot_flags_enum; // CHECK-NEXT: hipGraphDebugDotFlags GRAPH_DEBUG_DOT_FLAGS_VERBOSE = hipGraphDebugDotFlagsVerbose; @@ -842,6 +841,22 @@ int main() { CUgraphDebugDot_flags GRAPH_DEBUG_DOT_FLAGS_EXT_SEMAS_WAIT_NODE_PARAMS = CU_GRAPH_DEBUG_DOT_FLAGS_EXT_SEMAS_WAIT_NODE_PARAMS; CUgraphDebugDot_flags GRAPH_DEBUG_DOT_FLAGS_KERNEL_NODE_ATTRIBUTES = CU_GRAPH_DEBUG_DOT_FLAGS_KERNEL_NODE_ATTRIBUTES; CUgraphDebugDot_flags GRAPH_DEBUG_DOT_FLAGS_HANDLES = CU_GRAPH_DEBUG_DOT_FLAGS_HANDLES; + + // CHECK: hipFlushGPUDirectRDMAWritesOptions flushGPUDirectRDMAWritesOptions; + // CHECK-NEXT: hipFlushGPUDirectRDMAWritesOptions FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_HOST = hipFlushGPUDirectRDMAWritesOptionHost; + // CHECK-NEXT: hipFlushGPUDirectRDMAWritesOptions FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_MEMOPS = hipFlushGPUDirectRDMAWritesOptionMemOps; + cudaFlushGPUDirectRDMAWritesOptions flushGPUDirectRDMAWritesOptions; + cudaFlushGPUDirectRDMAWritesOptions FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_HOST = cudaFlushGPUDirectRDMAWritesOptionHost; + cudaFlushGPUDirectRDMAWritesOptions FLUSH_GPU_DIRECT_RDMA_WRITES_OPTION_MEMOPS = cudaFlushGPUDirectRDMAWritesOptionMemOps; + + // CHECK: hipGPUDirectRDMAWritesOrdering GPUDirectRDMAWritesOrdering; + // CHECK-NEXT: hipGPUDirectRDMAWritesOrdering GPU_DIRECT_RDMA_WRITES_ORDERING_NONE = hipGPUDirectRDMAWritesOrderingNone; + // CHECK-NEXT: hipGPUDirectRDMAWritesOrdering GPU_DIRECT_RDMA_WRITES_ORDERING_OWNER = hipGPUDirectRDMAWritesOrderingOwner; + // CHECK-NEXT: hipGPUDirectRDMAWritesOrdering GPU_DIRECT_RDMA_WRITES_ORDERING_ALL_DEVICES = hipGPUDirectRDMAWritesOrderingAllDevices; + cudaGPUDirectRDMAWritesOrdering GPUDirectRDMAWritesOrdering; + cudaGPUDirectRDMAWritesOrdering GPU_DIRECT_RDMA_WRITES_ORDERING_NONE = cudaGPUDirectRDMAWritesOrderingNone; + cudaGPUDirectRDMAWritesOrdering GPU_DIRECT_RDMA_WRITES_ORDERING_OWNER = cudaGPUDirectRDMAWritesOrderingOwner; + cudaGPUDirectRDMAWritesOrdering GPU_DIRECT_RDMA_WRITES_ORDERING_ALL_DEVICES = cudaGPUDirectRDMAWritesOrderingAllDevices; #endif #if CUDA_VERSION >= 11040 @@ -881,6 +896,19 @@ int main() { // CHECK-NEXT: hipGraphInstantiateFlags GraphInstantiateFlagDeviceLaunch = hipGraphInstantiateFlagDeviceLaunch; cudaGraphInstantiateFlags GraphInstantiateFlagUpload = cudaGraphInstantiateFlagUpload; cudaGraphInstantiateFlags GraphInstantiateFlagDeviceLaunch = cudaGraphInstantiateFlagDeviceLaunch; + + // CHECK: hipGraphInstantiateResult graphInstantiateResult; + // CHECK-NEXT: hipGraphInstantiateResult GRAPH_INSTANTIATE_SUCCESS = hipGraphInstantiateSuccess; + // CHECK-NEXT: hipGraphInstantiateResult GRAPH_INSTANTIATE_ERROR = hipGraphInstantiateError; + // CHECK-NEXT: hipGraphInstantiateResult GRAPH_INSTANTIATE_INVALID_STRUCTURE = hipGraphInstantiateInvalidStructure; + // CHECK-NEXT: hipGraphInstantiateResult GRAPH_INSTANTIATE_NODE_OPERATION_NOT_SUPPORTED = hipGraphInstantiateNodeOperationNotSupported; + // CHECK-NEXT: hipGraphInstantiateResult GRAPH_INSTANTIATE_MULTIPLE_CTXS_NOT_SUPPORTED = hipGraphInstantiateMultipleDevicesNotSupported; + cudaGraphInstantiateResult graphInstantiateResult; + cudaGraphInstantiateResult GRAPH_INSTANTIATE_SUCCESS = cudaGraphInstantiateSuccess; + cudaGraphInstantiateResult GRAPH_INSTANTIATE_ERROR = cudaGraphInstantiateError; + cudaGraphInstantiateResult GRAPH_INSTANTIATE_INVALID_STRUCTURE = cudaGraphInstantiateInvalidStructure; + cudaGraphInstantiateResult GRAPH_INSTANTIATE_NODE_OPERATION_NOT_SUPPORTED = cudaGraphInstantiateNodeOperationNotSupported; + cudaGraphInstantiateResult GRAPH_INSTANTIATE_MULTIPLE_CTXS_NOT_SUPPORTED = cudaGraphInstantiateMultipleDevicesNotSupported; #endif return 0; diff --git a/tests/unit_tests/synthetic/runtime_structs.cu b/tests/unit_tests/synthetic/runtime_structs.cu index 34ef740c..88bd6148 100644 --- a/tests/unit_tests/synthetic/runtime_structs.cu +++ b/tests/unit_tests/synthetic/runtime_structs.cu @@ -189,12 +189,34 @@ int main() { surfaceReference surfaceRef; #endif +#if CUDA_VERSION >= 12000 + // CHECK: hipGraphInstantiateParams GRAPH_INSTANTIATE_PARAMS_st; + // CHECK-NEXT: hipGraphInstantiateParams GRAPH_INSTANTIATE_PARAMS; + cudaGraphInstantiateParams_st GRAPH_INSTANTIATE_PARAMS_st; + cudaGraphInstantiateParams GRAPH_INSTANTIATE_PARAMS; +#endif + #if CUDA_VERSION >= 12020 // CHECK: hipExternalSemaphoreSignalNodeParams ExternalSemaphoreSignalNodeParams_v2; cudaExternalSemaphoreSignalNodeParamsV2 ExternalSemaphoreSignalNodeParams_v2; // CHECK: hipExternalSemaphoreWaitNodeParams ExternalSemaphoreWaitNodeParams_v2; cudaExternalSemaphoreWaitNodeParamsV2 ExternalSemaphoreWaitNodeParams_v2; + + // CHECK: hipMemFreeNodeParams MemFreeNodeParams; + cudaMemFreeNodeParams MemFreeNodeParams; + + // CHECK: hipChildGraphNodeParams ChildGraphNodeParams; + cudaChildGraphNodeParams ChildGraphNodeParams; + + // CHECK: hipEventRecordNodeParams EventRecordNodeParams; + cudaEventRecordNodeParams EventRecordNodeParams; + + // CHECK: hipEventWaitNodeParams EventWaitNodeParams; + cudaEventWaitNodeParams EventWaitNodeParams; + + // CHECK: hipGraphNodeParams *GraphNodeParams = nullptr + cudaGraphNodeParams *GraphNodeParams = nullptr; #endif return 0;