Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
5 changes: 5 additions & 0 deletions projects/rocsparse/CHANGELOG.md
Original file line number Diff line number Diff line change
Expand Up @@ -3,6 +3,11 @@
Documentation for rocSPARSE is available at
[https://rocm.docs.amd.com/projects/rocSPARSE/en/latest/](https://rocm.docs.amd.com/projects/rocSPARSE/en/latest/).

## rocSPARSE 4.5.1 for ROCm 7.13.0

### Resolved issues
* Fix `rocsparse_[s|d|c|z]csric0` where `rocsparse_status_invalid_value` was being returned when the maximum number of non-zeros in any row is between 513 and 1024.

## rocSPARSE 4.5.0 for ROCm 7.12.0

### Added
Expand Down
2 changes: 1 addition & 1 deletion projects/rocsparse/CMakeLists.txt
Original file line number Diff line number Diff line change
Expand Up @@ -193,7 +193,7 @@ endif()
message(STATUS "GPU_TARGETS: ${GPU_TARGETS}")

# Setup version
set(VERSION_STRING "4.5.0")
set(VERSION_STRING "4.5.1")
set(SOVERSION_STRING "1.0")
set(MIN_ROCPRIM_VERSION "4.0.0" CACHE STRING "Minimum version of rocPRIM.")
set(MIN_ROCBLAS_VERSION "4.1.0" CACHE STRING "Minimum version of rocBLAS.")
Expand Down
1 change: 1 addition & 0 deletions projects/rocsparse/clients/tests/test_csric0.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -44,6 +44,7 @@ Definitions:
- &M_N_range_extra
- { M: 10, N: 10 }
- { M: 235, N: 235 }
- { M: 600, N: 600 }
- { M: 1200, N: 1200 }

Tests:
Expand Down
2 changes: 1 addition & 1 deletion projects/rocsparse/library/src/level3/csrsm_device.h
Original file line number Diff line number Diff line change
Expand Up @@ -28,7 +28,7 @@

namespace rocsparse
{
template <uint32_t BLOCKSIZE, uint32_t WF_SIZE, bool SLEEP, typename I, typename J, typename T>
template <uint32_t BLOCKSIZE, bool SLEEP, typename I, typename J, typename T>
ROCSPARSE_DEVICE_ILF void csrsm_device(rocsparse_operation transB,
J m,
J nrhs,
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -36,7 +36,7 @@
#include "csrsm_device.h"
namespace rocsparse
{
template <uint32_t BLOCKSIZE, uint32_t WFSIZE, bool SLEEP, typename I, typename J, typename T>
template <uint32_t BLOCKSIZE, bool SLEEP, typename I, typename J, typename T>
ROCSPARSE_KERNEL(BLOCKSIZE)
void csrsm(rocsparse_operation transB,
J m,
Expand All @@ -57,21 +57,21 @@ namespace rocsparse
{
ROCSPARSE_DEVICE_HOST_SCALAR_GET(alpha);

rocsparse::csrsm_device<BLOCKSIZE, WFSIZE, SLEEP>(transB,
m,
nrhs,
alpha,
csr_row_ptr,
csr_col_ind,
csr_val,
B,
ldb,
done_array,
map,
zero_pivot,
idx_base,
fill_mode,
diag_type);
rocsparse::csrsm_device<BLOCKSIZE, SLEEP>(transB,
m,
nrhs,
alpha,
csr_row_ptr,
csr_col_ind,
csr_val,
B,
ldb,
done_array,
map,
zero_pivot,
idx_base,
fill_mode,
diag_type);
}

template <typename I, typename J, typename T>
Expand Down Expand Up @@ -211,11 +211,10 @@ namespace rocsparse

if(blockdim == 64)
{

if(gcn_arch_name == rocpsarse_arch_names::gfx908 && asicRev < 2)
{
RETURN_IF_HIPLAUNCHKERNELGGL_ERROR(
(rocsparse::csrsm<64, 64, true>),
(rocsparse::csrsm<64, true>),
csrsm_blocks,
csrsm_threads,
0,
Expand All @@ -240,7 +239,7 @@ namespace rocsparse
else
{
RETURN_IF_HIPLAUNCHKERNELGGL_ERROR(
(rocsparse::csrsm<64, 64, false>),
(rocsparse::csrsm<64, false>),
csrsm_blocks,
csrsm_threads,
0,
Expand Down Expand Up @@ -268,7 +267,7 @@ namespace rocsparse
if(gcn_arch_name == rocpsarse_arch_names::gfx908 && asicRev < 2)
{
RETURN_IF_HIPLAUNCHKERNELGGL_ERROR(
(rocsparse::csrsm<128, 64, true>),
(rocsparse::csrsm<128, true>),
csrsm_blocks,
csrsm_threads,
0,
Expand All @@ -293,7 +292,7 @@ namespace rocsparse
else
{
RETURN_IF_HIPLAUNCHKERNELGGL_ERROR(
(rocsparse::csrsm<128, 64, false>),
(rocsparse::csrsm<128, false>),
csrsm_blocks,
csrsm_threads,
0,
Expand Down Expand Up @@ -321,7 +320,7 @@ namespace rocsparse
if(gcn_arch_name == rocpsarse_arch_names::gfx908 && asicRev < 2)
{
RETURN_IF_HIPLAUNCHKERNELGGL_ERROR(
(rocsparse::csrsm<256, 64, true>),
(rocsparse::csrsm<256, true>),
csrsm_blocks,
csrsm_threads,
0,
Expand All @@ -346,7 +345,7 @@ namespace rocsparse
else
{
RETURN_IF_HIPLAUNCHKERNELGGL_ERROR(
(rocsparse::csrsm<256, 64, false>),
(rocsparse::csrsm<256, false>),
csrsm_blocks,
csrsm_threads,
0,
Expand Down Expand Up @@ -374,7 +373,7 @@ namespace rocsparse
if(gcn_arch_name == rocpsarse_arch_names::gfx908 && asicRev < 2)
{
RETURN_IF_HIPLAUNCHKERNELGGL_ERROR(
(rocsparse::csrsm<512, 64, true>),
(rocsparse::csrsm<512, true>),
csrsm_blocks,
csrsm_threads,
0,
Expand All @@ -399,7 +398,7 @@ namespace rocsparse
else
{
RETURN_IF_HIPLAUNCHKERNELGGL_ERROR(
(rocsparse::csrsm<512, 64, false>),
(rocsparse::csrsm<512, false>),
csrsm_blocks,
csrsm_threads,
0,
Expand Down Expand Up @@ -427,7 +426,7 @@ namespace rocsparse
if(gcn_arch_name == rocpsarse_arch_names::gfx908 && asicRev < 2)
{
RETURN_IF_HIPLAUNCHKERNELGGL_ERROR(
(rocsparse::csrsm<1024, 64, true>),
(rocsparse::csrsm<1024, true>),
csrsm_blocks,
csrsm_threads,
0,
Expand All @@ -452,7 +451,7 @@ namespace rocsparse
else
{
RETURN_IF_HIPLAUNCHKERNELGGL_ERROR(
(rocsparse::csrsm<1024, 64, false>),
(rocsparse::csrsm<1024, false>),
csrsm_blocks,
csrsm_threads,
0,
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -41,7 +41,7 @@ rocsparse_status rocsparse::csric0_kernel_launch(rocsparse_handle handle,

rocsparse::csric0_kernel_launch_t launch{};

if(sleep || (trm_info->get_max_nnz() > 1024))
if(sleep || (trm_info->get_max_nnz() > 512))
{
launch = rocsparse::find_csric0_kernel_binsearch_launch(handle, csric0_info, A);
}
Expand Down
Loading