Skip to content

Commit 0e0d7fb

Browse files
committed
Fix cuda compiling bug
1 parent 9a5a741 commit 0e0d7fb

File tree

1 file changed

+6
-6
lines changed

1 file changed

+6
-6
lines changed

source/module_hsolver/kernels/cuda/math_kernel_op.cu

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@
1212
namespace hsolver
1313
{
1414
const int warp_size = 32;
15-
//const unsigned int full_mask = 0xffffffff;
15+
// const unsigned int full_mask = 0xffffffff;
1616
const int thread_per_block = 256;
1717
}
1818

@@ -65,11 +65,11 @@ void destoryBLAShandle(){
6565
}
6666
}
6767

68-
template <typename FPTYPE>
69-
__forceinline__ __device__ void warp_reduce(FPTYPE& val) {
70-
for (int offset = 16; offset > 0; offset >>= 1)
71-
val += __shfl_down_sync(full_mask, val, offset);
72-
}
68+
// template <typename FPTYPE>
69+
// __forceinline__ __device__ void warp_reduce(FPTYPE& val) {
70+
// for (int offset = 16; offset > 0; offset >>= 1)
71+
// val += __shfl_down_sync(full_mask, val, offset);
72+
// }
7373

7474
template <typename Real>
7575
__global__ void line_minimize_with_block(

0 commit comments

Comments
 (0)