File tree Expand file tree Collapse file tree 1 file changed +6
-6
lines changed
source/module_hsolver/kernels/cuda Expand file tree Collapse file tree 1 file changed +6
-6
lines changed Original file line number Diff line number Diff line change 1212namespace hsolver
1313{
1414const int warp_size = 32 ;
15- // const unsigned int full_mask = 0xffffffff;
15+ // const unsigned int full_mask = 0xffffffff;
1616const int thread_per_block = 256 ;
1717}
1818
@@ -65,11 +65,11 @@ void destoryBLAShandle(){
6565 }
6666}
6767
68- template <typename FPTYPE>
69- __forceinline__ __device__ void warp_reduce (FPTYPE& val) {
70- for (int offset = 16 ; offset > 0 ; offset >>= 1 )
71- val += __shfl_down_sync (full_mask, val, offset);
72- }
68+ // template <typename FPTYPE>
69+ // __forceinline__ __device__ void warp_reduce(FPTYPE& val) {
70+ // for (int offset = 16; offset > 0; offset >>= 1)
71+ // val += __shfl_down_sync(full_mask, val, offset);
72+ // }
7373
7474template <typename Real>
7575__global__ void line_minimize_with_block (
You can’t perform that action at this time.
0 commit comments