Skip to content

Commit

Permalink
Fix cuda compiling bug
Browse files Browse the repository at this point in the history
  • Loading branch information
Critsium-xy committed Nov 8, 2024
1 parent 9a5a741 commit 0e0d7fb
Showing 1 changed file with 6 additions and 6 deletions.
12 changes: 6 additions & 6 deletions source/module_hsolver/kernels/cuda/math_kernel_op.cu
Original file line number Diff line number Diff line change
Expand Up @@ -12,7 +12,7 @@
namespace hsolver
{
const int warp_size = 32;
//const unsigned int full_mask = 0xffffffff;
// const unsigned int full_mask = 0xffffffff;
const int thread_per_block = 256;
}

Expand Down Expand Up @@ -65,11 +65,11 @@ void destoryBLAShandle(){
}
}

template <typename FPTYPE>
__forceinline__ __device__ void warp_reduce(FPTYPE& val) {
for (int offset = 16; offset > 0; offset >>= 1)
val += __shfl_down_sync(full_mask, val, offset);
}
// template <typename FPTYPE>
// __forceinline__ __device__ void warp_reduce(FPTYPE& val) {
// for (int offset = 16; offset > 0; offset >>= 1)
// val += __shfl_down_sync(full_mask, val, offset);
// }

template <typename Real>
__global__ void line_minimize_with_block(
Expand Down

0 comments on commit 0e0d7fb

Please sign in to comment.