[Metax] modify wrapSize to WARP_SIZE (#5442)

This commit is contained in:
xiaozude
2025-12-09 17:44:02 +08:00
committed by GitHub
parent e397c4fba6
commit df67379bc3
4 changed files with 406 additions and 228 deletions
@@ -18,7 +18,7 @@
template <typename T>
__forceinline__ __device__ T
CudaShuffleDownSync(unsigned mask, T val, int delta, int width = warpSize) {
CudaShuffleDownSync(unsigned mask, T val, int delta, int width = WARP_SIZE) {
return __shfl_down_sync(mask, val, static_cast<unsigned>(delta), width);
}