mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
[Metax] modify wrapSize to WARP_SIZE (#5442)
This commit is contained in:
@@ -18,7 +18,7 @@
|
||||
|
||||
template <typename T>
|
||||
__forceinline__ __device__ T
|
||||
CudaShuffleDownSync(unsigned mask, T val, int delta, int width = warpSize) {
|
||||
CudaShuffleDownSync(unsigned mask, T val, int delta, int width = WARP_SIZE) {
|
||||
return __shfl_down_sync(mask, val, static_cast<unsigned>(delta), width);
|
||||
}
|
||||
|
||||
|
||||
Reference in New Issue
Block a user