cuda : uint -> uint32_t
This commit is contained in:
parent
f725ca90fb
commit
5408d55506
2 changed files with 9 additions and 9 deletions
|
@ -307,9 +307,9 @@ static __device__ __forceinline__ half2 warp_reduce_max(half2 x) {
|
|||
}
|
||||
|
||||
#if CUDART_VERSION < 12000
|
||||
static __device__ __forceinline__ uint __hgt2_mask(const half2 a, const half2 b) {
|
||||
const uint mask_low = 0x0000FFFF * ( __low2half(a) > __low2half(b));
|
||||
const uint mask_high = 0xFFFF0000 * (__high2half(a) > __high2half(b));
|
||||
static __device__ __forceinline__ uint32_t __hgt2_mask(const half2 a, const half2 b) {
|
||||
const uint32_t mask_low = 0x0000FFFF * ( __low2half(a) > __low2half(b));
|
||||
const uint32_t mask_high = 0xFFFF0000 * (__high2half(a) > __high2half(b));
|
||||
return mask_low | mask_high;
|
||||
}
|
||||
#endif // CUDART_VERSION < 12000
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue