================ @@ -162,6 +162,62 @@ __gpu_shuffle_idx_u64(uint64_t __lane_mask, uint32_t __idx, uint64_t __x, ((uint64_t)__gpu_shuffle_idx_u32(__lane_mask, __idx, __lo, __width)); } +// Returns a bitmask marking all lanes that have the same value of __x. +_DEFAULT_FN_ATTRS static __inline__ uint64_t ---------------- jhuber6 wrote:
The typedef would be dependent on the `__AMDGCN_WAVESIZE` thing, which is being deprecated. But it would work between NVPTX and AMDGPU I suppose. https://github.com/llvm/llvm-project/pull/127504 _______________________________________________ cfe-commits mailing list cfe-commits@lists.llvm.org https://lists.llvm.org/cgi-bin/mailman/listinfo/cfe-commits