aboutsummaryrefslogtreecommitdiff
path: root/libomptarget/deviceRTLs
diff options
context:
space:
mode:
authorAlexey Bataev <a.bataev@hotmail.com>2018-12-10 16:50:36 +0000
committerAlexey Bataev <a.bataev@hotmail.com>2018-12-10 16:50:36 +0000
commite90d5a507452b782029b2cacce364785c3af9fdd (patch)
tree5caf928910a681784a6df21c7cb074ad6460684d /libomptarget/deviceRTLs
parenta23f780b1ae886c793d74375c10dab887a30d9eb (diff)
[OPENMP][NVPTX]Revert __kmpc_shuffle_int64 to its original form.
Summary: Use the original shuffle implementation for __kmpc_shuffle_int64 since default implementation uses the same implementation. Reviewers: gtbercea Subscribers: guansong, caomhin, openmp-commits Differential Revision: https://reviews.llvm.org/D55514 git-svn-id: https://llvm.org/svn/llvm-project/openmp/trunk@348772 91177308-0d34-0410-b5e6-96231b3b80d8
Diffstat (limited to 'libomptarget/deviceRTLs')
-rw-r--r--libomptarget/deviceRTLs/nvptx/src/reduction.cu5
1 files changed, 0 insertions, 5 deletions
diff --git a/libomptarget/deviceRTLs/nvptx/src/reduction.cu b/libomptarget/deviceRTLs/nvptx/src/reduction.cu
index 2546302..c0d22df 100644
--- a/libomptarget/deviceRTLs/nvptx/src/reduction.cu
+++ b/libomptarget/deviceRTLs/nvptx/src/reduction.cu
@@ -76,17 +76,12 @@ EXTERN int32_t __kmpc_shuffle_int32(int32_t val, int16_t delta, int16_t size) {
}
EXTERN int64_t __kmpc_shuffle_int64(int64_t val, int16_t delta, int16_t size) {
-#if defined(CUDART_VERSION) && CUDART_VERSION >= 9000
- return __SHFL_DOWN_SYNC(0xFFFFFFFFFFFFFFFFLL, (long long)val, (unsigned)delta,
- (int)size);
-#else
int lo, hi;
asm volatile("mov.b64 {%0,%1}, %2;" : "=r"(lo), "=r"(hi) : "l"(val));
hi = __SHFL_DOWN_SYNC(0xFFFFFFFF, hi, delta, size);
lo = __SHFL_DOWN_SYNC(0xFFFFFFFF, lo, delta, size);
asm volatile("mov.b64 %0, {%1,%2};" : "=l"(val) : "r"(lo), "r"(hi));
return val;
-#endif
}
static INLINE void gpu_regular_warp_reduce(void *reduce_data,