Skip to content

Commit

Permalink
[ROCm] fixes ambiguous calls to shfl* where there is no explicit type (
Browse files Browse the repository at this point in the history
…#411)

convertion from c10::Half to __half
  • Loading branch information
ashwinma authored Jan 23, 2024
1 parent 140d3ad commit 32caa1c
Showing 1 changed file with 10 additions and 0 deletions.
10 changes: 10 additions & 0 deletions csrc/cuda/utils.cuh
Original file line number Diff line number Diff line change
Expand Up @@ -18,6 +18,16 @@ __device__ __inline__ at::Half __shfl_down_sync(const unsigned mask,
return __shfl_down_sync(mask, var.operator __half(), delta);
}

__device__ __inline__ at::Half __shfl_up(const at::Half var,
const unsigned int delta) {
return __shfl_up(var.operator __half(), delta);
}

__device__ __inline__ at::Half __shfl_down(const at::Half var,
const unsigned int delta) {
return __shfl_down(var.operator __half(), delta);
}

#ifdef USE_ROCM
__device__ __inline__ at::Half __ldg(const at::Half* ptr) {
return __ldg(reinterpret_cast<const __half*>(ptr));
Expand Down

0 comments on commit 32caa1c

Please sign in to comment.