Skip to content

Commit

Permalink
SWDEV-432785 - Remove the mapping of __shfl* to __shfl*_sync function…
Browse files Browse the repository at this point in the history
…s on CUDA

Change-Id: I93d2ce360b834b3da01731cabc22841f7d0a092d
  • Loading branch information
Vladana Stojiljkovic authored and rakesroy committed Oct 8, 2024
1 parent ddc41f2 commit ed5b3fb
Showing 1 changed file with 0 additions and 7 deletions.
7 changes: 0 additions & 7 deletions hipnv/include/hip/nvidia_detail/nvidia_hip_runtime_api.h
Original file line number Diff line number Diff line change
Expand Up @@ -760,13 +760,6 @@ typedef enum cudaGraphInstantiateFlags hipGraphInstantiateFlags;
#define hipGraphInstantiateFlagDeviceLaunch cudaGraphInstantiateFlagDeviceLaunch
#define hipGraphInstantiateFlagUseNodePriority cudaGraphInstantiateFlagUseNodePriority

#if CUDA_VERSION >= CUDA_9000
#define __shfl(...) __shfl_sync(0xffffffff, __VA_ARGS__)
#define __shfl_up(...) __shfl_up_sync(0xffffffff, __VA_ARGS__)
#define __shfl_down(...) __shfl_down_sync(0xffffffff, __VA_ARGS__)
#define __shfl_xor(...) __shfl_xor_sync(0xffffffff, __VA_ARGS__)
#endif // CUDA_VERSION >= CUDA_9000

inline static hipError_t hipCUDAErrorTohipError(cudaError_t cuError) {
switch (cuError) {
case cudaSuccess:
Expand Down

0 comments on commit ed5b3fb

Please sign in to comment.