Skip to content

Commit 817f87b

Browse files
add __shfl_sync to HIP
1 parent e3b7c57 commit 817f87b

File tree

1 file changed

+1
-0
lines changed
  • ggml/src/ggml-cuda/vendors

1 file changed

+1
-0
lines changed

ggml/src/ggml-cuda/vendors/hip.h

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -25,6 +25,7 @@
2525
#define CU_MEM_LOCATION_TYPE_DEVICE hipMemLocationTypeDevice
2626
#define CU_MEM_ACCESS_FLAGS_PROT_READWRITE hipMemAccessFlagsProtReadWrite
2727
#define CU_CHECK(fn) {hipError_t err = fn; if(err != hipSuccess) { GGML_ABORT("HipVMM Failure: %s\n", hipGetErrorString(err)); }}
28+
#define __shfl_sync(mask, var, laneMask, width) __shfl(var, laneMask, width)
2829
#define __shfl_xor_sync(mask, var, laneMask, width) __shfl_xor(var, laneMask, width)
2930
#define cublasComputeType_t hipblasDatatype_t //deprecated, new hipblasComputeType_t not in 5.6
3031
#define cublasCreate hipblasCreate

0 commit comments

Comments
 (0)