@@ -109,9 +109,6 @@ static inline __device__ void atomicAdd( double *address, double val) { AtomicA
109109#elif !defined(__CUDA_ARCH__) && (CUDA_VERSION < 8000)
110110static inline __device__ void atomicAdd ( double *address, double val) {}
111111#endif
112- #ifdef CUDA_HALF_TENSOR
113- static inline __device__ void atomicAdd ( half *address, half val) {}
114- #endif
115112
116113#define OP (X, Y ) Y * X
117114ATOMIC_ (Mul)
@@ -123,9 +120,6 @@ static inline __device__ void atomicMul(int32_t *address, int32_t val) { AtomicM
123120static inline __device__ void atomicMul (int64_t *address, int64_t val) { AtomicMulIntegerImpl<int64_t , sizeof (int64_t )>()(address, val); }
124121static inline __device__ void atomicMul ( float *address, float val) { AtomicMulDecimalImpl< float , sizeof ( float )>()(address, val); }
125122static inline __device__ void atomicMul ( double *address, double val) { AtomicMulDecimalImpl< double , sizeof ( double )>()(address, val); }
126- #ifdef CUDA_HALF_TENSOR
127- static inline __device__ void atomicMul ( half *address, half val) {}
128- #endif
129123
130124#define OP (X, Y ) Y / X
131125ATOMIC_ (Div)
@@ -137,9 +131,6 @@ static inline __device__ void atomicDiv(int32_t *address, int32_t val) { AtomicD
137131static inline __device__ void atomicDiv (int64_t *address, int64_t val) { AtomicDivIntegerImpl<int64_t , sizeof (int64_t )>()(address, val); }
138132static inline __device__ void atomicDiv ( float *address, float val) { AtomicDivDecimalImpl< float , sizeof ( float )>()(address, val); }
139133static inline __device__ void atomicDiv ( double *address, double val) { AtomicDivDecimalImpl< double , sizeof ( double )>()(address, val); }
140- #ifdef CUDA_HALF_TENSOR
141- static inline __device__ void atomicDiv ( half *address, half val) {}
142- #endif
143134
144135#define OP (X, Y ) max(Y, X)
145136ATOMIC_ (Max)
@@ -150,9 +141,6 @@ static inline __device__ void atomicMax(int16_t *address, int16_t val) { AtomicM
150141static inline __device__ void atomicMax (int64_t *address, int64_t val) { AtomicMaxIntegerImpl<int64_t , sizeof (int64_t )>()(address, val); }
151142static inline __device__ void atomicMax ( float *address, float val) { AtomicMaxDecimalImpl< float , sizeof ( float )>()(address, val); }
152143static inline __device__ void atomicMax ( double *address, double val) { AtomicMaxDecimalImpl< double , sizeof ( double )>()(address, val); }
153- #ifdef CUDA_HALF_TENSOR
154- static inline __device__ void atomicMax ( half *address, half val) {}
155- #endif
156144
157145#define OP (X, Y ) min(Y, X)
158146ATOMIC_ (Min)
@@ -163,6 +151,3 @@ static inline __device__ void atomicMin(int16_t *address, int16_t val) { AtomicM
163151static inline __device__ void atomicMin (int64_t *address, int64_t val) { AtomicMinIntegerImpl<int64_t , sizeof (int64_t )>()(address, val); }
164152static inline __device__ void atomicMin ( float *address, float val) { AtomicMinDecimalImpl< float , sizeof ( float )>()(address, val); }
165153static inline __device__ void atomicMin ( double *address, double val) { AtomicMinDecimalImpl< double , sizeof ( double )>()(address, val); }
166- #ifdef CUDA_HALF_TENSOR
167- static inline __device__ void atomicMin ( half *address, half val) {}
168- #endif
0 commit comments