diff --git a/libnd4j/include/templatemath.h b/libnd4j/include/templatemath.h index 68b59f2d4..908323369 100644 --- a/libnd4j/include/templatemath.h +++ b/libnd4j/include/templatemath.h @@ -1057,7 +1057,7 @@ inline __device__ uint64_t nd4j_atomicAdd(uint64_t* address, uint64_t template <> inline __device__ float16 nd4j_atomicAdd(float16* address, float16 val) { -#if __CUDA_ARCH__ >= 700 +#if __CUDA_ARCH__ >= 700 && defined(CUDA_10) atomicAdd(reinterpret_cast<__half*>(address), val.data); #else auto address_as_ull = (int*) address;