From 3f93e656ea6be6f9a8816fa696ba7c435343fc2e Mon Sep 17 00:00:00 2001 From: Hieu Hoang Date: Tue, 15 Aug 2023 12:55:24 -0700 Subject: [PATCH] don't include nppdefs.h. Problematic on some machines (#1004) Co-authored-by: Hieu Hoang --- src/tensors/gpu/tensor_operators.cu | 6 ++---- 1 file changed, 2 insertions(+), 4 deletions(-) diff --git a/src/tensors/gpu/tensor_operators.cu b/src/tensors/gpu/tensor_operators.cu index 5f8c4c122..6dbded2a4 100644 --- a/src/tensors/gpu/tensor_operators.cu +++ b/src/tensors/gpu/tensor_operators.cu @@ -1,7 +1,5 @@ -# if defined(_MSC_VER) +# if !defined(NPP_MAX_32U) #define NPP_MAX_32U ( 4294967295U ) /**< Maximum 32-bit unsigned integer */ -#else -#include #endif #include "common/types.h" @@ -3548,7 +3546,7 @@ __global__ void HammmingAndSort(const uint32_t *weightHash, if (outIdx != NPP_MAX_32U) { uint32_t prevOutIdx; // Not supported in Maxwells or older -// Not supported in Maxwells or older +// Not supported in Maxwells or older #if __CUDA_ARCH__ >= 600 prevOutIdx = atomicAdd_block(&outIdx, (uint32_t) -1); #else