Commit b1fec976 authored by sxtyzhangzk's avatar sxtyzhangzk Committed by Zhekai Zhang
Browse files

[major] fix build on windows

parent 3969b561
...@@ -60,7 +60,7 @@ static void store(T *addr, T val) { ...@@ -60,7 +60,7 @@ static void store(T *addr, T val) {
} }
if constexpr (sizeof(T) == 4) { if constexpr (sizeof(T) == 4) {
__stcg(reinterpret_cast<uint *>(addr), *reinterpret_cast<uint *>(&val)); __stcg(reinterpret_cast<unsigned int *>(addr), *reinterpret_cast<unsigned int *>(&val));
return; return;
} }
if constexpr (sizeof(T) == 8) { if constexpr (sizeof(T) == 8) {
......
...@@ -7,7 +7,12 @@ ...@@ -7,7 +7,12 @@
#include "dispatch_utils.h" #include "dispatch_utils.h"
#pragma nv_diag_suppress 177 #pragma nv_diag_suppress 177
#ifdef _MSC_VER
#define ALWAYSINLINE [[msvc::forceinline]]
#else
#define ALWAYSINLINE __attribute__((always_inline)) #define ALWAYSINLINE __attribute__((always_inline))
#endif
// #define ENABLE_NAN_CHECK 1 // #define ENABLE_NAN_CHECK 1
#if ENABLE_NAN_CHECK #if ENABLE_NAN_CHECK
...@@ -196,12 +201,12 @@ public: ...@@ -196,12 +201,12 @@ public:
: :
"=f"(psum.data[0]), "=f"(psum.data[1]), "=f"(psum.data[2]), "=f"(psum.data[3]) "=f"(psum.data[0]), "=f"(psum.data[1]), "=f"(psum.data[2]), "=f"(psum.data[3])
: :
"r"(*reinterpret_cast<uint *>(&a.data[0])), "r"(*reinterpret_cast<unsigned int *>(&a.data[0])),
"r"(*reinterpret_cast<uint *>(&a.data[1])), "r"(*reinterpret_cast<unsigned int *>(&a.data[1])),
"r"(*reinterpret_cast<uint *>(&a.data[2])), "r"(*reinterpret_cast<unsigned int *>(&a.data[2])),
"r"(*reinterpret_cast<uint *>(&a.data[3])), "r"(*reinterpret_cast<unsigned int *>(&a.data[3])),
"r"(*reinterpret_cast<uint *>(&b.data[0])), "r"(*reinterpret_cast<unsigned int *>(&b.data[0])),
"r"(*reinterpret_cast<uint *>(&b.data[1])), "r"(*reinterpret_cast<unsigned int *>(&b.data[1])),
// "r"(0), "r"(0), "r"(0), "r"(0) // "r"(0), "r"(0), "r"(0), "r"(0)
"f"(psum.data[0]), "f"(psum.data[1]), "f"(psum.data[2]), "f"(psum.data[3]) "f"(psum.data[0]), "f"(psum.data[1]), "f"(psum.data[2]), "f"(psum.data[3])
...@@ -215,12 +220,12 @@ public: ...@@ -215,12 +220,12 @@ public:
: :
"=f"(psum.data[4]), "=f"(psum.data[5]), "=f"(psum.data[6]), "=f"(psum.data[7]) "=f"(psum.data[4]), "=f"(psum.data[5]), "=f"(psum.data[6]), "=f"(psum.data[7])
: :
"r"(*reinterpret_cast<uint *>(&a.data[0])), "r"(*reinterpret_cast<unsigned int *>(&a.data[0])),
"r"(*reinterpret_cast<uint *>(&a.data[1])), "r"(*reinterpret_cast<unsigned int *>(&a.data[1])),
"r"(*reinterpret_cast<uint *>(&a.data[2])), "r"(*reinterpret_cast<unsigned int *>(&a.data[2])),
"r"(*reinterpret_cast<uint *>(&a.data[3])), "r"(*reinterpret_cast<unsigned int *>(&a.data[3])),
"r"(*reinterpret_cast<uint *>(&b.data[2])), "r"(*reinterpret_cast<unsigned int *>(&b.data[2])),
"r"(*reinterpret_cast<uint *>(&b.data[3])), "r"(*reinterpret_cast<unsigned int *>(&b.data[3])),
// "r"(0), "r"(0), "r"(0), "r"(0) // "r"(0), "r"(0), "r"(0), "r"(0)
"f"(psum.data[4]), "f"(psum.data[5]), "f"(psum.data[6]), "f"(psum.data[7]) "f"(psum.data[4]), "f"(psum.data[5]), "f"(psum.data[6]), "f"(psum.data[7])
); );
...@@ -236,12 +241,12 @@ public: ...@@ -236,12 +241,12 @@ public:
: :
"=f"(psum.data[0]), "=f"(psum.data[1]), "=f"(psum.data[2]), "=f"(psum.data[3]) "=f"(psum.data[0]), "=f"(psum.data[1]), "=f"(psum.data[2]), "=f"(psum.data[3])
: :
"r"(*reinterpret_cast<uint *>(&a.data[0])), "r"(*reinterpret_cast<unsigned int *>(&a.data[0])),
"r"(*reinterpret_cast<uint *>(&a.data[1])), "r"(*reinterpret_cast<unsigned int *>(&a.data[1])),
"r"(*reinterpret_cast<uint *>(&a.data[2])), "r"(*reinterpret_cast<unsigned int *>(&a.data[2])),
"r"(*reinterpret_cast<uint *>(&a.data[3])), "r"(*reinterpret_cast<unsigned int *>(&a.data[3])),
"r"(*reinterpret_cast<uint *>(&b.data[0])), "r"(*reinterpret_cast<unsigned int *>(&b.data[0])),
"r"(*reinterpret_cast<uint *>(&b.data[1])), "r"(*reinterpret_cast<unsigned int *>(&b.data[1])),
// "r"(0), "r"(0), "r"(0), "r"(0) // "r"(0), "r"(0), "r"(0), "r"(0)
"f"(psum.data[0]), "f"(psum.data[1]), "f"(psum.data[2]), "f"(psum.data[3]) "f"(psum.data[0]), "f"(psum.data[1]), "f"(psum.data[2]), "f"(psum.data[3])
...@@ -255,12 +260,12 @@ public: ...@@ -255,12 +260,12 @@ public:
: :
"=f"(psum.data[4]), "=f"(psum.data[5]), "=f"(psum.data[6]), "=f"(psum.data[7]) "=f"(psum.data[4]), "=f"(psum.data[5]), "=f"(psum.data[6]), "=f"(psum.data[7])
: :
"r"(*reinterpret_cast<uint *>(&a.data[0])), "r"(*reinterpret_cast<unsigned int *>(&a.data[0])),
"r"(*reinterpret_cast<uint *>(&a.data[1])), "r"(*reinterpret_cast<unsigned int *>(&a.data[1])),
"r"(*reinterpret_cast<uint *>(&a.data[2])), "r"(*reinterpret_cast<unsigned int *>(&a.data[2])),
"r"(*reinterpret_cast<uint *>(&a.data[3])), "r"(*reinterpret_cast<unsigned int *>(&a.data[3])),
"r"(*reinterpret_cast<uint *>(&b.data[2])), "r"(*reinterpret_cast<unsigned int *>(&b.data[2])),
"r"(*reinterpret_cast<uint *>(&b.data[3])), "r"(*reinterpret_cast<unsigned int *>(&b.data[3])),
// "r"(0), "r"(0), "r"(0), "r"(0) // "r"(0), "r"(0), "r"(0), "r"(0)
"f"(psum.data[4]), "f"(psum.data[5]), "f"(psum.data[6]), "f"(psum.data[7]) "f"(psum.data[4]), "f"(psum.data[5]), "f"(psum.data[6]), "f"(psum.data[7])
); );
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment