From 1e876bb96cf746108e883db249e47939f5d9b47e Mon Sep 17 00:00:00 2001 From: Wesley Maxey Date: Wed, 18 Nov 2020 17:20:12 -0800 Subject: [PATCH] Add store intrinsics for older MSVC --- libcxx/include/__config | 2 +- libcxx/include/support/win32/atomic_msvc.h | 61 +++++++++++++++------- 2 files changed, 42 insertions(+), 21 deletions(-) diff --git a/libcxx/include/__config b/libcxx/include/__config index c96fe80ed8..575ea2429a 100644 --- a/libcxx/include/__config +++ b/libcxx/include/__config @@ -860,7 +860,7 @@ typedef __char32_t char32_t; // MSVC exposed __iso_volatile intrinsics beginning on 1924 for x86 #if _MSC_VER < 1924 - #define _LIBCUDACXX_HAS_NO_ISO_INTRIN + #define _LIBCUDACXX_MSVC_HAS_NO_ISO_INTRIN #endif #define _LIBCUDACXX_UNDERLYING_TYPE(...) __underlying_type(__VA_ARGS__) diff --git a/libcxx/include/support/win32/atomic_msvc.h b/libcxx/include/support/win32/atomic_msvc.h index 73a12d1f40..7b44a98b94 100644 --- a/libcxx/include/support/win32/atomic_msvc.h +++ b/libcxx/include/support/win32/atomic_msvc.h @@ -46,7 +46,7 @@ namespace detail { template = 0> void __atomic_load_relaxed(const volatile _Type *__ptr, _Type *__ret) { -#ifdef _LIBCUDACXX_HAS_NO_ISO_INTRIN +#ifdef _LIBCUDACXX_MSVC_HAS_NO_ISO_INTRIN __int8 __tmp = *(const volatile __int8 *)__ptr; #else __int8 __tmp = __iso_volatile_load8((const volatile __int8 *)__ptr); @@ -55,8 +55,8 @@ void __atomic_load_relaxed(const volatile _Type *__ptr, _Type *__ret) { } template = 0> void __atomic_load_relaxed(const volatile _Type *__ptr, _Type *__ret) { -#ifdef _LIBCUDACXX_HAS_NO_ISO_INTRIN - __int16 __tmp = *(const volatile __int8 *)__ptr; +#ifdef _LIBCUDACXX_MSVC_HAS_NO_ISO_INTRIN + __int16 __tmp = *(const volatile __int16 *)__ptr; #else __int16 __tmp = __iso_volatile_load16((const volatile __int16 *)__ptr); #endif @@ -64,8 +64,8 @@ void __atomic_load_relaxed(const volatile _Type *__ptr, _Type *__ret) { } template = 0> void __atomic_load_relaxed(const volatile _Type *__ptr, _Type *__ret) { -#ifdef _LIBCUDACXX_HAS_NO_ISO_INTRIN - __int32 __tmp = *(const volatile __int8 *)__ptr; +#ifdef _LIBCUDACXX_MSVC_HAS_NO_ISO_INTRIN + __int32 __tmp = *(const volatile __int32 *)__ptr; #else __int32 __tmp = __iso_volatile_load32((const volatile __int32 *)__ptr); #endif @@ -73,8 +73,8 @@ void __atomic_load_relaxed(const volatile _Type *__ptr, _Type *__ret) { } template = 0> void __atomic_load_relaxed(const volatile _Type *__ptr, _Type *__ret) { -#ifdef _LIBCUDACXX_HAS_NO_ISO_INTRIN - __int64 __tmp = *(const volatile __int8 *)__ptr; +#ifdef _LIBCUDACXX_MSVC_HAS_NO_ISO_INTRIN + __int64 __tmp = *(const volatile __int64 *)__ptr; #else __int64 __tmp = __iso_volatile_load64((const volatile __int64 *)__ptr); #endif @@ -92,27 +92,48 @@ void __atomic_load(const volatile _Type *__ptr, _Type *__ret, int __memorder) { } } - template = 0> -void __atomic_store_relaxed(const volatile _Type *__ptr, _Type *__val) { - __int8 __tmp = reinterpret_cast<__int8&>(*__val); - __iso_volatile_store8((volatile __int8 *)__ptr, __tmp); +void __atomic_store_relaxed(volatile _Type *__ptr, _Type *__val) { + auto __t = reinterpret_cast<__int8 *>(__val); + auto __d = reinterpret_cast(__ptr); +#ifdef _LIBCUDACXX_MSVC_HAS_NO_ISO_INTRIN + (void)_InterlockedExchange8(__d, *__t); +#else + __iso_volatile_store8(__d, __t); +#endif } template = 0> -void __atomic_store_relaxed(const volatile _Type *__ptr, _Type *__val) { - __int16 __tmp = reinterpret_cast<__int16&>(*__val); - __iso_volatile_store16((volatile __int16 *)__ptr, __tmp); +void __atomic_store_relaxed(volatile _Type *__ptr, _Type *__val) { + auto __t = reinterpret_cast<__int16 *>(__val); + auto __d = reinterpret_cast(__ptr); +#ifdef _LIBCUDACXX_MSVC_HAS_NO_ISO_INTRIN + (void)_InterlockedExchange16(__d, *__t); +#else + __iso_volatile_store16(__d, __t); +#endif } template = 0> -void __atomic_store_relaxed(const volatile _Type *__ptr, _Type *__val) { - __int32 __tmp = reinterpret_cast<__int32&>(*__val); - __iso_volatile_store32((volatile __int32 *)__ptr, __tmp); +void __atomic_store_relaxed(volatile _Type *__ptr, _Type *__val) { + auto __t = reinterpret_cast<__int32 *>(__val); + auto __d = reinterpret_cast(__ptr); +#ifdef _LIBCUDACXX_MSVC_HAS_NO_ISO_INTRIN + // int cannot be converted to long?... + (void)_InterlockedExchange(reinterpret_cast(__d), *__t); +#else + __iso_volatile_store32(__d, __t); +#endif } template = 0> -void __atomic_store_relaxed(const volatile _Type *__ptr, _Type *__val) { - __int64 __tmp = reinterpret_cast<__int64&>(*__val); - __iso_volatile_store64((volatile __int64 *)__ptr, __tmp); +void __atomic_store_relaxed(volatile _Type *__ptr, _Type *__val) { + auto __t = reinterpret_cast<__int64 *>(__val); + auto __d = reinterpret_cast(__ptr); +#ifdef _LIBCUDACXX_MSVC_HAS_NO_ISO_INTRIN + (void)_InterlockedExchange64(__d, *__t); +#else + __iso_volatile_store64(__d, __t); +#endif } + template void __atomic_store(volatile _Type *__ptr, _Type *__val, int __memorder) { switch (__memorder) {