// // Copyright (c) 2017 The Khronos Group Inc. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. // #ifndef _HOST_ATOMICS_H_ #define _HOST_ATOMICS_H_ #include "harness/testHarness.h" #ifdef WIN32 #include "Windows.h" #endif //flag for test verification (good test should discover non-atomic functions and fail) //#define NON_ATOMIC_FUNCTIONS enum TExplicitMemoryOrderType { MEMORY_ORDER_EMPTY, MEMORY_ORDER_RELAXED, MEMORY_ORDER_ACQUIRE, MEMORY_ORDER_RELEASE, MEMORY_ORDER_ACQ_REL, MEMORY_ORDER_SEQ_CST }; // host atomic types (applicable for atomic functions supported on host OS) #ifdef WIN32 #define HOST_ATOMIC_INT unsigned long #define HOST_ATOMIC_UINT unsigned long #define HOST_ATOMIC_LONG unsigned long long #define HOST_ATOMIC_ULONG unsigned long long #define HOST_ATOMIC_FLOAT float #define HOST_ATOMIC_DOUBLE double #else #define HOST_ATOMIC_INT cl_int #define HOST_ATOMIC_UINT cl_uint #define HOST_ATOMIC_LONG cl_long #define HOST_ATOMIC_ULONG cl_ulong #define HOST_ATOMIC_FLOAT cl_float #define HOST_ATOMIC_DOUBLE cl_double #endif #define HOST_ATOMIC_INTPTR_T32 HOST_ATOMIC_INT #define HOST_ATOMIC_UINTPTR_T32 HOST_ATOMIC_INT #define HOST_ATOMIC_SIZE_T32 HOST_ATOMIC_UINT #define HOST_ATOMIC_PTRDIFF_T32 HOST_ATOMIC_INT #define HOST_ATOMIC_INTPTR_T64 HOST_ATOMIC_LONG #define HOST_ATOMIC_UINTPTR_T64 HOST_ATOMIC_LONG #define HOST_ATOMIC_SIZE_T64 HOST_ATOMIC_ULONG #define HOST_ATOMIC_PTRDIFF_T64 HOST_ATOMIC_LONG #define HOST_ATOMIC_FLAG HOST_ATOMIC_INT // host regular types corresponding to atomic types #define HOST_INT cl_int #define HOST_UINT cl_uint #define HOST_LONG cl_long #define HOST_ULONG cl_ulong #define HOST_FLOAT cl_float #define HOST_DOUBLE cl_double #define HOST_INTPTR_T32 cl_int #define HOST_UINTPTR_T32 cl_uint #define HOST_SIZE_T32 cl_uint #define HOST_PTRDIFF_T32 cl_int #define HOST_INTPTR_T64 cl_long #define HOST_UINTPTR_T64 cl_ulong #define HOST_SIZE_T64 cl_ulong #define HOST_PTRDIFF_T64 cl_long #define HOST_FLAG cl_uint // host atomic functions void host_atomic_thread_fence(TExplicitMemoryOrderType order); template CorrespondingType host_atomic_fetch_add(volatile AtomicType *a, CorrespondingType c, TExplicitMemoryOrderType order) { #if defined( _MSC_VER ) || (defined( __INTEL_COMPILER ) && defined(WIN32)) return InterlockedExchangeAdd(a, c); #elif defined(__GNUC__) return __sync_fetch_and_add(a, c); #else log_info("Host function not implemented: atomic_fetch_add\n"); return 0; #endif } template CorrespondingType host_atomic_fetch_sub(volatile AtomicType *a, CorrespondingType c, TExplicitMemoryOrderType order) { #if defined( _MSC_VER ) || (defined( __INTEL_COMPILER ) && defined(WIN32)) return InterlockedExchangeSubtract(a, c); #elif defined(__GNUC__) return __sync_fetch_and_sub(a, c); #else log_info("Host function not implemented: atomic_fetch_sub\n"); return 0; #endif } template CorrespondingType host_atomic_exchange(volatile AtomicType *a, CorrespondingType c, TExplicitMemoryOrderType order) { #if defined( _MSC_VER ) || (defined( __INTEL_COMPILER ) && defined(WIN32)) return InterlockedExchange(a, c); #elif defined(__GNUC__) return __sync_lock_test_and_set(a, c); #else log_info("Host function not implemented: atomic_exchange\n"); return 0; #endif } template <> HOST_FLOAT host_atomic_exchange(volatile HOST_ATOMIC_FLOAT *a, HOST_FLOAT c, TExplicitMemoryOrderType order); template <> HOST_DOUBLE host_atomic_exchange(volatile HOST_ATOMIC_DOUBLE *a, HOST_DOUBLE c, TExplicitMemoryOrderType order); template bool host_atomic_compare_exchange(volatile AtomicType *a, CorrespondingType *expected, CorrespondingType desired, TExplicitMemoryOrderType order_success, TExplicitMemoryOrderType order_failure) { CorrespondingType tmp; #if defined( _MSC_VER ) || (defined( __INTEL_COMPILER ) && defined(WIN32)) tmp = InterlockedCompareExchange(a, desired, *expected); #elif defined(__GNUC__) tmp = __sync_val_compare_and_swap(a, *expected, desired); #else log_info("Host function not implemented: atomic_compare_exchange\n"); tmp = 0; #endif if(tmp == *expected) return true; *expected = tmp; return false; } template CorrespondingType host_atomic_load(volatile AtomicType *a, TExplicitMemoryOrderType order) { #if defined( _MSC_VER ) || (defined( __INTEL_COMPILER ) && defined(WIN32)) return InterlockedExchangeAdd(a, 0); #elif defined(__GNUC__) return __sync_add_and_fetch(a, 0); #else log_info("Host function not implemented: atomic_load\n"); return 0; #endif } template <> HOST_FLOAT host_atomic_load(volatile HOST_ATOMIC_FLOAT *a, TExplicitMemoryOrderType order); template <> HOST_DOUBLE host_atomic_load(volatile HOST_ATOMIC_DOUBLE *a, TExplicitMemoryOrderType order); template void host_atomic_store(volatile AtomicType* a, CorrespondingType c, TExplicitMemoryOrderType order) { host_atomic_exchange(a, c, order); } template void host_atomic_init(volatile AtomicType* a, CorrespondingType c) { host_atomic_exchange(a, c, MEMORY_ORDER_RELAXED); } template CorrespondingType host_atomic_fetch_or(volatile AtomicType *a, CorrespondingType c, TExplicitMemoryOrderType order) { CorrespondingType expected = host_atomic_load(a, order); CorrespondingType desired; do desired = expected | c; while(!host_atomic_compare_exchange(a, &expected, desired, order, order)); return expected; } template CorrespondingType host_atomic_fetch_and(volatile AtomicType *a, CorrespondingType c, TExplicitMemoryOrderType order) { CorrespondingType expected = host_atomic_load(a, order); CorrespondingType desired; do desired = expected & c; while(!host_atomic_compare_exchange(a, &expected, desired, order, order)); return expected; } template CorrespondingType host_atomic_fetch_xor(volatile AtomicType *a, CorrespondingType c, TExplicitMemoryOrderType order) { CorrespondingType expected = host_atomic_load(a, order); CorrespondingType desired; do desired = expected ^ c; while(!host_atomic_compare_exchange(a, &expected, desired, order, order)); return expected; } template CorrespondingType host_atomic_fetch_min(volatile AtomicType *a, CorrespondingType c, TExplicitMemoryOrderType order) { CorrespondingType expected = host_atomic_load(a, order); CorrespondingType desired; do desired = expected < c ? expected : c; while(!host_atomic_compare_exchange(a, &expected, desired, order, order)); return expected; } template CorrespondingType host_atomic_fetch_max(volatile AtomicType *a, CorrespondingType c, TExplicitMemoryOrderType order) { CorrespondingType expected = host_atomic_load(a, order); CorrespondingType desired; do desired = expected > c ? expected : c; while(!host_atomic_compare_exchange(a, &expected, desired, order, order)); return expected; } bool host_atomic_flag_test_and_set(volatile HOST_ATOMIC_FLAG *a, TExplicitMemoryOrderType order); void host_atomic_flag_clear(volatile HOST_ATOMIC_FLAG *a, TExplicitMemoryOrderType order); #endif //_HOST_ATOMICS_H_