blob: 6c4e783aa1ef8feffa1f1e63bce0a152a4a0a927 [file] [log] [blame]
//
// Copyright (c) 2017 The Khronos Group Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
//
#ifndef _HOST_ATOMICS_H_
#define _HOST_ATOMICS_H_
#include "harness/testHarness.h"
#ifdef WIN32
#include "Windows.h"
#endif
//flag for test verification (good test should discover non-atomic functions and fail)
//#define NON_ATOMIC_FUNCTIONS
enum TExplicitMemoryOrderType
{
MEMORY_ORDER_EMPTY,
MEMORY_ORDER_RELAXED,
MEMORY_ORDER_ACQUIRE,
MEMORY_ORDER_RELEASE,
MEMORY_ORDER_ACQ_REL,
MEMORY_ORDER_SEQ_CST
};
// host atomic types (applicable for atomic functions supported on host OS)
#ifdef WIN32
#define HOST_ATOMIC_INT unsigned long
#define HOST_ATOMIC_UINT unsigned long
#define HOST_ATOMIC_LONG unsigned long long
#define HOST_ATOMIC_ULONG unsigned long long
#define HOST_ATOMIC_FLOAT float
#define HOST_ATOMIC_DOUBLE double
#else
#define HOST_ATOMIC_INT cl_int
#define HOST_ATOMIC_UINT cl_uint
#define HOST_ATOMIC_LONG cl_long
#define HOST_ATOMIC_ULONG cl_ulong
#define HOST_ATOMIC_FLOAT cl_float
#define HOST_ATOMIC_DOUBLE cl_double
#endif
#define HOST_ATOMIC_INTPTR_T32 HOST_ATOMIC_INT
#define HOST_ATOMIC_UINTPTR_T32 HOST_ATOMIC_INT
#define HOST_ATOMIC_SIZE_T32 HOST_ATOMIC_UINT
#define HOST_ATOMIC_PTRDIFF_T32 HOST_ATOMIC_INT
#define HOST_ATOMIC_INTPTR_T64 HOST_ATOMIC_LONG
#define HOST_ATOMIC_UINTPTR_T64 HOST_ATOMIC_LONG
#define HOST_ATOMIC_SIZE_T64 HOST_ATOMIC_ULONG
#define HOST_ATOMIC_PTRDIFF_T64 HOST_ATOMIC_LONG
#define HOST_ATOMIC_FLAG HOST_ATOMIC_INT
// host regular types corresponding to atomic types
#define HOST_INT cl_int
#define HOST_UINT cl_uint
#define HOST_LONG cl_long
#define HOST_ULONG cl_ulong
#define HOST_FLOAT cl_float
#define HOST_DOUBLE cl_double
#define HOST_INTPTR_T32 cl_int
#define HOST_UINTPTR_T32 cl_uint
#define HOST_SIZE_T32 cl_uint
#define HOST_PTRDIFF_T32 cl_int
#define HOST_INTPTR_T64 cl_long
#define HOST_UINTPTR_T64 cl_ulong
#define HOST_SIZE_T64 cl_ulong
#define HOST_PTRDIFF_T64 cl_long
#define HOST_FLAG cl_uint
// host atomic functions
void host_atomic_thread_fence(TExplicitMemoryOrderType order);
template <typename AtomicType, typename CorrespondingType>
CorrespondingType host_atomic_fetch_add(volatile AtomicType *a, CorrespondingType c,
TExplicitMemoryOrderType order)
{
#if defined( _MSC_VER ) || (defined( __INTEL_COMPILER ) && defined(WIN32))
return InterlockedExchangeAdd(a, c);
#elif defined(__GNUC__)
return __sync_fetch_and_add(a, c);
#else
log_info("Host function not implemented: atomic_fetch_add\n");
return 0;
#endif
}
template <typename AtomicType, typename CorrespondingType>
CorrespondingType host_atomic_fetch_sub(volatile AtomicType *a, CorrespondingType c,
TExplicitMemoryOrderType order)
{
#if defined( _MSC_VER ) || (defined( __INTEL_COMPILER ) && defined(WIN32))
return InterlockedExchangeSubtract(a, c);
#elif defined(__GNUC__)
return __sync_fetch_and_sub(a, c);
#else
log_info("Host function not implemented: atomic_fetch_sub\n");
return 0;
#endif
}
template <typename AtomicType, typename CorrespondingType>
CorrespondingType host_atomic_exchange(volatile AtomicType *a, CorrespondingType c,
TExplicitMemoryOrderType order)
{
#if defined( _MSC_VER ) || (defined( __INTEL_COMPILER ) && defined(WIN32))
return InterlockedExchange(a, c);
#elif defined(__GNUC__)
return __sync_lock_test_and_set(a, c);
#else
log_info("Host function not implemented: atomic_exchange\n");
return 0;
#endif
}
template <> HOST_FLOAT host_atomic_exchange(volatile HOST_ATOMIC_FLOAT *a, HOST_FLOAT c,
TExplicitMemoryOrderType order);
template <> HOST_DOUBLE host_atomic_exchange(volatile HOST_ATOMIC_DOUBLE *a, HOST_DOUBLE c,
TExplicitMemoryOrderType order);
template <typename AtomicType, typename CorrespondingType>
bool host_atomic_compare_exchange(volatile AtomicType *a, CorrespondingType *expected, CorrespondingType desired,
TExplicitMemoryOrderType order_success,
TExplicitMemoryOrderType order_failure)
{
CorrespondingType tmp;
#if defined( _MSC_VER ) || (defined( __INTEL_COMPILER ) && defined(WIN32))
tmp = InterlockedCompareExchange(a, desired, *expected);
#elif defined(__GNUC__)
tmp = __sync_val_compare_and_swap(a, *expected, desired);
#else
log_info("Host function not implemented: atomic_compare_exchange\n");
tmp = 0;
#endif
if(tmp == *expected)
return true;
*expected = tmp;
return false;
}
template <typename AtomicType, typename CorrespondingType>
CorrespondingType host_atomic_load(volatile AtomicType *a,
TExplicitMemoryOrderType order)
{
#if defined( _MSC_VER ) || (defined( __INTEL_COMPILER ) && defined(WIN32))
return InterlockedExchangeAdd(a, 0);
#elif defined(__GNUC__)
return __sync_add_and_fetch(a, 0);
#else
log_info("Host function not implemented: atomic_load\n");
return 0;
#endif
}
template <> HOST_FLOAT host_atomic_load(volatile HOST_ATOMIC_FLOAT *a,
TExplicitMemoryOrderType order);
template <> HOST_DOUBLE host_atomic_load(volatile HOST_ATOMIC_DOUBLE *a,
TExplicitMemoryOrderType order);
template <typename AtomicType, typename CorrespondingType>
void host_atomic_store(volatile AtomicType* a, CorrespondingType c,
TExplicitMemoryOrderType order)
{
host_atomic_exchange(a, c, order);
}
template <typename AtomicType, typename CorrespondingType>
void host_atomic_init(volatile AtomicType* a, CorrespondingType c)
{
host_atomic_exchange(a, c, MEMORY_ORDER_RELAXED);
}
template <typename AtomicType, typename CorrespondingType>
CorrespondingType host_atomic_fetch_or(volatile AtomicType *a, CorrespondingType c,
TExplicitMemoryOrderType order)
{
CorrespondingType expected = host_atomic_load<AtomicType, CorrespondingType>(a, order);
CorrespondingType desired;
do
desired = expected | c;
while(!host_atomic_compare_exchange(a, &expected, desired, order, order));
return expected;
}
template <typename AtomicType, typename CorrespondingType>
CorrespondingType host_atomic_fetch_and(volatile AtomicType *a, CorrespondingType c,
TExplicitMemoryOrderType order)
{
CorrespondingType expected = host_atomic_load<AtomicType, CorrespondingType>(a, order);
CorrespondingType desired;
do
desired = expected & c;
while(!host_atomic_compare_exchange(a, &expected, desired, order, order));
return expected;
}
template <typename AtomicType, typename CorrespondingType>
CorrespondingType host_atomic_fetch_xor(volatile AtomicType *a, CorrespondingType c,
TExplicitMemoryOrderType order)
{
CorrespondingType expected = host_atomic_load<AtomicType, CorrespondingType>(a, order);
CorrespondingType desired;
do
desired = expected ^ c;
while(!host_atomic_compare_exchange(a, &expected, desired, order, order));
return expected;
}
template <typename AtomicType, typename CorrespondingType>
CorrespondingType host_atomic_fetch_min(volatile AtomicType *a, CorrespondingType c,
TExplicitMemoryOrderType order)
{
CorrespondingType expected = host_atomic_load<AtomicType, CorrespondingType>(a, order);
CorrespondingType desired;
do
desired = expected < c ? expected : c;
while(!host_atomic_compare_exchange(a, &expected, desired, order, order));
return expected;
}
template <typename AtomicType, typename CorrespondingType>
CorrespondingType host_atomic_fetch_max(volatile AtomicType *a, CorrespondingType c,
TExplicitMemoryOrderType order)
{
CorrespondingType expected = host_atomic_load<AtomicType, CorrespondingType>(a, order);
CorrespondingType desired;
do
desired = expected > c ? expected : c;
while(!host_atomic_compare_exchange(a, &expected, desired, order, order));
return expected;
}
bool host_atomic_flag_test_and_set(volatile HOST_ATOMIC_FLAG *a, TExplicitMemoryOrderType order);
void host_atomic_flag_clear(volatile HOST_ATOMIC_FLAG *a, TExplicitMemoryOrderType order);
#endif //_HOST_ATOMICS_H_