181 lines
10 KiB
C++
181 lines
10 KiB
C++
/*
|
|
Copyright 2005-2016 Intel Corporation. All Rights Reserved.
|
|
|
|
This file is part of Threading Building Blocks. Threading Building Blocks is free software;
|
|
you can redistribute it and/or modify it under the terms of the GNU General Public License
|
|
version 2 as published by the Free Software Foundation. Threading Building Blocks is
|
|
distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the
|
|
implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
|
|
See the GNU General Public License for more details. You should have received a copy of
|
|
the GNU General Public License along with Threading Building Blocks; if not, write to the
|
|
Free Software Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
|
|
|
|
As a special exception, you may use this file as part of a free software library without
|
|
restriction. Specifically, if other files instantiate templates or use macros or inline
|
|
functions from this file, or you compile this file and link it with other files to produce
|
|
an executable, this file does not by itself cause the resulting executable to be covered
|
|
by the GNU General Public License. This exception does not however invalidate any other
|
|
reasons why the executable file might be covered by the GNU General Public License.
|
|
*/
|
|
|
|
#if !defined(__TBB_machine_H) || defined(__TBB_machine_linux_ia64_H)
|
|
#error Do not #include this internal file directly; use public TBB headers instead.
|
|
#endif
|
|
|
|
#define __TBB_machine_linux_ia64_H
|
|
|
|
#include <stdint.h>
|
|
#include <ia64intrin.h>
|
|
|
|
#define __TBB_WORDSIZE 8
|
|
#define __TBB_ENDIANNESS __TBB_ENDIAN_LITTLE
|
|
|
|
#if __INTEL_COMPILER
|
|
#define __TBB_compiler_fence()
|
|
#define __TBB_control_consistency_helper() __TBB_compiler_fence()
|
|
#define __TBB_acquire_consistency_helper()
|
|
#define __TBB_release_consistency_helper()
|
|
#define __TBB_full_memory_fence() __mf()
|
|
#else
|
|
#define __TBB_compiler_fence() __asm__ __volatile__("": : :"memory")
|
|
#define __TBB_control_consistency_helper() __TBB_compiler_fence()
|
|
// Even though GCC imbues volatile loads with acquire semantics, it sometimes moves
|
|
// loads over the acquire fence. The following helpers stop such incorrect code motion.
|
|
#define __TBB_acquire_consistency_helper() __TBB_compiler_fence()
|
|
#define __TBB_release_consistency_helper() __TBB_compiler_fence()
|
|
#define __TBB_full_memory_fence() __asm__ __volatile__("mf": : :"memory")
|
|
#endif /* !__INTEL_COMPILER */
|
|
|
|
// Most of the functions will be in a .s file
|
|
// TODO: revise dynamic_link, memory pools and etc. if the library dependency is removed.
|
|
|
|
extern "C" {
|
|
int8_t __TBB_machine_fetchadd1__TBB_full_fence (volatile void *ptr, int8_t addend);
|
|
int8_t __TBB_machine_fetchadd1acquire(volatile void *ptr, int8_t addend);
|
|
int8_t __TBB_machine_fetchadd1release(volatile void *ptr, int8_t addend);
|
|
|
|
int16_t __TBB_machine_fetchadd2__TBB_full_fence (volatile void *ptr, int16_t addend);
|
|
int16_t __TBB_machine_fetchadd2acquire(volatile void *ptr, int16_t addend);
|
|
int16_t __TBB_machine_fetchadd2release(volatile void *ptr, int16_t addend);
|
|
|
|
int32_t __TBB_machine_fetchadd4__TBB_full_fence (volatile void *ptr, int32_t value);
|
|
int32_t __TBB_machine_fetchadd4acquire(volatile void *ptr, int32_t addend);
|
|
int32_t __TBB_machine_fetchadd4release(volatile void *ptr, int32_t addend);
|
|
|
|
int64_t __TBB_machine_fetchadd8__TBB_full_fence (volatile void *ptr, int64_t value);
|
|
int64_t __TBB_machine_fetchadd8acquire(volatile void *ptr, int64_t addend);
|
|
int64_t __TBB_machine_fetchadd8release(volatile void *ptr, int64_t addend);
|
|
|
|
int8_t __TBB_machine_fetchstore1__TBB_full_fence (volatile void *ptr, int8_t value);
|
|
int8_t __TBB_machine_fetchstore1acquire(volatile void *ptr, int8_t value);
|
|
int8_t __TBB_machine_fetchstore1release(volatile void *ptr, int8_t value);
|
|
|
|
int16_t __TBB_machine_fetchstore2__TBB_full_fence (volatile void *ptr, int16_t value);
|
|
int16_t __TBB_machine_fetchstore2acquire(volatile void *ptr, int16_t value);
|
|
int16_t __TBB_machine_fetchstore2release(volatile void *ptr, int16_t value);
|
|
|
|
int32_t __TBB_machine_fetchstore4__TBB_full_fence (volatile void *ptr, int32_t value);
|
|
int32_t __TBB_machine_fetchstore4acquire(volatile void *ptr, int32_t value);
|
|
int32_t __TBB_machine_fetchstore4release(volatile void *ptr, int32_t value);
|
|
|
|
int64_t __TBB_machine_fetchstore8__TBB_full_fence (volatile void *ptr, int64_t value);
|
|
int64_t __TBB_machine_fetchstore8acquire(volatile void *ptr, int64_t value);
|
|
int64_t __TBB_machine_fetchstore8release(volatile void *ptr, int64_t value);
|
|
|
|
int8_t __TBB_machine_cmpswp1__TBB_full_fence (volatile void *ptr, int8_t value, int8_t comparand);
|
|
int8_t __TBB_machine_cmpswp1acquire(volatile void *ptr, int8_t value, int8_t comparand);
|
|
int8_t __TBB_machine_cmpswp1release(volatile void *ptr, int8_t value, int8_t comparand);
|
|
|
|
int16_t __TBB_machine_cmpswp2__TBB_full_fence (volatile void *ptr, int16_t value, int16_t comparand);
|
|
int16_t __TBB_machine_cmpswp2acquire(volatile void *ptr, int16_t value, int16_t comparand);
|
|
int16_t __TBB_machine_cmpswp2release(volatile void *ptr, int16_t value, int16_t comparand);
|
|
|
|
int32_t __TBB_machine_cmpswp4__TBB_full_fence (volatile void *ptr, int32_t value, int32_t comparand);
|
|
int32_t __TBB_machine_cmpswp4acquire(volatile void *ptr, int32_t value, int32_t comparand);
|
|
int32_t __TBB_machine_cmpswp4release(volatile void *ptr, int32_t value, int32_t comparand);
|
|
|
|
int64_t __TBB_machine_cmpswp8__TBB_full_fence (volatile void *ptr, int64_t value, int64_t comparand);
|
|
int64_t __TBB_machine_cmpswp8acquire(volatile void *ptr, int64_t value, int64_t comparand);
|
|
int64_t __TBB_machine_cmpswp8release(volatile void *ptr, int64_t value, int64_t comparand);
|
|
|
|
int64_t __TBB_machine_lg(uint64_t value);
|
|
void __TBB_machine_pause(int32_t delay);
|
|
bool __TBB_machine_trylockbyte( volatile unsigned char &ptr );
|
|
int64_t __TBB_machine_lockbyte( volatile unsigned char &ptr );
|
|
|
|
//! Retrieves the current RSE backing store pointer. IA64 specific.
|
|
void* __TBB_get_bsp();
|
|
|
|
int32_t __TBB_machine_load1_relaxed(const void *ptr);
|
|
int32_t __TBB_machine_load2_relaxed(const void *ptr);
|
|
int32_t __TBB_machine_load4_relaxed(const void *ptr);
|
|
int64_t __TBB_machine_load8_relaxed(const void *ptr);
|
|
|
|
void __TBB_machine_store1_relaxed(void *ptr, int32_t value);
|
|
void __TBB_machine_store2_relaxed(void *ptr, int32_t value);
|
|
void __TBB_machine_store4_relaxed(void *ptr, int32_t value);
|
|
void __TBB_machine_store8_relaxed(void *ptr, int64_t value);
|
|
} // extern "C"
|
|
|
|
// Mapping old entry points to the names corresponding to the new full_fence identifier.
|
|
#define __TBB_machine_fetchadd1full_fence __TBB_machine_fetchadd1__TBB_full_fence
|
|
#define __TBB_machine_fetchadd2full_fence __TBB_machine_fetchadd2__TBB_full_fence
|
|
#define __TBB_machine_fetchadd4full_fence __TBB_machine_fetchadd4__TBB_full_fence
|
|
#define __TBB_machine_fetchadd8full_fence __TBB_machine_fetchadd8__TBB_full_fence
|
|
#define __TBB_machine_fetchstore1full_fence __TBB_machine_fetchstore1__TBB_full_fence
|
|
#define __TBB_machine_fetchstore2full_fence __TBB_machine_fetchstore2__TBB_full_fence
|
|
#define __TBB_machine_fetchstore4full_fence __TBB_machine_fetchstore4__TBB_full_fence
|
|
#define __TBB_machine_fetchstore8full_fence __TBB_machine_fetchstore8__TBB_full_fence
|
|
#define __TBB_machine_cmpswp1full_fence __TBB_machine_cmpswp1__TBB_full_fence
|
|
#define __TBB_machine_cmpswp2full_fence __TBB_machine_cmpswp2__TBB_full_fence
|
|
#define __TBB_machine_cmpswp4full_fence __TBB_machine_cmpswp4__TBB_full_fence
|
|
#define __TBB_machine_cmpswp8full_fence __TBB_machine_cmpswp8__TBB_full_fence
|
|
|
|
// Mapping relaxed operations to the entry points implementing them.
|
|
/** On IA64 RMW operations implicitly have acquire semantics. Thus one cannot
|
|
actually have completely relaxed RMW operation here. **/
|
|
#define __TBB_machine_fetchadd1relaxed __TBB_machine_fetchadd1acquire
|
|
#define __TBB_machine_fetchadd2relaxed __TBB_machine_fetchadd2acquire
|
|
#define __TBB_machine_fetchadd4relaxed __TBB_machine_fetchadd4acquire
|
|
#define __TBB_machine_fetchadd8relaxed __TBB_machine_fetchadd8acquire
|
|
#define __TBB_machine_fetchstore1relaxed __TBB_machine_fetchstore1acquire
|
|
#define __TBB_machine_fetchstore2relaxed __TBB_machine_fetchstore2acquire
|
|
#define __TBB_machine_fetchstore4relaxed __TBB_machine_fetchstore4acquire
|
|
#define __TBB_machine_fetchstore8relaxed __TBB_machine_fetchstore8acquire
|
|
#define __TBB_machine_cmpswp1relaxed __TBB_machine_cmpswp1acquire
|
|
#define __TBB_machine_cmpswp2relaxed __TBB_machine_cmpswp2acquire
|
|
#define __TBB_machine_cmpswp4relaxed __TBB_machine_cmpswp4acquire
|
|
#define __TBB_machine_cmpswp8relaxed __TBB_machine_cmpswp8acquire
|
|
|
|
#define __TBB_MACHINE_DEFINE_ATOMICS(S,V) \
|
|
template <typename T> \
|
|
struct machine_load_store_relaxed<T,S> { \
|
|
static inline T load ( const T& location ) { \
|
|
return (T)__TBB_machine_load##S##_relaxed(&location); \
|
|
} \
|
|
static inline void store ( T& location, T value ) { \
|
|
__TBB_machine_store##S##_relaxed(&location, (V)value); \
|
|
} \
|
|
}
|
|
|
|
namespace tbb {
|
|
namespace internal {
|
|
__TBB_MACHINE_DEFINE_ATOMICS(1,int8_t);
|
|
__TBB_MACHINE_DEFINE_ATOMICS(2,int16_t);
|
|
__TBB_MACHINE_DEFINE_ATOMICS(4,int32_t);
|
|
__TBB_MACHINE_DEFINE_ATOMICS(8,int64_t);
|
|
}} // namespaces internal, tbb
|
|
|
|
#undef __TBB_MACHINE_DEFINE_ATOMICS
|
|
|
|
#define __TBB_USE_FENCED_ATOMICS 1
|
|
#define __TBB_USE_GENERIC_HALF_FENCED_LOAD_STORE 1
|
|
#define __TBB_USE_GENERIC_SEQUENTIAL_CONSISTENCY_LOAD_STORE 1
|
|
|
|
// Definition of Lock functions
|
|
#define __TBB_TryLockByte(P) __TBB_machine_trylockbyte(P)
|
|
#define __TBB_LockByte(P) __TBB_machine_lockbyte(P)
|
|
|
|
// Definition of other utility functions
|
|
#define __TBB_Pause(V) __TBB_machine_pause(V)
|
|
#define __TBB_Log2(V) __TBB_machine_lg(V)
|