Static arch and uatomic headers
[urcu.git] / include / urcu / arch / x86.h
CommitLineData
ec4e58a3
MD
1#ifndef _URCU_ARCH_X86_H
2#define _URCU_ARCH_X86_H
121a5d44 3
6d0ce021 4/*
af02d47e 5 * arch_x86.h: trivial definitions for the x86 architecture.
6d0ce021 6 *
af02d47e 7 * Copyright (c) 2009 Paul E. McKenney, IBM Corporation.
6982d6d7 8 * Copyright (c) 2009 Mathieu Desnoyers <mathieu.desnoyers@efficios.com>
6d0ce021 9 *
af02d47e
MD
10 * This library is free software; you can redistribute it and/or
11 * modify it under the terms of the GNU Lesser General Public
12 * License as published by the Free Software Foundation; either
13 * version 2.1 of the License, or (at your option) any later version.
05dd4b94 14 *
af02d47e 15 * This library is distributed in the hope that it will be useful,
6d0ce021 16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
af02d47e
MD
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
18 * Lesser General Public License for more details.
6d0ce021 19 *
af02d47e
MD
20 * You should have received a copy of the GNU Lesser General Public
21 * License along with this library; if not, write to the Free Software
22 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
6d0ce021
PM
23 */
24
ec4e58a3 25#include <urcu/compiler.h>
c96a3726 26#include <urcu/config.h>
999991c6 27#include <urcu/syscall-compat.h>
3fa18286 28#include <stdint.h>
121a5d44 29
36bc70a8
MD
30#ifdef __cplusplus
31extern "C" {
67ecffc0 32#endif
36bc70a8 33
06f22bdb 34#define CAA_CACHE_LINE_SIZE 128
b4e52e3e 35
0b1e236d
MJ
36/*
37 * For now, using lock; addl compatibility mode even for i686, because the
38 * Pentium III is seen as a i686, but lacks mfence instruction. Only using
39 * fence for x86_64.
40 *
41 * k1om (__MIC__) is the name for the Intel MIC family (Xeon Phi). It is an
42 * x86_64 variant but lacks fence instructions.
43 */
44#if (defined(URCU_ARCH_AMD64) && !defined(URCU_ARCH_K1OM))
45
46/* For backwards compat */
47#define CONFIG_RCU_HAVE_FENCE 1
48
e51500ed 49#define cmm_mb() __asm__ __volatile__ ("mfence":::"memory")
4e029f65
PB
50
51/*
52 * Define cmm_rmb/cmm_wmb to "strict" barriers that may be needed when
53 * using SSE or working with I/O areas. cmm_smp_rmb/cmm_smp_wmb are
54 * only compiler barriers, which is enough for general use.
55 */
e51500ed
MD
56#define cmm_rmb() __asm__ __volatile__ ("lfence":::"memory")
57#define cmm_wmb() __asm__ __volatile__ ("sfence"::: "memory")
4e029f65
PB
58#define cmm_smp_rmb() cmm_barrier()
59#define cmm_smp_wmb() cmm_barrier()
0b1e236d 60
6d0ce021 61#else
0b1e236d 62
6d0ce021 63/*
4e029f65
PB
64 * We leave smp_rmb/smp_wmb as full barriers for processors that do not have
65 * fence instructions.
66 *
67 * An empty cmm_smp_rmb() may not be enough on old PentiumPro multiprocessor
68 * systems, due to an erratum. The Linux kernel says that "Even distro
69 * kernels should think twice before enabling this", but for now let's
70 * be conservative and leave the full barrier on 32-bit processors. Also,
71 * IDT WinChip supports weak store ordering, and the kernel may enable it
72 * under our feet; cmm_smp_wmb() ceases to be a nop for these processors.
6d0ce021 73 */
b33e85a8 74#if (CAA_BITS_PER_LONG == 32)
e51500ed 75#define cmm_mb() __asm__ __volatile__ ("lock; addl $0,0(%%esp)":::"memory")
b33e85a8
MD
76#define cmm_rmb() __asm__ __volatile__ ("lock; addl $0,0(%%esp)":::"memory")
77#define cmm_wmb() __asm__ __volatile__ ("lock; addl $0,0(%%esp)":::"memory")
78#else
79#define cmm_mb() __asm__ __volatile__ ("lock; addl $0,0(%%rsp)":::"memory")
80#define cmm_rmb() __asm__ __volatile__ ("lock; addl $0,0(%%rsp)":::"memory")
81#define cmm_wmb() __asm__ __volatile__ ("lock; addl $0,0(%%rsp)":::"memory")
82#endif
6d0ce021
PM
83#endif
84
2c81778b 85#define caa_cpu_relax() __asm__ __volatile__ ("rep; nop" : : : "memory")
6d0ce021 86
f8c43f45
MD
87#define HAS_CAA_GET_CYCLES
88
af02d47e
MD
89#define rdtscll(val) \
90 do { \
91 unsigned int __a, __d; \
e51500ed 92 __asm__ __volatile__ ("rdtsc" : "=a" (__a), "=d" (__d)); \
af02d47e
MD
93 (val) = ((unsigned long long)__a) \
94 | (((unsigned long long)__d) << 32); \
95 } while(0)
6d0ce021 96
3fa18286 97typedef uint64_t caa_cycles_t;
6d0ce021 98
3fa18286 99static inline caa_cycles_t caa_get_cycles(void)
6d0ce021 100{
3fa18286 101 caa_cycles_t ret = 0;
6d0ce021
PM
102
103 rdtscll(ret);
104 return ret;
105}
121a5d44 106
999991c6 107/*
84f4ccb4
MD
108 * On Linux, define the membarrier system call number if not yet available in
109 * the system headers.
999991c6 110 */
84f4ccb4 111#if (defined(__linux__) && !defined(__NR_membarrier))
999991c6 112#if (CAA_BITS_PER_LONG == 32)
999991c6 113#define __NR_membarrier 375
999991c6 114#else
999991c6
MD
115#define __NR_membarrier 324
116#endif
117#endif
118
67ecffc0 119#ifdef __cplusplus
36bc70a8
MD
120}
121#endif
122
1b9119f8 123#include <urcu/arch/generic.h>
e4d1eb09 124
ec4e58a3 125#endif /* _URCU_ARCH_X86_H */
This page took 0.047794 seconds and 4 git commands to generate.