Ralf Baechle | 0004a9d | 2006-10-31 03:45:07 +0000 | [diff] [blame] | 1 | /* |
| 2 | * This file is subject to the terms and conditions of the GNU General Public |
| 3 | * License. See the file "COPYING" in the main directory of this archive |
| 4 | * for more details. |
| 5 | * |
| 6 | * Copyright (C) 2006 by Ralf Baechle (ralf@linux-mips.org) |
| 7 | */ |
| 8 | #ifndef __ASM_BARRIER_H |
| 9 | #define __ASM_BARRIER_H |
| 10 | |
David Howells | b81947c | 2012-03-28 18:30:02 +0100 | [diff] [blame] | 11 | #include <asm/addrspace.h> |
| 12 | |
Ralf Baechle | 0004a9d | 2006-10-31 03:45:07 +0000 | [diff] [blame] | 13 | /* |
| 14 | * read_barrier_depends - Flush all pending reads that subsequents reads |
| 15 | * depend on. |
| 16 | * |
| 17 | * No data-dependent reads from memory-like regions are ever reordered |
| 18 | * over this barrier. All reads preceding this primitive are guaranteed |
| 19 | * to access memory (but not necessarily other CPUs' caches) before any |
| 20 | * reads following this primitive that depend on the data return by |
Maciej W. Rozycki | edf7b93 | 2013-11-01 23:47:05 +0000 | [diff] [blame] | 21 | * any of the preceding reads. This primitive is much lighter weight than |
Ralf Baechle | 0004a9d | 2006-10-31 03:45:07 +0000 | [diff] [blame] | 22 | * rmb() on most CPUs, and is never heavier weight than is |
| 23 | * rmb(). |
| 24 | * |
| 25 | * These ordering constraints are respected by both the local CPU |
| 26 | * and the compiler. |
| 27 | * |
| 28 | * Ordering is not guaranteed by anything other than these primitives, |
| 29 | * not even by data dependencies. See the documentation for |
| 30 | * memory_barrier() for examples and URLs to more information. |
| 31 | * |
| 32 | * For example, the following code would force ordering (the initial |
| 33 | * value of "a" is zero, "b" is one, and "p" is "&a"): |
| 34 | * |
| 35 | * <programlisting> |
| 36 | * CPU 0 CPU 1 |
| 37 | * |
| 38 | * b = 2; |
| 39 | * memory_barrier(); |
| 40 | * p = &b; q = p; |
| 41 | * read_barrier_depends(); |
| 42 | * d = *q; |
| 43 | * </programlisting> |
| 44 | * |
| 45 | * because the read of "*q" depends on the read of "p" and these |
Maciej W. Rozycki | edf7b93 | 2013-11-01 23:47:05 +0000 | [diff] [blame] | 46 | * two reads are separated by a read_barrier_depends(). However, |
Ralf Baechle | 0004a9d | 2006-10-31 03:45:07 +0000 | [diff] [blame] | 47 | * the following code, with the same initial values for "a" and "b": |
| 48 | * |
| 49 | * <programlisting> |
| 50 | * CPU 0 CPU 1 |
| 51 | * |
| 52 | * a = 2; |
| 53 | * memory_barrier(); |
| 54 | * b = 3; y = b; |
| 55 | * read_barrier_depends(); |
| 56 | * x = a; |
| 57 | * </programlisting> |
| 58 | * |
| 59 | * does not enforce ordering, since there is no data dependency between |
Maciej W. Rozycki | edf7b93 | 2013-11-01 23:47:05 +0000 | [diff] [blame] | 60 | * the read of "a" and the read of "b". Therefore, on some CPUs, such |
Ralf Baechle | 0004a9d | 2006-10-31 03:45:07 +0000 | [diff] [blame] | 61 | * as Alpha, "y" could be set to 3 and "x" to 0. Use rmb() |
| 62 | * in cases like this where there are no data dependencies. |
| 63 | */ |
| 64 | |
| 65 | #define read_barrier_depends() do { } while(0) |
| 66 | #define smp_read_barrier_depends() do { } while(0) |
| 67 | |
| 68 | #ifdef CONFIG_CPU_HAS_SYNC |
| 69 | #define __sync() \ |
| 70 | __asm__ __volatile__( \ |
| 71 | ".set push\n\t" \ |
| 72 | ".set noreorder\n\t" \ |
| 73 | ".set mips2\n\t" \ |
| 74 | "sync\n\t" \ |
| 75 | ".set pop" \ |
| 76 | : /* no output */ \ |
| 77 | : /* no input */ \ |
| 78 | : "memory") |
| 79 | #else |
| 80 | #define __sync() do { } while(0) |
| 81 | #endif |
| 82 | |
| 83 | #define __fast_iob() \ |
| 84 | __asm__ __volatile__( \ |
| 85 | ".set push\n\t" \ |
| 86 | ".set noreorder\n\t" \ |
| 87 | "lw $0,%0\n\t" \ |
| 88 | "nop\n\t" \ |
| 89 | ".set pop" \ |
| 90 | : /* no output */ \ |
| 91 | : "m" (*(int *)CKSEG1) \ |
| 92 | : "memory") |
David Daney | 6b07d38 | 2010-01-08 17:17:44 -0800 | [diff] [blame] | 93 | #ifdef CONFIG_CPU_CAVIUM_OCTEON |
| 94 | # define OCTEON_SYNCW_STR ".set push\n.set arch=octeon\nsyncw\nsyncw\n.set pop\n" |
Ralf Baechle | 7034228 | 2013-01-22 12:59:30 +0100 | [diff] [blame] | 95 | # define __syncw() __asm__ __volatile__(OCTEON_SYNCW_STR : : : "memory") |
Ralf Baechle | 0004a9d | 2006-10-31 03:45:07 +0000 | [diff] [blame] | 96 | |
David Daney | 6b07d38 | 2010-01-08 17:17:44 -0800 | [diff] [blame] | 97 | # define fast_wmb() __syncw() |
| 98 | # define fast_rmb() barrier() |
| 99 | # define fast_mb() __sync() |
| 100 | # define fast_iob() do { } while (0) |
| 101 | #else /* ! CONFIG_CPU_CAVIUM_OCTEON */ |
| 102 | # define fast_wmb() __sync() |
| 103 | # define fast_rmb() __sync() |
| 104 | # define fast_mb() __sync() |
| 105 | # ifdef CONFIG_SGI_IP28 |
| 106 | # define fast_iob() \ |
Thomas Bogendoerfer | 7a2852e | 2008-03-18 22:47:56 +0100 | [diff] [blame] | 107 | __asm__ __volatile__( \ |
| 108 | ".set push\n\t" \ |
| 109 | ".set noreorder\n\t" \ |
| 110 | "lw $0,%0\n\t" \ |
| 111 | "sync\n\t" \ |
| 112 | "lw $0,%0\n\t" \ |
| 113 | ".set pop" \ |
| 114 | : /* no output */ \ |
| 115 | : "m" (*(int *)CKSEG1ADDR(0x1fa00004)) \ |
| 116 | : "memory") |
David Daney | 6b07d38 | 2010-01-08 17:17:44 -0800 | [diff] [blame] | 117 | # else |
| 118 | # define fast_iob() \ |
Ralf Baechle | 0004a9d | 2006-10-31 03:45:07 +0000 | [diff] [blame] | 119 | do { \ |
| 120 | __sync(); \ |
| 121 | __fast_iob(); \ |
| 122 | } while (0) |
David Daney | 6b07d38 | 2010-01-08 17:17:44 -0800 | [diff] [blame] | 123 | # endif |
| 124 | #endif /* CONFIG_CPU_CAVIUM_OCTEON */ |
Ralf Baechle | 0004a9d | 2006-10-31 03:45:07 +0000 | [diff] [blame] | 125 | |
| 126 | #ifdef CONFIG_CPU_HAS_WB |
| 127 | |
| 128 | #include <asm/wbflush.h> |
| 129 | |
| 130 | #define wmb() fast_wmb() |
| 131 | #define rmb() fast_rmb() |
| 132 | #define mb() wbflush() |
| 133 | #define iob() wbflush() |
| 134 | |
| 135 | #else /* !CONFIG_CPU_HAS_WB */ |
| 136 | |
| 137 | #define wmb() fast_wmb() |
| 138 | #define rmb() fast_rmb() |
| 139 | #define mb() fast_mb() |
| 140 | #define iob() fast_iob() |
| 141 | |
| 142 | #endif /* !CONFIG_CPU_HAS_WB */ |
| 143 | |
| 144 | #if defined(CONFIG_WEAK_ORDERING) && defined(CONFIG_SMP) |
David Daney | 6b07d38 | 2010-01-08 17:17:44 -0800 | [diff] [blame] | 145 | # ifdef CONFIG_CPU_CAVIUM_OCTEON |
| 146 | # define smp_mb() __sync() |
| 147 | # define smp_rmb() barrier() |
| 148 | # define smp_wmb() __syncw() |
| 149 | # else |
| 150 | # define smp_mb() __asm__ __volatile__("sync" : : :"memory") |
| 151 | # define smp_rmb() __asm__ __volatile__("sync" : : :"memory") |
| 152 | # define smp_wmb() __asm__ __volatile__("sync" : : :"memory") |
| 153 | # endif |
Ralf Baechle | 0004a9d | 2006-10-31 03:45:07 +0000 | [diff] [blame] | 154 | #else |
David Daney | f252ffd | 2010-01-08 17:17:43 -0800 | [diff] [blame] | 155 | #define smp_mb() barrier() |
| 156 | #define smp_rmb() barrier() |
| 157 | #define smp_wmb() barrier() |
Ralf Baechle | 0004a9d | 2006-10-31 03:45:07 +0000 | [diff] [blame] | 158 | #endif |
David Daney | f252ffd | 2010-01-08 17:17:43 -0800 | [diff] [blame] | 159 | |
Ralf Baechle | 17099b1 | 2007-07-14 13:24:05 +0100 | [diff] [blame] | 160 | #if defined(CONFIG_WEAK_REORDERING_BEYOND_LLSC) && defined(CONFIG_SMP) |
Ralf Baechle | 7034228 | 2013-01-22 12:59:30 +0100 | [diff] [blame] | 161 | #define __WEAK_LLSC_MB " sync \n" |
Ralf Baechle | 17099b1 | 2007-07-14 13:24:05 +0100 | [diff] [blame] | 162 | #else |
| 163 | #define __WEAK_LLSC_MB " \n" |
| 164 | #endif |
Ralf Baechle | 0004a9d | 2006-10-31 03:45:07 +0000 | [diff] [blame] | 165 | |
Ralf Baechle | 0004a9d | 2006-10-31 03:45:07 +0000 | [diff] [blame] | 166 | #define set_mb(var, value) \ |
| 167 | do { var = value; smp_mb(); } while (0) |
| 168 | |
Ralf Baechle | 17099b1 | 2007-07-14 13:24:05 +0100 | [diff] [blame] | 169 | #define smp_llsc_mb() __asm__ __volatile__(__WEAK_LLSC_MB : : :"memory") |
Ralf Baechle | 17099b1 | 2007-07-14 13:24:05 +0100 | [diff] [blame] | 170 | |
David Daney | 6b07d38 | 2010-01-08 17:17:44 -0800 | [diff] [blame] | 171 | #ifdef CONFIG_CPU_CAVIUM_OCTEON |
| 172 | #define smp_mb__before_llsc() smp_wmb() |
David Daney | 500c2e1 | 2010-02-04 11:31:49 -0800 | [diff] [blame] | 173 | /* Cause previous writes to become visible on all CPUs as soon as possible */ |
| 174 | #define nudge_writes() __asm__ __volatile__(".set push\n\t" \ |
| 175 | ".set arch=octeon\n\t" \ |
| 176 | "syncw\n\t" \ |
| 177 | ".set pop" : : : "memory") |
David Daney | 6b07d38 | 2010-01-08 17:17:44 -0800 | [diff] [blame] | 178 | #else |
David Daney | f252ffd | 2010-01-08 17:17:43 -0800 | [diff] [blame] | 179 | #define smp_mb__before_llsc() smp_llsc_mb() |
David Daney | 500c2e1 | 2010-02-04 11:31:49 -0800 | [diff] [blame] | 180 | #define nudge_writes() mb() |
David Daney | 6b07d38 | 2010-01-08 17:17:44 -0800 | [diff] [blame] | 181 | #endif |
David Daney | f252ffd | 2010-01-08 17:17:43 -0800 | [diff] [blame] | 182 | |
Peter Zijlstra | 47933ad | 2013-11-06 14:57:36 +0100 | [diff] [blame] | 183 | #define smp_store_release(p, v) \ |
| 184 | do { \ |
| 185 | compiletime_assert_atomic_type(*p); \ |
| 186 | smp_mb(); \ |
| 187 | ACCESS_ONCE(*p) = (v); \ |
| 188 | } while (0) |
| 189 | |
| 190 | #define smp_load_acquire(p) \ |
| 191 | ({ \ |
| 192 | typeof(*p) ___p1 = ACCESS_ONCE(*p); \ |
| 193 | compiletime_assert_atomic_type(*p); \ |
| 194 | smp_mb(); \ |
| 195 | ___p1; \ |
| 196 | }) |
| 197 | |
Peter Zijlstra | 91bbefe | 2014-03-13 19:00:36 +0100 | [diff] [blame] | 198 | #define smp_mb__before_atomic() smp_mb__before_llsc() |
| 199 | #define smp_mb__after_atomic() smp_llsc_mb() |
| 200 | |
Ralf Baechle | 0004a9d | 2006-10-31 03:45:07 +0000 | [diff] [blame] | 201 | #endif /* __ASM_BARRIER_H */ |