| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1 | #ifndef __LINUX_SEQLOCK_H | 
|  | 2 | #define __LINUX_SEQLOCK_H | 
|  | 3 | /* | 
|  | 4 | * Reader/writer consistent mechanism without starving writers. This type of | 
| Robert P. J. Day | d08df60 | 2007-02-17 19:07:33 +0100 | [diff] [blame] | 5 | * lock for data where the reader wants a consistent set of information | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 6 | * and is willing to retry if the information changes.  Readers never | 
|  | 7 | * block but they may have to retry if a writer is in | 
|  | 8 | * progress. Writers do not wait for readers. | 
|  | 9 | * | 
|  | 10 | * This is not as cache friendly as brlock. Also, this will not work | 
|  | 11 | * for data that contains pointers, because any writer could | 
|  | 12 | * invalidate a pointer that a reader was following. | 
|  | 13 | * | 
|  | 14 | * Expected reader usage: | 
|  | 15 | * 	do { | 
|  | 16 | *	    seq = read_seqbegin(&foo); | 
|  | 17 | * 	... | 
|  | 18 | *      } while (read_seqretry(&foo, seq)); | 
|  | 19 | * | 
|  | 20 | * | 
|  | 21 | * On non-SMP the spin locks disappear but the writer still needs | 
|  | 22 | * to increment the sequence variables because an interrupt routine could | 
|  | 23 | * change the state of the data. | 
|  | 24 | * | 
|  | 25 | * Based on x86_64 vsyscall gettimeofday | 
|  | 26 | * by Keith Owens and Andrea Arcangeli | 
|  | 27 | */ | 
|  | 28 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 29 | #include <linux/spinlock.h> | 
|  | 30 | #include <linux/preempt.h> | 
| David Howells | 56a2105 | 2011-06-11 12:29:58 +0100 | [diff] [blame] | 31 | #include <asm/processor.h> | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 32 |  | 
|  | 33 | typedef struct { | 
|  | 34 | unsigned sequence; | 
|  | 35 | spinlock_t lock; | 
|  | 36 | } seqlock_t; | 
|  | 37 |  | 
|  | 38 | /* | 
|  | 39 | * These macros triggered gcc-3.x compile-time problems.  We think these are | 
|  | 40 | * OK now.  Be cautious. | 
|  | 41 | */ | 
| Ingo Molnar | e4d9191 | 2006-07-03 00:24:34 -0700 | [diff] [blame] | 42 | #define __SEQLOCK_UNLOCKED(lockname) \ | 
|  | 43 | { 0, __SPIN_LOCK_UNLOCKED(lockname) } | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 44 |  | 
| Ingo Molnar | 99a3eb3 | 2006-12-12 12:10:28 +0100 | [diff] [blame] | 45 | #define seqlock_init(x)					\ | 
|  | 46 | do {						\ | 
|  | 47 | (x)->sequence = 0;			\ | 
|  | 48 | spin_lock_init(&(x)->lock);		\ | 
|  | 49 | } while (0) | 
| Ingo Molnar | e4d9191 | 2006-07-03 00:24:34 -0700 | [diff] [blame] | 50 |  | 
|  | 51 | #define DEFINE_SEQLOCK(x) \ | 
|  | 52 | seqlock_t x = __SEQLOCK_UNLOCKED(x) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 53 |  | 
|  | 54 | /* Lock out other writers and update the count. | 
|  | 55 | * Acts like a normal spin_lock/unlock. | 
|  | 56 | * Don't need preempt_disable() because that is in the spin_lock already. | 
|  | 57 | */ | 
|  | 58 | static inline void write_seqlock(seqlock_t *sl) | 
|  | 59 | { | 
|  | 60 | spin_lock(&sl->lock); | 
|  | 61 | ++sl->sequence; | 
| Daniel Walker | 20f0939 | 2007-04-26 09:46:05 -0700 | [diff] [blame] | 62 | smp_wmb(); | 
|  | 63 | } | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 64 |  | 
| Daniel Walker | 20f0939 | 2007-04-26 09:46:05 -0700 | [diff] [blame] | 65 | static inline void write_sequnlock(seqlock_t *sl) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 66 | { | 
|  | 67 | smp_wmb(); | 
|  | 68 | sl->sequence++; | 
|  | 69 | spin_unlock(&sl->lock); | 
|  | 70 | } | 
|  | 71 |  | 
|  | 72 | static inline int write_tryseqlock(seqlock_t *sl) | 
|  | 73 | { | 
|  | 74 | int ret = spin_trylock(&sl->lock); | 
|  | 75 |  | 
|  | 76 | if (ret) { | 
|  | 77 | ++sl->sequence; | 
| Daniel Walker | 20f0939 | 2007-04-26 09:46:05 -0700 | [diff] [blame] | 78 | smp_wmb(); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 79 | } | 
|  | 80 | return ret; | 
|  | 81 | } | 
|  | 82 |  | 
|  | 83 | /* Start of read calculation -- fetch last complete writer token */ | 
| mao, bibo | cde227a | 2006-04-11 12:54:54 +0200 | [diff] [blame] | 84 | static __always_inline unsigned read_seqbegin(const seqlock_t *sl) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 85 | { | 
| Ingo Molnar | 88a411c | 2008-04-03 09:06:13 +0200 | [diff] [blame] | 86 | unsigned ret; | 
|  | 87 |  | 
|  | 88 | repeat: | 
| Milton Miller | 5db1256 | 2011-05-12 04:13:54 -0500 | [diff] [blame] | 89 | ret = ACCESS_ONCE(sl->sequence); | 
| Ingo Molnar | 88a411c | 2008-04-03 09:06:13 +0200 | [diff] [blame] | 90 | if (unlikely(ret & 1)) { | 
|  | 91 | cpu_relax(); | 
|  | 92 | goto repeat; | 
|  | 93 | } | 
| Milton Miller | 5db1256 | 2011-05-12 04:13:54 -0500 | [diff] [blame] | 94 | smp_rmb(); | 
| Ingo Molnar | 88a411c | 2008-04-03 09:06:13 +0200 | [diff] [blame] | 95 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 96 | return ret; | 
|  | 97 | } | 
|  | 98 |  | 
| Ingo Molnar | 88a411c | 2008-04-03 09:06:13 +0200 | [diff] [blame] | 99 | /* | 
|  | 100 | * Test if reader processed invalid data. | 
|  | 101 | * | 
|  | 102 | * If sequence value changed then writer changed data while in section. | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 103 | */ | 
| Ingo Molnar | 88a411c | 2008-04-03 09:06:13 +0200 | [diff] [blame] | 104 | static __always_inline int read_seqretry(const seqlock_t *sl, unsigned start) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 105 | { | 
|  | 106 | smp_rmb(); | 
| Ingo Molnar | 88a411c | 2008-04-03 09:06:13 +0200 | [diff] [blame] | 107 |  | 
| Nick Piggin | 3c22cd5 | 2011-01-07 17:49:51 +1100 | [diff] [blame] | 108 | return unlikely(sl->sequence != start); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 109 | } | 
|  | 110 |  | 
|  | 111 |  | 
|  | 112 | /* | 
|  | 113 | * Version using sequence counter only. | 
|  | 114 | * This can be used when code has its own mutex protecting the | 
|  | 115 | * updating starting before the write_seqcountbeqin() and ending | 
|  | 116 | * after the write_seqcount_end(). | 
|  | 117 | */ | 
|  | 118 |  | 
|  | 119 | typedef struct seqcount { | 
|  | 120 | unsigned sequence; | 
|  | 121 | } seqcount_t; | 
|  | 122 |  | 
|  | 123 | #define SEQCNT_ZERO { 0 } | 
|  | 124 | #define seqcount_init(x)	do { *(x) = (seqcount_t) SEQCNT_ZERO; } while (0) | 
|  | 125 |  | 
| Nick Piggin | 3c22cd5 | 2011-01-07 17:49:51 +1100 | [diff] [blame] | 126 | /** | 
|  | 127 | * __read_seqcount_begin - begin a seq-read critical section (without barrier) | 
|  | 128 | * @s: pointer to seqcount_t | 
|  | 129 | * Returns: count to be passed to read_seqcount_retry | 
|  | 130 | * | 
|  | 131 | * __read_seqcount_begin is like read_seqcount_begin, but has no smp_rmb() | 
|  | 132 | * barrier. Callers should ensure that smp_rmb() or equivalent ordering is | 
|  | 133 | * provided before actually loading any of the variables that are to be | 
|  | 134 | * protected in this critical section. | 
|  | 135 | * | 
|  | 136 | * Use carefully, only in critical code, and comment how the barrier is | 
|  | 137 | * provided. | 
|  | 138 | */ | 
|  | 139 | static inline unsigned __read_seqcount_begin(const seqcount_t *s) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 140 | { | 
| Ingo Molnar | 88a411c | 2008-04-03 09:06:13 +0200 | [diff] [blame] | 141 | unsigned ret; | 
|  | 142 |  | 
|  | 143 | repeat: | 
| Linus Torvalds | 2f62427 | 2012-05-04 14:46:02 -0700 | [diff] [blame] | 144 | ret = ACCESS_ONCE(s->sequence); | 
| Ingo Molnar | 88a411c | 2008-04-03 09:06:13 +0200 | [diff] [blame] | 145 | if (unlikely(ret & 1)) { | 
|  | 146 | cpu_relax(); | 
|  | 147 | goto repeat; | 
|  | 148 | } | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 149 | return ret; | 
|  | 150 | } | 
|  | 151 |  | 
| Nick Piggin | 3c22cd5 | 2011-01-07 17:49:51 +1100 | [diff] [blame] | 152 | /** | 
|  | 153 | * read_seqcount_begin - begin a seq-read critical section | 
|  | 154 | * @s: pointer to seqcount_t | 
|  | 155 | * Returns: count to be passed to read_seqcount_retry | 
|  | 156 | * | 
|  | 157 | * read_seqcount_begin opens a read critical section of the given seqcount. | 
|  | 158 | * Validity of the critical section is tested by checking read_seqcount_retry | 
|  | 159 | * function. | 
|  | 160 | */ | 
|  | 161 | static inline unsigned read_seqcount_begin(const seqcount_t *s) | 
|  | 162 | { | 
|  | 163 | unsigned ret = __read_seqcount_begin(s); | 
|  | 164 | smp_rmb(); | 
|  | 165 | return ret; | 
|  | 166 | } | 
|  | 167 |  | 
|  | 168 | /** | 
| Linus Torvalds | 4f988f1 | 2012-05-04 15:13:54 -0700 | [diff] [blame] | 169 | * raw_seqcount_begin - begin a seq-read critical section | 
|  | 170 | * @s: pointer to seqcount_t | 
|  | 171 | * Returns: count to be passed to read_seqcount_retry | 
|  | 172 | * | 
|  | 173 | * raw_seqcount_begin opens a read critical section of the given seqcount. | 
|  | 174 | * Validity of the critical section is tested by checking read_seqcount_retry | 
|  | 175 | * function. | 
|  | 176 | * | 
|  | 177 | * Unlike read_seqcount_begin(), this function will not wait for the count | 
|  | 178 | * to stabilize. If a writer is active when we begin, we will fail the | 
|  | 179 | * read_seqcount_retry() instead of stabilizing at the beginning of the | 
|  | 180 | * critical section. | 
|  | 181 | */ | 
|  | 182 | static inline unsigned raw_seqcount_begin(const seqcount_t *s) | 
|  | 183 | { | 
|  | 184 | unsigned ret = ACCESS_ONCE(s->sequence); | 
|  | 185 | smp_rmb(); | 
|  | 186 | return ret & ~1; | 
|  | 187 | } | 
|  | 188 |  | 
|  | 189 | /** | 
| Nick Piggin | 3c22cd5 | 2011-01-07 17:49:51 +1100 | [diff] [blame] | 190 | * __read_seqcount_retry - end a seq-read critical section (without barrier) | 
|  | 191 | * @s: pointer to seqcount_t | 
|  | 192 | * @start: count, from read_seqcount_begin | 
|  | 193 | * Returns: 1 if retry is required, else 0 | 
|  | 194 | * | 
|  | 195 | * __read_seqcount_retry is like read_seqcount_retry, but has no smp_rmb() | 
|  | 196 | * barrier. Callers should ensure that smp_rmb() or equivalent ordering is | 
|  | 197 | * provided before actually loading any of the variables that are to be | 
|  | 198 | * protected in this critical section. | 
|  | 199 | * | 
|  | 200 | * Use carefully, only in critical code, and comment how the barrier is | 
|  | 201 | * provided. | 
|  | 202 | */ | 
|  | 203 | static inline int __read_seqcount_retry(const seqcount_t *s, unsigned start) | 
|  | 204 | { | 
|  | 205 | return unlikely(s->sequence != start); | 
|  | 206 | } | 
|  | 207 |  | 
|  | 208 | /** | 
|  | 209 | * read_seqcount_retry - end a seq-read critical section | 
|  | 210 | * @s: pointer to seqcount_t | 
|  | 211 | * @start: count, from read_seqcount_begin | 
|  | 212 | * Returns: 1 if retry is required, else 0 | 
|  | 213 | * | 
|  | 214 | * read_seqcount_retry closes a read critical section of the given seqcount. | 
|  | 215 | * If the critical section was invalid, it must be ignored (and typically | 
|  | 216 | * retried). | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 217 | */ | 
| Ingo Molnar | 88a411c | 2008-04-03 09:06:13 +0200 | [diff] [blame] | 218 | static inline int read_seqcount_retry(const seqcount_t *s, unsigned start) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 219 | { | 
|  | 220 | smp_rmb(); | 
| Ingo Molnar | 88a411c | 2008-04-03 09:06:13 +0200 | [diff] [blame] | 221 |  | 
| Nick Piggin | 3c22cd5 | 2011-01-07 17:49:51 +1100 | [diff] [blame] | 222 | return __read_seqcount_retry(s, start); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 223 | } | 
|  | 224 |  | 
|  | 225 |  | 
|  | 226 | /* | 
|  | 227 | * Sequence counter only version assumes that callers are using their | 
|  | 228 | * own mutexing. | 
|  | 229 | */ | 
|  | 230 | static inline void write_seqcount_begin(seqcount_t *s) | 
|  | 231 | { | 
|  | 232 | s->sequence++; | 
|  | 233 | smp_wmb(); | 
|  | 234 | } | 
|  | 235 |  | 
|  | 236 | static inline void write_seqcount_end(seqcount_t *s) | 
|  | 237 | { | 
|  | 238 | smp_wmb(); | 
|  | 239 | s->sequence++; | 
|  | 240 | } | 
|  | 241 |  | 
| Nick Piggin | 3c22cd5 | 2011-01-07 17:49:51 +1100 | [diff] [blame] | 242 | /** | 
|  | 243 | * write_seqcount_barrier - invalidate in-progress read-side seq operations | 
|  | 244 | * @s: pointer to seqcount_t | 
|  | 245 | * | 
|  | 246 | * After write_seqcount_barrier, no read-side seq operations will complete | 
|  | 247 | * successfully and see data older than this. | 
|  | 248 | */ | 
|  | 249 | static inline void write_seqcount_barrier(seqcount_t *s) | 
|  | 250 | { | 
|  | 251 | smp_wmb(); | 
|  | 252 | s->sequence+=2; | 
|  | 253 | } | 
|  | 254 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 255 | /* | 
|  | 256 | * Possible sw/hw IRQ protected versions of the interfaces. | 
|  | 257 | */ | 
|  | 258 | #define write_seqlock_irqsave(lock, flags)				\ | 
|  | 259 | do { local_irq_save(flags); write_seqlock(lock); } while (0) | 
|  | 260 | #define write_seqlock_irq(lock)						\ | 
|  | 261 | do { local_irq_disable();   write_seqlock(lock); } while (0) | 
|  | 262 | #define write_seqlock_bh(lock)						\ | 
|  | 263 | do { local_bh_disable();    write_seqlock(lock); } while (0) | 
|  | 264 |  | 
|  | 265 | #define write_sequnlock_irqrestore(lock, flags)				\ | 
|  | 266 | do { write_sequnlock(lock); local_irq_restore(flags); } while(0) | 
|  | 267 | #define write_sequnlock_irq(lock)					\ | 
|  | 268 | do { write_sequnlock(lock); local_irq_enable(); } while(0) | 
|  | 269 | #define write_sequnlock_bh(lock)					\ | 
|  | 270 | do { write_sequnlock(lock); local_bh_enable(); } while(0) | 
|  | 271 |  | 
|  | 272 | #define read_seqbegin_irqsave(lock, flags)				\ | 
|  | 273 | ({ local_irq_save(flags);   read_seqbegin(lock); }) | 
|  | 274 |  | 
|  | 275 | #define read_seqretry_irqrestore(lock, iv, flags)			\ | 
|  | 276 | ({								\ | 
|  | 277 | int ret = read_seqretry(lock, iv);			\ | 
|  | 278 | local_irq_restore(flags);				\ | 
|  | 279 | ret;							\ | 
|  | 280 | }) | 
|  | 281 |  | 
|  | 282 | #endif /* __LINUX_SEQLOCK_H */ |