linux_dsm_epyc7002/tools/memory-model/linux-kernel.def

// SPDX-License-Identifier: GPL-2.0+
//
// An earlier version of this file appears in the companion webpage for
// "Frightening small children and disconcerting grown-ups: Concurrency
// in the Linux kernel" by Alglave, Maranget, McKenney, Parri, and Stern,
// which is to appear in ASPLOS 2018.

// ONCE
READ_ONCE(X) __load{once}(X)
WRITE_ONCE(X,V) { __store{once}(X,V); }

// Release Acquire and friends
smp_store_release(X,V) { __store{release}(*X,V); }
smp_load_acquire(X) __load{acquire}(*X)
rcu_assign_pointer(X,V) { __store{release}(X,V); }
lockless_dereference(X) __load{lderef}(X)
rcu_dereference(X) __load{deref}(X)

// Fences
smp_mb() { __fence{mb} ; }
smp_rmb() { __fence{rmb} ; }
smp_wmb() { __fence{wmb} ; }
smp_read_barrier_depends() { __fence{rb_dep}; }
smp_mb__before_atomic() { __fence{before_atomic} ; }
smp_mb__after_atomic() { __fence{after_atomic} ; }
smp_mb__after_spinlock() { __fence{after_spinlock} ; }

// Exchange
xchg(X,V)  __xchg{mb}(X,V)
xchg_relaxed(X,V) __xchg{once}(X,V)
xchg_release(X,V) __xchg{release}(X,V)
xchg_acquire(X,V) __xchg{acquire}(X,V)
cmpxchg(X,V,W) __cmpxchg{mb}(X,V,W)
cmpxchg_relaxed(X,V,W) __cmpxchg{once}(X,V,W)
cmpxchg_acquire(X,V,W) __cmpxchg{acquire}(X,V,W)
cmpxchg_release(X,V,W) __cmpxchg{release}(X,V,W)

// Spinlocks
spin_lock(X) { __lock(X) ; }
spin_unlock(X) { __unlock(X) ; }
spin_trylock(X) __trylock(X)

// RCU
rcu_read_lock() { __fence{rcu-lock}; }
rcu_read_unlock() { __fence{rcu-unlock};}
synchronize_rcu() { __fence{sync-rcu}; }
synchronize_rcu_expedited() { __fence{sync-rcu}; }

// Atomic
atomic_read(X) READ_ONCE(*X)
atomic_set(X,V) { WRITE_ONCE(*X,V) ; }
atomic_read_acquire(X) smp_load_acquire(X)
atomic_set_release(X,V) { smp_store_release(X,V); }

atomic_add(V,X) { __atomic_op(X,+,V) ; }
atomic_sub(V,X) { __atomic_op(X,-,V) ; }
atomic_inc(X)   { __atomic_op(X,+,1) ; }
atomic_dec(X)   { __atomic_op(X,-,1) ; }

atomic_add_return(V,X) __atomic_op_return{mb}(X,+,V)
atomic_add_return_relaxed(V,X) __atomic_op_return{once}(X,+,V)
atomic_add_return_acquire(V,X) __atomic_op_return{acquire}(X,+,V)
atomic_add_return_release(V,X) __atomic_op_return{release}(X,+,V)
atomic_fetch_add(V,X) __atomic_fetch_op{mb}(X,+,V)
atomic_fetch_add_relaxed(V,X) __atomic_fetch_op{once}(X,+,V)
atomic_fetch_add_acquire(V,X) __atomic_fetch_op{acquire}(X,+,V)
atomic_fetch_add_release(V,X) __atomic_fetch_op{release}(X,+,V)

atomic_inc_return(X) __atomic_op_return{mb}(X,+,1)
atomic_inc_return_relaxed(X) __atomic_op_return{once}(X,+,1)
atomic_inc_return_acquire(X) __atomic_op_return{acquire}(X,+,1)
atomic_inc_return_release(X) __atomic_op_return{release}(X,+,1)
atomic_fetch_inc(X) __atomic_fetch_op{mb}(X,+,1)
atomic_fetch_inc_relaxed(X) __atomic_fetch_op{once}(X,+,1)
atomic_fetch_inc_acquire(X) __atomic_fetch_op{acquire}(X,+,1)
atomic_fetch_inc_release(X) __atomic_fetch_op{release}(X,+,1)

atomic_sub_return(V,X) __atomic_op_return{mb}(X,-,V)
atomic_sub_return_relaxed(V,X) __atomic_op_return{once}(X,-,V)
atomic_sub_return_acquire(V,X) __atomic_op_return{acquire}(X,-,V)
atomic_sub_return_release(V,X) __atomic_op_return{release}(X,-,V)
atomic_fetch_sub(V,X) __atomic_fetch_op{mb}(X,-,V)
atomic_fetch_sub_relaxed(V,X) __atomic_fetch_op{once}(X,-,V)
atomic_fetch_sub_acquire(V,X) __atomic_fetch_op{acquire}(X,-,V)
atomic_fetch_sub_release(V,X) __atomic_fetch_op{release}(X,-,V)

atomic_dec_return(X) __atomic_op_return{mb}(X,-,1)
atomic_dec_return_relaxed(X) __atomic_op_return{once}(X,-,1)
atomic_dec_return_acquire(X) __atomic_op_return{acquire}(X,-,1)
atomic_dec_return_release(X) __atomic_op_return{release}(X,-,1)
atomic_fetch_dec(X) __atomic_fetch_op{mb}(X,-,1)
atomic_fetch_dec_relaxed(X) __atomic_fetch_op{once}(X,-,1)
atomic_fetch_dec_acquire(X) __atomic_fetch_op{acquire}(X,-,1)
atomic_fetch_dec_release(X) __atomic_fetch_op{release}(X,-,1)

atomic_xchg(X,V) __xchg{mb}(X,V)
atomic_xchg_relaxed(X,V) __xchg{once}(X,V)
atomic_xchg_release(X,V) __xchg{release}(X,V)
atomic_xchg_acquire(X,V) __xchg{acquire}(X,V)
atomic_cmpxchg(X,V,W) __cmpxchg{mb}(X,V,W)
atomic_cmpxchg_relaxed(X,V,W) __cmpxchg{once}(X,V,W)
atomic_cmpxchg_acquire(X,V,W) __cmpxchg{acquire}(X,V,W)
atomic_cmpxchg_release(X,V,W) __cmpxchg{release}(X,V,W)

atomic_sub_and_test(V,X) __atomic_op_return{mb}(X,-,V) == 0
atomic_dec_and_test(X)  __atomic_op_return{mb}(X,-,1) == 0
atomic_inc_and_test(X)  __atomic_op_return{mb}(X,+,1) == 0
atomic_add_negative(V,X) __atomic_op_return{mb}(X,+,V) < 0
Automate memory-barriers.txt; provide Linux-kernel memory model There is some reason to believe that Documentation/memory-barriers.txt could use some help, and a major purpose of this patch is to provide that help in the form of a design-time tool that can produce all valid executions of a small fragment of concurrent Linux-kernel code, which is called a "litmus test". This tool's functionality is roughly similar to a full state-space search. Please note that this is a design-time tool, not useful for regression testing. However, we hope that the underlying Linux-kernel memory model will be incorporated into other tools capable of analyzing large bodies of code for regression-testing purposes. The main tool is herd7, together with the linux-kernel.bell, linux-kernel.cat, linux-kernel.cfg, linux-kernel.def, and lock.cat files added by this patch. The herd7 executable takes the other files as input, and all of these files collectively define the Linux-kernel memory memory model. A brief description of each of these other files is provided in the README file. Although this tool does have its limitations, which are documented in the README file, it does improve on the version reported on in the LWN series (https://lwn.net/Articles/718628/ and https://lwn.net/Articles/720550/) by supporting locking and arithmetic, including a much wider variety of read-modify-write atomic operations. Please note that herd7 is not part of this submission, but is freely available from http://diy.inria.fr/sources/index.html (and via "git" at https://github.com/herd/herdtools7). A second tool is klitmus7, which converts litmus tests to loadable kernel modules for direct testing. As with herd7, the klitmus7 code is freely available from http://diy.inria.fr/sources/index.html (and via "git" at https://github.com/herd/herdtools7). Of course, litmus tests are not always the best way to fully understand a memory model, so this patch also includes Documentation/explanation.txt, which describes the memory model in detail. In addition, Documentation/recipes.txt provides example known-good and known-bad use cases for those who prefer working by example. This patch also includes a few sample litmus tests, and a great many more litmus tests are available at https://github.com/paulmckrcu/litmus. This patch was the result of a most excellent collaboration founded by Jade Alglave and also including Alan Stern, Andrea Parri, and Luc Maranget. For more details on the history of this collaboration, please refer to the Linux-kernel memory model presentations at 2016 LinuxCon EU, 2016 Kernel Summit, 2016 Linux Plumbers Conference, 2017 linux.conf.au, or 2017 Linux Plumbers Conference microconference. However, one aspect of the history does bear repeating due to weak copyright tracking earlier in this project, which extends back to early 2015. This weakness came to light in late 2017 after an LKMM presentation by Paul in which an audience member noted the similarity of some LKMM code to code in early published papers. This prompted a copyright review. From Alan Stern: To say that the model was mine is not entirely accurate. Pieces of it (especially the Scpv and Atomic axioms) were taken directly from Jade's models. And of course the Happens-before and Propagation relations and axioms were heavily based on Jade and Luc's work, even though they weren't identical to the earlier versions. Only the RCU portion was completely original. . . . One can make a much better case that I wrote the bulk of lock.cat. However, it was inspired by Luc's earlier version (and still shares some elements in common), and of course it benefited from feedback and testing from all members of our group. The model prior to Alan's was Luc Maranget's. From Luc: I totally agree on Alan Stern's account of the linux kernel model genesis. I thank him for his acknowledgments of my participation to previous model drafts. I'd like to complete Alan Stern's statement: any bell cat code I have written has its roots in discussions with Jade Alglave and Paul McKenney. Moreover I have borrowed cat and bell code written by Jade Alglave freely. This copyright review therefore resulted in late adds to the copyright statements of several files. Discussion of v1 has raised several issues, which we do not believe should block acceptance given that this level of change will be ongoing, just as it has been with memory-barriers.txt: o Under what conditions should ordering provided by pure locking be seen by CPUs not holding the relevant lock(s)? In particular, should the message-passing pattern be forbidden? o Should examples involving C11 release sequences be forbidden? Note that this C11 is still a moving target for this issue: http://www.open-std.org/jtc1/sc22/wg21/docs/papers/2017/p0735r0.html o Some details of the handling of internal dependencies for atomic read-modify-write atomic operations are still subject to debate. o Changes recently accepted into mainline greatly reduce the need to handle DEC Alpha as a special case. These changes add an smp_read_barrier_depends() to READ_ONCE(), thus causing Alpha to respect ordering of dependent reads. If these changes stick, the memory model can be simplified accordingly. o Will changes be required to accommodate RISC-V? Differences from v1: (http://lkml.kernel.org/r/20171113184031.GA26302@linux.vnet.ibm.com) o Add SPDX notations to .bell and .cat files, replacing textual license statements. o Add reference to upcoming ASPLOS paper to .bell and .cat files. o Updated identifier names in .bell and .cat files to match those used in the ASPLOS paper. o Updates to READMEs and other documentation based on review feedback. o Added a memory-ordering cheatsheet. o Update sigs to new Co-Developed-by and add acks and reviewed-bys. o Simplify rules detecting nested RCU read-side critical sections. o Update copyright statements as noted above. Co-Developed-by: Alan Stern <stern@rowland.harvard.edu> Co-Developed-by: Andrea Parri <parri.andrea@gmail.com> Co-Developed-by: Jade Alglave <j.alglave@ucl.ac.uk> Co-Developed-by: Luc Maranget <luc.maranget@inria.fr> Co-Developed-by: "Paul E. McKenney" <paulmck@linux.vnet.ibm.com> Signed-off-by: Alan Stern <stern@rowland.harvard.edu> Signed-off-by: Andrea Parri <parri.andrea@gmail.com> Signed-off-by: Jade Alglave <j.alglave@ucl.ac.uk> Signed-off-by: Luc Maranget <luc.maranget@inria.fr> Signed-off-by: "Paul E. McKenney" <paulmck@linux.vnet.ibm.com> Reviewed-by: Boqun Feng <boqun.feng@gmail.com> Acked-by: Will Deacon <will.deacon@arm.com> Acked-by: Peter Zijlstra <peterz@infradead.org> Acked-by: Nicholas Piggin <npiggin@gmail.com> Acked-by: David Howells <dhowells@redhat.com> Acked-by: "Reshetova, Elena" <elena.reshetova@intel.com> Acked-by: Michal Hocko <mhocko@suse.com> Acked-by: Akira Yokosawa <akiyks@gmail.com> Cc: <linux-arch@vger.kernel.org> 2018-01-19 10:58:55 +07:00			`// SPDX-License-Identifier: GPL-2.0+`
			`//`
			`// An earlier version of this file appears in the companion webpage for`
			`// "Frightening small children and disconcerting grown-ups: Concurrency`
			`// in the Linux kernel" by Alglave, Maranget, McKenney, Parri, and Stern,`
			`// which is to appear in ASPLOS 2018.`

			`// ONCE`
			`READ_ONCE(X) __load{once}(X)`
			`WRITE_ONCE(X,V) { __store{once}(X,V); }`

			`// Release Acquire and friends`
			`smp_store_release(X,V) { __store{release}(*X,V); }`
			`smp_load_acquire(X) __load{acquire}(*X)`
			`rcu_assign_pointer(X,V) { __store{release}(X,V); }`
			`lockless_dereference(X) __load{lderef}(X)`
			`rcu_dereference(X) __load{deref}(X)`

			`// Fences`
			`smp_mb() { __fence{mb} ; }`
			`smp_rmb() { __fence{rmb} ; }`
			`smp_wmb() { __fence{wmb} ; }`
			`smp_read_barrier_depends() { __fence{rb_dep}; }`
			`smp_mb__before_atomic() { __fence{before_atomic} ; }`
			`smp_mb__after_atomic() { __fence{after_atomic} ; }`
			`smp_mb__after_spinlock() { __fence{after_spinlock} ; }`

			`// Exchange`
			`xchg(X,V) __xchg{mb}(X,V)`
			`xchg_relaxed(X,V) __xchg{once}(X,V)`
			`xchg_release(X,V) __xchg{release}(X,V)`
			`xchg_acquire(X,V) __xchg{acquire}(X,V)`
			`cmpxchg(X,V,W) __cmpxchg{mb}(X,V,W)`
			`cmpxchg_relaxed(X,V,W) __cmpxchg{once}(X,V,W)`
			`cmpxchg_acquire(X,V,W) __cmpxchg{acquire}(X,V,W)`
			`cmpxchg_release(X,V,W) __cmpxchg{release}(X,V,W)`

			`// Spinlocks`
			`spin_lock(X) { __lock(X) ; }`
			`spin_unlock(X) { __unlock(X) ; }`
			`spin_trylock(X) __trylock(X)`

			`// RCU`
			`rcu_read_lock() { __fence{rcu-lock}; }`
			`rcu_read_unlock() { __fence{rcu-unlock};}`
			`synchronize_rcu() { __fence{sync-rcu}; }`
			`synchronize_rcu_expedited() { __fence{sync-rcu}; }`

			`// Atomic`
			`atomic_read(X) READ_ONCE(*X)`
			`atomic_set(X,V) { WRITE_ONCE(*X,V) ; }`
			`atomic_read_acquire(X) smp_load_acquire(X)`
			`atomic_set_release(X,V) { smp_store_release(X,V); }`

			`atomic_add(V,X) { __atomic_op(X,+,V) ; }`
			`atomic_sub(V,X) { __atomic_op(X,-,V) ; }`
			`atomic_inc(X) { __atomic_op(X,+,1) ; }`
			`atomic_dec(X) { __atomic_op(X,-,1) ; }`

			`atomic_add_return(V,X) __atomic_op_return{mb}(X,+,V)`
			`atomic_add_return_relaxed(V,X) __atomic_op_return{once}(X,+,V)`
			`atomic_add_return_acquire(V,X) __atomic_op_return{acquire}(X,+,V)`
			`atomic_add_return_release(V,X) __atomic_op_return{release}(X,+,V)`
			`atomic_fetch_add(V,X) __atomic_fetch_op{mb}(X,+,V)`
			`atomic_fetch_add_relaxed(V,X) __atomic_fetch_op{once}(X,+,V)`
			`atomic_fetch_add_acquire(V,X) __atomic_fetch_op{acquire}(X,+,V)`
			`atomic_fetch_add_release(V,X) __atomic_fetch_op{release}(X,+,V)`

			`atomic_inc_return(X) __atomic_op_return{mb}(X,+,1)`
			`atomic_inc_return_relaxed(X) __atomic_op_return{once}(X,+,1)`
			`atomic_inc_return_acquire(X) __atomic_op_return{acquire}(X,+,1)`
			`atomic_inc_return_release(X) __atomic_op_return{release}(X,+,1)`
			`atomic_fetch_inc(X) __atomic_fetch_op{mb}(X,+,1)`
			`atomic_fetch_inc_relaxed(X) __atomic_fetch_op{once}(X,+,1)`
			`atomic_fetch_inc_acquire(X) __atomic_fetch_op{acquire}(X,+,1)`
			`atomic_fetch_inc_release(X) __atomic_fetch_op{release}(X,+,1)`

			`atomic_sub_return(V,X) __atomic_op_return{mb}(X,-,V)`
			`atomic_sub_return_relaxed(V,X) __atomic_op_return{once}(X,-,V)`
			`atomic_sub_return_acquire(V,X) __atomic_op_return{acquire}(X,-,V)`
			`atomic_sub_return_release(V,X) __atomic_op_return{release}(X,-,V)`
			`atomic_fetch_sub(V,X) __atomic_fetch_op{mb}(X,-,V)`
			`atomic_fetch_sub_relaxed(V,X) __atomic_fetch_op{once}(X,-,V)`
			`atomic_fetch_sub_acquire(V,X) __atomic_fetch_op{acquire}(X,-,V)`
			`atomic_fetch_sub_release(V,X) __atomic_fetch_op{release}(X,-,V)`

			`atomic_dec_return(X) __atomic_op_return{mb}(X,-,1)`
			`atomic_dec_return_relaxed(X) __atomic_op_return{once}(X,-,1)`
			`atomic_dec_return_acquire(X) __atomic_op_return{acquire}(X,-,1)`
			`atomic_dec_return_release(X) __atomic_op_return{release}(X,-,1)`
			`atomic_fetch_dec(X) __atomic_fetch_op{mb}(X,-,1)`
			`atomic_fetch_dec_relaxed(X) __atomic_fetch_op{once}(X,-,1)`
			`atomic_fetch_dec_acquire(X) __atomic_fetch_op{acquire}(X,-,1)`
			`atomic_fetch_dec_release(X) __atomic_fetch_op{release}(X,-,1)`

			`atomic_xchg(X,V) __xchg{mb}(X,V)`
			`atomic_xchg_relaxed(X,V) __xchg{once}(X,V)`
			`atomic_xchg_release(X,V) __xchg{release}(X,V)`
			`atomic_xchg_acquire(X,V) __xchg{acquire}(X,V)`
			`atomic_cmpxchg(X,V,W) __cmpxchg{mb}(X,V,W)`
			`atomic_cmpxchg_relaxed(X,V,W) __cmpxchg{once}(X,V,W)`
			`atomic_cmpxchg_acquire(X,V,W) __cmpxchg{acquire}(X,V,W)`
			`atomic_cmpxchg_release(X,V,W) __cmpxchg{release}(X,V,W)`

			`atomic_sub_and_test(V,X) __atomic_op_return{mb}(X,-,V) == 0`
			`atomic_dec_and_test(X) __atomic_op_return{mb}(X,-,1) == 0`
			`atomic_inc_and_test(X) __atomic_op_return{mb}(X,+,1) == 0`
			`atomic_add_negative(V,X) __atomic_op_return{mb}(X,+,V) < 0`