11c27b644SPaul E. McKenney// SPDX-License-Identifier: GPL-2.0+
21c27b644SPaul E. McKenney(*
31c27b644SPaul E. McKenney * Copyright (C) 2015 Jade Alglave <[email protected]>,
41c27b644SPaul E. McKenney * Copyright (C) 2016 Luc Maranget <[email protected]> for Inria
51c27b644SPaul E. McKenney * Copyright (C) 2017 Alan Stern <[email protected]>,
61c27b644SPaul E. McKenney *                    Andrea Parri <[email protected]>
71c27b644SPaul E. McKenney *
81a00b455SAndrea Parri * An earlier version of this file appeared in the companion webpage for
91c27b644SPaul E. McKenney * "Frightening small children and disconcerting grown-ups: Concurrency
101c27b644SPaul E. McKenney * in the Linux kernel" by Alglave, Maranget, McKenney, Parri, and Stern,
111a00b455SAndrea Parri * which appeared in ASPLOS 2018.
121c27b644SPaul E. McKenney *)
131c27b644SPaul E. McKenney
1448d44d4eSAndrea Parri"Linux-kernel memory consistency model"
151c27b644SPaul E. McKenney
161c27b644SPaul E. McKenney(*
171c27b644SPaul E. McKenney * File "lock.cat" handles locks and is experimental.
181c27b644SPaul E. McKenney * It can be replaced by include "cos.cat" for tests that do not use locks.
191c27b644SPaul E. McKenney *)
201c27b644SPaul E. McKenney
211c27b644SPaul E. McKenneyinclude "lock.cat"
221c27b644SPaul E. McKenney
231c27b644SPaul E. McKenney(*******************)
241c27b644SPaul E. McKenney(* Basic relations *)
251c27b644SPaul E. McKenney(*******************)
261c27b644SPaul E. McKenney
274494dd58SAlan Stern(* Release Acquire *)
284494dd58SAlan Sternlet acq-po = [Acquire] ; po ; [M]
294494dd58SAlan Sternlet po-rel = [M] ; po ; [Release]
30ddfe1294SBoqun Fenglet po-unlock-lock-po = po ; [UL] ; (po|rf) ; [LKR] ; po
314494dd58SAlan Stern
321c27b644SPaul E. McKenney(* Fences *)
334494dd58SAlan Sternlet R4rmb = R \ Noreturn	(* Reads for which rmb works *)
344494dd58SAlan Sternlet rmb = [R4rmb] ; fencerel(Rmb) ; [R4rmb]
351c27b644SPaul E. McKenneylet wmb = [W] ; fencerel(Wmb) ; [W]
361c27b644SPaul E. McKenneylet mb = ([M] ; fencerel(Mb) ; [M]) |
37*29279349SJonas Oberhauser	(*
38*29279349SJonas Oberhauser	 * full-barrier RMWs (successful cmpxchg(), xchg(), etc.) act as
39*29279349SJonas Oberhauser	 * though there were enclosed by smp_mb().
40*29279349SJonas Oberhauser	 * The effect of these virtual smp_mb() is formalized by adding
41*29279349SJonas Oberhauser	 * Mb tags to the read and write of the operation, and providing
42*29279349SJonas Oberhauser	 * the same ordering as though there were additional po edges
43*29279349SJonas Oberhauser	 * between the Mb tag and the read resp. write.
44*29279349SJonas Oberhauser	 *)
45*29279349SJonas Oberhauser	([M] ; po ; [Mb & R]) |
46*29279349SJonas Oberhauser	([Mb & W] ; po ; [M]) |
47cac79a39SPaul E. McKenney	([M] ; fencerel(Before-atomic) ; [RMW] ; po? ; [M]) |
48cac79a39SPaul E. McKenney	([M] ; po? ; [RMW] ; fencerel(After-atomic) ; [M]) |
495b735eb1SAndrea Parri	([M] ; po? ; [LKW] ; fencerel(After-spinlock) ; [M]) |
50dd409de2SJonas Oberhauser(*
51dd409de2SJonas Oberhauser * Note: The po-unlock-lock-po relation only passes the lock to the direct
52dd409de2SJonas Oberhauser * successor, perhaps giving the impression that the ordering of the
53dd409de2SJonas Oberhauser * smp_mb__after_unlock_lock() fence only affects a single lock handover.
54dd409de2SJonas Oberhauser * However, in a longer sequence of lock handovers, the implicit
55dd409de2SJonas Oberhauser * A-cumulative release fences of lock-release ensure that any stores that
56dd409de2SJonas Oberhauser * propagate to one of the involved CPUs before it hands over the lock to
57dd409de2SJonas Oberhauser * the next CPU will also propagate to the final CPU handing over the lock
58dd409de2SJonas Oberhauser * to the CPU that executes the fence.  Therefore, all those stores are
59dd409de2SJonas Oberhauser * also affected by the fence.
60dd409de2SJonas Oberhauser *)
61dd409de2SJonas Oberhauser	([M] ; po-unlock-lock-po ;
6202bae7a2SPaul E. McKenney		[After-unlock-lock] ; po ; [M]) |
6302bae7a2SPaul E. McKenney	([M] ; po? ; [Srcu-unlock] ; fencerel(After-srcu-read-unlock) ; [M])
64a3f600d9SAlan Sternlet gp = po ; [Sync-rcu | Sync-srcu] ; po?
651c27b644SPaul E. McKenneylet strong-fence = mb | gp
661c27b644SPaul E. McKenney
674494dd58SAlan Sternlet nonrw-fence = strong-fence | po-rel | acq-po
684494dd58SAlan Sternlet fence = nonrw-fence | wmb | rmb
690031e38aSAlan Sternlet barrier = fencerel(Barrier | Rmb | Wmb | Mb | Sync-rcu | Sync-srcu |
70f9de4171SAlan Stern		Before-atomic | After-atomic | Acquire | Release |
71f9de4171SAlan Stern		Rcu-lock | Rcu-unlock | Srcu-lock | Srcu-unlock) |
720031e38aSAlan Stern	(po ; [Release]) | ([Acquire] ; po)
731c27b644SPaul E. McKenney
741c27b644SPaul E. McKenney(**********************************)
751c27b644SPaul E. McKenney(* Fundamental coherence ordering *)
761c27b644SPaul E. McKenney(**********************************)
771c27b644SPaul E. McKenney
781c27b644SPaul E. McKenney(* Sequential Consistency Per Variable *)
791c27b644SPaul E. McKenneylet com = rf | co | fr
801c27b644SPaul E. McKenneyacyclic po-loc | com as coherence
811c27b644SPaul E. McKenney
821c27b644SPaul E. McKenney(* Atomic Read-Modify-Write *)
831c27b644SPaul E. McKenneyempty rmw & (fre ; coe) as atomic
841c27b644SPaul E. McKenney
851c27b644SPaul E. McKenney(**********************************)
861c27b644SPaul E. McKenney(* Instruction execution ordering *)
871c27b644SPaul E. McKenney(**********************************)
881c27b644SPaul E. McKenney
891c27b644SPaul E. McKenney(* Preserved Program Order *)
901c27b644SPaul E. McKenneylet dep = addr | data
911c27b644SPaul E. McKenneylet rwdep = (dep | ctrl) ; [W]
921c27b644SPaul E. McKenneylet overwrite = co | fr
930031e38aSAlan Sternlet to-w = rwdep | (overwrite & int) | (addr ; [Plain] ; wmb)
94aa568c26SJoel Fernandes (Google)let to-r = (addr ; [R]) | (dep ; [Marked] ; rfi)
95762e9357SJonas Oberhauserlet ppo = to-r | to-w | (fence & int) | (po-unlock-lock-po & int)
961c27b644SPaul E. McKenney
971c27b644SPaul E. McKenney(* Propagation: Ordering from release operations and strong fences. *)
98d1a84ab1SAlan Sternlet A-cumul(r) = (rfe ; [Marked])? ; r
99ebd50e29SAlan Sternlet rmw-sequence = (rf ; rmw)*
100d1a84ab1SAlan Sternlet cumul-fence = [Marked] ; (A-cumul(strong-fence | po-rel) | wmb |
101ebd50e29SAlan Stern	po-unlock-lock-po) ; [Marked] ; rmw-sequence
102d1a84ab1SAlan Sternlet prop = [Marked] ; (overwrite & ext)? ; cumul-fence* ;
103d1a84ab1SAlan Stern	[Marked] ; rfe? ; [Marked]
1041c27b644SPaul E. McKenney
1051c27b644SPaul E. McKenney(*
1061c27b644SPaul E. McKenney * Happens Before: Ordering from the passage of time.
1071c27b644SPaul E. McKenney * No fences needed here for prop because relation confined to one process.
1081c27b644SPaul E. McKenney *)
109d1a84ab1SAlan Sternlet hb = [Marked] ; (ppo | rfe | ((prop \ id) & int)) ; [Marked]
1101c27b644SPaul E. McKenneyacyclic hb as happens-before
1111c27b644SPaul E. McKenney
1121c27b644SPaul E. McKenney(****************************************)
1131c27b644SPaul E. McKenney(* Write and fence propagation ordering *)
1141c27b644SPaul E. McKenney(****************************************)
1151c27b644SPaul E. McKenney
1161c27b644SPaul E. McKenney(* Propagation: Each non-rf link needs a strong fence. *)
117d1a84ab1SAlan Sternlet pb = prop ; strong-fence ; hb* ; [Marked]
1181c27b644SPaul E. McKenneyacyclic pb as propagation
1191c27b644SPaul E. McKenney
1201c27b644SPaul E. McKenney(*******)
1211c27b644SPaul E. McKenney(* RCU *)
1221c27b644SPaul E. McKenney(*******)
1231c27b644SPaul E. McKenney
1241c27b644SPaul E. McKenney(*
125284749b0SAlan Stern * Effects of read-side critical sections proceed from the rcu_read_unlock()
126a3f600d9SAlan Stern * or srcu_read_unlock() backwards on the one hand, and from the
127a3f600d9SAlan Stern * rcu_read_lock() or srcu_read_lock() forwards on the other hand.
128284749b0SAlan Stern *
129284749b0SAlan Stern * In the definition of rcu-fence below, the po term at the left-hand side
130284749b0SAlan Stern * of each disjunct and the po? term at the right-hand end have been factored
131284749b0SAlan Stern * out.  They have been moved into the definitions of rcu-link and rb.
132a3f600d9SAlan Stern * This was necessary in order to apply the "& loc" tests correctly.
1331c27b644SPaul E. McKenney *)
134284749b0SAlan Sternlet rcu-gp = [Sync-rcu]		(* Compare with gp *)
135a3f600d9SAlan Sternlet srcu-gp = [Sync-srcu]
136284749b0SAlan Sternlet rcu-rscsi = rcu-rscs^-1
137a3f600d9SAlan Sternlet srcu-rscsi = srcu-rscs^-1
1381c27b644SPaul E. McKenney
1391c27b644SPaul E. McKenney(*
1401c27b644SPaul E. McKenney * The synchronize_rcu() strong fence is special in that it can order not
1411c27b644SPaul E. McKenney * one but two non-rf relations, but only in conjunction with an RCU
1421c27b644SPaul E. McKenney * read-side critical section.
1431c27b644SPaul E. McKenney *)
144284749b0SAlan Sternlet rcu-link = po? ; hb* ; pb* ; prop ; po
1451c27b644SPaul E. McKenney
1461c27b644SPaul E. McKenney(*
1479d036883SAlan Stern * Any sequence containing at least as many grace periods as RCU read-side
14815aa25cbSAlan Stern * critical sections (joined by rcu-link) induces order like a generalized
14915aa25cbSAlan Stern * inter-CPU strong fence.
150a3f600d9SAlan Stern * Likewise for SRCU grace periods and read-side critical sections, provided
151a3f600d9SAlan Stern * the synchronize_srcu() and srcu_read_[un]lock() calls refer to the same
152a3f600d9SAlan Stern * struct srcu_struct location.
1531c27b644SPaul E. McKenney *)
15415aa25cbSAlan Sternlet rec rcu-order = rcu-gp | srcu-gp |
155284749b0SAlan Stern	(rcu-gp ; rcu-link ; rcu-rscsi) |
156a3f600d9SAlan Stern	((srcu-gp ; rcu-link ; srcu-rscsi) & loc) |
157284749b0SAlan Stern	(rcu-rscsi ; rcu-link ; rcu-gp) |
158a3f600d9SAlan Stern	((srcu-rscsi ; rcu-link ; srcu-gp) & loc) |
15915aa25cbSAlan Stern	(rcu-gp ; rcu-link ; rcu-order ; rcu-link ; rcu-rscsi) |
16015aa25cbSAlan Stern	((srcu-gp ; rcu-link ; rcu-order ; rcu-link ; srcu-rscsi) & loc) |
16115aa25cbSAlan Stern	(rcu-rscsi ; rcu-link ; rcu-order ; rcu-link ; rcu-gp) |
16215aa25cbSAlan Stern	((srcu-rscsi ; rcu-link ; rcu-order ; rcu-link ; srcu-gp) & loc) |
16315aa25cbSAlan Stern	(rcu-order ; rcu-link ; rcu-order)
16415aa25cbSAlan Sternlet rcu-fence = po ; rcu-order ; po?
16515aa25cbSAlan Sternlet fence = fence | rcu-fence
16615aa25cbSAlan Sternlet strong-fence = strong-fence | rcu-fence
1679d036883SAlan Stern
1689d036883SAlan Stern(* rb orders instructions just as pb does *)
16915aa25cbSAlan Sternlet rb = prop ; rcu-fence ; hb* ; pb* ; [Marked]
1701c27b644SPaul E. McKenney
1711ee2da5fSAlan Sternirreflexive rb as rcu
1729d036883SAlan Stern
1739d036883SAlan Stern(*
1749d036883SAlan Stern * The happens-before, propagation, and rcu constraints are all
1759d036883SAlan Stern * expressions of temporal ordering.  They could be replaced by
1769d036883SAlan Stern * a single constraint on an "executes-before" relation, xb:
1779d036883SAlan Stern *
1789d036883SAlan Stern * let xb = hb | pb | rb
1799d036883SAlan Stern * acyclic xb as executes-before
1809d036883SAlan Stern *)
1810031e38aSAlan Stern
1820031e38aSAlan Stern(*********************************)
1830031e38aSAlan Stern(* Plain accesses and data races *)
1840031e38aSAlan Stern(*********************************)
1850031e38aSAlan Stern
1860031e38aSAlan Stern(* Warn about plain writes and marked accesses in the same region *)
1870031e38aSAlan Sternlet mixed-accesses = ([Plain & W] ; (po-loc \ barrier) ; [Marked]) |
1880031e38aSAlan Stern	([Marked] ; (po-loc \ barrier) ; [Plain & W])
1890031e38aSAlan Sternflag ~empty mixed-accesses as mixed-accesses
1900031e38aSAlan Stern
1910031e38aSAlan Stern(* Executes-before and visibility *)
1920031e38aSAlan Sternlet xbstar = (hb | pb | rb)*
1930031e38aSAlan Sternlet vis = cumul-fence* ; rfe? ; [Marked] ;
19415aa25cbSAlan Stern	((strong-fence ; [Marked] ; xbstar) | (xbstar & int))
1950031e38aSAlan Stern
1960031e38aSAlan Stern(* Boundaries for lifetimes of plain accesses *)
1970031e38aSAlan Sternlet w-pre-bounded = [Marked] ; (addr | fence)?
1980031e38aSAlan Sternlet r-pre-bounded = [Marked] ; (addr | nonrw-fence |
1990031e38aSAlan Stern	([R4rmb] ; fencerel(Rmb) ; [~Noreturn]))?
200ebd50e29SAlan Sternlet w-post-bounded = fence? ; [Marked] ; rmw-sequence
2010031e38aSAlan Sternlet r-post-bounded = (nonrw-fence | ([~Noreturn] ; fencerel(Rmb) ; [R4rmb]))? ;
2020031e38aSAlan Stern	[Marked]
2030031e38aSAlan Stern
2040031e38aSAlan Stern(* Visibility and executes-before for plain accesses *)
2054289ee7dSAlan Sternlet ww-vis = fence | (strong-fence ; xbstar ; w-pre-bounded) |
2064289ee7dSAlan Stern	(w-post-bounded ; vis ; w-pre-bounded)
2074289ee7dSAlan Sternlet wr-vis = fence | (strong-fence ; xbstar ; r-pre-bounded) |
2084289ee7dSAlan Stern	(w-post-bounded ; vis ; r-pre-bounded)
2094289ee7dSAlan Sternlet rw-xbstar = fence | (r-post-bounded ; xbstar ; w-pre-bounded)
2100031e38aSAlan Stern
2110031e38aSAlan Stern(* Potential races *)
2120031e38aSAlan Sternlet pre-race = ext & ((Plain * M) | ((M \ IW) * Plain))
2130031e38aSAlan Stern
2140031e38aSAlan Stern(* Coherence requirements for plain accesses *)
2150031e38aSAlan Sternlet wr-incoh = pre-race & rf & rw-xbstar^-1
2160031e38aSAlan Sternlet rw-incoh = pre-race & fr & wr-vis^-1
2170031e38aSAlan Sternlet ww-incoh = pre-race & co & ww-vis^-1
2180031e38aSAlan Sternempty (wr-incoh | rw-incoh | ww-incoh) as plain-coherence
2190031e38aSAlan Stern
2200031e38aSAlan Stern(* Actual races *)
2210031e38aSAlan Sternlet ww-nonrace = ww-vis & ((Marked * W) | rw-xbstar) & ((W * Marked) | wr-vis)
2220031e38aSAlan Sternlet ww-race = (pre-race & co) \ ww-nonrace
223daebf24aSAlan Sternlet wr-race = (pre-race & (co? ; rf)) \ wr-vis \ rw-xbstar^-1
2240031e38aSAlan Sternlet rw-race = (pre-race & fr) \ rw-xbstar
2250031e38aSAlan Stern
2260031e38aSAlan Sternflag ~empty (ww-race | wr-race | rw-race) as data-race
227