11c27b644SPaul E. McKenney// SPDX-License-Identifier: GPL-2.0+ 21c27b644SPaul E. McKenney(* 31c27b644SPaul E. McKenney * Copyright (C) 2015 Jade Alglave <[email protected]>, 41c27b644SPaul E. McKenney * Copyright (C) 2016 Luc Maranget <[email protected]> for Inria 51c27b644SPaul E. McKenney * Copyright (C) 2017 Alan Stern <[email protected]>, 61c27b644SPaul E. McKenney * Andrea Parri <[email protected]> 71c27b644SPaul E. McKenney * 81a00b455SAndrea Parri * An earlier version of this file appeared in the companion webpage for 91c27b644SPaul E. McKenney * "Frightening small children and disconcerting grown-ups: Concurrency 101c27b644SPaul E. McKenney * in the Linux kernel" by Alglave, Maranget, McKenney, Parri, and Stern, 111a00b455SAndrea Parri * which appeared in ASPLOS 2018. 121c27b644SPaul E. McKenney *) 131c27b644SPaul E. McKenney 1448d44d4eSAndrea Parri"Linux-kernel memory consistency model" 151c27b644SPaul E. McKenney 161c27b644SPaul E. McKenney(* 171c27b644SPaul E. McKenney * File "lock.cat" handles locks and is experimental. 181c27b644SPaul E. McKenney * It can be replaced by include "cos.cat" for tests that do not use locks. 191c27b644SPaul E. McKenney *) 201c27b644SPaul E. McKenney 211c27b644SPaul E. McKenneyinclude "lock.cat" 221c27b644SPaul E. McKenney 231c27b644SPaul E. McKenney(*******************) 241c27b644SPaul E. McKenney(* Basic relations *) 251c27b644SPaul E. McKenney(*******************) 261c27b644SPaul E. McKenney 274494dd58SAlan Stern(* Release Acquire *) 284494dd58SAlan Sternlet acq-po = [Acquire] ; po ; [M] 294494dd58SAlan Sternlet po-rel = [M] ; po ; [Release] 30ddfe1294SBoqun Fenglet po-unlock-lock-po = po ; [UL] ; (po|rf) ; [LKR] ; po 314494dd58SAlan Stern 321c27b644SPaul E. McKenney(* Fences *) 334494dd58SAlan Sternlet R4rmb = R \ Noreturn (* Reads for which rmb works *) 344494dd58SAlan Sternlet rmb = [R4rmb] ; fencerel(Rmb) ; [R4rmb] 351c27b644SPaul E. McKenneylet wmb = [W] ; fencerel(Wmb) ; [W] 361c27b644SPaul E. McKenneylet mb = ([M] ; fencerel(Mb) ; [M]) | 37*29279349SJonas Oberhauser (* 38*29279349SJonas Oberhauser * full-barrier RMWs (successful cmpxchg(), xchg(), etc.) act as 39*29279349SJonas Oberhauser * though there were enclosed by smp_mb(). 40*29279349SJonas Oberhauser * The effect of these virtual smp_mb() is formalized by adding 41*29279349SJonas Oberhauser * Mb tags to the read and write of the operation, and providing 42*29279349SJonas Oberhauser * the same ordering as though there were additional po edges 43*29279349SJonas Oberhauser * between the Mb tag and the read resp. write. 44*29279349SJonas Oberhauser *) 45*29279349SJonas Oberhauser ([M] ; po ; [Mb & R]) | 46*29279349SJonas Oberhauser ([Mb & W] ; po ; [M]) | 47cac79a39SPaul E. McKenney ([M] ; fencerel(Before-atomic) ; [RMW] ; po? ; [M]) | 48cac79a39SPaul E. McKenney ([M] ; po? ; [RMW] ; fencerel(After-atomic) ; [M]) | 495b735eb1SAndrea Parri ([M] ; po? ; [LKW] ; fencerel(After-spinlock) ; [M]) | 50dd409de2SJonas Oberhauser(* 51dd409de2SJonas Oberhauser * Note: The po-unlock-lock-po relation only passes the lock to the direct 52dd409de2SJonas Oberhauser * successor, perhaps giving the impression that the ordering of the 53dd409de2SJonas Oberhauser * smp_mb__after_unlock_lock() fence only affects a single lock handover. 54dd409de2SJonas Oberhauser * However, in a longer sequence of lock handovers, the implicit 55dd409de2SJonas Oberhauser * A-cumulative release fences of lock-release ensure that any stores that 56dd409de2SJonas Oberhauser * propagate to one of the involved CPUs before it hands over the lock to 57dd409de2SJonas Oberhauser * the next CPU will also propagate to the final CPU handing over the lock 58dd409de2SJonas Oberhauser * to the CPU that executes the fence. Therefore, all those stores are 59dd409de2SJonas Oberhauser * also affected by the fence. 60dd409de2SJonas Oberhauser *) 61dd409de2SJonas Oberhauser ([M] ; po-unlock-lock-po ; 6202bae7a2SPaul E. McKenney [After-unlock-lock] ; po ; [M]) | 6302bae7a2SPaul E. McKenney ([M] ; po? ; [Srcu-unlock] ; fencerel(After-srcu-read-unlock) ; [M]) 64a3f600d9SAlan Sternlet gp = po ; [Sync-rcu | Sync-srcu] ; po? 651c27b644SPaul E. McKenneylet strong-fence = mb | gp 661c27b644SPaul E. McKenney 674494dd58SAlan Sternlet nonrw-fence = strong-fence | po-rel | acq-po 684494dd58SAlan Sternlet fence = nonrw-fence | wmb | rmb 690031e38aSAlan Sternlet barrier = fencerel(Barrier | Rmb | Wmb | Mb | Sync-rcu | Sync-srcu | 70f9de4171SAlan Stern Before-atomic | After-atomic | Acquire | Release | 71f9de4171SAlan Stern Rcu-lock | Rcu-unlock | Srcu-lock | Srcu-unlock) | 720031e38aSAlan Stern (po ; [Release]) | ([Acquire] ; po) 731c27b644SPaul E. McKenney 741c27b644SPaul E. McKenney(**********************************) 751c27b644SPaul E. McKenney(* Fundamental coherence ordering *) 761c27b644SPaul E. McKenney(**********************************) 771c27b644SPaul E. McKenney 781c27b644SPaul E. McKenney(* Sequential Consistency Per Variable *) 791c27b644SPaul E. McKenneylet com = rf | co | fr 801c27b644SPaul E. McKenneyacyclic po-loc | com as coherence 811c27b644SPaul E. McKenney 821c27b644SPaul E. McKenney(* Atomic Read-Modify-Write *) 831c27b644SPaul E. McKenneyempty rmw & (fre ; coe) as atomic 841c27b644SPaul E. McKenney 851c27b644SPaul E. McKenney(**********************************) 861c27b644SPaul E. McKenney(* Instruction execution ordering *) 871c27b644SPaul E. McKenney(**********************************) 881c27b644SPaul E. McKenney 891c27b644SPaul E. McKenney(* Preserved Program Order *) 901c27b644SPaul E. McKenneylet dep = addr | data 911c27b644SPaul E. McKenneylet rwdep = (dep | ctrl) ; [W] 921c27b644SPaul E. McKenneylet overwrite = co | fr 930031e38aSAlan Sternlet to-w = rwdep | (overwrite & int) | (addr ; [Plain] ; wmb) 94aa568c26SJoel Fernandes (Google)let to-r = (addr ; [R]) | (dep ; [Marked] ; rfi) 95762e9357SJonas Oberhauserlet ppo = to-r | to-w | (fence & int) | (po-unlock-lock-po & int) 961c27b644SPaul E. McKenney 971c27b644SPaul E. McKenney(* Propagation: Ordering from release operations and strong fences. *) 98d1a84ab1SAlan Sternlet A-cumul(r) = (rfe ; [Marked])? ; r 99ebd50e29SAlan Sternlet rmw-sequence = (rf ; rmw)* 100d1a84ab1SAlan Sternlet cumul-fence = [Marked] ; (A-cumul(strong-fence | po-rel) | wmb | 101ebd50e29SAlan Stern po-unlock-lock-po) ; [Marked] ; rmw-sequence 102d1a84ab1SAlan Sternlet prop = [Marked] ; (overwrite & ext)? ; cumul-fence* ; 103d1a84ab1SAlan Stern [Marked] ; rfe? ; [Marked] 1041c27b644SPaul E. McKenney 1051c27b644SPaul E. McKenney(* 1061c27b644SPaul E. McKenney * Happens Before: Ordering from the passage of time. 1071c27b644SPaul E. McKenney * No fences needed here for prop because relation confined to one process. 1081c27b644SPaul E. McKenney *) 109d1a84ab1SAlan Sternlet hb = [Marked] ; (ppo | rfe | ((prop \ id) & int)) ; [Marked] 1101c27b644SPaul E. McKenneyacyclic hb as happens-before 1111c27b644SPaul E. McKenney 1121c27b644SPaul E. McKenney(****************************************) 1131c27b644SPaul E. McKenney(* Write and fence propagation ordering *) 1141c27b644SPaul E. McKenney(****************************************) 1151c27b644SPaul E. McKenney 1161c27b644SPaul E. McKenney(* Propagation: Each non-rf link needs a strong fence. *) 117d1a84ab1SAlan Sternlet pb = prop ; strong-fence ; hb* ; [Marked] 1181c27b644SPaul E. McKenneyacyclic pb as propagation 1191c27b644SPaul E. McKenney 1201c27b644SPaul E. McKenney(*******) 1211c27b644SPaul E. McKenney(* RCU *) 1221c27b644SPaul E. McKenney(*******) 1231c27b644SPaul E. McKenney 1241c27b644SPaul E. McKenney(* 125284749b0SAlan Stern * Effects of read-side critical sections proceed from the rcu_read_unlock() 126a3f600d9SAlan Stern * or srcu_read_unlock() backwards on the one hand, and from the 127a3f600d9SAlan Stern * rcu_read_lock() or srcu_read_lock() forwards on the other hand. 128284749b0SAlan Stern * 129284749b0SAlan Stern * In the definition of rcu-fence below, the po term at the left-hand side 130284749b0SAlan Stern * of each disjunct and the po? term at the right-hand end have been factored 131284749b0SAlan Stern * out. They have been moved into the definitions of rcu-link and rb. 132a3f600d9SAlan Stern * This was necessary in order to apply the "& loc" tests correctly. 1331c27b644SPaul E. McKenney *) 134284749b0SAlan Sternlet rcu-gp = [Sync-rcu] (* Compare with gp *) 135a3f600d9SAlan Sternlet srcu-gp = [Sync-srcu] 136284749b0SAlan Sternlet rcu-rscsi = rcu-rscs^-1 137a3f600d9SAlan Sternlet srcu-rscsi = srcu-rscs^-1 1381c27b644SPaul E. McKenney 1391c27b644SPaul E. McKenney(* 1401c27b644SPaul E. McKenney * The synchronize_rcu() strong fence is special in that it can order not 1411c27b644SPaul E. McKenney * one but two non-rf relations, but only in conjunction with an RCU 1421c27b644SPaul E. McKenney * read-side critical section. 1431c27b644SPaul E. McKenney *) 144284749b0SAlan Sternlet rcu-link = po? ; hb* ; pb* ; prop ; po 1451c27b644SPaul E. McKenney 1461c27b644SPaul E. McKenney(* 1479d036883SAlan Stern * Any sequence containing at least as many grace periods as RCU read-side 14815aa25cbSAlan Stern * critical sections (joined by rcu-link) induces order like a generalized 14915aa25cbSAlan Stern * inter-CPU strong fence. 150a3f600d9SAlan Stern * Likewise for SRCU grace periods and read-side critical sections, provided 151a3f600d9SAlan Stern * the synchronize_srcu() and srcu_read_[un]lock() calls refer to the same 152a3f600d9SAlan Stern * struct srcu_struct location. 1531c27b644SPaul E. McKenney *) 15415aa25cbSAlan Sternlet rec rcu-order = rcu-gp | srcu-gp | 155284749b0SAlan Stern (rcu-gp ; rcu-link ; rcu-rscsi) | 156a3f600d9SAlan Stern ((srcu-gp ; rcu-link ; srcu-rscsi) & loc) | 157284749b0SAlan Stern (rcu-rscsi ; rcu-link ; rcu-gp) | 158a3f600d9SAlan Stern ((srcu-rscsi ; rcu-link ; srcu-gp) & loc) | 15915aa25cbSAlan Stern (rcu-gp ; rcu-link ; rcu-order ; rcu-link ; rcu-rscsi) | 16015aa25cbSAlan Stern ((srcu-gp ; rcu-link ; rcu-order ; rcu-link ; srcu-rscsi) & loc) | 16115aa25cbSAlan Stern (rcu-rscsi ; rcu-link ; rcu-order ; rcu-link ; rcu-gp) | 16215aa25cbSAlan Stern ((srcu-rscsi ; rcu-link ; rcu-order ; rcu-link ; srcu-gp) & loc) | 16315aa25cbSAlan Stern (rcu-order ; rcu-link ; rcu-order) 16415aa25cbSAlan Sternlet rcu-fence = po ; rcu-order ; po? 16515aa25cbSAlan Sternlet fence = fence | rcu-fence 16615aa25cbSAlan Sternlet strong-fence = strong-fence | rcu-fence 1679d036883SAlan Stern 1689d036883SAlan Stern(* rb orders instructions just as pb does *) 16915aa25cbSAlan Sternlet rb = prop ; rcu-fence ; hb* ; pb* ; [Marked] 1701c27b644SPaul E. McKenney 1711ee2da5fSAlan Sternirreflexive rb as rcu 1729d036883SAlan Stern 1739d036883SAlan Stern(* 1749d036883SAlan Stern * The happens-before, propagation, and rcu constraints are all 1759d036883SAlan Stern * expressions of temporal ordering. They could be replaced by 1769d036883SAlan Stern * a single constraint on an "executes-before" relation, xb: 1779d036883SAlan Stern * 1789d036883SAlan Stern * let xb = hb | pb | rb 1799d036883SAlan Stern * acyclic xb as executes-before 1809d036883SAlan Stern *) 1810031e38aSAlan Stern 1820031e38aSAlan Stern(*********************************) 1830031e38aSAlan Stern(* Plain accesses and data races *) 1840031e38aSAlan Stern(*********************************) 1850031e38aSAlan Stern 1860031e38aSAlan Stern(* Warn about plain writes and marked accesses in the same region *) 1870031e38aSAlan Sternlet mixed-accesses = ([Plain & W] ; (po-loc \ barrier) ; [Marked]) | 1880031e38aSAlan Stern ([Marked] ; (po-loc \ barrier) ; [Plain & W]) 1890031e38aSAlan Sternflag ~empty mixed-accesses as mixed-accesses 1900031e38aSAlan Stern 1910031e38aSAlan Stern(* Executes-before and visibility *) 1920031e38aSAlan Sternlet xbstar = (hb | pb | rb)* 1930031e38aSAlan Sternlet vis = cumul-fence* ; rfe? ; [Marked] ; 19415aa25cbSAlan Stern ((strong-fence ; [Marked] ; xbstar) | (xbstar & int)) 1950031e38aSAlan Stern 1960031e38aSAlan Stern(* Boundaries for lifetimes of plain accesses *) 1970031e38aSAlan Sternlet w-pre-bounded = [Marked] ; (addr | fence)? 1980031e38aSAlan Sternlet r-pre-bounded = [Marked] ; (addr | nonrw-fence | 1990031e38aSAlan Stern ([R4rmb] ; fencerel(Rmb) ; [~Noreturn]))? 200ebd50e29SAlan Sternlet w-post-bounded = fence? ; [Marked] ; rmw-sequence 2010031e38aSAlan Sternlet r-post-bounded = (nonrw-fence | ([~Noreturn] ; fencerel(Rmb) ; [R4rmb]))? ; 2020031e38aSAlan Stern [Marked] 2030031e38aSAlan Stern 2040031e38aSAlan Stern(* Visibility and executes-before for plain accesses *) 2054289ee7dSAlan Sternlet ww-vis = fence | (strong-fence ; xbstar ; w-pre-bounded) | 2064289ee7dSAlan Stern (w-post-bounded ; vis ; w-pre-bounded) 2074289ee7dSAlan Sternlet wr-vis = fence | (strong-fence ; xbstar ; r-pre-bounded) | 2084289ee7dSAlan Stern (w-post-bounded ; vis ; r-pre-bounded) 2094289ee7dSAlan Sternlet rw-xbstar = fence | (r-post-bounded ; xbstar ; w-pre-bounded) 2100031e38aSAlan Stern 2110031e38aSAlan Stern(* Potential races *) 2120031e38aSAlan Sternlet pre-race = ext & ((Plain * M) | ((M \ IW) * Plain)) 2130031e38aSAlan Stern 2140031e38aSAlan Stern(* Coherence requirements for plain accesses *) 2150031e38aSAlan Sternlet wr-incoh = pre-race & rf & rw-xbstar^-1 2160031e38aSAlan Sternlet rw-incoh = pre-race & fr & wr-vis^-1 2170031e38aSAlan Sternlet ww-incoh = pre-race & co & ww-vis^-1 2180031e38aSAlan Sternempty (wr-incoh | rw-incoh | ww-incoh) as plain-coherence 2190031e38aSAlan Stern 2200031e38aSAlan Stern(* Actual races *) 2210031e38aSAlan Sternlet ww-nonrace = ww-vis & ((Marked * W) | rw-xbstar) & ((W * Marked) | wr-vis) 2220031e38aSAlan Sternlet ww-race = (pre-race & co) \ ww-nonrace 223daebf24aSAlan Sternlet wr-race = (pre-race & (co? ; rf)) \ wr-vis \ rw-xbstar^-1 2240031e38aSAlan Sternlet rw-race = (pre-race & fr) \ rw-xbstar 2250031e38aSAlan Stern 2260031e38aSAlan Sternflag ~empty (ww-race | wr-race | rw-race) as data-race 227