tools/memory-model: Provide extra ordering for unlock+lock pair on the same CPU

author Boqun Feng <boqun.feng@gmail.com>

Mon, 25 Oct 2021 14:54:14 +0000 (22:54 +0800)

committer Paul E. McKenney <paulmck@kernel.org>

Wed, 1 Dec 2021 01:47:08 +0000 (17:47 -0800)
author Boqun Feng <boqun.feng@gmail.com>
Mon, 25 Oct 2021 14:54:14 +0000 (22:54 +0800)
committer Paul E. McKenney <paulmck@kernel.org>
Wed, 1 Dec 2021 01:47:08 +0000 (17:47 -0800)
diff --git a/tools/memory-model/Documentation/explanation.txt b/tools/memory-model/Documentation/explanation.txt

index 5d72f3112e5657bbbacc0849545cd17b09eede32..394ee57d58f2fbcc6ebb1b5d70b7cac242d6ae2e 100644 (file)
--- a/tools/memory-model/Documentation/explanation.txt
+++ b/tools/memory-model/Documentation/explanation.txt
@@ -1813,15 +1813,16 @@ spin_trylock() -- we can call these things lock-releases and
  lock-acquires -- have two properties beyond those of ordinary releases
  and acquires.
  
-First, when a lock-acquire reads from a lock-release, the LKMM
-requires that every instruction po-before the lock-release must
-execute before any instruction po-after the lock-acquire.  This would
-naturally hold if the release and acquire operations were on different
-CPUs, but the LKMM says it holds even when they are on the same CPU.
-For example:
+First, when a lock-acquire reads from or is po-after a lock-release,
+the LKMM requires that every instruction po-before the lock-release
+must execute before any instruction po-after the lock-acquire.  This
+would naturally hold if the release and acquire operations were on
+different CPUs and accessed the same lock variable, but the LKMM says
+it also holds when they are on the same CPU, even if they access
+different lock variables.  For example:
  
         int x, y;
-       spinlock_t s;
+       spinlock_t s, t;
  
         P0()
         {
@@ -1830,9 +1831,9 @@ For example:
                 spin_lock(&s);
                 r1 = READ_ONCE(x);
                 spin_unlock(&s);
-               spin_lock(&s);
+               spin_lock(&t);
                 r2 = READ_ONCE(y);
-               spin_unlock(&s);
+               spin_unlock(&t);
         }
  
         P1()
@@ -1842,10 +1843,10 @@ For example:
                 WRITE_ONCE(x, 1);
         }
  
-Here the second spin_lock() reads from the first spin_unlock(), and
-therefore the load of x must execute before the load of y.  Thus we
-cannot have r1 = 1 and r2 = 0 at the end (this is an instance of the
-MP pattern).
+Here the second spin_lock() is po-after the first spin_unlock(), and
+therefore the load of x must execute before the load of y, even though
+the two locking operations use different locks.  Thus we cannot have
+r1 = 1 and r2 = 0 at the end (this is an instance of the MP pattern).
  
  This requirement does not apply to ordinary release and acquire
  fences, only to lock-related operations.  For instance, suppose P0()
@@ -1872,13 +1873,13 @@ instructions in the following order:
  
  and thus it could load y before x, obtaining r2 = 0 and r1 = 1.
  
-Second, when a lock-acquire reads from a lock-release, and some other
-stores W and W' occur po-before the lock-release and po-after the
-lock-acquire respectively, the LKMM requires that W must propagate to
-each CPU before W' does.  For example, consider:
+Second, when a lock-acquire reads from or is po-after a lock-release,
+and some other stores W and W' occur po-before the lock-release and
+po-after the lock-acquire respectively, the LKMM requires that W must
+propagate to each CPU before W' does.  For example, consider:
  
         int x, y;
-       spinlock_t x;
+       spinlock_t s;
  
         P0()
         {
@@ -1908,7 +1909,12 @@ each CPU before W' does.  For example, consider:
  
  If r1 = 1 at the end then the spin_lock() in P1 must have read from
  the spin_unlock() in P0.  Hence the store to x must propagate to P2
-before the store to y does, so we cannot have r2 = 1 and r3 = 0.
+before the store to y does, so we cannot have r2 = 1 and r3 = 0.  But
+if P1 had used a lock variable different from s, the writes could have
+propagated in either order.  (On the other hand, if the code in P0 and
+P1 had all executed on a single CPU, as in the example before this
+one, then the writes would have propagated in order even if the two
+critical sections used different lock variables.)
  
  These two special requirements for lock-release and lock-acquire do
  not arise from the operational model.  Nevertheless, kernel developers
diff --git a/tools/memory-model/linux-kernel.cat b/tools/memory-model/linux-kernel.cat

index 2a9b4fe4a84ebdc56e553056991d60f68e8df48f..d70315fddef6e000e57a25e2cb0a297326abc398 100644 (file)
--- a/tools/memory-model/linux-kernel.cat
+++ b/tools/memory-model/linux-kernel.cat
@@ -27,7 +27,7 @@ include "lock.cat"
  (* Release Acquire *)
  let acq-po = [Acquire] ; po ; [M]
  let po-rel = [M] ; po ; [Release]
-let po-unlock-rf-lock-po = po ; [UL] ; rf ; [LKR] ; po
+let po-unlock-lock-po = po ; [UL] ; (po|rf) ; [LKR] ; po
  
  (* Fences *)
  let R4rmb = R \ Noreturn       (* Reads for which rmb works *)
@@ -70,12 +70,12 @@ let rwdep = (dep | ctrl) ; [W]
  let overwrite = co | fr
  let to-w = rwdep | (overwrite & int) | (addr ; [Plain] ; wmb)
  let to-r = addr | (dep ; [Marked] ; rfi)
-let ppo = to-r | to-w | fence | (po-unlock-rf-lock-po & int)
+let ppo = to-r | to-w | fence | (po-unlock-lock-po & int)
  
  (* Propagation: Ordering from release operations and strong fences. *)
  let A-cumul(r) = (rfe ; [Marked])? ; r
  let cumul-fence = [Marked] ; (A-cumul(strong-fence | po-rel) | wmb |
-       po-unlock-rf-lock-po) ; [Marked]
+       po-unlock-lock-po) ; [Marked]
  let prop = [Marked] ; (overwrite & ext)? ; cumul-fence* ;
         [Marked] ; rfe? ; [Marked]
author	Boqun Feng <boqun.feng@gmail.com>
	Mon, 25 Oct 2021 14:54:14 +0000 (22:54 +0800)
committer	Paul E. McKenney <paulmck@kernel.org>
	Wed, 1 Dec 2021 01:47:08 +0000 (17:47 -0800)
tools/memory-model/Documentation/explanation.txt		patch \| blob \| history
tools/memory-model/linux-kernel.cat		patch \| blob \| history