xen/rwlock: Add missing memory barrier in the unlock path of rwlock

author Julien Grall <jgrall@amazon.com>

Thu, 20 Feb 2020 20:54:40 +0000 (20:54 +0000)

committer Jan Beulich <jbeulich@suse.com>

Tue, 14 Apr 2020 12:37:11 +0000 (14:37 +0200)
author Julien Grall <jgrall@amazon.com>
Thu, 20 Feb 2020 20:54:40 +0000 (20:54 +0000)
committer Jan Beulich <jbeulich@suse.com>
Tue, 14 Apr 2020 12:37:11 +0000 (14:37 +0200)
diff --git a/xen/include/xen/rwlock.h b/xen/include/xen/rwlock.h

index 4d1b48c722e584ea78dc910132ed32de298750a0..427664037a4e9c05d58a8e6c50f6e05ebc2f27bf 100644 (file)
--- a/xen/include/xen/rwlock.h
+++ b/xen/include/xen/rwlock.h
@@ -60,6 +60,10 @@ static inline int _read_trylock(rwlock_t *lock)
      if ( likely(_can_read_lock(cnts)) )
      {
          cnts = (u32)atomic_add_return(_QR_BIAS, &lock->cnts);
+        /*
+         * atomic_add_return() is a full barrier so no need for an
+         * arch_lock_acquire_barrier().
+         */
          if ( likely(_can_read_lock(cnts)) )
              return 1;
          atomic_sub(_QR_BIAS, &lock->cnts);
@@ -78,11 +82,19 @@ static inline void _read_lock(rwlock_t *lock)
  
      preempt_disable();
      cnts = atomic_add_return(_QR_BIAS, &lock->cnts);
+    /*
+     * atomic_add_return() is a full barrier so no need for an
+     * arch_lock_acquire_barrier().
+     */
      if ( likely(_can_read_lock(cnts)) )
          return;
  
      /* The slowpath will decrement the reader count, if necessary. */
      queue_read_lock_slowpath(lock);
+    /*
+     * queue_read_lock_slowpath() is using spinlock and therefore is a
+     * full barrier. So no need for an arch_lock_acquire_barrier().
+     */
  }
  
  static inline void _read_lock_irq(rwlock_t *lock)
@@ -106,6 +118,7 @@ static inline unsigned long _read_lock_irqsave(rwlock_t *lock)
   */
  static inline void _read_unlock(rwlock_t *lock)
  {
+    arch_lock_release_barrier();
      /*
       * Atomically decrement the reader count
       */
@@ -141,12 +154,21 @@ static inline unsigned int _write_lock_val(void)
   */
  static inline void _write_lock(rwlock_t *lock)
  {
-    /* Optimize for the unfair lock case where the fair flag is 0. */
      preempt_disable();
+    /*
+     * Optimize for the unfair lock case where the fair flag is 0.
+     *
+     * atomic_cmpxchg() is a full barrier so no need for an
+     * arch_lock_acquire_barrier().
+     */
      if ( atomic_cmpxchg(&lock->cnts, 0, _write_lock_val()) == 0 )
          return;
  
      queue_write_lock_slowpath(lock);
+    /*
+     * queue_write_lock_slowpath() is using spinlock and therefore is a
+     * full barrier. So no need for an arch_lock_acquire_barrier().
+     */
  }
  
  static inline void _write_lock_irq(rwlock_t *lock)
@@ -183,12 +205,17 @@ static inline int _write_trylock(rwlock_t *lock)
          return 0;
      }
  
+    /*
+     * atomic_cmpxchg() is a full barrier so no need for an
+     * arch_lock_acquire_barrier().
+     */
      return 1;
  }
  
  static inline void _write_unlock(rwlock_t *lock)
  {
      ASSERT(_is_write_locked_by_me(atomic_read(&lock->cnts)));
+    arch_lock_release_barrier();
      atomic_and(~(_QW_CPUMASK | _QW_WMASK), &lock->cnts);
      preempt_enable();
  }
author	Julien Grall <jgrall@amazon.com>
	Thu, 20 Feb 2020 20:54:40 +0000 (20:54 +0000)
committer	Jan Beulich <jbeulich@suse.com>
	Tue, 14 Apr 2020 12:37:11 +0000 (14:37 +0200)