locking/pvqspinlock: Collect slowpath lock statistics

[cascardo/linux.git] / kernel / locking / qspinlock_paravirt.h
diff --git a/kernel/locking/qspinlock_paravirt.h b/kernel/locking/qspinlock_paravirt.h

index f0450ff..aaeeefb 100644 (file)
--- a/kernel/locking/qspinlock_paravirt.h
+++ b/kernel/locking/qspinlock_paravirt.h
@@ -40,6 +40,11 @@ struct pv_node {
         u8                      state;
  };
  
+/*
+ * Include queued spinlock statistics code
+ */
+#include "qspinlock_stat.h"
+
  /*
   * Lock and MCS node addresses hash table for fast lookup
   *
@@ -100,10 +105,13 @@ static struct qspinlock **pv_hash(struct qspinlock *lock, struct pv_node *node)
  {
         unsigned long offset, hash = hash_ptr(lock, pv_lock_hash_bits);
         struct pv_hash_entry *he;
+       int hopcnt = 0;
  
         for_each_hash_entry(he, offset, hash) {
+               hopcnt++;
                 if (!cmpxchg(&he->lock, NULL, lock)) {
                         WRITE_ONCE(he->node, node);
+                       qstat_hop(hopcnt);
                         return &he->lock;
                 }
         }
@@ -164,9 +172,11 @@ static void pv_init_node(struct mcs_spinlock *node)
  static void pv_wait_node(struct mcs_spinlock *node)
  {
         struct pv_node *pn = (struct pv_node *)node;
+       int waitcnt = 0;
         int loop;
  
-       for (;;) {
+       /* waitcnt processing will be compiled out if !QUEUED_LOCK_STAT */
+       for (;; waitcnt++) {
                 for (loop = SPIN_THRESHOLD; loop; loop--) {
                         if (READ_ONCE(node->locked))
                                 return;
@@ -184,12 +194,16 @@ static void pv_wait_node(struct mcs_spinlock *node)
                  */
                 smp_store_mb(pn->state, vcpu_halted);
  
-               if (!READ_ONCE(node->locked))
+               if (!READ_ONCE(node->locked)) {
+                       qstat_inc(qstat_pv_wait_node, true);
+                       qstat_inc(qstat_pv_wait_again, waitcnt);
                         pv_wait(&pn->state, vcpu_halted);
+               }
  
                 /*
-                * If pv_kick_node() changed us to vcpu_hashed, retain that value
-                * so that pv_wait_head() knows to not also try to hash this lock.
+                * If pv_kick_node() changed us to vcpu_hashed, retain that
+                * value so that pv_wait_head() knows to not also try to hash
+                * this lock.
                  */
                 cmpxchg(&pn->state, vcpu_halted, vcpu_running);
  
@@ -200,6 +214,7 @@ static void pv_wait_node(struct mcs_spinlock *node)
                  * So it is better to spin for a while in the hope that the
                  * MCS lock will be released soon.
                  */
+               qstat_inc(qstat_pv_spurious_wakeup, !READ_ONCE(node->locked));
         }
  
         /*
@@ -250,6 +265,7 @@ static void pv_wait_head(struct qspinlock *lock, struct mcs_spinlock *node)
         struct pv_node *pn = (struct pv_node *)node;
         struct __qspinlock *l = (void *)lock;
         struct qspinlock **lp = NULL;
+       int waitcnt = 0;
         int loop;
  
         /*
@@ -259,7 +275,7 @@ static void pv_wait_head(struct qspinlock *lock, struct mcs_spinlock *node)
         if (READ_ONCE(pn->state) == vcpu_hashed)
                 lp = (struct qspinlock **)1;
  
-       for (;;) {
+       for (;; waitcnt++) {
                 for (loop = SPIN_THRESHOLD; loop; loop--) {
                         if (!READ_ONCE(l->locked))
                                 return;
@@ -290,14 +306,19 @@ static void pv_wait_head(struct qspinlock *lock, struct mcs_spinlock *node)
                                 return;
                         }
                 }
+               qstat_inc(qstat_pv_wait_head, true);
+               qstat_inc(qstat_pv_wait_again, waitcnt);
                 pv_wait(&l->locked, _Q_SLOW_VAL);
  
+               if (!READ_ONCE(l->locked))
+                       return;
                 /*
                  * The unlocker should have freed the lock before kicking the
                  * CPU. So if the lock is still not free, it is a spurious
                  * wakeup and so the vCPU should wait again after spinning for
                  * a while.
                  */
+               qstat_inc(qstat_pv_spurious_wakeup, true);
         }
  
         /*
@@ -308,23 +329,14 @@ static void pv_wait_head(struct qspinlock *lock, struct mcs_spinlock *node)
  }
  
  /*
- * PV version of the unlock function to be used in stead of
- * queued_spin_unlock().
+ * PV versions of the unlock fastpath and slowpath functions to be used
+ * instead of queued_spin_unlock().
   */
-__visible void __pv_queued_spin_unlock(struct qspinlock *lock)
+__visible void
+__pv_queued_spin_unlock_slowpath(struct qspinlock *lock, u8 locked)
  {
         struct __qspinlock *l = (void *)lock;
         struct pv_node *node;
-       u8 locked;
-
-       /*
-        * We must not unlock if SLOW, because in that case we must first
-        * unhash. Otherwise it would be possible to have multiple @lock
-        * entries, which would be BAD.
-        */
-       locked = cmpxchg(&l->locked, _Q_LOCKED_VAL, 0);
-       if (likely(locked == _Q_LOCKED_VAL))
-               return;
  
         if (unlikely(locked != _Q_SLOW_VAL)) {
                 WARN(!debug_locks_silent,
@@ -361,14 +373,35 @@ __visible void __pv_queued_spin_unlock(struct qspinlock *lock)
          * vCPU is harmless other than the additional latency in completing
          * the unlock.
          */
+       qstat_inc(qstat_pv_kick_unlock, true);
         pv_kick(node->cpu);
  }
+
  /*
   * Include the architecture specific callee-save thunk of the
   * __pv_queued_spin_unlock(). This thunk is put together with
- * __pv_queued_spin_unlock() near the top of the file to make sure
- * that the callee-save thunk and the real unlock function are close
- * to each other sharing consecutive instruction cachelines.
+ * __pv_queued_spin_unlock() to make the callee-save thunk and the real unlock
+ * function close to each other sharing consecutive instruction cachelines.
+ * Alternatively, architecture specific version of __pv_queued_spin_unlock()
+ * can be defined.
   */
  #include <asm/qspinlock_paravirt.h>
  
+#ifndef __pv_queued_spin_unlock
+__visible void __pv_queued_spin_unlock(struct qspinlock *lock)
+{
+       struct __qspinlock *l = (void *)lock;
+       u8 locked;
+
+       /*
+        * We must not unlock if SLOW, because in that case we must first
+        * unhash. Otherwise it would be possible to have multiple @lock
+        * entries, which would be BAD.
+        */
+       locked = cmpxchg(&l->locked, _Q_LOCKED_VAL, 0);
+       if (likely(locked == _Q_LOCKED_VAL))
+               return;
+
+       __pv_queued_spin_unlock_slowpath(lock, locked);
+}
+#endif /* __pv_queued_spin_unlock */