Commit fd8fae50 authored by Nicholas Piggin's avatar Nicholas Piggin Committed by Michael Ellerman

powerpc/qspinlock: propagate owner preemptedness rather than CPU number

Rather than propagating the CPU number of the preempted lock owner,
just propagate whether the owner was preempted. Waiters must read the
lock value when yielding to it to prevent races anyway, so might as
well always load the owner CPU from the lock.

To further simplify the code, also don't propagate the -1 (or
sleepy=false in the new scheme) down the queue. Instead, have the
waiters clear it themselves when finding the lock owner is not
preempted.
Signed-off-by: default avatarNicholas Piggin <npiggin@gmail.com>
Tested-by: default avatarShrikanth Hegde <sshegde@linux.vnet.ibm.com>
Reviewed-by: default avatar"Nysal Jan K.A" <nysal@linux.ibm.com>
Signed-off-by: default avatarMichael Ellerman <mpe@ellerman.id.au>
Link: https://msgid.link/20231016124305.139923-4-npiggin@gmail.com
parent f6568647
...@@ -16,7 +16,8 @@ struct qnode { ...@@ -16,7 +16,8 @@ struct qnode {
struct qnode *next; struct qnode *next;
struct qspinlock *lock; struct qspinlock *lock;
int cpu; int cpu;
int yield_cpu; u8 sleepy; /* 1 if the previous vCPU was preempted or
* if the previous node was sleepy */
u8 locked; /* 1 if lock acquired */ u8 locked; /* 1 if lock acquired */
}; };
...@@ -349,7 +350,7 @@ static __always_inline bool yield_head_to_locked_owner(struct qspinlock *lock, u ...@@ -349,7 +350,7 @@ static __always_inline bool yield_head_to_locked_owner(struct qspinlock *lock, u
return __yield_to_locked_owner(lock, val, paravirt, mustq); return __yield_to_locked_owner(lock, val, paravirt, mustq);
} }
static __always_inline void propagate_yield_cpu(struct qnode *node, u32 val, int *set_yield_cpu, bool paravirt) static __always_inline void propagate_sleepy(struct qnode *node, u32 val, bool *set_sleepy, bool paravirt)
{ {
struct qnode *next; struct qnode *next;
int owner; int owner;
...@@ -358,21 +359,17 @@ static __always_inline void propagate_yield_cpu(struct qnode *node, u32 val, int ...@@ -358,21 +359,17 @@ static __always_inline void propagate_yield_cpu(struct qnode *node, u32 val, int
return; return;
if (!pv_yield_propagate_owner) if (!pv_yield_propagate_owner)
return; return;
if (*set_sleepy)
owner = get_owner_cpu(val);
if (*set_yield_cpu == owner)
return; return;
next = READ_ONCE(node->next); next = READ_ONCE(node->next);
if (!next) if (!next)
return; return;
owner = get_owner_cpu(val);
if (vcpu_is_preempted(owner)) { if (vcpu_is_preempted(owner)) {
next->yield_cpu = owner; next->sleepy = 1;
*set_yield_cpu = owner; *set_sleepy = true;
} else if (*set_yield_cpu != -1) {
next->yield_cpu = owner;
*set_yield_cpu = owner;
} }
} }
...@@ -380,7 +377,6 @@ static __always_inline void propagate_yield_cpu(struct qnode *node, u32 val, int ...@@ -380,7 +377,6 @@ static __always_inline void propagate_yield_cpu(struct qnode *node, u32 val, int
static __always_inline bool yield_to_prev(struct qspinlock *lock, struct qnode *node, int prev_cpu, bool paravirt) static __always_inline bool yield_to_prev(struct qspinlock *lock, struct qnode *node, int prev_cpu, bool paravirt)
{ {
u32 yield_count; u32 yield_count;
int yield_cpu;
bool preempted = false; bool preempted = false;
if (!paravirt) if (!paravirt)
...@@ -389,36 +385,32 @@ static __always_inline bool yield_to_prev(struct qspinlock *lock, struct qnode * ...@@ -389,36 +385,32 @@ static __always_inline bool yield_to_prev(struct qspinlock *lock, struct qnode *
if (!pv_yield_propagate_owner) if (!pv_yield_propagate_owner)
goto yield_prev; goto yield_prev;
yield_cpu = READ_ONCE(node->yield_cpu); if (!READ_ONCE(node->sleepy)) {
if (yield_cpu == -1) { /* Propagate back sleepy==false */
/* Propagate back the -1 CPU */ if (node->next && node->next->sleepy)
if (node->next && node->next->yield_cpu != -1) node->next->sleepy = 0;
node->next->yield_cpu = yield_cpu;
goto yield_prev; goto yield_prev;
} } else {
u32 val = READ_ONCE(lock->val);
yield_count = yield_count_of(yield_cpu);
if ((yield_count & 1) == 0) if (val & _Q_LOCKED_VAL) {
goto yield_prev; /* owner vcpu is running */ if (node->next && !node->next->sleepy) {
/*
if (get_owner_cpu(READ_ONCE(lock->val)) != yield_cpu) * Propagate sleepy to next waiter. Only if
goto yield_prev; /* re-sample lock owner */ * owner is preempted, which allows the queue
* to become "non-sleepy" if vCPU preemption
spin_end(); * ceases to occur, even if the lock remains
* highly contended.
preempted = true; */
seen_sleepy_node(); if (vcpu_is_preempted(get_owner_cpu(val)))
node->next->sleepy = 1;
smp_rmb(); }
if (yield_cpu == node->yield_cpu) { preempted = yield_to_locked_owner(lock, val, paravirt);
if (node->next && node->next->yield_cpu != yield_cpu) if (preempted)
node->next->yield_cpu = yield_cpu; return preempted;
yield_to_preempted(yield_cpu, yield_count); }
spin_begin();
return preempted;
} }
spin_begin();
yield_prev: yield_prev:
if (!pv_yield_prev) if (!pv_yield_prev)
...@@ -541,7 +533,7 @@ static __always_inline void queued_spin_lock_mcs_queue(struct qspinlock *lock, b ...@@ -541,7 +533,7 @@ static __always_inline void queued_spin_lock_mcs_queue(struct qspinlock *lock, b
bool sleepy = false; bool sleepy = false;
bool mustq = false; bool mustq = false;
int idx; int idx;
int set_yield_cpu = -1; bool set_sleepy = false;
int iters = 0; int iters = 0;
BUILD_BUG_ON(CONFIG_NR_CPUS >= (1U << _Q_TAIL_CPU_BITS)); BUILD_BUG_ON(CONFIG_NR_CPUS >= (1U << _Q_TAIL_CPU_BITS));
...@@ -565,7 +557,7 @@ static __always_inline void queued_spin_lock_mcs_queue(struct qspinlock *lock, b ...@@ -565,7 +557,7 @@ static __always_inline void queued_spin_lock_mcs_queue(struct qspinlock *lock, b
node->next = NULL; node->next = NULL;
node->lock = lock; node->lock = lock;
node->cpu = smp_processor_id(); node->cpu = smp_processor_id();
node->yield_cpu = -1; node->sleepy = 0;
node->locked = 0; node->locked = 0;
tail = encode_tail_cpu(node->cpu); tail = encode_tail_cpu(node->cpu);
...@@ -599,9 +591,9 @@ static __always_inline void queued_spin_lock_mcs_queue(struct qspinlock *lock, b ...@@ -599,9 +591,9 @@ static __always_inline void queued_spin_lock_mcs_queue(struct qspinlock *lock, b
spec_barrier(); spec_barrier();
spin_end(); spin_end();
/* Clear out stale propagated yield_cpu */ /* Clear out stale propagated sleepy */
if (paravirt && pv_yield_propagate_owner && node->yield_cpu != -1) if (paravirt && pv_yield_propagate_owner && node->sleepy)
node->yield_cpu = -1; node->sleepy = 0;
smp_rmb(); /* acquire barrier for the mcs lock */ smp_rmb(); /* acquire barrier for the mcs lock */
...@@ -644,7 +636,7 @@ static __always_inline void queued_spin_lock_mcs_queue(struct qspinlock *lock, b ...@@ -644,7 +636,7 @@ static __always_inline void queued_spin_lock_mcs_queue(struct qspinlock *lock, b
} }
} }
propagate_yield_cpu(node, val, &set_yield_cpu, paravirt); propagate_sleepy(node, val, &set_sleepy, paravirt);
preempted = yield_head_to_locked_owner(lock, val, paravirt); preempted = yield_head_to_locked_owner(lock, val, paravirt);
if (!maybe_stealers) if (!maybe_stealers)
continue; continue;
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment