Commit b58da0d0 authored by Rusty Russell's avatar Rusty Russell Committed by Linus Torvalds

[PATCH] Futex lock division

From: "Hu, Boris" <boris.hu@intel.com>

Andrew reminded me of this.

Simple change to split the futex lock into a per-hashchain lock.
Don't bother cacheline aligning: Jamie points out that increasing
FUTEX_HASHBITS would have more payoff.

Ulrich Drepper reports 6% improvement in on a 4way futex-thrashing
benchmark.
parent 176c1451
...@@ -79,9 +79,16 @@ struct futex_q { ...@@ -79,9 +79,16 @@ struct futex_q {
struct file *filp; struct file *filp;
}; };
/*
* Split the global futex_lock into every hash list lock.
*/
struct futex_hash_bucket {
spinlock_t lock;
struct list_head chain;
};
/* The key for the hash is the address + index + offset within page */ /* The key for the hash is the address + index + offset within page */
static struct list_head futex_queues[1<<FUTEX_HASHBITS]; static struct futex_hash_bucket futex_queues[1<<FUTEX_HASHBITS];
static spinlock_t futex_lock = SPIN_LOCK_UNLOCKED;
/* Futex-fs vfsmount entry: */ /* Futex-fs vfsmount entry: */
static struct vfsmount *futex_mnt; static struct vfsmount *futex_mnt;
...@@ -89,7 +96,7 @@ static struct vfsmount *futex_mnt; ...@@ -89,7 +96,7 @@ static struct vfsmount *futex_mnt;
/* /*
* We hash on the keys returned from get_futex_key (see below). * We hash on the keys returned from get_futex_key (see below).
*/ */
static inline struct list_head *hash_futex(union futex_key *key) static inline struct futex_hash_bucket *hash_futex(union futex_key *key)
{ {
return &futex_queues[hash_long(key->both.word return &futex_queues[hash_long(key->both.word
+ (unsigned long) key->both.ptr + (unsigned long) key->both.ptr
...@@ -214,6 +221,7 @@ static int get_futex_key(unsigned long uaddr, union futex_key *key) ...@@ -214,6 +221,7 @@ static int get_futex_key(unsigned long uaddr, union futex_key *key)
static int futex_wake(unsigned long uaddr, int num) static int futex_wake(unsigned long uaddr, int num)
{ {
struct list_head *i, *next, *head; struct list_head *i, *next, *head;
struct futex_hash_bucket *bh;
union futex_key key; union futex_key key;
int ret; int ret;
...@@ -223,9 +231,10 @@ static int futex_wake(unsigned long uaddr, int num) ...@@ -223,9 +231,10 @@ static int futex_wake(unsigned long uaddr, int num)
if (unlikely(ret != 0)) if (unlikely(ret != 0))
goto out; goto out;
head = hash_futex(&key); bh = hash_futex(&key);
spin_lock(&bh->lock);
head = &bh->chain;
spin_lock(&futex_lock);
list_for_each_safe(i, next, head) { list_for_each_safe(i, next, head) {
struct futex_q *this = list_entry(i, struct futex_q, list); struct futex_q *this = list_entry(i, struct futex_q, list);
...@@ -239,7 +248,7 @@ static int futex_wake(unsigned long uaddr, int num) ...@@ -239,7 +248,7 @@ static int futex_wake(unsigned long uaddr, int num)
break; break;
} }
} }
spin_unlock(&futex_lock); spin_unlock(&bh->lock);
out: out:
up_read(&current->mm->mmap_sem); up_read(&current->mm->mmap_sem);
...@@ -254,6 +263,7 @@ static int futex_requeue(unsigned long uaddr1, unsigned long uaddr2, ...@@ -254,6 +263,7 @@ static int futex_requeue(unsigned long uaddr1, unsigned long uaddr2,
int nr_wake, int nr_requeue) int nr_wake, int nr_requeue)
{ {
struct list_head *i, *next, *head1, *head2; struct list_head *i, *next, *head1, *head2;
struct futex_hash_bucket *bh1, *bh2;
union futex_key key1, key2; union futex_key key1, key2;
int ret; int ret;
...@@ -266,10 +276,19 @@ static int futex_requeue(unsigned long uaddr1, unsigned long uaddr2, ...@@ -266,10 +276,19 @@ static int futex_requeue(unsigned long uaddr1, unsigned long uaddr2,
if (unlikely(ret != 0)) if (unlikely(ret != 0))
goto out; goto out;
head1 = hash_futex(&key1); bh1 = hash_futex(&key1);
head2 = hash_futex(&key2); bh2 = hash_futex(&key2);
if (bh1 < bh2) {
spin_lock(&bh1->lock);
spin_lock(&bh2->lock);
} else {
spin_lock(&bh2->lock);
if (bh1 > bh2)
spin_lock(&bh1->lock);
}
head1 = &bh1->chain;
head2 = &bh2->chain;
spin_lock(&futex_lock);
list_for_each_safe(i, next, head1) { list_for_each_safe(i, next, head1) {
struct futex_q *this = list_entry(i, struct futex_q, list); struct futex_q *this = list_entry(i, struct futex_q, list);
...@@ -291,8 +310,14 @@ static int futex_requeue(unsigned long uaddr1, unsigned long uaddr2, ...@@ -291,8 +310,14 @@ static int futex_requeue(unsigned long uaddr1, unsigned long uaddr2,
} }
} }
} }
spin_unlock(&futex_lock); if (bh1 < bh2) {
spin_unlock(&bh2->lock);
spin_unlock(&bh1->lock);
} else {
if (bh1 > bh2)
spin_unlock(&bh1->lock);
spin_unlock(&bh2->lock);
}
out: out:
up_read(&current->mm->mmap_sem); up_read(&current->mm->mmap_sem);
return ret; return ret;
...@@ -301,28 +326,30 @@ static int futex_requeue(unsigned long uaddr1, unsigned long uaddr2, ...@@ -301,28 +326,30 @@ static int futex_requeue(unsigned long uaddr1, unsigned long uaddr2,
static inline void queue_me(struct futex_q *q, union futex_key *key, static inline void queue_me(struct futex_q *q, union futex_key *key,
int fd, struct file *filp) int fd, struct file *filp)
{ {
struct list_head *head = hash_futex(key); struct futex_hash_bucket *bh = hash_futex(key);
struct list_head *head = &bh->chain;
q->key = *key; q->key = *key;
q->fd = fd; q->fd = fd;
q->filp = filp; q->filp = filp;
spin_lock(&futex_lock); spin_lock(&bh->lock);
list_add_tail(&q->list, head); list_add_tail(&q->list, head);
spin_unlock(&futex_lock); spin_unlock(&bh->lock);
} }
/* Return 1 if we were still queued (ie. 0 means we were woken) */ /* Return 1 if we were still queued (ie. 0 means we were woken) */
static inline int unqueue_me(struct futex_q *q) static inline int unqueue_me(struct futex_q *q)
{ {
struct futex_hash_bucket *bh = hash_futex(&q->key);
int ret = 0; int ret = 0;
spin_lock(&futex_lock); spin_lock(&bh->lock);
if (!list_empty(&q->list)) { if (!list_empty(&q->list)) {
list_del(&q->list); list_del(&q->list);
ret = 1; ret = 1;
} }
spin_unlock(&futex_lock); spin_unlock(&bh->lock);
return ret; return ret;
} }
...@@ -332,6 +359,7 @@ static int futex_wait(unsigned long uaddr, int val, unsigned long time) ...@@ -332,6 +359,7 @@ static int futex_wait(unsigned long uaddr, int val, unsigned long time)
int ret, curval; int ret, curval;
union futex_key key; union futex_key key;
struct futex_q q; struct futex_q q;
struct futex_hash_bucket *bh = NULL;
try_again: try_again:
init_waitqueue_head(&q.waiters); init_waitqueue_head(&q.waiters);
...@@ -373,19 +401,20 @@ static int futex_wait(unsigned long uaddr, int val, unsigned long time) ...@@ -373,19 +401,20 @@ static int futex_wait(unsigned long uaddr, int val, unsigned long time)
* the waiter from the list. * the waiter from the list.
*/ */
add_wait_queue(&q.waiters, &wait); add_wait_queue(&q.waiters, &wait);
spin_lock(&futex_lock); bh = hash_futex(&key);
spin_lock(&bh->lock);
set_current_state(TASK_INTERRUPTIBLE); set_current_state(TASK_INTERRUPTIBLE);
if (unlikely(list_empty(&q.list))) { if (unlikely(list_empty(&q.list))) {
/* /*
* We were woken already. * We were woken already.
*/ */
spin_unlock(&futex_lock); spin_unlock(&bh->lock);
set_current_state(TASK_RUNNING); set_current_state(TASK_RUNNING);
return 0; return 0;
} }
spin_unlock(&futex_lock); spin_unlock(&bh->lock);
time = schedule_timeout(time); time = schedule_timeout(time);
set_current_state(TASK_RUNNING); set_current_state(TASK_RUNNING);
...@@ -435,13 +464,14 @@ static unsigned int futex_poll(struct file *filp, ...@@ -435,13 +464,14 @@ static unsigned int futex_poll(struct file *filp,
struct poll_table_struct *wait) struct poll_table_struct *wait)
{ {
struct futex_q *q = filp->private_data; struct futex_q *q = filp->private_data;
struct futex_hash_bucket *bh = hash_futex(&q->key);
int ret = 0; int ret = 0;
poll_wait(filp, &q->waiters, wait); poll_wait(filp, &q->waiters, wait);
spin_lock(&futex_lock); spin_lock(&bh->lock);
if (list_empty(&q->list)) if (list_empty(&q->list))
ret = POLLIN | POLLRDNORM; ret = POLLIN | POLLRDNORM;
spin_unlock(&futex_lock); spin_unlock(&bh->lock);
return ret; return ret;
} }
...@@ -587,8 +617,10 @@ static int __init init(void) ...@@ -587,8 +617,10 @@ static int __init init(void)
register_filesystem(&futex_fs_type); register_filesystem(&futex_fs_type);
futex_mnt = kern_mount(&futex_fs_type); futex_mnt = kern_mount(&futex_fs_type);
for (i = 0; i < ARRAY_SIZE(futex_queues); i++) for (i = 0; i < ARRAY_SIZE(futex_queues); i++) {
INIT_LIST_HEAD(&futex_queues[i]); INIT_LIST_HEAD(&futex_queues[i].chain);
futex_queues[i].lock = SPIN_LOCK_UNLOCKED;
}
return 0; return 0;
} }
__initcall(init); __initcall(init);
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment