]> git.hungrycats.org Git - linux/commitdiff
[PATCH] Futex lock division
authorRusty Russell <rusty@rustcorp.com.au>
Wed, 24 Sep 2003 13:41:18 +0000 (06:41 -0700)
committerLinus Torvalds <torvalds@home.osdl.org>
Wed, 24 Sep 2003 13:41:18 +0000 (06:41 -0700)
From: "Hu, Boris" <boris.hu@intel.com>

Andrew reminded me of this.

Simple change to split the futex lock into a per-hashchain lock.
Don't bother cacheline aligning: Jamie points out that increasing
FUTEX_HASHBITS would have more payoff.

Ulrich Drepper reports 6% improvement in on a 4way futex-thrashing
benchmark.

kernel/futex.c

index 6691f6475869f89dd38955ad56563a48db6d2cd7..1a354ba725225838740742ed71f92b623771c166 100644 (file)
@@ -79,9 +79,16 @@ struct futex_q {
        struct file *filp;
 };
 
+/*
+ * Split the global futex_lock into every hash list lock.
+ */
+struct futex_hash_bucket {
+       spinlock_t              lock;
+       struct list_head       chain;
+};
+
 /* The key for the hash is the address + index + offset within page */
-static struct list_head futex_queues[1<<FUTEX_HASHBITS];
-static spinlock_t futex_lock = SPIN_LOCK_UNLOCKED;
+static struct futex_hash_bucket futex_queues[1<<FUTEX_HASHBITS];
 
 /* Futex-fs vfsmount entry: */
 static struct vfsmount *futex_mnt;
@@ -89,7 +96,7 @@ static struct vfsmount *futex_mnt;
 /*
  * We hash on the keys returned from get_futex_key (see below).
  */
-static inline struct list_head *hash_futex(union futex_key *key)
+static inline struct futex_hash_bucket *hash_futex(union futex_key *key)
 {
        return &futex_queues[hash_long(key->both.word
                                       + (unsigned long) key->both.ptr
@@ -214,6 +221,7 @@ static int get_futex_key(unsigned long uaddr, union futex_key *key)
 static int futex_wake(unsigned long uaddr, int num)
 {
        struct list_head *i, *next, *head;
+       struct futex_hash_bucket *bh;
        union futex_key key;
        int ret;
 
@@ -223,9 +231,10 @@ static int futex_wake(unsigned long uaddr, int num)
        if (unlikely(ret != 0))
                goto out;
 
-       head = hash_futex(&key);
+       bh = hash_futex(&key);
+       spin_lock(&bh->lock);
+       head = &bh->chain;
 
-       spin_lock(&futex_lock);
        list_for_each_safe(i, next, head) {
                struct futex_q *this = list_entry(i, struct futex_q, list);
 
@@ -239,7 +248,7 @@ static int futex_wake(unsigned long uaddr, int num)
                                break;
                }
        }
-       spin_unlock(&futex_lock);
+       spin_unlock(&bh->lock);
 
 out:
        up_read(&current->mm->mmap_sem);
@@ -254,6 +263,7 @@ static int futex_requeue(unsigned long uaddr1, unsigned long uaddr2,
                                int nr_wake, int nr_requeue)
 {
        struct list_head *i, *next, *head1, *head2;
+       struct futex_hash_bucket *bh1, *bh2;
        union futex_key key1, key2;
        int ret;
 
@@ -266,10 +276,19 @@ static int futex_requeue(unsigned long uaddr1, unsigned long uaddr2,
        if (unlikely(ret != 0))
                goto out;
 
-       head1 = hash_futex(&key1);
-       head2 = hash_futex(&key2);
+       bh1 = hash_futex(&key1);
+       bh2 = hash_futex(&key2);
+       if (bh1 < bh2) {
+               spin_lock(&bh1->lock);
+               spin_lock(&bh2->lock);
+       } else {
+               spin_lock(&bh2->lock);
+               if (bh1 > bh2)
+                       spin_lock(&bh1->lock);
+       }
+       head1 = &bh1->chain;
+       head2 = &bh2->chain;
 
-       spin_lock(&futex_lock);
        list_for_each_safe(i, next, head1) {
                struct futex_q *this = list_entry(i, struct futex_q, list);
 
@@ -291,8 +310,14 @@ static int futex_requeue(unsigned long uaddr1, unsigned long uaddr2,
                        }
                }
        }
-       spin_unlock(&futex_lock);
-
+       if (bh1 < bh2) {
+               spin_unlock(&bh2->lock);
+               spin_unlock(&bh1->lock);
+       } else {
+               if (bh1 > bh2)
+                       spin_unlock(&bh1->lock);
+               spin_unlock(&bh2->lock);
+       }
 out:
        up_read(&current->mm->mmap_sem);
        return ret;
@@ -301,28 +326,30 @@ out:
 static inline void queue_me(struct futex_q *q, union futex_key *key,
                            int fd, struct file *filp)
 {
-       struct list_head *head = hash_futex(key);
+       struct futex_hash_bucket *bh = hash_futex(key);
+       struct list_head *head = &bh->chain;
 
        q->key = *key;
        q->fd = fd;
        q->filp = filp;
 
-       spin_lock(&futex_lock);
+       spin_lock(&bh->lock);
        list_add_tail(&q->list, head);
-       spin_unlock(&futex_lock);
+       spin_unlock(&bh->lock);
 }
 
 /* Return 1 if we were still queued (ie. 0 means we were woken) */
 static inline int unqueue_me(struct futex_q *q)
 {
+       struct futex_hash_bucket *bh = hash_futex(&q->key);
        int ret = 0;
 
-       spin_lock(&futex_lock);
+       spin_lock(&bh->lock);
        if (!list_empty(&q->list)) {
                list_del(&q->list);
                ret = 1;
        }
-       spin_unlock(&futex_lock);
+       spin_unlock(&bh->lock);
        return ret;
 }
 
@@ -332,6 +359,7 @@ static int futex_wait(unsigned long uaddr, int val, unsigned long time)
        int ret, curval;
        union futex_key key;
        struct futex_q q;
+       struct futex_hash_bucket *bh = NULL;
 
  try_again:
        init_waitqueue_head(&q.waiters);
@@ -373,19 +401,20 @@ static int futex_wait(unsigned long uaddr, int val, unsigned long time)
         * the waiter from the list.
         */
        add_wait_queue(&q.waiters, &wait);
-       spin_lock(&futex_lock);
+       bh = hash_futex(&key);
+       spin_lock(&bh->lock);
        set_current_state(TASK_INTERRUPTIBLE);
 
        if (unlikely(list_empty(&q.list))) {
                /*
                 * We were woken already.
                 */
-               spin_unlock(&futex_lock);
+               spin_unlock(&bh->lock);
                set_current_state(TASK_RUNNING);
                return 0;
        }
 
-       spin_unlock(&futex_lock);
+       spin_unlock(&bh->lock);
        time = schedule_timeout(time);
        set_current_state(TASK_RUNNING);
 
@@ -435,13 +464,14 @@ static unsigned int futex_poll(struct file *filp,
                               struct poll_table_struct *wait)
 {
        struct futex_q *q = filp->private_data;
+       struct futex_hash_bucket *bh = hash_futex(&q->key);
        int ret = 0;
 
        poll_wait(filp, &q->waiters, wait);
-       spin_lock(&futex_lock);
+       spin_lock(&bh->lock);
        if (list_empty(&q->list))
                ret = POLLIN | POLLRDNORM;
-       spin_unlock(&futex_lock);
+       spin_unlock(&bh->lock);
 
        return ret;
 }
@@ -587,8 +617,10 @@ static int __init init(void)
        register_filesystem(&futex_fs_type);
        futex_mnt = kern_mount(&futex_fs_type);
 
-       for (i = 0; i < ARRAY_SIZE(futex_queues); i++)
-               INIT_LIST_HEAD(&futex_queues[i]);
+       for (i = 0; i < ARRAY_SIZE(futex_queues); i++) {
+               INIT_LIST_HEAD(&futex_queues[i].chain);
+               futex_queues[i].lock = SPIN_LOCK_UNLOCKED;
+       }
        return 0;
 }
 __initcall(init);