[前][次][番号順一覧][スレッド一覧]

ruby-changes:46485

From: normal <ko1@a...>
Date: Mon, 8 May 2017 09:19:00 +0900 (JST)
Subject: [ruby-changes:46485] normal:r58604 (trunk): reduce rb_mutex_t size from 160 to 80 bytes on 64-bit

normal	2017-05-08 09:18:53 +0900 (Mon, 08 May 2017)

  New Revision: 58604

  https://svn.ruby-lang.org/cgi-bin/viewvc.cgi?view=revision&revision=58604

  Log:
    reduce rb_mutex_t size from 160 to 80 bytes on 64-bit
    
    Instead of relying on a native condition variable and mutex for
    every Ruby Mutex object, use a doubly linked-list to implement a
    waiter queue in the Mutex.  The immediate benefit of this is
    reducing the size of every Mutex object, as some projects have
    many objects requiring synchronization.
    
    In the future, this technique using a linked-list and on-stack
    list node (struct mutex_waiter) should allow us to easily
    transition to M:N threading model, as we can avoid the native
    thread dependency to implement Mutex.
    
    We already do something similar for autoload in variable.c,
    and this was inspired by the Linux kernel wait queue (as
    ccan/list is inspired by the Linux kernel linked-list).
    
    Finaly, there are big performance improvements for Mutex
    benchmarks, especially in contended cases:
    
    measure target: real
    
    name            |trunk  |built
    ----------------|------:|------:
    loop_whileloop2 |  0.149|  0.148
    vm2_mutex*      |  0.893|  0.651
    vm_thread_mutex1|  0.809|  0.624
    vm_thread_mutex2|  2.608|  0.628
    vm_thread_mutex3| 28.227|  0.881
    
    Speedup ratio: compare with the result of `trunk' (greater is better)
    
    name            |built
    ----------------|------:
    loop_whileloop2 |  1.002
    vm2_mutex*      |  1.372
    vm_thread_mutex1|  1.297
    vm_thread_mutex2|  4.149
    vm_thread_mutex3| 32.044
    
    Tested on AMD FX-8320 8-core at 3.5GHz
    
    * thread_sync.c (struct mutex_waiter): new on-stack struct
      (struct rb_mutex_struct): remove native lock/cond, use ccan/list
      (rb_mutex_num_waiting): new function for debug_deadlock_check
      (mutex_free): remove native_*_destroy
      (mutex_alloc): initialize waitq, remove native_*_initialize
      (rb_mutex_trylock): remove native_mutex_{lock,unlock}
      (lock_func): remove
      (lock_interrupt): remove
      (rb_mutex_lock): rewrite waiting path to use native_sleep + ccan/list
      (rb_mutex_unlock_th): rewrite to wake up from native_sleep
      using rb_threadptr_interrupt
      (rb_mutex_abandon_all): empty waitq
    * thread.c (debug_deadlock_check): update for new struct
      (rb_check_deadlock): ditto
      [ruby-core:80913] [Feature #13517]

  Modified files:
    trunk/thread.c
    trunk/thread_sync.c
Index: thread_sync.c
===================================================================
--- thread_sync.c	(revision 58603)
+++ thread_sync.c	(revision 58604)
@@ -1,16 +1,21 @@ https://github.com/ruby/ruby/blob/trunk/thread_sync.c#L1
 /* included by thread.c */
+#include "ccan/list/list.h"
 
 static VALUE rb_cMutex, rb_cQueue, rb_cSizedQueue, rb_cConditionVariable;
 static VALUE rb_eClosedQueueError;
 
 /* Mutex */
 
+/* mutex_waiter is always on-stack */
+struct mutex_waiter {
+    rb_thread_t *th;
+    struct list_node node;
+};
+
 typedef struct rb_mutex_struct {
-    rb_nativethread_lock_t lock;
-    rb_nativethread_cond_t cond;
     struct rb_thread_struct volatile *th;
     struct rb_mutex_struct *next_mutex;
-    int cond_waiting;
+    struct list_head waitq; /* protected by GVL */
     int allow_trap;
 } rb_mutex_t;
 
@@ -51,6 +56,19 @@ static const char* rb_mutex_unlock_th(rb https://github.com/ruby/ruby/blob/trunk/thread_sync.c#L56
 
 #define mutex_mark NULL
 
+static size_t
+rb_mutex_num_waiting(rb_mutex_t *mutex)
+{
+    struct mutex_waiter *w;
+    size_t n = 0;
+
+    list_for_each(&mutex->waitq, w, node) {
+	n++;
+    }
+
+    return n;
+}
+
 static void
 mutex_free(void *ptr)
 {
@@ -60,8 +78,6 @@ mutex_free(void *ptr) https://github.com/ruby/ruby/blob/trunk/thread_sync.c#L78
 	const char *err = rb_mutex_unlock_th(mutex, mutex->th);
 	if (err) rb_bug("%s", err);
     }
-    native_mutex_destroy(&mutex->lock);
-    native_cond_destroy(&mutex->cond);
     ruby_xfree(ptr);
 }
 
@@ -95,8 +111,7 @@ mutex_alloc(VALUE klass) https://github.com/ruby/ruby/blob/trunk/thread_sync.c#L111
     rb_mutex_t *mutex;
 
     obj = TypedData_Make_Struct(klass, rb_mutex_t, &mutex_data_type, mutex);
-    native_mutex_initialize(&mutex->lock);
-    native_cond_initialize(&mutex->cond, RB_CONDATTR_CLOCK_MONOTONIC);
+    list_head_init(&mutex->waitq);
     return obj;
 }
 
@@ -158,7 +173,6 @@ rb_mutex_trylock(VALUE self) https://github.com/ruby/ruby/blob/trunk/thread_sync.c#L173
     VALUE locked = Qfalse;
     GetMutexPtr(self, mutex);
 
-    native_mutex_lock(&mutex->lock);
     if (mutex->th == 0) {
 	rb_thread_t *th = GET_THREAD();
 	mutex->th = th;
@@ -166,61 +180,10 @@ rb_mutex_trylock(VALUE self) https://github.com/ruby/ruby/blob/trunk/thread_sync.c#L180
 
 	mutex_locked(th, self);
     }
-    native_mutex_unlock(&mutex->lock);
 
     return locked;
 }
 
-static int
-lock_func(rb_thread_t *th, rb_mutex_t *mutex, int timeout_ms)
-{
-    int interrupted = 0;
-    int err = 0;
-
-    mutex->cond_waiting++;
-    for (;;) {
-	if (!mutex->th) {
-	    mutex->th = th;
-	    break;
-	}
-	if (RUBY_VM_INTERRUPTED(th)) {
-	    interrupted = 1;
-	    break;
-	}
-	if (err == ETIMEDOUT) {
-	    interrupted = 2;
-	    break;
-	}
-
-	if (timeout_ms) {
-	    struct timespec timeout_rel;
-	    struct timespec timeout;
-
-	    timeout_rel.tv_sec = 0;
-	    timeout_rel.tv_nsec = timeout_ms * 1000 * 1000;
-	    timeout = native_cond_timeout(&mutex->cond, timeout_rel);
-	    err = native_cond_timedwait(&mutex->cond, &mutex->lock, &timeout);
-	}
-	else {
-	    native_cond_wait(&mutex->cond, &mutex->lock);
-	    err = 0;
-	}
-    }
-    mutex->cond_waiting--;
-
-    return interrupted;
-}
-
-static void
-lock_interrupt(void *ptr)
-{
-    rb_mutex_t *mutex = (rb_mutex_t *)ptr;
-    native_mutex_lock(&mutex->lock);
-    if (mutex->cond_waiting > 0)
-	native_cond_broadcast(&mutex->cond);
-    native_mutex_unlock(&mutex->lock);
-}
-
 /*
  * At maximum, only one thread can use cond_timedwait and watch deadlock
  * periodically. Multiple polling thread (i.e. concurrent deadlock check)
@@ -248,45 +211,45 @@ rb_mutex_lock(VALUE self) https://github.com/ruby/ruby/blob/trunk/thread_sync.c#L211
     }
 
     if (rb_mutex_trylock(self) == Qfalse) {
+	struct mutex_waiter w;
+
 	if (mutex->th == th) {
 	    rb_raise(rb_eThreadError, "deadlock; recursive locking");
 	}
 
+	w.th = th;
+
 	while (mutex->th != th) {
-	    int interrupted;
 	    enum rb_thread_status prev_status = th->status;
-	    volatile int timeout_ms = 0;
-	    struct rb_unblock_callback oldubf;
+	    struct timeval *timeout = 0;
+	    struct timeval tv = { 0, 100000 }; /* 100ms */
 
-	    set_unblock_function(th, lock_interrupt, mutex, &oldubf, FALSE);
 	    th->status = THREAD_STOPPED_FOREVER;
 	    th->locking_mutex = self;
-
-	    native_mutex_lock(&mutex->lock);
 	    th->vm->sleeper++;
 	    /*
-	     * Carefully! while some contended threads are in lock_func(),
+	     * Carefully! while some contended threads are in native_sleep(),
 	     * vm->sleeper is unstable value. we have to avoid both deadlock
 	     * and busy loop.
 	     */
 	    if ((vm_living_thread_num(th->vm) == th->vm->sleeper) &&
 		!patrol_thread) {
-		timeout_ms = 100;
+		timeout = &tv;
 		patrol_thread = th;
 	    }
 
-	    GVL_UNLOCK_BEGIN();
-	    interrupted = lock_func(th, mutex, (int)timeout_ms);
-	    native_mutex_unlock(&mutex->lock);
-	    GVL_UNLOCK_END();
+	    list_add_tail(&mutex->waitq, &w.node);
+	    native_sleep(th, timeout); /* release GVL */
+	    list_del(&w.node);
+	    if (!mutex->th) {
+		mutex->th = th;
+	    }
 
 	    if (patrol_thread == th)
 		patrol_thread = NULL;
 
-	    reset_unblock_function(th, &oldubf);
-
 	    th->locking_mutex = Qfalse;
-	    if (mutex->th && interrupted == 2) {
+	    if (mutex->th && timeout && !RUBY_VM_INTERRUPTED(th)) {
 		rb_check_deadlock(th->vm);
 	    }
 	    if (th->status == THREAD_STOPPED_FOREVER) {
@@ -296,9 +259,7 @@ rb_mutex_lock(VALUE self) https://github.com/ruby/ruby/blob/trunk/thread_sync.c#L259
 
 	    if (mutex->th == th) mutex_locked(th, self);
 
-	    if (interrupted) {
-		RUBY_VM_CHECK_INTS_BLOCKING(th);
-	    }
+	    RUBY_VM_CHECK_INTS_BLOCKING(th);
 	}
     }
     return self;
@@ -330,24 +291,32 @@ rb_mutex_unlock_th(rb_mutex_t *mutex, rb https://github.com/ruby/ruby/blob/trunk/thread_sync.c#L291
 {
     const char *err = NULL;
 
-    native_mutex_lock(&mutex->lock);
-
     if (mutex->th == 0) {
 	err = "Attempt to unlock a mutex which is not locked";
     }
     else if (mutex->th != th) {
 	err = "Attempt to unlock a mutex which is locked by another thread";
-    }
-    else {
-	mutex->th = 0;
-	if (mutex->cond_waiting > 0)
-	    native_cond_signal(&mutex->cond);
-    }
-
-    native_mutex_unlock(&mutex->lock);
-
-    if (!err) {
+    } else {
+	struct mutex_waiter *cur = 0, *next = 0;
 	rb_mutex_t *volatile *th_mutex = &th->keeping_mutexes;
+
+	mutex->th = 0;
+	list_for_each_safe(&mutex->waitq, cur, next, node) {
+	    list_del_init(&cur->node);
+	    switch (cur->th->status) {
+	    case THREAD_RUNNABLE: /* from someone else calling Thread#run */
+	    case THREAD_STOPPED_FOREVER: /* likely (rb_mutex_lock) */
+		rb_threadptr_interrupt(cur->th);
+		goto found;
+	    case THREAD_STOPPED: /* probably impossible */
+		rb_bug("unexpected THREAD_STOPPED");
+	    case THREAD_KILLED:
+                /* not sure about this, possible in exit GC? */
+		rb_bug("unexpected THREAD_KILLED");
+		continue;
+	    }
+	}
+found:
 	while (*th_mutex != mutex) {
 	    th_mutex = &(*th_mutex)->next_mutex;
 	}
@@ -411,6 +380,7 @@ rb_mutex_abandon_all(rb_mutex_t *mutexes https://github.com/ruby/ruby/blob/trunk/thread_sync.c#L380
 	mutexes = mutex->next_mutex;
 	mutex->th = 0;
 	mutex->next_mutex = 0;
+	list_head_init(&mutex->waitq);
     }
 }
 #endif
Index: thread.c
===================================================================
--- thread.c	(revision 58603)
+++ thread.c	(revision 58604)
@@ -4940,15 +4940,9 @@ debug_deadlock_check(rb_vm_t *vm, VALUE https://github.com/ruby/ruby/blob/trunk/thread.c#L4940
 		    th->self, th, thread_id_str(th), th->interrupt_flag);
 	if (th->locking_mutex) {
 	    rb_mutex_t *mutex;
-	    struct rb_thread_struct volatile *mth;
-	    int waiting;
 	    GetMutexPtr(th->locking_mutex, mutex);
-
-	    native_mutex_lock(&mutex->lock);
-	    mth = mutex->th;
-	    waiting = mutex->cond_waiting;
-	    native_mutex_unlock(&mutex->lock);
-	    rb_str_catf(msg, " mutex:%p cond:%d", mth, waiting);
+	    rb_str_catf(msg, " mutex:%p cond:%"PRIuSIZE,
+			mutex->th, rb_mutex_num_waiting(mutex));
 	}
 	{
 	    rb_thread_list_t *list = th->join_list;
@@ -4981,11 +4975,9 @@ rb_check_deadlock(rb_vm_t *vm) https://github.com/ruby/ruby/blob/trunk/thread.c#L4975
 	    rb_mutex_t *mutex;
 	    GetMutexPtr(th->locking_mutex, mutex);
 
-	    native_mutex_lock(&mutex->lock);
-	    if (mutex->th == th || (!mutex->th && mutex->cond_waiting)) {
+	    if (mutex->th == th || (!mutex->th && !list_empty(&mutex->waitq))) {
 		found = 1;
 	    }
-	    native_mutex_unlock(&mutex->lock);
 	}
 	if (found)
 	    break;

--
ML: ruby-changes@q...
Info: http://www.atdot.net/~ko1/quickml/

[前][次][番号順一覧][スレッド一覧]