From c2e6e1ef49d8e8745c9e4b6be2601b210a34506f Mon Sep 17 00:00:00 2001 From: "David M. Lee" <dlee@digium.com> Date: Mon, 9 Sep 2013 20:13:40 +0000 Subject: [PATCH] Fix DEBUG_THREADS when lock is acquired in __constructor__ This patch fixes some long-standing bugs in debug threads that were exacerbated with recent Optional API work in Asterisk 12. With debug threads enabled, on some systems, there's a lock ordering problem between our mutex and glibc's mutex protecting its module list (Ubuntu Lucid, glibc 2.11.1 in this instance). In one thread, the module list will be locked before acquiring our mutex. In another thread, our mutex will be locked before locking the module list (which happens in the depths of calling backtrace()). This patch fixes this issue by moving backtrace() calls outside of critical sections that have the mutex acquired. The bigger change was to reentrancy tracking for ast_cond_{timed,}wait, which wrongly assumed that waiting on the mutex was equivalent to a single unlock (it actually suspends all recursive locks on the mutex). (closes issue ASTERISK-22455) Review: https://reviewboard.asterisk.org/r/2824/ ........ Merged revisions 398648 from http://svn.asterisk.org/svn/asterisk/branches/1.8 ........ Merged revisions 398649 from http://svn.asterisk.org/svn/asterisk/branches/11 ........ Merged revisions 398651 from http://svn.asterisk.org/svn/asterisk/branches/12 git-svn-id: https://origsvn.digium.com/svn/asterisk/trunk@398652 65c4cc65-6c06-0410-ace0-fbb531ad65f3 --- include/asterisk/lock.h | 4 + main/lock.c | 203 +++++++++++++++++++++------------------- main/utils.c | 97 ++++++++++++++++--- 3 files changed, 194 insertions(+), 110 deletions(-) diff --git a/include/asterisk/lock.h b/include/asterisk/lock.h index aee084f322..d76a8d1852 100644 --- a/include/asterisk/lock.h +++ b/include/asterisk/lock.h @@ -282,12 +282,16 @@ void ast_remove_lock_info(void *lock_addr, struct ast_bt *bt); #else void ast_remove_lock_info(void *lock_addr); #endif /* HAVE_BKTR */ +void ast_suspend_lock_info(void *lock_addr); +void ast_restore_lock_info(void *lock_addr); #else #ifdef HAVE_BKTR #define ast_remove_lock_info(ignore,me) #else #define ast_remove_lock_info(ignore) #endif /* HAVE_BKTR */ +#define ast_suspend_lock_info(ignore); +#define ast_restore_lock_info(ignore); #endif /* !defined(LOW_MEMORY) */ /*! diff --git a/main/lock.c b/main/lock.c index 3036e5bc4b..d66e01b273 100644 --- a/main/lock.c +++ b/main/lock.c @@ -208,12 +208,20 @@ int __ast_pthread_mutex_lock(const char *filename, int lineno, const char *func, if (t->tracking) { #ifdef HAVE_BKTR + struct ast_bt tmp; + + /* The implementation of backtrace() may have its own locks. + * Capture the backtrace outside of the reentrancy lock to + * avoid deadlocks. See ASTERISK-22455. */ + ast_bt_get_addresses(&tmp); + ast_reentrancy_lock(lt); if (lt->reentrancy != AST_MAX_REENTRANCY) { - ast_bt_get_addresses(<->backtrace[lt->reentrancy]); + lt->backtrace[lt->reentrancy] = tmp; bt = <->backtrace[lt->reentrancy]; } ast_reentrancy_unlock(lt); + ast_store_lock_info(AST_MUTEX, filename, lineno, func, mutex_name, t, bt); #else ast_store_lock_info(AST_MUTEX, filename, lineno, func, mutex_name, t); @@ -340,12 +348,20 @@ int __ast_pthread_mutex_trylock(const char *filename, int lineno, const char *fu if (t->tracking) { #ifdef HAVE_BKTR + struct ast_bt tmp; + + /* The implementation of backtrace() may have its own locks. + * Capture the backtrace outside of the reentrancy lock to + * avoid deadlocks. See ASTERISK-22455. */ + ast_bt_get_addresses(&tmp); + ast_reentrancy_lock(lt); if (lt->reentrancy != AST_MAX_REENTRANCY) { - ast_bt_get_addresses(<->backtrace[lt->reentrancy]); + lt->backtrace[lt->reentrancy] = tmp; bt = <->backtrace[lt->reentrancy]; } ast_reentrancy_unlock(lt); + ast_store_lock_info(AST_MUTEX, filename, lineno, func, mutex_name, t, bt); #else ast_store_lock_info(AST_MUTEX, filename, lineno, func, mutex_name, t); @@ -497,10 +513,8 @@ int __ast_cond_wait(const char *filename, int lineno, const char *func, #ifdef DEBUG_THREADS struct ast_lock_track *lt; + struct ast_lock_track lt_orig; int canlog = strcmp(filename, "logger.c") & t->tracking; -#ifdef HAVE_BKTR - struct ast_bt *bt = NULL; -#endif #if defined(AST_MUTEX_INIT_W_CONSTRUCTORS) && defined(CAN_COMPARE_MUTEX_TO_INIT_VALUE) if ((t->mutex) == ((pthread_mutex_t) PTHREAD_MUTEX_INITIALIZER)) { @@ -531,33 +545,20 @@ int __ast_cond_wait(const char *filename, int lineno, const char *func, __dump_backtrace(<->backtrace[ROFFSET], canlog); #endif DO_THREAD_CRASH; + } else if (lt->reentrancy <= 0) { + __ast_mutex_logger("%s line %d (%s): attempted to wait on an unlocked mutex '%s'\n", + filename, lineno, func, mutex_name); + DO_THREAD_CRASH; } - if (--lt->reentrancy < 0) { - __ast_mutex_logger("%s line %d (%s): mutex '%s' freed more times than we've locked!\n", - filename, lineno, func, mutex_name); - lt->reentrancy = 0; - } - - if (lt->reentrancy < AST_MAX_REENTRANCY) { - lt->file[lt->reentrancy] = NULL; - lt->lineno[lt->reentrancy] = 0; - lt->func[lt->reentrancy] = NULL; - lt->thread[lt->reentrancy] = 0; - } - -#ifdef HAVE_BKTR - if (lt->reentrancy) { - bt = <->backtrace[lt->reentrancy - 1]; - } -#endif + /* Waiting on a condition completely suspends a recursive mutex, + * even if it's been recursively locked multiple times. Make a + * copy of the lock tracking, and reset reentrancy to zero */ + lt_orig = *lt; + lt->reentrancy = 0; ast_reentrancy_unlock(lt); -#ifdef HAVE_BKTR - ast_remove_lock_info(t, bt); -#else - ast_remove_lock_info(t); -#endif + ast_suspend_lock_info(t); } #endif /* DEBUG_THREADS */ @@ -569,28 +570,16 @@ int __ast_cond_wait(const char *filename, int lineno, const char *func, filename, lineno, func, strerror(res)); DO_THREAD_CRASH; } else if (t->tracking) { + pthread_mutex_t reentr_mutex_orig; ast_reentrancy_lock(lt); - if (lt->reentrancy < AST_MAX_REENTRANCY) { - lt->file[lt->reentrancy] = filename; - lt->lineno[lt->reentrancy] = lineno; - lt->func[lt->reentrancy] = func; - lt->thread[lt->reentrancy] = pthread_self(); -#ifdef HAVE_BKTR - ast_bt_get_addresses(<->backtrace[lt->reentrancy]); - bt = <->backtrace[lt->reentrancy]; -#endif - lt->reentrancy++; - } else { - __ast_mutex_logger("%s line %d (%s): '%s' really deep reentrancy!\n", - filename, lineno, func, mutex_name); - } + /* Restore lock tracking to what it was prior to the wait */ + reentr_mutex_orig = lt->reentr_mutex; + *lt = lt_orig; + /* un-trash the mutex we just copied over */ + lt->reentr_mutex = reentr_mutex_orig; ast_reentrancy_unlock(lt); -#ifdef HAVE_BKTR - ast_store_lock_info(AST_MUTEX, filename, lineno, func, mutex_name, t, bt); -#else - ast_store_lock_info(AST_MUTEX, filename, lineno, func, mutex_name, t); -#endif + ast_restore_lock_info(t); } #endif /* DEBUG_THREADS */ @@ -605,10 +594,8 @@ int __ast_cond_timedwait(const char *filename, int lineno, const char *func, #ifdef DEBUG_THREADS struct ast_lock_track *lt; + struct ast_lock_track lt_orig; int canlog = strcmp(filename, "logger.c") & t->tracking; -#ifdef HAVE_BKTR - struct ast_bt *bt = NULL; -#endif #if defined(AST_MUTEX_INIT_W_CONSTRUCTORS) && defined(CAN_COMPARE_MUTEX_TO_INIT_VALUE) if ((t->mutex) == ((pthread_mutex_t) PTHREAD_MUTEX_INITIALIZER)) { @@ -639,32 +626,20 @@ int __ast_cond_timedwait(const char *filename, int lineno, const char *func, __dump_backtrace(<->backtrace[ROFFSET], canlog); #endif DO_THREAD_CRASH; - } - - if (--lt->reentrancy < 0) { - __ast_mutex_logger("%s line %d (%s): mutex '%s' freed more times than we've locked!\n", + } else if (lt->reentrancy <= 0) { + __ast_mutex_logger("%s line %d (%s): attempted to wait on an unlocked mutex '%s'\n", filename, lineno, func, mutex_name); - lt->reentrancy = 0; + DO_THREAD_CRASH; } - if (lt->reentrancy < AST_MAX_REENTRANCY) { - lt->file[lt->reentrancy] = NULL; - lt->lineno[lt->reentrancy] = 0; - lt->func[lt->reentrancy] = NULL; - lt->thread[lt->reentrancy] = 0; - } -#ifdef HAVE_BKTR - if (lt->reentrancy) { - bt = <->backtrace[lt->reentrancy - 1]; - } -#endif + /* Waiting on a condition completely suspends a recursive mutex, + * even if it's been recursively locked multiple times. Make a + * copy of the lock tracking, and reset reentrancy to zero */ + lt_orig = *lt; + lt->reentrancy = 0; ast_reentrancy_unlock(lt); -#ifdef HAVE_BKTR - ast_remove_lock_info(t, bt); -#else - ast_remove_lock_info(t); -#endif + ast_suspend_lock_info(t); } #endif /* DEBUG_THREADS */ @@ -676,28 +651,16 @@ int __ast_cond_timedwait(const char *filename, int lineno, const char *func, filename, lineno, func, strerror(res)); DO_THREAD_CRASH; } else if (t->tracking) { + pthread_mutex_t reentr_mutex_orig; ast_reentrancy_lock(lt); - if (lt->reentrancy < AST_MAX_REENTRANCY) { - lt->file[lt->reentrancy] = filename; - lt->lineno[lt->reentrancy] = lineno; - lt->func[lt->reentrancy] = func; - lt->thread[lt->reentrancy] = pthread_self(); -#ifdef HAVE_BKTR - ast_bt_get_addresses(<->backtrace[lt->reentrancy]); - bt = <->backtrace[lt->reentrancy]; -#endif - lt->reentrancy++; - } else { - __ast_mutex_logger("%s line %d (%s): '%s' really deep reentrancy!\n", - filename, lineno, func, mutex_name); - } + /* Restore lock tracking to what it was prior to the wait */ + reentr_mutex_orig = lt->reentr_mutex; + *lt = lt_orig; + /* un-trash the mutex we just copied over */ + lt->reentr_mutex = reentr_mutex_orig; ast_reentrancy_unlock(lt); -#ifdef HAVE_BKTR - ast_store_lock_info(AST_MUTEX, filename, lineno, func, mutex_name, t, bt); -#else - ast_store_lock_info(AST_MUTEX, filename, lineno, func, mutex_name, t); -#endif + ast_suspend_lock_info(t); } #endif /* DEBUG_THREADS */ @@ -899,12 +862,20 @@ int __ast_rwlock_rdlock(const char *filename, int line, const char *func, ast_rw if (t->tracking) { #ifdef HAVE_BKTR + struct ast_bt tmp; + + /* The implementation of backtrace() may have its own locks. + * Capture the backtrace outside of the reentrancy lock to + * avoid deadlocks. See ASTERISK-22455. */ + ast_bt_get_addresses(&tmp); + ast_reentrancy_lock(lt); if (lt->reentrancy != AST_MAX_REENTRANCY) { - ast_bt_get_addresses(<->backtrace[lt->reentrancy]); + lt->backtrace[lt->reentrancy] = tmp; bt = <->backtrace[lt->reentrancy]; } ast_reentrancy_unlock(lt); + ast_store_lock_info(AST_RDLOCK, filename, line, func, name, t, bt); #else ast_store_lock_info(AST_RDLOCK, filename, line, func, name, t); @@ -1018,12 +989,20 @@ int __ast_rwlock_wrlock(const char *filename, int line, const char *func, ast_rw if (t->tracking) { #ifdef HAVE_BKTR + struct ast_bt tmp; + + /* The implementation of backtrace() may have its own locks. + * Capture the backtrace outside of the reentrancy lock to + * avoid deadlocks. See ASTERISK-22455. */ + ast_bt_get_addresses(&tmp); + ast_reentrancy_lock(lt); if (lt->reentrancy != AST_MAX_REENTRANCY) { - ast_bt_get_addresses(<->backtrace[lt->reentrancy]); + lt->backtrace[lt->reentrancy] = tmp; bt = <->backtrace[lt->reentrancy]; } ast_reentrancy_unlock(lt); + ast_store_lock_info(AST_WRLOCK, filename, line, func, name, t, bt); #else ast_store_lock_info(AST_WRLOCK, filename, line, func, name, t); @@ -1141,12 +1120,20 @@ int __ast_rwlock_timedrdlock(const char *filename, int line, const char *func, a if (t->tracking) { #ifdef HAVE_BKTR + struct ast_bt tmp; + + /* The implementation of backtrace() may have its own locks. + * Capture the backtrace outside of the reentrancy lock to + * avoid deadlocks. See ASTERISK-22455. */ + ast_bt_get_addresses(&tmp); + ast_reentrancy_lock(lt); if (lt->reentrancy != AST_MAX_REENTRANCY) { - ast_bt_get_addresses(<->backtrace[lt->reentrancy]); + lt->backtrace[lt->reentrancy] = tmp; bt = <->backtrace[lt->reentrancy]; } ast_reentrancy_unlock(lt); + ast_store_lock_info(AST_WRLOCK, filename, line, func, name, t, bt); #else ast_store_lock_info(AST_WRLOCK, filename, line, func, name, t); @@ -1244,12 +1231,20 @@ int __ast_rwlock_timedwrlock(const char *filename, int line, const char *func, a if (t->tracking) { #ifdef HAVE_BKTR + struct ast_bt tmp; + + /* The implementation of backtrace() may have its own locks. + * Capture the backtrace outside of the reentrancy lock to + * avoid deadlocks. See ASTERISK-22455. */ + ast_bt_get_addresses(&tmp); + ast_reentrancy_lock(lt); if (lt->reentrancy != AST_MAX_REENTRANCY) { - ast_bt_get_addresses(<->backtrace[lt->reentrancy]); + lt->backtrace[lt->reentrancy] = tmp; bt = <->backtrace[lt->reentrancy]; } ast_reentrancy_unlock(lt); + ast_store_lock_info(AST_WRLOCK, filename, line, func, name, t, bt); #else ast_store_lock_info(AST_WRLOCK, filename, line, func, name, t); @@ -1350,12 +1345,20 @@ int __ast_rwlock_tryrdlock(const char *filename, int line, const char *func, ast if (t->tracking) { #ifdef HAVE_BKTR + struct ast_bt tmp; + + /* The implementation of backtrace() may have its own locks. + * Capture the backtrace outside of the reentrancy lock to + * avoid deadlocks. See ASTERISK-22455. */ + ast_bt_get_addresses(&tmp); + ast_reentrancy_lock(lt); if (lt->reentrancy != AST_MAX_REENTRANCY) { - ast_bt_get_addresses(<->backtrace[lt->reentrancy]); + lt->backtrace[lt->reentrancy] = tmp; bt = <->backtrace[lt->reentrancy]; } ast_reentrancy_unlock(lt); + ast_store_lock_info(AST_RDLOCK, filename, line, func, name, t, bt); #else ast_store_lock_info(AST_RDLOCK, filename, line, func, name, t); @@ -1420,12 +1423,20 @@ int __ast_rwlock_trywrlock(const char *filename, int line, const char *func, ast if (t->tracking) { #ifdef HAVE_BKTR + struct ast_bt tmp; + + /* The implementation of backtrace() may have its own locks. + * Capture the backtrace outside of the reentrancy lock to + * avoid deadlocks. See ASTERISK-22455. */ + ast_bt_get_addresses(&tmp); + ast_reentrancy_lock(lt); if (lt->reentrancy != AST_MAX_REENTRANCY) { - ast_bt_get_addresses(<->backtrace[lt->reentrancy]); + lt->backtrace[lt->reentrancy] = tmp; bt = <->backtrace[lt->reentrancy]; } ast_reentrancy_unlock(lt); + ast_store_lock_info(AST_WRLOCK, filename, line, func, name, t, bt); #else ast_store_lock_info(AST_WRLOCK, filename, line, func, name, t); diff --git a/main/utils.c b/main/utils.c index 300d057d92..e2c5e2c3f6 100644 --- a/main/utils.c +++ b/main/utils.c @@ -597,6 +597,8 @@ struct thr_lock_info { enum ast_lock_type type; /*! This thread is waiting on this lock */ int pending:2; + /*! A condition has suspended this lock */ + int suspended:1; #ifdef HAVE_BKTR struct ast_bt *backtrace; #endif @@ -783,6 +785,60 @@ int ast_find_lock_info(void *lock_addr, char *filename, size_t filename_size, in return 0; } +void ast_suspend_lock_info(void *lock_addr) +{ + struct thr_lock_info *lock_info; + int i = 0; + + if (!(lock_info = ast_threadstorage_get(&thread_lock_info, sizeof(*lock_info)))) { + return; + } + + pthread_mutex_lock(&lock_info->lock); + + for (i = lock_info->num_locks - 1; i >= 0; i--) { + if (lock_info->locks[i].lock_addr == lock_addr) + break; + } + + if (i == -1) { + /* Lock not found :( */ + pthread_mutex_unlock(&lock_info->lock); + return; + } + + lock_info->locks[i].suspended = 1; + + pthread_mutex_unlock(&lock_info->lock); +} + +void ast_restore_lock_info(void *lock_addr) +{ + struct thr_lock_info *lock_info; + int i = 0; + + if (!(lock_info = ast_threadstorage_get(&thread_lock_info, sizeof(*lock_info)))) + return; + + pthread_mutex_lock(&lock_info->lock); + + for (i = lock_info->num_locks - 1; i >= 0; i--) { + if (lock_info->locks[i].lock_addr == lock_addr) + break; + } + + if (i == -1) { + /* Lock not found :( */ + pthread_mutex_unlock(&lock_info->lock); + return; + } + + lock_info->locks[i].suspended = 0; + + pthread_mutex_unlock(&lock_info->lock); +} + + #ifdef HAVE_BKTR void ast_remove_lock_info(void *lock_addr, struct ast_bt *bt) #else @@ -876,7 +932,7 @@ static void append_lock_information(struct ast_str **str, struct thr_lock_info * ast_mutex_t *lock; struct ast_lock_track *lt; - ast_str_append(str, 0, "=== ---> %sLock #%d (%s): %s %d %s %s %p (%d)\n", + ast_str_append(str, 0, "=== ---> %sLock #%d (%s): %s %d %s %s %p (%d%s)\n", lock_info->locks[i].pending > 0 ? "Waiting for " : lock_info->locks[i].pending < 0 ? "Tried and failed to get " : "", i, lock_info->locks[i].file, @@ -884,7 +940,8 @@ static void append_lock_information(struct ast_str **str, struct thr_lock_info * lock_info->locks[i].line_num, lock_info->locks[i].func, lock_info->locks[i].lock_name, lock_info->locks[i].lock_addr, - lock_info->locks[i].times_locked); + lock_info->locks[i].times_locked, + lock_info->locks[i].suspended ? " - suspended" : ""); #ifdef HAVE_BKTR append_backtrace_information(str, lock_info->locks[i].backtrace); #endif @@ -982,20 +1039,32 @@ struct ast_str *ast_dump_locks(void) pthread_mutex_lock(&lock_infos_lock.mutex); AST_LIST_TRAVERSE(&lock_infos, lock_info, entry) { int i; - if (lock_info->num_locks) { - ast_str_append(&str, 0, "=== Thread ID: 0x%lx (%s)\n", (long) lock_info->thread_id, - lock_info->thread_name); - pthread_mutex_lock(&lock_info->lock); - for (i = 0; str && i < lock_info->num_locks; i++) { - append_lock_information(&str, lock_info, i); + int header_printed = 0; + pthread_mutex_lock(&lock_info->lock); + for (i = 0; str && i < lock_info->num_locks; i++) { + /* Don't show suspended locks */ + if (lock_info->locks[i].suspended) { + continue; } - pthread_mutex_unlock(&lock_info->lock); - if (!str) - break; + + if (!header_printed) { + ast_str_append(&str, 0, "=== Thread ID: 0x%lx (%s)\n", (long) lock_info->thread_id, + lock_info->thread_name); + header_printed = 1; + } + + append_lock_information(&str, lock_info, i); + } + pthread_mutex_unlock(&lock_info->lock); + if (!str) { + break; + } + if (header_printed) { ast_str_append(&str, 0, "=== -------------------------------------------------------------------\n" - "===\n"); - if (!str) - break; + "===\n"); + } + if (!str) { + break; } } pthread_mutex_unlock(&lock_infos_lock.mutex); -- GitLab