| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | /*
 | 
					
						
							|  |  |  |  * Asterisk -- An open source telephony toolkit. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * Copyright (C) 1999 - 2010, Digium, Inc. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * Mark Spencer <markster@digium.com> | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * See http://www.asterisk.org for more information about
 | 
					
						
							|  |  |  |  * the Asterisk project. Please do not directly contact | 
					
						
							|  |  |  |  * any of the maintainers of this project for assistance; | 
					
						
							|  |  |  |  * the project provides a web site, mailing lists and IRC | 
					
						
							|  |  |  |  * channels for your use. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * This program is free software, distributed under the terms of | 
					
						
							|  |  |  |  * the GNU General Public License Version 2. See the LICENSE file | 
					
						
							|  |  |  |  * at the top of the source tree. | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /*! \file
 | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * \brief General Asterisk locking. | 
					
						
							|  |  |  |  */ | 
					
						
							| 
									
										
										
										
											2012-06-15 16:20:16 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | /*** MODULEINFO
 | 
					
						
							|  |  |  | 	<support_level>core</support_level> | 
					
						
							|  |  |  |  ***/ | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | #include "asterisk.h"
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-10-26 22:40:49 -04:00
										 |  |  | #ifdef HAVE_MTX_PROFILE
 | 
					
						
							|  |  |  | /* profile mutex */ | 
					
						
							|  |  |  | static int mtx_prof = -1; | 
					
						
							|  |  |  | static void __attribute__((constructor)) __mtx_init(void) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	mtx_prof = ast_add_profile("mtx_lock_" __FILE__, 0); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-08-23 18:07:40 +00:00
										 |  |  | #include "asterisk/utils.h"
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #include "asterisk/lock.h"
 | 
					
						
							| 
									
										
										
										
											2022-07-27 19:54:43 +00:00
										 |  |  | #include "asterisk/manager.h"
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | /* Allow direct use of pthread_mutex_* / pthread_cond_* */ | 
					
						
							|  |  |  | #undef pthread_mutex_init
 | 
					
						
							|  |  |  | #undef pthread_mutex_destroy
 | 
					
						
							|  |  |  | #undef pthread_mutex_lock
 | 
					
						
							|  |  |  | #undef pthread_mutex_trylock
 | 
					
						
							| 
									
										
										
										
											2010-06-09 23:56:08 +00:00
										 |  |  | #undef pthread_mutex_t
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #undef pthread_mutex_unlock
 | 
					
						
							|  |  |  | #undef pthread_cond_init
 | 
					
						
							|  |  |  | #undef pthread_cond_signal
 | 
					
						
							|  |  |  | #undef pthread_cond_broadcast
 | 
					
						
							|  |  |  | #undef pthread_cond_destroy
 | 
					
						
							|  |  |  | #undef pthread_cond_wait
 | 
					
						
							|  |  |  | #undef pthread_cond_timedwait
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | #if defined(DEBUG_THREADS) || defined(DETECT_DEADLOCKS)
 | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | #define log_mutex_error(canlog, ...) \
 | 
					
						
							|  |  |  | 	do { \ | 
					
						
							|  |  |  | 		if (canlog) { \ | 
					
						
							|  |  |  | 			ast_log(LOG_ERROR, __VA_ARGS__); \ | 
					
						
							|  |  |  | 		} else { \ | 
					
						
							|  |  |  | 			fprintf(stderr, __VA_ARGS__); \ | 
					
						
							|  |  |  | 		} \ | 
					
						
							|  |  |  | 	} while (0) | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-08-23 18:07:40 +00:00
										 |  |  | #if defined(DEBUG_THREADS) && defined(HAVE_BKTR)
 | 
					
						
							|  |  |  | static void __dump_backtrace(struct ast_bt *bt, int canlog) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	char **strings; | 
					
						
							|  |  |  | 	ssize_t i; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	strings = backtrace_symbols(bt->addresses, bt->num_frames); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	for (i = 0; i < bt->num_frames; i++) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 		log_mutex_error(canlog, "%s\n", strings[i]); | 
					
						
							| 
									
										
										
										
											2013-08-23 18:07:40 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	ast_std_free(strings); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | #endif	/* defined(DEBUG_THREADS) && defined(HAVE_BKTR) */
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							|  |  |  | AST_MUTEX_DEFINE_STATIC(reentrancy_lock); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | static inline struct ast_lock_track *ast_get_reentrancy(struct ast_lock_track **plt, | 
					
						
							|  |  |  | 	struct ast_lock_track_flags *flags, int no_setup) | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | { | 
					
						
							|  |  |  | 	pthread_mutexattr_t reentr_attr; | 
					
						
							|  |  |  | 	struct ast_lock_track *lt; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	if (!flags->tracking || flags->setup) { | 
					
						
							|  |  |  | 		return *plt; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	pthread_mutex_lock(&reentrancy_lock.mutex); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	if (*plt) { | 
					
						
							|  |  |  | 		pthread_mutex_unlock(&reentrancy_lock.mutex); | 
					
						
							|  |  |  | 		return *plt; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	if (no_setup) { | 
					
						
							|  |  |  | 		pthread_mutex_unlock(&reentrancy_lock.mutex); | 
					
						
							|  |  |  | 		return NULL; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	lt = *plt = ast_std_calloc(1, sizeof(*lt)); | 
					
						
							|  |  |  | 	if (!lt) { | 
					
						
							|  |  |  | 		fprintf(stderr, "%s: Failed to allocate lock tracking\n", __func__); | 
					
						
							|  |  |  | #if defined(DO_CRASH) || defined(THREAD_CRASH)
 | 
					
						
							|  |  |  | 		abort(); | 
					
						
							|  |  |  | #else
 | 
					
						
							|  |  |  | 		pthread_mutex_unlock(&reentrancy_lock.mutex); | 
					
						
							|  |  |  | 		return NULL; | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	pthread_mutexattr_init(&reentr_attr); | 
					
						
							|  |  |  | 	pthread_mutexattr_settype(&reentr_attr, AST_MUTEX_KIND); | 
					
						
							|  |  |  | 	pthread_mutex_init(<->reentr_mutex, &reentr_attr); | 
					
						
							|  |  |  | 	pthread_mutexattr_destroy(&reentr_attr); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	flags->setup = 1; | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	pthread_mutex_unlock(&reentrancy_lock.mutex); | 
					
						
							|  |  |  | 	return lt; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | static inline void delete_reentrancy_cs(struct ast_lock_track **plt) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	struct ast_lock_track *lt; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	if (*plt) { | 
					
						
							|  |  |  | 		lt = *plt; | 
					
						
							|  |  |  | 		*plt = NULL; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		pthread_mutex_destroy(<->reentr_mutex); | 
					
						
							|  |  |  | 		ast_std_free(lt); | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | int __ast_pthread_mutex_init(int tracking, const char *filename, int lineno, const char *func, | 
					
						
							|  |  |  | 						const char *mutex_name, ast_mutex_t *t) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	int res; | 
					
						
							|  |  |  | 	pthread_mutexattr_t  attr; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | #if defined(DEBUG_THREADS) && defined(AST_MUTEX_INIT_W_CONSTRUCTORS) && \
 | 
					
						
							|  |  |  | 	defined(CAN_COMPARE_MUTEX_TO_INIT_VALUE) | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	if ((t->mutex) != ((pthread_mutex_t) PTHREAD_MUTEX_INITIALIZER)) { | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		int canlog = tracking && strcmp(filename, "logger.c"); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 		log_mutex_error(canlog, "%s line %d (%s): NOTICE: mutex '%s' is already initialized.\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				   filename, lineno, func, mutex_name); | 
					
						
							|  |  |  | 		DO_THREAD_CRASH; | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		return EBUSY; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | #endif /* AST_MUTEX_INIT_W_CONSTRUCTORS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | #if defined(DEBUG_THREADS) || defined(DETECT_DEADLOCKS)
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	t->track = NULL; | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	t->flags.tracking = tracking; | 
					
						
							|  |  |  | 	t->flags.setup = 0; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	pthread_mutexattr_init(&attr); | 
					
						
							|  |  |  | 	pthread_mutexattr_settype(&attr, AST_MUTEX_KIND); | 
					
						
							|  |  |  | 	res = pthread_mutex_init(&t->mutex, &attr); | 
					
						
							|  |  |  | 	pthread_mutexattr_destroy(&attr); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	return res; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | int __ast_pthread_mutex_destroy(const char *filename, int lineno, const char *func, | 
					
						
							|  |  |  | 						const char *mutex_name, ast_mutex_t *t) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	int res; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	struct ast_lock_track *lt = ast_get_reentrancy(&t->track, &t->flags, 1); | 
					
						
							|  |  |  | 	int canlog = t->flags.tracking && strcmp(filename, "logger.c"); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | #if defined(AST_MUTEX_INIT_W_CONSTRUCTORS) && defined(CAN_COMPARE_MUTEX_TO_INIT_VALUE)
 | 
					
						
							|  |  |  | 	if ((t->mutex) == ((pthread_mutex_t) PTHREAD_MUTEX_INITIALIZER)) { | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		/* Don't try to uninitialize an uninitialized mutex
 | 
					
						
							|  |  |  | 		 * This may have no effect on linux | 
					
						
							|  |  |  | 		 * but it always generates a core on *BSD when | 
					
						
							|  |  |  | 		 * linked with libpthread. | 
					
						
							|  |  |  | 		 * This is not an error condition if the mutex is created on the fly. | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		 */ | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 		log_mutex_error(canlog, "%s line %d (%s): NOTICE: mutex '%s' is uninitialized.\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				   filename, lineno, func, mutex_name); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		DO_THREAD_CRASH; | 
					
						
							|  |  |  | 		res = EINVAL; | 
					
						
							|  |  |  | 		goto lt_cleanup; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	res = pthread_mutex_trylock(&t->mutex); | 
					
						
							|  |  |  | 	switch (res) { | 
					
						
							|  |  |  | 	case 0: | 
					
						
							|  |  |  | 		pthread_mutex_unlock(&t->mutex); | 
					
						
							|  |  |  | 		break; | 
					
						
							|  |  |  | 	case EINVAL: | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 		log_mutex_error(canlog, "%s line %d (%s): Error: attempt to destroy invalid mutex '%s'.\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				  filename, lineno, func, mutex_name); | 
					
						
							|  |  |  | 		break; | 
					
						
							|  |  |  | 	case EBUSY: | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 		log_mutex_error(canlog, "%s line %d (%s): Error: attempt to destroy locked mutex '%s'.\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				   filename, lineno, func, mutex_name); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		if (lt) { | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 			ast_reentrancy_lock(lt); | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 			log_mutex_error(canlog, "%s line %d (%s): Error: '%s' was locked here.\n", | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 				    lt->file[ROFFSET], lt->lineno[ROFFSET], lt->func[ROFFSET], mutex_name); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 			__dump_backtrace(<->backtrace[ROFFSET], canlog); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 			ast_reentrancy_unlock(lt); | 
					
						
							|  |  |  | 		} | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		break; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	res = pthread_mutex_destroy(&t->mutex); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							|  |  |  | 	if (res) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 		log_mutex_error(canlog, "%s line %d (%s): Error destroying mutex %s: %s\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				   filename, lineno, func, mutex_name, strerror(res)); | 
					
						
							|  |  |  | 	} | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | #if defined(AST_MUTEX_INIT_W_CONSTRUCTORS) && defined(CAN_COMPARE_MUTEX_TO_INIT_VALUE)
 | 
					
						
							|  |  |  | lt_cleanup: | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 	if (lt) { | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 		ast_reentrancy_lock(lt); | 
					
						
							|  |  |  | 		lt->file[0] = filename; | 
					
						
							|  |  |  | 		lt->lineno[0] = lineno; | 
					
						
							|  |  |  | 		lt->func[0] = func; | 
					
						
							|  |  |  | 		lt->reentrancy = 0; | 
					
						
							| 
									
										
											  
											
												chan_sip:  Address runaway when realtime peers subscribe to mailboxes
Users upgrading from asterisk 13.5 to a later version and who use
realtime with peers that have mailboxes were experiencing runaway
situations that manifested as a continuous stream of taskprocessor
congestion errors, memory leaks and an unresponsive chan_sip.
A related issue was that setting rtcachefriends=no NEVER worked in
asterisk 13 (since the move to stasis).  In 13.5 and earlier, when a
peer tried to register, all of the stasis threads would block and
chan_sip would again become unresponsive.  After 13.5, the runaway
would happen.
There were a number of causes...
* mwi_event_cb was (indirectly) calling build_peer even though calls to
  mwi_event_cb are often caused by build_peer.
* In an effort to prevent chan_sip from being unloaded while messages
  were still in flight, destroy_mailboxes was calling
  stasis_unsubscribe_and_join but in some cases waited forever for the
  final message.
* add_peer_mailboxes wasn't properly marking the existing mailboxes
  on a peer as "keep" so build_peer would always delete them all.
* add_peer_mwi_subs was unsubscribing existing mailbox subscriptions
  then just creating them again.
All of this was causing a flood of subscribes and unsubscribes on
multiple threads all for the same peer and mailbox.
Fixes...
* add_peer_mailboxes now marks mailboxes correctly and build_peer only
  deletes the ones that really are no longer needed by the peer.
* add_peer_mwi_subs now only adds subscriptions marked as "new" instead
  of unsubscribing and resubscribing everything.  It also adds the peer
  object's address to the mailbox instead of its name to the subscription
  userdata so mwi_event_cb doesn't have to call build_peer.
With these changes, with rtcachefriends=yes (the most common setting),
there are no leaks, locks, loops or crashes at shutdown.
rtcachefriends=no still causes leaks but at least it doesn't lock, loop
or crash.  Since making rtcachefriends=no work wasnt in scope for this
issue, further work will have to be deferred to a separate patch.
Side fixes...
 * The ast_lock_track structure had a member named "thread" which gdb
   doesn't like since it conflicts with it's "thread" command.  That
   member was renamed to "thread_id".
ASTERISK-25468 #close
Change-Id: I07519ef7f092629e1e844f855abd279d6475cdd0
											
										 
											2016-09-20 08:42:15 -06:00
										 |  |  | 		lt->thread_id[0] = 0; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 		memset(<->backtrace[0], 0, sizeof(lt->backtrace[0])); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 		ast_reentrancy_unlock(lt); | 
					
						
							|  |  |  | 		delete_reentrancy_cs(&t->track); | 
					
						
							|  |  |  | 	} | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	return res; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | int __ast_pthread_mutex_lock(const char *filename, int lineno, const char *func, | 
					
						
							| 
									
										
										
										
											2012-03-22 19:51:16 +00:00
										 |  |  | 				const char* mutex_name, ast_mutex_t *t) | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | { | 
					
						
							|  |  |  | 	int res; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | #if defined(DETECT_DEADLOCKS) || defined(DEBUG_THREADS)
 | 
					
						
							|  |  |  | 	int canlog = t->flags.tracking && strcmp(filename, "logger.c"); | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	struct ast_lock_track *lt = ast_get_reentrancy(&t->track, &t->flags, 0); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	struct ast_bt *bt = NULL; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	if (lt) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 		struct ast_bt tmp; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		/* The implementation of backtrace() may have its own locks.
 | 
					
						
							|  |  |  | 		 * Capture the backtrace outside of the reentrancy lock to | 
					
						
							|  |  |  | 		 * avoid deadlocks. See ASTERISK-22455. */ | 
					
						
							|  |  |  | 		ast_bt_get_addresses(&tmp); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		ast_reentrancy_lock(lt); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		if (lt->reentrancy < AST_MAX_REENTRANCY) { | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 			lt->backtrace[lt->reentrancy] = tmp; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 			bt = <->backtrace[lt->reentrancy]; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 		ast_reentrancy_unlock(lt); | 
					
						
							|  |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2017-10-23 01:55:18 -04:00
										 |  |  | 		ast_store_lock_info(AST_MUTEX, filename, lineno, func, mutex_name, t, bt); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | #if defined(DETECT_DEADLOCKS)
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	{ | 
					
						
							|  |  |  | 		time_t seconds = time(NULL); | 
					
						
							|  |  |  | 		time_t wait_time, reported_wait = 0; | 
					
						
							|  |  |  | 		do { | 
					
						
							|  |  |  | #ifdef	HAVE_MTX_PROFILE
 | 
					
						
							|  |  |  | 			ast_mark(mtx_prof, 1); | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 			res = pthread_mutex_trylock(&t->mutex); | 
					
						
							|  |  |  | #ifdef	HAVE_MTX_PROFILE
 | 
					
						
							|  |  |  | 			ast_mark(mtx_prof, 0); | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 			if (res == EBUSY) { | 
					
						
							|  |  |  | 				wait_time = time(NULL) - seconds; | 
					
						
							|  |  |  | 				if (wait_time > reported_wait && (wait_time % 5) == 0) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 					log_mutex_error(canlog, "%s line %d (%s): Deadlock? waited %d sec for mutex '%s'?\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 							   filename, lineno, func, (int) wait_time, mutex_name); | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2016-04-21 15:26:47 +02:00
										 |  |  | 					if (lt) { | 
					
						
							|  |  |  | 						ast_reentrancy_lock(lt); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							| 
									
										
										
										
											2016-04-21 15:26:47 +02:00
										 |  |  | 						__dump_backtrace(<->backtrace[lt->reentrancy], canlog); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 						log_mutex_error(canlog, "%s line %d (%s): '%s' was locked here.\n", | 
					
						
							| 
									
										
										
										
											2016-04-21 15:26:47 +02:00
										 |  |  | 								   lt->file[ROFFSET], lt->lineno[ROFFSET], | 
					
						
							|  |  |  | 								   lt->func[ROFFSET], mutex_name); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							| 
									
										
										
										
											2016-04-21 15:26:47 +02:00
										 |  |  | 						__dump_backtrace(<->backtrace[ROFFSET], canlog); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2016-04-21 15:26:47 +02:00
										 |  |  | 						ast_reentrancy_unlock(lt); | 
					
						
							|  |  |  | 					} | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 					reported_wait = wait_time; | 
					
						
							| 
									
										
										
										
											2022-07-27 19:54:43 +00:00
										 |  |  | 					if ((int) wait_time < 10) { /* Only emit an event when a deadlock starts, not every 5 seconds */ | 
					
						
							|  |  |  | 						/*** DOCUMENTATION
 | 
					
						
							|  |  |  | 							<managerEvent language="en_US" name="DeadlockStart"> | 
					
						
							|  |  |  | 								<managerEventInstance class="EVENT_FLAG_SYSTEM"> | 
					
						
							| 
									
										
										
										
											2025-01-23 16:35:58 -05:00
										 |  |  | 									<since> | 
					
						
							|  |  |  | 										<version>16.29.0</version> | 
					
						
							|  |  |  | 										<version>18.15.0</version> | 
					
						
							|  |  |  | 										<version>19.7.0</version> | 
					
						
							|  |  |  | 									</since> | 
					
						
							| 
									
										
										
										
											2022-07-27 19:54:43 +00:00
										 |  |  | 									<synopsis>Raised when a probable deadlock has started. | 
					
						
							|  |  |  | 									Delivery of this event is attempted but not guaranteed, | 
					
						
							|  |  |  |                                                                         and could fail for example if the manager itself is deadlocked. | 
					
						
							|  |  |  |                                                                         </synopsis> | 
					
						
							|  |  |  | 										<syntax> | 
					
						
							|  |  |  | 											<parameter name="Mutex"> | 
					
						
							|  |  |  | 												<para>The mutex involved in the deadlock.</para> | 
					
						
							|  |  |  | 											</parameter> | 
					
						
							|  |  |  | 										</syntax> | 
					
						
							|  |  |  | 								</managerEventInstance> | 
					
						
							|  |  |  | 							</managerEvent> | 
					
						
							|  |  |  | 						***/ | 
					
						
							|  |  |  | 						manager_event(EVENT_FLAG_SYSTEM, "DeadlockStart", | 
					
						
							|  |  |  | 							"Mutex: %s\r\n", | 
					
						
							|  |  |  | 							mutex_name); | 
					
						
							|  |  |  | 					} | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				} | 
					
						
							|  |  |  | 				usleep(200); | 
					
						
							|  |  |  | 			} | 
					
						
							|  |  |  | 		} while (res == EBUSY); | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | #else /* !DETECT_DEADLOCKS || !DEBUG_THREADS */
 | 
					
						
							|  |  |  | #ifdef	HAVE_MTX_PROFILE
 | 
					
						
							|  |  |  | 	ast_mark(mtx_prof, 1); | 
					
						
							|  |  |  | 	res = pthread_mutex_trylock(&t->mutex); | 
					
						
							|  |  |  | 	ast_mark(mtx_prof, 0); | 
					
						
							|  |  |  | 	if (res) | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 	res = pthread_mutex_lock(&t->mutex); | 
					
						
							|  |  |  | #endif /* !DETECT_DEADLOCKS || !DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	if (lt && !res) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		ast_reentrancy_lock(lt); | 
					
						
							|  |  |  | 		if (lt->reentrancy < AST_MAX_REENTRANCY) { | 
					
						
							|  |  |  | 			lt->file[lt->reentrancy] = filename; | 
					
						
							|  |  |  | 			lt->lineno[lt->reentrancy] = lineno; | 
					
						
							|  |  |  | 			lt->func[lt->reentrancy] = func; | 
					
						
							| 
									
										
											  
											
												chan_sip:  Address runaway when realtime peers subscribe to mailboxes
Users upgrading from asterisk 13.5 to a later version and who use
realtime with peers that have mailboxes were experiencing runaway
situations that manifested as a continuous stream of taskprocessor
congestion errors, memory leaks and an unresponsive chan_sip.
A related issue was that setting rtcachefriends=no NEVER worked in
asterisk 13 (since the move to stasis).  In 13.5 and earlier, when a
peer tried to register, all of the stasis threads would block and
chan_sip would again become unresponsive.  After 13.5, the runaway
would happen.
There were a number of causes...
* mwi_event_cb was (indirectly) calling build_peer even though calls to
  mwi_event_cb are often caused by build_peer.
* In an effort to prevent chan_sip from being unloaded while messages
  were still in flight, destroy_mailboxes was calling
  stasis_unsubscribe_and_join but in some cases waited forever for the
  final message.
* add_peer_mailboxes wasn't properly marking the existing mailboxes
  on a peer as "keep" so build_peer would always delete them all.
* add_peer_mwi_subs was unsubscribing existing mailbox subscriptions
  then just creating them again.
All of this was causing a flood of subscribes and unsubscribes on
multiple threads all for the same peer and mailbox.
Fixes...
* add_peer_mailboxes now marks mailboxes correctly and build_peer only
  deletes the ones that really are no longer needed by the peer.
* add_peer_mwi_subs now only adds subscriptions marked as "new" instead
  of unsubscribing and resubscribing everything.  It also adds the peer
  object's address to the mailbox instead of its name to the subscription
  userdata so mwi_event_cb doesn't have to call build_peer.
With these changes, with rtcachefriends=yes (the most common setting),
there are no leaks, locks, loops or crashes at shutdown.
rtcachefriends=no still causes leaks but at least it doesn't lock, loop
or crash.  Since making rtcachefriends=no work wasnt in scope for this
issue, further work will have to be deferred to a separate patch.
Side fixes...
 * The ast_lock_track structure had a member named "thread" which gdb
   doesn't like since it conflicts with it's "thread" command.  That
   member was renamed to "thread_id".
ASTERISK-25468 #close
Change-Id: I07519ef7f092629e1e844f855abd279d6475cdd0
											
										 
											2016-09-20 08:42:15 -06:00
										 |  |  | 			lt->thread_id[lt->reentrancy] = pthread_self(); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 			lt->reentrancy++; | 
					
						
							|  |  |  | 		} else { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 			log_mutex_error(canlog, "%s line %d (%s): '%s' really deep reentrancy!\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 							   filename, lineno, func, mutex_name); | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 		ast_reentrancy_unlock(lt); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		ast_mark_lock_acquired(t); | 
					
						
							|  |  |  | 	} else if (lt) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							|  |  |  | 		if (lt->reentrancy) { | 
					
						
							|  |  |  | 			ast_reentrancy_lock(lt); | 
					
						
							|  |  |  | 			bt = <->backtrace[lt->reentrancy-1]; | 
					
						
							|  |  |  | 			ast_reentrancy_unlock(lt); | 
					
						
							|  |  |  | 		} else { | 
					
						
							|  |  |  | 			bt = NULL; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2017-10-23 01:55:18 -04:00
										 |  |  | 		ast_remove_lock_info(t, bt); | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | 	if (res) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 		log_mutex_error(canlog, "%s line %d (%s): Error obtaining mutex: %s\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				   filename, lineno, func, strerror(res)); | 
					
						
							|  |  |  | 		DO_THREAD_CRASH; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	return res; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | int __ast_pthread_mutex_trylock(const char *filename, int lineno, const char *func, | 
					
						
							| 
									
										
										
										
											2012-03-22 19:51:16 +00:00
										 |  |  | 				const char* mutex_name, ast_mutex_t *t) | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | { | 
					
						
							|  |  |  | 	int res; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	struct ast_lock_track *lt = ast_get_reentrancy(&t->track, &t->flags, 0); | 
					
						
							|  |  |  | 	int canlog = t->flags.tracking && strcmp(filename, "logger.c"); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	struct ast_bt *bt = NULL; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	if (lt) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 		struct ast_bt tmp; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		/* The implementation of backtrace() may have its own locks.
 | 
					
						
							|  |  |  | 		 * Capture the backtrace outside of the reentrancy lock to | 
					
						
							|  |  |  | 		 * avoid deadlocks. See ASTERISK-22455. */ | 
					
						
							|  |  |  | 		ast_bt_get_addresses(&tmp); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		ast_reentrancy_lock(lt); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		if (lt->reentrancy < AST_MAX_REENTRANCY) { | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 			lt->backtrace[lt->reentrancy] = tmp; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 			bt = <->backtrace[lt->reentrancy]; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 		ast_reentrancy_unlock(lt); | 
					
						
							|  |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2017-10-23 01:55:18 -04:00
										 |  |  | 		ast_store_lock_info(AST_MUTEX, filename, lineno, func, mutex_name, t, bt); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	res = pthread_mutex_trylock(&t->mutex); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	if (lt && !res) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		ast_reentrancy_lock(lt); | 
					
						
							|  |  |  | 		if (lt->reentrancy < AST_MAX_REENTRANCY) { | 
					
						
							|  |  |  | 			lt->file[lt->reentrancy] = filename; | 
					
						
							|  |  |  | 			lt->lineno[lt->reentrancy] = lineno; | 
					
						
							|  |  |  | 			lt->func[lt->reentrancy] = func; | 
					
						
							| 
									
										
											  
											
												chan_sip:  Address runaway when realtime peers subscribe to mailboxes
Users upgrading from asterisk 13.5 to a later version and who use
realtime with peers that have mailboxes were experiencing runaway
situations that manifested as a continuous stream of taskprocessor
congestion errors, memory leaks and an unresponsive chan_sip.
A related issue was that setting rtcachefriends=no NEVER worked in
asterisk 13 (since the move to stasis).  In 13.5 and earlier, when a
peer tried to register, all of the stasis threads would block and
chan_sip would again become unresponsive.  After 13.5, the runaway
would happen.
There were a number of causes...
* mwi_event_cb was (indirectly) calling build_peer even though calls to
  mwi_event_cb are often caused by build_peer.
* In an effort to prevent chan_sip from being unloaded while messages
  were still in flight, destroy_mailboxes was calling
  stasis_unsubscribe_and_join but in some cases waited forever for the
  final message.
* add_peer_mailboxes wasn't properly marking the existing mailboxes
  on a peer as "keep" so build_peer would always delete them all.
* add_peer_mwi_subs was unsubscribing existing mailbox subscriptions
  then just creating them again.
All of this was causing a flood of subscribes and unsubscribes on
multiple threads all for the same peer and mailbox.
Fixes...
* add_peer_mailboxes now marks mailboxes correctly and build_peer only
  deletes the ones that really are no longer needed by the peer.
* add_peer_mwi_subs now only adds subscriptions marked as "new" instead
  of unsubscribing and resubscribing everything.  It also adds the peer
  object's address to the mailbox instead of its name to the subscription
  userdata so mwi_event_cb doesn't have to call build_peer.
With these changes, with rtcachefriends=yes (the most common setting),
there are no leaks, locks, loops or crashes at shutdown.
rtcachefriends=no still causes leaks but at least it doesn't lock, loop
or crash.  Since making rtcachefriends=no work wasnt in scope for this
issue, further work will have to be deferred to a separate patch.
Side fixes...
 * The ast_lock_track structure had a member named "thread" which gdb
   doesn't like since it conflicts with it's "thread" command.  That
   member was renamed to "thread_id".
ASTERISK-25468 #close
Change-Id: I07519ef7f092629e1e844f855abd279d6475cdd0
											
										 
											2016-09-20 08:42:15 -06:00
										 |  |  | 			lt->thread_id[lt->reentrancy] = pthread_self(); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 			lt->reentrancy++; | 
					
						
							|  |  |  | 		} else { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 			log_mutex_error(canlog, "%s line %d (%s): '%s' really deep reentrancy!\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 					   filename, lineno, func, mutex_name); | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 		ast_reentrancy_unlock(lt); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		ast_mark_lock_acquired(t); | 
					
						
							|  |  |  | 	} else if (lt) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		ast_mark_lock_failed(t); | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	return res; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | int __ast_pthread_mutex_unlock(const char *filename, int lineno, const char *func, | 
					
						
							|  |  |  | 					     const char *mutex_name, ast_mutex_t *t) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	int res; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	struct ast_lock_track *lt = NULL; | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	int canlog = t->flags.tracking && strcmp(filename, "logger.c"); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	struct ast_bt *bt = NULL; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #if defined(AST_MUTEX_INIT_W_CONSTRUCTORS) && defined(CAN_COMPARE_MUTEX_TO_INIT_VALUE)
 | 
					
						
							|  |  |  | 	if ((t->mutex) == ((pthread_mutex_t) PTHREAD_MUTEX_INITIALIZER)) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 		log_mutex_error(canlog, "%s line %d (%s): Error: mutex '%s' is uninitialized.\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				   filename, lineno, func, mutex_name); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		DO_THREAD_CRASH; | 
					
						
							|  |  |  | 		return EINVAL; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | #endif /* AST_MUTEX_INIT_W_CONSTRUCTORS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	lt = ast_get_reentrancy(&t->track, &t->flags, 0); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	if (lt) { | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 		ast_reentrancy_lock(lt); | 
					
						
							| 
									
										
											  
											
												chan_sip:  Address runaway when realtime peers subscribe to mailboxes
Users upgrading from asterisk 13.5 to a later version and who use
realtime with peers that have mailboxes were experiencing runaway
situations that manifested as a continuous stream of taskprocessor
congestion errors, memory leaks and an unresponsive chan_sip.
A related issue was that setting rtcachefriends=no NEVER worked in
asterisk 13 (since the move to stasis).  In 13.5 and earlier, when a
peer tried to register, all of the stasis threads would block and
chan_sip would again become unresponsive.  After 13.5, the runaway
would happen.
There were a number of causes...
* mwi_event_cb was (indirectly) calling build_peer even though calls to
  mwi_event_cb are often caused by build_peer.
* In an effort to prevent chan_sip from being unloaded while messages
  were still in flight, destroy_mailboxes was calling
  stasis_unsubscribe_and_join but in some cases waited forever for the
  final message.
* add_peer_mailboxes wasn't properly marking the existing mailboxes
  on a peer as "keep" so build_peer would always delete them all.
* add_peer_mwi_subs was unsubscribing existing mailbox subscriptions
  then just creating them again.
All of this was causing a flood of subscribes and unsubscribes on
multiple threads all for the same peer and mailbox.
Fixes...
* add_peer_mailboxes now marks mailboxes correctly and build_peer only
  deletes the ones that really are no longer needed by the peer.
* add_peer_mwi_subs now only adds subscriptions marked as "new" instead
  of unsubscribing and resubscribing everything.  It also adds the peer
  object's address to the mailbox instead of its name to the subscription
  userdata so mwi_event_cb doesn't have to call build_peer.
With these changes, with rtcachefriends=yes (the most common setting),
there are no leaks, locks, loops or crashes at shutdown.
rtcachefriends=no still causes leaks but at least it doesn't lock, loop
or crash.  Since making rtcachefriends=no work wasnt in scope for this
issue, further work will have to be deferred to a separate patch.
Side fixes...
 * The ast_lock_track structure had a member named "thread" which gdb
   doesn't like since it conflicts with it's "thread" command.  That
   member was renamed to "thread_id".
ASTERISK-25468 #close
Change-Id: I07519ef7f092629e1e844f855abd279d6475cdd0
											
										 
											2016-09-20 08:42:15 -06:00
										 |  |  | 		if (lt->reentrancy && (lt->thread_id[ROFFSET] != pthread_self())) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 			log_mutex_error(canlog, "%s line %d (%s): attempted unlock mutex '%s' without owning it!\n", | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 					   filename, lineno, func, mutex_name); | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 			log_mutex_error(canlog, "%s line %d (%s): '%s' was locked here.\n", | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 					   lt->file[ROFFSET], lt->lineno[ROFFSET], lt->func[ROFFSET], mutex_name); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 			__dump_backtrace(<->backtrace[ROFFSET], canlog); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 			DO_THREAD_CRASH; | 
					
						
							|  |  |  | 		} | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 		if (--lt->reentrancy < 0) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 			log_mutex_error(canlog, "%s line %d (%s): mutex '%s' freed more times than we've locked!\n", | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 					   filename, lineno, func, mutex_name); | 
					
						
							|  |  |  | 			lt->reentrancy = 0; | 
					
						
							|  |  |  | 		} | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 		if (lt->reentrancy < AST_MAX_REENTRANCY) { | 
					
						
							|  |  |  | 			lt->file[lt->reentrancy] = NULL; | 
					
						
							|  |  |  | 			lt->lineno[lt->reentrancy] = 0; | 
					
						
							|  |  |  | 			lt->func[lt->reentrancy] = NULL; | 
					
						
							| 
									
										
											  
											
												chan_sip:  Address runaway when realtime peers subscribe to mailboxes
Users upgrading from asterisk 13.5 to a later version and who use
realtime with peers that have mailboxes were experiencing runaway
situations that manifested as a continuous stream of taskprocessor
congestion errors, memory leaks and an unresponsive chan_sip.
A related issue was that setting rtcachefriends=no NEVER worked in
asterisk 13 (since the move to stasis).  In 13.5 and earlier, when a
peer tried to register, all of the stasis threads would block and
chan_sip would again become unresponsive.  After 13.5, the runaway
would happen.
There were a number of causes...
* mwi_event_cb was (indirectly) calling build_peer even though calls to
  mwi_event_cb are often caused by build_peer.
* In an effort to prevent chan_sip from being unloaded while messages
  were still in flight, destroy_mailboxes was calling
  stasis_unsubscribe_and_join but in some cases waited forever for the
  final message.
* add_peer_mailboxes wasn't properly marking the existing mailboxes
  on a peer as "keep" so build_peer would always delete them all.
* add_peer_mwi_subs was unsubscribing existing mailbox subscriptions
  then just creating them again.
All of this was causing a flood of subscribes and unsubscribes on
multiple threads all for the same peer and mailbox.
Fixes...
* add_peer_mailboxes now marks mailboxes correctly and build_peer only
  deletes the ones that really are no longer needed by the peer.
* add_peer_mwi_subs now only adds subscriptions marked as "new" instead
  of unsubscribing and resubscribing everything.  It also adds the peer
  object's address to the mailbox instead of its name to the subscription
  userdata so mwi_event_cb doesn't have to call build_peer.
With these changes, with rtcachefriends=yes (the most common setting),
there are no leaks, locks, loops or crashes at shutdown.
rtcachefriends=no still causes leaks but at least it doesn't lock, loop
or crash.  Since making rtcachefriends=no work wasnt in scope for this
issue, further work will have to be deferred to a separate patch.
Side fixes...
 * The ast_lock_track structure had a member named "thread" which gdb
   doesn't like since it conflicts with it's "thread" command.  That
   member was renamed to "thread_id".
ASTERISK-25468 #close
Change-Id: I07519ef7f092629e1e844f855abd279d6475cdd0
											
										 
											2016-09-20 08:42:15 -06:00
										 |  |  | 			lt->thread_id[lt->reentrancy] = 0; | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 		} | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | #ifdef HAVE_BKTR
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 		if (lt->reentrancy) { | 
					
						
							|  |  |  | 			bt = <->backtrace[lt->reentrancy - 1]; | 
					
						
							|  |  |  | 		} | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 		ast_reentrancy_unlock(lt); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | 		ast_remove_lock_info(t, bt); | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	res = pthread_mutex_unlock(&t->mutex); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							|  |  |  | 	if (res) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 		log_mutex_error(canlog, "%s line %d (%s): Error releasing mutex: %s\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				   filename, lineno, func, strerror(res)); | 
					
						
							|  |  |  | 		DO_THREAD_CRASH; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	return res; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | int __ast_cond_init(const char *filename, int lineno, const char *func, | 
					
						
							|  |  |  | 				  const char *cond_name, ast_cond_t *cond, pthread_condattr_t *cond_attr) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	return pthread_cond_init(cond, cond_attr); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | int __ast_cond_signal(const char *filename, int lineno, const char *func, | 
					
						
							|  |  |  | 				    const char *cond_name, ast_cond_t *cond) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	return pthread_cond_signal(cond); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | int __ast_cond_broadcast(const char *filename, int lineno, const char *func, | 
					
						
							|  |  |  | 				       const char *cond_name, ast_cond_t *cond) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	return pthread_cond_broadcast(cond); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | int __ast_cond_destroy(const char *filename, int lineno, const char *func, | 
					
						
							|  |  |  | 				     const char *cond_name, ast_cond_t *cond) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	return pthread_cond_destroy(cond); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							|  |  |  | static void restore_lock_tracking(struct ast_lock_track *lt, struct ast_lock_track *lt_saved) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	ast_reentrancy_lock(lt); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	/*
 | 
					
						
							|  |  |  | 	 * The following code must match the struct ast_lock_track | 
					
						
							|  |  |  | 	 * definition with the explicit exception of the reentr_mutex | 
					
						
							|  |  |  | 	 * member. | 
					
						
							|  |  |  | 	 */ | 
					
						
							|  |  |  | 	memcpy(lt->file, lt_saved->file, sizeof(lt->file)); | 
					
						
							|  |  |  | 	memcpy(lt->lineno, lt_saved->lineno, sizeof(lt->lineno)); | 
					
						
							|  |  |  | 	lt->reentrancy = lt_saved->reentrancy; | 
					
						
							|  |  |  | 	memcpy(lt->func, lt_saved->func, sizeof(lt->func)); | 
					
						
							| 
									
										
											  
											
												chan_sip:  Address runaway when realtime peers subscribe to mailboxes
Users upgrading from asterisk 13.5 to a later version and who use
realtime with peers that have mailboxes were experiencing runaway
situations that manifested as a continuous stream of taskprocessor
congestion errors, memory leaks and an unresponsive chan_sip.
A related issue was that setting rtcachefriends=no NEVER worked in
asterisk 13 (since the move to stasis).  In 13.5 and earlier, when a
peer tried to register, all of the stasis threads would block and
chan_sip would again become unresponsive.  After 13.5, the runaway
would happen.
There were a number of causes...
* mwi_event_cb was (indirectly) calling build_peer even though calls to
  mwi_event_cb are often caused by build_peer.
* In an effort to prevent chan_sip from being unloaded while messages
  were still in flight, destroy_mailboxes was calling
  stasis_unsubscribe_and_join but in some cases waited forever for the
  final message.
* add_peer_mailboxes wasn't properly marking the existing mailboxes
  on a peer as "keep" so build_peer would always delete them all.
* add_peer_mwi_subs was unsubscribing existing mailbox subscriptions
  then just creating them again.
All of this was causing a flood of subscribes and unsubscribes on
multiple threads all for the same peer and mailbox.
Fixes...
* add_peer_mailboxes now marks mailboxes correctly and build_peer only
  deletes the ones that really are no longer needed by the peer.
* add_peer_mwi_subs now only adds subscriptions marked as "new" instead
  of unsubscribing and resubscribing everything.  It also adds the peer
  object's address to the mailbox instead of its name to the subscription
  userdata so mwi_event_cb doesn't have to call build_peer.
With these changes, with rtcachefriends=yes (the most common setting),
there are no leaks, locks, loops or crashes at shutdown.
rtcachefriends=no still causes leaks but at least it doesn't lock, loop
or crash.  Since making rtcachefriends=no work wasnt in scope for this
issue, further work will have to be deferred to a separate patch.
Side fixes...
 * The ast_lock_track structure had a member named "thread" which gdb
   doesn't like since it conflicts with it's "thread" command.  That
   member was renamed to "thread_id".
ASTERISK-25468 #close
Change-Id: I07519ef7f092629e1e844f855abd279d6475cdd0
											
										 
											2016-09-20 08:42:15 -06:00
										 |  |  | 	memcpy(lt->thread_id, lt_saved->thread_id, sizeof(lt->thread_id)); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							|  |  |  | 	memcpy(lt->backtrace, lt_saved->backtrace, sizeof(lt->backtrace)); | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	ast_reentrancy_unlock(lt); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | int __ast_cond_wait(const char *filename, int lineno, const char *func, | 
					
						
							|  |  |  | 				  const char *cond_name, const char *mutex_name, | 
					
						
							|  |  |  | 				  ast_cond_t *cond, ast_mutex_t *t) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	int res; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	struct ast_lock_track *lt = NULL; | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 	struct ast_lock_track lt_orig; | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	int canlog = t->flags.tracking && strcmp(filename, "logger.c"); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | #if defined(AST_MUTEX_INIT_W_CONSTRUCTORS) && defined(CAN_COMPARE_MUTEX_TO_INIT_VALUE)
 | 
					
						
							|  |  |  | 	if ((t->mutex) == ((pthread_mutex_t) PTHREAD_MUTEX_INITIALIZER)) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 		log_mutex_error(canlog, "%s line %d (%s): Error: mutex '%s' is uninitialized.\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				   filename, lineno, func, mutex_name); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		DO_THREAD_CRASH; | 
					
						
							|  |  |  | 		return EINVAL; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | #endif /* AST_MUTEX_INIT_W_CONSTRUCTORS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	lt = ast_get_reentrancy(&t->track, &t->flags, 0); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	if (lt) { | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 		ast_reentrancy_lock(lt); | 
					
						
							| 
									
										
											  
											
												chan_sip:  Address runaway when realtime peers subscribe to mailboxes
Users upgrading from asterisk 13.5 to a later version and who use
realtime with peers that have mailboxes were experiencing runaway
situations that manifested as a continuous stream of taskprocessor
congestion errors, memory leaks and an unresponsive chan_sip.
A related issue was that setting rtcachefriends=no NEVER worked in
asterisk 13 (since the move to stasis).  In 13.5 and earlier, when a
peer tried to register, all of the stasis threads would block and
chan_sip would again become unresponsive.  After 13.5, the runaway
would happen.
There were a number of causes...
* mwi_event_cb was (indirectly) calling build_peer even though calls to
  mwi_event_cb are often caused by build_peer.
* In an effort to prevent chan_sip from being unloaded while messages
  were still in flight, destroy_mailboxes was calling
  stasis_unsubscribe_and_join but in some cases waited forever for the
  final message.
* add_peer_mailboxes wasn't properly marking the existing mailboxes
  on a peer as "keep" so build_peer would always delete them all.
* add_peer_mwi_subs was unsubscribing existing mailbox subscriptions
  then just creating them again.
All of this was causing a flood of subscribes and unsubscribes on
multiple threads all for the same peer and mailbox.
Fixes...
* add_peer_mailboxes now marks mailboxes correctly and build_peer only
  deletes the ones that really are no longer needed by the peer.
* add_peer_mwi_subs now only adds subscriptions marked as "new" instead
  of unsubscribing and resubscribing everything.  It also adds the peer
  object's address to the mailbox instead of its name to the subscription
  userdata so mwi_event_cb doesn't have to call build_peer.
With these changes, with rtcachefriends=yes (the most common setting),
there are no leaks, locks, loops or crashes at shutdown.
rtcachefriends=no still causes leaks but at least it doesn't lock, loop
or crash.  Since making rtcachefriends=no work wasnt in scope for this
issue, further work will have to be deferred to a separate patch.
Side fixes...
 * The ast_lock_track structure had a member named "thread" which gdb
   doesn't like since it conflicts with it's "thread" command.  That
   member was renamed to "thread_id".
ASTERISK-25468 #close
Change-Id: I07519ef7f092629e1e844f855abd279d6475cdd0
											
										 
											2016-09-20 08:42:15 -06:00
										 |  |  | 		if (lt->reentrancy && (lt->thread_id[ROFFSET] != pthread_self())) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 			log_mutex_error(canlog, "%s line %d (%s): attempted wait using mutex '%s' without owning it!\n", | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 					   filename, lineno, func, mutex_name); | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 			log_mutex_error(canlog, "%s line %d (%s): '%s' was locked here.\n", | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 					   lt->file[ROFFSET], lt->lineno[ROFFSET], lt->func[ROFFSET], mutex_name); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 			__dump_backtrace(<->backtrace[ROFFSET], canlog); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 			DO_THREAD_CRASH; | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 		} else if (lt->reentrancy <= 0) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 			log_mutex_error(canlog, "%s line %d (%s): attempted wait using an unlocked mutex '%s'\n", | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 					   filename, lineno, func, mutex_name); | 
					
						
							|  |  |  | 			DO_THREAD_CRASH; | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 		} | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 		/* Waiting on a condition completely suspends a recursive mutex,
 | 
					
						
							|  |  |  | 		 * even if it's been recursively locked multiple times. Make a | 
					
						
							|  |  |  | 		 * copy of the lock tracking, and reset reentrancy to zero */ | 
					
						
							|  |  |  | 		lt_orig = *lt; | 
					
						
							|  |  |  | 		lt->reentrancy = 0; | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 		ast_reentrancy_unlock(lt); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 		ast_suspend_lock_info(t); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	res = pthread_cond_wait(cond, &t->mutex); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							|  |  |  | 	if (res) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 		log_mutex_error(canlog, "%s line %d (%s): Error waiting on condition mutex '%s'\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				   filename, lineno, func, strerror(res)); | 
					
						
							|  |  |  | 		DO_THREAD_CRASH; | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	} else if (lt) { | 
					
						
							|  |  |  | 		restore_lock_tracking(lt, <_orig); | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 		ast_restore_lock_info(t); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	return res; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | int __ast_cond_timedwait(const char *filename, int lineno, const char *func, | 
					
						
							|  |  |  | 				       const char *cond_name, const char *mutex_name, ast_cond_t *cond, | 
					
						
							|  |  |  | 				       ast_mutex_t *t, const struct timespec *abstime) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	int res; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	struct ast_lock_track *lt = NULL; | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 	struct ast_lock_track lt_orig; | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	int canlog = t->flags.tracking && strcmp(filename, "logger.c"); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | #if defined(AST_MUTEX_INIT_W_CONSTRUCTORS) && defined(CAN_COMPARE_MUTEX_TO_INIT_VALUE)
 | 
					
						
							|  |  |  | 	if ((t->mutex) == ((pthread_mutex_t) PTHREAD_MUTEX_INITIALIZER)) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 		log_mutex_error(canlog, "%s line %d (%s): Error: mutex '%s' is uninitialized.\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				   filename, lineno, func, mutex_name); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		DO_THREAD_CRASH; | 
					
						
							|  |  |  | 		return EINVAL; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | #endif /* AST_MUTEX_INIT_W_CONSTRUCTORS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	lt = ast_get_reentrancy(&t->track, &t->flags, 0); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	if (lt) { | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 		ast_reentrancy_lock(lt); | 
					
						
							| 
									
										
											  
											
												chan_sip:  Address runaway when realtime peers subscribe to mailboxes
Users upgrading from asterisk 13.5 to a later version and who use
realtime with peers that have mailboxes were experiencing runaway
situations that manifested as a continuous stream of taskprocessor
congestion errors, memory leaks and an unresponsive chan_sip.
A related issue was that setting rtcachefriends=no NEVER worked in
asterisk 13 (since the move to stasis).  In 13.5 and earlier, when a
peer tried to register, all of the stasis threads would block and
chan_sip would again become unresponsive.  After 13.5, the runaway
would happen.
There were a number of causes...
* mwi_event_cb was (indirectly) calling build_peer even though calls to
  mwi_event_cb are often caused by build_peer.
* In an effort to prevent chan_sip from being unloaded while messages
  were still in flight, destroy_mailboxes was calling
  stasis_unsubscribe_and_join but in some cases waited forever for the
  final message.
* add_peer_mailboxes wasn't properly marking the existing mailboxes
  on a peer as "keep" so build_peer would always delete them all.
* add_peer_mwi_subs was unsubscribing existing mailbox subscriptions
  then just creating them again.
All of this was causing a flood of subscribes and unsubscribes on
multiple threads all for the same peer and mailbox.
Fixes...
* add_peer_mailboxes now marks mailboxes correctly and build_peer only
  deletes the ones that really are no longer needed by the peer.
* add_peer_mwi_subs now only adds subscriptions marked as "new" instead
  of unsubscribing and resubscribing everything.  It also adds the peer
  object's address to the mailbox instead of its name to the subscription
  userdata so mwi_event_cb doesn't have to call build_peer.
With these changes, with rtcachefriends=yes (the most common setting),
there are no leaks, locks, loops or crashes at shutdown.
rtcachefriends=no still causes leaks but at least it doesn't lock, loop
or crash.  Since making rtcachefriends=no work wasnt in scope for this
issue, further work will have to be deferred to a separate patch.
Side fixes...
 * The ast_lock_track structure had a member named "thread" which gdb
   doesn't like since it conflicts with it's "thread" command.  That
   member was renamed to "thread_id".
ASTERISK-25468 #close
Change-Id: I07519ef7f092629e1e844f855abd279d6475cdd0
											
										 
											2016-09-20 08:42:15 -06:00
										 |  |  | 		if (lt->reentrancy && (lt->thread_id[ROFFSET] != pthread_self())) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 			log_mutex_error(canlog, "%s line %d (%s): attempted wait using mutex '%s' without owning it!\n", | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 					   filename, lineno, func, mutex_name); | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 			log_mutex_error(canlog, "%s line %d (%s): '%s' was locked here.\n", | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 					   lt->file[ROFFSET], lt->lineno[ROFFSET], lt->func[ROFFSET], mutex_name); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 			__dump_backtrace(<->backtrace[ROFFSET], canlog); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 			DO_THREAD_CRASH; | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 		} else if (lt->reentrancy <= 0) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 			log_mutex_error(canlog, "%s line %d (%s): attempted wait using an unlocked mutex '%s'\n", | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 					   filename, lineno, func, mutex_name); | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 			DO_THREAD_CRASH; | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 		} | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 		/* Waiting on a condition completely suspends a recursive mutex,
 | 
					
						
							|  |  |  | 		 * even if it's been recursively locked multiple times. Make a | 
					
						
							|  |  |  | 		 * copy of the lock tracking, and reset reentrancy to zero */ | 
					
						
							|  |  |  | 		lt_orig = *lt; | 
					
						
							|  |  |  | 		lt->reentrancy = 0; | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 		ast_reentrancy_unlock(lt); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 		ast_suspend_lock_info(t); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	res = pthread_cond_timedwait(cond, &t->mutex, abstime); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							|  |  |  | 	if (res && (res != ETIMEDOUT)) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 		log_mutex_error(canlog, "%s line %d (%s): Error waiting on condition mutex '%s'\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				   filename, lineno, func, strerror(res)); | 
					
						
							|  |  |  | 		DO_THREAD_CRASH; | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	} else if (lt) { | 
					
						
							|  |  |  | 		restore_lock_tracking(lt, <_orig); | 
					
						
							|  |  |  | 		ast_restore_lock_info(t); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	return res; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | int __ast_rwlock_init(int tracking, const char *filename, int lineno, \ | 
					
						
							|  |  |  | 	const char *func, const char *rwlock_name, ast_rwlock_t *t) | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | { | 
					
						
							|  |  |  | 	int res; | 
					
						
							|  |  |  | 	pthread_rwlockattr_t attr; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | #if defined(DEBUG_THREADS) && defined(AST_MUTEX_INIT_W_CONSTRUCTORS) && \
 | 
					
						
							|  |  |  | 	defined(CAN_COMPARE_MUTEX_TO_INIT_VALUE) | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	if (t->lock != ((pthread_rwlock_t) __AST_RWLOCK_INIT_VALUE)) { | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		int canlog = tracking && strcmp(filename, "logger.c"); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 		log_mutex_error(canlog, "%s line %d (%s): Warning: rwlock '%s' is already initialized.\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				filename, lineno, func, rwlock_name); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		DO_THREAD_CRASH; | 
					
						
							|  |  |  | 		return EBUSY; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | #endif /* AST_MUTEX_INIT_W_CONSTRUCTORS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | #if defined(DEBUG_THREADS) || defined(DETECT_DEADLOCKS)
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	t->track = NULL; | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	t->flags.tracking = tracking; | 
					
						
							|  |  |  | 	t->flags.setup = 0; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	pthread_rwlockattr_init(&attr); | 
					
						
							|  |  |  | #ifdef HAVE_PTHREAD_RWLOCK_PREFER_WRITER_NP
 | 
					
						
							|  |  |  | 	pthread_rwlockattr_setkind_np(&attr, PTHREAD_RWLOCK_PREFER_WRITER_NP); | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 	res = pthread_rwlock_init(&t->lock, &attr); | 
					
						
							|  |  |  | 	pthread_rwlockattr_destroy(&attr); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	return res; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | int __ast_rwlock_destroy(const char *filename, int lineno, const char *func, const char *rwlock_name, ast_rwlock_t *t) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	int res; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	struct ast_lock_track *lt = ast_get_reentrancy(&t->track, &t->flags, 1); | 
					
						
							|  |  |  | 	int canlog = t->flags.tracking && strcmp(filename, "logger.c"); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | #if defined(AST_MUTEX_INIT_W_CONSTRUCTORS) && defined(CAN_COMPARE_MUTEX_TO_INIT_VALUE)
 | 
					
						
							|  |  |  | 	if (t->lock == ((pthread_rwlock_t) __AST_RWLOCK_INIT_VALUE)) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 		log_mutex_error(canlog, "%s line %d (%s): Warning: rwlock '%s' is uninitialized.\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				   filename, lineno, func, rwlock_name); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		DO_THREAD_CRASH; | 
					
						
							|  |  |  | 		res = EINVAL; | 
					
						
							|  |  |  | 		goto lt_cleanup; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | #endif /* AST_MUTEX_INIT_W_CONSTRUCTORS */
 | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	res = pthread_rwlock_destroy(&t->lock); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							|  |  |  | 	if (res) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 		log_mutex_error(canlog, "%s line %d (%s): Error destroying rwlock %s: %s\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				filename, lineno, func, rwlock_name, strerror(res)); | 
					
						
							|  |  |  | 	} | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | #if defined(AST_MUTEX_INIT_W_CONSTRUCTORS) && defined(CAN_COMPARE_MUTEX_TO_INIT_VALUE)
 | 
					
						
							|  |  |  | lt_cleanup: | 
					
						
							|  |  |  | #endif /* AST_MUTEX_INIT_W_CONSTRUCTORS */
 | 
					
						
							|  |  |  | 	if (lt) { | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 		ast_reentrancy_lock(lt); | 
					
						
							|  |  |  | 		lt->file[0] = filename; | 
					
						
							|  |  |  | 		lt->lineno[0] = lineno; | 
					
						
							|  |  |  | 		lt->func[0] = func; | 
					
						
							|  |  |  | 		lt->reentrancy = 0; | 
					
						
							| 
									
										
											  
											
												chan_sip:  Address runaway when realtime peers subscribe to mailboxes
Users upgrading from asterisk 13.5 to a later version and who use
realtime with peers that have mailboxes were experiencing runaway
situations that manifested as a continuous stream of taskprocessor
congestion errors, memory leaks and an unresponsive chan_sip.
A related issue was that setting rtcachefriends=no NEVER worked in
asterisk 13 (since the move to stasis).  In 13.5 and earlier, when a
peer tried to register, all of the stasis threads would block and
chan_sip would again become unresponsive.  After 13.5, the runaway
would happen.
There were a number of causes...
* mwi_event_cb was (indirectly) calling build_peer even though calls to
  mwi_event_cb are often caused by build_peer.
* In an effort to prevent chan_sip from being unloaded while messages
  were still in flight, destroy_mailboxes was calling
  stasis_unsubscribe_and_join but in some cases waited forever for the
  final message.
* add_peer_mailboxes wasn't properly marking the existing mailboxes
  on a peer as "keep" so build_peer would always delete them all.
* add_peer_mwi_subs was unsubscribing existing mailbox subscriptions
  then just creating them again.
All of this was causing a flood of subscribes and unsubscribes on
multiple threads all for the same peer and mailbox.
Fixes...
* add_peer_mailboxes now marks mailboxes correctly and build_peer only
  deletes the ones that really are no longer needed by the peer.
* add_peer_mwi_subs now only adds subscriptions marked as "new" instead
  of unsubscribing and resubscribing everything.  It also adds the peer
  object's address to the mailbox instead of its name to the subscription
  userdata so mwi_event_cb doesn't have to call build_peer.
With these changes, with rtcachefriends=yes (the most common setting),
there are no leaks, locks, loops or crashes at shutdown.
rtcachefriends=no still causes leaks but at least it doesn't lock, loop
or crash.  Since making rtcachefriends=no work wasnt in scope for this
issue, further work will have to be deferred to a separate patch.
Side fixes...
 * The ast_lock_track structure had a member named "thread" which gdb
   doesn't like since it conflicts with it's "thread" command.  That
   member was renamed to "thread_id".
ASTERISK-25468 #close
Change-Id: I07519ef7f092629e1e844f855abd279d6475cdd0
											
										 
											2016-09-20 08:42:15 -06:00
										 |  |  | 		lt->thread_id[0] = 0; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 		memset(<->backtrace[0], 0, sizeof(lt->backtrace[0])); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 		ast_reentrancy_unlock(lt); | 
					
						
							|  |  |  | 		delete_reentrancy_cs(&t->track); | 
					
						
							|  |  |  | 	} | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	return res; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | int __ast_rwlock_unlock(const char *filename, int line, const char *func, ast_rwlock_t *t, const char *name) | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | { | 
					
						
							|  |  |  | 	int res; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	struct ast_lock_track *lt = NULL; | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	int canlog = t->flags.tracking && strcmp(filename, "logger.c"); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	struct ast_bt *bt = NULL; | 
					
						
							|  |  |  | 	int lock_found = 0; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #if defined(AST_MUTEX_INIT_W_CONSTRUCTORS) && defined(CAN_COMPARE_MUTEX_TO_INIT_VALUE)
 | 
					
						
							|  |  |  | 	if ((t->lock) == ((pthread_rwlock_t) __AST_RWLOCK_INIT_VALUE)) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 		log_mutex_error(canlog, "%s line %d (%s): Warning: rwlock '%s' is uninitialized.\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				   filename, line, func, name); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		DO_THREAD_CRASH; | 
					
						
							|  |  |  | 		return EINVAL; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | #endif /* AST_MUTEX_INIT_W_CONSTRUCTORS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	lt = ast_get_reentrancy(&t->track, &t->flags, 0); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	if (lt) { | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 		ast_reentrancy_lock(lt); | 
					
						
							|  |  |  | 		if (lt->reentrancy) { | 
					
						
							|  |  |  | 			int i; | 
					
						
							|  |  |  | 			pthread_t self = pthread_self(); | 
					
						
							|  |  |  | 			for (i = lt->reentrancy - 1; i >= 0; --i) { | 
					
						
							| 
									
										
											  
											
												chan_sip:  Address runaway when realtime peers subscribe to mailboxes
Users upgrading from asterisk 13.5 to a later version and who use
realtime with peers that have mailboxes were experiencing runaway
situations that manifested as a continuous stream of taskprocessor
congestion errors, memory leaks and an unresponsive chan_sip.
A related issue was that setting rtcachefriends=no NEVER worked in
asterisk 13 (since the move to stasis).  In 13.5 and earlier, when a
peer tried to register, all of the stasis threads would block and
chan_sip would again become unresponsive.  After 13.5, the runaway
would happen.
There were a number of causes...
* mwi_event_cb was (indirectly) calling build_peer even though calls to
  mwi_event_cb are often caused by build_peer.
* In an effort to prevent chan_sip from being unloaded while messages
  were still in flight, destroy_mailboxes was calling
  stasis_unsubscribe_and_join but in some cases waited forever for the
  final message.
* add_peer_mailboxes wasn't properly marking the existing mailboxes
  on a peer as "keep" so build_peer would always delete them all.
* add_peer_mwi_subs was unsubscribing existing mailbox subscriptions
  then just creating them again.
All of this was causing a flood of subscribes and unsubscribes on
multiple threads all for the same peer and mailbox.
Fixes...
* add_peer_mailboxes now marks mailboxes correctly and build_peer only
  deletes the ones that really are no longer needed by the peer.
* add_peer_mwi_subs now only adds subscriptions marked as "new" instead
  of unsubscribing and resubscribing everything.  It also adds the peer
  object's address to the mailbox instead of its name to the subscription
  userdata so mwi_event_cb doesn't have to call build_peer.
With these changes, with rtcachefriends=yes (the most common setting),
there are no leaks, locks, loops or crashes at shutdown.
rtcachefriends=no still causes leaks but at least it doesn't lock, loop
or crash.  Since making rtcachefriends=no work wasnt in scope for this
issue, further work will have to be deferred to a separate patch.
Side fixes...
 * The ast_lock_track structure had a member named "thread" which gdb
   doesn't like since it conflicts with it's "thread" command.  That
   member was renamed to "thread_id".
ASTERISK-25468 #close
Change-Id: I07519ef7f092629e1e844f855abd279d6475cdd0
											
										 
											2016-09-20 08:42:15 -06:00
										 |  |  | 				if (lt->thread_id[i] == self) { | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 					lock_found = 1; | 
					
						
							|  |  |  | 					if (i != lt->reentrancy - 1) { | 
					
						
							|  |  |  | 						lt->file[i] = lt->file[lt->reentrancy - 1]; | 
					
						
							|  |  |  | 						lt->lineno[i] = lt->lineno[lt->reentrancy - 1]; | 
					
						
							|  |  |  | 						lt->func[i] = lt->func[lt->reentrancy - 1]; | 
					
						
							| 
									
										
											  
											
												chan_sip:  Address runaway when realtime peers subscribe to mailboxes
Users upgrading from asterisk 13.5 to a later version and who use
realtime with peers that have mailboxes were experiencing runaway
situations that manifested as a continuous stream of taskprocessor
congestion errors, memory leaks and an unresponsive chan_sip.
A related issue was that setting rtcachefriends=no NEVER worked in
asterisk 13 (since the move to stasis).  In 13.5 and earlier, when a
peer tried to register, all of the stasis threads would block and
chan_sip would again become unresponsive.  After 13.5, the runaway
would happen.
There were a number of causes...
* mwi_event_cb was (indirectly) calling build_peer even though calls to
  mwi_event_cb are often caused by build_peer.
* In an effort to prevent chan_sip from being unloaded while messages
  were still in flight, destroy_mailboxes was calling
  stasis_unsubscribe_and_join but in some cases waited forever for the
  final message.
* add_peer_mailboxes wasn't properly marking the existing mailboxes
  on a peer as "keep" so build_peer would always delete them all.
* add_peer_mwi_subs was unsubscribing existing mailbox subscriptions
  then just creating them again.
All of this was causing a flood of subscribes and unsubscribes on
multiple threads all for the same peer and mailbox.
Fixes...
* add_peer_mailboxes now marks mailboxes correctly and build_peer only
  deletes the ones that really are no longer needed by the peer.
* add_peer_mwi_subs now only adds subscriptions marked as "new" instead
  of unsubscribing and resubscribing everything.  It also adds the peer
  object's address to the mailbox instead of its name to the subscription
  userdata so mwi_event_cb doesn't have to call build_peer.
With these changes, with rtcachefriends=yes (the most common setting),
there are no leaks, locks, loops or crashes at shutdown.
rtcachefriends=no still causes leaks but at least it doesn't lock, loop
or crash.  Since making rtcachefriends=no work wasnt in scope for this
issue, further work will have to be deferred to a separate patch.
Side fixes...
 * The ast_lock_track structure had a member named "thread" which gdb
   doesn't like since it conflicts with it's "thread" command.  That
   member was renamed to "thread_id".
ASTERISK-25468 #close
Change-Id: I07519ef7f092629e1e844f855abd279d6475cdd0
											
										 
											2016-09-20 08:42:15 -06:00
										 |  |  | 						lt->thread_id[i] = lt->thread_id[lt->reentrancy - 1]; | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 					} | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 					bt = <->backtrace[i]; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 					lt->file[lt->reentrancy - 1] = NULL; | 
					
						
							|  |  |  | 					lt->lineno[lt->reentrancy - 1] = 0; | 
					
						
							|  |  |  | 					lt->func[lt->reentrancy - 1] = NULL; | 
					
						
							| 
									
										
											  
											
												chan_sip:  Address runaway when realtime peers subscribe to mailboxes
Users upgrading from asterisk 13.5 to a later version and who use
realtime with peers that have mailboxes were experiencing runaway
situations that manifested as a continuous stream of taskprocessor
congestion errors, memory leaks and an unresponsive chan_sip.
A related issue was that setting rtcachefriends=no NEVER worked in
asterisk 13 (since the move to stasis).  In 13.5 and earlier, when a
peer tried to register, all of the stasis threads would block and
chan_sip would again become unresponsive.  After 13.5, the runaway
would happen.
There were a number of causes...
* mwi_event_cb was (indirectly) calling build_peer even though calls to
  mwi_event_cb are often caused by build_peer.
* In an effort to prevent chan_sip from being unloaded while messages
  were still in flight, destroy_mailboxes was calling
  stasis_unsubscribe_and_join but in some cases waited forever for the
  final message.
* add_peer_mailboxes wasn't properly marking the existing mailboxes
  on a peer as "keep" so build_peer would always delete them all.
* add_peer_mwi_subs was unsubscribing existing mailbox subscriptions
  then just creating them again.
All of this was causing a flood of subscribes and unsubscribes on
multiple threads all for the same peer and mailbox.
Fixes...
* add_peer_mailboxes now marks mailboxes correctly and build_peer only
  deletes the ones that really are no longer needed by the peer.
* add_peer_mwi_subs now only adds subscriptions marked as "new" instead
  of unsubscribing and resubscribing everything.  It also adds the peer
  object's address to the mailbox instead of its name to the subscription
  userdata so mwi_event_cb doesn't have to call build_peer.
With these changes, with rtcachefriends=yes (the most common setting),
there are no leaks, locks, loops or crashes at shutdown.
rtcachefriends=no still causes leaks but at least it doesn't lock, loop
or crash.  Since making rtcachefriends=no work wasnt in scope for this
issue, further work will have to be deferred to a separate patch.
Side fixes...
 * The ast_lock_track structure had a member named "thread" which gdb
   doesn't like since it conflicts with it's "thread" command.  That
   member was renamed to "thread_id".
ASTERISK-25468 #close
Change-Id: I07519ef7f092629e1e844f855abd279d6475cdd0
											
										 
											2016-09-20 08:42:15 -06:00
										 |  |  | 					lt->thread_id[lt->reentrancy - 1] = AST_PTHREADT_NULL; | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 					break; | 
					
						
							|  |  |  | 				} | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 			} | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 		if (lock_found && --lt->reentrancy < 0) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 			log_mutex_error(canlog, "%s line %d (%s): rwlock '%s' freed more times than we've locked!\n", | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 					filename, line, func, name); | 
					
						
							|  |  |  | 			lt->reentrancy = 0; | 
					
						
							|  |  |  | 		} | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 		ast_reentrancy_unlock(lt); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | 		ast_remove_lock_info(t, bt); | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	res = pthread_rwlock_unlock(&t->lock); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							|  |  |  | 	if (res) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 		log_mutex_error(canlog, "%s line %d (%s): Error releasing rwlock: %s\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				filename, line, func, strerror(res)); | 
					
						
							|  |  |  | 		DO_THREAD_CRASH; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	return res; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | int __ast_rwlock_rdlock(const char *filename, int line, const char *func, | 
					
						
							|  |  |  | 	ast_rwlock_t *t, const char *name) | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | { | 
					
						
							|  |  |  | 	int res; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | #if defined(DEBUG_THREADS) || defined(DETECT_DEADLOCKS)
 | 
					
						
							|  |  |  | 	int canlog = t->flags.tracking && strcmp(filename, "logger.c"); | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	struct ast_lock_track *lt = ast_get_reentrancy(&t->track, &t->flags, 0); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	struct ast_bt *bt = NULL; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	if (lt) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 		struct ast_bt tmp; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		/* The implementation of backtrace() may have its own locks.
 | 
					
						
							|  |  |  | 		 * Capture the backtrace outside of the reentrancy lock to | 
					
						
							|  |  |  | 		 * avoid deadlocks. See ASTERISK-22455. */ | 
					
						
							|  |  |  | 		ast_bt_get_addresses(&tmp); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		ast_reentrancy_lock(lt); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		if (lt->reentrancy < AST_MAX_REENTRANCY) { | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 			lt->backtrace[lt->reentrancy] = tmp; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 			bt = <->backtrace[lt->reentrancy]; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 		ast_reentrancy_unlock(lt); | 
					
						
							|  |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2017-10-23 01:55:18 -04:00
										 |  |  | 		ast_store_lock_info(AST_RDLOCK, filename, line, func, name, t, bt); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | #if defined(DETECT_DEADLOCKS)
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	{ | 
					
						
							|  |  |  | 		time_t seconds = time(NULL); | 
					
						
							|  |  |  | 		time_t wait_time, reported_wait = 0; | 
					
						
							|  |  |  | 		do { | 
					
						
							|  |  |  | 			res = pthread_rwlock_tryrdlock(&t->lock); | 
					
						
							|  |  |  | 			if (res == EBUSY) { | 
					
						
							|  |  |  | 				wait_time = time(NULL) - seconds; | 
					
						
							|  |  |  | 				if (wait_time > reported_wait && (wait_time % 5) == 0) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 					log_mutex_error(canlog, "%s line %d (%s): Deadlock? waited %d sec for readlock '%s'?\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 						filename, line, func, (int)wait_time, name); | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 					if (lt) { | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 						ast_reentrancy_lock(lt); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 						__dump_backtrace(<->backtrace[lt->reentrancy], canlog); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 						log_mutex_error(canlog, "%s line %d (%s): '%s' was locked  here.\n", | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 								lt->file[lt->reentrancy-1], lt->lineno[lt->reentrancy-1], | 
					
						
							|  |  |  | 								lt->func[lt->reentrancy-1], name); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 						__dump_backtrace(<->backtrace[lt->reentrancy-1], canlog); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 						ast_reentrancy_unlock(lt); | 
					
						
							|  |  |  | 					} | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 					reported_wait = wait_time; | 
					
						
							|  |  |  | 				} | 
					
						
							|  |  |  | 				usleep(200); | 
					
						
							|  |  |  | 			} | 
					
						
							|  |  |  | 		} while (res == EBUSY); | 
					
						
							|  |  |  | 	} | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | #else /* !DETECT_DEADLOCKS */
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	res = pthread_rwlock_rdlock(&t->lock); | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | #endif /* !DETECT_DEADLOCKS */
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	if (!res && lt) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		ast_reentrancy_lock(lt); | 
					
						
							|  |  |  | 		if (lt->reentrancy < AST_MAX_REENTRANCY) { | 
					
						
							|  |  |  | 			lt->file[lt->reentrancy] = filename; | 
					
						
							|  |  |  | 			lt->lineno[lt->reentrancy] = line; | 
					
						
							|  |  |  | 			lt->func[lt->reentrancy] = func; | 
					
						
							| 
									
										
											  
											
												chan_sip:  Address runaway when realtime peers subscribe to mailboxes
Users upgrading from asterisk 13.5 to a later version and who use
realtime with peers that have mailboxes were experiencing runaway
situations that manifested as a continuous stream of taskprocessor
congestion errors, memory leaks and an unresponsive chan_sip.
A related issue was that setting rtcachefriends=no NEVER worked in
asterisk 13 (since the move to stasis).  In 13.5 and earlier, when a
peer tried to register, all of the stasis threads would block and
chan_sip would again become unresponsive.  After 13.5, the runaway
would happen.
There were a number of causes...
* mwi_event_cb was (indirectly) calling build_peer even though calls to
  mwi_event_cb are often caused by build_peer.
* In an effort to prevent chan_sip from being unloaded while messages
  were still in flight, destroy_mailboxes was calling
  stasis_unsubscribe_and_join but in some cases waited forever for the
  final message.
* add_peer_mailboxes wasn't properly marking the existing mailboxes
  on a peer as "keep" so build_peer would always delete them all.
* add_peer_mwi_subs was unsubscribing existing mailbox subscriptions
  then just creating them again.
All of this was causing a flood of subscribes and unsubscribes on
multiple threads all for the same peer and mailbox.
Fixes...
* add_peer_mailboxes now marks mailboxes correctly and build_peer only
  deletes the ones that really are no longer needed by the peer.
* add_peer_mwi_subs now only adds subscriptions marked as "new" instead
  of unsubscribing and resubscribing everything.  It also adds the peer
  object's address to the mailbox instead of its name to the subscription
  userdata so mwi_event_cb doesn't have to call build_peer.
With these changes, with rtcachefriends=yes (the most common setting),
there are no leaks, locks, loops or crashes at shutdown.
rtcachefriends=no still causes leaks but at least it doesn't lock, loop
or crash.  Since making rtcachefriends=no work wasnt in scope for this
issue, further work will have to be deferred to a separate patch.
Side fixes...
 * The ast_lock_track structure had a member named "thread" which gdb
   doesn't like since it conflicts with it's "thread" command.  That
   member was renamed to "thread_id".
ASTERISK-25468 #close
Change-Id: I07519ef7f092629e1e844f855abd279d6475cdd0
											
										 
											2016-09-20 08:42:15 -06:00
										 |  |  | 			lt->thread_id[lt->reentrancy] = pthread_self(); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 			lt->reentrancy++; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 		ast_reentrancy_unlock(lt); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		ast_mark_lock_acquired(t); | 
					
						
							|  |  |  | 	} else if (lt) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							|  |  |  | 		if (lt->reentrancy) { | 
					
						
							|  |  |  | 			ast_reentrancy_lock(lt); | 
					
						
							|  |  |  | 			bt = <->backtrace[lt->reentrancy-1]; | 
					
						
							|  |  |  | 			ast_reentrancy_unlock(lt); | 
					
						
							|  |  |  | 		} else { | 
					
						
							|  |  |  | 			bt = NULL; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2017-10-23 01:55:18 -04:00
										 |  |  | 		ast_remove_lock_info(t, bt); | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	if (res) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 		log_mutex_error(canlog, "%s line %d (%s): Error obtaining read lock: %s\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				filename, line, func, strerror(res)); | 
					
						
							|  |  |  | 		DO_THREAD_CRASH; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	return res; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | int __ast_rwlock_wrlock(const char *filename, int line, const char *func, \ | 
					
						
							|  |  |  | 	ast_rwlock_t *t, const char *name) | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | { | 
					
						
							|  |  |  | 	int res; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | #if defined(DEBUG_THREADS) || defined(DETECT_DEADLOCKS)
 | 
					
						
							|  |  |  | 	int canlog = t->flags.tracking && strcmp(filename, "logger.c"); | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	struct ast_lock_track *lt = ast_get_reentrancy(&t->track, &t->flags, 0); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	struct ast_bt *bt = NULL; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	if (lt) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 		struct ast_bt tmp; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		/* The implementation of backtrace() may have its own locks.
 | 
					
						
							|  |  |  | 		 * Capture the backtrace outside of the reentrancy lock to | 
					
						
							|  |  |  | 		 * avoid deadlocks. See ASTERISK-22455. */ | 
					
						
							|  |  |  | 		ast_bt_get_addresses(&tmp); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		ast_reentrancy_lock(lt); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		if (lt->reentrancy < AST_MAX_REENTRANCY) { | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 			lt->backtrace[lt->reentrancy] = tmp; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 			bt = <->backtrace[lt->reentrancy]; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 		ast_reentrancy_unlock(lt); | 
					
						
							|  |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2017-10-23 01:55:18 -04:00
										 |  |  | 		ast_store_lock_info(AST_WRLOCK, filename, line, func, name, t, bt); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | #ifdef DETECT_DEADLOCKS
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	{ | 
					
						
							|  |  |  | 		time_t seconds = time(NULL); | 
					
						
							|  |  |  | 		time_t wait_time, reported_wait = 0; | 
					
						
							|  |  |  | 		do { | 
					
						
							|  |  |  | 			res = pthread_rwlock_trywrlock(&t->lock); | 
					
						
							|  |  |  | 			if (res == EBUSY) { | 
					
						
							|  |  |  | 				wait_time = time(NULL) - seconds; | 
					
						
							|  |  |  | 				if (wait_time > reported_wait && (wait_time % 5) == 0) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 					log_mutex_error(canlog, "%s line %d (%s): Deadlock? waited %d sec for writelock '%s'?\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 						filename, line, func, (int)wait_time, name); | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 					if (lt) { | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 						ast_reentrancy_lock(lt); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 						__dump_backtrace(<->backtrace[lt->reentrancy], canlog); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 						log_mutex_error(canlog, "%s line %d (%s): '%s' was locked  here.\n", | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 								lt->file[lt->reentrancy-1], lt->lineno[lt->reentrancy-1], | 
					
						
							|  |  |  | 								lt->func[lt->reentrancy-1], name); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 						__dump_backtrace(<->backtrace[lt->reentrancy-1], canlog); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 						ast_reentrancy_unlock(lt); | 
					
						
							|  |  |  | 					} | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 					reported_wait = wait_time; | 
					
						
							|  |  |  | 				} | 
					
						
							|  |  |  | 				usleep(200); | 
					
						
							|  |  |  | 			} | 
					
						
							|  |  |  | 		} while (res == EBUSY); | 
					
						
							|  |  |  | 	} | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | #else /* !DETECT_DEADLOCKS */
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	res = pthread_rwlock_wrlock(&t->lock); | 
					
						
							| 
									
										
										
										
											2023-09-13 09:18:04 -06:00
										 |  |  | #endif /* !DETECT_DEADLOCKS */
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	if (!res && lt) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		ast_reentrancy_lock(lt); | 
					
						
							|  |  |  | 		if (lt->reentrancy < AST_MAX_REENTRANCY) { | 
					
						
							|  |  |  | 			lt->file[lt->reentrancy] = filename; | 
					
						
							|  |  |  | 			lt->lineno[lt->reentrancy] = line; | 
					
						
							|  |  |  | 			lt->func[lt->reentrancy] = func; | 
					
						
							| 
									
										
											  
											
												chan_sip:  Address runaway when realtime peers subscribe to mailboxes
Users upgrading from asterisk 13.5 to a later version and who use
realtime with peers that have mailboxes were experiencing runaway
situations that manifested as a continuous stream of taskprocessor
congestion errors, memory leaks and an unresponsive chan_sip.
A related issue was that setting rtcachefriends=no NEVER worked in
asterisk 13 (since the move to stasis).  In 13.5 and earlier, when a
peer tried to register, all of the stasis threads would block and
chan_sip would again become unresponsive.  After 13.5, the runaway
would happen.
There were a number of causes...
* mwi_event_cb was (indirectly) calling build_peer even though calls to
  mwi_event_cb are often caused by build_peer.
* In an effort to prevent chan_sip from being unloaded while messages
  were still in flight, destroy_mailboxes was calling
  stasis_unsubscribe_and_join but in some cases waited forever for the
  final message.
* add_peer_mailboxes wasn't properly marking the existing mailboxes
  on a peer as "keep" so build_peer would always delete them all.
* add_peer_mwi_subs was unsubscribing existing mailbox subscriptions
  then just creating them again.
All of this was causing a flood of subscribes and unsubscribes on
multiple threads all for the same peer and mailbox.
Fixes...
* add_peer_mailboxes now marks mailboxes correctly and build_peer only
  deletes the ones that really are no longer needed by the peer.
* add_peer_mwi_subs now only adds subscriptions marked as "new" instead
  of unsubscribing and resubscribing everything.  It also adds the peer
  object's address to the mailbox instead of its name to the subscription
  userdata so mwi_event_cb doesn't have to call build_peer.
With these changes, with rtcachefriends=yes (the most common setting),
there are no leaks, locks, loops or crashes at shutdown.
rtcachefriends=no still causes leaks but at least it doesn't lock, loop
or crash.  Since making rtcachefriends=no work wasnt in scope for this
issue, further work will have to be deferred to a separate patch.
Side fixes...
 * The ast_lock_track structure had a member named "thread" which gdb
   doesn't like since it conflicts with it's "thread" command.  That
   member was renamed to "thread_id".
ASTERISK-25468 #close
Change-Id: I07519ef7f092629e1e844f855abd279d6475cdd0
											
										 
											2016-09-20 08:42:15 -06:00
										 |  |  | 			lt->thread_id[lt->reentrancy] = pthread_self(); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 			lt->reentrancy++; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 		ast_reentrancy_unlock(lt); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		ast_mark_lock_acquired(t); | 
					
						
							|  |  |  | 	} else if (lt) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							|  |  |  | 		if (lt->reentrancy) { | 
					
						
							|  |  |  | 			ast_reentrancy_lock(lt); | 
					
						
							|  |  |  | 			bt = <->backtrace[lt->reentrancy-1]; | 
					
						
							|  |  |  | 			ast_reentrancy_unlock(lt); | 
					
						
							|  |  |  | 		} else { | 
					
						
							|  |  |  | 			bt = NULL; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2017-10-23 01:55:18 -04:00
										 |  |  | 		ast_remove_lock_info(t, bt); | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | 	if (res) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 		log_mutex_error(canlog, "%s line %d (%s): Error obtaining write lock: %s\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				filename, line, func, strerror(res)); | 
					
						
							|  |  |  | 		DO_THREAD_CRASH; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	return res; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | int __ast_rwlock_timedrdlock(const char *filename, int line, const char *func, ast_rwlock_t *t, const char *name, | 
					
						
							|  |  |  | 	const struct timespec *abs_timeout) | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | { | 
					
						
							|  |  |  | 	int res; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	struct ast_lock_track *lt = ast_get_reentrancy(&t->track, &t->flags, 0); | 
					
						
							|  |  |  | 	int canlog = t->flags.tracking && strcmp(filename, "logger.c"); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	struct ast_bt *bt = NULL; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	if (lt) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 		struct ast_bt tmp; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		/* The implementation of backtrace() may have its own locks.
 | 
					
						
							|  |  |  | 		 * Capture the backtrace outside of the reentrancy lock to | 
					
						
							|  |  |  | 		 * avoid deadlocks. See ASTERISK-22455. */ | 
					
						
							|  |  |  | 		ast_bt_get_addresses(&tmp); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		ast_reentrancy_lock(lt); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		if (lt->reentrancy < AST_MAX_REENTRANCY) { | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 			lt->backtrace[lt->reentrancy] = tmp; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 			bt = <->backtrace[lt->reentrancy]; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 		ast_reentrancy_unlock(lt); | 
					
						
							|  |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2017-10-23 01:55:18 -04:00
										 |  |  | 		ast_store_lock_info(AST_WRLOCK, filename, line, func, name, t, bt); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef HAVE_PTHREAD_RWLOCK_TIMEDWRLOCK
 | 
					
						
							|  |  |  | 	res = pthread_rwlock_timedrdlock(&t->lock, abs_timeout); | 
					
						
							|  |  |  | #else
 | 
					
						
							|  |  |  | 	do { | 
					
						
							| 
									
										
										
										
											2012-08-27 16:56:56 +00:00
										 |  |  | 		struct timeval _now; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		for (;;) { | 
					
						
							|  |  |  | 			if (!(res = pthread_rwlock_tryrdlock(&t->lock))) { | 
					
						
							|  |  |  | 				break; | 
					
						
							|  |  |  | 			} | 
					
						
							| 
									
										
										
										
											2012-08-27 16:56:56 +00:00
										 |  |  | 			_now = ast_tvnow(); | 
					
						
							|  |  |  | 			if (_now.tv_sec > abs_timeout->tv_sec || (_now.tv_sec == abs_timeout->tv_sec && _now.tv_usec * 1000 > abs_timeout->tv_nsec)) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				break; | 
					
						
							|  |  |  | 			} | 
					
						
							|  |  |  | 			usleep(1); | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 	} while (0); | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	if (!res && lt) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		ast_reentrancy_lock(lt); | 
					
						
							|  |  |  | 		if (lt->reentrancy < AST_MAX_REENTRANCY) { | 
					
						
							|  |  |  | 			lt->file[lt->reentrancy] = filename; | 
					
						
							|  |  |  | 			lt->lineno[lt->reentrancy] = line; | 
					
						
							|  |  |  | 			lt->func[lt->reentrancy] = func; | 
					
						
							| 
									
										
											  
											
												chan_sip:  Address runaway when realtime peers subscribe to mailboxes
Users upgrading from asterisk 13.5 to a later version and who use
realtime with peers that have mailboxes were experiencing runaway
situations that manifested as a continuous stream of taskprocessor
congestion errors, memory leaks and an unresponsive chan_sip.
A related issue was that setting rtcachefriends=no NEVER worked in
asterisk 13 (since the move to stasis).  In 13.5 and earlier, when a
peer tried to register, all of the stasis threads would block and
chan_sip would again become unresponsive.  After 13.5, the runaway
would happen.
There were a number of causes...
* mwi_event_cb was (indirectly) calling build_peer even though calls to
  mwi_event_cb are often caused by build_peer.
* In an effort to prevent chan_sip from being unloaded while messages
  were still in flight, destroy_mailboxes was calling
  stasis_unsubscribe_and_join but in some cases waited forever for the
  final message.
* add_peer_mailboxes wasn't properly marking the existing mailboxes
  on a peer as "keep" so build_peer would always delete them all.
* add_peer_mwi_subs was unsubscribing existing mailbox subscriptions
  then just creating them again.
All of this was causing a flood of subscribes and unsubscribes on
multiple threads all for the same peer and mailbox.
Fixes...
* add_peer_mailboxes now marks mailboxes correctly and build_peer only
  deletes the ones that really are no longer needed by the peer.
* add_peer_mwi_subs now only adds subscriptions marked as "new" instead
  of unsubscribing and resubscribing everything.  It also adds the peer
  object's address to the mailbox instead of its name to the subscription
  userdata so mwi_event_cb doesn't have to call build_peer.
With these changes, with rtcachefriends=yes (the most common setting),
there are no leaks, locks, loops or crashes at shutdown.
rtcachefriends=no still causes leaks but at least it doesn't lock, loop
or crash.  Since making rtcachefriends=no work wasnt in scope for this
issue, further work will have to be deferred to a separate patch.
Side fixes...
 * The ast_lock_track structure had a member named "thread" which gdb
   doesn't like since it conflicts with it's "thread" command.  That
   member was renamed to "thread_id".
ASTERISK-25468 #close
Change-Id: I07519ef7f092629e1e844f855abd279d6475cdd0
											
										 
											2016-09-20 08:42:15 -06:00
										 |  |  | 			lt->thread_id[lt->reentrancy] = pthread_self(); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 			lt->reentrancy++; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 		ast_reentrancy_unlock(lt); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		ast_mark_lock_acquired(t); | 
					
						
							|  |  |  | 	} else if (lt) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							|  |  |  | 		if (lt->reentrancy) { | 
					
						
							|  |  |  | 			ast_reentrancy_lock(lt); | 
					
						
							|  |  |  | 			bt = <->backtrace[lt->reentrancy-1]; | 
					
						
							|  |  |  | 			ast_reentrancy_unlock(lt); | 
					
						
							|  |  |  | 		} else { | 
					
						
							|  |  |  | 			bt = NULL; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2017-10-23 01:55:18 -04:00
										 |  |  | 		ast_remove_lock_info(t, bt); | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | 	if (res) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 		log_mutex_error(canlog, "%s line %d (%s): Error obtaining read lock: %s\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				filename, line, func, strerror(res)); | 
					
						
							|  |  |  | 		DO_THREAD_CRASH; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	return res; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | int __ast_rwlock_timedwrlock(const char *filename, int line, const char *func, ast_rwlock_t *t, const char *name, | 
					
						
							|  |  |  | 	const struct timespec *abs_timeout) | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | { | 
					
						
							|  |  |  | 	int res; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	struct ast_lock_track *lt = ast_get_reentrancy(&t->track, &t->flags, 0); | 
					
						
							|  |  |  | 	int canlog = t->flags.tracking && strcmp(filename, "logger.c"); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	struct ast_bt *bt = NULL; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	if (lt) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 		struct ast_bt tmp; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		/* The implementation of backtrace() may have its own locks.
 | 
					
						
							|  |  |  | 		 * Capture the backtrace outside of the reentrancy lock to | 
					
						
							|  |  |  | 		 * avoid deadlocks. See ASTERISK-22455. */ | 
					
						
							|  |  |  | 		ast_bt_get_addresses(&tmp); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		ast_reentrancy_lock(lt); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		if (lt->reentrancy < AST_MAX_REENTRANCY) { | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 			lt->backtrace[lt->reentrancy] = tmp; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 			bt = <->backtrace[lt->reentrancy]; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 		ast_reentrancy_unlock(lt); | 
					
						
							|  |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2017-10-23 01:55:18 -04:00
										 |  |  | 		ast_store_lock_info(AST_WRLOCK, filename, line, func, name, t, bt); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef HAVE_PTHREAD_RWLOCK_TIMEDWRLOCK
 | 
					
						
							|  |  |  | 	res = pthread_rwlock_timedwrlock(&t->lock, abs_timeout); | 
					
						
							|  |  |  | #else
 | 
					
						
							|  |  |  | 	do { | 
					
						
							| 
									
										
										
										
											2012-08-27 16:56:56 +00:00
										 |  |  | 		struct timeval _now; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		for (;;) { | 
					
						
							|  |  |  | 			if (!(res = pthread_rwlock_trywrlock(&t->lock))) { | 
					
						
							|  |  |  | 				break; | 
					
						
							|  |  |  | 			} | 
					
						
							| 
									
										
										
										
											2012-08-27 16:56:56 +00:00
										 |  |  | 			_now = ast_tvnow(); | 
					
						
							|  |  |  | 			if (_now.tv_sec > abs_timeout->tv_sec || (_now.tv_sec == abs_timeout->tv_sec && _now.tv_usec * 1000 > abs_timeout->tv_nsec)) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				break; | 
					
						
							|  |  |  | 			} | 
					
						
							|  |  |  | 			usleep(1); | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 	} while (0); | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	if (!res && lt) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		ast_reentrancy_lock(lt); | 
					
						
							|  |  |  | 		if (lt->reentrancy < AST_MAX_REENTRANCY) { | 
					
						
							|  |  |  | 			lt->file[lt->reentrancy] = filename; | 
					
						
							|  |  |  | 			lt->lineno[lt->reentrancy] = line; | 
					
						
							|  |  |  | 			lt->func[lt->reentrancy] = func; | 
					
						
							| 
									
										
											  
											
												chan_sip:  Address runaway when realtime peers subscribe to mailboxes
Users upgrading from asterisk 13.5 to a later version and who use
realtime with peers that have mailboxes were experiencing runaway
situations that manifested as a continuous stream of taskprocessor
congestion errors, memory leaks and an unresponsive chan_sip.
A related issue was that setting rtcachefriends=no NEVER worked in
asterisk 13 (since the move to stasis).  In 13.5 and earlier, when a
peer tried to register, all of the stasis threads would block and
chan_sip would again become unresponsive.  After 13.5, the runaway
would happen.
There were a number of causes...
* mwi_event_cb was (indirectly) calling build_peer even though calls to
  mwi_event_cb are often caused by build_peer.
* In an effort to prevent chan_sip from being unloaded while messages
  were still in flight, destroy_mailboxes was calling
  stasis_unsubscribe_and_join but in some cases waited forever for the
  final message.
* add_peer_mailboxes wasn't properly marking the existing mailboxes
  on a peer as "keep" so build_peer would always delete them all.
* add_peer_mwi_subs was unsubscribing existing mailbox subscriptions
  then just creating them again.
All of this was causing a flood of subscribes and unsubscribes on
multiple threads all for the same peer and mailbox.
Fixes...
* add_peer_mailboxes now marks mailboxes correctly and build_peer only
  deletes the ones that really are no longer needed by the peer.
* add_peer_mwi_subs now only adds subscriptions marked as "new" instead
  of unsubscribing and resubscribing everything.  It also adds the peer
  object's address to the mailbox instead of its name to the subscription
  userdata so mwi_event_cb doesn't have to call build_peer.
With these changes, with rtcachefriends=yes (the most common setting),
there are no leaks, locks, loops or crashes at shutdown.
rtcachefriends=no still causes leaks but at least it doesn't lock, loop
or crash.  Since making rtcachefriends=no work wasnt in scope for this
issue, further work will have to be deferred to a separate patch.
Side fixes...
 * The ast_lock_track structure had a member named "thread" which gdb
   doesn't like since it conflicts with it's "thread" command.  That
   member was renamed to "thread_id".
ASTERISK-25468 #close
Change-Id: I07519ef7f092629e1e844f855abd279d6475cdd0
											
										 
											2016-09-20 08:42:15 -06:00
										 |  |  | 			lt->thread_id[lt->reentrancy] = pthread_self(); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 			lt->reentrancy++; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 		ast_reentrancy_unlock(lt); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		ast_mark_lock_acquired(t); | 
					
						
							|  |  |  | 	} else if (lt) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							|  |  |  | 		if (lt->reentrancy) { | 
					
						
							|  |  |  | 			ast_reentrancy_lock(lt); | 
					
						
							|  |  |  | 			bt = <->backtrace[lt->reentrancy-1]; | 
					
						
							|  |  |  | 			ast_reentrancy_unlock(lt); | 
					
						
							|  |  |  | 		} else { | 
					
						
							|  |  |  | 			bt = NULL; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2017-10-23 01:55:18 -04:00
										 |  |  | 		ast_remove_lock_info(t, bt); | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | 	if (res) { | 
					
						
							| 
									
										
										
										
											2018-09-28 14:31:37 -04:00
										 |  |  | 		log_mutex_error(canlog, "%s line %d (%s): Error obtaining read lock: %s\n", | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 				filename, line, func, strerror(res)); | 
					
						
							|  |  |  | 		DO_THREAD_CRASH; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	return res; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | int __ast_rwlock_tryrdlock(const char *filename, int line, const char *func, ast_rwlock_t *t, const char *name) | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | { | 
					
						
							|  |  |  | 	int res; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	struct ast_lock_track *lt = ast_get_reentrancy(&t->track, &t->flags, 0); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	struct ast_bt *bt = NULL; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	if (lt) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 		struct ast_bt tmp; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		/* The implementation of backtrace() may have its own locks.
 | 
					
						
							|  |  |  | 		 * Capture the backtrace outside of the reentrancy lock to | 
					
						
							|  |  |  | 		 * avoid deadlocks. See ASTERISK-22455. */ | 
					
						
							|  |  |  | 		ast_bt_get_addresses(&tmp); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		ast_reentrancy_lock(lt); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		if (lt->reentrancy < AST_MAX_REENTRANCY) { | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 			lt->backtrace[lt->reentrancy] = tmp; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 			bt = <->backtrace[lt->reentrancy]; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 		ast_reentrancy_unlock(lt); | 
					
						
							|  |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2017-10-23 01:55:18 -04:00
										 |  |  | 		ast_store_lock_info(AST_RDLOCK, filename, line, func, name, t, bt); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	res = pthread_rwlock_tryrdlock(&t->lock); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	if (!res && lt) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		ast_reentrancy_lock(lt); | 
					
						
							|  |  |  | 		if (lt->reentrancy < AST_MAX_REENTRANCY) { | 
					
						
							|  |  |  | 			lt->file[lt->reentrancy] = filename; | 
					
						
							|  |  |  | 			lt->lineno[lt->reentrancy] = line; | 
					
						
							|  |  |  | 			lt->func[lt->reentrancy] = func; | 
					
						
							| 
									
										
											  
											
												chan_sip:  Address runaway when realtime peers subscribe to mailboxes
Users upgrading from asterisk 13.5 to a later version and who use
realtime with peers that have mailboxes were experiencing runaway
situations that manifested as a continuous stream of taskprocessor
congestion errors, memory leaks and an unresponsive chan_sip.
A related issue was that setting rtcachefriends=no NEVER worked in
asterisk 13 (since the move to stasis).  In 13.5 and earlier, when a
peer tried to register, all of the stasis threads would block and
chan_sip would again become unresponsive.  After 13.5, the runaway
would happen.
There were a number of causes...
* mwi_event_cb was (indirectly) calling build_peer even though calls to
  mwi_event_cb are often caused by build_peer.
* In an effort to prevent chan_sip from being unloaded while messages
  were still in flight, destroy_mailboxes was calling
  stasis_unsubscribe_and_join but in some cases waited forever for the
  final message.
* add_peer_mailboxes wasn't properly marking the existing mailboxes
  on a peer as "keep" so build_peer would always delete them all.
* add_peer_mwi_subs was unsubscribing existing mailbox subscriptions
  then just creating them again.
All of this was causing a flood of subscribes and unsubscribes on
multiple threads all for the same peer and mailbox.
Fixes...
* add_peer_mailboxes now marks mailboxes correctly and build_peer only
  deletes the ones that really are no longer needed by the peer.
* add_peer_mwi_subs now only adds subscriptions marked as "new" instead
  of unsubscribing and resubscribing everything.  It also adds the peer
  object's address to the mailbox instead of its name to the subscription
  userdata so mwi_event_cb doesn't have to call build_peer.
With these changes, with rtcachefriends=yes (the most common setting),
there are no leaks, locks, loops or crashes at shutdown.
rtcachefriends=no still causes leaks but at least it doesn't lock, loop
or crash.  Since making rtcachefriends=no work wasnt in scope for this
issue, further work will have to be deferred to a separate patch.
Side fixes...
 * The ast_lock_track structure had a member named "thread" which gdb
   doesn't like since it conflicts with it's "thread" command.  That
   member was renamed to "thread_id".
ASTERISK-25468 #close
Change-Id: I07519ef7f092629e1e844f855abd279d6475cdd0
											
										 
											2016-09-20 08:42:15 -06:00
										 |  |  | 			lt->thread_id[lt->reentrancy] = pthread_self(); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 			lt->reentrancy++; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 		ast_reentrancy_unlock(lt); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		ast_mark_lock_acquired(t); | 
					
						
							|  |  |  | 	} else if (lt) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		ast_mark_lock_failed(t); | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	return res; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | int __ast_rwlock_trywrlock(const char *filename, int line, const char *func, ast_rwlock_t *t, const char *name) | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | { | 
					
						
							|  |  |  | 	int res; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2018-09-27 20:32:21 -04:00
										 |  |  | 	struct ast_lock_track *lt = ast_get_reentrancy(&t->track, &t->flags, 0); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	struct ast_bt *bt = NULL; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	if (lt) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | #ifdef HAVE_BKTR
 | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 		struct ast_bt tmp; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		/* The implementation of backtrace() may have its own locks.
 | 
					
						
							|  |  |  | 		 * Capture the backtrace outside of the reentrancy lock to | 
					
						
							|  |  |  | 		 * avoid deadlocks. See ASTERISK-22455. */ | 
					
						
							|  |  |  | 		ast_bt_get_addresses(&tmp); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		ast_reentrancy_lock(lt); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 		if (lt->reentrancy < AST_MAX_REENTRANCY) { | 
					
						
							| 
									
										
										
										
											2013-09-09 20:13:40 +00:00
										 |  |  | 			lt->backtrace[lt->reentrancy] = tmp; | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 			bt = <->backtrace[lt->reentrancy]; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 		ast_reentrancy_unlock(lt); | 
					
						
							|  |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2017-10-23 01:55:18 -04:00
										 |  |  | 		ast_store_lock_info(AST_WRLOCK, filename, line, func, name, t, bt); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	res = pthread_rwlock_trywrlock(&t->lock); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_THREADS
 | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	if (!res && lt) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		ast_reentrancy_lock(lt); | 
					
						
							|  |  |  | 		if (lt->reentrancy < AST_MAX_REENTRANCY) { | 
					
						
							|  |  |  | 			lt->file[lt->reentrancy] = filename; | 
					
						
							|  |  |  | 			lt->lineno[lt->reentrancy] = line; | 
					
						
							|  |  |  | 			lt->func[lt->reentrancy] = func; | 
					
						
							| 
									
										
											  
											
												chan_sip:  Address runaway when realtime peers subscribe to mailboxes
Users upgrading from asterisk 13.5 to a later version and who use
realtime with peers that have mailboxes were experiencing runaway
situations that manifested as a continuous stream of taskprocessor
congestion errors, memory leaks and an unresponsive chan_sip.
A related issue was that setting rtcachefriends=no NEVER worked in
asterisk 13 (since the move to stasis).  In 13.5 and earlier, when a
peer tried to register, all of the stasis threads would block and
chan_sip would again become unresponsive.  After 13.5, the runaway
would happen.
There were a number of causes...
* mwi_event_cb was (indirectly) calling build_peer even though calls to
  mwi_event_cb are often caused by build_peer.
* In an effort to prevent chan_sip from being unloaded while messages
  were still in flight, destroy_mailboxes was calling
  stasis_unsubscribe_and_join but in some cases waited forever for the
  final message.
* add_peer_mailboxes wasn't properly marking the existing mailboxes
  on a peer as "keep" so build_peer would always delete them all.
* add_peer_mwi_subs was unsubscribing existing mailbox subscriptions
  then just creating them again.
All of this was causing a flood of subscribes and unsubscribes on
multiple threads all for the same peer and mailbox.
Fixes...
* add_peer_mailboxes now marks mailboxes correctly and build_peer only
  deletes the ones that really are no longer needed by the peer.
* add_peer_mwi_subs now only adds subscriptions marked as "new" instead
  of unsubscribing and resubscribing everything.  It also adds the peer
  object's address to the mailbox instead of its name to the subscription
  userdata so mwi_event_cb doesn't have to call build_peer.
With these changes, with rtcachefriends=yes (the most common setting),
there are no leaks, locks, loops or crashes at shutdown.
rtcachefriends=no still causes leaks but at least it doesn't lock, loop
or crash.  Since making rtcachefriends=no work wasnt in scope for this
issue, further work will have to be deferred to a separate patch.
Side fixes...
 * The ast_lock_track structure had a member named "thread" which gdb
   doesn't like since it conflicts with it's "thread" command.  That
   member was renamed to "thread_id".
ASTERISK-25468 #close
Change-Id: I07519ef7f092629e1e844f855abd279d6475cdd0
											
										 
											2016-09-20 08:42:15 -06:00
										 |  |  | 			lt->thread_id[lt->reentrancy] = pthread_self(); | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 			lt->reentrancy++; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 		ast_reentrancy_unlock(lt); | 
					
						
							| 
									
										
										
										
											2011-01-31 06:50:49 +00:00
										 |  |  | 		ast_mark_lock_acquired(t); | 
					
						
							| 
									
										
										
										
											2014-12-12 23:49:36 +00:00
										 |  |  | 	} else if (lt) { | 
					
						
							| 
									
										
										
										
											2010-04-22 19:08:01 +00:00
										 |  |  | 		ast_mark_lock_failed(t); | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | #endif /* DEBUG_THREADS */
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	return res; | 
					
						
							|  |  |  | } |