| 
									
										
										
										
											2007-12-18 23:06:05 +00:00
										 |  |  | /*
 | 
					
						
							|  |  |  |  * Asterisk -- An open source telephony toolkit. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * Copyright (C) 2007, Digium, Inc. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * Tilghman Lesher <tlesher AT digium DOT com> | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * See http://www.asterisk.org for more information about
 | 
					
						
							|  |  |  |  * the Asterisk project. Please do not directly contact | 
					
						
							|  |  |  |  * any of the maintainers of this project for assistance; | 
					
						
							|  |  |  |  * the project provides a web site, mailing lists and IRC | 
					
						
							|  |  |  |  * channels for your use. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * This program is free software, distributed under the terms of | 
					
						
							|  |  |  |  * the GNU General Public License Version 2. See the LICENSE file | 
					
						
							|  |  |  |  * at the top of the source tree. | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2011-07-14 20:28:54 +00:00
										 |  |  | /*** MODULEINFO
 | 
					
						
							|  |  |  | 	<support_level>core</support_level> | 
					
						
							|  |  |  |  ***/ | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-12-18 23:06:05 +00:00
										 |  |  | #include <sys/types.h>
 | 
					
						
							|  |  |  | #include <sys/stat.h>
 | 
					
						
							|  |  |  | #include <sys/time.h>
 | 
					
						
							|  |  |  | #include <sys/resource.h>
 | 
					
						
							|  |  |  | #include <utime.h>
 | 
					
						
							|  |  |  | #include <fcntl.h>
 | 
					
						
							|  |  |  | #include <unistd.h>
 | 
					
						
							|  |  |  | #include <stdlib.h>
 | 
					
						
							| 
									
										
										
										
											2008-05-18 21:15:58 +00:00
										 |  |  | #include <string.h>
 | 
					
						
							| 
									
										
										
										
											2010-01-15 21:42:36 +00:00
										 |  |  | #include <stdio.h>
 | 
					
						
							| 
									
										
										
										
											2007-12-18 23:06:05 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | /*!\brief
 | 
					
						
							|  |  |  |  * At one time, canaries were carried along with coal miners down | 
					
						
							|  |  |  |  * into a mine.  Their purpose was to alert the miners when they | 
					
						
							|  |  |  |  * had drilled into a pocket of methane gas or another noxious | 
					
						
							| 
									
										
										
										
											2009-02-24 17:51:36 +00:00
										 |  |  |  * substance.  The canary, being the most sensitive animal, would | 
					
						
							| 
									
										
										
										
											2007-12-18 23:06:05 +00:00
										 |  |  |  * immediately fall over.  Seeing this, the miners could take | 
					
						
							|  |  |  |  * action to escape the mine, seeing an imminent danger. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * This process serves a similar purpose, though with the realtime | 
					
						
							|  |  |  |  * priority being the reason.  When a thread starts running away | 
					
						
							|  |  |  |  * with the processor, it is typically difficult to tell what | 
					
						
							|  |  |  |  * thread caused the problem, as the machine acts as if it is | 
					
						
							|  |  |  |  * locked up (in fact, what has happened is that Asterisk runs at | 
					
						
							|  |  |  |  * a higher priority than even the login shell, so the runaway | 
					
						
							|  |  |  |  * thread hogs all available CPU time. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * If that happens, this canary process will cease to get any | 
					
						
							|  |  |  |  * process time, which we can monitor with a realtime thread in | 
					
						
							|  |  |  |  * Asterisk.  Should that happen, that monitoring thread may take | 
					
						
							|  |  |  |  * immediate action to slow down Asterisk to regular priority, | 
					
						
							|  |  |  |  * thus allowing an administrator to login to the system and | 
					
						
							|  |  |  |  * restart Asterisk or perhaps take another course of action | 
					
						
							|  |  |  |  * (such as retrieving a backtrace to let the developers know | 
					
						
							|  |  |  |  * what precisely went wrong). | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * Note that according to POSIX.1, all threads inside a single | 
					
						
							|  |  |  |  * process must share the same priority, so when the monitoring | 
					
						
							|  |  |  |  * thread deprioritizes itself, it deprioritizes all threads at | 
					
						
							|  |  |  |  * the same time.  This is also why this canary must exist as a | 
					
						
							|  |  |  |  * completely separate process and not simply as a thread within | 
					
						
							|  |  |  |  * Asterisk itself. | 
					
						
							| 
									
										
										
										
											2009-02-24 17:51:36 +00:00
										 |  |  |  * | 
					
						
							|  |  |  |  * Quote: | 
					
						
							|  |  |  |  * "The nice value set with setpriority() shall be applied to the | 
					
						
							|  |  |  |  * process. If the process is multi-threaded, the nice value shall | 
					
						
							|  |  |  |  * affect all system scope threads in the process." | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * Source: | 
					
						
							|  |  |  |  * http://www.opengroup.org/onlinepubs/000095399/functions/setpriority.html
 | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * In answer to the question, what aren't system scope threads, the | 
					
						
							|  |  |  |  * answer is, in Asterisk, nothing.  Process scope threads are the | 
					
						
							|  |  |  |  * alternative, but they aren't supported in Linux. | 
					
						
							| 
									
										
										
										
											2007-12-18 23:06:05 +00:00
										 |  |  |  */ | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2008-10-30 16:49:02 +00:00
										 |  |  | static const char explanation[] = | 
					
						
							| 
									
										
										
										
											2008-05-18 21:15:58 +00:00
										 |  |  | "This file is created when Asterisk is run with a realtime priority (-p).  It\n" | 
					
						
							|  |  |  | "must continue to exist, and the astcanary process must be allowed to continue\n" | 
					
						
							|  |  |  | "running, or else the Asterisk process will, within a short period of time,\n" | 
					
						
							|  |  |  | "slow itself down to regular priority.\n\n" | 
					
						
							|  |  |  | "The technical explanation for this file is to provide an assurance to Asterisk\n" | 
					
						
							|  |  |  | "that there are no threads that have gone into runaway mode, thus hogging the\n" | 
					
						
							|  |  |  | "CPU, and making the Asterisk machine seem to be unresponsive.  When that\n" | 
					
						
							|  |  |  | "happens, the astcanary process will be unable to update the timestamp on this\n" | 
					
						
							|  |  |  | "file, and Asterisk will notice within 120 seconds and react.  Slowing the\n" | 
					
						
							|  |  |  | "Asterisk process down to regular priority will permit an administrator to\n" | 
					
						
							|  |  |  | "intervene, thus avoiding a need to reboot the entire machine.\n"; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-12-18 23:06:05 +00:00
										 |  |  | int main(int argc, char *argv[]) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	int fd; | 
					
						
							| 
									
										
										
										
											2010-01-15 21:40:14 +00:00
										 |  |  | 	pid_t parent; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	if (argc < 3) { | 
					
						
							|  |  |  | 		fprintf(stderr, "Usage: %s <monitor-filename> <ppid>\n", argv[0]); | 
					
						
							|  |  |  | 		exit(1); | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-12-18 23:06:05 +00:00
										 |  |  | 	/* Run at normal priority */ | 
					
						
							|  |  |  | 	setpriority(PRIO_PROCESS, 0, 0); | 
					
						
							| 
									
										
										
										
											2010-01-15 21:40:14 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | 	/*!\note
 | 
					
						
							|  |  |  | 	 * See http://www.opengroup.org/onlinepubs/009695399/basedefs/xbd_chap03.html#tag_03_265
 | 
					
						
							|  |  |  | 	 * for a justification of this approach.  The PPID after the creator dies in Linux and | 
					
						
							|  |  |  | 	 * most other Unix-like systems will be 1, but this is not strictly the case.  The POSIX | 
					
						
							|  |  |  | 	 * specification allows it to be an implementation-defined system process.  However, it | 
					
						
							|  |  |  | 	 * most certainly will not be the original parent PID, which makes the following code | 
					
						
							|  |  |  | 	 * POSIX-compliant. | 
					
						
							|  |  |  | 	 */ | 
					
						
							|  |  |  | 	for (parent = atoi(argv[2]); parent == getppid() ;) { | 
					
						
							| 
									
										
										
										
											2007-12-18 23:06:05 +00:00
										 |  |  | 		/* Update the modification times (checked from Asterisk) */ | 
					
						
							|  |  |  | 		if (utime(argv[1], NULL)) { | 
					
						
							|  |  |  | 			/* Recreate the file if it doesn't exist */ | 
					
						
							| 
									
										
										
										
											2008-05-18 21:15:58 +00:00
										 |  |  | 			if ((fd = open(argv[1], O_RDWR | O_TRUNC | O_CREAT, 0777)) > -1) { | 
					
						
							| 
									
										
										
										
											2008-11-02 18:52:13 +00:00
										 |  |  | 				if (write(fd, explanation, strlen(explanation)) < 0) { | 
					
						
							|  |  |  | 					exit(1); | 
					
						
							|  |  |  | 				} | 
					
						
							| 
									
										
										
										
											2007-12-18 23:06:05 +00:00
										 |  |  | 				close(fd); | 
					
						
							| 
									
										
										
										
											2008-05-18 21:15:58 +00:00
										 |  |  | 			} else { | 
					
						
							| 
									
										
										
										
											2007-12-18 23:06:05 +00:00
										 |  |  | 				exit(1); | 
					
						
							| 
									
										
										
										
											2008-05-18 21:15:58 +00:00
										 |  |  | 			} | 
					
						
							| 
									
										
										
										
											2007-12-18 23:06:05 +00:00
										 |  |  | 			continue; | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		/* Run occasionally */ | 
					
						
							|  |  |  | 		sleep(5); | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-01-15 21:40:14 +00:00
										 |  |  | 	/* Exit when the parent dies */ | 
					
						
							| 
									
										
										
										
											2007-12-18 23:06:05 +00:00
										 |  |  | 	return 0; | 
					
						
							|  |  |  | } |