Home | History | Annotate | Line # | Download | only in sysmon
sysmon_wdog.c revision 1.21
      1 /*	$NetBSD: sysmon_wdog.c,v 1.21 2007/09/02 00:44:07 xtraeme Exp $	*/
      2 
      3 /*-
      4  * Copyright (c) 2000 Zembu Labs, Inc.
      5  * All rights reserved.
      6  *
      7  * Author: Jason R. Thorpe <thorpej (at) zembu.com>
      8  *
      9  * Redistribution and use in source and binary forms, with or without
     10  * modification, are permitted provided that the following conditions
     11  * are met:
     12  * 1. Redistributions of source code must retain the above copyright
     13  *    notice, this list of conditions and the following disclaimer.
     14  * 2. Redistributions in binary form must reproduce the above copyright
     15  *    notice, this list of conditions and the following disclaimer in the
     16  *    documentation and/or other materials provided with the distribution.
     17  * 3. All advertising materials mentioning features or use of this software
     18  *    must display the following acknowledgement:
     19  *	This product includes software developed by Zembu Labs, Inc.
     20  * 4. Neither the name of Zembu Labs nor the names of its employees may
     21  *    be used to endorse or promote products derived from this software
     22  *    without specific prior written permission.
     23  *
     24  * THIS SOFTWARE IS PROVIDED BY ZEMBU LABS, INC. ``AS IS'' AND ANY EXPRESS
     25  * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WAR-
     26  * RANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DIS-
     27  * CLAIMED.  IN NO EVENT SHALL ZEMBU LABS BE LIABLE FOR ANY DIRECT, INDIRECT,
     28  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
     29  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
     30  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
     31  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
     32  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
     33  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
     34  */
     35 
     36 /*
     37  * Watchdog timer framework for sysmon.  Hardware (and software)
     38  * watchdog timers can register themselves here to provide a
     39  * watchdog function, which provides an abstract interface to the
     40  * user.
     41  */
     42 
     43 #include <sys/cdefs.h>
     44 __KERNEL_RCSID(0, "$NetBSD: sysmon_wdog.c,v 1.21 2007/09/02 00:44:07 xtraeme Exp $");
     45 
     46 #include <sys/param.h>
     47 #include <sys/conf.h>
     48 #include <sys/errno.h>
     49 #include <sys/fcntl.h>
     50 #include <sys/mutex.h>
     51 #include <sys/callout.h>
     52 #include <sys/kernel.h>
     53 #include <sys/systm.h>
     54 #include <sys/proc.h>
     55 
     56 #include <dev/sysmon/sysmonvar.h>
     57 
     58 static LIST_HEAD(, sysmon_wdog) sysmon_wdog_list =
     59     LIST_HEAD_INITIALIZER(&sysmon_wdog_list);
     60 static int sysmon_wdog_count;
     61 static kmutex_t sysmon_wdog_list_mtx, sysmon_wdog_mtx;
     62 static struct sysmon_wdog *sysmon_armed_wdog;
     63 static callout_t sysmon_wdog_callout;
     64 static void *sysmon_wdog_sdhook;
     65 
     66 struct sysmon_wdog *sysmon_wdog_find(const char *);
     67 void	sysmon_wdog_release(struct sysmon_wdog *);
     68 int	sysmon_wdog_setmode(struct sysmon_wdog *, int, u_int);
     69 void	sysmon_wdog_ktickle(void *);
     70 void	sysmon_wdog_shutdown(void *);
     71 
     72 void
     73 sysmon_wdog_init(void)
     74 {
     75 	mutex_init(&sysmon_wdog_list_mtx, MUTEX_DEFAULT, IPL_NONE);
     76 	mutex_init(&sysmon_wdog_mtx, MUTEX_SPIN, IPL_SOFTCLOCK);
     77 }
     78 
     79 /*
     80  * sysmonopen_wdog:
     81  *
     82  *	Open the system monitor device.
     83  */
     84 int
     85 sysmonopen_wdog(dev_t dev, int flag, int mode, struct lwp *l)
     86 {
     87 
     88 	mutex_enter(&sysmon_wdog_list_mtx);
     89 	if (sysmon_wdog_sdhook == NULL) {
     90 		sysmon_wdog_sdhook =
     91 		    shutdownhook_establish(sysmon_wdog_shutdown, NULL);
     92 		if (sysmon_wdog_sdhook == NULL)
     93 			printf("WARNING: unable to register watchdog "
     94 			    "shutdown hook\n");
     95 		callout_init(&sysmon_wdog_callout, 0);
     96 	}
     97 	mutex_exit(&sysmon_wdog_list_mtx);
     98 
     99 	return 0;
    100 }
    101 
    102 /*
    103  * sysmonclose_wdog:
    104  *
    105  *	Close the system monitor device.
    106  */
    107 int
    108 sysmonclose_wdog(dev_t dev, int flag, int mode, struct lwp *l)
    109 {
    110 	struct sysmon_wdog *smw;
    111 	int error = 0;
    112 
    113 	/*
    114 	 * If this is the last close, and there is a watchdog
    115 	 * running in UTICKLE mode, we need to disable it,
    116 	 * otherwise the system will reset in short order.
    117 	 *
    118 	 * XXX Maybe we should just go into KTICKLE mode?
    119 	 */
    120 	mutex_enter(&sysmon_wdog_mtx);
    121 	if ((smw = sysmon_armed_wdog) != NULL) {
    122 		if ((smw->smw_mode & WDOG_MODE_MASK) == WDOG_MODE_UTICKLE) {
    123 			error = sysmon_wdog_setmode(smw,
    124 			    WDOG_MODE_DISARMED, smw->smw_period);
    125 			if (error) {
    126 				printf("WARNING: UNABLE TO DISARM "
    127 				    "WATCHDOG %s ON CLOSE!\n",
    128 				    smw->smw_name);
    129 				/*
    130 				 * ...we will probably reboot soon.
    131 				 */
    132 			}
    133 		}
    134 	}
    135 	mutex_exit(&sysmon_wdog_mtx);
    136 
    137 	return error;
    138 }
    139 
    140 /*
    141  * sysmonioctl_wdog:
    142  *
    143  *	Perform a watchdog control request.
    144  */
    145 int
    146 sysmonioctl_wdog(dev_t dev, u_long cmd, void *data, int flag, struct lwp *l)
    147 {
    148 	struct sysmon_wdog *smw;
    149 	int error = 0;
    150 
    151 	switch (cmd) {
    152 	case WDOGIOC_GMODE:
    153 	    {
    154 		struct wdog_mode *wm = (void *) data;
    155 
    156 		wm->wm_name[sizeof(wm->wm_name) - 1] = '\0';
    157 		smw = sysmon_wdog_find(wm->wm_name);
    158 		if (smw == NULL) {
    159 			error = ESRCH;
    160 			break;
    161 		}
    162 
    163 		wm->wm_mode = smw->smw_mode;
    164 		wm->wm_period = smw->smw_period;
    165 		sysmon_wdog_release(smw);
    166 		break;
    167 	    }
    168 
    169 	case WDOGIOC_SMODE:
    170 	    {
    171 		struct wdog_mode *wm = (void *) data;
    172 
    173 		if ((flag & FWRITE) == 0) {
    174 			error = EPERM;
    175 			break;
    176 		}
    177 
    178 		wm->wm_name[sizeof(wm->wm_name) - 1] = '\0';
    179 		smw = sysmon_wdog_find(wm->wm_name);
    180 		if (smw == NULL) {
    181 			error = ESRCH;
    182 			break;
    183 		}
    184 
    185 		if (wm->wm_mode & ~(WDOG_MODE_MASK|WDOG_FEATURE_MASK))
    186 			error = EINVAL;
    187 		else {
    188 			mutex_enter(&sysmon_wdog_mtx);
    189 			error = sysmon_wdog_setmode(smw, wm->wm_mode,
    190 			    wm->wm_period);
    191 			mutex_exit(&sysmon_wdog_mtx);
    192 		}
    193 
    194 		sysmon_wdog_release(smw);
    195 		break;
    196 	    }
    197 
    198 	case WDOGIOC_WHICH:
    199 	    {
    200 		struct wdog_mode *wm = (void *) data;
    201 
    202 		mutex_enter(&sysmon_wdog_mtx);
    203 		if ((smw = sysmon_armed_wdog) != NULL) {
    204 			strcpy(wm->wm_name, smw->smw_name);
    205 			wm->wm_mode = smw->smw_mode;
    206 			wm->wm_period = smw->smw_period;
    207 		} else
    208 			error = ESRCH;
    209 		mutex_exit(&sysmon_wdog_mtx);
    210 		break;
    211 	    }
    212 
    213 	case WDOGIOC_TICKLE:
    214 		if ((flag & FWRITE) == 0) {
    215 			error = EPERM;
    216 			break;
    217 		}
    218 
    219 		mutex_enter(&sysmon_wdog_mtx);
    220 		if ((smw = sysmon_armed_wdog) != NULL) {
    221 			error = (*smw->smw_tickle)(smw);
    222 			if (error == 0)
    223 				smw->smw_tickler = l->l_proc->p_pid;
    224 		} else
    225 			error = ESRCH;
    226 		mutex_exit(&sysmon_wdog_mtx);
    227 		break;
    228 
    229 	case WDOGIOC_GTICKLER:
    230 		if ((smw = sysmon_armed_wdog) != NULL)
    231 			*(pid_t *)data = smw->smw_tickler;
    232 		else
    233 			error = ESRCH;
    234 		break;
    235 
    236 	case WDOGIOC_GWDOGS:
    237 	    {
    238 		struct wdog_conf *wc = (void *) data;
    239 		char *cp;
    240 		int i;
    241 
    242 		mutex_enter(&sysmon_wdog_list_mtx);
    243 		if (wc->wc_names == NULL)
    244 			wc->wc_count = sysmon_wdog_count;
    245 		else {
    246 			for (i = 0, cp = wc->wc_names,
    247 			       smw = LIST_FIRST(&sysmon_wdog_list);
    248 			     i < sysmon_wdog_count && smw != NULL && error == 0;
    249 			     i++, cp += WDOG_NAMESIZE,
    250 			       smw = LIST_NEXT(smw, smw_list))
    251 				error = copyout(smw->smw_name, cp,
    252 				    strlen(smw->smw_name) + 1);
    253 			wc->wc_count = i;
    254 		}
    255 		mutex_exit(&sysmon_wdog_list_mtx);
    256 		break;
    257 	    }
    258 
    259 	default:
    260 		error = ENOTTY;
    261 	}
    262 
    263 	return error;
    264 }
    265 
    266 /*
    267  * sysmon_wdog_register:
    268  *
    269  *	Register a watchdog device.
    270  */
    271 int
    272 sysmon_wdog_register(struct sysmon_wdog *smw)
    273 {
    274 	struct sysmon_wdog *lsmw;
    275 	int error = 0;
    276 
    277 	mutex_enter(&sysmon_wdog_list_mtx);
    278 
    279 	for (lsmw = LIST_FIRST(&sysmon_wdog_list); lsmw != NULL;
    280 	     lsmw = LIST_NEXT(lsmw, smw_list)) {
    281 		if (strcmp(lsmw->smw_name, smw->smw_name) == 0) {
    282 			error = EEXIST;
    283 			goto out;
    284 		}
    285 	}
    286 
    287 	smw->smw_mode = WDOG_MODE_DISARMED;
    288 	smw->smw_tickler = (pid_t) -1;
    289 	smw->smw_refcnt = 0;
    290 	sysmon_wdog_count++;
    291 	LIST_INSERT_HEAD(&sysmon_wdog_list, smw, smw_list);
    292 
    293  out:
    294 	mutex_exit(&sysmon_wdog_list_mtx);
    295 	return error;
    296 }
    297 
    298 /*
    299  * sysmon_wdog_unregister:
    300  *
    301  *	Unregister a watchdog device.
    302  */
    303 void
    304 sysmon_wdog_unregister(struct sysmon_wdog *smw)
    305 {
    306 
    307 	mutex_enter(&sysmon_wdog_list_mtx);
    308 	sysmon_wdog_count--;
    309 	LIST_REMOVE(smw, smw_list);
    310 	mutex_exit(&sysmon_wdog_list_mtx);
    311 }
    312 
    313 /*
    314  * sysmon_wdog_find:
    315  *
    316  *	Find a watchdog device.  We increase the reference
    317  *	count on a match.
    318  */
    319 struct sysmon_wdog *
    320 sysmon_wdog_find(const char *name)
    321 {
    322 	struct sysmon_wdog *smw;
    323 
    324 	mutex_enter(&sysmon_wdog_list_mtx);
    325 
    326 	for (smw = LIST_FIRST(&sysmon_wdog_list); smw != NULL;
    327 	     smw = LIST_NEXT(smw, smw_list)) {
    328 		if (strcmp(smw->smw_name, name) == 0)
    329 			break;
    330 	}
    331 
    332 	if (smw != NULL)
    333 		smw->smw_refcnt++;
    334 
    335 	mutex_exit(&sysmon_wdog_list_mtx);
    336 	return smw;
    337 }
    338 
    339 /*
    340  * sysmon_wdog_release:
    341  *
    342  *	Release a watchdog device.
    343  */
    344 void
    345 sysmon_wdog_release(struct sysmon_wdog *smw)
    346 {
    347 
    348 	mutex_enter(&sysmon_wdog_list_mtx);
    349 	KASSERT(smw->smw_refcnt != 0);
    350 	smw->smw_refcnt--;
    351 	mutex_exit(&sysmon_wdog_list_mtx);
    352 }
    353 
    354 /*
    355  * sysmon_wdog_setmode:
    356  *
    357  *	Set the mode of a watchdog device.
    358  */
    359 int
    360 sysmon_wdog_setmode(struct sysmon_wdog *smw, int mode, u_int period)
    361 {
    362 	u_int operiod = smw->smw_period;
    363 	int omode = smw->smw_mode;
    364 	int error = 0;
    365 
    366 	smw->smw_period = period;
    367 	smw->smw_mode = mode;
    368 
    369 	switch (mode & WDOG_MODE_MASK) {
    370 	case WDOG_MODE_DISARMED:
    371 		if (smw != sysmon_armed_wdog) {
    372 			error = EINVAL;
    373 			goto out;
    374 		}
    375 		break;
    376 
    377 	case WDOG_MODE_KTICKLE:
    378 	case WDOG_MODE_UTICKLE:
    379 	case WDOG_MODE_ETICKLE:
    380 		if (sysmon_armed_wdog != NULL) {
    381 			error = EBUSY;
    382 			goto out;
    383 		}
    384 		break;
    385 
    386 	default:
    387 		error = EINVAL;
    388 		goto out;
    389 	}
    390 
    391 	error = (*smw->smw_setmode)(smw);
    392 
    393  out:
    394 	if (error) {
    395 		smw->smw_period = operiod;
    396 		smw->smw_mode = omode;
    397 	} else {
    398 		if ((mode & WDOG_MODE_MASK) == WDOG_MODE_DISARMED) {
    399 			sysmon_armed_wdog = NULL;
    400 			smw->smw_tickler = (pid_t) -1;
    401 			smw->smw_refcnt--;
    402 			if ((omode & WDOG_MODE_MASK) == WDOG_MODE_KTICKLE)
    403 				callout_stop(&sysmon_wdog_callout);
    404 		} else {
    405 			sysmon_armed_wdog = smw;
    406 			smw->smw_refcnt++;
    407 			if ((mode & WDOG_MODE_MASK) == WDOG_MODE_KTICKLE) {
    408 				callout_reset(&sysmon_wdog_callout,
    409 				    WDOG_PERIOD_TO_TICKS(smw->smw_period) / 2,
    410 				    sysmon_wdog_ktickle, NULL);
    411 			}
    412 		}
    413 	}
    414 	return error;
    415 }
    416 
    417 /*
    418  * sysmon_wdog_ktickle:
    419  *
    420  *	Kernel watchdog tickle routine.
    421  */
    422 void
    423 sysmon_wdog_ktickle(void *arg)
    424 {
    425 	struct sysmon_wdog *smw;
    426 
    427 	mutex_enter(&sysmon_wdog_mtx);
    428 	if ((smw = sysmon_armed_wdog) != NULL) {
    429 		if ((*smw->smw_tickle)(smw) != 0) {
    430 			printf("WARNING: KERNEL TICKLE OF WATCHDOG %s "
    431 			    "FAILED!\n", smw->smw_name);
    432 			/*
    433 			 * ...we will probably reboot soon.
    434 			 */
    435 		}
    436 		callout_reset(&sysmon_wdog_callout,
    437 		    WDOG_PERIOD_TO_TICKS(smw->smw_period) / 2,
    438 		    sysmon_wdog_ktickle, NULL);
    439 	}
    440 	mutex_exit(&sysmon_wdog_mtx);
    441 }
    442 
    443 /*
    444  * sysmon_wdog_shutdown:
    445  *
    446  *	Perform shutdown-time operations.
    447  */
    448 void
    449 sysmon_wdog_shutdown(void *arg)
    450 {
    451 	struct sysmon_wdog *smw;
    452 
    453 	/*
    454 	 * XXX Locking here?  I don't think it's necessary.
    455 	 */
    456 
    457 	if ((smw = sysmon_armed_wdog) != NULL) {
    458 		if (sysmon_wdog_setmode(smw, WDOG_MODE_DISARMED,
    459 		    smw->smw_period))
    460 			printf("WARNING: FAILED TO SHUTDOWN WATCHDOG %s!\n",
    461 			    smw->smw_name);
    462 	}
    463 }
    464