Home | History | Annotate | Line # | Download | only in kern
subr_iostat.c revision 1.17
      1  1.17        ad /*	$NetBSD: subr_iostat.c,v 1.17 2009/04/04 07:30:10 ad Exp $	*/
      2   1.1     blymn /*	NetBSD: subr_disk.c,v 1.69 2005/05/29 22:24:15 christos Exp	*/
      3   1.1     blymn 
      4   1.1     blymn /*-
      5  1.17        ad  * Copyright (c) 1996, 1997, 1999, 2000, 2009 The NetBSD Foundation, Inc.
      6   1.1     blymn  * All rights reserved.
      7   1.1     blymn  *
      8   1.1     blymn  * This code is derived from software contributed to The NetBSD Foundation
      9   1.1     blymn  * by Jason R. Thorpe of the Numerical Aerospace Simulation Facility,
     10   1.1     blymn  * NASA Ames Research Center.
     11   1.1     blymn  *
     12   1.1     blymn  * Redistribution and use in source and binary forms, with or without
     13   1.1     blymn  * modification, are permitted provided that the following conditions
     14   1.1     blymn  * are met:
     15   1.1     blymn  * 1. Redistributions of source code must retain the above copyright
     16   1.1     blymn  *    notice, this list of conditions and the following disclaimer.
     17   1.1     blymn  * 2. Redistributions in binary form must reproduce the above copyright
     18   1.1     blymn  *    notice, this list of conditions and the following disclaimer in the
     19   1.1     blymn  *    documentation and/or other materials provided with the distribution.
     20   1.1     blymn  *
     21   1.1     blymn  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     22   1.1     blymn  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     23   1.1     blymn  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     24   1.1     blymn  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     25   1.1     blymn  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     26   1.1     blymn  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     27   1.1     blymn  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     28   1.1     blymn  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     29   1.1     blymn  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     30   1.1     blymn  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     31   1.1     blymn  * POSSIBILITY OF SUCH DAMAGE.
     32   1.1     blymn  */
     33   1.1     blymn 
     34   1.1     blymn /*
     35   1.1     blymn  * Copyright (c) 1982, 1986, 1988, 1993
     36   1.1     blymn  *	The Regents of the University of California.  All rights reserved.
     37   1.1     blymn  * (c) UNIX System Laboratories, Inc.
     38   1.1     blymn  * All or some portions of this file are derived from material licensed
     39   1.1     blymn  * to the University of California by American Telephone and Telegraph
     40   1.1     blymn  * Co. or Unix System Laboratories, Inc. and are reproduced herein with
     41   1.1     blymn  * the permission of UNIX System Laboratories, Inc.
     42   1.1     blymn  *
     43   1.1     blymn  * Redistribution and use in source and binary forms, with or without
     44   1.1     blymn  * modification, are permitted provided that the following conditions
     45   1.1     blymn  * are met:
     46   1.1     blymn  * 1. Redistributions of source code must retain the above copyright
     47   1.1     blymn  *    notice, this list of conditions and the following disclaimer.
     48   1.1     blymn  * 2. Redistributions in binary form must reproduce the above copyright
     49   1.1     blymn  *    notice, this list of conditions and the following disclaimer in the
     50   1.1     blymn  *    documentation and/or other materials provided with the distribution.
     51   1.1     blymn  * 3. Neither the name of the University nor the names of its contributors
     52   1.1     blymn  *    may be used to endorse or promote products derived from this software
     53   1.1     blymn  *    without specific prior written permission.
     54   1.1     blymn  *
     55   1.1     blymn  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     56   1.1     blymn  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     57   1.1     blymn  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     58   1.1     blymn  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     59   1.1     blymn  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     60   1.1     blymn  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     61   1.1     blymn  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     62   1.1     blymn  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     63   1.1     blymn  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     64   1.1     blymn  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     65   1.1     blymn  * SUCH DAMAGE.
     66   1.1     blymn  *
     67   1.1     blymn  *	@(#)ufs_disksubr.c	8.5 (Berkeley) 1/21/94
     68   1.1     blymn  */
     69   1.1     blymn 
     70   1.1     blymn #include <sys/cdefs.h>
     71  1.17        ad __KERNEL_RCSID(0, "$NetBSD: subr_iostat.c,v 1.17 2009/04/04 07:30:10 ad Exp $");
     72   1.1     blymn 
     73   1.1     blymn #include <sys/param.h>
     74   1.1     blymn #include <sys/kernel.h>
     75  1.16      yamt #include <sys/kmem.h>
     76   1.6      yamt #include <sys/iostat.h>
     77   1.1     blymn #include <sys/sysctl.h>
     78  1.13        ad #include <sys/rwlock.h>
     79   1.1     blymn 
     80   1.1     blymn /*
     81   1.1     blymn  * Function prototypes for sysctl nodes
     82   1.1     blymn  */
     83   1.1     blymn static int	sysctl_hw_disknames(SYSCTLFN_PROTO);
     84   1.1     blymn static int	sysctl_hw_iostatnames(SYSCTLFN_PROTO);
     85   1.1     blymn static int	sysctl_hw_iostats(SYSCTLFN_PROTO);
     86   1.1     blymn 
     87   1.1     blymn static int
     88   1.1     blymn iostati_getnames(int disk_only, char *oldp, size_t *oldlenp, const void *newp,
     89   1.1     blymn 		u_int namelen);
     90   1.1     blymn 
     91   1.1     blymn /*
     92   1.1     blymn  * A global list of all drives attached to the system.  May grow or
     93   1.1     blymn  * shrink over time.
     94   1.1     blymn  */
     95   1.3      yamt struct iostatlist_head iostatlist = TAILQ_HEAD_INITIALIZER(iostatlist);
     96   1.3      yamt int iostat_count;		/* number of drives in global drivelist */
     97  1.13        ad krwlock_t iostatlist_lock;
     98  1.12        ad 
     99  1.12        ad /*
    100  1.12        ad  * Initialise the iostat subsystem.
    101  1.12        ad  */
    102  1.12        ad void
    103  1.12        ad iostat_init(void)
    104  1.12        ad {
    105  1.12        ad 
    106  1.13        ad 	rw_init(&iostatlist_lock);
    107  1.12        ad }
    108   1.1     blymn 
    109   1.1     blymn /*
    110   1.1     blymn  * Searches the iostatlist for the iostat corresponding to the
    111   1.1     blymn  * name provided.
    112   1.1     blymn  */
    113   1.1     blymn struct io_stats *
    114   1.8      yamt iostat_find(const char *name)
    115   1.1     blymn {
    116   1.1     blymn 	struct io_stats *iostatp;
    117   1.1     blymn 
    118   1.8      yamt 	KASSERT(name != NULL);
    119   1.1     blymn 
    120  1.13        ad 	rw_enter(&iostatlist_lock, RW_READER);
    121   1.8      yamt 	TAILQ_FOREACH(iostatp, &iostatlist, io_link) {
    122   1.2     blymn 		if (strcmp(iostatp->io_name, name) == 0) {
    123   1.8      yamt 			break;
    124   1.1     blymn 		}
    125   1.8      yamt 	}
    126  1.13        ad 	rw_exit(&iostatlist_lock);
    127   1.1     blymn 
    128   1.8      yamt 	return iostatp;
    129   1.1     blymn }
    130   1.1     blymn 
    131   1.1     blymn /*
    132   1.1     blymn  * Allocate and initialise memory for the i/o statistics.
    133   1.1     blymn  */
    134   1.3      yamt struct io_stats *
    135  1.11  christos iostat_alloc(int32_t type, void *parent, const char *name)
    136   1.1     blymn {
    137   1.1     blymn 	struct io_stats *stats;
    138   1.1     blymn 
    139  1.16      yamt 	stats = kmem_zalloc(sizeof(*stats), KM_SLEEP);
    140   1.1     blymn 	if (stats == NULL)
    141   1.4      yamt 		panic("iostat_alloc: cannot allocate memory for stats buffer");
    142   1.1     blymn 
    143   1.2     blymn 	stats->io_type = type;
    144  1.11  christos 	stats->io_parent = parent;
    145  1.11  christos 	(void)strlcpy(stats->io_name, name, sizeof(stats->io_name));
    146   1.1     blymn 
    147   1.1     blymn 	/*
    148   1.1     blymn 	 * Set the attached timestamp.
    149   1.1     blymn 	 */
    150  1.10    kardel 	getmicrouptime(&stats->io_attachtime);
    151   1.1     blymn 
    152   1.1     blymn 	/*
    153   1.1     blymn 	 * Link into the drivelist.
    154   1.1     blymn 	 */
    155  1.13        ad 	rw_enter(&iostatlist_lock, RW_WRITER);
    156   1.2     blymn 	TAILQ_INSERT_TAIL(&iostatlist, stats, io_link);
    157   1.1     blymn 	iostat_count++;
    158  1.13        ad 	rw_exit(&iostatlist_lock);
    159   1.1     blymn 
    160   1.1     blymn 	return stats;
    161   1.1     blymn }
    162   1.1     blymn 
    163   1.1     blymn /*
    164   1.1     blymn  * Remove i/o from stats collection.
    165   1.1     blymn  */
    166   1.1     blymn void
    167   1.1     blymn iostat_free(struct io_stats *stats)
    168   1.1     blymn {
    169   1.1     blymn 
    170   1.3      yamt 	/*
    171   1.3      yamt 	 * Remove from the iostat list.
    172   1.3      yamt 	 */
    173   1.1     blymn 	if (iostat_count == 0)
    174   1.1     blymn 		panic("iostat_free: iostat_count == 0");
    175  1.13        ad 	rw_enter(&iostatlist_lock, RW_WRITER);
    176   1.2     blymn 	TAILQ_REMOVE(&iostatlist, stats, io_link);
    177   1.1     blymn 	iostat_count--;
    178  1.13        ad 	rw_exit(&iostatlist_lock);
    179  1.16      yamt 	kmem_free(stats, sizeof(*stats));
    180   1.1     blymn }
    181   1.1     blymn 
    182   1.1     blymn /*
    183   1.1     blymn  * Increment a iostat busy counter.  If the counter is going from
    184   1.1     blymn  * 0 to 1, set the timestamp.
    185   1.1     blymn  */
    186   1.1     blymn void
    187   1.1     blymn iostat_busy(struct io_stats *stats)
    188   1.1     blymn {
    189   1.1     blymn 
    190  1.10    kardel 	if (stats->io_busy++ == 0)
    191  1.10    kardel 		getmicrouptime(&stats->io_timestamp);
    192   1.1     blymn }
    193   1.1     blymn 
    194   1.1     blymn /*
    195   1.1     blymn  * Decrement a iostat busy counter, increment the byte count, total busy
    196   1.1     blymn  * time, and reset the timestamp.
    197   1.1     blymn  */
    198   1.1     blymn void
    199   1.1     blymn iostat_unbusy(struct io_stats *stats, long bcount, int read)
    200   1.1     blymn {
    201   1.1     blymn 	struct timeval dv_time, diff_time;
    202   1.1     blymn 
    203   1.2     blymn 	if (stats->io_busy-- == 0) {
    204   1.2     blymn 		printf("%s: busy < 0\n", stats->io_name);
    205   1.1     blymn 		panic("iostat_unbusy");
    206   1.1     blymn 	}
    207   1.1     blymn 
    208  1.10    kardel 	getmicrouptime(&dv_time);
    209   1.1     blymn 
    210   1.2     blymn 	timersub(&dv_time, &stats->io_timestamp, &diff_time);
    211   1.2     blymn 	timeradd(&stats->io_time, &diff_time, &stats->io_time);
    212   1.1     blymn 
    213   1.2     blymn 	stats->io_timestamp = dv_time;
    214   1.1     blymn 	if (bcount > 0) {
    215   1.1     blymn 		if (read) {
    216   1.2     blymn 			stats->io_rbytes += bcount;
    217   1.2     blymn 			stats->io_rxfer++;
    218   1.1     blymn 		} else {
    219   1.2     blymn 			stats->io_wbytes += bcount;
    220   1.2     blymn 			stats->io_wxfer++;
    221   1.1     blymn 		}
    222   1.1     blymn 	}
    223   1.1     blymn }
    224   1.1     blymn 
    225   1.1     blymn /*
    226  1.17        ad  * Return non-zero if a device has an I/O request in flight.
    227  1.17        ad  */
    228  1.17        ad bool
    229  1.17        ad iostat_isbusy(struct io_stats *stats)
    230  1.17        ad {
    231  1.17        ad 
    232  1.17        ad 	return stats->io_busy != 0;
    233  1.17        ad }
    234  1.17        ad 
    235  1.17        ad /*
    236   1.1     blymn  * Increment the seek counter.  This does look almost redundant but it
    237   1.1     blymn  * abstracts the stats gathering.
    238   1.1     blymn  */
    239   1.1     blymn void
    240   1.1     blymn iostat_seek(struct io_stats *stats)
    241   1.1     blymn {
    242   1.3      yamt 
    243   1.2     blymn 	stats->io_seek++;
    244   1.1     blymn }
    245   1.1     blymn 
    246   1.1     blymn static int
    247   1.1     blymn sysctl_hw_disknames(SYSCTLFN_ARGS)
    248   1.1     blymn {
    249   1.3      yamt 
    250   1.1     blymn 	return iostati_getnames(1, oldp, oldlenp, newp, namelen);
    251   1.1     blymn }
    252   1.1     blymn 
    253   1.1     blymn static int
    254   1.1     blymn sysctl_hw_iostatnames(SYSCTLFN_ARGS)
    255   1.1     blymn {
    256   1.3      yamt 
    257   1.1     blymn 	return iostati_getnames(0, oldp, oldlenp, newp, namelen);
    258   1.1     blymn }
    259   1.1     blymn 
    260   1.1     blymn static int
    261   1.1     blymn iostati_getnames(int disk_only, char *oldp, size_t *oldlenp, const void *newp,
    262   1.1     blymn 		 u_int namelen)
    263   1.1     blymn {
    264   1.1     blymn 	char bf[IOSTATNAMELEN + 1];
    265   1.1     blymn 	char *where = oldp;
    266   1.1     blymn 	struct io_stats *stats;
    267   1.1     blymn 	size_t needed, left, slen;
    268   1.1     blymn 	int error, first;
    269   1.1     blymn 
    270   1.1     blymn 	if (newp != NULL)
    271   1.1     blymn 		return (EPERM);
    272   1.1     blymn 	if (namelen != 0)
    273   1.1     blymn 		return (EINVAL);
    274   1.1     blymn 
    275   1.1     blymn 	first = 1;
    276   1.1     blymn 	error = 0;
    277   1.1     blymn 	needed = 0;
    278   1.1     blymn 	left = *oldlenp;
    279   1.1     blymn 
    280  1.13        ad 	rw_enter(&iostatlist_lock, RW_READER);
    281   1.1     blymn 	for (stats = TAILQ_FIRST(&iostatlist); stats != NULL;
    282   1.2     blymn 	    stats = TAILQ_NEXT(stats, io_link)) {
    283   1.2     blymn 		if ((disk_only == 1) && (stats->io_type != IOSTAT_DISK))
    284   1.1     blymn 			continue;
    285   1.1     blymn 
    286   1.1     blymn 		if (where == NULL)
    287   1.2     blymn 			needed += strlen(stats->io_name) + 1;
    288   1.1     blymn 		else {
    289   1.1     blymn 			memset(bf, 0, sizeof(bf));
    290   1.1     blymn 			if (first) {
    291   1.2     blymn 				strncpy(bf, stats->io_name, sizeof(bf));
    292   1.1     blymn 				first = 0;
    293   1.1     blymn 			} else {
    294   1.1     blymn 				bf[0] = ' ';
    295   1.2     blymn 				strncpy(bf + 1, stats->io_name,
    296   1.1     blymn 				    sizeof(bf) - 1);
    297   1.1     blymn 			}
    298   1.1     blymn 			bf[IOSTATNAMELEN] = '\0';
    299   1.1     blymn 			slen = strlen(bf);
    300   1.1     blymn 			if (left < slen + 1)
    301   1.1     blymn 				break;
    302   1.1     blymn 			/* +1 to copy out the trailing NUL byte */
    303   1.1     blymn 			error = copyout(bf, where, slen + 1);
    304   1.1     blymn 			if (error)
    305   1.1     blymn 				break;
    306   1.1     blymn 			where += slen;
    307   1.1     blymn 			needed += slen;
    308   1.1     blymn 			left -= slen;
    309   1.1     blymn 		}
    310   1.1     blymn 	}
    311  1.13        ad 	rw_exit(&iostatlist_lock);
    312   1.1     blymn 	*oldlenp = needed;
    313   1.1     blymn 	return (error);
    314   1.1     blymn }
    315   1.1     blymn 
    316   1.1     blymn static int
    317   1.1     blymn sysctl_hw_iostats(SYSCTLFN_ARGS)
    318   1.1     blymn {
    319   1.1     blymn 	struct io_sysctl sdrive;
    320   1.1     blymn 	struct io_stats *stats;
    321   1.1     blymn 	char *where = oldp;
    322   1.1     blymn 	size_t tocopy, left;
    323   1.1     blymn 	int error;
    324   1.1     blymn 
    325   1.1     blymn 	if (newp != NULL)
    326   1.1     blymn 		return (EPERM);
    327   1.1     blymn 
    328   1.1     blymn 	/*
    329   1.1     blymn 	 * The original hw.diskstats call was broken and did not require
    330   1.1     blymn 	 * the userland to pass in it's size of struct disk_sysctl.  This
    331  1.15        ad 	 * was fixed after NetBSD 1.6 was released.
    332   1.1     blymn 	 */
    333   1.1     blymn 	if (namelen == 0)
    334   1.1     blymn 		tocopy = offsetof(struct io_sysctl, busy);
    335   1.1     blymn 	else
    336   1.1     blymn 		tocopy = name[0];
    337   1.1     blymn 
    338   1.1     blymn 	if (where == NULL) {
    339   1.1     blymn 		*oldlenp = iostat_count * tocopy;
    340   1.1     blymn 		return (0);
    341   1.1     blymn 	}
    342   1.1     blymn 
    343   1.1     blymn 	error = 0;
    344   1.1     blymn 	left = *oldlenp;
    345   1.1     blymn 	memset(&sdrive, 0, sizeof(sdrive));
    346   1.1     blymn 	*oldlenp = 0;
    347   1.1     blymn 
    348  1.13        ad 	rw_enter(&iostatlist_lock, RW_READER);
    349   1.2     blymn 	TAILQ_FOREACH(stats, &iostatlist, io_link) {
    350   1.1     blymn 		if (left < tocopy)
    351   1.1     blymn 			break;
    352   1.2     blymn 		strncpy(sdrive.name, stats->io_name, sizeof(sdrive.name));
    353   1.2     blymn 		sdrive.xfer = stats->io_rxfer + stats->io_wxfer;
    354   1.2     blymn 		sdrive.rxfer = stats->io_rxfer;
    355   1.2     blymn 		sdrive.wxfer = stats->io_wxfer;
    356   1.2     blymn 		sdrive.seek = stats->io_seek;
    357   1.2     blymn 		sdrive.bytes = stats->io_rbytes + stats->io_wbytes;
    358   1.2     blymn 		sdrive.rbytes = stats->io_rbytes;
    359   1.2     blymn 		sdrive.wbytes = stats->io_wbytes;
    360   1.2     blymn 		sdrive.attachtime_sec = stats->io_attachtime.tv_sec;
    361   1.2     blymn 		sdrive.attachtime_usec = stats->io_attachtime.tv_usec;
    362   1.2     blymn 		sdrive.timestamp_sec = stats->io_timestamp.tv_sec;
    363   1.2     blymn 		sdrive.timestamp_usec = stats->io_timestamp.tv_usec;
    364   1.2     blymn 		sdrive.time_sec = stats->io_time.tv_sec;
    365   1.2     blymn 		sdrive.time_usec = stats->io_time.tv_usec;
    366   1.2     blymn 		sdrive.busy = stats->io_busy;
    367   1.1     blymn 
    368   1.1     blymn 		error = copyout(&sdrive, where, min(tocopy, sizeof(sdrive)));
    369   1.1     blymn 		if (error)
    370   1.1     blymn 			break;
    371   1.1     blymn 		where += tocopy;
    372   1.1     blymn 		*oldlenp += tocopy;
    373   1.1     blymn 		left -= tocopy;
    374   1.1     blymn 	}
    375  1.13        ad 	rw_exit(&iostatlist_lock);
    376   1.1     blymn 	return (error);
    377   1.1     blymn }
    378   1.1     blymn 
    379   1.1     blymn SYSCTL_SETUP(sysctl_io_stats_setup, "sysctl i/o stats setup")
    380   1.1     blymn {
    381   1.3      yamt 
    382   1.1     blymn 	sysctl_createv(clog, 0, NULL, NULL,
    383   1.1     blymn 		       CTLFLAG_PERMANENT,
    384   1.1     blymn 		       CTLTYPE_STRING, "disknames",
    385   1.1     blymn 		       SYSCTL_DESCR("List of disk drives present"),
    386   1.1     blymn 		       sysctl_hw_disknames, 0, NULL, 0,
    387   1.1     blymn 		       CTL_HW, HW_DISKNAMES, CTL_EOL);
    388   1.1     blymn 	sysctl_createv(clog, 0, NULL, NULL,
    389   1.1     blymn 		       CTLFLAG_PERMANENT,
    390   1.1     blymn 		       CTLTYPE_STRING, "iostatnames",
    391   1.1     blymn 		       SYSCTL_DESCR("I/O stats are being collected for these"
    392   1.1     blymn 				    " devices"),
    393   1.1     blymn 		       sysctl_hw_iostatnames, 0, NULL, 0,
    394   1.1     blymn 		       CTL_HW, HW_IOSTATNAMES, CTL_EOL);
    395   1.1     blymn 	sysctl_createv(clog, 0, NULL, NULL,
    396   1.1     blymn 		       CTLFLAG_PERMANENT,
    397   1.7      yamt 		       CTLTYPE_STRUCT, "iostats",
    398   1.1     blymn 		       SYSCTL_DESCR("Statistics on device I/O operations"),
    399   1.1     blymn 		       sysctl_hw_iostats, 0, NULL, 0,
    400   1.1     blymn 		       CTL_HW, HW_IOSTATS, CTL_EOL);
    401   1.1     blymn }
    402