Home | History | Annotate | Line # | Download | only in tprof
tprof.c revision 1.18
      1  1.18       ryo /*	$NetBSD: tprof.c,v 1.18 2022/12/01 00:27:59 ryo Exp $	*/
      2   1.1      yamt 
      3   1.1      yamt /*-
      4   1.8      yamt  * Copyright (c)2008,2009,2010 YAMAMOTO Takashi,
      5   1.1      yamt  * All rights reserved.
      6   1.1      yamt  *
      7   1.1      yamt  * Redistribution and use in source and binary forms, with or without
      8   1.1      yamt  * modification, are permitted provided that the following conditions
      9   1.1      yamt  * are met:
     10   1.1      yamt  * 1. Redistributions of source code must retain the above copyright
     11   1.1      yamt  *    notice, this list of conditions and the following disclaimer.
     12   1.1      yamt  * 2. Redistributions in binary form must reproduce the above copyright
     13   1.1      yamt  *    notice, this list of conditions and the following disclaimer in the
     14   1.1      yamt  *    documentation and/or other materials provided with the distribution.
     15   1.1      yamt  *
     16   1.1      yamt  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
     17   1.1      yamt  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     18   1.1      yamt  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     19   1.1      yamt  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
     20   1.1      yamt  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     21   1.1      yamt  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     22   1.1      yamt  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     23   1.1      yamt  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     24   1.1      yamt  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     25   1.1      yamt  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     26   1.1      yamt  * SUCH DAMAGE.
     27   1.1      yamt  */
     28   1.1      yamt 
     29   1.1      yamt #include <sys/cdefs.h>
     30  1.18       ryo __KERNEL_RCSID(0, "$NetBSD: tprof.c,v 1.18 2022/12/01 00:27:59 ryo Exp $");
     31   1.1      yamt 
     32   1.1      yamt #include <sys/param.h>
     33   1.1      yamt #include <sys/systm.h>
     34   1.1      yamt #include <sys/kernel.h>
     35   1.1      yamt 
     36  1.15  riastrad #include <sys/callout.h>
     37  1.15  riastrad #include <sys/conf.h>
     38   1.1      yamt #include <sys/cpu.h>
     39   1.1      yamt #include <sys/kmem.h>
     40   1.4      yamt #include <sys/module.h>
     41  1.15  riastrad #include <sys/percpu.h>
     42   1.8      yamt #include <sys/proc.h>
     43  1.15  riastrad #include <sys/queue.h>
     44   1.1      yamt #include <sys/workqueue.h>
     45   1.1      yamt 
     46   1.1      yamt #include <dev/tprof/tprof.h>
     47   1.1      yamt #include <dev/tprof/tprof_ioctl.h>
     48   1.1      yamt 
     49  1.13  christos #include "ioconf.h"
     50  1.13  christos 
     51   1.4      yamt /*
     52   1.4      yamt  * locking order:
     53   1.4      yamt  *	tprof_reader_lock -> tprof_lock
     54   1.4      yamt  *	tprof_startstop_lock -> tprof_lock
     55   1.4      yamt  */
     56   1.4      yamt 
     57   1.4      yamt /*
     58   1.4      yamt  * protected by:
     59   1.4      yamt  *	L: tprof_lock
     60   1.4      yamt  *	R: tprof_reader_lock
     61   1.4      yamt  *	S: tprof_startstop_lock
     62   1.8      yamt  *	s: writer should hold tprof_startstop_lock and tprof_lock
     63   1.8      yamt  *	   reader should hold tprof_startstop_lock or tprof_lock
     64   1.4      yamt  */
     65   1.4      yamt 
     66   1.1      yamt typedef struct tprof_buf {
     67   1.1      yamt 	u_int b_used;
     68   1.1      yamt 	u_int b_size;
     69   1.1      yamt 	u_int b_overflow;
     70   1.1      yamt 	u_int b_unused;
     71   1.1      yamt 	STAILQ_ENTRY(tprof_buf) b_list;
     72   1.1      yamt 	tprof_sample_t b_data[];
     73   1.1      yamt } tprof_buf_t;
     74   1.1      yamt #define	TPROF_BUF_BYTESIZE(sz) \
     75   1.1      yamt 	(sizeof(tprof_buf_t) + (sz) * sizeof(tprof_sample_t))
     76   1.1      yamt #define	TPROF_MAX_SAMPLES_PER_BUF	10000
     77   1.1      yamt 
     78   1.1      yamt #define	TPROF_MAX_BUF			100
     79   1.1      yamt 
     80   1.1      yamt typedef struct {
     81   1.1      yamt 	tprof_buf_t *c_buf;
     82  1.10      yamt 	uint32_t c_cpuid;
     83   1.1      yamt 	struct work c_work;
     84   1.1      yamt 	callout_t c_callout;
     85   1.1      yamt } __aligned(CACHE_LINE_SIZE) tprof_cpu_t;
     86   1.1      yamt 
     87   1.4      yamt typedef struct tprof_backend {
     88   1.4      yamt 	const char *tb_name;
     89   1.4      yamt 	const tprof_backend_ops_t *tb_ops;
     90   1.4      yamt 	LIST_ENTRY(tprof_backend) tb_list;
     91   1.4      yamt 	int tb_usecount;	/* S: */
     92   1.4      yamt } tprof_backend_t;
     93   1.3      yamt 
     94   1.1      yamt static kmutex_t tprof_lock;
     95   1.8      yamt static bool tprof_running;		/* s: */
     96   1.4      yamt static u_int tprof_nworker;		/* L: # of running worker LWPs */
     97   1.1      yamt static lwp_t *tprof_owner;
     98   1.4      yamt static STAILQ_HEAD(, tprof_buf) tprof_list; /* L: global buffer list */
     99   1.4      yamt static u_int tprof_nbuf_on_list;	/* L: # of buffers on tprof_list */
    100   1.1      yamt static struct workqueue *tprof_wq;
    101  1.15  riastrad static struct percpu *tprof_cpus __read_mostly;	/* tprof_cpu_t * */
    102   1.1      yamt static u_int tprof_samples_per_buf;
    103   1.1      yamt 
    104   1.4      yamt static tprof_backend_t *tprof_backend;	/* S: */
    105   1.4      yamt static LIST_HEAD(, tprof_backend) tprof_backends =
    106   1.4      yamt     LIST_HEAD_INITIALIZER(tprof_backend); /* S: */
    107   1.4      yamt 
    108   1.1      yamt static kmutex_t tprof_reader_lock;
    109   1.4      yamt static kcondvar_t tprof_reader_cv;	/* L: */
    110   1.4      yamt static off_t tprof_reader_offset;	/* R: */
    111   1.1      yamt 
    112   1.1      yamt static kmutex_t tprof_startstop_lock;
    113   1.4      yamt static kcondvar_t tprof_cv;		/* L: */
    114   1.1      yamt 
    115   1.4      yamt static struct tprof_stat tprof_stat;	/* L: */
    116   1.1      yamt 
    117   1.1      yamt static tprof_cpu_t *
    118  1.18       ryo tprof_cpu_direct(struct cpu_info *ci)
    119  1.18       ryo {
    120  1.18       ryo 	tprof_cpu_t **cp;
    121  1.18       ryo 
    122  1.18       ryo 	cp = percpu_getptr_remote(tprof_cpus, ci);
    123  1.18       ryo 	return *cp;
    124  1.18       ryo }
    125  1.18       ryo 
    126  1.18       ryo static tprof_cpu_t *
    127   1.1      yamt tprof_cpu(struct cpu_info *ci)
    128   1.1      yamt {
    129  1.18       ryo 	tprof_cpu_t *c;
    130   1.1      yamt 
    131  1.15  riastrad 	/*
    132  1.15  riastrad 	 * As long as xcalls are blocked -- e.g., by kpreempt_disable
    133  1.15  riastrad 	 * -- the percpu object will not be swapped and destroyed.  We
    134  1.15  riastrad 	 * can't write to it, because the data may have already been
    135  1.15  riastrad 	 * moved to a new buffer, but we can safely read from it.
    136  1.15  riastrad 	 */
    137  1.15  riastrad 	kpreempt_disable();
    138  1.18       ryo 	c = tprof_cpu_direct(ci);
    139  1.15  riastrad 	kpreempt_enable();
    140  1.15  riastrad 
    141  1.15  riastrad 	return c;
    142   1.1      yamt }
    143   1.1      yamt 
    144   1.1      yamt static tprof_cpu_t *
    145   1.1      yamt tprof_curcpu(void)
    146   1.1      yamt {
    147   1.1      yamt 
    148   1.1      yamt 	return tprof_cpu(curcpu());
    149   1.1      yamt }
    150   1.1      yamt 
    151   1.1      yamt static tprof_buf_t *
    152   1.1      yamt tprof_buf_alloc(void)
    153   1.1      yamt {
    154   1.1      yamt 	tprof_buf_t *new;
    155   1.1      yamt 	u_int size = tprof_samples_per_buf;
    156  1.15  riastrad 
    157   1.1      yamt 	new = kmem_alloc(TPROF_BUF_BYTESIZE(size), KM_SLEEP);
    158   1.1      yamt 	new->b_used = 0;
    159   1.1      yamt 	new->b_size = size;
    160   1.1      yamt 	new->b_overflow = 0;
    161   1.1      yamt 	return new;
    162   1.1      yamt }
    163   1.1      yamt 
    164   1.1      yamt static void
    165   1.1      yamt tprof_buf_free(tprof_buf_t *buf)
    166   1.1      yamt {
    167   1.1      yamt 
    168   1.1      yamt 	kmem_free(buf, TPROF_BUF_BYTESIZE(buf->b_size));
    169   1.1      yamt }
    170   1.1      yamt 
    171   1.1      yamt static tprof_buf_t *
    172   1.1      yamt tprof_buf_switch(tprof_cpu_t *c, tprof_buf_t *new)
    173   1.1      yamt {
    174   1.1      yamt 	tprof_buf_t *old;
    175   1.1      yamt 
    176   1.1      yamt 	old = c->c_buf;
    177   1.1      yamt 	c->c_buf = new;
    178   1.1      yamt 	return old;
    179   1.1      yamt }
    180   1.1      yamt 
    181   1.1      yamt static tprof_buf_t *
    182   1.1      yamt tprof_buf_refresh(void)
    183   1.1      yamt {
    184   1.1      yamt 	tprof_cpu_t * const c = tprof_curcpu();
    185   1.1      yamt 	tprof_buf_t *new;
    186   1.1      yamt 
    187   1.1      yamt 	new = tprof_buf_alloc();
    188   1.1      yamt 	return tprof_buf_switch(c, new);
    189   1.1      yamt }
    190   1.1      yamt 
    191   1.1      yamt static void
    192   1.1      yamt tprof_worker(struct work *wk, void *dummy)
    193   1.1      yamt {
    194   1.1      yamt 	tprof_cpu_t * const c = tprof_curcpu();
    195   1.1      yamt 	tprof_buf_t *buf;
    196   1.1      yamt 	bool shouldstop;
    197   1.1      yamt 
    198   1.1      yamt 	KASSERT(wk == &c->c_work);
    199   1.1      yamt 	KASSERT(dummy == NULL);
    200   1.1      yamt 
    201   1.1      yamt 	/*
    202   1.1      yamt 	 * get a per cpu buffer.
    203   1.1      yamt 	 */
    204   1.1      yamt 	buf = tprof_buf_refresh();
    205   1.1      yamt 
    206   1.1      yamt 	/*
    207   1.1      yamt 	 * and put it on the global list for read(2).
    208   1.1      yamt 	 */
    209   1.1      yamt 	mutex_enter(&tprof_lock);
    210   1.1      yamt 	shouldstop = !tprof_running;
    211   1.1      yamt 	if (shouldstop) {
    212   1.1      yamt 		KASSERT(tprof_nworker > 0);
    213   1.1      yamt 		tprof_nworker--;
    214   1.1      yamt 		cv_broadcast(&tprof_cv);
    215   1.1      yamt 		cv_broadcast(&tprof_reader_cv);
    216   1.1      yamt 	}
    217   1.1      yamt 	if (buf->b_used == 0) {
    218   1.1      yamt 		tprof_stat.ts_emptybuf++;
    219   1.1      yamt 	} else if (tprof_nbuf_on_list < TPROF_MAX_BUF) {
    220   1.1      yamt 		tprof_stat.ts_sample += buf->b_used;
    221   1.1      yamt 		tprof_stat.ts_overflow += buf->b_overflow;
    222   1.1      yamt 		tprof_stat.ts_buf++;
    223   1.1      yamt 		STAILQ_INSERT_TAIL(&tprof_list, buf, b_list);
    224   1.1      yamt 		tprof_nbuf_on_list++;
    225   1.1      yamt 		buf = NULL;
    226   1.1      yamt 		cv_broadcast(&tprof_reader_cv);
    227   1.1      yamt 	} else {
    228   1.1      yamt 		tprof_stat.ts_dropbuf_sample += buf->b_used;
    229   1.1      yamt 		tprof_stat.ts_dropbuf++;
    230   1.1      yamt 	}
    231   1.1      yamt 	mutex_exit(&tprof_lock);
    232   1.1      yamt 	if (buf) {
    233   1.1      yamt 		tprof_buf_free(buf);
    234   1.1      yamt 	}
    235   1.1      yamt 	if (!shouldstop) {
    236   1.1      yamt 		callout_schedule(&c->c_callout, hz);
    237   1.1      yamt 	}
    238   1.1      yamt }
    239   1.1      yamt 
    240   1.1      yamt static void
    241   1.1      yamt tprof_kick(void *vp)
    242   1.1      yamt {
    243   1.1      yamt 	struct cpu_info * const ci = vp;
    244   1.1      yamt 	tprof_cpu_t * const c = tprof_cpu(ci);
    245   1.1      yamt 
    246   1.1      yamt 	workqueue_enqueue(tprof_wq, &c->c_work, ci);
    247   1.1      yamt }
    248   1.1      yamt 
    249   1.1      yamt static void
    250   1.1      yamt tprof_stop1(void)
    251   1.1      yamt {
    252   1.1      yamt 	CPU_INFO_ITERATOR cii;
    253   1.1      yamt 	struct cpu_info *ci;
    254   1.1      yamt 
    255   1.1      yamt 	KASSERT(mutex_owned(&tprof_startstop_lock));
    256   1.6      yamt 	KASSERT(tprof_nworker == 0);
    257   1.1      yamt 
    258   1.1      yamt 	for (CPU_INFO_FOREACH(cii, ci)) {
    259   1.1      yamt 		tprof_cpu_t * const c = tprof_cpu(ci);
    260   1.1      yamt 		tprof_buf_t *old;
    261   1.1      yamt 
    262   1.1      yamt 		old = tprof_buf_switch(c, NULL);
    263   1.1      yamt 		if (old != NULL) {
    264   1.1      yamt 			tprof_buf_free(old);
    265   1.1      yamt 		}
    266   1.1      yamt 		callout_destroy(&c->c_callout);
    267   1.1      yamt 	}
    268   1.1      yamt 	workqueue_destroy(tprof_wq);
    269   1.1      yamt }
    270   1.1      yamt 
    271  1.14      maxv static void
    272  1.14      maxv tprof_getinfo(struct tprof_info *info)
    273  1.14      maxv {
    274  1.14      maxv 	tprof_backend_t *tb;
    275  1.14      maxv 
    276  1.14      maxv 	KASSERT(mutex_owned(&tprof_startstop_lock));
    277  1.14      maxv 
    278  1.14      maxv 	memset(info, 0, sizeof(*info));
    279  1.14      maxv 	info->ti_version = TPROF_VERSION;
    280  1.14      maxv 	if ((tb = tprof_backend) != NULL) {
    281  1.14      maxv 		info->ti_ident = tb->tb_ops->tbo_ident();
    282  1.14      maxv 	}
    283  1.14      maxv }
    284  1.14      maxv 
    285   1.1      yamt static int
    286  1.14      maxv tprof_start(const tprof_param_t *param)
    287   1.1      yamt {
    288   1.1      yamt 	CPU_INFO_ITERATOR cii;
    289   1.1      yamt 	struct cpu_info *ci;
    290   1.1      yamt 	int error;
    291   1.1      yamt 	uint64_t freq;
    292   1.4      yamt 	tprof_backend_t *tb;
    293   1.1      yamt 
    294   1.1      yamt 	KASSERT(mutex_owned(&tprof_startstop_lock));
    295   1.1      yamt 	if (tprof_running) {
    296   1.1      yamt 		error = EBUSY;
    297   1.1      yamt 		goto done;
    298   1.1      yamt 	}
    299   1.1      yamt 
    300   1.4      yamt 	tb = tprof_backend;
    301   1.4      yamt 	if (tb == NULL) {
    302   1.4      yamt 		error = ENOENT;
    303   1.4      yamt 		goto done;
    304   1.4      yamt 	}
    305   1.4      yamt 	if (tb->tb_usecount > 0) {
    306   1.4      yamt 		error = EBUSY;
    307   1.4      yamt 		goto done;
    308   1.4      yamt 	}
    309   1.4      yamt 
    310   1.4      yamt 	tb->tb_usecount++;
    311   1.4      yamt 	freq = tb->tb_ops->tbo_estimate_freq();
    312   1.1      yamt 	tprof_samples_per_buf = MIN(freq * 2, TPROF_MAX_SAMPLES_PER_BUF);
    313   1.1      yamt 
    314   1.1      yamt 	error = workqueue_create(&tprof_wq, "tprofmv", tprof_worker, NULL,
    315   1.2      yamt 	    PRI_NONE, IPL_SOFTCLOCK, WQ_MPSAFE | WQ_PERCPU);
    316   1.1      yamt 	if (error != 0) {
    317   1.1      yamt 		goto done;
    318   1.1      yamt 	}
    319   1.1      yamt 
    320   1.1      yamt 	for (CPU_INFO_FOREACH(cii, ci)) {
    321   1.1      yamt 		tprof_cpu_t * const c = tprof_cpu(ci);
    322   1.1      yamt 		tprof_buf_t *new;
    323   1.1      yamt 		tprof_buf_t *old;
    324   1.1      yamt 
    325   1.1      yamt 		new = tprof_buf_alloc();
    326   1.1      yamt 		old = tprof_buf_switch(c, new);
    327   1.1      yamt 		if (old != NULL) {
    328   1.1      yamt 			tprof_buf_free(old);
    329   1.1      yamt 		}
    330   1.1      yamt 		callout_init(&c->c_callout, CALLOUT_MPSAFE);
    331   1.1      yamt 		callout_setfunc(&c->c_callout, tprof_kick, ci);
    332   1.1      yamt 	}
    333   1.1      yamt 
    334  1.14      maxv 	error = tb->tb_ops->tbo_start(param);
    335   1.1      yamt 	if (error != 0) {
    336   1.9      yamt 		KASSERT(tb->tb_usecount > 0);
    337   1.9      yamt 		tb->tb_usecount--;
    338   1.1      yamt 		tprof_stop1();
    339   1.1      yamt 		goto done;
    340   1.1      yamt 	}
    341   1.1      yamt 
    342   1.1      yamt 	mutex_enter(&tprof_lock);
    343   1.1      yamt 	tprof_running = true;
    344   1.1      yamt 	mutex_exit(&tprof_lock);
    345   1.1      yamt 	for (CPU_INFO_FOREACH(cii, ci)) {
    346   1.1      yamt 		tprof_cpu_t * const c = tprof_cpu(ci);
    347   1.1      yamt 
    348   1.1      yamt 		mutex_enter(&tprof_lock);
    349   1.1      yamt 		tprof_nworker++;
    350   1.1      yamt 		mutex_exit(&tprof_lock);
    351   1.1      yamt 		workqueue_enqueue(tprof_wq, &c->c_work, ci);
    352   1.1      yamt 	}
    353   1.1      yamt done:
    354   1.1      yamt 	return error;
    355   1.1      yamt }
    356   1.1      yamt 
    357   1.1      yamt static void
    358   1.1      yamt tprof_stop(void)
    359   1.1      yamt {
    360   1.4      yamt 	tprof_backend_t *tb;
    361   1.1      yamt 
    362   1.1      yamt 	KASSERT(mutex_owned(&tprof_startstop_lock));
    363   1.1      yamt 	if (!tprof_running) {
    364   1.1      yamt 		goto done;
    365   1.1      yamt 	}
    366   1.1      yamt 
    367   1.4      yamt 	tb = tprof_backend;
    368   1.4      yamt 	KASSERT(tb->tb_usecount > 0);
    369   1.4      yamt 	tb->tb_ops->tbo_stop(NULL);
    370   1.4      yamt 	tb->tb_usecount--;
    371   1.1      yamt 
    372   1.1      yamt 	mutex_enter(&tprof_lock);
    373   1.1      yamt 	tprof_running = false;
    374   1.1      yamt 	cv_broadcast(&tprof_reader_cv);
    375   1.8      yamt 	while (tprof_nworker > 0) {
    376   1.8      yamt 		cv_wait(&tprof_cv, &tprof_lock);
    377   1.8      yamt 	}
    378   1.1      yamt 	mutex_exit(&tprof_lock);
    379   1.1      yamt 
    380   1.1      yamt 	tprof_stop1();
    381   1.1      yamt done:
    382   1.1      yamt 	;
    383   1.1      yamt }
    384   1.1      yamt 
    385   1.4      yamt /*
    386   1.4      yamt  * tprof_clear: drain unread samples.
    387   1.4      yamt  */
    388   1.4      yamt 
    389   1.1      yamt static void
    390   1.1      yamt tprof_clear(void)
    391   1.1      yamt {
    392   1.1      yamt 	tprof_buf_t *buf;
    393   1.1      yamt 
    394   1.1      yamt 	mutex_enter(&tprof_reader_lock);
    395   1.1      yamt 	mutex_enter(&tprof_lock);
    396   1.1      yamt 	while ((buf = STAILQ_FIRST(&tprof_list)) != NULL) {
    397   1.1      yamt 		if (buf != NULL) {
    398   1.1      yamt 			STAILQ_REMOVE_HEAD(&tprof_list, b_list);
    399   1.1      yamt 			KASSERT(tprof_nbuf_on_list > 0);
    400   1.1      yamt 			tprof_nbuf_on_list--;
    401   1.1      yamt 			mutex_exit(&tprof_lock);
    402   1.1      yamt 			tprof_buf_free(buf);
    403   1.1      yamt 			mutex_enter(&tprof_lock);
    404   1.1      yamt 		}
    405   1.1      yamt 	}
    406   1.1      yamt 	KASSERT(tprof_nbuf_on_list == 0);
    407   1.1      yamt 	mutex_exit(&tprof_lock);
    408   1.1      yamt 	tprof_reader_offset = 0;
    409   1.1      yamt 	mutex_exit(&tprof_reader_lock);
    410   1.1      yamt 
    411   1.1      yamt 	memset(&tprof_stat, 0, sizeof(tprof_stat));
    412   1.1      yamt }
    413   1.1      yamt 
    414   1.4      yamt static tprof_backend_t *
    415   1.4      yamt tprof_backend_lookup(const char *name)
    416   1.4      yamt {
    417   1.4      yamt 	tprof_backend_t *tb;
    418   1.4      yamt 
    419   1.4      yamt 	KASSERT(mutex_owned(&tprof_startstop_lock));
    420   1.4      yamt 
    421   1.4      yamt 	LIST_FOREACH(tb, &tprof_backends, tb_list) {
    422   1.4      yamt 		if (!strcmp(tb->tb_name, name)) {
    423   1.4      yamt 			return tb;
    424   1.4      yamt 		}
    425   1.4      yamt 	}
    426   1.4      yamt 	return NULL;
    427   1.4      yamt }
    428   1.4      yamt 
    429   1.1      yamt /* -------------------- backend interfaces */
    430   1.1      yamt 
    431   1.1      yamt /*
    432   1.1      yamt  * tprof_sample: record a sample on the per-cpu buffer.
    433   1.1      yamt  *
    434   1.1      yamt  * be careful; can be called in NMI context.
    435  1.10      yamt  * we are bluntly assuming the followings are safe.
    436  1.10      yamt  *	curcpu()
    437  1.10      yamt  *	curlwp->l_lid
    438  1.10      yamt  *	curlwp->l_proc->p_pid
    439   1.1      yamt  */
    440   1.1      yamt 
    441   1.1      yamt void
    442  1.14      maxv tprof_sample(void *unused, const tprof_frame_info_t *tfi)
    443   1.1      yamt {
    444  1.18       ryo 	tprof_cpu_t * const c = tprof_cpu_direct(curcpu());
    445   1.1      yamt 	tprof_buf_t * const buf = c->c_buf;
    446   1.8      yamt 	tprof_sample_t *sp;
    447   1.5      yamt 	const uintptr_t pc = tfi->tfi_pc;
    448  1.10      yamt 	const lwp_t * const l = curlwp;
    449   1.1      yamt 	u_int idx;
    450   1.1      yamt 
    451   1.1      yamt 	idx = buf->b_used;
    452   1.1      yamt 	if (__predict_false(idx >= buf->b_size)) {
    453   1.1      yamt 		buf->b_overflow++;
    454   1.1      yamt 		return;
    455   1.1      yamt 	}
    456   1.8      yamt 	sp = &buf->b_data[idx];
    457  1.10      yamt 	sp->s_pid = l->l_proc->p_pid;
    458  1.10      yamt 	sp->s_lwpid = l->l_lid;
    459  1.10      yamt 	sp->s_cpuid = c->c_cpuid;
    460   1.8      yamt 	sp->s_flags = (tfi->tfi_inkernel) ? TPROF_SAMPLE_INKERNEL : 0;
    461   1.8      yamt 	sp->s_pc = pc;
    462   1.1      yamt 	buf->b_used = idx + 1;
    463   1.1      yamt }
    464   1.1      yamt 
    465   1.4      yamt /*
    466  1.16     skrll  * tprof_backend_register:
    467   1.4      yamt  */
    468   1.4      yamt 
    469   1.4      yamt int
    470   1.4      yamt tprof_backend_register(const char *name, const tprof_backend_ops_t *ops,
    471   1.4      yamt     int vers)
    472   1.4      yamt {
    473   1.4      yamt 	tprof_backend_t *tb;
    474   1.4      yamt 
    475   1.4      yamt 	if (vers != TPROF_BACKEND_VERSION) {
    476   1.4      yamt 		return EINVAL;
    477   1.4      yamt 	}
    478   1.4      yamt 
    479   1.4      yamt 	mutex_enter(&tprof_startstop_lock);
    480   1.4      yamt 	tb = tprof_backend_lookup(name);
    481   1.4      yamt 	if (tb != NULL) {
    482   1.4      yamt 		mutex_exit(&tprof_startstop_lock);
    483   1.4      yamt 		return EEXIST;
    484   1.4      yamt 	}
    485   1.4      yamt #if 1 /* XXX for now */
    486   1.4      yamt 	if (!LIST_EMPTY(&tprof_backends)) {
    487   1.4      yamt 		mutex_exit(&tprof_startstop_lock);
    488   1.4      yamt 		return ENOTSUP;
    489   1.4      yamt 	}
    490   1.4      yamt #endif
    491   1.4      yamt 	tb = kmem_alloc(sizeof(*tb), KM_SLEEP);
    492   1.4      yamt 	tb->tb_name = name;
    493   1.4      yamt 	tb->tb_ops = ops;
    494   1.4      yamt 	tb->tb_usecount = 0;
    495   1.4      yamt 	LIST_INSERT_HEAD(&tprof_backends, tb, tb_list);
    496   1.4      yamt #if 1 /* XXX for now */
    497   1.4      yamt 	if (tprof_backend == NULL) {
    498   1.4      yamt 		tprof_backend = tb;
    499   1.4      yamt 	}
    500   1.4      yamt #endif
    501   1.4      yamt 	mutex_exit(&tprof_startstop_lock);
    502   1.4      yamt 
    503   1.4      yamt 	return 0;
    504   1.4      yamt }
    505   1.4      yamt 
    506   1.4      yamt /*
    507  1.16     skrll  * tprof_backend_unregister:
    508   1.4      yamt  */
    509   1.4      yamt 
    510   1.4      yamt int
    511   1.4      yamt tprof_backend_unregister(const char *name)
    512   1.4      yamt {
    513   1.4      yamt 	tprof_backend_t *tb;
    514   1.4      yamt 
    515   1.4      yamt 	mutex_enter(&tprof_startstop_lock);
    516   1.4      yamt 	tb = tprof_backend_lookup(name);
    517   1.4      yamt #if defined(DIAGNOSTIC)
    518   1.4      yamt 	if (tb == NULL) {
    519   1.4      yamt 		mutex_exit(&tprof_startstop_lock);
    520   1.4      yamt 		panic("%s: not found '%s'", __func__, name);
    521   1.4      yamt 	}
    522   1.4      yamt #endif /* defined(DIAGNOSTIC) */
    523   1.4      yamt 	if (tb->tb_usecount > 0) {
    524   1.4      yamt 		mutex_exit(&tprof_startstop_lock);
    525   1.4      yamt 		return EBUSY;
    526   1.4      yamt 	}
    527   1.4      yamt #if 1 /* XXX for now */
    528   1.4      yamt 	if (tprof_backend == tb) {
    529   1.4      yamt 		tprof_backend = NULL;
    530   1.4      yamt 	}
    531   1.4      yamt #endif
    532   1.4      yamt 	LIST_REMOVE(tb, tb_list);
    533   1.4      yamt 	mutex_exit(&tprof_startstop_lock);
    534   1.4      yamt 
    535   1.4      yamt 	kmem_free(tb, sizeof(*tb));
    536   1.4      yamt 
    537   1.4      yamt 	return 0;
    538   1.4      yamt }
    539   1.4      yamt 
    540   1.1      yamt /* -------------------- cdevsw interfaces */
    541   1.1      yamt 
    542   1.1      yamt static int
    543   1.1      yamt tprof_open(dev_t dev, int flags, int type, struct lwp *l)
    544   1.1      yamt {
    545   1.1      yamt 
    546   1.1      yamt 	if (minor(dev) != 0) {
    547   1.1      yamt 		return EXDEV;
    548   1.1      yamt 	}
    549   1.1      yamt 	mutex_enter(&tprof_lock);
    550   1.1      yamt 	if (tprof_owner != NULL) {
    551   1.1      yamt 		mutex_exit(&tprof_lock);
    552   1.1      yamt 		return  EBUSY;
    553   1.1      yamt 	}
    554   1.1      yamt 	tprof_owner = curlwp;
    555   1.1      yamt 	mutex_exit(&tprof_lock);
    556   1.1      yamt 
    557   1.1      yamt 	return 0;
    558   1.1      yamt }
    559   1.1      yamt 
    560   1.1      yamt static int
    561   1.1      yamt tprof_close(dev_t dev, int flags, int type, struct lwp *l)
    562   1.1      yamt {
    563   1.1      yamt 
    564   1.1      yamt 	KASSERT(minor(dev) == 0);
    565   1.1      yamt 
    566   1.1      yamt 	mutex_enter(&tprof_startstop_lock);
    567   1.1      yamt 	mutex_enter(&tprof_lock);
    568   1.1      yamt 	tprof_owner = NULL;
    569   1.1      yamt 	mutex_exit(&tprof_lock);
    570   1.1      yamt 	tprof_stop();
    571   1.1      yamt 	tprof_clear();
    572   1.1      yamt 	mutex_exit(&tprof_startstop_lock);
    573   1.1      yamt 
    574   1.1      yamt 	return 0;
    575   1.1      yamt }
    576   1.1      yamt 
    577   1.1      yamt static int
    578   1.1      yamt tprof_read(dev_t dev, struct uio *uio, int flags)
    579   1.1      yamt {
    580   1.1      yamt 	tprof_buf_t *buf;
    581   1.1      yamt 	size_t bytes;
    582   1.1      yamt 	size_t resid;
    583   1.1      yamt 	size_t done;
    584   1.1      yamt 	int error = 0;
    585   1.1      yamt 
    586   1.1      yamt 	KASSERT(minor(dev) == 0);
    587   1.1      yamt 	mutex_enter(&tprof_reader_lock);
    588   1.1      yamt 	while (uio->uio_resid > 0 && error == 0) {
    589   1.1      yamt 		/*
    590   1.1      yamt 		 * take the first buffer from the list.
    591   1.1      yamt 		 */
    592   1.1      yamt 		mutex_enter(&tprof_lock);
    593   1.1      yamt 		buf = STAILQ_FIRST(&tprof_list);
    594   1.1      yamt 		if (buf == NULL) {
    595   1.1      yamt 			if (tprof_nworker == 0) {
    596   1.1      yamt 				mutex_exit(&tprof_lock);
    597   1.1      yamt 				error = 0;
    598   1.1      yamt 				break;
    599   1.1      yamt 			}
    600   1.1      yamt 			mutex_exit(&tprof_reader_lock);
    601   1.1      yamt 			error = cv_wait_sig(&tprof_reader_cv, &tprof_lock);
    602   1.1      yamt 			mutex_exit(&tprof_lock);
    603   1.1      yamt 			mutex_enter(&tprof_reader_lock);
    604   1.1      yamt 			continue;
    605   1.1      yamt 		}
    606   1.1      yamt 		STAILQ_REMOVE_HEAD(&tprof_list, b_list);
    607   1.1      yamt 		KASSERT(tprof_nbuf_on_list > 0);
    608   1.1      yamt 		tprof_nbuf_on_list--;
    609   1.1      yamt 		mutex_exit(&tprof_lock);
    610   1.1      yamt 
    611   1.1      yamt 		/*
    612   1.1      yamt 		 * copy it out.
    613   1.1      yamt 		 */
    614   1.1      yamt 		bytes = MIN(buf->b_used * sizeof(tprof_sample_t) -
    615   1.1      yamt 		    tprof_reader_offset, uio->uio_resid);
    616   1.1      yamt 		resid = uio->uio_resid;
    617   1.1      yamt 		error = uiomove((char *)buf->b_data + tprof_reader_offset,
    618   1.1      yamt 		    bytes, uio);
    619   1.1      yamt 		done = resid - uio->uio_resid;
    620   1.1      yamt 		tprof_reader_offset += done;
    621   1.1      yamt 
    622   1.1      yamt 		/*
    623   1.1      yamt 		 * if we didn't consume the whole buffer,
    624   1.1      yamt 		 * put it back to the list.
    625   1.1      yamt 		 */
    626   1.1      yamt 		if (tprof_reader_offset <
    627   1.1      yamt 		    buf->b_used * sizeof(tprof_sample_t)) {
    628   1.1      yamt 			mutex_enter(&tprof_lock);
    629   1.1      yamt 			STAILQ_INSERT_HEAD(&tprof_list, buf, b_list);
    630   1.1      yamt 			tprof_nbuf_on_list++;
    631   1.1      yamt 			cv_broadcast(&tprof_reader_cv);
    632   1.1      yamt 			mutex_exit(&tprof_lock);
    633   1.1      yamt 		} else {
    634   1.1      yamt 			tprof_buf_free(buf);
    635   1.1      yamt 			tprof_reader_offset = 0;
    636   1.1      yamt 		}
    637   1.1      yamt 	}
    638   1.1      yamt 	mutex_exit(&tprof_reader_lock);
    639   1.1      yamt 
    640   1.1      yamt 	return error;
    641   1.1      yamt }
    642   1.1      yamt 
    643   1.1      yamt static int
    644   1.1      yamt tprof_ioctl(dev_t dev, u_long cmd, void *data, int flags, struct lwp *l)
    645   1.1      yamt {
    646  1.14      maxv 	const tprof_param_t *param;
    647   1.1      yamt 	int error = 0;
    648   1.1      yamt 
    649   1.1      yamt 	KASSERT(minor(dev) == 0);
    650   1.1      yamt 
    651   1.1      yamt 	switch (cmd) {
    652  1.14      maxv 	case TPROF_IOC_GETINFO:
    653  1.14      maxv 		mutex_enter(&tprof_startstop_lock);
    654  1.14      maxv 		tprof_getinfo(data);
    655  1.14      maxv 		mutex_exit(&tprof_startstop_lock);
    656   1.1      yamt 		break;
    657   1.1      yamt 	case TPROF_IOC_START:
    658   1.1      yamt 		param = data;
    659   1.1      yamt 		mutex_enter(&tprof_startstop_lock);
    660   1.1      yamt 		error = tprof_start(param);
    661   1.1      yamt 		mutex_exit(&tprof_startstop_lock);
    662   1.1      yamt 		break;
    663   1.1      yamt 	case TPROF_IOC_STOP:
    664   1.1      yamt 		mutex_enter(&tprof_startstop_lock);
    665   1.1      yamt 		tprof_stop();
    666   1.1      yamt 		mutex_exit(&tprof_startstop_lock);
    667   1.1      yamt 		break;
    668   1.1      yamt 	case TPROF_IOC_GETSTAT:
    669   1.1      yamt 		mutex_enter(&tprof_lock);
    670   1.1      yamt 		memcpy(data, &tprof_stat, sizeof(tprof_stat));
    671   1.1      yamt 		mutex_exit(&tprof_lock);
    672   1.1      yamt 		break;
    673   1.1      yamt 	default:
    674   1.1      yamt 		error = EINVAL;
    675   1.1      yamt 		break;
    676   1.1      yamt 	}
    677   1.1      yamt 
    678   1.1      yamt 	return error;
    679   1.1      yamt }
    680   1.1      yamt 
    681   1.1      yamt const struct cdevsw tprof_cdevsw = {
    682   1.1      yamt 	.d_open = tprof_open,
    683   1.1      yamt 	.d_close = tprof_close,
    684   1.1      yamt 	.d_read = tprof_read,
    685   1.1      yamt 	.d_write = nowrite,
    686   1.1      yamt 	.d_ioctl = tprof_ioctl,
    687   1.1      yamt 	.d_stop = nostop,
    688   1.1      yamt 	.d_tty = notty,
    689   1.1      yamt 	.d_poll = nopoll,
    690   1.1      yamt 	.d_mmap = nommap,
    691   1.1      yamt 	.d_kqfilter = nokqfilter,
    692  1.12  dholland 	.d_discard = nodiscard,
    693  1.11  dholland 	.d_flag = D_OTHER | D_MPSAFE
    694   1.1      yamt };
    695   1.1      yamt 
    696   1.1      yamt void
    697   1.1      yamt tprofattach(int nunits)
    698   1.1      yamt {
    699   1.1      yamt 
    700   1.4      yamt 	/* nothing */
    701   1.4      yamt }
    702   1.4      yamt 
    703   1.4      yamt MODULE(MODULE_CLASS_DRIVER, tprof, NULL);
    704   1.4      yamt 
    705   1.4      yamt static void
    706  1.15  riastrad tprof_cpu_init(void *vcp, void *vcookie, struct cpu_info *ci)
    707  1.15  riastrad {
    708  1.15  riastrad 	tprof_cpu_t **cp = vcp, *c;
    709  1.15  riastrad 
    710  1.15  riastrad 	c = kmem_zalloc(sizeof(*c), KM_SLEEP);
    711  1.15  riastrad 	c->c_buf = NULL;
    712  1.15  riastrad 	c->c_cpuid = cpu_index(ci);
    713  1.15  riastrad 	*cp = c;
    714  1.15  riastrad }
    715  1.15  riastrad 
    716  1.15  riastrad static void
    717  1.15  riastrad tprof_cpu_fini(void *vcp, void *vcookie, struct cpu_info *ci)
    718  1.15  riastrad {
    719  1.15  riastrad 	tprof_cpu_t **cp = vcp, *c;
    720  1.15  riastrad 
    721  1.15  riastrad 	c = *cp;
    722  1.15  riastrad 	KASSERT(c->c_cpuid == cpu_index(ci));
    723  1.15  riastrad 	KASSERT(c->c_buf == NULL);
    724  1.15  riastrad 	kmem_free(c, sizeof(*c));
    725  1.15  riastrad 	*cp = NULL;
    726  1.15  riastrad }
    727  1.15  riastrad 
    728  1.15  riastrad static void
    729   1.4      yamt tprof_driver_init(void)
    730   1.4      yamt {
    731   1.4      yamt 
    732   1.1      yamt 	mutex_init(&tprof_lock, MUTEX_DEFAULT, IPL_NONE);
    733   1.1      yamt 	mutex_init(&tprof_reader_lock, MUTEX_DEFAULT, IPL_NONE);
    734   1.1      yamt 	mutex_init(&tprof_startstop_lock, MUTEX_DEFAULT, IPL_NONE);
    735   1.1      yamt 	cv_init(&tprof_cv, "tprof");
    736   1.7  pgoyette 	cv_init(&tprof_reader_cv, "tprof_rd");
    737   1.1      yamt 	STAILQ_INIT(&tprof_list);
    738  1.15  riastrad 	tprof_cpus = percpu_create(sizeof(tprof_cpu_t *),
    739  1.15  riastrad 	    tprof_cpu_init, tprof_cpu_fini, NULL);
    740   1.1      yamt }
    741   1.4      yamt 
    742   1.4      yamt static void
    743   1.4      yamt tprof_driver_fini(void)
    744   1.4      yamt {
    745   1.4      yamt 
    746  1.15  riastrad 	percpu_free(tprof_cpus, sizeof(tprof_cpu_t *));
    747   1.4      yamt 	mutex_destroy(&tprof_lock);
    748   1.4      yamt 	mutex_destroy(&tprof_reader_lock);
    749   1.4      yamt 	mutex_destroy(&tprof_startstop_lock);
    750   1.4      yamt 	cv_destroy(&tprof_cv);
    751   1.4      yamt 	cv_destroy(&tprof_reader_cv);
    752   1.4      yamt }
    753   1.4      yamt 
    754   1.4      yamt static int
    755   1.4      yamt tprof_modcmd(modcmd_t cmd, void *arg)
    756   1.4      yamt {
    757   1.4      yamt 
    758   1.4      yamt 	switch (cmd) {
    759   1.4      yamt 	case MODULE_CMD_INIT:
    760   1.4      yamt 		tprof_driver_init();
    761   1.4      yamt #if defined(_MODULE)
    762   1.4      yamt 		{
    763   1.4      yamt 			devmajor_t bmajor = NODEVMAJOR;
    764   1.4      yamt 			devmajor_t cmajor = NODEVMAJOR;
    765   1.4      yamt 			int error;
    766   1.4      yamt 
    767   1.4      yamt 			error = devsw_attach("tprof", NULL, &bmajor,
    768   1.4      yamt 			    &tprof_cdevsw, &cmajor);
    769   1.4      yamt 			if (error) {
    770   1.4      yamt 				tprof_driver_fini();
    771   1.4      yamt 				return error;
    772   1.4      yamt 			}
    773   1.4      yamt 		}
    774   1.4      yamt #endif /* defined(_MODULE) */
    775   1.4      yamt 		return 0;
    776   1.4      yamt 
    777   1.4      yamt 	case MODULE_CMD_FINI:
    778   1.4      yamt #if defined(_MODULE)
    779  1.17  riastrad 		devsw_detach(NULL, &tprof_cdevsw);
    780   1.4      yamt #endif /* defined(_MODULE) */
    781   1.4      yamt 		tprof_driver_fini();
    782   1.4      yamt 		return 0;
    783   1.4      yamt 
    784   1.4      yamt 	default:
    785   1.4      yamt 		return ENOTTY;
    786   1.4      yamt 	}
    787   1.4      yamt }
    788