Home | History | Annotate | Line # | Download | only in kern
kern_ksyms.c revision 1.28
      1 /*
      2  * Copyright (c) 2001, 2003 Anders Magnusson (ragge (at) ludd.luth.se).
      3  * All rights reserved.
      4  *
      5  * Redistribution and use in source and binary forms, with or without
      6  * modification, are permitted provided that the following conditions
      7  * are met:
      8  * 1. Redistributions of source code must retain the above copyright
      9  *    notice, this list of conditions and the following disclaimer.
     10  * 2. Redistributions in binary form must reproduce the above copyright
     11  *    notice, this list of conditions and the following disclaimer in the
     12  *    documentation and/or other materials provided with the distribution.
     13  * 3. The name of the author may not be used to endorse or promote products
     14  *    derived from this software without specific prior written permission
     15  *
     16  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
     17  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
     18  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
     19  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
     20  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
     21  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
     22  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
     23  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
     24  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
     25  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
     26  */
     27 
     28 /*
     29  * Code to deal with in-kernel symbol table management + /dev/ksyms.
     30  *
     31  * For each loaded module the symbol table info is kept track of by a
     32  * struct, placed in a circular list. The first entry is the kernel
     33  * symbol table.
     34  */
     35 
     36 /*
     37  * TODO:
     38  *	Change the ugly way of adding new symbols (comes with linker)
     39  *	Add kernel locking stuff.
     40  *	(Ev) add support for poll.
     41  *	(Ev) fix support for mmap.
     42  *
     43  *	Export ksyms internal logic for use in post-mortem debuggers?
     44  *	  Need to move struct symtab to ksyms.h for that.
     45  */
     46 
     47 #include <sys/cdefs.h>
     48 __KERNEL_RCSID(0, "$NetBSD: kern_ksyms.c,v 1.28 2006/10/12 01:32:15 christos Exp $");
     49 
     50 #ifdef _KERNEL
     51 #include "opt_ddb.h"
     52 #include "opt_ddbparam.h"	/* for SYMTAB_SPACE */
     53 #endif
     54 
     55 #include <sys/param.h>
     56 #include <sys/errno.h>
     57 #include <sys/queue.h>
     58 #include <sys/exec.h>
     59 #include <sys/systm.h>
     60 #include <sys/conf.h>
     61 #include <sys/device.h>
     62 #include <sys/malloc.h>
     63 #include <sys/proc.h>
     64 
     65 #include <machine/elf_machdep.h> /* XXX */
     66 #define ELFSIZE ARCH_ELFSIZE
     67 
     68 #include <sys/exec_elf.h>
     69 #include <sys/ksyms.h>
     70 
     71 #include <lib/libkern/libkern.h>
     72 
     73 #ifdef DDB
     74 #include <ddb/db_output.h>
     75 #endif
     76 
     77 #include "ksyms.h"
     78 
     79 static int ksymsinited = 0;
     80 
     81 #if NKSYMS
     82 static void ksyms_hdr_init(caddr_t hdraddr);
     83 static void ksyms_sizes_calc(void);
     84 static int ksyms_isopen;
     85 static int ksyms_maxlen;
     86 #endif
     87 
     88 #ifdef KSYMS_DEBUG
     89 #define	FOLLOW_CALLS		1
     90 #define	FOLLOW_MORE_CALLS	2
     91 #define	FOLLOW_DEVKSYMS		4
     92 static int ksyms_debug;
     93 #endif
     94 
     95 #ifdef SYMTAB_SPACE
     96 #define		SYMTAB_FILLER	"|This is the symbol table!"
     97 
     98 char		db_symtab[SYMTAB_SPACE] = SYMTAB_FILLER;
     99 int		db_symtabsize = SYMTAB_SPACE;
    100 #endif
    101 
    102 /*
    103  * Store the different symbol tables in a double-linked list.
    104  */
    105 struct symtab {
    106 	CIRCLEQ_ENTRY(symtab) sd_queue;
    107 	const char *sd_name;	/* Name of this table */
    108 	Elf_Sym *sd_symstart;	/* Address of symbol table */
    109 	caddr_t sd_strstart;	/* Adderss of corresponding string table */
    110 	int sd_usroffset;	/* Real address for userspace */
    111 	int sd_symsize;		/* Size in bytes of symbol table */
    112 	int sd_strsize;		/* Size of string table */
    113 	int *sd_symnmoff;	/* Used when calculating the name offset */
    114 };
    115 
    116 static CIRCLEQ_HEAD(, symtab) symtab_queue =
    117     CIRCLEQ_HEAD_INITIALIZER(symtab_queue);
    118 
    119 static struct symtab kernel_symtab;
    120 
    121 #define	USE_PTREE
    122 #ifdef USE_PTREE
    123 /*
    124  * Patricia-tree-based lookup structure for the in-kernel global symbols.
    125  * Based on a design by Mikael Sundstrom, msm (at) sm.luth.se.
    126  */
    127 struct ptree {
    128 	int16_t bitno;
    129 	int16_t lr[2];
    130 } *symb;
    131 static int16_t baseidx;
    132 static int treex = 1;
    133 
    134 #define	P_BIT(key, bit) ((key[bit >> 3] >> (bit & 7)) & 1)
    135 #define	STRING(idx) kernel_symtab.sd_symstart[idx].st_name + \
    136 			kernel_symtab.sd_strstart
    137 
    138 /*
    139  * Walk down the tree until a terminal node is found.
    140  */
    141 static int
    142 symbol_traverse(const char *key)
    143 {
    144 	int16_t nb, rbit = baseidx;
    145 
    146 	while (rbit > 0) {
    147 		nb = symb[rbit].bitno;
    148 		rbit = symb[rbit].lr[P_BIT(key, nb)];
    149 	}
    150 	return -rbit;
    151 }
    152 
    153 static int
    154 ptree_add(char *key, int val)
    155 {
    156 	int idx;
    157 	int nix, cix, bit, rbit, sb, lastrbit, svbit = 0, ix;
    158 	char *m, *k;
    159 
    160 	if (baseidx == 0) {
    161 		baseidx = -val;
    162 		return 0; /* First element */
    163 	}
    164 
    165 	/* Get string to match against */
    166 	idx = symbol_traverse(key);
    167 
    168 	/* Find first mismatching bit */
    169 	m = STRING(idx);
    170 	k = key;
    171 	if (strcmp(m, k) == 0)
    172 		return 1;
    173 
    174 	for (cix = 0; *m && *k && *m == *k; m++, k++, cix += 8)
    175 		;
    176 	ix = ffs((int)*m ^ (int)*k) - 1;
    177 	cix += ix;
    178 
    179 	/* Create new node */
    180 	nix = treex++;
    181 	bit = P_BIT(key, cix);
    182 	symb[nix].bitno = cix;
    183 	symb[nix].lr[bit] = -val;
    184 
    185 	/* Find where to insert node */
    186 	rbit = baseidx;
    187 	lastrbit = 0;
    188 	for (;;) {
    189 		if (rbit < 0)
    190 			break;
    191 		sb = symb[rbit].bitno;
    192 		if (sb > cix)
    193 			break;
    194 		if (sb == cix)
    195 			printf("symb[rbit].bitno == cix!!!\n");
    196 		lastrbit = rbit;
    197 		svbit = P_BIT(key, sb);
    198 		rbit = symb[rbit].lr[svbit];
    199 	}
    200 
    201 	/* Do the actual insertion */
    202 	if (lastrbit == 0) {
    203 		/* first element */
    204 		symb[nix].lr[!bit] = baseidx;
    205 		baseidx = nix;
    206 	} else {
    207 		symb[nix].lr[!bit] = rbit;
    208 		symb[lastrbit].lr[svbit] = nix;
    209 	}
    210 	return 0;
    211 }
    212 
    213 static int
    214 ptree_find(const char *key)
    215 {
    216 	int idx;
    217 
    218 	if (baseidx == 0)
    219 		return 0;
    220 	idx = symbol_traverse(key);
    221 
    222 	if (strcmp(key, STRING(idx)) == 0)
    223 		return idx;
    224 	return 0;
    225 }
    226 
    227 static void
    228 ptree_gen(char *off, struct symtab *tab)
    229 {
    230 	Elf_Sym *sym;
    231 	int i, nsym;
    232 
    233 	if (off != NULL)
    234 		symb = (struct ptree *)ALIGN(off);
    235 	else
    236 		symb = malloc((tab->sd_symsize/sizeof(Elf_Sym)) *
    237 		    sizeof(struct ptree), M_DEVBUF, M_WAITOK);
    238 	symb--; /* sym index won't be 0 */
    239 
    240 	sym = tab->sd_symstart;
    241 	if ((nsym = tab->sd_symsize/sizeof(Elf_Sym)) > INT16_MAX) {
    242 		printf("Too many symbols for tree, skipping %d symbols\n",
    243 		    nsym-INT16_MAX);
    244 		nsym = INT16_MAX;
    245 	}
    246 	for (i = 1; i < nsym; i++) {
    247 		if (ELF_ST_BIND(sym[i].st_info) != STB_GLOBAL)
    248 			continue;
    249 		ptree_add(tab->sd_strstart+sym[i].st_name, i);
    250 	}
    251 }
    252 #endif /* USE_PTREE */
    253 
    254 /*
    255  * Finds a certain symbol name in a certain symbol table.
    256  */
    257 static Elf_Sym *
    258 findsym(const char *name, struct symtab *table)
    259 {
    260 	Elf_Sym *start = table->sd_symstart;
    261 	int i, sz = table->sd_symsize/sizeof(Elf_Sym);
    262 	char *np;
    263 	caddr_t realstart = table->sd_strstart - table->sd_usroffset;
    264 
    265 #ifdef USE_PTREE
    266 	if (table == &kernel_symtab && (i = ptree_find(name)) != 0)
    267 		return &start[i];
    268 #endif
    269 
    270 	for (i = 0; i < sz; i++) {
    271 		np = realstart + start[i].st_name;
    272 		if (name[0] == np[0] && name[1] == np[1] &&
    273 		    strcmp(name, np) == 0)
    274 			return &start[i];
    275 	}
    276 	return NULL;
    277 }
    278 
    279 /*
    280  * The "attach" is in reality done in ksyms_init().
    281  */
    282 void ksymsattach(int);
    283 void
    284 ksymsattach(int arg __unused)
    285 {
    286 
    287 #ifdef USE_PTREE
    288 	if (baseidx == 0)
    289 		ptree_gen(0, &kernel_symtab);
    290 #endif
    291 
    292 }
    293 
    294 /*
    295  * Add a symbol table named name.
    296  * This is intended for use when the kernel loader enters the table.
    297  */
    298 static void
    299 addsymtab(const char *name, Elf_Ehdr *ehdr, struct symtab *tab)
    300 {
    301 	caddr_t start = (caddr_t)ehdr;
    302 	caddr_t send;
    303 	Elf_Shdr *shdr;
    304 	Elf_Sym *sym, *nsym;
    305 	int i, j, n, g;
    306 	char *str;
    307 
    308 	/* Find the symbol table and the corresponding string table. */
    309 	shdr = (Elf_Shdr *)(start + ehdr->e_shoff);
    310 	for (i = 1; i < ehdr->e_shnum; i++) {
    311 		if (shdr[i].sh_type != SHT_SYMTAB)
    312 			continue;
    313 		if (shdr[i].sh_offset == 0)
    314 			continue;
    315 		tab->sd_symstart = (Elf_Sym *)(start + shdr[i].sh_offset);
    316 		tab->sd_symsize = shdr[i].sh_size;
    317 		j = shdr[i].sh_link;
    318 		if (shdr[j].sh_offset == 0)
    319 			continue; /* Can this happen? */
    320 		tab->sd_strstart = start + shdr[j].sh_offset;
    321 		tab->sd_strsize = shdr[j].sh_size;
    322 		break;
    323 	}
    324 	tab->sd_name = name;
    325 	send = tab->sd_strstart + tab->sd_strsize;
    326 
    327 #ifdef KSYMS_DEBUG
    328 	printf("start %p sym %p symsz %d str %p strsz %d send %p\n",
    329 	    start, tab->sd_symstart, tab->sd_symsize,
    330 	    tab->sd_strstart, tab->sd_strsize, send);
    331 #endif
    332 
    333 	/*
    334 	 * Pack symbol table by removing all file name references
    335 	 * and overwrite the elf header.
    336 	 */
    337 	sym = tab->sd_symstart;
    338 	nsym = (Elf_Sym *)start;
    339 	str = tab->sd_strstart;
    340 	for (g = i = n = 0; i < tab->sd_symsize/sizeof(Elf_Sym); i++) {
    341 		if (i == 0) {
    342 			nsym[n++] = sym[i];
    343 			continue;
    344 		}
    345 		/*
    346 		 * Remove useless symbols.
    347 		 * Should actually remove all typeless symbols.
    348 		 */
    349 		if (sym[i].st_name == 0)
    350 			continue; /* Skip nameless entries */
    351 		if (ELF_ST_TYPE(sym[i].st_info) == STT_FILE)
    352 			continue; /* Skip filenames */
    353 		if (ELF_ST_TYPE(sym[i].st_info) == STT_NOTYPE &&
    354 		    sym[i].st_value == 0 &&
    355 		    strcmp(str + sym[i].st_name, "*ABS*") == 0)
    356 			continue; /* XXX */
    357 		if (ELF_ST_TYPE(sym[i].st_info) == STT_NOTYPE &&
    358 		    strcmp(str + sym[i].st_name, "gcc2_compiled.") == 0)
    359 			continue; /* XXX */
    360 
    361 #ifndef DDB
    362 		/* Only need global symbols */
    363 		if (ELF_ST_BIND(sym[i].st_info) != STB_GLOBAL)
    364 			continue;
    365 #endif
    366 
    367 		/* Save symbol. Set it as an absolute offset */
    368 		nsym[n] = sym[i];
    369 		nsym[n].st_shndx = SHN_ABS;
    370 		if (ELF_ST_BIND(nsym[n].st_info) == STB_GLOBAL)
    371 			g++;
    372 #if NKSYMS
    373 		j = strlen(nsym[n].st_name + tab->sd_strstart) + 1;
    374 		if (j > ksyms_maxlen)
    375 			ksyms_maxlen = j;
    376 #endif
    377 		n++;
    378 
    379 	}
    380 	tab->sd_symstart = nsym;
    381 	tab->sd_symsize = n * sizeof(Elf_Sym);
    382 
    383 #ifdef notyet
    384 	/*
    385 	 * Remove left-over strings.
    386 	 */
    387 	sym = tab->sd_symstart;
    388 	str = (caddr_t)tab->sd_symstart + tab->sd_symsize;
    389 	str[0] = 0;
    390 	n = 1;
    391 	for (i = 1; i < tab->sd_symsize/sizeof(Elf_Sym); i++) {
    392 		strcpy(str + n, tab->sd_strstart + sym[i].st_name);
    393 		sym[i].st_name = n;
    394 		n += strlen(str+n) + 1;
    395 	}
    396 	tab->sd_strstart = str;
    397 	tab->sd_strsize = n;
    398 
    399 #ifdef KSYMS_DEBUG
    400 	printf("str %p strsz %d send %p\n", str, n, send);
    401 #endif
    402 #endif
    403 
    404 	CIRCLEQ_INSERT_HEAD(&symtab_queue, tab, sd_queue);
    405 
    406 #ifdef notyet
    407 #ifdef USE_PTREE
    408 	/* Try to use the freed space, if possible */
    409 	if (send - str - n > g * sizeof(struct ptree))
    410 		ptree_gen(str + n, tab);
    411 #endif
    412 #endif
    413 }
    414 
    415 /*
    416  * Setup the kernel symbol table stuff.
    417  */
    418 void
    419 ksyms_init(int symsize, void *start, void *end __unused)
    420 {
    421 	Elf_Ehdr *ehdr;
    422 
    423 #ifdef SYMTAB_SPACE
    424 	if (symsize <= 0 &&
    425 	    strncmp(db_symtab, SYMTAB_FILLER, sizeof(SYMTAB_FILLER))) {
    426 		symsize = db_symtabsize;
    427 		start = db_symtab;
    428 		end = db_symtab + db_symtabsize;
    429 	}
    430 #endif
    431 	if (symsize <= 0) {
    432 		printf("[ Kernel symbol table missing! ]\n");
    433 		return;
    434 	}
    435 
    436 	/* Sanity check */
    437 	if (ALIGNED_POINTER(start, long) == 0) {
    438 		printf("[ Kernel symbol table has bad start address %p ]\n",
    439 		    start);
    440 		return;
    441 	}
    442 
    443 	ehdr = (Elf_Ehdr *)start;
    444 
    445 	/* check if this is a valid ELF header */
    446 	/* No reason to verify arch type, the kernel is actually running! */
    447 	if (memcmp(ehdr->e_ident, ELFMAG, SELFMAG) ||
    448 	    ehdr->e_ident[EI_CLASS] != ELFCLASS ||
    449 	    ehdr->e_version > 1) {
    450 #ifdef notyet /* DDB */
    451 		if (ddb_init(symsize, start, end))
    452 			return; /* old-style symbol table */
    453 #endif
    454 		printf("[ Kernel symbol table invalid! ]\n");
    455 		return; /* nothing to do */
    456 	}
    457 
    458 #if NKSYMS
    459 	/* Loaded header will be scratched in addsymtab */
    460 	ksyms_hdr_init(start);
    461 #endif
    462 
    463 	addsymtab("netbsd", ehdr, &kernel_symtab);
    464 
    465 #if NKSYMS
    466 	ksyms_sizes_calc();
    467 #endif
    468 
    469 	ksymsinited = 1;
    470 
    471 #ifdef DEBUG
    472 	printf("Loaded initial symtab at %p, strtab at %p, # entries %ld\n",
    473 	    kernel_symtab.sd_symstart, kernel_symtab.sd_strstart,
    474 	    (long)kernel_symtab.sd_symsize/sizeof(Elf_Sym));
    475 #endif
    476 }
    477 
    478 /*
    479  * Get the value associated with a symbol.
    480  * "mod" is the module name, or null if any module.
    481  * "sym" is the symbol name.
    482  * "val" is a pointer to the corresponding value, if call succeeded.
    483  * Returns 0 if success or ENOENT if no such entry.
    484  */
    485 int
    486 ksyms_getval(const char *mod, const char *sym, unsigned long *val, int type)
    487 {
    488 	struct symtab *st;
    489 	Elf_Sym *es;
    490 
    491 	if (ksymsinited == 0)
    492 		return ENOENT;
    493 
    494 #ifdef KSYMS_DEBUG
    495 	if (ksyms_debug & FOLLOW_CALLS)
    496 		printf("ksyms_getval: mod %s sym %s valp %p\n", mod, sym, val);
    497 #endif
    498 
    499 	CIRCLEQ_FOREACH(st, &symtab_queue, sd_queue) {
    500 		if (mod && strcmp(st->sd_name, mod))
    501 			continue;
    502 		if ((es = findsym(sym, st)) == NULL)
    503 			continue;
    504 
    505 		/* Skip if bad binding */
    506 		if (type == KSYMS_EXTERN &&
    507 		    ELF_ST_BIND(es->st_info) != STB_GLOBAL)
    508 			continue;
    509 
    510 		if (val)
    511 			*val = es->st_value;
    512 		return 0;
    513 	}
    514 	return ENOENT;
    515 }
    516 
    517 /*
    518  * Get "mod" and "symbol" associated with an address.
    519  * Returns 0 if success or ENOENT if no such entry.
    520  */
    521 int
    522 ksyms_getname(const char **mod, const char **sym, vaddr_t v, int f)
    523 {
    524 	struct symtab *st;
    525 	Elf_Sym *les, *es = NULL;
    526 	vaddr_t laddr = 0;
    527 	const char *lmod = NULL;
    528 	char *stable = NULL;
    529 	int type, i, sz;
    530 
    531 	if (ksymsinited == 0)
    532 		return ENOENT;
    533 
    534 	CIRCLEQ_FOREACH(st, &symtab_queue, sd_queue) {
    535 		sz = st->sd_symsize/sizeof(Elf_Sym);
    536 		for (i = 0; i < sz; i++) {
    537 			les = st->sd_symstart + i;
    538 			type = ELF_ST_TYPE(les->st_info);
    539 
    540 			if ((f & KSYMS_PROC) && (type != STT_FUNC))
    541 				continue;
    542 
    543 			if (type == STT_NOTYPE)
    544 				continue;
    545 
    546 			if (((f & KSYMS_ANY) == 0) &&
    547 			    (type != STT_FUNC) && (type != STT_OBJECT))
    548 				continue;
    549 
    550 			if ((les->st_value <= v) && (les->st_value > laddr)) {
    551 				laddr = les->st_value;
    552 				es = les;
    553 				lmod = st->sd_name;
    554 				stable = st->sd_strstart - st->sd_usroffset;
    555 			}
    556 		}
    557 	}
    558 	if (es == NULL)
    559 		return ENOENT;
    560 	if ((f & KSYMS_EXACT) && (v != es->st_value))
    561 		return ENOENT;
    562 	if (mod)
    563 		*mod = lmod;
    564 	if (sym)
    565 		*sym = stable + es->st_name;
    566 	return 0;
    567 }
    568 
    569 #if NKSYMS
    570 static int symsz, strsz;
    571 
    572 /*
    573  * In case we exposing the symbol table to the userland using the pseudo-
    574  * device /dev/ksyms, it is easier to provide all the tables as one.
    575  * However, it means we have to change all the st_name fields for the
    576  * symbols so they match the ELF image that the userland will read
    577  * through the device.
    578  *
    579  * The actual (correct) value of st_name is preserved through a global
    580  * offset stored in the symbol table structure.
    581  */
    582 
    583 static void
    584 ksyms_sizes_calc(void)
    585 {
    586         struct symtab *st;
    587 	int i;
    588 
    589         symsz = strsz = 0;
    590         CIRCLEQ_FOREACH(st, &symtab_queue, sd_queue) {
    591 		if (st != &kernel_symtab) {
    592 			for (i = 0; i < st->sd_symsize/sizeof(Elf_Sym); i++)
    593 				st->sd_symstart[i].st_name =
    594 				    strsz + st->sd_symnmoff[i];
    595 			st->sd_usroffset = strsz;
    596 		}
    597                 symsz += st->sd_symsize;
    598                 strsz += st->sd_strsize;
    599         }
    600 }
    601 #endif /* NKSYMS */
    602 
    603 /*
    604  * Temporary work structure for dynamic loaded symbol tables.
    605  * Will go away when in-kernel linker is in place.
    606  */
    607 
    608 struct syminfo {
    609 	size_t cursyms;
    610 	size_t curnamep;
    611 	size_t maxsyms;
    612 	size_t maxnamep;
    613 	Elf_Sym *syms;
    614 	int *symnmoff;
    615 	char *symnames;
    616 };
    617 
    618 
    619 /*
    620  * Add a symbol to the temporary save area for symbols.
    621  * This routine will go away when the in-kernel linker is in place.
    622  */
    623 static void
    624 addsym(struct syminfo *info, const Elf_Sym *sym, const char *name,
    625        const char *mod)
    626 {
    627 	int len, mlen;
    628 
    629 #ifdef KSYMS_DEBUG
    630 	if (ksyms_debug & FOLLOW_MORE_CALLS)
    631 		printf("addsym: name %s val %lx\n", name, (long)sym->st_value);
    632 #endif
    633 	len = strlen(name) + 1;
    634 	if (mod)
    635 		mlen = 1 + strlen(mod);
    636 	else
    637 		mlen = 0;
    638 	if (info->cursyms == info->maxsyms ||
    639 	    (len + mlen + info->curnamep) > info->maxnamep) {
    640 		printf("addsym: too many symbols, skipping '%s'\n", name);
    641 		return;
    642 	}
    643 	strlcpy(&info->symnames[info->curnamep], name,
    644 	    info->maxnamep - info->curnamep);
    645 	if (mlen) {
    646 		info->symnames[info->curnamep + len - 1] = '.';
    647 		strlcpy(&info->symnames[info->curnamep + len], mod,
    648 		    info->maxnamep - (info->curnamep + len));
    649 		len += mlen;
    650 	}
    651 	info->syms[info->cursyms] = *sym;
    652 	info->syms[info->cursyms].st_name = info->curnamep;
    653 	info->symnmoff[info->cursyms] = info->curnamep;
    654 	info->curnamep += len;
    655 #if NKSYMS
    656 	if (len > ksyms_maxlen)
    657 		ksyms_maxlen = len;
    658 #endif
    659 	info->cursyms++;
    660 }
    661 /*
    662  * Adds a symbol table.
    663  * "name" is the module name, "start" and "size" is where the symbol table
    664  * is located, and "type" is in which binary format the symbol table is.
    665  * New memory for keeping the symbol table is allocated in this function.
    666  * Returns 0 if success and EEXIST if the module name is in use.
    667  */
    668 static int
    669 specialsym(const char *symname)
    670 {
    671 	return	!strcmp(symname, "_bss_start") ||
    672 		!strcmp(symname, "__bss_start") ||
    673 		!strcmp(symname, "_bss_end__") ||
    674 		!strcmp(symname, "__bss_end__") ||
    675 		!strcmp(symname, "_edata") ||
    676 		!strcmp(symname, "_end") ||
    677 		!strcmp(symname, "__end") ||
    678 		!strcmp(symname, "__end__") ||
    679 		!strncmp(symname, "__start_link_set_", 17) ||
    680 		!strncmp(symname, "__stop_link_set_", 16);
    681 }
    682 
    683 int
    684 ksyms_addsymtab(const char *mod, void *symstart, vsize_t symsize,
    685     char *strstart, vsize_t strsize __unused)
    686 {
    687 	Elf_Sym *sym = symstart;
    688 	struct symtab *st;
    689 	unsigned long rval;
    690 	int i;
    691 	char *name;
    692 	struct syminfo info;
    693 
    694 #ifdef KSYMS_DEBUG
    695 	if (ksyms_debug & FOLLOW_CALLS)
    696 		printf("ksyms_addsymtab: mod %s symsize %lx strsize %lx\n",
    697 		    mod, symsize, strsize);
    698 #endif
    699 
    700 #if NKSYMS
    701 	/*
    702 	 * Do not try to add a symbol table while someone is reading
    703 	 * from /dev/ksyms.
    704 	 */
    705 	while (ksyms_isopen != 0)
    706 		tsleep(&ksyms_isopen, PWAIT, "ksyms", 0);
    707 #endif
    708 
    709 	/* Check if this symtab already loaded */
    710 	CIRCLEQ_FOREACH(st, &symtab_queue, sd_queue) {
    711 		if (strcmp(mod, st->sd_name) == 0)
    712 			return EEXIST;
    713 	}
    714 
    715 	/*
    716 	 * XXX - Only add a symbol if it do not exist already.
    717 	 * This is because of a flaw in the current LKM implementation,
    718 	 * these loops will be removed once the in-kernel linker is in place.
    719 	 */
    720 	memset(&info, 0, sizeof(info));
    721 	for (i = 0; i < symsize/sizeof(Elf_Sym); i++) {
    722 		char * const symname = strstart + sym[i].st_name;
    723 		if (sym[i].st_name == 0)
    724 			continue; /* Just ignore */
    725 
    726 		/* check validity of the symbol */
    727 		/* XXX - save local symbols if DDB */
    728 		if (ELF_ST_BIND(sym[i].st_info) != STB_GLOBAL)
    729 			continue;
    730 
    731 		/* Check if the symbol exists */
    732 		if (ksyms_getval(NULL, symname, &rval, KSYMS_EXTERN) == 0) {
    733 			/* Check (and complain) about differing values */
    734 			if (sym[i].st_value != rval) {
    735 				if (specialsym(symname)) {
    736 					info.maxsyms++;
    737 					info.maxnamep += strlen(symname) + 1 +
    738 					    strlen(mod) + 1;
    739 				} else {
    740 					printf("%s: symbol '%s' redeclared with"
    741 					    " different value (%lx != %lx)\n",
    742 					    mod, symname,
    743 					    rval, (long)sym[i].st_value);
    744 				}
    745 			}
    746 		} else {
    747 			/*
    748 			 * Count this symbol
    749 			 */
    750 			info.maxsyms++;
    751 			info.maxnamep += strlen(symname) + 1;
    752 		}
    753 	}
    754 
    755 	/*
    756 	 * Now that we know the sizes, malloc the structures.
    757 	 */
    758 	info.syms = malloc(sizeof(Elf_Sym)*info.maxsyms, M_DEVBUF, M_WAITOK);
    759 	info.symnames = malloc(info.maxnamep, M_DEVBUF, M_WAITOK);
    760 	info.symnmoff = malloc(sizeof(int)*info.maxsyms, M_DEVBUF, M_WAITOK);
    761 
    762 	/*
    763 	 * Now that we have the symbols, actually fill in the structures.
    764 	 */
    765 	for (i = 0; i < symsize/sizeof(Elf_Sym); i++) {
    766 		char * const symname = strstart + sym[i].st_name;
    767 		if (sym[i].st_name == 0)
    768 			continue; /* Just ignore */
    769 
    770 		/* check validity of the symbol */
    771 		/* XXX - save local symbols if DDB */
    772 		if (ELF_ST_BIND(sym[i].st_info) != STB_GLOBAL)
    773 			continue;
    774 
    775 		/* Check if the symbol exists */
    776 		if (ksyms_getval(NULL, symname, &rval, KSYMS_EXTERN) == 0) {
    777 			if ((sym[i].st_value != rval) && specialsym(symname)) {
    778 				addsym(&info, &sym[i], symname, mod);
    779 			}
    780 		} else
    781 			/* Ok, save this symbol */
    782 			addsym(&info, &sym[i], symname, NULL);
    783 	}
    784 
    785 	st = malloc(sizeof(struct symtab), M_DEVBUF, M_WAITOK);
    786 	i = strlen(mod) + 1;
    787 	name = malloc(i, M_DEVBUF, M_WAITOK);
    788 	strlcpy(name, mod, i);
    789 	st->sd_name = name;
    790 	st->sd_symnmoff = info.symnmoff;
    791 	st->sd_symstart = info.syms;
    792 	st->sd_symsize = sizeof(Elf_Sym)*info.maxsyms;
    793 	st->sd_strstart = info.symnames;
    794 	st->sd_strsize = info.maxnamep;
    795 
    796 	/* Make them absolute references */
    797 	sym = st->sd_symstart;
    798 	for (i = 0; i < st->sd_symsize/sizeof(Elf_Sym); i++)
    799 		sym[i].st_shndx = SHN_ABS;
    800 
    801 	CIRCLEQ_INSERT_TAIL(&symtab_queue, st, sd_queue);
    802 #if NKSYMS
    803 	ksyms_sizes_calc();
    804 #endif
    805 	return 0;
    806 }
    807 
    808 /*
    809  * Remove a symbol table specified by name.
    810  * Returns 0 if success, EBUSY if device open and ENOENT if no such name.
    811  */
    812 int
    813 ksyms_delsymtab(const char *mod)
    814 {
    815 	struct symtab *st;
    816 	int found = 0;
    817 
    818 #if NKSYMS
    819 	/*
    820 	 * Do not try to delete a symbol table while someone is reading
    821 	 * from /dev/ksyms.
    822 	 */
    823 	while (ksyms_isopen != 0)
    824 		tsleep(&ksyms_isopen, PWAIT, "ksyms", 0);
    825 #endif
    826 
    827 	CIRCLEQ_FOREACH(st, &symtab_queue, sd_queue) {
    828 		if (strcmp(mod, st->sd_name) == 0) {
    829 			found = 1;
    830 			break;
    831 		}
    832 	}
    833 	if (found == 0)
    834 		return ENOENT;
    835 	CIRCLEQ_REMOVE(&symtab_queue, st, sd_queue);
    836 	free(st->sd_symstart, M_DEVBUF);
    837 	free(st->sd_strstart, M_DEVBUF);
    838 	free(st->sd_symnmoff, M_DEVBUF);
    839 	/* XXXUNCONST LINTED - const castaway */
    840 	free(__UNCONST(st->sd_name), M_DEVBUF);
    841 	free(st, M_DEVBUF);
    842 #if NKSYMS
    843 	ksyms_sizes_calc();
    844 #endif
    845 	return 0;
    846 }
    847 
    848 int
    849 ksyms_rensymtab(const char *old, const char *new)
    850 {
    851 	struct symtab *st, *oldst = NULL;
    852 	char *newstr;
    853 
    854 	CIRCLEQ_FOREACH(st, &symtab_queue, sd_queue) {
    855 		if (strcmp(old, st->sd_name) == 0)
    856 			oldst = st;
    857 		if (strcmp(new, st->sd_name) == 0)
    858 			return (EEXIST);
    859 	}
    860 	if (oldst == NULL)
    861 		return (ENOENT);
    862 
    863 	newstr = malloc(strlen(new)+1, M_DEVBUF, M_WAITOK);
    864 	if (!newstr)
    865 		return (ENOMEM);
    866 	strcpy(newstr, new);
    867 	/*XXXUNCONST*/
    868 	free(__UNCONST(oldst->sd_name), M_DEVBUF);
    869 	oldst->sd_name = newstr;
    870 
    871 	return (0);
    872 }
    873 
    874 #ifdef DDB
    875 /*
    876  * Keep sifting stuff here, to avoid export of ksyms internals.
    877  */
    878 int
    879 ksyms_sift(char *mod, char *sym, int mode)
    880 {
    881 	struct symtab *st;
    882 	char *sb;
    883 	int i, sz;
    884 
    885 	if (ksymsinited == 0)
    886 		return ENOENT;
    887 
    888 	CIRCLEQ_FOREACH(st, &symtab_queue, sd_queue) {
    889 		if (mod && strcmp(mod, st->sd_name))
    890 			continue;
    891 		sb = st->sd_strstart;
    892 
    893 		sz = st->sd_symsize/sizeof(Elf_Sym);
    894 		for (i = 0; i < sz; i++) {
    895 			Elf_Sym *les = st->sd_symstart + i;
    896 			char c;
    897 
    898 			if (strstr(sb + les->st_name - st->sd_usroffset, sym)
    899 			    == NULL)
    900 				continue;
    901 
    902 			if (mode == 'F') {
    903 				switch (ELF_ST_TYPE(les->st_info)) {
    904 				case STT_OBJECT:
    905 					c = '+';
    906 					break;
    907 				case STT_FUNC:
    908 					c = '*';
    909 					break;
    910 				case STT_SECTION:
    911 					c = '&';
    912 					break;
    913 				case STT_FILE:
    914 					c = '/';
    915 					break;
    916 				default:
    917 					c = ' ';
    918 					break;
    919 				}
    920 				db_printf("%s%c ", sb + les->st_name -
    921 				    st->sd_usroffset, c);
    922 			} else
    923 				db_printf("%s ", sb + les->st_name -
    924 				    st->sd_usroffset);
    925 		}
    926 	}
    927 	return ENOENT;
    928 }
    929 #endif /* DDB */
    930 
    931 #if NKSYMS
    932 /*
    933  * Static allocated ELF header.
    934  * Basic info is filled in at attach, sizes at open.
    935  */
    936 #define	SYMTAB		1
    937 #define	STRTAB		2
    938 #define	SHSTRTAB	3
    939 #define NSECHDR		4
    940 
    941 #define	NPRGHDR		2
    942 #define	SHSTRSIZ	28
    943 
    944 static struct ksyms_hdr {
    945 	Elf_Ehdr	kh_ehdr;
    946 	Elf_Phdr	kh_phdr[NPRGHDR];
    947 	Elf_Shdr	kh_shdr[NSECHDR];
    948 	char 		kh_strtab[SHSTRSIZ];
    949 } ksyms_hdr;
    950 
    951 
    952 static void
    953 ksyms_hdr_init(caddr_t hdraddr)
    954 {
    955 
    956 	/* Copy the loaded elf exec header */
    957 	memcpy(&ksyms_hdr.kh_ehdr, hdraddr, sizeof(Elf_Ehdr));
    958 
    959 	/* Set correct program/section header sizes, offsets and numbers */
    960 	ksyms_hdr.kh_ehdr.e_phoff = offsetof(struct ksyms_hdr, kh_phdr[0]);
    961 	ksyms_hdr.kh_ehdr.e_phentsize = sizeof(Elf_Phdr);
    962 	ksyms_hdr.kh_ehdr.e_phnum = NPRGHDR;
    963 	ksyms_hdr.kh_ehdr.e_shoff = offsetof(struct ksyms_hdr, kh_shdr[0]);
    964 	ksyms_hdr.kh_ehdr.e_shentsize = sizeof(Elf_Shdr);
    965 	ksyms_hdr.kh_ehdr.e_shnum = NSECHDR;
    966 	ksyms_hdr.kh_ehdr.e_shstrndx = NSECHDR - 1; /* Last section */
    967 
    968 	/*
    969 	 * Keep program headers zeroed (unused).
    970 	 * The section headers are hand-crafted.
    971 	 * First section is section zero.
    972 	 */
    973 
    974 	/* Second section header; ".symtab" */
    975 	ksyms_hdr.kh_shdr[SYMTAB].sh_name = 1; /* Section 3 offset */
    976 	ksyms_hdr.kh_shdr[SYMTAB].sh_type = SHT_SYMTAB;
    977 	ksyms_hdr.kh_shdr[SYMTAB].sh_offset = sizeof(struct ksyms_hdr);
    978 /*	ksyms_hdr.kh_shdr[SYMTAB].sh_size = filled in at open */
    979 	ksyms_hdr.kh_shdr[SYMTAB].sh_link = 2; /* Corresponding strtab */
    980 	ksyms_hdr.kh_shdr[SYMTAB].sh_info = 0; /* XXX */
    981 	ksyms_hdr.kh_shdr[SYMTAB].sh_addralign = sizeof(long);
    982 	ksyms_hdr.kh_shdr[SYMTAB].sh_entsize = sizeof(Elf_Sym);
    983 
    984 	/* Third section header; ".strtab" */
    985 	ksyms_hdr.kh_shdr[STRTAB].sh_name = 9; /* Section 3 offset */
    986 	ksyms_hdr.kh_shdr[STRTAB].sh_type = SHT_STRTAB;
    987 /*	ksyms_hdr.kh_shdr[STRTAB].sh_offset = filled in at open */
    988 /*	ksyms_hdr.kh_shdr[STRTAB].sh_size = filled in at open */
    989 /*	ksyms_hdr.kh_shdr[STRTAB].sh_link = kept zero */
    990 	ksyms_hdr.kh_shdr[STRTAB].sh_info = 0;
    991 	ksyms_hdr.kh_shdr[STRTAB].sh_addralign = sizeof(char);
    992 	ksyms_hdr.kh_shdr[STRTAB].sh_entsize = 0;
    993 
    994 	/* Fourth section, ".shstrtab" */
    995 	ksyms_hdr.kh_shdr[SHSTRTAB].sh_name = 17; /* This section name offset */
    996 	ksyms_hdr.kh_shdr[SHSTRTAB].sh_type = SHT_STRTAB;
    997 	ksyms_hdr.kh_shdr[SHSTRTAB].sh_offset =
    998 	    offsetof(struct ksyms_hdr, kh_strtab);
    999 	ksyms_hdr.kh_shdr[SHSTRTAB].sh_size = SHSTRSIZ;
   1000 	ksyms_hdr.kh_shdr[SHSTRTAB].sh_addralign = sizeof(char);
   1001 
   1002 	/* Set section names */
   1003 	strlcpy(&ksyms_hdr.kh_strtab[1], ".symtab",
   1004 	    sizeof(ksyms_hdr.kh_strtab) - 1);
   1005 	strlcpy(&ksyms_hdr.kh_strtab[9], ".strtab",
   1006 	    sizeof(ksyms_hdr.kh_strtab) - 9);
   1007 	strlcpy(&ksyms_hdr.kh_strtab[17], ".shstrtab",
   1008 	    sizeof(ksyms_hdr.kh_strtab) - 17);
   1009 };
   1010 
   1011 static int
   1012 ksymsopen(dev_t dev, int oflags __unused, int devtype __unused,
   1013     struct lwp *l __unused)
   1014 {
   1015 
   1016 	if (minor(dev))
   1017 		return ENXIO;
   1018 	if (ksymsinited == 0)
   1019 		return ENXIO;
   1020 
   1021 	ksyms_hdr.kh_shdr[SYMTAB].sh_size = symsz;
   1022 	ksyms_hdr.kh_shdr[STRTAB].sh_offset = symsz +
   1023 	    ksyms_hdr.kh_shdr[SYMTAB].sh_offset;
   1024 	ksyms_hdr.kh_shdr[STRTAB].sh_size = strsz;
   1025 	ksyms_isopen = 1;
   1026 
   1027 #ifdef KSYMS_DEBUG
   1028 	if (ksyms_debug & FOLLOW_DEVKSYMS)
   1029 		printf("ksymsopen: symsz 0x%x strsz 0x%x\n", symsz, strsz);
   1030 #endif
   1031 
   1032 	return 0;
   1033 }
   1034 
   1035 static int
   1036 ksymsclose(dev_t dev __unused, int oflags __unused, int devtype __unused,
   1037     struct lwp *l __unused)
   1038 {
   1039 
   1040 #ifdef KSYMS_DEBUG
   1041 	if (ksyms_debug & FOLLOW_DEVKSYMS)
   1042 		printf("ksymsclose\n");
   1043 #endif
   1044 
   1045 	ksyms_isopen = 0;
   1046 	wakeup(&ksyms_isopen);
   1047 	return 0;
   1048 }
   1049 
   1050 #define	HDRSIZ	sizeof(struct ksyms_hdr)
   1051 
   1052 static int
   1053 ksymsread(dev_t dev __unused, struct uio *uio, int ioflag __unused)
   1054 {
   1055 	struct symtab *st;
   1056 	size_t filepos, inpos, off;
   1057 
   1058 #ifdef KSYMS_DEBUG
   1059 	if (ksyms_debug & FOLLOW_DEVKSYMS)
   1060 		printf("ksymsread: offset 0x%llx resid 0x%zx\n",
   1061 		    (long long)uio->uio_offset, uio->uio_resid);
   1062 #endif
   1063 
   1064 	off = uio->uio_offset;
   1065 	if (off >= (strsz + symsz + HDRSIZ))
   1066 		return 0; /* End of symtab */
   1067 	/*
   1068 	 * First: Copy out the ELF header.
   1069 	 */
   1070 	if (off < HDRSIZ)
   1071 		uiomove((char *)&ksyms_hdr + off, HDRSIZ - off, uio);
   1072 
   1073 	/*
   1074 	 * Copy out the symbol table.
   1075 	 */
   1076 	filepos = HDRSIZ;
   1077 	CIRCLEQ_FOREACH(st, &symtab_queue, sd_queue) {
   1078 		if (uio->uio_resid == 0)
   1079 			return 0;
   1080 		if (uio->uio_offset <= st->sd_symsize + filepos) {
   1081 			inpos = uio->uio_offset - filepos;
   1082 			uiomove((char *)st->sd_symstart + inpos,
   1083 			   st->sd_symsize - inpos, uio);
   1084 		}
   1085 		filepos += st->sd_symsize;
   1086 	}
   1087 
   1088 	if (filepos != HDRSIZ + symsz)
   1089 		panic("ksymsread: unsunc");
   1090 
   1091 	/*
   1092 	 * Copy out the string table
   1093 	 */
   1094 	CIRCLEQ_FOREACH(st, &symtab_queue, sd_queue) {
   1095 		if (uio->uio_resid == 0)
   1096 			return 0;
   1097 		if (uio->uio_offset <= st->sd_strsize + filepos) {
   1098 			inpos = uio->uio_offset - filepos;
   1099 			uiomove((char *)st->sd_strstart + inpos,
   1100 			   st->sd_strsize - inpos, uio);
   1101 		}
   1102 		filepos += st->sd_strsize;
   1103 	}
   1104 	return 0;
   1105 }
   1106 
   1107 static int
   1108 ksymswrite(dev_t dev __unused, struct uio *uio __unused, int ioflag __unused)
   1109 {
   1110 	return EROFS;
   1111 }
   1112 
   1113 static int
   1114 ksymsioctl(dev_t dev __unused, u_long cmd, caddr_t data, int fflag __unused,
   1115     struct lwp *l __unused)
   1116 {
   1117 	struct ksyms_gsymbol *kg = (struct ksyms_gsymbol *)data;
   1118 	struct symtab *st;
   1119 	Elf_Sym *sym = NULL;
   1120 	unsigned long val;
   1121 	int error = 0;
   1122 	char *str = NULL;
   1123 
   1124 	if (cmd == KIOCGVALUE || cmd == KIOCGSYMBOL)
   1125 		str = malloc(ksyms_maxlen, M_DEVBUF, M_WAITOK);
   1126 
   1127 	switch (cmd) {
   1128 	case KIOCGVALUE:
   1129 		/*
   1130 		 * Use the in-kernel symbol lookup code for fast
   1131 		 * retreival of a value.
   1132 		 */
   1133 		if ((error = copyinstr(kg->kg_name, str, ksyms_maxlen, NULL)))
   1134 			break;
   1135 		if ((error = ksyms_getval(NULL, str, &val, KSYMS_EXTERN)))
   1136 			break;
   1137 		error = copyout(&val, kg->kg_value, sizeof(long));
   1138 		break;
   1139 
   1140 	case KIOCGSYMBOL:
   1141 		/*
   1142 		 * Use the in-kernel symbol lookup code for fast
   1143 		 * retreival of a symbol.
   1144 		 */
   1145 		if ((error = copyinstr(kg->kg_name, str, ksyms_maxlen, NULL)))
   1146 			break;
   1147 		CIRCLEQ_FOREACH(st, &symtab_queue, sd_queue) {
   1148 			if ((sym = findsym(str, st)) == NULL) /* from userland */
   1149 				continue;
   1150 
   1151 			/* Skip if bad binding */
   1152 			if (ELF_ST_BIND(sym->st_info) != STB_GLOBAL) {
   1153 				sym = NULL;
   1154 				continue;
   1155 			}
   1156 			break;
   1157 		}
   1158 		/*
   1159 		 * XXX which value of sym->st_name should be returned?  The real
   1160 		 * one, or the one that matches what reading /dev/ksyms get?
   1161 		 *
   1162 		 * Currently, we're returning the /dev/ksyms one.
   1163 		 */
   1164 		if (sym != NULL)
   1165 			error = copyout(sym, kg->kg_sym, sizeof(Elf_Sym));
   1166 		else
   1167 			error = ENOENT;
   1168 		break;
   1169 
   1170 	case KIOCGSIZE:
   1171 		/*
   1172 		 * Get total size of symbol table.
   1173 		 */
   1174 		*(int *)data = strsz + symsz + HDRSIZ;
   1175 		break;
   1176 
   1177 	default:
   1178 		error = ENOTTY;
   1179 		break;
   1180 	}
   1181 
   1182 	if (cmd == KIOCGVALUE || cmd == KIOCGSYMBOL)
   1183 		free(str, M_DEVBUF);
   1184 
   1185 	return error;
   1186 }
   1187 
   1188 const struct cdevsw ksyms_cdevsw = {
   1189 	ksymsopen, ksymsclose, ksymsread, ksymswrite, ksymsioctl,
   1190 	    nullstop, notty, nopoll, nommap, nullkqfilter, DV_DULL
   1191 };
   1192 #endif /* NKSYMS */
   1193