Home | History | Annotate | Line # | Download | only in ld.elf_so
symbol.c revision 1.41
      1  1.41      matt /*	$NetBSD: symbol.c,v 1.41 2007/02/22 18:57:48 matt Exp $	 */
      2   1.1       cgd 
      3   1.1       cgd /*
      4   1.1       cgd  * Copyright 1996 John D. Polstra.
      5   1.1       cgd  * Copyright 1996 Matt Thomas <matt (at) 3am-software.com>
      6  1.25   mycroft  * Copyright 2002 Charles M. Hannum <root (at) ihack.net>
      7   1.1       cgd  * All rights reserved.
      8   1.1       cgd  *
      9   1.1       cgd  * Redistribution and use in source and binary forms, with or without
     10   1.1       cgd  * modification, are permitted provided that the following conditions
     11   1.1       cgd  * are met:
     12   1.1       cgd  * 1. Redistributions of source code must retain the above copyright
     13   1.1       cgd  *    notice, this list of conditions and the following disclaimer.
     14   1.1       cgd  * 2. Redistributions in binary form must reproduce the above copyright
     15   1.1       cgd  *    notice, this list of conditions and the following disclaimer in the
     16   1.1       cgd  *    documentation and/or other materials provided with the distribution.
     17   1.1       cgd  * 3. All advertising materials mentioning features or use of this software
     18   1.1       cgd  *    must display the following acknowledgement:
     19   1.1       cgd  *      This product includes software developed by John Polstra.
     20   1.1       cgd  * 4. The name of the author may not be used to endorse or promote products
     21   1.1       cgd  *    derived from this software without specific prior written permission.
     22   1.1       cgd  *
     23   1.1       cgd  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
     24   1.1       cgd  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
     25   1.1       cgd  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
     26   1.1       cgd  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
     27   1.1       cgd  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
     28   1.1       cgd  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
     29   1.1       cgd  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
     30   1.1       cgd  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
     31   1.1       cgd  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
     32   1.1       cgd  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
     33   1.1       cgd  */
     34   1.1       cgd 
     35   1.1       cgd /*
     36   1.1       cgd  * Dynamic linker for ELF.
     37   1.1       cgd  *
     38   1.1       cgd  * John Polstra <jdp (at) polstra.com>.
     39   1.1       cgd  */
     40   1.1       cgd 
     41  1.37     skrll #include <sys/cdefs.h>
     42  1.37     skrll #ifndef lint
     43  1.41      matt __RCSID("$NetBSD: symbol.c,v 1.41 2007/02/22 18:57:48 matt Exp $");
     44  1.37     skrll #endif /* not lint */
     45  1.37     skrll 
     46   1.1       cgd #include <err.h>
     47   1.1       cgd #include <errno.h>
     48   1.1       cgd #include <fcntl.h>
     49   1.1       cgd #include <stdarg.h>
     50   1.1       cgd #include <stdio.h>
     51   1.1       cgd #include <stdlib.h>
     52   1.1       cgd #include <string.h>
     53   1.1       cgd #include <unistd.h>
     54   1.1       cgd #include <sys/types.h>
     55   1.1       cgd #include <sys/mman.h>
     56   1.1       cgd #include <dirent.h>
     57   1.1       cgd 
     58   1.1       cgd #include "debug.h"
     59   1.1       cgd #include "rtld.h"
     60   1.1       cgd 
     61  1.39       chs typedef void (*fptr_t)(void);
     62  1.39       chs 
     63  1.33     skrll static bool
     64  1.33     skrll _rtld_is_exported(const Elf_Sym *def)
     65  1.33     skrll {
     66  1.39       chs 	static fptr_t _rtld_exports[] = {
     67  1.39       chs 		(fptr_t)dlopen,
     68  1.39       chs 		(fptr_t)dlclose,
     69  1.39       chs 		(fptr_t)dlsym,
     70  1.39       chs 		(fptr_t)dlerror,
     71  1.39       chs 		(fptr_t)dladdr,
     72  1.39       chs 		NULL
     73  1.33     skrll 	};
     74  1.33     skrll 	int i;
     75  1.39       chs 	fptr_t value;
     76  1.33     skrll 
     77  1.39       chs 	value = (fptr_t)(_rtld_objself.relocbase + def->st_value);
     78  1.39       chs 	for (i = 0; _rtld_exports[i] != NULL; i++) {
     79  1.33     skrll 		if (value == _rtld_exports[i])
     80  1.33     skrll 			return true;
     81  1.33     skrll 	}
     82  1.33     skrll 	return false;
     83  1.33     skrll }
     84  1.33     skrll 
     85   1.1       cgd /*
     86   1.1       cgd  * Hash function for symbol table lookup.  Don't even think about changing
     87   1.1       cgd  * this.  It is specified by the System V ABI.
     88   1.1       cgd  */
     89   1.1       cgd unsigned long
     90  1.31     skrll _rtld_elf_hash(const char *name)
     91   1.1       cgd {
     92   1.3  christos 	const unsigned char *p = (const unsigned char *) name;
     93   1.3  christos 	unsigned long   h = 0;
     94   1.3  christos 	unsigned long   g;
     95  1.24   mycroft 	unsigned long   c;
     96   1.3  christos 
     97  1.24   mycroft 	for (; __predict_true((c = *p) != '\0'); p++) {
     98  1.24   mycroft 		h <<= 4;
     99  1.24   mycroft 		h += c;
    100  1.24   mycroft 		if ((g = h & 0xf0000000) != 0) {
    101  1.24   mycroft 			h ^= g;
    102   1.3  christos 			h ^= g >> 24;
    103  1.24   mycroft 		}
    104   1.3  christos 	}
    105  1.24   mycroft 	return (h);
    106   1.1       cgd }
    107   1.1       cgd 
    108   1.5   mycroft const Elf_Sym *
    109  1.23   mycroft _rtld_symlook_list(const char *name, unsigned long hash, const Objlist *objlist,
    110  1.31     skrll     const Obj_Entry **defobj_out, bool in_plt)
    111   1.5   mycroft {
    112   1.5   mycroft 	const Elf_Sym *symp;
    113   1.5   mycroft 	const Elf_Sym *def;
    114  1.27   mycroft 	const Obj_Entry *defobj;
    115   1.5   mycroft 	const Objlist_Entry *elm;
    116   1.5   mycroft 
    117   1.5   mycroft 	def = NULL;
    118  1.27   mycroft 	defobj = NULL;
    119  1.12     lukem 	SIMPLEQ_FOREACH(elm, objlist, link) {
    120  1.23   mycroft 		rdbg(("search object %p (%s)", elm->obj, elm->obj->path));
    121  1.21   mycroft 		if ((symp = _rtld_symlook_obj(name, hash, elm->obj, in_plt))
    122   1.5   mycroft 		    != NULL) {
    123   1.5   mycroft 			if ((def == NULL) ||
    124   1.6   thorpej 			    (ELF_ST_BIND(symp->st_info) != STB_WEAK)) {
    125   1.5   mycroft 				def = symp;
    126  1.27   mycroft 				defobj = elm->obj;
    127   1.6   thorpej 				if (ELF_ST_BIND(def->st_info) != STB_WEAK)
    128   1.5   mycroft 					break;
    129   1.5   mycroft 			}
    130   1.5   mycroft 		}
    131   1.5   mycroft 	}
    132  1.27   mycroft 	if (def != NULL)
    133  1.27   mycroft 		*defobj_out = defobj;
    134   1.5   mycroft 	return def;
    135   1.5   mycroft }
    136   1.5   mycroft 
    137   1.1       cgd /*
    138   1.1       cgd  * Search the symbol table of a single shared object for a symbol of
    139   1.1       cgd  * the given name.  Returns a pointer to the symbol, or NULL if no
    140   1.1       cgd  * definition was found.
    141   1.1       cgd  *
    142   1.1       cgd  * The symbol's hash value is passed in for efficiency reasons; that
    143   1.1       cgd  * eliminates many recomputations of the hash value.
    144   1.1       cgd  */
    145   1.1       cgd const Elf_Sym *
    146  1.31     skrll _rtld_symlook_obj(const char *name, unsigned long hash,
    147  1.31     skrll     const Obj_Entry *obj, bool in_plt)
    148   1.1       cgd {
    149  1.20   mycroft 	unsigned long symnum;
    150   1.1       cgd 
    151  1.20   mycroft 	for (symnum = obj->buckets[hash % obj->nbuckets];
    152  1.20   mycroft 	     symnum != ELF_SYM_UNDEFINED;
    153  1.20   mycroft 	     symnum = obj->chains[symnum]) {
    154   1.3  christos 		const Elf_Sym  *symp;
    155   1.3  christos 		const char     *strp;
    156   1.3  christos 
    157   1.3  christos 		assert(symnum < obj->nchains);
    158   1.3  christos 		symp = obj->symtab + symnum;
    159   1.3  christos 		strp = obj->strtab + symp->st_name;
    160  1.38    martin 		rdbg(("check \"%s\" vs \"%s\" in %p", name, strp, obj));
    161  1.20   mycroft 		if (name[1] == strp[1] && !strcmp(name, strp)) {
    162  1.20   mycroft 			if (symp->st_shndx != SHN_UNDEF)
    163   1.3  christos 				return symp;
    164  1.21   mycroft #ifndef __mips__
    165  1.22   mycroft 			/*
    166  1.22   mycroft 			 * XXX DANGER WILL ROBINSON!
    167  1.22   mycroft 			 * If we have a function pointer in the executable's
    168  1.22   mycroft 			 * data section, it points to the executable's PLT
    169  1.22   mycroft 			 * slot, and there is NO relocation emitted.  To make
    170  1.22   mycroft 			 * the function pointer comparable to function pointers
    171  1.22   mycroft 			 * in shared libraries, we must resolve data references
    172  1.22   mycroft 			 * in the libraries to point to PLT slots in the
    173  1.22   mycroft 			 * executable, if they exist.
    174  1.22   mycroft 			 */
    175  1.21   mycroft 			else if (!in_plt && symp->st_value != 0 &&
    176  1.21   mycroft 			     ELF_ST_TYPE(symp->st_info) == STT_FUNC)
    177  1.21   mycroft 				return symp;
    178  1.21   mycroft #endif
    179  1.19   mycroft 			else
    180  1.19   mycroft 				return NULL;
    181   1.3  christos 		}
    182   1.1       cgd 	}
    183   1.1       cgd 
    184   1.3  christos 	return NULL;
    185   1.1       cgd }
    186   1.1       cgd 
    187   1.1       cgd /*
    188   1.1       cgd  * Given a symbol number in a referencing object, find the corresponding
    189   1.1       cgd  * definition of the symbol.  Returns a pointer to the symbol, or NULL if
    190   1.1       cgd  * no definition was found.  Returns a pointer to the Obj_Entry of the
    191   1.1       cgd  * defining object via the reference parameter DEFOBJ_OUT.
    192   1.1       cgd  */
    193   1.1       cgd const Elf_Sym *
    194  1.31     skrll _rtld_find_symdef(unsigned long symnum, const Obj_Entry *refobj,
    195  1.31     skrll     const Obj_Entry **defobj_out, bool in_plt)
    196   1.1       cgd {
    197  1.27   mycroft 	const Elf_Sym  *ref;
    198   1.5   mycroft 	const Elf_Sym  *def;
    199  1.27   mycroft 	const Obj_Entry *defobj;
    200  1.27   mycroft 	const char     *name;
    201   1.3  christos 	unsigned long   hash;
    202   1.3  christos 
    203  1.41      matt #ifdef COMBRELOC
    204  1.41      matt 	/*
    205  1.41      matt 	 * COMBRELOC combines multiple reloc sections and sorts them to make
    206  1.41      matt 	 * dynamic symbol lookup caching possible.
    207  1.41      matt 	 *
    208  1.41      matt 	 * So if the lookup we are doing is the same as the previous lookup
    209  1.41      matt 	 * return the cached results.
    210  1.41      matt 	 */
    211  1.41      matt 	static unsigned long last_symnum;
    212  1.41      matt 	static const Elf_Sym *last_def;
    213  1.41      matt 	static const Obj_Entry *last_refobj;
    214  1.41      matt 	static const Obj_Entry *last_defobj;
    215  1.41      matt 	static bool last_in_plt;
    216  1.41      matt 
    217  1.41      matt 	if (symnum == last_symnum && refobj == last_refobj
    218  1.41      matt 	    && in_plt == last_in_plt) {
    219  1.41      matt 		*defobj_out = last_defobj;
    220  1.41      matt 		return last_def;
    221  1.41      matt 	}
    222  1.41      matt #endif
    223  1.41      matt 
    224  1.27   mycroft 	ref = refobj->symtab + symnum;
    225  1.27   mycroft 	name = refobj->strtab + ref->st_name;
    226  1.27   mycroft 
    227  1.27   mycroft 	/*
    228  1.40     skrll 	 * We don't have to do a full scale lookup if the symbol is local.
    229  1.40     skrll 	 * We know it will bind to the instance in this load module; to
    230  1.40     skrll 	 * which we already have a pointer (ie ref).
    231  1.33     skrll 	 */
    232  1.40     skrll 	if (ELF_ST_BIND(ref->st_info) != STB_LOCAL) {
    233  1.40     skrll 		if (ELF_ST_TYPE(ref->st_info) == STT_SECTION) {
    234  1.40     skrll 			_rtld_error("%s: Bogus symbol table entry %lu",
    235  1.40     skrll 			    refobj->path, symnum);
    236  1.40     skrll         	}
    237  1.40     skrll 
    238  1.40     skrll 		hash = _rtld_elf_hash(name);
    239  1.40     skrll 		defobj = NULL;
    240  1.40     skrll 		def = _rtld_symlook_default(name, hash, refobj, &defobj, in_plt);
    241  1.40     skrll 	} else {
    242  1.40     skrll 		rdbg(("STB_LOCAL symbol %s in %s", name, refobj->path));
    243  1.40     skrll 		def = ref;
    244  1.40     skrll 		defobj = refobj;
    245  1.33     skrll 	}
    246  1.40     skrll 
    247  1.33     skrll 	/*
    248  1.27   mycroft 	 * If we found no definition and the reference is weak, treat the
    249  1.27   mycroft 	 * symbol as having the value zero.
    250  1.27   mycroft 	 */
    251  1.27   mycroft 	if (def == NULL && ELF_ST_BIND(ref->st_info) == STB_WEAK) {
    252  1.27   mycroft 		rdbg(("  returning _rtld_sym_zero@_rtld_objmain"));
    253  1.27   mycroft 		def = &_rtld_sym_zero;
    254  1.27   mycroft 		defobj = _rtld_objmain;
    255  1.27   mycroft 	}
    256  1.33     skrll 
    257  1.41      matt 	if (def != NULL) {
    258  1.27   mycroft 		*defobj_out = defobj;
    259  1.41      matt #ifdef COMBRELOC
    260  1.41      matt 		/*
    261  1.41      matt 		 * Cache the lookup arguments and results.
    262  1.41      matt 		 */
    263  1.41      matt 		last_symnum = symnum;
    264  1.41      matt 		last_refobj = refobj;
    265  1.41      matt 		last_def = def;
    266  1.41      matt 		last_defobj = defobj;
    267  1.41      matt 		last_in_plt = in_plt;
    268  1.41      matt #endif
    269  1.41      matt 	} else {
    270  1.27   mycroft 		rdbg(("lookup failed"));
    271  1.27   mycroft 		_rtld_error("%s: Undefined %ssymbol \"%s\" (symnum = %ld)",
    272  1.27   mycroft 		    refobj->path, in_plt ? "PLT " : "", name, symnum);
    273  1.27   mycroft 	}
    274  1.26   mycroft 	return def;
    275  1.28  christos }
    276  1.28  christos 
    277  1.28  christos /*
    278  1.28  christos  * Given a symbol name in a referencing object, find the corresponding
    279  1.28  christos  * definition of the symbol.  Returns a pointer to the symbol, or NULL if
    280  1.28  christos  * no definition was found.  Returns a pointer to the Obj_Entry of the
    281  1.28  christos  * defining object via the reference parameter DEFOBJ_OUT.
    282  1.28  christos  */
    283  1.28  christos const Elf_Sym *
    284  1.28  christos _rtld_symlook_default(const char *name, unsigned long hash,
    285  1.28  christos     const Obj_Entry *refobj, const Obj_Entry **defobj_out, bool in_plt)
    286  1.28  christos {
    287  1.29     skrll 	const Elf_Sym *def;
    288  1.29     skrll 	const Elf_Sym *symp;
    289  1.29     skrll 	const Obj_Entry *obj;
    290  1.29     skrll 	const Obj_Entry *defobj;
    291  1.29     skrll 	const Objlist_Entry *elm;
    292  1.29     skrll 	def = NULL;
    293  1.29     skrll 	defobj = NULL;
    294  1.29     skrll 
    295  1.29     skrll 	/* Look first in the referencing object if linked symbolically. */
    296  1.29     skrll 	if (refobj->symbolic) {
    297  1.40     skrll 		rdbg(("search referencing object"));
    298  1.29     skrll 		symp = _rtld_symlook_obj(name, hash, refobj, in_plt);
    299  1.29     skrll 		if (symp != NULL) {
    300  1.29     skrll 			def = symp;
    301  1.29     skrll 			defobj = refobj;
    302  1.29     skrll 		}
    303  1.29     skrll 	}
    304  1.29     skrll 
    305  1.29     skrll 	/* Search all objects loaded at program start up. */
    306  1.29     skrll 	if (def == NULL || ELF_ST_BIND(def->st_info) == STB_WEAK) {
    307  1.40     skrll 		rdbg(("search _rtld_list_main"));
    308  1.40     skrll 		symp = _rtld_symlook_list(name, hash, &_rtld_list_main, &obj,
    309  1.40     skrll 		    in_plt);
    310  1.29     skrll 		if (symp != NULL &&
    311  1.40     skrll 		    (def == NULL || ELF_ST_BIND(symp->st_info) != STB_WEAK)) {
    312  1.29     skrll 			def = symp;
    313  1.29     skrll 			defobj = obj;
    314  1.29     skrll 		}
    315  1.29     skrll 	}
    316  1.29     skrll 
    317  1.40     skrll 	/* Search all RTLD_GLOBAL objects. */
    318  1.40     skrll 	if (def == NULL || ELF_ST_BIND(def->st_info) == STB_WEAK) {
    319  1.40     skrll 		rdbg(("search _rtld_list_global"));
    320  1.40     skrll 		symp = _rtld_symlook_list(name, hash, &_rtld_list_global,
    321  1.40     skrll 		    &obj, in_plt);
    322  1.29     skrll 		if (symp != NULL &&
    323  1.29     skrll 		    (def == NULL || ELF_ST_BIND(symp->st_info) != STB_WEAK)) {
    324  1.29     skrll 			def = symp;
    325  1.29     skrll 			defobj = obj;
    326  1.29     skrll 		}
    327  1.29     skrll 	}
    328  1.40     skrll 
    329  1.40     skrll 	/* Search all dlopened DAGs containing the referencing object. */
    330  1.40     skrll 	SIMPLEQ_FOREACH(elm, &refobj->dldags, link) {
    331  1.29     skrll 		if (def != NULL && ELF_ST_BIND(def->st_info) != STB_WEAK)
    332  1.29     skrll 			break;
    333  1.40     skrll 		rdbg(("search DAG with root %p (%s)", elm->obj,
    334  1.40     skrll 		    elm->obj->path));
    335  1.40     skrll 		symp = _rtld_symlook_list(name, hash, &elm->obj->dagmembers,
    336  1.40     skrll 		    &obj, in_plt);
    337  1.29     skrll 		if (symp != NULL &&
    338  1.29     skrll 		    (def == NULL || ELF_ST_BIND(symp->st_info) != STB_WEAK)) {
    339  1.29     skrll 			def = symp;
    340  1.29     skrll 			defobj = obj;
    341  1.29     skrll 		}
    342  1.28  christos 	}
    343  1.28  christos 
    344  1.29     skrll 	/*
    345  1.29     skrll 	 * Search the dynamic linker itself, and possibly resolve the
    346  1.29     skrll 	 * symbol from there.  This is how the application links to
    347  1.29     skrll 	 * dynamic linker services such as dlopen.  Only the values listed
    348  1.40     skrll 	 * in the "_rtld_exports" array can be resolved from the dynamic
    349  1.40     skrll 	 * linker.
    350  1.29     skrll 	 */
    351  1.29     skrll 	if (def == NULL || ELF_ST_BIND(def->st_info) == STB_WEAK) {
    352  1.40     skrll 		rdbg(("Search the dynamic linker itself."));
    353  1.30     skrll 		symp = _rtld_symlook_obj(name, hash, &_rtld_objself, in_plt);
    354  1.40     skrll 		if (symp != NULL && _rtld_is_exported(symp)) {
    355  1.29     skrll 			def = symp;
    356  1.30     skrll 			defobj = &_rtld_objself;
    357  1.29     skrll 		}
    358  1.28  christos 	}
    359  1.28  christos 
    360  1.29     skrll 	if (def != NULL)
    361  1.29     skrll 		*defobj_out = defobj;
    362  1.29     skrll 	return def;
    363   1.1       cgd }
    364