Home | History | Annotate | Line # | Download | only in ld.elf_so
symbol.c revision 1.37
      1  1.37     skrll /*	$NetBSD: symbol.c,v 1.37 2004/10/22 05:39:57 skrll Exp $	 */
      2   1.1       cgd 
      3   1.1       cgd /*
      4   1.1       cgd  * Copyright 1996 John D. Polstra.
      5   1.1       cgd  * Copyright 1996 Matt Thomas <matt (at) 3am-software.com>
      6  1.25   mycroft  * Copyright 2002 Charles M. Hannum <root (at) ihack.net>
      7   1.1       cgd  * All rights reserved.
      8   1.1       cgd  *
      9   1.1       cgd  * Redistribution and use in source and binary forms, with or without
     10   1.1       cgd  * modification, are permitted provided that the following conditions
     11   1.1       cgd  * are met:
     12   1.1       cgd  * 1. Redistributions of source code must retain the above copyright
     13   1.1       cgd  *    notice, this list of conditions and the following disclaimer.
     14   1.1       cgd  * 2. Redistributions in binary form must reproduce the above copyright
     15   1.1       cgd  *    notice, this list of conditions and the following disclaimer in the
     16   1.1       cgd  *    documentation and/or other materials provided with the distribution.
     17   1.1       cgd  * 3. All advertising materials mentioning features or use of this software
     18   1.1       cgd  *    must display the following acknowledgement:
     19   1.1       cgd  *      This product includes software developed by John Polstra.
     20   1.1       cgd  * 4. The name of the author may not be used to endorse or promote products
     21   1.1       cgd  *    derived from this software without specific prior written permission.
     22   1.1       cgd  *
     23   1.1       cgd  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
     24   1.1       cgd  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
     25   1.1       cgd  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
     26   1.1       cgd  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
     27   1.1       cgd  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
     28   1.1       cgd  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
     29   1.1       cgd  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
     30   1.1       cgd  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
     31   1.1       cgd  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
     32   1.1       cgd  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
     33   1.1       cgd  */
     34   1.1       cgd 
     35   1.1       cgd /*
     36   1.1       cgd  * Dynamic linker for ELF.
     37   1.1       cgd  *
     38   1.1       cgd  * John Polstra <jdp (at) polstra.com>.
     39   1.1       cgd  */
     40   1.1       cgd 
     41  1.37     skrll #include <sys/cdefs.h>
     42  1.37     skrll #ifndef lint
     43  1.37     skrll __RCSID("$NetBSD: symbol.c,v 1.37 2004/10/22 05:39:57 skrll Exp $");
     44  1.37     skrll #endif /* not lint */
     45  1.37     skrll 
     46   1.1       cgd #include <err.h>
     47   1.1       cgd #include <errno.h>
     48   1.1       cgd #include <fcntl.h>
     49   1.1       cgd #include <stdarg.h>
     50   1.1       cgd #include <stdio.h>
     51   1.1       cgd #include <stdlib.h>
     52   1.1       cgd #include <string.h>
     53   1.1       cgd #include <unistd.h>
     54   1.1       cgd #include <sys/types.h>
     55   1.1       cgd #include <sys/mman.h>
     56   1.1       cgd #include <dirent.h>
     57   1.1       cgd 
     58   1.1       cgd #include "debug.h"
     59   1.1       cgd #include "rtld.h"
     60   1.1       cgd 
     61  1.33     skrll static bool
     62  1.33     skrll _rtld_is_exported(const Elf_Sym *def)
     63  1.33     skrll {
     64  1.33     skrll 	static Elf_Addr _rtld_exports[] = {
     65  1.33     skrll 		(Elf_Addr)dlopen,
     66  1.33     skrll 		(Elf_Addr)dlclose,
     67  1.33     skrll 		(Elf_Addr)dlsym,
     68  1.33     skrll 		(Elf_Addr)dlerror,
     69  1.33     skrll 		(Elf_Addr)dladdr,
     70  1.36   thorpej 
     71  1.36   thorpej #if 0
     72  1.36   thorpej 	/*
     73  1.36   thorpej 	 * Don't need to list these since they are aliases of the
     74  1.36   thorpej 	 * above symbols, and thus have the same value.
     75  1.36   thorpej 	 */
     76  1.36   thorpej 		(Elf_Addr)__dlopen,
     77  1.36   thorpej 		(Elf_Addr)__dlclose,
     78  1.36   thorpej 		(Elf_Addr)__dlsym,
     79  1.36   thorpej 		(Elf_Addr)__dlerror,
     80  1.36   thorpej 		(Elf_Addr)__dladdr,
     81  1.36   thorpej #endif
     82  1.36   thorpej 
     83  1.34      fvdl 		0
     84  1.33     skrll 	};
     85  1.33     skrll 	int i;
     86  1.33     skrll 
     87  1.33     skrll 	Elf_Addr value;
     88  1.33     skrll 	value = (Elf_Addr)(_rtld_objself.relocbase + def->st_value);
     89  1.33     skrll 
     90  1.34      fvdl 	for (i = 0; _rtld_exports[i] != 0; i++) {
     91  1.33     skrll 		if (value == _rtld_exports[i])
     92  1.33     skrll 			return true;
     93  1.33     skrll 	}
     94  1.33     skrll 	return false;
     95  1.33     skrll }
     96  1.33     skrll 
     97   1.1       cgd /*
     98   1.1       cgd  * Hash function for symbol table lookup.  Don't even think about changing
     99   1.1       cgd  * this.  It is specified by the System V ABI.
    100   1.1       cgd  */
    101   1.1       cgd unsigned long
    102  1.31     skrll _rtld_elf_hash(const char *name)
    103   1.1       cgd {
    104   1.3  christos 	const unsigned char *p = (const unsigned char *) name;
    105   1.3  christos 	unsigned long   h = 0;
    106   1.3  christos 	unsigned long   g;
    107  1.24   mycroft 	unsigned long   c;
    108   1.3  christos 
    109  1.24   mycroft 	for (; __predict_true((c = *p) != '\0'); p++) {
    110  1.24   mycroft 		h <<= 4;
    111  1.24   mycroft 		h += c;
    112  1.24   mycroft 		if ((g = h & 0xf0000000) != 0) {
    113  1.24   mycroft 			h ^= g;
    114   1.3  christos 			h ^= g >> 24;
    115  1.24   mycroft 		}
    116   1.3  christos 	}
    117  1.24   mycroft 	return (h);
    118   1.1       cgd }
    119   1.1       cgd 
    120   1.5   mycroft const Elf_Sym *
    121  1.23   mycroft _rtld_symlook_list(const char *name, unsigned long hash, const Objlist *objlist,
    122  1.31     skrll     const Obj_Entry **defobj_out, bool in_plt)
    123   1.5   mycroft {
    124   1.5   mycroft 	const Elf_Sym *symp;
    125   1.5   mycroft 	const Elf_Sym *def;
    126  1.27   mycroft 	const Obj_Entry *defobj;
    127   1.5   mycroft 	const Objlist_Entry *elm;
    128   1.5   mycroft 
    129   1.5   mycroft 	def = NULL;
    130  1.27   mycroft 	defobj = NULL;
    131  1.12     lukem 	SIMPLEQ_FOREACH(elm, objlist, link) {
    132  1.23   mycroft 		rdbg(("search object %p (%s)", elm->obj, elm->obj->path));
    133  1.21   mycroft 		if ((symp = _rtld_symlook_obj(name, hash, elm->obj, in_plt))
    134   1.5   mycroft 		    != NULL) {
    135   1.5   mycroft 			if ((def == NULL) ||
    136   1.6   thorpej 			    (ELF_ST_BIND(symp->st_info) != STB_WEAK)) {
    137   1.5   mycroft 				def = symp;
    138  1.27   mycroft 				defobj = elm->obj;
    139   1.6   thorpej 				if (ELF_ST_BIND(def->st_info) != STB_WEAK)
    140   1.5   mycroft 					break;
    141   1.5   mycroft 			}
    142   1.5   mycroft 		}
    143   1.5   mycroft 	}
    144  1.27   mycroft 	if (def != NULL)
    145  1.27   mycroft 		*defobj_out = defobj;
    146   1.5   mycroft 	return def;
    147   1.5   mycroft }
    148   1.5   mycroft 
    149   1.1       cgd /*
    150   1.1       cgd  * Search the symbol table of a single shared object for a symbol of
    151   1.1       cgd  * the given name.  Returns a pointer to the symbol, or NULL if no
    152   1.1       cgd  * definition was found.
    153   1.1       cgd  *
    154   1.1       cgd  * The symbol's hash value is passed in for efficiency reasons; that
    155   1.1       cgd  * eliminates many recomputations of the hash value.
    156   1.1       cgd  */
    157   1.1       cgd const Elf_Sym *
    158  1.31     skrll _rtld_symlook_obj(const char *name, unsigned long hash,
    159  1.31     skrll     const Obj_Entry *obj, bool in_plt)
    160   1.1       cgd {
    161  1.20   mycroft 	unsigned long symnum;
    162   1.1       cgd 
    163  1.20   mycroft 	for (symnum = obj->buckets[hash % obj->nbuckets];
    164  1.20   mycroft 	     symnum != ELF_SYM_UNDEFINED;
    165  1.20   mycroft 	     symnum = obj->chains[symnum]) {
    166   1.3  christos 		const Elf_Sym  *symp;
    167   1.3  christos 		const char     *strp;
    168   1.3  christos 
    169   1.3  christos 		assert(symnum < obj->nchains);
    170   1.3  christos 		symp = obj->symtab + symnum;
    171   1.3  christos 		strp = obj->strtab + symp->st_name;
    172  1.23   mycroft 		rdbg(("check %s vs %s in %p", name, strp, obj));
    173  1.20   mycroft 		if (name[1] == strp[1] && !strcmp(name, strp)) {
    174  1.20   mycroft 			if (symp->st_shndx != SHN_UNDEF)
    175   1.3  christos 				return symp;
    176  1.21   mycroft #ifndef __mips__
    177  1.22   mycroft 			/*
    178  1.22   mycroft 			 * XXX DANGER WILL ROBINSON!
    179  1.22   mycroft 			 * If we have a function pointer in the executable's
    180  1.22   mycroft 			 * data section, it points to the executable's PLT
    181  1.22   mycroft 			 * slot, and there is NO relocation emitted.  To make
    182  1.22   mycroft 			 * the function pointer comparable to function pointers
    183  1.22   mycroft 			 * in shared libraries, we must resolve data references
    184  1.22   mycroft 			 * in the libraries to point to PLT slots in the
    185  1.22   mycroft 			 * executable, if they exist.
    186  1.22   mycroft 			 */
    187  1.21   mycroft 			else if (!in_plt && symp->st_value != 0 &&
    188  1.21   mycroft 			     ELF_ST_TYPE(symp->st_info) == STT_FUNC)
    189  1.21   mycroft 				return symp;
    190  1.21   mycroft #endif
    191  1.19   mycroft 			else
    192  1.19   mycroft 				return NULL;
    193   1.3  christos 		}
    194   1.1       cgd 	}
    195   1.1       cgd 
    196   1.3  christos 	return NULL;
    197   1.1       cgd }
    198   1.1       cgd 
    199   1.1       cgd /*
    200   1.1       cgd  * Given a symbol number in a referencing object, find the corresponding
    201   1.1       cgd  * definition of the symbol.  Returns a pointer to the symbol, or NULL if
    202   1.1       cgd  * no definition was found.  Returns a pointer to the Obj_Entry of the
    203   1.1       cgd  * defining object via the reference parameter DEFOBJ_OUT.
    204   1.1       cgd  */
    205   1.1       cgd const Elf_Sym *
    206  1.31     skrll _rtld_find_symdef(unsigned long symnum, const Obj_Entry *refobj,
    207  1.31     skrll     const Obj_Entry **defobj_out, bool in_plt)
    208   1.1       cgd {
    209  1.27   mycroft 	const Elf_Sym  *ref;
    210   1.5   mycroft 	const Elf_Sym  *def;
    211   1.5   mycroft 	const Elf_Sym  *symp;
    212   1.3  christos 	const Obj_Entry *obj;
    213  1.27   mycroft 	const Obj_Entry *defobj;
    214   1.5   mycroft 	const Objlist_Entry *elm;
    215  1.27   mycroft 	const char     *name;
    216   1.3  christos 	unsigned long   hash;
    217   1.3  christos 
    218  1.27   mycroft 	ref = refobj->symtab + symnum;
    219  1.27   mycroft 	name = refobj->strtab + ref->st_name;
    220  1.27   mycroft 
    221   1.3  christos 	hash = _rtld_elf_hash(name);
    222   1.5   mycroft 	def = NULL;
    223  1.27   mycroft 	defobj = NULL;
    224   1.5   mycroft 
    225  1.32     skrll 	/* Look first in the referencing object if linked symbolically */
    226  1.32     skrll 	if (refobj->symbolic) {
    227  1.21   mycroft 		symp = _rtld_symlook_obj(name, hash, refobj, in_plt);
    228   1.5   mycroft 		if (symp != NULL) {
    229   1.5   mycroft 			def = symp;
    230  1.27   mycroft 			defobj = refobj;
    231   1.5   mycroft 		}
    232   1.5   mycroft 	}
    233   1.5   mycroft 
    234   1.5   mycroft 	/* Search all objects loaded at program start up. */
    235   1.6   thorpej 	if (def == NULL || ELF_ST_BIND(def->st_info) == STB_WEAK) {
    236  1.23   mycroft 		rdbg(("search _rtld_list_main"));
    237  1.21   mycroft 		symp = _rtld_symlook_list(name, hash, &_rtld_list_main, &obj, in_plt);
    238   1.5   mycroft 		if (symp != NULL &&
    239   1.6   thorpej 		    (def == NULL || ELF_ST_BIND(symp->st_info) != STB_WEAK)) {
    240   1.5   mycroft 			def = symp;
    241  1.27   mycroft 			defobj = obj;
    242   1.5   mycroft 		}
    243   1.5   mycroft 	}
    244   1.5   mycroft 
    245  1.35    mrauch 	/* Search all RTLD_GLOBAL objects. */
    246  1.35    mrauch 	if (def == NULL || ELF_ST_BIND(def->st_info) == STB_WEAK) {
    247  1.35    mrauch 		rdbg(("search _rtld_list_global"));
    248  1.35    mrauch 		symp = _rtld_symlook_list(name, hash, &_rtld_list_global, &obj, in_plt);
    249   1.5   mycroft 		if (symp != NULL &&
    250   1.6   thorpej 		    (def == NULL || ELF_ST_BIND(symp->st_info) != STB_WEAK)) {
    251   1.5   mycroft 			def = symp;
    252  1.27   mycroft 			defobj = obj;
    253   1.3  christos 		}
    254   1.3  christos 	}
    255   1.5   mycroft 
    256  1.35    mrauch 	/* Search all dlopened DAGs containing the referencing object. */
    257  1.35    mrauch 	SIMPLEQ_FOREACH(elm, &refobj->dldags, link) {
    258  1.35    mrauch 		if (def != NULL && ELF_ST_BIND(def->st_info) != STB_WEAK)
    259  1.35    mrauch 			break;
    260  1.35    mrauch 		rdbg(("search DAG with root %p (%s)", elm->obj, elm->obj->path));
    261  1.35    mrauch 		symp = _rtld_symlook_list(name, hash, &elm->obj->dagmembers, &obj, in_plt);
    262   1.5   mycroft 		if (symp != NULL &&
    263   1.6   thorpej 		    (def == NULL || ELF_ST_BIND(symp->st_info) != STB_WEAK)) {
    264   1.5   mycroft 			def = symp;
    265  1.27   mycroft 			defobj = obj;
    266   1.3  christos 		}
    267   1.3  christos 	}
    268   1.5   mycroft 
    269  1.27   mycroft 	/*
    270  1.33     skrll 	 * Search the dynamic linker itself, and possibly resolve the
    271  1.33     skrll 	 * symbol from there.  This is how the application links to
    272  1.33     skrll 	 * dynamic linker services such as dlopen.  Only the values listed
    273  1.33     skrll 	 * in the "_rtld_exports" array can be resolved from the dynamic linker.
    274  1.33     skrll 	 */
    275  1.33     skrll 	if (def == NULL || ELF_ST_BIND(def->st_info) == STB_WEAK) {
    276  1.33     skrll 		symp = _rtld_symlook_obj(name, hash, &_rtld_objself, in_plt);
    277  1.33     skrll 		if (symp != NULL && _rtld_is_exported(symp)) {
    278  1.33     skrll 			def = symp;
    279  1.33     skrll 			defobj = &_rtld_objself;
    280  1.33     skrll 		}
    281  1.33     skrll 	}
    282  1.33     skrll 
    283  1.33     skrll 	/*
    284  1.27   mycroft 	 * If we found no definition and the reference is weak, treat the
    285  1.27   mycroft 	 * symbol as having the value zero.
    286  1.27   mycroft 	 */
    287  1.27   mycroft 	if (def == NULL && ELF_ST_BIND(ref->st_info) == STB_WEAK) {
    288  1.27   mycroft 		rdbg(("  returning _rtld_sym_zero@_rtld_objmain"));
    289  1.27   mycroft 		def = &_rtld_sym_zero;
    290  1.27   mycroft 		defobj = _rtld_objmain;
    291  1.27   mycroft 	}
    292  1.33     skrll 
    293  1.27   mycroft 	if (def != NULL)
    294  1.27   mycroft 		*defobj_out = defobj;
    295  1.27   mycroft 	else {
    296  1.27   mycroft 		rdbg(("lookup failed"));
    297  1.27   mycroft 		_rtld_error("%s: Undefined %ssymbol \"%s\" (symnum = %ld)",
    298  1.27   mycroft 		    refobj->path, in_plt ? "PLT " : "", name, symnum);
    299  1.27   mycroft 	}
    300  1.26   mycroft 	return def;
    301  1.28  christos }
    302  1.28  christos 
    303  1.28  christos /*
    304  1.28  christos  * Given a symbol name in a referencing object, find the corresponding
    305  1.28  christos  * definition of the symbol.  Returns a pointer to the symbol, or NULL if
    306  1.28  christos  * no definition was found.  Returns a pointer to the Obj_Entry of the
    307  1.28  christos  * defining object via the reference parameter DEFOBJ_OUT.
    308  1.28  christos  */
    309  1.28  christos const Elf_Sym *
    310  1.28  christos _rtld_symlook_default(const char *name, unsigned long hash,
    311  1.28  christos     const Obj_Entry *refobj, const Obj_Entry **defobj_out, bool in_plt)
    312  1.28  christos {
    313  1.29     skrll 	const Elf_Sym *def;
    314  1.29     skrll 	const Elf_Sym *symp;
    315  1.29     skrll 	const Obj_Entry *obj;
    316  1.29     skrll 	const Obj_Entry *defobj;
    317  1.29     skrll 	const Objlist_Entry *elm;
    318  1.29     skrll 	def = NULL;
    319  1.29     skrll 	defobj = NULL;
    320  1.29     skrll 
    321  1.29     skrll 	/* Look first in the referencing object if linked symbolically. */
    322  1.29     skrll 	if (refobj->symbolic) {
    323  1.29     skrll 		symp = _rtld_symlook_obj(name, hash, refobj, in_plt);
    324  1.29     skrll 		if (symp != NULL) {
    325  1.29     skrll 			def = symp;
    326  1.29     skrll 			defobj = refobj;
    327  1.29     skrll 		}
    328  1.29     skrll 	}
    329  1.29     skrll 
    330  1.29     skrll 	/* Search all objects loaded at program start up. */
    331  1.29     skrll 	if (def == NULL || ELF_ST_BIND(def->st_info) == STB_WEAK) {
    332  1.29     skrll 		symp = _rtld_symlook_list(name, hash, &_rtld_list_main, &obj, in_plt);
    333  1.29     skrll 		if (symp != NULL &&
    334  1.29     skrll 		  (def == NULL || ELF_ST_BIND(symp->st_info) != STB_WEAK)) {
    335  1.29     skrll 			def = symp;
    336  1.29     skrll 			defobj = obj;
    337  1.29     skrll 		}
    338  1.29     skrll 	}
    339  1.29     skrll 
    340  1.29     skrll 	/* Search all dlopened DAGs containing the referencing object. */
    341  1.29     skrll 	SIMPLEQ_FOREACH(elm, &refobj->dldags, link) {
    342  1.29     skrll 		if (def != NULL && ELF_ST_BIND(def->st_info) != STB_WEAK)
    343  1.29     skrll 			break;
    344  1.29     skrll 		symp = _rtld_symlook_list(name, hash, &elm->obj->dagmembers, &obj,
    345  1.29     skrll 		    in_plt);
    346  1.29     skrll 		if (symp != NULL &&
    347  1.29     skrll 		    (def == NULL || ELF_ST_BIND(symp->st_info) != STB_WEAK)) {
    348  1.29     skrll 			def = symp;
    349  1.29     skrll 			defobj = obj;
    350  1.29     skrll 		}
    351  1.29     skrll 	}
    352  1.29     skrll 
    353  1.29     skrll 	/* Search all DAGs whose roots are RTLD_GLOBAL objects. */
    354  1.29     skrll 	SIMPLEQ_FOREACH(elm, &_rtld_list_global, link) {
    355  1.29     skrll 		if (def != NULL && ELF_ST_BIND(def->st_info) != STB_WEAK)
    356  1.29     skrll 			break;
    357  1.29     skrll 		symp = _rtld_symlook_list(name, hash, &elm->obj->dagmembers, &obj,
    358  1.29     skrll 		    in_plt);
    359  1.29     skrll 		if (symp != NULL &&
    360  1.29     skrll 		    (def == NULL || ELF_ST_BIND(symp->st_info) != STB_WEAK)) {
    361  1.29     skrll 			def = symp;
    362  1.29     skrll 			defobj = obj;
    363  1.29     skrll 		}
    364  1.28  christos 	}
    365  1.28  christos 
    366  1.28  christos #ifdef notyet
    367  1.29     skrll 	/*
    368  1.29     skrll 	 * Search the dynamic linker itself, and possibly resolve the
    369  1.29     skrll 	 * symbol from there.  This is how the application links to
    370  1.29     skrll 	 * dynamic linker services such as dlopen.  Only the values listed
    371  1.29     skrll 	 * in the "exports" array can be resolved from the dynamic linker.
    372  1.29     skrll 	 */
    373  1.29     skrll 	if (def == NULL || ELF_ST_BIND(def->st_info) == STB_WEAK) {
    374  1.30     skrll 		symp = _rtld_symlook_obj(name, hash, &_rtld_objself, in_plt);
    375  1.29     skrll 		if (symp != NULL && is_exported(symp)) {
    376  1.29     skrll 			def = symp;
    377  1.30     skrll 			defobj = &_rtld_objself;
    378  1.29     skrll 		}
    379  1.28  christos 	}
    380  1.28  christos #endif
    381  1.28  christos 
    382  1.29     skrll 	if (def != NULL)
    383  1.29     skrll 		*defobj_out = defobj;
    384  1.29     skrll 	return def;
    385   1.1       cgd }
    386