Home | History | Annotate | Line # | Download | only in ld.elf_so
symbol.c revision 1.42.4.1
      1  1.42.4.1      matt /*	$NetBSD: symbol.c,v 1.42.4.1 2008/01/09 01:37:13 matt Exp $	 */
      2       1.1       cgd 
      3       1.1       cgd /*
      4       1.1       cgd  * Copyright 1996 John D. Polstra.
      5       1.1       cgd  * Copyright 1996 Matt Thomas <matt (at) 3am-software.com>
      6      1.25   mycroft  * Copyright 2002 Charles M. Hannum <root (at) ihack.net>
      7       1.1       cgd  * All rights reserved.
      8       1.1       cgd  *
      9       1.1       cgd  * Redistribution and use in source and binary forms, with or without
     10       1.1       cgd  * modification, are permitted provided that the following conditions
     11       1.1       cgd  * are met:
     12       1.1       cgd  * 1. Redistributions of source code must retain the above copyright
     13       1.1       cgd  *    notice, this list of conditions and the following disclaimer.
     14       1.1       cgd  * 2. Redistributions in binary form must reproduce the above copyright
     15       1.1       cgd  *    notice, this list of conditions and the following disclaimer in the
     16       1.1       cgd  *    documentation and/or other materials provided with the distribution.
     17       1.1       cgd  * 3. All advertising materials mentioning features or use of this software
     18       1.1       cgd  *    must display the following acknowledgement:
     19       1.1       cgd  *      This product includes software developed by John Polstra.
     20       1.1       cgd  * 4. The name of the author may not be used to endorse or promote products
     21       1.1       cgd  *    derived from this software without specific prior written permission.
     22       1.1       cgd  *
     23       1.1       cgd  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
     24       1.1       cgd  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
     25       1.1       cgd  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
     26       1.1       cgd  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
     27       1.1       cgd  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
     28       1.1       cgd  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
     29       1.1       cgd  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
     30       1.1       cgd  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
     31       1.1       cgd  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
     32       1.1       cgd  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
     33       1.1       cgd  */
     34       1.1       cgd 
     35       1.1       cgd /*
     36       1.1       cgd  * Dynamic linker for ELF.
     37       1.1       cgd  *
     38       1.1       cgd  * John Polstra <jdp (at) polstra.com>.
     39       1.1       cgd  */
     40       1.1       cgd 
     41      1.37     skrll #include <sys/cdefs.h>
     42      1.37     skrll #ifndef lint
     43  1.42.4.1      matt __RCSID("$NetBSD: symbol.c,v 1.42.4.1 2008/01/09 01:37:13 matt Exp $");
     44      1.37     skrll #endif /* not lint */
     45      1.37     skrll 
     46       1.1       cgd #include <err.h>
     47       1.1       cgd #include <errno.h>
     48       1.1       cgd #include <fcntl.h>
     49       1.1       cgd #include <stdarg.h>
     50       1.1       cgd #include <stdio.h>
     51       1.1       cgd #include <stdlib.h>
     52       1.1       cgd #include <string.h>
     53       1.1       cgd #include <unistd.h>
     54       1.1       cgd #include <sys/types.h>
     55       1.1       cgd #include <sys/mman.h>
     56       1.1       cgd #include <dirent.h>
     57       1.1       cgd 
     58       1.1       cgd #include "debug.h"
     59       1.1       cgd #include "rtld.h"
     60       1.1       cgd 
     61      1.39       chs typedef void (*fptr_t)(void);
     62      1.39       chs 
     63      1.33     skrll static bool
     64      1.33     skrll _rtld_is_exported(const Elf_Sym *def)
     65      1.33     skrll {
     66      1.39       chs 	static fptr_t _rtld_exports[] = {
     67      1.39       chs 		(fptr_t)dlopen,
     68      1.39       chs 		(fptr_t)dlclose,
     69      1.39       chs 		(fptr_t)dlsym,
     70      1.39       chs 		(fptr_t)dlerror,
     71      1.39       chs 		(fptr_t)dladdr,
     72      1.39       chs 		NULL
     73      1.33     skrll 	};
     74      1.33     skrll 	int i;
     75      1.39       chs 	fptr_t value;
     76      1.33     skrll 
     77      1.39       chs 	value = (fptr_t)(_rtld_objself.relocbase + def->st_value);
     78      1.39       chs 	for (i = 0; _rtld_exports[i] != NULL; i++) {
     79      1.33     skrll 		if (value == _rtld_exports[i])
     80      1.33     skrll 			return true;
     81      1.33     skrll 	}
     82      1.33     skrll 	return false;
     83      1.33     skrll }
     84      1.33     skrll 
     85       1.1       cgd /*
     86       1.1       cgd  * Hash function for symbol table lookup.  Don't even think about changing
     87       1.1       cgd  * this.  It is specified by the System V ABI.
     88       1.1       cgd  */
     89       1.1       cgd unsigned long
     90      1.31     skrll _rtld_elf_hash(const char *name)
     91       1.1       cgd {
     92       1.3  christos 	const unsigned char *p = (const unsigned char *) name;
     93       1.3  christos 	unsigned long   h = 0;
     94       1.3  christos 	unsigned long   g;
     95      1.24   mycroft 	unsigned long   c;
     96       1.3  christos 
     97      1.24   mycroft 	for (; __predict_true((c = *p) != '\0'); p++) {
     98      1.24   mycroft 		h <<= 4;
     99      1.24   mycroft 		h += c;
    100      1.24   mycroft 		if ((g = h & 0xf0000000) != 0) {
    101      1.24   mycroft 			h ^= g;
    102       1.3  christos 			h ^= g >> 24;
    103      1.24   mycroft 		}
    104       1.3  christos 	}
    105      1.24   mycroft 	return (h);
    106       1.1       cgd }
    107       1.1       cgd 
    108       1.5   mycroft const Elf_Sym *
    109      1.23   mycroft _rtld_symlook_list(const char *name, unsigned long hash, const Objlist *objlist,
    110      1.31     skrll     const Obj_Entry **defobj_out, bool in_plt)
    111       1.5   mycroft {
    112       1.5   mycroft 	const Elf_Sym *symp;
    113       1.5   mycroft 	const Elf_Sym *def;
    114      1.27   mycroft 	const Obj_Entry *defobj;
    115       1.5   mycroft 	const Objlist_Entry *elm;
    116       1.5   mycroft 
    117       1.5   mycroft 	def = NULL;
    118      1.27   mycroft 	defobj = NULL;
    119      1.12     lukem 	SIMPLEQ_FOREACH(elm, objlist, link) {
    120  1.42.4.1      matt 		rdbg(("search object %p (%s) for %s", elm->obj, elm->obj->path,
    121  1.42.4.1      matt 		    name));
    122      1.21   mycroft 		if ((symp = _rtld_symlook_obj(name, hash, elm->obj, in_plt))
    123       1.5   mycroft 		    != NULL) {
    124       1.5   mycroft 			if ((def == NULL) ||
    125       1.6   thorpej 			    (ELF_ST_BIND(symp->st_info) != STB_WEAK)) {
    126       1.5   mycroft 				def = symp;
    127      1.27   mycroft 				defobj = elm->obj;
    128       1.6   thorpej 				if (ELF_ST_BIND(def->st_info) != STB_WEAK)
    129       1.5   mycroft 					break;
    130       1.5   mycroft 			}
    131       1.5   mycroft 		}
    132       1.5   mycroft 	}
    133      1.27   mycroft 	if (def != NULL)
    134      1.27   mycroft 		*defobj_out = defobj;
    135       1.5   mycroft 	return def;
    136       1.5   mycroft }
    137       1.5   mycroft 
    138       1.1       cgd /*
    139       1.1       cgd  * Search the symbol table of a single shared object for a symbol of
    140       1.1       cgd  * the given name.  Returns a pointer to the symbol, or NULL if no
    141       1.1       cgd  * definition was found.
    142       1.1       cgd  *
    143       1.1       cgd  * The symbol's hash value is passed in for efficiency reasons; that
    144       1.1       cgd  * eliminates many recomputations of the hash value.
    145       1.1       cgd  */
    146       1.1       cgd const Elf_Sym *
    147      1.31     skrll _rtld_symlook_obj(const char *name, unsigned long hash,
    148      1.31     skrll     const Obj_Entry *obj, bool in_plt)
    149       1.1       cgd {
    150      1.20   mycroft 	unsigned long symnum;
    151       1.1       cgd 
    152      1.20   mycroft 	for (symnum = obj->buckets[hash % obj->nbuckets];
    153      1.20   mycroft 	     symnum != ELF_SYM_UNDEFINED;
    154      1.20   mycroft 	     symnum = obj->chains[symnum]) {
    155       1.3  christos 		const Elf_Sym  *symp;
    156       1.3  christos 		const char     *strp;
    157       1.3  christos 
    158       1.3  christos 		assert(symnum < obj->nchains);
    159       1.3  christos 		symp = obj->symtab + symnum;
    160       1.3  christos 		strp = obj->strtab + symp->st_name;
    161      1.38    martin 		rdbg(("check \"%s\" vs \"%s\" in %p", name, strp, obj));
    162      1.20   mycroft 		if (name[1] == strp[1] && !strcmp(name, strp)) {
    163      1.20   mycroft 			if (symp->st_shndx != SHN_UNDEF)
    164       1.3  christos 				return symp;
    165      1.21   mycroft #ifndef __mips__
    166      1.22   mycroft 			/*
    167      1.22   mycroft 			 * XXX DANGER WILL ROBINSON!
    168      1.22   mycroft 			 * If we have a function pointer in the executable's
    169      1.22   mycroft 			 * data section, it points to the executable's PLT
    170      1.22   mycroft 			 * slot, and there is NO relocation emitted.  To make
    171      1.22   mycroft 			 * the function pointer comparable to function pointers
    172      1.22   mycroft 			 * in shared libraries, we must resolve data references
    173      1.22   mycroft 			 * in the libraries to point to PLT slots in the
    174      1.22   mycroft 			 * executable, if they exist.
    175      1.22   mycroft 			 */
    176      1.21   mycroft 			else if (!in_plt && symp->st_value != 0 &&
    177      1.21   mycroft 			     ELF_ST_TYPE(symp->st_info) == STT_FUNC)
    178      1.21   mycroft 				return symp;
    179      1.21   mycroft #endif
    180      1.19   mycroft 			else
    181      1.19   mycroft 				return NULL;
    182       1.3  christos 		}
    183       1.1       cgd 	}
    184       1.1       cgd 
    185       1.3  christos 	return NULL;
    186       1.1       cgd }
    187       1.1       cgd 
    188       1.1       cgd /*
    189       1.1       cgd  * Given a symbol number in a referencing object, find the corresponding
    190       1.1       cgd  * definition of the symbol.  Returns a pointer to the symbol, or NULL if
    191       1.1       cgd  * no definition was found.  Returns a pointer to the Obj_Entry of the
    192       1.1       cgd  * defining object via the reference parameter DEFOBJ_OUT.
    193       1.1       cgd  */
    194       1.1       cgd const Elf_Sym *
    195      1.31     skrll _rtld_find_symdef(unsigned long symnum, const Obj_Entry *refobj,
    196      1.31     skrll     const Obj_Entry **defobj_out, bool in_plt)
    197       1.1       cgd {
    198      1.27   mycroft 	const Elf_Sym  *ref;
    199       1.5   mycroft 	const Elf_Sym  *def;
    200      1.27   mycroft 	const Obj_Entry *defobj;
    201      1.27   mycroft 	const char     *name;
    202       1.3  christos 	unsigned long   hash;
    203       1.3  christos 
    204      1.41      matt #ifdef COMBRELOC
    205      1.41      matt 	/*
    206      1.41      matt 	 * COMBRELOC combines multiple reloc sections and sorts them to make
    207      1.41      matt 	 * dynamic symbol lookup caching possible.
    208      1.41      matt 	 *
    209      1.41      matt 	 * So if the lookup we are doing is the same as the previous lookup
    210      1.41      matt 	 * return the cached results.
    211      1.41      matt 	 */
    212      1.41      matt 	static unsigned long last_symnum;
    213      1.41      matt 	static const Elf_Sym *last_def;
    214      1.41      matt 	static const Obj_Entry *last_refobj;
    215      1.41      matt 	static const Obj_Entry *last_defobj;
    216      1.41      matt 
    217      1.41      matt 	if (symnum == last_symnum && refobj == last_refobj
    218      1.42      matt 	    && in_plt == false) {
    219      1.41      matt 		*defobj_out = last_defobj;
    220      1.41      matt 		return last_def;
    221      1.41      matt 	}
    222      1.41      matt #endif
    223      1.41      matt 
    224      1.27   mycroft 	ref = refobj->symtab + symnum;
    225      1.27   mycroft 	name = refobj->strtab + ref->st_name;
    226      1.27   mycroft 
    227      1.27   mycroft 	/*
    228      1.40     skrll 	 * We don't have to do a full scale lookup if the symbol is local.
    229      1.40     skrll 	 * We know it will bind to the instance in this load module; to
    230      1.40     skrll 	 * which we already have a pointer (ie ref).
    231      1.33     skrll 	 */
    232      1.40     skrll 	if (ELF_ST_BIND(ref->st_info) != STB_LOCAL) {
    233      1.40     skrll 		if (ELF_ST_TYPE(ref->st_info) == STT_SECTION) {
    234      1.40     skrll 			_rtld_error("%s: Bogus symbol table entry %lu",
    235      1.40     skrll 			    refobj->path, symnum);
    236      1.40     skrll         	}
    237      1.40     skrll 
    238      1.40     skrll 		hash = _rtld_elf_hash(name);
    239      1.40     skrll 		defobj = NULL;
    240      1.40     skrll 		def = _rtld_symlook_default(name, hash, refobj, &defobj, in_plt);
    241      1.40     skrll 	} else {
    242      1.40     skrll 		rdbg(("STB_LOCAL symbol %s in %s", name, refobj->path));
    243      1.40     skrll 		def = ref;
    244      1.40     skrll 		defobj = refobj;
    245      1.33     skrll 	}
    246      1.40     skrll 
    247      1.33     skrll 	/*
    248      1.27   mycroft 	 * If we found no definition and the reference is weak, treat the
    249      1.27   mycroft 	 * symbol as having the value zero.
    250      1.27   mycroft 	 */
    251      1.27   mycroft 	if (def == NULL && ELF_ST_BIND(ref->st_info) == STB_WEAK) {
    252      1.27   mycroft 		rdbg(("  returning _rtld_sym_zero@_rtld_objmain"));
    253      1.27   mycroft 		def = &_rtld_sym_zero;
    254      1.27   mycroft 		defobj = _rtld_objmain;
    255      1.27   mycroft 	}
    256      1.33     skrll 
    257      1.41      matt 	if (def != NULL) {
    258      1.27   mycroft 		*defobj_out = defobj;
    259      1.41      matt #ifdef COMBRELOC
    260      1.42      matt 		if (in_plt == false) {
    261      1.42      matt 			/*
    262      1.42      matt 			 * Cache the lookup arguments and results if this was
    263      1.42      matt 			 * non-PLT lookup.
    264      1.42      matt 			 */
    265      1.42      matt 			last_symnum = symnum;
    266      1.42      matt 			last_refobj = refobj;
    267      1.42      matt 			last_def = def;
    268      1.42      matt 			last_defobj = defobj;
    269      1.42      matt 		}
    270      1.41      matt #endif
    271      1.41      matt 	} else {
    272      1.27   mycroft 		rdbg(("lookup failed"));
    273      1.27   mycroft 		_rtld_error("%s: Undefined %ssymbol \"%s\" (symnum = %ld)",
    274      1.27   mycroft 		    refobj->path, in_plt ? "PLT " : "", name, symnum);
    275      1.27   mycroft 	}
    276      1.26   mycroft 	return def;
    277      1.28  christos }
    278      1.28  christos 
    279      1.28  christos /*
    280      1.28  christos  * Given a symbol name in a referencing object, find the corresponding
    281      1.28  christos  * definition of the symbol.  Returns a pointer to the symbol, or NULL if
    282      1.28  christos  * no definition was found.  Returns a pointer to the Obj_Entry of the
    283      1.28  christos  * defining object via the reference parameter DEFOBJ_OUT.
    284      1.28  christos  */
    285      1.28  christos const Elf_Sym *
    286      1.28  christos _rtld_symlook_default(const char *name, unsigned long hash,
    287      1.28  christos     const Obj_Entry *refobj, const Obj_Entry **defobj_out, bool in_plt)
    288      1.28  christos {
    289      1.29     skrll 	const Elf_Sym *def;
    290      1.29     skrll 	const Elf_Sym *symp;
    291      1.29     skrll 	const Obj_Entry *obj;
    292      1.29     skrll 	const Obj_Entry *defobj;
    293      1.29     skrll 	const Objlist_Entry *elm;
    294      1.29     skrll 	def = NULL;
    295      1.29     skrll 	defobj = NULL;
    296      1.29     skrll 
    297      1.29     skrll 	/* Look first in the referencing object if linked symbolically. */
    298      1.29     skrll 	if (refobj->symbolic) {
    299  1.42.4.1      matt 		rdbg(("search referencing object for %s", name));
    300      1.29     skrll 		symp = _rtld_symlook_obj(name, hash, refobj, in_plt);
    301      1.29     skrll 		if (symp != NULL) {
    302      1.29     skrll 			def = symp;
    303      1.29     skrll 			defobj = refobj;
    304      1.29     skrll 		}
    305      1.29     skrll 	}
    306      1.29     skrll 
    307      1.29     skrll 	/* Search all objects loaded at program start up. */
    308      1.29     skrll 	if (def == NULL || ELF_ST_BIND(def->st_info) == STB_WEAK) {
    309  1.42.4.1      matt 		rdbg(("search _rtld_list_main for %s", name));
    310      1.40     skrll 		symp = _rtld_symlook_list(name, hash, &_rtld_list_main, &obj,
    311      1.40     skrll 		    in_plt);
    312      1.29     skrll 		if (symp != NULL &&
    313      1.40     skrll 		    (def == NULL || ELF_ST_BIND(symp->st_info) != STB_WEAK)) {
    314      1.29     skrll 			def = symp;
    315      1.29     skrll 			defobj = obj;
    316      1.29     skrll 		}
    317      1.29     skrll 	}
    318      1.29     skrll 
    319      1.40     skrll 	/* Search all RTLD_GLOBAL objects. */
    320      1.40     skrll 	if (def == NULL || ELF_ST_BIND(def->st_info) == STB_WEAK) {
    321  1.42.4.1      matt 		rdbg(("search _rtld_list_global for %s", name));
    322      1.40     skrll 		symp = _rtld_symlook_list(name, hash, &_rtld_list_global,
    323      1.40     skrll 		    &obj, in_plt);
    324      1.29     skrll 		if (symp != NULL &&
    325      1.29     skrll 		    (def == NULL || ELF_ST_BIND(symp->st_info) != STB_WEAK)) {
    326      1.29     skrll 			def = symp;
    327      1.29     skrll 			defobj = obj;
    328      1.29     skrll 		}
    329      1.29     skrll 	}
    330      1.40     skrll 
    331      1.40     skrll 	/* Search all dlopened DAGs containing the referencing object. */
    332      1.40     skrll 	SIMPLEQ_FOREACH(elm, &refobj->dldags, link) {
    333      1.29     skrll 		if (def != NULL && ELF_ST_BIND(def->st_info) != STB_WEAK)
    334      1.29     skrll 			break;
    335  1.42.4.1      matt 		rdbg(("search DAG with root %p (%s) for %s", elm->obj,
    336  1.42.4.1      matt 		    elm->obj->path, name));
    337      1.40     skrll 		symp = _rtld_symlook_list(name, hash, &elm->obj->dagmembers,
    338      1.40     skrll 		    &obj, in_plt);
    339      1.29     skrll 		if (symp != NULL &&
    340      1.29     skrll 		    (def == NULL || ELF_ST_BIND(symp->st_info) != STB_WEAK)) {
    341      1.29     skrll 			def = symp;
    342      1.29     skrll 			defobj = obj;
    343      1.29     skrll 		}
    344      1.28  christos 	}
    345      1.28  christos 
    346      1.29     skrll 	/*
    347      1.29     skrll 	 * Search the dynamic linker itself, and possibly resolve the
    348      1.29     skrll 	 * symbol from there.  This is how the application links to
    349      1.29     skrll 	 * dynamic linker services such as dlopen.  Only the values listed
    350      1.40     skrll 	 * in the "_rtld_exports" array can be resolved from the dynamic
    351      1.40     skrll 	 * linker.
    352      1.29     skrll 	 */
    353      1.29     skrll 	if (def == NULL || ELF_ST_BIND(def->st_info) == STB_WEAK) {
    354      1.40     skrll 		rdbg(("Search the dynamic linker itself."));
    355      1.30     skrll 		symp = _rtld_symlook_obj(name, hash, &_rtld_objself, in_plt);
    356      1.40     skrll 		if (symp != NULL && _rtld_is_exported(symp)) {
    357      1.29     skrll 			def = symp;
    358      1.30     skrll 			defobj = &_rtld_objself;
    359      1.29     skrll 		}
    360      1.28  christos 	}
    361      1.28  christos 
    362      1.29     skrll 	if (def != NULL)
    363      1.29     skrll 		*defobj_out = defobj;
    364      1.29     skrll 	return def;
    365       1.1       cgd }
    366