Home | History | Annotate | Line # | Download | only in ld.elf_so
map_object.c revision 1.62
      1 /*	$NetBSD: map_object.c,v 1.62 2022/03/30 08:26:45 hannken Exp $	 */
      2 
      3 /*
      4  * Copyright 1996 John D. Polstra.
      5  * Copyright 1996 Matt Thomas <matt (at) 3am-software.com>
      6  * Copyright 2002 Charles M. Hannum <root (at) ihack.net>
      7  * All rights reserved.
      8  *
      9  * Redistribution and use in source and binary forms, with or without
     10  * modification, are permitted provided that the following conditions
     11  * are met:
     12  * 1. Redistributions of source code must retain the above copyright
     13  *    notice, this list of conditions and the following disclaimer.
     14  * 2. Redistributions in binary form must reproduce the above copyright
     15  *    notice, this list of conditions and the following disclaimer in the
     16  *    documentation and/or other materials provided with the distribution.
     17  * 3. All advertising materials mentioning features or use of this software
     18  *    must display the following acknowledgement:
     19  *      This product includes software developed by John Polstra.
     20  * 4. The name of the author may not be used to endorse or promote products
     21  *    derived from this software without specific prior written permission.
     22  *
     23  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
     24  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
     25  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
     26  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
     27  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
     28  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
     29  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
     30  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
     31  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
     32  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
     33  */
     34 
     35 #include <sys/cdefs.h>
     36 #ifndef lint
     37 __RCSID("$NetBSD: map_object.c,v 1.62 2022/03/30 08:26:45 hannken Exp $");
     38 #endif /* not lint */
     39 
     40 #include <errno.h>
     41 #include <stddef.h>
     42 #include <stdlib.h>
     43 #include <string.h>
     44 #include <unistd.h>
     45 #include <sys/stat.h>
     46 #include <sys/types.h>
     47 #include <sys/mman.h>
     48 
     49 #include "debug.h"
     50 #include "rtld.h"
     51 
     52 static int protflags(int);	/* Elf flags -> mmap protection */
     53 
     54 #define EA_UNDEF		(~(Elf_Addr)0)
     55 
     56 /*
     57  * Map a shared object into memory.  The argument is a file descriptor,
     58  * which must be open on the object and positioned at its beginning.
     59  *
     60  * The return value is a pointer to a newly-allocated Obj_Entry structure
     61  * for the shared object.  Returns NULL on failure.
     62  */
     63 Obj_Entry *
     64 _rtld_map_object(const char *path, int fd, const struct stat *sb)
     65 {
     66 	Obj_Entry	*obj;
     67 	Elf_Ehdr	*ehdr;
     68 	Elf_Phdr	*phdr;
     69 #if defined(__HAVE_TLS_VARIANT_I) || defined(__HAVE_TLS_VARIANT_II)
     70 	Elf_Phdr	*phtls;
     71 #endif
     72 	size_t		 phsize;
     73 	Elf_Phdr	*phlimit;
     74 	Elf_Phdr	*segs[2];
     75 	int		 nsegs;
     76 	caddr_t		 mapbase = MAP_FAILED;
     77 	size_t		 mapsize = 0;
     78 	int		 mapflags;
     79 	Elf_Off		 base_offset;
     80 	Elf_Addr	 base_alignment;
     81 	Elf_Addr	 base_vaddr;
     82 	Elf_Addr	 base_vlimit;
     83 	Elf_Addr	 text_vlimit;
     84 	int		 text_flags;
     85 	void		*base_addr;
     86 	Elf_Off		 data_offset;
     87 	Elf_Addr	 data_vaddr;
     88 	Elf_Addr	 data_vlimit;
     89 	int		 data_flags;
     90 	caddr_t		 data_addr;
     91 #if defined(__HAVE_TLS_VARIANT_I) || defined(__HAVE_TLS_VARIANT_II)
     92 	Elf_Addr	 tls_vaddr = 0; /* Noise GCC */
     93 #endif
     94 	Elf_Addr	 phdr_vaddr;
     95 	size_t		 phdr_memsz;
     96 	caddr_t		 gap_addr;
     97 	size_t		 gap_size;
     98 	int i;
     99 #ifdef RTLD_LOADER
    100 	Elf_Addr	 clear_vaddr;
    101 	caddr_t		 clear_addr;
    102 	size_t		 nclear;
    103 #endif
    104 #ifdef GNU_RELRO
    105 	Elf_Addr 	 relro_page;
    106 	size_t		 relro_size;
    107 #endif
    108 
    109 	if (sb != NULL && sb->st_size < (off_t)sizeof (Elf_Ehdr)) {
    110 		_rtld_error("%s: not ELF file (too short)", path);
    111 		return NULL;
    112 	}
    113 
    114 	obj = _rtld_obj_new();
    115 	obj->path = xstrdup(path);
    116 	obj->pathlen = strlen(path);
    117 	if (sb != NULL) {
    118 		obj->dev = sb->st_dev;
    119 		obj->ino = sb->st_ino;
    120 	}
    121 
    122 	ehdr = mmap(NULL, _rtld_pagesz, PROT_READ, MAP_FILE | MAP_SHARED, fd,
    123 	    (off_t)0);
    124 	obj->ehdr = ehdr;
    125 	if (ehdr == MAP_FAILED) {
    126 		_rtld_error("%s: read error: %s", path, xstrerror(errno));
    127 		goto bad;
    128 	}
    129 	/* Make sure the file is valid */
    130 	if (memcmp(ELFMAG, ehdr->e_ident, SELFMAG) != 0) {
    131 		_rtld_error("%s: not ELF file (magic number bad)", path);
    132 		goto bad;
    133 	}
    134 	if (ehdr->e_ident[EI_CLASS] != ELFCLASS) {
    135 		_rtld_error("%s: invalid ELF class %x; expected %x", path,
    136 		    ehdr->e_ident[EI_CLASS], ELFCLASS);
    137 		goto bad;
    138 	}
    139 	/* Elf_e_ident includes class */
    140 	if (ehdr->e_ident[EI_VERSION] != EV_CURRENT ||
    141 	    ehdr->e_version != EV_CURRENT ||
    142 	    ehdr->e_ident[EI_DATA] != ELFDEFNNAME(MACHDEP_ENDIANNESS)) {
    143 		_rtld_error("%s: unsupported file version", path);
    144 		goto bad;
    145 	}
    146 	if (ehdr->e_type != ET_EXEC && ehdr->e_type != ET_DYN) {
    147 		_rtld_error("%s: unsupported file type", path);
    148 		goto bad;
    149 	}
    150 	switch (ehdr->e_machine) {
    151 		ELFDEFNNAME(MACHDEP_ID_CASES)
    152 	default:
    153 		_rtld_error("%s: unsupported machine", path);
    154 		goto bad;
    155 	}
    156 
    157 	/*
    158          * We rely on the program header being in the first page.  This is
    159          * not strictly required by the ABI specification, but it seems to
    160          * always true in practice.  And, it simplifies things considerably.
    161          */
    162 	assert(ehdr->e_phentsize == sizeof(Elf_Phdr));
    163 	assert(ehdr->e_phoff + ehdr->e_phnum * sizeof(Elf_Phdr) <=
    164 	    _rtld_pagesz);
    165 
    166 	/*
    167          * Scan the program header entries, and save key information.
    168          *
    169          * We rely on there being exactly two load segments, text and data,
    170          * in that order.
    171          */
    172 	phdr = (Elf_Phdr *) ((caddr_t)ehdr + ehdr->e_phoff);
    173 #if defined(__HAVE_TLS_VARIANT_I) || defined(__HAVE_TLS_VARIANT_II)
    174 	phtls = NULL;
    175 #endif
    176 	phsize = ehdr->e_phnum * sizeof(phdr[0]);
    177 	obj->phdr = NULL;
    178 #ifdef GNU_RELRO
    179 	relro_page = 0;
    180 	relro_size = 0;
    181 #endif
    182 	phdr_vaddr = EA_UNDEF;
    183 	phdr_memsz = 0;
    184 	phlimit = phdr + ehdr->e_phnum;
    185 	nsegs = 0;
    186 	while (phdr < phlimit) {
    187 		switch (phdr->p_type) {
    188 		case PT_INTERP:
    189 			obj->interp = (void *)(uintptr_t)phdr->p_vaddr;
    190  			dbg(("%s: PT_INTERP %p", obj->path, obj->interp));
    191 			break;
    192 
    193 		case PT_LOAD:
    194 			if (nsegs < 2)
    195 				segs[nsegs] = phdr;
    196 			++nsegs;
    197 
    198 			dbg(("%s: %s %p phsize %" PRImemsz, obj->path, "PT_LOAD",
    199 			    (void *)(uintptr_t)phdr->p_vaddr, phdr->p_memsz));
    200 			break;
    201 
    202 		case PT_PHDR:
    203 			phdr_vaddr = phdr->p_vaddr;
    204 			phdr_memsz = phdr->p_memsz;
    205 			dbg(("%s: %s %p phsize %" PRImemsz, obj->path, "PT_PHDR",
    206 			    (void *)(uintptr_t)phdr->p_vaddr, phdr->p_memsz));
    207 			break;
    208 
    209 #ifdef GNU_RELRO
    210 		case PT_GNU_RELRO:
    211 			relro_page = phdr->p_vaddr;
    212 			relro_size = phdr->p_memsz;
    213 			break;
    214 #endif
    215 
    216 		case PT_DYNAMIC:
    217 			obj->dynamic = (void *)(uintptr_t)phdr->p_vaddr;
    218 			dbg(("%s: %s %p phsize %" PRImemsz, obj->path, "PT_DYNAMIC",
    219 			    (void *)(uintptr_t)phdr->p_vaddr, phdr->p_memsz));
    220 			break;
    221 
    222 #if defined(__HAVE_TLS_VARIANT_I) || defined(__HAVE_TLS_VARIANT_II)
    223 		case PT_TLS:
    224 			phtls = phdr;
    225 			dbg(("%s: %s %p phsize %" PRImemsz, obj->path, "PT_TLS",
    226 			    (void *)(uintptr_t)phdr->p_vaddr, phdr->p_memsz));
    227 			break;
    228 #endif
    229 #ifdef __ARM_EABI__
    230 		case PT_ARM_EXIDX:
    231 			obj->exidx_start = (void *)(uintptr_t)phdr->p_vaddr;
    232 			obj->exidx_sz = phdr->p_memsz;
    233 			break;
    234 #endif
    235 		}
    236 
    237 		++phdr;
    238 	}
    239 	phdr = (Elf_Phdr *) ((caddr_t)ehdr + ehdr->e_phoff);
    240 	obj->entry = (void *)(uintptr_t)ehdr->e_entry;
    241 	if (!obj->dynamic) {
    242 		_rtld_error("%s: not dynamically linked", path);
    243 		goto bad;
    244 	}
    245 	if (nsegs != 2) {
    246 		_rtld_error("%s: wrong number of segments (%d != 2)", path,
    247 		    nsegs);
    248 		goto bad;
    249 	}
    250 
    251 	/*
    252 	 * Map the entire address space of the object as a file
    253 	 * region to stake out our contiguous region and establish a
    254 	 * base for relocation.  We use a file mapping so that
    255 	 * the kernel will give us whatever alignment is appropriate
    256 	 * for the platform we're running on.
    257 	 *
    258 	 * We map it using the text protection, map the data segment
    259 	 * into the right place, then map an anon segment for the bss
    260 	 * and unmap the gaps left by padding to alignment.
    261 	 */
    262 
    263 	base_alignment = segs[0]->p_align;
    264 	base_offset = round_down(segs[0]->p_offset);
    265 	base_vaddr = round_down(segs[0]->p_vaddr);
    266 	base_vlimit = round_up(segs[1]->p_vaddr + segs[1]->p_memsz);
    267 	text_vlimit = round_up(segs[0]->p_vaddr + segs[0]->p_memsz);
    268 	text_flags = protflags(segs[0]->p_flags);
    269 	data_offset = round_down(segs[1]->p_offset);
    270 	data_vaddr = round_down(segs[1]->p_vaddr);
    271 	data_vlimit = round_up(segs[1]->p_vaddr + segs[1]->p_filesz);
    272 	data_flags = protflags(segs[1]->p_flags);
    273 #ifdef RTLD_LOADER
    274 	clear_vaddr = segs[1]->p_vaddr + segs[1]->p_filesz;
    275 #endif
    276 
    277 	obj->textsize = text_vlimit - base_vaddr;
    278 	obj->vaddrbase = base_vaddr;
    279 	obj->isdynamic = ehdr->e_type == ET_DYN;
    280 
    281 #if defined(__HAVE_TLS_VARIANT_I) || defined(__HAVE_TLS_VARIANT_II)
    282 	if (phtls != NULL) {
    283 		++_rtld_tls_dtv_generation;
    284 		obj->tlsindex = ++_rtld_tls_max_index;
    285 		obj->tlssize = phtls->p_memsz;
    286 		obj->tlsalign = phtls->p_align;
    287 		obj->tlsinitsize = phtls->p_filesz;
    288 		tls_vaddr = phtls->p_vaddr;
    289 	}
    290 #endif
    291 
    292 	obj->phdr_loaded = false;
    293 	for (i = 0; i < nsegs; i++) {
    294 		if (phdr_vaddr != EA_UNDEF &&
    295 		    segs[i]->p_vaddr <= phdr_vaddr &&
    296 		    segs[i]->p_memsz >= phdr_memsz) {
    297 			obj->phdr_loaded = true;
    298 			break;
    299 		}
    300 		if (segs[i]->p_offset <= ehdr->e_phoff &&
    301 		    segs[i]->p_memsz >= phsize) {
    302 			phdr_vaddr = segs[i]->p_vaddr + ehdr->e_phoff;
    303 			phdr_memsz = phsize;
    304 			obj->phdr_loaded = true;
    305 			break;
    306 		}
    307 	}
    308 	if (obj->phdr_loaded) {
    309 		obj->phdr = (void *)(uintptr_t)phdr_vaddr;
    310 		obj->phsize = phdr_memsz;
    311 	} else {
    312 		Elf_Phdr *buf;
    313 		buf = xmalloc(phsize);
    314 		if (buf == NULL) {
    315 			_rtld_error("%s: cannot allocate program header", path);
    316 			goto bad;
    317 		}
    318 		memcpy(buf, phdr, phsize);
    319 		obj->phdr = buf;
    320 		obj->phsize = phsize;
    321 	}
    322 	dbg(("%s: phdr %p phsize %zu (%s)", obj->path, obj->phdr, obj->phsize,
    323 	     obj->phdr_loaded ? "loaded" : "allocated"));
    324 
    325 	/* Unmap header if it overlaps the first load section. */
    326 	if (base_offset < _rtld_pagesz) {
    327 		munmap(ehdr, _rtld_pagesz);
    328 		obj->ehdr = MAP_FAILED;
    329 	}
    330 
    331 	/*
    332 	 * Calculate log2 of the base section alignment.
    333 	 */
    334 	mapflags = 0;
    335 	if (base_alignment > _rtld_pagesz) {
    336 		unsigned int log2 = 0;
    337 		for (; base_alignment > 1; base_alignment >>= 1)
    338 			log2++;
    339 		mapflags = MAP_ALIGNED(log2);
    340 	}
    341 
    342 	base_addr = NULL;
    343 #ifdef RTLD_LOADER
    344 	if (!obj->isdynamic) {
    345 		mapflags |= MAP_TRYFIXED;
    346 		base_addr = (void *)(uintptr_t)base_vaddr;
    347 	}
    348 #endif
    349 	mapsize = base_vlimit - base_vaddr;
    350 	mapbase = mmap(base_addr, mapsize, text_flags,
    351 	    mapflags | MAP_FILE | MAP_PRIVATE, fd, base_offset);
    352 	if (mapbase == MAP_FAILED) {
    353 		_rtld_error("mmap of entire address space failed: %s",
    354 		    xstrerror(errno));
    355 		goto bad;
    356 	}
    357 #ifdef RTLD_LOADER
    358 	if (!obj->isdynamic && mapbase != base_addr) {
    359 		_rtld_error("mmap of executable at correct address failed");
    360 		goto bad;
    361 	}
    362 #endif
    363 
    364 	/* Overlay the data segment onto the proper region. */
    365 	data_addr = mapbase + (data_vaddr - base_vaddr);
    366 	if (mmap(data_addr, data_vlimit - data_vaddr, data_flags,
    367 	    MAP_FILE | MAP_PRIVATE | MAP_FIXED, fd, data_offset) ==
    368 	    MAP_FAILED) {
    369 		_rtld_error("mmap of data failed: %s", xstrerror(errno));
    370 		goto bad;
    371 	}
    372 
    373 	/* Overlay the bss segment onto the proper region. */
    374 	if (base_vlimit > data_vlimit) {
    375 		if (mmap(mapbase + data_vlimit - base_vaddr,
    376 		    base_vlimit - data_vlimit, data_flags,
    377 		    MAP_ANON | MAP_PRIVATE | MAP_FIXED, -1, 0) == MAP_FAILED) {
    378 			_rtld_error("mmap of bss failed: %s", xstrerror(errno));
    379 			goto bad;
    380 		}
    381 	}
    382 
    383 	/* Unmap the gap between the text and data. */
    384 	gap_addr = mapbase + round_up(text_vlimit - base_vaddr);
    385 	gap_size = data_addr - gap_addr;
    386 	if (gap_size != 0 && mprotect(gap_addr, gap_size, PROT_NONE) == -1) {
    387 		_rtld_error("mprotect of text -> data gap failed: %s",
    388 		    xstrerror(errno));
    389 		goto bad;
    390 	}
    391 
    392 #ifdef RTLD_LOADER
    393 	/* Clear any BSS in the last page of the data segment. */
    394 	clear_addr = mapbase + (clear_vaddr - base_vaddr);
    395 	if ((nclear = data_vlimit - clear_vaddr) > 0)
    396 		memset(clear_addr, 0, nclear);
    397 
    398 	/* Non-file portion of BSS mapped above. */
    399 #endif
    400 
    401 #if defined(__HAVE_TLS_VARIANT_I) || defined(__HAVE_TLS_VARIANT_II)
    402 	if (phtls != NULL)
    403 		obj->tlsinit = mapbase + tls_vaddr;
    404 #endif
    405 
    406 	obj->mapbase = mapbase;
    407 	obj->mapsize = mapsize;
    408 	obj->relocbase = mapbase - base_vaddr;
    409 
    410 #ifdef GNU_RELRO
    411 	/* rounding happens later. */
    412 	obj->relro_page = obj->relocbase + relro_page;
    413 	obj->relro_size = relro_size;
    414 #endif
    415 
    416 	if (obj->dynamic)
    417 		obj->dynamic = (void *)(obj->relocbase + (Elf_Addr)(uintptr_t)obj->dynamic);
    418 	if (obj->entry)
    419 		obj->entry = (void *)(obj->relocbase + (Elf_Addr)(uintptr_t)obj->entry);
    420 	if (obj->interp)
    421 		obj->interp = (void *)(obj->relocbase + (Elf_Addr)(uintptr_t)obj->interp);
    422 	if (obj->phdr_loaded)
    423 		obj->phdr =  (void *)(obj->relocbase + (Elf_Addr)(uintptr_t)obj->phdr);
    424 #ifdef __ARM_EABI__
    425 	if (obj->exidx_start)
    426 		obj->exidx_start = (void *)(obj->relocbase + (Elf_Addr)(uintptr_t)obj->exidx_start);
    427 #endif
    428 
    429 	return obj;
    430 
    431 bad:
    432 	if (obj->ehdr != MAP_FAILED)
    433 		munmap(obj->ehdr, _rtld_pagesz);
    434 	if (mapbase != MAP_FAILED)
    435 		munmap(mapbase, mapsize);
    436 	_rtld_obj_free(obj);
    437 	return NULL;
    438 }
    439 
    440 void
    441 _rtld_obj_free(Obj_Entry *obj)
    442 {
    443 	Objlist_Entry *elm;
    444 	Name_Entry *entry;
    445 
    446 #if defined(__HAVE_TLS_VARIANT_I) || defined(__HAVE_TLS_VARIANT_II)
    447 	if (obj->tls_done)
    448 		_rtld_tls_offset_free(obj);
    449 #endif
    450 	xfree(obj->path);
    451 	while (obj->needed != NULL) {
    452 		Needed_Entry *needed = obj->needed;
    453 		obj->needed = needed->next;
    454 		xfree(needed);
    455 	}
    456 	while ((entry = SIMPLEQ_FIRST(&obj->names)) != NULL) {
    457 		SIMPLEQ_REMOVE_HEAD(&obj->names, link);
    458 		xfree(entry);
    459 	}
    460 	while ((elm = SIMPLEQ_FIRST(&obj->dldags)) != NULL) {
    461 		SIMPLEQ_REMOVE_HEAD(&obj->dldags, link);
    462 		xfree(elm);
    463 	}
    464 	while ((elm = SIMPLEQ_FIRST(&obj->dagmembers)) != NULL) {
    465 		SIMPLEQ_REMOVE_HEAD(&obj->dagmembers, link);
    466 		xfree(elm);
    467 	}
    468 	if (!obj->phdr_loaded)
    469 		xfree((void *)(uintptr_t)obj->phdr);
    470 	xfree(obj);
    471 }
    472 
    473 Obj_Entry *
    474 _rtld_obj_new(void)
    475 {
    476 	Obj_Entry *obj;
    477 
    478 	obj = CNEW(Obj_Entry);
    479 	SIMPLEQ_INIT(&obj->names);
    480 	SIMPLEQ_INIT(&obj->dldags);
    481 	SIMPLEQ_INIT(&obj->dagmembers);
    482 	return obj;
    483 }
    484 
    485 /*
    486  * Given a set of ELF protection flags, return the corresponding protection
    487  * flags for MMAP.
    488  */
    489 static int
    490 protflags(int elfflags)
    491 {
    492 	int prot = 0;
    493 
    494 	if (elfflags & PF_R)
    495 		prot |= PROT_READ;
    496 #ifdef RTLD_LOADER
    497 	if (elfflags & PF_W)
    498 		prot |= PROT_WRITE;
    499 #endif
    500 	if (elfflags & PF_X)
    501 		prot |= PROT_EXEC;
    502 	return prot;
    503 }
    504