map_object.c revision 1.62 1 /* $NetBSD: map_object.c,v 1.62 2022/03/30 08:26:45 hannken Exp $ */
2
3 /*
4 * Copyright 1996 John D. Polstra.
5 * Copyright 1996 Matt Thomas <matt (at) 3am-software.com>
6 * Copyright 2002 Charles M. Hannum <root (at) ihack.net>
7 * All rights reserved.
8 *
9 * Redistribution and use in source and binary forms, with or without
10 * modification, are permitted provided that the following conditions
11 * are met:
12 * 1. Redistributions of source code must retain the above copyright
13 * notice, this list of conditions and the following disclaimer.
14 * 2. Redistributions in binary form must reproduce the above copyright
15 * notice, this list of conditions and the following disclaimer in the
16 * documentation and/or other materials provided with the distribution.
17 * 3. All advertising materials mentioning features or use of this software
18 * must display the following acknowledgement:
19 * This product includes software developed by John Polstra.
20 * 4. The name of the author may not be used to endorse or promote products
21 * derived from this software without specific prior written permission.
22 *
23 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
24 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
25 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
26 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
27 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
28 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
29 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
30 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
31 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
32 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
33 */
34
35 #include <sys/cdefs.h>
36 #ifndef lint
37 __RCSID("$NetBSD: map_object.c,v 1.62 2022/03/30 08:26:45 hannken Exp $");
38 #endif /* not lint */
39
40 #include <errno.h>
41 #include <stddef.h>
42 #include <stdlib.h>
43 #include <string.h>
44 #include <unistd.h>
45 #include <sys/stat.h>
46 #include <sys/types.h>
47 #include <sys/mman.h>
48
49 #include "debug.h"
50 #include "rtld.h"
51
52 static int protflags(int); /* Elf flags -> mmap protection */
53
54 #define EA_UNDEF (~(Elf_Addr)0)
55
56 /*
57 * Map a shared object into memory. The argument is a file descriptor,
58 * which must be open on the object and positioned at its beginning.
59 *
60 * The return value is a pointer to a newly-allocated Obj_Entry structure
61 * for the shared object. Returns NULL on failure.
62 */
63 Obj_Entry *
64 _rtld_map_object(const char *path, int fd, const struct stat *sb)
65 {
66 Obj_Entry *obj;
67 Elf_Ehdr *ehdr;
68 Elf_Phdr *phdr;
69 #if defined(__HAVE_TLS_VARIANT_I) || defined(__HAVE_TLS_VARIANT_II)
70 Elf_Phdr *phtls;
71 #endif
72 size_t phsize;
73 Elf_Phdr *phlimit;
74 Elf_Phdr *segs[2];
75 int nsegs;
76 caddr_t mapbase = MAP_FAILED;
77 size_t mapsize = 0;
78 int mapflags;
79 Elf_Off base_offset;
80 Elf_Addr base_alignment;
81 Elf_Addr base_vaddr;
82 Elf_Addr base_vlimit;
83 Elf_Addr text_vlimit;
84 int text_flags;
85 void *base_addr;
86 Elf_Off data_offset;
87 Elf_Addr data_vaddr;
88 Elf_Addr data_vlimit;
89 int data_flags;
90 caddr_t data_addr;
91 #if defined(__HAVE_TLS_VARIANT_I) || defined(__HAVE_TLS_VARIANT_II)
92 Elf_Addr tls_vaddr = 0; /* Noise GCC */
93 #endif
94 Elf_Addr phdr_vaddr;
95 size_t phdr_memsz;
96 caddr_t gap_addr;
97 size_t gap_size;
98 int i;
99 #ifdef RTLD_LOADER
100 Elf_Addr clear_vaddr;
101 caddr_t clear_addr;
102 size_t nclear;
103 #endif
104 #ifdef GNU_RELRO
105 Elf_Addr relro_page;
106 size_t relro_size;
107 #endif
108
109 if (sb != NULL && sb->st_size < (off_t)sizeof (Elf_Ehdr)) {
110 _rtld_error("%s: not ELF file (too short)", path);
111 return NULL;
112 }
113
114 obj = _rtld_obj_new();
115 obj->path = xstrdup(path);
116 obj->pathlen = strlen(path);
117 if (sb != NULL) {
118 obj->dev = sb->st_dev;
119 obj->ino = sb->st_ino;
120 }
121
122 ehdr = mmap(NULL, _rtld_pagesz, PROT_READ, MAP_FILE | MAP_SHARED, fd,
123 (off_t)0);
124 obj->ehdr = ehdr;
125 if (ehdr == MAP_FAILED) {
126 _rtld_error("%s: read error: %s", path, xstrerror(errno));
127 goto bad;
128 }
129 /* Make sure the file is valid */
130 if (memcmp(ELFMAG, ehdr->e_ident, SELFMAG) != 0) {
131 _rtld_error("%s: not ELF file (magic number bad)", path);
132 goto bad;
133 }
134 if (ehdr->e_ident[EI_CLASS] != ELFCLASS) {
135 _rtld_error("%s: invalid ELF class %x; expected %x", path,
136 ehdr->e_ident[EI_CLASS], ELFCLASS);
137 goto bad;
138 }
139 /* Elf_e_ident includes class */
140 if (ehdr->e_ident[EI_VERSION] != EV_CURRENT ||
141 ehdr->e_version != EV_CURRENT ||
142 ehdr->e_ident[EI_DATA] != ELFDEFNNAME(MACHDEP_ENDIANNESS)) {
143 _rtld_error("%s: unsupported file version", path);
144 goto bad;
145 }
146 if (ehdr->e_type != ET_EXEC && ehdr->e_type != ET_DYN) {
147 _rtld_error("%s: unsupported file type", path);
148 goto bad;
149 }
150 switch (ehdr->e_machine) {
151 ELFDEFNNAME(MACHDEP_ID_CASES)
152 default:
153 _rtld_error("%s: unsupported machine", path);
154 goto bad;
155 }
156
157 /*
158 * We rely on the program header being in the first page. This is
159 * not strictly required by the ABI specification, but it seems to
160 * always true in practice. And, it simplifies things considerably.
161 */
162 assert(ehdr->e_phentsize == sizeof(Elf_Phdr));
163 assert(ehdr->e_phoff + ehdr->e_phnum * sizeof(Elf_Phdr) <=
164 _rtld_pagesz);
165
166 /*
167 * Scan the program header entries, and save key information.
168 *
169 * We rely on there being exactly two load segments, text and data,
170 * in that order.
171 */
172 phdr = (Elf_Phdr *) ((caddr_t)ehdr + ehdr->e_phoff);
173 #if defined(__HAVE_TLS_VARIANT_I) || defined(__HAVE_TLS_VARIANT_II)
174 phtls = NULL;
175 #endif
176 phsize = ehdr->e_phnum * sizeof(phdr[0]);
177 obj->phdr = NULL;
178 #ifdef GNU_RELRO
179 relro_page = 0;
180 relro_size = 0;
181 #endif
182 phdr_vaddr = EA_UNDEF;
183 phdr_memsz = 0;
184 phlimit = phdr + ehdr->e_phnum;
185 nsegs = 0;
186 while (phdr < phlimit) {
187 switch (phdr->p_type) {
188 case PT_INTERP:
189 obj->interp = (void *)(uintptr_t)phdr->p_vaddr;
190 dbg(("%s: PT_INTERP %p", obj->path, obj->interp));
191 break;
192
193 case PT_LOAD:
194 if (nsegs < 2)
195 segs[nsegs] = phdr;
196 ++nsegs;
197
198 dbg(("%s: %s %p phsize %" PRImemsz, obj->path, "PT_LOAD",
199 (void *)(uintptr_t)phdr->p_vaddr, phdr->p_memsz));
200 break;
201
202 case PT_PHDR:
203 phdr_vaddr = phdr->p_vaddr;
204 phdr_memsz = phdr->p_memsz;
205 dbg(("%s: %s %p phsize %" PRImemsz, obj->path, "PT_PHDR",
206 (void *)(uintptr_t)phdr->p_vaddr, phdr->p_memsz));
207 break;
208
209 #ifdef GNU_RELRO
210 case PT_GNU_RELRO:
211 relro_page = phdr->p_vaddr;
212 relro_size = phdr->p_memsz;
213 break;
214 #endif
215
216 case PT_DYNAMIC:
217 obj->dynamic = (void *)(uintptr_t)phdr->p_vaddr;
218 dbg(("%s: %s %p phsize %" PRImemsz, obj->path, "PT_DYNAMIC",
219 (void *)(uintptr_t)phdr->p_vaddr, phdr->p_memsz));
220 break;
221
222 #if defined(__HAVE_TLS_VARIANT_I) || defined(__HAVE_TLS_VARIANT_II)
223 case PT_TLS:
224 phtls = phdr;
225 dbg(("%s: %s %p phsize %" PRImemsz, obj->path, "PT_TLS",
226 (void *)(uintptr_t)phdr->p_vaddr, phdr->p_memsz));
227 break;
228 #endif
229 #ifdef __ARM_EABI__
230 case PT_ARM_EXIDX:
231 obj->exidx_start = (void *)(uintptr_t)phdr->p_vaddr;
232 obj->exidx_sz = phdr->p_memsz;
233 break;
234 #endif
235 }
236
237 ++phdr;
238 }
239 phdr = (Elf_Phdr *) ((caddr_t)ehdr + ehdr->e_phoff);
240 obj->entry = (void *)(uintptr_t)ehdr->e_entry;
241 if (!obj->dynamic) {
242 _rtld_error("%s: not dynamically linked", path);
243 goto bad;
244 }
245 if (nsegs != 2) {
246 _rtld_error("%s: wrong number of segments (%d != 2)", path,
247 nsegs);
248 goto bad;
249 }
250
251 /*
252 * Map the entire address space of the object as a file
253 * region to stake out our contiguous region and establish a
254 * base for relocation. We use a file mapping so that
255 * the kernel will give us whatever alignment is appropriate
256 * for the platform we're running on.
257 *
258 * We map it using the text protection, map the data segment
259 * into the right place, then map an anon segment for the bss
260 * and unmap the gaps left by padding to alignment.
261 */
262
263 base_alignment = segs[0]->p_align;
264 base_offset = round_down(segs[0]->p_offset);
265 base_vaddr = round_down(segs[0]->p_vaddr);
266 base_vlimit = round_up(segs[1]->p_vaddr + segs[1]->p_memsz);
267 text_vlimit = round_up(segs[0]->p_vaddr + segs[0]->p_memsz);
268 text_flags = protflags(segs[0]->p_flags);
269 data_offset = round_down(segs[1]->p_offset);
270 data_vaddr = round_down(segs[1]->p_vaddr);
271 data_vlimit = round_up(segs[1]->p_vaddr + segs[1]->p_filesz);
272 data_flags = protflags(segs[1]->p_flags);
273 #ifdef RTLD_LOADER
274 clear_vaddr = segs[1]->p_vaddr + segs[1]->p_filesz;
275 #endif
276
277 obj->textsize = text_vlimit - base_vaddr;
278 obj->vaddrbase = base_vaddr;
279 obj->isdynamic = ehdr->e_type == ET_DYN;
280
281 #if defined(__HAVE_TLS_VARIANT_I) || defined(__HAVE_TLS_VARIANT_II)
282 if (phtls != NULL) {
283 ++_rtld_tls_dtv_generation;
284 obj->tlsindex = ++_rtld_tls_max_index;
285 obj->tlssize = phtls->p_memsz;
286 obj->tlsalign = phtls->p_align;
287 obj->tlsinitsize = phtls->p_filesz;
288 tls_vaddr = phtls->p_vaddr;
289 }
290 #endif
291
292 obj->phdr_loaded = false;
293 for (i = 0; i < nsegs; i++) {
294 if (phdr_vaddr != EA_UNDEF &&
295 segs[i]->p_vaddr <= phdr_vaddr &&
296 segs[i]->p_memsz >= phdr_memsz) {
297 obj->phdr_loaded = true;
298 break;
299 }
300 if (segs[i]->p_offset <= ehdr->e_phoff &&
301 segs[i]->p_memsz >= phsize) {
302 phdr_vaddr = segs[i]->p_vaddr + ehdr->e_phoff;
303 phdr_memsz = phsize;
304 obj->phdr_loaded = true;
305 break;
306 }
307 }
308 if (obj->phdr_loaded) {
309 obj->phdr = (void *)(uintptr_t)phdr_vaddr;
310 obj->phsize = phdr_memsz;
311 } else {
312 Elf_Phdr *buf;
313 buf = xmalloc(phsize);
314 if (buf == NULL) {
315 _rtld_error("%s: cannot allocate program header", path);
316 goto bad;
317 }
318 memcpy(buf, phdr, phsize);
319 obj->phdr = buf;
320 obj->phsize = phsize;
321 }
322 dbg(("%s: phdr %p phsize %zu (%s)", obj->path, obj->phdr, obj->phsize,
323 obj->phdr_loaded ? "loaded" : "allocated"));
324
325 /* Unmap header if it overlaps the first load section. */
326 if (base_offset < _rtld_pagesz) {
327 munmap(ehdr, _rtld_pagesz);
328 obj->ehdr = MAP_FAILED;
329 }
330
331 /*
332 * Calculate log2 of the base section alignment.
333 */
334 mapflags = 0;
335 if (base_alignment > _rtld_pagesz) {
336 unsigned int log2 = 0;
337 for (; base_alignment > 1; base_alignment >>= 1)
338 log2++;
339 mapflags = MAP_ALIGNED(log2);
340 }
341
342 base_addr = NULL;
343 #ifdef RTLD_LOADER
344 if (!obj->isdynamic) {
345 mapflags |= MAP_TRYFIXED;
346 base_addr = (void *)(uintptr_t)base_vaddr;
347 }
348 #endif
349 mapsize = base_vlimit - base_vaddr;
350 mapbase = mmap(base_addr, mapsize, text_flags,
351 mapflags | MAP_FILE | MAP_PRIVATE, fd, base_offset);
352 if (mapbase == MAP_FAILED) {
353 _rtld_error("mmap of entire address space failed: %s",
354 xstrerror(errno));
355 goto bad;
356 }
357 #ifdef RTLD_LOADER
358 if (!obj->isdynamic && mapbase != base_addr) {
359 _rtld_error("mmap of executable at correct address failed");
360 goto bad;
361 }
362 #endif
363
364 /* Overlay the data segment onto the proper region. */
365 data_addr = mapbase + (data_vaddr - base_vaddr);
366 if (mmap(data_addr, data_vlimit - data_vaddr, data_flags,
367 MAP_FILE | MAP_PRIVATE | MAP_FIXED, fd, data_offset) ==
368 MAP_FAILED) {
369 _rtld_error("mmap of data failed: %s", xstrerror(errno));
370 goto bad;
371 }
372
373 /* Overlay the bss segment onto the proper region. */
374 if (base_vlimit > data_vlimit) {
375 if (mmap(mapbase + data_vlimit - base_vaddr,
376 base_vlimit - data_vlimit, data_flags,
377 MAP_ANON | MAP_PRIVATE | MAP_FIXED, -1, 0) == MAP_FAILED) {
378 _rtld_error("mmap of bss failed: %s", xstrerror(errno));
379 goto bad;
380 }
381 }
382
383 /* Unmap the gap between the text and data. */
384 gap_addr = mapbase + round_up(text_vlimit - base_vaddr);
385 gap_size = data_addr - gap_addr;
386 if (gap_size != 0 && mprotect(gap_addr, gap_size, PROT_NONE) == -1) {
387 _rtld_error("mprotect of text -> data gap failed: %s",
388 xstrerror(errno));
389 goto bad;
390 }
391
392 #ifdef RTLD_LOADER
393 /* Clear any BSS in the last page of the data segment. */
394 clear_addr = mapbase + (clear_vaddr - base_vaddr);
395 if ((nclear = data_vlimit - clear_vaddr) > 0)
396 memset(clear_addr, 0, nclear);
397
398 /* Non-file portion of BSS mapped above. */
399 #endif
400
401 #if defined(__HAVE_TLS_VARIANT_I) || defined(__HAVE_TLS_VARIANT_II)
402 if (phtls != NULL)
403 obj->tlsinit = mapbase + tls_vaddr;
404 #endif
405
406 obj->mapbase = mapbase;
407 obj->mapsize = mapsize;
408 obj->relocbase = mapbase - base_vaddr;
409
410 #ifdef GNU_RELRO
411 /* rounding happens later. */
412 obj->relro_page = obj->relocbase + relro_page;
413 obj->relro_size = relro_size;
414 #endif
415
416 if (obj->dynamic)
417 obj->dynamic = (void *)(obj->relocbase + (Elf_Addr)(uintptr_t)obj->dynamic);
418 if (obj->entry)
419 obj->entry = (void *)(obj->relocbase + (Elf_Addr)(uintptr_t)obj->entry);
420 if (obj->interp)
421 obj->interp = (void *)(obj->relocbase + (Elf_Addr)(uintptr_t)obj->interp);
422 if (obj->phdr_loaded)
423 obj->phdr = (void *)(obj->relocbase + (Elf_Addr)(uintptr_t)obj->phdr);
424 #ifdef __ARM_EABI__
425 if (obj->exidx_start)
426 obj->exidx_start = (void *)(obj->relocbase + (Elf_Addr)(uintptr_t)obj->exidx_start);
427 #endif
428
429 return obj;
430
431 bad:
432 if (obj->ehdr != MAP_FAILED)
433 munmap(obj->ehdr, _rtld_pagesz);
434 if (mapbase != MAP_FAILED)
435 munmap(mapbase, mapsize);
436 _rtld_obj_free(obj);
437 return NULL;
438 }
439
440 void
441 _rtld_obj_free(Obj_Entry *obj)
442 {
443 Objlist_Entry *elm;
444 Name_Entry *entry;
445
446 #if defined(__HAVE_TLS_VARIANT_I) || defined(__HAVE_TLS_VARIANT_II)
447 if (obj->tls_done)
448 _rtld_tls_offset_free(obj);
449 #endif
450 xfree(obj->path);
451 while (obj->needed != NULL) {
452 Needed_Entry *needed = obj->needed;
453 obj->needed = needed->next;
454 xfree(needed);
455 }
456 while ((entry = SIMPLEQ_FIRST(&obj->names)) != NULL) {
457 SIMPLEQ_REMOVE_HEAD(&obj->names, link);
458 xfree(entry);
459 }
460 while ((elm = SIMPLEQ_FIRST(&obj->dldags)) != NULL) {
461 SIMPLEQ_REMOVE_HEAD(&obj->dldags, link);
462 xfree(elm);
463 }
464 while ((elm = SIMPLEQ_FIRST(&obj->dagmembers)) != NULL) {
465 SIMPLEQ_REMOVE_HEAD(&obj->dagmembers, link);
466 xfree(elm);
467 }
468 if (!obj->phdr_loaded)
469 xfree((void *)(uintptr_t)obj->phdr);
470 xfree(obj);
471 }
472
473 Obj_Entry *
474 _rtld_obj_new(void)
475 {
476 Obj_Entry *obj;
477
478 obj = CNEW(Obj_Entry);
479 SIMPLEQ_INIT(&obj->names);
480 SIMPLEQ_INIT(&obj->dldags);
481 SIMPLEQ_INIT(&obj->dagmembers);
482 return obj;
483 }
484
485 /*
486 * Given a set of ELF protection flags, return the corresponding protection
487 * flags for MMAP.
488 */
489 static int
490 protflags(int elfflags)
491 {
492 int prot = 0;
493
494 if (elfflags & PF_R)
495 prot |= PROT_READ;
496 #ifdef RTLD_LOADER
497 if (elfflags & PF_W)
498 prot |= PROT_WRITE;
499 #endif
500 if (elfflags & PF_X)
501 prot |= PROT_EXEC;
502 return prot;
503 }
504