alpha_reloc.c revision 1.20 1 /* $NetBSD: alpha_reloc.c,v 1.20 2002/09/21 17:51:44 mycroft Exp $ */
2
3 /*
4 * Copyright (c) 2001 Wasabi Systems, Inc.
5 * All rights reserved.
6 *
7 * Written by Jason R. Thorpe for Wasabi Systems, Inc.
8 *
9 * Redistribution and use in source and binary forms, with or without
10 * modification, are permitted provided that the following conditions
11 * are met:
12 * 1. Redistributions of source code must retain the above copyright
13 * notice, this list of conditions and the following disclaimer.
14 * 2. Redistributions in binary form must reproduce the above copyright
15 * notice, this list of conditions and the following disclaimer in the
16 * documentation and/or other materials provided with the distribution.
17 * 3. All advertising materials mentioning features or use of this software
18 * must display the following acknowledgement:
19 * This product includes software developed for the NetBSD Project by
20 * Wasabi Systems, Inc.
21 * 4. The name of Wasabi Systems, Inc. may not be used to endorse
22 * or promote products derived from this software without specific prior
23 * written permission.
24 *
25 * THIS SOFTWARE IS PROVIDED BY WASABI SYSTEMS, INC. ``AS IS'' AND
26 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
27 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
28 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL WASABI SYSTEMS, INC
29 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
30 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
31 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
32 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
33 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
34 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
35 * POSSIBILITY OF SUCH DAMAGE.
36 */
37
38 /*
39 * Copyright 1996, 1997, 1998, 1999 John D. Polstra.
40 * All rights reserved.
41 *
42 * Redistribution and use in source and binary forms, with or without
43 * modification, are permitted provided that the following conditions
44 * are met:
45 * 1. Redistributions of source code must retain the above copyright
46 * notice, this list of conditions and the following disclaimer.
47 * 2. Redistributions in binary form must reproduce the above copyright
48 * notice, this list of conditions and the following disclaimer in the
49 * documentation and/or other materials provided with the distribution.
50 *
51 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
52 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
53 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
54 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
55 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
56 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
57 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
58 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
59 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
60 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
61 */
62
63 #include <sys/types.h>
64 #include <sys/stat.h>
65 #include <string.h>
66
67 #include "rtld.h"
68 #include "debug.h"
69
70 #ifdef RTLD_DEBUG_ALPHA
71 #define adbg(x) xprintf x
72 #else
73 #define adbg(x) /* nothing */
74 #endif
75
76 void _rtld_bind_start(void);
77 void _rtld_bind_start_old(void);
78 void _rtld_relocate_nonplt_self(Elf_Dyn *, Elf_Addr);
79
80 void
81 _rtld_setup_pltgot(const Obj_Entry *obj)
82 {
83 uint32_t word0;
84
85 /*
86 * The PLTGOT on the Alpha looks like this:
87 *
88 * PLT HEADER
89 * .
90 * . 32 bytes
91 * .
92 * PLT ENTRY #0
93 * .
94 * . 12 bytes
95 * .
96 * PLT ENTRY #1
97 * .
98 * . 12 bytes
99 * .
100 * etc.
101 *
102 * The old-format entries look like (displacements filled in
103 * by the linker):
104 *
105 * ldah $28, 0($31) # 0x279f0000
106 * lda $28, 0($28) # 0x239c0000
107 * br $31, plt0 # 0xc3e00000
108 *
109 * The new-format entries look like:
110 *
111 * br $28, plt0 # 0xc3800000
112 * # 0x00000000
113 * # 0x00000000
114 *
115 * What we do is fetch the first PLT entry and check to
116 * see the first word of it matches the first word of the
117 * old format. If so, we use a binding routine that can
118 * handle the old format, otherwise we use a binding routine
119 * that handles the new format.
120 *
121 * Note that this is done on a per-object basis, we can mix
122 * and match shared objects build with both the old and new
123 * linker.
124 */
125 word0 = *(uint32_t *)(((char *) obj->pltgot) + 32);
126 if ((word0 & 0xffff0000) == 0x279f0000) {
127 /* Old PLT entry format. */
128 adbg(("ALPHA: object %p has old PLT format\n", obj));
129 obj->pltgot[2] = (Elf_Addr) &_rtld_bind_start_old;
130 obj->pltgot[3] = (Elf_Addr) obj;
131 } else {
132 /* New PLT entry format. */
133 adbg(("ALPHA: object %p has new PLT format\n", obj));
134 obj->pltgot[2] = (Elf_Addr) &_rtld_bind_start;
135 obj->pltgot[3] = (Elf_Addr) obj;
136 }
137
138 __asm __volatile("imb");
139 }
140
141 /*
142 * It is possible for the compiler to emit relocations for unaligned data.
143 * We handle this situation with these inlines.
144 */
145 #define RELOC_ALIGNED_P(x) \
146 (((uintptr_t)(x) & (sizeof(void *) - 1)) == 0)
147
148 static __inline Elf_Addr
149 load_ptr(void *where)
150 {
151 Elf_Addr res;
152
153 memcpy(&res, where, sizeof(res));
154
155 return (res);
156 }
157
158 static __inline void
159 store_ptr(void *where, Elf_Addr val)
160 {
161
162 memcpy(where, &val, sizeof(val));
163 }
164
165 void
166 _rtld_relocate_nonplt_self(dynp, relocbase)
167 Elf_Dyn *dynp;
168 Elf_Addr relocbase;
169 {
170 const Elf_Rela *rela = 0, *relalim;
171 Elf_Addr relasz = 0;
172 Elf_Addr *where;
173
174 for (; dynp->d_tag != DT_NULL; dynp++) {
175 switch (dynp->d_tag) {
176 case DT_RELA:
177 rela = (const Elf_Rela *)(relocbase + dynp->d_un.d_ptr);
178 break;
179 case DT_RELASZ:
180 relasz = dynp->d_un.d_val;
181 break;
182 }
183 }
184 relalim = (const Elf_Rela *)((caddr_t)rela + relasz);
185 for (; rela < relalim; rela++) {
186 where = (Elf_Addr *)(relocbase + rela->r_offset);
187 /* XXX For some reason I see a few GLOB_DAT relocs here. */
188 *where += (Elf_Addr)relocbase;
189 }
190 }
191
192 int
193 _rtld_relocate_nonplt_objects(obj, self)
194 const Obj_Entry *obj;
195 bool self;
196 {
197 const Elf_Rela *rela;
198 #define COMBRELOC
199 #ifdef COMBRELOC
200 unsigned long lastsym = -1;
201 #endif
202 Elf_Addr target;
203
204 if (self)
205 return 0;
206
207 for (rela = obj->rela; rela < obj->relalim; rela++) {
208 Elf_Addr *where;
209 const Elf_Sym *def;
210 const Obj_Entry *defobj;
211 Elf_Addr tmp;
212 unsigned long symnum;
213
214 where = (Elf_Addr *)(obj->relocbase + rela->r_offset);
215 symnum = ELF_R_SYM(rela->r_info);
216
217 switch (ELF_R_TYPE(rela->r_info)) {
218 case R_TYPE(NONE):
219 break;
220
221 case R_TYPE(REFQUAD):
222 case R_TYPE(GLOB_DAT):
223 #ifdef COMBRELOC
224 if (symnum != lastsym) {
225 #endif
226 def = _rtld_find_symdef(symnum, obj, &defobj,
227 false);
228 if (def == NULL)
229 return -1;
230 target = (Elf_Addr)(defobj->relocbase +
231 def->st_value);
232 #ifdef COMBRELOC
233 lastsym = symnum;
234 }
235 #endif
236
237 tmp = target + rela->r_addend;
238 if (__predict_true(RELOC_ALIGNED_P(where))) {
239 if (*where != tmp)
240 *where = tmp;
241 } else {
242 if (load_ptr(where) != tmp)
243 store_ptr(where, tmp);
244 }
245 rdbg(("REFQUAD/GLOB_DAT %s in %s --> %p in %s",
246 obj->strtab + obj->symtab[symnum].st_name,
247 obj->path, (void *)tmp, defobj->path));
248 break;
249
250 case R_TYPE(RELATIVE):
251 if (__predict_true(RELOC_ALIGNED_P(where)))
252 *where += (Elf_Addr)obj->relocbase;
253 else
254 store_ptr(where,
255 load_ptr(where) + (Elf_Addr)obj->relocbase);
256 rdbg(("RELATIVE in %s --> %p", obj->path,
257 (void *)*where));
258 break;
259
260 case R_TYPE(COPY):
261 /*
262 * These are deferred until all other relocations have
263 * been done. All we do here is make sure that the
264 * COPY relocation is not in a shared library. They
265 * are allowed only in executable files.
266 */
267 if (obj->isdynamic) {
268 _rtld_error(
269 "%s: Unexpected R_COPY relocation in shared library",
270 obj->path);
271 return -1;
272 }
273 rdbg(("COPY (avoid in main)"));
274 break;
275
276 default:
277 rdbg(("sym = %lu, type = %lu, offset = %p, "
278 "addend = %p, contents = %p, symbol = %s",
279 symnum, (u_long)ELF_R_TYPE(rela->r_info),
280 (void *)rela->r_offset, (void *)rela->r_addend,
281 (void *)load_ptr(where),
282 obj->strtab + obj->symtab[symnum].st_name));
283 _rtld_error("%s: Unsupported relocation type %ld "
284 "in non-PLT relocations\n",
285 obj->path, (u_long) ELF_R_TYPE(rela->r_info));
286 return -1;
287 }
288 }
289 return 0;
290 }
291
292 int
293 _rtld_relocate_plt_lazy(obj)
294 const Obj_Entry *obj;
295 {
296 const Elf_Rela *rela;
297
298 if (!obj->isdynamic)
299 return 0;
300
301 for (rela = obj->pltrela; rela < obj->pltrelalim; rela++) {
302 Elf_Addr *where = (Elf_Addr *)(obj->relocbase + rela->r_offset);
303
304 assert(ELF_R_TYPE(rela->r_info) == R_TYPE(JMP_SLOT));
305
306 /* Just relocate the GOT slots pointing into the PLT */
307 *where += (Elf_Addr)obj->relocbase;
308 rdbg(("fixup !main in %s --> %p", obj->path, (void *)*where));
309 }
310
311 return 0;
312 }
313
314 int
315 _rtld_relocate_plt_object(obj, rela, addrp)
316 const Obj_Entry *obj;
317 const Elf_Rela *rela;
318 caddr_t *addrp;
319 {
320 Elf_Addr *where = (Elf_Addr *)(obj->relocbase + rela->r_offset);
321 Elf_Addr new_value;
322 const Elf_Sym *def;
323 const Obj_Entry *defobj;
324 Elf_Addr stubaddr;
325
326 assert(ELF_R_TYPE(rela->r_info) == R_TYPE(JMP_SLOT));
327
328 def = _rtld_find_symdef(ELF_R_SYM(rela->r_info), obj, &defobj, true);
329 if (def == NULL)
330 return -1;
331
332 new_value = (Elf_Addr)(defobj->relocbase + def->st_value);
333 rdbg(("bind now/fixup in %s --> old=%p new=%p",
334 defobj->strtab + def->st_name, (void *)*where, (void *)new_value));
335
336 if ((stubaddr = *where) != new_value) {
337 int64_t delta, idisp;
338 uint32_t insn[3], *stubptr;
339 int insncnt;
340 Elf_Addr pc;
341
342 /* Point this GOT entry at the target. */
343 *where = new_value;
344
345 /*
346 * Alpha shared objects may have multiple GOTs, each
347 * of which may point to this entry in the PLT. But,
348 * we only have a reference to the first GOT entry which
349 * points to this PLT entry. In order to avoid having to
350 * re-bind this call every time a non-first GOT entry is
351 * used, we will attempt to patch up the PLT entry to
352 * reference the target, rather than the binder.
353 *
354 * When the PLT stub gets control, PV contains the address
355 * of the PLT entry. Each PLT entry has room for 3 insns.
356 * If the displacement of the target from PV fits in a signed
357 * 32-bit integer, we can simply add it to PV. Otherwise,
358 * we must load the GOT entry itself into PV.
359 *
360 * Note if the shared object uses the old PLT format, then
361 * we cannot patch up the PLT safely, and so we skip it
362 * in that case[*].
363 *
364 * [*] Actually, if we're not doing lazy-binding, then
365 * we *can* (and do) patch up this PLT entry; the PLTGOT
366 * thunk won't yet point to any binder entry point, and
367 * so this test will fail as it would for the new PLT
368 * entry format.
369 */
370 if (obj->pltgot[2] == (Elf_Addr) &_rtld_bind_start_old) {
371 rdbg((" old PLT format"));
372 goto out;
373 }
374
375 delta = new_value - stubaddr;
376 rdbg((" stubaddr=%p, where-stubaddr=%ld, delta=%ld",
377 (void *)stubaddr, (long)where - (long)stubaddr,
378 (long)delta));
379 insncnt = 0;
380 if ((int32_t)delta == delta) {
381 /*
382 * We can adjust PV with an LDA, LDAH sequence.
383 *
384 * First, build an LDA insn to adjust the low 16
385 * bits.
386 */
387 insn[insncnt++] = 0x08 << 26 | 27 << 21 | 27 << 16 |
388 (delta & 0xffff);
389 rdbg((" LDA $27,%d($27)", (int16_t)delta));
390 /*
391 * Adjust the delta to account for the effects of
392 * the LDA, including sign-extension.
393 */
394 delta -= (int16_t)delta;
395 if (delta != 0) {
396 /*
397 * Build an LDAH instruction to adjust the
398 * high 16 bits.
399 */
400 insn[insncnt++] = 0x09 << 26 | 27 << 21 |
401 27 << 16 | ((delta >> 16) & 0xffff);
402 rdbg((" LDAH $27,%d($27)",
403 (int16_t)(delta >> 16)));
404 }
405 } else {
406 int64_t dhigh;
407
408 /* We must load the GOT entry. */
409 delta = (Elf_Addr)where - stubaddr;
410
411 /*
412 * If the GOT entry is too far away from the PLT
413 * entry, then we can't patch up the PLT entry.
414 * This PLT entry will have to be bound for each
415 * GOT entry except for the first one. This program
416 * will still run, albeit very slowly. It is very
417 * unlikely that this case will ever happen in
418 * practice.
419 */
420 if ((int32_t)delta != delta) {
421 rdbg((" PLT stub too far from GOT to relocate"));
422 goto out;
423 }
424 dhigh = delta - (int16_t)delta;
425 if (dhigh != 0) {
426 /*
427 * Build an LDAH instruction to adjust the
428 * high 16 bits.
429 */
430 insn[insncnt++] = 0x09 << 26 | 27 << 21 |
431 27 << 16 | ((dhigh >> 16) & 0xffff);
432 rdbg((" LDAH $27,%d($27)",
433 (int16_t)(dhigh >> 16)));
434 }
435 /* Build an LDQ to load the GOT entry. */
436 insn[insncnt++] = 0x29 << 26 | 27 << 21 |
437 27 << 16 | (delta & 0xffff);
438 rdbg((" LDQ $27,%d($27)",
439 (int16_t)delta));
440 }
441
442 /*
443 * Now, build a JMP or BR insn to jump to the target. If
444 * the displacement fits in a sign-extended 21-bit field,
445 * we can use the more efficient BR insn. Otherwise, we
446 * have to jump indirect through PV.
447 */
448 pc = stubaddr + (4 * (insncnt + 1));
449 idisp = (int64_t)(new_value - pc) >> 2;
450 if (-0x100000 <= idisp && idisp < 0x100000) {
451 insn[insncnt++] = 0x30 << 26 | 31 << 21 |
452 (idisp & 0x1fffff);
453 rdbg((" BR $31,%p", (void *)new_value));
454 } else {
455 insn[insncnt++] = 0x1a << 26 | 31 << 21 |
456 27 << 16 | (idisp & 0x3fff);
457 rdbg((" JMP $31,($27),%d",
458 (int)(idisp & 0x3fff)));
459 }
460
461 /*
462 * Fill in the tail of the PLT entry first, for reentrancy.
463 * Until we have overwritten the first insn (an unconditional
464 * branch), the remaining insns have no effect.
465 */
466 stubptr = (uint32_t *)stubaddr;
467 while (insncnt > 1) {
468 insncnt--;
469 stubptr[insncnt] = insn[insncnt];
470 }
471 /*
472 * Commit the tail of the insn sequence to memory
473 * before overwriting the first insn.
474 */
475 __asm __volatile("wmb" ::: "memory");
476 stubptr[0] = insn[0];
477 /*
478 * I-stream will be sync'd when we either return from
479 * the binder (lazy bind case) or when the PLTGOT thunk
480 * is patched up (bind-now case).
481 */
482 }
483
484 out:
485 *addrp = (caddr_t)new_value;
486 return 0;
487 }
488