linux_exec_elf32.c revision 1.12 1 /* $NetBSD: linux_exec_elf32.c,v 1.12 1995/10/07 06:27:00 mycroft Exp $ */
2
3 /*
4 * Copyright (c) 1995 Frank van der Linden
5 * Copyright (c) 1994 Christos Zoulas
6 * All rights reserved.
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
10 * are met:
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in the
15 * documentation and/or other materials provided with the distribution.
16 * 3. The name of the author may not be used to endorse or promote products
17 * derived from this software without specific prior written permission
18 *
19 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
20 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
21 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
22 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
23 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
24 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
25 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
26 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
27 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
28 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29 *
30 * based on exec_aout.c, sunos_exec.c and svr4_exec.c
31 */
32
33 #include <sys/param.h>
34 #include <sys/systm.h>
35 #include <sys/kernel.h>
36 #include <sys/proc.h>
37 #include <sys/malloc.h>
38 #include <sys/namei.h>
39 #include <sys/vnode.h>
40 #include <sys/exec_elf.h>
41
42 #include <sys/mman.h>
43 #include <vm/vm.h>
44 #include <vm/vm_param.h>
45 #include <vm/vm_map.h>
46
47 #include <machine/cpu.h>
48 #include <machine/reg.h>
49 #include <machine/exec.h>
50 #include <machine/linux_machdep.h>
51
52 #include <compat/linux/linux_types.h>
53 #include <compat/linux/linux_syscall.h>
54 #include <compat/linux/linux_signal.h>
55 #include <compat/linux/linux_syscallargs.h>
56 #include <compat/linux/linux_util.h>
57 #include <compat/linux/linux_exec.h>
58
59 static void *linux_aout_copyargs __P((struct exec_package *,
60 struct ps_strings *, void *, void *));
61
62 #define LINUX_AOUT_AUX_ARGSIZ 2
63 #define LINUX_ELF_AUX_ARGSIZ (sizeof(AuxInfo) * 8 / sizeof(char *))
64
65
66 const char linux_emul_path[] = "/emul/linux";
67 extern int linux_error[];
68 extern char linux_sigcode[], linux_esigcode[];
69 extern struct sysent linux_sysent[];
70 extern char *linux_syscallnames[];
71
72 struct emul emul_linux_aout = {
73 "linux",
74 linux_error,
75 linux_sendsig,
76 LINUX_SYS_syscall,
77 LINUX_SYS_MAXSYSCALL,
78 linux_sysent,
79 linux_syscallnames,
80 LINUX_AOUT_AUX_ARGSIZ,
81 linux_aout_copyargs,
82 setregs,
83 linux_sigcode,
84 linux_esigcode,
85 };
86
87 struct emul emul_linux_elf = {
88 "linux",
89 linux_error,
90 linux_sendsig,
91 LINUX_SYS_syscall,
92 LINUX_SYS_MAXSYSCALL,
93 linux_sysent,
94 linux_syscallnames,
95 LINUX_ELF_AUX_ARGSIZ,
96 elf_copyargs,
97 setregs,
98 linux_sigcode,
99 linux_esigcode,
100 };
101
102
103 static void *
104 linux_aout_copyargs(pack, arginfo, stack, argp)
105 struct exec_package *pack;
106 struct ps_strings *arginfo;
107 void *stack;
108 void *argp;
109 {
110 char **cpp = stack;
111 char **stk = stack;
112 char *dp, *sp;
113 size_t len;
114 void *nullp = NULL;
115 int argc = arginfo->ps_nargvstr;
116 int envc = arginfo->ps_nenvstr;
117
118 if (copyout(&argc, cpp++, sizeof(argc)))
119 return NULL;
120
121 /* leave room for envp and argv */
122 cpp += 2;
123 if (copyout(&cpp, &stk[1], sizeof (cpp)))
124 return NULL;
125
126 dp = (char *) (cpp + argc + envc + 2);
127 sp = argp;
128
129 /* XXX don't copy them out, remap them! */
130 arginfo->ps_argvstr = cpp; /* remember location of argv for later */
131
132 for (; --argc >= 0; sp += len, dp += len)
133 if (copyout(&dp, cpp++, sizeof(dp)) ||
134 copyoutstr(sp, dp, ARG_MAX, &len))
135 return NULL;
136
137 if (copyout(&nullp, cpp++, sizeof(nullp)))
138 return NULL;
139
140 if (copyout(&cpp, &stk[2], sizeof (cpp)))
141 return NULL;
142
143 arginfo->ps_envstr = cpp; /* remember location of envp for later */
144
145 for (; --envc >= 0; sp += len, dp += len)
146 if (copyout(&dp, cpp++, sizeof(dp)) ||
147 copyoutstr(sp, dp, ARG_MAX, &len))
148 return NULL;
149
150 if (copyout(&nullp, cpp++, sizeof(nullp)))
151 return NULL;
152
153 return cpp;
154 }
155
156 int
157 exec_linux_aout_makecmds(p, epp)
158 struct proc *p;
159 struct exec_package *epp;
160 {
161 struct exec *linux_ep = epp->ep_hdr;
162 int machtype, magic;
163 int error = ENOEXEC;
164
165 magic = LINUX_N_MAGIC(linux_ep);
166 machtype = LINUX_N_MACHTYPE(linux_ep);
167
168
169 if (machtype != LINUX_MID_MACHINE)
170 return (ENOEXEC);
171
172 switch (magic) {
173 case QMAGIC:
174 error = exec_linux_aout_prep_qmagic(p, epp);
175 break;
176 case ZMAGIC:
177 error = exec_linux_aout_prep_zmagic(p, epp);
178 break;
179 case NMAGIC:
180 error = exec_linux_aout_prep_nmagic(p, epp);
181 break;
182 case OMAGIC:
183 error = exec_linux_aout_prep_omagic(p, epp);
184 break;
185 }
186 if (error == 0)
187 epp->ep_emul = &emul_linux_aout;
188 return error;
189 }
190
191 /*
192 * Since text starts at 0x400 in Linux ZMAGIC executables, and 0x400
193 * is very likely not page aligned on most architectures, it is treated
194 * as an NMAGIC here. XXX
195 */
196
197 int
198 exec_linux_aout_prep_zmagic(p, epp)
199 struct proc *p;
200 struct exec_package *epp;
201 {
202 struct exec *execp = epp->ep_hdr;
203
204 epp->ep_taddr = LINUX_N_TXTADDR(*execp, ZMAGIC);
205 epp->ep_tsize = execp->a_text;
206 epp->ep_daddr = LINUX_N_DATADDR(*execp, ZMAGIC);
207 epp->ep_dsize = execp->a_data + execp->a_bss;
208 epp->ep_entry = execp->a_entry;
209
210 /* set up command for text segment */
211 NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_readvn, execp->a_text,
212 epp->ep_taddr, epp->ep_vp, LINUX_N_TXTOFF(*execp, ZMAGIC),
213 VM_PROT_READ|VM_PROT_EXECUTE);
214
215 /* set up command for data segment */
216 NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_readvn, execp->a_data,
217 epp->ep_daddr, epp->ep_vp, LINUX_N_DATOFF(*execp, ZMAGIC),
218 VM_PROT_READ|VM_PROT_WRITE|VM_PROT_EXECUTE);
219
220 /* set up command for bss segment */
221 NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_zero, execp->a_bss,
222 epp->ep_daddr + execp->a_data, NULLVP, 0,
223 VM_PROT_READ|VM_PROT_WRITE|VM_PROT_EXECUTE);
224
225 return exec_aout_setup_stack(p, epp);
226 }
227
228 /*
229 * exec_aout_prep_nmagic(): Prepare Linux NMAGIC package.
230 * Not different from the normal stuff.
231 */
232
233 int
234 exec_linux_aout_prep_nmagic(p, epp)
235 struct proc *p;
236 struct exec_package *epp;
237 {
238 struct exec *execp = epp->ep_hdr;
239 long bsize, baddr;
240
241 epp->ep_taddr = LINUX_N_TXTADDR(*execp, NMAGIC);
242 epp->ep_tsize = execp->a_text;
243 epp->ep_daddr = LINUX_N_DATADDR(*execp, NMAGIC);
244 epp->ep_dsize = execp->a_data + execp->a_bss;
245 epp->ep_entry = execp->a_entry;
246
247 /* set up command for text segment */
248 NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_readvn, execp->a_text,
249 epp->ep_taddr, epp->ep_vp, LINUX_N_TXTOFF(*execp, NMAGIC),
250 VM_PROT_READ|VM_PROT_EXECUTE);
251
252 /* set up command for data segment */
253 NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_readvn, execp->a_data,
254 epp->ep_daddr, epp->ep_vp, LINUX_N_DATOFF(*execp, NMAGIC),
255 VM_PROT_READ|VM_PROT_WRITE|VM_PROT_EXECUTE);
256
257 /* set up command for bss segment */
258 baddr = roundup(epp->ep_daddr + execp->a_data, NBPG);
259 bsize = epp->ep_daddr + epp->ep_dsize - baddr;
260 if (bsize > 0)
261 NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_zero, bsize, baddr,
262 NULLVP, 0, VM_PROT_READ|VM_PROT_WRITE|VM_PROT_EXECUTE);
263
264 return exec_aout_setup_stack(p, epp);
265 }
266
267 /*
268 * exec_aout_prep_omagic(): Prepare Linux OMAGIC package.
269 * Business as usual.
270 */
271
272 int
273 exec_linux_aout_prep_omagic(p, epp)
274 struct proc *p;
275 struct exec_package *epp;
276 {
277 struct exec *execp = epp->ep_hdr;
278 long dsize, bsize, baddr;
279
280 epp->ep_taddr = LINUX_N_TXTADDR(*execp, OMAGIC);
281 epp->ep_tsize = execp->a_text;
282 epp->ep_daddr = LINUX_N_DATADDR(*execp, OMAGIC);
283 epp->ep_dsize = execp->a_data + execp->a_bss;
284 epp->ep_entry = execp->a_entry;
285
286 /* set up command for text and data segments */
287 NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_readvn,
288 execp->a_text + execp->a_data, epp->ep_taddr, epp->ep_vp,
289 LINUX_N_TXTOFF(*execp, OMAGIC), VM_PROT_READ|VM_PROT_WRITE|VM_PROT_EXECUTE);
290
291 /* set up command for bss segment */
292 baddr = roundup(epp->ep_daddr + execp->a_data, NBPG);
293 bsize = epp->ep_daddr + epp->ep_dsize - baddr;
294 if (bsize > 0)
295 NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_zero, bsize, baddr,
296 NULLVP, 0, VM_PROT_READ|VM_PROT_WRITE|VM_PROT_EXECUTE);
297
298 /*
299 * Make sure (# of pages) mapped above equals (vm_tsize + vm_dsize);
300 * obreak(2) relies on this fact. Both `vm_tsize' and `vm_dsize' are
301 * computed (in execve(2)) by rounding *up* `ep_tsize' and `ep_dsize'
302 * respectively to page boundaries.
303 * Compensate `ep_dsize' for the amount of data covered by the last
304 * text page.
305 */
306 dsize = epp->ep_dsize + execp->a_text - roundup(execp->a_text, NBPG);
307 epp->ep_dsize = (dsize > 0) ? dsize : 0;
308 return exec_aout_setup_stack(p, epp);
309 }
310
311 int
312 exec_linux_aout_prep_qmagic(p, epp)
313 struct proc *p;
314 struct exec_package *epp;
315 {
316 struct exec *execp = epp->ep_hdr;
317
318 epp->ep_taddr = LINUX_N_TXTADDR(*execp, QMAGIC);
319 epp->ep_tsize = execp->a_text;
320 epp->ep_daddr = LINUX_N_DATADDR(*execp, QMAGIC);
321 epp->ep_dsize = execp->a_data + execp->a_bss;
322 epp->ep_entry = execp->a_entry;
323
324 /*
325 * check if vnode is in open for writing, because we want to
326 * demand-page out of it. if it is, don't do it, for various
327 * reasons
328 */
329 if ((execp->a_text != 0 || execp->a_data != 0) &&
330 epp->ep_vp->v_writecount != 0) {
331 #ifdef DIAGNOSTIC
332 if (epp->ep_vp->v_flag & VTEXT)
333 panic("exec: a VTEXT vnode has writecount != 0\n");
334 #endif
335 return ETXTBSY;
336 }
337 epp->ep_vp->v_flag |= VTEXT;
338
339 /* set up command for text segment */
340 NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_pagedvn, execp->a_text,
341 epp->ep_taddr, epp->ep_vp, LINUX_N_TXTOFF(*execp, QMAGIC),
342 VM_PROT_READ|VM_PROT_EXECUTE);
343
344 /* set up command for data segment */
345 NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_pagedvn, execp->a_data,
346 epp->ep_daddr, epp->ep_vp, LINUX_N_DATOFF(*execp, QMAGIC),
347 VM_PROT_READ|VM_PROT_WRITE|VM_PROT_EXECUTE);
348
349 /* set up command for bss segment */
350 NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_zero, execp->a_bss,
351 epp->ep_daddr + execp->a_data, NULLVP, 0,
352 VM_PROT_READ|VM_PROT_WRITE|VM_PROT_EXECUTE);
353
354 return exec_aout_setup_stack(p, epp);
355 }
356
357 int
358 linux_elf_probe(p, epp, itp, pos)
359 struct proc *p;
360 struct exec_package *epp;
361 char *itp;
362 u_long *pos;
363 {
364 char *bp;
365 int error;
366 size_t len;
367
368 if (itp[0]) {
369 if ((error = emul_find(p, NULL, linux_emul_path, itp, &bp, 0)))
370 return error;
371 if ((error = copystr(bp, itp, MAXPATHLEN, &len)))
372 return error;
373 free(bp, M_TEMP);
374 }
375 epp->ep_emul = &emul_linux_elf;
376 *pos = ELF32_NO_ADDR;
377 return 0;
378 }
379
380 /*
381 * The Linux system call to load shared libraries, a.out version. The
382 * a.out shared libs are just files that are mapped onto a fixed
383 * address in the process' address space. The address is given in
384 * a_entry. Read in the header, set up some VM commands and run them.
385 *
386 * Yes, both text and data are mapped at once, so we're left with
387 * writeable text for the shared libs. The Linux crt0 seemed to break
388 * sometimes when data was mapped seperately. It munmapped a uselib()
389 * of ld.so by hand, which failed with shared text and data for ld.so
390 * Yuck.
391 *
392 * Because of the problem with ZMAGIC executables (text starts
393 * at 0x400 in the file, but needs to be mapped at 0), ZMAGIC
394 * shared libs are not handled very efficiently :-(
395 */
396
397 int
398 linux_sys_uselib(p, v, retval)
399 struct proc *p;
400 void *v;
401 register_t *retval;
402 {
403 struct linux_sys_uselib_args /* {
404 syscallarg(char *) path;
405 } */ *uap = v;
406 caddr_t sg;
407 long bsize, dsize, tsize, taddr, baddr, daddr;
408 struct nameidata ni;
409 struct vnode *vp;
410 struct exec hdr;
411 struct exec_vmcmd_set vcset;
412 int rem, i, magic, error;
413
414 sg = stackgap_init(p->p_emul);
415 LINUX_CHECK_ALT_EXIST(p, &sg, SCARG(uap, path));
416
417 NDINIT(&ni, LOOKUP, FOLLOW, UIO_USERSPACE, SCARG(uap, path), p);
418
419 if ((error = namei(&ni)))
420 return error;
421
422 vp = ni.ni_vp;
423
424 if ((error = vn_rdwr(UIO_READ, vp, (caddr_t) &hdr, LINUX_AOUT_HDR_SIZE,
425 0, UIO_SYSSPACE, IO_NODELOCKED, p->p_ucred,
426 &rem, p))) {
427 vrele(vp);
428 return error;
429 }
430
431 if (rem != 0) {
432 vrele(vp);
433 return ENOEXEC;
434 }
435
436 if (LINUX_N_MACHTYPE(&hdr) != LINUX_MID_MACHINE)
437 return ENOEXEC;
438
439 magic = LINUX_N_MAGIC(&hdr);
440 taddr = hdr.a_entry & (~(NBPG - 1));
441 tsize = hdr.a_text;
442 daddr = taddr + tsize;
443 dsize = hdr.a_data + hdr.a_bss;
444
445 if ((hdr.a_text != 0 || hdr.a_data != 0) && vp->v_writecount != 0) {
446 vrele(vp);
447 return ETXTBSY;
448 }
449 vp->v_flag |= VTEXT;
450
451 vcset.evs_cnt = 0;
452 vcset.evs_used = 0;
453
454 NEW_VMCMD(&vcset,
455 magic == ZMAGIC ? vmcmd_map_readvn : vmcmd_map_pagedvn,
456 hdr.a_text + hdr.a_data, taddr,
457 vp, LINUX_N_TXTOFF(hdr, magic),
458 VM_PROT_READ|VM_PROT_EXECUTE|VM_PROT_WRITE);
459
460 baddr = roundup(daddr + hdr.a_data, NBPG);
461 bsize = daddr + dsize - baddr;
462 if (bsize > 0) {
463 NEW_VMCMD(&vcset, vmcmd_map_zero, bsize, baddr,
464 NULLVP, 0, VM_PROT_READ|VM_PROT_WRITE|VM_PROT_EXECUTE);
465 }
466
467 for (i = 0; i < vcset.evs_used && !error; i++) {
468 struct exec_vmcmd *vcp;
469
470 vcp = &vcset.evs_cmds[i];
471 error = (*vcp->ev_proc)(p, vcp);
472 }
473
474 kill_vmcmds(&vcset);
475
476 vrele(vp);
477
478 return error;
479 }
480
481 /*
482 * Execve(2). Just check the alternate emulation path, and pass it on
483 * to the NetBSD execve().
484 */
485 int
486 linux_sys_execve(p, v, retval)
487 struct proc *p;
488 void *v;
489 register_t *retval;
490 {
491 struct linux_sys_execve_args /* {
492 syscallarg(char *) path;
493 syscallarg(char **) argv;
494 syscallarg(char **) envp;
495 } */ *uap = v;
496 caddr_t sg;
497
498 sg = stackgap_init(p->p_emul);
499 LINUX_CHECK_ALT_EXIST(p, &sg, SCARG(uap, path));
500
501 return sys_execve(p, uap, retval);
502 }
503