linux_exec_aout.c revision 1.9 1 /* $NetBSD: linux_exec_aout.c,v 1.9 1995/06/24 20:20:09 christos Exp $ */
2
3 /*
4 * Copyright (c) 1995 Frank van der Linden
5 * Copyright (c) 1994 Christos Zoulas
6 * All rights reserved.
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
10 * are met:
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in the
15 * documentation and/or other materials provided with the distribution.
16 * 3. The name of the author may not be used to endorse or promote products
17 * derived from this software without specific prior written permission
18 *
19 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
20 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
21 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
22 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
23 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
24 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
25 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
26 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
27 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
28 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29 *
30 * based on exec_aout.c, sunos_exec.c and svr4_exec.c
31 */
32
33 #include <sys/param.h>
34 #include <sys/systm.h>
35 #include <sys/kernel.h>
36 #include <sys/proc.h>
37 #include <sys/malloc.h>
38 #include <sys/namei.h>
39 #include <sys/vnode.h>
40 #include <sys/exec_elf.h>
41
42 #include <sys/mman.h>
43 #include <vm/vm.h>
44 #include <vm/vm_param.h>
45 #include <vm/vm_map.h>
46
47 #include <machine/cpu.h>
48 #include <machine/reg.h>
49 #include <machine/exec.h>
50 #include <machine/linux_machdep.h>
51
52 #include <compat/linux/linux_types.h>
53 #include <compat/linux/linux_syscall.h>
54 #include <compat/linux/linux_syscallargs.h>
55 #include <compat/linux/linux_util.h>
56 #include <compat/linux/linux_exec.h>
57
58 static void *linux_aout_copyargs __P((struct exec_package *,
59 struct ps_strings *, void *, void *));
60
61 #define LINUX_AOUT_AUX_ARGSIZ 2
62 #define LINUX_ELF_AUX_ARGSIZ (sizeof(AuxInfo) * 8 / sizeof(char *))
63
64
65 const char linux_emul_path[] = "/emul/linux";
66 extern int linux_error[];
67 extern struct sysent linux_sysent[];
68 extern char *linux_syscallnames[];
69
70 struct emul emul_linux_aout = {
71 "linux",
72 linux_error,
73 linux_sendsig,
74 LINUX_SYS_syscall,
75 LINUX_SYS_MAXSYSCALL,
76 linux_sysent,
77 linux_syscallnames,
78 LINUX_AOUT_AUX_ARGSIZ,
79 linux_aout_copyargs,
80 setregs,
81 linux_sigcode,
82 linux_esigcode,
83 };
84
85 struct emul emul_linux_elf = {
86 "linux",
87 linux_error,
88 linux_sendsig,
89 LINUX_SYS_syscall,
90 LINUX_SYS_MAXSYSCALL,
91 linux_sysent,
92 linux_syscallnames,
93 LINUX_ELF_AUX_ARGSIZ,
94 elf_copyargs,
95 setregs,
96 linux_sigcode,
97 linux_esigcode,
98 };
99
100
101 static void *
102 linux_aout_copyargs(pack, arginfo, stack, argp)
103 struct exec_package *pack;
104 struct ps_strings *arginfo;
105 void *stack;
106 void *argp;
107 {
108 char **cpp = stack;
109 char **stk = stack;
110 char *dp, *sp;
111 size_t len;
112 void *nullp = NULL;
113 int argc = arginfo->ps_nargvstr;
114 int envc = arginfo->ps_nenvstr;
115
116 if (copyout(&argc, cpp++, sizeof(argc)))
117 return NULL;
118
119 /* leave room for envp and argv */
120 cpp += 2;
121 if (copyout(&cpp, &stk[1], sizeof (cpp)))
122 return NULL;
123
124 dp = (char *) (cpp + argc + envc + 2);
125 sp = argp;
126
127 /* XXX don't copy them out, remap them! */
128 arginfo->ps_argvstr = cpp; /* remember location of argv for later */
129
130 for (; --argc >= 0; sp += len, dp += len)
131 if (copyout(&dp, cpp++, sizeof(dp)) ||
132 copyoutstr(sp, dp, ARG_MAX, &len))
133 return NULL;
134
135 if (copyout(&nullp, cpp++, sizeof(nullp)))
136 return NULL;
137
138 if (copyout(&cpp, &stk[2], sizeof (cpp)))
139 return NULL;
140
141 arginfo->ps_envstr = cpp; /* remember location of envp for later */
142
143 for (; --envc >= 0; sp += len, dp += len)
144 if (copyout(&dp, cpp++, sizeof(dp)) ||
145 copyoutstr(sp, dp, ARG_MAX, &len))
146 return NULL;
147
148 if (copyout(&nullp, cpp++, sizeof(nullp)))
149 return NULL;
150
151 return cpp;
152 }
153
154 int
155 exec_linux_aout_makecmds(p, epp)
156 struct proc *p;
157 struct exec_package *epp;
158 {
159 struct exec *linux_ep = epp->ep_hdr;
160 int machtype, magic;
161 int error = ENOEXEC;
162
163 magic = LINUX_N_MAGIC(linux_ep);
164 machtype = LINUX_N_MACHTYPE(linux_ep);
165
166
167 if (machtype != LINUX_MID_MACHINE)
168 return (ENOEXEC);
169
170 switch (magic) {
171 case QMAGIC:
172 error = exec_linux_aout_prep_qmagic(p, epp);
173 break;
174 case ZMAGIC:
175 error = exec_linux_aout_prep_zmagic(p, epp);
176 break;
177 case NMAGIC:
178 error = exec_linux_aout_prep_nmagic(p, epp);
179 break;
180 case OMAGIC:
181 error = exec_linux_aout_prep_omagic(p, epp);
182 break;
183 }
184 if (error == 0)
185 epp->ep_emul = &emul_linux_aout;
186 return error;
187 }
188
189 /*
190 * Since text starts at 0x400 in Linux ZMAGIC executables, and 0x400
191 * is very likely not page aligned on most architectures, it is treated
192 * as an NMAGIC here. XXX
193 */
194
195 int
196 exec_linux_aout_prep_zmagic(p, epp)
197 struct proc *p;
198 struct exec_package *epp;
199 {
200 struct exec *execp = epp->ep_hdr;
201
202 epp->ep_taddr = LINUX_N_TXTADDR(*execp, ZMAGIC);
203 epp->ep_tsize = execp->a_text;
204 epp->ep_daddr = LINUX_N_DATADDR(*execp, ZMAGIC);
205 epp->ep_dsize = execp->a_data + execp->a_bss;
206 epp->ep_entry = execp->a_entry;
207
208 /* set up command for text segment */
209 NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_readvn, execp->a_text,
210 epp->ep_taddr, epp->ep_vp, LINUX_N_TXTOFF(*execp, ZMAGIC),
211 VM_PROT_READ|VM_PROT_EXECUTE);
212
213 /* set up command for data segment */
214 NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_readvn, execp->a_data,
215 epp->ep_daddr, epp->ep_vp, LINUX_N_DATOFF(*execp, ZMAGIC),
216 VM_PROT_READ|VM_PROT_WRITE|VM_PROT_EXECUTE);
217
218 /* set up command for bss segment */
219 NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_zero, execp->a_bss,
220 epp->ep_daddr + execp->a_data, NULLVP, 0,
221 VM_PROT_READ|VM_PROT_WRITE|VM_PROT_EXECUTE);
222
223 return exec_aout_setup_stack(p, epp);
224 }
225
226 /*
227 * exec_aout_prep_nmagic(): Prepare Linux NMAGIC package.
228 * Not different from the normal stuff.
229 */
230
231 int
232 exec_linux_aout_prep_nmagic(p, epp)
233 struct proc *p;
234 struct exec_package *epp;
235 {
236 struct exec *execp = epp->ep_hdr;
237 long bsize, baddr;
238
239 epp->ep_taddr = LINUX_N_TXTADDR(*execp, NMAGIC);
240 epp->ep_tsize = execp->a_text;
241 epp->ep_daddr = LINUX_N_DATADDR(*execp, NMAGIC);
242 epp->ep_dsize = execp->a_data + execp->a_bss;
243 epp->ep_entry = execp->a_entry;
244
245 /* set up command for text segment */
246 NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_readvn, execp->a_text,
247 epp->ep_taddr, epp->ep_vp, LINUX_N_TXTOFF(*execp, NMAGIC),
248 VM_PROT_READ|VM_PROT_EXECUTE);
249
250 /* set up command for data segment */
251 NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_readvn, execp->a_data,
252 epp->ep_daddr, epp->ep_vp, LINUX_N_DATOFF(*execp, NMAGIC),
253 VM_PROT_READ|VM_PROT_WRITE|VM_PROT_EXECUTE);
254
255 /* set up command for bss segment */
256 baddr = roundup(epp->ep_daddr + execp->a_data, NBPG);
257 bsize = epp->ep_daddr + epp->ep_dsize - baddr;
258 if (bsize > 0)
259 NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_zero, bsize, baddr,
260 NULLVP, 0, VM_PROT_READ|VM_PROT_WRITE|VM_PROT_EXECUTE);
261
262 return exec_aout_setup_stack(p, epp);
263 }
264
265 /*
266 * exec_aout_prep_omagic(): Prepare Linux OMAGIC package.
267 * Business as usual.
268 */
269
270 int
271 exec_linux_aout_prep_omagic(p, epp)
272 struct proc *p;
273 struct exec_package *epp;
274 {
275 struct exec *execp = epp->ep_hdr;
276 long dsize, bsize, baddr;
277
278 epp->ep_taddr = LINUX_N_TXTADDR(*execp, OMAGIC);
279 epp->ep_tsize = execp->a_text;
280 epp->ep_daddr = LINUX_N_DATADDR(*execp, OMAGIC);
281 epp->ep_dsize = execp->a_data + execp->a_bss;
282 epp->ep_entry = execp->a_entry;
283
284 /* set up command for text and data segments */
285 NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_readvn,
286 execp->a_text + execp->a_data, epp->ep_taddr, epp->ep_vp,
287 LINUX_N_TXTOFF(*execp, OMAGIC), VM_PROT_READ|VM_PROT_WRITE|VM_PROT_EXECUTE);
288
289 /* set up command for bss segment */
290 baddr = roundup(epp->ep_daddr + execp->a_data, NBPG);
291 bsize = epp->ep_daddr + epp->ep_dsize - baddr;
292 if (bsize > 0)
293 NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_zero, bsize, baddr,
294 NULLVP, 0, VM_PROT_READ|VM_PROT_WRITE|VM_PROT_EXECUTE);
295
296 /*
297 * Make sure (# of pages) mapped above equals (vm_tsize + vm_dsize);
298 * obreak(2) relies on this fact. Both `vm_tsize' and `vm_dsize' are
299 * computed (in execve(2)) by rounding *up* `ep_tsize' and `ep_dsize'
300 * respectively to page boundaries.
301 * Compensate `ep_dsize' for the amount of data covered by the last
302 * text page.
303 */
304 dsize = epp->ep_dsize + execp->a_text - roundup(execp->a_text, NBPG);
305 epp->ep_dsize = (dsize > 0) ? dsize : 0;
306 return exec_aout_setup_stack(p, epp);
307 }
308
309 int
310 exec_linux_aout_prep_qmagic(p, epp)
311 struct proc *p;
312 struct exec_package *epp;
313 {
314 struct exec *execp = epp->ep_hdr;
315
316 epp->ep_taddr = LINUX_N_TXTADDR(*execp, QMAGIC);
317 epp->ep_tsize = execp->a_text;
318 epp->ep_daddr = LINUX_N_DATADDR(*execp, QMAGIC);
319 epp->ep_dsize = execp->a_data + execp->a_bss;
320 epp->ep_entry = execp->a_entry;
321
322 /*
323 * check if vnode is in open for writing, because we want to
324 * demand-page out of it. if it is, don't do it, for various
325 * reasons
326 */
327 if ((execp->a_text != 0 || execp->a_data != 0) &&
328 epp->ep_vp->v_writecount != 0) {
329 #ifdef DIAGNOSTIC
330 if (epp->ep_vp->v_flag & VTEXT)
331 panic("exec: a VTEXT vnode has writecount != 0\n");
332 #endif
333 return ETXTBSY;
334 }
335 epp->ep_vp->v_flag |= VTEXT;
336
337 /* set up command for text segment */
338 NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_pagedvn, execp->a_text,
339 epp->ep_taddr, epp->ep_vp, LINUX_N_TXTOFF(*execp, QMAGIC),
340 VM_PROT_READ|VM_PROT_EXECUTE);
341
342 /* set up command for data segment */
343 NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_pagedvn, execp->a_data,
344 epp->ep_daddr, epp->ep_vp, LINUX_N_DATOFF(*execp, QMAGIC),
345 VM_PROT_READ|VM_PROT_WRITE|VM_PROT_EXECUTE);
346
347 /* set up command for bss segment */
348 NEW_VMCMD(&epp->ep_vmcmds, vmcmd_map_zero, execp->a_bss,
349 epp->ep_daddr + execp->a_data, NULLVP, 0,
350 VM_PROT_READ|VM_PROT_WRITE|VM_PROT_EXECUTE);
351
352 return exec_aout_setup_stack(p, epp);
353 }
354
355 int
356 linux_elf_probe(p, epp, itp, pos)
357 struct proc *p;
358 struct exec_package *epp;
359 char *itp;
360 u_long *pos;
361 {
362 char *bp;
363 int error;
364 size_t len;
365
366 if (itp[0]) {
367 if ((error = emul_find(p, NULL, linux_emul_path, itp, &bp, 0)))
368 return error;
369 if ((error = copystr(bp, itp, MAXPATHLEN, &len)))
370 return error;
371 free(bp, M_TEMP);
372 }
373 epp->ep_emul = &emul_linux_elf;
374 *pos = ELF32_NO_ADDR;
375 return 0;
376 }
377
378 /*
379 * The Linux system call to load shared libraries, a.out version. The
380 * a.out shared libs are just files that are mapped onto a fixed
381 * address in the process' address space. The address is given in
382 * a_entry. Read in the header, set up some VM commands and run them.
383 *
384 * Yes, both text and data are mapped at once, so we're left with
385 * writeable text for the shared libs. The Linux crt0 seemed to break
386 * sometimes when data was mapped seperately. It munmapped a uselib()
387 * of ld.so by hand, which failed with shared text and data for ld.so
388 * Yuck.
389 *
390 * Because of the problem with ZMAGIC executables (text starts
391 * at 0x400 in the file, but needs to be mapped at 0), ZMAGIC
392 * shared libs are not handled very efficiently :-(
393 */
394
395 int
396 linux_uselib(p, uap, retval)
397 struct proc *p;
398 struct linux_uselib_args /* {
399 syscallarg(char *) path;
400 } */ *uap;
401 register_t *retval;
402 {
403 caddr_t sg;
404 long bsize, dsize, tsize, taddr, baddr, daddr;
405 struct nameidata ni;
406 struct vnode *vp;
407 struct exec hdr;
408 struct exec_vmcmd_set vcset;
409 int rem, i, magic, error;
410
411 sg = stackgap_init(p->p_emul);
412 LINUX_CHECK_ALT_EXIST(p, &sg, SCARG(uap, path));
413
414 NDINIT(&ni, LOOKUP, FOLLOW, UIO_USERSPACE, SCARG(uap, path), p);
415
416 if ((error = namei(&ni)))
417 return error;
418
419 vp = ni.ni_vp;
420
421 if ((error = vn_rdwr(UIO_READ, vp, (caddr_t) &hdr, LINUX_AOUT_HDR_SIZE,
422 0, UIO_SYSSPACE, IO_NODELOCKED, p->p_ucred,
423 &rem, p))) {
424 vrele(vp);
425 return error;
426 }
427
428 if (rem != 0) {
429 vrele(vp);
430 return ENOEXEC;
431 }
432
433 if (LINUX_N_MACHTYPE(&hdr) != LINUX_MID_MACHINE)
434 return ENOEXEC;
435
436 magic = LINUX_N_MAGIC(&hdr);
437 taddr = hdr.a_entry & (~(NBPG - 1));
438 tsize = hdr.a_text;
439 daddr = taddr + tsize;
440 dsize = hdr.a_data + hdr.a_bss;
441
442 if ((hdr.a_text != 0 || hdr.a_data != 0) && vp->v_writecount != 0) {
443 vrele(vp);
444 return ETXTBSY;
445 }
446 vp->v_flag |= VTEXT;
447
448 vcset.evs_cnt = 0;
449 vcset.evs_used = 0;
450
451 NEW_VMCMD(&vcset,
452 magic == ZMAGIC ? vmcmd_map_readvn : vmcmd_map_pagedvn,
453 hdr.a_text + hdr.a_data, taddr,
454 vp, LINUX_N_TXTOFF(hdr, magic),
455 VM_PROT_READ|VM_PROT_EXECUTE|VM_PROT_WRITE);
456
457 baddr = roundup(daddr + hdr.a_data, NBPG);
458 bsize = daddr + dsize - baddr;
459 if (bsize > 0) {
460 NEW_VMCMD(&vcset, vmcmd_map_zero, bsize, baddr,
461 NULLVP, 0, VM_PROT_READ|VM_PROT_WRITE|VM_PROT_EXECUTE);
462 }
463
464 for (i = 0; i < vcset.evs_used && !error; i++) {
465 struct exec_vmcmd *vcp;
466
467 vcp = &vcset.evs_cmds[i];
468 error = (*vcp->ev_proc)(p, vcp);
469 }
470
471 kill_vmcmds(&vcset);
472
473 vrele(vp);
474
475 return error;
476 }
477
478 /*
479 * Execve(2). Just check the alternate emulation path, and pass it on
480 * to the NetBSD execve().
481 */
482 int
483 linux_execve(p, uap, retval)
484 struct proc *p;
485 struct linux_execve_args /* {
486 syscallarg(char *) path;
487 syscallarg(char **) argv;
488 syscallarg(char **) envp;
489 } */ *uap;
490 register_t *retval;
491 {
492 caddr_t sg;
493
494 sg = stackgap_init(p->p_emul);
495 LINUX_CHECK_ALT_EXIST(p, &sg, SCARG(uap, path));
496
497 return execve(p, uap, retval);
498 }
499