init_main.c revision 1.357 1 1.357 ad /* $NetBSD: init_main.c,v 1.357 2008/05/28 13:35:32 ad Exp $ */
2 1.347 ad
3 1.347 ad /*-
4 1.347 ad * Copyright (c) 2008 The NetBSD Foundation, Inc.
5 1.347 ad * All rights reserved.
6 1.347 ad *
7 1.347 ad * Redistribution and use in source and binary forms, with or without
8 1.347 ad * modification, are permitted provided that the following conditions
9 1.347 ad * are met:
10 1.347 ad * 1. Redistributions of source code must retain the above copyright
11 1.347 ad * notice, this list of conditions and the following disclaimer.
12 1.347 ad * 2. Redistributions in binary form must reproduce the above copyright
13 1.347 ad * notice, this list of conditions and the following disclaimer in the
14 1.347 ad * documentation and/or other materials provided with the distribution.
15 1.347 ad *
16 1.347 ad * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
17 1.347 ad * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
18 1.347 ad * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
19 1.347 ad * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
20 1.347 ad * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
21 1.347 ad * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
22 1.347 ad * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
23 1.347 ad * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
24 1.347 ad * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
25 1.347 ad * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
26 1.347 ad * POSSIBILITY OF SUCH DAMAGE.
27 1.347 ad */
28 1.61 mycroft
29 1.61 mycroft /*
30 1.61 mycroft * Copyright (c) 1982, 1986, 1989, 1991, 1992, 1993
31 1.61 mycroft * The Regents of the University of California. All rights reserved.
32 1.61 mycroft * (c) UNIX System Laboratories, Inc.
33 1.61 mycroft * All or some portions of this file are derived from material licensed
34 1.61 mycroft * to the University of California by American Telephone and Telegraph
35 1.61 mycroft * Co. or Unix System Laboratories, Inc. and are reproduced herein with
36 1.61 mycroft * the permission of UNIX System Laboratories, Inc.
37 1.61 mycroft *
38 1.61 mycroft * Redistribution and use in source and binary forms, with or without
39 1.61 mycroft * modification, are permitted provided that the following conditions
40 1.61 mycroft * are met:
41 1.61 mycroft * 1. Redistributions of source code must retain the above copyright
42 1.61 mycroft * notice, this list of conditions and the following disclaimer.
43 1.61 mycroft * 2. Redistributions in binary form must reproduce the above copyright
44 1.61 mycroft * notice, this list of conditions and the following disclaimer in the
45 1.61 mycroft * documentation and/or other materials provided with the distribution.
46 1.224 agc * 3. Neither the name of the University nor the names of its contributors
47 1.224 agc * may be used to endorse or promote products derived from this software
48 1.224 agc * without specific prior written permission.
49 1.224 agc *
50 1.224 agc * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
51 1.224 agc * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
52 1.224 agc * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
53 1.224 agc * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
54 1.224 agc * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
55 1.224 agc * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
56 1.224 agc * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
57 1.224 agc * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
58 1.224 agc * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
59 1.224 agc * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
60 1.224 agc * SUCH DAMAGE.
61 1.224 agc *
62 1.224 agc * @(#)init_main.c 8.16 (Berkeley) 5/14/95
63 1.224 agc */
64 1.224 agc
65 1.224 agc /*
66 1.224 agc * Copyright (c) 1995 Christopher G. Demetriou. All rights reserved.
67 1.224 agc *
68 1.224 agc * Redistribution and use in source and binary forms, with or without
69 1.224 agc * modification, are permitted provided that the following conditions
70 1.224 agc * are met:
71 1.224 agc * 1. Redistributions of source code must retain the above copyright
72 1.224 agc * notice, this list of conditions and the following disclaimer.
73 1.224 agc * 2. Redistributions in binary form must reproduce the above copyright
74 1.224 agc * notice, this list of conditions and the following disclaimer in the
75 1.224 agc * documentation and/or other materials provided with the distribution.
76 1.61 mycroft * 3. All advertising materials mentioning features or use of this software
77 1.61 mycroft * must display the following acknowledgement:
78 1.61 mycroft * This product includes software developed by the University of
79 1.61 mycroft * California, Berkeley and its contributors.
80 1.61 mycroft * 4. Neither the name of the University nor the names of its contributors
81 1.61 mycroft * may be used to endorse or promote products derived from this software
82 1.61 mycroft * without specific prior written permission.
83 1.61 mycroft *
84 1.61 mycroft * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
85 1.61 mycroft * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
86 1.61 mycroft * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
87 1.61 mycroft * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
88 1.61 mycroft * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
89 1.61 mycroft * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
90 1.61 mycroft * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
91 1.61 mycroft * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
92 1.61 mycroft * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
93 1.61 mycroft * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
94 1.61 mycroft * SUCH DAMAGE.
95 1.61 mycroft *
96 1.118 fvdl * @(#)init_main.c 8.16 (Berkeley) 5/14/95
97 1.61 mycroft */
98 1.196 lukem
99 1.196 lukem #include <sys/cdefs.h>
100 1.357 ad __KERNEL_RCSID(0, "$NetBSD: init_main.c,v 1.357 2008/05/28 13:35:32 ad Exp $");
101 1.115 mrg
102 1.223 jonathan #include "opt_ipsec.h"
103 1.267 kardel #include "opt_ntp.h"
104 1.198 jdolecek #include "opt_pipe.h"
105 1.267 kardel #include "opt_posix.h"
106 1.172 soren #include "opt_syscall_debug.h"
107 1.267 kardel #include "opt_sysv.h"
108 1.292 ad #include "opt_fileassoc.h"
109 1.292 ad #include "opt_ktrace.h"
110 1.281 elad #include "opt_pax.h"
111 1.61 mycroft
112 1.106 explorer #include "rnd.h"
113 1.305 xtraeme #include "sysmon_envsys.h"
114 1.305 xtraeme #include "sysmon_power.h"
115 1.313 xtraeme #include "sysmon_taskq.h"
116 1.313 xtraeme #include "sysmon_wdog.h"
117 1.276 dogcow #include "veriexec.h"
118 1.106 explorer
119 1.61 mycroft #include <sys/param.h>
120 1.164 enami #include <sys/acct.h>
121 1.61 mycroft #include <sys/filedesc.h>
122 1.131 thorpej #include <sys/file.h>
123 1.61 mycroft #include <sys/errno.h>
124 1.162 thorpej #include <sys/callout.h>
125 1.302 yamt #include <sys/cpu.h>
126 1.61 mycroft #include <sys/kernel.h>
127 1.269 yamt #include <sys/kmem.h>
128 1.61 mycroft #include <sys/mount.h>
129 1.61 mycroft #include <sys/proc.h>
130 1.136 thorpej #include <sys/kthread.h>
131 1.61 mycroft #include <sys/resourcevar.h>
132 1.61 mycroft #include <sys/signalvar.h>
133 1.61 mycroft #include <sys/systm.h>
134 1.61 mycroft #include <sys/vnode.h>
135 1.288 hannken #include <sys/fstrans.h>
136 1.87 thorpej #include <sys/tty.h>
137 1.61 mycroft #include <sys/conf.h>
138 1.95 thorpej #include <sys/disklabel.h>
139 1.61 mycroft #include <sys/buf.h>
140 1.61 mycroft #include <sys/device.h>
141 1.186 jdolecek #include <sys/exec.h>
142 1.128 thorpej #include <sys/socketvar.h>
143 1.61 mycroft #include <sys/protosw.h>
144 1.338 yamt #include <sys/percpu.h>
145 1.342 rmind #include <sys/pset.h>
146 1.338 yamt #include <sys/sysctl.h>
147 1.61 mycroft #include <sys/reboot.h>
148 1.61 mycroft #include <sys/user.h>
149 1.176 thorpej #include <sys/sysctl.h>
150 1.209 jdolecek #include <sys/event.h>
151 1.227 jonathan #include <sys/mbuf.h>
152 1.302 yamt #include <sys/sched.h>
153 1.292 ad #include <sys/sleepq.h>
154 1.284 ad #include <sys/iostat.h>
155 1.304 yamt #include <sys/vmem.h>
156 1.307 ad #include <sys/uuid.h>
157 1.307 ad #include <sys/extent.h>
158 1.309 ad #include <sys/disk.h>
159 1.314 rmind #include <sys/mqueue.h>
160 1.325 ad #include <sys/msgbuf.h>
161 1.340 ad #include <sys/module.h>
162 1.343 ad #include <sys/event.h>
163 1.357 ad #include <sys/lockf.h>
164 1.233 junyoung #ifdef FAST_IPSEC
165 1.223 jonathan #include <netipsec/ipsec.h>
166 1.223 jonathan #endif
167 1.82 christos #ifdef SYSVSHM
168 1.82 christos #include <sys/shm.h>
169 1.82 christos #endif
170 1.233 junyoung #ifdef SYSVSEM
171 1.82 christos #include <sys/sem.h>
172 1.82 christos #endif
173 1.82 christos #ifdef SYSVMSG
174 1.82 christos #include <sys/msg.h>
175 1.82 christos #endif
176 1.217 christos #ifdef P1003_1B_SEMAPHORE
177 1.217 christos #include <sys/ksem.h>
178 1.217 christos #endif
179 1.82 christos #include <sys/domain.h>
180 1.94 mouse #include <sys/namei.h>
181 1.106 explorer #if NRND > 0
182 1.103 explorer #include <sys/rnd.h>
183 1.106 explorer #endif
184 1.192 jdolecek #include <sys/pipe.h>
185 1.210 thorpej #ifdef LKM
186 1.210 thorpej #include <sys/lkm.h>
187 1.210 thorpej #endif
188 1.273 elad #if NVERIEXEC > 0
189 1.245 blymn #include <sys/verified_exec.h>
190 1.273 elad #endif /* NVERIEXEC > 0 */
191 1.292 ad #ifdef KTRACE
192 1.292 ad #include <sys/ktrace.h>
193 1.292 ad #endif
194 1.266 elad #include <sys/kauth.h>
195 1.252 skrll #include <net80211/ieee80211_netbsd.h>
196 1.61 mycroft
197 1.77 christos #include <sys/syscall.h>
198 1.68 cgd #include <sys/syscallargs.h>
199 1.68 cgd
200 1.334 elad #if defined(PAX_MPROTECT) || defined(PAX_SEGVGUARD) || defined(PAX_ASLR)
201 1.281 elad #include <sys/pax.h>
202 1.334 elad #endif /* PAX_MPROTECT || PAX_SEGVGUARD || PAX_ASLR */
203 1.334 elad
204 1.61 mycroft #include <ufs/ufs/quota.h>
205 1.61 mycroft
206 1.159 fvdl #include <miscfs/genfs/genfs.h>
207 1.159 fvdl #include <miscfs/syncfs/syncfs.h>
208 1.159 fvdl
209 1.323 ad #include <sys/cpu.h>
210 1.61 mycroft
211 1.114 mrg #include <uvm/uvm.h>
212 1.114 mrg
213 1.310 xtraeme #if NSYSMON_TASKQ > 0
214 1.310 xtraeme #include <dev/sysmon/sysmon_taskq.h>
215 1.310 xtraeme #endif
216 1.310 xtraeme
217 1.202 lukem #include <dev/cons.h>
218 1.310 xtraeme
219 1.313 xtraeme #if NSYSMON_ENVSYS > 0 || NSYSMON_POWER > 0 || NSYSMON_WDOG > 0
220 1.305 xtraeme #include <dev/sysmon/sysmonvar.h>
221 1.305 xtraeme #endif
222 1.202 lukem
223 1.81 christos #include <net/if.h>
224 1.81 christos #include <net/raw_cb.h>
225 1.61 mycroft
226 1.277 elad #include <secmodel/secmodel.h>
227 1.277 elad
228 1.251 junyoung extern struct proc proc0;
229 1.251 junyoung extern struct lwp lwp0;
230 1.251 junyoung extern struct cwdinfo cwdi0;
231 1.311 pooka extern time_t rootfstime;
232 1.251 junyoung
233 1.216 thorpej #ifndef curlwp
234 1.216 thorpej struct lwp *curlwp = &lwp0;
235 1.133 pk #endif
236 1.105 mycroft struct proc *initproc;
237 1.61 mycroft
238 1.61 mycroft struct vnode *rootvp, *swapdev_vp;
239 1.61 mycroft int boothowto;
240 1.156 thorpej int cold = 1; /* still working on startup */
241 1.272 kardel struct timeval boottime; /* time at system startup - will only follow settime deltas */
242 1.61 mycroft
243 1.356 ad int start_init_exec; /* semaphore for start_init() */
244 1.163 thorpej
245 1.260 christos static void check_console(struct lwp *l);
246 1.176 thorpej static void start_init(void *);
247 1.176 thorpej void main(void);
248 1.349 ad void ssp_init(void);
249 1.76 cgd
250 1.280 christos #if defined(__SSP__) || defined(__SSP_ALL__)
251 1.280 christos long __stack_chk_guard[8] = {0, 0, 0, 0, 0, 0, 0, 0};
252 1.280 christos void __stack_chk_fail(void);
253 1.280 christos
254 1.280 christos void
255 1.280 christos __stack_chk_fail(void)
256 1.280 christos {
257 1.280 christos panic("stack overflow detected; terminated");
258 1.280 christos }
259 1.349 ad
260 1.349 ad void
261 1.349 ad ssp_init(void)
262 1.349 ad {
263 1.349 ad int s;
264 1.349 ad
265 1.349 ad #ifdef DIAGNOSTIC
266 1.349 ad printf("Initializing SSP:");
267 1.349 ad #endif
268 1.349 ad /*
269 1.349 ad * We initialize ssp here carefully:
270 1.349 ad * 1. after we got some entropy
271 1.349 ad * 2. without calling a function
272 1.349 ad */
273 1.349 ad size_t i;
274 1.349 ad long guard[__arraycount(__stack_chk_guard)];
275 1.349 ad
276 1.349 ad arc4randbytes(guard, sizeof(guard));
277 1.349 ad s = splhigh();
278 1.349 ad for (i = 0; i < __arraycount(guard); i++)
279 1.349 ad __stack_chk_guard[i] = guard[i];
280 1.349 ad splx(s);
281 1.349 ad #ifdef DIAGNOSTIC
282 1.349 ad for (i = 0; i < __arraycount(guard); i++)
283 1.349 ad printf("%lx ", guard[i]);
284 1.349 ad printf("\n");
285 1.349 ad #endif
286 1.349 ad }
287 1.349 ad #else
288 1.349 ad void
289 1.349 ad ssp_init(void)
290 1.349 ad {
291 1.349 ad
292 1.349 ad }
293 1.280 christos #endif
294 1.280 christos
295 1.287 elad void __secmodel_none(void);
296 1.296 itohy __weak_alias(secmodel_start,__secmodel_none);
297 1.287 elad void
298 1.287 elad __secmodel_none(void)
299 1.287 elad {
300 1.287 elad return;
301 1.287 elad }
302 1.287 elad
303 1.61 mycroft /*
304 1.61 mycroft * System startup; initialize the world, create process 0, mount root
305 1.61 mycroft * filesystem, and fork to create init and pagedaemon. Most of the
306 1.61 mycroft * hard work is done in the lower-level initialization routines including
307 1.61 mycroft * startup(), which does memory initialization and autoconfiguration.
308 1.61 mycroft */
309 1.81 christos void
310 1.176 thorpej main(void)
311 1.61 mycroft {
312 1.267 kardel struct timeval time;
313 1.216 thorpej struct lwp *l;
314 1.144 thorpej struct proc *p;
315 1.204 thorpej int s, error;
316 1.175 jdolecek #ifdef NVNODE_IMPLICIT
317 1.175 jdolecek int usevnodes;
318 1.175 jdolecek #endif
319 1.312 ad CPU_INFO_ITERATOR cii;
320 1.312 ad struct cpu_info *ci;
321 1.61 mycroft
322 1.216 thorpej l = &lwp0;
323 1.327 matt #ifndef LWP0_CPU_INFO
324 1.216 thorpej l->l_cpu = curcpu();
325 1.327 matt #endif
326 1.233 junyoung
327 1.317 ad /*
328 1.61 mycroft * Attempt to find console and initialize
329 1.61 mycroft * in case of early panic or other messages.
330 1.61 mycroft */
331 1.61 mycroft consinit();
332 1.61 mycroft
333 1.321 ad kernel_lock_init();
334 1.179 thorpej
335 1.114 mrg uvm_init();
336 1.127 thorpej
337 1.269 yamt kmem_init();
338 1.269 yamt
339 1.338 yamt percpu_init();
340 1.338 yamt
341 1.347 ad /* Initialize lock caches. */
342 1.347 ad mutex_obj_init();
343 1.347 ad
344 1.307 ad /* Initialize the extent manager. */
345 1.307 ad extent_init();
346 1.307 ad
347 1.145 thorpej /* Do machine-dependent initialization. */
348 1.145 thorpej cpu_startup();
349 1.162 thorpej
350 1.307 ad /* Initialize callouts, part 1. */
351 1.166 enami callout_startup();
352 1.145 thorpej
353 1.291 elad /*
354 1.291 elad * Initialize the kernel authorization subsystem and start the
355 1.291 elad * default security model, if any. We need to do this early
356 1.291 elad * enough so that subsystems relying on any of the aforementioned
357 1.291 elad * can work properly. Since the security model may dictate the
358 1.291 elad * credential inheritance policy, it is needed at least before
359 1.291 elad * any process is created, specifically proc0.
360 1.291 elad */
361 1.289 elad kauth_init();
362 1.290 elad secmodel_start();
363 1.290 elad
364 1.228 pk /* Initialize the buffer cache */
365 1.228 pk bufinit();
366 1.228 pk
367 1.128 thorpej /* Initialize sockets. */
368 1.128 thorpej soinit();
369 1.127 thorpej
370 1.156 thorpej /*
371 1.212 thorpej * The following things must be done before autoconfiguration.
372 1.156 thorpej */
373 1.212 thorpej evcnt_init(); /* initialize event counters */
374 1.106 explorer #if NRND > 0
375 1.156 thorpej rnd_init(); /* initialize RNG */
376 1.106 explorer #endif
377 1.176 thorpej
378 1.236 simonb /* Initialize process and pgrp structures. */
379 1.63 mycroft procinit();
380 1.279 thorpej lwpinit();
381 1.210 thorpej
382 1.251 junyoung /* Initialize signal-related data structures. */
383 1.251 junyoung signal_init();
384 1.61 mycroft
385 1.333 ad /* Initialize resource management. */
386 1.333 ad resource_init();
387 1.333 ad
388 1.251 junyoung /* Create process 0 (the swapper). */
389 1.251 junyoung proc0_init();
390 1.61 mycroft
391 1.307 ad /* Initialize the UID hash table. */
392 1.307 ad uid_init();
393 1.307 ad
394 1.307 ad /* Charge root for one process. */
395 1.61 mycroft (void)chgproccnt(0, 1);
396 1.61 mycroft
397 1.330 ad /* Initialize timekeeping. */
398 1.330 ad time_init();
399 1.330 ad
400 1.292 ad /* Initialize the run queues, turnstiles and sleep queues. */
401 1.312 ad mutex_init(&cpu_lock, MUTEX_DEFAULT, IPL_NONE);
402 1.302 yamt sched_rqinit();
403 1.292 ad turnstile_init();
404 1.292 ad sleeptab_init(&sleeptab);
405 1.292 ad
406 1.339 rmind /* Initialize processor-sets */
407 1.339 rmind psets_init();
408 1.339 rmind
409 1.302 yamt /* MI initialization of the boot cpu */
410 1.302 yamt error = mi_cpu_attach(curcpu());
411 1.302 yamt KASSERT(error == 0);
412 1.302 yamt
413 1.350 ad /* Initialize timekeeping, part 2. */
414 1.350 ad time_init2();
415 1.350 ad
416 1.338 yamt /*
417 1.338 yamt * Initialize mbuf's. Do this now because we might attempt to
418 1.338 yamt * allocate mbufs or mbuf clusters during autoconfiguration.
419 1.338 yamt */
420 1.338 yamt mbinit();
421 1.338 yamt
422 1.292 ad /* Initialize the sysctl subsystem. */
423 1.292 ad sysctl_init();
424 1.61 mycroft
425 1.284 ad /* Initialize I/O statistics. */
426 1.284 ad iostat_init();
427 1.284 ad
428 1.325 ad /* Initialize the log device. */
429 1.325 ad loginit();
430 1.325 ad
431 1.355 ad /* Start module system. */
432 1.355 ad module_init();
433 1.355 ad
434 1.61 mycroft /* Initialize the file systems. */
435 1.194 matt #ifdef NVNODE_IMPLICIT
436 1.194 matt /*
437 1.194 matt * If maximum number of vnodes in namei vnode cache is not explicitly
438 1.194 matt * defined in kernel config, adjust the number such as we use roughly
439 1.232 tls * 1.0% of memory for vnode cache (but not less than NVNODE vnodes).
440 1.194 matt */
441 1.346 yamt usevnodes =
442 1.346 yamt calc_cache_size(kernel_map, 1, VNODE_VA_MAXPCT) / sizeof(vnode_t);
443 1.205 sommerfe if (usevnodes > desiredvnodes)
444 1.194 matt desiredvnodes = usevnodes;
445 1.194 matt #endif
446 1.61 mycroft vfsinit();
447 1.357 ad lf_init();
448 1.61 mycroft
449 1.288 hannken /* Initialize fstrans. */
450 1.288 hannken fstrans_init();
451 1.267 kardel
452 1.319 ad /* Initialize the file descriptor system. */
453 1.343 ad fd_sys_init();
454 1.319 ad
455 1.344 ad /* Initialize kqueue. */
456 1.343 ad kqueue_init();
457 1.307 ad
458 1.303 rmind /* Initialize asynchronous I/O. */
459 1.303 rmind aio_sysinit();
460 1.303 rmind
461 1.314 rmind /* Initialize message queues. */
462 1.314 rmind mqueue_sysinit();
463 1.314 rmind
464 1.313 xtraeme /* Initialize the system monitor subsystems. */
465 1.310 xtraeme #if NSYSMON_TASKQ > 0
466 1.310 xtraeme sysmon_task_queue_preinit();
467 1.310 xtraeme #endif
468 1.310 xtraeme
469 1.305 xtraeme #if NSYSMON_ENVSYS > 0
470 1.305 xtraeme sysmon_envsys_init();
471 1.305 xtraeme #endif
472 1.310 xtraeme
473 1.305 xtraeme #if NSYSMON_POWER > 0
474 1.305 xtraeme sysmon_power_init();
475 1.305 xtraeme #endif
476 1.313 xtraeme
477 1.313 xtraeme #if NSYSMON_WDOG > 0
478 1.313 xtraeme sysmon_wdog_init();
479 1.313 xtraeme #endif
480 1.313 xtraeme
481 1.268 kardel inittimecounter();
482 1.267 kardel ntp_init();
483 1.267 kardel
484 1.307 ad /* Initialize the device switch tables. */
485 1.307 ad devsw_init();
486 1.307 ad
487 1.326 ad /* Initialize tty subsystem. */
488 1.326 ad tty_init();
489 1.326 ad ttyldisc_init();
490 1.326 ad
491 1.336 ad /* Initialize the buffer cache, part 2. */
492 1.336 ad bufinit2();
493 1.336 ad
494 1.309 ad /* Initialize the disk wedge subsystem. */
495 1.309 ad dkwedge_init();
496 1.309 ad
497 1.156 thorpej /* Configure the system hardware. This will enable interrupts. */
498 1.156 thorpej configure();
499 1.61 mycroft
500 1.185 chs ubc_init(); /* must be after autoconfig */
501 1.185 chs
502 1.61 mycroft #ifdef SYSVSHM
503 1.61 mycroft /* Initialize System V style shared memory. */
504 1.61 mycroft shminit();
505 1.61 mycroft #endif
506 1.61 mycroft
507 1.61 mycroft #ifdef SYSVSEM
508 1.61 mycroft /* Initialize System V style semaphores. */
509 1.61 mycroft seminit();
510 1.61 mycroft #endif
511 1.61 mycroft
512 1.61 mycroft #ifdef SYSVMSG
513 1.61 mycroft /* Initialize System V style message queues. */
514 1.61 mycroft msginit();
515 1.61 mycroft #endif
516 1.61 mycroft
517 1.217 christos #ifdef P1003_1B_SEMAPHORE
518 1.217 christos /* Initialize posix semaphores */
519 1.217 christos ksem_init();
520 1.217 christos #endif
521 1.245 blymn
522 1.273 elad #if NVERIEXEC > 0
523 1.283 elad /*
524 1.283 elad * Initialise the Veriexec subsystem.
525 1.283 elad */
526 1.283 elad veriexec_init();
527 1.273 elad #endif /* NVERIEXEC > 0 */
528 1.251 junyoung
529 1.334 elad #if defined(PAX_MPROTECT) || defined(PAX_SEGVGUARD) || defined(PAX_ASLR)
530 1.281 elad pax_init();
531 1.334 elad #endif /* PAX_MPROTECT || PAX_SEGVGUARD || PAX_ASLR */
532 1.281 elad
533 1.223 jonathan #ifdef FAST_IPSEC
534 1.223 jonathan /* Attach network crypto subsystem */
535 1.223 jonathan ipsec_attach();
536 1.223 jonathan #endif
537 1.61 mycroft
538 1.61 mycroft /*
539 1.61 mycroft * Initialize protocols. Block reception of incoming packets
540 1.61 mycroft * until everything is ready.
541 1.61 mycroft */
542 1.190 thorpej s = splnet();
543 1.61 mycroft ifinit();
544 1.61 mycroft domaininit();
545 1.200 itojun if_attachdomain();
546 1.61 mycroft splx(s);
547 1.61 mycroft
548 1.61 mycroft #ifdef GPROF
549 1.61 mycroft /* Initialize kernel profiling. */
550 1.61 mycroft kmstartup();
551 1.61 mycroft #endif
552 1.164 enami
553 1.351 sborrill /* Initialize system accounting. */
554 1.164 enami acct_init();
555 1.61 mycroft
556 1.301 ad #ifndef PIPE_SOCKETPAIR
557 1.300 ad /* Initialize pipes. */
558 1.300 ad pipe_init();
559 1.301 ad #endif
560 1.300 ad
561 1.292 ad #ifdef KTRACE
562 1.292 ad /* Initialize ktrace. */
563 1.292 ad ktrinit();
564 1.292 ad #endif
565 1.292 ad
566 1.307 ad /* Initialize the UUID system calls. */
567 1.307 ad uuid_init();
568 1.307 ad
569 1.163 thorpej /*
570 1.163 thorpej * Create process 1 (init(8)). We do this now, as Unix has
571 1.163 thorpej * historically had init be process 1, and changing this would
572 1.163 thorpej * probably upset a lot of people.
573 1.163 thorpej *
574 1.163 thorpej * Note that process 1 won't immediately exec init(8), but will
575 1.163 thorpej * wait for us to inform it that the root file system has been
576 1.163 thorpej * mounted.
577 1.163 thorpej */
578 1.216 thorpej if (fork1(l, 0, SIGCHLD, NULL, 0, start_init, NULL, NULL, &initproc))
579 1.163 thorpej panic("fork init");
580 1.163 thorpej
581 1.163 thorpej /*
582 1.340 ad * Load any remaining builtin modules, and hand back temporary
583 1.340 ad * storage to the VM system.
584 1.340 ad */
585 1.340 ad module_init_class(MODULE_CLASS_ANY);
586 1.340 ad module_jettison();
587 1.340 ad
588 1.340 ad /*
589 1.208 thorpej * Finalize configuration now that all real devices have been
590 1.208 thorpej * found. This needs to be done before the root device is
591 1.208 thorpej * selected, since finalization may create the root device.
592 1.208 thorpej */
593 1.208 thorpej config_finalize();
594 1.163 thorpej
595 1.163 thorpej /*
596 1.163 thorpej * Now that autoconfiguration has completed, we can determine
597 1.163 thorpej * the root and dump devices.
598 1.163 thorpej */
599 1.98 gwr cpu_rootconf();
600 1.101 thorpej cpu_dumpconf();
601 1.61 mycroft
602 1.61 mycroft /* Mount the root file system. */
603 1.95 thorpej do {
604 1.95 thorpej domountroothook();
605 1.95 thorpej if ((error = vfs_mountroot())) {
606 1.97 thorpej printf("cannot mount root, error = %d\n", error);
607 1.95 thorpej boothowto |= RB_ASKNAME;
608 1.95 thorpej setroot(root_device,
609 1.152 thorpej (rootdev != NODEV) ? DISKPART(rootdev) : 0);
610 1.95 thorpej }
611 1.95 thorpej } while (error != 0);
612 1.95 thorpej mountroothook_destroy();
613 1.95 thorpej
614 1.239 pk /*
615 1.239 pk * Initialise the time-of-day clock, passing the time recorded
616 1.239 pk * in the root filesystem (if any) for use by systems that
617 1.239 pk * don't have a non-volatile time-of-day device.
618 1.239 pk */
619 1.239 pk inittodr(rootfstime);
620 1.239 pk
621 1.206 matt CIRCLEQ_FIRST(&mountlist)->mnt_flag |= MNT_ROOTFS;
622 1.206 matt CIRCLEQ_FIRST(&mountlist)->mnt_op->vfs_refcount++;
623 1.61 mycroft
624 1.111 thorpej /*
625 1.111 thorpej * Get the vnode for '/'. Set filedesc0.fd_fd.fd_cdir to
626 1.111 thorpej * reference it.
627 1.111 thorpej */
628 1.243 mycroft error = VFS_ROOT(CIRCLEQ_FIRST(&mountlist), &rootvnode);
629 1.243 mycroft if (error)
630 1.243 mycroft panic("cannot find root vnode, error=%d", error);
631 1.148 thorpej cwdi0.cwdi_cdir = rootvnode;
632 1.148 thorpej VREF(cwdi0.cwdi_cdir);
633 1.118 fvdl VOP_UNLOCK(rootvnode, 0);
634 1.148 thorpej cwdi0.cwdi_rdir = NULL;
635 1.163 thorpej
636 1.163 thorpej /*
637 1.163 thorpej * Now that root is mounted, we can fixup initproc's CWD
638 1.163 thorpej * info. All other processes are kthreads, which merely
639 1.163 thorpej * share proc0's CWD info.
640 1.163 thorpej */
641 1.163 thorpej initproc->p_cwdi->cwdi_cdir = rootvnode;
642 1.163 thorpej VREF(initproc->p_cwdi->cwdi_cdir);
643 1.163 thorpej initproc->p_cwdi->cwdi_rdir = NULL;
644 1.61 mycroft
645 1.61 mycroft /*
646 1.61 mycroft * Now can look at time, having had a chance to verify the time
647 1.292 ad * from the file system. Reset l->l_rtime as it may have been
648 1.61 mycroft * munched in mi_switch() after the time got set.
649 1.61 mycroft */
650 1.267 kardel getmicrotime(&time);
651 1.267 kardel boottime = time;
652 1.352 ad mutex_enter(proc_lock);
653 1.225 jdolecek LIST_FOREACH(p, &allproc, p_list) {
654 1.295 pavel KASSERT((p->p_flag & PK_MARKER) == 0);
655 1.353 ad mutex_enter(p->p_lock);
656 1.267 kardel p->p_stats->p_start = time;
657 1.225 jdolecek LIST_FOREACH(l, &p->p_lwps, l_sibling) {
658 1.292 ad lwp_lock(l);
659 1.332 yamt memset(&l->l_rtime, 0, sizeof(l->l_rtime));
660 1.292 ad lwp_unlock(l);
661 1.225 jdolecek }
662 1.353 ad mutex_exit(p->p_lock);
663 1.163 thorpej }
664 1.352 ad mutex_exit(proc_lock);
665 1.332 yamt binuptime(&curlwp->l_stime);
666 1.61 mycroft
667 1.312 ad for (CPU_INFO_FOREACH(cii, ci)) {
668 1.312 ad ci->ci_schedstate.spc_lastmod = time_second;
669 1.312 ad }
670 1.312 ad
671 1.163 thorpej /* Create the pageout daemon kernel thread. */
672 1.163 thorpej uvm_swap_init();
673 1.336 ad if (kthread_create(PRI_PGDAEMON, KTHREAD_MPSAFE, NULL, uvm_pageout,
674 1.307 ad NULL, NULL, "pgdaemon"))
675 1.135 thorpej panic("fork pagedaemon");
676 1.61 mycroft
677 1.163 thorpej /* Create the filesystem syncer kernel thread. */
678 1.336 ad if (kthread_create(PRI_IOFLUSH, KTHREAD_MPSAFE, NULL, sched_sync,
679 1.336 ad NULL, NULL, "ioflush"))
680 1.159 fvdl panic("fork syncer");
681 1.185 chs
682 1.185 chs /* Create the aiodone daemon kernel thread. */
683 1.286 yamt if (workqueue_create(&uvm.aiodone_queue, "aiodoned",
684 1.336 ad uvm_aiodone_worker, NULL, PRI_VM, IPL_NONE, WQ_MPSAFE))
685 1.185 chs panic("fork aiodoned");
686 1.137 thorpej
687 1.304 yamt vmem_rehash_start();
688 1.304 yamt
689 1.186 jdolecek /* Initialize exec structures */
690 1.186 jdolecek exec_init(1);
691 1.192 jdolecek
692 1.163 thorpej /*
693 1.163 thorpej * Okay, now we can let init(8) exec! It's off to userland!
694 1.163 thorpej */
695 1.356 ad mutex_enter(proc_lock);
696 1.163 thorpej start_init_exec = 1;
697 1.356 ad cv_broadcast(&lbolt);
698 1.356 ad mutex_exit(proc_lock);
699 1.163 thorpej
700 1.61 mycroft /* The scheduler is an infinite loop. */
701 1.114 mrg uvm_scheduler();
702 1.61 mycroft /* NOTREACHED */
703 1.61 mycroft }
704 1.61 mycroft
705 1.93 mouse static void
706 1.260 christos check_console(struct lwp *l)
707 1.93 mouse {
708 1.93 mouse struct nameidata nd;
709 1.93 mouse int error;
710 1.93 mouse
711 1.331 pooka NDINIT(&nd, LOOKUP, FOLLOW, UIO_SYSSPACE, "/dev/console");
712 1.93 mouse error = namei(&nd);
713 1.96 cgd if (error == 0)
714 1.96 cgd vrele(nd.ni_vp);
715 1.96 cgd else if (error == ENOENT)
716 1.96 cgd printf("warning: no /dev/console\n");
717 1.93 mouse else
718 1.96 cgd printf("warning: lookup /dev/console: error %d\n", error);
719 1.93 mouse }
720 1.93 mouse
721 1.61 mycroft /*
722 1.61 mycroft * List of paths to try when searching for "init".
723 1.61 mycroft */
724 1.327 matt static const char * const initpaths[] = {
725 1.61 mycroft "/sbin/init",
726 1.61 mycroft "/sbin/oinit",
727 1.61 mycroft "/sbin/init.bak",
728 1.61 mycroft NULL,
729 1.61 mycroft };
730 1.61 mycroft
731 1.61 mycroft /*
732 1.61 mycroft * Start the initial user process; try exec'ing each pathname in "initpaths".
733 1.61 mycroft * The program is invoked with one argument containing the boot flags.
734 1.61 mycroft */
735 1.61 mycroft static void
736 1.176 thorpej start_init(void *arg)
737 1.61 mycroft {
738 1.216 thorpej struct lwp *l = arg;
739 1.216 thorpej struct proc *p = l->l_proc;
740 1.130 eeh vaddr_t addr;
741 1.78 mycroft struct sys_execve_args /* {
742 1.108 mycroft syscallarg(const char *) path;
743 1.92 cgd syscallarg(char * const *) argp;
744 1.92 cgd syscallarg(char * const *) envp;
745 1.68 cgd } */ args;
746 1.68 cgd int options, i, error;
747 1.68 cgd register_t retval[2];
748 1.66 mycroft char flags[4], *flagsp;
749 1.202 lukem const char *path, *slash;
750 1.176 thorpej char *ucp, **uap, *arg0, *arg1 = NULL;
751 1.202 lukem char ipath[129];
752 1.202 lukem int ipx, len;
753 1.61 mycroft
754 1.76 cgd /*
755 1.76 cgd * Now in process 1.
756 1.76 cgd */
757 1.146 gwr strncpy(p->p_comm, "init", MAXCOMLEN);
758 1.163 thorpej
759 1.163 thorpej /*
760 1.163 thorpej * Wait for main() to tell us that it's safe to exec.
761 1.163 thorpej */
762 1.356 ad mutex_enter(proc_lock);
763 1.163 thorpej while (start_init_exec == 0)
764 1.356 ad cv_wait(&lbolt, proc_lock);
765 1.356 ad mutex_exit(proc_lock);
766 1.93 mouse
767 1.93 mouse /*
768 1.93 mouse * This is not the right way to do this. We really should
769 1.93 mouse * hand-craft a descriptor onto /dev/console to hand to init,
770 1.93 mouse * but that's a _lot_ more work, and the benefit from this easy
771 1.93 mouse * hack makes up for the "good is the enemy of the best" effect.
772 1.93 mouse */
773 1.260 christos check_console(l);
774 1.61 mycroft
775 1.61 mycroft /*
776 1.61 mycroft * Need just enough stack to hold the faked-up "execve()" arguments.
777 1.61 mycroft */
778 1.211 chs addr = (vaddr_t)STACK_ALLOC(USRSTACK, PAGE_SIZE);
779 1.205 sommerfe if (uvm_map(&p->p_vmspace->vm_map, &addr, PAGE_SIZE,
780 1.181 thorpej NULL, UVM_UNKNOWN_OFFSET, 0,
781 1.114 mrg UVM_MAPFLAG(UVM_PROT_ALL, UVM_PROT_ALL, UVM_INH_COPY,
782 1.114 mrg UVM_ADV_NORMAL,
783 1.189 chs UVM_FLAG_FIXED|UVM_FLAG_OVERLAY|UVM_FLAG_COPYONW)) != 0)
784 1.114 mrg panic("init: couldn't allocate argument space");
785 1.297 christos p->p_vmspace->vm_maxsaddr = (void *)STACK_MAX(addr, PAGE_SIZE);
786 1.61 mycroft
787 1.202 lukem ipx = 0;
788 1.202 lukem while (1) {
789 1.202 lukem if (boothowto & RB_ASKNAME) {
790 1.202 lukem printf("init path");
791 1.202 lukem if (initpaths[ipx])
792 1.202 lukem printf(" (default %s)", initpaths[ipx]);
793 1.202 lukem printf(": ");
794 1.202 lukem len = cngetsn(ipath, sizeof(ipath)-1);
795 1.202 lukem if (len == 0) {
796 1.202 lukem if (initpaths[ipx])
797 1.202 lukem path = initpaths[ipx++];
798 1.202 lukem else
799 1.202 lukem continue;
800 1.202 lukem } else {
801 1.202 lukem ipath[len] = '\0';
802 1.202 lukem path = ipath;
803 1.202 lukem }
804 1.202 lukem } else {
805 1.202 lukem if ((path = initpaths[ipx++]) == NULL)
806 1.202 lukem break;
807 1.202 lukem }
808 1.202 lukem
809 1.211 chs ucp = (char *)USRSTACK;
810 1.64 mycroft
811 1.61 mycroft /*
812 1.64 mycroft * Construct the boot flag argument.
813 1.61 mycroft */
814 1.66 mycroft flagsp = flags;
815 1.66 mycroft *flagsp++ = '-';
816 1.61 mycroft options = 0;
817 1.66 mycroft
818 1.61 mycroft if (boothowto & RB_SINGLE) {
819 1.64 mycroft *flagsp++ = 's';
820 1.61 mycroft options = 1;
821 1.61 mycroft }
822 1.61 mycroft #ifdef notyet
823 1.61 mycroft if (boothowto & RB_FASTBOOT) {
824 1.64 mycroft *flagsp++ = 'f';
825 1.61 mycroft options = 1;
826 1.61 mycroft }
827 1.61 mycroft #endif
828 1.64 mycroft
829 1.64 mycroft /*
830 1.64 mycroft * Move out the flags (arg 1), if necessary.
831 1.64 mycroft */
832 1.64 mycroft if (options != 0) {
833 1.64 mycroft *flagsp++ = '\0';
834 1.64 mycroft i = flagsp - flags;
835 1.64 mycroft #ifdef DEBUG
836 1.90 christos printf("init: copying out flags `%s' %d\n", flags, i);
837 1.64 mycroft #endif
838 1.211 chs arg1 = STACK_ALLOC(ucp, i);
839 1.211 chs ucp = STACK_MAX(arg1, i);
840 1.297 christos (void)copyout((void *)flags, arg1, i);
841 1.64 mycroft }
842 1.61 mycroft
843 1.61 mycroft /*
844 1.61 mycroft * Move out the file name (also arg 0).
845 1.61 mycroft */
846 1.64 mycroft i = strlen(path) + 1;
847 1.64 mycroft #ifdef DEBUG
848 1.90 christos printf("init: copying out path `%s' %d\n", path, i);
849 1.202 lukem #else
850 1.203 lukem if (boothowto & RB_ASKNAME || path != initpaths[0])
851 1.202 lukem printf("init: trying %s\n", path);
852 1.64 mycroft #endif
853 1.211 chs arg0 = STACK_ALLOC(ucp, i);
854 1.211 chs ucp = STACK_MAX(arg0, i);
855 1.247 christos (void)copyout(path, arg0, i);
856 1.61 mycroft
857 1.61 mycroft /*
858 1.61 mycroft * Move out the arg pointers.
859 1.61 mycroft */
860 1.297 christos ucp = (void *)STACK_ALIGN(ucp, ALIGNBYTES);
861 1.211 chs uap = (char **)STACK_ALLOC(ucp, sizeof(char *) * 3);
862 1.211 chs SCARG(&args, path) = arg0;
863 1.211 chs SCARG(&args, argp) = uap;
864 1.211 chs SCARG(&args, envp) = NULL;
865 1.142 mycroft slash = strrchr(path, '/');
866 1.142 mycroft if (slash)
867 1.297 christos (void)suword((void *)uap++,
868 1.142 mycroft (long)arg0 + (slash + 1 - path));
869 1.142 mycroft else
870 1.297 christos (void)suword((void *)uap++, (long)arg0);
871 1.211 chs if (options != 0)
872 1.297 christos (void)suword((void *)uap++, (long)arg1);
873 1.297 christos (void)suword((void *)uap++, 0); /* terminator */
874 1.61 mycroft
875 1.61 mycroft /*
876 1.61 mycroft * Now try to exec the program. If can't for any reason
877 1.61 mycroft * other than it doesn't exist, complain.
878 1.61 mycroft */
879 1.260 christos error = sys_execve(l, &args, retval);
880 1.179 thorpej if (error == 0 || error == EJUSTRETURN) {
881 1.292 ad KERNEL_UNLOCK_LAST(l);
882 1.61 mycroft return;
883 1.179 thorpej }
884 1.202 lukem printf("exec %s: error %d\n", path, error);
885 1.61 mycroft }
886 1.90 christos printf("init: not found\n");
887 1.61 mycroft panic("no init");
888 1.61 mycroft }
889 1.345 yamt
890 1.345 yamt /*
891 1.345 yamt * calculate cache size from physmem and vm_map size.
892 1.345 yamt */
893 1.345 yamt vaddr_t
894 1.346 yamt calc_cache_size(struct vm_map *map, int pct, int va_pct)
895 1.345 yamt {
896 1.345 yamt paddr_t t;
897 1.345 yamt
898 1.345 yamt /* XXX should consider competing cache if any */
899 1.345 yamt /* XXX should consider submaps */
900 1.346 yamt t = (uintmax_t)physmem * pct / 100 * PAGE_SIZE;
901 1.346 yamt if (map != NULL) {
902 1.346 yamt vsize_t vsize;
903 1.346 yamt
904 1.346 yamt vsize = vm_map_max(map) - vm_map_min(map);
905 1.346 yamt vsize = (uintmax_t)vsize * va_pct / 100;
906 1.346 yamt if (t > vsize) {
907 1.346 yamt t = vsize;
908 1.346 yamt }
909 1.345 yamt }
910 1.345 yamt return t;
911 1.345 yamt }
912