kern_sysctl.c revision 1.233 1 1.233 tls /* $NetBSD: kern_sysctl.c,v 1.233 2011/11/19 22:51:25 tls Exp $ */
2 1.153 atatat
3 1.153 atatat /*-
4 1.213 ad * Copyright (c) 2003, 2007, 2008 The NetBSD Foundation, Inc.
5 1.153 atatat * All rights reserved.
6 1.153 atatat *
7 1.153 atatat * This code is derived from software contributed to The NetBSD Foundation
8 1.153 atatat * by Andrew Brown.
9 1.153 atatat *
10 1.153 atatat * Redistribution and use in source and binary forms, with or without
11 1.153 atatat * modification, are permitted provided that the following conditions
12 1.153 atatat * are met:
13 1.153 atatat * 1. Redistributions of source code must retain the above copyright
14 1.153 atatat * notice, this list of conditions and the following disclaimer.
15 1.153 atatat * 2. Redistributions in binary form must reproduce the above copyright
16 1.153 atatat * notice, this list of conditions and the following disclaimer in the
17 1.153 atatat * documentation and/or other materials provided with the distribution.
18 1.153 atatat *
19 1.153 atatat * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 1.153 atatat * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 1.153 atatat * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 1.153 atatat * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 1.153 atatat * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 1.153 atatat * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 1.153 atatat * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 1.153 atatat * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 1.153 atatat * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 1.153 atatat * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 1.153 atatat * POSSIBILITY OF SUCH DAMAGE.
30 1.153 atatat */
31 1.2 cgd
32 1.1 cgd /*-
33 1.1 cgd * Copyright (c) 1982, 1986, 1989, 1993
34 1.1 cgd * The Regents of the University of California. All rights reserved.
35 1.1 cgd *
36 1.1 cgd * This code is derived from software contributed to Berkeley by
37 1.1 cgd * Mike Karels at Berkeley Software Design, Inc.
38 1.1 cgd *
39 1.1 cgd * Redistribution and use in source and binary forms, with or without
40 1.1 cgd * modification, are permitted provided that the following conditions
41 1.1 cgd * are met:
42 1.1 cgd * 1. Redistributions of source code must retain the above copyright
43 1.1 cgd * notice, this list of conditions and the following disclaimer.
44 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
45 1.1 cgd * notice, this list of conditions and the following disclaimer in the
46 1.1 cgd * documentation and/or other materials provided with the distribution.
47 1.140 agc * 3. Neither the name of the University nor the names of its contributors
48 1.1 cgd * may be used to endorse or promote products derived from this software
49 1.1 cgd * without specific prior written permission.
50 1.1 cgd *
51 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
52 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
53 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
54 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
55 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
56 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
57 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
58 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
59 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
60 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
61 1.1 cgd * SUCH DAMAGE.
62 1.1 cgd *
63 1.34 fvdl * @(#)kern_sysctl.c 8.9 (Berkeley) 5/20/95
64 1.1 cgd */
65 1.1 cgd
66 1.1 cgd /*
67 1.1 cgd * sysctl system call.
68 1.1 cgd */
69 1.97 lukem
70 1.97 lukem #include <sys/cdefs.h>
71 1.233 tls __KERNEL_RCSID(0, "$NetBSD: kern_sysctl.c,v 1.233 2011/11/19 22:51:25 tls Exp $");
72 1.30 thorpej
73 1.52 bouyer #include "opt_defcorename.h"
74 1.153 atatat #include "ksyms.h"
75 1.1 cgd
76 1.1 cgd #include <sys/param.h>
77 1.164 atatat #define __COMPAT_SYSCTL
78 1.153 atatat #include <sys/sysctl.h>
79 1.1 cgd #include <sys/systm.h>
80 1.62 simonb #include <sys/buf.h>
81 1.153 atatat #include <sys/ksyms.h>
82 1.1 cgd #include <sys/malloc.h>
83 1.62 simonb #include <sys/mount.h>
84 1.62 simonb #include <sys/syscallargs.h>
85 1.196 elad #include <sys/kauth.h>
86 1.203 manu #include <sys/ktrace.h>
87 1.233 tls #include <sys/cprng.h>
88 1.153 atatat
89 1.197 christos #define MAXDESCLEN 1024
90 1.153 atatat MALLOC_DEFINE(M_SYSCTLNODE, "sysctlnode", "sysctl node structures");
91 1.153 atatat MALLOC_DEFINE(M_SYSCTLDATA, "sysctldata", "misc sysctl data");
92 1.153 atatat
93 1.183 atatat static int sysctl_mmap(SYSCTLFN_PROTO);
94 1.153 atatat static int sysctl_alloc(struct sysctlnode *, int);
95 1.153 atatat static int sysctl_realloc(struct sysctlnode *);
96 1.38 jonathan
97 1.162 atatat static int sysctl_cvt_in(struct lwp *, int *, const void *, size_t,
98 1.162 atatat struct sysctlnode *);
99 1.162 atatat static int sysctl_cvt_out(struct lwp *, int, const struct sysctlnode *,
100 1.162 atatat void *, size_t, size_t *);
101 1.162 atatat
102 1.183 atatat static int sysctl_log_add(struct sysctllog **, const struct sysctlnode *);
103 1.163 atatat static int sysctl_log_realloc(struct sysctllog *);
104 1.163 atatat
105 1.221 pooka typedef void (*sysctl_setup_func)(struct sysctllog **);
106 1.221 pooka
107 1.163 atatat struct sysctllog {
108 1.183 atatat const struct sysctlnode *log_root;
109 1.163 atatat int *log_num;
110 1.163 atatat int log_size, log_left;
111 1.163 atatat };
112 1.163 atatat
113 1.153 atatat /*
114 1.153 atatat * the "root" of the new sysctl tree
115 1.153 atatat */
116 1.178 heas struct sysctlnode sysctl_root = {
117 1.161 atatat .sysctl_flags = SYSCTL_VERSION|
118 1.161 atatat CTLFLAG_ROOT|CTLFLAG_READWRITE|
119 1.153 atatat CTLTYPE_NODE,
120 1.153 atatat .sysctl_num = 0,
121 1.167 atatat /*
122 1.167 atatat * XXX once all ports are on gcc3, we can get rid of this
123 1.167 atatat * ugliness and simply make it into
124 1.167 atatat *
125 1.167 atatat * .sysctl_size = sizeof(struct sysctlnode),
126 1.167 atatat */
127 1.173 atatat sysc_init_field(_sysctl_size, sizeof(struct sysctlnode)),
128 1.153 atatat .sysctl_name = "(root)",
129 1.153 atatat };
130 1.69 simonb
131 1.153 atatat /*
132 1.153 atatat * link set of functions that add nodes at boot time (see also
133 1.153 atatat * sysctl_buildtree())
134 1.153 atatat */
135 1.153 atatat __link_set_decl(sysctl_funcs, sysctl_setup_func);
136 1.74 simonb
137 1.153 atatat /*
138 1.213 ad * The `sysctl_treelock' is intended to serialize access to the sysctl
139 1.213 ad * tree. XXX This has serious problems; allocating memory and
140 1.213 ad * copying data out with the lock held is insane.
141 1.153 atatat */
142 1.208 ad krwlock_t sysctl_treelock;
143 1.90 jdolecek
144 1.228 pooka kmutex_t sysctl_file_marker_lock;
145 1.228 pooka
146 1.153 atatat /*
147 1.153 atatat * Attributes stored in the kernel.
148 1.153 atatat */
149 1.153 atatat char hostname[MAXHOSTNAMELEN];
150 1.153 atatat int hostnamelen;
151 1.31 mrg
152 1.153 atatat char domainname[MAXHOSTNAMELEN];
153 1.153 atatat int domainnamelen;
154 1.109 itojun
155 1.153 atatat long hostid;
156 1.62 simonb
157 1.153 atatat #ifndef DEFCORENAME
158 1.153 atatat #define DEFCORENAME "%n.core"
159 1.80 bjh21 #endif
160 1.153 atatat char defcorename[MAXPATHLEN] = DEFCORENAME;
161 1.62 simonb
162 1.233 tls cprng_strong_t *sysctl_prng;
163 1.233 tls
164 1.75 thorpej /*
165 1.153 atatat * ********************************************************************
166 1.153 atatat * Section 0: Some simple glue
167 1.153 atatat * ********************************************************************
168 1.153 atatat * By wrapping copyin(), copyout(), and copyinstr() like this, we can
169 1.153 atatat * stop caring about who's calling us and simplify some code a bunch.
170 1.153 atatat * ********************************************************************
171 1.75 thorpej */
172 1.230 pooka int
173 1.203 manu sysctl_copyin(struct lwp *l, const void *uaddr, void *kaddr, size_t len)
174 1.153 atatat {
175 1.203 manu int error;
176 1.203 manu
177 1.203 manu if (l != NULL) {
178 1.203 manu error = copyin(uaddr, kaddr, len);
179 1.210 ad ktrmibio(-1, UIO_WRITE, uaddr, len, error);
180 1.203 manu } else {
181 1.203 manu error = kcopy(uaddr, kaddr, len);
182 1.203 manu }
183 1.153 atatat
184 1.203 manu return error;
185 1.153 atatat }
186 1.153 atatat
187 1.230 pooka int
188 1.203 manu sysctl_copyout(struct lwp *l, const void *kaddr, void *uaddr, size_t len)
189 1.153 atatat {
190 1.203 manu int error;
191 1.153 atatat
192 1.203 manu if (l != NULL) {
193 1.203 manu error = copyout(kaddr, uaddr, len);
194 1.210 ad ktrmibio(-1, UIO_READ, uaddr, len, error);
195 1.203 manu } else {
196 1.203 manu error = kcopy(kaddr, uaddr, len);
197 1.203 manu }
198 1.203 manu
199 1.203 manu return error;
200 1.153 atatat }
201 1.153 atatat
202 1.230 pooka int
203 1.203 manu sysctl_copyinstr(struct lwp *l, const void *uaddr, void *kaddr,
204 1.153 atatat size_t len, size_t *done)
205 1.153 atatat {
206 1.203 manu int error;
207 1.203 manu
208 1.203 manu if (l != NULL) {
209 1.203 manu error = copyinstr(uaddr, kaddr, len, done);
210 1.210 ad ktrmibio(-1, UIO_WRITE, uaddr, len, error);
211 1.203 manu } else {
212 1.203 manu error = copystr(uaddr, kaddr, len, done);
213 1.203 manu }
214 1.75 thorpej
215 1.203 manu return error;
216 1.153 atatat }
217 1.153 atatat
218 1.153 atatat /*
219 1.153 atatat * ********************************************************************
220 1.153 atatat * Initialize sysctl subsystem.
221 1.153 atatat * ********************************************************************
222 1.153 atatat */
223 1.75 thorpej void
224 1.75 thorpej sysctl_init(void)
225 1.75 thorpej {
226 1.174 matt sysctl_setup_func * const *sysctl_setup, f;
227 1.153 atatat
228 1.208 ad rw_init(&sysctl_treelock);
229 1.153 atatat
230 1.153 atatat /*
231 1.153 atatat * dynamic mib numbers start here
232 1.153 atatat */
233 1.153 atatat sysctl_root.sysctl_num = CREATE_BASE;
234 1.153 atatat
235 1.153 atatat __link_set_foreach(sysctl_setup, sysctl_funcs) {
236 1.153 atatat /*
237 1.153 atatat * XXX - why do i have to coerce the pointers like this?
238 1.153 atatat */
239 1.153 atatat f = (void*)*sysctl_setup;
240 1.161 atatat (*f)(NULL);
241 1.153 atatat }
242 1.227 elad
243 1.227 elad mutex_init(&sysctl_file_marker_lock, MUTEX_DEFAULT, IPL_NONE);
244 1.226 pooka }
245 1.226 pooka
246 1.226 pooka /*
247 1.226 pooka * Setting this means no more permanent nodes can be added,
248 1.226 pooka * trees that claim to be readonly at the root now are, and if
249 1.226 pooka * the main tree is readonly, *everything* is.
250 1.226 pooka *
251 1.233 tls * Also starts up the PRNG used for the "random" sysctl: it's
252 1.233 tls * better to start it later than sooner.
253 1.233 tls *
254 1.226 pooka * Call this at the end of kernel init.
255 1.226 pooka */
256 1.226 pooka void
257 1.226 pooka sysctl_finalize(void)
258 1.226 pooka {
259 1.233 tls sysctl_prng = cprng_strong_create("sysctl", IPL_NONE,
260 1.233 tls CPRNG_INIT_ANY|CPRNG_REKEY_ANY);
261 1.161 atatat sysctl_root.sysctl_flags |= CTLFLAG_PERMANENT;
262 1.75 thorpej }
263 1.75 thorpej
264 1.153 atatat /*
265 1.153 atatat * ********************************************************************
266 1.153 atatat * The main native sysctl system call itself.
267 1.153 atatat * ********************************************************************
268 1.153 atatat */
269 1.1 cgd int
270 1.211 dsl sys___sysctl(struct lwp *l, const struct sys___sysctl_args *uap, register_t *retval)
271 1.11 thorpej {
272 1.211 dsl /* {
273 1.189 drochner syscallarg(const int *) name;
274 1.5 cgd syscallarg(u_int) namelen;
275 1.5 cgd syscallarg(void *) old;
276 1.5 cgd syscallarg(size_t *) oldlenp;
277 1.189 drochner syscallarg(const void *) new;
278 1.5 cgd syscallarg(size_t) newlen;
279 1.211 dsl } */
280 1.153 atatat int error, nerror, name[CTL_MAXNAME];
281 1.153 atatat size_t oldlen, savelen, *oldlenp;
282 1.153 atatat
283 1.153 atatat /*
284 1.153 atatat * get oldlen
285 1.153 atatat */
286 1.153 atatat oldlen = 0;
287 1.153 atatat oldlenp = SCARG(uap, oldlenp);
288 1.153 atatat if (oldlenp != NULL) {
289 1.153 atatat error = copyin(oldlenp, &oldlen, sizeof(oldlen));
290 1.153 atatat if (error)
291 1.153 atatat return (error);
292 1.153 atatat }
293 1.153 atatat savelen = oldlen;
294 1.1 cgd
295 1.1 cgd /*
296 1.153 atatat * top-level sysctl names may or may not be non-terminal, but
297 1.153 atatat * we don't care
298 1.1 cgd */
299 1.153 atatat if (SCARG(uap, namelen) > CTL_MAXNAME || SCARG(uap, namelen) < 1)
300 1.1 cgd return (EINVAL);
301 1.13 christos error = copyin(SCARG(uap, name), &name,
302 1.153 atatat SCARG(uap, namelen) * sizeof(int));
303 1.13 christos if (error)
304 1.1 cgd return (error);
305 1.1 cgd
306 1.210 ad ktrmib(name, SCARG(uap, namelen));
307 1.210 ad
308 1.213 ad sysctl_lock(SCARG(uap, new) != NULL);
309 1.52 bouyer
310 1.153 atatat /*
311 1.153 atatat * do sysctl work (NULL means main built-in default tree)
312 1.153 atatat */
313 1.153 atatat error = sysctl_dispatch(&name[0], SCARG(uap, namelen),
314 1.153 atatat SCARG(uap, old), &oldlen,
315 1.153 atatat SCARG(uap, new), SCARG(uap, newlen),
316 1.153 atatat &name[0], l, NULL);
317 1.153 atatat
318 1.153 atatat /*
319 1.153 atatat * release the sysctl lock
320 1.153 atatat */
321 1.213 ad sysctl_unlock();
322 1.104 christos
323 1.153 atatat /*
324 1.153 atatat * set caller's oldlen to new value even in the face of an
325 1.153 atatat * error (if this gets an error and they didn't have one, they
326 1.153 atatat * get this one)
327 1.153 atatat */
328 1.153 atatat if (oldlenp) {
329 1.153 atatat nerror = copyout(&oldlen, oldlenp, sizeof(oldlen));
330 1.153 atatat if (error == 0)
331 1.153 atatat error = nerror;
332 1.1 cgd }
333 1.1 cgd
334 1.75 thorpej /*
335 1.153 atatat * if the only problem is that we weren't given enough space,
336 1.153 atatat * that's an ENOMEM error
337 1.75 thorpej */
338 1.153 atatat if (error == 0 && SCARG(uap, old) != NULL && savelen < oldlen)
339 1.153 atatat error = ENOMEM;
340 1.179 perry
341 1.153 atatat return (error);
342 1.153 atatat }
343 1.153 atatat
344 1.153 atatat /*
345 1.153 atatat * ********************************************************************
346 1.153 atatat * Section 1: How the tree is used
347 1.153 atatat * ********************************************************************
348 1.153 atatat * Implementations of sysctl for emulations should typically need only
349 1.153 atatat * these three functions in this order: lock the tree, dispatch
350 1.153 atatat * request into it, unlock the tree.
351 1.153 atatat * ********************************************************************
352 1.153 atatat */
353 1.213 ad void
354 1.213 ad sysctl_lock(bool write)
355 1.153 atatat {
356 1.75 thorpej
357 1.213 ad if (write) {
358 1.213 ad rw_enter(&sysctl_treelock, RW_WRITER);
359 1.213 ad curlwp->l_pflag |= LP_SYSCTLWRITE;
360 1.213 ad } else {
361 1.213 ad rw_enter(&sysctl_treelock, RW_READER);
362 1.213 ad curlwp->l_pflag &= ~LP_SYSCTLWRITE;
363 1.213 ad }
364 1.213 ad }
365 1.153 atatat
366 1.213 ad void
367 1.213 ad sysctl_relock(void)
368 1.213 ad {
369 1.204 chs
370 1.213 ad if ((curlwp->l_pflag & LP_SYSCTLWRITE) != 0) {
371 1.213 ad rw_enter(&sysctl_treelock, RW_WRITER);
372 1.213 ad } else {
373 1.213 ad rw_enter(&sysctl_treelock, RW_READER);
374 1.1 cgd }
375 1.1 cgd }
376 1.1 cgd
377 1.1 cgd /*
378 1.153 atatat * ********************************************************************
379 1.153 atatat * the main sysctl dispatch routine. scans the given tree and picks a
380 1.153 atatat * function to call based on what it finds.
381 1.153 atatat * ********************************************************************
382 1.1 cgd */
383 1.153 atatat int
384 1.183 atatat sysctl_dispatch(SYSCTLFN_ARGS)
385 1.153 atatat {
386 1.153 atatat int error;
387 1.153 atatat sysctlfn fn;
388 1.153 atatat int ni;
389 1.75 thorpej
390 1.213 ad KASSERT(rw_lock_held(&sysctl_treelock));
391 1.213 ad
392 1.161 atatat if (rnode && SYSCTL_VERS(rnode->sysctl_flags) != SYSCTL_VERSION) {
393 1.161 atatat printf("sysctl_dispatch: rnode %p wrong version\n", rnode);
394 1.203 manu error = EINVAL;
395 1.203 manu goto out;
396 1.161 atatat }
397 1.161 atatat
398 1.153 atatat fn = NULL;
399 1.153 atatat error = sysctl_locate(l, name, namelen, &rnode, &ni);
400 1.75 thorpej
401 1.188 yamt if (rnode->sysctl_func != NULL) {
402 1.188 yamt /*
403 1.188 yamt * the node we ended up at has a function, so call it. it can
404 1.188 yamt * hand off to query or create if it wants to.
405 1.188 yamt */
406 1.153 atatat fn = rnode->sysctl_func;
407 1.188 yamt } else if (error == 0) {
408 1.188 yamt /*
409 1.188 yamt * we found the node they were looking for, so do a lookup.
410 1.188 yamt */
411 1.153 atatat fn = (sysctlfn)sysctl_lookup; /* XXX may write to rnode */
412 1.188 yamt } else if (error == ENOENT && (ni + 1) == namelen && name[ni] < 0) {
413 1.188 yamt /*
414 1.188 yamt * prospective parent node found, but the terminal node was
415 1.188 yamt * not. generic operations associate with the parent.
416 1.188 yamt */
417 1.153 atatat switch (name[ni]) {
418 1.153 atatat case CTL_QUERY:
419 1.153 atatat fn = sysctl_query;
420 1.153 atatat break;
421 1.153 atatat case CTL_CREATE:
422 1.153 atatat #if NKSYMS > 0
423 1.153 atatat case CTL_CREATESYM:
424 1.153 atatat #endif /* NKSYMS > 0 */
425 1.213 ad if (newp == NULL) {
426 1.213 ad error = EINVAL;
427 1.213 ad break;
428 1.213 ad }
429 1.213 ad KASSERT(rw_write_held(&sysctl_treelock));
430 1.153 atatat fn = (sysctlfn)sysctl_create; /* we own the rnode */
431 1.153 atatat break;
432 1.153 atatat case CTL_DESTROY:
433 1.213 ad if (newp == NULL) {
434 1.213 ad error = EINVAL;
435 1.213 ad break;
436 1.213 ad }
437 1.213 ad KASSERT(rw_write_held(&sysctl_treelock));
438 1.153 atatat fn = (sysctlfn)sysctl_destroy; /* we own the rnode */
439 1.153 atatat break;
440 1.153 atatat case CTL_MMAP:
441 1.153 atatat fn = (sysctlfn)sysctl_mmap; /* we own the rnode */
442 1.153 atatat break;
443 1.165 atatat case CTL_DESCRIBE:
444 1.165 atatat fn = sysctl_describe;
445 1.165 atatat break;
446 1.153 atatat default:
447 1.153 atatat error = EOPNOTSUPP;
448 1.153 atatat break;
449 1.153 atatat }
450 1.153 atatat }
451 1.75 thorpej
452 1.153 atatat /*
453 1.153 atatat * after all of that, maybe we found someone who knows how to
454 1.153 atatat * get us what we want?
455 1.153 atatat */
456 1.153 atatat if (fn != NULL)
457 1.153 atatat error = (*fn)(name + ni, namelen - ni, oldp, oldlenp,
458 1.153 atatat newp, newlen, name, l, rnode);
459 1.153 atatat else if (error == 0)
460 1.153 atatat error = EOPNOTSUPP;
461 1.84 sommerfe
462 1.203 manu out:
463 1.153 atatat return (error);
464 1.153 atatat }
465 1.83 sommerfe
466 1.153 atatat /*
467 1.153 atatat * ********************************************************************
468 1.213 ad * Releases the tree lock.
469 1.153 atatat * ********************************************************************
470 1.153 atatat */
471 1.153 atatat void
472 1.213 ad sysctl_unlock(void)
473 1.83 sommerfe {
474 1.84 sommerfe
475 1.213 ad rw_exit(&sysctl_treelock);
476 1.84 sommerfe }
477 1.84 sommerfe
478 1.153 atatat /*
479 1.153 atatat * ********************************************************************
480 1.153 atatat * Section 2: The main tree interfaces
481 1.153 atatat * ********************************************************************
482 1.153 atatat * This is how sysctl_dispatch() does its work, and you can too, by
483 1.153 atatat * calling these routines from helpers (though typically only
484 1.153 atatat * sysctl_lookup() will be used). The tree MUST BE LOCKED when these
485 1.153 atatat * are called.
486 1.153 atatat * ********************************************************************
487 1.153 atatat */
488 1.83 sommerfe
489 1.1 cgd /*
490 1.153 atatat * sysctl_locate -- Finds the node matching the given mib under the
491 1.153 atatat * given tree (via rv). If no tree is given, we fall back to the
492 1.153 atatat * native tree. The current process (via l) is used for access
493 1.156 atatat * control on the tree (some nodes may be traversable only by root) and
494 1.153 atatat * on return, nip will show how many numbers in the mib were consumed.
495 1.1 cgd */
496 1.13 christos int
497 1.153 atatat sysctl_locate(struct lwp *l, const int *name, u_int namelen,
498 1.183 atatat const struct sysctlnode **rnode, int *nip)
499 1.1 cgd {
500 1.183 atatat const struct sysctlnode *node, *pnode;
501 1.153 atatat int tn, si, ni, error, alias;
502 1.153 atatat
503 1.213 ad KASSERT(rw_lock_held(&sysctl_treelock));
504 1.213 ad
505 1.153 atatat /*
506 1.153 atatat * basic checks and setup
507 1.153 atatat */
508 1.158 atatat if (*rnode == NULL)
509 1.158 atatat *rnode = &sysctl_root;
510 1.153 atatat if (nip)
511 1.153 atatat *nip = 0;
512 1.153 atatat if (namelen == 0)
513 1.153 atatat return (0);
514 1.1 cgd
515 1.153 atatat /*
516 1.153 atatat * search starts from "root"
517 1.153 atatat */
518 1.158 atatat pnode = *rnode;
519 1.161 atatat if (SYSCTL_VERS(pnode->sysctl_flags) != SYSCTL_VERSION) {
520 1.161 atatat printf("sysctl_locate: pnode %p wrong version\n", pnode);
521 1.161 atatat return (EINVAL);
522 1.161 atatat }
523 1.153 atatat node = pnode->sysctl_child;
524 1.153 atatat error = 0;
525 1.1 cgd
526 1.153 atatat /*
527 1.153 atatat * scan for node to which new node should be attached
528 1.153 atatat */
529 1.153 atatat for (ni = 0; ni < namelen; ni++) {
530 1.153 atatat /*
531 1.153 atatat * walked off bottom of tree
532 1.153 atatat */
533 1.153 atatat if (node == NULL) {
534 1.153 atatat if (SYSCTL_TYPE(pnode->sysctl_flags) == CTLTYPE_NODE)
535 1.153 atatat error = ENOENT;
536 1.153 atatat else
537 1.153 atatat error = ENOTDIR;
538 1.153 atatat break;
539 1.153 atatat }
540 1.153 atatat /*
541 1.153 atatat * can anyone traverse this node or only root?
542 1.153 atatat */
543 1.161 atatat if (l != NULL && (pnode->sysctl_flags & CTLFLAG_PRIVATE) &&
544 1.202 elad (error = kauth_authorize_system(l->l_cred,
545 1.202 elad KAUTH_SYSTEM_SYSCTL, KAUTH_REQ_SYSTEM_SYSCTL_PRVT,
546 1.202 elad NULL, NULL, NULL)) != 0)
547 1.153 atatat return (error);
548 1.153 atatat /*
549 1.153 atatat * find a child node with the right number
550 1.153 atatat */
551 1.153 atatat tn = name[ni];
552 1.153 atatat alias = 0;
553 1.159 atatat
554 1.159 atatat si = 0;
555 1.159 atatat /*
556 1.159 atatat * Note: ANYNUMBER only matches positive integers.
557 1.159 atatat * Since ANYNUMBER is only permitted on single-node
558 1.159 atatat * sub-trees (eg proc), check before the loop and skip
559 1.159 atatat * it if we can.
560 1.159 atatat */
561 1.161 atatat if ((node[si].sysctl_flags & CTLFLAG_ANYNUMBER) && (tn >= 0))
562 1.159 atatat goto foundit;
563 1.159 atatat for (; si < pnode->sysctl_clen; si++) {
564 1.159 atatat if (node[si].sysctl_num == tn) {
565 1.161 atatat if (node[si].sysctl_flags & CTLFLAG_ALIAS) {
566 1.153 atatat if (alias++ == 4)
567 1.159 atatat break;
568 1.153 atatat else {
569 1.153 atatat tn = node[si].sysctl_alias;
570 1.153 atatat si = -1;
571 1.153 atatat }
572 1.188 yamt } else
573 1.159 atatat goto foundit;
574 1.99 lukem }
575 1.29 sommerfe }
576 1.153 atatat /*
577 1.153 atatat * if we ran off the end, it obviously doesn't exist
578 1.153 atatat */
579 1.159 atatat error = ENOENT;
580 1.159 atatat break;
581 1.159 atatat
582 1.153 atatat /*
583 1.153 atatat * so far so good, move on down the line
584 1.153 atatat */
585 1.159 atatat foundit:
586 1.153 atatat pnode = &node[si];
587 1.153 atatat if (SYSCTL_TYPE(pnode->sysctl_flags) == CTLTYPE_NODE)
588 1.153 atatat node = node[si].sysctl_child;
589 1.153 atatat else
590 1.153 atatat node = NULL;
591 1.153 atatat }
592 1.153 atatat
593 1.158 atatat *rnode = pnode;
594 1.153 atatat if (nip)
595 1.153 atatat *nip = ni;
596 1.153 atatat
597 1.153 atatat return (error);
598 1.153 atatat }
599 1.153 atatat
600 1.153 atatat /*
601 1.165 atatat * sysctl_query -- The auto-discovery engine. Copies out the structs
602 1.165 atatat * describing nodes under the given node and handles overlay trees.
603 1.153 atatat */
604 1.153 atatat int
605 1.153 atatat sysctl_query(SYSCTLFN_ARGS)
606 1.153 atatat {
607 1.162 atatat int error, ni, elim, v;
608 1.153 atatat size_t out, left, t;
609 1.183 atatat const struct sysctlnode *enode, *onode;
610 1.183 atatat struct sysctlnode qnode;
611 1.121 jdolecek
612 1.213 ad KASSERT(rw_lock_held(&sysctl_treelock));
613 1.213 ad
614 1.161 atatat if (SYSCTL_VERS(rnode->sysctl_flags) != SYSCTL_VERSION) {
615 1.161 atatat printf("sysctl_query: rnode %p wrong version\n", rnode);
616 1.161 atatat return (EINVAL);
617 1.161 atatat }
618 1.161 atatat
619 1.153 atatat if (SYSCTL_TYPE(rnode->sysctl_flags) != CTLTYPE_NODE)
620 1.153 atatat return (ENOTDIR);
621 1.153 atatat if (namelen != 1 || name[0] != CTL_QUERY)
622 1.153 atatat return (EINVAL);
623 1.121 jdolecek
624 1.153 atatat error = 0;
625 1.153 atatat out = 0;
626 1.153 atatat left = *oldlenp;
627 1.153 atatat elim = 0;
628 1.153 atatat enode = NULL;
629 1.121 jdolecek
630 1.153 atatat /*
631 1.162 atatat * translate the given request to a current node
632 1.162 atatat */
633 1.162 atatat error = sysctl_cvt_in(l, &v, newp, newlen, &qnode);
634 1.162 atatat if (error)
635 1.162 atatat return (error);
636 1.162 atatat
637 1.162 atatat /*
638 1.162 atatat * if the request specifies a version, check it
639 1.162 atatat */
640 1.162 atatat if (qnode.sysctl_ver != 0) {
641 1.183 atatat enode = rnode;
642 1.162 atatat if (qnode.sysctl_ver != enode->sysctl_ver &&
643 1.162 atatat qnode.sysctl_ver != sysctl_rootof(enode)->sysctl_ver)
644 1.162 atatat return (EINVAL);
645 1.162 atatat }
646 1.162 atatat
647 1.162 atatat /*
648 1.153 atatat * process has overlay tree
649 1.153 atatat */
650 1.153 atatat if (l && l->l_proc->p_emul->e_sysctlovly) {
651 1.161 atatat enode = l->l_proc->p_emul->e_sysctlovly;
652 1.153 atatat elim = (name - oname);
653 1.153 atatat error = sysctl_locate(l, oname, elim, &enode, NULL);
654 1.153 atatat if (error == 0) {
655 1.153 atatat /* ah, found parent in overlay */
656 1.153 atatat elim = enode->sysctl_clen;
657 1.153 atatat enode = enode->sysctl_child;
658 1.188 yamt } else {
659 1.153 atatat error = 0;
660 1.153 atatat elim = 0;
661 1.153 atatat enode = NULL;
662 1.121 jdolecek }
663 1.153 atatat }
664 1.121 jdolecek
665 1.153 atatat for (ni = 0; ni < rnode->sysctl_clen; ni++) {
666 1.153 atatat onode = &rnode->sysctl_child[ni];
667 1.153 atatat if (enode && enode->sysctl_num == onode->sysctl_num) {
668 1.161 atatat if (SYSCTL_TYPE(enode->sysctl_flags) != CTLTYPE_NODE)
669 1.153 atatat onode = enode;
670 1.153 atatat if (--elim > 0)
671 1.153 atatat enode++;
672 1.153 atatat else
673 1.153 atatat enode = NULL;
674 1.153 atatat }
675 1.162 atatat error = sysctl_cvt_out(l, v, onode, oldp, left, &t);
676 1.153 atatat if (error)
677 1.1 cgd return (error);
678 1.162 atatat if (oldp != NULL)
679 1.162 atatat oldp = (char*)oldp + t;
680 1.162 atatat out += t;
681 1.162 atatat left -= MIN(left, t);
682 1.153 atatat }
683 1.153 atatat
684 1.153 atatat /*
685 1.153 atatat * overlay trees *MUST* be entirely consumed
686 1.153 atatat */
687 1.153 atatat KASSERT(enode == NULL);
688 1.153 atatat
689 1.153 atatat *oldlenp = out;
690 1.153 atatat
691 1.153 atatat return (error);
692 1.153 atatat }
693 1.153 atatat
694 1.153 atatat /*
695 1.153 atatat * sysctl_create -- Adds a node (the description of which is taken
696 1.153 atatat * from newp) to the tree, returning a copy of it in the space pointed
697 1.153 atatat * to by oldp. In the event that the requested slot is already taken
698 1.153 atatat * (either by name or by number), the offending node is returned
699 1.153 atatat * instead. Yes, this is complex, but we want to make sure everything
700 1.153 atatat * is proper.
701 1.153 atatat */
702 1.200 christos #ifdef SYSCTL_DEBUG_CREATE
703 1.200 christos int _sysctl_create(SYSCTLFN_ARGS);
704 1.200 christos int
705 1.200 christos _sysctl_create(SYSCTLFN_ARGS)
706 1.200 christos #else
707 1.153 atatat int
708 1.183 atatat sysctl_create(SYSCTLFN_ARGS)
709 1.200 christos #endif
710 1.153 atatat {
711 1.153 atatat struct sysctlnode nnode, *node, *pnode;
712 1.225 dyoung int error, ni, at, nm, type, nsz, sz, flags, anum, v;
713 1.153 atatat void *own;
714 1.153 atatat
715 1.213 ad KASSERT(rw_write_held(&sysctl_treelock));
716 1.213 ad
717 1.153 atatat error = 0;
718 1.153 atatat own = NULL;
719 1.153 atatat anum = -1;
720 1.153 atatat
721 1.161 atatat if (SYSCTL_VERS(rnode->sysctl_flags) != SYSCTL_VERSION) {
722 1.161 atatat printf("sysctl_create: rnode %p wrong version\n", rnode);
723 1.161 atatat return (EINVAL);
724 1.161 atatat }
725 1.161 atatat
726 1.153 atatat if (namelen != 1 || (name[namelen - 1] != CTL_CREATE
727 1.153 atatat #if NKSYMS > 0
728 1.153 atatat && name[namelen - 1] != CTL_CREATESYM
729 1.153 atatat #endif /* NKSYMS > 0 */
730 1.153 atatat ))
731 1.153 atatat return (EINVAL);
732 1.153 atatat
733 1.153 atatat /*
734 1.153 atatat * processes can only add nodes at securelevel 0, must be
735 1.153 atatat * root, and can't add nodes to a parent that's not writeable
736 1.153 atatat */
737 1.153 atatat if (l != NULL) {
738 1.156 atatat #ifndef SYSCTL_DISALLOW_CREATE
739 1.202 elad error = kauth_authorize_system(l->l_cred, KAUTH_SYSTEM_SYSCTL,
740 1.202 elad KAUTH_REQ_SYSTEM_SYSCTL_ADD, NULL, NULL, NULL);
741 1.153 atatat if (error)
742 1.153 atatat return (error);
743 1.161 atatat if (!(rnode->sysctl_flags & CTLFLAG_READWRITE))
744 1.153 atatat #endif /* SYSCTL_DISALLOW_CREATE */
745 1.1 cgd return (EPERM);
746 1.153 atatat }
747 1.153 atatat
748 1.153 atatat /*
749 1.153 atatat * nothing can add a node if:
750 1.220 pgoyette * we've finished initial set up of this tree and
751 1.220 pgoyette * (the tree itself is not writeable or
752 1.220 pgoyette * the entire sysctl system is not writeable)
753 1.153 atatat */
754 1.220 pgoyette if ((sysctl_rootof(rnode)->sysctl_flags & CTLFLAG_PERMANENT) &&
755 1.161 atatat (!(sysctl_rootof(rnode)->sysctl_flags & CTLFLAG_READWRITE) ||
756 1.161 atatat !(sysctl_root.sysctl_flags & CTLFLAG_READWRITE)))
757 1.153 atatat return (EPERM);
758 1.120 jdolecek
759 1.153 atatat /*
760 1.153 atatat * it must be a "node", not a "int" or something
761 1.153 atatat */
762 1.153 atatat if (SYSCTL_TYPE(rnode->sysctl_flags) != CTLTYPE_NODE)
763 1.153 atatat return (ENOTDIR);
764 1.169 atatat if (rnode->sysctl_flags & CTLFLAG_ALIAS) {
765 1.169 atatat printf("sysctl_create: attempt to add node to aliased "
766 1.169 atatat "node %p\n", rnode);
767 1.169 atatat return (EINVAL);
768 1.169 atatat }
769 1.183 atatat pnode = __UNCONST(rnode); /* we are adding children to this node */
770 1.120 jdolecek
771 1.162 atatat if (newp == NULL)
772 1.153 atatat return (EINVAL);
773 1.162 atatat error = sysctl_cvt_in(l, &v, newp, newlen, &nnode);
774 1.153 atatat if (error)
775 1.120 jdolecek return (error);
776 1.120 jdolecek
777 1.153 atatat /*
778 1.153 atatat * nodes passed in don't *have* parents
779 1.153 atatat */
780 1.153 atatat if (nnode.sysctl_parent != NULL)
781 1.153 atatat return (EINVAL);
782 1.145 dsl
783 1.153 atatat /*
784 1.153 atatat * if we are indeed adding it, it should be a "good" name and
785 1.153 atatat * number
786 1.153 atatat */
787 1.153 atatat nm = nnode.sysctl_num;
788 1.153 atatat #if NKSYMS > 0
789 1.153 atatat if (nm == CTL_CREATESYM)
790 1.153 atatat nm = CTL_CREATE;
791 1.153 atatat #endif /* NKSYMS > 0 */
792 1.153 atatat if (nm < 0 && nm != CTL_CREATE)
793 1.153 atatat return (EINVAL);
794 1.1 cgd
795 1.153 atatat /*
796 1.153 atatat * the name can't start with a digit
797 1.153 atatat */
798 1.225 dyoung if (nnode.sysctl_name[0] >= '0' &&
799 1.225 dyoung nnode.sysctl_name[0] <= '9')
800 1.153 atatat return (EINVAL);
801 1.1 cgd
802 1.153 atatat /*
803 1.153 atatat * the name must be only alphanumerics or - or _, longer than
804 1.153 atatat * 0 bytes and less that SYSCTL_NAMELEN
805 1.153 atatat */
806 1.225 dyoung nsz = 0;
807 1.225 dyoung while (nsz < SYSCTL_NAMELEN && nnode.sysctl_name[nsz] != '\0') {
808 1.225 dyoung if ((nnode.sysctl_name[nsz] >= '0' &&
809 1.225 dyoung nnode.sysctl_name[nsz] <= '9') ||
810 1.225 dyoung (nnode.sysctl_name[nsz] >= 'A' &&
811 1.225 dyoung nnode.sysctl_name[nsz] <= 'Z') ||
812 1.225 dyoung (nnode.sysctl_name[nsz] >= 'a' &&
813 1.225 dyoung nnode.sysctl_name[nsz] <= 'z') ||
814 1.225 dyoung nnode.sysctl_name[nsz] == '-' ||
815 1.225 dyoung nnode.sysctl_name[nsz] == '_')
816 1.225 dyoung nsz++;
817 1.153 atatat else
818 1.153 atatat return (EINVAL);
819 1.98 simonb }
820 1.225 dyoung if (nsz == 0 || nsz == SYSCTL_NAMELEN)
821 1.153 atatat return (EINVAL);
822 1.1 cgd
823 1.153 atatat /*
824 1.153 atatat * various checks revolve around size vs type, etc
825 1.153 atatat */
826 1.153 atatat type = SYSCTL_TYPE(nnode.sysctl_flags);
827 1.153 atatat flags = SYSCTL_FLAGS(nnode.sysctl_flags);
828 1.153 atatat sz = nnode.sysctl_size;
829 1.131 thorpej
830 1.153 atatat /*
831 1.153 atatat * find out if there's a collision, and if so, let the caller
832 1.153 atatat * know what they collided with
833 1.153 atatat */
834 1.153 atatat node = pnode->sysctl_child;
835 1.193 dsl at = 0;
836 1.193 dsl if (node) {
837 1.193 dsl if ((flags | node->sysctl_flags) & CTLFLAG_ANYNUMBER)
838 1.193 dsl /* No siblings for a CTLFLAG_ANYNUMBER node */
839 1.193 dsl return EINVAL;
840 1.193 dsl for (ni = 0; ni < pnode->sysctl_clen; ni++) {
841 1.193 dsl if (nm == node[ni].sysctl_num ||
842 1.193 dsl strcmp(nnode.sysctl_name, node[ni].sysctl_name) == 0) {
843 1.193 dsl /*
844 1.193 dsl * ignore error here, since we
845 1.193 dsl * are already fixed on EEXIST
846 1.193 dsl */
847 1.193 dsl (void)sysctl_cvt_out(l, v, &node[ni], oldp,
848 1.193 dsl *oldlenp, oldlenp);
849 1.193 dsl return (EEXIST);
850 1.193 dsl }
851 1.193 dsl if (nm > node[ni].sysctl_num)
852 1.193 dsl at++;
853 1.82 eeh }
854 1.1 cgd }
855 1.1 cgd
856 1.153 atatat /*
857 1.153 atatat * use sysctl_ver to add to the tree iff it hasn't changed
858 1.153 atatat */
859 1.153 atatat if (nnode.sysctl_ver != 0) {
860 1.153 atatat /*
861 1.153 atatat * a specified value must match either the parent
862 1.153 atatat * node's version or the root node's version
863 1.153 atatat */
864 1.153 atatat if (nnode.sysctl_ver != sysctl_rootof(rnode)->sysctl_ver &&
865 1.153 atatat nnode.sysctl_ver != rnode->sysctl_ver) {
866 1.153 atatat return (EINVAL);
867 1.153 atatat }
868 1.1 cgd }
869 1.1 cgd
870 1.153 atatat /*
871 1.153 atatat * only the kernel can assign functions to entries
872 1.153 atatat */
873 1.153 atatat if (l != NULL && nnode.sysctl_func != NULL)
874 1.153 atatat return (EPERM);
875 1.52 bouyer
876 1.153 atatat /*
877 1.153 atatat * only the kernel can create permanent entries, and only then
878 1.153 atatat * before the kernel is finished setting itself up
879 1.153 atatat */
880 1.153 atatat if (l != NULL && (flags & ~SYSCTL_USERFLAGS))
881 1.153 atatat return (EPERM);
882 1.161 atatat if ((flags & CTLFLAG_PERMANENT) &
883 1.161 atatat (sysctl_root.sysctl_flags & CTLFLAG_PERMANENT))
884 1.153 atatat return (EPERM);
885 1.179 perry if ((flags & (CTLFLAG_OWNDATA | CTLFLAG_IMMEDIATE)) ==
886 1.161 atatat (CTLFLAG_OWNDATA | CTLFLAG_IMMEDIATE))
887 1.153 atatat return (EINVAL);
888 1.161 atatat if ((flags & CTLFLAG_IMMEDIATE) &&
889 1.215 matt type != CTLTYPE_INT && type != CTLTYPE_QUAD && type != CTLTYPE_BOOL)
890 1.129 enami return (EINVAL);
891 1.52 bouyer
892 1.153 atatat /*
893 1.153 atatat * check size, or set it if unset and we can figure it out.
894 1.153 atatat * kernel created nodes are allowed to have a function instead
895 1.153 atatat * of a size (or a data pointer).
896 1.153 atatat */
897 1.153 atatat switch (type) {
898 1.153 atatat case CTLTYPE_NODE:
899 1.153 atatat /*
900 1.153 atatat * only *i* can assert the size of a node
901 1.153 atatat */
902 1.161 atatat if (flags & CTLFLAG_ALIAS) {
903 1.153 atatat anum = nnode.sysctl_alias;
904 1.153 atatat if (anum < 0)
905 1.153 atatat return (EINVAL);
906 1.153 atatat nnode.sysctl_alias = 0;
907 1.52 bouyer }
908 1.153 atatat if (sz != 0 || nnode.sysctl_data != NULL)
909 1.153 atatat return (EINVAL);
910 1.153 atatat if (nnode.sysctl_csize != 0 ||
911 1.153 atatat nnode.sysctl_clen != 0 ||
912 1.153 atatat nnode.sysctl_child != 0)
913 1.129 enami return (EINVAL);
914 1.161 atatat if (flags & CTLFLAG_OWNDATA)
915 1.129 enami return (EINVAL);
916 1.153 atatat sz = sizeof(struct sysctlnode);
917 1.153 atatat break;
918 1.153 atatat case CTLTYPE_INT:
919 1.153 atatat /*
920 1.153 atatat * since an int is an int, if the size is not given or
921 1.153 atatat * is wrong, we can "int-uit" it.
922 1.153 atatat */
923 1.153 atatat if (sz != 0 && sz != sizeof(int))
924 1.129 enami return (EINVAL);
925 1.153 atatat sz = sizeof(int);
926 1.153 atatat break;
927 1.153 atatat case CTLTYPE_STRING:
928 1.52 bouyer /*
929 1.153 atatat * strings are a little more tricky
930 1.52 bouyer */
931 1.153 atatat if (sz == 0) {
932 1.153 atatat if (l == NULL) {
933 1.153 atatat if (nnode.sysctl_func == NULL) {
934 1.153 atatat if (nnode.sysctl_data == NULL)
935 1.153 atatat return (EINVAL);
936 1.153 atatat else
937 1.153 atatat sz = strlen(nnode.sysctl_data) +
938 1.153 atatat 1;
939 1.52 bouyer }
940 1.188 yamt } else if (nnode.sysctl_data == NULL &&
941 1.161 atatat flags & CTLFLAG_OWNDATA) {
942 1.153 atatat return (EINVAL);
943 1.188 yamt } else {
944 1.181 scw char *vp, *e;
945 1.153 atatat size_t s;
946 1.153 atatat
947 1.153 atatat /*
948 1.156 atatat * we want a rough idea of what the
949 1.156 atatat * size is now
950 1.153 atatat */
951 1.181 scw vp = malloc(PAGE_SIZE, M_SYSCTLDATA,
952 1.181 scw M_WAITOK|M_CANFAIL);
953 1.181 scw if (vp == NULL)
954 1.181 scw return (ENOMEM);
955 1.156 atatat e = nnode.sysctl_data;
956 1.156 atatat do {
957 1.181 scw error = copyinstr(e, vp, PAGE_SIZE, &s);
958 1.156 atatat if (error) {
959 1.181 scw if (error != ENAMETOOLONG) {
960 1.181 scw free(vp, M_SYSCTLDATA);
961 1.156 atatat return (error);
962 1.181 scw }
963 1.156 atatat e += PAGE_SIZE;
964 1.156 atatat if ((e - 32 * PAGE_SIZE) >
965 1.181 scw (char*)nnode.sysctl_data) {
966 1.181 scw free(vp, M_SYSCTLDATA);
967 1.156 atatat return (ERANGE);
968 1.181 scw }
969 1.156 atatat }
970 1.156 atatat } while (error != 0);
971 1.156 atatat sz = s + (e - (char*)nnode.sysctl_data);
972 1.181 scw free(vp, M_SYSCTLDATA);
973 1.96 bouyer }
974 1.52 bouyer }
975 1.153 atatat break;
976 1.153 atatat case CTLTYPE_QUAD:
977 1.153 atatat if (sz != 0 && sz != sizeof(u_quad_t))
978 1.129 enami return (EINVAL);
979 1.153 atatat sz = sizeof(u_quad_t);
980 1.153 atatat break;
981 1.215 matt case CTLTYPE_BOOL:
982 1.215 matt /*
983 1.215 matt * since an bool is an bool, if the size is not given or
984 1.215 matt * is wrong, we can "intuit" it.
985 1.215 matt */
986 1.215 matt if (sz != 0 && sz != sizeof(bool))
987 1.215 matt return (EINVAL);
988 1.215 matt sz = sizeof(bool);
989 1.215 matt break;
990 1.153 atatat case CTLTYPE_STRUCT:
991 1.153 atatat if (sz == 0) {
992 1.153 atatat if (l != NULL || nnode.sysctl_func == NULL)
993 1.153 atatat return (EINVAL);
994 1.161 atatat if (flags & CTLFLAG_OWNDATA)
995 1.153 atatat return (EINVAL);
996 1.153 atatat }
997 1.153 atatat break;
998 1.115 manu default:
999 1.115 manu return (EINVAL);
1000 1.52 bouyer }
1001 1.52 bouyer
1002 1.153 atatat /*
1003 1.153 atatat * at this point, if sz is zero, we *must* have a
1004 1.153 atatat * function to go with it and we can't own it.
1005 1.153 atatat */
1006 1.104 christos
1007 1.153 atatat /*
1008 1.153 atatat * l ptr own
1009 1.153 atatat * 0 0 0 -> EINVAL (if no func)
1010 1.153 atatat * 0 0 1 -> own
1011 1.153 atatat * 0 1 0 -> kptr
1012 1.153 atatat * 0 1 1 -> kptr
1013 1.153 atatat * 1 0 0 -> EINVAL
1014 1.153 atatat * 1 0 1 -> own
1015 1.156 atatat * 1 1 0 -> kptr, no own (fault on lookup)
1016 1.153 atatat * 1 1 1 -> uptr, own
1017 1.153 atatat */
1018 1.153 atatat if (type != CTLTYPE_NODE) {
1019 1.153 atatat if (sz != 0) {
1020 1.161 atatat if (flags & CTLFLAG_OWNDATA) {
1021 1.153 atatat own = malloc(sz, M_SYSCTLDATA,
1022 1.153 atatat M_WAITOK|M_CANFAIL);
1023 1.194 dsl if (own == NULL)
1024 1.194 dsl return ENOMEM;
1025 1.153 atatat if (nnode.sysctl_data == NULL)
1026 1.153 atatat memset(own, 0, sz);
1027 1.153 atatat else {
1028 1.153 atatat error = sysctl_copyin(l,
1029 1.153 atatat nnode.sysctl_data, own, sz);
1030 1.153 atatat if (error != 0) {
1031 1.187 yamt free(own, M_SYSCTLDATA);
1032 1.153 atatat return (error);
1033 1.153 atatat }
1034 1.153 atatat }
1035 1.188 yamt } else if ((nnode.sysctl_data != NULL) &&
1036 1.161 atatat !(flags & CTLFLAG_IMMEDIATE)) {
1037 1.153 atatat #if NKSYMS > 0
1038 1.153 atatat if (name[namelen - 1] == CTL_CREATESYM) {
1039 1.153 atatat char symname[128]; /* XXX enough? */
1040 1.153 atatat u_long symaddr;
1041 1.153 atatat size_t symlen;
1042 1.153 atatat
1043 1.153 atatat error = sysctl_copyinstr(l,
1044 1.153 atatat nnode.sysctl_data, symname,
1045 1.153 atatat sizeof(symname), &symlen);
1046 1.153 atatat if (error)
1047 1.153 atatat return (error);
1048 1.177 elric error = ksyms_getval(NULL, symname,
1049 1.177 elric &symaddr, KSYMS_EXTERN);
1050 1.153 atatat if (error)
1051 1.153 atatat return (error); /* EINVAL? */
1052 1.153 atatat nnode.sysctl_data = (void*)symaddr;
1053 1.153 atatat }
1054 1.153 atatat #endif /* NKSYMS > 0 */
1055 1.156 atatat /*
1056 1.156 atatat * Ideally, we'd like to verify here
1057 1.156 atatat * that this address is acceptable,
1058 1.156 atatat * but...
1059 1.156 atatat *
1060 1.156 atatat * - it might be valid now, only to
1061 1.156 atatat * become invalid later
1062 1.156 atatat *
1063 1.156 atatat * - it might be invalid only for the
1064 1.156 atatat * moment and valid later
1065 1.156 atatat *
1066 1.156 atatat * - or something else.
1067 1.156 atatat *
1068 1.156 atatat * Since we can't get a good answer,
1069 1.156 atatat * we'll just accept the address as
1070 1.156 atatat * given, and fault on individual
1071 1.156 atatat * lookups.
1072 1.156 atatat */
1073 1.153 atatat }
1074 1.188 yamt } else if (nnode.sysctl_func == NULL)
1075 1.153 atatat return (EINVAL);
1076 1.153 atatat }
1077 1.104 christos
1078 1.153 atatat /*
1079 1.153 atatat * a process can't assign a function to a node, and the kernel
1080 1.153 atatat * can't create a node that has no function or data.
1081 1.153 atatat * (XXX somewhat redundant check)
1082 1.153 atatat */
1083 1.153 atatat if (l != NULL || nnode.sysctl_func == NULL) {
1084 1.153 atatat if (type != CTLTYPE_NODE &&
1085 1.153 atatat nnode.sysctl_data == NULL &&
1086 1.161 atatat !(flags & CTLFLAG_IMMEDIATE) &&
1087 1.153 atatat own == NULL)
1088 1.153 atatat return (EINVAL);
1089 1.153 atatat }
1090 1.104 christos
1091 1.153 atatat #ifdef SYSCTL_DISALLOW_KWRITE
1092 1.153 atatat /*
1093 1.153 atatat * a process can't create a writable node unless it refers to
1094 1.153 atatat * new data.
1095 1.153 atatat */
1096 1.153 atatat if (l != NULL && own == NULL && type != CTLTYPE_NODE &&
1097 1.161 atatat (flags & CTLFLAG_READWRITE) != CTLFLAG_READONLY &&
1098 1.161 atatat !(flags & CTLFLAG_IMMEDIATE))
1099 1.153 atatat return (EPERM);
1100 1.153 atatat #endif /* SYSCTL_DISALLOW_KWRITE */
1101 1.104 christos
1102 1.153 atatat /*
1103 1.153 atatat * make sure there's somewhere to put the new stuff.
1104 1.153 atatat */
1105 1.153 atatat if (pnode->sysctl_child == NULL) {
1106 1.161 atatat if (flags & CTLFLAG_ANYNUMBER)
1107 1.153 atatat error = sysctl_alloc(pnode, 1);
1108 1.153 atatat else
1109 1.153 atatat error = sysctl_alloc(pnode, 0);
1110 1.194 dsl if (error) {
1111 1.194 dsl if (own != NULL)
1112 1.194 dsl free(own, M_SYSCTLDATA);
1113 1.153 atatat return (error);
1114 1.194 dsl }
1115 1.153 atatat }
1116 1.153 atatat node = pnode->sysctl_child;
1117 1.105 jdolecek
1118 1.153 atatat /*
1119 1.153 atatat * no collisions, so pick a good dynamic number if we need to.
1120 1.153 atatat */
1121 1.153 atatat if (nm == CTL_CREATE) {
1122 1.153 atatat nm = ++sysctl_root.sysctl_num;
1123 1.153 atatat for (ni = 0; ni < pnode->sysctl_clen; ni++) {
1124 1.153 atatat if (nm == node[ni].sysctl_num) {
1125 1.153 atatat nm++;
1126 1.153 atatat ni = -1;
1127 1.188 yamt } else if (nm > node[ni].sysctl_num)
1128 1.153 atatat at = ni + 1;
1129 1.153 atatat }
1130 1.104 christos }
1131 1.104 christos
1132 1.153 atatat /*
1133 1.153 atatat * oops...ran out of space
1134 1.153 atatat */
1135 1.153 atatat if (pnode->sysctl_clen == pnode->sysctl_csize) {
1136 1.153 atatat error = sysctl_realloc(pnode);
1137 1.194 dsl if (error) {
1138 1.194 dsl if (own != NULL)
1139 1.194 dsl free(own, M_SYSCTLDATA);
1140 1.153 atatat return (error);
1141 1.194 dsl }
1142 1.153 atatat node = pnode->sysctl_child;
1143 1.55 is }
1144 1.55 is
1145 1.153 atatat /*
1146 1.153 atatat * insert new node data
1147 1.153 atatat */
1148 1.153 atatat if (at < pnode->sysctl_clen) {
1149 1.153 atatat int t;
1150 1.179 perry
1151 1.153 atatat /*
1152 1.153 atatat * move the nodes that should come after the new one
1153 1.153 atatat */
1154 1.153 atatat memmove(&node[at + 1], &node[at],
1155 1.153 atatat (pnode->sysctl_clen - at) * sizeof(struct sysctlnode));
1156 1.153 atatat memset(&node[at], 0, sizeof(struct sysctlnode));
1157 1.153 atatat node[at].sysctl_parent = pnode;
1158 1.153 atatat /*
1159 1.153 atatat * and...reparent any children of any moved nodes
1160 1.153 atatat */
1161 1.153 atatat for (ni = at; ni <= pnode->sysctl_clen; ni++)
1162 1.223 dyoung if (node[ni].sysctl_child != NULL)
1163 1.223 dyoung for (t = 0; t < node[ni].sysctl_csize; t++)
1164 1.153 atatat node[ni].sysctl_child[t].sysctl_parent =
1165 1.153 atatat &node[ni];
1166 1.153 atatat }
1167 1.153 atatat node = &node[at];
1168 1.153 atatat pnode->sysctl_clen++;
1169 1.153 atatat
1170 1.153 atatat strlcpy(node->sysctl_name, nnode.sysctl_name,
1171 1.153 atatat sizeof(node->sysctl_name));
1172 1.153 atatat node->sysctl_num = nm;
1173 1.153 atatat node->sysctl_size = sz;
1174 1.161 atatat node->sysctl_flags = SYSCTL_VERSION|type|flags; /* XXX other trees */
1175 1.153 atatat node->sysctl_csize = 0;
1176 1.153 atatat node->sysctl_clen = 0;
1177 1.153 atatat if (own) {
1178 1.153 atatat node->sysctl_data = own;
1179 1.161 atatat node->sysctl_flags |= CTLFLAG_OWNDATA;
1180 1.188 yamt } else if (flags & CTLFLAG_ALIAS) {
1181 1.153 atatat node->sysctl_alias = anum;
1182 1.188 yamt } else if (flags & CTLFLAG_IMMEDIATE) {
1183 1.153 atatat switch (type) {
1184 1.215 matt case CTLTYPE_BOOL:
1185 1.215 matt node->sysctl_idata = nnode.sysctl_bdata;
1186 1.215 matt break;
1187 1.153 atatat case CTLTYPE_INT:
1188 1.153 atatat node->sysctl_idata = nnode.sysctl_idata;
1189 1.153 atatat break;
1190 1.153 atatat case CTLTYPE_QUAD:
1191 1.153 atatat node->sysctl_qdata = nnode.sysctl_qdata;
1192 1.153 atatat break;
1193 1.153 atatat }
1194 1.188 yamt } else {
1195 1.153 atatat node->sysctl_data = nnode.sysctl_data;
1196 1.161 atatat node->sysctl_flags &= ~CTLFLAG_OWNDATA;
1197 1.153 atatat }
1198 1.153 atatat node->sysctl_func = nnode.sysctl_func;
1199 1.153 atatat node->sysctl_child = NULL;
1200 1.153 atatat /* node->sysctl_parent should already be done */
1201 1.55 is
1202 1.153 atatat /*
1203 1.153 atatat * update "version" on path to "root"
1204 1.153 atatat */
1205 1.153 atatat for (; rnode->sysctl_parent != NULL; rnode = rnode->sysctl_parent)
1206 1.153 atatat ;
1207 1.153 atatat pnode = node;
1208 1.153 atatat for (nm = rnode->sysctl_ver + 1; pnode != NULL;
1209 1.153 atatat pnode = pnode->sysctl_parent)
1210 1.153 atatat pnode->sysctl_ver = nm;
1211 1.153 atatat
1212 1.194 dsl /* If this fails, the node is already added - the user won't know! */
1213 1.162 atatat error = sysctl_cvt_out(l, v, node, oldp, *oldlenp, oldlenp);
1214 1.55 is
1215 1.1 cgd return (error);
1216 1.1 cgd }
1217 1.1 cgd
1218 1.1 cgd /*
1219 1.153 atatat * ********************************************************************
1220 1.153 atatat * A wrapper around sysctl_create() that prints the thing we're trying
1221 1.153 atatat * to add.
1222 1.153 atatat * ********************************************************************
1223 1.1 cgd */
1224 1.153 atatat #ifdef SYSCTL_DEBUG_CREATE
1225 1.13 christos int
1226 1.200 christos sysctl_create(SYSCTLFN_ARGS)
1227 1.1 cgd {
1228 1.153 atatat const struct sysctlnode *node;
1229 1.153 atatat int k, rc, ni, nl = namelen + (name - oname);
1230 1.153 atatat
1231 1.153 atatat node = newp;
1232 1.153 atatat
1233 1.153 atatat printf("namelen %d (", nl);
1234 1.153 atatat for (ni = 0; ni < nl - 1; ni++)
1235 1.153 atatat printf(" %d", oname[ni]);
1236 1.153 atatat printf(" %d )\t[%s]\tflags %08x (%08x %d %zu)\n",
1237 1.153 atatat k = node->sysctl_num,
1238 1.153 atatat node->sysctl_name,
1239 1.153 atatat node->sysctl_flags,
1240 1.153 atatat SYSCTL_FLAGS(node->sysctl_flags),
1241 1.153 atatat SYSCTL_TYPE(node->sysctl_flags),
1242 1.153 atatat node->sysctl_size);
1243 1.1 cgd
1244 1.153 atatat node = rnode;
1245 1.200 christos rc = _sysctl_create(SYSCTLFN_CALL(rnode));
1246 1.55 is
1247 1.153 atatat printf("sysctl_create(");
1248 1.153 atatat for (ni = 0; ni < nl - 1; ni++)
1249 1.153 atatat printf(" %d", oname[ni]);
1250 1.153 atatat printf(" %d ) returned %d\n", k, rc);
1251 1.55 is
1252 1.153 atatat return (rc);
1253 1.1 cgd }
1254 1.153 atatat #endif /* SYSCTL_DEBUG_CREATE */
1255 1.1 cgd
1256 1.1 cgd /*
1257 1.153 atatat * sysctl_destroy -- Removes a node (as described by newp) from the
1258 1.153 atatat * given tree, returning (if successful) a copy of the dead node in
1259 1.153 atatat * oldp. Since we're removing stuff, there's not much to check.
1260 1.52 bouyer */
1261 1.52 bouyer int
1262 1.183 atatat sysctl_destroy(SYSCTLFN_ARGS)
1263 1.52 bouyer {
1264 1.153 atatat struct sysctlnode *node, *pnode, onode, nnode;
1265 1.162 atatat int ni, error, v;
1266 1.52 bouyer
1267 1.213 ad KASSERT(rw_write_held(&sysctl_treelock));
1268 1.213 ad
1269 1.161 atatat if (SYSCTL_VERS(rnode->sysctl_flags) != SYSCTL_VERSION) {
1270 1.161 atatat printf("sysctl_destroy: rnode %p wrong version\n", rnode);
1271 1.161 atatat return (EINVAL);
1272 1.161 atatat }
1273 1.161 atatat
1274 1.153 atatat error = 0;
1275 1.55 is
1276 1.153 atatat if (namelen != 1 || name[namelen - 1] != CTL_DESTROY)
1277 1.153 atatat return (EINVAL);
1278 1.52 bouyer
1279 1.153 atatat /*
1280 1.153 atatat * processes can only destroy nodes at securelevel 0, must be
1281 1.153 atatat * root, and can't remove nodes from a parent that's not
1282 1.153 atatat * writeable
1283 1.153 atatat */
1284 1.153 atatat if (l != NULL) {
1285 1.156 atatat #ifndef SYSCTL_DISALLOW_CREATE
1286 1.202 elad error = kauth_authorize_system(l->l_cred, KAUTH_SYSTEM_SYSCTL,
1287 1.202 elad KAUTH_REQ_SYSTEM_SYSCTL_DELETE, NULL, NULL, NULL);
1288 1.153 atatat if (error)
1289 1.153 atatat return (error);
1290 1.161 atatat if (!(rnode->sysctl_flags & CTLFLAG_READWRITE))
1291 1.156 atatat #endif /* SYSCTL_DISALLOW_CREATE */
1292 1.153 atatat return (EPERM);
1293 1.153 atatat }
1294 1.52 bouyer
1295 1.153 atatat /*
1296 1.153 atatat * nothing can remove a node if:
1297 1.153 atatat * the node is permanent (checked later) or
1298 1.153 atatat * the tree itself is not writeable or
1299 1.153 atatat * the entire sysctl system is not writeable
1300 1.170 atatat *
1301 1.170 atatat * note that we ignore whether setup is complete or not,
1302 1.170 atatat * because these rules always apply.
1303 1.153 atatat */
1304 1.161 atatat if (!(sysctl_rootof(rnode)->sysctl_flags & CTLFLAG_READWRITE) ||
1305 1.161 atatat !(sysctl_root.sysctl_flags & CTLFLAG_READWRITE))
1306 1.52 bouyer return (EPERM);
1307 1.55 is
1308 1.161 atatat if (newp == NULL)
1309 1.153 atatat return (EINVAL);
1310 1.162 atatat error = sysctl_cvt_in(l, &v, newp, newlen, &nnode);
1311 1.153 atatat if (error)
1312 1.153 atatat return (error);
1313 1.153 atatat memset(&onode, 0, sizeof(struct sysctlnode));
1314 1.55 is
1315 1.153 atatat node = rnode->sysctl_child;
1316 1.153 atatat for (ni = 0; ni < rnode->sysctl_clen; ni++) {
1317 1.153 atatat if (nnode.sysctl_num == node[ni].sysctl_num) {
1318 1.153 atatat /*
1319 1.153 atatat * if name specified, must match
1320 1.153 atatat */
1321 1.153 atatat if (nnode.sysctl_name[0] != '\0' &&
1322 1.153 atatat strcmp(nnode.sysctl_name, node[ni].sysctl_name))
1323 1.153 atatat continue;
1324 1.153 atatat /*
1325 1.153 atatat * if version specified, must match
1326 1.153 atatat */
1327 1.153 atatat if (nnode.sysctl_ver != 0 &&
1328 1.153 atatat nnode.sysctl_ver != node[ni].sysctl_ver)
1329 1.153 atatat continue;
1330 1.153 atatat /*
1331 1.153 atatat * this must be the one
1332 1.153 atatat */
1333 1.153 atatat break;
1334 1.153 atatat }
1335 1.153 atatat }
1336 1.153 atatat if (ni == rnode->sysctl_clen)
1337 1.153 atatat return (ENOENT);
1338 1.153 atatat node = &node[ni];
1339 1.153 atatat pnode = node->sysctl_parent;
1340 1.52 bouyer
1341 1.153 atatat /*
1342 1.153 atatat * if the kernel says permanent, it is, so there. nyah.
1343 1.153 atatat */
1344 1.161 atatat if (SYSCTL_FLAGS(node->sysctl_flags) & CTLFLAG_PERMANENT)
1345 1.153 atatat return (EPERM);
1346 1.1 cgd
1347 1.153 atatat /*
1348 1.153 atatat * can't delete non-empty nodes
1349 1.153 atatat */
1350 1.153 atatat if (SYSCTL_TYPE(node->sysctl_flags) == CTLTYPE_NODE &&
1351 1.153 atatat node->sysctl_clen != 0)
1352 1.153 atatat return (ENOTEMPTY);
1353 1.55 is
1354 1.153 atatat /*
1355 1.153 atatat * if the node "owns" data, release it now
1356 1.153 atatat */
1357 1.161 atatat if (node->sysctl_flags & CTLFLAG_OWNDATA) {
1358 1.153 atatat if (node->sysctl_data != NULL)
1359 1.187 yamt free(node->sysctl_data, M_SYSCTLDATA);
1360 1.153 atatat node->sysctl_data = NULL;
1361 1.153 atatat }
1362 1.166 atatat if (node->sysctl_flags & CTLFLAG_OWNDESC) {
1363 1.166 atatat if (node->sysctl_desc != NULL)
1364 1.180 christos /*XXXUNCONST*/
1365 1.187 yamt free(__UNCONST(node->sysctl_desc), M_SYSCTLDATA);
1366 1.166 atatat node->sysctl_desc = NULL;
1367 1.166 atatat }
1368 1.55 is
1369 1.153 atatat /*
1370 1.153 atatat * if the node to be removed is not the last one on the list,
1371 1.153 atatat * move the remaining nodes up, and reparent any grandchildren
1372 1.153 atatat */
1373 1.153 atatat onode = *node;
1374 1.153 atatat if (ni < pnode->sysctl_clen - 1) {
1375 1.153 atatat int t;
1376 1.153 atatat
1377 1.153 atatat memmove(&pnode->sysctl_child[ni], &pnode->sysctl_child[ni + 1],
1378 1.153 atatat (pnode->sysctl_clen - ni - 1) *
1379 1.153 atatat sizeof(struct sysctlnode));
1380 1.153 atatat for (; ni < pnode->sysctl_clen - 1; ni++)
1381 1.153 atatat if (SYSCTL_TYPE(pnode->sysctl_child[ni].sysctl_flags) ==
1382 1.153 atatat CTLTYPE_NODE)
1383 1.161 atatat for (t = 0;
1384 1.161 atatat t < pnode->sysctl_child[ni].sysctl_clen;
1385 1.153 atatat t++)
1386 1.153 atatat pnode->sysctl_child[ni].sysctl_child[t].
1387 1.153 atatat sysctl_parent =
1388 1.153 atatat &pnode->sysctl_child[ni];
1389 1.153 atatat ni = pnode->sysctl_clen - 1;
1390 1.153 atatat node = &pnode->sysctl_child[ni];
1391 1.1 cgd }
1392 1.1 cgd
1393 1.153 atatat /*
1394 1.153 atatat * reset the space we just vacated
1395 1.153 atatat */
1396 1.153 atatat memset(node, 0, sizeof(struct sysctlnode));
1397 1.153 atatat node->sysctl_parent = pnode;
1398 1.153 atatat pnode->sysctl_clen--;
1399 1.1 cgd
1400 1.153 atatat /*
1401 1.153 atatat * if this parent just lost its last child, nuke the creche
1402 1.153 atatat */
1403 1.153 atatat if (pnode->sysctl_clen == 0) {
1404 1.187 yamt free(pnode->sysctl_child, M_SYSCTLNODE);
1405 1.153 atatat pnode->sysctl_csize = 0;
1406 1.153 atatat pnode->sysctl_child = NULL;
1407 1.153 atatat }
1408 1.55 is
1409 1.153 atatat /*
1410 1.153 atatat * update "version" on path to "root"
1411 1.153 atatat */
1412 1.153 atatat for (; rnode->sysctl_parent != NULL; rnode = rnode->sysctl_parent)
1413 1.153 atatat ;
1414 1.153 atatat for (ni = rnode->sysctl_ver + 1; pnode != NULL;
1415 1.153 atatat pnode = pnode->sysctl_parent)
1416 1.153 atatat pnode->sysctl_ver = ni;
1417 1.153 atatat
1418 1.162 atatat error = sysctl_cvt_out(l, v, &onode, oldp, *oldlenp, oldlenp);
1419 1.55 is
1420 1.1 cgd return (error);
1421 1.1 cgd }
1422 1.1 cgd
1423 1.1 cgd /*
1424 1.153 atatat * sysctl_lookup -- Handles copyin/copyout of new and old values.
1425 1.153 atatat * Partial reads are globally allowed. Only root can write to things
1426 1.153 atatat * unless the node says otherwise.
1427 1.1 cgd */
1428 1.13 christos int
1429 1.183 atatat sysctl_lookup(SYSCTLFN_ARGS)
1430 1.1 cgd {
1431 1.153 atatat int error, rw;
1432 1.153 atatat size_t sz, len;
1433 1.153 atatat void *d;
1434 1.153 atatat
1435 1.213 ad KASSERT(rw_lock_held(&sysctl_treelock));
1436 1.213 ad
1437 1.161 atatat if (SYSCTL_VERS(rnode->sysctl_flags) != SYSCTL_VERSION) {
1438 1.161 atatat printf("sysctl_lookup: rnode %p wrong version\n", rnode);
1439 1.161 atatat return (EINVAL);
1440 1.161 atatat }
1441 1.161 atatat
1442 1.153 atatat error = 0;
1443 1.153 atatat
1444 1.153 atatat /*
1445 1.153 atatat * you can't "look up" a node. you can "query" it, but you
1446 1.153 atatat * can't "look it up".
1447 1.153 atatat */
1448 1.153 atatat if (SYSCTL_TYPE(rnode->sysctl_flags) == CTLTYPE_NODE || namelen != 0)
1449 1.153 atatat return (EINVAL);
1450 1.1 cgd
1451 1.153 atatat /*
1452 1.153 atatat * some nodes are private, so only root can look into them.
1453 1.153 atatat */
1454 1.161 atatat if (l != NULL && (rnode->sysctl_flags & CTLFLAG_PRIVATE) &&
1455 1.202 elad (error = kauth_authorize_system(l->l_cred, KAUTH_SYSTEM_SYSCTL,
1456 1.202 elad KAUTH_REQ_SYSTEM_SYSCTL_PRVT, NULL, NULL, NULL)) != 0)
1457 1.153 atatat return (error);
1458 1.55 is
1459 1.153 atatat /*
1460 1.153 atatat * if a node wants to be writable according to different rules
1461 1.153 atatat * other than "only root can write to stuff unless a flag is
1462 1.153 atatat * set", then it needs its own function which should have been
1463 1.153 atatat * called and not us.
1464 1.153 atatat */
1465 1.153 atatat if (l != NULL && newp != NULL &&
1466 1.161 atatat !(rnode->sysctl_flags & CTLFLAG_ANYWRITE) &&
1467 1.222 elad (error = kauth_authorize_system(l->l_cred,
1468 1.222 elad KAUTH_SYSTEM_SYSCTL, KAUTH_REQ_SYSTEM_SYSCTL_MODIFY, NULL, NULL,
1469 1.222 elad NULL)) != 0)
1470 1.153 atatat return (error);
1471 1.1 cgd
1472 1.153 atatat /*
1473 1.153 atatat * is this node supposedly writable?
1474 1.153 atatat */
1475 1.199 elad rw = (rnode->sysctl_flags & CTLFLAG_READWRITE) ? 1 : 0;
1476 1.1 cgd
1477 1.153 atatat /*
1478 1.153 atatat * it appears not to be writable at this time, so if someone
1479 1.153 atatat * tried to write to it, we must tell them to go away
1480 1.153 atatat */
1481 1.153 atatat if (!rw && newp != NULL)
1482 1.1 cgd return (EPERM);
1483 1.55 is
1484 1.153 atatat /*
1485 1.153 atatat * step one, copy out the stuff we have presently
1486 1.153 atatat */
1487 1.161 atatat if (rnode->sysctl_flags & CTLFLAG_IMMEDIATE) {
1488 1.183 atatat /*
1489 1.183 atatat * note that we discard const here because we are
1490 1.183 atatat * modifying the contents of the node (which is okay
1491 1.183 atatat * because it's ours)
1492 1.183 atatat */
1493 1.153 atatat switch (SYSCTL_TYPE(rnode->sysctl_flags)) {
1494 1.215 matt case CTLTYPE_BOOL:
1495 1.215 matt d = __UNCONST(&rnode->sysctl_bdata);
1496 1.215 matt break;
1497 1.153 atatat case CTLTYPE_INT:
1498 1.183 atatat d = __UNCONST(&rnode->sysctl_idata);
1499 1.153 atatat break;
1500 1.153 atatat case CTLTYPE_QUAD:
1501 1.183 atatat d = __UNCONST(&rnode->sysctl_qdata);
1502 1.153 atatat break;
1503 1.153 atatat default:
1504 1.153 atatat return (EINVAL);
1505 1.153 atatat }
1506 1.188 yamt } else
1507 1.153 atatat d = rnode->sysctl_data;
1508 1.153 atatat if (SYSCTL_TYPE(rnode->sysctl_flags) == CTLTYPE_STRING)
1509 1.157 atatat sz = strlen(d) + 1; /* XXX@@@ possible fault here */
1510 1.153 atatat else
1511 1.153 atatat sz = rnode->sysctl_size;
1512 1.153 atatat if (oldp != NULL)
1513 1.153 atatat error = sysctl_copyout(l, d, oldp, MIN(sz, *oldlenp));
1514 1.153 atatat if (error)
1515 1.153 atatat return (error);
1516 1.153 atatat *oldlenp = sz;
1517 1.153 atatat
1518 1.153 atatat /*
1519 1.153 atatat * are we done?
1520 1.153 atatat */
1521 1.153 atatat if (newp == NULL || newlen == 0)
1522 1.153 atatat return (0);
1523 1.153 atatat
1524 1.153 atatat /*
1525 1.153 atatat * hmm...not done. must now "copy in" new value. re-adjust
1526 1.153 atatat * sz to maximum value (strings are "weird").
1527 1.153 atatat */
1528 1.153 atatat sz = rnode->sysctl_size;
1529 1.153 atatat switch (SYSCTL_TYPE(rnode->sysctl_flags)) {
1530 1.215 matt case CTLTYPE_BOOL: {
1531 1.229 mrg bool tmp;
1532 1.215 matt /*
1533 1.215 matt * these data must be *exactly* the same size coming
1534 1.215 matt * in. bool may only be true or false.
1535 1.215 matt */
1536 1.215 matt if (newlen != sz)
1537 1.215 matt return (EINVAL);
1538 1.215 matt error = sysctl_copyin(l, newp, &tmp, sz);
1539 1.229 mrg if (tmp != true && tmp != false)
1540 1.229 mrg return EINVAL;
1541 1.215 matt if (error)
1542 1.215 matt break;
1543 1.215 matt *(bool *)d = tmp;
1544 1.215 matt break;
1545 1.215 matt }
1546 1.153 atatat case CTLTYPE_INT:
1547 1.153 atatat case CTLTYPE_QUAD:
1548 1.153 atatat case CTLTYPE_STRUCT:
1549 1.153 atatat /*
1550 1.153 atatat * these data must be *exactly* the same size coming
1551 1.153 atatat * in.
1552 1.153 atatat */
1553 1.153 atatat if (newlen != sz)
1554 1.153 atatat return (EINVAL);
1555 1.153 atatat error = sysctl_copyin(l, newp, d, sz);
1556 1.153 atatat break;
1557 1.153 atatat case CTLTYPE_STRING: {
1558 1.153 atatat /*
1559 1.153 atatat * strings, on the other hand, can be shorter, and we
1560 1.153 atatat * let userland be sloppy about the trailing nul.
1561 1.153 atatat */
1562 1.153 atatat char *newbuf;
1563 1.85 simonb
1564 1.153 atatat /*
1565 1.153 atatat * too much new string?
1566 1.153 atatat */
1567 1.153 atatat if (newlen > sz)
1568 1.153 atatat return (EINVAL);
1569 1.85 simonb
1570 1.153 atatat /*
1571 1.153 atatat * temporary copy of new inbound string
1572 1.153 atatat */
1573 1.153 atatat len = MIN(sz, newlen);
1574 1.153 atatat newbuf = malloc(len, M_SYSCTLDATA, M_WAITOK|M_CANFAIL);
1575 1.153 atatat if (newbuf == NULL)
1576 1.153 atatat return (ENOMEM);
1577 1.153 atatat error = sysctl_copyin(l, newp, newbuf, len);
1578 1.153 atatat if (error) {
1579 1.187 yamt free(newbuf, M_SYSCTLDATA);
1580 1.153 atatat return (error);
1581 1.153 atatat }
1582 1.85 simonb
1583 1.153 atatat /*
1584 1.232 apb * did they NUL terminate it, or do we have space
1585 1.153 atatat * left to do it ourselves?
1586 1.153 atatat */
1587 1.153 atatat if (newbuf[len - 1] != '\0' && len == sz) {
1588 1.187 yamt free(newbuf, M_SYSCTLDATA);
1589 1.153 atatat return (EINVAL);
1590 1.153 atatat }
1591 1.85 simonb
1592 1.153 atatat /*
1593 1.153 atatat * looks good, so pop it into place and zero the rest.
1594 1.153 atatat */
1595 1.153 atatat if (len > 0)
1596 1.190 yamt memcpy(d, newbuf, len);
1597 1.153 atatat if (sz != len)
1598 1.190 yamt memset((char*)d + len, 0, sz - len);
1599 1.187 yamt free(newbuf, M_SYSCTLDATA);
1600 1.153 atatat break;
1601 1.153 atatat }
1602 1.153 atatat default:
1603 1.153 atatat return (EINVAL);
1604 1.153 atatat }
1605 1.55 is
1606 1.1 cgd return (error);
1607 1.1 cgd }
1608 1.1 cgd
1609 1.1 cgd /*
1610 1.153 atatat * sysctl_mmap -- Dispatches sysctl mmap requests to those nodes that
1611 1.153 atatat * purport to handle it. This interface isn't fully fleshed out yet,
1612 1.153 atatat * unfortunately.
1613 1.1 cgd */
1614 1.69 simonb static int
1615 1.183 atatat sysctl_mmap(SYSCTLFN_ARGS)
1616 1.1 cgd {
1617 1.183 atatat const struct sysctlnode *node;
1618 1.183 atatat struct sysctlnode nnode;
1619 1.111 thorpej int error;
1620 1.1 cgd
1621 1.161 atatat if (SYSCTL_VERS(rnode->sysctl_flags) != SYSCTL_VERSION) {
1622 1.161 atatat printf("sysctl_mmap: rnode %p wrong version\n", rnode);
1623 1.161 atatat return (EINVAL);
1624 1.161 atatat }
1625 1.161 atatat
1626 1.153 atatat /*
1627 1.153 atatat * let's just pretend that didn't happen, m'kay?
1628 1.153 atatat */
1629 1.153 atatat if (l == NULL)
1630 1.153 atatat return (EPERM);
1631 1.153 atatat
1632 1.153 atatat /*
1633 1.153 atatat * is this a sysctlnode description of an mmap request?
1634 1.153 atatat */
1635 1.153 atatat if (newp == NULL || newlen != sizeof(struct sysctlnode))
1636 1.153 atatat return (EINVAL);
1637 1.161 atatat error = sysctl_copyin(l, newp, &nnode, sizeof(nnode));
1638 1.153 atatat if (error)
1639 1.153 atatat return (error);
1640 1.1 cgd
1641 1.1 cgd /*
1642 1.153 atatat * does the node they asked for exist?
1643 1.1 cgd */
1644 1.153 atatat if (namelen != 1)
1645 1.153 atatat return (EOPNOTSUPP);
1646 1.153 atatat node = rnode;
1647 1.153 atatat error = sysctl_locate(l, &nnode.sysctl_num, 1, &node, NULL);
1648 1.13 christos if (error)
1649 1.1 cgd return (error);
1650 1.1 cgd
1651 1.1 cgd /*
1652 1.153 atatat * does this node that we have found purport to handle mmap?
1653 1.153 atatat */
1654 1.153 atatat if (node->sysctl_func == NULL ||
1655 1.161 atatat !(node->sysctl_flags & CTLFLAG_MMAP))
1656 1.153 atatat return (EOPNOTSUPP);
1657 1.153 atatat
1658 1.153 atatat /*
1659 1.153 atatat * well...okay, they asked for it.
1660 1.1 cgd */
1661 1.153 atatat return ((*node->sysctl_func)(SYSCTLFN_CALL(node)));
1662 1.1 cgd }
1663 1.1 cgd
1664 1.165 atatat int
1665 1.165 atatat sysctl_describe(SYSCTLFN_ARGS)
1666 1.165 atatat {
1667 1.166 atatat struct sysctldesc *d;
1668 1.197 christos void *bf;
1669 1.166 atatat size_t sz, left, tot;
1670 1.166 atatat int i, error, v = -1;
1671 1.166 atatat struct sysctlnode *node;
1672 1.166 atatat struct sysctlnode dnode;
1673 1.165 atatat
1674 1.165 atatat if (SYSCTL_VERS(rnode->sysctl_flags) != SYSCTL_VERSION) {
1675 1.165 atatat printf("sysctl_query: rnode %p wrong version\n", rnode);
1676 1.165 atatat return (EINVAL);
1677 1.165 atatat }
1678 1.165 atatat
1679 1.165 atatat if (SYSCTL_TYPE(rnode->sysctl_flags) != CTLTYPE_NODE)
1680 1.165 atatat return (ENOTDIR);
1681 1.165 atatat if (namelen != 1 || name[0] != CTL_DESCRIBE)
1682 1.165 atatat return (EINVAL);
1683 1.165 atatat
1684 1.165 atatat /*
1685 1.166 atatat * get ready...
1686 1.166 atatat */
1687 1.166 atatat error = 0;
1688 1.197 christos d = bf = malloc(MAXDESCLEN, M_TEMP, M_WAITOK|M_CANFAIL);
1689 1.197 christos if (bf == NULL)
1690 1.197 christos return ENOMEM;
1691 1.166 atatat tot = 0;
1692 1.166 atatat node = rnode->sysctl_child;
1693 1.166 atatat left = *oldlenp;
1694 1.166 atatat
1695 1.166 atatat /*
1696 1.166 atatat * no request -> all descriptions at this level
1697 1.166 atatat * request with desc unset -> just this node
1698 1.166 atatat * request with desc set -> set descr for this node
1699 1.165 atatat */
1700 1.166 atatat if (newp != NULL) {
1701 1.166 atatat error = sysctl_cvt_in(l, &v, newp, newlen, &dnode);
1702 1.166 atatat if (error)
1703 1.197 christos goto out;
1704 1.166 atatat if (dnode.sysctl_desc != NULL) {
1705 1.166 atatat /*
1706 1.166 atatat * processes cannot set descriptions above
1707 1.166 atatat * securelevel 0. and must be root. blah
1708 1.166 atatat * blah blah. a couple more checks are made
1709 1.166 atatat * once we find the node we want.
1710 1.166 atatat */
1711 1.166 atatat if (l != NULL) {
1712 1.166 atatat #ifndef SYSCTL_DISALLOW_CREATE
1713 1.202 elad error = kauth_authorize_system(l->l_cred,
1714 1.202 elad KAUTH_SYSTEM_SYSCTL,
1715 1.202 elad KAUTH_REQ_SYSTEM_SYSCTL_DESC, NULL,
1716 1.202 elad NULL, NULL);
1717 1.166 atatat if (error)
1718 1.197 christos goto out;
1719 1.166 atatat #else /* SYSCTL_DISALLOW_CREATE */
1720 1.197 christos error = EPERM;
1721 1.197 christos goto out;
1722 1.166 atatat #endif /* SYSCTL_DISALLOW_CREATE */
1723 1.166 atatat }
1724 1.166 atatat
1725 1.166 atatat /*
1726 1.166 atatat * find node and try to set the description on it
1727 1.166 atatat */
1728 1.166 atatat for (i = 0; i < rnode->sysctl_clen; i++)
1729 1.166 atatat if (node[i].sysctl_num == dnode.sysctl_num)
1730 1.166 atatat break;
1731 1.197 christos if (i == rnode->sysctl_clen) {
1732 1.197 christos error = ENOENT;
1733 1.197 christos goto out;
1734 1.197 christos }
1735 1.166 atatat node = &node[i];
1736 1.166 atatat
1737 1.166 atatat /*
1738 1.166 atatat * did the caller specify a node version?
1739 1.166 atatat */
1740 1.166 atatat if (dnode.sysctl_ver != 0 &&
1741 1.197 christos dnode.sysctl_ver != node->sysctl_ver) {
1742 1.197 christos error = EINVAL;
1743 1.197 christos goto out;
1744 1.197 christos }
1745 1.166 atatat
1746 1.166 atatat /*
1747 1.166 atatat * okay...some rules:
1748 1.170 atatat * (1) if setup is done and the tree is
1749 1.170 atatat * read-only or the whole system is
1750 1.170 atatat * read-only
1751 1.170 atatat * (2) no one can set a description on a
1752 1.166 atatat * permanent node (it must be set when
1753 1.166 atatat * using createv)
1754 1.170 atatat * (3) processes cannot *change* a description
1755 1.170 atatat * (4) processes *can*, however, set a
1756 1.166 atatat * description on a read-only node so that
1757 1.166 atatat * one can be created and then described
1758 1.166 atatat * in two steps
1759 1.166 atatat * anything else come to mind?
1760 1.166 atatat */
1761 1.170 atatat if ((sysctl_root.sysctl_flags & CTLFLAG_PERMANENT) &&
1762 1.170 atatat (!(sysctl_rootof(node)->sysctl_flags &
1763 1.170 atatat CTLFLAG_READWRITE) ||
1764 1.197 christos !(sysctl_root.sysctl_flags & CTLFLAG_READWRITE))) {
1765 1.197 christos error = EPERM;
1766 1.197 christos goto out;
1767 1.197 christos }
1768 1.197 christos if (node->sysctl_flags & CTLFLAG_PERMANENT) {
1769 1.197 christos error = EPERM;
1770 1.197 christos goto out;
1771 1.197 christos }
1772 1.197 christos if (l != NULL && node->sysctl_desc != NULL) {
1773 1.197 christos error = EPERM;
1774 1.197 christos goto out;
1775 1.197 christos }
1776 1.166 atatat
1777 1.166 atatat /*
1778 1.166 atatat * right, let's go ahead. the first step is
1779 1.166 atatat * making the description into something the
1780 1.166 atatat * node can "own", if need be.
1781 1.166 atatat */
1782 1.166 atatat if (l != NULL ||
1783 1.166 atatat dnode.sysctl_flags & CTLFLAG_OWNDESC) {
1784 1.197 christos char *nd, *k;
1785 1.166 atatat
1786 1.197 christos k = malloc(MAXDESCLEN, M_TEMP,
1787 1.197 christos M_WAITOK|M_CANFAIL);
1788 1.197 christos if (k == NULL) {
1789 1.197 christos error = ENOMEM;
1790 1.197 christos goto out;
1791 1.197 christos }
1792 1.166 atatat error = sysctl_copyinstr(l, dnode.sysctl_desc,
1793 1.197 christos k, MAXDESCLEN, &sz);
1794 1.197 christos if (error) {
1795 1.197 christos free(k, M_TEMP);
1796 1.197 christos goto out;
1797 1.197 christos }
1798 1.166 atatat nd = malloc(sz, M_SYSCTLDATA,
1799 1.166 atatat M_WAITOK|M_CANFAIL);
1800 1.197 christos if (nd == NULL) {
1801 1.197 christos free(k, M_TEMP);
1802 1.197 christos error = ENOMEM;
1803 1.197 christos goto out;
1804 1.197 christos }
1805 1.166 atatat memcpy(nd, k, sz);
1806 1.166 atatat dnode.sysctl_flags |= CTLFLAG_OWNDESC;
1807 1.166 atatat dnode.sysctl_desc = nd;
1808 1.197 christos free(k, M_TEMP);
1809 1.166 atatat }
1810 1.166 atatat
1811 1.166 atatat /*
1812 1.166 atatat * now "release" the old description and
1813 1.166 atatat * attach the new one. ta-da.
1814 1.166 atatat */
1815 1.166 atatat if ((node->sysctl_flags & CTLFLAG_OWNDESC) &&
1816 1.166 atatat node->sysctl_desc != NULL)
1817 1.180 christos /*XXXUNCONST*/
1818 1.180 christos free(__UNCONST(node->sysctl_desc), M_SYSCTLDATA);
1819 1.166 atatat node->sysctl_desc = dnode.sysctl_desc;
1820 1.166 atatat node->sysctl_flags |=
1821 1.166 atatat (dnode.sysctl_flags & CTLFLAG_OWNDESC);
1822 1.166 atatat
1823 1.166 atatat /*
1824 1.166 atatat * now we "fall out" and into the loop which
1825 1.166 atatat * will copy the new description back out for
1826 1.166 atatat * those interested parties
1827 1.166 atatat */
1828 1.166 atatat }
1829 1.166 atatat }
1830 1.166 atatat
1831 1.166 atatat /*
1832 1.166 atatat * scan for one description or just retrieve all descriptions
1833 1.166 atatat */
1834 1.166 atatat for (i = 0; i < rnode->sysctl_clen; i++) {
1835 1.166 atatat /*
1836 1.166 atatat * did they ask for the description of only one node?
1837 1.166 atatat */
1838 1.166 atatat if (v != -1 && node[i].sysctl_num != dnode.sysctl_num)
1839 1.166 atatat continue;
1840 1.166 atatat
1841 1.166 atatat /*
1842 1.166 atatat * don't describe "private" nodes to non-suser users
1843 1.166 atatat */
1844 1.166 atatat if ((node[i].sysctl_flags & CTLFLAG_PRIVATE) && (l != NULL) &&
1845 1.202 elad !(kauth_authorize_system(l->l_cred, KAUTH_SYSTEM_SYSCTL,
1846 1.202 elad KAUTH_REQ_SYSTEM_SYSCTL_PRVT, NULL, NULL, NULL)))
1847 1.166 atatat continue;
1848 1.166 atatat
1849 1.166 atatat /*
1850 1.166 atatat * is this description "valid"?
1851 1.166 atatat */
1852 1.197 christos memset(bf, 0, MAXDESCLEN);
1853 1.179 perry if (node[i].sysctl_desc == NULL)
1854 1.166 atatat sz = 1;
1855 1.166 atatat else if (copystr(node[i].sysctl_desc, &d->descr_str[0],
1856 1.197 christos MAXDESCLEN - sizeof(*d), &sz) != 0) {
1857 1.166 atatat /*
1858 1.166 atatat * erase possible partial description
1859 1.166 atatat */
1860 1.197 christos memset(bf, 0, MAXDESCLEN);
1861 1.166 atatat sz = 1;
1862 1.166 atatat }
1863 1.166 atatat
1864 1.166 atatat /*
1865 1.166 atatat * we've got it, stuff it into the caller's buffer
1866 1.166 atatat */
1867 1.166 atatat d->descr_num = node[i].sysctl_num;
1868 1.166 atatat d->descr_ver = node[i].sysctl_ver;
1869 1.166 atatat d->descr_len = sz; /* includes trailing nul */
1870 1.209 christos sz = (char *)NEXT_DESCR(d) - (char *)d;
1871 1.166 atatat if (oldp != NULL && left >= sz) {
1872 1.166 atatat error = sysctl_copyout(l, d, oldp, sz);
1873 1.166 atatat if (error)
1874 1.197 christos goto out;
1875 1.166 atatat left -= sz;
1876 1.180 christos oldp = (void *)__sysc_desc_adv(oldp, d->descr_len);
1877 1.166 atatat }
1878 1.166 atatat tot += sz;
1879 1.165 atatat
1880 1.166 atatat /*
1881 1.166 atatat * if we get this far with v not "unset", they asked
1882 1.166 atatat * for a specific node and we found it
1883 1.166 atatat */
1884 1.166 atatat if (v != -1)
1885 1.166 atatat break;
1886 1.166 atatat }
1887 1.166 atatat
1888 1.166 atatat /*
1889 1.166 atatat * did we find it after all?
1890 1.166 atatat */
1891 1.166 atatat if (v != -1 && tot == 0)
1892 1.166 atatat error = ENOENT;
1893 1.166 atatat else
1894 1.166 atatat *oldlenp = tot;
1895 1.165 atatat
1896 1.197 christos out:
1897 1.197 christos free(bf, M_TEMP);
1898 1.166 atatat return (error);
1899 1.165 atatat }
1900 1.165 atatat
1901 1.145 dsl /*
1902 1.153 atatat * ********************************************************************
1903 1.153 atatat * Section 3: Create and destroy from inside the kernel
1904 1.153 atatat * ********************************************************************
1905 1.153 atatat * sysctl_createv() and sysctl_destroyv() are simpler-to-use
1906 1.153 atatat * interfaces for the kernel to fling new entries into the mib and rip
1907 1.153 atatat * them out later. In the case of sysctl_createv(), the returned copy
1908 1.153 atatat * of the node (see sysctl_create()) will be translated back into a
1909 1.153 atatat * pointer to the actual node.
1910 1.153 atatat *
1911 1.153 atatat * Note that sysctl_createv() will return 0 if the create request
1912 1.153 atatat * matches an existing node (ala mkdir -p), and that sysctl_destroyv()
1913 1.153 atatat * will return 0 if the node to be destroyed already does not exist
1914 1.153 atatat * (aka rm -f) or if it is a parent of other nodes.
1915 1.153 atatat *
1916 1.153 atatat * This allows two (or more) different subsystems to assert sub-tree
1917 1.153 atatat * existence before populating their own nodes, and to remove their
1918 1.153 atatat * own nodes without orphaning the others when they are done.
1919 1.153 atatat * ********************************************************************
1920 1.145 dsl */
1921 1.153 atatat int
1922 1.161 atatat sysctl_createv(struct sysctllog **log, int cflags,
1923 1.183 atatat const struct sysctlnode **rnode, const struct sysctlnode **cnode,
1924 1.161 atatat int flags, int type, const char *namep, const char *descr,
1925 1.153 atatat sysctlfn func, u_quad_t qv, void *newp, size_t newlen,
1926 1.153 atatat ...)
1927 1.153 atatat {
1928 1.153 atatat va_list ap;
1929 1.153 atatat int error, ni, namelen, name[CTL_MAXNAME];
1930 1.183 atatat const struct sysctlnode *root, *pnode;
1931 1.183 atatat struct sysctlnode nnode, onode, *dnode;
1932 1.153 atatat size_t sz;
1933 1.145 dsl
1934 1.161 atatat /*
1935 1.161 atatat * where are we putting this?
1936 1.161 atatat */
1937 1.161 atatat if (rnode != NULL && *rnode == NULL) {
1938 1.161 atatat printf("sysctl_createv: rnode NULL\n");
1939 1.161 atatat return (EINVAL);
1940 1.161 atatat }
1941 1.169 atatat root = rnode ? *rnode : NULL;
1942 1.169 atatat if (cnode != NULL)
1943 1.169 atatat *cnode = NULL;
1944 1.169 atatat if (cflags != 0)
1945 1.169 atatat return (EINVAL);
1946 1.161 atatat
1947 1.153 atatat /*
1948 1.153 atatat * what is it?
1949 1.153 atatat */
1950 1.161 atatat flags = SYSCTL_VERSION|SYSCTL_TYPE(type)|SYSCTL_FLAGS(flags);
1951 1.163 atatat if (log != NULL)
1952 1.163 atatat flags &= ~CTLFLAG_PERMANENT;
1953 1.145 dsl
1954 1.145 dsl /*
1955 1.153 atatat * where do we put it?
1956 1.145 dsl */
1957 1.153 atatat va_start(ap, newlen);
1958 1.153 atatat namelen = 0;
1959 1.153 atatat ni = -1;
1960 1.153 atatat do {
1961 1.153 atatat if (++ni == CTL_MAXNAME)
1962 1.153 atatat return (ENAMETOOLONG);
1963 1.153 atatat name[ni] = va_arg(ap, int);
1964 1.153 atatat /*
1965 1.153 atatat * sorry, this is not supported from here
1966 1.153 atatat */
1967 1.153 atatat if (name[ni] == CTL_CREATESYM)
1968 1.153 atatat return (EINVAL);
1969 1.153 atatat } while (name[ni] != CTL_EOL && name[ni] != CTL_CREATE);
1970 1.153 atatat namelen = ni + (name[ni] == CTL_CREATE ? 1 : 0);
1971 1.153 atatat va_end(ap);
1972 1.69 simonb
1973 1.69 simonb /*
1974 1.153 atatat * what's it called
1975 1.69 simonb */
1976 1.184 peter if (strlcpy(nnode.sysctl_name, namep, sizeof(nnode.sysctl_name)) >=
1977 1.153 atatat sizeof(nnode.sysctl_name))
1978 1.153 atatat return (ENAMETOOLONG);
1979 1.69 simonb
1980 1.153 atatat /*
1981 1.153 atatat * cons up the description of the new node
1982 1.153 atatat */
1983 1.153 atatat nnode.sysctl_num = name[namelen - 1];
1984 1.153 atatat name[namelen - 1] = CTL_CREATE;
1985 1.153 atatat nnode.sysctl_size = newlen;
1986 1.153 atatat nnode.sysctl_flags = flags;
1987 1.153 atatat if (type == CTLTYPE_NODE) {
1988 1.153 atatat nnode.sysctl_csize = 0;
1989 1.153 atatat nnode.sysctl_clen = 0;
1990 1.153 atatat nnode.sysctl_child = NULL;
1991 1.161 atatat if (flags & CTLFLAG_ALIAS)
1992 1.153 atatat nnode.sysctl_alias = qv;
1993 1.188 yamt } else if (flags & CTLFLAG_IMMEDIATE) {
1994 1.153 atatat switch (type) {
1995 1.215 matt case CTLTYPE_BOOL:
1996 1.215 matt nnode.sysctl_bdata = qv;
1997 1.215 matt break;
1998 1.153 atatat case CTLTYPE_INT:
1999 1.153 atatat nnode.sysctl_idata = qv;
2000 1.153 atatat break;
2001 1.153 atatat case CTLTYPE_QUAD:
2002 1.153 atatat nnode.sysctl_qdata = qv;
2003 1.153 atatat break;
2004 1.153 atatat default:
2005 1.153 atatat return (EINVAL);
2006 1.153 atatat }
2007 1.188 yamt } else {
2008 1.153 atatat nnode.sysctl_data = newp;
2009 1.69 simonb }
2010 1.153 atatat nnode.sysctl_func = func;
2011 1.153 atatat nnode.sysctl_parent = NULL;
2012 1.153 atatat nnode.sysctl_ver = 0;
2013 1.69 simonb
2014 1.153 atatat /*
2015 1.153 atatat * initialize lock state -- we need locks if the main tree has
2016 1.153 atatat * been marked as complete, but since we could be called from
2017 1.153 atatat * either there, or from a device driver (say, at device
2018 1.219 ad * insertion), or from a module (at module load time, say), we
2019 1.153 atatat * don't really want to "wait"...
2020 1.153 atatat */
2021 1.213 ad sysctl_lock(true);
2022 1.179 perry
2023 1.153 atatat /*
2024 1.153 atatat * locate the prospective parent of the new node, and if we
2025 1.153 atatat * find it, add the new node.
2026 1.153 atatat */
2027 1.153 atatat sz = sizeof(onode);
2028 1.169 atatat pnode = root;
2029 1.153 atatat error = sysctl_locate(NULL, &name[0], namelen - 1, &pnode, &ni);
2030 1.161 atatat if (error) {
2031 1.175 atatat printf("sysctl_createv: sysctl_locate(%s) returned %d\n",
2032 1.175 atatat nnode.sysctl_name, error);
2033 1.213 ad sysctl_unlock();
2034 1.161 atatat return (error);
2035 1.161 atatat }
2036 1.161 atatat error = sysctl_create(&name[ni], namelen - ni, &onode, &sz,
2037 1.161 atatat &nnode, sizeof(nnode), &name[0], NULL,
2038 1.161 atatat pnode);
2039 1.72 simonb
2040 1.72 simonb /*
2041 1.153 atatat * unfortunately the node we wanted to create is already
2042 1.153 atatat * there. if the node that's already there is a reasonable
2043 1.153 atatat * facsimile of the node we wanted to create, just pretend
2044 1.153 atatat * (for the caller's benefit) that we managed to create the
2045 1.153 atatat * node they wanted.
2046 1.72 simonb */
2047 1.153 atatat if (error == EEXIST) {
2048 1.153 atatat /* name is the same as requested... */
2049 1.153 atatat if (strcmp(nnode.sysctl_name, onode.sysctl_name) == 0 &&
2050 1.153 atatat /* they want the same function... */
2051 1.153 atatat nnode.sysctl_func == onode.sysctl_func &&
2052 1.153 atatat /* number is the same as requested, or... */
2053 1.153 atatat (nnode.sysctl_num == onode.sysctl_num ||
2054 1.153 atatat /* they didn't pick a number... */
2055 1.153 atatat nnode.sysctl_num == CTL_CREATE)) {
2056 1.153 atatat /*
2057 1.153 atatat * collision here from trying to create
2058 1.153 atatat * something that already existed; let's give
2059 1.153 atatat * our customers a hand and tell them they got
2060 1.153 atatat * what they wanted.
2061 1.153 atatat */
2062 1.153 atatat #ifdef SYSCTL_DEBUG_CREATE
2063 1.153 atatat printf("cleared\n");
2064 1.153 atatat #endif /* SYSCTL_DEBUG_CREATE */
2065 1.153 atatat error = 0;
2066 1.153 atatat }
2067 1.72 simonb }
2068 1.72 simonb
2069 1.163 atatat if (error == 0 &&
2070 1.166 atatat (cnode != NULL || log != NULL || descr != NULL)) {
2071 1.153 atatat /*
2072 1.153 atatat * sysctl_create() gave us back a copy of the node,
2073 1.153 atatat * but we need to know where it actually is...
2074 1.153 atatat */
2075 1.169 atatat pnode = root;
2076 1.160 atatat error = sysctl_locate(NULL, &name[0], namelen - 1, &pnode, &ni);
2077 1.160 atatat
2078 1.160 atatat /*
2079 1.160 atatat * manual scan of last layer so that aliased nodes
2080 1.160 atatat * aren't followed.
2081 1.160 atatat */
2082 1.160 atatat if (error == 0) {
2083 1.160 atatat for (ni = 0; ni < pnode->sysctl_clen; ni++)
2084 1.160 atatat if (pnode->sysctl_child[ni].sysctl_num ==
2085 1.160 atatat onode.sysctl_num)
2086 1.160 atatat break;
2087 1.160 atatat if (ni < pnode->sysctl_clen)
2088 1.160 atatat pnode = &pnode->sysctl_child[ni];
2089 1.160 atatat else
2090 1.160 atatat error = ENOENT;
2091 1.160 atatat }
2092 1.160 atatat
2093 1.153 atatat /*
2094 1.153 atatat * not expecting an error here, but...
2095 1.153 atatat */
2096 1.161 atatat if (error == 0) {
2097 1.163 atatat if (log != NULL)
2098 1.163 atatat sysctl_log_add(log, pnode);
2099 1.161 atatat if (cnode != NULL)
2100 1.161 atatat *cnode = pnode;
2101 1.166 atatat if (descr != NULL) {
2102 1.171 atatat /*
2103 1.171 atatat * allow first caller to *set* a
2104 1.171 atatat * description actually to set it
2105 1.183 atatat *
2106 1.183 atatat * discard const here so we can attach
2107 1.183 atatat * the description
2108 1.171 atatat */
2109 1.183 atatat dnode = __UNCONST(pnode);
2110 1.171 atatat if (pnode->sysctl_desc != NULL)
2111 1.171 atatat /* skip it...we've got one */;
2112 1.171 atatat else if (flags & CTLFLAG_OWNDESC) {
2113 1.166 atatat size_t l = strlen(descr) + 1;
2114 1.166 atatat char *d = malloc(l, M_SYSCTLDATA,
2115 1.166 atatat M_WAITOK|M_CANFAIL);
2116 1.166 atatat if (d != NULL) {
2117 1.166 atatat memcpy(d, descr, l);
2118 1.183 atatat dnode->sysctl_desc = d;
2119 1.183 atatat dnode->sysctl_flags |=
2120 1.171 atatat CTLFLAG_OWNDESC;
2121 1.166 atatat }
2122 1.188 yamt } else
2123 1.183 atatat dnode->sysctl_desc = descr;
2124 1.166 atatat }
2125 1.188 yamt } else {
2126 1.161 atatat printf("sysctl_create succeeded but node not found?!\n");
2127 1.161 atatat /*
2128 1.161 atatat * confusing, but the create said it
2129 1.161 atatat * succeeded, so...
2130 1.161 atatat */
2131 1.161 atatat error = 0;
2132 1.161 atatat }
2133 1.72 simonb }
2134 1.72 simonb
2135 1.88 enami /*
2136 1.161 atatat * now it should be safe to release the lock state. note that
2137 1.161 atatat * the pointer to the newly created node being passed back may
2138 1.161 atatat * not be "good" for very long.
2139 1.88 enami */
2140 1.213 ad sysctl_unlock();
2141 1.88 enami
2142 1.153 atatat if (error != 0) {
2143 1.153 atatat printf("sysctl_createv: sysctl_create(%s) returned %d\n",
2144 1.153 atatat nnode.sysctl_name, error);
2145 1.153 atatat #if 0
2146 1.153 atatat if (error != ENOENT)
2147 1.153 atatat sysctl_dump(&onode);
2148 1.153 atatat #endif
2149 1.72 simonb }
2150 1.153 atatat
2151 1.72 simonb return (error);
2152 1.72 simonb }
2153 1.69 simonb
2154 1.153 atatat int
2155 1.153 atatat sysctl_destroyv(struct sysctlnode *rnode, ...)
2156 1.1 cgd {
2157 1.153 atatat va_list ap;
2158 1.153 atatat int error, name[CTL_MAXNAME], namelen, ni;
2159 1.183 atatat const struct sysctlnode *pnode, *node;
2160 1.183 atatat struct sysctlnode dnode, *onode;
2161 1.158 atatat size_t sz;
2162 1.153 atatat
2163 1.153 atatat va_start(ap, rnode);
2164 1.153 atatat namelen = 0;
2165 1.153 atatat ni = 0;
2166 1.153 atatat do {
2167 1.153 atatat if (ni == CTL_MAXNAME)
2168 1.153 atatat return (ENAMETOOLONG);
2169 1.153 atatat name[ni] = va_arg(ap, int);
2170 1.153 atatat } while (name[ni++] != CTL_EOL);
2171 1.153 atatat namelen = ni - 1;
2172 1.153 atatat va_end(ap);
2173 1.62 simonb
2174 1.153 atatat /*
2175 1.153 atatat * i can't imagine why we'd be destroying a node when the tree
2176 1.153 atatat * wasn't complete, but who knows?
2177 1.153 atatat */
2178 1.213 ad sysctl_lock(true);
2179 1.1 cgd
2180 1.153 atatat /*
2181 1.153 atatat * where is it?
2182 1.153 atatat */
2183 1.153 atatat node = rnode;
2184 1.160 atatat error = sysctl_locate(NULL, &name[0], namelen - 1, &node, &ni);
2185 1.153 atatat if (error) {
2186 1.153 atatat /* they want it gone and it's not there, so... */
2187 1.213 ad sysctl_unlock();
2188 1.153 atatat return (error == ENOENT ? 0 : error);
2189 1.62 simonb }
2190 1.41 thorpej
2191 1.153 atatat /*
2192 1.160 atatat * set up the deletion
2193 1.158 atatat */
2194 1.160 atatat pnode = node;
2195 1.160 atatat node = &dnode;
2196 1.160 atatat memset(&dnode, 0, sizeof(dnode));
2197 1.176 cube dnode.sysctl_flags = SYSCTL_VERSION;
2198 1.160 atatat dnode.sysctl_num = name[namelen - 1];
2199 1.158 atatat
2200 1.158 atatat /*
2201 1.153 atatat * we found it, now let's nuke it
2202 1.153 atatat */
2203 1.153 atatat name[namelen - 1] = CTL_DESTROY;
2204 1.158 atatat sz = 0;
2205 1.158 atatat error = sysctl_destroy(&name[namelen - 1], 1, NULL, &sz,
2206 1.153 atatat node, sizeof(*node), &name[0], NULL,
2207 1.153 atatat pnode);
2208 1.166 atatat if (error == ENOTEMPTY) {
2209 1.1 cgd /*
2210 1.153 atatat * think of trying to delete "foo" when "foo.bar"
2211 1.153 atatat * (which someone else put there) is still in
2212 1.153 atatat * existence
2213 1.1 cgd */
2214 1.153 atatat error = 0;
2215 1.1 cgd
2216 1.166 atatat /*
2217 1.166 atatat * dunno who put the description there, but if this
2218 1.166 atatat * node can ever be removed, we need to make sure the
2219 1.166 atatat * string doesn't go out of context. that means we
2220 1.166 atatat * need to find the node that's still there (don't use
2221 1.166 atatat * sysctl_locate() because that follows aliasing).
2222 1.166 atatat */
2223 1.166 atatat node = pnode->sysctl_child;
2224 1.166 atatat for (ni = 0; ni < pnode->sysctl_clen; ni++)
2225 1.166 atatat if (node[ni].sysctl_num == dnode.sysctl_num)
2226 1.166 atatat break;
2227 1.166 atatat node = (ni < pnode->sysctl_clen) ? &node[ni] : NULL;
2228 1.166 atatat
2229 1.166 atatat /*
2230 1.166 atatat * if we found it, and this node has a description,
2231 1.166 atatat * and this node can be released, and it doesn't
2232 1.166 atatat * already own its own description...sigh. :)
2233 1.166 atatat */
2234 1.166 atatat if (node != NULL && node->sysctl_desc != NULL &&
2235 1.166 atatat !(node->sysctl_flags & CTLFLAG_PERMANENT) &&
2236 1.166 atatat !(node->sysctl_flags & CTLFLAG_OWNDESC)) {
2237 1.166 atatat char *d;
2238 1.166 atatat
2239 1.166 atatat sz = strlen(node->sysctl_desc) + 1;
2240 1.166 atatat d = malloc(sz, M_SYSCTLDATA, M_WAITOK|M_CANFAIL);
2241 1.166 atatat if (d != NULL) {
2242 1.183 atatat /*
2243 1.183 atatat * discard const so that we can
2244 1.183 atatat * re-attach the description
2245 1.183 atatat */
2246 1.166 atatat memcpy(d, node->sysctl_desc, sz);
2247 1.183 atatat onode = __UNCONST(node);
2248 1.183 atatat onode->sysctl_desc = d;
2249 1.183 atatat onode->sysctl_flags |= CTLFLAG_OWNDESC;
2250 1.188 yamt } else {
2251 1.166 atatat /*
2252 1.166 atatat * XXX drop the description? be
2253 1.166 atatat * afraid? don't care?
2254 1.166 atatat */
2255 1.166 atatat }
2256 1.166 atatat }
2257 1.166 atatat }
2258 1.166 atatat
2259 1.213 ad sysctl_unlock();
2260 1.1 cgd
2261 1.153 atatat return (error);
2262 1.153 atatat }
2263 1.1 cgd
2264 1.123 thorpej /*
2265 1.153 atatat * ********************************************************************
2266 1.153 atatat * Deletes an entire n-ary tree. Not recommended unless you know why
2267 1.153 atatat * you're doing it. Personally, I don't know why you'd even think
2268 1.153 atatat * about it.
2269 1.153 atatat * ********************************************************************
2270 1.123 thorpej */
2271 1.153 atatat void
2272 1.153 atatat sysctl_free(struct sysctlnode *rnode)
2273 1.123 thorpej {
2274 1.153 atatat struct sysctlnode *node, *pnode;
2275 1.123 thorpej
2276 1.214 ad rw_enter(&sysctl_treelock, RW_WRITER);
2277 1.213 ad
2278 1.192 chris if (rnode == NULL)
2279 1.192 chris rnode = &sysctl_root;
2280 1.192 chris
2281 1.161 atatat if (SYSCTL_VERS(rnode->sysctl_flags) != SYSCTL_VERSION) {
2282 1.161 atatat printf("sysctl_free: rnode %p wrong version\n", rnode);
2283 1.214 ad rw_exit(&sysctl_treelock);
2284 1.161 atatat return;
2285 1.161 atatat }
2286 1.161 atatat
2287 1.153 atatat pnode = rnode;
2288 1.153 atatat
2289 1.153 atatat node = pnode->sysctl_child;
2290 1.153 atatat do {
2291 1.153 atatat while (node != NULL && pnode->sysctl_csize > 0) {
2292 1.153 atatat while (node <
2293 1.153 atatat &pnode->sysctl_child[pnode->sysctl_clen] &&
2294 1.153 atatat (SYSCTL_TYPE(node->sysctl_flags) !=
2295 1.153 atatat CTLTYPE_NODE ||
2296 1.153 atatat node->sysctl_csize == 0)) {
2297 1.153 atatat if (SYSCTL_FLAGS(node->sysctl_flags) &
2298 1.161 atatat CTLFLAG_OWNDATA) {
2299 1.153 atatat if (node->sysctl_data != NULL) {
2300 1.187 yamt free(node->sysctl_data,
2301 1.153 atatat M_SYSCTLDATA);
2302 1.153 atatat node->sysctl_data = NULL;
2303 1.153 atatat }
2304 1.153 atatat }
2305 1.166 atatat if (SYSCTL_FLAGS(node->sysctl_flags) &
2306 1.166 atatat CTLFLAG_OWNDESC) {
2307 1.166 atatat if (node->sysctl_desc != NULL) {
2308 1.180 christos /*XXXUNCONST*/
2309 1.187 yamt free(__UNCONST(node->sysctl_desc),
2310 1.166 atatat M_SYSCTLDATA);
2311 1.166 atatat node->sysctl_desc = NULL;
2312 1.166 atatat }
2313 1.166 atatat }
2314 1.153 atatat node++;
2315 1.153 atatat }
2316 1.153 atatat if (node < &pnode->sysctl_child[pnode->sysctl_clen]) {
2317 1.153 atatat pnode = node;
2318 1.153 atatat node = node->sysctl_child;
2319 1.188 yamt } else
2320 1.153 atatat break;
2321 1.153 atatat }
2322 1.153 atatat if (pnode->sysctl_child != NULL)
2323 1.187 yamt free(pnode->sysctl_child, M_SYSCTLNODE);
2324 1.153 atatat pnode->sysctl_clen = 0;
2325 1.153 atatat pnode->sysctl_csize = 0;
2326 1.153 atatat pnode->sysctl_child = NULL;
2327 1.153 atatat node = pnode;
2328 1.153 atatat pnode = node->sysctl_parent;
2329 1.158 atatat } while (pnode != NULL && node != rnode);
2330 1.214 ad
2331 1.214 ad rw_exit(&sysctl_treelock);
2332 1.123 thorpej }
2333 1.123 thorpej
2334 1.224 dyoung void
2335 1.224 dyoung sysctl_log_print(const struct sysctllog *slog)
2336 1.224 dyoung {
2337 1.224 dyoung int i, len;
2338 1.224 dyoung
2339 1.224 dyoung printf("root %p left %d size %d content", (const void *)slog->log_root,
2340 1.224 dyoung slog->log_left, slog->log_size);
2341 1.224 dyoung
2342 1.224 dyoung for (len = 0, i = slog->log_left; i < slog->log_size; i++) {
2343 1.224 dyoung switch (len) {
2344 1.224 dyoung case 0:
2345 1.224 dyoung len = -1;
2346 1.224 dyoung printf(" version %d", slog->log_num[i]);
2347 1.224 dyoung break;
2348 1.224 dyoung case -1:
2349 1.224 dyoung len = -2;
2350 1.224 dyoung printf(" type %d", slog->log_num[i]);
2351 1.224 dyoung break;
2352 1.224 dyoung case -2:
2353 1.224 dyoung len = slog->log_num[i];
2354 1.224 dyoung printf(" len %d:", slog->log_num[i]);
2355 1.224 dyoung if (len <= 0)
2356 1.224 dyoung len = -1;
2357 1.224 dyoung break;
2358 1.224 dyoung default:
2359 1.224 dyoung len--;
2360 1.224 dyoung printf(" %d", slog->log_num[i]);
2361 1.224 dyoung break;
2362 1.224 dyoung }
2363 1.224 dyoung }
2364 1.224 dyoung printf(" end\n");
2365 1.224 dyoung }
2366 1.224 dyoung
2367 1.163 atatat int
2368 1.183 atatat sysctl_log_add(struct sysctllog **logp, const struct sysctlnode *node)
2369 1.163 atatat {
2370 1.224 dyoung const int size0 = 16;
2371 1.163 atatat int name[CTL_MAXNAME], namelen, i;
2372 1.183 atatat const struct sysctlnode *pnode;
2373 1.163 atatat struct sysctllog *log;
2374 1.163 atatat
2375 1.163 atatat if (node->sysctl_flags & CTLFLAG_PERMANENT)
2376 1.163 atatat return (0);
2377 1.163 atatat
2378 1.163 atatat if (logp == NULL)
2379 1.163 atatat return (0);
2380 1.163 atatat
2381 1.163 atatat if (*logp == NULL) {
2382 1.187 yamt log = malloc(sizeof(struct sysctllog),
2383 1.163 atatat M_SYSCTLDATA, M_WAITOK|M_CANFAIL);
2384 1.163 atatat if (log == NULL) {
2385 1.163 atatat /* XXX print error message? */
2386 1.163 atatat return (-1);
2387 1.163 atatat }
2388 1.224 dyoung log->log_num = malloc(size0 * sizeof(int),
2389 1.163 atatat M_SYSCTLDATA, M_WAITOK|M_CANFAIL);
2390 1.163 atatat if (log->log_num == NULL) {
2391 1.163 atatat /* XXX print error message? */
2392 1.163 atatat free(log, M_SYSCTLDATA);
2393 1.163 atatat return (-1);
2394 1.163 atatat }
2395 1.224 dyoung memset(log->log_num, 0, size0 * sizeof(int));
2396 1.163 atatat log->log_root = NULL;
2397 1.224 dyoung log->log_size = size0;
2398 1.224 dyoung log->log_left = size0;
2399 1.163 atatat *logp = log;
2400 1.188 yamt } else
2401 1.163 atatat log = *logp;
2402 1.163 atatat
2403 1.163 atatat /*
2404 1.163 atatat * check that the root is proper. it's okay to record the
2405 1.163 atatat * address of the root of a tree. it's the only thing that's
2406 1.163 atatat * guaranteed not to shift around as nodes come and go.
2407 1.163 atatat */
2408 1.163 atatat if (log->log_root == NULL)
2409 1.163 atatat log->log_root = sysctl_rootof(node);
2410 1.163 atatat else if (log->log_root != sysctl_rootof(node)) {
2411 1.163 atatat printf("sysctl: log %p root mismatch (%p)\n",
2412 1.163 atatat log->log_root, sysctl_rootof(node));
2413 1.163 atatat return (-1);
2414 1.163 atatat }
2415 1.163 atatat
2416 1.163 atatat /*
2417 1.163 atatat * we will copy out name in reverse order
2418 1.163 atatat */
2419 1.163 atatat for (pnode = node, namelen = 0;
2420 1.163 atatat pnode != NULL && !(pnode->sysctl_flags & CTLFLAG_ROOT);
2421 1.163 atatat pnode = pnode->sysctl_parent)
2422 1.163 atatat name[namelen++] = pnode->sysctl_num;
2423 1.163 atatat
2424 1.163 atatat /*
2425 1.163 atatat * do we have space?
2426 1.163 atatat */
2427 1.163 atatat if (log->log_left < (namelen + 3))
2428 1.163 atatat sysctl_log_realloc(log);
2429 1.163 atatat if (log->log_left < (namelen + 3))
2430 1.163 atatat return (-1);
2431 1.163 atatat
2432 1.163 atatat /*
2433 1.163 atatat * stuff name in, then namelen, then node type, and finally,
2434 1.163 atatat * the version for non-node nodes.
2435 1.163 atatat */
2436 1.163 atatat for (i = 0; i < namelen; i++)
2437 1.163 atatat log->log_num[--log->log_left] = name[i];
2438 1.163 atatat log->log_num[--log->log_left] = namelen;
2439 1.163 atatat log->log_num[--log->log_left] = SYSCTL_TYPE(node->sysctl_flags);
2440 1.163 atatat if (log->log_num[log->log_left] != CTLTYPE_NODE)
2441 1.163 atatat log->log_num[--log->log_left] = node->sysctl_ver;
2442 1.163 atatat else
2443 1.163 atatat log->log_num[--log->log_left] = 0;
2444 1.163 atatat
2445 1.163 atatat return (0);
2446 1.163 atatat }
2447 1.163 atatat
2448 1.163 atatat void
2449 1.163 atatat sysctl_teardown(struct sysctllog **logp)
2450 1.163 atatat {
2451 1.183 atatat const struct sysctlnode *rnode;
2452 1.183 atatat struct sysctlnode node;
2453 1.163 atatat struct sysctllog *log;
2454 1.163 atatat uint namelen;
2455 1.163 atatat int *name, t, v, error, ni;
2456 1.163 atatat size_t sz;
2457 1.163 atatat
2458 1.163 atatat if (logp == NULL || *logp == NULL)
2459 1.163 atatat return;
2460 1.163 atatat log = *logp;
2461 1.163 atatat
2462 1.213 ad rw_enter(&sysctl_treelock, RW_WRITER);
2463 1.163 atatat memset(&node, 0, sizeof(node));
2464 1.163 atatat
2465 1.163 atatat while (log->log_left < log->log_size) {
2466 1.163 atatat KASSERT((log->log_left + 3 < log->log_size) &&
2467 1.163 atatat (log->log_left + log->log_num[log->log_left + 2] <=
2468 1.163 atatat log->log_size));
2469 1.163 atatat v = log->log_num[log->log_left++];
2470 1.163 atatat t = log->log_num[log->log_left++];
2471 1.163 atatat namelen = log->log_num[log->log_left++];
2472 1.163 atatat name = &log->log_num[log->log_left];
2473 1.163 atatat
2474 1.163 atatat node.sysctl_num = name[namelen - 1];
2475 1.168 atatat node.sysctl_flags = SYSCTL_VERSION|t;
2476 1.163 atatat node.sysctl_ver = v;
2477 1.163 atatat
2478 1.163 atatat rnode = log->log_root;
2479 1.163 atatat error = sysctl_locate(NULL, &name[0], namelen, &rnode, &ni);
2480 1.163 atatat if (error == 0) {
2481 1.163 atatat name[namelen - 1] = CTL_DESTROY;
2482 1.163 atatat rnode = rnode->sysctl_parent;
2483 1.163 atatat sz = 0;
2484 1.163 atatat (void)sysctl_destroy(&name[namelen - 1], 1, NULL,
2485 1.163 atatat &sz, &node, sizeof(node),
2486 1.163 atatat &name[0], NULL, rnode);
2487 1.163 atatat }
2488 1.163 atatat
2489 1.163 atatat log->log_left += namelen;
2490 1.163 atatat }
2491 1.163 atatat
2492 1.163 atatat KASSERT(log->log_size == log->log_left);
2493 1.163 atatat free(log->log_num, M_SYSCTLDATA);
2494 1.163 atatat free(log, M_SYSCTLDATA);
2495 1.163 atatat *logp = NULL;
2496 1.163 atatat
2497 1.213 ad rw_exit(&sysctl_treelock);
2498 1.163 atatat }
2499 1.163 atatat
2500 1.1 cgd /*
2501 1.153 atatat * ********************************************************************
2502 1.153 atatat * old_sysctl -- A routine to bridge old-style internal calls to the
2503 1.153 atatat * new infrastructure.
2504 1.153 atatat * ********************************************************************
2505 1.1 cgd */
2506 1.153 atatat int
2507 1.153 atatat old_sysctl(int *name, u_int namelen, void *oldp, size_t *oldlenp,
2508 1.153 atatat void *newp, size_t newlen, struct lwp *l)
2509 1.1 cgd {
2510 1.153 atatat int error;
2511 1.186 yamt size_t oldlen = 0;
2512 1.186 yamt size_t savelen;
2513 1.186 yamt
2514 1.186 yamt if (oldlenp) {
2515 1.186 yamt oldlen = *oldlenp;
2516 1.186 yamt }
2517 1.186 yamt savelen = oldlen;
2518 1.179 perry
2519 1.213 ad sysctl_lock(newp != NULL);
2520 1.186 yamt error = sysctl_dispatch(name, namelen, oldp, &oldlen,
2521 1.153 atatat newp, newlen, name, l, NULL);
2522 1.213 ad sysctl_unlock();
2523 1.186 yamt if (error == 0 && oldp != NULL && savelen < oldlen)
2524 1.153 atatat error = ENOMEM;
2525 1.186 yamt if (oldlenp) {
2526 1.186 yamt *oldlenp = oldlen;
2527 1.186 yamt }
2528 1.186 yamt
2529 1.153 atatat return (error);
2530 1.62 simonb }
2531 1.62 simonb
2532 1.62 simonb /*
2533 1.153 atatat * ********************************************************************
2534 1.153 atatat * Section 4: Generic helper routines
2535 1.153 atatat * ********************************************************************
2536 1.153 atatat * "helper" routines that can do more finely grained access control,
2537 1.153 atatat * construct structures from disparate information, create the
2538 1.153 atatat * appearance of more nodes and sub-trees, etc. for example, if
2539 1.153 atatat * CTL_PROC wanted a helper function, it could respond to a CTL_QUERY
2540 1.153 atatat * with a dynamically created list of nodes that represented the
2541 1.153 atatat * currently running processes at that instant.
2542 1.153 atatat * ********************************************************************
2543 1.153 atatat */
2544 1.123 thorpej
2545 1.123 thorpej /*
2546 1.153 atatat * first, a few generic helpers that provide:
2547 1.153 atatat *
2548 1.153 atatat * sysctl_needfunc() a readonly interface that emits a warning
2549 1.153 atatat * sysctl_notavail() returns EOPNOTSUPP (generic error)
2550 1.153 atatat * sysctl_null() an empty return buffer with no error
2551 1.123 thorpej */
2552 1.62 simonb int
2553 1.153 atatat sysctl_needfunc(SYSCTLFN_ARGS)
2554 1.62 simonb {
2555 1.153 atatat int error;
2556 1.153 atatat
2557 1.153 atatat printf("!!SYSCTL_NEEDFUNC!!\n");
2558 1.62 simonb
2559 1.153 atatat if (newp != NULL || namelen != 0)
2560 1.153 atatat return (EOPNOTSUPP);
2561 1.62 simonb
2562 1.153 atatat error = 0;
2563 1.153 atatat if (oldp != NULL)
2564 1.153 atatat error = sysctl_copyout(l, rnode->sysctl_data, oldp,
2565 1.153 atatat MIN(rnode->sysctl_size, *oldlenp));
2566 1.153 atatat *oldlenp = rnode->sysctl_size;
2567 1.62 simonb
2568 1.153 atatat return (error);
2569 1.153 atatat }
2570 1.62 simonb
2571 1.153 atatat int
2572 1.153 atatat sysctl_notavail(SYSCTLFN_ARGS)
2573 1.153 atatat {
2574 1.62 simonb
2575 1.155 atatat if (namelen == 1 && name[0] == CTL_QUERY)
2576 1.182 atatat return (sysctl_query(SYSCTLFN_CALL(rnode)));
2577 1.155 atatat
2578 1.153 atatat return (EOPNOTSUPP);
2579 1.153 atatat }
2580 1.62 simonb
2581 1.153 atatat int
2582 1.153 atatat sysctl_null(SYSCTLFN_ARGS)
2583 1.153 atatat {
2584 1.62 simonb
2585 1.153 atatat *oldlenp = 0;
2586 1.123 thorpej
2587 1.153 atatat return (0);
2588 1.153 atatat }
2589 1.67 simonb
2590 1.230 pooka u_int
2591 1.230 pooka sysctl_map_flags(const u_int *map, u_int word)
2592 1.230 pooka {
2593 1.230 pooka u_int rv;
2594 1.230 pooka
2595 1.230 pooka for (rv = 0; *map != 0; map += 2)
2596 1.230 pooka if ((word & map[0]) != 0)
2597 1.230 pooka rv |= map[1];
2598 1.230 pooka
2599 1.230 pooka return rv;
2600 1.230 pooka }
2601 1.230 pooka
2602 1.153 atatat /*
2603 1.153 atatat * ********************************************************************
2604 1.153 atatat * Section 5: The machinery that makes it all go
2605 1.153 atatat * ********************************************************************
2606 1.153 atatat * Memory "manglement" routines. Not much to this, eh?
2607 1.153 atatat * ********************************************************************
2608 1.153 atatat */
2609 1.153 atatat static int
2610 1.153 atatat sysctl_alloc(struct sysctlnode *p, int x)
2611 1.153 atatat {
2612 1.153 atatat int i;
2613 1.153 atatat struct sysctlnode *n;
2614 1.62 simonb
2615 1.153 atatat assert(p->sysctl_child == NULL);
2616 1.62 simonb
2617 1.153 atatat if (x == 1)
2618 1.187 yamt n = malloc(sizeof(struct sysctlnode),
2619 1.153 atatat M_SYSCTLNODE, M_WAITOK|M_CANFAIL);
2620 1.62 simonb else
2621 1.187 yamt n = malloc(SYSCTL_DEFSIZE * sizeof(struct sysctlnode),
2622 1.153 atatat M_SYSCTLNODE, M_WAITOK|M_CANFAIL);
2623 1.153 atatat if (n == NULL)
2624 1.153 atatat return (ENOMEM);
2625 1.153 atatat
2626 1.153 atatat if (x == 1) {
2627 1.153 atatat memset(n, 0, sizeof(struct sysctlnode));
2628 1.153 atatat p->sysctl_csize = 1;
2629 1.188 yamt } else {
2630 1.153 atatat memset(n, 0, SYSCTL_DEFSIZE * sizeof(struct sysctlnode));
2631 1.153 atatat p->sysctl_csize = SYSCTL_DEFSIZE;
2632 1.62 simonb }
2633 1.153 atatat p->sysctl_clen = 0;
2634 1.62 simonb
2635 1.153 atatat for (i = 0; i < p->sysctl_csize; i++)
2636 1.153 atatat n[i].sysctl_parent = p;
2637 1.62 simonb
2638 1.153 atatat p->sysctl_child = n;
2639 1.153 atatat return (0);
2640 1.1 cgd }
2641 1.78 jdolecek
2642 1.78 jdolecek static int
2643 1.153 atatat sysctl_realloc(struct sysctlnode *p)
2644 1.78 jdolecek {
2645 1.224 dyoung int i, j, olen;
2646 1.153 atatat struct sysctlnode *n;
2647 1.78 jdolecek
2648 1.153 atatat assert(p->sysctl_csize == p->sysctl_clen);
2649 1.78 jdolecek
2650 1.153 atatat /*
2651 1.153 atatat * how many do we have...how many should we make?
2652 1.153 atatat */
2653 1.224 dyoung olen = p->sysctl_clen;
2654 1.224 dyoung n = malloc(2 * olen * sizeof(struct sysctlnode), M_SYSCTLNODE,
2655 1.153 atatat M_WAITOK|M_CANFAIL);
2656 1.153 atatat if (n == NULL)
2657 1.153 atatat return (ENOMEM);
2658 1.78 jdolecek
2659 1.153 atatat /*
2660 1.153 atatat * move old children over...initialize new children
2661 1.153 atatat */
2662 1.224 dyoung memcpy(n, p->sysctl_child, olen * sizeof(struct sysctlnode));
2663 1.224 dyoung memset(&n[olen], 0, olen * sizeof(struct sysctlnode));
2664 1.224 dyoung p->sysctl_csize = 2 * olen;
2665 1.78 jdolecek
2666 1.153 atatat /*
2667 1.153 atatat * reattach moved (and new) children to parent; if a moved
2668 1.153 atatat * child node has children, reattach the parent pointers of
2669 1.153 atatat * grandchildren
2670 1.153 atatat */
2671 1.153 atatat for (i = 0; i < p->sysctl_csize; i++) {
2672 1.153 atatat n[i].sysctl_parent = p;
2673 1.153 atatat if (n[i].sysctl_child != NULL) {
2674 1.153 atatat for (j = 0; j < n[i].sysctl_csize; j++)
2675 1.153 atatat n[i].sysctl_child[j].sysctl_parent = &n[i];
2676 1.153 atatat }
2677 1.78 jdolecek }
2678 1.78 jdolecek
2679 1.153 atatat /*
2680 1.153 atatat * get out with the old and in with the new
2681 1.153 atatat */
2682 1.187 yamt free(p->sysctl_child, M_SYSCTLNODE);
2683 1.153 atatat p->sysctl_child = n;
2684 1.100 simonb
2685 1.153 atatat return (0);
2686 1.100 simonb }
2687 1.162 atatat
2688 1.163 atatat static int
2689 1.163 atatat sysctl_log_realloc(struct sysctllog *log)
2690 1.163 atatat {
2691 1.163 atatat int *n, s, d;
2692 1.163 atatat
2693 1.163 atatat s = log->log_size * 2;
2694 1.163 atatat d = log->log_size;
2695 1.163 atatat
2696 1.163 atatat n = malloc(s * sizeof(int), M_SYSCTLDATA, M_WAITOK|M_CANFAIL);
2697 1.163 atatat if (n == NULL)
2698 1.163 atatat return (-1);
2699 1.163 atatat
2700 1.163 atatat memset(n, 0, s * sizeof(int));
2701 1.163 atatat memcpy(&n[d], log->log_num, d * sizeof(int));
2702 1.163 atatat free(log->log_num, M_SYSCTLDATA);
2703 1.163 atatat log->log_num = n;
2704 1.163 atatat if (d)
2705 1.163 atatat log->log_left += d;
2706 1.163 atatat else
2707 1.163 atatat log->log_left = s;
2708 1.163 atatat log->log_size = s;
2709 1.163 atatat
2710 1.163 atatat return (0);
2711 1.163 atatat }
2712 1.163 atatat
2713 1.162 atatat /*
2714 1.162 atatat * ********************************************************************
2715 1.162 atatat * Section 6: Conversion between API versions wrt the sysctlnode
2716 1.162 atatat * ********************************************************************
2717 1.162 atatat */
2718 1.162 atatat static int
2719 1.162 atatat sysctl_cvt_in(struct lwp *l, int *vp, const void *i, size_t sz,
2720 1.162 atatat struct sysctlnode *node)
2721 1.162 atatat {
2722 1.162 atatat int error, flags;
2723 1.162 atatat
2724 1.172 atatat if (i == NULL || sz < sizeof(flags))
2725 1.162 atatat return (EINVAL);
2726 1.162 atatat
2727 1.162 atatat error = sysctl_copyin(l, i, &flags, sizeof(flags));
2728 1.162 atatat if (error)
2729 1.162 atatat return (error);
2730 1.162 atatat
2731 1.164 atatat #if (SYSCTL_VERSION != SYSCTL_VERS_1)
2732 1.164 atatat #error sysctl_cvt_in: no support for SYSCTL_VERSION
2733 1.164 atatat #endif /* (SYSCTL_VERSION != SYSCTL_VERS_1) */
2734 1.164 atatat
2735 1.162 atatat if (sz == sizeof(*node) &&
2736 1.162 atatat SYSCTL_VERS(flags) == SYSCTL_VERSION) {
2737 1.162 atatat error = sysctl_copyin(l, i, node, sizeof(*node));
2738 1.162 atatat if (error)
2739 1.162 atatat return (error);
2740 1.162 atatat *vp = SYSCTL_VERSION;
2741 1.162 atatat return (0);
2742 1.162 atatat }
2743 1.162 atatat
2744 1.162 atatat return (EINVAL);
2745 1.162 atatat }
2746 1.162 atatat
2747 1.162 atatat static int
2748 1.162 atatat sysctl_cvt_out(struct lwp *l, int v, const struct sysctlnode *i,
2749 1.162 atatat void *ovp, size_t left, size_t *szp)
2750 1.162 atatat {
2751 1.162 atatat size_t sz = sizeof(*i);
2752 1.162 atatat const void *src = i;
2753 1.162 atatat int error;
2754 1.162 atatat
2755 1.162 atatat switch (v) {
2756 1.164 atatat case SYSCTL_VERS_0:
2757 1.172 atatat return (EINVAL);
2758 1.164 atatat
2759 1.164 atatat #if (SYSCTL_VERSION != SYSCTL_VERS_1)
2760 1.164 atatat #error sysctl_cvt_out: no support for SYSCTL_VERSION
2761 1.164 atatat #endif /* (SYSCTL_VERSION != SYSCTL_VERS_1) */
2762 1.164 atatat
2763 1.162 atatat case SYSCTL_VERSION:
2764 1.162 atatat /* nothing more to do here */
2765 1.162 atatat break;
2766 1.162 atatat }
2767 1.162 atatat
2768 1.162 atatat if (ovp != NULL && left >= sz) {
2769 1.162 atatat error = sysctl_copyout(l, src, ovp, sz);
2770 1.162 atatat if (error)
2771 1.162 atatat return (error);
2772 1.162 atatat }
2773 1.162 atatat
2774 1.162 atatat if (szp != NULL)
2775 1.162 atatat *szp = sz;
2776 1.162 atatat
2777 1.162 atatat return (0);
2778 1.162 atatat }
2779