procfs_subr.c revision 1.36 1 1.36 jdolecek /* $NetBSD: procfs_subr.c,v 1.36 2001/01/18 20:28:21 jdolecek Exp $ */
2 1.13 cgd
3 1.1 pk /*
4 1.20 thorpej * Copyright (c) 1994 Christopher G. Demetriou. All rights reserved.
5 1.5 cgd * Copyright (c) 1993 Jan-Simon Pendry
6 1.11 mycroft * Copyright (c) 1993
7 1.11 mycroft * The Regents of the University of California. All rights reserved.
8 1.2 pk *
9 1.5 cgd * This code is derived from software contributed to Berkeley by
10 1.5 cgd * Jan-Simon Pendry.
11 1.5 cgd *
12 1.2 pk * Redistribution and use in source and binary forms, with or without
13 1.2 pk * modification, are permitted provided that the following conditions
14 1.2 pk * are met:
15 1.2 pk * 1. Redistributions of source code must retain the above copyright
16 1.2 pk * notice, this list of conditions and the following disclaimer.
17 1.2 pk * 2. Redistributions in binary form must reproduce the above copyright
18 1.2 pk * notice, this list of conditions and the following disclaimer in the
19 1.2 pk * documentation and/or other materials provided with the distribution.
20 1.2 pk * 3. All advertising materials mentioning features or use of this software
21 1.2 pk * must display the following acknowledgement:
22 1.5 cgd * This product includes software developed by the University of
23 1.5 cgd * California, Berkeley and its contributors.
24 1.5 cgd * 4. Neither the name of the University nor the names of its contributors
25 1.5 cgd * may be used to endorse or promote products derived from this software
26 1.5 cgd * without specific prior written permission.
27 1.5 cgd *
28 1.5 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
29 1.5 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
30 1.5 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
31 1.5 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
32 1.5 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
33 1.5 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
34 1.5 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
35 1.5 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
36 1.5 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
37 1.5 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
38 1.5 cgd * SUCH DAMAGE.
39 1.2 pk *
40 1.23 fvdl * @(#)procfs_subr.c 8.6 (Berkeley) 5/14/95
41 1.1 pk */
42 1.5 cgd
43 1.4 mycroft #include <sys/param.h>
44 1.4 mycroft #include <sys/systm.h>
45 1.4 mycroft #include <sys/time.h>
46 1.4 mycroft #include <sys/kernel.h>
47 1.4 mycroft #include <sys/proc.h>
48 1.4 mycroft #include <sys/vnode.h>
49 1.11 mycroft #include <sys/malloc.h>
50 1.18 mycroft #include <sys/stat.h>
51 1.18 mycroft
52 1.5 cgd #include <miscfs/procfs/procfs.h>
53 1.1 pk
54 1.29 fvdl void procfs_hashins __P((struct pfsnode *));
55 1.29 fvdl void procfs_hashrem __P((struct pfsnode *));
56 1.29 fvdl struct vnode *procfs_hashget __P((pid_t, pfstype, struct mount *));
57 1.29 fvdl
58 1.29 fvdl LIST_HEAD(pfs_hashhead, pfsnode) *pfs_hashtbl;
59 1.30 fvdl u_long pfs_ihash; /* size of hash table - 1 */
60 1.30 fvdl #define PFSPIDHASH(pid) (&pfs_hashtbl[(pid) & pfs_ihash])
61 1.29 fvdl
62 1.29 fvdl struct lock pfs_hashlock;
63 1.29 fvdl struct simplelock pfs_hash_slock;
64 1.1 pk
65 1.20 thorpej #define ISSET(t, f) ((t) & (f))
66 1.20 thorpej
67 1.1 pk /*
68 1.5 cgd * allocate a pfsnode/vnode pair. the vnode is
69 1.27 wrstuden * referenced, and locked.
70 1.5 cgd *
71 1.5 cgd * the pid, pfs_type, and mount point uniquely
72 1.5 cgd * identify a pfsnode. the mount point is needed
73 1.5 cgd * because someone might mount this filesystem
74 1.5 cgd * twice.
75 1.5 cgd *
76 1.5 cgd * all pfsnodes are maintained on a singly-linked
77 1.5 cgd * list. new nodes are only allocated when they cannot
78 1.5 cgd * be found on this list. entries on the list are
79 1.5 cgd * removed when the vfs reclaim entry is called.
80 1.5 cgd *
81 1.5 cgd * a single lock is kept for the entire list. this is
82 1.5 cgd * needed because the getnewvnode() function can block
83 1.5 cgd * waiting for a vnode to become free, in which case there
84 1.5 cgd * may be more than one process trying to get the same
85 1.5 cgd * vnode. this lock is only taken if we are going to
86 1.5 cgd * call getnewvnode, since the kernel itself is single-threaded.
87 1.5 cgd *
88 1.5 cgd * if an entry is found on the list, then call vget() to
89 1.5 cgd * take a reference. this is done because there may be
90 1.5 cgd * zero references to it and so it needs to removed from
91 1.5 cgd * the vnode free list.
92 1.1 pk */
93 1.11 mycroft int
94 1.5 cgd procfs_allocvp(mp, vpp, pid, pfs_type)
95 1.5 cgd struct mount *mp;
96 1.5 cgd struct vnode **vpp;
97 1.5 cgd long pid;
98 1.5 cgd pfstype pfs_type;
99 1.1 pk {
100 1.12 mycroft struct pfsnode *pfs;
101 1.12 mycroft struct vnode *vp;
102 1.5 cgd int error;
103 1.5 cgd
104 1.29 fvdl do {
105 1.29 fvdl if ((*vpp = procfs_hashget(pid, pfs_type, mp)) != NULL)
106 1.5 cgd return (0);
107 1.29 fvdl } while (lockmgr(&pfs_hashlock, LK_EXCLUSIVE|LK_SLEEPFAIL, 0));
108 1.1 pk
109 1.29 fvdl if ((error = getnewvnode(VT_PROCFS, mp, procfs_vnodeop_p, vpp)) != 0) {
110 1.29 fvdl *vpp = NULL;
111 1.33 chs lockmgr(&pfs_hashlock, LK_RELEASE, NULL);
112 1.29 fvdl return (error);
113 1.5 cgd }
114 1.11 mycroft vp = *vpp;
115 1.5 cgd
116 1.11 mycroft MALLOC(pfs, void *, sizeof(struct pfsnode), M_TEMP, M_WAITOK);
117 1.11 mycroft vp->v_data = pfs;
118 1.5 cgd
119 1.5 cgd pfs->pfs_pid = (pid_t) pid;
120 1.5 cgd pfs->pfs_type = pfs_type;
121 1.11 mycroft pfs->pfs_vnode = vp;
122 1.5 cgd pfs->pfs_flags = 0;
123 1.5 cgd pfs->pfs_fileno = PROCFS_FILENO(pid, pfs_type);
124 1.5 cgd
125 1.5 cgd switch (pfs_type) {
126 1.11 mycroft case Proot: /* /proc = dr-xr-xr-x */
127 1.17 mycroft pfs->pfs_mode = S_IRUSR|S_IXUSR|S_IRGRP|S_IXGRP|S_IROTH|S_IXOTH;
128 1.11 mycroft vp->v_type = VDIR;
129 1.11 mycroft vp->v_flag = VROOT;
130 1.11 mycroft break;
131 1.11 mycroft
132 1.22 mycroft case Pcurproc: /* /proc/curproc = lr-xr-xr-x */
133 1.28 thorpej case Pself: /* /proc/self = lr-xr-xr-x */
134 1.22 mycroft pfs->pfs_mode = S_IRUSR|S_IXUSR|S_IRGRP|S_IXGRP|S_IROTH|S_IXOTH;
135 1.11 mycroft vp->v_type = VLNK;
136 1.5 cgd break;
137 1.5 cgd
138 1.17 mycroft case Pproc: /* /proc/N = dr-xr-xr-x */
139 1.17 mycroft pfs->pfs_mode = S_IRUSR|S_IXUSR|S_IRGRP|S_IXGRP|S_IROTH|S_IXOTH;
140 1.6 ws vp->v_type = VDIR;
141 1.5 cgd break;
142 1.5 cgd
143 1.17 mycroft case Pfile: /* /proc/N/file = -rw------- */
144 1.17 mycroft case Pmem: /* /proc/N/mem = -rw------- */
145 1.17 mycroft case Pregs: /* /proc/N/regs = -rw------- */
146 1.17 mycroft case Pfpregs: /* /proc/N/fpregs = -rw------- */
147 1.17 mycroft pfs->pfs_mode = S_IRUSR|S_IWUSR;
148 1.9 cgd vp->v_type = VREG;
149 1.9 cgd break;
150 1.9 cgd
151 1.17 mycroft case Pctl: /* /proc/N/ctl = --w------ */
152 1.17 mycroft case Pnote: /* /proc/N/note = --w------ */
153 1.17 mycroft case Pnotepg: /* /proc/N/notepg = --w------ */
154 1.17 mycroft pfs->pfs_mode = S_IWUSR;
155 1.6 ws vp->v_type = VREG;
156 1.5 cgd break;
157 1.5 cgd
158 1.25 msaitoh case Pmap: /* /proc/N/map = -r--r--r-- */
159 1.17 mycroft case Pstatus: /* /proc/N/status = -r--r--r-- */
160 1.26 christos case Pcmdline: /* /proc/N/cmdline = -r--r--r-- */
161 1.35 fvdl case Pmeminfo: /* /proc/meminfo = -r--r--r-- */
162 1.35 fvdl case Pcpuinfo: /* /proc/cpuinfo = -r--r--r-- */
163 1.17 mycroft pfs->pfs_mode = S_IRUSR|S_IRGRP|S_IROTH;
164 1.6 ws vp->v_type = VREG;
165 1.5 cgd break;
166 1.5 cgd
167 1.5 cgd default:
168 1.11 mycroft panic("procfs_allocvp");
169 1.5 cgd }
170 1.27 wrstuden
171 1.29 fvdl procfs_hashins(pfs);
172 1.34 chs uvm_vnp_setsize(vp, 0);
173 1.33 chs lockmgr(&pfs_hashlock, LK_RELEASE, NULL);
174 1.1 pk
175 1.5 cgd return (error);
176 1.1 pk }
177 1.1 pk
178 1.11 mycroft int
179 1.5 cgd procfs_freevp(vp)
180 1.5 cgd struct vnode *vp;
181 1.1 pk {
182 1.5 cgd struct pfsnode *pfs = VTOPFS(vp);
183 1.5 cgd
184 1.29 fvdl procfs_hashrem(pfs);
185 1.1 pk
186 1.11 mycroft FREE(vp->v_data, M_TEMP);
187 1.11 mycroft vp->v_data = 0;
188 1.5 cgd return (0);
189 1.1 pk }
190 1.1 pk
191 1.11 mycroft int
192 1.15 christos procfs_rw(v)
193 1.15 christos void *v;
194 1.1 pk {
195 1.15 christos struct vop_read_args *ap = v;
196 1.11 mycroft struct vnode *vp = ap->a_vp;
197 1.11 mycroft struct uio *uio = ap->a_uio;
198 1.5 cgd struct proc *curp = uio->uio_procp;
199 1.5 cgd struct pfsnode *pfs = VTOPFS(vp);
200 1.5 cgd struct proc *p;
201 1.5 cgd
202 1.5 cgd p = PFIND(pfs->pfs_pid);
203 1.5 cgd if (p == 0)
204 1.1 pk return (EINVAL);
205 1.19 mycroft
206 1.19 mycroft switch (pfs->pfs_type) {
207 1.19 mycroft case Pregs:
208 1.19 mycroft case Pfpregs:
209 1.19 mycroft case Pmem:
210 1.19 mycroft /*
211 1.19 mycroft * Do not allow init to be modified while in secure mode; it
212 1.19 mycroft * could be duped into changing the security level.
213 1.19 mycroft */
214 1.19 mycroft if (uio->uio_rw == UIO_WRITE &&
215 1.19 mycroft p == initproc && securelevel > -1)
216 1.19 mycroft return (EPERM);
217 1.19 mycroft break;
218 1.19 mycroft
219 1.19 mycroft default:
220 1.19 mycroft break;
221 1.19 mycroft }
222 1.1 pk
223 1.5 cgd switch (pfs->pfs_type) {
224 1.5 cgd case Pnote:
225 1.5 cgd case Pnotepg:
226 1.11 mycroft return (procfs_donote(curp, p, pfs, uio));
227 1.5 cgd
228 1.5 cgd case Pregs:
229 1.11 mycroft return (procfs_doregs(curp, p, pfs, uio));
230 1.9 cgd
231 1.9 cgd case Pfpregs:
232 1.11 mycroft return (procfs_dofpregs(curp, p, pfs, uio));
233 1.5 cgd
234 1.5 cgd case Pctl:
235 1.11 mycroft return (procfs_doctl(curp, p, pfs, uio));
236 1.5 cgd
237 1.5 cgd case Pstatus:
238 1.11 mycroft return (procfs_dostatus(curp, p, pfs, uio));
239 1.25 msaitoh
240 1.25 msaitoh case Pmap:
241 1.25 msaitoh return (procfs_domap(curp, p, pfs, uio));
242 1.1 pk
243 1.5 cgd case Pmem:
244 1.11 mycroft return (procfs_domem(curp, p, pfs, uio));
245 1.26 christos
246 1.26 christos case Pcmdline:
247 1.26 christos return (procfs_docmdline(curp, p, pfs, uio));
248 1.35 fvdl
249 1.35 fvdl case Pmeminfo:
250 1.35 fvdl return (procfs_domeminfo(curp, p, pfs, uio));
251 1.35 fvdl case Pcpuinfo:
252 1.35 fvdl return (procfs_docpuinfo(curp, p, pfs, uio));
253 1.1 pk
254 1.5 cgd default:
255 1.5 cgd return (EOPNOTSUPP);
256 1.5 cgd }
257 1.1 pk }
258 1.1 pk
259 1.5 cgd /*
260 1.5 cgd * Get a string from userland into (buf). Strip a trailing
261 1.5 cgd * nl character (to allow easy access from the shell).
262 1.11 mycroft * The buffer should be *buflenp + 1 chars long. vfs_getuserstr
263 1.5 cgd * will automatically add a nul char at the end.
264 1.5 cgd *
265 1.5 cgd * Returns 0 on success or the following errors
266 1.5 cgd *
267 1.5 cgd * EINVAL: file offset is non-zero.
268 1.5 cgd * EMSGSIZE: message is longer than kernel buffer
269 1.5 cgd * EFAULT: user i/o buffer is not addressable
270 1.5 cgd */
271 1.11 mycroft int
272 1.11 mycroft vfs_getuserstr(uio, buf, buflenp)
273 1.5 cgd struct uio *uio;
274 1.5 cgd char *buf;
275 1.5 cgd int *buflenp;
276 1.1 pk {
277 1.5 cgd int xlen;
278 1.5 cgd int error;
279 1.5 cgd
280 1.11 mycroft if (uio->uio_offset != 0)
281 1.11 mycroft return (EINVAL);
282 1.11 mycroft
283 1.5 cgd xlen = *buflenp;
284 1.1 pk
285 1.5 cgd /* must be able to read the whole string in one go */
286 1.5 cgd if (xlen < uio->uio_resid)
287 1.5 cgd return (EMSGSIZE);
288 1.5 cgd xlen = uio->uio_resid;
289 1.5 cgd
290 1.14 christos if ((error = uiomove(buf, xlen, uio)) != 0)
291 1.5 cgd return (error);
292 1.5 cgd
293 1.11 mycroft /* allow multiple writes without seeks */
294 1.11 mycroft uio->uio_offset = 0;
295 1.11 mycroft
296 1.5 cgd /* cleanup string and remove trailing newline */
297 1.5 cgd buf[xlen] = '\0';
298 1.5 cgd xlen = strlen(buf);
299 1.5 cgd if (xlen > 0 && buf[xlen-1] == '\n')
300 1.5 cgd buf[--xlen] = '\0';
301 1.5 cgd *buflenp = xlen;
302 1.1 pk
303 1.5 cgd return (0);
304 1.1 pk }
305 1.1 pk
306 1.36 jdolecek const vfs_namemap_t *
307 1.11 mycroft vfs_findname(nm, buf, buflen)
308 1.36 jdolecek const vfs_namemap_t *nm;
309 1.36 jdolecek const char *buf;
310 1.5 cgd int buflen;
311 1.1 pk {
312 1.11 mycroft
313 1.5 cgd for (; nm->nm_name; nm++)
314 1.24 perry if (memcmp(buf, nm->nm_name, buflen+1) == 0)
315 1.5 cgd return (nm);
316 1.5 cgd
317 1.5 cgd return (0);
318 1.29 fvdl }
319 1.29 fvdl
320 1.29 fvdl /*
321 1.29 fvdl * Initialize pfsnode hash table.
322 1.29 fvdl */
323 1.29 fvdl void
324 1.29 fvdl procfs_hashinit()
325 1.29 fvdl {
326 1.29 fvdl lockinit(&pfs_hashlock, PINOD, "pfs_hashlock", 0, 0);
327 1.32 ad pfs_hashtbl = hashinit(desiredvnodes / 4, HASH_LIST, M_UFSMNT,
328 1.32 ad M_WAITOK, &pfs_ihash);
329 1.29 fvdl simple_lock_init(&pfs_hash_slock);
330 1.31 jdolecek }
331 1.31 jdolecek
332 1.31 jdolecek /*
333 1.31 jdolecek * Free pfsnode hash table.
334 1.31 jdolecek */
335 1.31 jdolecek void
336 1.31 jdolecek procfs_hashdone()
337 1.31 jdolecek {
338 1.31 jdolecek hashdone(pfs_hashtbl, M_UFSMNT);
339 1.29 fvdl }
340 1.29 fvdl
341 1.29 fvdl struct vnode *
342 1.29 fvdl procfs_hashget(pid, type, mp)
343 1.29 fvdl pid_t pid;
344 1.29 fvdl pfstype type;
345 1.29 fvdl struct mount *mp;
346 1.29 fvdl {
347 1.29 fvdl struct pfsnode *pp;
348 1.29 fvdl struct vnode *vp;
349 1.29 fvdl
350 1.29 fvdl loop:
351 1.29 fvdl simple_lock(&pfs_hash_slock);
352 1.29 fvdl for (pp = PFSPIDHASH(pid)->lh_first; pp; pp = pp->pfs_hash.le_next) {
353 1.29 fvdl vp = PFSTOV(pp);
354 1.29 fvdl if (pid == pp->pfs_pid && pp->pfs_type == type &&
355 1.29 fvdl vp->v_mount == mp) {
356 1.29 fvdl simple_lock(&vp->v_interlock);
357 1.29 fvdl simple_unlock(&pfs_hash_slock);
358 1.29 fvdl if (vget(vp, LK_EXCLUSIVE | LK_INTERLOCK))
359 1.29 fvdl goto loop;
360 1.29 fvdl return (vp);
361 1.29 fvdl }
362 1.29 fvdl }
363 1.29 fvdl simple_unlock(&pfs_hash_slock);
364 1.29 fvdl return (NULL);
365 1.29 fvdl }
366 1.29 fvdl
367 1.29 fvdl /*
368 1.29 fvdl * Insert the pfsnode into the hash table and lock it.
369 1.29 fvdl */
370 1.29 fvdl void
371 1.29 fvdl procfs_hashins(pp)
372 1.29 fvdl struct pfsnode *pp;
373 1.29 fvdl {
374 1.29 fvdl struct pfs_hashhead *ppp;
375 1.29 fvdl
376 1.29 fvdl /* lock the pfsnode, then put it on the appropriate hash list */
377 1.29 fvdl lockmgr(&pp->pfs_vnode->v_lock, LK_EXCLUSIVE, (struct simplelock *)0);
378 1.29 fvdl
379 1.29 fvdl simple_lock(&pfs_hash_slock);
380 1.29 fvdl ppp = PFSPIDHASH(pp->pfs_pid);
381 1.29 fvdl LIST_INSERT_HEAD(ppp, pp, pfs_hash);
382 1.29 fvdl simple_unlock(&pfs_hash_slock);
383 1.29 fvdl }
384 1.29 fvdl
385 1.29 fvdl /*
386 1.29 fvdl * Remove the pfsnode from the hash table.
387 1.29 fvdl */
388 1.29 fvdl void
389 1.29 fvdl procfs_hashrem(pp)
390 1.29 fvdl struct pfsnode *pp;
391 1.29 fvdl {
392 1.29 fvdl simple_lock(&pfs_hash_slock);
393 1.29 fvdl LIST_REMOVE(pp, pfs_hash);
394 1.29 fvdl simple_unlock(&pfs_hash_slock);
395 1.29 fvdl }
396 1.29 fvdl
397 1.29 fvdl void
398 1.29 fvdl procfs_revoke_vnodes(p, arg)
399 1.29 fvdl struct proc *p;
400 1.29 fvdl void *arg;
401 1.29 fvdl {
402 1.29 fvdl struct pfsnode *pfs, *pnext;
403 1.29 fvdl struct vnode *vp;
404 1.29 fvdl struct mount *mp = (struct mount *)arg;
405 1.29 fvdl
406 1.29 fvdl if (!(p->p_flag & P_SUGID))
407 1.29 fvdl return;
408 1.29 fvdl
409 1.29 fvdl for (pfs = PFSPIDHASH(p->p_pid)->lh_first; pfs; pfs = pnext) {
410 1.29 fvdl vp = PFSTOV(pfs);
411 1.29 fvdl pnext = pfs->pfs_hash.le_next;
412 1.29 fvdl if (vp->v_usecount > 0 && pfs->pfs_pid == p->p_pid &&
413 1.29 fvdl vp->v_mount == mp)
414 1.29 fvdl VOP_REVOKE(vp, REVOKEALL);
415 1.29 fvdl }
416 1.1 pk }
417