procfs_subr.c revision 1.32 1 1.32 ad /* $NetBSD: procfs_subr.c,v 1.32 2000/11/08 14:28:14 ad Exp $ */
2 1.13 cgd
3 1.1 pk /*
4 1.20 thorpej * Copyright (c) 1994 Christopher G. Demetriou. All rights reserved.
5 1.5 cgd * Copyright (c) 1993 Jan-Simon Pendry
6 1.11 mycroft * Copyright (c) 1993
7 1.11 mycroft * The Regents of the University of California. All rights reserved.
8 1.2 pk *
9 1.5 cgd * This code is derived from software contributed to Berkeley by
10 1.5 cgd * Jan-Simon Pendry.
11 1.5 cgd *
12 1.2 pk * Redistribution and use in source and binary forms, with or without
13 1.2 pk * modification, are permitted provided that the following conditions
14 1.2 pk * are met:
15 1.2 pk * 1. Redistributions of source code must retain the above copyright
16 1.2 pk * notice, this list of conditions and the following disclaimer.
17 1.2 pk * 2. Redistributions in binary form must reproduce the above copyright
18 1.2 pk * notice, this list of conditions and the following disclaimer in the
19 1.2 pk * documentation and/or other materials provided with the distribution.
20 1.2 pk * 3. All advertising materials mentioning features or use of this software
21 1.2 pk * must display the following acknowledgement:
22 1.5 cgd * This product includes software developed by the University of
23 1.5 cgd * California, Berkeley and its contributors.
24 1.5 cgd * 4. Neither the name of the University nor the names of its contributors
25 1.5 cgd * may be used to endorse or promote products derived from this software
26 1.5 cgd * without specific prior written permission.
27 1.5 cgd *
28 1.5 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
29 1.5 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
30 1.5 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
31 1.5 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
32 1.5 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
33 1.5 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
34 1.5 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
35 1.5 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
36 1.5 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
37 1.5 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
38 1.5 cgd * SUCH DAMAGE.
39 1.2 pk *
40 1.23 fvdl * @(#)procfs_subr.c 8.6 (Berkeley) 5/14/95
41 1.1 pk */
42 1.5 cgd
43 1.4 mycroft #include <sys/param.h>
44 1.4 mycroft #include <sys/systm.h>
45 1.4 mycroft #include <sys/time.h>
46 1.4 mycroft #include <sys/kernel.h>
47 1.4 mycroft #include <sys/proc.h>
48 1.4 mycroft #include <sys/vnode.h>
49 1.11 mycroft #include <sys/malloc.h>
50 1.18 mycroft #include <sys/stat.h>
51 1.18 mycroft
52 1.5 cgd #include <miscfs/procfs/procfs.h>
53 1.1 pk
54 1.29 fvdl void procfs_hashins __P((struct pfsnode *));
55 1.29 fvdl void procfs_hashrem __P((struct pfsnode *));
56 1.29 fvdl struct vnode *procfs_hashget __P((pid_t, pfstype, struct mount *));
57 1.29 fvdl
58 1.29 fvdl LIST_HEAD(pfs_hashhead, pfsnode) *pfs_hashtbl;
59 1.30 fvdl u_long pfs_ihash; /* size of hash table - 1 */
60 1.30 fvdl #define PFSPIDHASH(pid) (&pfs_hashtbl[(pid) & pfs_ihash])
61 1.29 fvdl
62 1.29 fvdl struct lock pfs_hashlock;
63 1.29 fvdl struct simplelock pfs_hash_slock;
64 1.1 pk
65 1.20 thorpej #define ISSET(t, f) ((t) & (f))
66 1.20 thorpej
67 1.1 pk /*
68 1.5 cgd * allocate a pfsnode/vnode pair. the vnode is
69 1.27 wrstuden * referenced, and locked.
70 1.5 cgd *
71 1.5 cgd * the pid, pfs_type, and mount point uniquely
72 1.5 cgd * identify a pfsnode. the mount point is needed
73 1.5 cgd * because someone might mount this filesystem
74 1.5 cgd * twice.
75 1.5 cgd *
76 1.5 cgd * all pfsnodes are maintained on a singly-linked
77 1.5 cgd * list. new nodes are only allocated when they cannot
78 1.5 cgd * be found on this list. entries on the list are
79 1.5 cgd * removed when the vfs reclaim entry is called.
80 1.5 cgd *
81 1.5 cgd * a single lock is kept for the entire list. this is
82 1.5 cgd * needed because the getnewvnode() function can block
83 1.5 cgd * waiting for a vnode to become free, in which case there
84 1.5 cgd * may be more than one process trying to get the same
85 1.5 cgd * vnode. this lock is only taken if we are going to
86 1.5 cgd * call getnewvnode, since the kernel itself is single-threaded.
87 1.5 cgd *
88 1.5 cgd * if an entry is found on the list, then call vget() to
89 1.5 cgd * take a reference. this is done because there may be
90 1.5 cgd * zero references to it and so it needs to removed from
91 1.5 cgd * the vnode free list.
92 1.1 pk */
93 1.11 mycroft int
94 1.5 cgd procfs_allocvp(mp, vpp, pid, pfs_type)
95 1.5 cgd struct mount *mp;
96 1.5 cgd struct vnode **vpp;
97 1.5 cgd long pid;
98 1.5 cgd pfstype pfs_type;
99 1.1 pk {
100 1.12 mycroft struct pfsnode *pfs;
101 1.12 mycroft struct vnode *vp;
102 1.5 cgd int error;
103 1.5 cgd
104 1.29 fvdl do {
105 1.29 fvdl if ((*vpp = procfs_hashget(pid, pfs_type, mp)) != NULL)
106 1.5 cgd return (0);
107 1.29 fvdl } while (lockmgr(&pfs_hashlock, LK_EXCLUSIVE|LK_SLEEPFAIL, 0));
108 1.1 pk
109 1.29 fvdl if ((error = getnewvnode(VT_PROCFS, mp, procfs_vnodeop_p, vpp)) != 0) {
110 1.29 fvdl *vpp = NULL;
111 1.29 fvdl lockmgr(&pfs_hashlock, LK_RELEASE, 0);
112 1.29 fvdl return (error);
113 1.5 cgd }
114 1.11 mycroft vp = *vpp;
115 1.5 cgd
116 1.11 mycroft MALLOC(pfs, void *, sizeof(struct pfsnode), M_TEMP, M_WAITOK);
117 1.11 mycroft vp->v_data = pfs;
118 1.5 cgd
119 1.5 cgd pfs->pfs_pid = (pid_t) pid;
120 1.5 cgd pfs->pfs_type = pfs_type;
121 1.11 mycroft pfs->pfs_vnode = vp;
122 1.5 cgd pfs->pfs_flags = 0;
123 1.5 cgd pfs->pfs_fileno = PROCFS_FILENO(pid, pfs_type);
124 1.5 cgd
125 1.5 cgd switch (pfs_type) {
126 1.11 mycroft case Proot: /* /proc = dr-xr-xr-x */
127 1.17 mycroft pfs->pfs_mode = S_IRUSR|S_IXUSR|S_IRGRP|S_IXGRP|S_IROTH|S_IXOTH;
128 1.11 mycroft vp->v_type = VDIR;
129 1.11 mycroft vp->v_flag = VROOT;
130 1.11 mycroft break;
131 1.11 mycroft
132 1.22 mycroft case Pcurproc: /* /proc/curproc = lr-xr-xr-x */
133 1.28 thorpej case Pself: /* /proc/self = lr-xr-xr-x */
134 1.22 mycroft pfs->pfs_mode = S_IRUSR|S_IXUSR|S_IRGRP|S_IXGRP|S_IROTH|S_IXOTH;
135 1.11 mycroft vp->v_type = VLNK;
136 1.5 cgd break;
137 1.5 cgd
138 1.17 mycroft case Pproc: /* /proc/N = dr-xr-xr-x */
139 1.17 mycroft pfs->pfs_mode = S_IRUSR|S_IXUSR|S_IRGRP|S_IXGRP|S_IROTH|S_IXOTH;
140 1.6 ws vp->v_type = VDIR;
141 1.5 cgd break;
142 1.5 cgd
143 1.17 mycroft case Pfile: /* /proc/N/file = -rw------- */
144 1.17 mycroft case Pmem: /* /proc/N/mem = -rw------- */
145 1.17 mycroft case Pregs: /* /proc/N/regs = -rw------- */
146 1.17 mycroft case Pfpregs: /* /proc/N/fpregs = -rw------- */
147 1.17 mycroft pfs->pfs_mode = S_IRUSR|S_IWUSR;
148 1.9 cgd vp->v_type = VREG;
149 1.9 cgd break;
150 1.9 cgd
151 1.17 mycroft case Pctl: /* /proc/N/ctl = --w------ */
152 1.17 mycroft case Pnote: /* /proc/N/note = --w------ */
153 1.17 mycroft case Pnotepg: /* /proc/N/notepg = --w------ */
154 1.17 mycroft pfs->pfs_mode = S_IWUSR;
155 1.6 ws vp->v_type = VREG;
156 1.5 cgd break;
157 1.5 cgd
158 1.25 msaitoh case Pmap: /* /proc/N/map = -r--r--r-- */
159 1.17 mycroft case Pstatus: /* /proc/N/status = -r--r--r-- */
160 1.26 christos case Pcmdline: /* /proc/N/cmdline = -r--r--r-- */
161 1.17 mycroft pfs->pfs_mode = S_IRUSR|S_IRGRP|S_IROTH;
162 1.6 ws vp->v_type = VREG;
163 1.5 cgd break;
164 1.5 cgd
165 1.5 cgd default:
166 1.11 mycroft panic("procfs_allocvp");
167 1.5 cgd }
168 1.27 wrstuden
169 1.29 fvdl procfs_hashins(pfs);
170 1.29 fvdl lockmgr(&pfs_hashlock, LK_RELEASE, 0);
171 1.1 pk
172 1.5 cgd return (error);
173 1.1 pk }
174 1.1 pk
175 1.11 mycroft int
176 1.5 cgd procfs_freevp(vp)
177 1.5 cgd struct vnode *vp;
178 1.1 pk {
179 1.5 cgd struct pfsnode *pfs = VTOPFS(vp);
180 1.5 cgd
181 1.29 fvdl procfs_hashrem(pfs);
182 1.1 pk
183 1.11 mycroft FREE(vp->v_data, M_TEMP);
184 1.11 mycroft vp->v_data = 0;
185 1.5 cgd return (0);
186 1.1 pk }
187 1.1 pk
188 1.11 mycroft int
189 1.15 christos procfs_rw(v)
190 1.15 christos void *v;
191 1.1 pk {
192 1.15 christos struct vop_read_args *ap = v;
193 1.11 mycroft struct vnode *vp = ap->a_vp;
194 1.11 mycroft struct uio *uio = ap->a_uio;
195 1.5 cgd struct proc *curp = uio->uio_procp;
196 1.5 cgd struct pfsnode *pfs = VTOPFS(vp);
197 1.5 cgd struct proc *p;
198 1.5 cgd
199 1.5 cgd p = PFIND(pfs->pfs_pid);
200 1.5 cgd if (p == 0)
201 1.1 pk return (EINVAL);
202 1.19 mycroft
203 1.19 mycroft switch (pfs->pfs_type) {
204 1.19 mycroft case Pregs:
205 1.19 mycroft case Pfpregs:
206 1.19 mycroft case Pmem:
207 1.19 mycroft /*
208 1.19 mycroft * Do not allow init to be modified while in secure mode; it
209 1.19 mycroft * could be duped into changing the security level.
210 1.19 mycroft */
211 1.19 mycroft if (uio->uio_rw == UIO_WRITE &&
212 1.19 mycroft p == initproc && securelevel > -1)
213 1.19 mycroft return (EPERM);
214 1.19 mycroft break;
215 1.19 mycroft
216 1.19 mycroft default:
217 1.19 mycroft break;
218 1.19 mycroft }
219 1.1 pk
220 1.5 cgd switch (pfs->pfs_type) {
221 1.5 cgd case Pnote:
222 1.5 cgd case Pnotepg:
223 1.11 mycroft return (procfs_donote(curp, p, pfs, uio));
224 1.5 cgd
225 1.5 cgd case Pregs:
226 1.11 mycroft return (procfs_doregs(curp, p, pfs, uio));
227 1.9 cgd
228 1.9 cgd case Pfpregs:
229 1.11 mycroft return (procfs_dofpregs(curp, p, pfs, uio));
230 1.5 cgd
231 1.5 cgd case Pctl:
232 1.11 mycroft return (procfs_doctl(curp, p, pfs, uio));
233 1.5 cgd
234 1.5 cgd case Pstatus:
235 1.11 mycroft return (procfs_dostatus(curp, p, pfs, uio));
236 1.25 msaitoh
237 1.25 msaitoh case Pmap:
238 1.25 msaitoh return (procfs_domap(curp, p, pfs, uio));
239 1.1 pk
240 1.5 cgd case Pmem:
241 1.11 mycroft return (procfs_domem(curp, p, pfs, uio));
242 1.26 christos
243 1.26 christos case Pcmdline:
244 1.26 christos return (procfs_docmdline(curp, p, pfs, uio));
245 1.1 pk
246 1.5 cgd default:
247 1.5 cgd return (EOPNOTSUPP);
248 1.5 cgd }
249 1.1 pk }
250 1.1 pk
251 1.5 cgd /*
252 1.5 cgd * Get a string from userland into (buf). Strip a trailing
253 1.5 cgd * nl character (to allow easy access from the shell).
254 1.11 mycroft * The buffer should be *buflenp + 1 chars long. vfs_getuserstr
255 1.5 cgd * will automatically add a nul char at the end.
256 1.5 cgd *
257 1.5 cgd * Returns 0 on success or the following errors
258 1.5 cgd *
259 1.5 cgd * EINVAL: file offset is non-zero.
260 1.5 cgd * EMSGSIZE: message is longer than kernel buffer
261 1.5 cgd * EFAULT: user i/o buffer is not addressable
262 1.5 cgd */
263 1.11 mycroft int
264 1.11 mycroft vfs_getuserstr(uio, buf, buflenp)
265 1.5 cgd struct uio *uio;
266 1.5 cgd char *buf;
267 1.5 cgd int *buflenp;
268 1.1 pk {
269 1.5 cgd int xlen;
270 1.5 cgd int error;
271 1.5 cgd
272 1.11 mycroft if (uio->uio_offset != 0)
273 1.11 mycroft return (EINVAL);
274 1.11 mycroft
275 1.5 cgd xlen = *buflenp;
276 1.1 pk
277 1.5 cgd /* must be able to read the whole string in one go */
278 1.5 cgd if (xlen < uio->uio_resid)
279 1.5 cgd return (EMSGSIZE);
280 1.5 cgd xlen = uio->uio_resid;
281 1.5 cgd
282 1.14 christos if ((error = uiomove(buf, xlen, uio)) != 0)
283 1.5 cgd return (error);
284 1.5 cgd
285 1.11 mycroft /* allow multiple writes without seeks */
286 1.11 mycroft uio->uio_offset = 0;
287 1.11 mycroft
288 1.5 cgd /* cleanup string and remove trailing newline */
289 1.5 cgd buf[xlen] = '\0';
290 1.5 cgd xlen = strlen(buf);
291 1.5 cgd if (xlen > 0 && buf[xlen-1] == '\n')
292 1.5 cgd buf[--xlen] = '\0';
293 1.5 cgd *buflenp = xlen;
294 1.1 pk
295 1.5 cgd return (0);
296 1.1 pk }
297 1.1 pk
298 1.11 mycroft vfs_namemap_t *
299 1.11 mycroft vfs_findname(nm, buf, buflen)
300 1.11 mycroft vfs_namemap_t *nm;
301 1.5 cgd char *buf;
302 1.5 cgd int buflen;
303 1.1 pk {
304 1.11 mycroft
305 1.5 cgd for (; nm->nm_name; nm++)
306 1.24 perry if (memcmp(buf, nm->nm_name, buflen+1) == 0)
307 1.5 cgd return (nm);
308 1.5 cgd
309 1.5 cgd return (0);
310 1.29 fvdl }
311 1.29 fvdl
312 1.29 fvdl /*
313 1.29 fvdl * Initialize pfsnode hash table.
314 1.29 fvdl */
315 1.29 fvdl void
316 1.29 fvdl procfs_hashinit()
317 1.29 fvdl {
318 1.29 fvdl lockinit(&pfs_hashlock, PINOD, "pfs_hashlock", 0, 0);
319 1.32 ad pfs_hashtbl = hashinit(desiredvnodes / 4, HASH_LIST, M_UFSMNT,
320 1.32 ad M_WAITOK, &pfs_ihash);
321 1.29 fvdl simple_lock_init(&pfs_hash_slock);
322 1.31 jdolecek }
323 1.31 jdolecek
324 1.31 jdolecek /*
325 1.31 jdolecek * Free pfsnode hash table.
326 1.31 jdolecek */
327 1.31 jdolecek void
328 1.31 jdolecek procfs_hashdone()
329 1.31 jdolecek {
330 1.31 jdolecek hashdone(pfs_hashtbl, M_UFSMNT);
331 1.29 fvdl }
332 1.29 fvdl
333 1.29 fvdl struct vnode *
334 1.29 fvdl procfs_hashget(pid, type, mp)
335 1.29 fvdl pid_t pid;
336 1.29 fvdl pfstype type;
337 1.29 fvdl struct mount *mp;
338 1.29 fvdl {
339 1.29 fvdl struct pfsnode *pp;
340 1.29 fvdl struct vnode *vp;
341 1.29 fvdl
342 1.29 fvdl loop:
343 1.29 fvdl simple_lock(&pfs_hash_slock);
344 1.29 fvdl for (pp = PFSPIDHASH(pid)->lh_first; pp; pp = pp->pfs_hash.le_next) {
345 1.29 fvdl vp = PFSTOV(pp);
346 1.29 fvdl if (pid == pp->pfs_pid && pp->pfs_type == type &&
347 1.29 fvdl vp->v_mount == mp) {
348 1.29 fvdl simple_lock(&vp->v_interlock);
349 1.29 fvdl simple_unlock(&pfs_hash_slock);
350 1.29 fvdl if (vget(vp, LK_EXCLUSIVE | LK_INTERLOCK))
351 1.29 fvdl goto loop;
352 1.29 fvdl return (vp);
353 1.29 fvdl }
354 1.29 fvdl }
355 1.29 fvdl simple_unlock(&pfs_hash_slock);
356 1.29 fvdl return (NULL);
357 1.29 fvdl }
358 1.29 fvdl
359 1.29 fvdl /*
360 1.29 fvdl * Insert the pfsnode into the hash table and lock it.
361 1.29 fvdl */
362 1.29 fvdl void
363 1.29 fvdl procfs_hashins(pp)
364 1.29 fvdl struct pfsnode *pp;
365 1.29 fvdl {
366 1.29 fvdl struct pfs_hashhead *ppp;
367 1.29 fvdl
368 1.29 fvdl /* lock the pfsnode, then put it on the appropriate hash list */
369 1.29 fvdl lockmgr(&pp->pfs_vnode->v_lock, LK_EXCLUSIVE, (struct simplelock *)0);
370 1.29 fvdl
371 1.29 fvdl simple_lock(&pfs_hash_slock);
372 1.29 fvdl ppp = PFSPIDHASH(pp->pfs_pid);
373 1.29 fvdl LIST_INSERT_HEAD(ppp, pp, pfs_hash);
374 1.29 fvdl simple_unlock(&pfs_hash_slock);
375 1.29 fvdl }
376 1.29 fvdl
377 1.29 fvdl /*
378 1.29 fvdl * Remove the pfsnode from the hash table.
379 1.29 fvdl */
380 1.29 fvdl void
381 1.29 fvdl procfs_hashrem(pp)
382 1.29 fvdl struct pfsnode *pp;
383 1.29 fvdl {
384 1.29 fvdl simple_lock(&pfs_hash_slock);
385 1.29 fvdl LIST_REMOVE(pp, pfs_hash);
386 1.29 fvdl simple_unlock(&pfs_hash_slock);
387 1.29 fvdl }
388 1.29 fvdl
389 1.29 fvdl void
390 1.29 fvdl procfs_revoke_vnodes(p, arg)
391 1.29 fvdl struct proc *p;
392 1.29 fvdl void *arg;
393 1.29 fvdl {
394 1.29 fvdl struct pfsnode *pfs, *pnext;
395 1.29 fvdl struct vnode *vp;
396 1.29 fvdl struct mount *mp = (struct mount *)arg;
397 1.29 fvdl
398 1.29 fvdl if (!(p->p_flag & P_SUGID))
399 1.29 fvdl return;
400 1.29 fvdl
401 1.29 fvdl for (pfs = PFSPIDHASH(p->p_pid)->lh_first; pfs; pfs = pnext) {
402 1.29 fvdl vp = PFSTOV(pfs);
403 1.29 fvdl pnext = pfs->pfs_hash.le_next;
404 1.29 fvdl if (vp->v_usecount > 0 && pfs->pfs_pid == p->p_pid &&
405 1.29 fvdl vp->v_mount == mp)
406 1.29 fvdl VOP_REVOKE(vp, REVOKEALL);
407 1.29 fvdl }
408 1.1 pk }
409