procfs_subr.c revision 1.34 1 1.34 chs /* $NetBSD: procfs_subr.c,v 1.34 2000/11/27 08:39:46 chs Exp $ */
2 1.13 cgd
3 1.1 pk /*
4 1.20 thorpej * Copyright (c) 1994 Christopher G. Demetriou. All rights reserved.
5 1.5 cgd * Copyright (c) 1993 Jan-Simon Pendry
6 1.11 mycroft * Copyright (c) 1993
7 1.11 mycroft * The Regents of the University of California. All rights reserved.
8 1.2 pk *
9 1.5 cgd * This code is derived from software contributed to Berkeley by
10 1.5 cgd * Jan-Simon Pendry.
11 1.5 cgd *
12 1.2 pk * Redistribution and use in source and binary forms, with or without
13 1.2 pk * modification, are permitted provided that the following conditions
14 1.2 pk * are met:
15 1.2 pk * 1. Redistributions of source code must retain the above copyright
16 1.2 pk * notice, this list of conditions and the following disclaimer.
17 1.2 pk * 2. Redistributions in binary form must reproduce the above copyright
18 1.2 pk * notice, this list of conditions and the following disclaimer in the
19 1.2 pk * documentation and/or other materials provided with the distribution.
20 1.2 pk * 3. All advertising materials mentioning features or use of this software
21 1.2 pk * must display the following acknowledgement:
22 1.5 cgd * This product includes software developed by the University of
23 1.5 cgd * California, Berkeley and its contributors.
24 1.5 cgd * 4. Neither the name of the University nor the names of its contributors
25 1.5 cgd * may be used to endorse or promote products derived from this software
26 1.5 cgd * without specific prior written permission.
27 1.5 cgd *
28 1.5 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
29 1.5 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
30 1.5 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
31 1.5 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
32 1.5 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
33 1.5 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
34 1.5 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
35 1.5 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
36 1.5 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
37 1.5 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
38 1.5 cgd * SUCH DAMAGE.
39 1.2 pk *
40 1.23 fvdl * @(#)procfs_subr.c 8.6 (Berkeley) 5/14/95
41 1.1 pk */
42 1.5 cgd
43 1.4 mycroft #include <sys/param.h>
44 1.4 mycroft #include <sys/systm.h>
45 1.4 mycroft #include <sys/time.h>
46 1.4 mycroft #include <sys/kernel.h>
47 1.4 mycroft #include <sys/proc.h>
48 1.4 mycroft #include <sys/vnode.h>
49 1.11 mycroft #include <sys/malloc.h>
50 1.18 mycroft #include <sys/stat.h>
51 1.18 mycroft
52 1.5 cgd #include <miscfs/procfs/procfs.h>
53 1.1 pk
54 1.29 fvdl void procfs_hashins __P((struct pfsnode *));
55 1.29 fvdl void procfs_hashrem __P((struct pfsnode *));
56 1.29 fvdl struct vnode *procfs_hashget __P((pid_t, pfstype, struct mount *));
57 1.29 fvdl
58 1.29 fvdl LIST_HEAD(pfs_hashhead, pfsnode) *pfs_hashtbl;
59 1.30 fvdl u_long pfs_ihash; /* size of hash table - 1 */
60 1.30 fvdl #define PFSPIDHASH(pid) (&pfs_hashtbl[(pid) & pfs_ihash])
61 1.29 fvdl
62 1.29 fvdl struct lock pfs_hashlock;
63 1.29 fvdl struct simplelock pfs_hash_slock;
64 1.1 pk
65 1.20 thorpej #define ISSET(t, f) ((t) & (f))
66 1.20 thorpej
67 1.1 pk /*
68 1.5 cgd * allocate a pfsnode/vnode pair. the vnode is
69 1.27 wrstuden * referenced, and locked.
70 1.5 cgd *
71 1.5 cgd * the pid, pfs_type, and mount point uniquely
72 1.5 cgd * identify a pfsnode. the mount point is needed
73 1.5 cgd * because someone might mount this filesystem
74 1.5 cgd * twice.
75 1.5 cgd *
76 1.5 cgd * all pfsnodes are maintained on a singly-linked
77 1.5 cgd * list. new nodes are only allocated when they cannot
78 1.5 cgd * be found on this list. entries on the list are
79 1.5 cgd * removed when the vfs reclaim entry is called.
80 1.5 cgd *
81 1.5 cgd * a single lock is kept for the entire list. this is
82 1.5 cgd * needed because the getnewvnode() function can block
83 1.5 cgd * waiting for a vnode to become free, in which case there
84 1.5 cgd * may be more than one process trying to get the same
85 1.5 cgd * vnode. this lock is only taken if we are going to
86 1.5 cgd * call getnewvnode, since the kernel itself is single-threaded.
87 1.5 cgd *
88 1.5 cgd * if an entry is found on the list, then call vget() to
89 1.5 cgd * take a reference. this is done because there may be
90 1.5 cgd * zero references to it and so it needs to removed from
91 1.5 cgd * the vnode free list.
92 1.1 pk */
93 1.11 mycroft int
94 1.5 cgd procfs_allocvp(mp, vpp, pid, pfs_type)
95 1.5 cgd struct mount *mp;
96 1.5 cgd struct vnode **vpp;
97 1.5 cgd long pid;
98 1.5 cgd pfstype pfs_type;
99 1.1 pk {
100 1.12 mycroft struct pfsnode *pfs;
101 1.12 mycroft struct vnode *vp;
102 1.5 cgd int error;
103 1.5 cgd
104 1.29 fvdl do {
105 1.29 fvdl if ((*vpp = procfs_hashget(pid, pfs_type, mp)) != NULL)
106 1.5 cgd return (0);
107 1.29 fvdl } while (lockmgr(&pfs_hashlock, LK_EXCLUSIVE|LK_SLEEPFAIL, 0));
108 1.1 pk
109 1.29 fvdl if ((error = getnewvnode(VT_PROCFS, mp, procfs_vnodeop_p, vpp)) != 0) {
110 1.29 fvdl *vpp = NULL;
111 1.33 chs lockmgr(&pfs_hashlock, LK_RELEASE, NULL);
112 1.29 fvdl return (error);
113 1.5 cgd }
114 1.11 mycroft vp = *vpp;
115 1.5 cgd
116 1.11 mycroft MALLOC(pfs, void *, sizeof(struct pfsnode), M_TEMP, M_WAITOK);
117 1.11 mycroft vp->v_data = pfs;
118 1.5 cgd
119 1.5 cgd pfs->pfs_pid = (pid_t) pid;
120 1.5 cgd pfs->pfs_type = pfs_type;
121 1.11 mycroft pfs->pfs_vnode = vp;
122 1.5 cgd pfs->pfs_flags = 0;
123 1.5 cgd pfs->pfs_fileno = PROCFS_FILENO(pid, pfs_type);
124 1.5 cgd
125 1.5 cgd switch (pfs_type) {
126 1.11 mycroft case Proot: /* /proc = dr-xr-xr-x */
127 1.17 mycroft pfs->pfs_mode = S_IRUSR|S_IXUSR|S_IRGRP|S_IXGRP|S_IROTH|S_IXOTH;
128 1.11 mycroft vp->v_type = VDIR;
129 1.11 mycroft vp->v_flag = VROOT;
130 1.11 mycroft break;
131 1.11 mycroft
132 1.22 mycroft case Pcurproc: /* /proc/curproc = lr-xr-xr-x */
133 1.28 thorpej case Pself: /* /proc/self = lr-xr-xr-x */
134 1.22 mycroft pfs->pfs_mode = S_IRUSR|S_IXUSR|S_IRGRP|S_IXGRP|S_IROTH|S_IXOTH;
135 1.11 mycroft vp->v_type = VLNK;
136 1.5 cgd break;
137 1.5 cgd
138 1.17 mycroft case Pproc: /* /proc/N = dr-xr-xr-x */
139 1.17 mycroft pfs->pfs_mode = S_IRUSR|S_IXUSR|S_IRGRP|S_IXGRP|S_IROTH|S_IXOTH;
140 1.6 ws vp->v_type = VDIR;
141 1.5 cgd break;
142 1.5 cgd
143 1.17 mycroft case Pfile: /* /proc/N/file = -rw------- */
144 1.17 mycroft case Pmem: /* /proc/N/mem = -rw------- */
145 1.17 mycroft case Pregs: /* /proc/N/regs = -rw------- */
146 1.17 mycroft case Pfpregs: /* /proc/N/fpregs = -rw------- */
147 1.17 mycroft pfs->pfs_mode = S_IRUSR|S_IWUSR;
148 1.9 cgd vp->v_type = VREG;
149 1.9 cgd break;
150 1.9 cgd
151 1.17 mycroft case Pctl: /* /proc/N/ctl = --w------ */
152 1.17 mycroft case Pnote: /* /proc/N/note = --w------ */
153 1.17 mycroft case Pnotepg: /* /proc/N/notepg = --w------ */
154 1.17 mycroft pfs->pfs_mode = S_IWUSR;
155 1.6 ws vp->v_type = VREG;
156 1.5 cgd break;
157 1.5 cgd
158 1.25 msaitoh case Pmap: /* /proc/N/map = -r--r--r-- */
159 1.17 mycroft case Pstatus: /* /proc/N/status = -r--r--r-- */
160 1.26 christos case Pcmdline: /* /proc/N/cmdline = -r--r--r-- */
161 1.17 mycroft pfs->pfs_mode = S_IRUSR|S_IRGRP|S_IROTH;
162 1.6 ws vp->v_type = VREG;
163 1.5 cgd break;
164 1.5 cgd
165 1.5 cgd default:
166 1.11 mycroft panic("procfs_allocvp");
167 1.5 cgd }
168 1.27 wrstuden
169 1.29 fvdl procfs_hashins(pfs);
170 1.34 chs uvm_vnp_setsize(vp, 0);
171 1.33 chs lockmgr(&pfs_hashlock, LK_RELEASE, NULL);
172 1.1 pk
173 1.5 cgd return (error);
174 1.1 pk }
175 1.1 pk
176 1.11 mycroft int
177 1.5 cgd procfs_freevp(vp)
178 1.5 cgd struct vnode *vp;
179 1.1 pk {
180 1.5 cgd struct pfsnode *pfs = VTOPFS(vp);
181 1.5 cgd
182 1.29 fvdl procfs_hashrem(pfs);
183 1.1 pk
184 1.11 mycroft FREE(vp->v_data, M_TEMP);
185 1.11 mycroft vp->v_data = 0;
186 1.5 cgd return (0);
187 1.1 pk }
188 1.1 pk
189 1.11 mycroft int
190 1.15 christos procfs_rw(v)
191 1.15 christos void *v;
192 1.1 pk {
193 1.15 christos struct vop_read_args *ap = v;
194 1.11 mycroft struct vnode *vp = ap->a_vp;
195 1.11 mycroft struct uio *uio = ap->a_uio;
196 1.5 cgd struct proc *curp = uio->uio_procp;
197 1.5 cgd struct pfsnode *pfs = VTOPFS(vp);
198 1.5 cgd struct proc *p;
199 1.5 cgd
200 1.5 cgd p = PFIND(pfs->pfs_pid);
201 1.5 cgd if (p == 0)
202 1.1 pk return (EINVAL);
203 1.19 mycroft
204 1.19 mycroft switch (pfs->pfs_type) {
205 1.19 mycroft case Pregs:
206 1.19 mycroft case Pfpregs:
207 1.19 mycroft case Pmem:
208 1.19 mycroft /*
209 1.19 mycroft * Do not allow init to be modified while in secure mode; it
210 1.19 mycroft * could be duped into changing the security level.
211 1.19 mycroft */
212 1.19 mycroft if (uio->uio_rw == UIO_WRITE &&
213 1.19 mycroft p == initproc && securelevel > -1)
214 1.19 mycroft return (EPERM);
215 1.19 mycroft break;
216 1.19 mycroft
217 1.19 mycroft default:
218 1.19 mycroft break;
219 1.19 mycroft }
220 1.1 pk
221 1.5 cgd switch (pfs->pfs_type) {
222 1.5 cgd case Pnote:
223 1.5 cgd case Pnotepg:
224 1.11 mycroft return (procfs_donote(curp, p, pfs, uio));
225 1.5 cgd
226 1.5 cgd case Pregs:
227 1.11 mycroft return (procfs_doregs(curp, p, pfs, uio));
228 1.9 cgd
229 1.9 cgd case Pfpregs:
230 1.11 mycroft return (procfs_dofpregs(curp, p, pfs, uio));
231 1.5 cgd
232 1.5 cgd case Pctl:
233 1.11 mycroft return (procfs_doctl(curp, p, pfs, uio));
234 1.5 cgd
235 1.5 cgd case Pstatus:
236 1.11 mycroft return (procfs_dostatus(curp, p, pfs, uio));
237 1.25 msaitoh
238 1.25 msaitoh case Pmap:
239 1.25 msaitoh return (procfs_domap(curp, p, pfs, uio));
240 1.1 pk
241 1.5 cgd case Pmem:
242 1.11 mycroft return (procfs_domem(curp, p, pfs, uio));
243 1.26 christos
244 1.26 christos case Pcmdline:
245 1.26 christos return (procfs_docmdline(curp, p, pfs, uio));
246 1.1 pk
247 1.5 cgd default:
248 1.5 cgd return (EOPNOTSUPP);
249 1.5 cgd }
250 1.1 pk }
251 1.1 pk
252 1.5 cgd /*
253 1.5 cgd * Get a string from userland into (buf). Strip a trailing
254 1.5 cgd * nl character (to allow easy access from the shell).
255 1.11 mycroft * The buffer should be *buflenp + 1 chars long. vfs_getuserstr
256 1.5 cgd * will automatically add a nul char at the end.
257 1.5 cgd *
258 1.5 cgd * Returns 0 on success or the following errors
259 1.5 cgd *
260 1.5 cgd * EINVAL: file offset is non-zero.
261 1.5 cgd * EMSGSIZE: message is longer than kernel buffer
262 1.5 cgd * EFAULT: user i/o buffer is not addressable
263 1.5 cgd */
264 1.11 mycroft int
265 1.11 mycroft vfs_getuserstr(uio, buf, buflenp)
266 1.5 cgd struct uio *uio;
267 1.5 cgd char *buf;
268 1.5 cgd int *buflenp;
269 1.1 pk {
270 1.5 cgd int xlen;
271 1.5 cgd int error;
272 1.5 cgd
273 1.11 mycroft if (uio->uio_offset != 0)
274 1.11 mycroft return (EINVAL);
275 1.11 mycroft
276 1.5 cgd xlen = *buflenp;
277 1.1 pk
278 1.5 cgd /* must be able to read the whole string in one go */
279 1.5 cgd if (xlen < uio->uio_resid)
280 1.5 cgd return (EMSGSIZE);
281 1.5 cgd xlen = uio->uio_resid;
282 1.5 cgd
283 1.14 christos if ((error = uiomove(buf, xlen, uio)) != 0)
284 1.5 cgd return (error);
285 1.5 cgd
286 1.11 mycroft /* allow multiple writes without seeks */
287 1.11 mycroft uio->uio_offset = 0;
288 1.11 mycroft
289 1.5 cgd /* cleanup string and remove trailing newline */
290 1.5 cgd buf[xlen] = '\0';
291 1.5 cgd xlen = strlen(buf);
292 1.5 cgd if (xlen > 0 && buf[xlen-1] == '\n')
293 1.5 cgd buf[--xlen] = '\0';
294 1.5 cgd *buflenp = xlen;
295 1.1 pk
296 1.5 cgd return (0);
297 1.1 pk }
298 1.1 pk
299 1.11 mycroft vfs_namemap_t *
300 1.11 mycroft vfs_findname(nm, buf, buflen)
301 1.11 mycroft vfs_namemap_t *nm;
302 1.5 cgd char *buf;
303 1.5 cgd int buflen;
304 1.1 pk {
305 1.11 mycroft
306 1.5 cgd for (; nm->nm_name; nm++)
307 1.24 perry if (memcmp(buf, nm->nm_name, buflen+1) == 0)
308 1.5 cgd return (nm);
309 1.5 cgd
310 1.5 cgd return (0);
311 1.29 fvdl }
312 1.29 fvdl
313 1.29 fvdl /*
314 1.29 fvdl * Initialize pfsnode hash table.
315 1.29 fvdl */
316 1.29 fvdl void
317 1.29 fvdl procfs_hashinit()
318 1.29 fvdl {
319 1.29 fvdl lockinit(&pfs_hashlock, PINOD, "pfs_hashlock", 0, 0);
320 1.32 ad pfs_hashtbl = hashinit(desiredvnodes / 4, HASH_LIST, M_UFSMNT,
321 1.32 ad M_WAITOK, &pfs_ihash);
322 1.29 fvdl simple_lock_init(&pfs_hash_slock);
323 1.31 jdolecek }
324 1.31 jdolecek
325 1.31 jdolecek /*
326 1.31 jdolecek * Free pfsnode hash table.
327 1.31 jdolecek */
328 1.31 jdolecek void
329 1.31 jdolecek procfs_hashdone()
330 1.31 jdolecek {
331 1.31 jdolecek hashdone(pfs_hashtbl, M_UFSMNT);
332 1.29 fvdl }
333 1.29 fvdl
334 1.29 fvdl struct vnode *
335 1.29 fvdl procfs_hashget(pid, type, mp)
336 1.29 fvdl pid_t pid;
337 1.29 fvdl pfstype type;
338 1.29 fvdl struct mount *mp;
339 1.29 fvdl {
340 1.29 fvdl struct pfsnode *pp;
341 1.29 fvdl struct vnode *vp;
342 1.29 fvdl
343 1.29 fvdl loop:
344 1.29 fvdl simple_lock(&pfs_hash_slock);
345 1.29 fvdl for (pp = PFSPIDHASH(pid)->lh_first; pp; pp = pp->pfs_hash.le_next) {
346 1.29 fvdl vp = PFSTOV(pp);
347 1.29 fvdl if (pid == pp->pfs_pid && pp->pfs_type == type &&
348 1.29 fvdl vp->v_mount == mp) {
349 1.29 fvdl simple_lock(&vp->v_interlock);
350 1.29 fvdl simple_unlock(&pfs_hash_slock);
351 1.29 fvdl if (vget(vp, LK_EXCLUSIVE | LK_INTERLOCK))
352 1.29 fvdl goto loop;
353 1.29 fvdl return (vp);
354 1.29 fvdl }
355 1.29 fvdl }
356 1.29 fvdl simple_unlock(&pfs_hash_slock);
357 1.29 fvdl return (NULL);
358 1.29 fvdl }
359 1.29 fvdl
360 1.29 fvdl /*
361 1.29 fvdl * Insert the pfsnode into the hash table and lock it.
362 1.29 fvdl */
363 1.29 fvdl void
364 1.29 fvdl procfs_hashins(pp)
365 1.29 fvdl struct pfsnode *pp;
366 1.29 fvdl {
367 1.29 fvdl struct pfs_hashhead *ppp;
368 1.29 fvdl
369 1.29 fvdl /* lock the pfsnode, then put it on the appropriate hash list */
370 1.29 fvdl lockmgr(&pp->pfs_vnode->v_lock, LK_EXCLUSIVE, (struct simplelock *)0);
371 1.29 fvdl
372 1.29 fvdl simple_lock(&pfs_hash_slock);
373 1.29 fvdl ppp = PFSPIDHASH(pp->pfs_pid);
374 1.29 fvdl LIST_INSERT_HEAD(ppp, pp, pfs_hash);
375 1.29 fvdl simple_unlock(&pfs_hash_slock);
376 1.29 fvdl }
377 1.29 fvdl
378 1.29 fvdl /*
379 1.29 fvdl * Remove the pfsnode from the hash table.
380 1.29 fvdl */
381 1.29 fvdl void
382 1.29 fvdl procfs_hashrem(pp)
383 1.29 fvdl struct pfsnode *pp;
384 1.29 fvdl {
385 1.29 fvdl simple_lock(&pfs_hash_slock);
386 1.29 fvdl LIST_REMOVE(pp, pfs_hash);
387 1.29 fvdl simple_unlock(&pfs_hash_slock);
388 1.29 fvdl }
389 1.29 fvdl
390 1.29 fvdl void
391 1.29 fvdl procfs_revoke_vnodes(p, arg)
392 1.29 fvdl struct proc *p;
393 1.29 fvdl void *arg;
394 1.29 fvdl {
395 1.29 fvdl struct pfsnode *pfs, *pnext;
396 1.29 fvdl struct vnode *vp;
397 1.29 fvdl struct mount *mp = (struct mount *)arg;
398 1.29 fvdl
399 1.29 fvdl if (!(p->p_flag & P_SUGID))
400 1.29 fvdl return;
401 1.29 fvdl
402 1.29 fvdl for (pfs = PFSPIDHASH(p->p_pid)->lh_first; pfs; pfs = pnext) {
403 1.29 fvdl vp = PFSTOV(pfs);
404 1.29 fvdl pnext = pfs->pfs_hash.le_next;
405 1.29 fvdl if (vp->v_usecount > 0 && pfs->pfs_pid == p->p_pid &&
406 1.29 fvdl vp->v_mount == mp)
407 1.29 fvdl VOP_REVOKE(vp, REVOKEALL);
408 1.29 fvdl }
409 1.1 pk }
410