nfs_syscalls.c revision 1.47 1 1.47 chs /* $NetBSD: nfs_syscalls.c,v 1.47 2000/11/24 23:30:03 chs Exp $ */
2 1.11 cgd
3 1.1 cgd /*
4 1.10 mycroft * Copyright (c) 1989, 1993
5 1.10 mycroft * The Regents of the University of California. All rights reserved.
6 1.1 cgd *
7 1.1 cgd * This code is derived from software contributed to Berkeley by
8 1.1 cgd * Rick Macklem at The University of Guelph.
9 1.1 cgd *
10 1.1 cgd * Redistribution and use in source and binary forms, with or without
11 1.1 cgd * modification, are permitted provided that the following conditions
12 1.1 cgd * are met:
13 1.1 cgd * 1. Redistributions of source code must retain the above copyright
14 1.1 cgd * notice, this list of conditions and the following disclaimer.
15 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
16 1.1 cgd * notice, this list of conditions and the following disclaimer in the
17 1.1 cgd * documentation and/or other materials provided with the distribution.
18 1.1 cgd * 3. All advertising materials mentioning features or use of this software
19 1.1 cgd * must display the following acknowledgement:
20 1.1 cgd * This product includes software developed by the University of
21 1.1 cgd * California, Berkeley and its contributors.
22 1.1 cgd * 4. Neither the name of the University nor the names of its contributors
23 1.1 cgd * may be used to endorse or promote products derived from this software
24 1.1 cgd * without specific prior written permission.
25 1.1 cgd *
26 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
27 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
28 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
29 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
30 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
31 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
32 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
33 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
34 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
35 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
36 1.1 cgd * SUCH DAMAGE.
37 1.1 cgd *
38 1.19 fvdl * @(#)nfs_syscalls.c 8.5 (Berkeley) 3/30/95
39 1.1 cgd */
40 1.28 thorpej
41 1.28 thorpej #include "fs_nfs.h"
42 1.43 bjh21 #include "opt_nfs.h"
43 1.30 thorpej #include "opt_nfsserver.h"
44 1.31 jonathan #include "opt_iso.h"
45 1.41 fvdl #include "opt_inet.h"
46 1.39 tsarna #include "opt_compat_netbsd.h"
47 1.1 cgd
48 1.7 mycroft #include <sys/param.h>
49 1.7 mycroft #include <sys/systm.h>
50 1.7 mycroft #include <sys/kernel.h>
51 1.7 mycroft #include <sys/file.h>
52 1.7 mycroft #include <sys/stat.h>
53 1.7 mycroft #include <sys/vnode.h>
54 1.7 mycroft #include <sys/mount.h>
55 1.7 mycroft #include <sys/proc.h>
56 1.10 mycroft #include <sys/uio.h>
57 1.7 mycroft #include <sys/malloc.h>
58 1.7 mycroft #include <sys/buf.h>
59 1.7 mycroft #include <sys/mbuf.h>
60 1.7 mycroft #include <sys/socket.h>
61 1.7 mycroft #include <sys/socketvar.h>
62 1.39 tsarna #include <sys/signalvar.h>
63 1.7 mycroft #include <sys/domain.h>
64 1.7 mycroft #include <sys/protosw.h>
65 1.10 mycroft #include <sys/namei.h>
66 1.10 mycroft #include <sys/syslog.h>
67 1.18 christos #include <sys/filedesc.h>
68 1.39 tsarna #include <sys/kthread.h>
69 1.1 cgd
70 1.13 cgd #include <sys/syscallargs.h>
71 1.13 cgd
72 1.7 mycroft #include <netinet/in.h>
73 1.7 mycroft #include <netinet/tcp.h>
74 1.10 mycroft #ifdef ISO
75 1.10 mycroft #include <netiso/iso.h>
76 1.10 mycroft #endif
77 1.19 fvdl #include <nfs/xdr_subs.h>
78 1.10 mycroft #include <nfs/rpcv2.h>
79 1.19 fvdl #include <nfs/nfsproto.h>
80 1.7 mycroft #include <nfs/nfs.h>
81 1.19 fvdl #include <nfs/nfsm_subs.h>
82 1.7 mycroft #include <nfs/nfsrvcache.h>
83 1.10 mycroft #include <nfs/nfsmount.h>
84 1.10 mycroft #include <nfs/nfsnode.h>
85 1.10 mycroft #include <nfs/nqnfs.h>
86 1.10 mycroft #include <nfs/nfsrtt.h>
87 1.18 christos #include <nfs/nfs_var.h>
88 1.1 cgd
89 1.1 cgd /* Global defs. */
90 1.19 fvdl extern int32_t (*nfsrv3_procs[NFS_NPROCS]) __P((struct nfsrv_descript *,
91 1.19 fvdl struct nfssvc_sock *,
92 1.19 fvdl struct proc *, struct mbuf **));
93 1.1 cgd extern int nfs_numasync;
94 1.10 mycroft extern time_t nqnfsstarttime;
95 1.10 mycroft extern int nqsrv_writeslack;
96 1.10 mycroft extern int nfsrtton;
97 1.19 fvdl extern struct nfsstats nfsstats;
98 1.19 fvdl extern int nfsrvw_procrastinate;
99 1.47 chs struct nfssvc_sock *nfs_udpsock;
100 1.47 chs #ifdef ISO
101 1.47 chs struct nfssvc_sock *nfs_cltpsock;
102 1.47 chs #endif
103 1.41 fvdl #ifdef INET6
104 1.41 fvdl struct nfssvc_sock *nfs_udp6sock;
105 1.41 fvdl #endif
106 1.10 mycroft int nuidhash_max = NFS_MAXUIDHASH;
107 1.18 christos int nfsd_waiting = 0;
108 1.18 christos #ifdef NFSSERVER
109 1.10 mycroft static int nfs_numnfsd = 0;
110 1.10 mycroft static int notstarted = 1;
111 1.10 mycroft static int modify_flag = 0;
112 1.10 mycroft static struct nfsdrt nfsdrt;
113 1.18 christos #endif
114 1.1 cgd
115 1.1 cgd #define TRUE 1
116 1.1 cgd #define FALSE 0
117 1.1 cgd
118 1.24 thorpej #ifdef NFS
119 1.39 tsarna static struct proc *nfs_asyncdaemon[NFS_MAXASYNCDAEMON];
120 1.40 tsarna int nfs_niothreads = -1; /* == "0, and has never been set" */
121 1.23 thorpej #endif
122 1.19 fvdl
123 1.18 christos #ifdef NFSSERVER
124 1.19 fvdl static void nfsd_rt __P((int, struct nfsrv_descript *, int));
125 1.18 christos #endif
126 1.19 fvdl
127 1.1 cgd /*
128 1.1 cgd * NFS server system calls
129 1.1 cgd */
130 1.1 cgd
131 1.1 cgd
132 1.1 cgd /*
133 1.19 fvdl * Nfs server pseudo system call for the nfsd's
134 1.10 mycroft * Based on the flag value it either:
135 1.10 mycroft * - adds a socket to the selection list
136 1.10 mycroft * - remains in the kernel as an nfsd
137 1.10 mycroft * - remains in the kernel as an nfsiod
138 1.1 cgd */
139 1.18 christos int
140 1.16 mycroft sys_nfssvc(p, v, retval)
141 1.1 cgd struct proc *p;
142 1.15 thorpej void *v;
143 1.15 thorpej register_t *retval;
144 1.15 thorpej {
145 1.38 augustss struct sys_nfssvc_args /* {
146 1.13 cgd syscallarg(int) flag;
147 1.13 cgd syscallarg(caddr_t) argp;
148 1.15 thorpej } */ *uap = v;
149 1.23 thorpej int error;
150 1.24 thorpej #ifdef NFS
151 1.10 mycroft struct nameidata nd;
152 1.18 christos struct nfsmount *nmp;
153 1.19 fvdl struct nfsd_cargs ncd;
154 1.19 fvdl #endif
155 1.18 christos #ifdef NFSSERVER
156 1.1 cgd struct file *fp;
157 1.10 mycroft struct mbuf *nam;
158 1.10 mycroft struct nfsd_args nfsdarg;
159 1.10 mycroft struct nfsd_srvargs nfsd_srvargs, *nsd = &nfsd_srvargs;
160 1.10 mycroft struct nfsd *nfsd;
161 1.10 mycroft struct nfssvc_sock *slp;
162 1.18 christos struct nfsuid *nuidp;
163 1.18 christos #endif
164 1.1 cgd
165 1.1 cgd /*
166 1.1 cgd * Must be super user
167 1.1 cgd */
168 1.19 fvdl error = suser(p->p_ucred, &p->p_acflag);
169 1.19 fvdl if(error)
170 1.1 cgd return (error);
171 1.12 mycroft while (nfssvc_sockhead_flag & SLP_INIT) {
172 1.19 fvdl nfssvc_sockhead_flag |= SLP_WANTINIT;
173 1.10 mycroft (void) tsleep((caddr_t)&nfssvc_sockhead, PSOCK, "nfsd init", 0);
174 1.10 mycroft }
175 1.13 cgd if (SCARG(uap, flag) & NFSSVC_BIOD) {
176 1.39 tsarna #if defined(NFS) && defined(COMPAT_14)
177 1.19 fvdl error = nfssvc_iod(p);
178 1.19 fvdl #else
179 1.10 mycroft error = ENOSYS;
180 1.19 fvdl #endif
181 1.13 cgd } else if (SCARG(uap, flag) & NFSSVC_MNTD) {
182 1.24 thorpej #ifndef NFS
183 1.10 mycroft error = ENOSYS;
184 1.19 fvdl #else
185 1.18 christos error = copyin(SCARG(uap, argp), (caddr_t)&ncd, sizeof (ncd));
186 1.18 christos if (error)
187 1.10 mycroft return (error);
188 1.10 mycroft NDINIT(&nd, LOOKUP, FOLLOW | LOCKLEAF, UIO_USERSPACE,
189 1.10 mycroft ncd.ncd_dirp, p);
190 1.19 fvdl error = namei(&nd);
191 1.19 fvdl if (error)
192 1.10 mycroft return (error);
193 1.10 mycroft if ((nd.ni_vp->v_flag & VROOT) == 0)
194 1.10 mycroft error = EINVAL;
195 1.10 mycroft nmp = VFSTONFS(nd.ni_vp->v_mount);
196 1.10 mycroft vput(nd.ni_vp);
197 1.10 mycroft if (error)
198 1.10 mycroft return (error);
199 1.27 fvdl if ((nmp->nm_iflag & NFSMNT_MNTD) &&
200 1.19 fvdl (SCARG(uap, flag) & NFSSVC_GOTAUTH) == 0)
201 1.10 mycroft return (0);
202 1.27 fvdl nmp->nm_iflag |= NFSMNT_MNTD;
203 1.13 cgd error = nqnfs_clientd(nmp, p->p_ucred, &ncd, SCARG(uap, flag),
204 1.19 fvdl SCARG(uap, argp), p);
205 1.24 thorpej #endif /* NFS */
206 1.13 cgd } else if (SCARG(uap, flag) & NFSSVC_ADDSOCK) {
207 1.10 mycroft #ifndef NFSSERVER
208 1.10 mycroft error = ENOSYS;
209 1.19 fvdl #else
210 1.18 christos error = copyin(SCARG(uap, argp), (caddr_t)&nfsdarg,
211 1.19 fvdl sizeof(nfsdarg));
212 1.18 christos if (error)
213 1.10 mycroft return (error);
214 1.35 thorpej /* getsock() will use the descriptor for us */
215 1.19 fvdl error = getsock(p->p_fd, nfsdarg.sock, &fp);
216 1.19 fvdl if (error)
217 1.10 mycroft return (error);
218 1.10 mycroft /*
219 1.10 mycroft * Get the client address for connected sockets.
220 1.10 mycroft */
221 1.10 mycroft if (nfsdarg.name == NULL || nfsdarg.namelen == 0)
222 1.10 mycroft nam = (struct mbuf *)0;
223 1.18 christos else {
224 1.18 christos error = sockargs(&nam, nfsdarg.name, nfsdarg.namelen,
225 1.19 fvdl MT_SONAME);
226 1.35 thorpej if (error) {
227 1.35 thorpej FILE_UNUSE(fp, NULL);
228 1.18 christos return (error);
229 1.35 thorpej }
230 1.18 christos }
231 1.10 mycroft error = nfssvc_addsock(fp, nam);
232 1.35 thorpej FILE_UNUSE(fp, NULL);
233 1.10 mycroft #endif /* !NFSSERVER */
234 1.10 mycroft } else {
235 1.10 mycroft #ifndef NFSSERVER
236 1.10 mycroft error = ENOSYS;
237 1.19 fvdl #else
238 1.18 christos error = copyin(SCARG(uap, argp), (caddr_t)nsd, sizeof (*nsd));
239 1.18 christos if (error)
240 1.10 mycroft return (error);
241 1.13 cgd if ((SCARG(uap, flag) & NFSSVC_AUTHIN) &&
242 1.19 fvdl ((nfsd = nsd->nsd_nfsd)) != NULL &&
243 1.19 fvdl (nfsd->nfsd_slp->ns_flag & SLP_VALID)) {
244 1.19 fvdl slp = nfsd->nfsd_slp;
245 1.10 mycroft
246 1.10 mycroft /*
247 1.10 mycroft * First check to see if another nfsd has already
248 1.10 mycroft * added this credential.
249 1.10 mycroft */
250 1.19 fvdl for (nuidp = NUIDHASH(slp,nsd->nsd_cr.cr_uid)->lh_first;
251 1.12 mycroft nuidp != 0; nuidp = nuidp->nu_hash.le_next) {
252 1.19 fvdl if (nuidp->nu_cr.cr_uid == nsd->nsd_cr.cr_uid &&
253 1.19 fvdl (!nfsd->nfsd_nd->nd_nam2 ||
254 1.19 fvdl netaddr_match(NU_NETFAM(nuidp),
255 1.19 fvdl &nuidp->nu_haddr, nfsd->nfsd_nd->nd_nam2)))
256 1.10 mycroft break;
257 1.10 mycroft }
258 1.19 fvdl if (nuidp) {
259 1.19 fvdl nfsrv_setcred(&nuidp->nu_cr,&nfsd->nfsd_nd->nd_cr);
260 1.19 fvdl nfsd->nfsd_nd->nd_flag |= ND_KERBFULL;
261 1.19 fvdl } else {
262 1.10 mycroft /*
263 1.10 mycroft * Nope, so we will.
264 1.10 mycroft */
265 1.10 mycroft if (slp->ns_numuids < nuidhash_max) {
266 1.10 mycroft slp->ns_numuids++;
267 1.10 mycroft nuidp = (struct nfsuid *)
268 1.10 mycroft malloc(sizeof (struct nfsuid), M_NFSUID,
269 1.10 mycroft M_WAITOK);
270 1.10 mycroft } else
271 1.10 mycroft nuidp = (struct nfsuid *)0;
272 1.10 mycroft if ((slp->ns_flag & SLP_VALID) == 0) {
273 1.10 mycroft if (nuidp)
274 1.10 mycroft free((caddr_t)nuidp, M_NFSUID);
275 1.10 mycroft } else {
276 1.10 mycroft if (nuidp == (struct nfsuid *)0) {
277 1.12 mycroft nuidp = slp->ns_uidlruhead.tqh_first;
278 1.12 mycroft LIST_REMOVE(nuidp, nu_hash);
279 1.12 mycroft TAILQ_REMOVE(&slp->ns_uidlruhead, nuidp,
280 1.12 mycroft nu_lru);
281 1.19 fvdl if (nuidp->nu_flag & NU_NAM)
282 1.19 fvdl m_freem(nuidp->nu_nam);
283 1.10 mycroft }
284 1.19 fvdl nuidp->nu_flag = 0;
285 1.10 mycroft nuidp->nu_cr = nsd->nsd_cr;
286 1.10 mycroft if (nuidp->nu_cr.cr_ngroups > NGROUPS)
287 1.19 fvdl nuidp->nu_cr.cr_ngroups = NGROUPS;
288 1.10 mycroft nuidp->nu_cr.cr_ref = 1;
289 1.19 fvdl nuidp->nu_timestamp = nsd->nsd_timestamp;
290 1.19 fvdl nuidp->nu_expire = time.tv_sec + nsd->nsd_ttl;
291 1.19 fvdl /*
292 1.19 fvdl * and save the session key in nu_key.
293 1.19 fvdl */
294 1.32 perry memcpy(nuidp->nu_key, nsd->nsd_key,
295 1.32 perry sizeof(nsd->nsd_key));
296 1.19 fvdl if (nfsd->nfsd_nd->nd_nam2) {
297 1.19 fvdl struct sockaddr_in *saddr;
298 1.19 fvdl
299 1.19 fvdl saddr = mtod(nfsd->nfsd_nd->nd_nam2,
300 1.19 fvdl struct sockaddr_in *);
301 1.19 fvdl switch (saddr->sin_family) {
302 1.19 fvdl case AF_INET:
303 1.19 fvdl nuidp->nu_flag |= NU_INETADDR;
304 1.19 fvdl nuidp->nu_inetaddr =
305 1.19 fvdl saddr->sin_addr.s_addr;
306 1.19 fvdl break;
307 1.19 fvdl case AF_ISO:
308 1.19 fvdl default:
309 1.19 fvdl nuidp->nu_flag |= NU_NAM;
310 1.19 fvdl nuidp->nu_nam = m_copym(
311 1.19 fvdl nfsd->nfsd_nd->nd_nam2, 0,
312 1.19 fvdl M_COPYALL, M_WAIT);
313 1.19 fvdl break;
314 1.19 fvdl };
315 1.19 fvdl }
316 1.12 mycroft TAILQ_INSERT_TAIL(&slp->ns_uidlruhead, nuidp,
317 1.19 fvdl nu_lru);
318 1.12 mycroft LIST_INSERT_HEAD(NUIDHASH(slp, nsd->nsd_uid),
319 1.19 fvdl nuidp, nu_hash);
320 1.19 fvdl nfsrv_setcred(&nuidp->nu_cr,
321 1.19 fvdl &nfsd->nfsd_nd->nd_cr);
322 1.19 fvdl nfsd->nfsd_nd->nd_flag |= ND_KERBFULL;
323 1.10 mycroft }
324 1.10 mycroft }
325 1.10 mycroft }
326 1.13 cgd if ((SCARG(uap, flag) & NFSSVC_AUTHINFAIL) &&
327 1.13 cgd (nfsd = nsd->nsd_nfsd))
328 1.19 fvdl nfsd->nfsd_flag |= NFSD_AUTHFAIL;
329 1.13 cgd error = nfssvc_nfsd(nsd, SCARG(uap, argp), p);
330 1.10 mycroft #endif /* !NFSSERVER */
331 1.10 mycroft }
332 1.10 mycroft if (error == EINTR || error == ERESTART)
333 1.10 mycroft error = 0;
334 1.10 mycroft return (error);
335 1.10 mycroft }
336 1.10 mycroft
337 1.10 mycroft #ifdef NFSSERVER
338 1.10 mycroft /*
339 1.10 mycroft * Adds a socket to the list for servicing by nfsds.
340 1.10 mycroft */
341 1.18 christos int
342 1.10 mycroft nfssvc_addsock(fp, mynam)
343 1.10 mycroft struct file *fp;
344 1.10 mycroft struct mbuf *mynam;
345 1.10 mycroft {
346 1.38 augustss struct mbuf *m;
347 1.38 augustss int siz;
348 1.38 augustss struct nfssvc_sock *slp;
349 1.38 augustss struct socket *so;
350 1.10 mycroft struct nfssvc_sock *tslp;
351 1.10 mycroft int error, s;
352 1.10 mycroft
353 1.1 cgd so = (struct socket *)fp->f_data;
354 1.10 mycroft tslp = (struct nfssvc_sock *)0;
355 1.10 mycroft /*
356 1.10 mycroft * Add it to the list, as required.
357 1.10 mycroft */
358 1.10 mycroft if (so->so_proto->pr_protocol == IPPROTO_UDP) {
359 1.41 fvdl #ifdef INET6
360 1.41 fvdl if (so->so_proto->pr_domain->dom_family == AF_INET6)
361 1.41 fvdl tslp = nfs_udp6sock;
362 1.41 fvdl else
363 1.41 fvdl #endif
364 1.10 mycroft tslp = nfs_udpsock;
365 1.10 mycroft if (tslp->ns_flag & SLP_VALID) {
366 1.10 mycroft m_freem(mynam);
367 1.10 mycroft return (EPERM);
368 1.10 mycroft }
369 1.10 mycroft #ifdef ISO
370 1.10 mycroft } else if (so->so_proto->pr_protocol == ISOPROTO_CLTP) {
371 1.10 mycroft tslp = nfs_cltpsock;
372 1.10 mycroft if (tslp->ns_flag & SLP_VALID) {
373 1.10 mycroft m_freem(mynam);
374 1.10 mycroft return (EPERM);
375 1.10 mycroft }
376 1.10 mycroft #endif /* ISO */
377 1.10 mycroft }
378 1.10 mycroft if (so->so_type == SOCK_STREAM)
379 1.19 fvdl siz = NFS_MAXPACKET + sizeof (u_long);
380 1.10 mycroft else
381 1.1 cgd siz = NFS_MAXPACKET;
382 1.19 fvdl error = soreserve(so, siz, siz);
383 1.19 fvdl if (error) {
384 1.10 mycroft m_freem(mynam);
385 1.10 mycroft return (error);
386 1.10 mycroft }
387 1.1 cgd
388 1.1 cgd /*
389 1.1 cgd * Set protocol specific options { for now TCP only } and
390 1.1 cgd * reserve some space. For datagram sockets, this can get called
391 1.1 cgd * repeatedly for the same socket, but that isn't harmful.
392 1.1 cgd */
393 1.10 mycroft if (so->so_type == SOCK_STREAM) {
394 1.1 cgd MGET(m, M_WAIT, MT_SOOPTS);
395 1.19 fvdl *mtod(m, int32_t *) = 1;
396 1.19 fvdl m->m_len = sizeof(int32_t);
397 1.1 cgd sosetopt(so, SOL_SOCKET, SO_KEEPALIVE, m);
398 1.1 cgd }
399 1.41 fvdl if ((so->so_proto->pr_domain->dom_family == AF_INET
400 1.41 fvdl #ifdef INET6
401 1.41 fvdl || so->so_proto->pr_domain->dom_family == AF_INET6
402 1.41 fvdl #endif
403 1.41 fvdl ) &&
404 1.10 mycroft so->so_proto->pr_protocol == IPPROTO_TCP) {
405 1.1 cgd MGET(m, M_WAIT, MT_SOOPTS);
406 1.19 fvdl *mtod(m, int32_t *) = 1;
407 1.19 fvdl m->m_len = sizeof(int32_t);
408 1.1 cgd sosetopt(so, IPPROTO_TCP, TCP_NODELAY, m);
409 1.1 cgd }
410 1.1 cgd so->so_rcv.sb_flags &= ~SB_NOINTR;
411 1.1 cgd so->so_rcv.sb_timeo = 0;
412 1.1 cgd so->so_snd.sb_flags &= ~SB_NOINTR;
413 1.1 cgd so->so_snd.sb_timeo = 0;
414 1.10 mycroft if (tslp)
415 1.10 mycroft slp = tslp;
416 1.10 mycroft else {
417 1.10 mycroft slp = (struct nfssvc_sock *)
418 1.10 mycroft malloc(sizeof (struct nfssvc_sock), M_NFSSVC, M_WAITOK);
419 1.32 perry memset((caddr_t)slp, 0, sizeof (struct nfssvc_sock));
420 1.12 mycroft TAILQ_INIT(&slp->ns_uidlruhead);
421 1.12 mycroft TAILQ_INSERT_TAIL(&nfssvc_sockhead, slp, ns_chain);
422 1.10 mycroft }
423 1.10 mycroft slp->ns_so = so;
424 1.10 mycroft slp->ns_nam = mynam;
425 1.10 mycroft fp->f_count++;
426 1.10 mycroft slp->ns_fp = fp;
427 1.14 mycroft s = splsoftnet();
428 1.10 mycroft so->so_upcallarg = (caddr_t)slp;
429 1.10 mycroft so->so_upcall = nfsrv_rcv;
430 1.29 matt so->so_rcv.sb_flags |= SB_UPCALL;
431 1.10 mycroft slp->ns_flag = (SLP_VALID | SLP_NEEDQ);
432 1.10 mycroft nfsrv_wakenfsd(slp);
433 1.10 mycroft splx(s);
434 1.10 mycroft return (0);
435 1.10 mycroft }
436 1.1 cgd
437 1.10 mycroft /*
438 1.10 mycroft * Called by nfssvc() for nfsds. Just loops around servicing rpc requests
439 1.10 mycroft * until it is killed by a signal.
440 1.10 mycroft */
441 1.18 christos int
442 1.10 mycroft nfssvc_nfsd(nsd, argp, p)
443 1.10 mycroft struct nfsd_srvargs *nsd;
444 1.10 mycroft caddr_t argp;
445 1.10 mycroft struct proc *p;
446 1.10 mycroft {
447 1.38 augustss struct mbuf *m;
448 1.38 augustss int siz;
449 1.38 augustss struct nfssvc_sock *slp;
450 1.38 augustss struct socket *so;
451 1.38 augustss int *solockp;
452 1.19 fvdl struct nfsd *nfsd = nsd->nsd_nfsd;
453 1.19 fvdl struct nfsrv_descript *nd = NULL;
454 1.19 fvdl struct mbuf *mreq;
455 1.19 fvdl int error = 0, cacherep, s, sotype, writes_todo;
456 1.19 fvdl u_quad_t cur_usec;
457 1.19 fvdl
458 1.19 fvdl #ifndef nolint
459 1.19 fvdl cacherep = RC_DOIT;
460 1.19 fvdl writes_todo = 0;
461 1.19 fvdl #endif
462 1.14 mycroft s = splsoftnet();
463 1.19 fvdl if (nfsd == (struct nfsd *)0) {
464 1.19 fvdl nsd->nsd_nfsd = nfsd = (struct nfsd *)
465 1.10 mycroft malloc(sizeof (struct nfsd), M_NFSD, M_WAITOK);
466 1.32 perry memset((caddr_t)nfsd, 0, sizeof (struct nfsd));
467 1.19 fvdl nfsd->nfsd_procp = p;
468 1.19 fvdl TAILQ_INSERT_TAIL(&nfsd_head, nfsd, nfsd_chain);
469 1.10 mycroft nfs_numnfsd++;
470 1.10 mycroft }
471 1.33 mycroft p->p_holdcnt++;
472 1.1 cgd /*
473 1.10 mycroft * Loop getting rpc requests until SIGKILL.
474 1.1 cgd */
475 1.1 cgd for (;;) {
476 1.19 fvdl if ((nfsd->nfsd_flag & NFSD_REQINPROG) == 0) {
477 1.19 fvdl while (nfsd->nfsd_slp == (struct nfssvc_sock *)0 &&
478 1.12 mycroft (nfsd_head_flag & NFSD_CHECKSLP) == 0) {
479 1.19 fvdl nfsd->nfsd_flag |= NFSD_WAITING;
480 1.10 mycroft nfsd_waiting++;
481 1.19 fvdl error = tsleep((caddr_t)nfsd, PSOCK | PCATCH,
482 1.19 fvdl "nfsd", 0);
483 1.10 mycroft nfsd_waiting--;
484 1.10 mycroft if (error)
485 1.10 mycroft goto done;
486 1.10 mycroft }
487 1.19 fvdl if (nfsd->nfsd_slp == (struct nfssvc_sock *)0 &&
488 1.12 mycroft (nfsd_head_flag & NFSD_CHECKSLP) != 0) {
489 1.12 mycroft for (slp = nfssvc_sockhead.tqh_first; slp != 0;
490 1.12 mycroft slp = slp->ns_chain.tqe_next) {
491 1.10 mycroft if ((slp->ns_flag & (SLP_VALID | SLP_DOREC))
492 1.10 mycroft == (SLP_VALID | SLP_DOREC)) {
493 1.10 mycroft slp->ns_flag &= ~SLP_DOREC;
494 1.10 mycroft slp->ns_sref++;
495 1.19 fvdl nfsd->nfsd_slp = slp;
496 1.10 mycroft break;
497 1.10 mycroft }
498 1.10 mycroft }
499 1.12 mycroft if (slp == 0)
500 1.12 mycroft nfsd_head_flag &= ~NFSD_CHECKSLP;
501 1.10 mycroft }
502 1.19 fvdl if ((slp = nfsd->nfsd_slp) == (struct nfssvc_sock *)0)
503 1.10 mycroft continue;
504 1.10 mycroft if (slp->ns_flag & SLP_VALID) {
505 1.10 mycroft if (slp->ns_flag & SLP_DISCONN)
506 1.10 mycroft nfsrv_zapsock(slp);
507 1.10 mycroft else if (slp->ns_flag & SLP_NEEDQ) {
508 1.10 mycroft slp->ns_flag &= ~SLP_NEEDQ;
509 1.10 mycroft (void) nfs_sndlock(&slp->ns_solock,
510 1.10 mycroft (struct nfsreq *)0);
511 1.10 mycroft nfsrv_rcv(slp->ns_so, (caddr_t)slp,
512 1.10 mycroft M_WAIT);
513 1.10 mycroft nfs_sndunlock(&slp->ns_solock);
514 1.10 mycroft }
515 1.19 fvdl error = nfsrv_dorec(slp, nfsd, &nd);
516 1.19 fvdl cur_usec = (u_quad_t)time.tv_sec * 1000000 +
517 1.19 fvdl (u_quad_t)time.tv_usec;
518 1.19 fvdl if (error && slp->ns_tq.lh_first &&
519 1.19 fvdl slp->ns_tq.lh_first->nd_time <= cur_usec) {
520 1.19 fvdl error = 0;
521 1.19 fvdl cacherep = RC_DOIT;
522 1.19 fvdl writes_todo = 1;
523 1.19 fvdl } else
524 1.19 fvdl writes_todo = 0;
525 1.19 fvdl nfsd->nfsd_flag |= NFSD_REQINPROG;
526 1.1 cgd }
527 1.10 mycroft } else {
528 1.10 mycroft error = 0;
529 1.19 fvdl slp = nfsd->nfsd_slp;
530 1.10 mycroft }
531 1.10 mycroft if (error || (slp->ns_flag & SLP_VALID) == 0) {
532 1.19 fvdl if (nd) {
533 1.19 fvdl free((caddr_t)nd, M_NFSRVDESC);
534 1.19 fvdl nd = NULL;
535 1.19 fvdl }
536 1.19 fvdl nfsd->nfsd_slp = (struct nfssvc_sock *)0;
537 1.19 fvdl nfsd->nfsd_flag &= ~NFSD_REQINPROG;
538 1.10 mycroft nfsrv_slpderef(slp);
539 1.1 cgd continue;
540 1.1 cgd }
541 1.10 mycroft splx(s);
542 1.10 mycroft so = slp->ns_so;
543 1.10 mycroft sotype = so->so_type;
544 1.10 mycroft if (so->so_proto->pr_flags & PR_CONNREQUIRED)
545 1.10 mycroft solockp = &slp->ns_solock;
546 1.10 mycroft else
547 1.10 mycroft solockp = (int *)0;
548 1.19 fvdl if (nd) {
549 1.19 fvdl nd->nd_starttime = time;
550 1.19 fvdl if (nd->nd_nam2)
551 1.19 fvdl nd->nd_nam = nd->nd_nam2;
552 1.19 fvdl else
553 1.19 fvdl nd->nd_nam = slp->ns_nam;
554 1.19 fvdl
555 1.19 fvdl /*
556 1.19 fvdl * Check to see if authorization is needed.
557 1.19 fvdl */
558 1.19 fvdl if (nfsd->nfsd_flag & NFSD_NEEDAUTH) {
559 1.19 fvdl nfsd->nfsd_flag &= ~NFSD_NEEDAUTH;
560 1.19 fvdl nsd->nsd_haddr = mtod(nd->nd_nam,
561 1.19 fvdl struct sockaddr_in *)->sin_addr.s_addr;
562 1.19 fvdl nsd->nsd_authlen = nfsd->nfsd_authlen;
563 1.19 fvdl nsd->nsd_verflen = nfsd->nfsd_verflen;
564 1.19 fvdl if (!copyout(nfsd->nfsd_authstr,nsd->nsd_authstr,
565 1.19 fvdl nfsd->nfsd_authlen) &&
566 1.19 fvdl !copyout(nfsd->nfsd_verfstr, nsd->nsd_verfstr,
567 1.19 fvdl nfsd->nfsd_verflen) &&
568 1.33 mycroft !copyout((caddr_t)nsd, argp, sizeof (*nsd))) {
569 1.33 mycroft p->p_holdcnt--;
570 1.19 fvdl return (ENEEDAUTH);
571 1.33 mycroft }
572 1.19 fvdl cacherep = RC_DROPIT;
573 1.19 fvdl } else
574 1.19 fvdl cacherep = nfsrv_getcache(nd, slp, &mreq);
575 1.19 fvdl
576 1.19 fvdl /*
577 1.19 fvdl * Check for just starting up for NQNFS and send
578 1.19 fvdl * fake "try again later" replies to the NQNFS clients.
579 1.19 fvdl */
580 1.19 fvdl if (notstarted && nqnfsstarttime <= time.tv_sec) {
581 1.10 mycroft if (modify_flag) {
582 1.10 mycroft nqnfsstarttime = time.tv_sec + nqsrv_writeslack;
583 1.10 mycroft modify_flag = 0;
584 1.10 mycroft } else
585 1.10 mycroft notstarted = 0;
586 1.19 fvdl }
587 1.19 fvdl if (notstarted) {
588 1.19 fvdl if ((nd->nd_flag & ND_NQNFS) == 0)
589 1.10 mycroft cacherep = RC_DROPIT;
590 1.10 mycroft else if (nd->nd_procnum != NFSPROC_WRITE) {
591 1.10 mycroft nd->nd_procnum = NFSPROC_NOOP;
592 1.10 mycroft nd->nd_repstat = NQNFS_TRYLATER;
593 1.10 mycroft cacherep = RC_DOIT;
594 1.10 mycroft } else
595 1.10 mycroft modify_flag = 1;
596 1.19 fvdl } else if (nfsd->nfsd_flag & NFSD_AUTHFAIL) {
597 1.19 fvdl nfsd->nfsd_flag &= ~NFSD_AUTHFAIL;
598 1.10 mycroft nd->nd_procnum = NFSPROC_NOOP;
599 1.19 fvdl nd->nd_repstat = (NFSERR_AUTHERR | AUTH_TOOWEAK);
600 1.1 cgd cacherep = RC_DOIT;
601 1.19 fvdl }
602 1.10 mycroft }
603 1.10 mycroft
604 1.19 fvdl /*
605 1.19 fvdl * Loop to get all the write rpc relies that have been
606 1.19 fvdl * gathered together.
607 1.19 fvdl */
608 1.19 fvdl do {
609 1.34 sommerfe #ifdef DIAGNOSTIC
610 1.34 sommerfe int lockcount;
611 1.34 sommerfe #endif
612 1.19 fvdl switch (cacherep) {
613 1.19 fvdl case RC_DOIT:
614 1.34 sommerfe #ifdef DIAGNOSTIC
615 1.34 sommerfe /*
616 1.34 sommerfe * NFS server procs should neither release
617 1.34 sommerfe * locks already held, nor leave things
618 1.34 sommerfe * locked. Catch this sooner, rather than
619 1.34 sommerfe * later (when we try to relock something we
620 1.34 sommerfe * already have locked). Careful inspection
621 1.34 sommerfe * of the failing routine usually turns up the
622 1.34 sommerfe * lock leak.. once we know what it is..
623 1.34 sommerfe */
624 1.34 sommerfe lockcount = p->p_locks;
625 1.34 sommerfe #endif
626 1.44 fvdl if (writes_todo || (!(nd->nd_flag & ND_NFSV3) &&
627 1.44 fvdl nd->nd_procnum == NFSPROC_WRITE &&
628 1.44 fvdl nfsrvw_procrastinate > 0 && !notstarted))
629 1.19 fvdl error = nfsrv_writegather(&nd, slp,
630 1.19 fvdl nfsd->nfsd_procp, &mreq);
631 1.19 fvdl else
632 1.19 fvdl error = (*(nfsrv3_procs[nd->nd_procnum]))(nd,
633 1.19 fvdl slp, nfsd->nfsd_procp, &mreq);
634 1.34 sommerfe #ifdef DIAGNOSTIC
635 1.34 sommerfe if (p->p_locks != lockcount) {
636 1.34 sommerfe /*
637 1.34 sommerfe * If you see this panic, audit
638 1.34 sommerfe * nfsrv3_procs[nd->nd_procnum] for vnode
639 1.34 sommerfe * locking errors (usually, it's due to
640 1.34 sommerfe * forgetting to vput() something).
641 1.34 sommerfe */
642 1.46 matt #ifdef DEBUG
643 1.46 matt extern void printlockedvnodes(void);
644 1.46 matt printlockedvnodes();
645 1.46 matt #endif
646 1.46 matt printf("nfsd: locking botch in op %d"
647 1.46 matt " (before %d, after %d)\n",
648 1.46 matt nd ? nd->nd_procnum : -1,
649 1.46 matt lockcount, p->p_locks);
650 1.34 sommerfe }
651 1.34 sommerfe #endif
652 1.19 fvdl if (mreq == NULL)
653 1.19 fvdl break;
654 1.10 mycroft if (error) {
655 1.10 mycroft if (nd->nd_procnum != NQNFSPROC_VACATED)
656 1.10 mycroft nfsstats.srv_errs++;
657 1.19 fvdl nfsrv_updatecache(nd, FALSE, mreq);
658 1.19 fvdl if (nd->nd_nam2)
659 1.19 fvdl m_freem(nd->nd_nam2);
660 1.1 cgd break;
661 1.1 cgd }
662 1.10 mycroft nfsstats.srvrpccnt[nd->nd_procnum]++;
663 1.19 fvdl nfsrv_updatecache(nd, TRUE, mreq);
664 1.10 mycroft nd->nd_mrep = (struct mbuf *)0;
665 1.19 fvdl case RC_REPLY:
666 1.1 cgd m = mreq;
667 1.1 cgd siz = 0;
668 1.1 cgd while (m) {
669 1.1 cgd siz += m->m_len;
670 1.1 cgd m = m->m_next;
671 1.1 cgd }
672 1.1 cgd if (siz <= 0 || siz > NFS_MAXPACKET) {
673 1.21 christos printf("mbuf siz=%d\n",siz);
674 1.1 cgd panic("Bad nfs svc reply");
675 1.1 cgd }
676 1.10 mycroft m = mreq;
677 1.10 mycroft m->m_pkthdr.len = siz;
678 1.10 mycroft m->m_pkthdr.rcvif = (struct ifnet *)0;
679 1.1 cgd /*
680 1.10 mycroft * For stream protocols, prepend a Sun RPC
681 1.1 cgd * Record Mark.
682 1.1 cgd */
683 1.10 mycroft if (sotype == SOCK_STREAM) {
684 1.10 mycroft M_PREPEND(m, NFSX_UNSIGNED, M_WAIT);
685 1.17 cgd *mtod(m, u_int32_t *) = htonl(0x80000000 | siz);
686 1.10 mycroft }
687 1.10 mycroft if (solockp)
688 1.10 mycroft (void) nfs_sndlock(solockp, (struct nfsreq *)0);
689 1.10 mycroft if (slp->ns_flag & SLP_VALID)
690 1.19 fvdl error = nfs_send(so, nd->nd_nam2, m, NULL);
691 1.10 mycroft else {
692 1.10 mycroft error = EPIPE;
693 1.10 mycroft m_freem(m);
694 1.10 mycroft }
695 1.10 mycroft if (nfsrtton)
696 1.19 fvdl nfsd_rt(sotype, nd, cacherep);
697 1.19 fvdl if (nd->nd_nam2)
698 1.19 fvdl MFREE(nd->nd_nam2, m);
699 1.10 mycroft if (nd->nd_mrep)
700 1.10 mycroft m_freem(nd->nd_mrep);
701 1.10 mycroft if (error == EPIPE)
702 1.10 mycroft nfsrv_zapsock(slp);
703 1.10 mycroft if (solockp)
704 1.10 mycroft nfs_sndunlock(solockp);
705 1.10 mycroft if (error == EINTR || error == ERESTART) {
706 1.19 fvdl free((caddr_t)nd, M_NFSRVDESC);
707 1.10 mycroft nfsrv_slpderef(slp);
708 1.14 mycroft s = splsoftnet();
709 1.10 mycroft goto done;
710 1.1 cgd }
711 1.1 cgd break;
712 1.19 fvdl case RC_DROPIT:
713 1.10 mycroft if (nfsrtton)
714 1.19 fvdl nfsd_rt(sotype, nd, cacherep);
715 1.10 mycroft m_freem(nd->nd_mrep);
716 1.19 fvdl m_freem(nd->nd_nam2);
717 1.1 cgd break;
718 1.19 fvdl };
719 1.19 fvdl if (nd) {
720 1.19 fvdl FREE((caddr_t)nd, M_NFSRVDESC);
721 1.19 fvdl nd = NULL;
722 1.19 fvdl }
723 1.19 fvdl
724 1.19 fvdl /*
725 1.19 fvdl * Check to see if there are outstanding writes that
726 1.19 fvdl * need to be serviced.
727 1.19 fvdl */
728 1.19 fvdl cur_usec = (u_quad_t)time.tv_sec * 1000000 +
729 1.19 fvdl (u_quad_t)time.tv_usec;
730 1.19 fvdl s = splsoftclock();
731 1.19 fvdl if (slp->ns_tq.lh_first &&
732 1.19 fvdl slp->ns_tq.lh_first->nd_time <= cur_usec) {
733 1.19 fvdl cacherep = RC_DOIT;
734 1.19 fvdl writes_todo = 1;
735 1.19 fvdl } else
736 1.19 fvdl writes_todo = 0;
737 1.19 fvdl splx(s);
738 1.19 fvdl } while (writes_todo);
739 1.14 mycroft s = splsoftnet();
740 1.19 fvdl if (nfsrv_dorec(slp, nfsd, &nd)) {
741 1.19 fvdl nfsd->nfsd_flag &= ~NFSD_REQINPROG;
742 1.19 fvdl nfsd->nfsd_slp = NULL;
743 1.10 mycroft nfsrv_slpderef(slp);
744 1.10 mycroft }
745 1.1 cgd }
746 1.10 mycroft done:
747 1.33 mycroft p->p_holdcnt--;
748 1.19 fvdl TAILQ_REMOVE(&nfsd_head, nfsd, nfsd_chain);
749 1.10 mycroft splx(s);
750 1.19 fvdl free((caddr_t)nfsd, M_NFSD);
751 1.10 mycroft nsd->nsd_nfsd = (struct nfsd *)0;
752 1.10 mycroft if (--nfs_numnfsd == 0)
753 1.10 mycroft nfsrv_init(TRUE); /* Reinitialize everything */
754 1.1 cgd return (error);
755 1.1 cgd }
756 1.1 cgd
757 1.10 mycroft /*
758 1.10 mycroft * Shut down a socket associated with an nfssvc_sock structure.
759 1.10 mycroft * Should be called with the send lock set, if required.
760 1.10 mycroft * The trick here is to increment the sref at the start, so that the nfsds
761 1.10 mycroft * will stop using it and clear ns_flag at the end so that it will not be
762 1.10 mycroft * reassigned during cleanup.
763 1.10 mycroft */
764 1.18 christos void
765 1.10 mycroft nfsrv_zapsock(slp)
766 1.38 augustss struct nfssvc_sock *slp;
767 1.10 mycroft {
768 1.38 augustss struct nfsuid *nuidp, *nnuidp;
769 1.38 augustss struct nfsrv_descript *nwp, *nnwp;
770 1.10 mycroft struct socket *so;
771 1.10 mycroft struct file *fp;
772 1.10 mycroft struct mbuf *m;
773 1.19 fvdl int s;
774 1.10 mycroft
775 1.10 mycroft slp->ns_flag &= ~SLP_ALLFLAGS;
776 1.19 fvdl fp = slp->ns_fp;
777 1.19 fvdl if (fp) {
778 1.35 thorpej FILE_USE(fp);
779 1.10 mycroft slp->ns_fp = (struct file *)0;
780 1.10 mycroft so = slp->ns_so;
781 1.10 mycroft so->so_upcall = NULL;
782 1.29 matt so->so_upcallarg = NULL;
783 1.29 matt so->so_rcv.sb_flags &= ~SB_UPCALL;
784 1.10 mycroft soshutdown(so, 2);
785 1.10 mycroft closef(fp, (struct proc *)0);
786 1.10 mycroft if (slp->ns_nam)
787 1.10 mycroft MFREE(slp->ns_nam, m);
788 1.10 mycroft m_freem(slp->ns_raw);
789 1.10 mycroft m_freem(slp->ns_rec);
790 1.12 mycroft for (nuidp = slp->ns_uidlruhead.tqh_first; nuidp != 0;
791 1.12 mycroft nuidp = nnuidp) {
792 1.12 mycroft nnuidp = nuidp->nu_lru.tqe_next;
793 1.12 mycroft LIST_REMOVE(nuidp, nu_hash);
794 1.12 mycroft TAILQ_REMOVE(&slp->ns_uidlruhead, nuidp, nu_lru);
795 1.19 fvdl if (nuidp->nu_flag & NU_NAM)
796 1.19 fvdl m_freem(nuidp->nu_nam);
797 1.12 mycroft free((caddr_t)nuidp, M_NFSUID);
798 1.12 mycroft }
799 1.19 fvdl s = splsoftclock();
800 1.19 fvdl for (nwp = slp->ns_tq.lh_first; nwp; nwp = nnwp) {
801 1.19 fvdl nnwp = nwp->nd_tq.le_next;
802 1.19 fvdl LIST_REMOVE(nwp, nd_tq);
803 1.19 fvdl free((caddr_t)nwp, M_NFSRVDESC);
804 1.19 fvdl }
805 1.19 fvdl LIST_INIT(&slp->ns_tq);
806 1.19 fvdl splx(s);
807 1.10 mycroft }
808 1.10 mycroft }
809 1.10 mycroft
810 1.10 mycroft /*
811 1.10 mycroft * Derefence a server socket structure. If it has no more references and
812 1.10 mycroft * is no longer valid, you can throw it away.
813 1.10 mycroft */
814 1.10 mycroft void
815 1.10 mycroft nfsrv_slpderef(slp)
816 1.38 augustss struct nfssvc_sock *slp;
817 1.10 mycroft {
818 1.10 mycroft if (--(slp->ns_sref) == 0 && (slp->ns_flag & SLP_VALID) == 0) {
819 1.12 mycroft TAILQ_REMOVE(&nfssvc_sockhead, slp, ns_chain);
820 1.10 mycroft free((caddr_t)slp, M_NFSSVC);
821 1.10 mycroft }
822 1.10 mycroft }
823 1.10 mycroft
824 1.10 mycroft /*
825 1.10 mycroft * Initialize the data structures for the server.
826 1.10 mycroft * Handshake with any new nfsds starting up to avoid any chance of
827 1.10 mycroft * corruption.
828 1.10 mycroft */
829 1.10 mycroft void
830 1.10 mycroft nfsrv_init(terminating)
831 1.10 mycroft int terminating;
832 1.10 mycroft {
833 1.38 augustss struct nfssvc_sock *slp, *nslp;
834 1.10 mycroft
835 1.12 mycroft if (nfssvc_sockhead_flag & SLP_INIT)
836 1.10 mycroft panic("nfsd init");
837 1.12 mycroft nfssvc_sockhead_flag |= SLP_INIT;
838 1.10 mycroft if (terminating) {
839 1.12 mycroft for (slp = nfssvc_sockhead.tqh_first; slp != 0; slp = nslp) {
840 1.12 mycroft nslp = slp->ns_chain.tqe_next;
841 1.10 mycroft if (slp->ns_flag & SLP_VALID)
842 1.10 mycroft nfsrv_zapsock(slp);
843 1.12 mycroft TAILQ_REMOVE(&nfssvc_sockhead, slp, ns_chain);
844 1.12 mycroft free((caddr_t)slp, M_NFSSVC);
845 1.10 mycroft }
846 1.10 mycroft nfsrv_cleancache(); /* And clear out server cache */
847 1.26 fvdl } else
848 1.26 fvdl nfs_pub.np_valid = 0;
849 1.12 mycroft
850 1.12 mycroft TAILQ_INIT(&nfssvc_sockhead);
851 1.12 mycroft nfssvc_sockhead_flag &= ~SLP_INIT;
852 1.12 mycroft if (nfssvc_sockhead_flag & SLP_WANTINIT) {
853 1.12 mycroft nfssvc_sockhead_flag &= ~SLP_WANTINIT;
854 1.12 mycroft wakeup((caddr_t)&nfssvc_sockhead);
855 1.12 mycroft }
856 1.12 mycroft
857 1.12 mycroft TAILQ_INIT(&nfsd_head);
858 1.12 mycroft nfsd_head_flag &= ~NFSD_CHECKSLP;
859 1.12 mycroft
860 1.10 mycroft nfs_udpsock = (struct nfssvc_sock *)
861 1.10 mycroft malloc(sizeof (struct nfssvc_sock), M_NFSSVC, M_WAITOK);
862 1.32 perry memset((caddr_t)nfs_udpsock, 0, sizeof (struct nfssvc_sock));
863 1.12 mycroft TAILQ_INIT(&nfs_udpsock->ns_uidlruhead);
864 1.12 mycroft TAILQ_INSERT_HEAD(&nfssvc_sockhead, nfs_udpsock, ns_chain);
865 1.41 fvdl
866 1.41 fvdl #ifdef INET6
867 1.41 fvdl nfs_udp6sock = (struct nfssvc_sock *)
868 1.41 fvdl malloc(sizeof (struct nfssvc_sock), M_NFSSVC, M_WAITOK);
869 1.41 fvdl memset((caddr_t)nfs_udp6sock, 0, sizeof (struct nfssvc_sock));
870 1.41 fvdl TAILQ_INIT(&nfs_udp6sock->ns_uidlruhead);
871 1.41 fvdl TAILQ_INSERT_TAIL(&nfssvc_sockhead, nfs_udp6sock, ns_chain);
872 1.41 fvdl #endif
873 1.12 mycroft
874 1.47 chs #ifdef ISO
875 1.10 mycroft nfs_cltpsock = (struct nfssvc_sock *)
876 1.10 mycroft malloc(sizeof (struct nfssvc_sock), M_NFSSVC, M_WAITOK);
877 1.32 perry memset((caddr_t)nfs_cltpsock, 0, sizeof (struct nfssvc_sock));
878 1.12 mycroft TAILQ_INIT(&nfs_cltpsock->ns_uidlruhead);
879 1.12 mycroft TAILQ_INSERT_TAIL(&nfssvc_sockhead, nfs_cltpsock, ns_chain);
880 1.47 chs #endif
881 1.10 mycroft }
882 1.10 mycroft
883 1.10 mycroft /*
884 1.10 mycroft * Add entries to the server monitor log.
885 1.10 mycroft */
886 1.10 mycroft static void
887 1.19 fvdl nfsd_rt(sotype, nd, cacherep)
888 1.10 mycroft int sotype;
889 1.38 augustss struct nfsrv_descript *nd;
890 1.10 mycroft int cacherep;
891 1.10 mycroft {
892 1.38 augustss struct drt *rt;
893 1.10 mycroft
894 1.10 mycroft rt = &nfsdrt.drt[nfsdrt.pos];
895 1.10 mycroft if (cacherep == RC_DOIT)
896 1.10 mycroft rt->flag = 0;
897 1.10 mycroft else if (cacherep == RC_REPLY)
898 1.10 mycroft rt->flag = DRT_CACHEREPLY;
899 1.10 mycroft else
900 1.10 mycroft rt->flag = DRT_CACHEDROP;
901 1.10 mycroft if (sotype == SOCK_STREAM)
902 1.10 mycroft rt->flag |= DRT_TCP;
903 1.19 fvdl if (nd->nd_flag & ND_NQNFS)
904 1.10 mycroft rt->flag |= DRT_NQNFS;
905 1.19 fvdl else if (nd->nd_flag & ND_NFSV3)
906 1.19 fvdl rt->flag |= DRT_NFSV3;
907 1.10 mycroft rt->proc = nd->nd_procnum;
908 1.19 fvdl if (mtod(nd->nd_nam, struct sockaddr *)->sa_family == AF_INET)
909 1.19 fvdl rt->ipadr = mtod(nd->nd_nam, struct sockaddr_in *)->sin_addr.s_addr;
910 1.10 mycroft else
911 1.19 fvdl rt->ipadr = INADDR_ANY;
912 1.19 fvdl rt->resptime = ((time.tv_sec - nd->nd_starttime.tv_sec) * 1000000) +
913 1.19 fvdl (time.tv_usec - nd->nd_starttime.tv_usec);
914 1.10 mycroft rt->tstamp = time;
915 1.10 mycroft nfsdrt.pos = (nfsdrt.pos + 1) % NFSRTTLOGSIZ;
916 1.10 mycroft }
917 1.3 glass #endif /* NFSSERVER */
918 1.3 glass
919 1.24 thorpej #ifdef NFS
920 1.22 thorpej
921 1.22 thorpej int nfs_defect = 0;
922 1.1 cgd /*
923 1.39 tsarna * Asynchronous I/O threads for client nfs.
924 1.10 mycroft * They do read-ahead and write-behind operations on the block I/O cache.
925 1.10 mycroft * Never returns unless it fails or gets killed.
926 1.1 cgd */
927 1.39 tsarna
928 1.18 christos int
929 1.10 mycroft nfssvc_iod(p)
930 1.1 cgd struct proc *p;
931 1.1 cgd {
932 1.38 augustss struct buf *bp;
933 1.38 augustss int i, myiod;
934 1.22 thorpej struct nfsmount *nmp;
935 1.22 thorpej int error = 0;
936 1.1 cgd
937 1.1 cgd /*
938 1.1 cgd * Assign my position or return error if too many already running
939 1.1 cgd */
940 1.1 cgd myiod = -1;
941 1.1 cgd for (i = 0; i < NFS_MAXASYNCDAEMON; i++)
942 1.39 tsarna if (nfs_asyncdaemon[i] == NULL) {
943 1.1 cgd myiod = i;
944 1.1 cgd break;
945 1.1 cgd }
946 1.1 cgd if (myiod == -1)
947 1.1 cgd return (EBUSY);
948 1.39 tsarna nfs_asyncdaemon[myiod] = p;
949 1.1 cgd nfs_numasync++;
950 1.33 mycroft p->p_holdcnt++;
951 1.1 cgd /*
952 1.42 nathanw * Just loop around doing our stuff until SIGKILL
953 1.1 cgd */
954 1.1 cgd for (;;) {
955 1.22 thorpej while (((nmp = nfs_iodmount[myiod]) == NULL
956 1.22 thorpej || nmp->nm_bufq.tqh_first == NULL)
957 1.22 thorpej && error == 0) {
958 1.22 thorpej if (nmp)
959 1.22 thorpej nmp->nm_bufqiods--;
960 1.19 fvdl nfs_iodwant[myiod] = p;
961 1.22 thorpej nfs_iodmount[myiod] = NULL;
962 1.19 fvdl error = tsleep((caddr_t)&nfs_iodwant[myiod],
963 1.19 fvdl PWAIT | PCATCH, "nfsidl", 0);
964 1.19 fvdl }
965 1.45 chs while (nmp != NULL && (bp = nmp->nm_bufq.tqh_first) != NULL) {
966 1.19 fvdl /* Take one off the front of the list */
967 1.22 thorpej TAILQ_REMOVE(&nmp->nm_bufq, bp, b_freelist);
968 1.22 thorpej nmp->nm_bufqlen--;
969 1.22 thorpej if (nmp->nm_bufqwant && nmp->nm_bufqlen < 2 * nfs_numasync) {
970 1.22 thorpej nmp->nm_bufqwant = FALSE;
971 1.22 thorpej wakeup(&nmp->nm_bufq);
972 1.22 thorpej }
973 1.19 fvdl if (bp->b_flags & B_READ)
974 1.19 fvdl (void) nfs_doio(bp, bp->b_rcred, (struct proc *)0);
975 1.22 thorpej else
976 1.19 fvdl (void) nfs_doio(bp, bp->b_wcred, (struct proc *)0);
977 1.22 thorpej /*
978 1.22 thorpej * If there are more than one iod on this mount, then defect
979 1.22 thorpej * so that the iods can be shared out fairly between the mounts
980 1.22 thorpej */
981 1.22 thorpej if (nfs_defect && nmp->nm_bufqiods > 1) {
982 1.22 thorpej nfs_iodmount[myiod] = NULL;
983 1.22 thorpej nmp->nm_bufqiods--;
984 1.22 thorpej break;
985 1.22 thorpej }
986 1.19 fvdl }
987 1.45 chs if (error) {
988 1.45 chs break;
989 1.45 chs }
990 1.1 cgd }
991 1.33 mycroft p->p_holdcnt--;
992 1.45 chs if (nmp)
993 1.45 chs nmp->nm_bufqiods--;
994 1.45 chs nfs_iodwant[myiod] = NULL;
995 1.45 chs nfs_iodmount[myiod] = NULL;
996 1.39 tsarna nfs_asyncdaemon[myiod] = NULL;
997 1.33 mycroft nfs_numasync--;
998 1.39 tsarna
999 1.33 mycroft return (error);
1000 1.1 cgd }
1001 1.3 glass
1002 1.39 tsarna void
1003 1.39 tsarna start_nfsio(arg)
1004 1.39 tsarna void *arg;
1005 1.39 tsarna {
1006 1.39 tsarna nfssvc_iod(curproc);
1007 1.39 tsarna
1008 1.39 tsarna kthread_exit(0);
1009 1.39 tsarna }
1010 1.39 tsarna
1011 1.39 tsarna void
1012 1.39 tsarna nfs_getset_niothreads(set)
1013 1.39 tsarna int set;
1014 1.39 tsarna {
1015 1.39 tsarna int i, have, start;
1016 1.39 tsarna
1017 1.39 tsarna for (have = 0, i = 0; i < NFS_MAXASYNCDAEMON; i++)
1018 1.39 tsarna if (nfs_asyncdaemon[i] != NULL)
1019 1.39 tsarna have++;
1020 1.39 tsarna
1021 1.39 tsarna if (set) {
1022 1.39 tsarna /* clamp to sane range */
1023 1.39 tsarna nfs_niothreads = max(0, min(nfs_niothreads, NFS_MAXASYNCDAEMON));
1024 1.39 tsarna
1025 1.39 tsarna start = nfs_niothreads - have;
1026 1.39 tsarna
1027 1.39 tsarna while (start > 0) {
1028 1.39 tsarna kthread_create1(start_nfsio, NULL, NULL, "nfsio");
1029 1.39 tsarna start--;
1030 1.39 tsarna }
1031 1.39 tsarna
1032 1.39 tsarna for (i = 0; (start < 0) && (i < NFS_MAXASYNCDAEMON); i++)
1033 1.39 tsarna if (nfs_asyncdaemon[i] != NULL) {
1034 1.39 tsarna psignal(nfs_asyncdaemon[i], SIGKILL);
1035 1.39 tsarna start++;
1036 1.39 tsarna }
1037 1.39 tsarna } else {
1038 1.40 tsarna if (nfs_niothreads >= 0)
1039 1.40 tsarna nfs_niothreads = have;
1040 1.39 tsarna }
1041 1.39 tsarna }
1042 1.19 fvdl
1043 1.10 mycroft /*
1044 1.10 mycroft * Get an authorization string for the uid by having the mount_nfs sitting
1045 1.10 mycroft * on this mount point porpous out of the kernel and do it.
1046 1.10 mycroft */
1047 1.18 christos int
1048 1.19 fvdl nfs_getauth(nmp, rep, cred, auth_str, auth_len, verf_str, verf_len, key)
1049 1.38 augustss struct nfsmount *nmp;
1050 1.10 mycroft struct nfsreq *rep;
1051 1.10 mycroft struct ucred *cred;
1052 1.10 mycroft char **auth_str;
1053 1.10 mycroft int *auth_len;
1054 1.19 fvdl char *verf_str;
1055 1.19 fvdl int *verf_len;
1056 1.19 fvdl NFSKERBKEY_T key; /* return session key */
1057 1.10 mycroft {
1058 1.10 mycroft int error = 0;
1059 1.10 mycroft
1060 1.27 fvdl while ((nmp->nm_iflag & NFSMNT_WAITAUTH) == 0) {
1061 1.27 fvdl nmp->nm_iflag |= NFSMNT_WANTAUTH;
1062 1.10 mycroft (void) tsleep((caddr_t)&nmp->nm_authtype, PSOCK,
1063 1.10 mycroft "nfsauth1", 2 * hz);
1064 1.18 christos error = nfs_sigintr(nmp, rep, rep->r_procp);
1065 1.18 christos if (error) {
1066 1.27 fvdl nmp->nm_iflag &= ~NFSMNT_WANTAUTH;
1067 1.10 mycroft return (error);
1068 1.10 mycroft }
1069 1.10 mycroft }
1070 1.27 fvdl nmp->nm_iflag &= ~(NFSMNT_WAITAUTH | NFSMNT_WANTAUTH);
1071 1.10 mycroft nmp->nm_authstr = *auth_str = (char *)malloc(RPCAUTH_MAXSIZ, M_TEMP, M_WAITOK);
1072 1.19 fvdl nmp->nm_authlen = RPCAUTH_MAXSIZ;
1073 1.19 fvdl nmp->nm_verfstr = verf_str;
1074 1.19 fvdl nmp->nm_verflen = *verf_len;
1075 1.10 mycroft nmp->nm_authuid = cred->cr_uid;
1076 1.10 mycroft wakeup((caddr_t)&nmp->nm_authstr);
1077 1.3 glass
1078 1.10 mycroft /*
1079 1.10 mycroft * And wait for mount_nfs to do its stuff.
1080 1.10 mycroft */
1081 1.27 fvdl while ((nmp->nm_iflag & NFSMNT_HASAUTH) == 0 && error == 0) {
1082 1.10 mycroft (void) tsleep((caddr_t)&nmp->nm_authlen, PSOCK,
1083 1.10 mycroft "nfsauth2", 2 * hz);
1084 1.10 mycroft error = nfs_sigintr(nmp, rep, rep->r_procp);
1085 1.10 mycroft }
1086 1.27 fvdl if (nmp->nm_iflag & NFSMNT_AUTHERR) {
1087 1.27 fvdl nmp->nm_iflag &= ~NFSMNT_AUTHERR;
1088 1.10 mycroft error = EAUTH;
1089 1.10 mycroft }
1090 1.10 mycroft if (error)
1091 1.10 mycroft free((caddr_t)*auth_str, M_TEMP);
1092 1.10 mycroft else {
1093 1.10 mycroft *auth_len = nmp->nm_authlen;
1094 1.19 fvdl *verf_len = nmp->nm_verflen;
1095 1.32 perry memcpy((caddr_t)key, (caddr_t)nmp->nm_key, sizeof (key));
1096 1.10 mycroft }
1097 1.27 fvdl nmp->nm_iflag &= ~NFSMNT_HASAUTH;
1098 1.27 fvdl nmp->nm_iflag |= NFSMNT_WAITAUTH;
1099 1.27 fvdl if (nmp->nm_iflag & NFSMNT_WANTAUTH) {
1100 1.27 fvdl nmp->nm_iflag &= ~NFSMNT_WANTAUTH;
1101 1.10 mycroft wakeup((caddr_t)&nmp->nm_authtype);
1102 1.10 mycroft }
1103 1.19 fvdl return (error);
1104 1.19 fvdl }
1105 1.19 fvdl
1106 1.19 fvdl /*
1107 1.19 fvdl * Get a nickname authenticator and verifier.
1108 1.19 fvdl */
1109 1.19 fvdl int
1110 1.19 fvdl nfs_getnickauth(nmp, cred, auth_str, auth_len, verf_str, verf_len)
1111 1.19 fvdl struct nfsmount *nmp;
1112 1.19 fvdl struct ucred *cred;
1113 1.19 fvdl char **auth_str;
1114 1.19 fvdl int *auth_len;
1115 1.19 fvdl char *verf_str;
1116 1.19 fvdl int verf_len;
1117 1.19 fvdl {
1118 1.38 augustss struct nfsuid *nuidp;
1119 1.38 augustss u_int32_t *nickp, *verfp;
1120 1.19 fvdl struct timeval ktvin, ktvout;
1121 1.19 fvdl
1122 1.19 fvdl #ifdef DIAGNOSTIC
1123 1.19 fvdl if (verf_len < (4 * NFSX_UNSIGNED))
1124 1.19 fvdl panic("nfs_getnickauth verf too small");
1125 1.19 fvdl #endif
1126 1.19 fvdl for (nuidp = NMUIDHASH(nmp, cred->cr_uid)->lh_first;
1127 1.19 fvdl nuidp != 0; nuidp = nuidp->nu_hash.le_next) {
1128 1.19 fvdl if (nuidp->nu_cr.cr_uid == cred->cr_uid)
1129 1.19 fvdl break;
1130 1.19 fvdl }
1131 1.19 fvdl if (!nuidp || nuidp->nu_expire < time.tv_sec)
1132 1.19 fvdl return (EACCES);
1133 1.19 fvdl
1134 1.19 fvdl /*
1135 1.19 fvdl * Move to the end of the lru list (end of lru == most recently used).
1136 1.19 fvdl */
1137 1.19 fvdl TAILQ_REMOVE(&nmp->nm_uidlruhead, nuidp, nu_lru);
1138 1.19 fvdl TAILQ_INSERT_TAIL(&nmp->nm_uidlruhead, nuidp, nu_lru);
1139 1.19 fvdl
1140 1.19 fvdl nickp = (u_int32_t *)malloc(2 * NFSX_UNSIGNED, M_TEMP, M_WAITOK);
1141 1.19 fvdl *nickp++ = txdr_unsigned(RPCAKN_NICKNAME);
1142 1.19 fvdl *nickp = txdr_unsigned(nuidp->nu_nickname);
1143 1.19 fvdl *auth_str = (char *)nickp;
1144 1.19 fvdl *auth_len = 2 * NFSX_UNSIGNED;
1145 1.19 fvdl
1146 1.19 fvdl /*
1147 1.19 fvdl * Now we must encrypt the verifier and package it up.
1148 1.19 fvdl */
1149 1.19 fvdl verfp = (u_int32_t *)verf_str;
1150 1.19 fvdl *verfp++ = txdr_unsigned(RPCAKN_NICKNAME);
1151 1.19 fvdl if (time.tv_sec > nuidp->nu_timestamp.tv_sec ||
1152 1.19 fvdl (time.tv_sec == nuidp->nu_timestamp.tv_sec &&
1153 1.19 fvdl time.tv_usec > nuidp->nu_timestamp.tv_usec))
1154 1.19 fvdl nuidp->nu_timestamp = time;
1155 1.19 fvdl else
1156 1.19 fvdl nuidp->nu_timestamp.tv_usec++;
1157 1.19 fvdl ktvin.tv_sec = txdr_unsigned(nuidp->nu_timestamp.tv_sec);
1158 1.19 fvdl ktvin.tv_usec = txdr_unsigned(nuidp->nu_timestamp.tv_usec);
1159 1.19 fvdl
1160 1.19 fvdl /*
1161 1.19 fvdl * Now encrypt the timestamp verifier in ecb mode using the session
1162 1.19 fvdl * key.
1163 1.19 fvdl */
1164 1.19 fvdl #ifdef NFSKERB
1165 1.19 fvdl XXX
1166 1.19 fvdl #endif
1167 1.19 fvdl
1168 1.19 fvdl *verfp++ = ktvout.tv_sec;
1169 1.19 fvdl *verfp++ = ktvout.tv_usec;
1170 1.19 fvdl *verfp = 0;
1171 1.19 fvdl return (0);
1172 1.19 fvdl }
1173 1.19 fvdl
1174 1.19 fvdl /*
1175 1.19 fvdl * Save the current nickname in a hash list entry on the mount point.
1176 1.19 fvdl */
1177 1.19 fvdl int
1178 1.19 fvdl nfs_savenickauth(nmp, cred, len, key, mdp, dposp, mrep)
1179 1.38 augustss struct nfsmount *nmp;
1180 1.19 fvdl struct ucred *cred;
1181 1.19 fvdl int len;
1182 1.19 fvdl NFSKERBKEY_T key;
1183 1.19 fvdl struct mbuf **mdp;
1184 1.19 fvdl char **dposp;
1185 1.19 fvdl struct mbuf *mrep;
1186 1.19 fvdl {
1187 1.38 augustss struct nfsuid *nuidp;
1188 1.38 augustss u_int32_t *tl;
1189 1.38 augustss int32_t t1;
1190 1.19 fvdl struct mbuf *md = *mdp;
1191 1.19 fvdl struct timeval ktvin, ktvout;
1192 1.19 fvdl u_int32_t nick;
1193 1.19 fvdl char *dpos = *dposp, *cp2;
1194 1.19 fvdl int deltasec, error = 0;
1195 1.19 fvdl
1196 1.19 fvdl if (len == (3 * NFSX_UNSIGNED)) {
1197 1.19 fvdl nfsm_dissect(tl, u_int32_t *, 3 * NFSX_UNSIGNED);
1198 1.19 fvdl ktvin.tv_sec = *tl++;
1199 1.19 fvdl ktvin.tv_usec = *tl++;
1200 1.19 fvdl nick = fxdr_unsigned(u_int32_t, *tl);
1201 1.19 fvdl
1202 1.19 fvdl /*
1203 1.19 fvdl * Decrypt the timestamp in ecb mode.
1204 1.19 fvdl */
1205 1.19 fvdl #ifdef NFSKERB
1206 1.19 fvdl XXX
1207 1.19 fvdl #endif
1208 1.19 fvdl ktvout.tv_sec = fxdr_unsigned(long, ktvout.tv_sec);
1209 1.19 fvdl ktvout.tv_usec = fxdr_unsigned(long, ktvout.tv_usec);
1210 1.19 fvdl deltasec = time.tv_sec - ktvout.tv_sec;
1211 1.19 fvdl if (deltasec < 0)
1212 1.19 fvdl deltasec = -deltasec;
1213 1.19 fvdl /*
1214 1.19 fvdl * If ok, add it to the hash list for the mount point.
1215 1.19 fvdl */
1216 1.19 fvdl if (deltasec <= NFS_KERBCLOCKSKEW) {
1217 1.19 fvdl if (nmp->nm_numuids < nuidhash_max) {
1218 1.19 fvdl nmp->nm_numuids++;
1219 1.19 fvdl nuidp = (struct nfsuid *)
1220 1.19 fvdl malloc(sizeof (struct nfsuid), M_NFSUID,
1221 1.19 fvdl M_WAITOK);
1222 1.19 fvdl } else {
1223 1.19 fvdl nuidp = nmp->nm_uidlruhead.tqh_first;
1224 1.19 fvdl LIST_REMOVE(nuidp, nu_hash);
1225 1.19 fvdl TAILQ_REMOVE(&nmp->nm_uidlruhead, nuidp,
1226 1.19 fvdl nu_lru);
1227 1.19 fvdl }
1228 1.19 fvdl nuidp->nu_flag = 0;
1229 1.19 fvdl nuidp->nu_cr.cr_uid = cred->cr_uid;
1230 1.19 fvdl nuidp->nu_expire = time.tv_sec + NFS_KERBTTL;
1231 1.19 fvdl nuidp->nu_timestamp = ktvout;
1232 1.19 fvdl nuidp->nu_nickname = nick;
1233 1.32 perry memcpy(nuidp->nu_key, key, sizeof (key));
1234 1.19 fvdl TAILQ_INSERT_TAIL(&nmp->nm_uidlruhead, nuidp,
1235 1.19 fvdl nu_lru);
1236 1.19 fvdl LIST_INSERT_HEAD(NMUIDHASH(nmp, cred->cr_uid),
1237 1.19 fvdl nuidp, nu_hash);
1238 1.19 fvdl }
1239 1.19 fvdl } else
1240 1.19 fvdl nfsm_adv(nfsm_rndup(len));
1241 1.19 fvdl nfsmout:
1242 1.19 fvdl *mdp = md;
1243 1.19 fvdl *dposp = dpos;
1244 1.10 mycroft return (error);
1245 1.10 mycroft }
1246 1.24 thorpej #endif /* NFS */
1247