nfs_subs.c revision 1.220 1 1.220 uebayasi /* $NetBSD: nfs_subs.c,v 1.220 2010/11/06 11:00:29 uebayasi Exp $ */
2 1.14 cgd
3 1.1 cgd /*
4 1.12 mycroft * Copyright (c) 1989, 1993
5 1.12 mycroft * The Regents of the University of California. All rights reserved.
6 1.1 cgd *
7 1.1 cgd * This code is derived from software contributed to Berkeley by
8 1.1 cgd * Rick Macklem at The University of Guelph.
9 1.1 cgd *
10 1.1 cgd * Redistribution and use in source and binary forms, with or without
11 1.1 cgd * modification, are permitted provided that the following conditions
12 1.1 cgd * are met:
13 1.1 cgd * 1. Redistributions of source code must retain the above copyright
14 1.1 cgd * notice, this list of conditions and the following disclaimer.
15 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
16 1.1 cgd * notice, this list of conditions and the following disclaimer in the
17 1.1 cgd * documentation and/or other materials provided with the distribution.
18 1.127 agc * 3. Neither the name of the University nor the names of its contributors
19 1.1 cgd * may be used to endorse or promote products derived from this software
20 1.1 cgd * without specific prior written permission.
21 1.1 cgd *
22 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
23 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
26 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32 1.1 cgd * SUCH DAMAGE.
33 1.1 cgd *
34 1.25 fvdl * @(#)nfs_subs.c 8.8 (Berkeley) 5/22/95
35 1.1 cgd */
36 1.1 cgd
37 1.83 fvdl /*
38 1.83 fvdl * Copyright 2000 Wasabi Systems, Inc.
39 1.83 fvdl * All rights reserved.
40 1.83 fvdl *
41 1.83 fvdl * Written by Frank van der Linden for Wasabi Systems, Inc.
42 1.83 fvdl *
43 1.83 fvdl * Redistribution and use in source and binary forms, with or without
44 1.83 fvdl * modification, are permitted provided that the following conditions
45 1.83 fvdl * are met:
46 1.83 fvdl * 1. Redistributions of source code must retain the above copyright
47 1.83 fvdl * notice, this list of conditions and the following disclaimer.
48 1.83 fvdl * 2. Redistributions in binary form must reproduce the above copyright
49 1.83 fvdl * notice, this list of conditions and the following disclaimer in the
50 1.83 fvdl * documentation and/or other materials provided with the distribution.
51 1.83 fvdl * 3. All advertising materials mentioning features or use of this software
52 1.83 fvdl * must display the following acknowledgement:
53 1.83 fvdl * This product includes software developed for the NetBSD Project by
54 1.83 fvdl * Wasabi Systems, Inc.
55 1.83 fvdl * 4. The name of Wasabi Systems, Inc. may not be used to endorse
56 1.83 fvdl * or promote products derived from this software without specific prior
57 1.83 fvdl * written permission.
58 1.83 fvdl *
59 1.83 fvdl * THIS SOFTWARE IS PROVIDED BY WASABI SYSTEMS, INC. ``AS IS'' AND
60 1.83 fvdl * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
61 1.83 fvdl * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
62 1.83 fvdl * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL WASABI SYSTEMS, INC
63 1.83 fvdl * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
64 1.83 fvdl * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
65 1.83 fvdl * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
66 1.83 fvdl * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
67 1.83 fvdl * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
68 1.83 fvdl * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
69 1.83 fvdl * POSSIBILITY OF SUCH DAMAGE.
70 1.83 fvdl */
71 1.99 lukem
72 1.99 lukem #include <sys/cdefs.h>
73 1.220 uebayasi __KERNEL_RCSID(0, "$NetBSD: nfs_subs.c,v 1.220 2010/11/06 11:00:29 uebayasi Exp $");
74 1.83 fvdl
75 1.210 ad #ifdef _KERNEL_OPT
76 1.82 bjh21 #include "opt_nfs.h"
77 1.210 ad #endif
78 1.25 fvdl
79 1.1 cgd /*
80 1.1 cgd * These functions support the macros and help fiddle mbuf chains for
81 1.1 cgd * the nfs op functions. They do things like create the rpc header and
82 1.1 cgd * copy data between mbuf chains and uio lists.
83 1.1 cgd */
84 1.9 mycroft #include <sys/param.h>
85 1.9 mycroft #include <sys/proc.h>
86 1.9 mycroft #include <sys/systm.h>
87 1.9 mycroft #include <sys/kernel.h>
88 1.196 yamt #include <sys/kmem.h>
89 1.9 mycroft #include <sys/mount.h>
90 1.9 mycroft #include <sys/vnode.h>
91 1.9 mycroft #include <sys/namei.h>
92 1.9 mycroft #include <sys/mbuf.h>
93 1.12 mycroft #include <sys/socket.h>
94 1.12 mycroft #include <sys/stat.h>
95 1.98 fvdl #include <sys/filedesc.h>
96 1.30 fvdl #include <sys/time.h>
97 1.43 fvdl #include <sys/dirent.h>
98 1.155 thorpej #include <sys/once.h>
99 1.162 elad #include <sys/kauth.h>
100 1.207 pooka #include <sys/atomic.h>
101 1.1 cgd
102 1.220 uebayasi #include <uvm/uvm.h>
103 1.51 mrg
104 1.9 mycroft #include <nfs/rpcv2.h>
105 1.25 fvdl #include <nfs/nfsproto.h>
106 1.9 mycroft #include <nfs/nfsnode.h>
107 1.9 mycroft #include <nfs/nfs.h>
108 1.9 mycroft #include <nfs/xdr_subs.h>
109 1.9 mycroft #include <nfs/nfsm_subs.h>
110 1.12 mycroft #include <nfs/nfsmount.h>
111 1.12 mycroft #include <nfs/nfsrtt.h>
112 1.24 christos #include <nfs/nfs_var.h>
113 1.12 mycroft
114 1.12 mycroft #include <miscfs/specfs/specdev.h>
115 1.24 christos
116 1.12 mycroft #include <netinet/in.h>
117 1.1 cgd
118 1.207 pooka static u_int32_t nfs_xid;
119 1.207 pooka
120 1.218 christos int nuidhash_max = NFS_MAXUIDHASH;
121 1.1 cgd /*
122 1.1 cgd * Data items converted to xdr at startup, since they are constant
123 1.1 cgd * This is kinda hokey, but may save a little time doing byte swaps
124 1.1 cgd */
125 1.22 cgd u_int32_t nfs_xdrneg1;
126 1.22 cgd u_int32_t rpc_call, rpc_vers, rpc_reply, rpc_msgdenied, rpc_autherr,
127 1.25 fvdl rpc_mismatch, rpc_auth_unix, rpc_msgaccepted,
128 1.12 mycroft rpc_auth_kerb;
129 1.179 yamt u_int32_t nfs_prog, nfs_true, nfs_false;
130 1.12 mycroft
131 1.1 cgd /* And other global data */
132 1.90 jdolecek const nfstype nfsv2_type[9] =
133 1.90 jdolecek { NFNON, NFREG, NFDIR, NFBLK, NFCHR, NFLNK, NFNON, NFCHR, NFNON };
134 1.90 jdolecek const nfstype nfsv3_type[9] =
135 1.90 jdolecek { NFNON, NFREG, NFDIR, NFBLK, NFCHR, NFLNK, NFSOCK, NFFIFO, NFNON };
136 1.90 jdolecek const enum vtype nv2tov_type[8] =
137 1.90 jdolecek { VNON, VREG, VDIR, VBLK, VCHR, VLNK, VNON, VNON };
138 1.90 jdolecek const enum vtype nv3tov_type[8] =
139 1.90 jdolecek { VNON, VREG, VDIR, VBLK, VCHR, VLNK, VSOCK, VFIFO };
140 1.25 fvdl int nfs_ticks;
141 1.108 christos
142 1.35 thorpej /* NFS client/server stats. */
143 1.35 thorpej struct nfsstats nfsstats;
144 1.35 thorpej
145 1.25 fvdl /*
146 1.25 fvdl * Mapping of old NFS Version 2 RPC numbers to generic numbers.
147 1.25 fvdl */
148 1.90 jdolecek const int nfsv3_procid[NFS_NPROCS] = {
149 1.25 fvdl NFSPROC_NULL,
150 1.25 fvdl NFSPROC_GETATTR,
151 1.25 fvdl NFSPROC_SETATTR,
152 1.25 fvdl NFSPROC_NOOP,
153 1.25 fvdl NFSPROC_LOOKUP,
154 1.25 fvdl NFSPROC_READLINK,
155 1.25 fvdl NFSPROC_READ,
156 1.25 fvdl NFSPROC_NOOP,
157 1.25 fvdl NFSPROC_WRITE,
158 1.25 fvdl NFSPROC_CREATE,
159 1.25 fvdl NFSPROC_REMOVE,
160 1.25 fvdl NFSPROC_RENAME,
161 1.25 fvdl NFSPROC_LINK,
162 1.25 fvdl NFSPROC_SYMLINK,
163 1.25 fvdl NFSPROC_MKDIR,
164 1.25 fvdl NFSPROC_RMDIR,
165 1.25 fvdl NFSPROC_READDIR,
166 1.25 fvdl NFSPROC_FSSTAT,
167 1.25 fvdl NFSPROC_NOOP,
168 1.25 fvdl NFSPROC_NOOP,
169 1.25 fvdl NFSPROC_NOOP,
170 1.25 fvdl NFSPROC_NOOP,
171 1.25 fvdl NFSPROC_NOOP
172 1.25 fvdl };
173 1.25 fvdl
174 1.25 fvdl /*
175 1.25 fvdl * and the reverse mapping from generic to Version 2 procedure numbers
176 1.25 fvdl */
177 1.90 jdolecek const int nfsv2_procid[NFS_NPROCS] = {
178 1.25 fvdl NFSV2PROC_NULL,
179 1.25 fvdl NFSV2PROC_GETATTR,
180 1.25 fvdl NFSV2PROC_SETATTR,
181 1.25 fvdl NFSV2PROC_LOOKUP,
182 1.25 fvdl NFSV2PROC_NOOP,
183 1.25 fvdl NFSV2PROC_READLINK,
184 1.25 fvdl NFSV2PROC_READ,
185 1.25 fvdl NFSV2PROC_WRITE,
186 1.25 fvdl NFSV2PROC_CREATE,
187 1.25 fvdl NFSV2PROC_MKDIR,
188 1.25 fvdl NFSV2PROC_SYMLINK,
189 1.25 fvdl NFSV2PROC_CREATE,
190 1.25 fvdl NFSV2PROC_REMOVE,
191 1.25 fvdl NFSV2PROC_RMDIR,
192 1.25 fvdl NFSV2PROC_RENAME,
193 1.25 fvdl NFSV2PROC_LINK,
194 1.25 fvdl NFSV2PROC_READDIR,
195 1.25 fvdl NFSV2PROC_NOOP,
196 1.25 fvdl NFSV2PROC_STATFS,
197 1.25 fvdl NFSV2PROC_NOOP,
198 1.25 fvdl NFSV2PROC_NOOP,
199 1.25 fvdl NFSV2PROC_NOOP,
200 1.25 fvdl NFSV2PROC_NOOP,
201 1.25 fvdl };
202 1.25 fvdl
203 1.25 fvdl /*
204 1.25 fvdl * Maps errno values to nfs error numbers.
205 1.25 fvdl * Use NFSERR_IO as the catch all for ones not specifically defined in
206 1.25 fvdl * RFC 1094.
207 1.25 fvdl */
208 1.90 jdolecek static const u_char nfsrv_v2errmap[ELAST] = {
209 1.25 fvdl NFSERR_PERM, NFSERR_NOENT, NFSERR_IO, NFSERR_IO, NFSERR_IO,
210 1.25 fvdl NFSERR_NXIO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
211 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_ACCES, NFSERR_IO, NFSERR_IO,
212 1.25 fvdl NFSERR_IO, NFSERR_EXIST, NFSERR_IO, NFSERR_NODEV, NFSERR_NOTDIR,
213 1.25 fvdl NFSERR_ISDIR, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
214 1.25 fvdl NFSERR_IO, NFSERR_FBIG, NFSERR_NOSPC, NFSERR_IO, NFSERR_ROFS,
215 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
216 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
217 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
218 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
219 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
220 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
221 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_NAMETOL, NFSERR_IO, NFSERR_IO,
222 1.25 fvdl NFSERR_NOTEMPTY, NFSERR_IO, NFSERR_IO, NFSERR_DQUOT, NFSERR_STALE,
223 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
224 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
225 1.52 mikel NFSERR_IO, NFSERR_IO,
226 1.25 fvdl };
227 1.25 fvdl
228 1.25 fvdl /*
229 1.25 fvdl * Maps errno values to nfs error numbers.
230 1.25 fvdl * Although it is not obvious whether or not NFS clients really care if
231 1.25 fvdl * a returned error value is in the specified list for the procedure, the
232 1.25 fvdl * safest thing to do is filter them appropriately. For Version 2, the
233 1.25 fvdl * X/Open XNFS document is the only specification that defines error values
234 1.25 fvdl * for each RPC (The RFC simply lists all possible error values for all RPCs),
235 1.25 fvdl * so I have decided to not do this for Version 2.
236 1.25 fvdl * The first entry is the default error return and the rest are the valid
237 1.25 fvdl * errors for that RPC in increasing numeric order.
238 1.25 fvdl */
239 1.90 jdolecek static const short nfsv3err_null[] = {
240 1.25 fvdl 0,
241 1.25 fvdl 0,
242 1.25 fvdl };
243 1.25 fvdl
244 1.90 jdolecek static const short nfsv3err_getattr[] = {
245 1.25 fvdl NFSERR_IO,
246 1.25 fvdl NFSERR_IO,
247 1.25 fvdl NFSERR_STALE,
248 1.25 fvdl NFSERR_BADHANDLE,
249 1.25 fvdl NFSERR_SERVERFAULT,
250 1.25 fvdl 0,
251 1.25 fvdl };
252 1.25 fvdl
253 1.90 jdolecek static const short nfsv3err_setattr[] = {
254 1.25 fvdl NFSERR_IO,
255 1.25 fvdl NFSERR_PERM,
256 1.25 fvdl NFSERR_IO,
257 1.25 fvdl NFSERR_ACCES,
258 1.25 fvdl NFSERR_INVAL,
259 1.25 fvdl NFSERR_NOSPC,
260 1.25 fvdl NFSERR_ROFS,
261 1.25 fvdl NFSERR_DQUOT,
262 1.25 fvdl NFSERR_STALE,
263 1.25 fvdl NFSERR_BADHANDLE,
264 1.25 fvdl NFSERR_NOT_SYNC,
265 1.25 fvdl NFSERR_SERVERFAULT,
266 1.25 fvdl 0,
267 1.25 fvdl };
268 1.25 fvdl
269 1.90 jdolecek static const short nfsv3err_lookup[] = {
270 1.25 fvdl NFSERR_IO,
271 1.25 fvdl NFSERR_NOENT,
272 1.25 fvdl NFSERR_IO,
273 1.25 fvdl NFSERR_ACCES,
274 1.25 fvdl NFSERR_NOTDIR,
275 1.25 fvdl NFSERR_NAMETOL,
276 1.25 fvdl NFSERR_STALE,
277 1.25 fvdl NFSERR_BADHANDLE,
278 1.25 fvdl NFSERR_SERVERFAULT,
279 1.25 fvdl 0,
280 1.25 fvdl };
281 1.25 fvdl
282 1.90 jdolecek static const short nfsv3err_access[] = {
283 1.25 fvdl NFSERR_IO,
284 1.25 fvdl NFSERR_IO,
285 1.25 fvdl NFSERR_STALE,
286 1.25 fvdl NFSERR_BADHANDLE,
287 1.25 fvdl NFSERR_SERVERFAULT,
288 1.25 fvdl 0,
289 1.25 fvdl };
290 1.25 fvdl
291 1.90 jdolecek static const short nfsv3err_readlink[] = {
292 1.25 fvdl NFSERR_IO,
293 1.25 fvdl NFSERR_IO,
294 1.25 fvdl NFSERR_ACCES,
295 1.25 fvdl NFSERR_INVAL,
296 1.25 fvdl NFSERR_STALE,
297 1.25 fvdl NFSERR_BADHANDLE,
298 1.25 fvdl NFSERR_NOTSUPP,
299 1.25 fvdl NFSERR_SERVERFAULT,
300 1.25 fvdl 0,
301 1.25 fvdl };
302 1.25 fvdl
303 1.90 jdolecek static const short nfsv3err_read[] = {
304 1.25 fvdl NFSERR_IO,
305 1.25 fvdl NFSERR_IO,
306 1.25 fvdl NFSERR_NXIO,
307 1.25 fvdl NFSERR_ACCES,
308 1.25 fvdl NFSERR_INVAL,
309 1.25 fvdl NFSERR_STALE,
310 1.25 fvdl NFSERR_BADHANDLE,
311 1.25 fvdl NFSERR_SERVERFAULT,
312 1.67 fvdl NFSERR_JUKEBOX,
313 1.25 fvdl 0,
314 1.25 fvdl };
315 1.25 fvdl
316 1.90 jdolecek static const short nfsv3err_write[] = {
317 1.25 fvdl NFSERR_IO,
318 1.25 fvdl NFSERR_IO,
319 1.25 fvdl NFSERR_ACCES,
320 1.25 fvdl NFSERR_INVAL,
321 1.25 fvdl NFSERR_FBIG,
322 1.25 fvdl NFSERR_NOSPC,
323 1.25 fvdl NFSERR_ROFS,
324 1.25 fvdl NFSERR_DQUOT,
325 1.25 fvdl NFSERR_STALE,
326 1.25 fvdl NFSERR_BADHANDLE,
327 1.25 fvdl NFSERR_SERVERFAULT,
328 1.68 fvdl NFSERR_JUKEBOX,
329 1.25 fvdl 0,
330 1.25 fvdl };
331 1.25 fvdl
332 1.90 jdolecek static const short nfsv3err_create[] = {
333 1.25 fvdl NFSERR_IO,
334 1.25 fvdl NFSERR_IO,
335 1.25 fvdl NFSERR_ACCES,
336 1.25 fvdl NFSERR_EXIST,
337 1.25 fvdl NFSERR_NOTDIR,
338 1.25 fvdl NFSERR_NOSPC,
339 1.25 fvdl NFSERR_ROFS,
340 1.25 fvdl NFSERR_NAMETOL,
341 1.25 fvdl NFSERR_DQUOT,
342 1.25 fvdl NFSERR_STALE,
343 1.25 fvdl NFSERR_BADHANDLE,
344 1.25 fvdl NFSERR_NOTSUPP,
345 1.25 fvdl NFSERR_SERVERFAULT,
346 1.25 fvdl 0,
347 1.25 fvdl };
348 1.25 fvdl
349 1.90 jdolecek static const short nfsv3err_mkdir[] = {
350 1.25 fvdl NFSERR_IO,
351 1.25 fvdl NFSERR_IO,
352 1.25 fvdl NFSERR_ACCES,
353 1.25 fvdl NFSERR_EXIST,
354 1.25 fvdl NFSERR_NOTDIR,
355 1.25 fvdl NFSERR_NOSPC,
356 1.25 fvdl NFSERR_ROFS,
357 1.25 fvdl NFSERR_NAMETOL,
358 1.25 fvdl NFSERR_DQUOT,
359 1.25 fvdl NFSERR_STALE,
360 1.25 fvdl NFSERR_BADHANDLE,
361 1.25 fvdl NFSERR_NOTSUPP,
362 1.25 fvdl NFSERR_SERVERFAULT,
363 1.25 fvdl 0,
364 1.25 fvdl };
365 1.25 fvdl
366 1.90 jdolecek static const short nfsv3err_symlink[] = {
367 1.25 fvdl NFSERR_IO,
368 1.25 fvdl NFSERR_IO,
369 1.25 fvdl NFSERR_ACCES,
370 1.25 fvdl NFSERR_EXIST,
371 1.25 fvdl NFSERR_NOTDIR,
372 1.25 fvdl NFSERR_NOSPC,
373 1.25 fvdl NFSERR_ROFS,
374 1.25 fvdl NFSERR_NAMETOL,
375 1.25 fvdl NFSERR_DQUOT,
376 1.25 fvdl NFSERR_STALE,
377 1.25 fvdl NFSERR_BADHANDLE,
378 1.25 fvdl NFSERR_NOTSUPP,
379 1.25 fvdl NFSERR_SERVERFAULT,
380 1.25 fvdl 0,
381 1.25 fvdl };
382 1.25 fvdl
383 1.90 jdolecek static const short nfsv3err_mknod[] = {
384 1.25 fvdl NFSERR_IO,
385 1.25 fvdl NFSERR_IO,
386 1.25 fvdl NFSERR_ACCES,
387 1.25 fvdl NFSERR_EXIST,
388 1.25 fvdl NFSERR_NOTDIR,
389 1.25 fvdl NFSERR_NOSPC,
390 1.25 fvdl NFSERR_ROFS,
391 1.25 fvdl NFSERR_NAMETOL,
392 1.25 fvdl NFSERR_DQUOT,
393 1.25 fvdl NFSERR_STALE,
394 1.25 fvdl NFSERR_BADHANDLE,
395 1.25 fvdl NFSERR_NOTSUPP,
396 1.25 fvdl NFSERR_SERVERFAULT,
397 1.25 fvdl NFSERR_BADTYPE,
398 1.25 fvdl 0,
399 1.25 fvdl };
400 1.25 fvdl
401 1.90 jdolecek static const short nfsv3err_remove[] = {
402 1.25 fvdl NFSERR_IO,
403 1.25 fvdl NFSERR_NOENT,
404 1.25 fvdl NFSERR_IO,
405 1.25 fvdl NFSERR_ACCES,
406 1.25 fvdl NFSERR_NOTDIR,
407 1.25 fvdl NFSERR_ROFS,
408 1.25 fvdl NFSERR_NAMETOL,
409 1.25 fvdl NFSERR_STALE,
410 1.25 fvdl NFSERR_BADHANDLE,
411 1.25 fvdl NFSERR_SERVERFAULT,
412 1.25 fvdl 0,
413 1.25 fvdl };
414 1.25 fvdl
415 1.90 jdolecek static const short nfsv3err_rmdir[] = {
416 1.25 fvdl NFSERR_IO,
417 1.25 fvdl NFSERR_NOENT,
418 1.25 fvdl NFSERR_IO,
419 1.25 fvdl NFSERR_ACCES,
420 1.25 fvdl NFSERR_EXIST,
421 1.25 fvdl NFSERR_NOTDIR,
422 1.25 fvdl NFSERR_INVAL,
423 1.25 fvdl NFSERR_ROFS,
424 1.25 fvdl NFSERR_NAMETOL,
425 1.25 fvdl NFSERR_NOTEMPTY,
426 1.25 fvdl NFSERR_STALE,
427 1.25 fvdl NFSERR_BADHANDLE,
428 1.25 fvdl NFSERR_NOTSUPP,
429 1.25 fvdl NFSERR_SERVERFAULT,
430 1.25 fvdl 0,
431 1.25 fvdl };
432 1.25 fvdl
433 1.90 jdolecek static const short nfsv3err_rename[] = {
434 1.25 fvdl NFSERR_IO,
435 1.25 fvdl NFSERR_NOENT,
436 1.25 fvdl NFSERR_IO,
437 1.25 fvdl NFSERR_ACCES,
438 1.25 fvdl NFSERR_EXIST,
439 1.25 fvdl NFSERR_XDEV,
440 1.25 fvdl NFSERR_NOTDIR,
441 1.25 fvdl NFSERR_ISDIR,
442 1.25 fvdl NFSERR_INVAL,
443 1.25 fvdl NFSERR_NOSPC,
444 1.25 fvdl NFSERR_ROFS,
445 1.25 fvdl NFSERR_MLINK,
446 1.25 fvdl NFSERR_NAMETOL,
447 1.25 fvdl NFSERR_NOTEMPTY,
448 1.25 fvdl NFSERR_DQUOT,
449 1.25 fvdl NFSERR_STALE,
450 1.25 fvdl NFSERR_BADHANDLE,
451 1.25 fvdl NFSERR_NOTSUPP,
452 1.25 fvdl NFSERR_SERVERFAULT,
453 1.25 fvdl 0,
454 1.25 fvdl };
455 1.25 fvdl
456 1.90 jdolecek static const short nfsv3err_link[] = {
457 1.25 fvdl NFSERR_IO,
458 1.25 fvdl NFSERR_IO,
459 1.25 fvdl NFSERR_ACCES,
460 1.25 fvdl NFSERR_EXIST,
461 1.25 fvdl NFSERR_XDEV,
462 1.25 fvdl NFSERR_NOTDIR,
463 1.25 fvdl NFSERR_INVAL,
464 1.25 fvdl NFSERR_NOSPC,
465 1.25 fvdl NFSERR_ROFS,
466 1.25 fvdl NFSERR_MLINK,
467 1.25 fvdl NFSERR_NAMETOL,
468 1.25 fvdl NFSERR_DQUOT,
469 1.25 fvdl NFSERR_STALE,
470 1.25 fvdl NFSERR_BADHANDLE,
471 1.25 fvdl NFSERR_NOTSUPP,
472 1.25 fvdl NFSERR_SERVERFAULT,
473 1.25 fvdl 0,
474 1.25 fvdl };
475 1.25 fvdl
476 1.90 jdolecek static const short nfsv3err_readdir[] = {
477 1.25 fvdl NFSERR_IO,
478 1.25 fvdl NFSERR_IO,
479 1.25 fvdl NFSERR_ACCES,
480 1.25 fvdl NFSERR_NOTDIR,
481 1.25 fvdl NFSERR_STALE,
482 1.25 fvdl NFSERR_BADHANDLE,
483 1.25 fvdl NFSERR_BAD_COOKIE,
484 1.25 fvdl NFSERR_TOOSMALL,
485 1.25 fvdl NFSERR_SERVERFAULT,
486 1.25 fvdl 0,
487 1.25 fvdl };
488 1.25 fvdl
489 1.90 jdolecek static const short nfsv3err_readdirplus[] = {
490 1.25 fvdl NFSERR_IO,
491 1.25 fvdl NFSERR_IO,
492 1.25 fvdl NFSERR_ACCES,
493 1.25 fvdl NFSERR_NOTDIR,
494 1.25 fvdl NFSERR_STALE,
495 1.25 fvdl NFSERR_BADHANDLE,
496 1.25 fvdl NFSERR_BAD_COOKIE,
497 1.25 fvdl NFSERR_NOTSUPP,
498 1.25 fvdl NFSERR_TOOSMALL,
499 1.25 fvdl NFSERR_SERVERFAULT,
500 1.25 fvdl 0,
501 1.25 fvdl };
502 1.25 fvdl
503 1.90 jdolecek static const short nfsv3err_fsstat[] = {
504 1.25 fvdl NFSERR_IO,
505 1.25 fvdl NFSERR_IO,
506 1.25 fvdl NFSERR_STALE,
507 1.25 fvdl NFSERR_BADHANDLE,
508 1.25 fvdl NFSERR_SERVERFAULT,
509 1.25 fvdl 0,
510 1.25 fvdl };
511 1.25 fvdl
512 1.90 jdolecek static const short nfsv3err_fsinfo[] = {
513 1.25 fvdl NFSERR_STALE,
514 1.25 fvdl NFSERR_STALE,
515 1.25 fvdl NFSERR_BADHANDLE,
516 1.25 fvdl NFSERR_SERVERFAULT,
517 1.25 fvdl 0,
518 1.25 fvdl };
519 1.25 fvdl
520 1.90 jdolecek static const short nfsv3err_pathconf[] = {
521 1.25 fvdl NFSERR_STALE,
522 1.25 fvdl NFSERR_STALE,
523 1.25 fvdl NFSERR_BADHANDLE,
524 1.25 fvdl NFSERR_SERVERFAULT,
525 1.25 fvdl 0,
526 1.25 fvdl };
527 1.25 fvdl
528 1.90 jdolecek static const short nfsv3err_commit[] = {
529 1.25 fvdl NFSERR_IO,
530 1.25 fvdl NFSERR_IO,
531 1.25 fvdl NFSERR_STALE,
532 1.25 fvdl NFSERR_BADHANDLE,
533 1.25 fvdl NFSERR_SERVERFAULT,
534 1.25 fvdl 0,
535 1.25 fvdl };
536 1.25 fvdl
537 1.90 jdolecek static const short * const nfsrv_v3errmap[] = {
538 1.25 fvdl nfsv3err_null,
539 1.25 fvdl nfsv3err_getattr,
540 1.25 fvdl nfsv3err_setattr,
541 1.25 fvdl nfsv3err_lookup,
542 1.25 fvdl nfsv3err_access,
543 1.25 fvdl nfsv3err_readlink,
544 1.25 fvdl nfsv3err_read,
545 1.25 fvdl nfsv3err_write,
546 1.25 fvdl nfsv3err_create,
547 1.25 fvdl nfsv3err_mkdir,
548 1.25 fvdl nfsv3err_symlink,
549 1.25 fvdl nfsv3err_mknod,
550 1.25 fvdl nfsv3err_remove,
551 1.25 fvdl nfsv3err_rmdir,
552 1.25 fvdl nfsv3err_rename,
553 1.25 fvdl nfsv3err_link,
554 1.25 fvdl nfsv3err_readdir,
555 1.25 fvdl nfsv3err_readdirplus,
556 1.25 fvdl nfsv3err_fsstat,
557 1.25 fvdl nfsv3err_fsinfo,
558 1.25 fvdl nfsv3err_pathconf,
559 1.25 fvdl nfsv3err_commit,
560 1.25 fvdl };
561 1.25 fvdl
562 1.12 mycroft extern struct nfsrtt nfsrtt;
563 1.1 cgd
564 1.46 fvdl u_long nfsdirhashmask;
565 1.18 mycroft
566 1.213 dsl int nfs_webnamei(struct nameidata *, struct vnode *, struct proc *);
567 1.43 fvdl
568 1.1 cgd /*
569 1.1 cgd * Create the header for an rpc request packet
570 1.1 cgd * The hsiz is the size of the rest of the nfs request header.
571 1.1 cgd * (just used to decide if a cluster is a good idea)
572 1.1 cgd */
573 1.12 mycroft struct mbuf *
574 1.183 christos nfsm_reqh(struct nfsnode *np, u_long procid, int hsiz, char **bposp)
575 1.12 mycroft {
576 1.75 augustss struct mbuf *mb;
577 1.183 christos char *bpos;
578 1.12 mycroft
579 1.109 matt mb = m_get(M_WAIT, MT_DATA);
580 1.109 matt MCLAIM(mb, &nfs_mowner);
581 1.12 mycroft if (hsiz >= MINCLSIZE)
582 1.109 matt m_clget(mb, M_WAIT);
583 1.12 mycroft mb->m_len = 0;
584 1.183 christos bpos = mtod(mb, void *);
585 1.148 perry
586 1.12 mycroft /* Finally, return values */
587 1.12 mycroft *bposp = bpos;
588 1.12 mycroft return (mb);
589 1.12 mycroft }
590 1.12 mycroft
591 1.12 mycroft /*
592 1.12 mycroft * Build the RPC header and fill in the authorization info.
593 1.12 mycroft * The authorization string argument is only used when the credentials
594 1.12 mycroft * come from outside of the kernel.
595 1.12 mycroft * Returns the head of the mbuf list.
596 1.12 mycroft */
597 1.12 mycroft struct mbuf *
598 1.216 cegger nfsm_rpchead(kauth_cred_t cr, int nmflag, int procid,
599 1.216 cegger int auth_type, int auth_len, char *auth_str, int verf_len,
600 1.216 cegger char *verf_str, struct mbuf *mrest, int mrest_len,
601 1.216 cegger struct mbuf **mbp, uint32_t *xidp)
602 1.1 cgd {
603 1.75 augustss struct mbuf *mb;
604 1.75 augustss u_int32_t *tl;
605 1.183 christos char *bpos;
606 1.75 augustss int i;
607 1.109 matt struct mbuf *mreq;
608 1.12 mycroft int siz, grpsiz, authsiz;
609 1.1 cgd
610 1.12 mycroft authsiz = nfsm_rndup(auth_len);
611 1.109 matt mb = m_gethdr(M_WAIT, MT_DATA);
612 1.109 matt MCLAIM(mb, &nfs_mowner);
613 1.25 fvdl if ((authsiz + 10 * NFSX_UNSIGNED) >= MINCLSIZE) {
614 1.109 matt m_clget(mb, M_WAIT);
615 1.25 fvdl } else if ((authsiz + 10 * NFSX_UNSIGNED) < MHLEN) {
616 1.25 fvdl MH_ALIGN(mb, authsiz + 10 * NFSX_UNSIGNED);
617 1.12 mycroft } else {
618 1.25 fvdl MH_ALIGN(mb, 8 * NFSX_UNSIGNED);
619 1.1 cgd }
620 1.12 mycroft mb->m_len = 0;
621 1.12 mycroft mreq = mb;
622 1.183 christos bpos = mtod(mb, void *);
623 1.12 mycroft
624 1.12 mycroft /*
625 1.12 mycroft * First the RPC header.
626 1.12 mycroft */
627 1.25 fvdl nfsm_build(tl, u_int32_t *, 8 * NFSX_UNSIGNED);
628 1.30 fvdl
629 1.126 yamt *tl++ = *xidp = nfs_getxid();
630 1.1 cgd *tl++ = rpc_call;
631 1.1 cgd *tl++ = rpc_vers;
632 1.179 yamt *tl++ = txdr_unsigned(NFS_PROG);
633 1.179 yamt if (nmflag & NFSMNT_NFSV3)
634 1.179 yamt *tl++ = txdr_unsigned(NFS_VER3);
635 1.179 yamt else
636 1.179 yamt *tl++ = txdr_unsigned(NFS_VER2);
637 1.25 fvdl if (nmflag & NFSMNT_NFSV3)
638 1.25 fvdl *tl++ = txdr_unsigned(procid);
639 1.25 fvdl else
640 1.25 fvdl *tl++ = txdr_unsigned(nfsv2_procid[procid]);
641 1.12 mycroft
642 1.12 mycroft /*
643 1.12 mycroft * And then the authorization cred.
644 1.12 mycroft */
645 1.12 mycroft *tl++ = txdr_unsigned(auth_type);
646 1.12 mycroft *tl = txdr_unsigned(authsiz);
647 1.12 mycroft switch (auth_type) {
648 1.12 mycroft case RPCAUTH_UNIX:
649 1.22 cgd nfsm_build(tl, u_int32_t *, auth_len);
650 1.12 mycroft *tl++ = 0; /* stamp ?? */
651 1.12 mycroft *tl++ = 0; /* NULL hostname */
652 1.162 elad *tl++ = txdr_unsigned(kauth_cred_geteuid(cr));
653 1.162 elad *tl++ = txdr_unsigned(kauth_cred_getegid(cr));
654 1.12 mycroft grpsiz = (auth_len >> 2) - 5;
655 1.12 mycroft *tl++ = txdr_unsigned(grpsiz);
656 1.20 mycroft for (i = 0; i < grpsiz; i++)
657 1.162 elad *tl++ = txdr_unsigned(kauth_cred_group(cr, i)); /* XXX elad review */
658 1.12 mycroft break;
659 1.25 fvdl case RPCAUTH_KERB4:
660 1.12 mycroft siz = auth_len;
661 1.12 mycroft while (siz > 0) {
662 1.12 mycroft if (M_TRAILINGSPACE(mb) == 0) {
663 1.109 matt struct mbuf *mb2;
664 1.109 matt mb2 = m_get(M_WAIT, MT_DATA);
665 1.109 matt MCLAIM(mb2, &nfs_mowner);
666 1.12 mycroft if (siz >= MINCLSIZE)
667 1.109 matt m_clget(mb2, M_WAIT);
668 1.12 mycroft mb->m_next = mb2;
669 1.12 mycroft mb = mb2;
670 1.12 mycroft mb->m_len = 0;
671 1.183 christos bpos = mtod(mb, void *);
672 1.12 mycroft }
673 1.12 mycroft i = min(siz, M_TRAILINGSPACE(mb));
674 1.63 perry memcpy(bpos, auth_str, i);
675 1.12 mycroft mb->m_len += i;
676 1.12 mycroft auth_str += i;
677 1.12 mycroft bpos += i;
678 1.12 mycroft siz -= i;
679 1.12 mycroft }
680 1.12 mycroft if ((siz = (nfsm_rndup(auth_len) - auth_len)) > 0) {
681 1.12 mycroft for (i = 0; i < siz; i++)
682 1.12 mycroft *bpos++ = '\0';
683 1.12 mycroft mb->m_len += siz;
684 1.12 mycroft }
685 1.12 mycroft break;
686 1.12 mycroft };
687 1.25 fvdl
688 1.25 fvdl /*
689 1.25 fvdl * And the verifier...
690 1.25 fvdl */
691 1.25 fvdl nfsm_build(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
692 1.25 fvdl if (verf_str) {
693 1.25 fvdl *tl++ = txdr_unsigned(RPCAUTH_KERB4);
694 1.25 fvdl *tl = txdr_unsigned(verf_len);
695 1.25 fvdl siz = verf_len;
696 1.25 fvdl while (siz > 0) {
697 1.25 fvdl if (M_TRAILINGSPACE(mb) == 0) {
698 1.109 matt struct mbuf *mb2;
699 1.109 matt mb2 = m_get(M_WAIT, MT_DATA);
700 1.109 matt MCLAIM(mb2, &nfs_mowner);
701 1.25 fvdl if (siz >= MINCLSIZE)
702 1.109 matt m_clget(mb2, M_WAIT);
703 1.25 fvdl mb->m_next = mb2;
704 1.25 fvdl mb = mb2;
705 1.25 fvdl mb->m_len = 0;
706 1.183 christos bpos = mtod(mb, void *);
707 1.25 fvdl }
708 1.25 fvdl i = min(siz, M_TRAILINGSPACE(mb));
709 1.63 perry memcpy(bpos, verf_str, i);
710 1.25 fvdl mb->m_len += i;
711 1.25 fvdl verf_str += i;
712 1.25 fvdl bpos += i;
713 1.25 fvdl siz -= i;
714 1.25 fvdl }
715 1.25 fvdl if ((siz = (nfsm_rndup(verf_len) - verf_len)) > 0) {
716 1.25 fvdl for (i = 0; i < siz; i++)
717 1.25 fvdl *bpos++ = '\0';
718 1.25 fvdl mb->m_len += siz;
719 1.25 fvdl }
720 1.25 fvdl } else {
721 1.25 fvdl *tl++ = txdr_unsigned(RPCAUTH_NULL);
722 1.25 fvdl *tl = 0;
723 1.25 fvdl }
724 1.12 mycroft mb->m_next = mrest;
725 1.25 fvdl mreq->m_pkthdr.len = authsiz + 10 * NFSX_UNSIGNED + mrest_len;
726 1.12 mycroft mreq->m_pkthdr.rcvif = (struct ifnet *)0;
727 1.12 mycroft *mbp = mb;
728 1.1 cgd return (mreq);
729 1.1 cgd }
730 1.1 cgd
731 1.1 cgd /*
732 1.1 cgd * copies mbuf chain to the uio scatter/gather list
733 1.1 cgd */
734 1.24 christos int
735 1.214 dsl nfsm_mbuftouio(struct mbuf **mrep, struct uio *uiop, int siz, char **dpos)
736 1.1 cgd {
737 1.75 augustss char *mbufcp, *uiocp;
738 1.75 augustss int xfer, left, len;
739 1.75 augustss struct mbuf *mp;
740 1.1 cgd long uiosiz, rem;
741 1.1 cgd int error = 0;
742 1.1 cgd
743 1.1 cgd mp = *mrep;
744 1.1 cgd mbufcp = *dpos;
745 1.183 christos len = mtod(mp, char *) + mp->m_len - mbufcp;
746 1.1 cgd rem = nfsm_rndup(siz)-siz;
747 1.1 cgd while (siz > 0) {
748 1.1 cgd if (uiop->uio_iovcnt <= 0 || uiop->uio_iov == NULL)
749 1.1 cgd return (EFBIG);
750 1.1 cgd left = uiop->uio_iov->iov_len;
751 1.1 cgd uiocp = uiop->uio_iov->iov_base;
752 1.1 cgd if (left > siz)
753 1.1 cgd left = siz;
754 1.1 cgd uiosiz = left;
755 1.1 cgd while (left > 0) {
756 1.1 cgd while (len == 0) {
757 1.1 cgd mp = mp->m_next;
758 1.1 cgd if (mp == NULL)
759 1.1 cgd return (EBADRPC);
760 1.183 christos mbufcp = mtod(mp, void *);
761 1.1 cgd len = mp->m_len;
762 1.1 cgd }
763 1.1 cgd xfer = (left > len) ? len : left;
764 1.158 yamt error = copyout_vmspace(uiop->uio_vmspace, mbufcp,
765 1.158 yamt uiocp, xfer);
766 1.158 yamt if (error) {
767 1.158 yamt return error;
768 1.158 yamt }
769 1.1 cgd left -= xfer;
770 1.1 cgd len -= xfer;
771 1.1 cgd mbufcp += xfer;
772 1.1 cgd uiocp += xfer;
773 1.1 cgd uiop->uio_offset += xfer;
774 1.1 cgd uiop->uio_resid -= xfer;
775 1.1 cgd }
776 1.1 cgd if (uiop->uio_iov->iov_len <= siz) {
777 1.1 cgd uiop->uio_iovcnt--;
778 1.1 cgd uiop->uio_iov++;
779 1.1 cgd } else {
780 1.95 lukem uiop->uio_iov->iov_base =
781 1.183 christos (char *)uiop->uio_iov->iov_base + uiosiz;
782 1.1 cgd uiop->uio_iov->iov_len -= uiosiz;
783 1.1 cgd }
784 1.1 cgd siz -= uiosiz;
785 1.1 cgd }
786 1.1 cgd *dpos = mbufcp;
787 1.1 cgd *mrep = mp;
788 1.1 cgd if (rem > 0) {
789 1.1 cgd if (len < rem)
790 1.1 cgd error = nfs_adv(mrep, dpos, rem, len);
791 1.1 cgd else
792 1.1 cgd *dpos += rem;
793 1.1 cgd }
794 1.1 cgd return (error);
795 1.1 cgd }
796 1.1 cgd
797 1.1 cgd /*
798 1.29 fvdl * copies a uio scatter/gather list to an mbuf chain.
799 1.29 fvdl * NOTE: can ony handle iovcnt == 1
800 1.1 cgd */
801 1.24 christos int
802 1.214 dsl nfsm_uiotombuf(struct uio *uiop, struct mbuf **mq, int siz, char **bpos)
803 1.1 cgd {
804 1.75 augustss char *uiocp;
805 1.75 augustss struct mbuf *mp, *mp2;
806 1.75 augustss int xfer, left, mlen;
807 1.1 cgd int uiosiz, clflg, rem;
808 1.1 cgd char *cp;
809 1.158 yamt int error;
810 1.1 cgd
811 1.29 fvdl #ifdef DIAGNOSTIC
812 1.29 fvdl if (uiop->uio_iovcnt != 1)
813 1.29 fvdl panic("nfsm_uiotombuf: iovcnt != 1");
814 1.29 fvdl #endif
815 1.29 fvdl
816 1.1 cgd if (siz > MLEN) /* or should it >= MCLBYTES ?? */
817 1.1 cgd clflg = 1;
818 1.1 cgd else
819 1.1 cgd clflg = 0;
820 1.1 cgd rem = nfsm_rndup(siz)-siz;
821 1.12 mycroft mp = mp2 = *mq;
822 1.1 cgd while (siz > 0) {
823 1.1 cgd left = uiop->uio_iov->iov_len;
824 1.1 cgd uiocp = uiop->uio_iov->iov_base;
825 1.1 cgd if (left > siz)
826 1.1 cgd left = siz;
827 1.1 cgd uiosiz = left;
828 1.1 cgd while (left > 0) {
829 1.12 mycroft mlen = M_TRAILINGSPACE(mp);
830 1.12 mycroft if (mlen == 0) {
831 1.109 matt mp = m_get(M_WAIT, MT_DATA);
832 1.109 matt MCLAIM(mp, &nfs_mowner);
833 1.12 mycroft if (clflg)
834 1.109 matt m_clget(mp, M_WAIT);
835 1.12 mycroft mp->m_len = 0;
836 1.12 mycroft mp2->m_next = mp;
837 1.12 mycroft mp2 = mp;
838 1.12 mycroft mlen = M_TRAILINGSPACE(mp);
839 1.12 mycroft }
840 1.12 mycroft xfer = (left > mlen) ? mlen : left;
841 1.183 christos cp = mtod(mp, char *) + mp->m_len;
842 1.158 yamt error = copyin_vmspace(uiop->uio_vmspace, uiocp, cp,
843 1.158 yamt xfer);
844 1.158 yamt if (error) {
845 1.158 yamt /* XXX */
846 1.158 yamt }
847 1.12 mycroft mp->m_len += xfer;
848 1.1 cgd left -= xfer;
849 1.1 cgd uiocp += xfer;
850 1.1 cgd uiop->uio_offset += xfer;
851 1.1 cgd uiop->uio_resid -= xfer;
852 1.1 cgd }
853 1.183 christos uiop->uio_iov->iov_base = (char *)uiop->uio_iov->iov_base +
854 1.95 lukem uiosiz;
855 1.29 fvdl uiop->uio_iov->iov_len -= uiosiz;
856 1.1 cgd siz -= uiosiz;
857 1.1 cgd }
858 1.1 cgd if (rem > 0) {
859 1.12 mycroft if (rem > M_TRAILINGSPACE(mp)) {
860 1.109 matt mp = m_get(M_WAIT, MT_DATA);
861 1.109 matt MCLAIM(mp, &nfs_mowner);
862 1.1 cgd mp->m_len = 0;
863 1.1 cgd mp2->m_next = mp;
864 1.1 cgd }
865 1.183 christos cp = mtod(mp, char *) + mp->m_len;
866 1.1 cgd for (left = 0; left < rem; left++)
867 1.1 cgd *cp++ = '\0';
868 1.1 cgd mp->m_len += rem;
869 1.1 cgd *bpos = cp;
870 1.1 cgd } else
871 1.183 christos *bpos = mtod(mp, char *) + mp->m_len;
872 1.1 cgd *mq = mp;
873 1.1 cgd return (0);
874 1.1 cgd }
875 1.1 cgd
876 1.1 cgd /*
877 1.39 fvdl * Get at least "siz" bytes of correctly aligned data.
878 1.39 fvdl * When called the mbuf pointers are not necessarily correct,
879 1.39 fvdl * dsosp points to what ought to be in m_data and left contains
880 1.148 perry * what ought to be in m_len.
881 1.12 mycroft * This is used by the macros nfsm_dissect and nfsm_dissecton for tough
882 1.1 cgd * cases. (The macros use the vars. dpos and dpos2)
883 1.1 cgd */
884 1.24 christos int
885 1.214 dsl nfsm_disct(struct mbuf **mdp, char **dposp, int siz, int left, char **cp2)
886 1.1 cgd {
887 1.75 augustss struct mbuf *m1, *m2;
888 1.39 fvdl struct mbuf *havebuf = NULL;
889 1.183 christos char *src = *dposp;
890 1.183 christos char *dst;
891 1.39 fvdl int len;
892 1.39 fvdl
893 1.39 fvdl #ifdef DEBUG
894 1.39 fvdl if (left < 0)
895 1.148 perry panic("nfsm_disct: left < 0");
896 1.39 fvdl #endif
897 1.39 fvdl m1 = *mdp;
898 1.39 fvdl /*
899 1.39 fvdl * Skip through the mbuf chain looking for an mbuf with
900 1.39 fvdl * some data. If the first mbuf found has enough data
901 1.39 fvdl * and it is correctly aligned return it.
902 1.39 fvdl */
903 1.1 cgd while (left == 0) {
904 1.39 fvdl havebuf = m1;
905 1.39 fvdl *mdp = m1 = m1->m_next;
906 1.39 fvdl if (m1 == NULL)
907 1.1 cgd return (EBADRPC);
908 1.183 christos src = mtod(m1, void *);
909 1.39 fvdl left = m1->m_len;
910 1.39 fvdl /*
911 1.39 fvdl * If we start a new mbuf and it is big enough
912 1.39 fvdl * and correctly aligned just return it, don't
913 1.39 fvdl * do any pull up.
914 1.39 fvdl */
915 1.39 fvdl if (left >= siz && nfsm_aligned(src)) {
916 1.39 fvdl *cp2 = src;
917 1.39 fvdl *dposp = src + siz;
918 1.39 fvdl return (0);
919 1.39 fvdl }
920 1.1 cgd }
921 1.201 yamt if ((m1->m_flags & M_EXT) != 0) {
922 1.201 yamt if (havebuf && M_TRAILINGSPACE(havebuf) >= siz &&
923 1.201 yamt nfsm_aligned(mtod(havebuf, char *) + havebuf->m_len)) {
924 1.201 yamt /*
925 1.201 yamt * If the first mbuf with data has external data
926 1.201 yamt * and there is a previous mbuf with some trailing
927 1.201 yamt * space, use it to move the data into.
928 1.39 fvdl */
929 1.39 fvdl m2 = m1;
930 1.39 fvdl *mdp = m1 = havebuf;
931 1.201 yamt *cp2 = mtod(m1, char *) + m1->m_len;
932 1.201 yamt } else if (havebuf) {
933 1.39 fvdl /*
934 1.39 fvdl * If the first mbuf has a external data
935 1.39 fvdl * and there is no previous empty mbuf
936 1.39 fvdl * allocate a new mbuf and move the external
937 1.148 perry * data to the new mbuf. Also make the first
938 1.39 fvdl * mbuf look empty.
939 1.39 fvdl */
940 1.201 yamt m2 = m1;
941 1.201 yamt *mdp = m1 = m_get(M_WAIT, MT_DATA);
942 1.201 yamt MCLAIM(m1, m2->m_owner);
943 1.201 yamt if ((m2->m_flags & M_PKTHDR) != 0) {
944 1.201 yamt /* XXX MOVE */
945 1.201 yamt M_COPY_PKTHDR(m1, m2);
946 1.201 yamt m_tag_delete_chain(m2, NULL);
947 1.201 yamt m2->m_flags &= ~M_PKTHDR;
948 1.201 yamt }
949 1.201 yamt if (havebuf) {
950 1.201 yamt havebuf->m_next = m1;
951 1.201 yamt }
952 1.201 yamt m1->m_next = m2;
953 1.201 yamt MRESETDATA(m1);
954 1.201 yamt m1->m_len = 0;
955 1.39 fvdl m2->m_data = src;
956 1.39 fvdl m2->m_len = left;
957 1.201 yamt *cp2 = mtod(m1, char *);
958 1.201 yamt } else {
959 1.201 yamt struct mbuf **nextp = &m1->m_next;
960 1.201 yamt
961 1.201 yamt m1->m_len -= left;
962 1.201 yamt do {
963 1.201 yamt m2 = m_get(M_WAIT, MT_DATA);
964 1.201 yamt MCLAIM(m2, m1->m_owner);
965 1.201 yamt if (left >= MINCLSIZE) {
966 1.201 yamt MCLGET(m2, M_WAIT);
967 1.201 yamt }
968 1.201 yamt m2->m_next = *nextp;
969 1.201 yamt *nextp = m2;
970 1.201 yamt nextp = &m2->m_next;
971 1.201 yamt len = (m2->m_flags & M_EXT) != 0 ?
972 1.201 yamt MCLBYTES : MLEN;
973 1.201 yamt if (len > left) {
974 1.201 yamt len = left;
975 1.201 yamt }
976 1.201 yamt memcpy(mtod(m2, char *), src, len);
977 1.201 yamt m2->m_len = len;
978 1.201 yamt src += len;
979 1.201 yamt left -= len;
980 1.201 yamt } while (left > 0);
981 1.201 yamt *mdp = m1 = m1->m_next;
982 1.201 yamt m2 = m1->m_next;
983 1.201 yamt *cp2 = mtod(m1, char *);
984 1.1 cgd }
985 1.39 fvdl } else {
986 1.39 fvdl /*
987 1.39 fvdl * If the first mbuf has no external data
988 1.39 fvdl * move the data to the front of the mbuf.
989 1.39 fvdl */
990 1.201 yamt MRESETDATA(m1);
991 1.201 yamt dst = mtod(m1, char *);
992 1.201 yamt if (dst != src) {
993 1.63 perry memmove(dst, src, left);
994 1.201 yamt }
995 1.39 fvdl m1->m_len = left;
996 1.39 fvdl m2 = m1->m_next;
997 1.201 yamt *cp2 = m1->m_data;
998 1.1 cgd }
999 1.201 yamt *dposp = *cp2 + siz;
1000 1.39 fvdl /*
1001 1.39 fvdl * Loop through mbufs pulling data up into first mbuf until
1002 1.39 fvdl * the first mbuf is full or there is no more data to
1003 1.39 fvdl * pullup.
1004 1.39 fvdl */
1005 1.201 yamt dst = mtod(m1, char *) + m1->m_len;
1006 1.129 itojun while ((len = M_TRAILINGSPACE(m1)) != 0 && m2) {
1007 1.201 yamt if ((len = min(len, m2->m_len)) != 0) {
1008 1.201 yamt memcpy(dst, mtod(m2, char *), len);
1009 1.201 yamt }
1010 1.39 fvdl m1->m_len += len;
1011 1.39 fvdl dst += len;
1012 1.39 fvdl m2->m_data += len;
1013 1.39 fvdl m2->m_len -= len;
1014 1.39 fvdl m2 = m2->m_next;
1015 1.39 fvdl }
1016 1.39 fvdl if (m1->m_len < siz)
1017 1.39 fvdl return (EBADRPC);
1018 1.1 cgd return (0);
1019 1.1 cgd }
1020 1.1 cgd
1021 1.1 cgd /*
1022 1.1 cgd * Advance the position in the mbuf chain.
1023 1.1 cgd */
1024 1.24 christos int
1025 1.214 dsl nfs_adv(struct mbuf **mdp, char **dposp, int offs, int left)
1026 1.1 cgd {
1027 1.75 augustss struct mbuf *m;
1028 1.75 augustss int s;
1029 1.1 cgd
1030 1.1 cgd m = *mdp;
1031 1.1 cgd s = left;
1032 1.1 cgd while (s < offs) {
1033 1.1 cgd offs -= s;
1034 1.1 cgd m = m->m_next;
1035 1.1 cgd if (m == NULL)
1036 1.1 cgd return (EBADRPC);
1037 1.1 cgd s = m->m_len;
1038 1.1 cgd }
1039 1.1 cgd *mdp = m;
1040 1.183 christos *dposp = mtod(m, char *) + offs;
1041 1.1 cgd return (0);
1042 1.1 cgd }
1043 1.1 cgd
1044 1.1 cgd /*
1045 1.1 cgd * Copy a string into mbufs for the hard cases...
1046 1.1 cgd */
1047 1.24 christos int
1048 1.214 dsl nfsm_strtmbuf(struct mbuf **mb, char **bpos, const char *cp, long siz)
1049 1.1 cgd {
1050 1.75 augustss struct mbuf *m1 = NULL, *m2;
1051 1.1 cgd long left, xfer, len, tlen;
1052 1.22 cgd u_int32_t *tl;
1053 1.1 cgd int putsize;
1054 1.1 cgd
1055 1.1 cgd putsize = 1;
1056 1.1 cgd m2 = *mb;
1057 1.12 mycroft left = M_TRAILINGSPACE(m2);
1058 1.1 cgd if (left > 0) {
1059 1.22 cgd tl = ((u_int32_t *)(*bpos));
1060 1.1 cgd *tl++ = txdr_unsigned(siz);
1061 1.1 cgd putsize = 0;
1062 1.1 cgd left -= NFSX_UNSIGNED;
1063 1.1 cgd m2->m_len += NFSX_UNSIGNED;
1064 1.1 cgd if (left > 0) {
1065 1.183 christos memcpy((void *) tl, cp, left);
1066 1.1 cgd siz -= left;
1067 1.1 cgd cp += left;
1068 1.1 cgd m2->m_len += left;
1069 1.1 cgd left = 0;
1070 1.1 cgd }
1071 1.1 cgd }
1072 1.12 mycroft /* Loop around adding mbufs */
1073 1.1 cgd while (siz > 0) {
1074 1.109 matt m1 = m_get(M_WAIT, MT_DATA);
1075 1.109 matt MCLAIM(m1, &nfs_mowner);
1076 1.1 cgd if (siz > MLEN)
1077 1.109 matt m_clget(m1, M_WAIT);
1078 1.1 cgd m1->m_len = NFSMSIZ(m1);
1079 1.1 cgd m2->m_next = m1;
1080 1.1 cgd m2 = m1;
1081 1.22 cgd tl = mtod(m1, u_int32_t *);
1082 1.1 cgd tlen = 0;
1083 1.1 cgd if (putsize) {
1084 1.1 cgd *tl++ = txdr_unsigned(siz);
1085 1.1 cgd m1->m_len -= NFSX_UNSIGNED;
1086 1.1 cgd tlen = NFSX_UNSIGNED;
1087 1.1 cgd putsize = 0;
1088 1.1 cgd }
1089 1.1 cgd if (siz < m1->m_len) {
1090 1.1 cgd len = nfsm_rndup(siz);
1091 1.1 cgd xfer = siz;
1092 1.1 cgd if (xfer < len)
1093 1.1 cgd *(tl+(xfer>>2)) = 0;
1094 1.1 cgd } else {
1095 1.1 cgd xfer = len = m1->m_len;
1096 1.1 cgd }
1097 1.183 christos memcpy((void *) tl, cp, xfer);
1098 1.1 cgd m1->m_len = len+tlen;
1099 1.1 cgd siz -= xfer;
1100 1.1 cgd cp += xfer;
1101 1.1 cgd }
1102 1.1 cgd *mb = m1;
1103 1.183 christos *bpos = mtod(m1, char *) + m1->m_len;
1104 1.1 cgd return (0);
1105 1.1 cgd }
1106 1.1 cgd
1107 1.49 fvdl /*
1108 1.49 fvdl * Directory caching routines. They work as follows:
1109 1.49 fvdl * - a cache is maintained per VDIR nfsnode.
1110 1.49 fvdl * - for each offset cookie that is exported to userspace, and can
1111 1.49 fvdl * thus be thrown back at us as an offset to VOP_READDIR, store
1112 1.49 fvdl * information in the cache.
1113 1.49 fvdl * - cached are:
1114 1.49 fvdl * - cookie itself
1115 1.49 fvdl * - blocknumber (essentially just a search key in the buffer cache)
1116 1.49 fvdl * - entry number in block.
1117 1.49 fvdl * - offset cookie of block in which this entry is stored
1118 1.49 fvdl * - 32 bit cookie if NFSMNT_XLATECOOKIE is used.
1119 1.49 fvdl * - entries are looked up in a hash table
1120 1.49 fvdl * - also maintained is an LRU list of entries, used to determine
1121 1.49 fvdl * which ones to delete if the cache grows too large.
1122 1.49 fvdl * - if 32 <-> 64 translation mode is requested for a filesystem,
1123 1.49 fvdl * the cache also functions as a translation table
1124 1.49 fvdl * - in the translation case, invalidating the cache does not mean
1125 1.49 fvdl * flushing it, but just marking entries as invalid, except for
1126 1.49 fvdl * the <64bit cookie, 32bitcookie> pair which is still valid, to
1127 1.49 fvdl * still be able to use the cache as a translation table.
1128 1.49 fvdl * - 32 bit cookies are uniquely created by combining the hash table
1129 1.49 fvdl * entry value, and one generation count per hash table entry,
1130 1.49 fvdl * incremented each time an entry is appended to the chain.
1131 1.49 fvdl * - the cache is invalidated each time a direcory is modified
1132 1.49 fvdl * - sanity checks are also done; if an entry in a block turns
1133 1.49 fvdl * out not to have a matching cookie, the cache is invalidated
1134 1.49 fvdl * and a new block starting from the wanted offset is fetched from
1135 1.49 fvdl * the server.
1136 1.49 fvdl * - directory entries as read from the server are extended to contain
1137 1.49 fvdl * the 64bit and, optionally, the 32bit cookies, for sanity checking
1138 1.49 fvdl * the cache and exporting them to userspace through the cookie
1139 1.49 fvdl * argument to VOP_READDIR.
1140 1.49 fvdl */
1141 1.49 fvdl
1142 1.46 fvdl u_long
1143 1.214 dsl nfs_dirhash(off_t off)
1144 1.46 fvdl {
1145 1.46 fvdl int i;
1146 1.46 fvdl char *cp = (char *)&off;
1147 1.46 fvdl u_long sum = 0L;
1148 1.46 fvdl
1149 1.46 fvdl for (i = 0 ; i < sizeof (off); i++)
1150 1.46 fvdl sum += *cp++;
1151 1.46 fvdl
1152 1.46 fvdl return sum;
1153 1.46 fvdl }
1154 1.46 fvdl
1155 1.135 yamt #define _NFSDC_MTX(np) (&NFSTOV(np)->v_interlock)
1156 1.195 ad #define NFSDC_LOCK(np) mutex_enter(_NFSDC_MTX(np))
1157 1.195 ad #define NFSDC_UNLOCK(np) mutex_exit(_NFSDC_MTX(np))
1158 1.195 ad #define NFSDC_ASSERT_LOCKED(np) KASSERT(mutex_owned(_NFSDC_MTX(np)))
1159 1.135 yamt
1160 1.49 fvdl void
1161 1.214 dsl nfs_initdircache(struct vnode *vp)
1162 1.49 fvdl {
1163 1.49 fvdl struct nfsnode *np = VTONFS(vp);
1164 1.135 yamt struct nfsdirhashhead *dircache;
1165 1.120 yamt
1166 1.202 ad dircache = hashinit(NFS_DIRHASHSIZ, HASH_LIST, true,
1167 1.202 ad &nfsdirhashmask);
1168 1.49 fvdl
1169 1.135 yamt NFSDC_LOCK(np);
1170 1.135 yamt if (np->n_dircache == NULL) {
1171 1.135 yamt np->n_dircachesize = 0;
1172 1.135 yamt np->n_dircache = dircache;
1173 1.135 yamt dircache = NULL;
1174 1.135 yamt TAILQ_INIT(&np->n_dirchain);
1175 1.135 yamt }
1176 1.135 yamt NFSDC_UNLOCK(np);
1177 1.135 yamt if (dircache)
1178 1.202 ad hashdone(dircache, HASH_LIST, nfsdirhashmask);
1179 1.120 yamt }
1180 1.120 yamt
1181 1.120 yamt void
1182 1.214 dsl nfs_initdirxlatecookie(struct vnode *vp)
1183 1.120 yamt {
1184 1.120 yamt struct nfsnode *np = VTONFS(vp);
1185 1.135 yamt unsigned *dirgens;
1186 1.120 yamt
1187 1.120 yamt KASSERT(VFSTONFS(vp->v_mount)->nm_flag & NFSMNT_XLATECOOKIE);
1188 1.120 yamt
1189 1.196 yamt dirgens = kmem_zalloc(NFS_DIRHASHSIZ * sizeof(unsigned), KM_SLEEP);
1190 1.135 yamt NFSDC_LOCK(np);
1191 1.135 yamt if (np->n_dirgens == NULL) {
1192 1.135 yamt np->n_dirgens = dirgens;
1193 1.135 yamt dirgens = NULL;
1194 1.135 yamt }
1195 1.135 yamt NFSDC_UNLOCK(np);
1196 1.135 yamt if (dirgens)
1197 1.196 yamt kmem_free(dirgens, NFS_DIRHASHSIZ * sizeof(unsigned));
1198 1.135 yamt }
1199 1.135 yamt
1200 1.135 yamt static const struct nfsdircache dzero;
1201 1.135 yamt
1202 1.213 dsl static void nfs_unlinkdircache(struct nfsnode *np, struct nfsdircache *);
1203 1.213 dsl static void nfs_putdircache_unlocked(struct nfsnode *,
1204 1.213 dsl struct nfsdircache *);
1205 1.135 yamt
1206 1.135 yamt static void
1207 1.214 dsl nfs_unlinkdircache(struct nfsnode *np, struct nfsdircache *ndp)
1208 1.135 yamt {
1209 1.135 yamt
1210 1.135 yamt NFSDC_ASSERT_LOCKED(np);
1211 1.135 yamt KASSERT(ndp != &dzero);
1212 1.135 yamt
1213 1.135 yamt if (LIST_NEXT(ndp, dc_hash) == (void *)-1)
1214 1.135 yamt return;
1215 1.135 yamt
1216 1.135 yamt TAILQ_REMOVE(&np->n_dirchain, ndp, dc_chain);
1217 1.135 yamt LIST_REMOVE(ndp, dc_hash);
1218 1.135 yamt LIST_NEXT(ndp, dc_hash) = (void *)-1; /* mark as unlinked */
1219 1.135 yamt
1220 1.135 yamt nfs_putdircache_unlocked(np, ndp);
1221 1.135 yamt }
1222 1.135 yamt
1223 1.135 yamt void
1224 1.214 dsl nfs_putdircache(struct nfsnode *np, struct nfsdircache *ndp)
1225 1.135 yamt {
1226 1.135 yamt int ref;
1227 1.135 yamt
1228 1.135 yamt if (ndp == &dzero)
1229 1.135 yamt return;
1230 1.135 yamt
1231 1.135 yamt KASSERT(ndp->dc_refcnt > 0);
1232 1.135 yamt NFSDC_LOCK(np);
1233 1.135 yamt ref = --ndp->dc_refcnt;
1234 1.135 yamt NFSDC_UNLOCK(np);
1235 1.135 yamt
1236 1.135 yamt if (ref == 0)
1237 1.196 yamt kmem_free(ndp, sizeof(*ndp));
1238 1.49 fvdl }
1239 1.49 fvdl
1240 1.135 yamt static void
1241 1.177 yamt nfs_putdircache_unlocked(struct nfsnode *np, struct nfsdircache *ndp)
1242 1.135 yamt {
1243 1.135 yamt int ref;
1244 1.135 yamt
1245 1.135 yamt NFSDC_ASSERT_LOCKED(np);
1246 1.135 yamt
1247 1.135 yamt if (ndp == &dzero)
1248 1.135 yamt return;
1249 1.135 yamt
1250 1.135 yamt KASSERT(ndp->dc_refcnt > 0);
1251 1.135 yamt ref = --ndp->dc_refcnt;
1252 1.135 yamt if (ref == 0)
1253 1.196 yamt kmem_free(ndp, sizeof(*ndp));
1254 1.135 yamt }
1255 1.46 fvdl
1256 1.46 fvdl struct nfsdircache *
1257 1.214 dsl nfs_searchdircache(struct vnode *vp, off_t off, int do32, int *hashent)
1258 1.49 fvdl {
1259 1.49 fvdl struct nfsdirhashhead *ndhp;
1260 1.49 fvdl struct nfsdircache *ndp = NULL;
1261 1.49 fvdl struct nfsnode *np = VTONFS(vp);
1262 1.49 fvdl unsigned ent;
1263 1.49 fvdl
1264 1.49 fvdl /*
1265 1.49 fvdl * Zero is always a valid cookie.
1266 1.49 fvdl */
1267 1.49 fvdl if (off == 0)
1268 1.149 christos /* XXXUNCONST */
1269 1.149 christos return (struct nfsdircache *)__UNCONST(&dzero);
1270 1.49 fvdl
1271 1.134 yamt if (!np->n_dircache)
1272 1.134 yamt return NULL;
1273 1.134 yamt
1274 1.49 fvdl /*
1275 1.49 fvdl * We use a 32bit cookie as search key, directly reconstruct
1276 1.49 fvdl * the hashentry. Else use the hashfunction.
1277 1.49 fvdl */
1278 1.49 fvdl if (do32) {
1279 1.49 fvdl ent = (u_int32_t)off >> 24;
1280 1.49 fvdl if (ent >= NFS_DIRHASHSIZ)
1281 1.49 fvdl return NULL;
1282 1.49 fvdl ndhp = &np->n_dircache[ent];
1283 1.49 fvdl } else {
1284 1.49 fvdl ndhp = NFSDIRHASH(np, off);
1285 1.49 fvdl }
1286 1.49 fvdl
1287 1.49 fvdl if (hashent)
1288 1.49 fvdl *hashent = (int)(ndhp - np->n_dircache);
1289 1.135 yamt
1290 1.135 yamt NFSDC_LOCK(np);
1291 1.49 fvdl if (do32) {
1292 1.113 yamt LIST_FOREACH(ndp, ndhp, dc_hash) {
1293 1.49 fvdl if (ndp->dc_cookie32 == (u_int32_t)off) {
1294 1.49 fvdl /*
1295 1.49 fvdl * An invalidated entry will become the
1296 1.49 fvdl * start of a new block fetched from
1297 1.49 fvdl * the server.
1298 1.49 fvdl */
1299 1.135 yamt if (ndp->dc_flags & NFSDC_INVALID) {
1300 1.49 fvdl ndp->dc_blkcookie = ndp->dc_cookie;
1301 1.49 fvdl ndp->dc_entry = 0;
1302 1.135 yamt ndp->dc_flags &= ~NFSDC_INVALID;
1303 1.49 fvdl }
1304 1.49 fvdl break;
1305 1.49 fvdl }
1306 1.49 fvdl }
1307 1.49 fvdl } else {
1308 1.113 yamt LIST_FOREACH(ndp, ndhp, dc_hash) {
1309 1.49 fvdl if (ndp->dc_cookie == off)
1310 1.49 fvdl break;
1311 1.113 yamt }
1312 1.49 fvdl }
1313 1.135 yamt if (ndp != NULL)
1314 1.135 yamt ndp->dc_refcnt++;
1315 1.135 yamt NFSDC_UNLOCK(np);
1316 1.49 fvdl return ndp;
1317 1.49 fvdl }
1318 1.49 fvdl
1319 1.49 fvdl
1320 1.49 fvdl struct nfsdircache *
1321 1.171 christos nfs_enterdircache(struct vnode *vp, off_t off, off_t blkoff, int en,
1322 1.177 yamt daddr_t blkno)
1323 1.46 fvdl {
1324 1.46 fvdl struct nfsnode *np = VTONFS(vp);
1325 1.46 fvdl struct nfsdirhashhead *ndhp;
1326 1.135 yamt struct nfsdircache *ndp = NULL;
1327 1.135 yamt struct nfsdircache *newndp = NULL;
1328 1.49 fvdl struct nfsmount *nmp = VFSTONFS(vp->v_mount);
1329 1.161 christos int hashent = 0, gen, overwrite; /* XXX: GCC */
1330 1.46 fvdl
1331 1.135 yamt /*
1332 1.135 yamt * XXX refuse entries for offset 0. amd(8) erroneously sets
1333 1.135 yamt * cookie 0 for the '.' entry, making this necessary. This
1334 1.135 yamt * isn't so bad, as 0 is a special case anyway.
1335 1.135 yamt */
1336 1.135 yamt if (off == 0)
1337 1.149 christos /* XXXUNCONST */
1338 1.149 christos return (struct nfsdircache *)__UNCONST(&dzero);
1339 1.135 yamt
1340 1.49 fvdl if (!np->n_dircache)
1341 1.49 fvdl /*
1342 1.49 fvdl * XXX would like to do this in nfs_nget but vtype
1343 1.49 fvdl * isn't known at that time.
1344 1.49 fvdl */
1345 1.49 fvdl nfs_initdircache(vp);
1346 1.50 fvdl
1347 1.120 yamt if ((nmp->nm_flag & NFSMNT_XLATECOOKIE) && !np->n_dirgens)
1348 1.120 yamt nfs_initdirxlatecookie(vp);
1349 1.120 yamt
1350 1.135 yamt retry:
1351 1.49 fvdl ndp = nfs_searchdircache(vp, off, 0, &hashent);
1352 1.49 fvdl
1353 1.135 yamt NFSDC_LOCK(np);
1354 1.135 yamt if (ndp && (ndp->dc_flags & NFSDC_INVALID) == 0) {
1355 1.49 fvdl /*
1356 1.49 fvdl * Overwriting an old entry. Check if it's the same.
1357 1.49 fvdl * If so, just return. If not, remove the old entry.
1358 1.49 fvdl */
1359 1.49 fvdl if (ndp->dc_blkcookie == blkoff && ndp->dc_entry == en)
1360 1.135 yamt goto done;
1361 1.135 yamt nfs_unlinkdircache(np, ndp);
1362 1.135 yamt nfs_putdircache_unlocked(np, ndp);
1363 1.135 yamt ndp = NULL;
1364 1.46 fvdl }
1365 1.46 fvdl
1366 1.49 fvdl ndhp = &np->n_dircache[hashent];
1367 1.46 fvdl
1368 1.49 fvdl if (!ndp) {
1369 1.135 yamt if (newndp == NULL) {
1370 1.135 yamt NFSDC_UNLOCK(np);
1371 1.196 yamt newndp = kmem_alloc(sizeof(*newndp), KM_SLEEP);
1372 1.135 yamt newndp->dc_refcnt = 1;
1373 1.135 yamt LIST_NEXT(newndp, dc_hash) = (void *)-1;
1374 1.135 yamt goto retry;
1375 1.135 yamt }
1376 1.135 yamt ndp = newndp;
1377 1.135 yamt newndp = NULL;
1378 1.49 fvdl overwrite = 0;
1379 1.49 fvdl if (nmp->nm_flag & NFSMNT_XLATECOOKIE) {
1380 1.49 fvdl /*
1381 1.49 fvdl * We're allocating a new entry, so bump the
1382 1.49 fvdl * generation number.
1383 1.49 fvdl */
1384 1.160 christos KASSERT(np->n_dirgens);
1385 1.49 fvdl gen = ++np->n_dirgens[hashent];
1386 1.49 fvdl if (gen == 0) {
1387 1.49 fvdl np->n_dirgens[hashent]++;
1388 1.49 fvdl gen++;
1389 1.49 fvdl }
1390 1.49 fvdl ndp->dc_cookie32 = (hashent << 24) | (gen & 0xffffff);
1391 1.49 fvdl }
1392 1.49 fvdl } else
1393 1.49 fvdl overwrite = 1;
1394 1.46 fvdl
1395 1.49 fvdl ndp->dc_cookie = off;
1396 1.49 fvdl ndp->dc_blkcookie = blkoff;
1397 1.46 fvdl ndp->dc_entry = en;
1398 1.137 yamt ndp->dc_flags = 0;
1399 1.46 fvdl
1400 1.49 fvdl if (overwrite)
1401 1.135 yamt goto done;
1402 1.49 fvdl
1403 1.46 fvdl /*
1404 1.46 fvdl * If the maximum directory cookie cache size has been reached
1405 1.46 fvdl * for this node, take one off the front. The idea is that
1406 1.46 fvdl * directories are typically read front-to-back once, so that
1407 1.46 fvdl * the oldest entries can be thrown away without much performance
1408 1.46 fvdl * loss.
1409 1.46 fvdl */
1410 1.46 fvdl if (np->n_dircachesize == NFS_MAXDIRCACHE) {
1411 1.135 yamt nfs_unlinkdircache(np, TAILQ_FIRST(&np->n_dirchain));
1412 1.46 fvdl } else
1413 1.46 fvdl np->n_dircachesize++;
1414 1.148 perry
1415 1.135 yamt KASSERT(ndp->dc_refcnt == 1);
1416 1.46 fvdl LIST_INSERT_HEAD(ndhp, ndp, dc_hash);
1417 1.46 fvdl TAILQ_INSERT_TAIL(&np->n_dirchain, ndp, dc_chain);
1418 1.135 yamt ndp->dc_refcnt++;
1419 1.135 yamt done:
1420 1.135 yamt KASSERT(ndp->dc_refcnt > 0);
1421 1.135 yamt NFSDC_UNLOCK(np);
1422 1.135 yamt if (newndp)
1423 1.135 yamt nfs_putdircache(np, newndp);
1424 1.46 fvdl return ndp;
1425 1.46 fvdl }
1426 1.46 fvdl
1427 1.46 fvdl void
1428 1.214 dsl nfs_invaldircache(struct vnode *vp, int flags)
1429 1.46 fvdl {
1430 1.46 fvdl struct nfsnode *np = VTONFS(vp);
1431 1.46 fvdl struct nfsdircache *ndp = NULL;
1432 1.49 fvdl struct nfsmount *nmp = VFSTONFS(vp->v_mount);
1433 1.181 thorpej const bool forcefree = flags & NFS_INVALDIRCACHE_FORCE;
1434 1.46 fvdl
1435 1.46 fvdl #ifdef DIAGNOSTIC
1436 1.46 fvdl if (vp->v_type != VDIR)
1437 1.46 fvdl panic("nfs: invaldircache: not dir");
1438 1.46 fvdl #endif
1439 1.46 fvdl
1440 1.145 yamt if ((flags & NFS_INVALDIRCACHE_KEEPEOF) == 0)
1441 1.145 yamt np->n_flag &= ~NEOFVALID;
1442 1.144 yamt
1443 1.46 fvdl if (!np->n_dircache)
1444 1.46 fvdl return;
1445 1.46 fvdl
1446 1.135 yamt NFSDC_LOCK(np);
1447 1.49 fvdl if (!(nmp->nm_flag & NFSMNT_XLATECOOKIE) || forcefree) {
1448 1.135 yamt while ((ndp = TAILQ_FIRST(&np->n_dirchain)) != NULL) {
1449 1.135 yamt KASSERT(!forcefree || ndp->dc_refcnt == 1);
1450 1.135 yamt nfs_unlinkdircache(np, ndp);
1451 1.49 fvdl }
1452 1.49 fvdl np->n_dircachesize = 0;
1453 1.49 fvdl if (forcefree && np->n_dirgens) {
1454 1.196 yamt kmem_free(np->n_dirgens,
1455 1.196 yamt NFS_DIRHASHSIZ * sizeof(unsigned));
1456 1.120 yamt np->n_dirgens = NULL;
1457 1.49 fvdl }
1458 1.49 fvdl } else {
1459 1.135 yamt TAILQ_FOREACH(ndp, &np->n_dirchain, dc_chain)
1460 1.135 yamt ndp->dc_flags |= NFSDC_INVALID;
1461 1.46 fvdl }
1462 1.46 fvdl
1463 1.135 yamt NFSDC_UNLOCK(np);
1464 1.46 fvdl }
1465 1.46 fvdl
1466 1.1 cgd /*
1467 1.35 thorpej * Called once before VFS init to initialize shared and
1468 1.35 thorpej * server-specific data structures.
1469 1.1 cgd */
1470 1.157 yamt static int
1471 1.155 thorpej nfs_init0(void)
1472 1.1 cgd {
1473 1.189 ad
1474 1.12 mycroft nfsrtt.pos = 0;
1475 1.1 cgd rpc_vers = txdr_unsigned(RPC_VER2);
1476 1.1 cgd rpc_call = txdr_unsigned(RPC_CALL);
1477 1.1 cgd rpc_reply = txdr_unsigned(RPC_REPLY);
1478 1.1 cgd rpc_msgdenied = txdr_unsigned(RPC_MSGDENIED);
1479 1.1 cgd rpc_msgaccepted = txdr_unsigned(RPC_MSGACCEPTED);
1480 1.1 cgd rpc_mismatch = txdr_unsigned(RPC_MISMATCH);
1481 1.12 mycroft rpc_autherr = txdr_unsigned(RPC_AUTHERR);
1482 1.1 cgd rpc_auth_unix = txdr_unsigned(RPCAUTH_UNIX);
1483 1.25 fvdl rpc_auth_kerb = txdr_unsigned(RPCAUTH_KERB4);
1484 1.1 cgd nfs_prog = txdr_unsigned(NFS_PROG);
1485 1.182 thorpej nfs_true = txdr_unsigned(true);
1486 1.182 thorpej nfs_false = txdr_unsigned(false);
1487 1.12 mycroft nfs_xdrneg1 = txdr_unsigned(-1);
1488 1.25 fvdl nfs_ticks = (hz * NFS_TICKINTVL + 500) / 1000;
1489 1.25 fvdl if (nfs_ticks < 1)
1490 1.25 fvdl nfs_ticks = 1;
1491 1.207 pooka nfs_xid = arc4random();
1492 1.164 yamt nfsdreq_init();
1493 1.164 yamt
1494 1.1 cgd /*
1495 1.1 cgd * Initialize reply list and start timer
1496 1.1 cgd */
1497 1.16 mycroft TAILQ_INIT(&nfs_reqq);
1498 1.191 yamt nfs_timer_init();
1499 1.109 matt MOWNER_ATTACH(&nfs_mowner);
1500 1.106 jdolecek
1501 1.157 yamt return 0;
1502 1.1 cgd }
1503 1.1 cgd
1504 1.210 ad /*
1505 1.210 ad * This is disgusting, but it must support both modular and monolothic
1506 1.210 ad * configurations. For monolithic builds NFSSERVER may not imply NFS.
1507 1.210 ad *
1508 1.210 ad * Yuck.
1509 1.210 ad */
1510 1.155 thorpej void
1511 1.155 thorpej nfs_init(void)
1512 1.155 thorpej {
1513 1.155 thorpej static ONCE_DECL(nfs_init_once);
1514 1.155 thorpej
1515 1.155 thorpej RUN_ONCE(&nfs_init_once, nfs_init0);
1516 1.155 thorpej }
1517 1.155 thorpej
1518 1.210 ad void
1519 1.210 ad nfs_fini(void)
1520 1.210 ad {
1521 1.210 ad
1522 1.210 ad nfsdreq_fini();
1523 1.210 ad nfs_timer_fini();
1524 1.210 ad MOWNER_DETACH(&nfs_mowner);
1525 1.210 ad }
1526 1.210 ad
1527 1.1 cgd /*
1528 1.118 yamt * A fiddled version of m_adj() that ensures null fill to a 32-bit
1529 1.1 cgd * boundary and only trims off the back end
1530 1.122 yamt *
1531 1.122 yamt * 1. trim off 'len' bytes as m_adj(mp, -len).
1532 1.122 yamt * 2. add zero-padding 'nul' bytes at the end of the mbuf chain.
1533 1.1 cgd */
1534 1.12 mycroft void
1535 1.214 dsl nfs_zeropad(struct mbuf *mp, int len, int nul)
1536 1.1 cgd {
1537 1.75 augustss struct mbuf *m;
1538 1.130 yamt int count;
1539 1.1 cgd
1540 1.1 cgd /*
1541 1.1 cgd * Trim from tail. Scan the mbuf chain,
1542 1.1 cgd * calculating its length and finding the last mbuf.
1543 1.1 cgd * If the adjustment only affects this mbuf, then just
1544 1.1 cgd * adjust and return. Otherwise, rescan and truncate
1545 1.1 cgd * after the remaining size.
1546 1.1 cgd */
1547 1.1 cgd count = 0;
1548 1.1 cgd m = mp;
1549 1.1 cgd for (;;) {
1550 1.1 cgd count += m->m_len;
1551 1.122 yamt if (m->m_next == NULL)
1552 1.1 cgd break;
1553 1.1 cgd m = m->m_next;
1554 1.1 cgd }
1555 1.122 yamt
1556 1.122 yamt KDASSERT(count >= len);
1557 1.122 yamt
1558 1.122 yamt if (m->m_len >= len) {
1559 1.1 cgd m->m_len -= len;
1560 1.122 yamt } else {
1561 1.122 yamt count -= len;
1562 1.122 yamt /*
1563 1.122 yamt * Correct length for chain is "count".
1564 1.122 yamt * Find the mbuf with last data, adjust its length,
1565 1.122 yamt * and toss data from remaining mbufs on chain.
1566 1.122 yamt */
1567 1.122 yamt for (m = mp; m; m = m->m_next) {
1568 1.122 yamt if (m->m_len >= count) {
1569 1.122 yamt m->m_len = count;
1570 1.122 yamt break;
1571 1.118 yamt }
1572 1.122 yamt count -= m->m_len;
1573 1.1 cgd }
1574 1.159 christos KASSERT(m && m->m_next);
1575 1.122 yamt m_freem(m->m_next);
1576 1.122 yamt m->m_next = NULL;
1577 1.1 cgd }
1578 1.122 yamt
1579 1.130 yamt KDASSERT(m->m_next == NULL);
1580 1.130 yamt
1581 1.122 yamt /*
1582 1.122 yamt * zero-padding.
1583 1.122 yamt */
1584 1.122 yamt if (nul > 0) {
1585 1.130 yamt char *cp;
1586 1.130 yamt int i;
1587 1.130 yamt
1588 1.122 yamt if (M_ROMAP(m) || M_TRAILINGSPACE(m) < nul) {
1589 1.122 yamt struct mbuf *n;
1590 1.122 yamt
1591 1.122 yamt KDASSERT(MLEN >= nul);
1592 1.122 yamt n = m_get(M_WAIT, MT_DATA);
1593 1.122 yamt MCLAIM(n, &nfs_mowner);
1594 1.122 yamt n->m_len = nul;
1595 1.130 yamt n->m_next = NULL;
1596 1.122 yamt m->m_next = n;
1597 1.183 christos cp = mtod(n, void *);
1598 1.122 yamt } else {
1599 1.183 christos cp = mtod(m, char *) + m->m_len;
1600 1.122 yamt m->m_len += nul;
1601 1.1 cgd }
1602 1.122 yamt for (i = 0; i < nul; i++)
1603 1.122 yamt *cp++ = '\0';
1604 1.1 cgd }
1605 1.122 yamt return;
1606 1.1 cgd }
1607 1.1 cgd
1608 1.1 cgd /*
1609 1.25 fvdl * Make these functions instead of macros, so that the kernel text size
1610 1.25 fvdl * doesn't get too big...
1611 1.25 fvdl */
1612 1.25 fvdl void
1613 1.214 dsl nfsm_srvwcc(struct nfsrv_descript *nfsd, int before_ret, struct vattr *before_vap, int after_ret, struct vattr *after_vap, struct mbuf **mbp, char **bposp)
1614 1.25 fvdl {
1615 1.109 matt struct mbuf *mb = *mbp;
1616 1.75 augustss char *bpos = *bposp;
1617 1.75 augustss u_int32_t *tl;
1618 1.25 fvdl
1619 1.25 fvdl if (before_ret) {
1620 1.25 fvdl nfsm_build(tl, u_int32_t *, NFSX_UNSIGNED);
1621 1.25 fvdl *tl = nfs_false;
1622 1.25 fvdl } else {
1623 1.25 fvdl nfsm_build(tl, u_int32_t *, 7 * NFSX_UNSIGNED);
1624 1.25 fvdl *tl++ = nfs_true;
1625 1.66 fair txdr_hyper(before_vap->va_size, tl);
1626 1.25 fvdl tl += 2;
1627 1.25 fvdl txdr_nfsv3time(&(before_vap->va_mtime), tl);
1628 1.25 fvdl tl += 2;
1629 1.25 fvdl txdr_nfsv3time(&(before_vap->va_ctime), tl);
1630 1.25 fvdl }
1631 1.25 fvdl *bposp = bpos;
1632 1.25 fvdl *mbp = mb;
1633 1.25 fvdl nfsm_srvpostopattr(nfsd, after_ret, after_vap, mbp, bposp);
1634 1.25 fvdl }
1635 1.25 fvdl
1636 1.25 fvdl void
1637 1.214 dsl nfsm_srvpostopattr(struct nfsrv_descript *nfsd, int after_ret, struct vattr *after_vap, struct mbuf **mbp, char **bposp)
1638 1.25 fvdl {
1639 1.109 matt struct mbuf *mb = *mbp;
1640 1.75 augustss char *bpos = *bposp;
1641 1.75 augustss u_int32_t *tl;
1642 1.75 augustss struct nfs_fattr *fp;
1643 1.25 fvdl
1644 1.25 fvdl if (after_ret) {
1645 1.25 fvdl nfsm_build(tl, u_int32_t *, NFSX_UNSIGNED);
1646 1.25 fvdl *tl = nfs_false;
1647 1.25 fvdl } else {
1648 1.25 fvdl nfsm_build(tl, u_int32_t *, NFSX_UNSIGNED + NFSX_V3FATTR);
1649 1.25 fvdl *tl++ = nfs_true;
1650 1.25 fvdl fp = (struct nfs_fattr *)tl;
1651 1.25 fvdl nfsm_srvfattr(nfsd, after_vap, fp);
1652 1.25 fvdl }
1653 1.25 fvdl *mbp = mb;
1654 1.25 fvdl *bposp = bpos;
1655 1.25 fvdl }
1656 1.25 fvdl
1657 1.25 fvdl void
1658 1.214 dsl nfsm_srvfattr(struct nfsrv_descript *nfsd, struct vattr *vap, struct nfs_fattr *fp)
1659 1.25 fvdl {
1660 1.25 fvdl
1661 1.25 fvdl fp->fa_nlink = txdr_unsigned(vap->va_nlink);
1662 1.25 fvdl fp->fa_uid = txdr_unsigned(vap->va_uid);
1663 1.25 fvdl fp->fa_gid = txdr_unsigned(vap->va_gid);
1664 1.25 fvdl if (nfsd->nd_flag & ND_NFSV3) {
1665 1.25 fvdl fp->fa_type = vtonfsv3_type(vap->va_type);
1666 1.25 fvdl fp->fa_mode = vtonfsv3_mode(vap->va_mode);
1667 1.66 fair txdr_hyper(vap->va_size, &fp->fa3_size);
1668 1.66 fair txdr_hyper(vap->va_bytes, &fp->fa3_used);
1669 1.25 fvdl fp->fa3_rdev.specdata1 = txdr_unsigned(major(vap->va_rdev));
1670 1.25 fvdl fp->fa3_rdev.specdata2 = txdr_unsigned(minor(vap->va_rdev));
1671 1.25 fvdl fp->fa3_fsid.nfsuquad[0] = 0;
1672 1.25 fvdl fp->fa3_fsid.nfsuquad[1] = txdr_unsigned(vap->va_fsid);
1673 1.151 yamt txdr_hyper(vap->va_fileid, &fp->fa3_fileid);
1674 1.25 fvdl txdr_nfsv3time(&vap->va_atime, &fp->fa3_atime);
1675 1.25 fvdl txdr_nfsv3time(&vap->va_mtime, &fp->fa3_mtime);
1676 1.25 fvdl txdr_nfsv3time(&vap->va_ctime, &fp->fa3_ctime);
1677 1.25 fvdl } else {
1678 1.25 fvdl fp->fa_type = vtonfsv2_type(vap->va_type);
1679 1.25 fvdl fp->fa_mode = vtonfsv2_mode(vap->va_type, vap->va_mode);
1680 1.25 fvdl fp->fa2_size = txdr_unsigned(vap->va_size);
1681 1.25 fvdl fp->fa2_blocksize = txdr_unsigned(vap->va_blocksize);
1682 1.25 fvdl if (vap->va_type == VFIFO)
1683 1.25 fvdl fp->fa2_rdev = 0xffffffff;
1684 1.25 fvdl else
1685 1.25 fvdl fp->fa2_rdev = txdr_unsigned(vap->va_rdev);
1686 1.25 fvdl fp->fa2_blocks = txdr_unsigned(vap->va_bytes / NFS_FABLKSIZE);
1687 1.25 fvdl fp->fa2_fsid = txdr_unsigned(vap->va_fsid);
1688 1.25 fvdl fp->fa2_fileid = txdr_unsigned(vap->va_fileid);
1689 1.25 fvdl txdr_nfsv2time(&vap->va_atime, &fp->fa2_atime);
1690 1.25 fvdl txdr_nfsv2time(&vap->va_mtime, &fp->fa2_mtime);
1691 1.25 fvdl txdr_nfsv2time(&vap->va_ctime, &fp->fa2_ctime);
1692 1.25 fvdl }
1693 1.25 fvdl }
1694 1.25 fvdl
1695 1.1 cgd /*
1696 1.182 thorpej * This function compares two net addresses by family and returns true
1697 1.12 mycroft * if they are the same host.
1698 1.182 thorpej * If there is any doubt, return false.
1699 1.12 mycroft * The AF_INET family is handled as a special case so that address mbufs
1700 1.12 mycroft * don't need to be saved to store "struct in_addr", which is only 4 bytes.
1701 1.1 cgd */
1702 1.24 christos int
1703 1.214 dsl netaddr_match(int family, union nethostaddr *haddr, struct mbuf *nam)
1704 1.1 cgd {
1705 1.75 augustss struct sockaddr_in *inetaddr;
1706 1.1 cgd
1707 1.12 mycroft switch (family) {
1708 1.12 mycroft case AF_INET:
1709 1.12 mycroft inetaddr = mtod(nam, struct sockaddr_in *);
1710 1.12 mycroft if (inetaddr->sin_family == AF_INET &&
1711 1.12 mycroft inetaddr->sin_addr.s_addr == haddr->had_inetaddr)
1712 1.12 mycroft return (1);
1713 1.12 mycroft break;
1714 1.76 fvdl case AF_INET6:
1715 1.76 fvdl {
1716 1.76 fvdl struct sockaddr_in6 *sin6_1, *sin6_2;
1717 1.76 fvdl
1718 1.76 fvdl sin6_1 = mtod(nam, struct sockaddr_in6 *);
1719 1.76 fvdl sin6_2 = mtod(haddr->had_nam, struct sockaddr_in6 *);
1720 1.76 fvdl if (sin6_1->sin6_family == AF_INET6 &&
1721 1.76 fvdl IN6_ARE_ADDR_EQUAL(&sin6_1->sin6_addr, &sin6_2->sin6_addr))
1722 1.76 fvdl return 1;
1723 1.76 fvdl }
1724 1.12 mycroft default:
1725 1.12 mycroft break;
1726 1.12 mycroft };
1727 1.12 mycroft return (0);
1728 1.25 fvdl }
1729 1.25 fvdl
1730 1.25 fvdl /*
1731 1.25 fvdl * The write verifier has changed (probably due to a server reboot), so all
1732 1.114 yamt * PG_NEEDCOMMIT pages will have to be written again. Since they are marked
1733 1.117 yamt * as dirty or are being written out just now, all this takes is clearing
1734 1.117 yamt * the PG_NEEDCOMMIT flag. Once done the new write verifier can be set for
1735 1.117 yamt * the mount point.
1736 1.25 fvdl */
1737 1.25 fvdl void
1738 1.214 dsl nfs_clearcommit(struct mount *mp)
1739 1.25 fvdl {
1740 1.89 chs struct vnode *vp;
1741 1.83 fvdl struct nfsnode *np;
1742 1.89 chs struct vm_page *pg;
1743 1.116 yamt struct nfsmount *nmp = VFSTONFS(mp);
1744 1.116 yamt
1745 1.180 yamt rw_enter(&nmp->nm_writeverflock, RW_WRITER);
1746 1.195 ad mutex_enter(&mntvnode_lock);
1747 1.176 reinoud TAILQ_FOREACH(vp, &mp->mnt_vnodelist, v_mntvnodes) {
1748 1.89 chs KASSERT(vp->v_mount == mp);
1749 1.146 yamt if (vp->v_type != VREG)
1750 1.85 enami continue;
1751 1.217 yamt mutex_enter(&vp->v_interlock);
1752 1.217 yamt if (vp->v_iflag & (VI_XLOCK | VI_CLEAN)) {
1753 1.217 yamt mutex_exit(&vp->v_interlock);
1754 1.217 yamt continue;
1755 1.217 yamt }
1756 1.83 fvdl np = VTONFS(vp);
1757 1.83 fvdl np->n_pushlo = np->n_pushhi = np->n_pushedlo =
1758 1.83 fvdl np->n_pushedhi = 0;
1759 1.83 fvdl np->n_commitflags &=
1760 1.83 fvdl ~(NFS_COMMIT_PUSH_VALID | NFS_COMMIT_PUSHED_VALID);
1761 1.204 ad TAILQ_FOREACH(pg, &vp->v_uobj.memq, listq.queue) {
1762 1.89 chs pg->flags &= ~PG_NEEDCOMMIT;
1763 1.25 fvdl }
1764 1.217 yamt mutex_exit(&vp->v_interlock);
1765 1.25 fvdl }
1766 1.195 ad mutex_exit(&mntvnode_lock);
1767 1.186 yamt mutex_enter(&nmp->nm_lock);
1768 1.116 yamt nmp->nm_iflag &= ~NFSMNT_STALEWRITEVERF;
1769 1.186 yamt mutex_exit(&nmp->nm_lock);
1770 1.180 yamt rw_exit(&nmp->nm_writeverflock);
1771 1.83 fvdl }
1772 1.83 fvdl
1773 1.83 fvdl void
1774 1.214 dsl nfs_merge_commit_ranges(struct vnode *vp)
1775 1.83 fvdl {
1776 1.83 fvdl struct nfsnode *np = VTONFS(vp);
1777 1.112 yamt
1778 1.112 yamt KASSERT(np->n_commitflags & NFS_COMMIT_PUSH_VALID);
1779 1.83 fvdl
1780 1.83 fvdl if (!(np->n_commitflags & NFS_COMMIT_PUSHED_VALID)) {
1781 1.83 fvdl np->n_pushedlo = np->n_pushlo;
1782 1.83 fvdl np->n_pushedhi = np->n_pushhi;
1783 1.83 fvdl np->n_commitflags |= NFS_COMMIT_PUSHED_VALID;
1784 1.83 fvdl } else {
1785 1.83 fvdl if (np->n_pushlo < np->n_pushedlo)
1786 1.83 fvdl np->n_pushedlo = np->n_pushlo;
1787 1.83 fvdl if (np->n_pushhi > np->n_pushedhi)
1788 1.83 fvdl np->n_pushedhi = np->n_pushhi;
1789 1.83 fvdl }
1790 1.83 fvdl
1791 1.83 fvdl np->n_pushlo = np->n_pushhi = 0;
1792 1.83 fvdl np->n_commitflags &= ~NFS_COMMIT_PUSH_VALID;
1793 1.83 fvdl
1794 1.111 yamt #ifdef NFS_DEBUG_COMMIT
1795 1.83 fvdl printf("merge: committed: %u - %u\n", (unsigned)np->n_pushedlo,
1796 1.83 fvdl (unsigned)np->n_pushedhi);
1797 1.83 fvdl #endif
1798 1.83 fvdl }
1799 1.83 fvdl
1800 1.83 fvdl int
1801 1.215 dsl nfs_in_committed_range(struct vnode *vp, off_t off, off_t len)
1802 1.83 fvdl {
1803 1.83 fvdl struct nfsnode *np = VTONFS(vp);
1804 1.83 fvdl off_t lo, hi;
1805 1.83 fvdl
1806 1.83 fvdl if (!(np->n_commitflags & NFS_COMMIT_PUSHED_VALID))
1807 1.83 fvdl return 0;
1808 1.89 chs lo = off;
1809 1.89 chs hi = lo + len;
1810 1.83 fvdl
1811 1.83 fvdl return (lo >= np->n_pushedlo && hi <= np->n_pushedhi);
1812 1.83 fvdl }
1813 1.83 fvdl
1814 1.83 fvdl int
1815 1.215 dsl nfs_in_tobecommitted_range(struct vnode *vp, off_t off, off_t len)
1816 1.83 fvdl {
1817 1.83 fvdl struct nfsnode *np = VTONFS(vp);
1818 1.83 fvdl off_t lo, hi;
1819 1.83 fvdl
1820 1.83 fvdl if (!(np->n_commitflags & NFS_COMMIT_PUSH_VALID))
1821 1.83 fvdl return 0;
1822 1.89 chs lo = off;
1823 1.89 chs hi = lo + len;
1824 1.83 fvdl
1825 1.83 fvdl return (lo >= np->n_pushlo && hi <= np->n_pushhi);
1826 1.83 fvdl }
1827 1.83 fvdl
1828 1.83 fvdl void
1829 1.215 dsl nfs_add_committed_range(struct vnode *vp, off_t off, off_t len)
1830 1.83 fvdl {
1831 1.83 fvdl struct nfsnode *np = VTONFS(vp);
1832 1.83 fvdl off_t lo, hi;
1833 1.83 fvdl
1834 1.89 chs lo = off;
1835 1.89 chs hi = lo + len;
1836 1.83 fvdl
1837 1.83 fvdl if (!(np->n_commitflags & NFS_COMMIT_PUSHED_VALID)) {
1838 1.83 fvdl np->n_pushedlo = lo;
1839 1.83 fvdl np->n_pushedhi = hi;
1840 1.83 fvdl np->n_commitflags |= NFS_COMMIT_PUSHED_VALID;
1841 1.83 fvdl } else {
1842 1.83 fvdl if (hi > np->n_pushedhi)
1843 1.83 fvdl np->n_pushedhi = hi;
1844 1.83 fvdl if (lo < np->n_pushedlo)
1845 1.83 fvdl np->n_pushedlo = lo;
1846 1.83 fvdl }
1847 1.111 yamt #ifdef NFS_DEBUG_COMMIT
1848 1.83 fvdl printf("add: committed: %u - %u\n", (unsigned)np->n_pushedlo,
1849 1.83 fvdl (unsigned)np->n_pushedhi);
1850 1.83 fvdl #endif
1851 1.83 fvdl }
1852 1.83 fvdl
1853 1.83 fvdl void
1854 1.215 dsl nfs_del_committed_range(struct vnode *vp, off_t off, off_t len)
1855 1.83 fvdl {
1856 1.83 fvdl struct nfsnode *np = VTONFS(vp);
1857 1.83 fvdl off_t lo, hi;
1858 1.83 fvdl
1859 1.83 fvdl if (!(np->n_commitflags & NFS_COMMIT_PUSHED_VALID))
1860 1.83 fvdl return;
1861 1.83 fvdl
1862 1.89 chs lo = off;
1863 1.89 chs hi = lo + len;
1864 1.83 fvdl
1865 1.83 fvdl if (lo > np->n_pushedhi || hi < np->n_pushedlo)
1866 1.83 fvdl return;
1867 1.83 fvdl if (lo <= np->n_pushedlo)
1868 1.83 fvdl np->n_pushedlo = hi;
1869 1.83 fvdl else if (hi >= np->n_pushedhi)
1870 1.83 fvdl np->n_pushedhi = lo;
1871 1.83 fvdl else {
1872 1.83 fvdl /*
1873 1.83 fvdl * XXX There's only one range. If the deleted range
1874 1.83 fvdl * is in the middle, pick the largest of the
1875 1.83 fvdl * contiguous ranges that it leaves.
1876 1.83 fvdl */
1877 1.83 fvdl if ((np->n_pushedlo - lo) > (hi - np->n_pushedhi))
1878 1.83 fvdl np->n_pushedhi = lo;
1879 1.83 fvdl else
1880 1.83 fvdl np->n_pushedlo = hi;
1881 1.83 fvdl }
1882 1.111 yamt #ifdef NFS_DEBUG_COMMIT
1883 1.83 fvdl printf("del: committed: %u - %u\n", (unsigned)np->n_pushedlo,
1884 1.83 fvdl (unsigned)np->n_pushedhi);
1885 1.83 fvdl #endif
1886 1.83 fvdl }
1887 1.83 fvdl
1888 1.83 fvdl void
1889 1.215 dsl nfs_add_tobecommitted_range(struct vnode *vp, off_t off, off_t len)
1890 1.83 fvdl {
1891 1.83 fvdl struct nfsnode *np = VTONFS(vp);
1892 1.83 fvdl off_t lo, hi;
1893 1.83 fvdl
1894 1.89 chs lo = off;
1895 1.89 chs hi = lo + len;
1896 1.83 fvdl
1897 1.83 fvdl if (!(np->n_commitflags & NFS_COMMIT_PUSH_VALID)) {
1898 1.83 fvdl np->n_pushlo = lo;
1899 1.83 fvdl np->n_pushhi = hi;
1900 1.83 fvdl np->n_commitflags |= NFS_COMMIT_PUSH_VALID;
1901 1.83 fvdl } else {
1902 1.83 fvdl if (lo < np->n_pushlo)
1903 1.83 fvdl np->n_pushlo = lo;
1904 1.83 fvdl if (hi > np->n_pushhi)
1905 1.83 fvdl np->n_pushhi = hi;
1906 1.83 fvdl }
1907 1.111 yamt #ifdef NFS_DEBUG_COMMIT
1908 1.83 fvdl printf("add: tobecommitted: %u - %u\n", (unsigned)np->n_pushlo,
1909 1.83 fvdl (unsigned)np->n_pushhi);
1910 1.83 fvdl #endif
1911 1.83 fvdl }
1912 1.83 fvdl
1913 1.83 fvdl void
1914 1.215 dsl nfs_del_tobecommitted_range(struct vnode *vp, off_t off, off_t len)
1915 1.83 fvdl {
1916 1.83 fvdl struct nfsnode *np = VTONFS(vp);
1917 1.83 fvdl off_t lo, hi;
1918 1.83 fvdl
1919 1.83 fvdl if (!(np->n_commitflags & NFS_COMMIT_PUSH_VALID))
1920 1.83 fvdl return;
1921 1.83 fvdl
1922 1.89 chs lo = off;
1923 1.89 chs hi = lo + len;
1924 1.83 fvdl
1925 1.83 fvdl if (lo > np->n_pushhi || hi < np->n_pushlo)
1926 1.83 fvdl return;
1927 1.83 fvdl
1928 1.83 fvdl if (lo <= np->n_pushlo)
1929 1.83 fvdl np->n_pushlo = hi;
1930 1.83 fvdl else if (hi >= np->n_pushhi)
1931 1.83 fvdl np->n_pushhi = lo;
1932 1.83 fvdl else {
1933 1.83 fvdl /*
1934 1.83 fvdl * XXX There's only one range. If the deleted range
1935 1.83 fvdl * is in the middle, pick the largest of the
1936 1.83 fvdl * contiguous ranges that it leaves.
1937 1.83 fvdl */
1938 1.83 fvdl if ((np->n_pushlo - lo) > (hi - np->n_pushhi))
1939 1.83 fvdl np->n_pushhi = lo;
1940 1.83 fvdl else
1941 1.83 fvdl np->n_pushlo = hi;
1942 1.83 fvdl }
1943 1.111 yamt #ifdef NFS_DEBUG_COMMIT
1944 1.83 fvdl printf("del: tobecommitted: %u - %u\n", (unsigned)np->n_pushlo,
1945 1.83 fvdl (unsigned)np->n_pushhi);
1946 1.83 fvdl #endif
1947 1.25 fvdl }
1948 1.25 fvdl
1949 1.25 fvdl /*
1950 1.25 fvdl * Map errnos to NFS error numbers. For Version 3 also filter out error
1951 1.25 fvdl * numbers not specified for the associated procedure.
1952 1.25 fvdl */
1953 1.25 fvdl int
1954 1.214 dsl nfsrv_errmap(struct nfsrv_descript *nd, int err)
1955 1.25 fvdl {
1956 1.90 jdolecek const short *defaulterrp, *errp;
1957 1.25 fvdl
1958 1.25 fvdl if (nd->nd_flag & ND_NFSV3) {
1959 1.25 fvdl if (nd->nd_procnum <= NFSPROC_COMMIT) {
1960 1.25 fvdl errp = defaulterrp = nfsrv_v3errmap[nd->nd_procnum];
1961 1.25 fvdl while (*++errp) {
1962 1.25 fvdl if (*errp == err)
1963 1.25 fvdl return (err);
1964 1.25 fvdl else if (*errp > err)
1965 1.25 fvdl break;
1966 1.25 fvdl }
1967 1.25 fvdl return ((int)*defaulterrp);
1968 1.25 fvdl } else
1969 1.25 fvdl return (err & 0xffff);
1970 1.25 fvdl }
1971 1.25 fvdl if (err <= ELAST)
1972 1.25 fvdl return ((int)nfsrv_v2errmap[err - 1]);
1973 1.25 fvdl return (NFSERR_IO);
1974 1.25 fvdl }
1975 1.25 fvdl
1976 1.126 yamt u_int32_t
1977 1.216 cegger nfs_getxid(void)
1978 1.126 yamt {
1979 1.126 yamt u_int32_t newxid;
1980 1.126 yamt
1981 1.207 pooka /* get next xid. skip 0 */
1982 1.207 pooka do {
1983 1.207 pooka newxid = atomic_inc_32_nv(&nfs_xid);
1984 1.207 pooka } while (__predict_false(newxid == 0));
1985 1.126 yamt
1986 1.126 yamt return txdr_unsigned(newxid);
1987 1.126 yamt }
1988 1.126 yamt
1989 1.126 yamt /*
1990 1.126 yamt * assign a new xid for existing request.
1991 1.126 yamt * used for NFSERR_JUKEBOX handling.
1992 1.126 yamt */
1993 1.126 yamt void
1994 1.126 yamt nfs_renewxid(struct nfsreq *req)
1995 1.126 yamt {
1996 1.126 yamt u_int32_t xid;
1997 1.126 yamt int off;
1998 1.126 yamt
1999 1.126 yamt xid = nfs_getxid();
2000 1.126 yamt if (req->r_nmp->nm_sotype == SOCK_STREAM)
2001 1.126 yamt off = sizeof(u_int32_t); /* RPC record mark */
2002 1.126 yamt else
2003 1.126 yamt off = 0;
2004 1.126 yamt
2005 1.126 yamt m_copyback(req->r_mreq, off, sizeof(xid), (void *)&xid);
2006 1.126 yamt req->r_xid = xid;
2007 1.1 cgd }
2008