nfs_subs.c revision 1.236 1 1.236 ad /* $NetBSD: nfs_subs.c,v 1.236 2019/12/15 21:11:34 ad Exp $ */
2 1.14 cgd
3 1.1 cgd /*
4 1.12 mycroft * Copyright (c) 1989, 1993
5 1.12 mycroft * The Regents of the University of California. All rights reserved.
6 1.1 cgd *
7 1.1 cgd * This code is derived from software contributed to Berkeley by
8 1.1 cgd * Rick Macklem at The University of Guelph.
9 1.1 cgd *
10 1.1 cgd * Redistribution and use in source and binary forms, with or without
11 1.1 cgd * modification, are permitted provided that the following conditions
12 1.1 cgd * are met:
13 1.1 cgd * 1. Redistributions of source code must retain the above copyright
14 1.1 cgd * notice, this list of conditions and the following disclaimer.
15 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
16 1.1 cgd * notice, this list of conditions and the following disclaimer in the
17 1.1 cgd * documentation and/or other materials provided with the distribution.
18 1.127 agc * 3. Neither the name of the University nor the names of its contributors
19 1.1 cgd * may be used to endorse or promote products derived from this software
20 1.1 cgd * without specific prior written permission.
21 1.1 cgd *
22 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
23 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
26 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32 1.1 cgd * SUCH DAMAGE.
33 1.1 cgd *
34 1.25 fvdl * @(#)nfs_subs.c 8.8 (Berkeley) 5/22/95
35 1.1 cgd */
36 1.1 cgd
37 1.83 fvdl /*
38 1.83 fvdl * Copyright 2000 Wasabi Systems, Inc.
39 1.83 fvdl * All rights reserved.
40 1.83 fvdl *
41 1.83 fvdl * Written by Frank van der Linden for Wasabi Systems, Inc.
42 1.83 fvdl *
43 1.83 fvdl * Redistribution and use in source and binary forms, with or without
44 1.83 fvdl * modification, are permitted provided that the following conditions
45 1.83 fvdl * are met:
46 1.83 fvdl * 1. Redistributions of source code must retain the above copyright
47 1.83 fvdl * notice, this list of conditions and the following disclaimer.
48 1.83 fvdl * 2. Redistributions in binary form must reproduce the above copyright
49 1.83 fvdl * notice, this list of conditions and the following disclaimer in the
50 1.83 fvdl * documentation and/or other materials provided with the distribution.
51 1.83 fvdl * 3. All advertising materials mentioning features or use of this software
52 1.83 fvdl * must display the following acknowledgement:
53 1.83 fvdl * This product includes software developed for the NetBSD Project by
54 1.83 fvdl * Wasabi Systems, Inc.
55 1.83 fvdl * 4. The name of Wasabi Systems, Inc. may not be used to endorse
56 1.83 fvdl * or promote products derived from this software without specific prior
57 1.83 fvdl * written permission.
58 1.83 fvdl *
59 1.83 fvdl * THIS SOFTWARE IS PROVIDED BY WASABI SYSTEMS, INC. ``AS IS'' AND
60 1.83 fvdl * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
61 1.83 fvdl * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
62 1.83 fvdl * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL WASABI SYSTEMS, INC
63 1.83 fvdl * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
64 1.83 fvdl * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
65 1.83 fvdl * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
66 1.83 fvdl * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
67 1.83 fvdl * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
68 1.83 fvdl * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
69 1.83 fvdl * POSSIBILITY OF SUCH DAMAGE.
70 1.83 fvdl */
71 1.99 lukem
72 1.99 lukem #include <sys/cdefs.h>
73 1.236 ad __KERNEL_RCSID(0, "$NetBSD: nfs_subs.c,v 1.236 2019/12/15 21:11:34 ad Exp $");
74 1.83 fvdl
75 1.210 ad #ifdef _KERNEL_OPT
76 1.82 bjh21 #include "opt_nfs.h"
77 1.210 ad #endif
78 1.25 fvdl
79 1.1 cgd /*
80 1.1 cgd * These functions support the macros and help fiddle mbuf chains for
81 1.1 cgd * the nfs op functions. They do things like create the rpc header and
82 1.1 cgd * copy data between mbuf chains and uio lists.
83 1.1 cgd */
84 1.9 mycroft #include <sys/param.h>
85 1.9 mycroft #include <sys/proc.h>
86 1.9 mycroft #include <sys/systm.h>
87 1.9 mycroft #include <sys/kernel.h>
88 1.196 yamt #include <sys/kmem.h>
89 1.9 mycroft #include <sys/mount.h>
90 1.9 mycroft #include <sys/vnode.h>
91 1.9 mycroft #include <sys/namei.h>
92 1.9 mycroft #include <sys/mbuf.h>
93 1.12 mycroft #include <sys/socket.h>
94 1.12 mycroft #include <sys/stat.h>
95 1.98 fvdl #include <sys/filedesc.h>
96 1.30 fvdl #include <sys/time.h>
97 1.43 fvdl #include <sys/dirent.h>
98 1.155 thorpej #include <sys/once.h>
99 1.162 elad #include <sys/kauth.h>
100 1.207 pooka #include <sys/atomic.h>
101 1.222 tls #include <sys/cprng.h>
102 1.1 cgd
103 1.220 uebayasi #include <uvm/uvm.h>
104 1.236 ad #include <uvm/uvm_page_array.h>
105 1.51 mrg
106 1.9 mycroft #include <nfs/rpcv2.h>
107 1.25 fvdl #include <nfs/nfsproto.h>
108 1.9 mycroft #include <nfs/nfsnode.h>
109 1.9 mycroft #include <nfs/nfs.h>
110 1.9 mycroft #include <nfs/xdr_subs.h>
111 1.9 mycroft #include <nfs/nfsm_subs.h>
112 1.12 mycroft #include <nfs/nfsmount.h>
113 1.12 mycroft #include <nfs/nfsrtt.h>
114 1.24 christos #include <nfs/nfs_var.h>
115 1.12 mycroft
116 1.12 mycroft #include <miscfs/specfs/specdev.h>
117 1.24 christos
118 1.12 mycroft #include <netinet/in.h>
119 1.1 cgd
120 1.207 pooka static u_int32_t nfs_xid;
121 1.207 pooka
122 1.218 christos int nuidhash_max = NFS_MAXUIDHASH;
123 1.1 cgd /*
124 1.1 cgd * Data items converted to xdr at startup, since they are constant
125 1.1 cgd * This is kinda hokey, but may save a little time doing byte swaps
126 1.1 cgd */
127 1.22 cgd u_int32_t nfs_xdrneg1;
128 1.22 cgd u_int32_t rpc_call, rpc_vers, rpc_reply, rpc_msgdenied, rpc_autherr,
129 1.25 fvdl rpc_mismatch, rpc_auth_unix, rpc_msgaccepted,
130 1.12 mycroft rpc_auth_kerb;
131 1.179 yamt u_int32_t nfs_prog, nfs_true, nfs_false;
132 1.12 mycroft
133 1.1 cgd /* And other global data */
134 1.90 jdolecek const nfstype nfsv2_type[9] =
135 1.90 jdolecek { NFNON, NFREG, NFDIR, NFBLK, NFCHR, NFLNK, NFNON, NFCHR, NFNON };
136 1.90 jdolecek const nfstype nfsv3_type[9] =
137 1.90 jdolecek { NFNON, NFREG, NFDIR, NFBLK, NFCHR, NFLNK, NFSOCK, NFFIFO, NFNON };
138 1.90 jdolecek const enum vtype nv2tov_type[8] =
139 1.90 jdolecek { VNON, VREG, VDIR, VBLK, VCHR, VLNK, VNON, VNON };
140 1.90 jdolecek const enum vtype nv3tov_type[8] =
141 1.90 jdolecek { VNON, VREG, VDIR, VBLK, VCHR, VLNK, VSOCK, VFIFO };
142 1.25 fvdl int nfs_ticks;
143 1.108 christos
144 1.35 thorpej /* NFS client/server stats. */
145 1.35 thorpej struct nfsstats nfsstats;
146 1.35 thorpej
147 1.25 fvdl /*
148 1.25 fvdl * Mapping of old NFS Version 2 RPC numbers to generic numbers.
149 1.25 fvdl */
150 1.90 jdolecek const int nfsv3_procid[NFS_NPROCS] = {
151 1.25 fvdl NFSPROC_NULL,
152 1.25 fvdl NFSPROC_GETATTR,
153 1.25 fvdl NFSPROC_SETATTR,
154 1.25 fvdl NFSPROC_NOOP,
155 1.25 fvdl NFSPROC_LOOKUP,
156 1.25 fvdl NFSPROC_READLINK,
157 1.25 fvdl NFSPROC_READ,
158 1.25 fvdl NFSPROC_NOOP,
159 1.25 fvdl NFSPROC_WRITE,
160 1.25 fvdl NFSPROC_CREATE,
161 1.25 fvdl NFSPROC_REMOVE,
162 1.25 fvdl NFSPROC_RENAME,
163 1.25 fvdl NFSPROC_LINK,
164 1.25 fvdl NFSPROC_SYMLINK,
165 1.25 fvdl NFSPROC_MKDIR,
166 1.25 fvdl NFSPROC_RMDIR,
167 1.25 fvdl NFSPROC_READDIR,
168 1.25 fvdl NFSPROC_FSSTAT,
169 1.25 fvdl NFSPROC_NOOP,
170 1.25 fvdl NFSPROC_NOOP,
171 1.25 fvdl NFSPROC_NOOP,
172 1.25 fvdl NFSPROC_NOOP,
173 1.25 fvdl NFSPROC_NOOP
174 1.25 fvdl };
175 1.25 fvdl
176 1.25 fvdl /*
177 1.25 fvdl * and the reverse mapping from generic to Version 2 procedure numbers
178 1.25 fvdl */
179 1.90 jdolecek const int nfsv2_procid[NFS_NPROCS] = {
180 1.25 fvdl NFSV2PROC_NULL,
181 1.25 fvdl NFSV2PROC_GETATTR,
182 1.25 fvdl NFSV2PROC_SETATTR,
183 1.25 fvdl NFSV2PROC_LOOKUP,
184 1.25 fvdl NFSV2PROC_NOOP,
185 1.25 fvdl NFSV2PROC_READLINK,
186 1.25 fvdl NFSV2PROC_READ,
187 1.25 fvdl NFSV2PROC_WRITE,
188 1.25 fvdl NFSV2PROC_CREATE,
189 1.25 fvdl NFSV2PROC_MKDIR,
190 1.25 fvdl NFSV2PROC_SYMLINK,
191 1.25 fvdl NFSV2PROC_CREATE,
192 1.25 fvdl NFSV2PROC_REMOVE,
193 1.25 fvdl NFSV2PROC_RMDIR,
194 1.25 fvdl NFSV2PROC_RENAME,
195 1.25 fvdl NFSV2PROC_LINK,
196 1.25 fvdl NFSV2PROC_READDIR,
197 1.25 fvdl NFSV2PROC_NOOP,
198 1.25 fvdl NFSV2PROC_STATFS,
199 1.25 fvdl NFSV2PROC_NOOP,
200 1.25 fvdl NFSV2PROC_NOOP,
201 1.25 fvdl NFSV2PROC_NOOP,
202 1.25 fvdl NFSV2PROC_NOOP,
203 1.25 fvdl };
204 1.25 fvdl
205 1.25 fvdl /*
206 1.25 fvdl * Maps errno values to nfs error numbers.
207 1.25 fvdl * Use NFSERR_IO as the catch all for ones not specifically defined in
208 1.25 fvdl * RFC 1094.
209 1.25 fvdl */
210 1.90 jdolecek static const u_char nfsrv_v2errmap[ELAST] = {
211 1.25 fvdl NFSERR_PERM, NFSERR_NOENT, NFSERR_IO, NFSERR_IO, NFSERR_IO,
212 1.25 fvdl NFSERR_NXIO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
213 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_ACCES, NFSERR_IO, NFSERR_IO,
214 1.25 fvdl NFSERR_IO, NFSERR_EXIST, NFSERR_IO, NFSERR_NODEV, NFSERR_NOTDIR,
215 1.25 fvdl NFSERR_ISDIR, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
216 1.25 fvdl NFSERR_IO, NFSERR_FBIG, NFSERR_NOSPC, NFSERR_IO, NFSERR_ROFS,
217 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
218 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
219 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
220 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
221 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
222 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
223 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_NAMETOL, NFSERR_IO, NFSERR_IO,
224 1.25 fvdl NFSERR_NOTEMPTY, NFSERR_IO, NFSERR_IO, NFSERR_DQUOT, NFSERR_STALE,
225 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
226 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
227 1.52 mikel NFSERR_IO, NFSERR_IO,
228 1.25 fvdl };
229 1.25 fvdl
230 1.25 fvdl /*
231 1.25 fvdl * Maps errno values to nfs error numbers.
232 1.25 fvdl * Although it is not obvious whether or not NFS clients really care if
233 1.25 fvdl * a returned error value is in the specified list for the procedure, the
234 1.25 fvdl * safest thing to do is filter them appropriately. For Version 2, the
235 1.25 fvdl * X/Open XNFS document is the only specification that defines error values
236 1.25 fvdl * for each RPC (The RFC simply lists all possible error values for all RPCs),
237 1.25 fvdl * so I have decided to not do this for Version 2.
238 1.25 fvdl * The first entry is the default error return and the rest are the valid
239 1.25 fvdl * errors for that RPC in increasing numeric order.
240 1.25 fvdl */
241 1.90 jdolecek static const short nfsv3err_null[] = {
242 1.25 fvdl 0,
243 1.25 fvdl 0,
244 1.25 fvdl };
245 1.25 fvdl
246 1.90 jdolecek static const short nfsv3err_getattr[] = {
247 1.25 fvdl NFSERR_IO,
248 1.25 fvdl NFSERR_IO,
249 1.25 fvdl NFSERR_STALE,
250 1.25 fvdl NFSERR_BADHANDLE,
251 1.25 fvdl NFSERR_SERVERFAULT,
252 1.25 fvdl 0,
253 1.25 fvdl };
254 1.25 fvdl
255 1.90 jdolecek static const short nfsv3err_setattr[] = {
256 1.25 fvdl NFSERR_IO,
257 1.25 fvdl NFSERR_PERM,
258 1.25 fvdl NFSERR_IO,
259 1.25 fvdl NFSERR_ACCES,
260 1.25 fvdl NFSERR_INVAL,
261 1.25 fvdl NFSERR_NOSPC,
262 1.25 fvdl NFSERR_ROFS,
263 1.25 fvdl NFSERR_DQUOT,
264 1.25 fvdl NFSERR_STALE,
265 1.25 fvdl NFSERR_BADHANDLE,
266 1.25 fvdl NFSERR_NOT_SYNC,
267 1.25 fvdl NFSERR_SERVERFAULT,
268 1.25 fvdl 0,
269 1.25 fvdl };
270 1.25 fvdl
271 1.90 jdolecek static const short nfsv3err_lookup[] = {
272 1.25 fvdl NFSERR_IO,
273 1.25 fvdl NFSERR_NOENT,
274 1.25 fvdl NFSERR_IO,
275 1.25 fvdl NFSERR_ACCES,
276 1.25 fvdl NFSERR_NOTDIR,
277 1.25 fvdl NFSERR_NAMETOL,
278 1.25 fvdl NFSERR_STALE,
279 1.25 fvdl NFSERR_BADHANDLE,
280 1.25 fvdl NFSERR_SERVERFAULT,
281 1.25 fvdl 0,
282 1.25 fvdl };
283 1.25 fvdl
284 1.90 jdolecek static const short nfsv3err_access[] = {
285 1.25 fvdl NFSERR_IO,
286 1.25 fvdl NFSERR_IO,
287 1.25 fvdl NFSERR_STALE,
288 1.25 fvdl NFSERR_BADHANDLE,
289 1.25 fvdl NFSERR_SERVERFAULT,
290 1.25 fvdl 0,
291 1.25 fvdl };
292 1.25 fvdl
293 1.90 jdolecek static const short nfsv3err_readlink[] = {
294 1.25 fvdl NFSERR_IO,
295 1.25 fvdl NFSERR_IO,
296 1.25 fvdl NFSERR_ACCES,
297 1.25 fvdl NFSERR_INVAL,
298 1.25 fvdl NFSERR_STALE,
299 1.25 fvdl NFSERR_BADHANDLE,
300 1.25 fvdl NFSERR_NOTSUPP,
301 1.25 fvdl NFSERR_SERVERFAULT,
302 1.25 fvdl 0,
303 1.25 fvdl };
304 1.25 fvdl
305 1.90 jdolecek static const short nfsv3err_read[] = {
306 1.25 fvdl NFSERR_IO,
307 1.25 fvdl NFSERR_IO,
308 1.25 fvdl NFSERR_NXIO,
309 1.25 fvdl NFSERR_ACCES,
310 1.25 fvdl NFSERR_INVAL,
311 1.25 fvdl NFSERR_STALE,
312 1.25 fvdl NFSERR_BADHANDLE,
313 1.25 fvdl NFSERR_SERVERFAULT,
314 1.67 fvdl NFSERR_JUKEBOX,
315 1.25 fvdl 0,
316 1.25 fvdl };
317 1.25 fvdl
318 1.90 jdolecek static const short nfsv3err_write[] = {
319 1.25 fvdl NFSERR_IO,
320 1.25 fvdl NFSERR_IO,
321 1.25 fvdl NFSERR_ACCES,
322 1.25 fvdl NFSERR_INVAL,
323 1.25 fvdl NFSERR_FBIG,
324 1.25 fvdl NFSERR_NOSPC,
325 1.25 fvdl NFSERR_ROFS,
326 1.25 fvdl NFSERR_DQUOT,
327 1.25 fvdl NFSERR_STALE,
328 1.25 fvdl NFSERR_BADHANDLE,
329 1.25 fvdl NFSERR_SERVERFAULT,
330 1.68 fvdl NFSERR_JUKEBOX,
331 1.25 fvdl 0,
332 1.25 fvdl };
333 1.25 fvdl
334 1.90 jdolecek static const short nfsv3err_create[] = {
335 1.25 fvdl NFSERR_IO,
336 1.25 fvdl NFSERR_IO,
337 1.25 fvdl NFSERR_ACCES,
338 1.25 fvdl NFSERR_EXIST,
339 1.25 fvdl NFSERR_NOTDIR,
340 1.25 fvdl NFSERR_NOSPC,
341 1.25 fvdl NFSERR_ROFS,
342 1.25 fvdl NFSERR_NAMETOL,
343 1.25 fvdl NFSERR_DQUOT,
344 1.25 fvdl NFSERR_STALE,
345 1.25 fvdl NFSERR_BADHANDLE,
346 1.25 fvdl NFSERR_NOTSUPP,
347 1.25 fvdl NFSERR_SERVERFAULT,
348 1.25 fvdl 0,
349 1.25 fvdl };
350 1.25 fvdl
351 1.90 jdolecek static const short nfsv3err_mkdir[] = {
352 1.25 fvdl NFSERR_IO,
353 1.25 fvdl NFSERR_IO,
354 1.25 fvdl NFSERR_ACCES,
355 1.25 fvdl NFSERR_EXIST,
356 1.25 fvdl NFSERR_NOTDIR,
357 1.25 fvdl NFSERR_NOSPC,
358 1.25 fvdl NFSERR_ROFS,
359 1.25 fvdl NFSERR_NAMETOL,
360 1.25 fvdl NFSERR_DQUOT,
361 1.25 fvdl NFSERR_STALE,
362 1.25 fvdl NFSERR_BADHANDLE,
363 1.25 fvdl NFSERR_NOTSUPP,
364 1.25 fvdl NFSERR_SERVERFAULT,
365 1.25 fvdl 0,
366 1.25 fvdl };
367 1.25 fvdl
368 1.90 jdolecek static const short nfsv3err_symlink[] = {
369 1.25 fvdl NFSERR_IO,
370 1.25 fvdl NFSERR_IO,
371 1.25 fvdl NFSERR_ACCES,
372 1.25 fvdl NFSERR_EXIST,
373 1.25 fvdl NFSERR_NOTDIR,
374 1.25 fvdl NFSERR_NOSPC,
375 1.25 fvdl NFSERR_ROFS,
376 1.25 fvdl NFSERR_NAMETOL,
377 1.25 fvdl NFSERR_DQUOT,
378 1.25 fvdl NFSERR_STALE,
379 1.25 fvdl NFSERR_BADHANDLE,
380 1.25 fvdl NFSERR_NOTSUPP,
381 1.25 fvdl NFSERR_SERVERFAULT,
382 1.25 fvdl 0,
383 1.25 fvdl };
384 1.25 fvdl
385 1.90 jdolecek static const short nfsv3err_mknod[] = {
386 1.25 fvdl NFSERR_IO,
387 1.25 fvdl NFSERR_IO,
388 1.25 fvdl NFSERR_ACCES,
389 1.25 fvdl NFSERR_EXIST,
390 1.25 fvdl NFSERR_NOTDIR,
391 1.25 fvdl NFSERR_NOSPC,
392 1.25 fvdl NFSERR_ROFS,
393 1.25 fvdl NFSERR_NAMETOL,
394 1.25 fvdl NFSERR_DQUOT,
395 1.25 fvdl NFSERR_STALE,
396 1.25 fvdl NFSERR_BADHANDLE,
397 1.25 fvdl NFSERR_NOTSUPP,
398 1.25 fvdl NFSERR_SERVERFAULT,
399 1.25 fvdl NFSERR_BADTYPE,
400 1.25 fvdl 0,
401 1.25 fvdl };
402 1.25 fvdl
403 1.90 jdolecek static const short nfsv3err_remove[] = {
404 1.25 fvdl NFSERR_IO,
405 1.25 fvdl NFSERR_NOENT,
406 1.25 fvdl NFSERR_IO,
407 1.25 fvdl NFSERR_ACCES,
408 1.25 fvdl NFSERR_NOTDIR,
409 1.25 fvdl NFSERR_ROFS,
410 1.25 fvdl NFSERR_NAMETOL,
411 1.25 fvdl NFSERR_STALE,
412 1.25 fvdl NFSERR_BADHANDLE,
413 1.25 fvdl NFSERR_SERVERFAULT,
414 1.25 fvdl 0,
415 1.25 fvdl };
416 1.25 fvdl
417 1.90 jdolecek static const short nfsv3err_rmdir[] = {
418 1.25 fvdl NFSERR_IO,
419 1.25 fvdl NFSERR_NOENT,
420 1.25 fvdl NFSERR_IO,
421 1.25 fvdl NFSERR_ACCES,
422 1.25 fvdl NFSERR_EXIST,
423 1.25 fvdl NFSERR_NOTDIR,
424 1.25 fvdl NFSERR_INVAL,
425 1.25 fvdl NFSERR_ROFS,
426 1.25 fvdl NFSERR_NAMETOL,
427 1.25 fvdl NFSERR_NOTEMPTY,
428 1.25 fvdl NFSERR_STALE,
429 1.25 fvdl NFSERR_BADHANDLE,
430 1.25 fvdl NFSERR_NOTSUPP,
431 1.25 fvdl NFSERR_SERVERFAULT,
432 1.25 fvdl 0,
433 1.25 fvdl };
434 1.25 fvdl
435 1.90 jdolecek static const short nfsv3err_rename[] = {
436 1.25 fvdl NFSERR_IO,
437 1.25 fvdl NFSERR_NOENT,
438 1.25 fvdl NFSERR_IO,
439 1.25 fvdl NFSERR_ACCES,
440 1.25 fvdl NFSERR_EXIST,
441 1.25 fvdl NFSERR_XDEV,
442 1.25 fvdl NFSERR_NOTDIR,
443 1.25 fvdl NFSERR_ISDIR,
444 1.25 fvdl NFSERR_INVAL,
445 1.25 fvdl NFSERR_NOSPC,
446 1.25 fvdl NFSERR_ROFS,
447 1.25 fvdl NFSERR_MLINK,
448 1.25 fvdl NFSERR_NAMETOL,
449 1.25 fvdl NFSERR_NOTEMPTY,
450 1.25 fvdl NFSERR_DQUOT,
451 1.25 fvdl NFSERR_STALE,
452 1.25 fvdl NFSERR_BADHANDLE,
453 1.25 fvdl NFSERR_NOTSUPP,
454 1.25 fvdl NFSERR_SERVERFAULT,
455 1.25 fvdl 0,
456 1.25 fvdl };
457 1.25 fvdl
458 1.90 jdolecek static const short nfsv3err_link[] = {
459 1.25 fvdl NFSERR_IO,
460 1.25 fvdl NFSERR_IO,
461 1.25 fvdl NFSERR_ACCES,
462 1.25 fvdl NFSERR_EXIST,
463 1.25 fvdl NFSERR_XDEV,
464 1.25 fvdl NFSERR_NOTDIR,
465 1.25 fvdl NFSERR_INVAL,
466 1.25 fvdl NFSERR_NOSPC,
467 1.25 fvdl NFSERR_ROFS,
468 1.25 fvdl NFSERR_MLINK,
469 1.25 fvdl NFSERR_NAMETOL,
470 1.25 fvdl NFSERR_DQUOT,
471 1.25 fvdl NFSERR_STALE,
472 1.25 fvdl NFSERR_BADHANDLE,
473 1.25 fvdl NFSERR_NOTSUPP,
474 1.25 fvdl NFSERR_SERVERFAULT,
475 1.25 fvdl 0,
476 1.25 fvdl };
477 1.25 fvdl
478 1.90 jdolecek static const short nfsv3err_readdir[] = {
479 1.25 fvdl NFSERR_IO,
480 1.25 fvdl NFSERR_IO,
481 1.25 fvdl NFSERR_ACCES,
482 1.25 fvdl NFSERR_NOTDIR,
483 1.25 fvdl NFSERR_STALE,
484 1.25 fvdl NFSERR_BADHANDLE,
485 1.25 fvdl NFSERR_BAD_COOKIE,
486 1.25 fvdl NFSERR_TOOSMALL,
487 1.25 fvdl NFSERR_SERVERFAULT,
488 1.25 fvdl 0,
489 1.25 fvdl };
490 1.25 fvdl
491 1.90 jdolecek static const short nfsv3err_readdirplus[] = {
492 1.25 fvdl NFSERR_IO,
493 1.25 fvdl NFSERR_IO,
494 1.25 fvdl NFSERR_ACCES,
495 1.25 fvdl NFSERR_NOTDIR,
496 1.25 fvdl NFSERR_STALE,
497 1.25 fvdl NFSERR_BADHANDLE,
498 1.25 fvdl NFSERR_BAD_COOKIE,
499 1.25 fvdl NFSERR_NOTSUPP,
500 1.25 fvdl NFSERR_TOOSMALL,
501 1.25 fvdl NFSERR_SERVERFAULT,
502 1.25 fvdl 0,
503 1.25 fvdl };
504 1.25 fvdl
505 1.90 jdolecek static const short nfsv3err_fsstat[] = {
506 1.25 fvdl NFSERR_IO,
507 1.25 fvdl NFSERR_IO,
508 1.25 fvdl NFSERR_STALE,
509 1.25 fvdl NFSERR_BADHANDLE,
510 1.25 fvdl NFSERR_SERVERFAULT,
511 1.25 fvdl 0,
512 1.25 fvdl };
513 1.25 fvdl
514 1.90 jdolecek static const short nfsv3err_fsinfo[] = {
515 1.25 fvdl NFSERR_STALE,
516 1.25 fvdl NFSERR_STALE,
517 1.25 fvdl NFSERR_BADHANDLE,
518 1.25 fvdl NFSERR_SERVERFAULT,
519 1.25 fvdl 0,
520 1.25 fvdl };
521 1.25 fvdl
522 1.90 jdolecek static const short nfsv3err_pathconf[] = {
523 1.25 fvdl NFSERR_STALE,
524 1.25 fvdl NFSERR_STALE,
525 1.25 fvdl NFSERR_BADHANDLE,
526 1.25 fvdl NFSERR_SERVERFAULT,
527 1.25 fvdl 0,
528 1.25 fvdl };
529 1.25 fvdl
530 1.90 jdolecek static const short nfsv3err_commit[] = {
531 1.25 fvdl NFSERR_IO,
532 1.25 fvdl NFSERR_IO,
533 1.25 fvdl NFSERR_STALE,
534 1.25 fvdl NFSERR_BADHANDLE,
535 1.25 fvdl NFSERR_SERVERFAULT,
536 1.25 fvdl 0,
537 1.25 fvdl };
538 1.25 fvdl
539 1.90 jdolecek static const short * const nfsrv_v3errmap[] = {
540 1.25 fvdl nfsv3err_null,
541 1.25 fvdl nfsv3err_getattr,
542 1.25 fvdl nfsv3err_setattr,
543 1.25 fvdl nfsv3err_lookup,
544 1.25 fvdl nfsv3err_access,
545 1.25 fvdl nfsv3err_readlink,
546 1.25 fvdl nfsv3err_read,
547 1.25 fvdl nfsv3err_write,
548 1.25 fvdl nfsv3err_create,
549 1.25 fvdl nfsv3err_mkdir,
550 1.25 fvdl nfsv3err_symlink,
551 1.25 fvdl nfsv3err_mknod,
552 1.25 fvdl nfsv3err_remove,
553 1.25 fvdl nfsv3err_rmdir,
554 1.25 fvdl nfsv3err_rename,
555 1.25 fvdl nfsv3err_link,
556 1.25 fvdl nfsv3err_readdir,
557 1.25 fvdl nfsv3err_readdirplus,
558 1.25 fvdl nfsv3err_fsstat,
559 1.25 fvdl nfsv3err_fsinfo,
560 1.25 fvdl nfsv3err_pathconf,
561 1.25 fvdl nfsv3err_commit,
562 1.25 fvdl };
563 1.25 fvdl
564 1.12 mycroft extern struct nfsrtt nfsrtt;
565 1.1 cgd
566 1.46 fvdl u_long nfsdirhashmask;
567 1.18 mycroft
568 1.213 dsl int nfs_webnamei(struct nameidata *, struct vnode *, struct proc *);
569 1.43 fvdl
570 1.1 cgd /*
571 1.1 cgd * Create the header for an rpc request packet
572 1.1 cgd * The hsiz is the size of the rest of the nfs request header.
573 1.1 cgd * (just used to decide if a cluster is a good idea)
574 1.1 cgd */
575 1.12 mycroft struct mbuf *
576 1.183 christos nfsm_reqh(struct nfsnode *np, u_long procid, int hsiz, char **bposp)
577 1.12 mycroft {
578 1.75 augustss struct mbuf *mb;
579 1.183 christos char *bpos;
580 1.12 mycroft
581 1.109 matt mb = m_get(M_WAIT, MT_DATA);
582 1.109 matt MCLAIM(mb, &nfs_mowner);
583 1.12 mycroft if (hsiz >= MINCLSIZE)
584 1.109 matt m_clget(mb, M_WAIT);
585 1.12 mycroft mb->m_len = 0;
586 1.183 christos bpos = mtod(mb, void *);
587 1.148 perry
588 1.12 mycroft /* Finally, return values */
589 1.12 mycroft *bposp = bpos;
590 1.12 mycroft return (mb);
591 1.12 mycroft }
592 1.12 mycroft
593 1.12 mycroft /*
594 1.12 mycroft * Build the RPC header and fill in the authorization info.
595 1.12 mycroft * The authorization string argument is only used when the credentials
596 1.12 mycroft * come from outside of the kernel.
597 1.12 mycroft * Returns the head of the mbuf list.
598 1.12 mycroft */
599 1.12 mycroft struct mbuf *
600 1.216 cegger nfsm_rpchead(kauth_cred_t cr, int nmflag, int procid,
601 1.216 cegger int auth_type, int auth_len, char *auth_str, int verf_len,
602 1.216 cegger char *verf_str, struct mbuf *mrest, int mrest_len,
603 1.216 cegger struct mbuf **mbp, uint32_t *xidp)
604 1.1 cgd {
605 1.75 augustss struct mbuf *mb;
606 1.75 augustss u_int32_t *tl;
607 1.183 christos char *bpos;
608 1.75 augustss int i;
609 1.109 matt struct mbuf *mreq;
610 1.12 mycroft int siz, grpsiz, authsiz;
611 1.1 cgd
612 1.12 mycroft authsiz = nfsm_rndup(auth_len);
613 1.109 matt mb = m_gethdr(M_WAIT, MT_DATA);
614 1.109 matt MCLAIM(mb, &nfs_mowner);
615 1.25 fvdl if ((authsiz + 10 * NFSX_UNSIGNED) >= MINCLSIZE) {
616 1.109 matt m_clget(mb, M_WAIT);
617 1.25 fvdl } else if ((authsiz + 10 * NFSX_UNSIGNED) < MHLEN) {
618 1.235 maxv m_align(mb, authsiz + 10 * NFSX_UNSIGNED);
619 1.12 mycroft } else {
620 1.235 maxv m_align(mb, 8 * NFSX_UNSIGNED);
621 1.1 cgd }
622 1.12 mycroft mb->m_len = 0;
623 1.12 mycroft mreq = mb;
624 1.183 christos bpos = mtod(mb, void *);
625 1.12 mycroft
626 1.12 mycroft /*
627 1.12 mycroft * First the RPC header.
628 1.12 mycroft */
629 1.25 fvdl nfsm_build(tl, u_int32_t *, 8 * NFSX_UNSIGNED);
630 1.30 fvdl
631 1.126 yamt *tl++ = *xidp = nfs_getxid();
632 1.1 cgd *tl++ = rpc_call;
633 1.1 cgd *tl++ = rpc_vers;
634 1.179 yamt *tl++ = txdr_unsigned(NFS_PROG);
635 1.179 yamt if (nmflag & NFSMNT_NFSV3)
636 1.179 yamt *tl++ = txdr_unsigned(NFS_VER3);
637 1.179 yamt else
638 1.179 yamt *tl++ = txdr_unsigned(NFS_VER2);
639 1.25 fvdl if (nmflag & NFSMNT_NFSV3)
640 1.25 fvdl *tl++ = txdr_unsigned(procid);
641 1.25 fvdl else
642 1.25 fvdl *tl++ = txdr_unsigned(nfsv2_procid[procid]);
643 1.12 mycroft
644 1.12 mycroft /*
645 1.12 mycroft * And then the authorization cred.
646 1.12 mycroft */
647 1.12 mycroft *tl++ = txdr_unsigned(auth_type);
648 1.12 mycroft *tl = txdr_unsigned(authsiz);
649 1.12 mycroft switch (auth_type) {
650 1.12 mycroft case RPCAUTH_UNIX:
651 1.22 cgd nfsm_build(tl, u_int32_t *, auth_len);
652 1.12 mycroft *tl++ = 0; /* stamp ?? */
653 1.12 mycroft *tl++ = 0; /* NULL hostname */
654 1.162 elad *tl++ = txdr_unsigned(kauth_cred_geteuid(cr));
655 1.162 elad *tl++ = txdr_unsigned(kauth_cred_getegid(cr));
656 1.12 mycroft grpsiz = (auth_len >> 2) - 5;
657 1.12 mycroft *tl++ = txdr_unsigned(grpsiz);
658 1.20 mycroft for (i = 0; i < grpsiz; i++)
659 1.162 elad *tl++ = txdr_unsigned(kauth_cred_group(cr, i)); /* XXX elad review */
660 1.12 mycroft break;
661 1.25 fvdl case RPCAUTH_KERB4:
662 1.12 mycroft siz = auth_len;
663 1.12 mycroft while (siz > 0) {
664 1.12 mycroft if (M_TRAILINGSPACE(mb) == 0) {
665 1.109 matt struct mbuf *mb2;
666 1.109 matt mb2 = m_get(M_WAIT, MT_DATA);
667 1.109 matt MCLAIM(mb2, &nfs_mowner);
668 1.12 mycroft if (siz >= MINCLSIZE)
669 1.109 matt m_clget(mb2, M_WAIT);
670 1.12 mycroft mb->m_next = mb2;
671 1.12 mycroft mb = mb2;
672 1.12 mycroft mb->m_len = 0;
673 1.183 christos bpos = mtod(mb, void *);
674 1.12 mycroft }
675 1.233 riastrad i = uimin(siz, M_TRAILINGSPACE(mb));
676 1.63 perry memcpy(bpos, auth_str, i);
677 1.12 mycroft mb->m_len += i;
678 1.12 mycroft auth_str += i;
679 1.12 mycroft bpos += i;
680 1.12 mycroft siz -= i;
681 1.12 mycroft }
682 1.12 mycroft if ((siz = (nfsm_rndup(auth_len) - auth_len)) > 0) {
683 1.12 mycroft for (i = 0; i < siz; i++)
684 1.12 mycroft *bpos++ = '\0';
685 1.12 mycroft mb->m_len += siz;
686 1.12 mycroft }
687 1.12 mycroft break;
688 1.12 mycroft };
689 1.25 fvdl
690 1.25 fvdl /*
691 1.25 fvdl * And the verifier...
692 1.25 fvdl */
693 1.25 fvdl nfsm_build(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
694 1.25 fvdl if (verf_str) {
695 1.25 fvdl *tl++ = txdr_unsigned(RPCAUTH_KERB4);
696 1.25 fvdl *tl = txdr_unsigned(verf_len);
697 1.25 fvdl siz = verf_len;
698 1.25 fvdl while (siz > 0) {
699 1.25 fvdl if (M_TRAILINGSPACE(mb) == 0) {
700 1.109 matt struct mbuf *mb2;
701 1.109 matt mb2 = m_get(M_WAIT, MT_DATA);
702 1.109 matt MCLAIM(mb2, &nfs_mowner);
703 1.25 fvdl if (siz >= MINCLSIZE)
704 1.109 matt m_clget(mb2, M_WAIT);
705 1.25 fvdl mb->m_next = mb2;
706 1.25 fvdl mb = mb2;
707 1.25 fvdl mb->m_len = 0;
708 1.183 christos bpos = mtod(mb, void *);
709 1.25 fvdl }
710 1.233 riastrad i = uimin(siz, M_TRAILINGSPACE(mb));
711 1.63 perry memcpy(bpos, verf_str, i);
712 1.25 fvdl mb->m_len += i;
713 1.25 fvdl verf_str += i;
714 1.25 fvdl bpos += i;
715 1.25 fvdl siz -= i;
716 1.25 fvdl }
717 1.25 fvdl if ((siz = (nfsm_rndup(verf_len) - verf_len)) > 0) {
718 1.25 fvdl for (i = 0; i < siz; i++)
719 1.25 fvdl *bpos++ = '\0';
720 1.25 fvdl mb->m_len += siz;
721 1.25 fvdl }
722 1.25 fvdl } else {
723 1.25 fvdl *tl++ = txdr_unsigned(RPCAUTH_NULL);
724 1.25 fvdl *tl = 0;
725 1.25 fvdl }
726 1.12 mycroft mb->m_next = mrest;
727 1.25 fvdl mreq->m_pkthdr.len = authsiz + 10 * NFSX_UNSIGNED + mrest_len;
728 1.228 ozaki m_reset_rcvif(mreq);
729 1.12 mycroft *mbp = mb;
730 1.1 cgd return (mreq);
731 1.1 cgd }
732 1.1 cgd
733 1.1 cgd /*
734 1.1 cgd * copies mbuf chain to the uio scatter/gather list
735 1.1 cgd */
736 1.24 christos int
737 1.214 dsl nfsm_mbuftouio(struct mbuf **mrep, struct uio *uiop, int siz, char **dpos)
738 1.1 cgd {
739 1.75 augustss char *mbufcp, *uiocp;
740 1.75 augustss int xfer, left, len;
741 1.75 augustss struct mbuf *mp;
742 1.1 cgd long uiosiz, rem;
743 1.1 cgd int error = 0;
744 1.1 cgd
745 1.1 cgd mp = *mrep;
746 1.1 cgd mbufcp = *dpos;
747 1.183 christos len = mtod(mp, char *) + mp->m_len - mbufcp;
748 1.1 cgd rem = nfsm_rndup(siz)-siz;
749 1.1 cgd while (siz > 0) {
750 1.1 cgd if (uiop->uio_iovcnt <= 0 || uiop->uio_iov == NULL)
751 1.1 cgd return (EFBIG);
752 1.1 cgd left = uiop->uio_iov->iov_len;
753 1.1 cgd uiocp = uiop->uio_iov->iov_base;
754 1.1 cgd if (left > siz)
755 1.1 cgd left = siz;
756 1.1 cgd uiosiz = left;
757 1.1 cgd while (left > 0) {
758 1.1 cgd while (len == 0) {
759 1.1 cgd mp = mp->m_next;
760 1.1 cgd if (mp == NULL)
761 1.1 cgd return (EBADRPC);
762 1.183 christos mbufcp = mtod(mp, void *);
763 1.1 cgd len = mp->m_len;
764 1.1 cgd }
765 1.1 cgd xfer = (left > len) ? len : left;
766 1.158 yamt error = copyout_vmspace(uiop->uio_vmspace, mbufcp,
767 1.158 yamt uiocp, xfer);
768 1.158 yamt if (error) {
769 1.158 yamt return error;
770 1.158 yamt }
771 1.1 cgd left -= xfer;
772 1.1 cgd len -= xfer;
773 1.1 cgd mbufcp += xfer;
774 1.1 cgd uiocp += xfer;
775 1.1 cgd uiop->uio_offset += xfer;
776 1.1 cgd uiop->uio_resid -= xfer;
777 1.1 cgd }
778 1.1 cgd if (uiop->uio_iov->iov_len <= siz) {
779 1.1 cgd uiop->uio_iovcnt--;
780 1.1 cgd uiop->uio_iov++;
781 1.1 cgd } else {
782 1.95 lukem uiop->uio_iov->iov_base =
783 1.183 christos (char *)uiop->uio_iov->iov_base + uiosiz;
784 1.1 cgd uiop->uio_iov->iov_len -= uiosiz;
785 1.1 cgd }
786 1.1 cgd siz -= uiosiz;
787 1.1 cgd }
788 1.1 cgd *dpos = mbufcp;
789 1.1 cgd *mrep = mp;
790 1.1 cgd if (rem > 0) {
791 1.1 cgd if (len < rem)
792 1.1 cgd error = nfs_adv(mrep, dpos, rem, len);
793 1.1 cgd else
794 1.1 cgd *dpos += rem;
795 1.1 cgd }
796 1.1 cgd return (error);
797 1.1 cgd }
798 1.1 cgd
799 1.1 cgd /*
800 1.29 fvdl * copies a uio scatter/gather list to an mbuf chain.
801 1.29 fvdl * NOTE: can ony handle iovcnt == 1
802 1.1 cgd */
803 1.24 christos int
804 1.214 dsl nfsm_uiotombuf(struct uio *uiop, struct mbuf **mq, int siz, char **bpos)
805 1.1 cgd {
806 1.75 augustss char *uiocp;
807 1.75 augustss struct mbuf *mp, *mp2;
808 1.75 augustss int xfer, left, mlen;
809 1.1 cgd int uiosiz, clflg, rem;
810 1.1 cgd char *cp;
811 1.158 yamt int error;
812 1.1 cgd
813 1.29 fvdl #ifdef DIAGNOSTIC
814 1.29 fvdl if (uiop->uio_iovcnt != 1)
815 1.29 fvdl panic("nfsm_uiotombuf: iovcnt != 1");
816 1.29 fvdl #endif
817 1.29 fvdl
818 1.1 cgd if (siz > MLEN) /* or should it >= MCLBYTES ?? */
819 1.1 cgd clflg = 1;
820 1.1 cgd else
821 1.1 cgd clflg = 0;
822 1.1 cgd rem = nfsm_rndup(siz)-siz;
823 1.12 mycroft mp = mp2 = *mq;
824 1.1 cgd while (siz > 0) {
825 1.1 cgd left = uiop->uio_iov->iov_len;
826 1.1 cgd uiocp = uiop->uio_iov->iov_base;
827 1.1 cgd if (left > siz)
828 1.1 cgd left = siz;
829 1.1 cgd uiosiz = left;
830 1.1 cgd while (left > 0) {
831 1.12 mycroft mlen = M_TRAILINGSPACE(mp);
832 1.12 mycroft if (mlen == 0) {
833 1.109 matt mp = m_get(M_WAIT, MT_DATA);
834 1.109 matt MCLAIM(mp, &nfs_mowner);
835 1.12 mycroft if (clflg)
836 1.109 matt m_clget(mp, M_WAIT);
837 1.12 mycroft mp->m_len = 0;
838 1.12 mycroft mp2->m_next = mp;
839 1.12 mycroft mp2 = mp;
840 1.12 mycroft mlen = M_TRAILINGSPACE(mp);
841 1.12 mycroft }
842 1.12 mycroft xfer = (left > mlen) ? mlen : left;
843 1.183 christos cp = mtod(mp, char *) + mp->m_len;
844 1.158 yamt error = copyin_vmspace(uiop->uio_vmspace, uiocp, cp,
845 1.158 yamt xfer);
846 1.158 yamt if (error) {
847 1.158 yamt /* XXX */
848 1.158 yamt }
849 1.12 mycroft mp->m_len += xfer;
850 1.1 cgd left -= xfer;
851 1.1 cgd uiocp += xfer;
852 1.1 cgd uiop->uio_offset += xfer;
853 1.1 cgd uiop->uio_resid -= xfer;
854 1.1 cgd }
855 1.183 christos uiop->uio_iov->iov_base = (char *)uiop->uio_iov->iov_base +
856 1.95 lukem uiosiz;
857 1.29 fvdl uiop->uio_iov->iov_len -= uiosiz;
858 1.1 cgd siz -= uiosiz;
859 1.1 cgd }
860 1.1 cgd if (rem > 0) {
861 1.12 mycroft if (rem > M_TRAILINGSPACE(mp)) {
862 1.109 matt mp = m_get(M_WAIT, MT_DATA);
863 1.109 matt MCLAIM(mp, &nfs_mowner);
864 1.1 cgd mp->m_len = 0;
865 1.1 cgd mp2->m_next = mp;
866 1.1 cgd }
867 1.183 christos cp = mtod(mp, char *) + mp->m_len;
868 1.1 cgd for (left = 0; left < rem; left++)
869 1.1 cgd *cp++ = '\0';
870 1.1 cgd mp->m_len += rem;
871 1.1 cgd *bpos = cp;
872 1.1 cgd } else
873 1.183 christos *bpos = mtod(mp, char *) + mp->m_len;
874 1.1 cgd *mq = mp;
875 1.1 cgd return (0);
876 1.1 cgd }
877 1.1 cgd
878 1.1 cgd /*
879 1.39 fvdl * Get at least "siz" bytes of correctly aligned data.
880 1.39 fvdl * When called the mbuf pointers are not necessarily correct,
881 1.39 fvdl * dsosp points to what ought to be in m_data and left contains
882 1.148 perry * what ought to be in m_len.
883 1.12 mycroft * This is used by the macros nfsm_dissect and nfsm_dissecton for tough
884 1.1 cgd * cases. (The macros use the vars. dpos and dpos2)
885 1.1 cgd */
886 1.24 christos int
887 1.214 dsl nfsm_disct(struct mbuf **mdp, char **dposp, int siz, int left, char **cp2)
888 1.1 cgd {
889 1.75 augustss struct mbuf *m1, *m2;
890 1.39 fvdl struct mbuf *havebuf = NULL;
891 1.183 christos char *src = *dposp;
892 1.183 christos char *dst;
893 1.39 fvdl int len;
894 1.39 fvdl
895 1.39 fvdl #ifdef DEBUG
896 1.39 fvdl if (left < 0)
897 1.148 perry panic("nfsm_disct: left < 0");
898 1.39 fvdl #endif
899 1.39 fvdl m1 = *mdp;
900 1.39 fvdl /*
901 1.39 fvdl * Skip through the mbuf chain looking for an mbuf with
902 1.39 fvdl * some data. If the first mbuf found has enough data
903 1.39 fvdl * and it is correctly aligned return it.
904 1.39 fvdl */
905 1.1 cgd while (left == 0) {
906 1.39 fvdl havebuf = m1;
907 1.39 fvdl *mdp = m1 = m1->m_next;
908 1.39 fvdl if (m1 == NULL)
909 1.1 cgd return (EBADRPC);
910 1.183 christos src = mtod(m1, void *);
911 1.39 fvdl left = m1->m_len;
912 1.39 fvdl /*
913 1.39 fvdl * If we start a new mbuf and it is big enough
914 1.39 fvdl * and correctly aligned just return it, don't
915 1.39 fvdl * do any pull up.
916 1.39 fvdl */
917 1.39 fvdl if (left >= siz && nfsm_aligned(src)) {
918 1.39 fvdl *cp2 = src;
919 1.39 fvdl *dposp = src + siz;
920 1.39 fvdl return (0);
921 1.39 fvdl }
922 1.1 cgd }
923 1.201 yamt if ((m1->m_flags & M_EXT) != 0) {
924 1.201 yamt if (havebuf && M_TRAILINGSPACE(havebuf) >= siz &&
925 1.201 yamt nfsm_aligned(mtod(havebuf, char *) + havebuf->m_len)) {
926 1.201 yamt /*
927 1.201 yamt * If the first mbuf with data has external data
928 1.201 yamt * and there is a previous mbuf with some trailing
929 1.201 yamt * space, use it to move the data into.
930 1.39 fvdl */
931 1.39 fvdl m2 = m1;
932 1.39 fvdl *mdp = m1 = havebuf;
933 1.201 yamt *cp2 = mtod(m1, char *) + m1->m_len;
934 1.201 yamt } else if (havebuf) {
935 1.39 fvdl /*
936 1.39 fvdl * If the first mbuf has a external data
937 1.39 fvdl * and there is no previous empty mbuf
938 1.39 fvdl * allocate a new mbuf and move the external
939 1.148 perry * data to the new mbuf. Also make the first
940 1.39 fvdl * mbuf look empty.
941 1.39 fvdl */
942 1.201 yamt m2 = m1;
943 1.201 yamt *mdp = m1 = m_get(M_WAIT, MT_DATA);
944 1.201 yamt MCLAIM(m1, m2->m_owner);
945 1.201 yamt if ((m2->m_flags & M_PKTHDR) != 0) {
946 1.234 maxv m_move_pkthdr(m1, m2);
947 1.201 yamt }
948 1.201 yamt if (havebuf) {
949 1.201 yamt havebuf->m_next = m1;
950 1.201 yamt }
951 1.201 yamt m1->m_next = m2;
952 1.201 yamt MRESETDATA(m1);
953 1.201 yamt m1->m_len = 0;
954 1.39 fvdl m2->m_data = src;
955 1.39 fvdl m2->m_len = left;
956 1.201 yamt *cp2 = mtod(m1, char *);
957 1.201 yamt } else {
958 1.201 yamt struct mbuf **nextp = &m1->m_next;
959 1.201 yamt
960 1.201 yamt m1->m_len -= left;
961 1.201 yamt do {
962 1.201 yamt m2 = m_get(M_WAIT, MT_DATA);
963 1.201 yamt MCLAIM(m2, m1->m_owner);
964 1.201 yamt if (left >= MINCLSIZE) {
965 1.201 yamt MCLGET(m2, M_WAIT);
966 1.201 yamt }
967 1.201 yamt m2->m_next = *nextp;
968 1.201 yamt *nextp = m2;
969 1.201 yamt nextp = &m2->m_next;
970 1.201 yamt len = (m2->m_flags & M_EXT) != 0 ?
971 1.201 yamt MCLBYTES : MLEN;
972 1.201 yamt if (len > left) {
973 1.201 yamt len = left;
974 1.201 yamt }
975 1.201 yamt memcpy(mtod(m2, char *), src, len);
976 1.201 yamt m2->m_len = len;
977 1.201 yamt src += len;
978 1.201 yamt left -= len;
979 1.201 yamt } while (left > 0);
980 1.201 yamt *mdp = m1 = m1->m_next;
981 1.201 yamt m2 = m1->m_next;
982 1.201 yamt *cp2 = mtod(m1, char *);
983 1.1 cgd }
984 1.39 fvdl } else {
985 1.39 fvdl /*
986 1.39 fvdl * If the first mbuf has no external data
987 1.39 fvdl * move the data to the front of the mbuf.
988 1.39 fvdl */
989 1.201 yamt MRESETDATA(m1);
990 1.201 yamt dst = mtod(m1, char *);
991 1.201 yamt if (dst != src) {
992 1.63 perry memmove(dst, src, left);
993 1.201 yamt }
994 1.39 fvdl m1->m_len = left;
995 1.39 fvdl m2 = m1->m_next;
996 1.201 yamt *cp2 = m1->m_data;
997 1.1 cgd }
998 1.201 yamt *dposp = *cp2 + siz;
999 1.39 fvdl /*
1000 1.39 fvdl * Loop through mbufs pulling data up into first mbuf until
1001 1.39 fvdl * the first mbuf is full or there is no more data to
1002 1.39 fvdl * pullup.
1003 1.39 fvdl */
1004 1.201 yamt dst = mtod(m1, char *) + m1->m_len;
1005 1.129 itojun while ((len = M_TRAILINGSPACE(m1)) != 0 && m2) {
1006 1.233 riastrad if ((len = uimin(len, m2->m_len)) != 0) {
1007 1.201 yamt memcpy(dst, mtod(m2, char *), len);
1008 1.201 yamt }
1009 1.39 fvdl m1->m_len += len;
1010 1.39 fvdl dst += len;
1011 1.39 fvdl m2->m_data += len;
1012 1.39 fvdl m2->m_len -= len;
1013 1.39 fvdl m2 = m2->m_next;
1014 1.39 fvdl }
1015 1.39 fvdl if (m1->m_len < siz)
1016 1.39 fvdl return (EBADRPC);
1017 1.1 cgd return (0);
1018 1.1 cgd }
1019 1.1 cgd
1020 1.1 cgd /*
1021 1.1 cgd * Advance the position in the mbuf chain.
1022 1.1 cgd */
1023 1.24 christos int
1024 1.214 dsl nfs_adv(struct mbuf **mdp, char **dposp, int offs, int left)
1025 1.1 cgd {
1026 1.75 augustss struct mbuf *m;
1027 1.75 augustss int s;
1028 1.1 cgd
1029 1.1 cgd m = *mdp;
1030 1.1 cgd s = left;
1031 1.1 cgd while (s < offs) {
1032 1.1 cgd offs -= s;
1033 1.1 cgd m = m->m_next;
1034 1.1 cgd if (m == NULL)
1035 1.1 cgd return (EBADRPC);
1036 1.1 cgd s = m->m_len;
1037 1.1 cgd }
1038 1.1 cgd *mdp = m;
1039 1.183 christos *dposp = mtod(m, char *) + offs;
1040 1.1 cgd return (0);
1041 1.1 cgd }
1042 1.1 cgd
1043 1.1 cgd /*
1044 1.1 cgd * Copy a string into mbufs for the hard cases...
1045 1.1 cgd */
1046 1.24 christos int
1047 1.214 dsl nfsm_strtmbuf(struct mbuf **mb, char **bpos, const char *cp, long siz)
1048 1.1 cgd {
1049 1.75 augustss struct mbuf *m1 = NULL, *m2;
1050 1.1 cgd long left, xfer, len, tlen;
1051 1.22 cgd u_int32_t *tl;
1052 1.1 cgd int putsize;
1053 1.1 cgd
1054 1.1 cgd putsize = 1;
1055 1.1 cgd m2 = *mb;
1056 1.12 mycroft left = M_TRAILINGSPACE(m2);
1057 1.1 cgd if (left > 0) {
1058 1.22 cgd tl = ((u_int32_t *)(*bpos));
1059 1.1 cgd *tl++ = txdr_unsigned(siz);
1060 1.1 cgd putsize = 0;
1061 1.1 cgd left -= NFSX_UNSIGNED;
1062 1.1 cgd m2->m_len += NFSX_UNSIGNED;
1063 1.1 cgd if (left > 0) {
1064 1.183 christos memcpy((void *) tl, cp, left);
1065 1.1 cgd siz -= left;
1066 1.1 cgd cp += left;
1067 1.1 cgd m2->m_len += left;
1068 1.1 cgd left = 0;
1069 1.1 cgd }
1070 1.1 cgd }
1071 1.12 mycroft /* Loop around adding mbufs */
1072 1.1 cgd while (siz > 0) {
1073 1.109 matt m1 = m_get(M_WAIT, MT_DATA);
1074 1.109 matt MCLAIM(m1, &nfs_mowner);
1075 1.1 cgd if (siz > MLEN)
1076 1.109 matt m_clget(m1, M_WAIT);
1077 1.1 cgd m1->m_len = NFSMSIZ(m1);
1078 1.1 cgd m2->m_next = m1;
1079 1.1 cgd m2 = m1;
1080 1.22 cgd tl = mtod(m1, u_int32_t *);
1081 1.1 cgd tlen = 0;
1082 1.1 cgd if (putsize) {
1083 1.1 cgd *tl++ = txdr_unsigned(siz);
1084 1.1 cgd m1->m_len -= NFSX_UNSIGNED;
1085 1.1 cgd tlen = NFSX_UNSIGNED;
1086 1.1 cgd putsize = 0;
1087 1.1 cgd }
1088 1.1 cgd if (siz < m1->m_len) {
1089 1.1 cgd len = nfsm_rndup(siz);
1090 1.1 cgd xfer = siz;
1091 1.1 cgd if (xfer < len)
1092 1.1 cgd *(tl+(xfer>>2)) = 0;
1093 1.1 cgd } else {
1094 1.1 cgd xfer = len = m1->m_len;
1095 1.1 cgd }
1096 1.183 christos memcpy((void *) tl, cp, xfer);
1097 1.1 cgd m1->m_len = len+tlen;
1098 1.1 cgd siz -= xfer;
1099 1.1 cgd cp += xfer;
1100 1.1 cgd }
1101 1.1 cgd *mb = m1;
1102 1.183 christos *bpos = mtod(m1, char *) + m1->m_len;
1103 1.1 cgd return (0);
1104 1.1 cgd }
1105 1.1 cgd
1106 1.49 fvdl /*
1107 1.49 fvdl * Directory caching routines. They work as follows:
1108 1.49 fvdl * - a cache is maintained per VDIR nfsnode.
1109 1.49 fvdl * - for each offset cookie that is exported to userspace, and can
1110 1.49 fvdl * thus be thrown back at us as an offset to VOP_READDIR, store
1111 1.49 fvdl * information in the cache.
1112 1.49 fvdl * - cached are:
1113 1.49 fvdl * - cookie itself
1114 1.49 fvdl * - blocknumber (essentially just a search key in the buffer cache)
1115 1.49 fvdl * - entry number in block.
1116 1.49 fvdl * - offset cookie of block in which this entry is stored
1117 1.49 fvdl * - 32 bit cookie if NFSMNT_XLATECOOKIE is used.
1118 1.49 fvdl * - entries are looked up in a hash table
1119 1.49 fvdl * - also maintained is an LRU list of entries, used to determine
1120 1.49 fvdl * which ones to delete if the cache grows too large.
1121 1.49 fvdl * - if 32 <-> 64 translation mode is requested for a filesystem,
1122 1.49 fvdl * the cache also functions as a translation table
1123 1.49 fvdl * - in the translation case, invalidating the cache does not mean
1124 1.49 fvdl * flushing it, but just marking entries as invalid, except for
1125 1.49 fvdl * the <64bit cookie, 32bitcookie> pair which is still valid, to
1126 1.49 fvdl * still be able to use the cache as a translation table.
1127 1.49 fvdl * - 32 bit cookies are uniquely created by combining the hash table
1128 1.49 fvdl * entry value, and one generation count per hash table entry,
1129 1.49 fvdl * incremented each time an entry is appended to the chain.
1130 1.49 fvdl * - the cache is invalidated each time a direcory is modified
1131 1.49 fvdl * - sanity checks are also done; if an entry in a block turns
1132 1.49 fvdl * out not to have a matching cookie, the cache is invalidated
1133 1.49 fvdl * and a new block starting from the wanted offset is fetched from
1134 1.49 fvdl * the server.
1135 1.49 fvdl * - directory entries as read from the server are extended to contain
1136 1.49 fvdl * the 64bit and, optionally, the 32bit cookies, for sanity checking
1137 1.49 fvdl * the cache and exporting them to userspace through the cookie
1138 1.49 fvdl * argument to VOP_READDIR.
1139 1.49 fvdl */
1140 1.49 fvdl
1141 1.46 fvdl u_long
1142 1.214 dsl nfs_dirhash(off_t off)
1143 1.46 fvdl {
1144 1.46 fvdl int i;
1145 1.46 fvdl char *cp = (char *)&off;
1146 1.46 fvdl u_long sum = 0L;
1147 1.46 fvdl
1148 1.46 fvdl for (i = 0 ; i < sizeof (off); i++)
1149 1.46 fvdl sum += *cp++;
1150 1.46 fvdl
1151 1.46 fvdl return sum;
1152 1.46 fvdl }
1153 1.46 fvdl
1154 1.221 rmind #define _NFSDC_MTX(np) (NFSTOV(np)->v_interlock)
1155 1.195 ad #define NFSDC_LOCK(np) mutex_enter(_NFSDC_MTX(np))
1156 1.195 ad #define NFSDC_UNLOCK(np) mutex_exit(_NFSDC_MTX(np))
1157 1.195 ad #define NFSDC_ASSERT_LOCKED(np) KASSERT(mutex_owned(_NFSDC_MTX(np)))
1158 1.135 yamt
1159 1.49 fvdl void
1160 1.214 dsl nfs_initdircache(struct vnode *vp)
1161 1.49 fvdl {
1162 1.49 fvdl struct nfsnode *np = VTONFS(vp);
1163 1.135 yamt struct nfsdirhashhead *dircache;
1164 1.120 yamt
1165 1.202 ad dircache = hashinit(NFS_DIRHASHSIZ, HASH_LIST, true,
1166 1.202 ad &nfsdirhashmask);
1167 1.49 fvdl
1168 1.135 yamt NFSDC_LOCK(np);
1169 1.135 yamt if (np->n_dircache == NULL) {
1170 1.135 yamt np->n_dircachesize = 0;
1171 1.135 yamt np->n_dircache = dircache;
1172 1.135 yamt dircache = NULL;
1173 1.135 yamt TAILQ_INIT(&np->n_dirchain);
1174 1.135 yamt }
1175 1.135 yamt NFSDC_UNLOCK(np);
1176 1.135 yamt if (dircache)
1177 1.202 ad hashdone(dircache, HASH_LIST, nfsdirhashmask);
1178 1.120 yamt }
1179 1.120 yamt
1180 1.120 yamt void
1181 1.214 dsl nfs_initdirxlatecookie(struct vnode *vp)
1182 1.120 yamt {
1183 1.120 yamt struct nfsnode *np = VTONFS(vp);
1184 1.135 yamt unsigned *dirgens;
1185 1.120 yamt
1186 1.120 yamt KASSERT(VFSTONFS(vp->v_mount)->nm_flag & NFSMNT_XLATECOOKIE);
1187 1.120 yamt
1188 1.196 yamt dirgens = kmem_zalloc(NFS_DIRHASHSIZ * sizeof(unsigned), KM_SLEEP);
1189 1.135 yamt NFSDC_LOCK(np);
1190 1.135 yamt if (np->n_dirgens == NULL) {
1191 1.135 yamt np->n_dirgens = dirgens;
1192 1.135 yamt dirgens = NULL;
1193 1.135 yamt }
1194 1.135 yamt NFSDC_UNLOCK(np);
1195 1.135 yamt if (dirgens)
1196 1.196 yamt kmem_free(dirgens, NFS_DIRHASHSIZ * sizeof(unsigned));
1197 1.135 yamt }
1198 1.135 yamt
1199 1.135 yamt static const struct nfsdircache dzero;
1200 1.135 yamt
1201 1.213 dsl static void nfs_unlinkdircache(struct nfsnode *np, struct nfsdircache *);
1202 1.213 dsl static void nfs_putdircache_unlocked(struct nfsnode *,
1203 1.213 dsl struct nfsdircache *);
1204 1.135 yamt
1205 1.135 yamt static void
1206 1.214 dsl nfs_unlinkdircache(struct nfsnode *np, struct nfsdircache *ndp)
1207 1.135 yamt {
1208 1.135 yamt
1209 1.135 yamt NFSDC_ASSERT_LOCKED(np);
1210 1.135 yamt KASSERT(ndp != &dzero);
1211 1.135 yamt
1212 1.135 yamt if (LIST_NEXT(ndp, dc_hash) == (void *)-1)
1213 1.135 yamt return;
1214 1.135 yamt
1215 1.135 yamt TAILQ_REMOVE(&np->n_dirchain, ndp, dc_chain);
1216 1.135 yamt LIST_REMOVE(ndp, dc_hash);
1217 1.135 yamt LIST_NEXT(ndp, dc_hash) = (void *)-1; /* mark as unlinked */
1218 1.135 yamt
1219 1.135 yamt nfs_putdircache_unlocked(np, ndp);
1220 1.135 yamt }
1221 1.135 yamt
1222 1.135 yamt void
1223 1.214 dsl nfs_putdircache(struct nfsnode *np, struct nfsdircache *ndp)
1224 1.135 yamt {
1225 1.135 yamt int ref;
1226 1.135 yamt
1227 1.135 yamt if (ndp == &dzero)
1228 1.135 yamt return;
1229 1.135 yamt
1230 1.135 yamt KASSERT(ndp->dc_refcnt > 0);
1231 1.135 yamt NFSDC_LOCK(np);
1232 1.135 yamt ref = --ndp->dc_refcnt;
1233 1.135 yamt NFSDC_UNLOCK(np);
1234 1.135 yamt
1235 1.135 yamt if (ref == 0)
1236 1.196 yamt kmem_free(ndp, sizeof(*ndp));
1237 1.49 fvdl }
1238 1.49 fvdl
1239 1.135 yamt static void
1240 1.177 yamt nfs_putdircache_unlocked(struct nfsnode *np, struct nfsdircache *ndp)
1241 1.135 yamt {
1242 1.135 yamt int ref;
1243 1.135 yamt
1244 1.135 yamt NFSDC_ASSERT_LOCKED(np);
1245 1.135 yamt
1246 1.135 yamt if (ndp == &dzero)
1247 1.135 yamt return;
1248 1.135 yamt
1249 1.135 yamt KASSERT(ndp->dc_refcnt > 0);
1250 1.135 yamt ref = --ndp->dc_refcnt;
1251 1.135 yamt if (ref == 0)
1252 1.196 yamt kmem_free(ndp, sizeof(*ndp));
1253 1.135 yamt }
1254 1.46 fvdl
1255 1.46 fvdl struct nfsdircache *
1256 1.214 dsl nfs_searchdircache(struct vnode *vp, off_t off, int do32, int *hashent)
1257 1.49 fvdl {
1258 1.49 fvdl struct nfsdirhashhead *ndhp;
1259 1.49 fvdl struct nfsdircache *ndp = NULL;
1260 1.49 fvdl struct nfsnode *np = VTONFS(vp);
1261 1.49 fvdl unsigned ent;
1262 1.49 fvdl
1263 1.49 fvdl /*
1264 1.49 fvdl * Zero is always a valid cookie.
1265 1.49 fvdl */
1266 1.49 fvdl if (off == 0)
1267 1.149 christos /* XXXUNCONST */
1268 1.149 christos return (struct nfsdircache *)__UNCONST(&dzero);
1269 1.49 fvdl
1270 1.134 yamt if (!np->n_dircache)
1271 1.134 yamt return NULL;
1272 1.134 yamt
1273 1.49 fvdl /*
1274 1.49 fvdl * We use a 32bit cookie as search key, directly reconstruct
1275 1.49 fvdl * the hashentry. Else use the hashfunction.
1276 1.49 fvdl */
1277 1.49 fvdl if (do32) {
1278 1.49 fvdl ent = (u_int32_t)off >> 24;
1279 1.49 fvdl if (ent >= NFS_DIRHASHSIZ)
1280 1.49 fvdl return NULL;
1281 1.49 fvdl ndhp = &np->n_dircache[ent];
1282 1.49 fvdl } else {
1283 1.49 fvdl ndhp = NFSDIRHASH(np, off);
1284 1.49 fvdl }
1285 1.49 fvdl
1286 1.49 fvdl if (hashent)
1287 1.49 fvdl *hashent = (int)(ndhp - np->n_dircache);
1288 1.135 yamt
1289 1.135 yamt NFSDC_LOCK(np);
1290 1.49 fvdl if (do32) {
1291 1.113 yamt LIST_FOREACH(ndp, ndhp, dc_hash) {
1292 1.49 fvdl if (ndp->dc_cookie32 == (u_int32_t)off) {
1293 1.49 fvdl /*
1294 1.49 fvdl * An invalidated entry will become the
1295 1.49 fvdl * start of a new block fetched from
1296 1.49 fvdl * the server.
1297 1.49 fvdl */
1298 1.135 yamt if (ndp->dc_flags & NFSDC_INVALID) {
1299 1.49 fvdl ndp->dc_blkcookie = ndp->dc_cookie;
1300 1.49 fvdl ndp->dc_entry = 0;
1301 1.135 yamt ndp->dc_flags &= ~NFSDC_INVALID;
1302 1.49 fvdl }
1303 1.49 fvdl break;
1304 1.49 fvdl }
1305 1.49 fvdl }
1306 1.49 fvdl } else {
1307 1.113 yamt LIST_FOREACH(ndp, ndhp, dc_hash) {
1308 1.49 fvdl if (ndp->dc_cookie == off)
1309 1.49 fvdl break;
1310 1.113 yamt }
1311 1.49 fvdl }
1312 1.135 yamt if (ndp != NULL)
1313 1.135 yamt ndp->dc_refcnt++;
1314 1.135 yamt NFSDC_UNLOCK(np);
1315 1.49 fvdl return ndp;
1316 1.49 fvdl }
1317 1.49 fvdl
1318 1.49 fvdl
1319 1.49 fvdl struct nfsdircache *
1320 1.171 christos nfs_enterdircache(struct vnode *vp, off_t off, off_t blkoff, int en,
1321 1.177 yamt daddr_t blkno)
1322 1.46 fvdl {
1323 1.46 fvdl struct nfsnode *np = VTONFS(vp);
1324 1.46 fvdl struct nfsdirhashhead *ndhp;
1325 1.135 yamt struct nfsdircache *ndp = NULL;
1326 1.135 yamt struct nfsdircache *newndp = NULL;
1327 1.49 fvdl struct nfsmount *nmp = VFSTONFS(vp->v_mount);
1328 1.161 christos int hashent = 0, gen, overwrite; /* XXX: GCC */
1329 1.46 fvdl
1330 1.135 yamt /*
1331 1.135 yamt * XXX refuse entries for offset 0. amd(8) erroneously sets
1332 1.135 yamt * cookie 0 for the '.' entry, making this necessary. This
1333 1.135 yamt * isn't so bad, as 0 is a special case anyway.
1334 1.135 yamt */
1335 1.135 yamt if (off == 0)
1336 1.149 christos /* XXXUNCONST */
1337 1.149 christos return (struct nfsdircache *)__UNCONST(&dzero);
1338 1.135 yamt
1339 1.49 fvdl if (!np->n_dircache)
1340 1.49 fvdl /*
1341 1.49 fvdl * XXX would like to do this in nfs_nget but vtype
1342 1.49 fvdl * isn't known at that time.
1343 1.49 fvdl */
1344 1.49 fvdl nfs_initdircache(vp);
1345 1.50 fvdl
1346 1.120 yamt if ((nmp->nm_flag & NFSMNT_XLATECOOKIE) && !np->n_dirgens)
1347 1.120 yamt nfs_initdirxlatecookie(vp);
1348 1.120 yamt
1349 1.135 yamt retry:
1350 1.49 fvdl ndp = nfs_searchdircache(vp, off, 0, &hashent);
1351 1.49 fvdl
1352 1.135 yamt NFSDC_LOCK(np);
1353 1.135 yamt if (ndp && (ndp->dc_flags & NFSDC_INVALID) == 0) {
1354 1.49 fvdl /*
1355 1.49 fvdl * Overwriting an old entry. Check if it's the same.
1356 1.49 fvdl * If so, just return. If not, remove the old entry.
1357 1.49 fvdl */
1358 1.49 fvdl if (ndp->dc_blkcookie == blkoff && ndp->dc_entry == en)
1359 1.135 yamt goto done;
1360 1.135 yamt nfs_unlinkdircache(np, ndp);
1361 1.135 yamt nfs_putdircache_unlocked(np, ndp);
1362 1.135 yamt ndp = NULL;
1363 1.46 fvdl }
1364 1.46 fvdl
1365 1.49 fvdl ndhp = &np->n_dircache[hashent];
1366 1.46 fvdl
1367 1.49 fvdl if (!ndp) {
1368 1.135 yamt if (newndp == NULL) {
1369 1.135 yamt NFSDC_UNLOCK(np);
1370 1.196 yamt newndp = kmem_alloc(sizeof(*newndp), KM_SLEEP);
1371 1.135 yamt newndp->dc_refcnt = 1;
1372 1.135 yamt LIST_NEXT(newndp, dc_hash) = (void *)-1;
1373 1.135 yamt goto retry;
1374 1.135 yamt }
1375 1.135 yamt ndp = newndp;
1376 1.135 yamt newndp = NULL;
1377 1.49 fvdl overwrite = 0;
1378 1.49 fvdl if (nmp->nm_flag & NFSMNT_XLATECOOKIE) {
1379 1.49 fvdl /*
1380 1.49 fvdl * We're allocating a new entry, so bump the
1381 1.49 fvdl * generation number.
1382 1.49 fvdl */
1383 1.160 christos KASSERT(np->n_dirgens);
1384 1.49 fvdl gen = ++np->n_dirgens[hashent];
1385 1.49 fvdl if (gen == 0) {
1386 1.49 fvdl np->n_dirgens[hashent]++;
1387 1.49 fvdl gen++;
1388 1.49 fvdl }
1389 1.49 fvdl ndp->dc_cookie32 = (hashent << 24) | (gen & 0xffffff);
1390 1.49 fvdl }
1391 1.49 fvdl } else
1392 1.49 fvdl overwrite = 1;
1393 1.46 fvdl
1394 1.49 fvdl ndp->dc_cookie = off;
1395 1.49 fvdl ndp->dc_blkcookie = blkoff;
1396 1.46 fvdl ndp->dc_entry = en;
1397 1.137 yamt ndp->dc_flags = 0;
1398 1.46 fvdl
1399 1.49 fvdl if (overwrite)
1400 1.135 yamt goto done;
1401 1.49 fvdl
1402 1.46 fvdl /*
1403 1.46 fvdl * If the maximum directory cookie cache size has been reached
1404 1.46 fvdl * for this node, take one off the front. The idea is that
1405 1.46 fvdl * directories are typically read front-to-back once, so that
1406 1.46 fvdl * the oldest entries can be thrown away without much performance
1407 1.46 fvdl * loss.
1408 1.46 fvdl */
1409 1.46 fvdl if (np->n_dircachesize == NFS_MAXDIRCACHE) {
1410 1.135 yamt nfs_unlinkdircache(np, TAILQ_FIRST(&np->n_dirchain));
1411 1.46 fvdl } else
1412 1.46 fvdl np->n_dircachesize++;
1413 1.148 perry
1414 1.135 yamt KASSERT(ndp->dc_refcnt == 1);
1415 1.46 fvdl LIST_INSERT_HEAD(ndhp, ndp, dc_hash);
1416 1.46 fvdl TAILQ_INSERT_TAIL(&np->n_dirchain, ndp, dc_chain);
1417 1.135 yamt ndp->dc_refcnt++;
1418 1.135 yamt done:
1419 1.135 yamt KASSERT(ndp->dc_refcnt > 0);
1420 1.135 yamt NFSDC_UNLOCK(np);
1421 1.135 yamt if (newndp)
1422 1.135 yamt nfs_putdircache(np, newndp);
1423 1.46 fvdl return ndp;
1424 1.46 fvdl }
1425 1.46 fvdl
1426 1.46 fvdl void
1427 1.214 dsl nfs_invaldircache(struct vnode *vp, int flags)
1428 1.46 fvdl {
1429 1.46 fvdl struct nfsnode *np = VTONFS(vp);
1430 1.46 fvdl struct nfsdircache *ndp = NULL;
1431 1.49 fvdl struct nfsmount *nmp = VFSTONFS(vp->v_mount);
1432 1.181 thorpej const bool forcefree = flags & NFS_INVALDIRCACHE_FORCE;
1433 1.46 fvdl
1434 1.46 fvdl #ifdef DIAGNOSTIC
1435 1.46 fvdl if (vp->v_type != VDIR)
1436 1.46 fvdl panic("nfs: invaldircache: not dir");
1437 1.46 fvdl #endif
1438 1.46 fvdl
1439 1.145 yamt if ((flags & NFS_INVALDIRCACHE_KEEPEOF) == 0)
1440 1.145 yamt np->n_flag &= ~NEOFVALID;
1441 1.144 yamt
1442 1.46 fvdl if (!np->n_dircache)
1443 1.46 fvdl return;
1444 1.46 fvdl
1445 1.135 yamt NFSDC_LOCK(np);
1446 1.49 fvdl if (!(nmp->nm_flag & NFSMNT_XLATECOOKIE) || forcefree) {
1447 1.135 yamt while ((ndp = TAILQ_FIRST(&np->n_dirchain)) != NULL) {
1448 1.135 yamt KASSERT(!forcefree || ndp->dc_refcnt == 1);
1449 1.135 yamt nfs_unlinkdircache(np, ndp);
1450 1.49 fvdl }
1451 1.49 fvdl np->n_dircachesize = 0;
1452 1.49 fvdl if (forcefree && np->n_dirgens) {
1453 1.196 yamt kmem_free(np->n_dirgens,
1454 1.196 yamt NFS_DIRHASHSIZ * sizeof(unsigned));
1455 1.120 yamt np->n_dirgens = NULL;
1456 1.49 fvdl }
1457 1.49 fvdl } else {
1458 1.135 yamt TAILQ_FOREACH(ndp, &np->n_dirchain, dc_chain)
1459 1.135 yamt ndp->dc_flags |= NFSDC_INVALID;
1460 1.46 fvdl }
1461 1.46 fvdl
1462 1.135 yamt NFSDC_UNLOCK(np);
1463 1.46 fvdl }
1464 1.46 fvdl
1465 1.1 cgd /*
1466 1.35 thorpej * Called once before VFS init to initialize shared and
1467 1.35 thorpej * server-specific data structures.
1468 1.1 cgd */
1469 1.157 yamt static int
1470 1.155 thorpej nfs_init0(void)
1471 1.1 cgd {
1472 1.189 ad
1473 1.12 mycroft nfsrtt.pos = 0;
1474 1.1 cgd rpc_vers = txdr_unsigned(RPC_VER2);
1475 1.1 cgd rpc_call = txdr_unsigned(RPC_CALL);
1476 1.1 cgd rpc_reply = txdr_unsigned(RPC_REPLY);
1477 1.1 cgd rpc_msgdenied = txdr_unsigned(RPC_MSGDENIED);
1478 1.1 cgd rpc_msgaccepted = txdr_unsigned(RPC_MSGACCEPTED);
1479 1.1 cgd rpc_mismatch = txdr_unsigned(RPC_MISMATCH);
1480 1.12 mycroft rpc_autherr = txdr_unsigned(RPC_AUTHERR);
1481 1.1 cgd rpc_auth_unix = txdr_unsigned(RPCAUTH_UNIX);
1482 1.25 fvdl rpc_auth_kerb = txdr_unsigned(RPCAUTH_KERB4);
1483 1.1 cgd nfs_prog = txdr_unsigned(NFS_PROG);
1484 1.182 thorpej nfs_true = txdr_unsigned(true);
1485 1.182 thorpej nfs_false = txdr_unsigned(false);
1486 1.12 mycroft nfs_xdrneg1 = txdr_unsigned(-1);
1487 1.25 fvdl nfs_ticks = (hz * NFS_TICKINTVL + 500) / 1000;
1488 1.25 fvdl if (nfs_ticks < 1)
1489 1.25 fvdl nfs_ticks = 1;
1490 1.164 yamt nfsdreq_init();
1491 1.164 yamt
1492 1.1 cgd /*
1493 1.1 cgd * Initialize reply list and start timer
1494 1.1 cgd */
1495 1.16 mycroft TAILQ_INIT(&nfs_reqq);
1496 1.230 christos mutex_init(&nfs_reqq_lock, MUTEX_DEFAULT, IPL_NONE);
1497 1.191 yamt nfs_timer_init();
1498 1.109 matt MOWNER_ATTACH(&nfs_mowner);
1499 1.106 jdolecek
1500 1.157 yamt return 0;
1501 1.1 cgd }
1502 1.1 cgd
1503 1.223 christos static volatile uint32_t nfs_mutex;
1504 1.223 christos static uint32_t nfs_refcount;
1505 1.223 christos
1506 1.223 christos #define nfs_p() while (atomic_cas_32(&nfs_mutex, 0, 1) == 0) continue;
1507 1.223 christos #define nfs_v() while (atomic_cas_32(&nfs_mutex, 1, 0) == 1) continue;
1508 1.223 christos
1509 1.210 ad /*
1510 1.210 ad * This is disgusting, but it must support both modular and monolothic
1511 1.223 christos * configurations, plus the code is shared between server and client.
1512 1.223 christos * For monolithic builds NFSSERVER may not imply NFS. Unfortunately we
1513 1.223 christos * can't use regular mutexes here that would require static initialization
1514 1.223 christos * and we can get initialized from multiple places, so we improvise.
1515 1.210 ad *
1516 1.210 ad * Yuck.
1517 1.210 ad */
1518 1.155 thorpej void
1519 1.155 thorpej nfs_init(void)
1520 1.155 thorpej {
1521 1.224 pgoyette
1522 1.223 christos nfs_p();
1523 1.223 christos if (nfs_refcount++ == 0)
1524 1.223 christos nfs_init0();
1525 1.223 christos nfs_v();
1526 1.155 thorpej }
1527 1.155 thorpej
1528 1.210 ad void
1529 1.210 ad nfs_fini(void)
1530 1.210 ad {
1531 1.224 pgoyette
1532 1.223 christos nfs_p();
1533 1.223 christos if (--nfs_refcount == 0) {
1534 1.223 christos MOWNER_DETACH(&nfs_mowner);
1535 1.223 christos nfs_timer_fini();
1536 1.230 christos mutex_destroy(&nfs_reqq_lock);
1537 1.223 christos nfsdreq_fini();
1538 1.223 christos }
1539 1.223 christos nfs_v();
1540 1.210 ad }
1541 1.210 ad
1542 1.1 cgd /*
1543 1.118 yamt * A fiddled version of m_adj() that ensures null fill to a 32-bit
1544 1.1 cgd * boundary and only trims off the back end
1545 1.122 yamt *
1546 1.122 yamt * 1. trim off 'len' bytes as m_adj(mp, -len).
1547 1.122 yamt * 2. add zero-padding 'nul' bytes at the end of the mbuf chain.
1548 1.1 cgd */
1549 1.12 mycroft void
1550 1.214 dsl nfs_zeropad(struct mbuf *mp, int len, int nul)
1551 1.1 cgd {
1552 1.75 augustss struct mbuf *m;
1553 1.130 yamt int count;
1554 1.1 cgd
1555 1.1 cgd /*
1556 1.1 cgd * Trim from tail. Scan the mbuf chain,
1557 1.1 cgd * calculating its length and finding the last mbuf.
1558 1.1 cgd * If the adjustment only affects this mbuf, then just
1559 1.1 cgd * adjust and return. Otherwise, rescan and truncate
1560 1.1 cgd * after the remaining size.
1561 1.1 cgd */
1562 1.1 cgd count = 0;
1563 1.1 cgd m = mp;
1564 1.1 cgd for (;;) {
1565 1.1 cgd count += m->m_len;
1566 1.122 yamt if (m->m_next == NULL)
1567 1.1 cgd break;
1568 1.1 cgd m = m->m_next;
1569 1.1 cgd }
1570 1.122 yamt
1571 1.122 yamt KDASSERT(count >= len);
1572 1.122 yamt
1573 1.122 yamt if (m->m_len >= len) {
1574 1.1 cgd m->m_len -= len;
1575 1.122 yamt } else {
1576 1.122 yamt count -= len;
1577 1.122 yamt /*
1578 1.122 yamt * Correct length for chain is "count".
1579 1.122 yamt * Find the mbuf with last data, adjust its length,
1580 1.122 yamt * and toss data from remaining mbufs on chain.
1581 1.122 yamt */
1582 1.122 yamt for (m = mp; m; m = m->m_next) {
1583 1.122 yamt if (m->m_len >= count) {
1584 1.122 yamt m->m_len = count;
1585 1.122 yamt break;
1586 1.118 yamt }
1587 1.122 yamt count -= m->m_len;
1588 1.1 cgd }
1589 1.159 christos KASSERT(m && m->m_next);
1590 1.122 yamt m_freem(m->m_next);
1591 1.122 yamt m->m_next = NULL;
1592 1.1 cgd }
1593 1.122 yamt
1594 1.130 yamt KDASSERT(m->m_next == NULL);
1595 1.130 yamt
1596 1.122 yamt /*
1597 1.122 yamt * zero-padding.
1598 1.122 yamt */
1599 1.122 yamt if (nul > 0) {
1600 1.130 yamt char *cp;
1601 1.130 yamt int i;
1602 1.130 yamt
1603 1.231 maxv if (M_READONLY(m) || M_TRAILINGSPACE(m) < nul) {
1604 1.122 yamt struct mbuf *n;
1605 1.122 yamt
1606 1.122 yamt KDASSERT(MLEN >= nul);
1607 1.122 yamt n = m_get(M_WAIT, MT_DATA);
1608 1.122 yamt MCLAIM(n, &nfs_mowner);
1609 1.122 yamt n->m_len = nul;
1610 1.130 yamt n->m_next = NULL;
1611 1.122 yamt m->m_next = n;
1612 1.183 christos cp = mtod(n, void *);
1613 1.122 yamt } else {
1614 1.183 christos cp = mtod(m, char *) + m->m_len;
1615 1.122 yamt m->m_len += nul;
1616 1.1 cgd }
1617 1.122 yamt for (i = 0; i < nul; i++)
1618 1.122 yamt *cp++ = '\0';
1619 1.1 cgd }
1620 1.122 yamt return;
1621 1.1 cgd }
1622 1.1 cgd
1623 1.1 cgd /*
1624 1.25 fvdl * Make these functions instead of macros, so that the kernel text size
1625 1.25 fvdl * doesn't get too big...
1626 1.25 fvdl */
1627 1.25 fvdl void
1628 1.214 dsl nfsm_srvwcc(struct nfsrv_descript *nfsd, int before_ret, struct vattr *before_vap, int after_ret, struct vattr *after_vap, struct mbuf **mbp, char **bposp)
1629 1.25 fvdl {
1630 1.109 matt struct mbuf *mb = *mbp;
1631 1.75 augustss char *bpos = *bposp;
1632 1.75 augustss u_int32_t *tl;
1633 1.25 fvdl
1634 1.25 fvdl if (before_ret) {
1635 1.25 fvdl nfsm_build(tl, u_int32_t *, NFSX_UNSIGNED);
1636 1.25 fvdl *tl = nfs_false;
1637 1.25 fvdl } else {
1638 1.25 fvdl nfsm_build(tl, u_int32_t *, 7 * NFSX_UNSIGNED);
1639 1.25 fvdl *tl++ = nfs_true;
1640 1.66 fair txdr_hyper(before_vap->va_size, tl);
1641 1.25 fvdl tl += 2;
1642 1.25 fvdl txdr_nfsv3time(&(before_vap->va_mtime), tl);
1643 1.25 fvdl tl += 2;
1644 1.25 fvdl txdr_nfsv3time(&(before_vap->va_ctime), tl);
1645 1.25 fvdl }
1646 1.25 fvdl *bposp = bpos;
1647 1.25 fvdl *mbp = mb;
1648 1.25 fvdl nfsm_srvpostopattr(nfsd, after_ret, after_vap, mbp, bposp);
1649 1.25 fvdl }
1650 1.25 fvdl
1651 1.25 fvdl void
1652 1.214 dsl nfsm_srvpostopattr(struct nfsrv_descript *nfsd, int after_ret, struct vattr *after_vap, struct mbuf **mbp, char **bposp)
1653 1.25 fvdl {
1654 1.109 matt struct mbuf *mb = *mbp;
1655 1.75 augustss char *bpos = *bposp;
1656 1.75 augustss u_int32_t *tl;
1657 1.75 augustss struct nfs_fattr *fp;
1658 1.25 fvdl
1659 1.25 fvdl if (after_ret) {
1660 1.25 fvdl nfsm_build(tl, u_int32_t *, NFSX_UNSIGNED);
1661 1.25 fvdl *tl = nfs_false;
1662 1.25 fvdl } else {
1663 1.25 fvdl nfsm_build(tl, u_int32_t *, NFSX_UNSIGNED + NFSX_V3FATTR);
1664 1.25 fvdl *tl++ = nfs_true;
1665 1.25 fvdl fp = (struct nfs_fattr *)tl;
1666 1.25 fvdl nfsm_srvfattr(nfsd, after_vap, fp);
1667 1.25 fvdl }
1668 1.25 fvdl *mbp = mb;
1669 1.25 fvdl *bposp = bpos;
1670 1.25 fvdl }
1671 1.25 fvdl
1672 1.25 fvdl void
1673 1.214 dsl nfsm_srvfattr(struct nfsrv_descript *nfsd, struct vattr *vap, struct nfs_fattr *fp)
1674 1.25 fvdl {
1675 1.25 fvdl
1676 1.25 fvdl fp->fa_nlink = txdr_unsigned(vap->va_nlink);
1677 1.25 fvdl fp->fa_uid = txdr_unsigned(vap->va_uid);
1678 1.25 fvdl fp->fa_gid = txdr_unsigned(vap->va_gid);
1679 1.25 fvdl if (nfsd->nd_flag & ND_NFSV3) {
1680 1.25 fvdl fp->fa_type = vtonfsv3_type(vap->va_type);
1681 1.25 fvdl fp->fa_mode = vtonfsv3_mode(vap->va_mode);
1682 1.66 fair txdr_hyper(vap->va_size, &fp->fa3_size);
1683 1.66 fair txdr_hyper(vap->va_bytes, &fp->fa3_used);
1684 1.25 fvdl fp->fa3_rdev.specdata1 = txdr_unsigned(major(vap->va_rdev));
1685 1.25 fvdl fp->fa3_rdev.specdata2 = txdr_unsigned(minor(vap->va_rdev));
1686 1.25 fvdl fp->fa3_fsid.nfsuquad[0] = 0;
1687 1.25 fvdl fp->fa3_fsid.nfsuquad[1] = txdr_unsigned(vap->va_fsid);
1688 1.151 yamt txdr_hyper(vap->va_fileid, &fp->fa3_fileid);
1689 1.25 fvdl txdr_nfsv3time(&vap->va_atime, &fp->fa3_atime);
1690 1.25 fvdl txdr_nfsv3time(&vap->va_mtime, &fp->fa3_mtime);
1691 1.25 fvdl txdr_nfsv3time(&vap->va_ctime, &fp->fa3_ctime);
1692 1.25 fvdl } else {
1693 1.25 fvdl fp->fa_type = vtonfsv2_type(vap->va_type);
1694 1.25 fvdl fp->fa_mode = vtonfsv2_mode(vap->va_type, vap->va_mode);
1695 1.25 fvdl fp->fa2_size = txdr_unsigned(vap->va_size);
1696 1.25 fvdl fp->fa2_blocksize = txdr_unsigned(vap->va_blocksize);
1697 1.25 fvdl if (vap->va_type == VFIFO)
1698 1.25 fvdl fp->fa2_rdev = 0xffffffff;
1699 1.25 fvdl else
1700 1.25 fvdl fp->fa2_rdev = txdr_unsigned(vap->va_rdev);
1701 1.25 fvdl fp->fa2_blocks = txdr_unsigned(vap->va_bytes / NFS_FABLKSIZE);
1702 1.25 fvdl fp->fa2_fsid = txdr_unsigned(vap->va_fsid);
1703 1.25 fvdl fp->fa2_fileid = txdr_unsigned(vap->va_fileid);
1704 1.25 fvdl txdr_nfsv2time(&vap->va_atime, &fp->fa2_atime);
1705 1.25 fvdl txdr_nfsv2time(&vap->va_mtime, &fp->fa2_mtime);
1706 1.25 fvdl txdr_nfsv2time(&vap->va_ctime, &fp->fa2_ctime);
1707 1.25 fvdl }
1708 1.25 fvdl }
1709 1.25 fvdl
1710 1.1 cgd /*
1711 1.182 thorpej * This function compares two net addresses by family and returns true
1712 1.12 mycroft * if they are the same host.
1713 1.182 thorpej * If there is any doubt, return false.
1714 1.12 mycroft * The AF_INET family is handled as a special case so that address mbufs
1715 1.12 mycroft * don't need to be saved to store "struct in_addr", which is only 4 bytes.
1716 1.1 cgd */
1717 1.24 christos int
1718 1.214 dsl netaddr_match(int family, union nethostaddr *haddr, struct mbuf *nam)
1719 1.1 cgd {
1720 1.75 augustss struct sockaddr_in *inetaddr;
1721 1.1 cgd
1722 1.12 mycroft switch (family) {
1723 1.12 mycroft case AF_INET:
1724 1.12 mycroft inetaddr = mtod(nam, struct sockaddr_in *);
1725 1.12 mycroft if (inetaddr->sin_family == AF_INET &&
1726 1.12 mycroft inetaddr->sin_addr.s_addr == haddr->had_inetaddr)
1727 1.12 mycroft return (1);
1728 1.12 mycroft break;
1729 1.76 fvdl case AF_INET6:
1730 1.76 fvdl {
1731 1.76 fvdl struct sockaddr_in6 *sin6_1, *sin6_2;
1732 1.76 fvdl
1733 1.76 fvdl sin6_1 = mtod(nam, struct sockaddr_in6 *);
1734 1.76 fvdl sin6_2 = mtod(haddr->had_nam, struct sockaddr_in6 *);
1735 1.76 fvdl if (sin6_1->sin6_family == AF_INET6 &&
1736 1.76 fvdl IN6_ARE_ADDR_EQUAL(&sin6_1->sin6_addr, &sin6_2->sin6_addr))
1737 1.76 fvdl return 1;
1738 1.76 fvdl }
1739 1.12 mycroft default:
1740 1.12 mycroft break;
1741 1.12 mycroft };
1742 1.12 mycroft return (0);
1743 1.25 fvdl }
1744 1.25 fvdl
1745 1.226 christos struct nfs_clearcommit_ctx {
1746 1.226 christos struct mount *mp;
1747 1.226 christos };
1748 1.226 christos
1749 1.226 christos static bool
1750 1.226 christos nfs_clearcommit_selector(void *cl, struct vnode *vp)
1751 1.226 christos {
1752 1.226 christos struct nfs_clearcommit_ctx *c = cl;
1753 1.226 christos struct nfsnode *np;
1754 1.226 christos struct vm_page *pg;
1755 1.236 ad struct uvm_page_array a;
1756 1.236 ad voff_t off;
1757 1.226 christos
1758 1.229 riastrad KASSERT(mutex_owned(vp->v_interlock));
1759 1.229 riastrad
1760 1.226 christos np = VTONFS(vp);
1761 1.226 christos if (vp->v_type != VREG || vp->v_mount != c->mp || np == NULL)
1762 1.226 christos return false;
1763 1.226 christos np->n_pushlo = np->n_pushhi = np->n_pushedlo =
1764 1.226 christos np->n_pushedhi = 0;
1765 1.226 christos np->n_commitflags &=
1766 1.226 christos ~(NFS_COMMIT_PUSH_VALID | NFS_COMMIT_PUSHED_VALID);
1767 1.236 ad uvm_page_array_init(&a);
1768 1.236 ad off = 0;
1769 1.236 ad while ((pg = uvm_page_array_fill_and_peek(&a, &vp->v_uobj, off,
1770 1.236 ad 0, 0)) != NULL) {
1771 1.226 christos pg->flags &= ~PG_NEEDCOMMIT;
1772 1.236 ad uvm_page_array_advance(&a);
1773 1.236 ad off = pg->offset + PAGE_SIZE;
1774 1.226 christos }
1775 1.236 ad uvm_page_array_fini(&a);
1776 1.226 christos return false;
1777 1.226 christos }
1778 1.226 christos
1779 1.25 fvdl /*
1780 1.25 fvdl * The write verifier has changed (probably due to a server reboot), so all
1781 1.114 yamt * PG_NEEDCOMMIT pages will have to be written again. Since they are marked
1782 1.117 yamt * as dirty or are being written out just now, all this takes is clearing
1783 1.117 yamt * the PG_NEEDCOMMIT flag. Once done the new write verifier can be set for
1784 1.117 yamt * the mount point.
1785 1.25 fvdl */
1786 1.25 fvdl void
1787 1.214 dsl nfs_clearcommit(struct mount *mp)
1788 1.25 fvdl {
1789 1.226 christos struct vnode *vp __diagused;
1790 1.225 hannken struct vnode_iterator *marker;
1791 1.116 yamt struct nfsmount *nmp = VFSTONFS(mp);
1792 1.226 christos struct nfs_clearcommit_ctx ctx;
1793 1.116 yamt
1794 1.180 yamt rw_enter(&nmp->nm_writeverflock, RW_WRITER);
1795 1.225 hannken vfs_vnode_iterator_init(mp, &marker);
1796 1.226 christos ctx.mp = mp;
1797 1.226 christos vp = vfs_vnode_iterator_next(marker, nfs_clearcommit_selector, &ctx);
1798 1.226 christos KASSERT(vp == NULL);
1799 1.225 hannken vfs_vnode_iterator_destroy(marker);
1800 1.186 yamt mutex_enter(&nmp->nm_lock);
1801 1.116 yamt nmp->nm_iflag &= ~NFSMNT_STALEWRITEVERF;
1802 1.186 yamt mutex_exit(&nmp->nm_lock);
1803 1.180 yamt rw_exit(&nmp->nm_writeverflock);
1804 1.83 fvdl }
1805 1.83 fvdl
1806 1.83 fvdl void
1807 1.214 dsl nfs_merge_commit_ranges(struct vnode *vp)
1808 1.83 fvdl {
1809 1.83 fvdl struct nfsnode *np = VTONFS(vp);
1810 1.112 yamt
1811 1.112 yamt KASSERT(np->n_commitflags & NFS_COMMIT_PUSH_VALID);
1812 1.83 fvdl
1813 1.83 fvdl if (!(np->n_commitflags & NFS_COMMIT_PUSHED_VALID)) {
1814 1.83 fvdl np->n_pushedlo = np->n_pushlo;
1815 1.83 fvdl np->n_pushedhi = np->n_pushhi;
1816 1.83 fvdl np->n_commitflags |= NFS_COMMIT_PUSHED_VALID;
1817 1.83 fvdl } else {
1818 1.83 fvdl if (np->n_pushlo < np->n_pushedlo)
1819 1.83 fvdl np->n_pushedlo = np->n_pushlo;
1820 1.83 fvdl if (np->n_pushhi > np->n_pushedhi)
1821 1.83 fvdl np->n_pushedhi = np->n_pushhi;
1822 1.83 fvdl }
1823 1.83 fvdl
1824 1.83 fvdl np->n_pushlo = np->n_pushhi = 0;
1825 1.83 fvdl np->n_commitflags &= ~NFS_COMMIT_PUSH_VALID;
1826 1.83 fvdl
1827 1.111 yamt #ifdef NFS_DEBUG_COMMIT
1828 1.83 fvdl printf("merge: committed: %u - %u\n", (unsigned)np->n_pushedlo,
1829 1.83 fvdl (unsigned)np->n_pushedhi);
1830 1.83 fvdl #endif
1831 1.83 fvdl }
1832 1.83 fvdl
1833 1.83 fvdl int
1834 1.215 dsl nfs_in_committed_range(struct vnode *vp, off_t off, off_t len)
1835 1.83 fvdl {
1836 1.83 fvdl struct nfsnode *np = VTONFS(vp);
1837 1.83 fvdl off_t lo, hi;
1838 1.83 fvdl
1839 1.83 fvdl if (!(np->n_commitflags & NFS_COMMIT_PUSHED_VALID))
1840 1.83 fvdl return 0;
1841 1.89 chs lo = off;
1842 1.89 chs hi = lo + len;
1843 1.83 fvdl
1844 1.83 fvdl return (lo >= np->n_pushedlo && hi <= np->n_pushedhi);
1845 1.83 fvdl }
1846 1.83 fvdl
1847 1.83 fvdl int
1848 1.215 dsl nfs_in_tobecommitted_range(struct vnode *vp, off_t off, off_t len)
1849 1.83 fvdl {
1850 1.83 fvdl struct nfsnode *np = VTONFS(vp);
1851 1.83 fvdl off_t lo, hi;
1852 1.83 fvdl
1853 1.83 fvdl if (!(np->n_commitflags & NFS_COMMIT_PUSH_VALID))
1854 1.83 fvdl return 0;
1855 1.89 chs lo = off;
1856 1.89 chs hi = lo + len;
1857 1.83 fvdl
1858 1.83 fvdl return (lo >= np->n_pushlo && hi <= np->n_pushhi);
1859 1.83 fvdl }
1860 1.83 fvdl
1861 1.83 fvdl void
1862 1.215 dsl nfs_add_committed_range(struct vnode *vp, off_t off, off_t len)
1863 1.83 fvdl {
1864 1.83 fvdl struct nfsnode *np = VTONFS(vp);
1865 1.83 fvdl off_t lo, hi;
1866 1.83 fvdl
1867 1.89 chs lo = off;
1868 1.89 chs hi = lo + len;
1869 1.83 fvdl
1870 1.83 fvdl if (!(np->n_commitflags & NFS_COMMIT_PUSHED_VALID)) {
1871 1.83 fvdl np->n_pushedlo = lo;
1872 1.83 fvdl np->n_pushedhi = hi;
1873 1.83 fvdl np->n_commitflags |= NFS_COMMIT_PUSHED_VALID;
1874 1.83 fvdl } else {
1875 1.83 fvdl if (hi > np->n_pushedhi)
1876 1.83 fvdl np->n_pushedhi = hi;
1877 1.83 fvdl if (lo < np->n_pushedlo)
1878 1.83 fvdl np->n_pushedlo = lo;
1879 1.83 fvdl }
1880 1.111 yamt #ifdef NFS_DEBUG_COMMIT
1881 1.83 fvdl printf("add: committed: %u - %u\n", (unsigned)np->n_pushedlo,
1882 1.83 fvdl (unsigned)np->n_pushedhi);
1883 1.83 fvdl #endif
1884 1.83 fvdl }
1885 1.83 fvdl
1886 1.83 fvdl void
1887 1.215 dsl nfs_del_committed_range(struct vnode *vp, off_t off, off_t len)
1888 1.83 fvdl {
1889 1.83 fvdl struct nfsnode *np = VTONFS(vp);
1890 1.83 fvdl off_t lo, hi;
1891 1.83 fvdl
1892 1.83 fvdl if (!(np->n_commitflags & NFS_COMMIT_PUSHED_VALID))
1893 1.83 fvdl return;
1894 1.83 fvdl
1895 1.89 chs lo = off;
1896 1.89 chs hi = lo + len;
1897 1.83 fvdl
1898 1.83 fvdl if (lo > np->n_pushedhi || hi < np->n_pushedlo)
1899 1.83 fvdl return;
1900 1.83 fvdl if (lo <= np->n_pushedlo)
1901 1.83 fvdl np->n_pushedlo = hi;
1902 1.83 fvdl else if (hi >= np->n_pushedhi)
1903 1.83 fvdl np->n_pushedhi = lo;
1904 1.83 fvdl else {
1905 1.83 fvdl /*
1906 1.83 fvdl * XXX There's only one range. If the deleted range
1907 1.83 fvdl * is in the middle, pick the largest of the
1908 1.83 fvdl * contiguous ranges that it leaves.
1909 1.83 fvdl */
1910 1.83 fvdl if ((np->n_pushedlo - lo) > (hi - np->n_pushedhi))
1911 1.83 fvdl np->n_pushedhi = lo;
1912 1.83 fvdl else
1913 1.83 fvdl np->n_pushedlo = hi;
1914 1.83 fvdl }
1915 1.111 yamt #ifdef NFS_DEBUG_COMMIT
1916 1.83 fvdl printf("del: committed: %u - %u\n", (unsigned)np->n_pushedlo,
1917 1.83 fvdl (unsigned)np->n_pushedhi);
1918 1.83 fvdl #endif
1919 1.83 fvdl }
1920 1.83 fvdl
1921 1.83 fvdl void
1922 1.215 dsl nfs_add_tobecommitted_range(struct vnode *vp, off_t off, off_t len)
1923 1.83 fvdl {
1924 1.83 fvdl struct nfsnode *np = VTONFS(vp);
1925 1.83 fvdl off_t lo, hi;
1926 1.83 fvdl
1927 1.89 chs lo = off;
1928 1.89 chs hi = lo + len;
1929 1.83 fvdl
1930 1.83 fvdl if (!(np->n_commitflags & NFS_COMMIT_PUSH_VALID)) {
1931 1.83 fvdl np->n_pushlo = lo;
1932 1.83 fvdl np->n_pushhi = hi;
1933 1.83 fvdl np->n_commitflags |= NFS_COMMIT_PUSH_VALID;
1934 1.83 fvdl } else {
1935 1.83 fvdl if (lo < np->n_pushlo)
1936 1.83 fvdl np->n_pushlo = lo;
1937 1.83 fvdl if (hi > np->n_pushhi)
1938 1.83 fvdl np->n_pushhi = hi;
1939 1.83 fvdl }
1940 1.111 yamt #ifdef NFS_DEBUG_COMMIT
1941 1.83 fvdl printf("add: tobecommitted: %u - %u\n", (unsigned)np->n_pushlo,
1942 1.83 fvdl (unsigned)np->n_pushhi);
1943 1.83 fvdl #endif
1944 1.83 fvdl }
1945 1.83 fvdl
1946 1.83 fvdl void
1947 1.215 dsl nfs_del_tobecommitted_range(struct vnode *vp, off_t off, off_t len)
1948 1.83 fvdl {
1949 1.83 fvdl struct nfsnode *np = VTONFS(vp);
1950 1.83 fvdl off_t lo, hi;
1951 1.83 fvdl
1952 1.83 fvdl if (!(np->n_commitflags & NFS_COMMIT_PUSH_VALID))
1953 1.83 fvdl return;
1954 1.83 fvdl
1955 1.89 chs lo = off;
1956 1.89 chs hi = lo + len;
1957 1.83 fvdl
1958 1.83 fvdl if (lo > np->n_pushhi || hi < np->n_pushlo)
1959 1.83 fvdl return;
1960 1.83 fvdl
1961 1.83 fvdl if (lo <= np->n_pushlo)
1962 1.83 fvdl np->n_pushlo = hi;
1963 1.83 fvdl else if (hi >= np->n_pushhi)
1964 1.83 fvdl np->n_pushhi = lo;
1965 1.83 fvdl else {
1966 1.83 fvdl /*
1967 1.83 fvdl * XXX There's only one range. If the deleted range
1968 1.83 fvdl * is in the middle, pick the largest of the
1969 1.83 fvdl * contiguous ranges that it leaves.
1970 1.83 fvdl */
1971 1.83 fvdl if ((np->n_pushlo - lo) > (hi - np->n_pushhi))
1972 1.83 fvdl np->n_pushhi = lo;
1973 1.83 fvdl else
1974 1.83 fvdl np->n_pushlo = hi;
1975 1.83 fvdl }
1976 1.111 yamt #ifdef NFS_DEBUG_COMMIT
1977 1.83 fvdl printf("del: tobecommitted: %u - %u\n", (unsigned)np->n_pushlo,
1978 1.83 fvdl (unsigned)np->n_pushhi);
1979 1.83 fvdl #endif
1980 1.25 fvdl }
1981 1.25 fvdl
1982 1.25 fvdl /*
1983 1.25 fvdl * Map errnos to NFS error numbers. For Version 3 also filter out error
1984 1.25 fvdl * numbers not specified for the associated procedure.
1985 1.25 fvdl */
1986 1.25 fvdl int
1987 1.214 dsl nfsrv_errmap(struct nfsrv_descript *nd, int err)
1988 1.25 fvdl {
1989 1.90 jdolecek const short *defaulterrp, *errp;
1990 1.25 fvdl
1991 1.25 fvdl if (nd->nd_flag & ND_NFSV3) {
1992 1.25 fvdl if (nd->nd_procnum <= NFSPROC_COMMIT) {
1993 1.25 fvdl errp = defaulterrp = nfsrv_v3errmap[nd->nd_procnum];
1994 1.25 fvdl while (*++errp) {
1995 1.25 fvdl if (*errp == err)
1996 1.25 fvdl return (err);
1997 1.25 fvdl else if (*errp > err)
1998 1.25 fvdl break;
1999 1.25 fvdl }
2000 1.25 fvdl return ((int)*defaulterrp);
2001 1.25 fvdl } else
2002 1.25 fvdl return (err & 0xffff);
2003 1.25 fvdl }
2004 1.25 fvdl if (err <= ELAST)
2005 1.25 fvdl return ((int)nfsrv_v2errmap[err - 1]);
2006 1.25 fvdl return (NFSERR_IO);
2007 1.25 fvdl }
2008 1.25 fvdl
2009 1.126 yamt u_int32_t
2010 1.216 cegger nfs_getxid(void)
2011 1.126 yamt {
2012 1.126 yamt u_int32_t newxid;
2013 1.126 yamt
2014 1.227 tls if (__predict_false(nfs_xid == 0)) {
2015 1.227 tls nfs_xid = cprng_fast32();
2016 1.227 tls }
2017 1.227 tls
2018 1.207 pooka /* get next xid. skip 0 */
2019 1.207 pooka do {
2020 1.207 pooka newxid = atomic_inc_32_nv(&nfs_xid);
2021 1.207 pooka } while (__predict_false(newxid == 0));
2022 1.126 yamt
2023 1.126 yamt return txdr_unsigned(newxid);
2024 1.126 yamt }
2025 1.126 yamt
2026 1.126 yamt /*
2027 1.126 yamt * assign a new xid for existing request.
2028 1.126 yamt * used for NFSERR_JUKEBOX handling.
2029 1.126 yamt */
2030 1.126 yamt void
2031 1.126 yamt nfs_renewxid(struct nfsreq *req)
2032 1.126 yamt {
2033 1.126 yamt u_int32_t xid;
2034 1.126 yamt int off;
2035 1.126 yamt
2036 1.126 yamt xid = nfs_getxid();
2037 1.126 yamt if (req->r_nmp->nm_sotype == SOCK_STREAM)
2038 1.126 yamt off = sizeof(u_int32_t); /* RPC record mark */
2039 1.126 yamt else
2040 1.126 yamt off = 0;
2041 1.126 yamt
2042 1.126 yamt m_copyback(req->r_mreq, off, sizeof(xid), (void *)&xid);
2043 1.126 yamt req->r_xid = xid;
2044 1.1 cgd }
2045