nfs_subs.c revision 1.241 1 1.241 riastrad /* $NetBSD: nfs_subs.c,v 1.241 2020/09/05 16:30:12 riastradh Exp $ */
2 1.14 cgd
3 1.1 cgd /*
4 1.12 mycroft * Copyright (c) 1989, 1993
5 1.12 mycroft * The Regents of the University of California. All rights reserved.
6 1.1 cgd *
7 1.1 cgd * This code is derived from software contributed to Berkeley by
8 1.1 cgd * Rick Macklem at The University of Guelph.
9 1.1 cgd *
10 1.1 cgd * Redistribution and use in source and binary forms, with or without
11 1.1 cgd * modification, are permitted provided that the following conditions
12 1.1 cgd * are met:
13 1.1 cgd * 1. Redistributions of source code must retain the above copyright
14 1.1 cgd * notice, this list of conditions and the following disclaimer.
15 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
16 1.1 cgd * notice, this list of conditions and the following disclaimer in the
17 1.1 cgd * documentation and/or other materials provided with the distribution.
18 1.127 agc * 3. Neither the name of the University nor the names of its contributors
19 1.1 cgd * may be used to endorse or promote products derived from this software
20 1.1 cgd * without specific prior written permission.
21 1.1 cgd *
22 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
23 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
26 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32 1.1 cgd * SUCH DAMAGE.
33 1.1 cgd *
34 1.25 fvdl * @(#)nfs_subs.c 8.8 (Berkeley) 5/22/95
35 1.1 cgd */
36 1.1 cgd
37 1.83 fvdl /*
38 1.83 fvdl * Copyright 2000 Wasabi Systems, Inc.
39 1.83 fvdl * All rights reserved.
40 1.83 fvdl *
41 1.83 fvdl * Written by Frank van der Linden for Wasabi Systems, Inc.
42 1.83 fvdl *
43 1.83 fvdl * Redistribution and use in source and binary forms, with or without
44 1.83 fvdl * modification, are permitted provided that the following conditions
45 1.83 fvdl * are met:
46 1.83 fvdl * 1. Redistributions of source code must retain the above copyright
47 1.83 fvdl * notice, this list of conditions and the following disclaimer.
48 1.83 fvdl * 2. Redistributions in binary form must reproduce the above copyright
49 1.83 fvdl * notice, this list of conditions and the following disclaimer in the
50 1.83 fvdl * documentation and/or other materials provided with the distribution.
51 1.83 fvdl * 3. All advertising materials mentioning features or use of this software
52 1.83 fvdl * must display the following acknowledgement:
53 1.83 fvdl * This product includes software developed for the NetBSD Project by
54 1.83 fvdl * Wasabi Systems, Inc.
55 1.83 fvdl * 4. The name of Wasabi Systems, Inc. may not be used to endorse
56 1.83 fvdl * or promote products derived from this software without specific prior
57 1.83 fvdl * written permission.
58 1.83 fvdl *
59 1.83 fvdl * THIS SOFTWARE IS PROVIDED BY WASABI SYSTEMS, INC. ``AS IS'' AND
60 1.83 fvdl * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
61 1.83 fvdl * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
62 1.83 fvdl * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL WASABI SYSTEMS, INC
63 1.83 fvdl * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
64 1.83 fvdl * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
65 1.83 fvdl * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
66 1.83 fvdl * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
67 1.83 fvdl * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
68 1.83 fvdl * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
69 1.83 fvdl * POSSIBILITY OF SUCH DAMAGE.
70 1.83 fvdl */
71 1.99 lukem
72 1.99 lukem #include <sys/cdefs.h>
73 1.241 riastrad __KERNEL_RCSID(0, "$NetBSD: nfs_subs.c,v 1.241 2020/09/05 16:30:12 riastradh Exp $");
74 1.83 fvdl
75 1.210 ad #ifdef _KERNEL_OPT
76 1.82 bjh21 #include "opt_nfs.h"
77 1.210 ad #endif
78 1.25 fvdl
79 1.1 cgd /*
80 1.1 cgd * These functions support the macros and help fiddle mbuf chains for
81 1.1 cgd * the nfs op functions. They do things like create the rpc header and
82 1.1 cgd * copy data between mbuf chains and uio lists.
83 1.1 cgd */
84 1.9 mycroft #include <sys/param.h>
85 1.9 mycroft #include <sys/proc.h>
86 1.9 mycroft #include <sys/systm.h>
87 1.9 mycroft #include <sys/kernel.h>
88 1.196 yamt #include <sys/kmem.h>
89 1.9 mycroft #include <sys/mount.h>
90 1.9 mycroft #include <sys/vnode.h>
91 1.9 mycroft #include <sys/namei.h>
92 1.9 mycroft #include <sys/mbuf.h>
93 1.12 mycroft #include <sys/socket.h>
94 1.12 mycroft #include <sys/stat.h>
95 1.98 fvdl #include <sys/filedesc.h>
96 1.30 fvdl #include <sys/time.h>
97 1.43 fvdl #include <sys/dirent.h>
98 1.155 thorpej #include <sys/once.h>
99 1.162 elad #include <sys/kauth.h>
100 1.207 pooka #include <sys/atomic.h>
101 1.222 tls #include <sys/cprng.h>
102 1.1 cgd
103 1.241 riastrad #include <uvm/uvm_page.h>
104 1.236 ad #include <uvm/uvm_page_array.h>
105 1.51 mrg
106 1.9 mycroft #include <nfs/rpcv2.h>
107 1.25 fvdl #include <nfs/nfsproto.h>
108 1.9 mycroft #include <nfs/nfsnode.h>
109 1.9 mycroft #include <nfs/nfs.h>
110 1.9 mycroft #include <nfs/xdr_subs.h>
111 1.9 mycroft #include <nfs/nfsm_subs.h>
112 1.12 mycroft #include <nfs/nfsmount.h>
113 1.12 mycroft #include <nfs/nfsrtt.h>
114 1.24 christos #include <nfs/nfs_var.h>
115 1.12 mycroft
116 1.12 mycroft #include <miscfs/specfs/specdev.h>
117 1.24 christos
118 1.12 mycroft #include <netinet/in.h>
119 1.1 cgd
120 1.207 pooka static u_int32_t nfs_xid;
121 1.207 pooka
122 1.218 christos int nuidhash_max = NFS_MAXUIDHASH;
123 1.1 cgd /*
124 1.1 cgd * Data items converted to xdr at startup, since they are constant
125 1.1 cgd * This is kinda hokey, but may save a little time doing byte swaps
126 1.1 cgd */
127 1.22 cgd u_int32_t nfs_xdrneg1;
128 1.22 cgd u_int32_t rpc_call, rpc_vers, rpc_reply, rpc_msgdenied, rpc_autherr,
129 1.25 fvdl rpc_mismatch, rpc_auth_unix, rpc_msgaccepted,
130 1.12 mycroft rpc_auth_kerb;
131 1.179 yamt u_int32_t nfs_prog, nfs_true, nfs_false;
132 1.12 mycroft
133 1.1 cgd /* And other global data */
134 1.90 jdolecek const nfstype nfsv2_type[9] =
135 1.90 jdolecek { NFNON, NFREG, NFDIR, NFBLK, NFCHR, NFLNK, NFNON, NFCHR, NFNON };
136 1.90 jdolecek const nfstype nfsv3_type[9] =
137 1.90 jdolecek { NFNON, NFREG, NFDIR, NFBLK, NFCHR, NFLNK, NFSOCK, NFFIFO, NFNON };
138 1.90 jdolecek const enum vtype nv2tov_type[8] =
139 1.90 jdolecek { VNON, VREG, VDIR, VBLK, VCHR, VLNK, VNON, VNON };
140 1.90 jdolecek const enum vtype nv3tov_type[8] =
141 1.90 jdolecek { VNON, VREG, VDIR, VBLK, VCHR, VLNK, VSOCK, VFIFO };
142 1.25 fvdl int nfs_ticks;
143 1.108 christos
144 1.35 thorpej /* NFS client/server stats. */
145 1.35 thorpej struct nfsstats nfsstats;
146 1.35 thorpej
147 1.25 fvdl /*
148 1.25 fvdl * Mapping of old NFS Version 2 RPC numbers to generic numbers.
149 1.25 fvdl */
150 1.90 jdolecek const int nfsv3_procid[NFS_NPROCS] = {
151 1.25 fvdl NFSPROC_NULL,
152 1.25 fvdl NFSPROC_GETATTR,
153 1.25 fvdl NFSPROC_SETATTR,
154 1.25 fvdl NFSPROC_NOOP,
155 1.25 fvdl NFSPROC_LOOKUP,
156 1.25 fvdl NFSPROC_READLINK,
157 1.25 fvdl NFSPROC_READ,
158 1.25 fvdl NFSPROC_NOOP,
159 1.25 fvdl NFSPROC_WRITE,
160 1.25 fvdl NFSPROC_CREATE,
161 1.25 fvdl NFSPROC_REMOVE,
162 1.25 fvdl NFSPROC_RENAME,
163 1.25 fvdl NFSPROC_LINK,
164 1.25 fvdl NFSPROC_SYMLINK,
165 1.25 fvdl NFSPROC_MKDIR,
166 1.25 fvdl NFSPROC_RMDIR,
167 1.25 fvdl NFSPROC_READDIR,
168 1.25 fvdl NFSPROC_FSSTAT,
169 1.25 fvdl NFSPROC_NOOP,
170 1.25 fvdl NFSPROC_NOOP,
171 1.25 fvdl NFSPROC_NOOP,
172 1.25 fvdl NFSPROC_NOOP,
173 1.25 fvdl NFSPROC_NOOP
174 1.25 fvdl };
175 1.25 fvdl
176 1.25 fvdl /*
177 1.25 fvdl * and the reverse mapping from generic to Version 2 procedure numbers
178 1.25 fvdl */
179 1.90 jdolecek const int nfsv2_procid[NFS_NPROCS] = {
180 1.25 fvdl NFSV2PROC_NULL,
181 1.25 fvdl NFSV2PROC_GETATTR,
182 1.25 fvdl NFSV2PROC_SETATTR,
183 1.25 fvdl NFSV2PROC_LOOKUP,
184 1.25 fvdl NFSV2PROC_NOOP,
185 1.25 fvdl NFSV2PROC_READLINK,
186 1.25 fvdl NFSV2PROC_READ,
187 1.25 fvdl NFSV2PROC_WRITE,
188 1.25 fvdl NFSV2PROC_CREATE,
189 1.25 fvdl NFSV2PROC_MKDIR,
190 1.25 fvdl NFSV2PROC_SYMLINK,
191 1.25 fvdl NFSV2PROC_CREATE,
192 1.25 fvdl NFSV2PROC_REMOVE,
193 1.25 fvdl NFSV2PROC_RMDIR,
194 1.25 fvdl NFSV2PROC_RENAME,
195 1.25 fvdl NFSV2PROC_LINK,
196 1.25 fvdl NFSV2PROC_READDIR,
197 1.25 fvdl NFSV2PROC_NOOP,
198 1.25 fvdl NFSV2PROC_STATFS,
199 1.25 fvdl NFSV2PROC_NOOP,
200 1.25 fvdl NFSV2PROC_NOOP,
201 1.25 fvdl NFSV2PROC_NOOP,
202 1.25 fvdl NFSV2PROC_NOOP,
203 1.25 fvdl };
204 1.25 fvdl
205 1.25 fvdl /*
206 1.25 fvdl * Maps errno values to nfs error numbers.
207 1.25 fvdl * Use NFSERR_IO as the catch all for ones not specifically defined in
208 1.25 fvdl * RFC 1094.
209 1.25 fvdl */
210 1.238 mgorny static const u_char nfsrv_v2errmap[] = {
211 1.25 fvdl NFSERR_PERM, NFSERR_NOENT, NFSERR_IO, NFSERR_IO, NFSERR_IO,
212 1.25 fvdl NFSERR_NXIO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
213 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_ACCES, NFSERR_IO, NFSERR_IO,
214 1.25 fvdl NFSERR_IO, NFSERR_EXIST, NFSERR_IO, NFSERR_NODEV, NFSERR_NOTDIR,
215 1.25 fvdl NFSERR_ISDIR, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
216 1.25 fvdl NFSERR_IO, NFSERR_FBIG, NFSERR_NOSPC, NFSERR_IO, NFSERR_ROFS,
217 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
218 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
219 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
220 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
221 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
222 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
223 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_NAMETOL, NFSERR_IO, NFSERR_IO,
224 1.25 fvdl NFSERR_NOTEMPTY, NFSERR_IO, NFSERR_IO, NFSERR_DQUOT, NFSERR_STALE,
225 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
226 1.25 fvdl NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
227 1.238 mgorny NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
228 1.238 mgorny NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
229 1.238 mgorny NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO, NFSERR_IO,
230 1.238 mgorny NFSERR_IO, NFSERR_IO, NFSERR_IO
231 1.25 fvdl };
232 1.238 mgorny __CTASSERT(__arraycount(nfsrv_v2errmap) == ELAST);
233 1.25 fvdl
234 1.25 fvdl /*
235 1.25 fvdl * Maps errno values to nfs error numbers.
236 1.25 fvdl * Although it is not obvious whether or not NFS clients really care if
237 1.25 fvdl * a returned error value is in the specified list for the procedure, the
238 1.25 fvdl * safest thing to do is filter them appropriately. For Version 2, the
239 1.25 fvdl * X/Open XNFS document is the only specification that defines error values
240 1.25 fvdl * for each RPC (The RFC simply lists all possible error values for all RPCs),
241 1.25 fvdl * so I have decided to not do this for Version 2.
242 1.25 fvdl * The first entry is the default error return and the rest are the valid
243 1.25 fvdl * errors for that RPC in increasing numeric order.
244 1.25 fvdl */
245 1.90 jdolecek static const short nfsv3err_null[] = {
246 1.25 fvdl 0,
247 1.25 fvdl 0,
248 1.25 fvdl };
249 1.25 fvdl
250 1.90 jdolecek static const short nfsv3err_getattr[] = {
251 1.25 fvdl NFSERR_IO,
252 1.25 fvdl NFSERR_IO,
253 1.25 fvdl NFSERR_STALE,
254 1.25 fvdl NFSERR_BADHANDLE,
255 1.25 fvdl NFSERR_SERVERFAULT,
256 1.25 fvdl 0,
257 1.25 fvdl };
258 1.25 fvdl
259 1.90 jdolecek static const short nfsv3err_setattr[] = {
260 1.25 fvdl NFSERR_IO,
261 1.25 fvdl NFSERR_PERM,
262 1.25 fvdl NFSERR_IO,
263 1.25 fvdl NFSERR_ACCES,
264 1.25 fvdl NFSERR_INVAL,
265 1.25 fvdl NFSERR_NOSPC,
266 1.25 fvdl NFSERR_ROFS,
267 1.25 fvdl NFSERR_DQUOT,
268 1.25 fvdl NFSERR_STALE,
269 1.25 fvdl NFSERR_BADHANDLE,
270 1.25 fvdl NFSERR_NOT_SYNC,
271 1.25 fvdl NFSERR_SERVERFAULT,
272 1.25 fvdl 0,
273 1.25 fvdl };
274 1.25 fvdl
275 1.90 jdolecek static const short nfsv3err_lookup[] = {
276 1.25 fvdl NFSERR_IO,
277 1.25 fvdl NFSERR_NOENT,
278 1.25 fvdl NFSERR_IO,
279 1.25 fvdl NFSERR_ACCES,
280 1.25 fvdl NFSERR_NOTDIR,
281 1.25 fvdl NFSERR_NAMETOL,
282 1.25 fvdl NFSERR_STALE,
283 1.25 fvdl NFSERR_BADHANDLE,
284 1.25 fvdl NFSERR_SERVERFAULT,
285 1.25 fvdl 0,
286 1.25 fvdl };
287 1.25 fvdl
288 1.90 jdolecek static const short nfsv3err_access[] = {
289 1.25 fvdl NFSERR_IO,
290 1.25 fvdl NFSERR_IO,
291 1.25 fvdl NFSERR_STALE,
292 1.25 fvdl NFSERR_BADHANDLE,
293 1.25 fvdl NFSERR_SERVERFAULT,
294 1.25 fvdl 0,
295 1.25 fvdl };
296 1.25 fvdl
297 1.90 jdolecek static const short nfsv3err_readlink[] = {
298 1.25 fvdl NFSERR_IO,
299 1.25 fvdl NFSERR_IO,
300 1.25 fvdl NFSERR_ACCES,
301 1.25 fvdl NFSERR_INVAL,
302 1.25 fvdl NFSERR_STALE,
303 1.25 fvdl NFSERR_BADHANDLE,
304 1.25 fvdl NFSERR_NOTSUPP,
305 1.25 fvdl NFSERR_SERVERFAULT,
306 1.25 fvdl 0,
307 1.25 fvdl };
308 1.25 fvdl
309 1.90 jdolecek static const short nfsv3err_read[] = {
310 1.25 fvdl NFSERR_IO,
311 1.25 fvdl NFSERR_IO,
312 1.25 fvdl NFSERR_NXIO,
313 1.25 fvdl NFSERR_ACCES,
314 1.25 fvdl NFSERR_INVAL,
315 1.25 fvdl NFSERR_STALE,
316 1.25 fvdl NFSERR_BADHANDLE,
317 1.25 fvdl NFSERR_SERVERFAULT,
318 1.67 fvdl NFSERR_JUKEBOX,
319 1.25 fvdl 0,
320 1.25 fvdl };
321 1.25 fvdl
322 1.90 jdolecek static const short nfsv3err_write[] = {
323 1.25 fvdl NFSERR_IO,
324 1.25 fvdl NFSERR_IO,
325 1.25 fvdl NFSERR_ACCES,
326 1.25 fvdl NFSERR_INVAL,
327 1.25 fvdl NFSERR_FBIG,
328 1.25 fvdl NFSERR_NOSPC,
329 1.25 fvdl NFSERR_ROFS,
330 1.25 fvdl NFSERR_DQUOT,
331 1.25 fvdl NFSERR_STALE,
332 1.25 fvdl NFSERR_BADHANDLE,
333 1.25 fvdl NFSERR_SERVERFAULT,
334 1.68 fvdl NFSERR_JUKEBOX,
335 1.25 fvdl 0,
336 1.25 fvdl };
337 1.25 fvdl
338 1.90 jdolecek static const short nfsv3err_create[] = {
339 1.25 fvdl NFSERR_IO,
340 1.25 fvdl NFSERR_IO,
341 1.25 fvdl NFSERR_ACCES,
342 1.25 fvdl NFSERR_EXIST,
343 1.25 fvdl NFSERR_NOTDIR,
344 1.25 fvdl NFSERR_NOSPC,
345 1.25 fvdl NFSERR_ROFS,
346 1.25 fvdl NFSERR_NAMETOL,
347 1.25 fvdl NFSERR_DQUOT,
348 1.25 fvdl NFSERR_STALE,
349 1.25 fvdl NFSERR_BADHANDLE,
350 1.25 fvdl NFSERR_NOTSUPP,
351 1.25 fvdl NFSERR_SERVERFAULT,
352 1.25 fvdl 0,
353 1.25 fvdl };
354 1.25 fvdl
355 1.90 jdolecek static const short nfsv3err_mkdir[] = {
356 1.25 fvdl NFSERR_IO,
357 1.25 fvdl NFSERR_IO,
358 1.25 fvdl NFSERR_ACCES,
359 1.25 fvdl NFSERR_EXIST,
360 1.25 fvdl NFSERR_NOTDIR,
361 1.25 fvdl NFSERR_NOSPC,
362 1.25 fvdl NFSERR_ROFS,
363 1.25 fvdl NFSERR_NAMETOL,
364 1.25 fvdl NFSERR_DQUOT,
365 1.25 fvdl NFSERR_STALE,
366 1.25 fvdl NFSERR_BADHANDLE,
367 1.25 fvdl NFSERR_NOTSUPP,
368 1.25 fvdl NFSERR_SERVERFAULT,
369 1.25 fvdl 0,
370 1.25 fvdl };
371 1.25 fvdl
372 1.90 jdolecek static const short nfsv3err_symlink[] = {
373 1.25 fvdl NFSERR_IO,
374 1.25 fvdl NFSERR_IO,
375 1.25 fvdl NFSERR_ACCES,
376 1.25 fvdl NFSERR_EXIST,
377 1.25 fvdl NFSERR_NOTDIR,
378 1.25 fvdl NFSERR_NOSPC,
379 1.25 fvdl NFSERR_ROFS,
380 1.25 fvdl NFSERR_NAMETOL,
381 1.25 fvdl NFSERR_DQUOT,
382 1.25 fvdl NFSERR_STALE,
383 1.25 fvdl NFSERR_BADHANDLE,
384 1.25 fvdl NFSERR_NOTSUPP,
385 1.25 fvdl NFSERR_SERVERFAULT,
386 1.25 fvdl 0,
387 1.25 fvdl };
388 1.25 fvdl
389 1.90 jdolecek static const short nfsv3err_mknod[] = {
390 1.25 fvdl NFSERR_IO,
391 1.25 fvdl NFSERR_IO,
392 1.25 fvdl NFSERR_ACCES,
393 1.25 fvdl NFSERR_EXIST,
394 1.25 fvdl NFSERR_NOTDIR,
395 1.25 fvdl NFSERR_NOSPC,
396 1.25 fvdl NFSERR_ROFS,
397 1.25 fvdl NFSERR_NAMETOL,
398 1.25 fvdl NFSERR_DQUOT,
399 1.25 fvdl NFSERR_STALE,
400 1.25 fvdl NFSERR_BADHANDLE,
401 1.25 fvdl NFSERR_NOTSUPP,
402 1.25 fvdl NFSERR_SERVERFAULT,
403 1.25 fvdl NFSERR_BADTYPE,
404 1.25 fvdl 0,
405 1.25 fvdl };
406 1.25 fvdl
407 1.90 jdolecek static const short nfsv3err_remove[] = {
408 1.25 fvdl NFSERR_IO,
409 1.25 fvdl NFSERR_NOENT,
410 1.25 fvdl NFSERR_IO,
411 1.25 fvdl NFSERR_ACCES,
412 1.25 fvdl NFSERR_NOTDIR,
413 1.25 fvdl NFSERR_ROFS,
414 1.25 fvdl NFSERR_NAMETOL,
415 1.25 fvdl NFSERR_STALE,
416 1.25 fvdl NFSERR_BADHANDLE,
417 1.25 fvdl NFSERR_SERVERFAULT,
418 1.25 fvdl 0,
419 1.25 fvdl };
420 1.25 fvdl
421 1.90 jdolecek static const short nfsv3err_rmdir[] = {
422 1.25 fvdl NFSERR_IO,
423 1.25 fvdl NFSERR_NOENT,
424 1.25 fvdl NFSERR_IO,
425 1.25 fvdl NFSERR_ACCES,
426 1.25 fvdl NFSERR_EXIST,
427 1.25 fvdl NFSERR_NOTDIR,
428 1.25 fvdl NFSERR_INVAL,
429 1.25 fvdl NFSERR_ROFS,
430 1.25 fvdl NFSERR_NAMETOL,
431 1.25 fvdl NFSERR_NOTEMPTY,
432 1.25 fvdl NFSERR_STALE,
433 1.25 fvdl NFSERR_BADHANDLE,
434 1.25 fvdl NFSERR_NOTSUPP,
435 1.25 fvdl NFSERR_SERVERFAULT,
436 1.25 fvdl 0,
437 1.25 fvdl };
438 1.25 fvdl
439 1.90 jdolecek static const short nfsv3err_rename[] = {
440 1.25 fvdl NFSERR_IO,
441 1.25 fvdl NFSERR_NOENT,
442 1.25 fvdl NFSERR_IO,
443 1.25 fvdl NFSERR_ACCES,
444 1.25 fvdl NFSERR_EXIST,
445 1.25 fvdl NFSERR_XDEV,
446 1.25 fvdl NFSERR_NOTDIR,
447 1.25 fvdl NFSERR_ISDIR,
448 1.25 fvdl NFSERR_INVAL,
449 1.25 fvdl NFSERR_NOSPC,
450 1.25 fvdl NFSERR_ROFS,
451 1.25 fvdl NFSERR_MLINK,
452 1.25 fvdl NFSERR_NAMETOL,
453 1.25 fvdl NFSERR_NOTEMPTY,
454 1.25 fvdl NFSERR_DQUOT,
455 1.25 fvdl NFSERR_STALE,
456 1.25 fvdl NFSERR_BADHANDLE,
457 1.25 fvdl NFSERR_NOTSUPP,
458 1.25 fvdl NFSERR_SERVERFAULT,
459 1.25 fvdl 0,
460 1.25 fvdl };
461 1.25 fvdl
462 1.90 jdolecek static const short nfsv3err_link[] = {
463 1.25 fvdl NFSERR_IO,
464 1.25 fvdl NFSERR_IO,
465 1.25 fvdl NFSERR_ACCES,
466 1.25 fvdl NFSERR_EXIST,
467 1.25 fvdl NFSERR_XDEV,
468 1.25 fvdl NFSERR_NOTDIR,
469 1.25 fvdl NFSERR_INVAL,
470 1.25 fvdl NFSERR_NOSPC,
471 1.25 fvdl NFSERR_ROFS,
472 1.25 fvdl NFSERR_MLINK,
473 1.25 fvdl NFSERR_NAMETOL,
474 1.25 fvdl NFSERR_DQUOT,
475 1.25 fvdl NFSERR_STALE,
476 1.25 fvdl NFSERR_BADHANDLE,
477 1.25 fvdl NFSERR_NOTSUPP,
478 1.25 fvdl NFSERR_SERVERFAULT,
479 1.25 fvdl 0,
480 1.25 fvdl };
481 1.25 fvdl
482 1.90 jdolecek static const short nfsv3err_readdir[] = {
483 1.25 fvdl NFSERR_IO,
484 1.25 fvdl NFSERR_IO,
485 1.25 fvdl NFSERR_ACCES,
486 1.25 fvdl NFSERR_NOTDIR,
487 1.25 fvdl NFSERR_STALE,
488 1.25 fvdl NFSERR_BADHANDLE,
489 1.25 fvdl NFSERR_BAD_COOKIE,
490 1.25 fvdl NFSERR_TOOSMALL,
491 1.25 fvdl NFSERR_SERVERFAULT,
492 1.25 fvdl 0,
493 1.25 fvdl };
494 1.25 fvdl
495 1.90 jdolecek static const short nfsv3err_readdirplus[] = {
496 1.25 fvdl NFSERR_IO,
497 1.25 fvdl NFSERR_IO,
498 1.25 fvdl NFSERR_ACCES,
499 1.25 fvdl NFSERR_NOTDIR,
500 1.25 fvdl NFSERR_STALE,
501 1.25 fvdl NFSERR_BADHANDLE,
502 1.25 fvdl NFSERR_BAD_COOKIE,
503 1.25 fvdl NFSERR_NOTSUPP,
504 1.25 fvdl NFSERR_TOOSMALL,
505 1.25 fvdl NFSERR_SERVERFAULT,
506 1.25 fvdl 0,
507 1.25 fvdl };
508 1.25 fvdl
509 1.90 jdolecek static const short nfsv3err_fsstat[] = {
510 1.25 fvdl NFSERR_IO,
511 1.25 fvdl NFSERR_IO,
512 1.25 fvdl NFSERR_STALE,
513 1.25 fvdl NFSERR_BADHANDLE,
514 1.25 fvdl NFSERR_SERVERFAULT,
515 1.25 fvdl 0,
516 1.25 fvdl };
517 1.25 fvdl
518 1.90 jdolecek static const short nfsv3err_fsinfo[] = {
519 1.25 fvdl NFSERR_STALE,
520 1.25 fvdl NFSERR_STALE,
521 1.25 fvdl NFSERR_BADHANDLE,
522 1.25 fvdl NFSERR_SERVERFAULT,
523 1.25 fvdl 0,
524 1.25 fvdl };
525 1.25 fvdl
526 1.90 jdolecek static const short nfsv3err_pathconf[] = {
527 1.25 fvdl NFSERR_STALE,
528 1.25 fvdl NFSERR_STALE,
529 1.25 fvdl NFSERR_BADHANDLE,
530 1.25 fvdl NFSERR_SERVERFAULT,
531 1.25 fvdl 0,
532 1.25 fvdl };
533 1.25 fvdl
534 1.90 jdolecek static const short nfsv3err_commit[] = {
535 1.25 fvdl NFSERR_IO,
536 1.25 fvdl NFSERR_IO,
537 1.25 fvdl NFSERR_STALE,
538 1.25 fvdl NFSERR_BADHANDLE,
539 1.25 fvdl NFSERR_SERVERFAULT,
540 1.25 fvdl 0,
541 1.25 fvdl };
542 1.25 fvdl
543 1.90 jdolecek static const short * const nfsrv_v3errmap[] = {
544 1.25 fvdl nfsv3err_null,
545 1.25 fvdl nfsv3err_getattr,
546 1.25 fvdl nfsv3err_setattr,
547 1.25 fvdl nfsv3err_lookup,
548 1.25 fvdl nfsv3err_access,
549 1.25 fvdl nfsv3err_readlink,
550 1.25 fvdl nfsv3err_read,
551 1.25 fvdl nfsv3err_write,
552 1.25 fvdl nfsv3err_create,
553 1.25 fvdl nfsv3err_mkdir,
554 1.25 fvdl nfsv3err_symlink,
555 1.25 fvdl nfsv3err_mknod,
556 1.25 fvdl nfsv3err_remove,
557 1.25 fvdl nfsv3err_rmdir,
558 1.25 fvdl nfsv3err_rename,
559 1.25 fvdl nfsv3err_link,
560 1.25 fvdl nfsv3err_readdir,
561 1.25 fvdl nfsv3err_readdirplus,
562 1.25 fvdl nfsv3err_fsstat,
563 1.25 fvdl nfsv3err_fsinfo,
564 1.25 fvdl nfsv3err_pathconf,
565 1.25 fvdl nfsv3err_commit,
566 1.25 fvdl };
567 1.25 fvdl
568 1.12 mycroft extern struct nfsrtt nfsrtt;
569 1.1 cgd
570 1.46 fvdl u_long nfsdirhashmask;
571 1.18 mycroft
572 1.213 dsl int nfs_webnamei(struct nameidata *, struct vnode *, struct proc *);
573 1.43 fvdl
574 1.1 cgd /*
575 1.1 cgd * Create the header for an rpc request packet
576 1.1 cgd * The hsiz is the size of the rest of the nfs request header.
577 1.1 cgd * (just used to decide if a cluster is a good idea)
578 1.1 cgd */
579 1.12 mycroft struct mbuf *
580 1.183 christos nfsm_reqh(struct nfsnode *np, u_long procid, int hsiz, char **bposp)
581 1.12 mycroft {
582 1.75 augustss struct mbuf *mb;
583 1.183 christos char *bpos;
584 1.12 mycroft
585 1.109 matt mb = m_get(M_WAIT, MT_DATA);
586 1.109 matt MCLAIM(mb, &nfs_mowner);
587 1.12 mycroft if (hsiz >= MINCLSIZE)
588 1.109 matt m_clget(mb, M_WAIT);
589 1.12 mycroft mb->m_len = 0;
590 1.183 christos bpos = mtod(mb, void *);
591 1.148 perry
592 1.12 mycroft /* Finally, return values */
593 1.12 mycroft *bposp = bpos;
594 1.12 mycroft return (mb);
595 1.12 mycroft }
596 1.12 mycroft
597 1.12 mycroft /*
598 1.12 mycroft * Build the RPC header and fill in the authorization info.
599 1.12 mycroft * The authorization string argument is only used when the credentials
600 1.12 mycroft * come from outside of the kernel.
601 1.12 mycroft * Returns the head of the mbuf list.
602 1.12 mycroft */
603 1.12 mycroft struct mbuf *
604 1.216 cegger nfsm_rpchead(kauth_cred_t cr, int nmflag, int procid,
605 1.216 cegger int auth_type, int auth_len, char *auth_str, int verf_len,
606 1.216 cegger char *verf_str, struct mbuf *mrest, int mrest_len,
607 1.216 cegger struct mbuf **mbp, uint32_t *xidp)
608 1.1 cgd {
609 1.75 augustss struct mbuf *mb;
610 1.75 augustss u_int32_t *tl;
611 1.183 christos char *bpos;
612 1.75 augustss int i;
613 1.109 matt struct mbuf *mreq;
614 1.12 mycroft int siz, grpsiz, authsiz;
615 1.1 cgd
616 1.12 mycroft authsiz = nfsm_rndup(auth_len);
617 1.109 matt mb = m_gethdr(M_WAIT, MT_DATA);
618 1.109 matt MCLAIM(mb, &nfs_mowner);
619 1.25 fvdl if ((authsiz + 10 * NFSX_UNSIGNED) >= MINCLSIZE) {
620 1.109 matt m_clget(mb, M_WAIT);
621 1.25 fvdl } else if ((authsiz + 10 * NFSX_UNSIGNED) < MHLEN) {
622 1.235 maxv m_align(mb, authsiz + 10 * NFSX_UNSIGNED);
623 1.12 mycroft } else {
624 1.235 maxv m_align(mb, 8 * NFSX_UNSIGNED);
625 1.1 cgd }
626 1.12 mycroft mb->m_len = 0;
627 1.12 mycroft mreq = mb;
628 1.183 christos bpos = mtod(mb, void *);
629 1.12 mycroft
630 1.12 mycroft /*
631 1.12 mycroft * First the RPC header.
632 1.12 mycroft */
633 1.25 fvdl nfsm_build(tl, u_int32_t *, 8 * NFSX_UNSIGNED);
634 1.30 fvdl
635 1.126 yamt *tl++ = *xidp = nfs_getxid();
636 1.1 cgd *tl++ = rpc_call;
637 1.1 cgd *tl++ = rpc_vers;
638 1.179 yamt *tl++ = txdr_unsigned(NFS_PROG);
639 1.179 yamt if (nmflag & NFSMNT_NFSV3)
640 1.179 yamt *tl++ = txdr_unsigned(NFS_VER3);
641 1.179 yamt else
642 1.179 yamt *tl++ = txdr_unsigned(NFS_VER2);
643 1.25 fvdl if (nmflag & NFSMNT_NFSV3)
644 1.25 fvdl *tl++ = txdr_unsigned(procid);
645 1.25 fvdl else
646 1.25 fvdl *tl++ = txdr_unsigned(nfsv2_procid[procid]);
647 1.12 mycroft
648 1.12 mycroft /*
649 1.12 mycroft * And then the authorization cred.
650 1.12 mycroft */
651 1.12 mycroft *tl++ = txdr_unsigned(auth_type);
652 1.12 mycroft *tl = txdr_unsigned(authsiz);
653 1.12 mycroft switch (auth_type) {
654 1.12 mycroft case RPCAUTH_UNIX:
655 1.22 cgd nfsm_build(tl, u_int32_t *, auth_len);
656 1.12 mycroft *tl++ = 0; /* stamp ?? */
657 1.12 mycroft *tl++ = 0; /* NULL hostname */
658 1.162 elad *tl++ = txdr_unsigned(kauth_cred_geteuid(cr));
659 1.162 elad *tl++ = txdr_unsigned(kauth_cred_getegid(cr));
660 1.12 mycroft grpsiz = (auth_len >> 2) - 5;
661 1.12 mycroft *tl++ = txdr_unsigned(grpsiz);
662 1.20 mycroft for (i = 0; i < grpsiz; i++)
663 1.162 elad *tl++ = txdr_unsigned(kauth_cred_group(cr, i)); /* XXX elad review */
664 1.12 mycroft break;
665 1.25 fvdl case RPCAUTH_KERB4:
666 1.12 mycroft siz = auth_len;
667 1.12 mycroft while (siz > 0) {
668 1.12 mycroft if (M_TRAILINGSPACE(mb) == 0) {
669 1.109 matt struct mbuf *mb2;
670 1.109 matt mb2 = m_get(M_WAIT, MT_DATA);
671 1.109 matt MCLAIM(mb2, &nfs_mowner);
672 1.12 mycroft if (siz >= MINCLSIZE)
673 1.109 matt m_clget(mb2, M_WAIT);
674 1.12 mycroft mb->m_next = mb2;
675 1.12 mycroft mb = mb2;
676 1.12 mycroft mb->m_len = 0;
677 1.183 christos bpos = mtod(mb, void *);
678 1.12 mycroft }
679 1.233 riastrad i = uimin(siz, M_TRAILINGSPACE(mb));
680 1.63 perry memcpy(bpos, auth_str, i);
681 1.12 mycroft mb->m_len += i;
682 1.12 mycroft auth_str += i;
683 1.12 mycroft bpos += i;
684 1.12 mycroft siz -= i;
685 1.12 mycroft }
686 1.12 mycroft if ((siz = (nfsm_rndup(auth_len) - auth_len)) > 0) {
687 1.12 mycroft for (i = 0; i < siz; i++)
688 1.12 mycroft *bpos++ = '\0';
689 1.12 mycroft mb->m_len += siz;
690 1.12 mycroft }
691 1.12 mycroft break;
692 1.12 mycroft };
693 1.25 fvdl
694 1.25 fvdl /*
695 1.25 fvdl * And the verifier...
696 1.25 fvdl */
697 1.25 fvdl nfsm_build(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
698 1.25 fvdl if (verf_str) {
699 1.25 fvdl *tl++ = txdr_unsigned(RPCAUTH_KERB4);
700 1.25 fvdl *tl = txdr_unsigned(verf_len);
701 1.25 fvdl siz = verf_len;
702 1.25 fvdl while (siz > 0) {
703 1.25 fvdl if (M_TRAILINGSPACE(mb) == 0) {
704 1.109 matt struct mbuf *mb2;
705 1.109 matt mb2 = m_get(M_WAIT, MT_DATA);
706 1.109 matt MCLAIM(mb2, &nfs_mowner);
707 1.25 fvdl if (siz >= MINCLSIZE)
708 1.109 matt m_clget(mb2, M_WAIT);
709 1.25 fvdl mb->m_next = mb2;
710 1.25 fvdl mb = mb2;
711 1.25 fvdl mb->m_len = 0;
712 1.183 christos bpos = mtod(mb, void *);
713 1.25 fvdl }
714 1.233 riastrad i = uimin(siz, M_TRAILINGSPACE(mb));
715 1.63 perry memcpy(bpos, verf_str, i);
716 1.25 fvdl mb->m_len += i;
717 1.25 fvdl verf_str += i;
718 1.25 fvdl bpos += i;
719 1.25 fvdl siz -= i;
720 1.25 fvdl }
721 1.25 fvdl if ((siz = (nfsm_rndup(verf_len) - verf_len)) > 0) {
722 1.25 fvdl for (i = 0; i < siz; i++)
723 1.25 fvdl *bpos++ = '\0';
724 1.25 fvdl mb->m_len += siz;
725 1.25 fvdl }
726 1.25 fvdl } else {
727 1.25 fvdl *tl++ = txdr_unsigned(RPCAUTH_NULL);
728 1.25 fvdl *tl = 0;
729 1.25 fvdl }
730 1.12 mycroft mb->m_next = mrest;
731 1.25 fvdl mreq->m_pkthdr.len = authsiz + 10 * NFSX_UNSIGNED + mrest_len;
732 1.228 ozaki m_reset_rcvif(mreq);
733 1.12 mycroft *mbp = mb;
734 1.1 cgd return (mreq);
735 1.1 cgd }
736 1.1 cgd
737 1.1 cgd /*
738 1.1 cgd * copies mbuf chain to the uio scatter/gather list
739 1.1 cgd */
740 1.24 christos int
741 1.214 dsl nfsm_mbuftouio(struct mbuf **mrep, struct uio *uiop, int siz, char **dpos)
742 1.1 cgd {
743 1.75 augustss char *mbufcp, *uiocp;
744 1.75 augustss int xfer, left, len;
745 1.75 augustss struct mbuf *mp;
746 1.1 cgd long uiosiz, rem;
747 1.1 cgd int error = 0;
748 1.1 cgd
749 1.1 cgd mp = *mrep;
750 1.1 cgd mbufcp = *dpos;
751 1.183 christos len = mtod(mp, char *) + mp->m_len - mbufcp;
752 1.1 cgd rem = nfsm_rndup(siz)-siz;
753 1.1 cgd while (siz > 0) {
754 1.1 cgd if (uiop->uio_iovcnt <= 0 || uiop->uio_iov == NULL)
755 1.1 cgd return (EFBIG);
756 1.1 cgd left = uiop->uio_iov->iov_len;
757 1.1 cgd uiocp = uiop->uio_iov->iov_base;
758 1.1 cgd if (left > siz)
759 1.1 cgd left = siz;
760 1.1 cgd uiosiz = left;
761 1.1 cgd while (left > 0) {
762 1.1 cgd while (len == 0) {
763 1.1 cgd mp = mp->m_next;
764 1.1 cgd if (mp == NULL)
765 1.1 cgd return (EBADRPC);
766 1.183 christos mbufcp = mtod(mp, void *);
767 1.1 cgd len = mp->m_len;
768 1.1 cgd }
769 1.1 cgd xfer = (left > len) ? len : left;
770 1.158 yamt error = copyout_vmspace(uiop->uio_vmspace, mbufcp,
771 1.158 yamt uiocp, xfer);
772 1.158 yamt if (error) {
773 1.158 yamt return error;
774 1.158 yamt }
775 1.1 cgd left -= xfer;
776 1.1 cgd len -= xfer;
777 1.1 cgd mbufcp += xfer;
778 1.1 cgd uiocp += xfer;
779 1.1 cgd uiop->uio_offset += xfer;
780 1.1 cgd uiop->uio_resid -= xfer;
781 1.1 cgd }
782 1.1 cgd if (uiop->uio_iov->iov_len <= siz) {
783 1.1 cgd uiop->uio_iovcnt--;
784 1.1 cgd uiop->uio_iov++;
785 1.1 cgd } else {
786 1.95 lukem uiop->uio_iov->iov_base =
787 1.183 christos (char *)uiop->uio_iov->iov_base + uiosiz;
788 1.1 cgd uiop->uio_iov->iov_len -= uiosiz;
789 1.1 cgd }
790 1.1 cgd siz -= uiosiz;
791 1.1 cgd }
792 1.1 cgd *dpos = mbufcp;
793 1.1 cgd *mrep = mp;
794 1.1 cgd if (rem > 0) {
795 1.1 cgd if (len < rem)
796 1.1 cgd error = nfs_adv(mrep, dpos, rem, len);
797 1.1 cgd else
798 1.1 cgd *dpos += rem;
799 1.1 cgd }
800 1.1 cgd return (error);
801 1.1 cgd }
802 1.1 cgd
803 1.1 cgd /*
804 1.29 fvdl * copies a uio scatter/gather list to an mbuf chain.
805 1.29 fvdl * NOTE: can ony handle iovcnt == 1
806 1.1 cgd */
807 1.24 christos int
808 1.214 dsl nfsm_uiotombuf(struct uio *uiop, struct mbuf **mq, int siz, char **bpos)
809 1.1 cgd {
810 1.75 augustss char *uiocp;
811 1.75 augustss struct mbuf *mp, *mp2;
812 1.75 augustss int xfer, left, mlen;
813 1.1 cgd int uiosiz, clflg, rem;
814 1.1 cgd char *cp;
815 1.158 yamt int error;
816 1.1 cgd
817 1.29 fvdl #ifdef DIAGNOSTIC
818 1.29 fvdl if (uiop->uio_iovcnt != 1)
819 1.29 fvdl panic("nfsm_uiotombuf: iovcnt != 1");
820 1.29 fvdl #endif
821 1.29 fvdl
822 1.1 cgd if (siz > MLEN) /* or should it >= MCLBYTES ?? */
823 1.1 cgd clflg = 1;
824 1.1 cgd else
825 1.1 cgd clflg = 0;
826 1.1 cgd rem = nfsm_rndup(siz)-siz;
827 1.12 mycroft mp = mp2 = *mq;
828 1.1 cgd while (siz > 0) {
829 1.1 cgd left = uiop->uio_iov->iov_len;
830 1.1 cgd uiocp = uiop->uio_iov->iov_base;
831 1.1 cgd if (left > siz)
832 1.1 cgd left = siz;
833 1.1 cgd uiosiz = left;
834 1.1 cgd while (left > 0) {
835 1.12 mycroft mlen = M_TRAILINGSPACE(mp);
836 1.12 mycroft if (mlen == 0) {
837 1.109 matt mp = m_get(M_WAIT, MT_DATA);
838 1.109 matt MCLAIM(mp, &nfs_mowner);
839 1.12 mycroft if (clflg)
840 1.109 matt m_clget(mp, M_WAIT);
841 1.12 mycroft mp->m_len = 0;
842 1.12 mycroft mp2->m_next = mp;
843 1.12 mycroft mp2 = mp;
844 1.12 mycroft mlen = M_TRAILINGSPACE(mp);
845 1.12 mycroft }
846 1.12 mycroft xfer = (left > mlen) ? mlen : left;
847 1.183 christos cp = mtod(mp, char *) + mp->m_len;
848 1.158 yamt error = copyin_vmspace(uiop->uio_vmspace, uiocp, cp,
849 1.158 yamt xfer);
850 1.158 yamt if (error) {
851 1.158 yamt /* XXX */
852 1.158 yamt }
853 1.12 mycroft mp->m_len += xfer;
854 1.1 cgd left -= xfer;
855 1.1 cgd uiocp += xfer;
856 1.1 cgd uiop->uio_offset += xfer;
857 1.1 cgd uiop->uio_resid -= xfer;
858 1.1 cgd }
859 1.183 christos uiop->uio_iov->iov_base = (char *)uiop->uio_iov->iov_base +
860 1.95 lukem uiosiz;
861 1.29 fvdl uiop->uio_iov->iov_len -= uiosiz;
862 1.1 cgd siz -= uiosiz;
863 1.1 cgd }
864 1.1 cgd if (rem > 0) {
865 1.12 mycroft if (rem > M_TRAILINGSPACE(mp)) {
866 1.109 matt mp = m_get(M_WAIT, MT_DATA);
867 1.109 matt MCLAIM(mp, &nfs_mowner);
868 1.1 cgd mp->m_len = 0;
869 1.1 cgd mp2->m_next = mp;
870 1.1 cgd }
871 1.183 christos cp = mtod(mp, char *) + mp->m_len;
872 1.1 cgd for (left = 0; left < rem; left++)
873 1.1 cgd *cp++ = '\0';
874 1.1 cgd mp->m_len += rem;
875 1.1 cgd *bpos = cp;
876 1.1 cgd } else
877 1.183 christos *bpos = mtod(mp, char *) + mp->m_len;
878 1.1 cgd *mq = mp;
879 1.1 cgd return (0);
880 1.1 cgd }
881 1.1 cgd
882 1.1 cgd /*
883 1.39 fvdl * Get at least "siz" bytes of correctly aligned data.
884 1.39 fvdl * When called the mbuf pointers are not necessarily correct,
885 1.39 fvdl * dsosp points to what ought to be in m_data and left contains
886 1.148 perry * what ought to be in m_len.
887 1.12 mycroft * This is used by the macros nfsm_dissect and nfsm_dissecton for tough
888 1.1 cgd * cases. (The macros use the vars. dpos and dpos2)
889 1.1 cgd */
890 1.24 christos int
891 1.214 dsl nfsm_disct(struct mbuf **mdp, char **dposp, int siz, int left, char **cp2)
892 1.1 cgd {
893 1.75 augustss struct mbuf *m1, *m2;
894 1.39 fvdl struct mbuf *havebuf = NULL;
895 1.183 christos char *src = *dposp;
896 1.183 christos char *dst;
897 1.39 fvdl int len;
898 1.39 fvdl
899 1.39 fvdl #ifdef DEBUG
900 1.39 fvdl if (left < 0)
901 1.148 perry panic("nfsm_disct: left < 0");
902 1.39 fvdl #endif
903 1.39 fvdl m1 = *mdp;
904 1.39 fvdl /*
905 1.39 fvdl * Skip through the mbuf chain looking for an mbuf with
906 1.39 fvdl * some data. If the first mbuf found has enough data
907 1.39 fvdl * and it is correctly aligned return it.
908 1.39 fvdl */
909 1.1 cgd while (left == 0) {
910 1.39 fvdl havebuf = m1;
911 1.39 fvdl *mdp = m1 = m1->m_next;
912 1.39 fvdl if (m1 == NULL)
913 1.1 cgd return (EBADRPC);
914 1.183 christos src = mtod(m1, void *);
915 1.39 fvdl left = m1->m_len;
916 1.39 fvdl /*
917 1.39 fvdl * If we start a new mbuf and it is big enough
918 1.39 fvdl * and correctly aligned just return it, don't
919 1.39 fvdl * do any pull up.
920 1.39 fvdl */
921 1.39 fvdl if (left >= siz && nfsm_aligned(src)) {
922 1.39 fvdl *cp2 = src;
923 1.39 fvdl *dposp = src + siz;
924 1.39 fvdl return (0);
925 1.39 fvdl }
926 1.1 cgd }
927 1.201 yamt if ((m1->m_flags & M_EXT) != 0) {
928 1.201 yamt if (havebuf && M_TRAILINGSPACE(havebuf) >= siz &&
929 1.201 yamt nfsm_aligned(mtod(havebuf, char *) + havebuf->m_len)) {
930 1.201 yamt /*
931 1.201 yamt * If the first mbuf with data has external data
932 1.201 yamt * and there is a previous mbuf with some trailing
933 1.201 yamt * space, use it to move the data into.
934 1.39 fvdl */
935 1.39 fvdl m2 = m1;
936 1.39 fvdl *mdp = m1 = havebuf;
937 1.201 yamt *cp2 = mtod(m1, char *) + m1->m_len;
938 1.201 yamt } else if (havebuf) {
939 1.39 fvdl /*
940 1.39 fvdl * If the first mbuf has a external data
941 1.39 fvdl * and there is no previous empty mbuf
942 1.39 fvdl * allocate a new mbuf and move the external
943 1.148 perry * data to the new mbuf. Also make the first
944 1.39 fvdl * mbuf look empty.
945 1.39 fvdl */
946 1.201 yamt m2 = m1;
947 1.201 yamt *mdp = m1 = m_get(M_WAIT, MT_DATA);
948 1.201 yamt MCLAIM(m1, m2->m_owner);
949 1.201 yamt if ((m2->m_flags & M_PKTHDR) != 0) {
950 1.234 maxv m_move_pkthdr(m1, m2);
951 1.201 yamt }
952 1.201 yamt if (havebuf) {
953 1.201 yamt havebuf->m_next = m1;
954 1.201 yamt }
955 1.201 yamt m1->m_next = m2;
956 1.201 yamt MRESETDATA(m1);
957 1.201 yamt m1->m_len = 0;
958 1.39 fvdl m2->m_data = src;
959 1.39 fvdl m2->m_len = left;
960 1.201 yamt *cp2 = mtod(m1, char *);
961 1.201 yamt } else {
962 1.201 yamt struct mbuf **nextp = &m1->m_next;
963 1.201 yamt
964 1.201 yamt m1->m_len -= left;
965 1.201 yamt do {
966 1.201 yamt m2 = m_get(M_WAIT, MT_DATA);
967 1.201 yamt MCLAIM(m2, m1->m_owner);
968 1.201 yamt if (left >= MINCLSIZE) {
969 1.201 yamt MCLGET(m2, M_WAIT);
970 1.201 yamt }
971 1.201 yamt m2->m_next = *nextp;
972 1.201 yamt *nextp = m2;
973 1.201 yamt nextp = &m2->m_next;
974 1.201 yamt len = (m2->m_flags & M_EXT) != 0 ?
975 1.201 yamt MCLBYTES : MLEN;
976 1.201 yamt if (len > left) {
977 1.201 yamt len = left;
978 1.201 yamt }
979 1.201 yamt memcpy(mtod(m2, char *), src, len);
980 1.201 yamt m2->m_len = len;
981 1.201 yamt src += len;
982 1.201 yamt left -= len;
983 1.201 yamt } while (left > 0);
984 1.201 yamt *mdp = m1 = m1->m_next;
985 1.201 yamt m2 = m1->m_next;
986 1.201 yamt *cp2 = mtod(m1, char *);
987 1.1 cgd }
988 1.39 fvdl } else {
989 1.39 fvdl /*
990 1.39 fvdl * If the first mbuf has no external data
991 1.39 fvdl * move the data to the front of the mbuf.
992 1.39 fvdl */
993 1.201 yamt MRESETDATA(m1);
994 1.201 yamt dst = mtod(m1, char *);
995 1.201 yamt if (dst != src) {
996 1.63 perry memmove(dst, src, left);
997 1.201 yamt }
998 1.39 fvdl m1->m_len = left;
999 1.39 fvdl m2 = m1->m_next;
1000 1.201 yamt *cp2 = m1->m_data;
1001 1.1 cgd }
1002 1.201 yamt *dposp = *cp2 + siz;
1003 1.39 fvdl /*
1004 1.39 fvdl * Loop through mbufs pulling data up into first mbuf until
1005 1.39 fvdl * the first mbuf is full or there is no more data to
1006 1.39 fvdl * pullup.
1007 1.39 fvdl */
1008 1.201 yamt dst = mtod(m1, char *) + m1->m_len;
1009 1.129 itojun while ((len = M_TRAILINGSPACE(m1)) != 0 && m2) {
1010 1.233 riastrad if ((len = uimin(len, m2->m_len)) != 0) {
1011 1.201 yamt memcpy(dst, mtod(m2, char *), len);
1012 1.201 yamt }
1013 1.39 fvdl m1->m_len += len;
1014 1.39 fvdl dst += len;
1015 1.39 fvdl m2->m_data += len;
1016 1.39 fvdl m2->m_len -= len;
1017 1.39 fvdl m2 = m2->m_next;
1018 1.39 fvdl }
1019 1.39 fvdl if (m1->m_len < siz)
1020 1.39 fvdl return (EBADRPC);
1021 1.1 cgd return (0);
1022 1.1 cgd }
1023 1.1 cgd
1024 1.1 cgd /*
1025 1.1 cgd * Advance the position in the mbuf chain.
1026 1.1 cgd */
1027 1.24 christos int
1028 1.214 dsl nfs_adv(struct mbuf **mdp, char **dposp, int offs, int left)
1029 1.1 cgd {
1030 1.75 augustss struct mbuf *m;
1031 1.75 augustss int s;
1032 1.1 cgd
1033 1.1 cgd m = *mdp;
1034 1.1 cgd s = left;
1035 1.1 cgd while (s < offs) {
1036 1.1 cgd offs -= s;
1037 1.1 cgd m = m->m_next;
1038 1.1 cgd if (m == NULL)
1039 1.1 cgd return (EBADRPC);
1040 1.1 cgd s = m->m_len;
1041 1.1 cgd }
1042 1.1 cgd *mdp = m;
1043 1.183 christos *dposp = mtod(m, char *) + offs;
1044 1.1 cgd return (0);
1045 1.1 cgd }
1046 1.1 cgd
1047 1.1 cgd /*
1048 1.1 cgd * Copy a string into mbufs for the hard cases...
1049 1.1 cgd */
1050 1.24 christos int
1051 1.214 dsl nfsm_strtmbuf(struct mbuf **mb, char **bpos, const char *cp, long siz)
1052 1.1 cgd {
1053 1.75 augustss struct mbuf *m1 = NULL, *m2;
1054 1.1 cgd long left, xfer, len, tlen;
1055 1.22 cgd u_int32_t *tl;
1056 1.1 cgd int putsize;
1057 1.1 cgd
1058 1.1 cgd putsize = 1;
1059 1.1 cgd m2 = *mb;
1060 1.12 mycroft left = M_TRAILINGSPACE(m2);
1061 1.1 cgd if (left > 0) {
1062 1.22 cgd tl = ((u_int32_t *)(*bpos));
1063 1.1 cgd *tl++ = txdr_unsigned(siz);
1064 1.1 cgd putsize = 0;
1065 1.1 cgd left -= NFSX_UNSIGNED;
1066 1.1 cgd m2->m_len += NFSX_UNSIGNED;
1067 1.1 cgd if (left > 0) {
1068 1.183 christos memcpy((void *) tl, cp, left);
1069 1.1 cgd siz -= left;
1070 1.1 cgd cp += left;
1071 1.1 cgd m2->m_len += left;
1072 1.1 cgd left = 0;
1073 1.1 cgd }
1074 1.1 cgd }
1075 1.12 mycroft /* Loop around adding mbufs */
1076 1.1 cgd while (siz > 0) {
1077 1.109 matt m1 = m_get(M_WAIT, MT_DATA);
1078 1.109 matt MCLAIM(m1, &nfs_mowner);
1079 1.1 cgd if (siz > MLEN)
1080 1.109 matt m_clget(m1, M_WAIT);
1081 1.1 cgd m1->m_len = NFSMSIZ(m1);
1082 1.1 cgd m2->m_next = m1;
1083 1.1 cgd m2 = m1;
1084 1.22 cgd tl = mtod(m1, u_int32_t *);
1085 1.1 cgd tlen = 0;
1086 1.1 cgd if (putsize) {
1087 1.1 cgd *tl++ = txdr_unsigned(siz);
1088 1.1 cgd m1->m_len -= NFSX_UNSIGNED;
1089 1.1 cgd tlen = NFSX_UNSIGNED;
1090 1.1 cgd putsize = 0;
1091 1.1 cgd }
1092 1.1 cgd if (siz < m1->m_len) {
1093 1.1 cgd len = nfsm_rndup(siz);
1094 1.1 cgd xfer = siz;
1095 1.1 cgd if (xfer < len)
1096 1.1 cgd *(tl+(xfer>>2)) = 0;
1097 1.1 cgd } else {
1098 1.1 cgd xfer = len = m1->m_len;
1099 1.1 cgd }
1100 1.183 christos memcpy((void *) tl, cp, xfer);
1101 1.1 cgd m1->m_len = len+tlen;
1102 1.1 cgd siz -= xfer;
1103 1.1 cgd cp += xfer;
1104 1.1 cgd }
1105 1.1 cgd *mb = m1;
1106 1.183 christos *bpos = mtod(m1, char *) + m1->m_len;
1107 1.1 cgd return (0);
1108 1.1 cgd }
1109 1.1 cgd
1110 1.49 fvdl /*
1111 1.49 fvdl * Directory caching routines. They work as follows:
1112 1.49 fvdl * - a cache is maintained per VDIR nfsnode.
1113 1.49 fvdl * - for each offset cookie that is exported to userspace, and can
1114 1.49 fvdl * thus be thrown back at us as an offset to VOP_READDIR, store
1115 1.49 fvdl * information in the cache.
1116 1.49 fvdl * - cached are:
1117 1.49 fvdl * - cookie itself
1118 1.49 fvdl * - blocknumber (essentially just a search key in the buffer cache)
1119 1.49 fvdl * - entry number in block.
1120 1.49 fvdl * - offset cookie of block in which this entry is stored
1121 1.49 fvdl * - 32 bit cookie if NFSMNT_XLATECOOKIE is used.
1122 1.49 fvdl * - entries are looked up in a hash table
1123 1.49 fvdl * - also maintained is an LRU list of entries, used to determine
1124 1.49 fvdl * which ones to delete if the cache grows too large.
1125 1.49 fvdl * - if 32 <-> 64 translation mode is requested for a filesystem,
1126 1.49 fvdl * the cache also functions as a translation table
1127 1.49 fvdl * - in the translation case, invalidating the cache does not mean
1128 1.49 fvdl * flushing it, but just marking entries as invalid, except for
1129 1.49 fvdl * the <64bit cookie, 32bitcookie> pair which is still valid, to
1130 1.49 fvdl * still be able to use the cache as a translation table.
1131 1.49 fvdl * - 32 bit cookies are uniquely created by combining the hash table
1132 1.49 fvdl * entry value, and one generation count per hash table entry,
1133 1.49 fvdl * incremented each time an entry is appended to the chain.
1134 1.49 fvdl * - the cache is invalidated each time a direcory is modified
1135 1.49 fvdl * - sanity checks are also done; if an entry in a block turns
1136 1.49 fvdl * out not to have a matching cookie, the cache is invalidated
1137 1.49 fvdl * and a new block starting from the wanted offset is fetched from
1138 1.49 fvdl * the server.
1139 1.49 fvdl * - directory entries as read from the server are extended to contain
1140 1.49 fvdl * the 64bit and, optionally, the 32bit cookies, for sanity checking
1141 1.49 fvdl * the cache and exporting them to userspace through the cookie
1142 1.49 fvdl * argument to VOP_READDIR.
1143 1.49 fvdl */
1144 1.49 fvdl
1145 1.46 fvdl u_long
1146 1.214 dsl nfs_dirhash(off_t off)
1147 1.46 fvdl {
1148 1.46 fvdl int i;
1149 1.46 fvdl char *cp = (char *)&off;
1150 1.46 fvdl u_long sum = 0L;
1151 1.46 fvdl
1152 1.46 fvdl for (i = 0 ; i < sizeof (off); i++)
1153 1.46 fvdl sum += *cp++;
1154 1.46 fvdl
1155 1.46 fvdl return sum;
1156 1.46 fvdl }
1157 1.46 fvdl
1158 1.221 rmind #define _NFSDC_MTX(np) (NFSTOV(np)->v_interlock)
1159 1.195 ad #define NFSDC_LOCK(np) mutex_enter(_NFSDC_MTX(np))
1160 1.195 ad #define NFSDC_UNLOCK(np) mutex_exit(_NFSDC_MTX(np))
1161 1.195 ad #define NFSDC_ASSERT_LOCKED(np) KASSERT(mutex_owned(_NFSDC_MTX(np)))
1162 1.135 yamt
1163 1.49 fvdl void
1164 1.214 dsl nfs_initdircache(struct vnode *vp)
1165 1.49 fvdl {
1166 1.49 fvdl struct nfsnode *np = VTONFS(vp);
1167 1.135 yamt struct nfsdirhashhead *dircache;
1168 1.120 yamt
1169 1.202 ad dircache = hashinit(NFS_DIRHASHSIZ, HASH_LIST, true,
1170 1.202 ad &nfsdirhashmask);
1171 1.49 fvdl
1172 1.135 yamt NFSDC_LOCK(np);
1173 1.135 yamt if (np->n_dircache == NULL) {
1174 1.135 yamt np->n_dircachesize = 0;
1175 1.135 yamt np->n_dircache = dircache;
1176 1.135 yamt dircache = NULL;
1177 1.135 yamt TAILQ_INIT(&np->n_dirchain);
1178 1.135 yamt }
1179 1.135 yamt NFSDC_UNLOCK(np);
1180 1.135 yamt if (dircache)
1181 1.202 ad hashdone(dircache, HASH_LIST, nfsdirhashmask);
1182 1.120 yamt }
1183 1.120 yamt
1184 1.120 yamt void
1185 1.214 dsl nfs_initdirxlatecookie(struct vnode *vp)
1186 1.120 yamt {
1187 1.120 yamt struct nfsnode *np = VTONFS(vp);
1188 1.135 yamt unsigned *dirgens;
1189 1.120 yamt
1190 1.120 yamt KASSERT(VFSTONFS(vp->v_mount)->nm_flag & NFSMNT_XLATECOOKIE);
1191 1.120 yamt
1192 1.196 yamt dirgens = kmem_zalloc(NFS_DIRHASHSIZ * sizeof(unsigned), KM_SLEEP);
1193 1.135 yamt NFSDC_LOCK(np);
1194 1.135 yamt if (np->n_dirgens == NULL) {
1195 1.135 yamt np->n_dirgens = dirgens;
1196 1.135 yamt dirgens = NULL;
1197 1.135 yamt }
1198 1.135 yamt NFSDC_UNLOCK(np);
1199 1.135 yamt if (dirgens)
1200 1.196 yamt kmem_free(dirgens, NFS_DIRHASHSIZ * sizeof(unsigned));
1201 1.135 yamt }
1202 1.135 yamt
1203 1.135 yamt static const struct nfsdircache dzero;
1204 1.135 yamt
1205 1.213 dsl static void nfs_unlinkdircache(struct nfsnode *np, struct nfsdircache *);
1206 1.213 dsl static void nfs_putdircache_unlocked(struct nfsnode *,
1207 1.213 dsl struct nfsdircache *);
1208 1.135 yamt
1209 1.135 yamt static void
1210 1.214 dsl nfs_unlinkdircache(struct nfsnode *np, struct nfsdircache *ndp)
1211 1.135 yamt {
1212 1.135 yamt
1213 1.135 yamt NFSDC_ASSERT_LOCKED(np);
1214 1.135 yamt KASSERT(ndp != &dzero);
1215 1.135 yamt
1216 1.135 yamt if (LIST_NEXT(ndp, dc_hash) == (void *)-1)
1217 1.135 yamt return;
1218 1.135 yamt
1219 1.135 yamt TAILQ_REMOVE(&np->n_dirchain, ndp, dc_chain);
1220 1.135 yamt LIST_REMOVE(ndp, dc_hash);
1221 1.135 yamt LIST_NEXT(ndp, dc_hash) = (void *)-1; /* mark as unlinked */
1222 1.135 yamt
1223 1.135 yamt nfs_putdircache_unlocked(np, ndp);
1224 1.135 yamt }
1225 1.135 yamt
1226 1.135 yamt void
1227 1.214 dsl nfs_putdircache(struct nfsnode *np, struct nfsdircache *ndp)
1228 1.135 yamt {
1229 1.135 yamt int ref;
1230 1.135 yamt
1231 1.135 yamt if (ndp == &dzero)
1232 1.135 yamt return;
1233 1.135 yamt
1234 1.135 yamt KASSERT(ndp->dc_refcnt > 0);
1235 1.135 yamt NFSDC_LOCK(np);
1236 1.135 yamt ref = --ndp->dc_refcnt;
1237 1.135 yamt NFSDC_UNLOCK(np);
1238 1.135 yamt
1239 1.135 yamt if (ref == 0)
1240 1.196 yamt kmem_free(ndp, sizeof(*ndp));
1241 1.49 fvdl }
1242 1.49 fvdl
1243 1.135 yamt static void
1244 1.177 yamt nfs_putdircache_unlocked(struct nfsnode *np, struct nfsdircache *ndp)
1245 1.135 yamt {
1246 1.135 yamt int ref;
1247 1.135 yamt
1248 1.135 yamt NFSDC_ASSERT_LOCKED(np);
1249 1.135 yamt
1250 1.135 yamt if (ndp == &dzero)
1251 1.135 yamt return;
1252 1.135 yamt
1253 1.135 yamt KASSERT(ndp->dc_refcnt > 0);
1254 1.135 yamt ref = --ndp->dc_refcnt;
1255 1.135 yamt if (ref == 0)
1256 1.196 yamt kmem_free(ndp, sizeof(*ndp));
1257 1.135 yamt }
1258 1.46 fvdl
1259 1.46 fvdl struct nfsdircache *
1260 1.214 dsl nfs_searchdircache(struct vnode *vp, off_t off, int do32, int *hashent)
1261 1.49 fvdl {
1262 1.49 fvdl struct nfsdirhashhead *ndhp;
1263 1.49 fvdl struct nfsdircache *ndp = NULL;
1264 1.49 fvdl struct nfsnode *np = VTONFS(vp);
1265 1.49 fvdl unsigned ent;
1266 1.49 fvdl
1267 1.49 fvdl /*
1268 1.49 fvdl * Zero is always a valid cookie.
1269 1.49 fvdl */
1270 1.49 fvdl if (off == 0)
1271 1.149 christos /* XXXUNCONST */
1272 1.149 christos return (struct nfsdircache *)__UNCONST(&dzero);
1273 1.49 fvdl
1274 1.134 yamt if (!np->n_dircache)
1275 1.134 yamt return NULL;
1276 1.134 yamt
1277 1.49 fvdl /*
1278 1.49 fvdl * We use a 32bit cookie as search key, directly reconstruct
1279 1.49 fvdl * the hashentry. Else use the hashfunction.
1280 1.49 fvdl */
1281 1.49 fvdl if (do32) {
1282 1.49 fvdl ent = (u_int32_t)off >> 24;
1283 1.49 fvdl if (ent >= NFS_DIRHASHSIZ)
1284 1.49 fvdl return NULL;
1285 1.49 fvdl ndhp = &np->n_dircache[ent];
1286 1.49 fvdl } else {
1287 1.49 fvdl ndhp = NFSDIRHASH(np, off);
1288 1.49 fvdl }
1289 1.49 fvdl
1290 1.49 fvdl if (hashent)
1291 1.49 fvdl *hashent = (int)(ndhp - np->n_dircache);
1292 1.135 yamt
1293 1.135 yamt NFSDC_LOCK(np);
1294 1.49 fvdl if (do32) {
1295 1.113 yamt LIST_FOREACH(ndp, ndhp, dc_hash) {
1296 1.49 fvdl if (ndp->dc_cookie32 == (u_int32_t)off) {
1297 1.49 fvdl /*
1298 1.49 fvdl * An invalidated entry will become the
1299 1.49 fvdl * start of a new block fetched from
1300 1.49 fvdl * the server.
1301 1.49 fvdl */
1302 1.135 yamt if (ndp->dc_flags & NFSDC_INVALID) {
1303 1.49 fvdl ndp->dc_blkcookie = ndp->dc_cookie;
1304 1.49 fvdl ndp->dc_entry = 0;
1305 1.135 yamt ndp->dc_flags &= ~NFSDC_INVALID;
1306 1.49 fvdl }
1307 1.49 fvdl break;
1308 1.49 fvdl }
1309 1.49 fvdl }
1310 1.49 fvdl } else {
1311 1.113 yamt LIST_FOREACH(ndp, ndhp, dc_hash) {
1312 1.49 fvdl if (ndp->dc_cookie == off)
1313 1.49 fvdl break;
1314 1.113 yamt }
1315 1.49 fvdl }
1316 1.135 yamt if (ndp != NULL)
1317 1.135 yamt ndp->dc_refcnt++;
1318 1.135 yamt NFSDC_UNLOCK(np);
1319 1.49 fvdl return ndp;
1320 1.49 fvdl }
1321 1.49 fvdl
1322 1.49 fvdl
1323 1.49 fvdl struct nfsdircache *
1324 1.171 christos nfs_enterdircache(struct vnode *vp, off_t off, off_t blkoff, int en,
1325 1.177 yamt daddr_t blkno)
1326 1.46 fvdl {
1327 1.46 fvdl struct nfsnode *np = VTONFS(vp);
1328 1.46 fvdl struct nfsdirhashhead *ndhp;
1329 1.135 yamt struct nfsdircache *ndp = NULL;
1330 1.135 yamt struct nfsdircache *newndp = NULL;
1331 1.49 fvdl struct nfsmount *nmp = VFSTONFS(vp->v_mount);
1332 1.161 christos int hashent = 0, gen, overwrite; /* XXX: GCC */
1333 1.46 fvdl
1334 1.135 yamt /*
1335 1.135 yamt * XXX refuse entries for offset 0. amd(8) erroneously sets
1336 1.135 yamt * cookie 0 for the '.' entry, making this necessary. This
1337 1.135 yamt * isn't so bad, as 0 is a special case anyway.
1338 1.135 yamt */
1339 1.135 yamt if (off == 0)
1340 1.149 christos /* XXXUNCONST */
1341 1.149 christos return (struct nfsdircache *)__UNCONST(&dzero);
1342 1.135 yamt
1343 1.49 fvdl if (!np->n_dircache)
1344 1.49 fvdl /*
1345 1.49 fvdl * XXX would like to do this in nfs_nget but vtype
1346 1.49 fvdl * isn't known at that time.
1347 1.49 fvdl */
1348 1.49 fvdl nfs_initdircache(vp);
1349 1.50 fvdl
1350 1.120 yamt if ((nmp->nm_flag & NFSMNT_XLATECOOKIE) && !np->n_dirgens)
1351 1.120 yamt nfs_initdirxlatecookie(vp);
1352 1.120 yamt
1353 1.135 yamt retry:
1354 1.49 fvdl ndp = nfs_searchdircache(vp, off, 0, &hashent);
1355 1.49 fvdl
1356 1.135 yamt NFSDC_LOCK(np);
1357 1.135 yamt if (ndp && (ndp->dc_flags & NFSDC_INVALID) == 0) {
1358 1.49 fvdl /*
1359 1.49 fvdl * Overwriting an old entry. Check if it's the same.
1360 1.49 fvdl * If so, just return. If not, remove the old entry.
1361 1.49 fvdl */
1362 1.49 fvdl if (ndp->dc_blkcookie == blkoff && ndp->dc_entry == en)
1363 1.135 yamt goto done;
1364 1.135 yamt nfs_unlinkdircache(np, ndp);
1365 1.135 yamt nfs_putdircache_unlocked(np, ndp);
1366 1.135 yamt ndp = NULL;
1367 1.46 fvdl }
1368 1.46 fvdl
1369 1.49 fvdl ndhp = &np->n_dircache[hashent];
1370 1.46 fvdl
1371 1.49 fvdl if (!ndp) {
1372 1.135 yamt if (newndp == NULL) {
1373 1.135 yamt NFSDC_UNLOCK(np);
1374 1.196 yamt newndp = kmem_alloc(sizeof(*newndp), KM_SLEEP);
1375 1.135 yamt newndp->dc_refcnt = 1;
1376 1.135 yamt LIST_NEXT(newndp, dc_hash) = (void *)-1;
1377 1.135 yamt goto retry;
1378 1.135 yamt }
1379 1.135 yamt ndp = newndp;
1380 1.135 yamt newndp = NULL;
1381 1.49 fvdl overwrite = 0;
1382 1.49 fvdl if (nmp->nm_flag & NFSMNT_XLATECOOKIE) {
1383 1.49 fvdl /*
1384 1.49 fvdl * We're allocating a new entry, so bump the
1385 1.49 fvdl * generation number.
1386 1.49 fvdl */
1387 1.160 christos KASSERT(np->n_dirgens);
1388 1.49 fvdl gen = ++np->n_dirgens[hashent];
1389 1.49 fvdl if (gen == 0) {
1390 1.49 fvdl np->n_dirgens[hashent]++;
1391 1.49 fvdl gen++;
1392 1.49 fvdl }
1393 1.49 fvdl ndp->dc_cookie32 = (hashent << 24) | (gen & 0xffffff);
1394 1.49 fvdl }
1395 1.49 fvdl } else
1396 1.49 fvdl overwrite = 1;
1397 1.46 fvdl
1398 1.49 fvdl ndp->dc_cookie = off;
1399 1.49 fvdl ndp->dc_blkcookie = blkoff;
1400 1.46 fvdl ndp->dc_entry = en;
1401 1.137 yamt ndp->dc_flags = 0;
1402 1.46 fvdl
1403 1.49 fvdl if (overwrite)
1404 1.135 yamt goto done;
1405 1.49 fvdl
1406 1.46 fvdl /*
1407 1.46 fvdl * If the maximum directory cookie cache size has been reached
1408 1.46 fvdl * for this node, take one off the front. The idea is that
1409 1.46 fvdl * directories are typically read front-to-back once, so that
1410 1.46 fvdl * the oldest entries can be thrown away without much performance
1411 1.46 fvdl * loss.
1412 1.46 fvdl */
1413 1.46 fvdl if (np->n_dircachesize == NFS_MAXDIRCACHE) {
1414 1.135 yamt nfs_unlinkdircache(np, TAILQ_FIRST(&np->n_dirchain));
1415 1.46 fvdl } else
1416 1.46 fvdl np->n_dircachesize++;
1417 1.148 perry
1418 1.135 yamt KASSERT(ndp->dc_refcnt == 1);
1419 1.46 fvdl LIST_INSERT_HEAD(ndhp, ndp, dc_hash);
1420 1.46 fvdl TAILQ_INSERT_TAIL(&np->n_dirchain, ndp, dc_chain);
1421 1.135 yamt ndp->dc_refcnt++;
1422 1.135 yamt done:
1423 1.135 yamt KASSERT(ndp->dc_refcnt > 0);
1424 1.135 yamt NFSDC_UNLOCK(np);
1425 1.135 yamt if (newndp)
1426 1.135 yamt nfs_putdircache(np, newndp);
1427 1.46 fvdl return ndp;
1428 1.46 fvdl }
1429 1.46 fvdl
1430 1.46 fvdl void
1431 1.214 dsl nfs_invaldircache(struct vnode *vp, int flags)
1432 1.46 fvdl {
1433 1.46 fvdl struct nfsnode *np = VTONFS(vp);
1434 1.46 fvdl struct nfsdircache *ndp = NULL;
1435 1.49 fvdl struct nfsmount *nmp = VFSTONFS(vp->v_mount);
1436 1.181 thorpej const bool forcefree = flags & NFS_INVALDIRCACHE_FORCE;
1437 1.46 fvdl
1438 1.46 fvdl #ifdef DIAGNOSTIC
1439 1.46 fvdl if (vp->v_type != VDIR)
1440 1.46 fvdl panic("nfs: invaldircache: not dir");
1441 1.46 fvdl #endif
1442 1.46 fvdl
1443 1.145 yamt if ((flags & NFS_INVALDIRCACHE_KEEPEOF) == 0)
1444 1.145 yamt np->n_flag &= ~NEOFVALID;
1445 1.144 yamt
1446 1.46 fvdl if (!np->n_dircache)
1447 1.46 fvdl return;
1448 1.46 fvdl
1449 1.135 yamt NFSDC_LOCK(np);
1450 1.49 fvdl if (!(nmp->nm_flag & NFSMNT_XLATECOOKIE) || forcefree) {
1451 1.135 yamt while ((ndp = TAILQ_FIRST(&np->n_dirchain)) != NULL) {
1452 1.135 yamt KASSERT(!forcefree || ndp->dc_refcnt == 1);
1453 1.135 yamt nfs_unlinkdircache(np, ndp);
1454 1.49 fvdl }
1455 1.49 fvdl np->n_dircachesize = 0;
1456 1.49 fvdl if (forcefree && np->n_dirgens) {
1457 1.196 yamt kmem_free(np->n_dirgens,
1458 1.196 yamt NFS_DIRHASHSIZ * sizeof(unsigned));
1459 1.120 yamt np->n_dirgens = NULL;
1460 1.49 fvdl }
1461 1.49 fvdl } else {
1462 1.135 yamt TAILQ_FOREACH(ndp, &np->n_dirchain, dc_chain)
1463 1.135 yamt ndp->dc_flags |= NFSDC_INVALID;
1464 1.46 fvdl }
1465 1.46 fvdl
1466 1.135 yamt NFSDC_UNLOCK(np);
1467 1.46 fvdl }
1468 1.46 fvdl
1469 1.1 cgd /*
1470 1.35 thorpej * Called once before VFS init to initialize shared and
1471 1.35 thorpej * server-specific data structures.
1472 1.1 cgd */
1473 1.157 yamt static int
1474 1.155 thorpej nfs_init0(void)
1475 1.1 cgd {
1476 1.189 ad
1477 1.12 mycroft nfsrtt.pos = 0;
1478 1.1 cgd rpc_vers = txdr_unsigned(RPC_VER2);
1479 1.1 cgd rpc_call = txdr_unsigned(RPC_CALL);
1480 1.1 cgd rpc_reply = txdr_unsigned(RPC_REPLY);
1481 1.1 cgd rpc_msgdenied = txdr_unsigned(RPC_MSGDENIED);
1482 1.1 cgd rpc_msgaccepted = txdr_unsigned(RPC_MSGACCEPTED);
1483 1.1 cgd rpc_mismatch = txdr_unsigned(RPC_MISMATCH);
1484 1.12 mycroft rpc_autherr = txdr_unsigned(RPC_AUTHERR);
1485 1.1 cgd rpc_auth_unix = txdr_unsigned(RPCAUTH_UNIX);
1486 1.25 fvdl rpc_auth_kerb = txdr_unsigned(RPCAUTH_KERB4);
1487 1.1 cgd nfs_prog = txdr_unsigned(NFS_PROG);
1488 1.182 thorpej nfs_true = txdr_unsigned(true);
1489 1.182 thorpej nfs_false = txdr_unsigned(false);
1490 1.12 mycroft nfs_xdrneg1 = txdr_unsigned(-1);
1491 1.25 fvdl nfs_ticks = (hz * NFS_TICKINTVL + 500) / 1000;
1492 1.25 fvdl if (nfs_ticks < 1)
1493 1.25 fvdl nfs_ticks = 1;
1494 1.164 yamt nfsdreq_init();
1495 1.164 yamt
1496 1.1 cgd /*
1497 1.1 cgd * Initialize reply list and start timer
1498 1.1 cgd */
1499 1.16 mycroft TAILQ_INIT(&nfs_reqq);
1500 1.230 christos mutex_init(&nfs_reqq_lock, MUTEX_DEFAULT, IPL_NONE);
1501 1.191 yamt nfs_timer_init();
1502 1.109 matt MOWNER_ATTACH(&nfs_mowner);
1503 1.106 jdolecek
1504 1.157 yamt return 0;
1505 1.1 cgd }
1506 1.1 cgd
1507 1.223 christos static volatile uint32_t nfs_mutex;
1508 1.223 christos static uint32_t nfs_refcount;
1509 1.223 christos
1510 1.223 christos #define nfs_p() while (atomic_cas_32(&nfs_mutex, 0, 1) == 0) continue;
1511 1.223 christos #define nfs_v() while (atomic_cas_32(&nfs_mutex, 1, 0) == 1) continue;
1512 1.223 christos
1513 1.210 ad /*
1514 1.210 ad * This is disgusting, but it must support both modular and monolothic
1515 1.223 christos * configurations, plus the code is shared between server and client.
1516 1.223 christos * For monolithic builds NFSSERVER may not imply NFS. Unfortunately we
1517 1.223 christos * can't use regular mutexes here that would require static initialization
1518 1.223 christos * and we can get initialized from multiple places, so we improvise.
1519 1.210 ad *
1520 1.210 ad * Yuck.
1521 1.210 ad */
1522 1.155 thorpej void
1523 1.155 thorpej nfs_init(void)
1524 1.155 thorpej {
1525 1.224 pgoyette
1526 1.223 christos nfs_p();
1527 1.223 christos if (nfs_refcount++ == 0)
1528 1.223 christos nfs_init0();
1529 1.223 christos nfs_v();
1530 1.155 thorpej }
1531 1.155 thorpej
1532 1.210 ad void
1533 1.210 ad nfs_fini(void)
1534 1.210 ad {
1535 1.224 pgoyette
1536 1.223 christos nfs_p();
1537 1.223 christos if (--nfs_refcount == 0) {
1538 1.223 christos MOWNER_DETACH(&nfs_mowner);
1539 1.223 christos nfs_timer_fini();
1540 1.230 christos mutex_destroy(&nfs_reqq_lock);
1541 1.223 christos nfsdreq_fini();
1542 1.223 christos }
1543 1.223 christos nfs_v();
1544 1.210 ad }
1545 1.210 ad
1546 1.1 cgd /*
1547 1.118 yamt * A fiddled version of m_adj() that ensures null fill to a 32-bit
1548 1.1 cgd * boundary and only trims off the back end
1549 1.122 yamt *
1550 1.122 yamt * 1. trim off 'len' bytes as m_adj(mp, -len).
1551 1.122 yamt * 2. add zero-padding 'nul' bytes at the end of the mbuf chain.
1552 1.1 cgd */
1553 1.12 mycroft void
1554 1.214 dsl nfs_zeropad(struct mbuf *mp, int len, int nul)
1555 1.1 cgd {
1556 1.75 augustss struct mbuf *m;
1557 1.130 yamt int count;
1558 1.1 cgd
1559 1.1 cgd /*
1560 1.1 cgd * Trim from tail. Scan the mbuf chain,
1561 1.1 cgd * calculating its length and finding the last mbuf.
1562 1.1 cgd * If the adjustment only affects this mbuf, then just
1563 1.1 cgd * adjust and return. Otherwise, rescan and truncate
1564 1.1 cgd * after the remaining size.
1565 1.1 cgd */
1566 1.1 cgd count = 0;
1567 1.1 cgd m = mp;
1568 1.1 cgd for (;;) {
1569 1.1 cgd count += m->m_len;
1570 1.122 yamt if (m->m_next == NULL)
1571 1.1 cgd break;
1572 1.1 cgd m = m->m_next;
1573 1.1 cgd }
1574 1.122 yamt
1575 1.122 yamt KDASSERT(count >= len);
1576 1.122 yamt
1577 1.122 yamt if (m->m_len >= len) {
1578 1.1 cgd m->m_len -= len;
1579 1.122 yamt } else {
1580 1.122 yamt count -= len;
1581 1.122 yamt /*
1582 1.122 yamt * Correct length for chain is "count".
1583 1.122 yamt * Find the mbuf with last data, adjust its length,
1584 1.122 yamt * and toss data from remaining mbufs on chain.
1585 1.122 yamt */
1586 1.122 yamt for (m = mp; m; m = m->m_next) {
1587 1.122 yamt if (m->m_len >= count) {
1588 1.122 yamt m->m_len = count;
1589 1.122 yamt break;
1590 1.118 yamt }
1591 1.122 yamt count -= m->m_len;
1592 1.1 cgd }
1593 1.159 christos KASSERT(m && m->m_next);
1594 1.122 yamt m_freem(m->m_next);
1595 1.122 yamt m->m_next = NULL;
1596 1.1 cgd }
1597 1.122 yamt
1598 1.130 yamt KDASSERT(m->m_next == NULL);
1599 1.130 yamt
1600 1.122 yamt /*
1601 1.122 yamt * zero-padding.
1602 1.122 yamt */
1603 1.122 yamt if (nul > 0) {
1604 1.130 yamt char *cp;
1605 1.130 yamt int i;
1606 1.130 yamt
1607 1.231 maxv if (M_READONLY(m) || M_TRAILINGSPACE(m) < nul) {
1608 1.122 yamt struct mbuf *n;
1609 1.122 yamt
1610 1.122 yamt KDASSERT(MLEN >= nul);
1611 1.122 yamt n = m_get(M_WAIT, MT_DATA);
1612 1.122 yamt MCLAIM(n, &nfs_mowner);
1613 1.122 yamt n->m_len = nul;
1614 1.130 yamt n->m_next = NULL;
1615 1.122 yamt m->m_next = n;
1616 1.183 christos cp = mtod(n, void *);
1617 1.122 yamt } else {
1618 1.183 christos cp = mtod(m, char *) + m->m_len;
1619 1.122 yamt m->m_len += nul;
1620 1.1 cgd }
1621 1.122 yamt for (i = 0; i < nul; i++)
1622 1.122 yamt *cp++ = '\0';
1623 1.1 cgd }
1624 1.122 yamt return;
1625 1.1 cgd }
1626 1.1 cgd
1627 1.1 cgd /*
1628 1.25 fvdl * Make these functions instead of macros, so that the kernel text size
1629 1.25 fvdl * doesn't get too big...
1630 1.25 fvdl */
1631 1.25 fvdl void
1632 1.214 dsl nfsm_srvwcc(struct nfsrv_descript *nfsd, int before_ret, struct vattr *before_vap, int after_ret, struct vattr *after_vap, struct mbuf **mbp, char **bposp)
1633 1.25 fvdl {
1634 1.109 matt struct mbuf *mb = *mbp;
1635 1.75 augustss char *bpos = *bposp;
1636 1.75 augustss u_int32_t *tl;
1637 1.25 fvdl
1638 1.25 fvdl if (before_ret) {
1639 1.25 fvdl nfsm_build(tl, u_int32_t *, NFSX_UNSIGNED);
1640 1.25 fvdl *tl = nfs_false;
1641 1.25 fvdl } else {
1642 1.25 fvdl nfsm_build(tl, u_int32_t *, 7 * NFSX_UNSIGNED);
1643 1.25 fvdl *tl++ = nfs_true;
1644 1.66 fair txdr_hyper(before_vap->va_size, tl);
1645 1.25 fvdl tl += 2;
1646 1.25 fvdl txdr_nfsv3time(&(before_vap->va_mtime), tl);
1647 1.25 fvdl tl += 2;
1648 1.25 fvdl txdr_nfsv3time(&(before_vap->va_ctime), tl);
1649 1.25 fvdl }
1650 1.25 fvdl *bposp = bpos;
1651 1.25 fvdl *mbp = mb;
1652 1.25 fvdl nfsm_srvpostopattr(nfsd, after_ret, after_vap, mbp, bposp);
1653 1.25 fvdl }
1654 1.25 fvdl
1655 1.25 fvdl void
1656 1.214 dsl nfsm_srvpostopattr(struct nfsrv_descript *nfsd, int after_ret, struct vattr *after_vap, struct mbuf **mbp, char **bposp)
1657 1.25 fvdl {
1658 1.109 matt struct mbuf *mb = *mbp;
1659 1.75 augustss char *bpos = *bposp;
1660 1.75 augustss u_int32_t *tl;
1661 1.75 augustss struct nfs_fattr *fp;
1662 1.25 fvdl
1663 1.25 fvdl if (after_ret) {
1664 1.25 fvdl nfsm_build(tl, u_int32_t *, NFSX_UNSIGNED);
1665 1.25 fvdl *tl = nfs_false;
1666 1.25 fvdl } else {
1667 1.25 fvdl nfsm_build(tl, u_int32_t *, NFSX_UNSIGNED + NFSX_V3FATTR);
1668 1.25 fvdl *tl++ = nfs_true;
1669 1.25 fvdl fp = (struct nfs_fattr *)tl;
1670 1.25 fvdl nfsm_srvfattr(nfsd, after_vap, fp);
1671 1.25 fvdl }
1672 1.25 fvdl *mbp = mb;
1673 1.25 fvdl *bposp = bpos;
1674 1.25 fvdl }
1675 1.25 fvdl
1676 1.25 fvdl void
1677 1.214 dsl nfsm_srvfattr(struct nfsrv_descript *nfsd, struct vattr *vap, struct nfs_fattr *fp)
1678 1.25 fvdl {
1679 1.25 fvdl
1680 1.25 fvdl fp->fa_nlink = txdr_unsigned(vap->va_nlink);
1681 1.25 fvdl fp->fa_uid = txdr_unsigned(vap->va_uid);
1682 1.25 fvdl fp->fa_gid = txdr_unsigned(vap->va_gid);
1683 1.25 fvdl if (nfsd->nd_flag & ND_NFSV3) {
1684 1.25 fvdl fp->fa_type = vtonfsv3_type(vap->va_type);
1685 1.25 fvdl fp->fa_mode = vtonfsv3_mode(vap->va_mode);
1686 1.66 fair txdr_hyper(vap->va_size, &fp->fa3_size);
1687 1.66 fair txdr_hyper(vap->va_bytes, &fp->fa3_used);
1688 1.25 fvdl fp->fa3_rdev.specdata1 = txdr_unsigned(major(vap->va_rdev));
1689 1.25 fvdl fp->fa3_rdev.specdata2 = txdr_unsigned(minor(vap->va_rdev));
1690 1.25 fvdl fp->fa3_fsid.nfsuquad[0] = 0;
1691 1.25 fvdl fp->fa3_fsid.nfsuquad[1] = txdr_unsigned(vap->va_fsid);
1692 1.151 yamt txdr_hyper(vap->va_fileid, &fp->fa3_fileid);
1693 1.25 fvdl txdr_nfsv3time(&vap->va_atime, &fp->fa3_atime);
1694 1.25 fvdl txdr_nfsv3time(&vap->va_mtime, &fp->fa3_mtime);
1695 1.25 fvdl txdr_nfsv3time(&vap->va_ctime, &fp->fa3_ctime);
1696 1.25 fvdl } else {
1697 1.25 fvdl fp->fa_type = vtonfsv2_type(vap->va_type);
1698 1.25 fvdl fp->fa_mode = vtonfsv2_mode(vap->va_type, vap->va_mode);
1699 1.239 mlelstv fp->fa2_size = txdr_unsigned(NFS_V2CLAMP32(vap->va_size));
1700 1.239 mlelstv fp->fa2_blocksize = txdr_unsigned(NFS_V2CLAMP16(vap->va_blocksize));
1701 1.25 fvdl if (vap->va_type == VFIFO)
1702 1.25 fvdl fp->fa2_rdev = 0xffffffff;
1703 1.25 fvdl else
1704 1.25 fvdl fp->fa2_rdev = txdr_unsigned(vap->va_rdev);
1705 1.25 fvdl fp->fa2_blocks = txdr_unsigned(vap->va_bytes / NFS_FABLKSIZE);
1706 1.25 fvdl fp->fa2_fsid = txdr_unsigned(vap->va_fsid);
1707 1.25 fvdl fp->fa2_fileid = txdr_unsigned(vap->va_fileid);
1708 1.25 fvdl txdr_nfsv2time(&vap->va_atime, &fp->fa2_atime);
1709 1.25 fvdl txdr_nfsv2time(&vap->va_mtime, &fp->fa2_mtime);
1710 1.25 fvdl txdr_nfsv2time(&vap->va_ctime, &fp->fa2_ctime);
1711 1.25 fvdl }
1712 1.25 fvdl }
1713 1.25 fvdl
1714 1.1 cgd /*
1715 1.182 thorpej * This function compares two net addresses by family and returns true
1716 1.12 mycroft * if they are the same host.
1717 1.182 thorpej * If there is any doubt, return false.
1718 1.12 mycroft * The AF_INET family is handled as a special case so that address mbufs
1719 1.12 mycroft * don't need to be saved to store "struct in_addr", which is only 4 bytes.
1720 1.1 cgd */
1721 1.24 christos int
1722 1.214 dsl netaddr_match(int family, union nethostaddr *haddr, struct mbuf *nam)
1723 1.1 cgd {
1724 1.75 augustss struct sockaddr_in *inetaddr;
1725 1.1 cgd
1726 1.12 mycroft switch (family) {
1727 1.12 mycroft case AF_INET:
1728 1.12 mycroft inetaddr = mtod(nam, struct sockaddr_in *);
1729 1.12 mycroft if (inetaddr->sin_family == AF_INET &&
1730 1.12 mycroft inetaddr->sin_addr.s_addr == haddr->had_inetaddr)
1731 1.12 mycroft return (1);
1732 1.12 mycroft break;
1733 1.76 fvdl case AF_INET6:
1734 1.76 fvdl {
1735 1.76 fvdl struct sockaddr_in6 *sin6_1, *sin6_2;
1736 1.76 fvdl
1737 1.76 fvdl sin6_1 = mtod(nam, struct sockaddr_in6 *);
1738 1.76 fvdl sin6_2 = mtod(haddr->had_nam, struct sockaddr_in6 *);
1739 1.76 fvdl if (sin6_1->sin6_family == AF_INET6 &&
1740 1.76 fvdl IN6_ARE_ADDR_EQUAL(&sin6_1->sin6_addr, &sin6_2->sin6_addr))
1741 1.76 fvdl return 1;
1742 1.76 fvdl }
1743 1.12 mycroft default:
1744 1.12 mycroft break;
1745 1.12 mycroft };
1746 1.12 mycroft return (0);
1747 1.25 fvdl }
1748 1.25 fvdl
1749 1.226 christos struct nfs_clearcommit_ctx {
1750 1.226 christos struct mount *mp;
1751 1.226 christos };
1752 1.226 christos
1753 1.226 christos static bool
1754 1.226 christos nfs_clearcommit_selector(void *cl, struct vnode *vp)
1755 1.226 christos {
1756 1.226 christos struct nfs_clearcommit_ctx *c = cl;
1757 1.226 christos struct nfsnode *np;
1758 1.226 christos
1759 1.229 riastrad KASSERT(mutex_owned(vp->v_interlock));
1760 1.229 riastrad
1761 1.237 ad /* XXXAD mountpoint check looks like nonsense to me */
1762 1.226 christos np = VTONFS(vp);
1763 1.226 christos if (vp->v_type != VREG || vp->v_mount != c->mp || np == NULL)
1764 1.226 christos return false;
1765 1.226 christos return false;
1766 1.226 christos }
1767 1.226 christos
1768 1.25 fvdl /*
1769 1.25 fvdl * The write verifier has changed (probably due to a server reboot), so all
1770 1.114 yamt * PG_NEEDCOMMIT pages will have to be written again. Since they are marked
1771 1.117 yamt * as dirty or are being written out just now, all this takes is clearing
1772 1.117 yamt * the PG_NEEDCOMMIT flag. Once done the new write verifier can be set for
1773 1.117 yamt * the mount point.
1774 1.25 fvdl */
1775 1.25 fvdl void
1776 1.214 dsl nfs_clearcommit(struct mount *mp)
1777 1.25 fvdl {
1778 1.237 ad struct vnode *vp;
1779 1.225 hannken struct vnode_iterator *marker;
1780 1.116 yamt struct nfsmount *nmp = VFSTONFS(mp);
1781 1.226 christos struct nfs_clearcommit_ctx ctx;
1782 1.237 ad struct nfsnode *np;
1783 1.237 ad struct vm_page *pg;
1784 1.237 ad struct uvm_page_array a;
1785 1.237 ad voff_t off;
1786 1.116 yamt
1787 1.180 yamt rw_enter(&nmp->nm_writeverflock, RW_WRITER);
1788 1.225 hannken vfs_vnode_iterator_init(mp, &marker);
1789 1.226 christos ctx.mp = mp;
1790 1.237 ad for (;;) {
1791 1.237 ad vp = vfs_vnode_iterator_next(marker, nfs_clearcommit_selector,
1792 1.237 ad &ctx);
1793 1.237 ad if (vp == NULL)
1794 1.237 ad break;
1795 1.237 ad rw_enter(vp->v_uobj.vmobjlock, RW_WRITER);
1796 1.237 ad np = VTONFS(vp);
1797 1.237 ad np->n_pushlo = np->n_pushhi = np->n_pushedlo =
1798 1.237 ad np->n_pushedhi = 0;
1799 1.237 ad np->n_commitflags &=
1800 1.237 ad ~(NFS_COMMIT_PUSH_VALID | NFS_COMMIT_PUSHED_VALID);
1801 1.240 ad uvm_page_array_init(&a, &vp->v_uobj, 0);
1802 1.237 ad off = 0;
1803 1.240 ad while ((pg = uvm_page_array_fill_and_peek(&a, off, 0)) !=
1804 1.240 ad NULL) {
1805 1.237 ad pg->flags &= ~PG_NEEDCOMMIT;
1806 1.237 ad uvm_page_array_advance(&a);
1807 1.237 ad off = pg->offset + PAGE_SIZE;
1808 1.237 ad }
1809 1.237 ad uvm_page_array_fini(&a);
1810 1.237 ad rw_exit(vp->v_uobj.vmobjlock);
1811 1.237 ad vrele(vp);
1812 1.237 ad }
1813 1.226 christos KASSERT(vp == NULL);
1814 1.225 hannken vfs_vnode_iterator_destroy(marker);
1815 1.186 yamt mutex_enter(&nmp->nm_lock);
1816 1.116 yamt nmp->nm_iflag &= ~NFSMNT_STALEWRITEVERF;
1817 1.186 yamt mutex_exit(&nmp->nm_lock);
1818 1.180 yamt rw_exit(&nmp->nm_writeverflock);
1819 1.83 fvdl }
1820 1.83 fvdl
1821 1.83 fvdl void
1822 1.214 dsl nfs_merge_commit_ranges(struct vnode *vp)
1823 1.83 fvdl {
1824 1.83 fvdl struct nfsnode *np = VTONFS(vp);
1825 1.112 yamt
1826 1.112 yamt KASSERT(np->n_commitflags & NFS_COMMIT_PUSH_VALID);
1827 1.83 fvdl
1828 1.83 fvdl if (!(np->n_commitflags & NFS_COMMIT_PUSHED_VALID)) {
1829 1.83 fvdl np->n_pushedlo = np->n_pushlo;
1830 1.83 fvdl np->n_pushedhi = np->n_pushhi;
1831 1.83 fvdl np->n_commitflags |= NFS_COMMIT_PUSHED_VALID;
1832 1.83 fvdl } else {
1833 1.83 fvdl if (np->n_pushlo < np->n_pushedlo)
1834 1.83 fvdl np->n_pushedlo = np->n_pushlo;
1835 1.83 fvdl if (np->n_pushhi > np->n_pushedhi)
1836 1.83 fvdl np->n_pushedhi = np->n_pushhi;
1837 1.83 fvdl }
1838 1.83 fvdl
1839 1.83 fvdl np->n_pushlo = np->n_pushhi = 0;
1840 1.83 fvdl np->n_commitflags &= ~NFS_COMMIT_PUSH_VALID;
1841 1.83 fvdl
1842 1.111 yamt #ifdef NFS_DEBUG_COMMIT
1843 1.83 fvdl printf("merge: committed: %u - %u\n", (unsigned)np->n_pushedlo,
1844 1.83 fvdl (unsigned)np->n_pushedhi);
1845 1.83 fvdl #endif
1846 1.83 fvdl }
1847 1.83 fvdl
1848 1.83 fvdl int
1849 1.215 dsl nfs_in_committed_range(struct vnode *vp, off_t off, off_t len)
1850 1.83 fvdl {
1851 1.83 fvdl struct nfsnode *np = VTONFS(vp);
1852 1.83 fvdl off_t lo, hi;
1853 1.83 fvdl
1854 1.83 fvdl if (!(np->n_commitflags & NFS_COMMIT_PUSHED_VALID))
1855 1.83 fvdl return 0;
1856 1.89 chs lo = off;
1857 1.89 chs hi = lo + len;
1858 1.83 fvdl
1859 1.83 fvdl return (lo >= np->n_pushedlo && hi <= np->n_pushedhi);
1860 1.83 fvdl }
1861 1.83 fvdl
1862 1.83 fvdl int
1863 1.215 dsl nfs_in_tobecommitted_range(struct vnode *vp, off_t off, off_t len)
1864 1.83 fvdl {
1865 1.83 fvdl struct nfsnode *np = VTONFS(vp);
1866 1.83 fvdl off_t lo, hi;
1867 1.83 fvdl
1868 1.83 fvdl if (!(np->n_commitflags & NFS_COMMIT_PUSH_VALID))
1869 1.83 fvdl return 0;
1870 1.89 chs lo = off;
1871 1.89 chs hi = lo + len;
1872 1.83 fvdl
1873 1.83 fvdl return (lo >= np->n_pushlo && hi <= np->n_pushhi);
1874 1.83 fvdl }
1875 1.83 fvdl
1876 1.83 fvdl void
1877 1.215 dsl nfs_add_committed_range(struct vnode *vp, off_t off, off_t len)
1878 1.83 fvdl {
1879 1.83 fvdl struct nfsnode *np = VTONFS(vp);
1880 1.83 fvdl off_t lo, hi;
1881 1.83 fvdl
1882 1.89 chs lo = off;
1883 1.89 chs hi = lo + len;
1884 1.83 fvdl
1885 1.83 fvdl if (!(np->n_commitflags & NFS_COMMIT_PUSHED_VALID)) {
1886 1.83 fvdl np->n_pushedlo = lo;
1887 1.83 fvdl np->n_pushedhi = hi;
1888 1.83 fvdl np->n_commitflags |= NFS_COMMIT_PUSHED_VALID;
1889 1.83 fvdl } else {
1890 1.83 fvdl if (hi > np->n_pushedhi)
1891 1.83 fvdl np->n_pushedhi = hi;
1892 1.83 fvdl if (lo < np->n_pushedlo)
1893 1.83 fvdl np->n_pushedlo = lo;
1894 1.83 fvdl }
1895 1.111 yamt #ifdef NFS_DEBUG_COMMIT
1896 1.83 fvdl printf("add: committed: %u - %u\n", (unsigned)np->n_pushedlo,
1897 1.83 fvdl (unsigned)np->n_pushedhi);
1898 1.83 fvdl #endif
1899 1.83 fvdl }
1900 1.83 fvdl
1901 1.83 fvdl void
1902 1.215 dsl nfs_del_committed_range(struct vnode *vp, off_t off, off_t len)
1903 1.83 fvdl {
1904 1.83 fvdl struct nfsnode *np = VTONFS(vp);
1905 1.83 fvdl off_t lo, hi;
1906 1.83 fvdl
1907 1.83 fvdl if (!(np->n_commitflags & NFS_COMMIT_PUSHED_VALID))
1908 1.83 fvdl return;
1909 1.83 fvdl
1910 1.89 chs lo = off;
1911 1.89 chs hi = lo + len;
1912 1.83 fvdl
1913 1.83 fvdl if (lo > np->n_pushedhi || hi < np->n_pushedlo)
1914 1.83 fvdl return;
1915 1.83 fvdl if (lo <= np->n_pushedlo)
1916 1.83 fvdl np->n_pushedlo = hi;
1917 1.83 fvdl else if (hi >= np->n_pushedhi)
1918 1.83 fvdl np->n_pushedhi = lo;
1919 1.83 fvdl else {
1920 1.83 fvdl /*
1921 1.83 fvdl * XXX There's only one range. If the deleted range
1922 1.83 fvdl * is in the middle, pick the largest of the
1923 1.83 fvdl * contiguous ranges that it leaves.
1924 1.83 fvdl */
1925 1.83 fvdl if ((np->n_pushedlo - lo) > (hi - np->n_pushedhi))
1926 1.83 fvdl np->n_pushedhi = lo;
1927 1.83 fvdl else
1928 1.83 fvdl np->n_pushedlo = hi;
1929 1.83 fvdl }
1930 1.111 yamt #ifdef NFS_DEBUG_COMMIT
1931 1.83 fvdl printf("del: committed: %u - %u\n", (unsigned)np->n_pushedlo,
1932 1.83 fvdl (unsigned)np->n_pushedhi);
1933 1.83 fvdl #endif
1934 1.83 fvdl }
1935 1.83 fvdl
1936 1.83 fvdl void
1937 1.215 dsl nfs_add_tobecommitted_range(struct vnode *vp, off_t off, off_t len)
1938 1.83 fvdl {
1939 1.83 fvdl struct nfsnode *np = VTONFS(vp);
1940 1.83 fvdl off_t lo, hi;
1941 1.83 fvdl
1942 1.89 chs lo = off;
1943 1.89 chs hi = lo + len;
1944 1.83 fvdl
1945 1.83 fvdl if (!(np->n_commitflags & NFS_COMMIT_PUSH_VALID)) {
1946 1.83 fvdl np->n_pushlo = lo;
1947 1.83 fvdl np->n_pushhi = hi;
1948 1.83 fvdl np->n_commitflags |= NFS_COMMIT_PUSH_VALID;
1949 1.83 fvdl } else {
1950 1.83 fvdl if (lo < np->n_pushlo)
1951 1.83 fvdl np->n_pushlo = lo;
1952 1.83 fvdl if (hi > np->n_pushhi)
1953 1.83 fvdl np->n_pushhi = hi;
1954 1.83 fvdl }
1955 1.111 yamt #ifdef NFS_DEBUG_COMMIT
1956 1.83 fvdl printf("add: tobecommitted: %u - %u\n", (unsigned)np->n_pushlo,
1957 1.83 fvdl (unsigned)np->n_pushhi);
1958 1.83 fvdl #endif
1959 1.83 fvdl }
1960 1.83 fvdl
1961 1.83 fvdl void
1962 1.215 dsl nfs_del_tobecommitted_range(struct vnode *vp, off_t off, off_t len)
1963 1.83 fvdl {
1964 1.83 fvdl struct nfsnode *np = VTONFS(vp);
1965 1.83 fvdl off_t lo, hi;
1966 1.83 fvdl
1967 1.83 fvdl if (!(np->n_commitflags & NFS_COMMIT_PUSH_VALID))
1968 1.83 fvdl return;
1969 1.83 fvdl
1970 1.89 chs lo = off;
1971 1.89 chs hi = lo + len;
1972 1.83 fvdl
1973 1.83 fvdl if (lo > np->n_pushhi || hi < np->n_pushlo)
1974 1.83 fvdl return;
1975 1.83 fvdl
1976 1.83 fvdl if (lo <= np->n_pushlo)
1977 1.83 fvdl np->n_pushlo = hi;
1978 1.83 fvdl else if (hi >= np->n_pushhi)
1979 1.83 fvdl np->n_pushhi = lo;
1980 1.83 fvdl else {
1981 1.83 fvdl /*
1982 1.83 fvdl * XXX There's only one range. If the deleted range
1983 1.83 fvdl * is in the middle, pick the largest of the
1984 1.83 fvdl * contiguous ranges that it leaves.
1985 1.83 fvdl */
1986 1.83 fvdl if ((np->n_pushlo - lo) > (hi - np->n_pushhi))
1987 1.83 fvdl np->n_pushhi = lo;
1988 1.83 fvdl else
1989 1.83 fvdl np->n_pushlo = hi;
1990 1.83 fvdl }
1991 1.111 yamt #ifdef NFS_DEBUG_COMMIT
1992 1.83 fvdl printf("del: tobecommitted: %u - %u\n", (unsigned)np->n_pushlo,
1993 1.83 fvdl (unsigned)np->n_pushhi);
1994 1.83 fvdl #endif
1995 1.25 fvdl }
1996 1.25 fvdl
1997 1.25 fvdl /*
1998 1.25 fvdl * Map errnos to NFS error numbers. For Version 3 also filter out error
1999 1.25 fvdl * numbers not specified for the associated procedure.
2000 1.25 fvdl */
2001 1.25 fvdl int
2002 1.214 dsl nfsrv_errmap(struct nfsrv_descript *nd, int err)
2003 1.25 fvdl {
2004 1.90 jdolecek const short *defaulterrp, *errp;
2005 1.25 fvdl
2006 1.25 fvdl if (nd->nd_flag & ND_NFSV3) {
2007 1.25 fvdl if (nd->nd_procnum <= NFSPROC_COMMIT) {
2008 1.25 fvdl errp = defaulterrp = nfsrv_v3errmap[nd->nd_procnum];
2009 1.25 fvdl while (*++errp) {
2010 1.25 fvdl if (*errp == err)
2011 1.25 fvdl return (err);
2012 1.25 fvdl else if (*errp > err)
2013 1.25 fvdl break;
2014 1.25 fvdl }
2015 1.25 fvdl return ((int)*defaulterrp);
2016 1.25 fvdl } else
2017 1.25 fvdl return (err & 0xffff);
2018 1.25 fvdl }
2019 1.25 fvdl if (err <= ELAST)
2020 1.25 fvdl return ((int)nfsrv_v2errmap[err - 1]);
2021 1.25 fvdl return (NFSERR_IO);
2022 1.25 fvdl }
2023 1.25 fvdl
2024 1.126 yamt u_int32_t
2025 1.216 cegger nfs_getxid(void)
2026 1.126 yamt {
2027 1.126 yamt u_int32_t newxid;
2028 1.126 yamt
2029 1.227 tls if (__predict_false(nfs_xid == 0)) {
2030 1.227 tls nfs_xid = cprng_fast32();
2031 1.227 tls }
2032 1.227 tls
2033 1.207 pooka /* get next xid. skip 0 */
2034 1.207 pooka do {
2035 1.207 pooka newxid = atomic_inc_32_nv(&nfs_xid);
2036 1.207 pooka } while (__predict_false(newxid == 0));
2037 1.126 yamt
2038 1.126 yamt return txdr_unsigned(newxid);
2039 1.126 yamt }
2040 1.126 yamt
2041 1.126 yamt /*
2042 1.126 yamt * assign a new xid for existing request.
2043 1.126 yamt * used for NFSERR_JUKEBOX handling.
2044 1.126 yamt */
2045 1.126 yamt void
2046 1.126 yamt nfs_renewxid(struct nfsreq *req)
2047 1.126 yamt {
2048 1.126 yamt u_int32_t xid;
2049 1.126 yamt int off;
2050 1.126 yamt
2051 1.126 yamt xid = nfs_getxid();
2052 1.126 yamt if (req->r_nmp->nm_sotype == SOCK_STREAM)
2053 1.126 yamt off = sizeof(u_int32_t); /* RPC record mark */
2054 1.126 yamt else
2055 1.126 yamt off = 0;
2056 1.126 yamt
2057 1.126 yamt m_copyback(req->r_mreq, off, sizeof(xid), (void *)&xid);
2058 1.126 yamt req->r_xid = xid;
2059 1.1 cgd }
2060