ops_nfs.c revision 1.1.1.1 1 /* $NetBSD: ops_nfs.c,v 1.1.1.1 2008/09/19 20:07:16 christos Exp $ */
2
3 /*
4 * Copyright (c) 1997-2007 Erez Zadok
5 * Copyright (c) 1990 Jan-Simon Pendry
6 * Copyright (c) 1990 Imperial College of Science, Technology & Medicine
7 * Copyright (c) 1990 The Regents of the University of California.
8 * All rights reserved.
9 *
10 * This code is derived from software contributed to Berkeley by
11 * Jan-Simon Pendry at Imperial College, London.
12 *
13 * Redistribution and use in source and binary forms, with or without
14 * modification, are permitted provided that the following conditions
15 * are met:
16 * 1. Redistributions of source code must retain the above copyright
17 * notice, this list of conditions and the following disclaimer.
18 * 2. Redistributions in binary form must reproduce the above copyright
19 * notice, this list of conditions and the following disclaimer in the
20 * documentation and/or other materials provided with the distribution.
21 * 3. All advertising materials mentioning features or use of this software
22 * must display the following acknowledgment:
23 * This product includes software developed by the University of
24 * California, Berkeley and its contributors.
25 * 4. Neither the name of the University nor the names of its contributors
26 * may be used to endorse or promote products derived from this software
27 * without specific prior written permission.
28 *
29 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
30 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
31 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
32 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
33 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
34 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
35 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
36 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
37 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
38 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
39 * SUCH DAMAGE.
40 *
41 *
42 * File: am-utils/amd/ops_nfs.c
43 *
44 */
45
46 /*
47 * Network file system
48 */
49
50 #ifdef HAVE_CONFIG_H
51 # include <config.h>
52 #endif /* HAVE_CONFIG_H */
53 #include <am_defs.h>
54 #include <amd.h>
55
56 /*
57 * Convert from nfsstat to UN*X error code
58 */
59 #define unx_error(e) ((int)(e))
60
61 /*
62 * FH_TTL is the time a file handle will remain in the cache since
63 * last being used. If the file handle becomes invalid, then it
64 * will be flushed anyway.
65 */
66 #define FH_TTL (5 * 60) /* five minutes */
67 #define FH_TTL_ERROR (30) /* 30 seconds */
68 #define FHID_ALLOC() (++fh_id)
69
70 /*
71 * The NFS layer maintains a cache of file handles.
72 * This is *fundamental* to the implementation and
73 * also allows quick remounting when a filesystem
74 * is accessed soon after timing out.
75 *
76 * The NFS server layer knows to flush this cache
77 * when a server goes down so avoiding stale handles.
78 *
79 * Each cache entry keeps a hard reference to
80 * the corresponding server. This ensures that
81 * the server keepalive information is maintained.
82 *
83 * The copy of the sockaddr_in here is taken so
84 * that the port can be twiddled to talk to mountd
85 * instead of portmap or the NFS server as used
86 * elsewhere.
87 * The port# is flushed if a server goes down.
88 * The IP address is never flushed - we assume
89 * that the address of a mounted machine never
90 * changes. If it does, then you have other
91 * problems...
92 */
93 typedef struct fh_cache fh_cache;
94 struct fh_cache {
95 qelem fh_q; /* List header */
96 wchan_t fh_wchan; /* Wait channel */
97 int fh_error; /* Valid data? */
98 int fh_id; /* Unique id */
99 int fh_cid; /* Callout id */
100 u_long fh_nfs_version; /* highest NFS version on host */
101 am_nfs_handle_t fh_nfs_handle; /* Handle on filesystem */
102 int fh_status; /* Status of last rpc */
103 struct sockaddr_in fh_sin; /* Address of mountd */
104 fserver *fh_fs; /* Server holding filesystem */
105 char *fh_path; /* Filesystem on host */
106 };
107
108 /* forward definitions */
109 static int nfs_init(mntfs *mf);
110 static char *nfs_match(am_opts *fo);
111 static int nfs_mount(am_node *am, mntfs *mf);
112 static int nfs_umount(am_node *am, mntfs *mf);
113 static void nfs_umounted(mntfs *mf);
114 static int call_mountd(fh_cache *fp, u_long proc, fwd_fun f, wchan_t wchan);
115 static int webnfs_lookup(fh_cache *fp, fwd_fun f, wchan_t wchan);
116 static int fh_id = 0;
117
118 /* globals */
119 AUTH *nfs_auth;
120 qelem fh_head = {&fh_head, &fh_head};
121
122 /*
123 * Network file system operations
124 */
125 am_ops nfs_ops =
126 {
127 "nfs",
128 nfs_match,
129 nfs_init,
130 nfs_mount,
131 nfs_umount,
132 amfs_error_lookup_child,
133 amfs_error_mount_child,
134 amfs_error_readdir,
135 0, /* nfs_readlink */
136 0, /* nfs_mounted */
137 nfs_umounted,
138 find_nfs_srvr,
139 0, /* nfs_get_wchan */
140 FS_MKMNT | FS_BACKGROUND | FS_AMQINFO, /* nfs_fs_flags */
141 #ifdef HAVE_FS_AUTOFS
142 AUTOFS_NFS_FS_FLAGS,
143 #endif /* HAVE_FS_AUTOFS */
144 };
145
146
147 static fh_cache *
148 find_nfs_fhandle_cache(opaque_t arg, int done)
149 {
150 fh_cache *fp, *fp2 = NULL;
151 int id = (long) arg; /* for 64-bit archs */
152
153 ITER(fp, fh_cache, &fh_head) {
154 if (fp->fh_id == id) {
155 fp2 = fp;
156 break;
157 }
158 }
159
160 if (fp2) {
161 dlog("fh cache gives fp %#lx, fs %s", (unsigned long) fp2, fp2->fh_path);
162 } else {
163 dlog("fh cache search failed");
164 }
165
166 if (fp2 && !done) {
167 fp2->fh_error = ETIMEDOUT;
168 return 0;
169 }
170
171 return fp2;
172 }
173
174
175 /*
176 * Called when a filehandle appears via the mount protocol
177 */
178 static void
179 got_nfs_fh_mount(voidp pkt, int len, struct sockaddr_in *sa, struct sockaddr_in *ia, opaque_t arg, int done)
180 {
181 fh_cache *fp;
182 struct fhstatus res;
183 #ifdef HAVE_FS_NFS3
184 struct am_mountres3 res3;
185 #endif /* HAVE_FS_NFS3 */
186
187 fp = find_nfs_fhandle_cache(arg, done);
188 if (!fp)
189 return;
190
191 /*
192 * retrieve the correct RPC reply for the file handle, based on the
193 * NFS protocol version.
194 */
195 #ifdef HAVE_FS_NFS3
196 if (fp->fh_nfs_version == NFS_VERSION3) {
197 memset(&res3, 0, sizeof(res3));
198 fp->fh_error = pickup_rpc_reply(pkt, len, (voidp) &res3,
199 (XDRPROC_T_TYPE) xdr_am_mountres3);
200 fp->fh_status = unx_error(res3.fhs_status);
201 memset(&fp->fh_nfs_handle.v3, 0, sizeof(am_nfs_fh3));
202 fp->fh_nfs_handle.v3.am_fh3_length = res3.mountres3_u.mountinfo.fhandle.fhandle3_len;
203 memmove(fp->fh_nfs_handle.v3.am_fh3_data,
204 res3.mountres3_u.mountinfo.fhandle.fhandle3_val,
205 fp->fh_nfs_handle.v3.am_fh3_length);
206 } else {
207 #endif /* HAVE_FS_NFS3 */
208 memset(&res, 0, sizeof(res));
209 fp->fh_error = pickup_rpc_reply(pkt, len, (voidp) &res,
210 (XDRPROC_T_TYPE) xdr_fhstatus);
211 fp->fh_status = unx_error(res.fhs_status);
212 memmove(&fp->fh_nfs_handle.v2, &res.fhs_fh, NFS_FHSIZE);
213 #ifdef HAVE_FS_NFS3
214 }
215 #endif /* HAVE_FS_NFS3 */
216
217 if (!fp->fh_error) {
218 dlog("got filehandle for %s:%s", fp->fh_fs->fs_host, fp->fh_path);
219 } else {
220 plog(XLOG_USER, "filehandle denied for %s:%s", fp->fh_fs->fs_host, fp->fh_path);
221 /*
222 * Force the error to be EACCES. It's debatable whether it should be
223 * ENOENT instead, but the server really doesn't give us any clues, and
224 * EACCES is more in line with the "filehandle denied" message.
225 */
226 fp->fh_error = EACCES;
227 }
228
229 /*
230 * Wakeup anything sleeping on this filehandle
231 */
232 if (fp->fh_wchan) {
233 dlog("Calling wakeup on %#lx", (unsigned long) fp->fh_wchan);
234 wakeup(fp->fh_wchan);
235 }
236 }
237
238
239 /*
240 * Called when a filehandle appears via WebNFS
241 */
242 static void
243 got_nfs_fh_webnfs(voidp pkt, int len, struct sockaddr_in *sa, struct sockaddr_in *ia, opaque_t arg, int done)
244 {
245 fh_cache *fp;
246 nfsdiropres res;
247 #ifdef HAVE_FS_NFS3
248 am_LOOKUP3res res3;
249 #endif /* HAVE_FS_NFS3 */
250
251 fp = find_nfs_fhandle_cache(arg, done);
252 if (!fp)
253 return;
254
255 /*
256 * retrieve the correct RPC reply for the file handle, based on the
257 * NFS protocol version.
258 */
259 #ifdef HAVE_FS_NFS3
260 if (fp->fh_nfs_version == NFS_VERSION3) {
261 memset(&res3, 0, sizeof(res3));
262 fp->fh_error = pickup_rpc_reply(pkt, len, (voidp) &res3,
263 (XDRPROC_T_TYPE) xdr_am_LOOKUP3res);
264 fp->fh_status = unx_error(res3.status);
265 memset(&fp->fh_nfs_handle.v3, 0, sizeof(am_nfs_fh3));
266 fp->fh_nfs_handle.v3.am_fh3_length = res3.res_u.ok.object.am_fh3_length;
267 memmove(fp->fh_nfs_handle.v3.am_fh3_data,
268 res3.res_u.ok.object.am_fh3_data,
269 fp->fh_nfs_handle.v3.am_fh3_length);
270 } else {
271 #endif /* HAVE_FS_NFS3 */
272 memset(&res, 0, sizeof(res));
273 fp->fh_error = pickup_rpc_reply(pkt, len, (voidp) &res,
274 (XDRPROC_T_TYPE) xdr_diropres);
275 fp->fh_status = unx_error(res.dr_status);
276 memmove(&fp->fh_nfs_handle.v2, &res.dr_u.dr_drok_u.drok_fhandle, NFS_FHSIZE);
277 #ifdef HAVE_FS_NFS3
278 }
279 #endif /* HAVE_FS_NFS3 */
280
281 if (!fp->fh_error) {
282 dlog("got filehandle for %s:%s", fp->fh_fs->fs_host, fp->fh_path);
283 } else {
284 plog(XLOG_USER, "filehandle denied for %s:%s", fp->fh_fs->fs_host, fp->fh_path);
285 /*
286 * Force the error to be EACCES. It's debatable whether it should be
287 * ENOENT instead, but the server really doesn't give us any clues, and
288 * EACCES is more in line with the "filehandle denied" message.
289 */
290 fp->fh_error = EACCES;
291 }
292
293 /*
294 * Wakeup anything sleeping on this filehandle
295 */
296 if (fp->fh_wchan) {
297 dlog("Calling wakeup on %#lx", (unsigned long) fp->fh_wchan);
298 wakeup(fp->fh_wchan);
299 }
300 }
301
302
303 void
304 flush_nfs_fhandle_cache(fserver *fs)
305 {
306 fh_cache *fp;
307
308 ITER(fp, fh_cache, &fh_head) {
309 if (fp->fh_fs == fs || fs == NULL) {
310 /*
311 * Only invalidate port info for non-WebNFS servers
312 */
313 if (!(fp->fh_fs->fs_flags & FSF_WEBNFS))
314 fp->fh_sin.sin_port = (u_short) 0;
315 fp->fh_error = -1;
316 }
317 }
318 }
319
320
321 static void
322 discard_fh(opaque_t arg)
323 {
324 fh_cache *fp = (fh_cache *) arg;
325
326 rem_que(&fp->fh_q);
327 if (fp->fh_fs) {
328 dlog("Discarding filehandle for %s:%s", fp->fh_fs->fs_host, fp->fh_path);
329 free_srvr(fp->fh_fs);
330 }
331 if (fp->fh_path)
332 XFREE(fp->fh_path);
333 XFREE(fp);
334 }
335
336
337 /*
338 * Determine the file handle for a node
339 */
340 static int
341 prime_nfs_fhandle_cache(char *path, fserver *fs, am_nfs_handle_t *fhbuf, mntfs *mf)
342 {
343 fh_cache *fp, *fp_save = NULL;
344 int error;
345 int reuse_id = FALSE;
346
347 dlog("Searching cache for %s:%s", fs->fs_host, path);
348
349 /*
350 * First search the cache
351 */
352 ITER(fp, fh_cache, &fh_head) {
353 if (fs != fp->fh_fs || !STREQ(path, fp->fh_path))
354 continue; /* skip to next ITER item */
355 /* else we got a match */
356 switch (fp->fh_error) {
357 case 0:
358 plog(XLOG_INFO, "prime_nfs_fhandle_cache: NFS version %d", (int) fp->fh_nfs_version);
359
360 error = fp->fh_error = fp->fh_status;
361
362 if (error == 0) {
363 if (mf->mf_flags & MFF_NFS_SCALEDOWN) {
364 fp_save = fp;
365 /* XXX: why reuse the ID? */
366 reuse_id = TRUE;
367 break;
368 }
369
370 if (fhbuf) {
371 #ifdef HAVE_FS_NFS3
372 if (fp->fh_nfs_version == NFS_VERSION3) {
373 memmove((voidp) &(fhbuf->v3), (voidp) &(fp->fh_nfs_handle.v3),
374 sizeof(fp->fh_nfs_handle.v3));
375 } else
376 #endif /* HAVE_FS_NFS3 */
377 {
378 memmove((voidp) &(fhbuf->v2), (voidp) &(fp->fh_nfs_handle.v2),
379 sizeof(fp->fh_nfs_handle.v2));
380 }
381 }
382 if (fp->fh_cid)
383 untimeout(fp->fh_cid);
384 fp->fh_cid = timeout(FH_TTL, discard_fh, (opaque_t) fp);
385 } else if (error == EACCES) {
386 /*
387 * Now decode the file handle return code.
388 */
389 plog(XLOG_INFO, "Filehandle denied for \"%s:%s\"",
390 fs->fs_host, path);
391 } else {
392 errno = error; /* XXX */
393 plog(XLOG_INFO, "Filehandle error for \"%s:%s\": %m",
394 fs->fs_host, path);
395 }
396
397 /*
398 * The error was returned from the remote mount daemon.
399 * Policy: this error will be cached for now...
400 */
401 return error;
402
403 case -1:
404 /*
405 * Still thinking about it, but we can re-use.
406 */
407 fp_save = fp;
408 reuse_id = TRUE;
409 break;
410
411 default:
412 /*
413 * Return the error.
414 * Policy: make sure we recompute if required again
415 * in case this was caused by a network failure.
416 * This can thrash mountd's though... If you find
417 * your mountd going slowly then:
418 * 1. Add a fork() loop to main.
419 * 2. Remove the call to innetgr() and don't use
420 * netgroups, especially if you don't use YP.
421 */
422 error = fp->fh_error;
423 fp->fh_error = -1;
424 return error;
425 } /* end of switch statement */
426 } /* end of ITER loop */
427
428 /*
429 * Not in cache
430 */
431 if (fp_save) {
432 fp = fp_save;
433 /*
434 * Re-use existing slot
435 */
436 untimeout(fp->fh_cid);
437 free_srvr(fp->fh_fs);
438 XFREE(fp->fh_path);
439 } else {
440 fp = ALLOC(struct fh_cache);
441 memset((voidp) fp, 0, sizeof(struct fh_cache));
442 ins_que(&fp->fh_q, &fh_head);
443 }
444 if (!reuse_id)
445 fp->fh_id = FHID_ALLOC();
446 fp->fh_wchan = get_mntfs_wchan(mf);
447 fp->fh_error = -1;
448 fp->fh_cid = timeout(FH_TTL, discard_fh, (opaque_t) fp);
449
450 /*
451 * If fs->fs_ip is null, remote server is probably down.
452 */
453 if (!fs->fs_ip) {
454 /* Mark the fileserver down and invalid again */
455 fs->fs_flags &= ~FSF_VALID;
456 fs->fs_flags |= FSF_DOWN;
457 error = AM_ERRNO_HOST_DOWN;
458 return error;
459 }
460
461 /*
462 * Either fp has been freshly allocated or the address has changed.
463 * Initialize address and nfs version. Don't try to re-use the port
464 * information unless using WebNFS where the port is fixed either by
465 * the spec or the "port" mount option.
466 */
467 if (fp->fh_sin.sin_addr.s_addr != fs->fs_ip->sin_addr.s_addr) {
468 fp->fh_sin = *fs->fs_ip;
469 if (!(mf->mf_flags & MFF_WEBNFS))
470 fp->fh_sin.sin_port = 0;
471 fp->fh_nfs_version = fs->fs_version;
472 }
473
474 fp->fh_fs = dup_srvr(fs);
475 fp->fh_path = strdup(path);
476
477 if (mf->mf_flags & MFF_WEBNFS)
478 error = webnfs_lookup(fp, got_nfs_fh_webnfs, get_mntfs_wchan(mf));
479 else
480 error = call_mountd(fp, MOUNTPROC_MNT, got_nfs_fh_mount, get_mntfs_wchan(mf));
481 if (error) {
482 /*
483 * Local error - cache for a short period
484 * just to prevent thrashing.
485 */
486 untimeout(fp->fh_cid);
487 fp->fh_cid = timeout(error < 0 ? 2 * ALLOWED_MOUNT_TIME : FH_TTL_ERROR,
488 discard_fh, (opaque_t) fp);
489 fp->fh_error = error;
490 } else {
491 error = fp->fh_error;
492 }
493
494 return error;
495 }
496
497
498 int
499 make_nfs_auth(void)
500 {
501 AUTH_CREATE_GIDLIST_TYPE group_wheel = 0;
502
503 /* Some NFS mounts (particularly cross-domain) require FQDNs to succeed */
504
505 #ifdef HAVE_TRANSPORT_TYPE_TLI
506 if (gopt.flags & CFM_FULLY_QUALIFIED_HOSTS) {
507 plog(XLOG_INFO, "Using NFS auth for FQHN \"%s\"", hostd);
508 nfs_auth = authsys_create(hostd, 0, 0, 1, &group_wheel);
509 } else {
510 nfs_auth = authsys_create_default();
511 }
512 #else /* not HAVE_TRANSPORT_TYPE_TLI */
513 if (gopt.flags & CFM_FULLY_QUALIFIED_HOSTS) {
514 plog(XLOG_INFO, "Using NFS auth for FQHN \"%s\"", hostd);
515 nfs_auth = authunix_create(hostd, 0, 0, 1, &group_wheel);
516 } else {
517 nfs_auth = authunix_create_default();
518 }
519 #endif /* not HAVE_TRANSPORT_TYPE_TLI */
520
521 if (!nfs_auth)
522 return ENOBUFS;
523
524 return 0;
525 }
526
527
528 static int
529 call_mountd(fh_cache *fp, u_long proc, fwd_fun fun, wchan_t wchan)
530 {
531 struct rpc_msg mnt_msg;
532 int len;
533 char iobuf[UDPMSGSIZE];
534 int error;
535 u_long mnt_version;
536
537 if (!nfs_auth) {
538 error = make_nfs_auth();
539 if (error)
540 return error;
541 }
542
543 if (fp->fh_sin.sin_port == 0) {
544 u_short mountd_port;
545 error = get_mountd_port(fp->fh_fs, &mountd_port, wchan);
546 if (error)
547 return error;
548 fp->fh_sin.sin_port = mountd_port;
549 }
550
551 /* find the right version of the mount protocol */
552 #ifdef HAVE_FS_NFS3
553 if (fp->fh_nfs_version == NFS_VERSION3)
554 mnt_version = AM_MOUNTVERS3;
555 else
556 #endif /* HAVE_FS_NFS3 */
557 mnt_version = MOUNTVERS;
558 plog(XLOG_INFO, "call_mountd: NFS version %d, mount version %d",
559 (int) fp->fh_nfs_version, (int) mnt_version);
560
561 rpc_msg_init(&mnt_msg, MOUNTPROG, mnt_version, MOUNTPROC_NULL);
562 len = make_rpc_packet(iobuf,
563 sizeof(iobuf),
564 proc,
565 &mnt_msg,
566 (voidp) &fp->fh_path,
567 (XDRPROC_T_TYPE) xdr_nfspath,
568 nfs_auth);
569
570 if (len > 0) {
571 error = fwd_packet(MK_RPC_XID(RPC_XID_MOUNTD, fp->fh_id),
572 iobuf,
573 len,
574 &fp->fh_sin,
575 &fp->fh_sin,
576 (opaque_t) ((long) fp->fh_id), /* cast to long needed for 64-bit archs */
577 fun);
578 } else {
579 error = -len;
580 }
581
582 /*
583 * It may be the case that we're sending to the wrong MOUNTD port. This
584 * occurs if mountd is restarted on the server after the port has been
585 * looked up and stored in the filehandle cache somewhere. The correct
586 * solution, if we're going to cache port numbers is to catch the ICMP
587 * port unreachable reply from the server and cause the portmap request
588 * to be redone. The quick solution here is to invalidate the MOUNTD
589 * port.
590 */
591 fp->fh_sin.sin_port = 0;
592
593 return error;
594 }
595
596
597 static int
598 webnfs_lookup(fh_cache *fp, fwd_fun fun, wchan_t wchan)
599 {
600 struct rpc_msg wnfs_msg;
601 int len;
602 char iobuf[UDPMSGSIZE];
603 int error;
604 u_long proc;
605 XDRPROC_T_TYPE xdr_fn;
606 voidp argp;
607 nfsdiropargs args;
608 #ifdef HAVE_FS_NFS3
609 am_LOOKUP3args args3;
610 #endif /* HAVE_FS_NFS3 */
611 char *wnfs_path;
612 size_t l;
613
614 if (!nfs_auth) {
615 error = make_nfs_auth();
616 if (error)
617 return error;
618 }
619
620 if (fp->fh_sin.sin_port == 0) {
621 /* FIXME: wrong, don't discard sin_port in the first place for WebNFS. */
622 plog(XLOG_WARNING, "webnfs_lookup: port == 0 for nfs on %s, fixed",
623 fp->fh_fs->fs_host);
624 fp->fh_sin.sin_port = htons(NFS_PORT);
625 }
626
627 /*
628 * Use native path like the rest of amd (cf. RFC 2054, 6.1).
629 */
630 l = strlen(fp->fh_path) + 2;
631 wnfs_path = (char *) xmalloc(l);
632 wnfs_path[0] = 0x80;
633 xstrlcpy(wnfs_path + 1, fp->fh_path, l - 1);
634
635 /* find the right program and lookup procedure */
636 #ifdef HAVE_FS_NFS3
637 if (fp->fh_nfs_version == NFS_VERSION3) {
638 proc = AM_NFSPROC3_LOOKUP;
639 xdr_fn = (XDRPROC_T_TYPE) xdr_am_LOOKUP3args;
640 argp = &args3;
641 /* WebNFS public file handle */
642 args3.what.dir.am_fh3_length = 0;
643 args3.what.name = wnfs_path;
644 } else {
645 #endif /* HAVE_FS_NFS3 */
646 proc = NFSPROC_LOOKUP;
647 xdr_fn = (XDRPROC_T_TYPE) xdr_diropargs;
648 argp = &args;
649 /* WebNFS public file handle */
650 memset(&args.da_fhandle, 0, NFS_FHSIZE);
651 args.da_name = wnfs_path;
652 #ifdef HAVE_FS_NFS3
653 }
654 #endif /* HAVE_FS_NFS3 */
655
656 plog(XLOG_INFO, "webnfs_lookup: NFS version %d", (int) fp->fh_nfs_version);
657
658 rpc_msg_init(&wnfs_msg, NFS_PROGRAM, fp->fh_nfs_version, proc);
659 len = make_rpc_packet(iobuf,
660 sizeof(iobuf),
661 proc,
662 &wnfs_msg,
663 argp,
664 (XDRPROC_T_TYPE) xdr_fn,
665 nfs_auth);
666
667 if (len > 0) {
668 error = fwd_packet(MK_RPC_XID(RPC_XID_WEBNFS, fp->fh_id),
669 iobuf,
670 len,
671 &fp->fh_sin,
672 &fp->fh_sin,
673 (opaque_t) ((long) fp->fh_id), /* cast to long needed for 64-bit archs */
674 fun);
675 } else {
676 error = -len;
677 }
678
679 XFREE(wnfs_path);
680 return error;
681 }
682
683
684 /*
685 * NFS needs the local filesystem, remote filesystem
686 * remote hostname.
687 * Local filesystem defaults to remote and vice-versa.
688 */
689 static char *
690 nfs_match(am_opts *fo)
691 {
692 char *xmtab;
693 size_t l;
694
695 if (fo->opt_fs && !fo->opt_rfs)
696 fo->opt_rfs = fo->opt_fs;
697 if (!fo->opt_rfs) {
698 plog(XLOG_USER, "nfs: no remote filesystem specified");
699 return NULL;
700 }
701 if (!fo->opt_rhost) {
702 plog(XLOG_USER, "nfs: no remote host specified");
703 return NULL;
704 }
705
706 /*
707 * Determine magic cookie to put in mtab
708 */
709 l = strlen(fo->opt_rhost) + strlen(fo->opt_rfs) + 2;
710 xmtab = (char *) xmalloc(l);
711 xsnprintf(xmtab, l, "%s:%s", fo->opt_rhost, fo->opt_rfs);
712 dlog("NFS: mounting remote server \"%s\", remote fs \"%s\" on \"%s\"",
713 fo->opt_rhost, fo->opt_rfs, fo->opt_fs);
714
715 return xmtab;
716 }
717
718
719 /*
720 * Initialize am structure for nfs
721 */
722 static int
723 nfs_init(mntfs *mf)
724 {
725 int error;
726 am_nfs_handle_t fhs;
727 char *colon;
728
729 if (mf->mf_private) {
730 if (mf->mf_flags & MFF_NFS_SCALEDOWN) {
731 fserver *fs;
732
733 /* tell remote mountd that we're done with this filehandle */
734 mf->mf_ops->umounted(mf);
735
736 mf->mf_prfree(mf->mf_private);
737 fs = mf->mf_ops->ffserver(mf);
738 free_srvr(mf->mf_server);
739 mf->mf_server = fs;
740 } else
741 return 0;
742 }
743
744 colon = strchr(mf->mf_info, ':');
745 if (colon == 0)
746 return ENOENT;
747
748 error = prime_nfs_fhandle_cache(colon + 1, mf->mf_server, &fhs, mf);
749 if (!error) {
750 mf->mf_private = (opaque_t) ALLOC(am_nfs_handle_t);
751 mf->mf_prfree = (void (*)(opaque_t)) free;
752 memmove(mf->mf_private, (voidp) &fhs, sizeof(fhs));
753 }
754 return error;
755 }
756
757
758 int
759 mount_nfs_fh(am_nfs_handle_t *fhp, char *mntdir, char *fs_name, mntfs *mf)
760 {
761 MTYPE_TYPE type;
762 char *colon;
763 char *xopts=NULL, transp_timeo_opts[40], transp_retrans_opts[40];
764 char host[MAXHOSTNAMELEN + MAXPATHLEN + 2];
765 fserver *fs = mf->mf_server;
766 u_long nfs_version = fs->fs_version;
767 char *nfs_proto = fs->fs_proto; /* "tcp" or "udp" */
768 int on_autofs = mf->mf_flags & MFF_ON_AUTOFS;
769 int error;
770 int genflags;
771 int retry;
772 int proto = AMU_TYPE_NONE;
773 mntent_t mnt;
774 nfs_args_t nfs_args;
775
776 /*
777 * Extract HOST name to give to kernel.
778 * Some systems like osf1/aix3/bsd44 variants may need old code
779 * for NFS_ARGS_NEEDS_PATH.
780 */
781 if (!(colon = strchr(fs_name, ':')))
782 return ENOENT;
783 #ifdef MOUNT_TABLE_ON_FILE
784 *colon = '\0';
785 #endif /* MOUNT_TABLE_ON_FILE */
786 xstrlcpy(host, fs_name, sizeof(host));
787 #ifdef MOUNT_TABLE_ON_FILE
788 *colon = ':';
789 #endif /* MOUNT_TABLE_ON_FILE */
790 #ifdef MAXHOSTNAMELEN
791 /* most kernels have a name length restriction */
792 if (strlen(host) >= MAXHOSTNAMELEN)
793 xstrlcpy(host + MAXHOSTNAMELEN - 3, "..",
794 sizeof(host) - MAXHOSTNAMELEN + 3);
795 #endif /* MAXHOSTNAMELEN */
796
797 /*
798 * Create option=VAL for udp/tcp specific timeouts and retrans values, but
799 * only if these options were specified.
800 */
801
802 transp_timeo_opts[0] = transp_retrans_opts[0] = '\0'; /* initialize */
803 if (STREQ(nfs_proto, "udp"))
804 proto = AMU_TYPE_UDP;
805 else if (STREQ(nfs_proto, "tcp"))
806 proto = AMU_TYPE_TCP;
807 if (proto != AMU_TYPE_NONE) {
808 if (gopt.amfs_auto_timeo[proto] > 0)
809 xsnprintf(transp_timeo_opts, sizeof(transp_timeo_opts), "%s=%d,",
810 MNTTAB_OPT_TIMEO, gopt.amfs_auto_timeo[proto]);
811 if (gopt.amfs_auto_retrans[proto] > 0)
812 xsnprintf(transp_retrans_opts, sizeof(transp_retrans_opts), "%s=%d,",
813 MNTTAB_OPT_RETRANS, gopt.amfs_auto_retrans[proto]);
814 }
815
816 if (mf->mf_remopts && *mf->mf_remopts &&
817 !islocalnet(fs->fs_ip->sin_addr.s_addr)) {
818 plog(XLOG_INFO, "Using remopts=\"%s\"", mf->mf_remopts);
819 /* use transp_opts first, so map-specific opts will override */
820 xopts = str3cat(xopts, transp_timeo_opts, transp_retrans_opts, mf->mf_remopts);
821 } else {
822 /* use transp_opts first, so map-specific opts will override */
823 xopts = str3cat(xopts, transp_timeo_opts, transp_retrans_opts, mf->mf_mopts);
824 }
825
826 memset((voidp) &mnt, 0, sizeof(mnt));
827 mnt.mnt_dir = mntdir;
828 mnt.mnt_fsname = fs_name;
829 mnt.mnt_opts = xopts;
830
831 /*
832 * Set mount types accordingly
833 */
834 #ifndef HAVE_FS_NFS3
835 type = MOUNT_TYPE_NFS;
836 mnt.mnt_type = MNTTAB_TYPE_NFS;
837 #else /* HAVE_FS_NFS3 */
838 if (nfs_version == NFS_VERSION3) {
839 type = MOUNT_TYPE_NFS3;
840 /*
841 * Systems that include the mount table "vers" option generally do not
842 * set the mnttab entry to "nfs3", but to "nfs" and then they set
843 * "vers=3". Setting it to "nfs3" works, but it may break some things
844 * like "df -t nfs" and the "quota" program (esp. on Solaris and Irix).
845 * So on those systems, set it to "nfs".
846 * Note: MNTTAB_OPT_VERS is always set for NFS3 (see am_compat.h).
847 */
848 # if defined(MNTTAB_OPT_VERS) && defined(MOUNT_TABLE_ON_FILE)
849 mnt.mnt_type = MNTTAB_TYPE_NFS;
850 # else /* defined(MNTTAB_OPT_VERS) && defined(MOUNT_TABLE_ON_FILE) */
851 mnt.mnt_type = MNTTAB_TYPE_NFS3;
852 # endif /* defined(MNTTAB_OPT_VERS) && defined(MOUNT_TABLE_ON_FILE) */
853 } else {
854 type = MOUNT_TYPE_NFS;
855 mnt.mnt_type = MNTTAB_TYPE_NFS;
856 }
857 #endif /* HAVE_FS_NFS3 */
858 plog(XLOG_INFO, "mount_nfs_fh: NFS version %d", (int) nfs_version);
859 plog(XLOG_INFO, "mount_nfs_fh: using NFS transport %s", nfs_proto);
860
861 retry = hasmntval(&mnt, MNTTAB_OPT_RETRY);
862 if (retry <= 0)
863 retry = 1; /* XXX */
864
865 genflags = compute_mount_flags(&mnt);
866 #ifdef HAVE_FS_AUTOFS
867 if (on_autofs)
868 genflags |= autofs_compute_mount_flags(&mnt);
869 #endif /* HAVE_FS_AUTOFS */
870
871 /* setup the many fields and flags within nfs_args */
872 compute_nfs_args(&nfs_args,
873 &mnt,
874 genflags,
875 NULL, /* struct netconfig *nfsncp */
876 fs->fs_ip,
877 nfs_version,
878 nfs_proto,
879 fhp,
880 host,
881 fs_name);
882
883 /* finally call the mounting function */
884 if (amuDebug(D_TRACE)) {
885 print_nfs_args(&nfs_args, nfs_version);
886 plog(XLOG_DEBUG, "Generic mount flags 0x%x used for NFS mount", genflags);
887 }
888 error = mount_fs(&mnt, genflags, (caddr_t) &nfs_args, retry, type,
889 nfs_version, nfs_proto, mnttab_file_name, on_autofs);
890 XFREE(xopts);
891
892 #ifdef HAVE_TRANSPORT_TYPE_TLI
893 free_knetconfig(nfs_args.knconf);
894 if (nfs_args.addr)
895 XFREE(nfs_args.addr); /* allocated in compute_nfs_args() */
896 #endif /* HAVE_TRANSPORT_TYPE_TLI */
897
898 return error;
899 }
900
901
902 static int
903 nfs_mount(am_node *am, mntfs *mf)
904 {
905 int error = 0;
906 mntent_t mnt;
907
908 if (!mf->mf_private) {
909 plog(XLOG_ERROR, "Missing filehandle for %s", mf->mf_info);
910 return EINVAL;
911 }
912
913 mnt.mnt_opts = mf->mf_mopts;
914 if (amu_hasmntopt(&mnt, "softlookup") ||
915 (amu_hasmntopt(&mnt, "soft") && !amu_hasmntopt(&mnt, "nosoftlookup")))
916 am->am_flags |= AMF_SOFTLOOKUP;
917
918 error = mount_nfs_fh((am_nfs_handle_t *) mf->mf_private,
919 mf->mf_mount,
920 mf->mf_info,
921 mf);
922
923 if (error) {
924 errno = error;
925 dlog("mount_nfs: %m");
926 }
927
928 return error;
929 }
930
931
932 static int
933 nfs_umount(am_node *am, mntfs *mf)
934 {
935 int unmount_flags, new_unmount_flags, error;
936
937 unmount_flags = (mf->mf_flags & MFF_ON_AUTOFS) ? AMU_UMOUNT_AUTOFS : 0;
938 error = UMOUNT_FS(mf->mf_mount, mnttab_file_name, unmount_flags);
939
940 #if defined(HAVE_UMOUNT2) && (defined(MNT2_GEN_OPT_FORCE) || defined(MNT2_GEN_OPT_DETACH))
941 /*
942 * If the attempt to unmount failed with EBUSY, and this fserver was
943 * marked for forced unmounts, then use forced/lazy unmounts.
944 */
945 if (error == EBUSY &&
946 gopt.flags & CFM_FORCED_UNMOUNTS &&
947 mf->mf_server->fs_flags & FSF_FORCE_UNMOUNT) {
948 plog(XLOG_INFO, "EZK: nfs_umount: trying forced/lazy unmounts");
949 /*
950 * XXX: turning off the FSF_FORCE_UNMOUNT may not be perfectly
951 * incorrect. Multiple nodes may need to be timed out and restarted for
952 * a single hung fserver.
953 */
954 mf->mf_server->fs_flags &= ~FSF_FORCE_UNMOUNT;
955 new_unmount_flags = unmount_flags | AMU_UMOUNT_FORCE | AMU_UMOUNT_DETACH;
956 error = UMOUNT_FS(mf->mf_mount, mnttab_file_name, new_unmount_flags);
957 }
958 #endif /* HAVE_UMOUNT2 && (MNT2_GEN_OPT_FORCE || MNT2_GEN_OPT_DETACH) */
959
960 /*
961 * Here is some code to unmount 'restarted' file systems.
962 * The restarted file systems are marked as 'nfs', not
963 * 'host', so we only have the map information for the
964 * the top-level mount. The unmount will fail (EBUSY)
965 * if there are anything else from the NFS server mounted
966 * below the mount-point. This code checks to see if there
967 * is anything mounted with the same prefix as the
968 * file system to be unmounted ("/a/b/c" when unmounting "/a/b").
969 * If there is, and it is a 'restarted' file system, we unmount
970 * it.
971 * Added by Mike Mitchell, mcm (at) unx.sas.com, 09/08/93
972 */
973 if (error == EBUSY) {
974 mntfs *new_mf;
975 int len = strlen(mf->mf_mount);
976 int didsome = 0;
977
978 ITER(new_mf, mntfs, &mfhead) {
979 if (new_mf->mf_ops != mf->mf_ops ||
980 new_mf->mf_refc > 1 ||
981 mf == new_mf ||
982 ((new_mf->mf_flags & (MFF_MOUNTED | MFF_UNMOUNTING | MFF_RESTART)) == (MFF_MOUNTED | MFF_RESTART)))
983 continue;
984
985 if (NSTREQ(mf->mf_mount, new_mf->mf_mount, len) &&
986 new_mf->mf_mount[len] == '/') {
987 new_unmount_flags =
988 (new_mf->mf_flags & MFF_ON_AUTOFS) ? AMU_UMOUNT_AUTOFS : 0;
989 UMOUNT_FS(new_mf->mf_mount, mnttab_file_name, new_unmount_flags);
990 didsome = 1;
991 }
992 }
993 if (didsome)
994 error = UMOUNT_FS(mf->mf_mount, mnttab_file_name, unmount_flags);
995 }
996 if (error)
997 return error;
998
999 return 0;
1000 }
1001
1002
1003 static void
1004 nfs_umounted(mntfs *mf)
1005 {
1006 fserver *fs;
1007 char *colon, *path;
1008
1009 if (mf->mf_error || mf->mf_refc > 1)
1010 return;
1011
1012 /*
1013 * No need to inform mountd when WebNFS is in use.
1014 */
1015 if (mf->mf_flags & MFF_WEBNFS)
1016 return;
1017
1018 /*
1019 * Call the mount daemon on the server to announce that we are not using
1020 * the fs any more.
1021 *
1022 * XXX: This is *wrong*. The mountd should be called when the fhandle is
1023 * flushed from the cache, and a reference held to the cached entry while
1024 * the fs is mounted...
1025 */
1026 fs = mf->mf_server;
1027 colon = path = strchr(mf->mf_info, ':');
1028 if (fs && colon) {
1029 fh_cache f;
1030
1031 dlog("calling mountd for %s", mf->mf_info);
1032 *path++ = '\0';
1033 f.fh_path = path;
1034 f.fh_sin = *fs->fs_ip;
1035 f.fh_sin.sin_port = (u_short) 0;
1036 f.fh_nfs_version = fs->fs_version;
1037 f.fh_fs = fs;
1038 f.fh_id = 0;
1039 f.fh_error = 0;
1040 prime_nfs_fhandle_cache(colon + 1, mf->mf_server, (am_nfs_handle_t *) NULL, mf);
1041 call_mountd(&f, MOUNTPROC_UMNT, (fwd_fun *) NULL, (wchan_t) NULL);
1042 *colon = ':';
1043 }
1044 }
1045