4 * The contents of this file are subject to the terms of the
5 * Common Development and Distribution License (the "License").
6 * You may not use this file except in compliance with the License.
8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9 * or http://www.opensolaris.org/os/licensing.
10 * See the License for the specific language governing permissions
11 * and limitations under the License.
13 * When distributing Covered Code, include this CDDL HEADER in each
14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15 * If applicable, add the following below this CDDL HEADER, with the
16 * fields enclosed by brackets "[]" replaced with your own identifying
17 * information: Portions Copyright [yyyy] [name of copyright owner]
22 * Copyright (c) 1986, 2010, Oracle and/or its affiliates. All rights reserved.
24 * Copyright (c) 1983,1984,1985,1986,1987,1988,1989 AT&T.
25 * All rights reserved.
28 #include <sys/param.h>
29 #include <sys/types.h>
30 #include <sys/systm.h>
33 #include <sys/vnode.h>
34 #include <sys/pathname.h>
35 #include <sys/sysmacros.h>
37 #include <sys/mkdev.h>
38 #include <sys/mount.h>
39 #include <sys/mntent.h>
40 #include <sys/statvfs.h>
41 #include <sys/errno.h>
42 #include <sys/debug.h>
43 #include <sys/cmn_err.h>
44 #include <sys/utsname.h>
45 #include <sys/bootconf.h>
46 #include <sys/modctl.h>
48 #include <sys/flock.h>
49 #include <sys/policy.h>
51 #include <sys/class.h>
52 #include <sys/socket.h>
53 #include <sys/netconfig.h>
54 #include <sys/mntent.h>
56 #include <rpc/types.h>
61 #include <nfs/nfs_clnt.h>
62 #include <nfs/rnode.h>
63 #include <nfs/mount.h>
64 #include <nfs/nfs_acl.h>
66 #include <sys/fs_subr.h>
69 * From rpcsec module (common/rpcsec).
71 extern int sec_clnt_loadinfo(struct sec_data
*, struct sec_data
**, model_t
);
72 extern void sec_clnt_freeinfo(struct sec_data
*);
74 static int pathconf_copyin(struct nfs_args
*, struct pathcnf
*);
75 static int pathconf_get(struct mntinfo
*, struct nfs_args
*);
76 static void pathconf_rele(struct mntinfo
*);
79 * The order and contents of this structure must be kept in sync with that of
80 * rfsreqcnt_v2_tmpl in nfs_stats.c
82 static char *rfsnames_v2
[] = {
83 "null", "getattr", "setattr", "unused", "lookup", "readlink", "read",
84 "unused", "write", "create", "remove", "rename", "link", "symlink",
85 "mkdir", "rmdir", "readdir", "fsstat"
89 * This table maps from NFS protocol number into call type.
90 * Zero means a "Lookup" type call
91 * One means a "Read" type call
92 * Two means a "Write" type call
93 * This is used to select a default time-out.
95 static uchar_t call_type_v2
[] = {
102 * Similar table, but to determine which timer to use
103 * (only real reads and writes!)
105 static uchar_t timer_type_v2
[] = {
112 * This table maps from NFS protocol number into a call type
113 * for the semisoft mount option.
114 * Zero means do not repeat operation.
117 static uchar_t ss_call_type_v2
[] = {
124 * nfs vfs operations.
126 static int nfs_mount(vfs_t
*, vnode_t
*, struct mounta
*, cred_t
*);
127 static int nfs_unmount(vfs_t
*, int, cred_t
*);
128 static int nfs_root(vfs_t
*, vnode_t
**);
129 static int nfs_statvfs(vfs_t
*, struct statvfs64
*);
130 static int nfs_sync(vfs_t
*, short, cred_t
*);
131 static int nfs_vget(vfs_t
*, vnode_t
**, fid_t
*);
132 static int nfs_mountroot(vfs_t
*, whymountroot_t
);
133 static void nfs_freevfs(vfs_t
*);
135 static int nfsrootvp(vnode_t
**, vfs_t
*, struct servinfo
*,
136 int, cred_t
*, zone_t
*);
139 * Initialize the vfs structure
145 * Debug variable to check for rdma based
146 * transport startup and cleanup. Controlled
147 * through /etc/system. Off by default.
151 const struct vfsops nfs_vfsops
= {
152 .vfs_mount
= nfs_mount
,
153 .vfs_unmount
= nfs_unmount
,
154 .vfs_root
= nfs_root
,
155 .vfs_statvfs
= nfs_statvfs
,
156 .vfs_sync
= nfs_sync
,
157 .vfs_vget
= nfs_vget
,
158 .vfs_mountroot
= nfs_mountroot
,
159 .vfs_freevfs
= nfs_freevfs
,
163 nfsinit(int fstyp
, char *name
)
167 error
= vfs_setfsops(fstyp
, &nfs_vfsops
);
169 zcmn_err(GLOBAL_ZONEID
, CE_WARN
,
170 "nfsinit: bad fstyp");
185 nfs_free_args(struct nfs_args
*nargs
, nfs_fhandle
*fh
)
189 kmem_free(fh
, sizeof (*fh
));
191 if (nargs
->pathconf
) {
192 kmem_free(nargs
->pathconf
, sizeof (struct pathcnf
));
193 nargs
->pathconf
= NULL
;
197 if (nargs
->knconf
->knc_protofmly
)
198 kmem_free(nargs
->knconf
->knc_protofmly
, KNC_STRSIZE
);
199 if (nargs
->knconf
->knc_proto
)
200 kmem_free(nargs
->knconf
->knc_proto
, KNC_STRSIZE
);
201 kmem_free(nargs
->knconf
, sizeof (*nargs
->knconf
));
202 nargs
->knconf
= NULL
;
206 kmem_free(nargs
->fh
, strlen(nargs
->fh
) + 1);
210 if (nargs
->hostname
) {
211 kmem_free(nargs
->hostname
, strlen(nargs
->hostname
) + 1);
212 nargs
->hostname
= NULL
;
216 if (nargs
->addr
->buf
) {
217 ASSERT(nargs
->addr
->len
);
218 kmem_free(nargs
->addr
->buf
, nargs
->addr
->len
);
220 kmem_free(nargs
->addr
, sizeof (struct netbuf
));
224 if (nargs
->syncaddr
) {
225 ASSERT(nargs
->syncaddr
->len
);
226 if (nargs
->syncaddr
->buf
) {
227 ASSERT(nargs
->syncaddr
->len
);
228 kmem_free(nargs
->syncaddr
->buf
, nargs
->syncaddr
->len
);
230 kmem_free(nargs
->syncaddr
, sizeof (struct netbuf
));
231 nargs
->syncaddr
= NULL
;
234 if (nargs
->netname
) {
235 kmem_free(nargs
->netname
, strlen(nargs
->netname
) + 1);
236 nargs
->netname
= NULL
;
239 if (nargs
->nfs_ext_u
.nfs_extA
.secdata
) {
240 sec_clnt_freeinfo(nargs
->nfs_ext_u
.nfs_extA
.secdata
);
241 nargs
->nfs_ext_u
.nfs_extA
.secdata
= NULL
;
246 nfs_copyin(char *data
, int datalen
, struct nfs_args
*nargs
, nfs_fhandle
*fh
)
250 size_t nlen
; /* length of netname */
251 size_t hlen
; /* length of hostname */
252 char netname
[MAXNETNAMELEN
+1]; /* server's netname */
253 struct netbuf addr
; /* server's address */
254 struct netbuf syncaddr
; /* AUTH_DES time sync addr */
255 struct knetconfig
*knconf
; /* transport knetconfig structure */
256 struct sec_data
*secdata
= NULL
; /* security data */
257 STRUCT_DECL(nfs_args
, args
); /* nfs mount arguments */
258 STRUCT_DECL(knetconfig
, knconf_tmp
);
259 STRUCT_DECL(netbuf
, addr_tmp
);
261 struct pathcnf
*pc
; /* Pathconf */
266 bzero(nargs
, sizeof (*nargs
));
268 STRUCT_INIT(args
, get_udatamodel());
269 bzero(STRUCT_BUF(args
), SIZEOF_STRUCT(nfs_args
, DATAMODEL_NATIVE
));
270 if (copyin(data
, STRUCT_BUF(args
), MIN(datalen
, STRUCT_SIZE(args
))))
273 nargs
->wsize
= STRUCT_FGET(args
, wsize
);
274 nargs
->rsize
= STRUCT_FGET(args
, rsize
);
275 nargs
->timeo
= STRUCT_FGET(args
, timeo
);
276 nargs
->retrans
= STRUCT_FGET(args
, retrans
);
277 nargs
->acregmin
= STRUCT_FGET(args
, acregmin
);
278 nargs
->acregmax
= STRUCT_FGET(args
, acregmax
);
279 nargs
->acdirmin
= STRUCT_FGET(args
, acdirmin
);
280 nargs
->acdirmax
= STRUCT_FGET(args
, acdirmax
);
282 flags
= STRUCT_FGET(args
, flags
);
283 nargs
->flags
= flags
;
290 * Allocate space for a knetconfig structure and
291 * its strings and copy in from user-land.
293 knconf
= kmem_zalloc(sizeof (*knconf
), KM_SLEEP
);
294 STRUCT_INIT(knconf_tmp
, get_udatamodel());
295 if (copyin(STRUCT_FGETP(args
, knconf
), STRUCT_BUF(knconf_tmp
),
296 STRUCT_SIZE(knconf_tmp
))) {
297 kmem_free(knconf
, sizeof (*knconf
));
301 knconf
->knc_semantics
= STRUCT_FGET(knconf_tmp
, knc_semantics
);
302 knconf
->knc_protofmly
= STRUCT_FGETP(knconf_tmp
, knc_protofmly
);
303 knconf
->knc_proto
= STRUCT_FGETP(knconf_tmp
, knc_proto
);
304 if (get_udatamodel() != DATAMODEL_LP64
) {
305 knconf
->knc_rdev
= expldev(STRUCT_FGET(knconf_tmp
, knc_rdev
));
307 knconf
->knc_rdev
= STRUCT_FGET(knconf_tmp
, knc_rdev
);
310 pf
= kmem_alloc(KNC_STRSIZE
, KM_SLEEP
);
311 p
= kmem_alloc(KNC_STRSIZE
, KM_SLEEP
);
312 error
= copyinstr(knconf
->knc_protofmly
, pf
, KNC_STRSIZE
, NULL
);
314 kmem_free(pf
, KNC_STRSIZE
);
315 kmem_free(p
, KNC_STRSIZE
);
316 kmem_free(knconf
, sizeof (*knconf
));
320 error
= copyinstr(knconf
->knc_proto
, p
, KNC_STRSIZE
, NULL
);
322 kmem_free(pf
, KNC_STRSIZE
);
323 kmem_free(p
, KNC_STRSIZE
);
324 kmem_free(knconf
, sizeof (*knconf
));
329 knconf
->knc_protofmly
= pf
;
330 knconf
->knc_proto
= p
;
332 nargs
->knconf
= knconf
;
334 /* Copyin pathconf if there is one */
335 if (STRUCT_FGETP(args
, pathconf
) != NULL
) {
336 pc
= kmem_alloc(sizeof (*pc
), KM_SLEEP
);
337 error
= pathconf_copyin(STRUCT_BUF(args
), pc
);
338 nargs
->pathconf
= pc
;
346 STRUCT_INIT(addr_tmp
, get_udatamodel());
347 if (copyin(STRUCT_FGETP(args
, addr
), STRUCT_BUF(addr_tmp
),
348 STRUCT_SIZE(addr_tmp
))) {
352 nargs
->addr
= kmem_alloc(sizeof (struct netbuf
), KM_SLEEP
);
353 userbufptr
= STRUCT_FGETP(addr_tmp
, buf
);
354 addr
.len
= STRUCT_FGET(addr_tmp
, len
);
355 addr
.buf
= kmem_alloc(addr
.len
, KM_SLEEP
);
356 addr
.maxlen
= addr
.len
;
357 if (copyin(userbufptr
, addr
.buf
, addr
.len
)) {
358 kmem_free(addr
.buf
, addr
.len
);
362 bcopy(&addr
, nargs
->addr
, sizeof (struct netbuf
));
365 * Get the root fhandle
368 if (copyin(STRUCT_FGETP(args
, fh
), &fh
->fh_buf
, NFS_FHSIZE
)) {
372 fh
->fh_len
= NFS_FHSIZE
;
375 * Get server's hostname
377 if (flags
& NFSMNT_HOSTNAME
) {
378 error
= copyinstr(STRUCT_FGETP(args
, hostname
), netname
,
379 sizeof (netname
), &hlen
);
382 nargs
->hostname
= kmem_zalloc(hlen
, KM_SLEEP
);
383 (void) strcpy(nargs
->hostname
, netname
);
386 nargs
->hostname
= NULL
;
391 * If there are syncaddr and netname data, load them in. This is
392 * to support data needed for NFSV4 when AUTH_DH is the negotiated
393 * flavor via SECINFO. (instead of using MOUNT protocol in V3).
396 if (flags
& NFSMNT_SECURE
) {
397 if (STRUCT_FGETP(args
, syncaddr
) == NULL
) {
402 STRUCT_INIT(addr_tmp
, get_udatamodel());
403 if (copyin(STRUCT_FGETP(args
, syncaddr
), STRUCT_BUF(addr_tmp
),
404 STRUCT_SIZE(addr_tmp
))) {
408 userbufptr
= STRUCT_FGETP(addr_tmp
, buf
);
409 syncaddr
.len
= STRUCT_FGET(addr_tmp
, len
);
410 syncaddr
.buf
= kmem_alloc(syncaddr
.len
, KM_SLEEP
);
411 syncaddr
.maxlen
= syncaddr
.len
;
412 if (copyin(userbufptr
, syncaddr
.buf
, syncaddr
.len
)) {
413 kmem_free(syncaddr
.buf
, syncaddr
.len
);
418 nargs
->syncaddr
= kmem_alloc(sizeof (struct netbuf
), KM_SLEEP
);
419 bcopy(&syncaddr
, nargs
->syncaddr
, sizeof (struct netbuf
));
421 ASSERT(STRUCT_FGETP(args
, netname
));
422 if (copyinstr(STRUCT_FGETP(args
, netname
), netname
,
423 sizeof (netname
), &nlen
)) {
428 netname
[nlen
] = '\0';
429 nargs
->netname
= kmem_zalloc(nlen
, KM_SLEEP
);
430 (void) strcpy(nargs
->netname
, netname
);
434 * Get the extention data which has the security data structure.
435 * This includes data for AUTH_SYS as well.
437 if (flags
& NFSMNT_NEWARGS
) {
438 nargs
->nfs_args_ext
= STRUCT_FGET(args
, nfs_args_ext
);
439 if (nargs
->nfs_args_ext
== NFS_ARGS_EXTA
||
440 nargs
->nfs_args_ext
== NFS_ARGS_EXTB
) {
442 * Indicating the application is using the new
443 * sec_data structure to pass in the security
446 if (STRUCT_FGETP(args
,
447 nfs_ext_u
.nfs_extA
.secdata
) != NULL
) {
448 error
= sec_clnt_loadinfo(
449 (struct sec_data
*)STRUCT_FGETP(args
,
450 nfs_ext_u
.nfs_extA
.secdata
), &secdata
,
453 nargs
->nfs_ext_u
.nfs_extA
.secdata
= secdata
;
463 * We may have a linked list of nfs_args structures,
464 * which means the user is looking for failover. If
465 * the mount is either not "read-only" or "soft",
466 * we want to bail out with EINVAL.
468 if (nargs
->nfs_args_ext
== NFS_ARGS_EXTB
)
469 nargs
->nfs_ext_u
.nfs_extB
.next
=
470 STRUCT_FGETP(args
, nfs_ext_u
.nfs_extB
.next
);
474 nfs_free_args(nargs
, fh
);
482 * Set up mount info record and attach it to vfs struct.
485 nfs_mount(vfs_t
*vfsp
, vnode_t
*mvp
, struct mounta
*uap
, cred_t
*cr
)
487 char *data
= uap
->dataptr
;
489 vnode_t
*rtvp
; /* the server's root */
490 mntinfo_t
*mi
; /* mount info, pointed at by vfs */
491 size_t nlen
; /* length of netname */
492 struct knetconfig
*knconf
; /* transport knetconfig structure */
493 struct knetconfig
*rdma_knconf
; /* rdma transport structure */
495 struct servinfo
*svp
; /* nfs server info */
496 struct servinfo
*svp_tail
= NULL
; /* previous nfs server info */
497 struct servinfo
*svp_head
; /* first nfs server info */
498 struct servinfo
*svp_2ndlast
; /* 2nd last in the server info list */
499 struct sec_data
*secdata
; /* security data */
500 struct nfs_args
*args
= NULL
;
501 int flags
, addr_type
;
502 zone_t
*zone
= nfs_zone();
503 zone_t
*mntzone
= NULL
;
504 nfs_fhandle
*fhandle
= NULL
;
506 if ((error
= secpolicy_fs_mount(cr
, mvp
, vfsp
)) != 0)
509 if (mvp
->v_type
!= VDIR
)
515 * nfs_args is now versioned and is extensible, so
516 * uap->datalen might be different from sizeof (args)
517 * in a compatible situation.
521 if (!(uap
->flags
& MS_SYSSPACE
)) {
523 args
= kmem_alloc(sizeof (struct nfs_args
), KM_SLEEP
);
525 nfs_free_args(args
, fhandle
);
529 fhandle
= kmem_zalloc(sizeof (nfs_fhandle
), KM_SLEEP
);
530 error
= nfs_copyin(data
, uap
->datalen
, args
, fhandle
);
533 kmem_free(args
, sizeof (*args
));
537 args
= (struct nfs_args
*)data
;
538 fhandle
= (nfs_fhandle
*)args
->fh
;
544 if (uap
->flags
& MS_REMOUNT
) {
548 if (uap
->flags
& MS_SYSSPACE
)
549 error
= copystr(uap
->fstype
, name
, FSTYPSZ
, &n
);
551 error
= copyinstr(uap
->fstype
, name
, FSTYPSZ
, &n
);
554 if (error
== ENAMETOOLONG
)
561 * This check is to ensure that the request is a
562 * genuine nfs remount request.
565 if (strncmp(name
, "nfs", 3) != 0)
569 * If the request changes the locking type, disallow the
571 * because it's questionable whether we can transfer the
572 * locking state correctly.
574 * Remounts need to save the pathconf information.
575 * Part of the infamous static kludge.
578 if ((mi
= VFTOMI(vfsp
)) != NULL
) {
582 new_mi_llock
= (flags
& NFSMNT_LLOCK
) ? 1 : 0;
583 old_mi_llock
= (mi
->mi_flags
& MI_LLOCK
) ? 1 : 0;
584 if (old_mi_llock
!= new_mi_llock
)
587 error
= pathconf_get((struct mntinfo
*)vfsp
->vfs_data
, args
);
589 if (!(uap
->flags
& MS_SYSSPACE
)) {
590 nfs_free_args(args
, fhandle
);
591 kmem_free(args
, sizeof (*args
));
597 mutex_enter(&mvp
->v_lock
);
598 if (!(uap
->flags
& MS_OVERLAY
) &&
599 (mvp
->v_count
!= 1 || (mvp
->v_flag
& VROOT
))) {
600 mutex_exit(&mvp
->v_lock
);
601 if (!(uap
->flags
& MS_SYSSPACE
)) {
602 nfs_free_args(args
, fhandle
);
603 kmem_free(args
, sizeof (*args
));
607 mutex_exit(&mvp
->v_lock
);
609 /* make sure things are zeroed for errout: */
615 * A valid knetconfig structure is required.
617 if (!(flags
& NFSMNT_KNCONF
)) {
618 if (!(uap
->flags
& MS_SYSSPACE
)) {
619 nfs_free_args(args
, fhandle
);
620 kmem_free(args
, sizeof (*args
));
625 if ((strlen(args
->knconf
->knc_protofmly
) >= KNC_STRSIZE
) ||
626 (strlen(args
->knconf
->knc_proto
) >= KNC_STRSIZE
)) {
627 if (!(uap
->flags
& MS_SYSSPACE
)) {
628 nfs_free_args(args
, fhandle
);
629 kmem_free(args
, sizeof (*args
));
636 * Allocate a servinfo struct.
638 svp
= kmem_zalloc(sizeof (*svp
), KM_SLEEP
);
639 mutex_init(&svp
->sv_lock
, NULL
, MUTEX_DEFAULT
, NULL
);
641 svp_2ndlast
= svp_tail
;
642 svp_tail
->sv_next
= svp
;
651 * Get knetconfig and server address
653 svp
->sv_knconf
= args
->knconf
;
656 if (args
->addr
== NULL
|| args
->addr
->buf
== NULL
) {
661 svp
->sv_addr
.maxlen
= args
->addr
->maxlen
;
662 svp
->sv_addr
.len
= args
->addr
->len
;
663 svp
->sv_addr
.buf
= args
->addr
->buf
;
664 args
->addr
->buf
= NULL
;
667 * Get the root fhandle
671 bcopy(&fhandle
->fh_buf
, &svp
->sv_fhandle
.fh_buf
, fhandle
->fh_len
);
672 svp
->sv_fhandle
.fh_len
= fhandle
->fh_len
;
675 * Get server's hostname
677 if (flags
& NFSMNT_HOSTNAME
) {
678 if (args
->hostname
== NULL
) {
682 svp
->sv_hostnamelen
= strlen(args
->hostname
) + 1;
683 svp
->sv_hostname
= args
->hostname
;
684 args
->hostname
= NULL
;
686 char *p
= "unknown-host";
687 svp
->sv_hostnamelen
= strlen(p
) + 1;
688 svp
->sv_hostname
= kmem_zalloc(svp
->sv_hostnamelen
, KM_SLEEP
);
689 (void) strcpy(svp
->sv_hostname
, p
);
694 * RDMA MOUNT SUPPORT FOR NFS v2:
695 * Establish, is it possible to use RDMA, if so overload the
696 * knconf with rdma specific knconf and free the orignal.
698 if ((flags
& NFSMNT_TRYRDMA
) || (flags
& NFSMNT_DORDMA
)) {
700 * Determine the addr type for RDMA, IPv4 or v6.
702 if (strcmp(svp
->sv_knconf
->knc_protofmly
, NC_INET
) == 0)
704 else if (strcmp(svp
->sv_knconf
->knc_protofmly
, NC_INET6
) == 0)
705 addr_type
= AF_INET6
;
707 if (rdma_reachable(addr_type
, &svp
->sv_addr
,
708 &rdma_knconf
) == 0) {
710 * If successful, hijack, the orignal knconf and
711 * replace with a new one, depending on the flags.
713 svp
->sv_origknconf
= svp
->sv_knconf
;
714 svp
->sv_knconf
= rdma_knconf
;
715 knconf
= rdma_knconf
;
717 if (flags
& NFSMNT_TRYRDMA
) {
720 zcmn_err(getzoneid(), CE_WARN
,
721 "no RDMA onboard, revert\n");
725 if (flags
& NFSMNT_DORDMA
) {
727 * If proto=rdma is specified and no RDMA
728 * path to this server is avialable then
730 * This is not included in the mountable
731 * server list or the replica list.
732 * Check if more servers are specified;
733 * Failover case, otherwise bail out of mount.
735 if (args
->nfs_args_ext
== NFS_ARGS_EXTB
&&
736 args
->nfs_ext_u
.nfs_extB
.next
!= NULL
) {
738 args
->nfs_ext_u
.nfs_extB
.next
;
739 if (uap
->flags
& MS_RDONLY
&&
740 !(flags
& NFSMNT_SOFT
)) {
741 if (svp_head
->sv_next
== NULL
) {
747 svp_tail
= svp_2ndlast
;
748 svp_2ndlast
->sv_next
=
756 * This is the last server specified
757 * in the nfs_args list passed down
758 * and its not rdma capable.
760 if (svp_head
->sv_next
== NULL
) {
762 * Is this the only one
767 zcmn_err(getzoneid(),
774 * There is list, since some
775 * servers specified before
776 * this passed all requirements
778 svp_tail
= svp_2ndlast
;
779 svp_2ndlast
->sv_next
= NULL
;
789 * Get the extention data which has the new security data structure.
791 if (flags
& NFSMNT_NEWARGS
) {
792 switch (args
->nfs_args_ext
) {
796 * Indicating the application is using the new
797 * sec_data structure to pass in the security
800 secdata
= args
->nfs_ext_u
.nfs_extA
.secdata
;
801 if (secdata
== NULL
) {
805 * Need to validate the flavor here if
806 * sysspace, userspace was already
807 * validate from the nfs_copyin function.
809 switch (secdata
->rpcflavor
) {
821 args
->nfs_ext_u
.nfs_extA
.secdata
= NULL
;
828 } else if (flags
& NFSMNT_SECURE
) {
830 * Keep this for backward compatibility to support
831 * NFSMNT_SECURE/NFSMNT_RPCTIMESYNC flags.
833 if (args
->syncaddr
== NULL
|| args
->syncaddr
->buf
== NULL
) {
839 * get time sync address.
841 if (args
->syncaddr
== NULL
) {
847 * Move security related data to the sec_data structure.
850 dh_k4_clntdata_t
*data
;
853 secdata
= kmem_alloc(sizeof (*secdata
), KM_SLEEP
);
854 if (flags
& NFSMNT_RPCTIMESYNC
)
855 secdata
->flags
|= AUTH_F_RPCTIMESYNC
;
856 data
= kmem_alloc(sizeof (*data
), KM_SLEEP
);
857 bcopy(args
->syncaddr
, &data
->syncaddr
,
858 sizeof (*args
->syncaddr
));
862 * duplicate the knconf information for the
865 data
->knconf
= kmem_alloc(sizeof (*knconf
), KM_SLEEP
);
866 *data
->knconf
= *knconf
;
867 pf
= kmem_alloc(KNC_STRSIZE
, KM_SLEEP
);
868 p
= kmem_alloc(KNC_STRSIZE
, KM_SLEEP
);
869 bcopy(knconf
->knc_protofmly
, pf
, KNC_STRSIZE
);
870 bcopy(knconf
->knc_proto
, pf
, KNC_STRSIZE
);
871 data
->knconf
->knc_protofmly
= pf
;
872 data
->knconf
->knc_proto
= p
;
874 /* move server netname to the sec_data structure */
875 nlen
= strlen(args
->hostname
) + 1;
877 data
->netname
= kmem_alloc(nlen
, KM_SLEEP
);
878 bcopy(args
->hostname
, data
->netname
, nlen
);
879 data
->netnamelen
= (int)nlen
;
881 secdata
->secmod
= secdata
->rpcflavor
= AUTH_DES
;
882 secdata
->data
= (caddr_t
)data
;
885 secdata
= kmem_alloc(sizeof (*secdata
), KM_SLEEP
);
886 secdata
->secmod
= secdata
->rpcflavor
= AUTH_UNIX
;
887 secdata
->data
= NULL
;
889 svp
->sv_secdata
= secdata
;
893 * If mount secure failed, we will fall back to AUTH_NONE
894 * and try again. nfs3rootvp() will turn this back off.
896 * The NFS Version 2 mount uses GETATTR and STATFS procedures.
897 * The server does not care if these procedures have the proper
898 * authentication flavor, so if mount retries using AUTH_NONE
899 * that does not require a credential setup for root then the
900 * automounter would work without requiring root to be
901 * keylogged into AUTH_DES.
903 if (secdata
->rpcflavor
!= AUTH_UNIX
&&
904 secdata
->rpcflavor
!= AUTH_LOOPBACK
)
905 secdata
->flags
|= AUTH_F_TRYNONE
;
910 * We may have a linked list of nfs_args structures,
911 * which means the user is looking for failover. If
912 * the mount is either not "read-only" or "soft",
913 * we want to bail out with EINVAL.
915 if (args
->nfs_args_ext
== NFS_ARGS_EXTB
&&
916 args
->nfs_ext_u
.nfs_extB
.next
!= NULL
) {
917 if (uap
->flags
& MS_RDONLY
&& !(flags
& NFSMNT_SOFT
)) {
918 data
= (char *)args
->nfs_ext_u
.nfs_extB
.next
;
926 * Determine the zone we're being mounted into.
928 zone_hold(mntzone
= zone
); /* start with this assumption */
929 if (getzoneid() == GLOBAL_ZONEID
) {
931 mntzone
= zone_find_by_path(refstr_value(vfsp
->vfs_mntpt
));
932 ASSERT(mntzone
!= NULL
);
933 if (mntzone
!= zone
) {
940 * Stop the mount from going any further if the zone is going away.
942 if (zone_status_get(mntzone
) >= ZONE_IS_SHUTTING_DOWN
) {
951 error
= nfsrootvp(&rtvp
, vfsp
, svp_head
, flags
, cr
, mntzone
);
957 * Set option fields in the mount info record
961 if (svp_head
->sv_next
)
962 mi
->mi_flags
|= MI_LLOCK
;
964 error
= nfs_setopts(rtvp
, DATAMODEL_NATIVE
, args
);
966 /* static pathconf kludge */
967 error
= pathconf_get(mi
, args
);
974 if (rp
->r_flags
& RHASHED
)
983 nfs_async_stop(vfsp
);
984 nfs_async_manager_stop(vfsp
);
985 if (mi
->mi_io_kstats
) {
986 kstat_delete(mi
->mi_io_kstats
);
987 mi
->mi_io_kstats
= NULL
;
989 if (mi
->mi_ro_kstats
) {
990 kstat_delete(mi
->mi_ro_kstats
);
991 mi
->mi_ro_kstats
= NULL
;
997 if (!(uap
->flags
& MS_SYSSPACE
)) {
998 nfs_free_args(args
, fhandle
);
999 kmem_free(args
, sizeof (*args
));
1002 if (mntzone
!= NULL
)
1009 * The pathconf information is kept on a linked list of kmem_alloc'ed
1010 * structs. We search the list & add a new struct iff there is no other
1011 * struct with the same information.
1012 * See sys/pathconf.h for ``the rest of the story.''
1014 static struct pathcnf
*allpc
= NULL
;
1017 pathconf_copyin(struct nfs_args
*args
, struct pathcnf
*pc
)
1019 STRUCT_DECL(pathcnf
, pc_tmp
);
1020 STRUCT_HANDLE(nfs_args
, ap
);
1024 model
= get_udatamodel();
1025 STRUCT_INIT(pc_tmp
, model
);
1026 STRUCT_SET_HANDLE(ap
, model
, args
);
1028 if ((STRUCT_FGET(ap
, flags
) & NFSMNT_POSIX
) &&
1029 STRUCT_FGETP(ap
, pathconf
) != NULL
) {
1030 if (copyin(STRUCT_FGETP(ap
, pathconf
), STRUCT_BUF(pc_tmp
),
1031 STRUCT_SIZE(pc_tmp
)))
1033 if (_PC_ISSET(_PC_ERROR
, STRUCT_FGET(pc_tmp
, pc_mask
)))
1036 pc
->pc_link_max
= STRUCT_FGET(pc_tmp
, pc_link_max
);
1037 pc
->pc_max_canon
= STRUCT_FGET(pc_tmp
, pc_max_canon
);
1038 pc
->pc_max_input
= STRUCT_FGET(pc_tmp
, pc_max_input
);
1039 pc
->pc_name_max
= STRUCT_FGET(pc_tmp
, pc_name_max
);
1040 pc
->pc_path_max
= STRUCT_FGET(pc_tmp
, pc_path_max
);
1041 pc
->pc_pipe_buf
= STRUCT_FGET(pc_tmp
, pc_pipe_buf
);
1042 pc
->pc_vdisable
= STRUCT_FGET(pc_tmp
, pc_vdisable
);
1043 pc
->pc_xxx
= STRUCT_FGET(pc_tmp
, pc_xxx
);
1044 for (i
= 0; i
< _PC_N
; i
++)
1045 pc
->pc_mask
[i
] = STRUCT_FGET(pc_tmp
, pc_mask
[i
]);
1051 pathconf_get(struct mntinfo
*mi
, struct nfs_args
*args
)
1053 struct pathcnf
*p
, *pc
;
1055 pc
= args
->pathconf
;
1056 if (mi
->mi_pathconf
!= NULL
) {
1058 mi
->mi_pathconf
= NULL
;
1061 if (args
->flags
& NFSMNT_POSIX
&& args
->pathconf
!= NULL
) {
1062 if (_PC_ISSET(_PC_ERROR
, pc
->pc_mask
))
1065 for (p
= allpc
; p
!= NULL
; p
= p
->pc_next
) {
1066 if (PCCMP(p
, pc
) == 0)
1070 mi
->mi_pathconf
= p
;
1073 p
= kmem_alloc(sizeof (*p
), KM_SLEEP
);
1074 bcopy(pc
, p
, sizeof (struct pathcnf
));
1077 allpc
= mi
->mi_pathconf
= p
;
1084 * release the static pathconf information
1087 pathconf_rele(struct mntinfo
*mi
)
1089 if (mi
->mi_pathconf
!= NULL
) {
1090 if (--mi
->mi_pathconf
->pc_refcnt
== 0) {
1095 while (p
!= NULL
&& p
!= mi
->mi_pathconf
) {
1100 panic("mi->pathconf");
1106 p2
->pc_next
= p
->pc_next
;
1107 kmem_free(p
, sizeof (*p
));
1108 mi
->mi_pathconf
= NULL
;
1113 static int nfs_dynamic
= 1; /* global variable to enable dynamic retrans. */
1114 static ushort_t nfs_max_threads
= 8; /* max number of active async threads */
1115 static uint_t nfs_async_clusters
= 1; /* # of reqs from each async queue */
1116 static uint_t nfs_cots_timeo
= NFS_COTS_TIMEO
;
1119 nfsrootvp(vnode_t
**rtvpp
, vfs_t
*vfsp
, struct servinfo
*svp
,
1120 int flags
, cred_t
*cr
, zone_t
*zone
)
1129 struct nfs_stats
*nfsstatsp
;
1130 cred_t
*lcr
= NULL
, *tcr
= cr
;
1132 nfsstatsp
= zone_getspecific(nfsstat_zone_key
, nfs_zone());
1133 ASSERT(nfsstatsp
!= NULL
);
1136 * Create a mount record and link it to the vfs struct.
1138 mi
= kmem_zalloc(sizeof (*mi
), KM_SLEEP
);
1139 mutex_init(&mi
->mi_lock
, NULL
, MUTEX_DEFAULT
, NULL
);
1140 mutex_init(&mi
->mi_remap_lock
, NULL
, MUTEX_DEFAULT
, NULL
);
1141 mi
->mi_flags
= MI_ACL
| MI_EXTATTR
;
1142 if (!(flags
& NFSMNT_SOFT
))
1143 mi
->mi_flags
|= MI_HARD
;
1144 if ((flags
& NFSMNT_SEMISOFT
))
1145 mi
->mi_flags
|= MI_SEMISOFT
;
1146 if ((flags
& NFSMNT_NOPRINT
))
1147 mi
->mi_flags
|= MI_NOPRINT
;
1148 if (flags
& NFSMNT_INT
)
1149 mi
->mi_flags
|= MI_INT
;
1150 mi
->mi_retrans
= NFS_RETRIES
;
1151 if (svp
->sv_knconf
->knc_semantics
== NC_TPI_COTS_ORD
||
1152 svp
->sv_knconf
->knc_semantics
== NC_TPI_COTS
)
1153 mi
->mi_timeo
= nfs_cots_timeo
;
1155 mi
->mi_timeo
= NFS_TIMEO
;
1156 mi
->mi_prog
= NFS_PROGRAM
;
1157 mi
->mi_vers
= NFS_VERSION
;
1158 mi
->mi_rfsnames
= rfsnames_v2
;
1159 mi
->mi_reqs
= nfsstatsp
->nfs_stats_v2
.rfsreqcnt_ptr
;
1160 mi
->mi_call_type
= call_type_v2
;
1161 mi
->mi_ss_call_type
= ss_call_type_v2
;
1162 mi
->mi_timer_type
= timer_type_v2
;
1163 mi
->mi_aclnames
= aclnames_v2
;
1164 mi
->mi_aclreqs
= nfsstatsp
->nfs_stats_v2
.aclreqcnt_ptr
;
1165 mi
->mi_acl_call_type
= acl_call_type_v2
;
1166 mi
->mi_acl_ss_call_type
= acl_ss_call_type_v2
;
1167 mi
->mi_acl_timer_type
= acl_timer_type_v2
;
1168 cv_init(&mi
->mi_failover_cv
, NULL
, CV_DEFAULT
, NULL
);
1169 mi
->mi_servers
= svp
;
1170 mi
->mi_curr_serv
= svp
;
1171 mi
->mi_acregmin
= SEC2HR(ACREGMIN
);
1172 mi
->mi_acregmax
= SEC2HR(ACREGMAX
);
1173 mi
->mi_acdirmin
= SEC2HR(ACDIRMIN
);
1174 mi
->mi_acdirmax
= SEC2HR(ACDIRMAX
);
1177 mi
->mi_flags
|= MI_DYNAMIC
;
1179 if (flags
& NFSMNT_DIRECTIO
)
1180 mi
->mi_flags
|= MI_DIRECTIO
;
1183 * Make a vfs struct for nfs. We do this here instead of below
1184 * because rtvp needs a vfs before we can do a getattr on it.
1186 * Assign a unique device id to the mount
1188 mutex_enter(&nfs_minor_lock
);
1190 nfs_minor
= (nfs_minor
+ 1) & MAXMIN32
;
1191 nfs_dev
= makedevice(nfs_major
, nfs_minor
);
1192 } while (vfs_devismounted(nfs_dev
));
1193 mutex_exit(&nfs_minor_lock
);
1195 vfsp
->vfs_dev
= nfs_dev
;
1196 vfs_make_fsid(&vfsp
->vfs_fsid
, nfs_dev
, nfsfstyp
);
1197 vfsp
->vfs_data
= (caddr_t
)mi
;
1198 vfsp
->vfs_fstype
= nfsfstyp
;
1199 vfsp
->vfs_bsize
= NFS_MAXDATA
;
1202 * Initialize fields used to support async putpage operations.
1204 for (i
= 0; i
< NFS_ASYNC_TYPES
; i
++)
1205 mi
->mi_async_clusters
[i
] = nfs_async_clusters
;
1206 mi
->mi_async_init_clusters
= nfs_async_clusters
;
1207 mi
->mi_async_curr
[NFS_ASYNC_QUEUE
] =
1208 mi
->mi_async_curr
[NFS_ASYNC_PGOPS_QUEUE
] = &mi
->mi_async_reqs
[0];
1209 mi
->mi_max_threads
= nfs_max_threads
;
1210 mutex_init(&mi
->mi_async_lock
, NULL
, MUTEX_DEFAULT
, NULL
);
1211 cv_init(&mi
->mi_async_reqs_cv
, NULL
, CV_DEFAULT
, NULL
);
1212 cv_init(&mi
->mi_async_work_cv
[NFS_ASYNC_QUEUE
], NULL
, CV_DEFAULT
, NULL
);
1213 cv_init(&mi
->mi_async_work_cv
[NFS_ASYNC_PGOPS_QUEUE
], NULL
,
1215 cv_init(&mi
->mi_async_cv
, NULL
, CV_DEFAULT
, NULL
);
1219 zone_init_ref(&mi
->mi_zone_ref
);
1220 zone_hold_ref(zone
, &mi
->mi_zone_ref
, ZONE_REF_NFS
);
1221 nfs_mi_zonelist_add(mi
);
1224 * Make the root vnode, use it to get attributes,
1225 * then remake it with the attributes.
1227 rtvp
= makenfsnode((fhandle_t
*)svp
->sv_fhandle
.fh_buf
,
1228 NULL
, vfsp
, gethrtime(), cr
, NULL
, NULL
);
1230 va
.va_mask
= AT_ALL
;
1233 * If the uid is set then set the creds for secure mounts
1234 * by proxy processes such as automountd.
1236 if (svp
->sv_secdata
->uid
!= 0 &&
1237 svp
->sv_secdata
->rpcflavor
== RPCSEC_GSS
) {
1239 (void) crsetugid(lcr
, svp
->sv_secdata
->uid
, crgetgid(cr
));
1243 error
= nfsgetattr(rtvp
, &va
, tcr
);
1246 rtvp
->v_type
= va
.va_type
;
1249 * Poll every server to get the filesystem stats; we're
1250 * only interested in the server's transfer size, and we
1253 * While we're looping, we'll turn off AUTH_F_TRYNONE,
1254 * which is only for the mount operation.
1257 mi
->mi_tsize
= MIN(NFS_MAXDATA
, nfstsize());
1258 mi
->mi_stsize
= MIN(NFS_MAXDATA
, nfstsize());
1260 for (svp
= mi
->mi_servers
; svp
!= NULL
; svp
= svp
->sv_next
) {
1261 struct nfsstatfs fs
;
1265 mi
->mi_curr_serv
= svp
;
1267 error
= rfs2call(mi
, RFS_STATFS
, xdr_fhandle
,
1268 (caddr_t
)svp
->sv_fhandle
.fh_buf
, xdr_statfs
, (caddr_t
)&fs
,
1269 tcr
, &douprintf
, &fs
.fs_status
, 0, NULL
);
1272 mi
->mi_stsize
= MIN(mi
->mi_stsize
, fs
.fs_tsize
);
1273 svp
->sv_secdata
->flags
&= ~AUTH_F_TRYNONE
;
1275 mi
->mi_curr_serv
= mi
->mi_servers
;
1276 mi
->mi_curread
= mi
->mi_tsize
;
1277 mi
->mi_curwrite
= mi
->mi_stsize
;
1280 * Start the manager thread responsible for handling async worker
1283 VFS_HOLD(vfsp
); /* add reference for thread */
1284 mi
->mi_manager_thread
= zthread_create(NULL
, 0, nfs_async_manager
,
1285 vfsp
, 0, minclsyspri
);
1286 ASSERT(mi
->mi_manager_thread
!= NULL
);
1291 nfs_mnt_kstat_init(vfsp
);
1293 mi
->mi_type
= rtvp
->v_type
;
1302 * An error occurred somewhere, need to clean up...
1303 * We need to release our reference to the root vnode and
1304 * destroy the mntinfo struct that we just created.
1309 if (rp
->r_flags
& RHASHED
)
1312 nfs_async_stop(vfsp
);
1313 nfs_async_manager_stop(vfsp
);
1314 if (mi
->mi_io_kstats
) {
1315 kstat_delete(mi
->mi_io_kstats
);
1316 mi
->mi_io_kstats
= NULL
;
1318 if (mi
->mi_ro_kstats
) {
1319 kstat_delete(mi
->mi_ro_kstats
);
1320 mi
->mi_ro_kstats
= NULL
;
1331 nfs_unmount(vfs_t
*vfsp
, int flag
, cred_t
*cr
)
1336 if (secpolicy_fs_unmount(cr
, vfsp
) != 0)
1340 if (flag
& MS_FORCE
) {
1342 vfsp
->vfs_flag
|= VFS_UNMOUNTED
;
1345 * We are about to stop the async manager.
1346 * Let every one know not to schedule any
1347 * more async requests.
1349 mutex_enter(&mi
->mi_async_lock
);
1350 mi
->mi_max_threads
= 0;
1351 NFS_WAKEALL_ASYNC_WORKERS(mi
->mi_async_work_cv
);
1352 mutex_exit(&mi
->mi_async_lock
);
1355 * We need to stop the manager thread explicitly; the worker
1356 * threads can time out and exit on their own.
1358 nfs_async_manager_stop(vfsp
);
1359 destroy_rtable(vfsp
, cr
);
1360 if (mi
->mi_io_kstats
) {
1361 kstat_delete(mi
->mi_io_kstats
);
1362 mi
->mi_io_kstats
= NULL
;
1364 if (mi
->mi_ro_kstats
) {
1365 kstat_delete(mi
->mi_ro_kstats
);
1366 mi
->mi_ro_kstats
= NULL
;
1371 * Wait until all asynchronous putpage operations on
1372 * this file system are complete before flushing rnodes
1375 omax
= mi
->mi_max_threads
;
1376 if (nfs_async_stop_sig(vfsp
)) {
1381 * If there are any active vnodes on this file system,
1382 * then the file system is busy and can't be umounted.
1384 if (check_rtable(vfsp
)) {
1385 mutex_enter(&mi
->mi_async_lock
);
1386 mi
->mi_max_threads
= omax
;
1387 mutex_exit(&mi
->mi_async_lock
);
1391 * The unmount can't fail from now on; stop the manager thread.
1393 nfs_async_manager_stop(vfsp
);
1395 * Destroy all rnodes belonging to this file system from the
1396 * rnode hash queues and purge any resources allocated to
1399 destroy_rtable(vfsp
, cr
);
1400 if (mi
->mi_io_kstats
) {
1401 kstat_delete(mi
->mi_io_kstats
);
1402 mi
->mi_io_kstats
= NULL
;
1404 if (mi
->mi_ro_kstats
) {
1405 kstat_delete(mi
->mi_ro_kstats
);
1406 mi
->mi_ro_kstats
= NULL
;
1415 nfs_root(vfs_t
*vfsp
, vnode_t
**vpp
)
1425 if (nfs_zone() != mi
->mi_zone
)
1428 svp
= mi
->mi_curr_serv
;
1429 if (svp
&& (svp
->sv_flags
& SV_ROOT_STALE
)) {
1430 mutex_enter(&svp
->sv_lock
);
1431 svp
->sv_flags
&= ~SV_ROOT_STALE
;
1432 mutex_exit(&svp
->sv_lock
);
1436 vp
= makenfsnode((fhandle_t
*)mi
->mi_curr_serv
->sv_fhandle
.fh_buf
,
1437 NULL
, vfsp
, gethrtime(), CRED(), NULL
, NULL
);
1440 * if the SV_ROOT_STALE flag was reset above, reset the
1441 * RSTALE flag if needed and return an error
1443 if (error
== ENOENT
) {
1445 if (svp
&& rp
->r_flags
& RSTALE
) {
1446 mutex_enter(&rp
->r_statelock
);
1447 rp
->r_flags
&= ~RSTALE
;
1448 mutex_exit(&rp
->r_statelock
);
1454 ASSERT(vp
->v_type
== VNON
|| vp
->v_type
== mi
->mi_type
);
1456 vp
->v_type
= mi
->mi_type
;
1464 * Get file system statistics.
1467 nfs_statvfs(vfs_t
*vfsp
, struct statvfs64
*sbp
)
1471 struct nfsstatfs fs
;
1476 error
= nfs_root(vfsp
, &vp
);
1483 fi
.fhp
= NULL
; /* no need to update, filehandle not copied */
1484 fi
.copyproc
= nfscopyfh
;
1485 fi
.lookupproc
= nfslookup
;
1486 fi
.xattrdirproc
= acl_getxattrdir2
;
1488 error
= rfs2call(mi
, RFS_STATFS
, xdr_fhandle
, (caddr_t
)VTOFH(vp
),
1489 xdr_statfs
, (caddr_t
)&fs
, CRED(), &douprintf
, &fs
.fs_status
, 0,
1493 error
= geterrno(fs
.fs_status
);
1495 mutex_enter(&mi
->mi_lock
);
1496 if (mi
->mi_stsize
) {
1497 mi
->mi_stsize
= MIN(mi
->mi_stsize
, fs
.fs_tsize
);
1499 mi
->mi_stsize
= fs
.fs_tsize
;
1500 mi
->mi_curwrite
= mi
->mi_stsize
;
1502 mutex_exit(&mi
->mi_lock
);
1503 sbp
->f_bsize
= fs
.fs_bsize
;
1504 sbp
->f_frsize
= fs
.fs_bsize
;
1505 sbp
->f_blocks
= (fsblkcnt64_t
)fs
.fs_blocks
;
1506 sbp
->f_bfree
= (fsblkcnt64_t
)fs
.fs_bfree
;
1508 * Some servers may return negative available
1509 * block counts. They may do this because they
1510 * calculate the number of available blocks by
1511 * subtracting the number of used blocks from
1512 * the total number of blocks modified by the
1513 * minimum free value. For example, if the
1514 * minumum free percentage is 10 and the file
1515 * system is greater than 90 percent full, then
1516 * 90 percent of the total blocks minus the
1517 * actual number of used blocks may be a
1520 * In this case, we need to sign extend the
1521 * negative number through the assignment from
1522 * the 32 bit bavail count to the 64 bit bavail
1525 * We need to be able to discern between there
1526 * just being a lot of available blocks on the
1527 * file system and the case described above.
1528 * We are making the assumption that it does
1529 * not make sense to have more available blocks
1530 * than there are free blocks. So, if there
1531 * are, then we treat the number as if it were
1532 * a negative number and arrange to have it
1533 * sign extended when it is converted from 32
1536 if (fs
.fs_bavail
<= fs
.fs_bfree
)
1537 sbp
->f_bavail
= (fsblkcnt64_t
)fs
.fs_bavail
;
1540 (fsblkcnt64_t
)((long)fs
.fs_bavail
);
1542 sbp
->f_files
= (fsfilcnt64_t
)-1;
1543 sbp
->f_ffree
= (fsfilcnt64_t
)-1;
1544 sbp
->f_favail
= (fsfilcnt64_t
)-1;
1545 sbp
->f_fsid
= (unsigned long)vfsp
->vfs_fsid
.val
[0];
1546 (void) strncpy(sbp
->f_basetype
,
1547 vfssw
[vfsp
->vfs_fstype
].vsw_name
, FSTYPSZ
);
1548 sbp
->f_flag
= vf_to_stf(vfsp
->vfs_flag
);
1549 sbp
->f_namemax
= (uint32_t)-1;
1551 PURGE_STALE_FH(error
, vp
, CRED());
1560 static kmutex_t nfs_syncbusy
;
1563 * Flush dirty nfs files for file system vfsp.
1564 * If vfsp == NULL, all nfs files are flushed.
1568 nfs_sync(vfs_t
*vfsp
, short flag
, cred_t
*cr
)
1571 * Cross-zone calls are OK here, since this translates to a
1572 * fop_putpage(B_ASYNC), which gets picked up by the right zone.
1574 if (!(flag
& SYNC_ATTR
) && mutex_tryenter(&nfs_syncbusy
) != 0) {
1576 mutex_exit(&nfs_syncbusy
);
1583 nfs_vget(vfs_t
*vfsp
, vnode_t
**vpp
, fid_t
*fidp
)
1588 struct nfs_fid
*nfsfidp
= (struct nfs_fid
*)fidp
;
1589 zoneid_t zoneid
= VFTOMI(vfsp
)->mi_zone
->zone_id
;
1591 if (nfs_zone() != VFTOMI(vfsp
)->mi_zone
)
1593 if (fidp
->fid_len
!= (sizeof (*nfsfidp
) - sizeof (short))) {
1595 zcmn_err(zoneid
, CE_WARN
,
1596 "nfs_vget: bad fid len, %d/%d", fidp
->fid_len
,
1597 (int)(sizeof (*nfsfidp
) - sizeof (short)));
1603 vp
= makenfsnode((fhandle_t
*)(nfsfidp
->nf_data
), NULL
, vfsp
,
1604 gethrtime(), CRED(), NULL
, NULL
);
1606 if (VTOR(vp
)->r_flags
& RSTALE
) {
1612 if (vp
->v_type
== VNON
) {
1613 va
.va_mask
= AT_ALL
;
1614 error
= nfsgetattr(vp
, &va
, CRED());
1620 vp
->v_type
= va
.va_type
;
1630 nfs_mountroot(vfs_t
*vfsp
, whymountroot_t why
)
1633 char root_hostname
[SYS_NMLN
+1];
1634 struct servinfo
*svp
;
1642 struct nfs_args args
; /* nfs mount arguments */
1643 static char token
[10];
1645 bzero(&args
, sizeof (args
));
1647 /* do this BEFORE getfile which causes xid stamps to be initialized */
1648 clkset(-1L); /* hack for now - until we get time svc? */
1650 if (why
== ROOT_REMOUNT
) {
1654 panic("nfs_mountroot: why == ROOT_REMOUNT");
1657 if (why
== ROOT_UNMOUNT
) {
1659 * Nothing to do for NFS.
1670 getfsname("root", name
, sizeof (token
));
1673 root_path
= pn
.pn_path
;
1675 svp
= kmem_zalloc(sizeof (*svp
), KM_SLEEP
);
1676 svp
->sv_knconf
= kmem_zalloc(sizeof (*svp
->sv_knconf
), KM_SLEEP
);
1677 svp
->sv_knconf
->knc_protofmly
= kmem_alloc(KNC_STRSIZE
, KM_SLEEP
);
1678 svp
->sv_knconf
->knc_proto
= kmem_alloc(KNC_STRSIZE
, KM_SLEEP
);
1681 * Get server address
1682 * Get the root fhandle
1683 * Get server's transport
1684 * Get server's hostname
1687 args
.addr
= &svp
->sv_addr
;
1688 args
.fh
= (char *)&svp
->sv_fhandle
.fh_buf
;
1689 args
.knconf
= svp
->sv_knconf
;
1690 args
.hostname
= root_hostname
;
1692 if (error
= mount_root(*name
? name
: "root", root_path
, NFS_VERSION
,
1693 &args
, &vfsflags
)) {
1694 nfs_cmn_err(error
, CE_WARN
,
1695 "nfs_mountroot: mount_root failed: %m");
1700 svp
->sv_fhandle
.fh_len
= NFS_FHSIZE
;
1701 svp
->sv_hostnamelen
= (int)(strlen(root_hostname
) + 1);
1702 svp
->sv_hostname
= kmem_alloc(svp
->sv_hostnamelen
, KM_SLEEP
);
1703 (void) strcpy(svp
->sv_hostname
, root_hostname
);
1706 * Force root partition to always be mounted with AUTH_UNIX for now
1708 svp
->sv_secdata
= kmem_alloc(sizeof (*svp
->sv_secdata
), KM_SLEEP
);
1709 svp
->sv_secdata
->secmod
= AUTH_UNIX
;
1710 svp
->sv_secdata
->rpcflavor
= AUTH_UNIX
;
1711 svp
->sv_secdata
->data
= NULL
;
1716 error
= nfsrootvp(&rtvp
, vfsp
, svp
, args
.flags
, cr
, global_zone
);
1726 error
= nfs_setopts(rtvp
, DATAMODEL_NATIVE
, &args
);
1728 nfs_cmn_err(error
, CE_WARN
,
1729 "nfs_mountroot: invalid root mount options");
1734 (void) vfs_lock_wait(vfsp
);
1735 vfs_add(NULL
, vfsp
, vfsflags
);
1738 size
= strlen(svp
->sv_hostname
);
1739 (void) strcpy(rootfs
.bo_name
, svp
->sv_hostname
);
1740 rootfs
.bo_name
[size
] = ':';
1741 (void) strcpy(&rootfs
.bo_name
[size
+ 1], root_path
);
1748 nfs_async_stop(vfsp
);
1749 nfs_async_manager_stop(vfsp
);
1759 * Initialization routine for VFS routines. Should only be called once
1764 mutex_init(&nfs_syncbusy
, NULL
, MUTEX_DEFAULT
, NULL
);
1771 mutex_destroy(&nfs_syncbusy
);
1775 nfs_freevfs(vfs_t
*vfsp
)
1780 /* free up the resources */
1783 svp
= mi
->mi_servers
;
1784 mi
->mi_servers
= mi
->mi_curr_serv
= NULL
;
1788 * By this time we should have already deleted the
1789 * mi kstats in the unmount code. If they are still around
1792 ASSERT(mi
->mi_io_kstats
== NULL
);