17c478bd9Sstevel@tonic-gate /* 27c478bd9Sstevel@tonic-gate * CDDL HEADER START 37c478bd9Sstevel@tonic-gate * 47c478bd9Sstevel@tonic-gate * The contents of this file are subject to the terms of the 5f86c6ccaSdm * Common Development and Distribution License (the "License"). 6f86c6ccaSdm * You may not use this file except in compliance with the License. 77c478bd9Sstevel@tonic-gate * 87c478bd9Sstevel@tonic-gate * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 97c478bd9Sstevel@tonic-gate * or http://www.opensolaris.org/os/licensing. 107c478bd9Sstevel@tonic-gate * See the License for the specific language governing permissions 117c478bd9Sstevel@tonic-gate * and limitations under the License. 127c478bd9Sstevel@tonic-gate * 137c478bd9Sstevel@tonic-gate * When distributing Covered Code, include this CDDL HEADER in each 147c478bd9Sstevel@tonic-gate * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 157c478bd9Sstevel@tonic-gate * If applicable, add the following below this CDDL HEADER, with the 167c478bd9Sstevel@tonic-gate * fields enclosed by brackets "[]" replaced with your own identifying 177c478bd9Sstevel@tonic-gate * information: Portions Copyright [yyyy] [name of copyright owner] 187c478bd9Sstevel@tonic-gate * 197c478bd9Sstevel@tonic-gate * CDDL HEADER END 207c478bd9Sstevel@tonic-gate */ 217c478bd9Sstevel@tonic-gate /* 22e557fb2cSDai Ngo * Copyright 2009 Sun Microsystems, Inc. All rights reserved. 237c478bd9Sstevel@tonic-gate * Use is subject to license terms. 247c478bd9Sstevel@tonic-gate */ 257c478bd9Sstevel@tonic-gate 267c478bd9Sstevel@tonic-gate /* 277c478bd9Sstevel@tonic-gate * Copyright (c) 1983,1984,1985,1986,1987,1988,1989 AT&T. 287c478bd9Sstevel@tonic-gate * All Rights Reserved 297c478bd9Sstevel@tonic-gate */ 307c478bd9Sstevel@tonic-gate 317c478bd9Sstevel@tonic-gate #include <sys/param.h> 327c478bd9Sstevel@tonic-gate #include <sys/types.h> 337c478bd9Sstevel@tonic-gate #include <sys/systm.h> 347c478bd9Sstevel@tonic-gate #include <sys/cred.h> 357c478bd9Sstevel@tonic-gate #include <sys/vfs.h> 36aa59c4cbSrsb #include <sys/vfs_opreg.h> 377c478bd9Sstevel@tonic-gate #include <sys/vnode.h> 387c478bd9Sstevel@tonic-gate #include <sys/pathname.h> 397c478bd9Sstevel@tonic-gate #include <sys/sysmacros.h> 407c478bd9Sstevel@tonic-gate #include <sys/kmem.h> 417c478bd9Sstevel@tonic-gate #include <sys/mkdev.h> 427c478bd9Sstevel@tonic-gate #include <sys/mount.h> 437c478bd9Sstevel@tonic-gate #include <sys/statvfs.h> 447c478bd9Sstevel@tonic-gate #include <sys/errno.h> 457c478bd9Sstevel@tonic-gate #include <sys/debug.h> 467c478bd9Sstevel@tonic-gate #include <sys/cmn_err.h> 477c478bd9Sstevel@tonic-gate #include <sys/utsname.h> 487c478bd9Sstevel@tonic-gate #include <sys/bootconf.h> 497c478bd9Sstevel@tonic-gate #include <sys/modctl.h> 507c478bd9Sstevel@tonic-gate #include <sys/acl.h> 517c478bd9Sstevel@tonic-gate #include <sys/flock.h> 527c478bd9Sstevel@tonic-gate #include <sys/time.h> 537c478bd9Sstevel@tonic-gate #include <sys/disp.h> 547c478bd9Sstevel@tonic-gate #include <sys/policy.h> 557c478bd9Sstevel@tonic-gate #include <sys/socket.h> 567c478bd9Sstevel@tonic-gate #include <sys/netconfig.h> 577c478bd9Sstevel@tonic-gate #include <sys/dnlc.h> 587c478bd9Sstevel@tonic-gate #include <sys/list.h> 5945916cd2Sjpk #include <sys/mntent.h> 6045916cd2Sjpk #include <sys/tsol/label.h> 617c478bd9Sstevel@tonic-gate 627c478bd9Sstevel@tonic-gate #include <rpc/types.h> 637c478bd9Sstevel@tonic-gate #include <rpc/auth.h> 647c478bd9Sstevel@tonic-gate #include <rpc/rpcsec_gss.h> 657c478bd9Sstevel@tonic-gate #include <rpc/clnt.h> 667c478bd9Sstevel@tonic-gate 677c478bd9Sstevel@tonic-gate #include <nfs/nfs.h> 687c478bd9Sstevel@tonic-gate #include <nfs/nfs_clnt.h> 697c478bd9Sstevel@tonic-gate #include <nfs/mount.h> 707c478bd9Sstevel@tonic-gate #include <nfs/nfs_acl.h> 717c478bd9Sstevel@tonic-gate 727c478bd9Sstevel@tonic-gate #include <fs/fs_subr.h> 737c478bd9Sstevel@tonic-gate 747c478bd9Sstevel@tonic-gate #include <nfs/nfs4.h> 757c478bd9Sstevel@tonic-gate #include <nfs/rnode4.h> 767c478bd9Sstevel@tonic-gate #include <nfs/nfs4_clnt.h> 7739d3e169Sevanl #include <sys/fs/autofs.h> 7839d3e169Sevanl 797c478bd9Sstevel@tonic-gate 807c478bd9Sstevel@tonic-gate /* 817c478bd9Sstevel@tonic-gate * Arguments passed to thread to free data structures from forced unmount. 827c478bd9Sstevel@tonic-gate */ 837c478bd9Sstevel@tonic-gate 847c478bd9Sstevel@tonic-gate typedef struct { 85b9238976Sth vfs_t *fm_vfsp; 86b9238976Sth int fm_flag; 87b9238976Sth cred_t *fm_cr; 887c478bd9Sstevel@tonic-gate } freemountargs_t; 897c478bd9Sstevel@tonic-gate 90b9238976Sth static void async_free_mount(vfs_t *, int, cred_t *); 91b9238976Sth static void nfs4_free_mount(vfs_t *, int, cred_t *); 927c478bd9Sstevel@tonic-gate static void nfs4_free_mount_thread(freemountargs_t *); 937c478bd9Sstevel@tonic-gate static int nfs4_chkdup_servinfo4(servinfo4_t *, servinfo4_t *); 947c478bd9Sstevel@tonic-gate 957c478bd9Sstevel@tonic-gate /* 967c478bd9Sstevel@tonic-gate * From rpcsec module (common/rpcsec). 977c478bd9Sstevel@tonic-gate */ 987c478bd9Sstevel@tonic-gate extern int sec_clnt_loadinfo(struct sec_data *, struct sec_data **, model_t); 997c478bd9Sstevel@tonic-gate extern void sec_clnt_freeinfo(struct sec_data *); 1007c478bd9Sstevel@tonic-gate 1017c478bd9Sstevel@tonic-gate /* 1027c478bd9Sstevel@tonic-gate * The order and contents of this structure must be kept in sync with that of 1037c478bd9Sstevel@tonic-gate * rfsreqcnt_v4_tmpl in nfs_stats.c 1047c478bd9Sstevel@tonic-gate */ 1057c478bd9Sstevel@tonic-gate static char *rfsnames_v4[] = { 1067c478bd9Sstevel@tonic-gate "null", "compound", "reserved", "access", "close", "commit", "create", 1077c478bd9Sstevel@tonic-gate "delegpurge", "delegreturn", "getattr", "getfh", "link", "lock", 1087c478bd9Sstevel@tonic-gate "lockt", "locku", "lookup", "lookupp", "nverify", "open", "openattr", 1097c478bd9Sstevel@tonic-gate "open_confirm", "open_downgrade", "putfh", "putpubfh", "putrootfh", 1107c478bd9Sstevel@tonic-gate "read", "readdir", "readlink", "remove", "rename", "renew", 1117c478bd9Sstevel@tonic-gate "restorefh", "savefh", "secinfo", "setattr", "setclientid", 1127c478bd9Sstevel@tonic-gate "setclientid_confirm", "verify", "write" 1137c478bd9Sstevel@tonic-gate }; 1147c478bd9Sstevel@tonic-gate 1157c478bd9Sstevel@tonic-gate /* 1167c478bd9Sstevel@tonic-gate * nfs4_max_mount_retry is the number of times the client will redrive 1177c478bd9Sstevel@tonic-gate * a mount compound before giving up and returning failure. The intent 1187c478bd9Sstevel@tonic-gate * is to redrive mount compounds which fail NFS4ERR_STALE so that 1197c478bd9Sstevel@tonic-gate * if a component of the server path being mounted goes stale, it can 1207c478bd9Sstevel@tonic-gate * "recover" by redriving the mount compund (LOOKUP ops). This recovery 1217c478bd9Sstevel@tonic-gate * code is needed outside of the recovery framework because mount is a 1227c478bd9Sstevel@tonic-gate * special case. The client doesn't create vnodes/rnodes for components 1237c478bd9Sstevel@tonic-gate * of the server path being mounted. The recovery code recovers real 1247c478bd9Sstevel@tonic-gate * client objects, not STALE FHs which map to components of the server 1257c478bd9Sstevel@tonic-gate * path being mounted. 1267c478bd9Sstevel@tonic-gate * 1277c478bd9Sstevel@tonic-gate * We could just fail the mount on the first time, but that would 1287c478bd9Sstevel@tonic-gate * instantly trigger failover (from nfs4_mount), and the client should 1297c478bd9Sstevel@tonic-gate * try to re-lookup the STALE FH before doing failover. The easiest 1307c478bd9Sstevel@tonic-gate * way to "re-lookup" is to simply redrive the mount compound. 1317c478bd9Sstevel@tonic-gate */ 1327c478bd9Sstevel@tonic-gate static int nfs4_max_mount_retry = 2; 1337c478bd9Sstevel@tonic-gate 1347c478bd9Sstevel@tonic-gate /* 1357c478bd9Sstevel@tonic-gate * nfs4 vfs operations. 1367c478bd9Sstevel@tonic-gate */ 137b9238976Sth int nfs4_mount(vfs_t *, vnode_t *, struct mounta *, cred_t *); 1387c478bd9Sstevel@tonic-gate static int nfs4_unmount(vfs_t *, int, cred_t *); 1397c478bd9Sstevel@tonic-gate static int nfs4_root(vfs_t *, vnode_t **); 1407c478bd9Sstevel@tonic-gate static int nfs4_statvfs(vfs_t *, struct statvfs64 *); 1417c478bd9Sstevel@tonic-gate static int nfs4_sync(vfs_t *, short, cred_t *); 1427c478bd9Sstevel@tonic-gate static int nfs4_vget(vfs_t *, vnode_t **, fid_t *); 1437c478bd9Sstevel@tonic-gate static int nfs4_mountroot(vfs_t *, whymountroot_t); 1447c478bd9Sstevel@tonic-gate static void nfs4_freevfs(vfs_t *); 1457c478bd9Sstevel@tonic-gate 1467c478bd9Sstevel@tonic-gate static int nfs4rootvp(vnode_t **, vfs_t *, struct servinfo4 *, 1477c478bd9Sstevel@tonic-gate int, cred_t *, zone_t *); 1487c478bd9Sstevel@tonic-gate 1497c478bd9Sstevel@tonic-gate vfsops_t *nfs4_vfsops; 1507c478bd9Sstevel@tonic-gate 1517c478bd9Sstevel@tonic-gate int nfs4_vfsinit(void); 1527c478bd9Sstevel@tonic-gate void nfs4_vfsfini(void); 1537c478bd9Sstevel@tonic-gate static void nfs4setclientid_init(void); 1547c478bd9Sstevel@tonic-gate static void nfs4setclientid_fini(void); 1557c478bd9Sstevel@tonic-gate static void nfs4setclientid_otw(mntinfo4_t *, servinfo4_t *, cred_t *, 1567c478bd9Sstevel@tonic-gate struct nfs4_server *, nfs4_error_t *, int *); 1577c478bd9Sstevel@tonic-gate static void destroy_nfs4_server(nfs4_server_t *); 1587c478bd9Sstevel@tonic-gate static void remove_mi(nfs4_server_t *, mntinfo4_t *); 1597c478bd9Sstevel@tonic-gate 160b9238976Sth extern void nfs4_ephemeral_init(void); 161b9238976Sth extern void nfs4_ephemeral_fini(void); 162b9238976Sth 1637c478bd9Sstevel@tonic-gate /* 1647c478bd9Sstevel@tonic-gate * Initialize the vfs structure 1657c478bd9Sstevel@tonic-gate */ 1667c478bd9Sstevel@tonic-gate 1677c478bd9Sstevel@tonic-gate static int nfs4fstyp; 1687c478bd9Sstevel@tonic-gate 1697c478bd9Sstevel@tonic-gate 1707c478bd9Sstevel@tonic-gate /* 1717c478bd9Sstevel@tonic-gate * Debug variable to check for rdma based 1727c478bd9Sstevel@tonic-gate * transport startup and cleanup. Controlled 1737c478bd9Sstevel@tonic-gate * through /etc/system. Off by default. 1747c478bd9Sstevel@tonic-gate */ 1757c478bd9Sstevel@tonic-gate extern int rdma_debug; 1767c478bd9Sstevel@tonic-gate 1777c478bd9Sstevel@tonic-gate int 1787c478bd9Sstevel@tonic-gate nfs4init(int fstyp, char *name) 1797c478bd9Sstevel@tonic-gate { 1807c478bd9Sstevel@tonic-gate static const fs_operation_def_t nfs4_vfsops_template[] = { 181aa59c4cbSrsb VFSNAME_MOUNT, { .vfs_mount = nfs4_mount }, 182aa59c4cbSrsb VFSNAME_UNMOUNT, { .vfs_unmount = nfs4_unmount }, 183aa59c4cbSrsb VFSNAME_ROOT, { .vfs_root = nfs4_root }, 184aa59c4cbSrsb VFSNAME_STATVFS, { .vfs_statvfs = nfs4_statvfs }, 185aa59c4cbSrsb VFSNAME_SYNC, { .vfs_sync = nfs4_sync }, 186aa59c4cbSrsb VFSNAME_VGET, { .vfs_vget = nfs4_vget }, 187aa59c4cbSrsb VFSNAME_MOUNTROOT, { .vfs_mountroot = nfs4_mountroot }, 188aa59c4cbSrsb VFSNAME_FREEVFS, { .vfs_freevfs = nfs4_freevfs }, 189aa59c4cbSrsb NULL, NULL 1907c478bd9Sstevel@tonic-gate }; 1917c478bd9Sstevel@tonic-gate int error; 1927c478bd9Sstevel@tonic-gate 193b9238976Sth nfs4_vfsops = NULL; 194b9238976Sth nfs4_vnodeops = NULL; 195b9238976Sth nfs4_trigger_vnodeops = NULL; 196b9238976Sth 1977c478bd9Sstevel@tonic-gate error = vfs_setfsops(fstyp, nfs4_vfsops_template, &nfs4_vfsops); 1987c478bd9Sstevel@tonic-gate if (error != 0) { 1997c478bd9Sstevel@tonic-gate zcmn_err(GLOBAL_ZONEID, CE_WARN, 2007c478bd9Sstevel@tonic-gate "nfs4init: bad vfs ops template"); 201b9238976Sth goto out; 2027c478bd9Sstevel@tonic-gate } 2037c478bd9Sstevel@tonic-gate 2047c478bd9Sstevel@tonic-gate error = vn_make_ops(name, nfs4_vnodeops_template, &nfs4_vnodeops); 2057c478bd9Sstevel@tonic-gate if (error != 0) { 2067c478bd9Sstevel@tonic-gate zcmn_err(GLOBAL_ZONEID, CE_WARN, 2077c478bd9Sstevel@tonic-gate "nfs4init: bad vnode ops template"); 208b9238976Sth goto out; 2097c478bd9Sstevel@tonic-gate } 2107c478bd9Sstevel@tonic-gate 211b9238976Sth error = vn_make_ops("nfs4_trigger", nfs4_trigger_vnodeops_template, 212b9238976Sth &nfs4_trigger_vnodeops); 213b9238976Sth if (error != 0) { 214b9238976Sth zcmn_err(GLOBAL_ZONEID, CE_WARN, 215b9238976Sth "nfs4init: bad trigger vnode ops template"); 216b9238976Sth goto out; 217b9238976Sth } 2187c478bd9Sstevel@tonic-gate 219b9238976Sth nfs4fstyp = fstyp; 2207c478bd9Sstevel@tonic-gate (void) nfs4_vfsinit(); 2217c478bd9Sstevel@tonic-gate (void) nfs4_init_dot_entries(); 2227c478bd9Sstevel@tonic-gate 223b9238976Sth out: 224b9238976Sth if (error) { 225b9238976Sth if (nfs4_trigger_vnodeops != NULL) 226b9238976Sth vn_freevnodeops(nfs4_trigger_vnodeops); 227b9238976Sth 228b9238976Sth if (nfs4_vnodeops != NULL) 229b9238976Sth vn_freevnodeops(nfs4_vnodeops); 230b9238976Sth 231b9238976Sth (void) vfs_freevfsops_by_type(fstyp); 232b9238976Sth } 233b9238976Sth 234b9238976Sth return (error); 2357c478bd9Sstevel@tonic-gate } 2367c478bd9Sstevel@tonic-gate 2377c478bd9Sstevel@tonic-gate void 2387c478bd9Sstevel@tonic-gate nfs4fini(void) 2397c478bd9Sstevel@tonic-gate { 2407c478bd9Sstevel@tonic-gate (void) nfs4_destroy_dot_entries(); 2417c478bd9Sstevel@tonic-gate nfs4_vfsfini(); 2427c478bd9Sstevel@tonic-gate } 2437c478bd9Sstevel@tonic-gate 2447c478bd9Sstevel@tonic-gate /* 2457c478bd9Sstevel@tonic-gate * Create a new sec_data structure to store AUTH_DH related data: 2467c478bd9Sstevel@tonic-gate * netname, syncaddr, knetconfig. There is no AUTH_F_RPCTIMESYNC 2477c478bd9Sstevel@tonic-gate * flag set for NFS V4 since we are avoiding to contact the rpcbind 2487c478bd9Sstevel@tonic-gate * daemon and is using the IP time service (IPPORT_TIMESERVER). 2497c478bd9Sstevel@tonic-gate * 2507c478bd9Sstevel@tonic-gate * sec_data can be freed by sec_clnt_freeinfo(). 2517c478bd9Sstevel@tonic-gate */ 252b9238976Sth static struct sec_data * 2537c478bd9Sstevel@tonic-gate create_authdh_data(char *netname, int nlen, struct netbuf *syncaddr, 2547c478bd9Sstevel@tonic-gate struct knetconfig *knconf) { 2557c478bd9Sstevel@tonic-gate struct sec_data *secdata; 2567c478bd9Sstevel@tonic-gate dh_k4_clntdata_t *data; 2577c478bd9Sstevel@tonic-gate char *pf, *p; 2587c478bd9Sstevel@tonic-gate 2597c478bd9Sstevel@tonic-gate if (syncaddr == NULL || syncaddr->buf == NULL || nlen == 0) 2607c478bd9Sstevel@tonic-gate return (NULL); 2617c478bd9Sstevel@tonic-gate 2627c478bd9Sstevel@tonic-gate secdata = kmem_alloc(sizeof (*secdata), KM_SLEEP); 2637c478bd9Sstevel@tonic-gate secdata->flags = 0; 2647c478bd9Sstevel@tonic-gate 2657c478bd9Sstevel@tonic-gate data = kmem_alloc(sizeof (*data), KM_SLEEP); 2667c478bd9Sstevel@tonic-gate 2677c478bd9Sstevel@tonic-gate data->syncaddr.maxlen = syncaddr->maxlen; 2687c478bd9Sstevel@tonic-gate data->syncaddr.len = syncaddr->len; 2697c478bd9Sstevel@tonic-gate data->syncaddr.buf = (char *)kmem_alloc(syncaddr->len, KM_SLEEP); 2707c478bd9Sstevel@tonic-gate bcopy(syncaddr->buf, data->syncaddr.buf, syncaddr->len); 2717c478bd9Sstevel@tonic-gate 2727c478bd9Sstevel@tonic-gate /* 2737c478bd9Sstevel@tonic-gate * duplicate the knconf information for the 2747c478bd9Sstevel@tonic-gate * new opaque data. 2757c478bd9Sstevel@tonic-gate */ 2767c478bd9Sstevel@tonic-gate data->knconf = kmem_alloc(sizeof (*knconf), KM_SLEEP); 2777c478bd9Sstevel@tonic-gate *data->knconf = *knconf; 2787c478bd9Sstevel@tonic-gate pf = kmem_alloc(KNC_STRSIZE, KM_SLEEP); 2797c478bd9Sstevel@tonic-gate p = kmem_alloc(KNC_STRSIZE, KM_SLEEP); 2807c478bd9Sstevel@tonic-gate bcopy(knconf->knc_protofmly, pf, KNC_STRSIZE); 2817c478bd9Sstevel@tonic-gate bcopy(knconf->knc_proto, p, KNC_STRSIZE); 2827c478bd9Sstevel@tonic-gate data->knconf->knc_protofmly = pf; 2837c478bd9Sstevel@tonic-gate data->knconf->knc_proto = p; 2847c478bd9Sstevel@tonic-gate 2857c478bd9Sstevel@tonic-gate /* move server netname to the sec_data structure */ 2867c478bd9Sstevel@tonic-gate data->netname = kmem_alloc(nlen, KM_SLEEP); 2877c478bd9Sstevel@tonic-gate bcopy(netname, data->netname, nlen); 2887c478bd9Sstevel@tonic-gate data->netnamelen = (int)nlen; 2897c478bd9Sstevel@tonic-gate 2907c478bd9Sstevel@tonic-gate secdata->secmod = AUTH_DH; 2917c478bd9Sstevel@tonic-gate secdata->rpcflavor = AUTH_DH; 2927c478bd9Sstevel@tonic-gate secdata->data = (caddr_t)data; 2937c478bd9Sstevel@tonic-gate 2947c478bd9Sstevel@tonic-gate return (secdata); 2957c478bd9Sstevel@tonic-gate } 2967c478bd9Sstevel@tonic-gate 297b9238976Sth /* 298b9238976Sth * Returns (deep) copy of sec_data_t. Allocates all memory required; caller 299b9238976Sth * is responsible for freeing. 300b9238976Sth */ 301b9238976Sth sec_data_t * 302b9238976Sth copy_sec_data(sec_data_t *fsecdata) { 303b9238976Sth sec_data_t *tsecdata; 304b9238976Sth 305b9238976Sth if (fsecdata == NULL) 306b9238976Sth return (NULL); 307b9238976Sth 308b9238976Sth if (fsecdata->rpcflavor == AUTH_DH) { 309b9238976Sth dh_k4_clntdata_t *fdata = (dh_k4_clntdata_t *)fsecdata->data; 310b9238976Sth 311b9238976Sth if (fdata == NULL) 312b9238976Sth return (NULL); 313b9238976Sth 314b9238976Sth tsecdata = (sec_data_t *)create_authdh_data(fdata->netname, 315b9238976Sth fdata->netnamelen, &fdata->syncaddr, fdata->knconf); 316b9238976Sth 317b9238976Sth return (tsecdata); 318b9238976Sth } 319b9238976Sth 320b9238976Sth tsecdata = kmem_zalloc(sizeof (sec_data_t), KM_SLEEP); 321b9238976Sth 322b9238976Sth tsecdata->secmod = fsecdata->secmod; 323b9238976Sth tsecdata->rpcflavor = fsecdata->rpcflavor; 324b9238976Sth tsecdata->flags = fsecdata->flags; 325b9238976Sth tsecdata->uid = fsecdata->uid; 326b9238976Sth 327b9238976Sth if (fsecdata->rpcflavor == RPCSEC_GSS) { 328b9238976Sth gss_clntdata_t *gcd = (gss_clntdata_t *)fsecdata->data; 329b9238976Sth 330b9238976Sth tsecdata->data = (caddr_t)copy_sec_data_gss(gcd); 331b9238976Sth } else { 332b9238976Sth tsecdata->data = NULL; 333b9238976Sth } 334b9238976Sth 335b9238976Sth return (tsecdata); 336b9238976Sth } 337b9238976Sth 338b9238976Sth gss_clntdata_t * 339b9238976Sth copy_sec_data_gss(gss_clntdata_t *fdata) 340b9238976Sth { 341b9238976Sth gss_clntdata_t *tdata; 342b9238976Sth 343b9238976Sth if (fdata == NULL) 344b9238976Sth return (NULL); 345b9238976Sth 346b9238976Sth tdata = kmem_zalloc(sizeof (gss_clntdata_t), KM_SLEEP); 347b9238976Sth 348b9238976Sth tdata->mechanism.length = fdata->mechanism.length; 349b9238976Sth tdata->mechanism.elements = kmem_zalloc(fdata->mechanism.length, 350b9238976Sth KM_SLEEP); 351b9238976Sth bcopy(fdata->mechanism.elements, tdata->mechanism.elements, 352b9238976Sth fdata->mechanism.length); 353b9238976Sth 354b9238976Sth tdata->service = fdata->service; 355b9238976Sth 356b9238976Sth (void) strcpy(tdata->uname, fdata->uname); 357b9238976Sth (void) strcpy(tdata->inst, fdata->inst); 358b9238976Sth (void) strcpy(tdata->realm, fdata->realm); 359b9238976Sth 360b9238976Sth tdata->qop = fdata->qop; 361b9238976Sth 362b9238976Sth return (tdata); 363b9238976Sth } 364b9238976Sth 3657c478bd9Sstevel@tonic-gate static int 3667c478bd9Sstevel@tonic-gate nfs4_chkdup_servinfo4(servinfo4_t *svp_head, servinfo4_t *svp) 3677c478bd9Sstevel@tonic-gate { 3687c478bd9Sstevel@tonic-gate servinfo4_t *si; 3697c478bd9Sstevel@tonic-gate 3707c478bd9Sstevel@tonic-gate /* 3717c478bd9Sstevel@tonic-gate * Iterate over the servinfo4 list to make sure 3727c478bd9Sstevel@tonic-gate * we do not have a duplicate. Skip any servinfo4 3737c478bd9Sstevel@tonic-gate * that has been marked "NOT IN USE" 3747c478bd9Sstevel@tonic-gate */ 3757c478bd9Sstevel@tonic-gate for (si = svp_head; si; si = si->sv_next) { 3767c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&si->sv_lock, RW_READER, 0); 3777c478bd9Sstevel@tonic-gate if (si->sv_flags & SV4_NOTINUSE) { 3787c478bd9Sstevel@tonic-gate nfs_rw_exit(&si->sv_lock); 3797c478bd9Sstevel@tonic-gate continue; 3807c478bd9Sstevel@tonic-gate } 3817c478bd9Sstevel@tonic-gate nfs_rw_exit(&si->sv_lock); 3827c478bd9Sstevel@tonic-gate if (si == svp) 3837c478bd9Sstevel@tonic-gate continue; 3847c478bd9Sstevel@tonic-gate if (si->sv_addr.len == svp->sv_addr.len && 3857c478bd9Sstevel@tonic-gate strcmp(si->sv_knconf->knc_protofmly, 386b9238976Sth svp->sv_knconf->knc_protofmly) == 0 && 3877c478bd9Sstevel@tonic-gate bcmp(si->sv_addr.buf, svp->sv_addr.buf, 388b9238976Sth si->sv_addr.len) == 0) { 3897c478bd9Sstevel@tonic-gate /* it's a duplicate */ 3907c478bd9Sstevel@tonic-gate return (1); 3917c478bd9Sstevel@tonic-gate } 3927c478bd9Sstevel@tonic-gate } 3937c478bd9Sstevel@tonic-gate /* it's not a duplicate */ 3947c478bd9Sstevel@tonic-gate return (0); 3957c478bd9Sstevel@tonic-gate } 3967c478bd9Sstevel@tonic-gate 39739d3e169Sevanl void 39839d3e169Sevanl nfs4_free_args(struct nfs_args *nargs) 39939d3e169Sevanl { 40039d3e169Sevanl if (nargs->knconf) { 40139d3e169Sevanl if (nargs->knconf->knc_protofmly) 40239d3e169Sevanl kmem_free(nargs->knconf->knc_protofmly, 403b9238976Sth KNC_STRSIZE); 40439d3e169Sevanl if (nargs->knconf->knc_proto) 40539d3e169Sevanl kmem_free(nargs->knconf->knc_proto, KNC_STRSIZE); 40639d3e169Sevanl kmem_free(nargs->knconf, sizeof (*nargs->knconf)); 40739d3e169Sevanl nargs->knconf = NULL; 40839d3e169Sevanl } 40939d3e169Sevanl 41039d3e169Sevanl if (nargs->fh) { 41139d3e169Sevanl kmem_free(nargs->fh, strlen(nargs->fh) + 1); 41239d3e169Sevanl nargs->fh = NULL; 41339d3e169Sevanl } 41439d3e169Sevanl 41539d3e169Sevanl if (nargs->hostname) { 41639d3e169Sevanl kmem_free(nargs->hostname, strlen(nargs->hostname) + 1); 41739d3e169Sevanl nargs->hostname = NULL; 41839d3e169Sevanl } 41939d3e169Sevanl 42039d3e169Sevanl if (nargs->addr) { 42139d3e169Sevanl if (nargs->addr->buf) { 42239d3e169Sevanl ASSERT(nargs->addr->len); 42339d3e169Sevanl kmem_free(nargs->addr->buf, nargs->addr->len); 42439d3e169Sevanl } 42539d3e169Sevanl kmem_free(nargs->addr, sizeof (struct netbuf)); 42639d3e169Sevanl nargs->addr = NULL; 42739d3e169Sevanl } 42839d3e169Sevanl 42939d3e169Sevanl if (nargs->syncaddr) { 43039d3e169Sevanl ASSERT(nargs->syncaddr->len); 43139d3e169Sevanl if (nargs->syncaddr->buf) { 43239d3e169Sevanl ASSERT(nargs->syncaddr->len); 43339d3e169Sevanl kmem_free(nargs->syncaddr->buf, nargs->syncaddr->len); 43439d3e169Sevanl } 43539d3e169Sevanl kmem_free(nargs->syncaddr, sizeof (struct netbuf)); 43639d3e169Sevanl nargs->syncaddr = NULL; 43739d3e169Sevanl } 43839d3e169Sevanl 43939d3e169Sevanl if (nargs->netname) { 44039d3e169Sevanl kmem_free(nargs->netname, strlen(nargs->netname) + 1); 44139d3e169Sevanl nargs->netname = NULL; 44239d3e169Sevanl } 44339d3e169Sevanl 44439d3e169Sevanl if (nargs->nfs_ext_u.nfs_extA.secdata) { 44539d3e169Sevanl sec_clnt_freeinfo( 446b9238976Sth nargs->nfs_ext_u.nfs_extA.secdata); 44739d3e169Sevanl nargs->nfs_ext_u.nfs_extA.secdata = NULL; 44839d3e169Sevanl } 44939d3e169Sevanl } 45039d3e169Sevanl 45139d3e169Sevanl 45239d3e169Sevanl int 45339d3e169Sevanl nfs4_copyin(char *data, int datalen, struct nfs_args *nargs) 45439d3e169Sevanl { 45539d3e169Sevanl 45639d3e169Sevanl int error; 45739d3e169Sevanl size_t hlen; /* length of hostname */ 45839d3e169Sevanl size_t nlen; /* length of netname */ 45939d3e169Sevanl char netname[MAXNETNAMELEN+1]; /* server's netname */ 46039d3e169Sevanl struct netbuf addr; /* server's address */ 46139d3e169Sevanl struct netbuf syncaddr; /* AUTH_DES time sync addr */ 46239d3e169Sevanl struct knetconfig *knconf; /* transport structure */ 46339d3e169Sevanl struct sec_data *secdata = NULL; /* security data */ 46439d3e169Sevanl STRUCT_DECL(nfs_args, args); /* nfs mount arguments */ 46539d3e169Sevanl STRUCT_DECL(knetconfig, knconf_tmp); 46639d3e169Sevanl STRUCT_DECL(netbuf, addr_tmp); 46739d3e169Sevanl int flags; 46839d3e169Sevanl char *p, *pf; 46939d3e169Sevanl struct pathname pn; 47039d3e169Sevanl char *userbufptr; 47139d3e169Sevanl 47239d3e169Sevanl 47339d3e169Sevanl bzero(nargs, sizeof (*nargs)); 47439d3e169Sevanl 47539d3e169Sevanl STRUCT_INIT(args, get_udatamodel()); 47639d3e169Sevanl bzero(STRUCT_BUF(args), SIZEOF_STRUCT(nfs_args, DATAMODEL_NATIVE)); 47739d3e169Sevanl if (copyin(data, STRUCT_BUF(args), MIN(datalen, 47839d3e169Sevanl STRUCT_SIZE(args)))) 47939d3e169Sevanl return (EFAULT); 48039d3e169Sevanl 48139d3e169Sevanl nargs->wsize = STRUCT_FGET(args, wsize); 48239d3e169Sevanl nargs->rsize = STRUCT_FGET(args, rsize); 48339d3e169Sevanl nargs->timeo = STRUCT_FGET(args, timeo); 48439d3e169Sevanl nargs->retrans = STRUCT_FGET(args, retrans); 48539d3e169Sevanl nargs->acregmin = STRUCT_FGET(args, acregmin); 48639d3e169Sevanl nargs->acregmax = STRUCT_FGET(args, acregmax); 48739d3e169Sevanl nargs->acdirmin = STRUCT_FGET(args, acdirmin); 48839d3e169Sevanl nargs->acdirmax = STRUCT_FGET(args, acdirmax); 48939d3e169Sevanl 49039d3e169Sevanl flags = STRUCT_FGET(args, flags); 49139d3e169Sevanl nargs->flags = flags; 49239d3e169Sevanl 49339d3e169Sevanl addr.buf = NULL; 49439d3e169Sevanl syncaddr.buf = NULL; 49539d3e169Sevanl 49639d3e169Sevanl 49739d3e169Sevanl /* 49839d3e169Sevanl * Allocate space for a knetconfig structure and 49939d3e169Sevanl * its strings and copy in from user-land. 50039d3e169Sevanl */ 50139d3e169Sevanl knconf = kmem_zalloc(sizeof (*knconf), KM_SLEEP); 50239d3e169Sevanl STRUCT_INIT(knconf_tmp, get_udatamodel()); 50339d3e169Sevanl if (copyin(STRUCT_FGETP(args, knconf), STRUCT_BUF(knconf_tmp), 50439d3e169Sevanl STRUCT_SIZE(knconf_tmp))) { 50539d3e169Sevanl kmem_free(knconf, sizeof (*knconf)); 50639d3e169Sevanl return (EFAULT); 50739d3e169Sevanl } 50839d3e169Sevanl 50939d3e169Sevanl knconf->knc_semantics = STRUCT_FGET(knconf_tmp, knc_semantics); 51039d3e169Sevanl knconf->knc_protofmly = STRUCT_FGETP(knconf_tmp, knc_protofmly); 51139d3e169Sevanl knconf->knc_proto = STRUCT_FGETP(knconf_tmp, knc_proto); 51239d3e169Sevanl if (get_udatamodel() != DATAMODEL_LP64) { 51339d3e169Sevanl knconf->knc_rdev = expldev(STRUCT_FGET(knconf_tmp, knc_rdev)); 51439d3e169Sevanl } else { 51539d3e169Sevanl knconf->knc_rdev = STRUCT_FGET(knconf_tmp, knc_rdev); 51639d3e169Sevanl } 51739d3e169Sevanl 51839d3e169Sevanl pf = kmem_alloc(KNC_STRSIZE, KM_SLEEP); 51939d3e169Sevanl p = kmem_alloc(KNC_STRSIZE, KM_SLEEP); 52039d3e169Sevanl error = copyinstr(knconf->knc_protofmly, pf, KNC_STRSIZE, NULL); 52139d3e169Sevanl if (error) { 52239d3e169Sevanl kmem_free(pf, KNC_STRSIZE); 52339d3e169Sevanl kmem_free(p, KNC_STRSIZE); 52439d3e169Sevanl kmem_free(knconf, sizeof (*knconf)); 52539d3e169Sevanl return (error); 52639d3e169Sevanl } 52739d3e169Sevanl 52839d3e169Sevanl error = copyinstr(knconf->knc_proto, p, KNC_STRSIZE, NULL); 52939d3e169Sevanl if (error) { 53039d3e169Sevanl kmem_free(pf, KNC_STRSIZE); 53139d3e169Sevanl kmem_free(p, KNC_STRSIZE); 53239d3e169Sevanl kmem_free(knconf, sizeof (*knconf)); 53339d3e169Sevanl return (error); 53439d3e169Sevanl } 53539d3e169Sevanl 53639d3e169Sevanl 53739d3e169Sevanl knconf->knc_protofmly = pf; 53839d3e169Sevanl knconf->knc_proto = p; 53939d3e169Sevanl 54039d3e169Sevanl nargs->knconf = knconf; 54139d3e169Sevanl 54239d3e169Sevanl /* 54339d3e169Sevanl * Get server address 54439d3e169Sevanl */ 54539d3e169Sevanl STRUCT_INIT(addr_tmp, get_udatamodel()); 54639d3e169Sevanl if (copyin(STRUCT_FGETP(args, addr), STRUCT_BUF(addr_tmp), 54739d3e169Sevanl STRUCT_SIZE(addr_tmp))) { 54839d3e169Sevanl error = EFAULT; 54939d3e169Sevanl goto errout; 55039d3e169Sevanl } 55139d3e169Sevanl 552*7e450cbcSJames Wahlig nargs->addr = kmem_zalloc(sizeof (struct netbuf), KM_SLEEP); 55339d3e169Sevanl userbufptr = STRUCT_FGETP(addr_tmp, buf); 55439d3e169Sevanl addr.len = STRUCT_FGET(addr_tmp, len); 55539d3e169Sevanl addr.buf = kmem_alloc(addr.len, KM_SLEEP); 55639d3e169Sevanl addr.maxlen = addr.len; 55739d3e169Sevanl if (copyin(userbufptr, addr.buf, addr.len)) { 55839d3e169Sevanl kmem_free(addr.buf, addr.len); 55939d3e169Sevanl error = EFAULT; 56039d3e169Sevanl goto errout; 56139d3e169Sevanl } 56239d3e169Sevanl bcopy(&addr, nargs->addr, sizeof (struct netbuf)); 56339d3e169Sevanl 56439d3e169Sevanl /* 56539d3e169Sevanl * Get the root fhandle 56639d3e169Sevanl */ 56739d3e169Sevanl error = pn_get(STRUCT_FGETP(args, fh), UIO_USERSPACE, &pn); 56839d3e169Sevanl if (error) 56939d3e169Sevanl goto errout; 57039d3e169Sevanl 57139d3e169Sevanl /* Volatile fh: keep server paths, so use actual-size strings */ 57239d3e169Sevanl nargs->fh = kmem_alloc(pn.pn_pathlen + 1, KM_SLEEP); 57339d3e169Sevanl bcopy(pn.pn_path, nargs->fh, pn.pn_pathlen); 57439d3e169Sevanl nargs->fh[pn.pn_pathlen] = '\0'; 57539d3e169Sevanl pn_free(&pn); 57639d3e169Sevanl 57739d3e169Sevanl 57839d3e169Sevanl /* 57939d3e169Sevanl * Get server's hostname 58039d3e169Sevanl */ 58139d3e169Sevanl if (flags & NFSMNT_HOSTNAME) { 58239d3e169Sevanl error = copyinstr(STRUCT_FGETP(args, hostname), 583b9238976Sth netname, sizeof (netname), &hlen); 58439d3e169Sevanl if (error) 58539d3e169Sevanl goto errout; 58639d3e169Sevanl nargs->hostname = kmem_zalloc(hlen, KM_SLEEP); 58739d3e169Sevanl (void) strcpy(nargs->hostname, netname); 58839d3e169Sevanl 58939d3e169Sevanl } else { 59039d3e169Sevanl nargs->hostname = NULL; 59139d3e169Sevanl } 59239d3e169Sevanl 59339d3e169Sevanl 59439d3e169Sevanl /* 59539d3e169Sevanl * If there are syncaddr and netname data, load them in. This is 59639d3e169Sevanl * to support data needed for NFSV4 when AUTH_DH is the negotiated 59739d3e169Sevanl * flavor via SECINFO. (instead of using MOUNT protocol in V3). 59839d3e169Sevanl */ 59939d3e169Sevanl netname[0] = '\0'; 60039d3e169Sevanl if (flags & NFSMNT_SECURE) { 60139d3e169Sevanl 60239d3e169Sevanl /* get syncaddr */ 60339d3e169Sevanl STRUCT_INIT(addr_tmp, get_udatamodel()); 60439d3e169Sevanl if (copyin(STRUCT_FGETP(args, syncaddr), STRUCT_BUF(addr_tmp), 605b9238976Sth STRUCT_SIZE(addr_tmp))) { 60639d3e169Sevanl error = EINVAL; 60739d3e169Sevanl goto errout; 60839d3e169Sevanl } 60939d3e169Sevanl userbufptr = STRUCT_FGETP(addr_tmp, buf); 61039d3e169Sevanl syncaddr.len = STRUCT_FGET(addr_tmp, len); 61139d3e169Sevanl syncaddr.buf = kmem_alloc(syncaddr.len, KM_SLEEP); 61239d3e169Sevanl syncaddr.maxlen = syncaddr.len; 61339d3e169Sevanl if (copyin(userbufptr, syncaddr.buf, syncaddr.len)) { 61439d3e169Sevanl kmem_free(syncaddr.buf, syncaddr.len); 61539d3e169Sevanl error = EFAULT; 61639d3e169Sevanl goto errout; 61739d3e169Sevanl } 61839d3e169Sevanl 61939d3e169Sevanl nargs->syncaddr = kmem_alloc(sizeof (struct netbuf), KM_SLEEP); 62039d3e169Sevanl bcopy(&syncaddr, nargs->syncaddr, sizeof (struct netbuf)); 62139d3e169Sevanl 62222d5e933Skr /* get server's netname */ 62322d5e933Skr if (copyinstr(STRUCT_FGETP(args, netname), netname, 624b9238976Sth sizeof (netname), &nlen)) { 62522d5e933Skr error = EFAULT; 62622d5e933Skr goto errout; 62722d5e933Skr } 62822d5e933Skr 62922d5e933Skr netname[nlen] = '\0'; 63022d5e933Skr nargs->netname = kmem_zalloc(nlen, KM_SLEEP); 63122d5e933Skr (void) strcpy(nargs->netname, netname); 63222d5e933Skr } 63339d3e169Sevanl 63439d3e169Sevanl /* 63539d3e169Sevanl * Get the extention data which has the security data structure. 63639d3e169Sevanl * This includes data for AUTH_SYS as well. 63739d3e169Sevanl */ 63839d3e169Sevanl if (flags & NFSMNT_NEWARGS) { 63939d3e169Sevanl nargs->nfs_args_ext = STRUCT_FGET(args, nfs_args_ext); 64039d3e169Sevanl if (nargs->nfs_args_ext == NFS_ARGS_EXTA || 641b9238976Sth nargs->nfs_args_ext == NFS_ARGS_EXTB) { 64239d3e169Sevanl /* 64339d3e169Sevanl * Indicating the application is using the new 64439d3e169Sevanl * sec_data structure to pass in the security 64539d3e169Sevanl * data. 64639d3e169Sevanl */ 64739d3e169Sevanl if (STRUCT_FGETP(args, 64839d3e169Sevanl nfs_ext_u.nfs_extA.secdata) != NULL) { 64939d3e169Sevanl error = sec_clnt_loadinfo( 65039d3e169Sevanl (struct sec_data *)STRUCT_FGETP(args, 651b9238976Sth nfs_ext_u.nfs_extA.secdata), 65239d3e169Sevanl &secdata, get_udatamodel()); 65339d3e169Sevanl } 65439d3e169Sevanl nargs->nfs_ext_u.nfs_extA.secdata = secdata; 65539d3e169Sevanl } 65639d3e169Sevanl } 65739d3e169Sevanl 65839d3e169Sevanl if (error) 65939d3e169Sevanl goto errout; 66039d3e169Sevanl 66139d3e169Sevanl /* 66239d3e169Sevanl * Failover support: 66339d3e169Sevanl * 66439d3e169Sevanl * We may have a linked list of nfs_args structures, 66539d3e169Sevanl * which means the user is looking for failover. If 66639d3e169Sevanl * the mount is either not "read-only" or "soft", 66739d3e169Sevanl * we want to bail out with EINVAL. 66839d3e169Sevanl */ 66939d3e169Sevanl if (nargs->nfs_args_ext == NFS_ARGS_EXTB) 67039d3e169Sevanl nargs->nfs_ext_u.nfs_extB.next = 671b9238976Sth STRUCT_FGETP(args, nfs_ext_u.nfs_extB.next); 67239d3e169Sevanl 67339d3e169Sevanl errout: 67439d3e169Sevanl if (error) 67539d3e169Sevanl nfs4_free_args(nargs); 67639d3e169Sevanl 67739d3e169Sevanl return (error); 67839d3e169Sevanl } 67939d3e169Sevanl 68039d3e169Sevanl 6817c478bd9Sstevel@tonic-gate /* 6827c478bd9Sstevel@tonic-gate * nfs mount vfsop 6837c478bd9Sstevel@tonic-gate * Set up mount info record and attach it to vfs struct. 6847c478bd9Sstevel@tonic-gate */ 685b9238976Sth int 6867c478bd9Sstevel@tonic-gate nfs4_mount(vfs_t *vfsp, vnode_t *mvp, struct mounta *uap, cred_t *cr) 6877c478bd9Sstevel@tonic-gate { 6887c478bd9Sstevel@tonic-gate char *data = uap->dataptr; 6897c478bd9Sstevel@tonic-gate int error; 6907c478bd9Sstevel@tonic-gate vnode_t *rtvp; /* the server's root */ 6917c478bd9Sstevel@tonic-gate mntinfo4_t *mi; /* mount info, pointed at by vfs */ 6927c478bd9Sstevel@tonic-gate struct knetconfig *rdma_knconf; /* rdma transport structure */ 6937c478bd9Sstevel@tonic-gate rnode4_t *rp; 6947c478bd9Sstevel@tonic-gate struct servinfo4 *svp; /* nfs server info */ 6957c478bd9Sstevel@tonic-gate struct servinfo4 *svp_tail = NULL; /* previous nfs server info */ 6967c478bd9Sstevel@tonic-gate struct servinfo4 *svp_head; /* first nfs server info */ 6977c478bd9Sstevel@tonic-gate struct servinfo4 *svp_2ndlast; /* 2nd last in server info list */ 6987c478bd9Sstevel@tonic-gate struct sec_data *secdata; /* security data */ 69939d3e169Sevanl struct nfs_args *args = NULL; 70050a83466Sjwahlig int flags, addr_type, removed; 701108322fbScarlsonj zone_t *zone = nfs_zone(); 7027c478bd9Sstevel@tonic-gate nfs4_error_t n4e; 70345916cd2Sjpk zone_t *mntzone = NULL; 7047c478bd9Sstevel@tonic-gate 7057c478bd9Sstevel@tonic-gate if (secpolicy_fs_mount(cr, mvp, vfsp) != 0) 7067c478bd9Sstevel@tonic-gate return (EPERM); 7077c478bd9Sstevel@tonic-gate if (mvp->v_type != VDIR) 7087c478bd9Sstevel@tonic-gate return (ENOTDIR); 709b9238976Sth 7107c478bd9Sstevel@tonic-gate /* 7117c478bd9Sstevel@tonic-gate * get arguments 7127c478bd9Sstevel@tonic-gate * 7137c478bd9Sstevel@tonic-gate * nfs_args is now versioned and is extensible, so 7147c478bd9Sstevel@tonic-gate * uap->datalen might be different from sizeof (args) 7157c478bd9Sstevel@tonic-gate * in a compatible situation. 7167c478bd9Sstevel@tonic-gate */ 7177c478bd9Sstevel@tonic-gate more: 71839d3e169Sevanl if (!(uap->flags & MS_SYSSPACE)) { 71939d3e169Sevanl if (args == NULL) 72039d3e169Sevanl args = kmem_zalloc(sizeof (struct nfs_args), KM_SLEEP); 72139d3e169Sevanl else 72239d3e169Sevanl nfs4_free_args(args); 72339d3e169Sevanl error = nfs4_copyin(data, uap->datalen, args); 72439d3e169Sevanl if (error) { 72539d3e169Sevanl if (args) { 72639d3e169Sevanl kmem_free(args, sizeof (*args)); 72739d3e169Sevanl } 72839d3e169Sevanl return (error); 72939d3e169Sevanl } 73039d3e169Sevanl } else { 73139d3e169Sevanl args = (struct nfs_args *)data; 73239d3e169Sevanl } 7337c478bd9Sstevel@tonic-gate 73439d3e169Sevanl flags = args->flags; 7357c478bd9Sstevel@tonic-gate 7367c478bd9Sstevel@tonic-gate /* 7377c478bd9Sstevel@tonic-gate * If the request changes the locking type, disallow the remount, 7387c478bd9Sstevel@tonic-gate * because it's questionable whether we can transfer the 7397c478bd9Sstevel@tonic-gate * locking state correctly. 7407c478bd9Sstevel@tonic-gate */ 7417c478bd9Sstevel@tonic-gate if (uap->flags & MS_REMOUNT) { 74239d3e169Sevanl if (!(uap->flags & MS_SYSSPACE)) { 74339d3e169Sevanl nfs4_free_args(args); 74439d3e169Sevanl kmem_free(args, sizeof (*args)); 74539d3e169Sevanl } 7467c478bd9Sstevel@tonic-gate if ((mi = VFTOMI4(vfsp)) != NULL) { 7477c478bd9Sstevel@tonic-gate uint_t new_mi_llock; 7487c478bd9Sstevel@tonic-gate uint_t old_mi_llock; 7497c478bd9Sstevel@tonic-gate new_mi_llock = (flags & NFSMNT_LLOCK) ? 1 : 0; 7507c478bd9Sstevel@tonic-gate old_mi_llock = (mi->mi_flags & MI4_LLOCK) ? 1 : 0; 7517c478bd9Sstevel@tonic-gate if (old_mi_llock != new_mi_llock) 7527c478bd9Sstevel@tonic-gate return (EBUSY); 7537c478bd9Sstevel@tonic-gate } 7547c478bd9Sstevel@tonic-gate return (0); 7557c478bd9Sstevel@tonic-gate } 7567c478bd9Sstevel@tonic-gate 757b9238976Sth /* 758b9238976Sth * For ephemeral mount trigger stub vnodes, we have two problems 759b9238976Sth * to solve: racing threads will likely fail the v_count check, and 760b9238976Sth * we want only one to proceed with the mount. 761b9238976Sth * 762b9238976Sth * For stubs, if the mount has already occurred (via a racing thread), 763b9238976Sth * just return success. If not, skip the v_count check and proceed. 764b9238976Sth * Note that we are already serialised at this point. 765b9238976Sth */ 7667c478bd9Sstevel@tonic-gate mutex_enter(&mvp->v_lock); 767b9238976Sth if (vn_matchops(mvp, nfs4_trigger_vnodeops)) { 768b9238976Sth /* mntpt is a v4 stub vnode */ 769b9238976Sth ASSERT(RP_ISSTUB(VTOR4(mvp))); 770b9238976Sth ASSERT(!(uap->flags & MS_OVERLAY)); 771b9238976Sth ASSERT(!(mvp->v_flag & VROOT)); 772b9238976Sth if (vn_mountedvfs(mvp) != NULL) { 773b9238976Sth /* ephemeral mount has already occurred */ 774b9238976Sth ASSERT(uap->flags & MS_SYSSPACE); 775b9238976Sth mutex_exit(&mvp->v_lock); 776b9238976Sth return (0); 777b9238976Sth } 778b9238976Sth } else { 779b9238976Sth /* mntpt is a non-v4 or v4 non-stub vnode */ 780b9238976Sth if (!(uap->flags & MS_OVERLAY) && 781b9238976Sth (mvp->v_count != 1 || (mvp->v_flag & VROOT))) { 782b9238976Sth mutex_exit(&mvp->v_lock); 783b9238976Sth if (!(uap->flags & MS_SYSSPACE)) { 784b9238976Sth nfs4_free_args(args); 785b9238976Sth kmem_free(args, sizeof (*args)); 786b9238976Sth } 787b9238976Sth return (EBUSY); 78839d3e169Sevanl } 7897c478bd9Sstevel@tonic-gate } 7907c478bd9Sstevel@tonic-gate mutex_exit(&mvp->v_lock); 7917c478bd9Sstevel@tonic-gate 7927c478bd9Sstevel@tonic-gate /* make sure things are zeroed for errout: */ 7937c478bd9Sstevel@tonic-gate rtvp = NULL; 7947c478bd9Sstevel@tonic-gate mi = NULL; 7957c478bd9Sstevel@tonic-gate secdata = NULL; 7967c478bd9Sstevel@tonic-gate 7977c478bd9Sstevel@tonic-gate /* 7987c478bd9Sstevel@tonic-gate * A valid knetconfig structure is required. 7997c478bd9Sstevel@tonic-gate */ 80039d3e169Sevanl if (!(flags & NFSMNT_KNCONF) || 801b9238976Sth args->knconf == NULL || args->knconf->knc_protofmly == NULL || 802b9238976Sth args->knconf->knc_proto == NULL || 803b9238976Sth (strcmp(args->knconf->knc_proto, NC_UDP) == 0)) { 80439d3e169Sevanl if (!(uap->flags & MS_SYSSPACE)) { 80539d3e169Sevanl nfs4_free_args(args); 80639d3e169Sevanl kmem_free(args, sizeof (*args)); 80739d3e169Sevanl } 8087c478bd9Sstevel@tonic-gate return (EINVAL); 80939d3e169Sevanl } 81039d3e169Sevanl 81139d3e169Sevanl if ((strlen(args->knconf->knc_protofmly) >= KNC_STRSIZE) || 812b9238976Sth (strlen(args->knconf->knc_proto) >= KNC_STRSIZE)) { 81339d3e169Sevanl if (!(uap->flags & MS_SYSSPACE)) { 81439d3e169Sevanl nfs4_free_args(args); 81539d3e169Sevanl kmem_free(args, sizeof (*args)); 81639d3e169Sevanl } 81739d3e169Sevanl return (EINVAL); 81839d3e169Sevanl } 81939d3e169Sevanl 8207c478bd9Sstevel@tonic-gate /* 8217c478bd9Sstevel@tonic-gate * Allocate a servinfo4 struct. 8227c478bd9Sstevel@tonic-gate */ 8237c478bd9Sstevel@tonic-gate svp = kmem_zalloc(sizeof (*svp), KM_SLEEP); 8247c478bd9Sstevel@tonic-gate nfs_rw_init(&svp->sv_lock, NULL, RW_DEFAULT, NULL); 8257c478bd9Sstevel@tonic-gate if (svp_tail) { 8267c478bd9Sstevel@tonic-gate svp_2ndlast = svp_tail; 8277c478bd9Sstevel@tonic-gate svp_tail->sv_next = svp; 8287c478bd9Sstevel@tonic-gate } else { 8297c478bd9Sstevel@tonic-gate svp_head = svp; 8307c478bd9Sstevel@tonic-gate svp_2ndlast = svp; 8317c478bd9Sstevel@tonic-gate } 8327c478bd9Sstevel@tonic-gate 8337c478bd9Sstevel@tonic-gate svp_tail = svp; 83439d3e169Sevanl svp->sv_knconf = args->knconf; 83539d3e169Sevanl args->knconf = NULL; 8367c478bd9Sstevel@tonic-gate 8377c478bd9Sstevel@tonic-gate /* 8387c478bd9Sstevel@tonic-gate * Get server address 8397c478bd9Sstevel@tonic-gate */ 84039d3e169Sevanl if (args->addr == NULL || args->addr->buf == NULL) { 84139d3e169Sevanl error = EINVAL; 8427c478bd9Sstevel@tonic-gate goto errout; 8437c478bd9Sstevel@tonic-gate } 8447c478bd9Sstevel@tonic-gate 84539d3e169Sevanl svp->sv_addr.maxlen = args->addr->maxlen; 84639d3e169Sevanl svp->sv_addr.len = args->addr->len; 84739d3e169Sevanl svp->sv_addr.buf = args->addr->buf; 84839d3e169Sevanl args->addr->buf = NULL; 84939d3e169Sevanl 8507c478bd9Sstevel@tonic-gate /* 8517c478bd9Sstevel@tonic-gate * Get the root fhandle 8527c478bd9Sstevel@tonic-gate */ 85339d3e169Sevanl if (args->fh == NULL || (strlen(args->fh) >= MAXPATHLEN)) { 85439d3e169Sevanl error = EINVAL; 8557c478bd9Sstevel@tonic-gate goto errout; 85639d3e169Sevanl } 8577c478bd9Sstevel@tonic-gate 85839d3e169Sevanl svp->sv_path = args->fh; 85939d3e169Sevanl svp->sv_pathlen = strlen(args->fh) + 1; 86039d3e169Sevanl args->fh = NULL; 8617c478bd9Sstevel@tonic-gate 8627c478bd9Sstevel@tonic-gate /* 8637c478bd9Sstevel@tonic-gate * Get server's hostname 8647c478bd9Sstevel@tonic-gate */ 8657c478bd9Sstevel@tonic-gate if (flags & NFSMNT_HOSTNAME) { 86639d3e169Sevanl if (args->hostname == NULL || (strlen(args->hostname) > 867b9238976Sth MAXNETNAMELEN)) { 86839d3e169Sevanl error = EINVAL; 8697c478bd9Sstevel@tonic-gate goto errout; 87039d3e169Sevanl } 87139d3e169Sevanl svp->sv_hostnamelen = strlen(args->hostname) + 1; 87239d3e169Sevanl svp->sv_hostname = args->hostname; 87339d3e169Sevanl args->hostname = NULL; 8747c478bd9Sstevel@tonic-gate } else { 8757c478bd9Sstevel@tonic-gate char *p = "unknown-host"; 87639d3e169Sevanl svp->sv_hostnamelen = strlen(p) + 1; 87739d3e169Sevanl svp->sv_hostname = kmem_zalloc(svp->sv_hostnamelen, KM_SLEEP); 87839d3e169Sevanl (void) strcpy(svp->sv_hostname, p); 8797c478bd9Sstevel@tonic-gate } 8807c478bd9Sstevel@tonic-gate 8817c478bd9Sstevel@tonic-gate /* 8827c478bd9Sstevel@tonic-gate * RDMA MOUNT SUPPORT FOR NFS v4. 8837c478bd9Sstevel@tonic-gate * Establish, is it possible to use RDMA, if so overload the 8847c478bd9Sstevel@tonic-gate * knconf with rdma specific knconf and free the orignal knconf. 8857c478bd9Sstevel@tonic-gate */ 8867c478bd9Sstevel@tonic-gate if ((flags & NFSMNT_TRYRDMA) || (flags & NFSMNT_DORDMA)) { 8877c478bd9Sstevel@tonic-gate /* 8887c478bd9Sstevel@tonic-gate * Determine the addr type for RDMA, IPv4 or v6. 8897c478bd9Sstevel@tonic-gate */ 8907c478bd9Sstevel@tonic-gate if (strcmp(svp->sv_knconf->knc_protofmly, NC_INET) == 0) 8917c478bd9Sstevel@tonic-gate addr_type = AF_INET; 8927c478bd9Sstevel@tonic-gate else if (strcmp(svp->sv_knconf->knc_protofmly, NC_INET6) == 0) 8937c478bd9Sstevel@tonic-gate addr_type = AF_INET6; 8947c478bd9Sstevel@tonic-gate 8957c478bd9Sstevel@tonic-gate if (rdma_reachable(addr_type, &svp->sv_addr, 896b9238976Sth &rdma_knconf) == 0) { 8977c478bd9Sstevel@tonic-gate /* 8987c478bd9Sstevel@tonic-gate * If successful, hijack the orignal knconf and 8997c478bd9Sstevel@tonic-gate * replace with the new one, depending on the flags. 9007c478bd9Sstevel@tonic-gate */ 9017c478bd9Sstevel@tonic-gate svp->sv_origknconf = svp->sv_knconf; 9027c478bd9Sstevel@tonic-gate svp->sv_knconf = rdma_knconf; 9037c478bd9Sstevel@tonic-gate } else { 9047c478bd9Sstevel@tonic-gate if (flags & NFSMNT_TRYRDMA) { 9057c478bd9Sstevel@tonic-gate #ifdef DEBUG 9067c478bd9Sstevel@tonic-gate if (rdma_debug) 9077c478bd9Sstevel@tonic-gate zcmn_err(getzoneid(), CE_WARN, 9087c478bd9Sstevel@tonic-gate "no RDMA onboard, revert\n"); 9097c478bd9Sstevel@tonic-gate #endif 9107c478bd9Sstevel@tonic-gate } 9117c478bd9Sstevel@tonic-gate 9127c478bd9Sstevel@tonic-gate if (flags & NFSMNT_DORDMA) { 9137c478bd9Sstevel@tonic-gate /* 9147c478bd9Sstevel@tonic-gate * If proto=rdma is specified and no RDMA 9157c478bd9Sstevel@tonic-gate * path to this server is avialable then 9167c478bd9Sstevel@tonic-gate * ditch this server. 9177c478bd9Sstevel@tonic-gate * This is not included in the mountable 9187c478bd9Sstevel@tonic-gate * server list or the replica list. 9197c478bd9Sstevel@tonic-gate * Check if more servers are specified; 9207c478bd9Sstevel@tonic-gate * Failover case, otherwise bail out of mount. 9217c478bd9Sstevel@tonic-gate */ 922b9238976Sth if (args->nfs_args_ext == NFS_ARGS_EXTB && 923b9238976Sth args->nfs_ext_u.nfs_extB.next != NULL) { 92439d3e169Sevanl data = (char *) 925b9238976Sth args->nfs_ext_u.nfs_extB.next; 9267c478bd9Sstevel@tonic-gate if (uap->flags & MS_RDONLY && 9277c478bd9Sstevel@tonic-gate !(flags & NFSMNT_SOFT)) { 9287c478bd9Sstevel@tonic-gate if (svp_head->sv_next == NULL) { 9297c478bd9Sstevel@tonic-gate svp_tail = NULL; 9307c478bd9Sstevel@tonic-gate svp_2ndlast = NULL; 9317c478bd9Sstevel@tonic-gate sv4_free(svp_head); 9327c478bd9Sstevel@tonic-gate goto more; 9337c478bd9Sstevel@tonic-gate } else { 9347c478bd9Sstevel@tonic-gate svp_tail = svp_2ndlast; 9357c478bd9Sstevel@tonic-gate svp_2ndlast->sv_next = 9367c478bd9Sstevel@tonic-gate NULL; 9377c478bd9Sstevel@tonic-gate sv4_free(svp); 9387c478bd9Sstevel@tonic-gate goto more; 9397c478bd9Sstevel@tonic-gate } 9407c478bd9Sstevel@tonic-gate } 9417c478bd9Sstevel@tonic-gate } else { 9427c478bd9Sstevel@tonic-gate /* 9437c478bd9Sstevel@tonic-gate * This is the last server specified 9447c478bd9Sstevel@tonic-gate * in the nfs_args list passed down 9457c478bd9Sstevel@tonic-gate * and its not rdma capable. 9467c478bd9Sstevel@tonic-gate */ 9477c478bd9Sstevel@tonic-gate if (svp_head->sv_next == NULL) { 9487c478bd9Sstevel@tonic-gate /* 9497c478bd9Sstevel@tonic-gate * Is this the only one 9507c478bd9Sstevel@tonic-gate */ 9517c478bd9Sstevel@tonic-gate error = EINVAL; 9527c478bd9Sstevel@tonic-gate #ifdef DEBUG 9537c478bd9Sstevel@tonic-gate if (rdma_debug) 9547c478bd9Sstevel@tonic-gate zcmn_err(getzoneid(), 9557c478bd9Sstevel@tonic-gate CE_WARN, 9567c478bd9Sstevel@tonic-gate "No RDMA srv"); 9577c478bd9Sstevel@tonic-gate #endif 9587c478bd9Sstevel@tonic-gate goto errout; 9597c478bd9Sstevel@tonic-gate } else { 9607c478bd9Sstevel@tonic-gate /* 9617c478bd9Sstevel@tonic-gate * There is list, since some 9627c478bd9Sstevel@tonic-gate * servers specified before 9637c478bd9Sstevel@tonic-gate * this passed all requirements 9647c478bd9Sstevel@tonic-gate */ 9657c478bd9Sstevel@tonic-gate svp_tail = svp_2ndlast; 9667c478bd9Sstevel@tonic-gate svp_2ndlast->sv_next = NULL; 9677c478bd9Sstevel@tonic-gate sv4_free(svp); 9687c478bd9Sstevel@tonic-gate goto proceed; 9697c478bd9Sstevel@tonic-gate } 9707c478bd9Sstevel@tonic-gate } 9717c478bd9Sstevel@tonic-gate } 9727c478bd9Sstevel@tonic-gate } 9737c478bd9Sstevel@tonic-gate } 9747c478bd9Sstevel@tonic-gate 9757c478bd9Sstevel@tonic-gate /* 9767c478bd9Sstevel@tonic-gate * If there are syncaddr and netname data, load them in. This is 9777c478bd9Sstevel@tonic-gate * to support data needed for NFSV4 when AUTH_DH is the negotiated 9787c478bd9Sstevel@tonic-gate * flavor via SECINFO. (instead of using MOUNT protocol in V3). 9797c478bd9Sstevel@tonic-gate */ 98039d3e169Sevanl if (args->flags & NFSMNT_SECURE) { 98139d3e169Sevanl svp->sv_dhsec = create_authdh_data(args->netname, 982b9238976Sth strlen(args->netname), 983b9238976Sth args->syncaddr, svp->sv_knconf); 9847c478bd9Sstevel@tonic-gate } 9857c478bd9Sstevel@tonic-gate 9867c478bd9Sstevel@tonic-gate /* 9877c478bd9Sstevel@tonic-gate * Get the extention data which has the security data structure. 9887c478bd9Sstevel@tonic-gate * This includes data for AUTH_SYS as well. 9897c478bd9Sstevel@tonic-gate */ 9907c478bd9Sstevel@tonic-gate if (flags & NFSMNT_NEWARGS) { 99139d3e169Sevanl switch (args->nfs_args_ext) { 9927c478bd9Sstevel@tonic-gate case NFS_ARGS_EXTA: 9937c478bd9Sstevel@tonic-gate case NFS_ARGS_EXTB: 9947c478bd9Sstevel@tonic-gate /* 9957c478bd9Sstevel@tonic-gate * Indicating the application is using the new 9967c478bd9Sstevel@tonic-gate * sec_data structure to pass in the security 9977c478bd9Sstevel@tonic-gate * data. 9987c478bd9Sstevel@tonic-gate */ 99939d3e169Sevanl secdata = args->nfs_ext_u.nfs_extA.secdata; 100039d3e169Sevanl if (secdata == NULL) { 10017c478bd9Sstevel@tonic-gate error = EINVAL; 100239d3e169Sevanl } else if (uap->flags & MS_SYSSPACE) { 100339d3e169Sevanl /* 100439d3e169Sevanl * Need to validate the flavor here if 100539d3e169Sevanl * sysspace, userspace was already 100639d3e169Sevanl * validate from the nfs_copyin function. 100739d3e169Sevanl */ 100839d3e169Sevanl switch (secdata->rpcflavor) { 100939d3e169Sevanl case AUTH_NONE: 101039d3e169Sevanl case AUTH_UNIX: 101139d3e169Sevanl case AUTH_LOOPBACK: 101239d3e169Sevanl case AUTH_DES: 101339d3e169Sevanl case RPCSEC_GSS: 101439d3e169Sevanl break; 101539d3e169Sevanl default: 101639d3e169Sevanl error = EINVAL; 101739d3e169Sevanl goto errout; 101839d3e169Sevanl } 10197c478bd9Sstevel@tonic-gate } 102039d3e169Sevanl args->nfs_ext_u.nfs_extA.secdata = NULL; 10217c478bd9Sstevel@tonic-gate break; 10227c478bd9Sstevel@tonic-gate 10237c478bd9Sstevel@tonic-gate default: 10247c478bd9Sstevel@tonic-gate error = EINVAL; 10257c478bd9Sstevel@tonic-gate break; 10267c478bd9Sstevel@tonic-gate } 10277c478bd9Sstevel@tonic-gate 10287c478bd9Sstevel@tonic-gate } else if (flags & NFSMNT_SECURE) { 10297c478bd9Sstevel@tonic-gate /* 10307c478bd9Sstevel@tonic-gate * NFSMNT_SECURE is deprecated but we keep it 1031b9238976Sth * to support the rogue user-generated application 10327c478bd9Sstevel@tonic-gate * that may use this undocumented interface to do 1033b9238976Sth * AUTH_DH security, e.g. our own rexd. 1034b9238976Sth * 1035b9238976Sth * Also note that NFSMNT_SECURE is used for passing 1036b9238976Sth * AUTH_DH info to be used in negotiation. 10377c478bd9Sstevel@tonic-gate */ 103839d3e169Sevanl secdata = create_authdh_data(args->netname, 1039b9238976Sth strlen(args->netname), args->syncaddr, svp->sv_knconf); 10407c478bd9Sstevel@tonic-gate 10417c478bd9Sstevel@tonic-gate } else { 10427c478bd9Sstevel@tonic-gate secdata = kmem_alloc(sizeof (*secdata), KM_SLEEP); 10437c478bd9Sstevel@tonic-gate secdata->secmod = secdata->rpcflavor = AUTH_SYS; 10447c478bd9Sstevel@tonic-gate secdata->data = NULL; 10457c478bd9Sstevel@tonic-gate } 10467c478bd9Sstevel@tonic-gate 10477c478bd9Sstevel@tonic-gate svp->sv_secdata = secdata; 10487c478bd9Sstevel@tonic-gate 10497c478bd9Sstevel@tonic-gate /* 10507c478bd9Sstevel@tonic-gate * User does not explictly specify a flavor, and a user 10517c478bd9Sstevel@tonic-gate * defined default flavor is passed down. 10527c478bd9Sstevel@tonic-gate */ 10537c478bd9Sstevel@tonic-gate if (flags & NFSMNT_SECDEFAULT) { 10547c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_WRITER, 0); 10557c478bd9Sstevel@tonic-gate svp->sv_flags |= SV4_TRYSECDEFAULT; 10567c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 10577c478bd9Sstevel@tonic-gate } 10587c478bd9Sstevel@tonic-gate 10597c478bd9Sstevel@tonic-gate /* 10607c478bd9Sstevel@tonic-gate * Failover support: 10617c478bd9Sstevel@tonic-gate * 10627c478bd9Sstevel@tonic-gate * We may have a linked list of nfs_args structures, 10637c478bd9Sstevel@tonic-gate * which means the user is looking for failover. If 10647c478bd9Sstevel@tonic-gate * the mount is either not "read-only" or "soft", 10657c478bd9Sstevel@tonic-gate * we want to bail out with EINVAL. 10667c478bd9Sstevel@tonic-gate */ 106739d3e169Sevanl if (args->nfs_args_ext == NFS_ARGS_EXTB && 106839d3e169Sevanl args->nfs_ext_u.nfs_extB.next != NULL) { 10697c478bd9Sstevel@tonic-gate if (uap->flags & MS_RDONLY && !(flags & NFSMNT_SOFT)) { 107039d3e169Sevanl data = (char *)args->nfs_ext_u.nfs_extB.next; 10717c478bd9Sstevel@tonic-gate goto more; 10727c478bd9Sstevel@tonic-gate } 10737c478bd9Sstevel@tonic-gate error = EINVAL; 10747c478bd9Sstevel@tonic-gate goto errout; 10757c478bd9Sstevel@tonic-gate } 10767c478bd9Sstevel@tonic-gate 10777c478bd9Sstevel@tonic-gate /* 10787c478bd9Sstevel@tonic-gate * Determine the zone we're being mounted into. 10797c478bd9Sstevel@tonic-gate */ 108045916cd2Sjpk zone_hold(mntzone = zone); /* start with this assumption */ 10817c478bd9Sstevel@tonic-gate if (getzoneid() == GLOBAL_ZONEID) { 108245916cd2Sjpk zone_rele(mntzone); 10837c478bd9Sstevel@tonic-gate mntzone = zone_find_by_path(refstr_value(vfsp->vfs_mntpt)); 10847c478bd9Sstevel@tonic-gate ASSERT(mntzone != NULL); 10857c478bd9Sstevel@tonic-gate if (mntzone != zone) { 10867c478bd9Sstevel@tonic-gate error = EBUSY; 10877c478bd9Sstevel@tonic-gate goto errout; 10887c478bd9Sstevel@tonic-gate } 10897c478bd9Sstevel@tonic-gate } 10907c478bd9Sstevel@tonic-gate 109145916cd2Sjpk if (is_system_labeled()) { 109245916cd2Sjpk error = nfs_mount_label_policy(vfsp, &svp->sv_addr, 109345916cd2Sjpk svp->sv_knconf, cr); 109445916cd2Sjpk 109545916cd2Sjpk if (error > 0) 109645916cd2Sjpk goto errout; 109745916cd2Sjpk 109845916cd2Sjpk if (error == -1) { 109945916cd2Sjpk /* change mount to read-only to prevent write-down */ 110045916cd2Sjpk vfs_setmntopt(vfsp, MNTOPT_RO, NULL, 0); 110145916cd2Sjpk } 110245916cd2Sjpk } 110345916cd2Sjpk 11047c478bd9Sstevel@tonic-gate /* 11057c478bd9Sstevel@tonic-gate * Stop the mount from going any further if the zone is going away. 11067c478bd9Sstevel@tonic-gate */ 110745916cd2Sjpk if (zone_status_get(mntzone) >= ZONE_IS_SHUTTING_DOWN) { 11087c478bd9Sstevel@tonic-gate error = EBUSY; 11097c478bd9Sstevel@tonic-gate goto errout; 11107c478bd9Sstevel@tonic-gate } 11117c478bd9Sstevel@tonic-gate 11127c478bd9Sstevel@tonic-gate /* 11137c478bd9Sstevel@tonic-gate * Get root vnode. 11147c478bd9Sstevel@tonic-gate */ 11157c478bd9Sstevel@tonic-gate proceed: 111645916cd2Sjpk error = nfs4rootvp(&rtvp, vfsp, svp_head, flags, cr, mntzone); 111750a83466Sjwahlig if (error) { 111850a83466Sjwahlig /* if nfs4rootvp failed, it will free svp_head */ 111950a83466Sjwahlig svp_head = NULL; 11207c478bd9Sstevel@tonic-gate goto errout; 112150a83466Sjwahlig } 11227c478bd9Sstevel@tonic-gate 11237c478bd9Sstevel@tonic-gate mi = VTOMI4(rtvp); 11247c478bd9Sstevel@tonic-gate 11257c478bd9Sstevel@tonic-gate /* 11267c478bd9Sstevel@tonic-gate * Send client id to the server, if necessary 11277c478bd9Sstevel@tonic-gate */ 11287c478bd9Sstevel@tonic-gate nfs4_error_zinit(&n4e); 11297c478bd9Sstevel@tonic-gate nfs4setclientid(mi, cr, FALSE, &n4e); 1130b9238976Sth 11317c478bd9Sstevel@tonic-gate error = n4e.error; 11327c478bd9Sstevel@tonic-gate 11337c478bd9Sstevel@tonic-gate if (error) 11347c478bd9Sstevel@tonic-gate goto errout; 11357c478bd9Sstevel@tonic-gate 11367c478bd9Sstevel@tonic-gate /* 11377c478bd9Sstevel@tonic-gate * Set option fields in the mount info record 11387c478bd9Sstevel@tonic-gate */ 11397c478bd9Sstevel@tonic-gate 11407c478bd9Sstevel@tonic-gate if (svp_head->sv_next) { 11417c478bd9Sstevel@tonic-gate mutex_enter(&mi->mi_lock); 11427c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_LLOCK; 11437c478bd9Sstevel@tonic-gate mutex_exit(&mi->mi_lock); 11447c478bd9Sstevel@tonic-gate } 114539d3e169Sevanl error = nfs4_setopts(rtvp, DATAMODEL_NATIVE, args); 1146b9238976Sth if (error) 1147b9238976Sth goto errout; 1148b9238976Sth 1149b9238976Sth /* 1150b9238976Sth * Time to tie in the mirror mount info at last! 1151b9238976Sth */ 1152b9238976Sth if (flags & NFSMNT_EPHEMERAL) 1153d3a14591SThomas Haynes error = nfs4_record_ephemeral_mount(mi, mvp); 11547c478bd9Sstevel@tonic-gate 11557c478bd9Sstevel@tonic-gate errout: 11567c478bd9Sstevel@tonic-gate if (error) { 11577c478bd9Sstevel@tonic-gate if (rtvp != NULL) { 11587c478bd9Sstevel@tonic-gate rp = VTOR4(rtvp); 11597c478bd9Sstevel@tonic-gate if (rp->r_flags & R4HASHED) 11607c478bd9Sstevel@tonic-gate rp4_rmhash(rp); 11617c478bd9Sstevel@tonic-gate } 11627c478bd9Sstevel@tonic-gate if (mi != NULL) { 11637c478bd9Sstevel@tonic-gate nfs4_async_stop(vfsp); 11647c478bd9Sstevel@tonic-gate nfs4_async_manager_stop(vfsp); 11657c478bd9Sstevel@tonic-gate nfs4_remove_mi_from_server(mi, NULL); 116650a83466Sjwahlig if (rtvp != NULL) 11677c478bd9Sstevel@tonic-gate VN_RELE(rtvp); 116845916cd2Sjpk if (mntzone != NULL) 116945916cd2Sjpk zone_rele(mntzone); 117050a83466Sjwahlig /* need to remove it from the zone */ 117150a83466Sjwahlig removed = nfs4_mi_zonelist_remove(mi); 117250a83466Sjwahlig if (removed) 117350a83466Sjwahlig zone_rele(mi->mi_zone); 117450a83466Sjwahlig MI4_RELE(mi); 117539d3e169Sevanl if (!(uap->flags & MS_SYSSPACE) && args) { 117639d3e169Sevanl nfs4_free_args(args); 117739d3e169Sevanl kmem_free(args, sizeof (*args)); 117839d3e169Sevanl } 11797c478bd9Sstevel@tonic-gate return (error); 11807c478bd9Sstevel@tonic-gate } 118150a83466Sjwahlig if (svp_head) 118250a83466Sjwahlig sv4_free(svp_head); 11837c478bd9Sstevel@tonic-gate } 11847c478bd9Sstevel@tonic-gate 118539d3e169Sevanl if (!(uap->flags & MS_SYSSPACE) && args) { 118639d3e169Sevanl nfs4_free_args(args); 118739d3e169Sevanl kmem_free(args, sizeof (*args)); 118839d3e169Sevanl } 11897c478bd9Sstevel@tonic-gate if (rtvp != NULL) 11907c478bd9Sstevel@tonic-gate VN_RELE(rtvp); 11917c478bd9Sstevel@tonic-gate 119245916cd2Sjpk if (mntzone != NULL) 119345916cd2Sjpk zone_rele(mntzone); 119445916cd2Sjpk 11957c478bd9Sstevel@tonic-gate return (error); 11967c478bd9Sstevel@tonic-gate } 11977c478bd9Sstevel@tonic-gate 119839d3e169Sevanl #ifdef DEBUG 11997c478bd9Sstevel@tonic-gate #define VERS_MSG "NFS4 server " 12007c478bd9Sstevel@tonic-gate #else 12017c478bd9Sstevel@tonic-gate #define VERS_MSG "NFS server " 12027c478bd9Sstevel@tonic-gate #endif 12037c478bd9Sstevel@tonic-gate 120439d3e169Sevanl #define READ_MSG \ 12057c478bd9Sstevel@tonic-gate VERS_MSG "%s returned 0 for read transfer size" 120639d3e169Sevanl #define WRITE_MSG \ 12077c478bd9Sstevel@tonic-gate VERS_MSG "%s returned 0 for write transfer size" 120839d3e169Sevanl #define SIZE_MSG \ 12097c478bd9Sstevel@tonic-gate VERS_MSG "%s returned 0 for maximum file size" 12107c478bd9Sstevel@tonic-gate 12117c478bd9Sstevel@tonic-gate /* 12127c478bd9Sstevel@tonic-gate * Get the symbolic link text from the server for a given filehandle 12137c478bd9Sstevel@tonic-gate * of that symlink. 12147c478bd9Sstevel@tonic-gate * 121539d3e169Sevanl * (get symlink text) PUTFH READLINK 12167c478bd9Sstevel@tonic-gate */ 12177c478bd9Sstevel@tonic-gate static int 12187c478bd9Sstevel@tonic-gate getlinktext_otw(mntinfo4_t *mi, nfs_fh4 *fh, char **linktextp, cred_t *cr, 1219b9238976Sth int flags) 12207c478bd9Sstevel@tonic-gate { 12217c478bd9Sstevel@tonic-gate COMPOUND4args_clnt args; 12227c478bd9Sstevel@tonic-gate COMPOUND4res_clnt res; 12237c478bd9Sstevel@tonic-gate int doqueue; 12247c478bd9Sstevel@tonic-gate nfs_argop4 argop[2]; 12257c478bd9Sstevel@tonic-gate nfs_resop4 *resop; 12267c478bd9Sstevel@tonic-gate READLINK4res *lr_res; 12277c478bd9Sstevel@tonic-gate uint_t len; 12287c478bd9Sstevel@tonic-gate bool_t needrecov = FALSE; 12297c478bd9Sstevel@tonic-gate nfs4_recov_state_t recov_state; 12307c478bd9Sstevel@tonic-gate nfs4_sharedfh_t *sfh; 12317c478bd9Sstevel@tonic-gate nfs4_error_t e; 12327c478bd9Sstevel@tonic-gate int num_retry = nfs4_max_mount_retry; 12337c478bd9Sstevel@tonic-gate int recovery = !(flags & NFS4_GETFH_NEEDSOP); 12347c478bd9Sstevel@tonic-gate 12357c478bd9Sstevel@tonic-gate sfh = sfh4_get(fh, mi); 12367c478bd9Sstevel@tonic-gate recov_state.rs_flags = 0; 12377c478bd9Sstevel@tonic-gate recov_state.rs_num_retry_despite_err = 0; 12387c478bd9Sstevel@tonic-gate 12397c478bd9Sstevel@tonic-gate recov_retry: 12407c478bd9Sstevel@tonic-gate nfs4_error_zinit(&e); 12417c478bd9Sstevel@tonic-gate 12427c478bd9Sstevel@tonic-gate args.array_len = 2; 12437c478bd9Sstevel@tonic-gate args.array = argop; 12447c478bd9Sstevel@tonic-gate args.ctag = TAG_GET_SYMLINK; 12457c478bd9Sstevel@tonic-gate 12467c478bd9Sstevel@tonic-gate if (! recovery) { 12477c478bd9Sstevel@tonic-gate e.error = nfs4_start_op(mi, NULL, NULL, &recov_state); 12487c478bd9Sstevel@tonic-gate if (e.error) { 12497c478bd9Sstevel@tonic-gate sfh4_rele(&sfh); 12507c478bd9Sstevel@tonic-gate return (e.error); 12517c478bd9Sstevel@tonic-gate } 12527c478bd9Sstevel@tonic-gate } 12537c478bd9Sstevel@tonic-gate 12547c478bd9Sstevel@tonic-gate /* 0. putfh symlink fh */ 12557c478bd9Sstevel@tonic-gate argop[0].argop = OP_CPUTFH; 12567c478bd9Sstevel@tonic-gate argop[0].nfs_argop4_u.opcputfh.sfh = sfh; 12577c478bd9Sstevel@tonic-gate 12587c478bd9Sstevel@tonic-gate /* 1. readlink */ 12597c478bd9Sstevel@tonic-gate argop[1].argop = OP_READLINK; 12607c478bd9Sstevel@tonic-gate 12617c478bd9Sstevel@tonic-gate doqueue = 1; 12627c478bd9Sstevel@tonic-gate 12637c478bd9Sstevel@tonic-gate rfs4call(mi, &args, &res, cr, &doqueue, 0, &e); 12647c478bd9Sstevel@tonic-gate 12657c478bd9Sstevel@tonic-gate needrecov = nfs4_needs_recovery(&e, FALSE, mi->mi_vfsp); 12667c478bd9Sstevel@tonic-gate 12677c478bd9Sstevel@tonic-gate if (needrecov && !recovery && num_retry-- > 0) { 12687c478bd9Sstevel@tonic-gate 12697c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_recov_debug, (CE_NOTE, 1270b9238976Sth "getlinktext_otw: initiating recovery\n")); 12717c478bd9Sstevel@tonic-gate 12727c478bd9Sstevel@tonic-gate if (nfs4_start_recovery(&e, mi, NULL, NULL, NULL, NULL, 1273b9238976Sth OP_READLINK, NULL) == FALSE) { 1274b9238976Sth nfs4_end_op(mi, NULL, NULL, &recov_state, needrecov); 1275b9238976Sth if (!e.error) 1276b9238976Sth (void) xdr_free(xdr_COMPOUND4res_clnt, 1277b9238976Sth (caddr_t)&res); 12787c478bd9Sstevel@tonic-gate goto recov_retry; 12797c478bd9Sstevel@tonic-gate } 12807c478bd9Sstevel@tonic-gate } 12817c478bd9Sstevel@tonic-gate 12827c478bd9Sstevel@tonic-gate /* 12837c478bd9Sstevel@tonic-gate * If non-NFS4 pcol error and/or we weren't able to recover. 12847c478bd9Sstevel@tonic-gate */ 12857c478bd9Sstevel@tonic-gate if (e.error != 0) { 12867c478bd9Sstevel@tonic-gate if (! recovery) 12877c478bd9Sstevel@tonic-gate nfs4_end_op(mi, NULL, NULL, &recov_state, needrecov); 12887c478bd9Sstevel@tonic-gate sfh4_rele(&sfh); 12897c478bd9Sstevel@tonic-gate return (e.error); 12907c478bd9Sstevel@tonic-gate } 12917c478bd9Sstevel@tonic-gate 12927c478bd9Sstevel@tonic-gate if (res.status) { 12937c478bd9Sstevel@tonic-gate e.error = geterrno4(res.status); 12947c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 12957c478bd9Sstevel@tonic-gate if (! recovery) 12967c478bd9Sstevel@tonic-gate nfs4_end_op(mi, NULL, NULL, &recov_state, needrecov); 12977c478bd9Sstevel@tonic-gate sfh4_rele(&sfh); 12987c478bd9Sstevel@tonic-gate return (e.error); 12997c478bd9Sstevel@tonic-gate } 13007c478bd9Sstevel@tonic-gate 13017c478bd9Sstevel@tonic-gate /* res.status == NFS4_OK */ 13027c478bd9Sstevel@tonic-gate ASSERT(res.status == NFS4_OK); 13037c478bd9Sstevel@tonic-gate 130439d3e169Sevanl resop = &res.array[1]; /* readlink res */ 13057c478bd9Sstevel@tonic-gate lr_res = &resop->nfs_resop4_u.opreadlink; 13067c478bd9Sstevel@tonic-gate 13077c478bd9Sstevel@tonic-gate /* treat symlink name as data */ 13087c478bd9Sstevel@tonic-gate *linktextp = utf8_to_str(&lr_res->link, &len, NULL); 13097c478bd9Sstevel@tonic-gate 13107c478bd9Sstevel@tonic-gate if (! recovery) 13117c478bd9Sstevel@tonic-gate nfs4_end_op(mi, NULL, NULL, &recov_state, needrecov); 13127c478bd9Sstevel@tonic-gate sfh4_rele(&sfh); 13137c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 13147c478bd9Sstevel@tonic-gate return (0); 13157c478bd9Sstevel@tonic-gate } 13167c478bd9Sstevel@tonic-gate 13177c478bd9Sstevel@tonic-gate /* 13187c478bd9Sstevel@tonic-gate * Skip over consecutive slashes and "/./" in a pathname. 13197c478bd9Sstevel@tonic-gate */ 13207c478bd9Sstevel@tonic-gate void 13217c478bd9Sstevel@tonic-gate pathname_skipslashdot(struct pathname *pnp) 13227c478bd9Sstevel@tonic-gate { 13237c478bd9Sstevel@tonic-gate char *c1, *c2; 13247c478bd9Sstevel@tonic-gate 13257c478bd9Sstevel@tonic-gate while (pnp->pn_pathlen > 0 && *pnp->pn_path == '/') { 13267c478bd9Sstevel@tonic-gate 13277c478bd9Sstevel@tonic-gate c1 = pnp->pn_path + 1; 13287c478bd9Sstevel@tonic-gate c2 = pnp->pn_path + 2; 13297c478bd9Sstevel@tonic-gate 13307c478bd9Sstevel@tonic-gate if (*c1 == '.' && (*c2 == '/' || *c2 == '\0')) { 13317c478bd9Sstevel@tonic-gate pnp->pn_path = pnp->pn_path + 2; /* skip "/." */ 13327c478bd9Sstevel@tonic-gate pnp->pn_pathlen = pnp->pn_pathlen - 2; 13337c478bd9Sstevel@tonic-gate } else { 13347c478bd9Sstevel@tonic-gate pnp->pn_path++; 13357c478bd9Sstevel@tonic-gate pnp->pn_pathlen--; 13367c478bd9Sstevel@tonic-gate } 13377c478bd9Sstevel@tonic-gate } 13387c478bd9Sstevel@tonic-gate } 13397c478bd9Sstevel@tonic-gate 13407c478bd9Sstevel@tonic-gate /* 13417c478bd9Sstevel@tonic-gate * Resolve a symbolic link path. The symlink is in the nth component of 13427c478bd9Sstevel@tonic-gate * svp->sv_path and has an nfs4 file handle "fh". 13437c478bd9Sstevel@tonic-gate * Upon return, the sv_path will point to the new path that has the nth 13447c478bd9Sstevel@tonic-gate * component resolved to its symlink text. 13457c478bd9Sstevel@tonic-gate */ 13467c478bd9Sstevel@tonic-gate int 13477c478bd9Sstevel@tonic-gate resolve_sympath(mntinfo4_t *mi, servinfo4_t *svp, int nth, nfs_fh4 *fh, 1348b9238976Sth cred_t *cr, int flags) 13497c478bd9Sstevel@tonic-gate { 13507c478bd9Sstevel@tonic-gate char *oldpath; 13517c478bd9Sstevel@tonic-gate char *symlink, *newpath; 13527c478bd9Sstevel@tonic-gate struct pathname oldpn, newpn; 13537c478bd9Sstevel@tonic-gate char component[MAXNAMELEN]; 13547c478bd9Sstevel@tonic-gate int i, addlen, error = 0; 13557c478bd9Sstevel@tonic-gate int oldpathlen; 13567c478bd9Sstevel@tonic-gate 13577c478bd9Sstevel@tonic-gate /* Get the symbolic link text over the wire. */ 13587c478bd9Sstevel@tonic-gate error = getlinktext_otw(mi, fh, &symlink, cr, flags); 13597c478bd9Sstevel@tonic-gate 13607c478bd9Sstevel@tonic-gate if (error || symlink == NULL || strlen(symlink) == 0) 13617c478bd9Sstevel@tonic-gate return (error); 13627c478bd9Sstevel@tonic-gate 13637c478bd9Sstevel@tonic-gate /* 13647c478bd9Sstevel@tonic-gate * Compose the new pathname. 13657c478bd9Sstevel@tonic-gate * Note: 13667c478bd9Sstevel@tonic-gate * - only the nth component is resolved for the pathname. 13677c478bd9Sstevel@tonic-gate * - pathname.pn_pathlen does not count the ending null byte. 13687c478bd9Sstevel@tonic-gate */ 13697c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 13707c478bd9Sstevel@tonic-gate oldpath = svp->sv_path; 13717c478bd9Sstevel@tonic-gate oldpathlen = svp->sv_pathlen; 13727c478bd9Sstevel@tonic-gate if (error = pn_get(oldpath, UIO_SYSSPACE, &oldpn)) { 13737c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 13747c478bd9Sstevel@tonic-gate kmem_free(symlink, strlen(symlink) + 1); 13757c478bd9Sstevel@tonic-gate return (error); 13767c478bd9Sstevel@tonic-gate } 13777c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 13787c478bd9Sstevel@tonic-gate pn_alloc(&newpn); 13797c478bd9Sstevel@tonic-gate 13807c478bd9Sstevel@tonic-gate /* 13817c478bd9Sstevel@tonic-gate * Skip over previous components from the oldpath so that the 13827c478bd9Sstevel@tonic-gate * oldpn.pn_path will point to the symlink component. Skip 13837c478bd9Sstevel@tonic-gate * leading slashes and "/./" (no OP_LOOKUP on ".") so that 13847c478bd9Sstevel@tonic-gate * pn_getcompnent can get the component. 13857c478bd9Sstevel@tonic-gate */ 13867c478bd9Sstevel@tonic-gate for (i = 1; i < nth; i++) { 13877c478bd9Sstevel@tonic-gate pathname_skipslashdot(&oldpn); 13887c478bd9Sstevel@tonic-gate error = pn_getcomponent(&oldpn, component); 13897c478bd9Sstevel@tonic-gate if (error) 13907c478bd9Sstevel@tonic-gate goto out; 13917c478bd9Sstevel@tonic-gate } 13927c478bd9Sstevel@tonic-gate 13937c478bd9Sstevel@tonic-gate /* 13947c478bd9Sstevel@tonic-gate * Copy the old path upto the component right before the symlink 13957c478bd9Sstevel@tonic-gate * if the symlink is not an absolute path. 13967c478bd9Sstevel@tonic-gate */ 13977c478bd9Sstevel@tonic-gate if (symlink[0] != '/') { 13987c478bd9Sstevel@tonic-gate addlen = oldpn.pn_path - oldpn.pn_buf; 13997c478bd9Sstevel@tonic-gate bcopy(oldpn.pn_buf, newpn.pn_path, addlen); 14007c478bd9Sstevel@tonic-gate newpn.pn_pathlen += addlen; 14017c478bd9Sstevel@tonic-gate newpn.pn_path += addlen; 14027c478bd9Sstevel@tonic-gate newpn.pn_buf[newpn.pn_pathlen] = '/'; 14037c478bd9Sstevel@tonic-gate newpn.pn_pathlen++; 14047c478bd9Sstevel@tonic-gate newpn.pn_path++; 14057c478bd9Sstevel@tonic-gate } 14067c478bd9Sstevel@tonic-gate 14077c478bd9Sstevel@tonic-gate /* copy the resolved symbolic link text */ 14087c478bd9Sstevel@tonic-gate addlen = strlen(symlink); 14097c478bd9Sstevel@tonic-gate if (newpn.pn_pathlen + addlen >= newpn.pn_bufsize) { 14107c478bd9Sstevel@tonic-gate error = ENAMETOOLONG; 14117c478bd9Sstevel@tonic-gate goto out; 14127c478bd9Sstevel@tonic-gate } 14137c478bd9Sstevel@tonic-gate bcopy(symlink, newpn.pn_path, addlen); 14147c478bd9Sstevel@tonic-gate newpn.pn_pathlen += addlen; 14157c478bd9Sstevel@tonic-gate newpn.pn_path += addlen; 14167c478bd9Sstevel@tonic-gate 14177c478bd9Sstevel@tonic-gate /* 14187c478bd9Sstevel@tonic-gate * Check if there is any remaining path after the symlink component. 14197c478bd9Sstevel@tonic-gate * First, skip the symlink component. 14207c478bd9Sstevel@tonic-gate */ 14217c478bd9Sstevel@tonic-gate pathname_skipslashdot(&oldpn); 14227c478bd9Sstevel@tonic-gate if (error = pn_getcomponent(&oldpn, component)) 14237c478bd9Sstevel@tonic-gate goto out; 14247c478bd9Sstevel@tonic-gate 14257c478bd9Sstevel@tonic-gate addlen = pn_pathleft(&oldpn); /* includes counting the slash */ 14267c478bd9Sstevel@tonic-gate 14277c478bd9Sstevel@tonic-gate /* 14287c478bd9Sstevel@tonic-gate * Copy the remaining path to the new pathname if there is any. 14297c478bd9Sstevel@tonic-gate */ 14307c478bd9Sstevel@tonic-gate if (addlen > 0) { 14317c478bd9Sstevel@tonic-gate if (newpn.pn_pathlen + addlen >= newpn.pn_bufsize) { 14327c478bd9Sstevel@tonic-gate error = ENAMETOOLONG; 14337c478bd9Sstevel@tonic-gate goto out; 14347c478bd9Sstevel@tonic-gate } 14357c478bd9Sstevel@tonic-gate bcopy(oldpn.pn_path, newpn.pn_path, addlen); 14367c478bd9Sstevel@tonic-gate newpn.pn_pathlen += addlen; 14377c478bd9Sstevel@tonic-gate } 14387c478bd9Sstevel@tonic-gate newpn.pn_buf[newpn.pn_pathlen] = '\0'; 14397c478bd9Sstevel@tonic-gate 14407c478bd9Sstevel@tonic-gate /* get the newpath and store it in the servinfo4_t */ 14417c478bd9Sstevel@tonic-gate newpath = kmem_alloc(newpn.pn_pathlen + 1, KM_SLEEP); 14427c478bd9Sstevel@tonic-gate bcopy(newpn.pn_buf, newpath, newpn.pn_pathlen); 14437c478bd9Sstevel@tonic-gate newpath[newpn.pn_pathlen] = '\0'; 14447c478bd9Sstevel@tonic-gate 14457c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_WRITER, 0); 14467c478bd9Sstevel@tonic-gate svp->sv_path = newpath; 14477c478bd9Sstevel@tonic-gate svp->sv_pathlen = strlen(newpath) + 1; 14487c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 14497c478bd9Sstevel@tonic-gate 14507c478bd9Sstevel@tonic-gate kmem_free(oldpath, oldpathlen); 14517c478bd9Sstevel@tonic-gate out: 14527c478bd9Sstevel@tonic-gate kmem_free(symlink, strlen(symlink) + 1); 14537c478bd9Sstevel@tonic-gate pn_free(&newpn); 14547c478bd9Sstevel@tonic-gate pn_free(&oldpn); 14557c478bd9Sstevel@tonic-gate 14567c478bd9Sstevel@tonic-gate return (error); 14577c478bd9Sstevel@tonic-gate } 14587c478bd9Sstevel@tonic-gate 14597c478bd9Sstevel@tonic-gate /* 14607c478bd9Sstevel@tonic-gate * Get the root filehandle for the given filesystem and server, and update 14617c478bd9Sstevel@tonic-gate * svp. 14627c478bd9Sstevel@tonic-gate * 14637c478bd9Sstevel@tonic-gate * If NFS4_GETFH_NEEDSOP is set, then use nfs4_start_fop and nfs4_end_fop 14647c478bd9Sstevel@tonic-gate * to coordinate with recovery. Otherwise, the caller is assumed to be 14657c478bd9Sstevel@tonic-gate * the recovery thread or have already done a start_fop. 14667c478bd9Sstevel@tonic-gate * 14677c478bd9Sstevel@tonic-gate * Errors are returned by the nfs4_error_t parameter. 14687c478bd9Sstevel@tonic-gate */ 14697c478bd9Sstevel@tonic-gate 14707c478bd9Sstevel@tonic-gate static void 14717c478bd9Sstevel@tonic-gate nfs4getfh_otw(struct mntinfo4 *mi, servinfo4_t *svp, vtype_t *vtp, 1472b9238976Sth int flags, cred_t *cr, nfs4_error_t *ep) 14737c478bd9Sstevel@tonic-gate { 14747c478bd9Sstevel@tonic-gate COMPOUND4args_clnt args; 14757c478bd9Sstevel@tonic-gate COMPOUND4res_clnt res; 14767c478bd9Sstevel@tonic-gate int doqueue = 1; 14777c478bd9Sstevel@tonic-gate nfs_argop4 *argop; 14787c478bd9Sstevel@tonic-gate nfs_resop4 *resop; 14797c478bd9Sstevel@tonic-gate nfs4_ga_res_t *garp; 14807c478bd9Sstevel@tonic-gate int num_argops; 14817c478bd9Sstevel@tonic-gate lookup4_param_t lookuparg; 14827c478bd9Sstevel@tonic-gate nfs_fh4 *tmpfhp; 14837c478bd9Sstevel@tonic-gate nfs_fh4 *resfhp; 14847c478bd9Sstevel@tonic-gate bool_t needrecov = FALSE; 14857c478bd9Sstevel@tonic-gate nfs4_recov_state_t recov_state; 14867c478bd9Sstevel@tonic-gate int llndx; 14877c478bd9Sstevel@tonic-gate int nthcomp; 14887c478bd9Sstevel@tonic-gate int recovery = !(flags & NFS4_GETFH_NEEDSOP); 14897c478bd9Sstevel@tonic-gate 14907c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 14917c478bd9Sstevel@tonic-gate ASSERT(svp->sv_path != NULL); 14927c478bd9Sstevel@tonic-gate if (svp->sv_path[0] == '\0') { 14937c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 14947c478bd9Sstevel@tonic-gate nfs4_error_init(ep, EINVAL); 14957c478bd9Sstevel@tonic-gate return; 14967c478bd9Sstevel@tonic-gate } 14977c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 14987c478bd9Sstevel@tonic-gate 14997c478bd9Sstevel@tonic-gate recov_state.rs_flags = 0; 15007c478bd9Sstevel@tonic-gate recov_state.rs_num_retry_despite_err = 0; 15017c478bd9Sstevel@tonic-gate recov_retry: 15027c478bd9Sstevel@tonic-gate nfs4_error_zinit(ep); 15037c478bd9Sstevel@tonic-gate 15047c478bd9Sstevel@tonic-gate if (!recovery) { 15057c478bd9Sstevel@tonic-gate ep->error = nfs4_start_fop(mi, NULL, NULL, OH_MOUNT, 1506b9238976Sth &recov_state, NULL); 15077c478bd9Sstevel@tonic-gate 15087c478bd9Sstevel@tonic-gate /* 15097c478bd9Sstevel@tonic-gate * If recovery has been started and this request as 15107c478bd9Sstevel@tonic-gate * initiated by a mount, then we must wait for recovery 15117c478bd9Sstevel@tonic-gate * to finish before proceeding, otherwise, the error 15127c478bd9Sstevel@tonic-gate * cleanup would remove data structures needed by the 15137c478bd9Sstevel@tonic-gate * recovery thread. 15147c478bd9Sstevel@tonic-gate */ 15157c478bd9Sstevel@tonic-gate if (ep->error) { 15167c478bd9Sstevel@tonic-gate mutex_enter(&mi->mi_lock); 15177c478bd9Sstevel@tonic-gate if (mi->mi_flags & MI4_MOUNTING) { 15187c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_RECOV_FAIL; 15197c478bd9Sstevel@tonic-gate mi->mi_error = EIO; 15207c478bd9Sstevel@tonic-gate 15217c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_recov_debug, (CE_NOTE, 15227c478bd9Sstevel@tonic-gate "nfs4getfh_otw: waiting 4 recovery\n")); 15237c478bd9Sstevel@tonic-gate 15247c478bd9Sstevel@tonic-gate while (mi->mi_flags & MI4_RECOV_ACTIV) 15257c478bd9Sstevel@tonic-gate cv_wait(&mi->mi_failover_cv, 15267c478bd9Sstevel@tonic-gate &mi->mi_lock); 15277c478bd9Sstevel@tonic-gate } 15287c478bd9Sstevel@tonic-gate mutex_exit(&mi->mi_lock); 15297c478bd9Sstevel@tonic-gate return; 15307c478bd9Sstevel@tonic-gate } 15317c478bd9Sstevel@tonic-gate 15327c478bd9Sstevel@tonic-gate /* 15337c478bd9Sstevel@tonic-gate * If the client does not specify a specific flavor to use 15347c478bd9Sstevel@tonic-gate * and has not gotten a secinfo list from the server yet, 15357c478bd9Sstevel@tonic-gate * retrieve the secinfo list from the server and use a 15367c478bd9Sstevel@tonic-gate * flavor from the list to mount. 15377c478bd9Sstevel@tonic-gate * 15387c478bd9Sstevel@tonic-gate * If fail to get the secinfo list from the server, then 15397c478bd9Sstevel@tonic-gate * try the default flavor. 15407c478bd9Sstevel@tonic-gate */ 15417c478bd9Sstevel@tonic-gate if ((svp->sv_flags & SV4_TRYSECDEFAULT) && 15427c478bd9Sstevel@tonic-gate svp->sv_secinfo == NULL) { 15437c478bd9Sstevel@tonic-gate (void) nfs4_secinfo_path(mi, cr, FALSE); 15447c478bd9Sstevel@tonic-gate } 15457c478bd9Sstevel@tonic-gate } 15467c478bd9Sstevel@tonic-gate 15477c478bd9Sstevel@tonic-gate if (recovery) 15487c478bd9Sstevel@tonic-gate args.ctag = TAG_REMAP_MOUNT; 15497c478bd9Sstevel@tonic-gate else 15507c478bd9Sstevel@tonic-gate args.ctag = TAG_MOUNT; 15517c478bd9Sstevel@tonic-gate 15527c478bd9Sstevel@tonic-gate lookuparg.l4_getattrs = LKP4_ALL_ATTRIBUTES; 15537c478bd9Sstevel@tonic-gate lookuparg.argsp = &args; 15547c478bd9Sstevel@tonic-gate lookuparg.resp = &res; 15557c478bd9Sstevel@tonic-gate lookuparg.header_len = 2; /* Putrootfh, getfh */ 15567c478bd9Sstevel@tonic-gate lookuparg.trailer_len = 0; 15577c478bd9Sstevel@tonic-gate lookuparg.ga_bits = FATTR4_FSINFO_MASK; 15587c478bd9Sstevel@tonic-gate lookuparg.mi = mi; 15597c478bd9Sstevel@tonic-gate 15607c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 15617c478bd9Sstevel@tonic-gate ASSERT(svp->sv_path != NULL); 15627c478bd9Sstevel@tonic-gate llndx = nfs4lookup_setup(svp->sv_path, &lookuparg, 0); 15637c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 15647c478bd9Sstevel@tonic-gate 15657c478bd9Sstevel@tonic-gate argop = args.array; 15667c478bd9Sstevel@tonic-gate num_argops = args.array_len; 15677c478bd9Sstevel@tonic-gate 15687c478bd9Sstevel@tonic-gate /* choose public or root filehandle */ 15697c478bd9Sstevel@tonic-gate if (flags & NFS4_GETFH_PUBLIC) 15707c478bd9Sstevel@tonic-gate argop[0].argop = OP_PUTPUBFH; 15717c478bd9Sstevel@tonic-gate else 15727c478bd9Sstevel@tonic-gate argop[0].argop = OP_PUTROOTFH; 15737c478bd9Sstevel@tonic-gate 15747c478bd9Sstevel@tonic-gate /* get fh */ 15757c478bd9Sstevel@tonic-gate argop[1].argop = OP_GETFH; 15767c478bd9Sstevel@tonic-gate 15777c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_call_debug, (CE_NOTE, 15787c478bd9Sstevel@tonic-gate "nfs4getfh_otw: %s call, mi 0x%p", 15797c478bd9Sstevel@tonic-gate needrecov ? "recov" : "first", (void *)mi)); 15807c478bd9Sstevel@tonic-gate 15817c478bd9Sstevel@tonic-gate rfs4call(mi, &args, &res, cr, &doqueue, RFSCALL_SOFT, ep); 15827c478bd9Sstevel@tonic-gate 15837c478bd9Sstevel@tonic-gate needrecov = nfs4_needs_recovery(ep, FALSE, mi->mi_vfsp); 15847c478bd9Sstevel@tonic-gate 15857c478bd9Sstevel@tonic-gate if (needrecov) { 15867c478bd9Sstevel@tonic-gate bool_t abort; 15877c478bd9Sstevel@tonic-gate 15887c478bd9Sstevel@tonic-gate if (recovery) { 15897c478bd9Sstevel@tonic-gate nfs4args_lookup_free(argop, num_argops); 15907c478bd9Sstevel@tonic-gate kmem_free(argop, 1591b9238976Sth lookuparg.arglen * sizeof (nfs_argop4)); 15927c478bd9Sstevel@tonic-gate if (!ep->error) 15937c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, 1594b9238976Sth (caddr_t)&res); 15957c478bd9Sstevel@tonic-gate return; 15967c478bd9Sstevel@tonic-gate } 15977c478bd9Sstevel@tonic-gate 15987c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_recov_debug, 15997c478bd9Sstevel@tonic-gate (CE_NOTE, "nfs4getfh_otw: initiating recovery\n")); 16007c478bd9Sstevel@tonic-gate 16017c478bd9Sstevel@tonic-gate abort = nfs4_start_recovery(ep, mi, NULL, 1602b9238976Sth NULL, NULL, NULL, OP_GETFH, NULL); 16037c478bd9Sstevel@tonic-gate if (!ep->error) { 16047c478bd9Sstevel@tonic-gate ep->error = geterrno4(res.status); 16057c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 16067c478bd9Sstevel@tonic-gate } 16077c478bd9Sstevel@tonic-gate nfs4args_lookup_free(argop, num_argops); 16087c478bd9Sstevel@tonic-gate kmem_free(argop, lookuparg.arglen * sizeof (nfs_argop4)); 16097c478bd9Sstevel@tonic-gate nfs4_end_fop(mi, NULL, NULL, OH_MOUNT, &recov_state, needrecov); 16107c478bd9Sstevel@tonic-gate /* have another go? */ 16117c478bd9Sstevel@tonic-gate if (abort == FALSE) 16127c478bd9Sstevel@tonic-gate goto recov_retry; 16137c478bd9Sstevel@tonic-gate return; 16147c478bd9Sstevel@tonic-gate } 16157c478bd9Sstevel@tonic-gate 16167c478bd9Sstevel@tonic-gate /* 16177c478bd9Sstevel@tonic-gate * No recovery, but check if error is set. 16187c478bd9Sstevel@tonic-gate */ 16197c478bd9Sstevel@tonic-gate if (ep->error) { 16207c478bd9Sstevel@tonic-gate nfs4args_lookup_free(argop, num_argops); 16217c478bd9Sstevel@tonic-gate kmem_free(argop, lookuparg.arglen * sizeof (nfs_argop4)); 16227c478bd9Sstevel@tonic-gate if (!recovery) 16237c478bd9Sstevel@tonic-gate nfs4_end_fop(mi, NULL, NULL, OH_MOUNT, &recov_state, 1624b9238976Sth needrecov); 16257c478bd9Sstevel@tonic-gate return; 16267c478bd9Sstevel@tonic-gate } 16277c478bd9Sstevel@tonic-gate 16287c478bd9Sstevel@tonic-gate is_link_err: 16297c478bd9Sstevel@tonic-gate 16307c478bd9Sstevel@tonic-gate /* for non-recovery errors */ 16317c478bd9Sstevel@tonic-gate if (res.status && res.status != NFS4ERR_SYMLINK) { 16327c478bd9Sstevel@tonic-gate if (!recovery) { 16337c478bd9Sstevel@tonic-gate nfs4_end_fop(mi, NULL, NULL, OH_MOUNT, &recov_state, 1634b9238976Sth needrecov); 16357c478bd9Sstevel@tonic-gate } 16367c478bd9Sstevel@tonic-gate nfs4args_lookup_free(argop, num_argops); 16377c478bd9Sstevel@tonic-gate kmem_free(argop, lookuparg.arglen * sizeof (nfs_argop4)); 16387c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 16397c478bd9Sstevel@tonic-gate return; 16407c478bd9Sstevel@tonic-gate } 16417c478bd9Sstevel@tonic-gate 16427c478bd9Sstevel@tonic-gate /* 16437c478bd9Sstevel@tonic-gate * If any intermediate component in the path is a symbolic link, 16447c478bd9Sstevel@tonic-gate * resolve the symlink, then try mount again using the new path. 16457c478bd9Sstevel@tonic-gate */ 16467c478bd9Sstevel@tonic-gate if (res.status == NFS4ERR_SYMLINK) { 16477c478bd9Sstevel@tonic-gate int where; 16487c478bd9Sstevel@tonic-gate 16497c478bd9Sstevel@tonic-gate /* 16507c478bd9Sstevel@tonic-gate * This must be from OP_LOOKUP failure. The (cfh) for this 16517c478bd9Sstevel@tonic-gate * OP_LOOKUP is a symlink node. Found out where the 16527c478bd9Sstevel@tonic-gate * OP_GETFH is for the (cfh) that is a symlink node. 16537c478bd9Sstevel@tonic-gate * 16547c478bd9Sstevel@tonic-gate * Example: 16557c478bd9Sstevel@tonic-gate * (mount) PUTROOTFH, GETFH, LOOKUP comp1, GETFH, GETATTR, 16567c478bd9Sstevel@tonic-gate * LOOKUP comp2, GETFH, GETATTR, LOOKUP comp3, GETFH, GETATTR 16577c478bd9Sstevel@tonic-gate * 16587c478bd9Sstevel@tonic-gate * LOOKUP comp3 fails with SYMLINK because comp2 is a symlink. 16597c478bd9Sstevel@tonic-gate * In this case, where = 7, nthcomp = 2. 16607c478bd9Sstevel@tonic-gate */ 16617c478bd9Sstevel@tonic-gate where = res.array_len - 2; 16627c478bd9Sstevel@tonic-gate ASSERT(where > 0); 16637c478bd9Sstevel@tonic-gate 16647c478bd9Sstevel@tonic-gate resop = &res.array[where - 1]; 16657c478bd9Sstevel@tonic-gate ASSERT(resop->resop == OP_GETFH); 16667c478bd9Sstevel@tonic-gate tmpfhp = &resop->nfs_resop4_u.opgetfh.object; 16677c478bd9Sstevel@tonic-gate nthcomp = res.array_len/3 - 1; 16687c478bd9Sstevel@tonic-gate 16697c478bd9Sstevel@tonic-gate /* 16707c478bd9Sstevel@tonic-gate * Need to call nfs4_end_op before resolve_sympath to avoid 16717c478bd9Sstevel@tonic-gate * potential nfs4_start_op deadlock. 16727c478bd9Sstevel@tonic-gate */ 16737c478bd9Sstevel@tonic-gate if (!recovery) 16747c478bd9Sstevel@tonic-gate nfs4_end_fop(mi, NULL, NULL, OH_MOUNT, &recov_state, 1675b9238976Sth needrecov); 16767c478bd9Sstevel@tonic-gate 16777c478bd9Sstevel@tonic-gate ep->error = resolve_sympath(mi, svp, nthcomp, tmpfhp, cr, 1678b9238976Sth flags); 16797c478bd9Sstevel@tonic-gate 16807c478bd9Sstevel@tonic-gate nfs4args_lookup_free(argop, num_argops); 16817c478bd9Sstevel@tonic-gate kmem_free(argop, lookuparg.arglen * sizeof (nfs_argop4)); 16827c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 16837c478bd9Sstevel@tonic-gate 16847c478bd9Sstevel@tonic-gate if (ep->error) 16857c478bd9Sstevel@tonic-gate return; 16867c478bd9Sstevel@tonic-gate 16877c478bd9Sstevel@tonic-gate goto recov_retry; 16887c478bd9Sstevel@tonic-gate } 16897c478bd9Sstevel@tonic-gate 16907c478bd9Sstevel@tonic-gate /* getfh */ 16917c478bd9Sstevel@tonic-gate resop = &res.array[res.array_len - 2]; 16927c478bd9Sstevel@tonic-gate ASSERT(resop->resop == OP_GETFH); 16937c478bd9Sstevel@tonic-gate resfhp = &resop->nfs_resop4_u.opgetfh.object; 16947c478bd9Sstevel@tonic-gate 16957c478bd9Sstevel@tonic-gate /* getattr fsinfo res */ 16967c478bd9Sstevel@tonic-gate resop++; 16977c478bd9Sstevel@tonic-gate garp = &resop->nfs_resop4_u.opgetattr.ga_res; 16987c478bd9Sstevel@tonic-gate 16997c478bd9Sstevel@tonic-gate *vtp = garp->n4g_va.va_type; 17007c478bd9Sstevel@tonic-gate 17017c478bd9Sstevel@tonic-gate mi->mi_fh_expire_type = garp->n4g_ext_res->n4g_fet; 17027c478bd9Sstevel@tonic-gate 17037c478bd9Sstevel@tonic-gate mutex_enter(&mi->mi_lock); 17047c478bd9Sstevel@tonic-gate if (garp->n4g_ext_res->n4g_pc4.pc4_link_support) 17057c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_LINK; 17067c478bd9Sstevel@tonic-gate if (garp->n4g_ext_res->n4g_pc4.pc4_symlink_support) 17077c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_SYMLINK; 17087c478bd9Sstevel@tonic-gate if (garp->n4g_ext_res->n4g_suppattrs & FATTR4_ACL_MASK) 17097c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_ACL; 17107c478bd9Sstevel@tonic-gate mutex_exit(&mi->mi_lock); 17117c478bd9Sstevel@tonic-gate 17127c478bd9Sstevel@tonic-gate if (garp->n4g_ext_res->n4g_maxread == 0) 17137c478bd9Sstevel@tonic-gate mi->mi_tsize = 1714b9238976Sth MIN(MAXBSIZE, mi->mi_tsize); 17157c478bd9Sstevel@tonic-gate else 17167c478bd9Sstevel@tonic-gate mi->mi_tsize = 1717b9238976Sth MIN(garp->n4g_ext_res->n4g_maxread, 1718b9238976Sth mi->mi_tsize); 17197c478bd9Sstevel@tonic-gate 17207c478bd9Sstevel@tonic-gate if (garp->n4g_ext_res->n4g_maxwrite == 0) 17217c478bd9Sstevel@tonic-gate mi->mi_stsize = 1722b9238976Sth MIN(MAXBSIZE, mi->mi_stsize); 17237c478bd9Sstevel@tonic-gate else 17247c478bd9Sstevel@tonic-gate mi->mi_stsize = 1725b9238976Sth MIN(garp->n4g_ext_res->n4g_maxwrite, 1726b9238976Sth mi->mi_stsize); 17277c478bd9Sstevel@tonic-gate 17287c478bd9Sstevel@tonic-gate if (garp->n4g_ext_res->n4g_maxfilesize != 0) 17297c478bd9Sstevel@tonic-gate mi->mi_maxfilesize = 1730b9238976Sth MIN(garp->n4g_ext_res->n4g_maxfilesize, 1731b9238976Sth mi->mi_maxfilesize); 17327c478bd9Sstevel@tonic-gate 17337c478bd9Sstevel@tonic-gate /* 17347c478bd9Sstevel@tonic-gate * If the final component is a a symbolic link, resolve the symlink, 17357c478bd9Sstevel@tonic-gate * then try mount again using the new path. 17367c478bd9Sstevel@tonic-gate * 17377c478bd9Sstevel@tonic-gate * Assume no symbolic link for root filesysm "/". 17387c478bd9Sstevel@tonic-gate */ 17397c478bd9Sstevel@tonic-gate if (*vtp == VLNK) { 17407c478bd9Sstevel@tonic-gate /* 17417c478bd9Sstevel@tonic-gate * nthcomp is the total result length minus 17427c478bd9Sstevel@tonic-gate * the 1st 2 OPs (PUTROOTFH, GETFH), 17437c478bd9Sstevel@tonic-gate * then divided by 3 (LOOKUP,GETFH,GETATTR) 17447c478bd9Sstevel@tonic-gate * 17457c478bd9Sstevel@tonic-gate * e.g. PUTROOTFH GETFH LOOKUP 1st-comp GETFH GETATTR 17467c478bd9Sstevel@tonic-gate * LOOKUP 2nd-comp GETFH GETATTR 17477c478bd9Sstevel@tonic-gate * 17487c478bd9Sstevel@tonic-gate * (8 - 2)/3 = 2 17497c478bd9Sstevel@tonic-gate */ 17507c478bd9Sstevel@tonic-gate nthcomp = (res.array_len - 2)/3; 17517c478bd9Sstevel@tonic-gate 17527c478bd9Sstevel@tonic-gate /* 17537c478bd9Sstevel@tonic-gate * Need to call nfs4_end_op before resolve_sympath to avoid 17547c478bd9Sstevel@tonic-gate * potential nfs4_start_op deadlock. See RFE 4777612. 17557c478bd9Sstevel@tonic-gate */ 17567c478bd9Sstevel@tonic-gate if (!recovery) 17577c478bd9Sstevel@tonic-gate nfs4_end_fop(mi, NULL, NULL, OH_MOUNT, &recov_state, 1758b9238976Sth needrecov); 17597c478bd9Sstevel@tonic-gate 17607c478bd9Sstevel@tonic-gate ep->error = resolve_sympath(mi, svp, nthcomp, resfhp, cr, 1761b9238976Sth flags); 17627c478bd9Sstevel@tonic-gate 17637c478bd9Sstevel@tonic-gate nfs4args_lookup_free(argop, num_argops); 17647c478bd9Sstevel@tonic-gate kmem_free(argop, lookuparg.arglen * sizeof (nfs_argop4)); 17657c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 17667c478bd9Sstevel@tonic-gate 17677c478bd9Sstevel@tonic-gate if (ep->error) 17687c478bd9Sstevel@tonic-gate return; 17697c478bd9Sstevel@tonic-gate 17707c478bd9Sstevel@tonic-gate goto recov_retry; 17717c478bd9Sstevel@tonic-gate } 17727c478bd9Sstevel@tonic-gate 17737c478bd9Sstevel@tonic-gate /* 17747c478bd9Sstevel@tonic-gate * We need to figure out where in the compound the getfh 17757c478bd9Sstevel@tonic-gate * for the parent directory is. If the object to be mounted is 17767c478bd9Sstevel@tonic-gate * the root, then there is no lookup at all: 17777c478bd9Sstevel@tonic-gate * PUTROOTFH, GETFH. 17787c478bd9Sstevel@tonic-gate * If the object to be mounted is in the root, then the compound is: 17797c478bd9Sstevel@tonic-gate * PUTROOTFH, GETFH, LOOKUP, GETFH, GETATTR. 17807c478bd9Sstevel@tonic-gate * In either of these cases, the index of the GETFH is 1. 17817c478bd9Sstevel@tonic-gate * If it is not at the root, then it's something like: 17827c478bd9Sstevel@tonic-gate * PUTROOTFH, GETFH, LOOKUP, GETFH, GETATTR, 17837c478bd9Sstevel@tonic-gate * LOOKUP, GETFH, GETATTR 17847c478bd9Sstevel@tonic-gate * In this case, the index is llndx (last lookup index) - 2. 17857c478bd9Sstevel@tonic-gate */ 17867c478bd9Sstevel@tonic-gate if (llndx == -1 || llndx == 2) 17877c478bd9Sstevel@tonic-gate resop = &res.array[1]; 17887c478bd9Sstevel@tonic-gate else { 17897c478bd9Sstevel@tonic-gate ASSERT(llndx > 2); 17907c478bd9Sstevel@tonic-gate resop = &res.array[llndx-2]; 17917c478bd9Sstevel@tonic-gate } 17927c478bd9Sstevel@tonic-gate 17937c478bd9Sstevel@tonic-gate ASSERT(resop->resop == OP_GETFH); 17947c478bd9Sstevel@tonic-gate tmpfhp = &resop->nfs_resop4_u.opgetfh.object; 17957c478bd9Sstevel@tonic-gate 17967c478bd9Sstevel@tonic-gate /* save the filehandles for the replica */ 17977c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_WRITER, 0); 17987c478bd9Sstevel@tonic-gate ASSERT(tmpfhp->nfs_fh4_len <= NFS4_FHSIZE); 17997c478bd9Sstevel@tonic-gate svp->sv_pfhandle.fh_len = tmpfhp->nfs_fh4_len; 18007c478bd9Sstevel@tonic-gate bcopy(tmpfhp->nfs_fh4_val, svp->sv_pfhandle.fh_buf, 18017c478bd9Sstevel@tonic-gate tmpfhp->nfs_fh4_len); 18027c478bd9Sstevel@tonic-gate ASSERT(resfhp->nfs_fh4_len <= NFS4_FHSIZE); 18037c478bd9Sstevel@tonic-gate svp->sv_fhandle.fh_len = resfhp->nfs_fh4_len; 18047c478bd9Sstevel@tonic-gate bcopy(resfhp->nfs_fh4_val, svp->sv_fhandle.fh_buf, resfhp->nfs_fh4_len); 18057c478bd9Sstevel@tonic-gate 18067c478bd9Sstevel@tonic-gate /* initialize fsid and supp_attrs for server fs */ 18077c478bd9Sstevel@tonic-gate svp->sv_fsid = garp->n4g_fsid; 18087c478bd9Sstevel@tonic-gate svp->sv_supp_attrs = 1809b9238976Sth garp->n4g_ext_res->n4g_suppattrs | FATTR4_MANDATTR_MASK; 18107c478bd9Sstevel@tonic-gate 18117c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 18127c478bd9Sstevel@tonic-gate 18137c478bd9Sstevel@tonic-gate nfs4args_lookup_free(argop, num_argops); 18147c478bd9Sstevel@tonic-gate kmem_free(argop, lookuparg.arglen * sizeof (nfs_argop4)); 18157c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 18167c478bd9Sstevel@tonic-gate if (!recovery) 18177c478bd9Sstevel@tonic-gate nfs4_end_fop(mi, NULL, NULL, OH_MOUNT, &recov_state, needrecov); 18187c478bd9Sstevel@tonic-gate } 18197c478bd9Sstevel@tonic-gate 18207c478bd9Sstevel@tonic-gate static ushort_t nfs4_max_threads = 8; /* max number of active async threads */ 18217c478bd9Sstevel@tonic-gate static uint_t nfs4_bsize = 32 * 1024; /* client `block' size */ 18227c478bd9Sstevel@tonic-gate static uint_t nfs4_async_clusters = 1; /* # of reqs from each async queue */ 18237c478bd9Sstevel@tonic-gate static uint_t nfs4_cots_timeo = NFS_COTS_TIMEO; 18247c478bd9Sstevel@tonic-gate 18257c478bd9Sstevel@tonic-gate /* 18267c478bd9Sstevel@tonic-gate * Remap the root filehandle for the given filesystem. 18277c478bd9Sstevel@tonic-gate * 18287c478bd9Sstevel@tonic-gate * results returned via the nfs4_error_t parameter. 18297c478bd9Sstevel@tonic-gate */ 18307c478bd9Sstevel@tonic-gate void 18317c478bd9Sstevel@tonic-gate nfs4_remap_root(mntinfo4_t *mi, nfs4_error_t *ep, int flags) 18327c478bd9Sstevel@tonic-gate { 18337c478bd9Sstevel@tonic-gate struct servinfo4 *svp; 18347c478bd9Sstevel@tonic-gate vtype_t vtype; 18357c478bd9Sstevel@tonic-gate nfs_fh4 rootfh; 18367c478bd9Sstevel@tonic-gate int getfh_flags; 18377c478bd9Sstevel@tonic-gate char *orig_sv_path; 18387c478bd9Sstevel@tonic-gate int orig_sv_pathlen, num_retry; 18397c478bd9Sstevel@tonic-gate 18407c478bd9Sstevel@tonic-gate mutex_enter(&mi->mi_lock); 18418c9e5ad2Saalok 18428c9e5ad2Saalok remap_retry: 18437c478bd9Sstevel@tonic-gate svp = mi->mi_curr_serv; 18447c478bd9Sstevel@tonic-gate getfh_flags = 1845b9238976Sth (flags & NFS4_REMAP_NEEDSOP) ? NFS4_GETFH_NEEDSOP : 0; 18467c478bd9Sstevel@tonic-gate getfh_flags |= 1847b9238976Sth (mi->mi_flags & MI4_PUBLIC) ? NFS4_GETFH_PUBLIC : 0; 18487c478bd9Sstevel@tonic-gate mutex_exit(&mi->mi_lock); 18497c478bd9Sstevel@tonic-gate 18507c478bd9Sstevel@tonic-gate /* 18517c478bd9Sstevel@tonic-gate * Just in case server path being mounted contains 18527c478bd9Sstevel@tonic-gate * symlinks and fails w/STALE, save the initial sv_path 18537c478bd9Sstevel@tonic-gate * so we can redrive the initial mount compound with the 18547c478bd9Sstevel@tonic-gate * initial sv_path -- not a symlink-expanded version. 18557c478bd9Sstevel@tonic-gate * 18567c478bd9Sstevel@tonic-gate * This could only happen if a symlink was expanded 18577c478bd9Sstevel@tonic-gate * and the expanded mount compound failed stale. Because 18587c478bd9Sstevel@tonic-gate * it could be the case that the symlink was removed at 18597c478bd9Sstevel@tonic-gate * the server (and replaced with another symlink/dir, 18607c478bd9Sstevel@tonic-gate * we need to use the initial sv_path when attempting 18617c478bd9Sstevel@tonic-gate * to re-lookup everything and recover. 18627c478bd9Sstevel@tonic-gate */ 18637c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 18647c478bd9Sstevel@tonic-gate orig_sv_pathlen = svp->sv_pathlen; 18657c478bd9Sstevel@tonic-gate orig_sv_path = kmem_alloc(orig_sv_pathlen, KM_SLEEP); 18667c478bd9Sstevel@tonic-gate bcopy(svp->sv_path, orig_sv_path, orig_sv_pathlen); 18677c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 18687c478bd9Sstevel@tonic-gate 18697c478bd9Sstevel@tonic-gate num_retry = nfs4_max_mount_retry; 18707c478bd9Sstevel@tonic-gate 18717c478bd9Sstevel@tonic-gate do { 18727c478bd9Sstevel@tonic-gate /* 18737c478bd9Sstevel@tonic-gate * Get the root fh from the server. Retry nfs4_max_mount_retry 18747c478bd9Sstevel@tonic-gate * (2) times if it fails with STALE since the recovery 18757c478bd9Sstevel@tonic-gate * infrastructure doesn't do STALE recovery for components 18767c478bd9Sstevel@tonic-gate * of the server path to the object being mounted. 18777c478bd9Sstevel@tonic-gate */ 18787c478bd9Sstevel@tonic-gate nfs4getfh_otw(mi, svp, &vtype, getfh_flags, CRED(), ep); 18797c478bd9Sstevel@tonic-gate 18807c478bd9Sstevel@tonic-gate if (ep->error == 0 && ep->stat == NFS4_OK) 18817c478bd9Sstevel@tonic-gate break; 18827c478bd9Sstevel@tonic-gate 18837c478bd9Sstevel@tonic-gate /* 18847c478bd9Sstevel@tonic-gate * For some reason, the mount compound failed. Before 18857c478bd9Sstevel@tonic-gate * retrying, we need to restore the original sv_path 18867c478bd9Sstevel@tonic-gate * because it might have contained symlinks that were 18877c478bd9Sstevel@tonic-gate * expanded by nfsgetfh_otw before the failure occurred. 18887c478bd9Sstevel@tonic-gate * replace current sv_path with orig sv_path -- just in case 18897c478bd9Sstevel@tonic-gate * it changed due to embedded symlinks. 18907c478bd9Sstevel@tonic-gate */ 18917c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 18927c478bd9Sstevel@tonic-gate if (orig_sv_pathlen != svp->sv_pathlen) { 18937c478bd9Sstevel@tonic-gate kmem_free(svp->sv_path, svp->sv_pathlen); 18947c478bd9Sstevel@tonic-gate svp->sv_path = kmem_alloc(orig_sv_pathlen, KM_SLEEP); 18957c478bd9Sstevel@tonic-gate svp->sv_pathlen = orig_sv_pathlen; 18967c478bd9Sstevel@tonic-gate } 18977c478bd9Sstevel@tonic-gate bcopy(orig_sv_path, svp->sv_path, orig_sv_pathlen); 18987c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 18997c478bd9Sstevel@tonic-gate 19007c478bd9Sstevel@tonic-gate } while (num_retry-- > 0); 19017c478bd9Sstevel@tonic-gate 19027c478bd9Sstevel@tonic-gate kmem_free(orig_sv_path, orig_sv_pathlen); 19037c478bd9Sstevel@tonic-gate 19047c478bd9Sstevel@tonic-gate if (ep->error != 0 || ep->stat != 0) { 19057c478bd9Sstevel@tonic-gate return; 19067c478bd9Sstevel@tonic-gate } 19077c478bd9Sstevel@tonic-gate 19087c478bd9Sstevel@tonic-gate if (vtype != VNON && vtype != mi->mi_type) { 19097c478bd9Sstevel@tonic-gate /* shouldn't happen */ 19107c478bd9Sstevel@tonic-gate zcmn_err(mi->mi_zone->zone_id, CE_WARN, 1911b9238976Sth "nfs4_remap_root: server root vnode type (%d) doesn't " 1912b9238976Sth "match mount info (%d)", vtype, mi->mi_type); 19137c478bd9Sstevel@tonic-gate } 19147c478bd9Sstevel@tonic-gate 19157c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 19167c478bd9Sstevel@tonic-gate rootfh.nfs_fh4_val = svp->sv_fhandle.fh_buf; 19177c478bd9Sstevel@tonic-gate rootfh.nfs_fh4_len = svp->sv_fhandle.fh_len; 19187c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 19197c478bd9Sstevel@tonic-gate sfh4_update(mi->mi_rootfh, &rootfh); 19207c478bd9Sstevel@tonic-gate 19217c478bd9Sstevel@tonic-gate /* 19228c9e5ad2Saalok * It's possible that recovery took place on the filesystem 19238c9e5ad2Saalok * and the server has been updated between the time we did 19248c9e5ad2Saalok * the nfs4getfh_otw and now. Re-drive the otw operation 19258c9e5ad2Saalok * to make sure we have a good fh. 19267c478bd9Sstevel@tonic-gate */ 19277c478bd9Sstevel@tonic-gate mutex_enter(&mi->mi_lock); 19288c9e5ad2Saalok if (mi->mi_curr_serv != svp) 19298c9e5ad2Saalok goto remap_retry; 19308c9e5ad2Saalok 19317c478bd9Sstevel@tonic-gate mutex_exit(&mi->mi_lock); 19327c478bd9Sstevel@tonic-gate } 19337c478bd9Sstevel@tonic-gate 19347c478bd9Sstevel@tonic-gate static int 19357c478bd9Sstevel@tonic-gate nfs4rootvp(vnode_t **rtvpp, vfs_t *vfsp, struct servinfo4 *svp_head, 1936b9238976Sth int flags, cred_t *cr, zone_t *zone) 19377c478bd9Sstevel@tonic-gate { 19387c478bd9Sstevel@tonic-gate vnode_t *rtvp = NULL; 19397c478bd9Sstevel@tonic-gate mntinfo4_t *mi; 19407c478bd9Sstevel@tonic-gate dev_t nfs_dev; 19417c478bd9Sstevel@tonic-gate int error = 0; 19427c478bd9Sstevel@tonic-gate rnode4_t *rp; 19437c478bd9Sstevel@tonic-gate int i; 19447c478bd9Sstevel@tonic-gate struct vattr va; 19457c478bd9Sstevel@tonic-gate vtype_t vtype = VNON; 19467c478bd9Sstevel@tonic-gate vtype_t tmp_vtype = VNON; 19477c478bd9Sstevel@tonic-gate struct servinfo4 *firstsvp = NULL, *svp = svp_head; 19487c478bd9Sstevel@tonic-gate nfs4_oo_hash_bucket_t *bucketp; 19497c478bd9Sstevel@tonic-gate nfs_fh4 fh; 19507c478bd9Sstevel@tonic-gate char *droptext = ""; 19517c478bd9Sstevel@tonic-gate struct nfs_stats *nfsstatsp; 19527c478bd9Sstevel@tonic-gate nfs4_fname_t *mfname; 19537c478bd9Sstevel@tonic-gate nfs4_error_t e; 19547c478bd9Sstevel@tonic-gate char *orig_sv_path; 195550a83466Sjwahlig int orig_sv_pathlen, num_retry, removed; 19567c478bd9Sstevel@tonic-gate cred_t *lcr = NULL, *tcr = cr; 19577c478bd9Sstevel@tonic-gate 1958108322fbScarlsonj nfsstatsp = zone_getspecific(nfsstat_zone_key, nfs_zone()); 19597c478bd9Sstevel@tonic-gate ASSERT(nfsstatsp != NULL); 19607c478bd9Sstevel@tonic-gate 1961108322fbScarlsonj ASSERT(nfs_zone() == zone); 19627c478bd9Sstevel@tonic-gate ASSERT(crgetref(cr)); 19637c478bd9Sstevel@tonic-gate 19647c478bd9Sstevel@tonic-gate /* 19657c478bd9Sstevel@tonic-gate * Create a mount record and link it to the vfs struct. 19667c478bd9Sstevel@tonic-gate */ 19677c478bd9Sstevel@tonic-gate mi = kmem_zalloc(sizeof (*mi), KM_SLEEP); 19687c478bd9Sstevel@tonic-gate mutex_init(&mi->mi_lock, NULL, MUTEX_DEFAULT, NULL); 19697c478bd9Sstevel@tonic-gate nfs_rw_init(&mi->mi_recovlock, NULL, RW_DEFAULT, NULL); 19707c478bd9Sstevel@tonic-gate nfs_rw_init(&mi->mi_rename_lock, NULL, RW_DEFAULT, NULL); 19717c478bd9Sstevel@tonic-gate nfs_rw_init(&mi->mi_fh_lock, NULL, RW_DEFAULT, NULL); 19727c478bd9Sstevel@tonic-gate 19737c478bd9Sstevel@tonic-gate if (!(flags & NFSMNT_SOFT)) 19747c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_HARD; 19757c478bd9Sstevel@tonic-gate if ((flags & NFSMNT_NOPRINT)) 19767c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_NOPRINT; 19777c478bd9Sstevel@tonic-gate if (flags & NFSMNT_INT) 19787c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_INT; 19797c478bd9Sstevel@tonic-gate if (flags & NFSMNT_PUBLIC) 19807c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_PUBLIC; 1981b9238976Sth if (flags & NFSMNT_MIRRORMOUNT) 1982b9238976Sth mi->mi_flags |= MI4_MIRRORMOUNT; 19837c478bd9Sstevel@tonic-gate mi->mi_retrans = NFS_RETRIES; 19847c478bd9Sstevel@tonic-gate if (svp->sv_knconf->knc_semantics == NC_TPI_COTS_ORD || 19857c478bd9Sstevel@tonic-gate svp->sv_knconf->knc_semantics == NC_TPI_COTS) 19867c478bd9Sstevel@tonic-gate mi->mi_timeo = nfs4_cots_timeo; 19877c478bd9Sstevel@tonic-gate else 19887c478bd9Sstevel@tonic-gate mi->mi_timeo = NFS_TIMEO; 19897c478bd9Sstevel@tonic-gate mi->mi_prog = NFS_PROGRAM; 19907c478bd9Sstevel@tonic-gate mi->mi_vers = NFS_V4; 19917c478bd9Sstevel@tonic-gate mi->mi_rfsnames = rfsnames_v4; 19927c478bd9Sstevel@tonic-gate mi->mi_reqs = nfsstatsp->nfs_stats_v4.rfsreqcnt_ptr; 19937c478bd9Sstevel@tonic-gate cv_init(&mi->mi_failover_cv, NULL, CV_DEFAULT, NULL); 19947c478bd9Sstevel@tonic-gate mi->mi_servers = svp; 19957c478bd9Sstevel@tonic-gate mi->mi_curr_serv = svp; 19967c478bd9Sstevel@tonic-gate mi->mi_acregmin = SEC2HR(ACREGMIN); 19977c478bd9Sstevel@tonic-gate mi->mi_acregmax = SEC2HR(ACREGMAX); 19987c478bd9Sstevel@tonic-gate mi->mi_acdirmin = SEC2HR(ACDIRMIN); 19997c478bd9Sstevel@tonic-gate mi->mi_acdirmax = SEC2HR(ACDIRMAX); 20007c478bd9Sstevel@tonic-gate mi->mi_fh_expire_type = FH4_PERSISTENT; 20017c478bd9Sstevel@tonic-gate mi->mi_clientid_next = NULL; 20027c478bd9Sstevel@tonic-gate mi->mi_clientid_prev = NULL; 20033b895386SPavel Filipensky mi->mi_srv = NULL; 20047c478bd9Sstevel@tonic-gate mi->mi_grace_wait = 0; 20057c478bd9Sstevel@tonic-gate mi->mi_error = 0; 20067c478bd9Sstevel@tonic-gate mi->mi_srvsettime = 0; 20073b895386SPavel Filipensky mi->mi_srvset_cnt = 0; 20087c478bd9Sstevel@tonic-gate 200950a83466Sjwahlig mi->mi_count = 1; 201050a83466Sjwahlig 20117c478bd9Sstevel@tonic-gate mi->mi_tsize = nfs4_tsize(svp->sv_knconf); 20127c478bd9Sstevel@tonic-gate mi->mi_stsize = mi->mi_tsize; 20137c478bd9Sstevel@tonic-gate 20147c478bd9Sstevel@tonic-gate if (flags & NFSMNT_DIRECTIO) 20157c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_DIRECTIO; 20167c478bd9Sstevel@tonic-gate 20177c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_MOUNTING; 20187c478bd9Sstevel@tonic-gate 20197c478bd9Sstevel@tonic-gate /* 20207c478bd9Sstevel@tonic-gate * Make a vfs struct for nfs. We do this here instead of below 20217c478bd9Sstevel@tonic-gate * because rtvp needs a vfs before we can do a getattr on it. 20227c478bd9Sstevel@tonic-gate * 20237c478bd9Sstevel@tonic-gate * Assign a unique device id to the mount 20247c478bd9Sstevel@tonic-gate */ 20257c478bd9Sstevel@tonic-gate mutex_enter(&nfs_minor_lock); 20267c478bd9Sstevel@tonic-gate do { 20277c478bd9Sstevel@tonic-gate nfs_minor = (nfs_minor + 1) & MAXMIN32; 20287c478bd9Sstevel@tonic-gate nfs_dev = makedevice(nfs_major, nfs_minor); 20297c478bd9Sstevel@tonic-gate } while (vfs_devismounted(nfs_dev)); 20307c478bd9Sstevel@tonic-gate mutex_exit(&nfs_minor_lock); 20317c478bd9Sstevel@tonic-gate 20327c478bd9Sstevel@tonic-gate vfsp->vfs_dev = nfs_dev; 20337c478bd9Sstevel@tonic-gate vfs_make_fsid(&vfsp->vfs_fsid, nfs_dev, nfs4fstyp); 20347c478bd9Sstevel@tonic-gate vfsp->vfs_data = (caddr_t)mi; 20357c478bd9Sstevel@tonic-gate vfsp->vfs_fstype = nfsfstyp; 20367c478bd9Sstevel@tonic-gate vfsp->vfs_bsize = nfs4_bsize; 20377c478bd9Sstevel@tonic-gate 20387c478bd9Sstevel@tonic-gate /* 20397c478bd9Sstevel@tonic-gate * Initialize fields used to support async putpage operations. 20407c478bd9Sstevel@tonic-gate */ 20417c478bd9Sstevel@tonic-gate for (i = 0; i < NFS4_ASYNC_TYPES; i++) 20427c478bd9Sstevel@tonic-gate mi->mi_async_clusters[i] = nfs4_async_clusters; 20437c478bd9Sstevel@tonic-gate mi->mi_async_init_clusters = nfs4_async_clusters; 20447c478bd9Sstevel@tonic-gate mi->mi_async_curr = &mi->mi_async_reqs[0]; 20457c478bd9Sstevel@tonic-gate mi->mi_max_threads = nfs4_max_threads; 20467c478bd9Sstevel@tonic-gate mutex_init(&mi->mi_async_lock, NULL, MUTEX_DEFAULT, NULL); 20477c478bd9Sstevel@tonic-gate cv_init(&mi->mi_async_reqs_cv, NULL, CV_DEFAULT, NULL); 20487c478bd9Sstevel@tonic-gate cv_init(&mi->mi_async_work_cv, NULL, CV_DEFAULT, NULL); 20497c478bd9Sstevel@tonic-gate cv_init(&mi->mi_async_cv, NULL, CV_DEFAULT, NULL); 20507c478bd9Sstevel@tonic-gate cv_init(&mi->mi_inact_req_cv, NULL, CV_DEFAULT, NULL); 20517c478bd9Sstevel@tonic-gate 20527c478bd9Sstevel@tonic-gate mi->mi_vfsp = vfsp; 20537c478bd9Sstevel@tonic-gate zone_hold(mi->mi_zone = zone); 20547c478bd9Sstevel@tonic-gate nfs4_mi_zonelist_add(mi); 20557c478bd9Sstevel@tonic-gate 20567c478bd9Sstevel@tonic-gate /* 20577c478bd9Sstevel@tonic-gate * Initialize the <open owner/cred> hash table. 20587c478bd9Sstevel@tonic-gate */ 20597c478bd9Sstevel@tonic-gate for (i = 0; i < NFS4_NUM_OO_BUCKETS; i++) { 20607c478bd9Sstevel@tonic-gate bucketp = &(mi->mi_oo_list[i]); 20617c478bd9Sstevel@tonic-gate mutex_init(&bucketp->b_lock, NULL, MUTEX_DEFAULT, NULL); 20627c478bd9Sstevel@tonic-gate list_create(&bucketp->b_oo_hash_list, 20637c478bd9Sstevel@tonic-gate sizeof (nfs4_open_owner_t), 20647c478bd9Sstevel@tonic-gate offsetof(nfs4_open_owner_t, oo_hash_node)); 20657c478bd9Sstevel@tonic-gate } 20667c478bd9Sstevel@tonic-gate 20677c478bd9Sstevel@tonic-gate /* 20687c478bd9Sstevel@tonic-gate * Initialize the freed open owner list. 20697c478bd9Sstevel@tonic-gate */ 20707c478bd9Sstevel@tonic-gate mi->mi_foo_num = 0; 20717c478bd9Sstevel@tonic-gate mi->mi_foo_max = NFS4_NUM_FREED_OPEN_OWNERS; 20727c478bd9Sstevel@tonic-gate list_create(&mi->mi_foo_list, sizeof (nfs4_open_owner_t), 20737c478bd9Sstevel@tonic-gate offsetof(nfs4_open_owner_t, oo_foo_node)); 20747c478bd9Sstevel@tonic-gate 20757c478bd9Sstevel@tonic-gate list_create(&mi->mi_lost_state, sizeof (nfs4_lost_rqst_t), 20767c478bd9Sstevel@tonic-gate offsetof(nfs4_lost_rqst_t, lr_node)); 20777c478bd9Sstevel@tonic-gate 20787c478bd9Sstevel@tonic-gate list_create(&mi->mi_bseqid_list, sizeof (nfs4_bseqid_entry_t), 20797c478bd9Sstevel@tonic-gate offsetof(nfs4_bseqid_entry_t, bs_node)); 20807c478bd9Sstevel@tonic-gate 20817c478bd9Sstevel@tonic-gate /* 20827c478bd9Sstevel@tonic-gate * Initialize the msg buffer. 20837c478bd9Sstevel@tonic-gate */ 20847c478bd9Sstevel@tonic-gate list_create(&mi->mi_msg_list, sizeof (nfs4_debug_msg_t), 20857c478bd9Sstevel@tonic-gate offsetof(nfs4_debug_msg_t, msg_node)); 20867c478bd9Sstevel@tonic-gate mi->mi_msg_count = 0; 20877c478bd9Sstevel@tonic-gate mutex_init(&mi->mi_msg_list_lock, NULL, MUTEX_DEFAULT, NULL); 20887c478bd9Sstevel@tonic-gate 20897c478bd9Sstevel@tonic-gate /* 20907c478bd9Sstevel@tonic-gate * Initialize kstats 20917c478bd9Sstevel@tonic-gate */ 20927c478bd9Sstevel@tonic-gate nfs4_mnt_kstat_init(vfsp); 20937c478bd9Sstevel@tonic-gate 20947c478bd9Sstevel@tonic-gate /* 2095bbf2a467SNagakiran Rajashekar * Initialize the shared filehandle pool. 20967c478bd9Sstevel@tonic-gate */ 20977c478bd9Sstevel@tonic-gate sfh4_createtab(&mi->mi_filehandles); 20987c478bd9Sstevel@tonic-gate 20997c478bd9Sstevel@tonic-gate /* 21007c478bd9Sstevel@tonic-gate * Save server path we're attempting to mount. 21017c478bd9Sstevel@tonic-gate */ 21027c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_WRITER, 0); 21037c478bd9Sstevel@tonic-gate orig_sv_pathlen = svp_head->sv_pathlen; 21047c478bd9Sstevel@tonic-gate orig_sv_path = kmem_alloc(svp_head->sv_pathlen, KM_SLEEP); 21057c478bd9Sstevel@tonic-gate bcopy(svp_head->sv_path, orig_sv_path, svp_head->sv_pathlen); 21067c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 21077c478bd9Sstevel@tonic-gate 21087c478bd9Sstevel@tonic-gate /* 21097c478bd9Sstevel@tonic-gate * Make the GETFH call to get root fh for each replica. 21107c478bd9Sstevel@tonic-gate */ 21117c478bd9Sstevel@tonic-gate if (svp_head->sv_next) 21127c478bd9Sstevel@tonic-gate droptext = ", dropping replica"; 21137c478bd9Sstevel@tonic-gate 21147c478bd9Sstevel@tonic-gate /* 21157c478bd9Sstevel@tonic-gate * If the uid is set then set the creds for secure mounts 21167c478bd9Sstevel@tonic-gate * by proxy processes such as automountd. 21177c478bd9Sstevel@tonic-gate */ 21187c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 2119f722863dSSiyamaladevi Santhana Krishnan if (svp->sv_secdata->uid != 0 && 2120f722863dSSiyamaladevi Santhana Krishnan svp->sv_secdata->rpcflavor == RPCSEC_GSS) { 21217c478bd9Sstevel@tonic-gate lcr = crdup(cr); 21227c478bd9Sstevel@tonic-gate (void) crsetugid(lcr, svp->sv_secdata->uid, crgetgid(cr)); 21237c478bd9Sstevel@tonic-gate tcr = lcr; 21247c478bd9Sstevel@tonic-gate } 21257c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 21267c478bd9Sstevel@tonic-gate for (svp = svp_head; svp; svp = svp->sv_next) { 21277c478bd9Sstevel@tonic-gate if (nfs4_chkdup_servinfo4(svp_head, svp)) { 21287c478bd9Sstevel@tonic-gate nfs_cmn_err(error, CE_WARN, 2129b9238976Sth VERS_MSG "Host %s is a duplicate%s", 2130b9238976Sth svp->sv_hostname, droptext); 21317c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_WRITER, 0); 21327c478bd9Sstevel@tonic-gate svp->sv_flags |= SV4_NOTINUSE; 21337c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 21347c478bd9Sstevel@tonic-gate continue; 21357c478bd9Sstevel@tonic-gate } 21367c478bd9Sstevel@tonic-gate mi->mi_curr_serv = svp; 21377c478bd9Sstevel@tonic-gate 21387c478bd9Sstevel@tonic-gate /* 21397c478bd9Sstevel@tonic-gate * Just in case server path being mounted contains 21407c478bd9Sstevel@tonic-gate * symlinks and fails w/STALE, save the initial sv_path 21417c478bd9Sstevel@tonic-gate * so we can redrive the initial mount compound with the 21427c478bd9Sstevel@tonic-gate * initial sv_path -- not a symlink-expanded version. 21437c478bd9Sstevel@tonic-gate * 21447c478bd9Sstevel@tonic-gate * This could only happen if a symlink was expanded 21457c478bd9Sstevel@tonic-gate * and the expanded mount compound failed stale. Because 21467c478bd9Sstevel@tonic-gate * it could be the case that the symlink was removed at 21477c478bd9Sstevel@tonic-gate * the server (and replaced with another symlink/dir, 21487c478bd9Sstevel@tonic-gate * we need to use the initial sv_path when attempting 21497c478bd9Sstevel@tonic-gate * to re-lookup everything and recover. 21507c478bd9Sstevel@tonic-gate * 21517c478bd9Sstevel@tonic-gate * Other mount errors should evenutally be handled here also 21527c478bd9Sstevel@tonic-gate * (NFS4ERR_DELAY, NFS4ERR_RESOURCE). For now, all mount 21537c478bd9Sstevel@tonic-gate * failures will result in mount being redriven a few times. 21547c478bd9Sstevel@tonic-gate */ 21557c478bd9Sstevel@tonic-gate num_retry = nfs4_max_mount_retry; 21567c478bd9Sstevel@tonic-gate do { 21577c478bd9Sstevel@tonic-gate nfs4getfh_otw(mi, svp, &tmp_vtype, 21587c478bd9Sstevel@tonic-gate ((flags & NFSMNT_PUBLIC) ? NFS4_GETFH_PUBLIC : 0) | 21597c478bd9Sstevel@tonic-gate NFS4_GETFH_NEEDSOP, tcr, &e); 21607c478bd9Sstevel@tonic-gate 21617c478bd9Sstevel@tonic-gate if (e.error == 0 && e.stat == NFS4_OK) 21627c478bd9Sstevel@tonic-gate break; 21637c478bd9Sstevel@tonic-gate 21647c478bd9Sstevel@tonic-gate /* 21657c478bd9Sstevel@tonic-gate * replace current sv_path with orig sv_path -- just in 21667c478bd9Sstevel@tonic-gate * case it changed due to embedded symlinks. 21677c478bd9Sstevel@tonic-gate */ 21687c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 21697c478bd9Sstevel@tonic-gate if (orig_sv_pathlen != svp->sv_pathlen) { 21707c478bd9Sstevel@tonic-gate kmem_free(svp->sv_path, svp->sv_pathlen); 21717c478bd9Sstevel@tonic-gate svp->sv_path = kmem_alloc(orig_sv_pathlen, 2172b9238976Sth KM_SLEEP); 21737c478bd9Sstevel@tonic-gate svp->sv_pathlen = orig_sv_pathlen; 21747c478bd9Sstevel@tonic-gate } 21757c478bd9Sstevel@tonic-gate bcopy(orig_sv_path, svp->sv_path, orig_sv_pathlen); 21767c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 21777c478bd9Sstevel@tonic-gate 21787c478bd9Sstevel@tonic-gate } while (num_retry-- > 0); 21797c478bd9Sstevel@tonic-gate 21807c478bd9Sstevel@tonic-gate error = e.error ? e.error : geterrno4(e.stat); 21817c478bd9Sstevel@tonic-gate if (error) { 21827c478bd9Sstevel@tonic-gate nfs_cmn_err(error, CE_WARN, 2183b9238976Sth VERS_MSG "initial call to %s failed%s: %m", 2184b9238976Sth svp->sv_hostname, droptext); 21857c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_WRITER, 0); 21867c478bd9Sstevel@tonic-gate svp->sv_flags |= SV4_NOTINUSE; 21877c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 21887c478bd9Sstevel@tonic-gate mi->mi_flags &= ~MI4_RECOV_FAIL; 21897c478bd9Sstevel@tonic-gate mi->mi_error = 0; 21907c478bd9Sstevel@tonic-gate continue; 21917c478bd9Sstevel@tonic-gate } 21927c478bd9Sstevel@tonic-gate 21937c478bd9Sstevel@tonic-gate if (tmp_vtype == VBAD) { 21947c478bd9Sstevel@tonic-gate zcmn_err(mi->mi_zone->zone_id, CE_WARN, 2195b9238976Sth VERS_MSG "%s returned a bad file type for " 2196b9238976Sth "root%s", svp->sv_hostname, droptext); 21977c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_WRITER, 0); 21987c478bd9Sstevel@tonic-gate svp->sv_flags |= SV4_NOTINUSE; 21997c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 22007c478bd9Sstevel@tonic-gate continue; 22017c478bd9Sstevel@tonic-gate } 22027c478bd9Sstevel@tonic-gate 22037c478bd9Sstevel@tonic-gate if (vtype == VNON) { 22047c478bd9Sstevel@tonic-gate vtype = tmp_vtype; 22057c478bd9Sstevel@tonic-gate } else if (vtype != tmp_vtype) { 22067c478bd9Sstevel@tonic-gate zcmn_err(mi->mi_zone->zone_id, CE_WARN, 2207b9238976Sth VERS_MSG "%s returned a different file type " 2208b9238976Sth "for root%s", svp->sv_hostname, droptext); 22097c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_WRITER, 0); 22107c478bd9Sstevel@tonic-gate svp->sv_flags |= SV4_NOTINUSE; 22117c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 22127c478bd9Sstevel@tonic-gate continue; 22137c478bd9Sstevel@tonic-gate } 22147c478bd9Sstevel@tonic-gate if (firstsvp == NULL) 22157c478bd9Sstevel@tonic-gate firstsvp = svp; 22167c478bd9Sstevel@tonic-gate } 22177c478bd9Sstevel@tonic-gate 22187c478bd9Sstevel@tonic-gate kmem_free(orig_sv_path, orig_sv_pathlen); 22197c478bd9Sstevel@tonic-gate 22207c478bd9Sstevel@tonic-gate if (firstsvp == NULL) { 22217c478bd9Sstevel@tonic-gate if (error == 0) 22227c478bd9Sstevel@tonic-gate error = ENOENT; 22237c478bd9Sstevel@tonic-gate goto bad; 22247c478bd9Sstevel@tonic-gate } 22257c478bd9Sstevel@tonic-gate 22267c478bd9Sstevel@tonic-gate mi->mi_curr_serv = svp = firstsvp; 22277c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 22287c478bd9Sstevel@tonic-gate ASSERT((mi->mi_curr_serv->sv_flags & SV4_NOTINUSE) == 0); 22297c478bd9Sstevel@tonic-gate fh.nfs_fh4_len = svp->sv_fhandle.fh_len; 22307c478bd9Sstevel@tonic-gate fh.nfs_fh4_val = svp->sv_fhandle.fh_buf; 22317c478bd9Sstevel@tonic-gate mi->mi_rootfh = sfh4_get(&fh, mi); 22327c478bd9Sstevel@tonic-gate fh.nfs_fh4_len = svp->sv_pfhandle.fh_len; 22337c478bd9Sstevel@tonic-gate fh.nfs_fh4_val = svp->sv_pfhandle.fh_buf; 22347c478bd9Sstevel@tonic-gate mi->mi_srvparentfh = sfh4_get(&fh, mi); 22357c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 22367c478bd9Sstevel@tonic-gate 22377c478bd9Sstevel@tonic-gate /* 2238bbf2a467SNagakiran Rajashekar * Get the fname for filesystem root. 22397c478bd9Sstevel@tonic-gate */ 2240bbf2a467SNagakiran Rajashekar mi->mi_fname = fn_get(NULL, ".", mi->mi_rootfh); 22417c478bd9Sstevel@tonic-gate mfname = mi->mi_fname; 22427c478bd9Sstevel@tonic-gate fn_hold(mfname); 2243bbf2a467SNagakiran Rajashekar 2244bbf2a467SNagakiran Rajashekar /* 2245bbf2a467SNagakiran Rajashekar * Make the root vnode without attributes. 2246bbf2a467SNagakiran Rajashekar */ 22477c478bd9Sstevel@tonic-gate rtvp = makenfs4node_by_fh(mi->mi_rootfh, NULL, 22487c478bd9Sstevel@tonic-gate &mfname, NULL, mi, cr, gethrtime()); 22497c478bd9Sstevel@tonic-gate rtvp->v_type = vtype; 22507c478bd9Sstevel@tonic-gate 22517c478bd9Sstevel@tonic-gate mi->mi_curread = mi->mi_tsize; 22527c478bd9Sstevel@tonic-gate mi->mi_curwrite = mi->mi_stsize; 22537c478bd9Sstevel@tonic-gate 22547c478bd9Sstevel@tonic-gate /* 22557c478bd9Sstevel@tonic-gate * Start the manager thread responsible for handling async worker 22567c478bd9Sstevel@tonic-gate * threads. 22577c478bd9Sstevel@tonic-gate */ 225850a83466Sjwahlig MI4_HOLD(mi); 22597c478bd9Sstevel@tonic-gate VFS_HOLD(vfsp); /* add reference for thread */ 22607c478bd9Sstevel@tonic-gate mi->mi_manager_thread = zthread_create(NULL, 0, nfs4_async_manager, 2261b9238976Sth vfsp, 0, minclsyspri); 22627c478bd9Sstevel@tonic-gate ASSERT(mi->mi_manager_thread != NULL); 226350a83466Sjwahlig 22647c478bd9Sstevel@tonic-gate /* 22657c478bd9Sstevel@tonic-gate * Create the thread that handles over-the-wire calls for 22667c478bd9Sstevel@tonic-gate * VOP_INACTIVE. 22677c478bd9Sstevel@tonic-gate * This needs to happen after the manager thread is created. 22687c478bd9Sstevel@tonic-gate */ 226950a83466Sjwahlig MI4_HOLD(mi); 22707c478bd9Sstevel@tonic-gate mi->mi_inactive_thread = zthread_create(NULL, 0, nfs4_inactive_thread, 2271b9238976Sth mi, 0, minclsyspri); 22727c478bd9Sstevel@tonic-gate ASSERT(mi->mi_inactive_thread != NULL); 22737c478bd9Sstevel@tonic-gate 22747c478bd9Sstevel@tonic-gate /* If we didn't get a type, get one now */ 22757c478bd9Sstevel@tonic-gate if (rtvp->v_type == VNON) { 22767c478bd9Sstevel@tonic-gate va.va_mask = AT_TYPE; 22777c478bd9Sstevel@tonic-gate error = nfs4getattr(rtvp, &va, tcr); 22787c478bd9Sstevel@tonic-gate if (error) 22797c478bd9Sstevel@tonic-gate goto bad; 22807c478bd9Sstevel@tonic-gate rtvp->v_type = va.va_type; 22817c478bd9Sstevel@tonic-gate } 22827c478bd9Sstevel@tonic-gate 22837c478bd9Sstevel@tonic-gate mi->mi_type = rtvp->v_type; 22847c478bd9Sstevel@tonic-gate 22857c478bd9Sstevel@tonic-gate mutex_enter(&mi->mi_lock); 22867c478bd9Sstevel@tonic-gate mi->mi_flags &= ~MI4_MOUNTING; 22877c478bd9Sstevel@tonic-gate mutex_exit(&mi->mi_lock); 22887c478bd9Sstevel@tonic-gate 22897c478bd9Sstevel@tonic-gate *rtvpp = rtvp; 22907c478bd9Sstevel@tonic-gate if (lcr != NULL) 22917c478bd9Sstevel@tonic-gate crfree(lcr); 22927c478bd9Sstevel@tonic-gate 22937c478bd9Sstevel@tonic-gate return (0); 22947c478bd9Sstevel@tonic-gate bad: 22957c478bd9Sstevel@tonic-gate /* 22967c478bd9Sstevel@tonic-gate * An error occurred somewhere, need to clean up... 22977c478bd9Sstevel@tonic-gate */ 22987c478bd9Sstevel@tonic-gate if (lcr != NULL) 22997c478bd9Sstevel@tonic-gate crfree(lcr); 2300b9238976Sth 23017c478bd9Sstevel@tonic-gate if (rtvp != NULL) { 23027c478bd9Sstevel@tonic-gate /* 23037c478bd9Sstevel@tonic-gate * We need to release our reference to the root vnode and 23047c478bd9Sstevel@tonic-gate * destroy the mntinfo4 struct that we just created. 23057c478bd9Sstevel@tonic-gate */ 23067c478bd9Sstevel@tonic-gate rp = VTOR4(rtvp); 23077c478bd9Sstevel@tonic-gate if (rp->r_flags & R4HASHED) 23087c478bd9Sstevel@tonic-gate rp4_rmhash(rp); 23097c478bd9Sstevel@tonic-gate VN_RELE(rtvp); 23107c478bd9Sstevel@tonic-gate } 23117c478bd9Sstevel@tonic-gate nfs4_async_stop(vfsp); 23127c478bd9Sstevel@tonic-gate nfs4_async_manager_stop(vfsp); 231350a83466Sjwahlig removed = nfs4_mi_zonelist_remove(mi); 231450a83466Sjwahlig if (removed) 231550a83466Sjwahlig zone_rele(mi->mi_zone); 231650a83466Sjwahlig 231750a83466Sjwahlig /* 231850a83466Sjwahlig * This releases the initial "hold" of the mi since it will never 231950a83466Sjwahlig * be referenced by the vfsp. Also, when mount returns to vfs.c 232050a83466Sjwahlig * with an error, the vfsp will be destroyed, not rele'd. 232150a83466Sjwahlig */ 232250a83466Sjwahlig MI4_RELE(mi); 232350a83466Sjwahlig 23247c478bd9Sstevel@tonic-gate *rtvpp = NULL; 23257c478bd9Sstevel@tonic-gate return (error); 23267c478bd9Sstevel@tonic-gate } 23277c478bd9Sstevel@tonic-gate 23287c478bd9Sstevel@tonic-gate /* 23297c478bd9Sstevel@tonic-gate * vfs operations 23307c478bd9Sstevel@tonic-gate */ 23317c478bd9Sstevel@tonic-gate static int 23327c478bd9Sstevel@tonic-gate nfs4_unmount(vfs_t *vfsp, int flag, cred_t *cr) 23337c478bd9Sstevel@tonic-gate { 2334b9238976Sth mntinfo4_t *mi; 2335b9238976Sth ushort_t omax; 2336b9238976Sth int removed; 2337b9238976Sth 2338d3a14591SThomas Haynes bool_t must_unlock; 2339d708af74SThomas Haynes bool_t must_rele; 2340b9238976Sth 2341b9238976Sth nfs4_ephemeral_tree_t *eph_tree; 23427c478bd9Sstevel@tonic-gate 23437c478bd9Sstevel@tonic-gate if (secpolicy_fs_unmount(cr, vfsp) != 0) 23447c478bd9Sstevel@tonic-gate return (EPERM); 23457c478bd9Sstevel@tonic-gate 23467c478bd9Sstevel@tonic-gate mi = VFTOMI4(vfsp); 23477c478bd9Sstevel@tonic-gate 23487c478bd9Sstevel@tonic-gate if (flag & MS_FORCE) { 23497c478bd9Sstevel@tonic-gate vfsp->vfs_flag |= VFS_UNMOUNTED; 2350108322fbScarlsonj if (nfs_zone() != mi->mi_zone) { 23517c478bd9Sstevel@tonic-gate /* 23527c478bd9Sstevel@tonic-gate * If the request is coming from the wrong zone, 23537c478bd9Sstevel@tonic-gate * we don't want to create any new threads, and 23547c478bd9Sstevel@tonic-gate * performance is not a concern. Do everything 23557c478bd9Sstevel@tonic-gate * inline. 23567c478bd9Sstevel@tonic-gate */ 23577c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_zone_debug, (CE_NOTE, 23587c478bd9Sstevel@tonic-gate "nfs4_unmount x-zone forced unmount of vfs %p\n", 23597c478bd9Sstevel@tonic-gate (void *)vfsp)); 2360b9238976Sth nfs4_free_mount(vfsp, flag, cr); 23617c478bd9Sstevel@tonic-gate } else { 23627c478bd9Sstevel@tonic-gate /* 23637c478bd9Sstevel@tonic-gate * Free data structures asynchronously, to avoid 23647c478bd9Sstevel@tonic-gate * blocking the current thread (for performance 23657c478bd9Sstevel@tonic-gate * reasons only). 23667c478bd9Sstevel@tonic-gate */ 2367b9238976Sth async_free_mount(vfsp, flag, cr); 23687c478bd9Sstevel@tonic-gate } 2369b9238976Sth 23707c478bd9Sstevel@tonic-gate return (0); 23717c478bd9Sstevel@tonic-gate } 2372b9238976Sth 23737c478bd9Sstevel@tonic-gate /* 23747c478bd9Sstevel@tonic-gate * Wait until all asynchronous putpage operations on 23757c478bd9Sstevel@tonic-gate * this file system are complete before flushing rnodes 23767c478bd9Sstevel@tonic-gate * from the cache. 23777c478bd9Sstevel@tonic-gate */ 23787c478bd9Sstevel@tonic-gate omax = mi->mi_max_threads; 2379b9238976Sth if (nfs4_async_stop_sig(vfsp)) 23807c478bd9Sstevel@tonic-gate return (EINTR); 2381b9238976Sth 23827c478bd9Sstevel@tonic-gate r4flush(vfsp, cr); 2383b9238976Sth 2384eabd0450Sth /* 2385eabd0450Sth * About the only reason that this would fail would be 2386eabd0450Sth * that the harvester is already busy tearing down this 2387eabd0450Sth * node. So we fail back to the caller and let them try 2388eabd0450Sth * again when needed. 2389eabd0450Sth */ 2390eabd0450Sth if (nfs4_ephemeral_umount(mi, flag, cr, 2391d708af74SThomas Haynes &must_unlock, &must_rele, &eph_tree)) { 2392d3a14591SThomas Haynes ASSERT(must_unlock == FALSE); 2393eabd0450Sth mutex_enter(&mi->mi_async_lock); 2394eabd0450Sth mi->mi_max_threads = omax; 2395eabd0450Sth mutex_exit(&mi->mi_async_lock); 2396eabd0450Sth 2397eabd0450Sth return (EBUSY); 2398eabd0450Sth } 2399b9238976Sth 24007c478bd9Sstevel@tonic-gate /* 24017c478bd9Sstevel@tonic-gate * If there are any active vnodes on this file system, 2402b9238976Sth * then the file system is busy and can't be unmounted. 24037c478bd9Sstevel@tonic-gate */ 24047c478bd9Sstevel@tonic-gate if (check_rtable4(vfsp)) { 2405d708af74SThomas Haynes nfs4_ephemeral_umount_unlock(&must_unlock, &must_rele, 2406d708af74SThomas Haynes &eph_tree); 2407b9238976Sth 24087c478bd9Sstevel@tonic-gate mutex_enter(&mi->mi_async_lock); 24097c478bd9Sstevel@tonic-gate mi->mi_max_threads = omax; 24107c478bd9Sstevel@tonic-gate mutex_exit(&mi->mi_async_lock); 2411b9238976Sth 24127c478bd9Sstevel@tonic-gate return (EBUSY); 24137c478bd9Sstevel@tonic-gate } 2414b9238976Sth 2415b9238976Sth /* 2416b9238976Sth * The unmount can't fail from now on, so record any 2417b9238976Sth * ephemeral changes. 2418b9238976Sth */ 2419d708af74SThomas Haynes nfs4_ephemeral_umount_activate(mi, &must_unlock, 2420d708af74SThomas Haynes &must_rele, &eph_tree); 2421b9238976Sth 24227c478bd9Sstevel@tonic-gate /* 2423b9238976Sth * There are no active files that could require over-the-wire 2424b9238976Sth * calls to the server, so stop the async manager and the 2425b9238976Sth * inactive thread. 24267c478bd9Sstevel@tonic-gate */ 24277c478bd9Sstevel@tonic-gate nfs4_async_manager_stop(vfsp); 2428b9238976Sth 24297c478bd9Sstevel@tonic-gate /* 24307c478bd9Sstevel@tonic-gate * Destroy all rnodes belonging to this file system from the 24317c478bd9Sstevel@tonic-gate * rnode hash queues and purge any resources allocated to 24327c478bd9Sstevel@tonic-gate * them. 24337c478bd9Sstevel@tonic-gate */ 24347c478bd9Sstevel@tonic-gate destroy_rtable4(vfsp, cr); 24357c478bd9Sstevel@tonic-gate vfsp->vfs_flag |= VFS_UNMOUNTED; 243650a83466Sjwahlig 24377c478bd9Sstevel@tonic-gate nfs4_remove_mi_from_server(mi, NULL); 243850a83466Sjwahlig removed = nfs4_mi_zonelist_remove(mi); 243950a83466Sjwahlig if (removed) 244050a83466Sjwahlig zone_rele(mi->mi_zone); 244150a83466Sjwahlig 24427c478bd9Sstevel@tonic-gate return (0); 24437c478bd9Sstevel@tonic-gate } 24447c478bd9Sstevel@tonic-gate 24457c478bd9Sstevel@tonic-gate /* 24467c478bd9Sstevel@tonic-gate * find root of nfs 24477c478bd9Sstevel@tonic-gate */ 24487c478bd9Sstevel@tonic-gate static int 24497c478bd9Sstevel@tonic-gate nfs4_root(vfs_t *vfsp, vnode_t **vpp) 24507c478bd9Sstevel@tonic-gate { 24517c478bd9Sstevel@tonic-gate mntinfo4_t *mi; 24527c478bd9Sstevel@tonic-gate vnode_t *vp; 24537c478bd9Sstevel@tonic-gate nfs4_fname_t *mfname; 24547c478bd9Sstevel@tonic-gate servinfo4_t *svp; 24557c478bd9Sstevel@tonic-gate 24567c478bd9Sstevel@tonic-gate mi = VFTOMI4(vfsp); 24577c478bd9Sstevel@tonic-gate 2458108322fbScarlsonj if (nfs_zone() != mi->mi_zone) 24597c478bd9Sstevel@tonic-gate return (EPERM); 24607c478bd9Sstevel@tonic-gate 24617c478bd9Sstevel@tonic-gate svp = mi->mi_curr_serv; 24627c478bd9Sstevel@tonic-gate if (svp) { 24637c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 24647c478bd9Sstevel@tonic-gate if (svp->sv_flags & SV4_ROOT_STALE) { 24657c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 24667c478bd9Sstevel@tonic-gate 24677c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_WRITER, 0); 24687c478bd9Sstevel@tonic-gate if (svp->sv_flags & SV4_ROOT_STALE) { 24697c478bd9Sstevel@tonic-gate svp->sv_flags &= ~SV4_ROOT_STALE; 24707c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 24717c478bd9Sstevel@tonic-gate return (ENOENT); 24727c478bd9Sstevel@tonic-gate } 24737c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 24747c478bd9Sstevel@tonic-gate } else 24757c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 24767c478bd9Sstevel@tonic-gate } 24777c478bd9Sstevel@tonic-gate 24787c478bd9Sstevel@tonic-gate mfname = mi->mi_fname; 24797c478bd9Sstevel@tonic-gate fn_hold(mfname); 24807c478bd9Sstevel@tonic-gate vp = makenfs4node_by_fh(mi->mi_rootfh, NULL, &mfname, NULL, 24817c478bd9Sstevel@tonic-gate VFTOMI4(vfsp), CRED(), gethrtime()); 24827c478bd9Sstevel@tonic-gate 24837c478bd9Sstevel@tonic-gate if (VTOR4(vp)->r_flags & R4STALE) { 24847c478bd9Sstevel@tonic-gate VN_RELE(vp); 24857c478bd9Sstevel@tonic-gate return (ENOENT); 24867c478bd9Sstevel@tonic-gate } 24877c478bd9Sstevel@tonic-gate 24887c478bd9Sstevel@tonic-gate ASSERT(vp->v_type == VNON || vp->v_type == mi->mi_type); 24897c478bd9Sstevel@tonic-gate 24907c478bd9Sstevel@tonic-gate vp->v_type = mi->mi_type; 24917c478bd9Sstevel@tonic-gate 24927c478bd9Sstevel@tonic-gate *vpp = vp; 24937c478bd9Sstevel@tonic-gate 24947c478bd9Sstevel@tonic-gate return (0); 24957c478bd9Sstevel@tonic-gate } 24967c478bd9Sstevel@tonic-gate 24977c478bd9Sstevel@tonic-gate static int 24987c478bd9Sstevel@tonic-gate nfs4_statfs_otw(vnode_t *vp, struct statvfs64 *sbp, cred_t *cr) 24997c478bd9Sstevel@tonic-gate { 25007c478bd9Sstevel@tonic-gate int error; 25017c478bd9Sstevel@tonic-gate nfs4_ga_res_t gar; 25027c478bd9Sstevel@tonic-gate nfs4_ga_ext_res_t ger; 25037c478bd9Sstevel@tonic-gate 25047c478bd9Sstevel@tonic-gate gar.n4g_ext_res = &ger; 25057c478bd9Sstevel@tonic-gate 25067c478bd9Sstevel@tonic-gate if (error = nfs4_attr_otw(vp, TAG_FSINFO, &gar, 25077c478bd9Sstevel@tonic-gate NFS4_STATFS_ATTR_MASK, cr)) 25087c478bd9Sstevel@tonic-gate return (error); 25097c478bd9Sstevel@tonic-gate 25107c478bd9Sstevel@tonic-gate *sbp = gar.n4g_ext_res->n4g_sb; 25117c478bd9Sstevel@tonic-gate 25127c478bd9Sstevel@tonic-gate return (0); 25137c478bd9Sstevel@tonic-gate } 25147c478bd9Sstevel@tonic-gate 25157c478bd9Sstevel@tonic-gate /* 25167c478bd9Sstevel@tonic-gate * Get file system statistics. 25177c478bd9Sstevel@tonic-gate */ 25187c478bd9Sstevel@tonic-gate static int 25197c478bd9Sstevel@tonic-gate nfs4_statvfs(vfs_t *vfsp, struct statvfs64 *sbp) 25207c478bd9Sstevel@tonic-gate { 25217c478bd9Sstevel@tonic-gate int error; 25227c478bd9Sstevel@tonic-gate vnode_t *vp; 25237c478bd9Sstevel@tonic-gate cred_t *cr; 25247c478bd9Sstevel@tonic-gate 25257c478bd9Sstevel@tonic-gate error = nfs4_root(vfsp, &vp); 25267c478bd9Sstevel@tonic-gate if (error) 25277c478bd9Sstevel@tonic-gate return (error); 25287c478bd9Sstevel@tonic-gate 25297c478bd9Sstevel@tonic-gate cr = CRED(); 25307c478bd9Sstevel@tonic-gate 25317c478bd9Sstevel@tonic-gate error = nfs4_statfs_otw(vp, sbp, cr); 25327c478bd9Sstevel@tonic-gate if (!error) { 25337c478bd9Sstevel@tonic-gate (void) strncpy(sbp->f_basetype, 2534b9238976Sth vfssw[vfsp->vfs_fstype].vsw_name, FSTYPSZ); 25357c478bd9Sstevel@tonic-gate sbp->f_flag = vf_to_stf(vfsp->vfs_flag); 25367c478bd9Sstevel@tonic-gate } else { 25377c478bd9Sstevel@tonic-gate nfs4_purge_stale_fh(error, vp, cr); 25387c478bd9Sstevel@tonic-gate } 25397c478bd9Sstevel@tonic-gate 25407c478bd9Sstevel@tonic-gate VN_RELE(vp); 25417c478bd9Sstevel@tonic-gate 25427c478bd9Sstevel@tonic-gate return (error); 25437c478bd9Sstevel@tonic-gate } 25447c478bd9Sstevel@tonic-gate 25457c478bd9Sstevel@tonic-gate static kmutex_t nfs4_syncbusy; 25467c478bd9Sstevel@tonic-gate 25477c478bd9Sstevel@tonic-gate /* 25487c478bd9Sstevel@tonic-gate * Flush dirty nfs files for file system vfsp. 25497c478bd9Sstevel@tonic-gate * If vfsp == NULL, all nfs files are flushed. 25507c478bd9Sstevel@tonic-gate * 25517c478bd9Sstevel@tonic-gate * SYNC_CLOSE in flag is passed to us to 25527c478bd9Sstevel@tonic-gate * indicate that we are shutting down and or 25537c478bd9Sstevel@tonic-gate * rebooting. 25547c478bd9Sstevel@tonic-gate */ 25557c478bd9Sstevel@tonic-gate static int 25567c478bd9Sstevel@tonic-gate nfs4_sync(vfs_t *vfsp, short flag, cred_t *cr) 25577c478bd9Sstevel@tonic-gate { 25587c478bd9Sstevel@tonic-gate /* 25597c478bd9Sstevel@tonic-gate * Cross-zone calls are OK here, since this translates to a 25607c478bd9Sstevel@tonic-gate * VOP_PUTPAGE(B_ASYNC), which gets picked up by the right zone. 25617c478bd9Sstevel@tonic-gate */ 25627c478bd9Sstevel@tonic-gate if (!(flag & SYNC_ATTR) && mutex_tryenter(&nfs4_syncbusy) != 0) { 25637c478bd9Sstevel@tonic-gate r4flush(vfsp, cr); 25647c478bd9Sstevel@tonic-gate mutex_exit(&nfs4_syncbusy); 25657c478bd9Sstevel@tonic-gate } 25667c478bd9Sstevel@tonic-gate 25677c478bd9Sstevel@tonic-gate /* 25687c478bd9Sstevel@tonic-gate * if SYNC_CLOSE is set then we know that 25697c478bd9Sstevel@tonic-gate * the system is rebooting, mark the mntinfo 25707c478bd9Sstevel@tonic-gate * for later examination. 25717c478bd9Sstevel@tonic-gate */ 25727c478bd9Sstevel@tonic-gate if (vfsp && (flag & SYNC_CLOSE)) { 25737c478bd9Sstevel@tonic-gate mntinfo4_t *mi; 25747c478bd9Sstevel@tonic-gate 25757c478bd9Sstevel@tonic-gate mi = VFTOMI4(vfsp); 25767c478bd9Sstevel@tonic-gate if (!(mi->mi_flags & MI4_SHUTDOWN)) { 25777c478bd9Sstevel@tonic-gate mutex_enter(&mi->mi_lock); 25787c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_SHUTDOWN; 25797c478bd9Sstevel@tonic-gate mutex_exit(&mi->mi_lock); 25807c478bd9Sstevel@tonic-gate } 25817c478bd9Sstevel@tonic-gate } 25827c478bd9Sstevel@tonic-gate return (0); 25837c478bd9Sstevel@tonic-gate } 25847c478bd9Sstevel@tonic-gate 25857c478bd9Sstevel@tonic-gate /* 25867c478bd9Sstevel@tonic-gate * vget is difficult, if not impossible, to support in v4 because we don't 25877c478bd9Sstevel@tonic-gate * know the parent directory or name, which makes it impossible to create a 25887c478bd9Sstevel@tonic-gate * useful shadow vnode. And we need the shadow vnode for things like 25897c478bd9Sstevel@tonic-gate * OPEN. 25907c478bd9Sstevel@tonic-gate */ 25917c478bd9Sstevel@tonic-gate 25927c478bd9Sstevel@tonic-gate /* ARGSUSED */ 25937c478bd9Sstevel@tonic-gate /* 25947c478bd9Sstevel@tonic-gate * XXX Check nfs4_vget_pseudo() for dependency. 25957c478bd9Sstevel@tonic-gate */ 25967c478bd9Sstevel@tonic-gate static int 25977c478bd9Sstevel@tonic-gate nfs4_vget(vfs_t *vfsp, vnode_t **vpp, fid_t *fidp) 25987c478bd9Sstevel@tonic-gate { 25997c478bd9Sstevel@tonic-gate return (EREMOTE); 26007c478bd9Sstevel@tonic-gate } 26017c478bd9Sstevel@tonic-gate 26027c478bd9Sstevel@tonic-gate /* 26037c478bd9Sstevel@tonic-gate * nfs4_mountroot get called in the case where we are diskless booting. All 26047c478bd9Sstevel@tonic-gate * we need from here is the ability to get the server info and from there we 26057c478bd9Sstevel@tonic-gate * can simply call nfs4_rootvp. 26067c478bd9Sstevel@tonic-gate */ 26077c478bd9Sstevel@tonic-gate /* ARGSUSED */ 26087c478bd9Sstevel@tonic-gate static int 26097c478bd9Sstevel@tonic-gate nfs4_mountroot(vfs_t *vfsp, whymountroot_t why) 26107c478bd9Sstevel@tonic-gate { 26117c478bd9Sstevel@tonic-gate vnode_t *rtvp; 26127c478bd9Sstevel@tonic-gate char root_hostname[SYS_NMLN+1]; 26137c478bd9Sstevel@tonic-gate struct servinfo4 *svp; 26147c478bd9Sstevel@tonic-gate int error; 26157c478bd9Sstevel@tonic-gate int vfsflags; 26167c478bd9Sstevel@tonic-gate size_t size; 26177c478bd9Sstevel@tonic-gate char *root_path; 26187c478bd9Sstevel@tonic-gate struct pathname pn; 26197c478bd9Sstevel@tonic-gate char *name; 26207c478bd9Sstevel@tonic-gate cred_t *cr; 26217c478bd9Sstevel@tonic-gate mntinfo4_t *mi; 26227c478bd9Sstevel@tonic-gate struct nfs_args args; /* nfs mount arguments */ 26237c478bd9Sstevel@tonic-gate static char token[10]; 26247c478bd9Sstevel@tonic-gate nfs4_error_t n4e; 26257c478bd9Sstevel@tonic-gate 26267c478bd9Sstevel@tonic-gate bzero(&args, sizeof (args)); 26277c478bd9Sstevel@tonic-gate 26287c478bd9Sstevel@tonic-gate /* do this BEFORE getfile which causes xid stamps to be initialized */ 26297c478bd9Sstevel@tonic-gate clkset(-1L); /* hack for now - until we get time svc? */ 26307c478bd9Sstevel@tonic-gate 26317c478bd9Sstevel@tonic-gate if (why == ROOT_REMOUNT) { 26327c478bd9Sstevel@tonic-gate /* 26337c478bd9Sstevel@tonic-gate * Shouldn't happen. 26347c478bd9Sstevel@tonic-gate */ 26357c478bd9Sstevel@tonic-gate panic("nfs4_mountroot: why == ROOT_REMOUNT"); 26367c478bd9Sstevel@tonic-gate } 26377c478bd9Sstevel@tonic-gate 26387c478bd9Sstevel@tonic-gate if (why == ROOT_UNMOUNT) { 26397c478bd9Sstevel@tonic-gate /* 26407c478bd9Sstevel@tonic-gate * Nothing to do for NFS. 26417c478bd9Sstevel@tonic-gate */ 26427c478bd9Sstevel@tonic-gate return (0); 26437c478bd9Sstevel@tonic-gate } 26447c478bd9Sstevel@tonic-gate 26457c478bd9Sstevel@tonic-gate /* 26467c478bd9Sstevel@tonic-gate * why == ROOT_INIT 26477c478bd9Sstevel@tonic-gate */ 26487c478bd9Sstevel@tonic-gate 26497c478bd9Sstevel@tonic-gate name = token; 26507c478bd9Sstevel@tonic-gate *name = 0; 26517c478bd9Sstevel@tonic-gate (void) getfsname("root", name, sizeof (token)); 26527c478bd9Sstevel@tonic-gate 26537c478bd9Sstevel@tonic-gate pn_alloc(&pn); 26547c478bd9Sstevel@tonic-gate root_path = pn.pn_path; 26557c478bd9Sstevel@tonic-gate 26567c478bd9Sstevel@tonic-gate svp = kmem_zalloc(sizeof (*svp), KM_SLEEP); 26577c478bd9Sstevel@tonic-gate nfs_rw_init(&svp->sv_lock, NULL, RW_DEFAULT, NULL); 26587c478bd9Sstevel@tonic-gate svp->sv_knconf = kmem_zalloc(sizeof (*svp->sv_knconf), KM_SLEEP); 26597c478bd9Sstevel@tonic-gate svp->sv_knconf->knc_protofmly = kmem_alloc(KNC_STRSIZE, KM_SLEEP); 26607c478bd9Sstevel@tonic-gate svp->sv_knconf->knc_proto = kmem_alloc(KNC_STRSIZE, KM_SLEEP); 26617c478bd9Sstevel@tonic-gate 26627c478bd9Sstevel@tonic-gate /* 26637c478bd9Sstevel@tonic-gate * Get server address 26647c478bd9Sstevel@tonic-gate * Get the root path 26657c478bd9Sstevel@tonic-gate * Get server's transport 26667c478bd9Sstevel@tonic-gate * Get server's hostname 26677c478bd9Sstevel@tonic-gate * Get options 26687c478bd9Sstevel@tonic-gate */ 26697c478bd9Sstevel@tonic-gate args.addr = &svp->sv_addr; 26707c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 26717c478bd9Sstevel@tonic-gate args.fh = (char *)&svp->sv_fhandle; 26727c478bd9Sstevel@tonic-gate args.knconf = svp->sv_knconf; 26737c478bd9Sstevel@tonic-gate args.hostname = root_hostname; 26747c478bd9Sstevel@tonic-gate vfsflags = 0; 26757c478bd9Sstevel@tonic-gate if (error = mount_root(*name ? name : "root", root_path, NFS_V4, 26767c478bd9Sstevel@tonic-gate &args, &vfsflags)) { 26777c478bd9Sstevel@tonic-gate if (error == EPROTONOSUPPORT) 26787c478bd9Sstevel@tonic-gate nfs_cmn_err(error, CE_WARN, "nfs4_mountroot: " 26797c478bd9Sstevel@tonic-gate "mount_root failed: server doesn't support NFS V4"); 26807c478bd9Sstevel@tonic-gate else 26817c478bd9Sstevel@tonic-gate nfs_cmn_err(error, CE_WARN, 26827c478bd9Sstevel@tonic-gate "nfs4_mountroot: mount_root failed: %m"); 26837c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 26847c478bd9Sstevel@tonic-gate sv4_free(svp); 26857c478bd9Sstevel@tonic-gate pn_free(&pn); 26867c478bd9Sstevel@tonic-gate return (error); 26877c478bd9Sstevel@tonic-gate } 26887c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 26897c478bd9Sstevel@tonic-gate svp->sv_hostnamelen = (int)(strlen(root_hostname) + 1); 26907c478bd9Sstevel@tonic-gate svp->sv_hostname = kmem_alloc(svp->sv_hostnamelen, KM_SLEEP); 26917c478bd9Sstevel@tonic-gate (void) strcpy(svp->sv_hostname, root_hostname); 26927c478bd9Sstevel@tonic-gate 26937c478bd9Sstevel@tonic-gate svp->sv_pathlen = (int)(strlen(root_path) + 1); 26947c478bd9Sstevel@tonic-gate svp->sv_path = kmem_alloc(svp->sv_pathlen, KM_SLEEP); 26957c478bd9Sstevel@tonic-gate (void) strcpy(svp->sv_path, root_path); 26967c478bd9Sstevel@tonic-gate 26977c478bd9Sstevel@tonic-gate /* 26987c478bd9Sstevel@tonic-gate * Force root partition to always be mounted with AUTH_UNIX for now 26997c478bd9Sstevel@tonic-gate */ 27007c478bd9Sstevel@tonic-gate svp->sv_secdata = kmem_alloc(sizeof (*svp->sv_secdata), KM_SLEEP); 27017c478bd9Sstevel@tonic-gate svp->sv_secdata->secmod = AUTH_UNIX; 27027c478bd9Sstevel@tonic-gate svp->sv_secdata->rpcflavor = AUTH_UNIX; 27037c478bd9Sstevel@tonic-gate svp->sv_secdata->data = NULL; 27047c478bd9Sstevel@tonic-gate 27057c478bd9Sstevel@tonic-gate cr = crgetcred(); 27067c478bd9Sstevel@tonic-gate rtvp = NULL; 27077c478bd9Sstevel@tonic-gate 27087c478bd9Sstevel@tonic-gate error = nfs4rootvp(&rtvp, vfsp, svp, args.flags, cr, global_zone); 27097c478bd9Sstevel@tonic-gate 27107c478bd9Sstevel@tonic-gate if (error) { 27117c478bd9Sstevel@tonic-gate crfree(cr); 27127c478bd9Sstevel@tonic-gate pn_free(&pn); 2713ab7762b6Smaheshvs sv4_free(svp); 2714ab7762b6Smaheshvs return (error); 27157c478bd9Sstevel@tonic-gate } 27167c478bd9Sstevel@tonic-gate 27177c478bd9Sstevel@tonic-gate mi = VTOMI4(rtvp); 27187c478bd9Sstevel@tonic-gate 27197c478bd9Sstevel@tonic-gate /* 27207c478bd9Sstevel@tonic-gate * Send client id to the server, if necessary 27217c478bd9Sstevel@tonic-gate */ 27227c478bd9Sstevel@tonic-gate nfs4_error_zinit(&n4e); 27237c478bd9Sstevel@tonic-gate nfs4setclientid(mi, cr, FALSE, &n4e); 27247c478bd9Sstevel@tonic-gate error = n4e.error; 27257c478bd9Sstevel@tonic-gate 27267c478bd9Sstevel@tonic-gate crfree(cr); 27277c478bd9Sstevel@tonic-gate 27287c478bd9Sstevel@tonic-gate if (error) { 27297c478bd9Sstevel@tonic-gate pn_free(&pn); 27307c478bd9Sstevel@tonic-gate goto errout; 27317c478bd9Sstevel@tonic-gate } 27327c478bd9Sstevel@tonic-gate 27337c478bd9Sstevel@tonic-gate error = nfs4_setopts(rtvp, DATAMODEL_NATIVE, &args); 27347c478bd9Sstevel@tonic-gate if (error) { 27357c478bd9Sstevel@tonic-gate nfs_cmn_err(error, CE_WARN, 27367c478bd9Sstevel@tonic-gate "nfs4_mountroot: invalid root mount options"); 27377c478bd9Sstevel@tonic-gate pn_free(&pn); 27387c478bd9Sstevel@tonic-gate goto errout; 27397c478bd9Sstevel@tonic-gate } 27407c478bd9Sstevel@tonic-gate 27417c478bd9Sstevel@tonic-gate (void) vfs_lock_wait(vfsp); 27427c478bd9Sstevel@tonic-gate vfs_add(NULL, vfsp, vfsflags); 27437c478bd9Sstevel@tonic-gate vfs_unlock(vfsp); 27447c478bd9Sstevel@tonic-gate 27457c478bd9Sstevel@tonic-gate size = strlen(svp->sv_hostname); 27467c478bd9Sstevel@tonic-gate (void) strcpy(rootfs.bo_name, svp->sv_hostname); 27477c478bd9Sstevel@tonic-gate rootfs.bo_name[size] = ':'; 27487c478bd9Sstevel@tonic-gate (void) strcpy(&rootfs.bo_name[size + 1], root_path); 27497c478bd9Sstevel@tonic-gate 27507c478bd9Sstevel@tonic-gate pn_free(&pn); 27517c478bd9Sstevel@tonic-gate 27527c478bd9Sstevel@tonic-gate errout: 27537c478bd9Sstevel@tonic-gate if (error) { 27547c478bd9Sstevel@tonic-gate sv4_free(svp); 27557c478bd9Sstevel@tonic-gate nfs4_async_stop(vfsp); 27567c478bd9Sstevel@tonic-gate nfs4_async_manager_stop(vfsp); 27577c478bd9Sstevel@tonic-gate } 27587c478bd9Sstevel@tonic-gate 27597c478bd9Sstevel@tonic-gate if (rtvp != NULL) 27607c478bd9Sstevel@tonic-gate VN_RELE(rtvp); 27617c478bd9Sstevel@tonic-gate 27627c478bd9Sstevel@tonic-gate return (error); 27637c478bd9Sstevel@tonic-gate } 27647c478bd9Sstevel@tonic-gate 27657c478bd9Sstevel@tonic-gate /* 27667c478bd9Sstevel@tonic-gate * Initialization routine for VFS routines. Should only be called once 27677c478bd9Sstevel@tonic-gate */ 27687c478bd9Sstevel@tonic-gate int 27697c478bd9Sstevel@tonic-gate nfs4_vfsinit(void) 27707c478bd9Sstevel@tonic-gate { 27717c478bd9Sstevel@tonic-gate mutex_init(&nfs4_syncbusy, NULL, MUTEX_DEFAULT, NULL); 27727c478bd9Sstevel@tonic-gate nfs4setclientid_init(); 2773b9238976Sth nfs4_ephemeral_init(); 27747c478bd9Sstevel@tonic-gate return (0); 27757c478bd9Sstevel@tonic-gate } 27767c478bd9Sstevel@tonic-gate 27777c478bd9Sstevel@tonic-gate void 27787c478bd9Sstevel@tonic-gate nfs4_vfsfini(void) 27797c478bd9Sstevel@tonic-gate { 2780b9238976Sth nfs4_ephemeral_fini(); 27817c478bd9Sstevel@tonic-gate nfs4setclientid_fini(); 27827c478bd9Sstevel@tonic-gate mutex_destroy(&nfs4_syncbusy); 27837c478bd9Sstevel@tonic-gate } 27847c478bd9Sstevel@tonic-gate 27857c478bd9Sstevel@tonic-gate void 27867c478bd9Sstevel@tonic-gate nfs4_freevfs(vfs_t *vfsp) 27877c478bd9Sstevel@tonic-gate { 27887c478bd9Sstevel@tonic-gate mntinfo4_t *mi; 27897c478bd9Sstevel@tonic-gate 279050a83466Sjwahlig /* need to release the initial hold */ 27917c478bd9Sstevel@tonic-gate mi = VFTOMI4(vfsp); 279250a83466Sjwahlig MI4_RELE(mi); 27937c478bd9Sstevel@tonic-gate } 27947c478bd9Sstevel@tonic-gate 27957c478bd9Sstevel@tonic-gate /* 27967c478bd9Sstevel@tonic-gate * Client side SETCLIENTID and SETCLIENTID_CONFIRM 27977c478bd9Sstevel@tonic-gate */ 27987c478bd9Sstevel@tonic-gate struct nfs4_server nfs4_server_lst = 27997c478bd9Sstevel@tonic-gate { &nfs4_server_lst, &nfs4_server_lst }; 28007c478bd9Sstevel@tonic-gate 28017c478bd9Sstevel@tonic-gate kmutex_t nfs4_server_lst_lock; 28027c478bd9Sstevel@tonic-gate 28037c478bd9Sstevel@tonic-gate static void 28047c478bd9Sstevel@tonic-gate nfs4setclientid_init(void) 28057c478bd9Sstevel@tonic-gate { 28067c478bd9Sstevel@tonic-gate mutex_init(&nfs4_server_lst_lock, NULL, MUTEX_DEFAULT, NULL); 28077c478bd9Sstevel@tonic-gate } 28087c478bd9Sstevel@tonic-gate 28097c478bd9Sstevel@tonic-gate static void 28107c478bd9Sstevel@tonic-gate nfs4setclientid_fini(void) 28117c478bd9Sstevel@tonic-gate { 28127c478bd9Sstevel@tonic-gate mutex_destroy(&nfs4_server_lst_lock); 28137c478bd9Sstevel@tonic-gate } 28147c478bd9Sstevel@tonic-gate 28157c478bd9Sstevel@tonic-gate int nfs4_retry_sclid_delay = NFS4_RETRY_SCLID_DELAY; 28167c478bd9Sstevel@tonic-gate int nfs4_num_sclid_retries = NFS4_NUM_SCLID_RETRIES; 28177c478bd9Sstevel@tonic-gate 28187c478bd9Sstevel@tonic-gate /* 28197c478bd9Sstevel@tonic-gate * Set the clientid for the server for "mi". No-op if the clientid is 28207c478bd9Sstevel@tonic-gate * already set. 28217c478bd9Sstevel@tonic-gate * 28227c478bd9Sstevel@tonic-gate * The recovery boolean should be set to TRUE if this function was called 2823a092743bSek * by the recovery code, and FALSE otherwise. This is used to determine 2824a092743bSek * if we need to call nfs4_start/end_op as well as grab the mi_recovlock 2825a092743bSek * for adding a mntinfo4_t to a nfs4_server_t. 28267c478bd9Sstevel@tonic-gate * 28277c478bd9Sstevel@tonic-gate * Error is returned via 'n4ep'. If there was a 'n4ep->stat' error, then 28287c478bd9Sstevel@tonic-gate * 'n4ep->error' is set to geterrno4(n4ep->stat). 28297c478bd9Sstevel@tonic-gate */ 28307c478bd9Sstevel@tonic-gate void 28317c478bd9Sstevel@tonic-gate nfs4setclientid(mntinfo4_t *mi, cred_t *cr, bool_t recovery, nfs4_error_t *n4ep) 28327c478bd9Sstevel@tonic-gate { 28337c478bd9Sstevel@tonic-gate struct nfs4_server *np; 28347c478bd9Sstevel@tonic-gate struct servinfo4 *svp = mi->mi_curr_serv; 28357c478bd9Sstevel@tonic-gate nfs4_recov_state_t recov_state; 28367c478bd9Sstevel@tonic-gate int num_retries = 0; 2837f64c4ae1Sdm bool_t retry; 28387c478bd9Sstevel@tonic-gate cred_t *lcr = NULL; 28397c478bd9Sstevel@tonic-gate int retry_inuse = 1; /* only retry once on NFS4ERR_CLID_INUSE */ 28407c478bd9Sstevel@tonic-gate time_t lease_time = 0; 28417c478bd9Sstevel@tonic-gate 28427c478bd9Sstevel@tonic-gate recov_state.rs_flags = 0; 28437c478bd9Sstevel@tonic-gate recov_state.rs_num_retry_despite_err = 0; 28447c478bd9Sstevel@tonic-gate ASSERT(n4ep != NULL); 28457c478bd9Sstevel@tonic-gate 28467c478bd9Sstevel@tonic-gate recov_retry: 2847f64c4ae1Sdm retry = FALSE; 28487c478bd9Sstevel@tonic-gate nfs4_error_zinit(n4ep); 2849a092743bSek if (!recovery) 2850a092743bSek (void) nfs_rw_enter_sig(&mi->mi_recovlock, RW_READER, 0); 2851a092743bSek 2852f86c6ccaSdm mutex_enter(&nfs4_server_lst_lock); 2853f86c6ccaSdm np = servinfo4_to_nfs4_server(svp); /* This locks np if it is found */ 2854f86c6ccaSdm mutex_exit(&nfs4_server_lst_lock); 2855f86c6ccaSdm if (!np) { 2856f86c6ccaSdm struct nfs4_server *tnp; 2857f86c6ccaSdm np = new_nfs4_server(svp, cr); 285816237317Sdm mutex_enter(&np->s_lock); 28597c478bd9Sstevel@tonic-gate 2860f86c6ccaSdm mutex_enter(&nfs4_server_lst_lock); 2861f86c6ccaSdm tnp = servinfo4_to_nfs4_server(svp); 2862f86c6ccaSdm if (tnp) { 2863f86c6ccaSdm /* 2864f86c6ccaSdm * another thread snuck in and put server on list. 2865f86c6ccaSdm * since we aren't adding it to the nfs4_server_list 2866f86c6ccaSdm * we need to set the ref count to 0 and destroy it. 2867f86c6ccaSdm */ 2868f86c6ccaSdm np->s_refcnt = 0; 2869f86c6ccaSdm destroy_nfs4_server(np); 2870f86c6ccaSdm np = tnp; 2871f86c6ccaSdm } else { 2872f86c6ccaSdm /* 2873f86c6ccaSdm * do not give list a reference until everything 2874f86c6ccaSdm * succeeds 2875f86c6ccaSdm */ 2876f86c6ccaSdm insque(np, &nfs4_server_lst); 2877f86c6ccaSdm } 2878f86c6ccaSdm mutex_exit(&nfs4_server_lst_lock); 2879f86c6ccaSdm } 2880f86c6ccaSdm ASSERT(MUTEX_HELD(&np->s_lock)); 28817c478bd9Sstevel@tonic-gate /* 2882f86c6ccaSdm * If we find the server already has N4S_CLIENTID_SET, then 2883f86c6ccaSdm * just return, we've already done SETCLIENTID to that server 28847c478bd9Sstevel@tonic-gate */ 2885f86c6ccaSdm if (np->s_flags & N4S_CLIENTID_SET) { 28867c478bd9Sstevel@tonic-gate /* add mi to np's mntinfo4_list */ 28877c478bd9Sstevel@tonic-gate nfs4_add_mi_to_server(np, mi); 2888a092743bSek if (!recovery) 2889a092743bSek nfs_rw_exit(&mi->mi_recovlock); 28907c478bd9Sstevel@tonic-gate mutex_exit(&np->s_lock); 28917c478bd9Sstevel@tonic-gate nfs4_server_rele(np); 28927c478bd9Sstevel@tonic-gate return; 28937c478bd9Sstevel@tonic-gate } 2894f86c6ccaSdm mutex_exit(&np->s_lock); 2895f86c6ccaSdm 28967c478bd9Sstevel@tonic-gate 2897a092743bSek /* 2898a092743bSek * Drop the mi_recovlock since nfs4_start_op will 2899a092743bSek * acquire it again for us. 2900a092743bSek */ 2901f86c6ccaSdm if (!recovery) { 2902a092743bSek nfs_rw_exit(&mi->mi_recovlock); 2903a092743bSek 29047c478bd9Sstevel@tonic-gate n4ep->error = nfs4_start_op(mi, NULL, NULL, &recov_state); 29057c478bd9Sstevel@tonic-gate if (n4ep->error) { 29067c478bd9Sstevel@tonic-gate nfs4_server_rele(np); 29077c478bd9Sstevel@tonic-gate return; 29087c478bd9Sstevel@tonic-gate } 29097c478bd9Sstevel@tonic-gate } 29107c478bd9Sstevel@tonic-gate 29117c478bd9Sstevel@tonic-gate mutex_enter(&np->s_lock); 2912f86c6ccaSdm while (np->s_flags & N4S_CLIENTID_PEND) { 2913f86c6ccaSdm if (!cv_wait_sig(&np->s_clientid_pend, &np->s_lock)) { 2914f86c6ccaSdm mutex_exit(&np->s_lock); 2915f86c6ccaSdm nfs4_server_rele(np); 2916f86c6ccaSdm if (!recovery) 2917f86c6ccaSdm nfs4_end_op(mi, NULL, NULL, &recov_state, 2918f86c6ccaSdm recovery); 2919f86c6ccaSdm n4ep->error = EINTR; 2920f86c6ccaSdm return; 2921f86c6ccaSdm } 2922f86c6ccaSdm } 29237c478bd9Sstevel@tonic-gate 29247c478bd9Sstevel@tonic-gate if (np->s_flags & N4S_CLIENTID_SET) { 29257c478bd9Sstevel@tonic-gate /* XXX copied/pasted from above */ 29267c478bd9Sstevel@tonic-gate /* add mi to np's mntinfo4_list */ 29277c478bd9Sstevel@tonic-gate nfs4_add_mi_to_server(np, mi); 29287c478bd9Sstevel@tonic-gate mutex_exit(&np->s_lock); 29297c478bd9Sstevel@tonic-gate nfs4_server_rele(np); 29307c478bd9Sstevel@tonic-gate if (!recovery) 29317c478bd9Sstevel@tonic-gate nfs4_end_op(mi, NULL, NULL, &recov_state, recovery); 29327c478bd9Sstevel@tonic-gate return; 29337c478bd9Sstevel@tonic-gate } 29347c478bd9Sstevel@tonic-gate 2935f86c6ccaSdm /* 2936f86c6ccaSdm * Reset the N4S_CB_PINGED flag. This is used to 2937f86c6ccaSdm * indicate if we have received a CB_NULL from the 2938f86c6ccaSdm * server. Also we reset the waiter flag. 2939f86c6ccaSdm */ 2940f86c6ccaSdm np->s_flags &= ~(N4S_CB_PINGED | N4S_CB_WAITER); 2941f86c6ccaSdm /* any failure must now clear this flag */ 2942f86c6ccaSdm np->s_flags |= N4S_CLIENTID_PEND; 2943f86c6ccaSdm mutex_exit(&np->s_lock); 29447c478bd9Sstevel@tonic-gate nfs4setclientid_otw(mi, svp, cr, np, n4ep, &retry_inuse); 29457c478bd9Sstevel@tonic-gate 29467c478bd9Sstevel@tonic-gate if (n4ep->error == EACCES) { 29477c478bd9Sstevel@tonic-gate /* 29487c478bd9Sstevel@tonic-gate * If the uid is set then set the creds for secure mounts 29497c478bd9Sstevel@tonic-gate * by proxy processes such as automountd. 29507c478bd9Sstevel@tonic-gate */ 29517c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 29527c478bd9Sstevel@tonic-gate if (svp->sv_secdata->uid != 0) { 29537c478bd9Sstevel@tonic-gate lcr = crdup(cr); 29547c478bd9Sstevel@tonic-gate (void) crsetugid(lcr, svp->sv_secdata->uid, 29557c478bd9Sstevel@tonic-gate crgetgid(cr)); 29567c478bd9Sstevel@tonic-gate } 29577c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 29587c478bd9Sstevel@tonic-gate 2959f86c6ccaSdm if (lcr != NULL) { 2960f86c6ccaSdm mutex_enter(&np->s_lock); 2961f86c6ccaSdm crfree(np->s_cred); 2962f86c6ccaSdm np->s_cred = lcr; 2963f86c6ccaSdm mutex_exit(&np->s_lock); 29647c478bd9Sstevel@tonic-gate nfs4setclientid_otw(mi, svp, lcr, np, n4ep, 2965b9238976Sth &retry_inuse); 2966f86c6ccaSdm } 29677c478bd9Sstevel@tonic-gate } 2968f86c6ccaSdm mutex_enter(&np->s_lock); 29697c478bd9Sstevel@tonic-gate lease_time = np->s_lease_time; 2970f86c6ccaSdm np->s_flags &= ~N4S_CLIENTID_PEND; 29717c478bd9Sstevel@tonic-gate mutex_exit(&np->s_lock); 29727c478bd9Sstevel@tonic-gate 29737c478bd9Sstevel@tonic-gate if (n4ep->error != 0 || n4ep->stat != NFS4_OK) { 29747c478bd9Sstevel@tonic-gate /* 29757c478bd9Sstevel@tonic-gate * Start recovery if failover is a possibility. If 29767c478bd9Sstevel@tonic-gate * invoked by the recovery thread itself, then just 29777c478bd9Sstevel@tonic-gate * return and let it handle the failover first. NB: 29787c478bd9Sstevel@tonic-gate * recovery is not allowed if the mount is in progress 29797c478bd9Sstevel@tonic-gate * since the infrastructure is not sufficiently setup 29807c478bd9Sstevel@tonic-gate * to allow it. Just return the error (after suitable 29817c478bd9Sstevel@tonic-gate * retries). 29827c478bd9Sstevel@tonic-gate */ 29837c478bd9Sstevel@tonic-gate if (FAILOVER_MOUNT4(mi) && nfs4_try_failover(n4ep)) { 29847c478bd9Sstevel@tonic-gate (void) nfs4_start_recovery(n4ep, mi, NULL, 2985b9238976Sth NULL, NULL, NULL, OP_SETCLIENTID, NULL); 29867c478bd9Sstevel@tonic-gate /* 29877c478bd9Sstevel@tonic-gate * Don't retry here, just return and let 29887c478bd9Sstevel@tonic-gate * recovery take over. 29897c478bd9Sstevel@tonic-gate */ 29907c478bd9Sstevel@tonic-gate if (recovery) 29917c478bd9Sstevel@tonic-gate retry = FALSE; 29927c478bd9Sstevel@tonic-gate } else if (nfs4_rpc_retry_error(n4ep->error) || 2993b9238976Sth n4ep->stat == NFS4ERR_RESOURCE || 2994b9238976Sth n4ep->stat == NFS4ERR_STALE_CLIENTID) { 29957c478bd9Sstevel@tonic-gate 2996b9238976Sth retry = TRUE; 2997b9238976Sth /* 2998b9238976Sth * Always retry if in recovery or once had 2999b9238976Sth * contact with the server (but now it's 3000b9238976Sth * overloaded). 3001b9238976Sth */ 3002b9238976Sth if (recovery == TRUE || 3003b9238976Sth n4ep->error == ETIMEDOUT || 3004b9238976Sth n4ep->error == ECONNRESET) 30057c478bd9Sstevel@tonic-gate num_retries = 0; 3006b9238976Sth } else if (retry_inuse && n4ep->error == 0 && 3007b9238976Sth n4ep->stat == NFS4ERR_CLID_INUSE) { 3008b9238976Sth retry = TRUE; 3009b9238976Sth num_retries = 0; 30107c478bd9Sstevel@tonic-gate } 3011f86c6ccaSdm } else { 3012f64c4ae1Sdm /* 3013f64c4ae1Sdm * Since everything succeeded give the list a reference count if 3014f64c4ae1Sdm * it hasn't been given one by add_new_nfs4_server() or if this 3015f64c4ae1Sdm * is not a recovery situation in which case it is already on 3016f64c4ae1Sdm * the list. 3017f64c4ae1Sdm */ 3018f86c6ccaSdm mutex_enter(&np->s_lock); 3019f64c4ae1Sdm if ((np->s_flags & N4S_INSERTED) == 0) { 3020f64c4ae1Sdm np->s_refcnt++; 3021f64c4ae1Sdm np->s_flags |= N4S_INSERTED; 3022f64c4ae1Sdm } 3023f86c6ccaSdm mutex_exit(&np->s_lock); 30247c478bd9Sstevel@tonic-gate } 30257c478bd9Sstevel@tonic-gate 30267c478bd9Sstevel@tonic-gate if (!recovery) 30277c478bd9Sstevel@tonic-gate nfs4_end_op(mi, NULL, NULL, &recov_state, recovery); 3028f86c6ccaSdm 30297c478bd9Sstevel@tonic-gate 30307c478bd9Sstevel@tonic-gate if (retry && num_retries++ < nfs4_num_sclid_retries) { 30317c478bd9Sstevel@tonic-gate if (retry_inuse) { 30327c478bd9Sstevel@tonic-gate delay(SEC_TO_TICK(lease_time + nfs4_retry_sclid_delay)); 30337c478bd9Sstevel@tonic-gate retry_inuse = 0; 30347c478bd9Sstevel@tonic-gate } else 30357c478bd9Sstevel@tonic-gate delay(SEC_TO_TICK(nfs4_retry_sclid_delay)); 3036f86c6ccaSdm 3037f86c6ccaSdm nfs4_server_rele(np); 30387c478bd9Sstevel@tonic-gate goto recov_retry; 30397c478bd9Sstevel@tonic-gate } 30407c478bd9Sstevel@tonic-gate 3041f86c6ccaSdm 30427c478bd9Sstevel@tonic-gate if (n4ep->error == 0) 30437c478bd9Sstevel@tonic-gate n4ep->error = geterrno4(n4ep->stat); 3044f86c6ccaSdm 3045f86c6ccaSdm /* broadcast before release in case no other threads are waiting */ 3046f86c6ccaSdm cv_broadcast(&np->s_clientid_pend); 3047f86c6ccaSdm nfs4_server_rele(np); 30487c478bd9Sstevel@tonic-gate } 30497c478bd9Sstevel@tonic-gate 30507c478bd9Sstevel@tonic-gate int nfs4setclientid_otw_debug = 0; 30517c478bd9Sstevel@tonic-gate 30527c478bd9Sstevel@tonic-gate /* 30537c478bd9Sstevel@tonic-gate * This function handles the recovery of STALE_CLIENTID for SETCLIENTID_CONFRIM, 30547c478bd9Sstevel@tonic-gate * but nothing else; the calling function must be designed to handle those 30557c478bd9Sstevel@tonic-gate * other errors. 30567c478bd9Sstevel@tonic-gate */ 30577c478bd9Sstevel@tonic-gate static void 30587c478bd9Sstevel@tonic-gate nfs4setclientid_otw(mntinfo4_t *mi, struct servinfo4 *svp, cred_t *cr, 3059b9238976Sth struct nfs4_server *np, nfs4_error_t *ep, int *retry_inusep) 30607c478bd9Sstevel@tonic-gate { 30617c478bd9Sstevel@tonic-gate COMPOUND4args_clnt args; 30627c478bd9Sstevel@tonic-gate COMPOUND4res_clnt res; 30637c478bd9Sstevel@tonic-gate nfs_argop4 argop[3]; 30647c478bd9Sstevel@tonic-gate SETCLIENTID4args *s_args; 30657c478bd9Sstevel@tonic-gate SETCLIENTID4resok *s_resok; 30667c478bd9Sstevel@tonic-gate int doqueue = 1; 30677c478bd9Sstevel@tonic-gate nfs4_ga_res_t *garp = NULL; 30687c478bd9Sstevel@tonic-gate timespec_t prop_time, after_time; 30697c478bd9Sstevel@tonic-gate verifier4 verf; 30707c478bd9Sstevel@tonic-gate clientid4 tmp_clientid; 30717c478bd9Sstevel@tonic-gate 3072f86c6ccaSdm ASSERT(!MUTEX_HELD(&np->s_lock)); 30737c478bd9Sstevel@tonic-gate 30747c478bd9Sstevel@tonic-gate args.ctag = TAG_SETCLIENTID; 30757c478bd9Sstevel@tonic-gate 30767c478bd9Sstevel@tonic-gate args.array = argop; 30777c478bd9Sstevel@tonic-gate args.array_len = 3; 30787c478bd9Sstevel@tonic-gate 30797c478bd9Sstevel@tonic-gate /* PUTROOTFH */ 30807c478bd9Sstevel@tonic-gate argop[0].argop = OP_PUTROOTFH; 30817c478bd9Sstevel@tonic-gate 30827c478bd9Sstevel@tonic-gate /* GETATTR */ 30837c478bd9Sstevel@tonic-gate argop[1].argop = OP_GETATTR; 30847c478bd9Sstevel@tonic-gate argop[1].nfs_argop4_u.opgetattr.attr_request = FATTR4_LEASE_TIME_MASK; 30857c478bd9Sstevel@tonic-gate argop[1].nfs_argop4_u.opgetattr.mi = mi; 30867c478bd9Sstevel@tonic-gate 30877c478bd9Sstevel@tonic-gate /* SETCLIENTID */ 30887c478bd9Sstevel@tonic-gate argop[2].argop = OP_SETCLIENTID; 30897c478bd9Sstevel@tonic-gate 30907c478bd9Sstevel@tonic-gate s_args = &argop[2].nfs_argop4_u.opsetclientid; 30917c478bd9Sstevel@tonic-gate 3092f86c6ccaSdm mutex_enter(&np->s_lock); 3093f86c6ccaSdm 30947c478bd9Sstevel@tonic-gate s_args->client.verifier = np->clidtosend.verifier; 30957c478bd9Sstevel@tonic-gate s_args->client.id_len = np->clidtosend.id_len; 30967c478bd9Sstevel@tonic-gate ASSERT(s_args->client.id_len <= NFS4_OPAQUE_LIMIT); 30977c478bd9Sstevel@tonic-gate s_args->client.id_val = np->clidtosend.id_val; 30987c478bd9Sstevel@tonic-gate 30997c478bd9Sstevel@tonic-gate /* 31007c478bd9Sstevel@tonic-gate * Callback needs to happen on non-RDMA transport 31017c478bd9Sstevel@tonic-gate * Check if we have saved the original knetconfig 31027c478bd9Sstevel@tonic-gate * if so, use that instead. 31037c478bd9Sstevel@tonic-gate */ 31047c478bd9Sstevel@tonic-gate if (svp->sv_origknconf != NULL) 31057c478bd9Sstevel@tonic-gate nfs4_cb_args(np, svp->sv_origknconf, s_args); 31067c478bd9Sstevel@tonic-gate else 31077c478bd9Sstevel@tonic-gate nfs4_cb_args(np, svp->sv_knconf, s_args); 31087c478bd9Sstevel@tonic-gate 3109f86c6ccaSdm mutex_exit(&np->s_lock); 3110f86c6ccaSdm 3111f86c6ccaSdm rfs4call(mi, &args, &res, cr, &doqueue, 0, ep); 31127c478bd9Sstevel@tonic-gate 31137c478bd9Sstevel@tonic-gate if (ep->error) 31147c478bd9Sstevel@tonic-gate return; 31157c478bd9Sstevel@tonic-gate 31167c478bd9Sstevel@tonic-gate /* getattr lease_time res */ 3117e557fb2cSDai Ngo if ((res.array_len >= 2) && 3118e557fb2cSDai Ngo (res.array[1].nfs_resop4_u.opgetattr.status == NFS4_OK)) { 31197c478bd9Sstevel@tonic-gate garp = &res.array[1].nfs_resop4_u.opgetattr.ga_res; 31207c478bd9Sstevel@tonic-gate 31217c478bd9Sstevel@tonic-gate #ifndef _LP64 31227c478bd9Sstevel@tonic-gate /* 31237c478bd9Sstevel@tonic-gate * The 32 bit client cannot handle a lease time greater than 31247c478bd9Sstevel@tonic-gate * (INT32_MAX/1000000). This is due to the use of the 31257c478bd9Sstevel@tonic-gate * lease_time in calls to drv_usectohz() in 31267c478bd9Sstevel@tonic-gate * nfs4_renew_lease_thread(). The problem is that 31277c478bd9Sstevel@tonic-gate * drv_usectohz() takes a time_t (which is just a long = 4 31287c478bd9Sstevel@tonic-gate * bytes) as its parameter. The lease_time is multiplied by 31297c478bd9Sstevel@tonic-gate * 1000000 to convert seconds to usecs for the parameter. If 31307c478bd9Sstevel@tonic-gate * a number bigger than (INT32_MAX/1000000) is used then we 31317c478bd9Sstevel@tonic-gate * overflow on the 32bit client. 31327c478bd9Sstevel@tonic-gate */ 31337c478bd9Sstevel@tonic-gate if (garp->n4g_ext_res->n4g_leasetime > (INT32_MAX/1000000)) { 31347c478bd9Sstevel@tonic-gate garp->n4g_ext_res->n4g_leasetime = INT32_MAX/1000000; 31357c478bd9Sstevel@tonic-gate } 31367c478bd9Sstevel@tonic-gate #endif 31377c478bd9Sstevel@tonic-gate 3138f86c6ccaSdm mutex_enter(&np->s_lock); 31397c478bd9Sstevel@tonic-gate np->s_lease_time = garp->n4g_ext_res->n4g_leasetime; 31407c478bd9Sstevel@tonic-gate 31417c478bd9Sstevel@tonic-gate /* 31427c478bd9Sstevel@tonic-gate * Keep track of the lease period for the mi's 31437c478bd9Sstevel@tonic-gate * mi_msg_list. We need an appropiate time 31447c478bd9Sstevel@tonic-gate * bound to associate past facts with a current 31457c478bd9Sstevel@tonic-gate * event. The lease period is perfect for this. 31467c478bd9Sstevel@tonic-gate */ 31477c478bd9Sstevel@tonic-gate mutex_enter(&mi->mi_msg_list_lock); 31487c478bd9Sstevel@tonic-gate mi->mi_lease_period = np->s_lease_time; 31497c478bd9Sstevel@tonic-gate mutex_exit(&mi->mi_msg_list_lock); 3150f86c6ccaSdm mutex_exit(&np->s_lock); 31517c478bd9Sstevel@tonic-gate } 31527c478bd9Sstevel@tonic-gate 31537c478bd9Sstevel@tonic-gate 31547c478bd9Sstevel@tonic-gate if (res.status == NFS4ERR_CLID_INUSE) { 31557c478bd9Sstevel@tonic-gate clientaddr4 *clid_inuse; 31567c478bd9Sstevel@tonic-gate 31577c478bd9Sstevel@tonic-gate if (!(*retry_inusep)) { 31587c478bd9Sstevel@tonic-gate clid_inuse = &res.array->nfs_resop4_u. 3159b9238976Sth opsetclientid.SETCLIENTID4res_u.client_using; 31607c478bd9Sstevel@tonic-gate 31617c478bd9Sstevel@tonic-gate zcmn_err(mi->mi_zone->zone_id, CE_NOTE, 31627c478bd9Sstevel@tonic-gate "NFS4 mount (SETCLIENTID failed)." 31637c478bd9Sstevel@tonic-gate " nfs4_client_id.id is in" 31647c478bd9Sstevel@tonic-gate "use already by: r_netid<%s> r_addr<%s>", 31657c478bd9Sstevel@tonic-gate clid_inuse->r_netid, clid_inuse->r_addr); 31667c478bd9Sstevel@tonic-gate } 31677c478bd9Sstevel@tonic-gate 31687c478bd9Sstevel@tonic-gate /* 31697c478bd9Sstevel@tonic-gate * XXX - The client should be more robust in its 31707c478bd9Sstevel@tonic-gate * handling of clientid in use errors (regen another 31717c478bd9Sstevel@tonic-gate * clientid and try again?) 31727c478bd9Sstevel@tonic-gate */ 31737c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 31747c478bd9Sstevel@tonic-gate return; 31757c478bd9Sstevel@tonic-gate } 31767c478bd9Sstevel@tonic-gate 31777c478bd9Sstevel@tonic-gate if (res.status) { 31787c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 31797c478bd9Sstevel@tonic-gate return; 31807c478bd9Sstevel@tonic-gate } 31817c478bd9Sstevel@tonic-gate 31827c478bd9Sstevel@tonic-gate s_resok = &res.array[2].nfs_resop4_u. 3183b9238976Sth opsetclientid.SETCLIENTID4res_u.resok4; 31847c478bd9Sstevel@tonic-gate 31857c478bd9Sstevel@tonic-gate tmp_clientid = s_resok->clientid; 31867c478bd9Sstevel@tonic-gate 31877c478bd9Sstevel@tonic-gate verf = s_resok->setclientid_confirm; 31887c478bd9Sstevel@tonic-gate 31897c478bd9Sstevel@tonic-gate #ifdef DEBUG 31907c478bd9Sstevel@tonic-gate if (nfs4setclientid_otw_debug) { 31917c478bd9Sstevel@tonic-gate union { 31927c478bd9Sstevel@tonic-gate clientid4 clientid; 31937c478bd9Sstevel@tonic-gate int foo[2]; 31947c478bd9Sstevel@tonic-gate } cid; 31957c478bd9Sstevel@tonic-gate 31967c478bd9Sstevel@tonic-gate cid.clientid = s_resok->clientid; 31977c478bd9Sstevel@tonic-gate 31987c478bd9Sstevel@tonic-gate zcmn_err(mi->mi_zone->zone_id, CE_NOTE, 31997c478bd9Sstevel@tonic-gate "nfs4setclientid_otw: OK, clientid = %x,%x, " 32007c478bd9Sstevel@tonic-gate "verifier = %" PRIx64 "\n", cid.foo[0], cid.foo[1], verf); 32017c478bd9Sstevel@tonic-gate } 32027c478bd9Sstevel@tonic-gate #endif 32037c478bd9Sstevel@tonic-gate 32047c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 32057c478bd9Sstevel@tonic-gate 32067c478bd9Sstevel@tonic-gate /* Confirm the client id and get the lease_time attribute */ 32077c478bd9Sstevel@tonic-gate 32087c478bd9Sstevel@tonic-gate args.ctag = TAG_SETCLIENTID_CF; 32097c478bd9Sstevel@tonic-gate 32107c478bd9Sstevel@tonic-gate args.array = argop; 32117c478bd9Sstevel@tonic-gate args.array_len = 1; 32127c478bd9Sstevel@tonic-gate 32137c478bd9Sstevel@tonic-gate argop[0].argop = OP_SETCLIENTID_CONFIRM; 32147c478bd9Sstevel@tonic-gate 32157c478bd9Sstevel@tonic-gate argop[0].nfs_argop4_u.opsetclientid_confirm.clientid = tmp_clientid; 32167c478bd9Sstevel@tonic-gate argop[0].nfs_argop4_u.opsetclientid_confirm.setclientid_confirm = verf; 32177c478bd9Sstevel@tonic-gate 32187c478bd9Sstevel@tonic-gate /* used to figure out RTT for np */ 32197c478bd9Sstevel@tonic-gate gethrestime(&prop_time); 32207c478bd9Sstevel@tonic-gate 32217c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_lease_debug, (CE_NOTE, "nfs4setlientid_otw: " 3222b9238976Sth "start time: %ld sec %ld nsec", prop_time.tv_sec, 3223b9238976Sth prop_time.tv_nsec)); 32247c478bd9Sstevel@tonic-gate 32257c478bd9Sstevel@tonic-gate rfs4call(mi, &args, &res, cr, &doqueue, 0, ep); 32267c478bd9Sstevel@tonic-gate 32277c478bd9Sstevel@tonic-gate gethrestime(&after_time); 3228f86c6ccaSdm mutex_enter(&np->s_lock); 32297c478bd9Sstevel@tonic-gate np->propagation_delay.tv_sec = 3230b9238976Sth MAX(1, after_time.tv_sec - prop_time.tv_sec); 3231f86c6ccaSdm mutex_exit(&np->s_lock); 32327c478bd9Sstevel@tonic-gate 32337c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_lease_debug, (CE_NOTE, "nfs4setlcientid_otw: " 3234b9238976Sth "finish time: %ld sec ", after_time.tv_sec)); 32357c478bd9Sstevel@tonic-gate 32367c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_lease_debug, (CE_NOTE, "nfs4setclientid_otw: " 3237b9238976Sth "propagation delay set to %ld sec", 3238b9238976Sth np->propagation_delay.tv_sec)); 32397c478bd9Sstevel@tonic-gate 32407c478bd9Sstevel@tonic-gate if (ep->error) 32417c478bd9Sstevel@tonic-gate return; 32427c478bd9Sstevel@tonic-gate 32437c478bd9Sstevel@tonic-gate if (res.status == NFS4ERR_CLID_INUSE) { 32447c478bd9Sstevel@tonic-gate clientaddr4 *clid_inuse; 32457c478bd9Sstevel@tonic-gate 32467c478bd9Sstevel@tonic-gate if (!(*retry_inusep)) { 32477c478bd9Sstevel@tonic-gate clid_inuse = &res.array->nfs_resop4_u. 3248b9238976Sth opsetclientid.SETCLIENTID4res_u.client_using; 32497c478bd9Sstevel@tonic-gate 32507c478bd9Sstevel@tonic-gate zcmn_err(mi->mi_zone->zone_id, CE_NOTE, 32517c478bd9Sstevel@tonic-gate "SETCLIENTID_CONFIRM failed. " 32527c478bd9Sstevel@tonic-gate "nfs4_client_id.id is in use already by: " 32537c478bd9Sstevel@tonic-gate "r_netid<%s> r_addr<%s>", 32547c478bd9Sstevel@tonic-gate clid_inuse->r_netid, clid_inuse->r_addr); 32557c478bd9Sstevel@tonic-gate } 32567c478bd9Sstevel@tonic-gate 32577c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 32587c478bd9Sstevel@tonic-gate return; 32597c478bd9Sstevel@tonic-gate } 32607c478bd9Sstevel@tonic-gate 32617c478bd9Sstevel@tonic-gate if (res.status) { 32627c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 32637c478bd9Sstevel@tonic-gate return; 32647c478bd9Sstevel@tonic-gate } 32657c478bd9Sstevel@tonic-gate 3266f86c6ccaSdm mutex_enter(&np->s_lock); 32677c478bd9Sstevel@tonic-gate np->clientid = tmp_clientid; 32687c478bd9Sstevel@tonic-gate np->s_flags |= N4S_CLIENTID_SET; 32697c478bd9Sstevel@tonic-gate 32707c478bd9Sstevel@tonic-gate /* Add mi to np's mntinfo4 list */ 32717c478bd9Sstevel@tonic-gate nfs4_add_mi_to_server(np, mi); 32727c478bd9Sstevel@tonic-gate 32737c478bd9Sstevel@tonic-gate if (np->lease_valid == NFS4_LEASE_NOT_STARTED) { 32747c478bd9Sstevel@tonic-gate /* 32757c478bd9Sstevel@tonic-gate * Start lease management thread. 32767c478bd9Sstevel@tonic-gate * Keep trying until we succeed. 32777c478bd9Sstevel@tonic-gate */ 32787c478bd9Sstevel@tonic-gate 32797c478bd9Sstevel@tonic-gate np->s_refcnt++; /* pass reference to thread */ 32807c478bd9Sstevel@tonic-gate (void) zthread_create(NULL, 0, nfs4_renew_lease_thread, np, 0, 3281b9238976Sth minclsyspri); 32827c478bd9Sstevel@tonic-gate } 3283f86c6ccaSdm mutex_exit(&np->s_lock); 32847c478bd9Sstevel@tonic-gate 32857c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 32867c478bd9Sstevel@tonic-gate } 32877c478bd9Sstevel@tonic-gate 32887c478bd9Sstevel@tonic-gate /* 32897c478bd9Sstevel@tonic-gate * Add mi to sp's mntinfo4_list if it isn't already in the list. Makes 32907c478bd9Sstevel@tonic-gate * mi's clientid the same as sp's. 32917c478bd9Sstevel@tonic-gate * Assumes sp is locked down. 32927c478bd9Sstevel@tonic-gate */ 32937c478bd9Sstevel@tonic-gate void 32947c478bd9Sstevel@tonic-gate nfs4_add_mi_to_server(nfs4_server_t *sp, mntinfo4_t *mi) 32957c478bd9Sstevel@tonic-gate { 32967c478bd9Sstevel@tonic-gate mntinfo4_t *tmi; 32977c478bd9Sstevel@tonic-gate int in_list = 0; 32987c478bd9Sstevel@tonic-gate 3299a092743bSek ASSERT(nfs_rw_lock_held(&mi->mi_recovlock, RW_READER) || 3300a092743bSek nfs_rw_lock_held(&mi->mi_recovlock, RW_WRITER)); 33017c478bd9Sstevel@tonic-gate ASSERT(sp != &nfs4_server_lst); 33027c478bd9Sstevel@tonic-gate ASSERT(MUTEX_HELD(&sp->s_lock)); 33037c478bd9Sstevel@tonic-gate 33047c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_lease_debug, (CE_NOTE, 3305b9238976Sth "nfs4_add_mi_to_server: add mi %p to sp %p", 3306b9238976Sth (void*)mi, (void*)sp)); 33077c478bd9Sstevel@tonic-gate 33087c478bd9Sstevel@tonic-gate for (tmi = sp->mntinfo4_list; 33097c478bd9Sstevel@tonic-gate tmi != NULL; 33107c478bd9Sstevel@tonic-gate tmi = tmi->mi_clientid_next) { 33117c478bd9Sstevel@tonic-gate if (tmi == mi) { 33127c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_lease_debug, 3313b9238976Sth (CE_NOTE, 3314b9238976Sth "nfs4_add_mi_to_server: mi in list")); 33157c478bd9Sstevel@tonic-gate in_list = 1; 33167c478bd9Sstevel@tonic-gate } 33177c478bd9Sstevel@tonic-gate } 33187c478bd9Sstevel@tonic-gate 33197c478bd9Sstevel@tonic-gate /* 33207c478bd9Sstevel@tonic-gate * First put a hold on the mntinfo4's vfsp so that references via 33217c478bd9Sstevel@tonic-gate * mntinfo4_list will be valid. 33227c478bd9Sstevel@tonic-gate */ 33237c478bd9Sstevel@tonic-gate if (!in_list) 33247c478bd9Sstevel@tonic-gate VFS_HOLD(mi->mi_vfsp); 33257c478bd9Sstevel@tonic-gate 33267c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_lease_debug, (CE_NOTE, "nfs4_add_mi_to_server: " 3327b9238976Sth "hold vfs %p for mi: %p", (void*)mi->mi_vfsp, (void*)mi)); 33287c478bd9Sstevel@tonic-gate 33297c478bd9Sstevel@tonic-gate if (!in_list) { 33307c478bd9Sstevel@tonic-gate if (sp->mntinfo4_list) 33317c478bd9Sstevel@tonic-gate sp->mntinfo4_list->mi_clientid_prev = mi; 33327c478bd9Sstevel@tonic-gate mi->mi_clientid_next = sp->mntinfo4_list; 33333b895386SPavel Filipensky mi->mi_srv = sp; 33347c478bd9Sstevel@tonic-gate sp->mntinfo4_list = mi; 33357c478bd9Sstevel@tonic-gate mi->mi_srvsettime = gethrestime_sec(); 33363b895386SPavel Filipensky mi->mi_srvset_cnt++; 33377c478bd9Sstevel@tonic-gate } 33387c478bd9Sstevel@tonic-gate 33397c478bd9Sstevel@tonic-gate /* set mi's clientid to that of sp's for later matching */ 33407c478bd9Sstevel@tonic-gate mi->mi_clientid = sp->clientid; 33417c478bd9Sstevel@tonic-gate 33427c478bd9Sstevel@tonic-gate /* 33437c478bd9Sstevel@tonic-gate * Update the clientid for any other mi's belonging to sp. This 33447c478bd9Sstevel@tonic-gate * must be done here while we hold sp->s_lock, so that 33457c478bd9Sstevel@tonic-gate * find_nfs4_server() continues to work. 33467c478bd9Sstevel@tonic-gate */ 33477c478bd9Sstevel@tonic-gate 33487c478bd9Sstevel@tonic-gate for (tmi = sp->mntinfo4_list; 33497c478bd9Sstevel@tonic-gate tmi != NULL; 33507c478bd9Sstevel@tonic-gate tmi = tmi->mi_clientid_next) { 33517c478bd9Sstevel@tonic-gate if (tmi != mi) { 33527c478bd9Sstevel@tonic-gate tmi->mi_clientid = sp->clientid; 33537c478bd9Sstevel@tonic-gate } 33547c478bd9Sstevel@tonic-gate } 33557c478bd9Sstevel@tonic-gate } 33567c478bd9Sstevel@tonic-gate 33577c478bd9Sstevel@tonic-gate /* 33587c478bd9Sstevel@tonic-gate * Remove the mi from sp's mntinfo4_list and release its reference. 33597c478bd9Sstevel@tonic-gate * Exception: if mi still has open files, flag it for later removal (when 33607c478bd9Sstevel@tonic-gate * all the files are closed). 33617c478bd9Sstevel@tonic-gate * 33627c478bd9Sstevel@tonic-gate * If this is the last mntinfo4 in sp's list then tell the lease renewal 33637c478bd9Sstevel@tonic-gate * thread to exit. 33647c478bd9Sstevel@tonic-gate */ 33657c478bd9Sstevel@tonic-gate static void 33667c478bd9Sstevel@tonic-gate nfs4_remove_mi_from_server_nolock(mntinfo4_t *mi, nfs4_server_t *sp) 33677c478bd9Sstevel@tonic-gate { 33687c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_lease_debug, (CE_NOTE, 3369b9238976Sth "nfs4_remove_mi_from_server_nolock: remove mi %p from sp %p", 3370b9238976Sth (void*)mi, (void*)sp)); 33717c478bd9Sstevel@tonic-gate 33727c478bd9Sstevel@tonic-gate ASSERT(sp != NULL); 33737c478bd9Sstevel@tonic-gate ASSERT(MUTEX_HELD(&sp->s_lock)); 33747c478bd9Sstevel@tonic-gate ASSERT(mi->mi_open_files >= 0); 33757c478bd9Sstevel@tonic-gate 33767c478bd9Sstevel@tonic-gate /* 33777c478bd9Sstevel@tonic-gate * First make sure this mntinfo4 can be taken off of the list, 33787c478bd9Sstevel@tonic-gate * ie: it doesn't have any open files remaining. 33797c478bd9Sstevel@tonic-gate */ 33807c478bd9Sstevel@tonic-gate if (mi->mi_open_files > 0) { 33817c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_lease_debug, (CE_NOTE, 3382b9238976Sth "nfs4_remove_mi_from_server_nolock: don't " 3383b9238976Sth "remove mi since it still has files open")); 33847c478bd9Sstevel@tonic-gate 33857c478bd9Sstevel@tonic-gate mutex_enter(&mi->mi_lock); 33867c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_REMOVE_ON_LAST_CLOSE; 33877c478bd9Sstevel@tonic-gate mutex_exit(&mi->mi_lock); 33887c478bd9Sstevel@tonic-gate return; 33897c478bd9Sstevel@tonic-gate } 33907c478bd9Sstevel@tonic-gate 339150a83466Sjwahlig VFS_HOLD(mi->mi_vfsp); 33927c478bd9Sstevel@tonic-gate remove_mi(sp, mi); 339350a83466Sjwahlig VFS_RELE(mi->mi_vfsp); 33947c478bd9Sstevel@tonic-gate 33957c478bd9Sstevel@tonic-gate if (sp->mntinfo4_list == NULL) { 33967c478bd9Sstevel@tonic-gate /* last fs unmounted, kill the thread */ 33977c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_lease_debug, (CE_NOTE, 3398b9238976Sth "remove_mi_from_nfs4_server_nolock: kill the thread")); 33997c478bd9Sstevel@tonic-gate nfs4_mark_srv_dead(sp); 34007c478bd9Sstevel@tonic-gate } 34017c478bd9Sstevel@tonic-gate } 34027c478bd9Sstevel@tonic-gate 34037c478bd9Sstevel@tonic-gate /* 34047c478bd9Sstevel@tonic-gate * Remove mi from sp's mntinfo4_list and release the vfs reference. 34057c478bd9Sstevel@tonic-gate */ 34067c478bd9Sstevel@tonic-gate static void 34077c478bd9Sstevel@tonic-gate remove_mi(nfs4_server_t *sp, mntinfo4_t *mi) 34087c478bd9Sstevel@tonic-gate { 34097c478bd9Sstevel@tonic-gate ASSERT(MUTEX_HELD(&sp->s_lock)); 34107c478bd9Sstevel@tonic-gate 34117c478bd9Sstevel@tonic-gate /* 34127c478bd9Sstevel@tonic-gate * We release a reference, and the caller must still have a 34137c478bd9Sstevel@tonic-gate * reference. 34147c478bd9Sstevel@tonic-gate */ 34157c478bd9Sstevel@tonic-gate ASSERT(mi->mi_vfsp->vfs_count >= 2); 34167c478bd9Sstevel@tonic-gate 34177c478bd9Sstevel@tonic-gate if (mi->mi_clientid_prev) { 34187c478bd9Sstevel@tonic-gate mi->mi_clientid_prev->mi_clientid_next = mi->mi_clientid_next; 34197c478bd9Sstevel@tonic-gate } else { 34207c478bd9Sstevel@tonic-gate /* This is the first mi in sp's mntinfo4_list */ 34217c478bd9Sstevel@tonic-gate /* 34227c478bd9Sstevel@tonic-gate * Make sure the first mntinfo4 in the list is the actual 34237c478bd9Sstevel@tonic-gate * mntinfo4 passed in. 34247c478bd9Sstevel@tonic-gate */ 34257c478bd9Sstevel@tonic-gate ASSERT(sp->mntinfo4_list == mi); 34267c478bd9Sstevel@tonic-gate 34277c478bd9Sstevel@tonic-gate sp->mntinfo4_list = mi->mi_clientid_next; 34287c478bd9Sstevel@tonic-gate } 34297c478bd9Sstevel@tonic-gate if (mi->mi_clientid_next) 34307c478bd9Sstevel@tonic-gate mi->mi_clientid_next->mi_clientid_prev = mi->mi_clientid_prev; 34317c478bd9Sstevel@tonic-gate 34327c478bd9Sstevel@tonic-gate /* Now mark the mntinfo4's links as being removed */ 34337c478bd9Sstevel@tonic-gate mi->mi_clientid_prev = mi->mi_clientid_next = NULL; 34343b895386SPavel Filipensky mi->mi_srv = NULL; 343522dc8f51SPavel Filipensky mi->mi_srvset_cnt++; 34367c478bd9Sstevel@tonic-gate 34377c478bd9Sstevel@tonic-gate VFS_RELE(mi->mi_vfsp); 34387c478bd9Sstevel@tonic-gate } 34397c478bd9Sstevel@tonic-gate 34407c478bd9Sstevel@tonic-gate /* 34417c478bd9Sstevel@tonic-gate * Free all the entries in sp's mntinfo4_list. 34427c478bd9Sstevel@tonic-gate */ 34437c478bd9Sstevel@tonic-gate static void 34447c478bd9Sstevel@tonic-gate remove_all_mi(nfs4_server_t *sp) 34457c478bd9Sstevel@tonic-gate { 34467c478bd9Sstevel@tonic-gate mntinfo4_t *mi; 34477c478bd9Sstevel@tonic-gate 34487c478bd9Sstevel@tonic-gate ASSERT(MUTEX_HELD(&sp->s_lock)); 34497c478bd9Sstevel@tonic-gate 34507c478bd9Sstevel@tonic-gate while (sp->mntinfo4_list != NULL) { 34517c478bd9Sstevel@tonic-gate mi = sp->mntinfo4_list; 34527c478bd9Sstevel@tonic-gate /* 34537c478bd9Sstevel@tonic-gate * Grab a reference in case there is only one left (which 34547c478bd9Sstevel@tonic-gate * remove_mi() frees). 34557c478bd9Sstevel@tonic-gate */ 34567c478bd9Sstevel@tonic-gate VFS_HOLD(mi->mi_vfsp); 34577c478bd9Sstevel@tonic-gate remove_mi(sp, mi); 34587c478bd9Sstevel@tonic-gate VFS_RELE(mi->mi_vfsp); 34597c478bd9Sstevel@tonic-gate } 34607c478bd9Sstevel@tonic-gate } 34617c478bd9Sstevel@tonic-gate 34627c478bd9Sstevel@tonic-gate /* 34637c478bd9Sstevel@tonic-gate * Remove the mi from sp's mntinfo4_list as above, and rele the vfs. 34647c478bd9Sstevel@tonic-gate * 34657c478bd9Sstevel@tonic-gate * This version can be called with a null nfs4_server_t arg, 34667c478bd9Sstevel@tonic-gate * and will either find the right one and handle locking, or 34677c478bd9Sstevel@tonic-gate * do nothing because the mi wasn't added to an sp's mntinfo4_list. 34687c478bd9Sstevel@tonic-gate */ 34697c478bd9Sstevel@tonic-gate void 34707c478bd9Sstevel@tonic-gate nfs4_remove_mi_from_server(mntinfo4_t *mi, nfs4_server_t *esp) 34717c478bd9Sstevel@tonic-gate { 34727c478bd9Sstevel@tonic-gate nfs4_server_t *sp; 34737c478bd9Sstevel@tonic-gate 34743b895386SPavel Filipensky if (esp) { 34753b895386SPavel Filipensky nfs4_remove_mi_from_server_nolock(mi, esp); 34763b895386SPavel Filipensky return; 34773b895386SPavel Filipensky } 34787c478bd9Sstevel@tonic-gate 34793b895386SPavel Filipensky (void) nfs_rw_enter_sig(&mi->mi_recovlock, RW_READER, 0); 348022dc8f51SPavel Filipensky if (sp = find_nfs4_server_all(mi, 1)) { 34817c478bd9Sstevel@tonic-gate nfs4_remove_mi_from_server_nolock(mi, sp); 34823b895386SPavel Filipensky mutex_exit(&sp->s_lock); 348322dc8f51SPavel Filipensky nfs4_server_rele(sp); 34847c478bd9Sstevel@tonic-gate } 34853b895386SPavel Filipensky nfs_rw_exit(&mi->mi_recovlock); 34867c478bd9Sstevel@tonic-gate } 34877c478bd9Sstevel@tonic-gate 34887c478bd9Sstevel@tonic-gate /* 34897c478bd9Sstevel@tonic-gate * Return TRUE if the given server has any non-unmounted filesystems. 34907c478bd9Sstevel@tonic-gate */ 34917c478bd9Sstevel@tonic-gate 34927c478bd9Sstevel@tonic-gate bool_t 34937c478bd9Sstevel@tonic-gate nfs4_fs_active(nfs4_server_t *sp) 34947c478bd9Sstevel@tonic-gate { 34957c478bd9Sstevel@tonic-gate mntinfo4_t *mi; 34967c478bd9Sstevel@tonic-gate 34977c478bd9Sstevel@tonic-gate ASSERT(MUTEX_HELD(&sp->s_lock)); 34987c478bd9Sstevel@tonic-gate 34997c478bd9Sstevel@tonic-gate for (mi = sp->mntinfo4_list; mi != NULL; mi = mi->mi_clientid_next) { 35007c478bd9Sstevel@tonic-gate if (!(mi->mi_vfsp->vfs_flag & VFS_UNMOUNTED)) 35017c478bd9Sstevel@tonic-gate return (TRUE); 35027c478bd9Sstevel@tonic-gate } 35037c478bd9Sstevel@tonic-gate 35047c478bd9Sstevel@tonic-gate return (FALSE); 35057c478bd9Sstevel@tonic-gate } 35067c478bd9Sstevel@tonic-gate 35077c478bd9Sstevel@tonic-gate /* 35087c478bd9Sstevel@tonic-gate * Mark sp as finished and notify any waiters. 35097c478bd9Sstevel@tonic-gate */ 35107c478bd9Sstevel@tonic-gate 35117c478bd9Sstevel@tonic-gate void 35127c478bd9Sstevel@tonic-gate nfs4_mark_srv_dead(nfs4_server_t *sp) 35137c478bd9Sstevel@tonic-gate { 35147c478bd9Sstevel@tonic-gate ASSERT(MUTEX_HELD(&sp->s_lock)); 35157c478bd9Sstevel@tonic-gate 35167c478bd9Sstevel@tonic-gate sp->s_thread_exit = NFS4_THREAD_EXIT; 35177c478bd9Sstevel@tonic-gate cv_broadcast(&sp->cv_thread_exit); 35187c478bd9Sstevel@tonic-gate } 35197c478bd9Sstevel@tonic-gate 35207c478bd9Sstevel@tonic-gate /* 35217c478bd9Sstevel@tonic-gate * Create a new nfs4_server_t structure. 35227c478bd9Sstevel@tonic-gate * Returns new node unlocked and not in list, but with a reference count of 35237c478bd9Sstevel@tonic-gate * 1. 35247c478bd9Sstevel@tonic-gate */ 35257c478bd9Sstevel@tonic-gate struct nfs4_server * 35267c478bd9Sstevel@tonic-gate new_nfs4_server(struct servinfo4 *svp, cred_t *cr) 35277c478bd9Sstevel@tonic-gate { 35287c478bd9Sstevel@tonic-gate struct nfs4_server *np; 35297c478bd9Sstevel@tonic-gate timespec_t tt; 35307c478bd9Sstevel@tonic-gate union { 35317c478bd9Sstevel@tonic-gate struct { 35327c478bd9Sstevel@tonic-gate uint32_t sec; 35337c478bd9Sstevel@tonic-gate uint32_t subsec; 35347c478bd9Sstevel@tonic-gate } un_curtime; 35357c478bd9Sstevel@tonic-gate verifier4 un_verifier; 35367c478bd9Sstevel@tonic-gate } nfs4clientid_verifier; 35377c478bd9Sstevel@tonic-gate char id_val[] = "Solaris: %s, NFSv4 kernel client"; 35387c478bd9Sstevel@tonic-gate int len; 35397c478bd9Sstevel@tonic-gate 35407c478bd9Sstevel@tonic-gate np = kmem_zalloc(sizeof (struct nfs4_server), KM_SLEEP); 35417c478bd9Sstevel@tonic-gate np->saddr.len = svp->sv_addr.len; 35427c478bd9Sstevel@tonic-gate np->saddr.maxlen = svp->sv_addr.maxlen; 35437c478bd9Sstevel@tonic-gate np->saddr.buf = kmem_alloc(svp->sv_addr.maxlen, KM_SLEEP); 35447c478bd9Sstevel@tonic-gate bcopy(svp->sv_addr.buf, np->saddr.buf, svp->sv_addr.len); 35457c478bd9Sstevel@tonic-gate np->s_refcnt = 1; 35467c478bd9Sstevel@tonic-gate 35477c478bd9Sstevel@tonic-gate /* 35487c478bd9Sstevel@tonic-gate * Build the nfs_client_id4 for this server mount. Ensure 35497c478bd9Sstevel@tonic-gate * the verifier is useful and that the identification is 35507c478bd9Sstevel@tonic-gate * somehow based on the server's address for the case of 35517c478bd9Sstevel@tonic-gate * multi-homed servers. 35527c478bd9Sstevel@tonic-gate */ 35537c478bd9Sstevel@tonic-gate nfs4clientid_verifier.un_verifier = 0; 35547c478bd9Sstevel@tonic-gate gethrestime(&tt); 35557c478bd9Sstevel@tonic-gate nfs4clientid_verifier.un_curtime.sec = (uint32_t)tt.tv_sec; 35567c478bd9Sstevel@tonic-gate nfs4clientid_verifier.un_curtime.subsec = (uint32_t)tt.tv_nsec; 35577c478bd9Sstevel@tonic-gate np->clidtosend.verifier = nfs4clientid_verifier.un_verifier; 35587c478bd9Sstevel@tonic-gate 35597c478bd9Sstevel@tonic-gate /* 35607c478bd9Sstevel@tonic-gate * calculate the length of the opaque identifier. Subtract 2 35617c478bd9Sstevel@tonic-gate * for the "%s" and add the traditional +1 for null 35627c478bd9Sstevel@tonic-gate * termination. 35637c478bd9Sstevel@tonic-gate */ 35647c478bd9Sstevel@tonic-gate len = strlen(id_val) - 2 + strlen(uts_nodename()) + 1; 35657c478bd9Sstevel@tonic-gate np->clidtosend.id_len = len + np->saddr.maxlen; 35667c478bd9Sstevel@tonic-gate 35677c478bd9Sstevel@tonic-gate np->clidtosend.id_val = kmem_alloc(np->clidtosend.id_len, KM_SLEEP); 35687c478bd9Sstevel@tonic-gate (void) sprintf(np->clidtosend.id_val, id_val, uts_nodename()); 35697c478bd9Sstevel@tonic-gate bcopy(np->saddr.buf, &np->clidtosend.id_val[len], np->saddr.len); 35707c478bd9Sstevel@tonic-gate 35717c478bd9Sstevel@tonic-gate np->s_flags = 0; 35727c478bd9Sstevel@tonic-gate np->mntinfo4_list = NULL; 35737c478bd9Sstevel@tonic-gate /* save cred for issuing rfs4calls inside the renew thread */ 35747c478bd9Sstevel@tonic-gate crhold(cr); 35757c478bd9Sstevel@tonic-gate np->s_cred = cr; 35767c478bd9Sstevel@tonic-gate cv_init(&np->cv_thread_exit, NULL, CV_DEFAULT, NULL); 35777c478bd9Sstevel@tonic-gate mutex_init(&np->s_lock, NULL, MUTEX_DEFAULT, NULL); 35787c478bd9Sstevel@tonic-gate nfs_rw_init(&np->s_recovlock, NULL, RW_DEFAULT, NULL); 35797c478bd9Sstevel@tonic-gate list_create(&np->s_deleg_list, sizeof (rnode4_t), 35807c478bd9Sstevel@tonic-gate offsetof(rnode4_t, r_deleg_link)); 35817c478bd9Sstevel@tonic-gate np->s_thread_exit = 0; 35827c478bd9Sstevel@tonic-gate np->state_ref_count = 0; 35837c478bd9Sstevel@tonic-gate np->lease_valid = NFS4_LEASE_NOT_STARTED; 35847c478bd9Sstevel@tonic-gate cv_init(&np->s_cv_otw_count, NULL, CV_DEFAULT, NULL); 3585f86c6ccaSdm cv_init(&np->s_clientid_pend, NULL, CV_DEFAULT, NULL); 35867c478bd9Sstevel@tonic-gate np->s_otw_call_count = 0; 35877c478bd9Sstevel@tonic-gate cv_init(&np->wait_cb_null, NULL, CV_DEFAULT, NULL); 35887c478bd9Sstevel@tonic-gate np->zoneid = getzoneid(); 35897c478bd9Sstevel@tonic-gate np->zone_globals = nfs4_get_callback_globals(); 35907c478bd9Sstevel@tonic-gate ASSERT(np->zone_globals != NULL); 35917c478bd9Sstevel@tonic-gate return (np); 35927c478bd9Sstevel@tonic-gate } 35937c478bd9Sstevel@tonic-gate 35947c478bd9Sstevel@tonic-gate /* 35957c478bd9Sstevel@tonic-gate * Create a new nfs4_server_t structure and add it to the list. 35967c478bd9Sstevel@tonic-gate * Returns new node locked; reference must eventually be freed. 35977c478bd9Sstevel@tonic-gate */ 35987c478bd9Sstevel@tonic-gate static struct nfs4_server * 35997c478bd9Sstevel@tonic-gate add_new_nfs4_server(struct servinfo4 *svp, cred_t *cr) 36007c478bd9Sstevel@tonic-gate { 36017c478bd9Sstevel@tonic-gate nfs4_server_t *sp; 36027c478bd9Sstevel@tonic-gate 36037c478bd9Sstevel@tonic-gate ASSERT(MUTEX_HELD(&nfs4_server_lst_lock)); 36047c478bd9Sstevel@tonic-gate sp = new_nfs4_server(svp, cr); 36057c478bd9Sstevel@tonic-gate mutex_enter(&sp->s_lock); 36067c478bd9Sstevel@tonic-gate insque(sp, &nfs4_server_lst); 36077c478bd9Sstevel@tonic-gate sp->s_refcnt++; /* list gets a reference */ 3608f64c4ae1Sdm sp->s_flags |= N4S_INSERTED; 36097c478bd9Sstevel@tonic-gate sp->clientid = 0; 36107c478bd9Sstevel@tonic-gate return (sp); 36117c478bd9Sstevel@tonic-gate } 36127c478bd9Sstevel@tonic-gate 36137c478bd9Sstevel@tonic-gate int nfs4_server_t_debug = 0; 36147c478bd9Sstevel@tonic-gate 36157c478bd9Sstevel@tonic-gate #ifdef lint 36167c478bd9Sstevel@tonic-gate extern void 36177c478bd9Sstevel@tonic-gate dumpnfs4slist(char *, mntinfo4_t *, clientid4, servinfo4_t *); 36187c478bd9Sstevel@tonic-gate #endif 36197c478bd9Sstevel@tonic-gate 36207c478bd9Sstevel@tonic-gate #ifndef lint 36217c478bd9Sstevel@tonic-gate #ifdef DEBUG 36227c478bd9Sstevel@tonic-gate void 36237c478bd9Sstevel@tonic-gate dumpnfs4slist(char *txt, mntinfo4_t *mi, clientid4 clientid, servinfo4_t *srv_p) 36247c478bd9Sstevel@tonic-gate { 36257c478bd9Sstevel@tonic-gate int hash16(void *p, int len); 36267c478bd9Sstevel@tonic-gate nfs4_server_t *np; 36277c478bd9Sstevel@tonic-gate 36287c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_server_t_debug, (CE_NOTE, 36297c478bd9Sstevel@tonic-gate "dumping nfs4_server_t list in %s", txt)); 36307c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_server_t_debug, (CE_CONT, 36317c478bd9Sstevel@tonic-gate "mi 0x%p, want clientid %llx, addr %d/%04X", 36327c478bd9Sstevel@tonic-gate mi, (longlong_t)clientid, srv_p->sv_addr.len, 36337c478bd9Sstevel@tonic-gate hash16((void *)srv_p->sv_addr.buf, srv_p->sv_addr.len))); 36347c478bd9Sstevel@tonic-gate for (np = nfs4_server_lst.forw; np != &nfs4_server_lst; 36357c478bd9Sstevel@tonic-gate np = np->forw) { 36367c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_server_t_debug, (CE_CONT, 36377c478bd9Sstevel@tonic-gate "node 0x%p, clientid %llx, addr %d/%04X, cnt %d", 36387c478bd9Sstevel@tonic-gate np, (longlong_t)np->clientid, np->saddr.len, 36397c478bd9Sstevel@tonic-gate hash16((void *)np->saddr.buf, np->saddr.len), 36407c478bd9Sstevel@tonic-gate np->state_ref_count)); 36417c478bd9Sstevel@tonic-gate if (np->saddr.len == srv_p->sv_addr.len && 36427c478bd9Sstevel@tonic-gate bcmp(np->saddr.buf, srv_p->sv_addr.buf, 36437c478bd9Sstevel@tonic-gate np->saddr.len) == 0) 36447c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_server_t_debug, (CE_CONT, 36457c478bd9Sstevel@tonic-gate " - address matches")); 36467c478bd9Sstevel@tonic-gate if (np->clientid == clientid || np->clientid == 0) 36477c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_server_t_debug, (CE_CONT, 36487c478bd9Sstevel@tonic-gate " - clientid matches")); 36497c478bd9Sstevel@tonic-gate if (np->s_thread_exit != NFS4_THREAD_EXIT) 36507c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_server_t_debug, (CE_CONT, 36517c478bd9Sstevel@tonic-gate " - thread not exiting")); 36527c478bd9Sstevel@tonic-gate } 36537c478bd9Sstevel@tonic-gate delay(hz); 36547c478bd9Sstevel@tonic-gate } 36557c478bd9Sstevel@tonic-gate #endif 36567c478bd9Sstevel@tonic-gate #endif 36577c478bd9Sstevel@tonic-gate 36587c478bd9Sstevel@tonic-gate 36597c478bd9Sstevel@tonic-gate /* 36607c478bd9Sstevel@tonic-gate * Move a mntinfo4_t from one server list to another. 36617c478bd9Sstevel@tonic-gate * Locking of the two nfs4_server_t nodes will be done in list order. 36627c478bd9Sstevel@tonic-gate * 36637c478bd9Sstevel@tonic-gate * Returns NULL if the current nfs4_server_t for the filesystem could not 36647c478bd9Sstevel@tonic-gate * be found (e.g., due to forced unmount). Otherwise returns a reference 36657c478bd9Sstevel@tonic-gate * to the new nfs4_server_t, which must eventually be freed. 36667c478bd9Sstevel@tonic-gate */ 36677c478bd9Sstevel@tonic-gate nfs4_server_t * 36687c478bd9Sstevel@tonic-gate nfs4_move_mi(mntinfo4_t *mi, servinfo4_t *old, servinfo4_t *new) 36697c478bd9Sstevel@tonic-gate { 36707c478bd9Sstevel@tonic-gate nfs4_server_t *p, *op = NULL, *np = NULL; 36717c478bd9Sstevel@tonic-gate int num_open; 3672108322fbScarlsonj zoneid_t zoneid = nfs_zoneid(); 36737c478bd9Sstevel@tonic-gate 3674108322fbScarlsonj ASSERT(nfs_zone() == mi->mi_zone); 36757c478bd9Sstevel@tonic-gate 36767c478bd9Sstevel@tonic-gate mutex_enter(&nfs4_server_lst_lock); 36777c478bd9Sstevel@tonic-gate #ifdef DEBUG 36787c478bd9Sstevel@tonic-gate if (nfs4_server_t_debug) 36797c478bd9Sstevel@tonic-gate dumpnfs4slist("nfs4_move_mi", mi, (clientid4)0, new); 36807c478bd9Sstevel@tonic-gate #endif 36817c478bd9Sstevel@tonic-gate for (p = nfs4_server_lst.forw; p != &nfs4_server_lst; p = p->forw) { 36827c478bd9Sstevel@tonic-gate if (p->zoneid != zoneid) 36837c478bd9Sstevel@tonic-gate continue; 36847c478bd9Sstevel@tonic-gate if (p->saddr.len == old->sv_addr.len && 36857c478bd9Sstevel@tonic-gate bcmp(p->saddr.buf, old->sv_addr.buf, p->saddr.len) == 0 && 36867c478bd9Sstevel@tonic-gate p->s_thread_exit != NFS4_THREAD_EXIT) { 36877c478bd9Sstevel@tonic-gate op = p; 36887c478bd9Sstevel@tonic-gate mutex_enter(&op->s_lock); 36897c478bd9Sstevel@tonic-gate op->s_refcnt++; 36907c478bd9Sstevel@tonic-gate } 36917c478bd9Sstevel@tonic-gate if (p->saddr.len == new->sv_addr.len && 36927c478bd9Sstevel@tonic-gate bcmp(p->saddr.buf, new->sv_addr.buf, p->saddr.len) == 0 && 36937c478bd9Sstevel@tonic-gate p->s_thread_exit != NFS4_THREAD_EXIT) { 36947c478bd9Sstevel@tonic-gate np = p; 36957c478bd9Sstevel@tonic-gate mutex_enter(&np->s_lock); 36967c478bd9Sstevel@tonic-gate } 36977c478bd9Sstevel@tonic-gate if (op != NULL && np != NULL) 36987c478bd9Sstevel@tonic-gate break; 36997c478bd9Sstevel@tonic-gate } 37007c478bd9Sstevel@tonic-gate if (op == NULL) { 37017c478bd9Sstevel@tonic-gate /* 37027c478bd9Sstevel@tonic-gate * Filesystem has been forcibly unmounted. Bail out. 37037c478bd9Sstevel@tonic-gate */ 37047c478bd9Sstevel@tonic-gate if (np != NULL) 37057c478bd9Sstevel@tonic-gate mutex_exit(&np->s_lock); 37067c478bd9Sstevel@tonic-gate mutex_exit(&nfs4_server_lst_lock); 37077c478bd9Sstevel@tonic-gate return (NULL); 37087c478bd9Sstevel@tonic-gate } 37097c478bd9Sstevel@tonic-gate if (np != NULL) { 37107c478bd9Sstevel@tonic-gate np->s_refcnt++; 37117c478bd9Sstevel@tonic-gate } else { 37127c478bd9Sstevel@tonic-gate #ifdef DEBUG 37137c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_failover_debug, (CE_NOTE, 37147c478bd9Sstevel@tonic-gate "nfs4_move_mi: no target nfs4_server, will create.")); 37157c478bd9Sstevel@tonic-gate #endif 37167c478bd9Sstevel@tonic-gate np = add_new_nfs4_server(new, kcred); 37177c478bd9Sstevel@tonic-gate } 37187c478bd9Sstevel@tonic-gate mutex_exit(&nfs4_server_lst_lock); 37197c478bd9Sstevel@tonic-gate 37207c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_failover_debug, (CE_NOTE, 37217c478bd9Sstevel@tonic-gate "nfs4_move_mi: for mi 0x%p, " 37227c478bd9Sstevel@tonic-gate "old servinfo4 0x%p, new servinfo4 0x%p, " 37237c478bd9Sstevel@tonic-gate "old nfs4_server 0x%p, new nfs4_server 0x%p, ", 37247c478bd9Sstevel@tonic-gate (void*)mi, (void*)old, (void*)new, 37257c478bd9Sstevel@tonic-gate (void*)op, (void*)np)); 37267c478bd9Sstevel@tonic-gate ASSERT(op != NULL && np != NULL); 37277c478bd9Sstevel@tonic-gate 37287c478bd9Sstevel@tonic-gate /* discard any delegations */ 37297c478bd9Sstevel@tonic-gate nfs4_deleg_discard(mi, op); 37307c478bd9Sstevel@tonic-gate 37317c478bd9Sstevel@tonic-gate num_open = mi->mi_open_files; 37327c478bd9Sstevel@tonic-gate mi->mi_open_files = 0; 37337c478bd9Sstevel@tonic-gate op->state_ref_count -= num_open; 37347c478bd9Sstevel@tonic-gate ASSERT(op->state_ref_count >= 0); 37357c478bd9Sstevel@tonic-gate np->state_ref_count += num_open; 37367c478bd9Sstevel@tonic-gate nfs4_remove_mi_from_server_nolock(mi, op); 37377c478bd9Sstevel@tonic-gate mi->mi_open_files = num_open; 37387c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_failover_debug, (CE_NOTE, 37397c478bd9Sstevel@tonic-gate "nfs4_move_mi: mi_open_files %d, op->cnt %d, np->cnt %d", 37407c478bd9Sstevel@tonic-gate mi->mi_open_files, op->state_ref_count, np->state_ref_count)); 37417c478bd9Sstevel@tonic-gate 37427c478bd9Sstevel@tonic-gate nfs4_add_mi_to_server(np, mi); 37437c478bd9Sstevel@tonic-gate 37447c478bd9Sstevel@tonic-gate mutex_exit(&op->s_lock); 37457c478bd9Sstevel@tonic-gate mutex_exit(&np->s_lock); 374695c7fa91SPavel Filipensky nfs4_server_rele(op); 37477c478bd9Sstevel@tonic-gate 37487c478bd9Sstevel@tonic-gate return (np); 37497c478bd9Sstevel@tonic-gate } 37507c478bd9Sstevel@tonic-gate 37517c478bd9Sstevel@tonic-gate /* 3752f86c6ccaSdm * Need to have the nfs4_server_lst_lock. 37537c478bd9Sstevel@tonic-gate * Search the nfs4_server list to find a match on this servinfo4 37547c478bd9Sstevel@tonic-gate * based on its address. 37557c478bd9Sstevel@tonic-gate * 37567c478bd9Sstevel@tonic-gate * Returns NULL if no match is found. Otherwise returns a reference (which 37577c478bd9Sstevel@tonic-gate * must eventually be freed) to a locked nfs4_server. 37587c478bd9Sstevel@tonic-gate */ 37597c478bd9Sstevel@tonic-gate nfs4_server_t * 37607c478bd9Sstevel@tonic-gate servinfo4_to_nfs4_server(servinfo4_t *srv_p) 37617c478bd9Sstevel@tonic-gate { 37627c478bd9Sstevel@tonic-gate nfs4_server_t *np; 3763108322fbScarlsonj zoneid_t zoneid = nfs_zoneid(); 37647c478bd9Sstevel@tonic-gate 3765f86c6ccaSdm ASSERT(MUTEX_HELD(&nfs4_server_lst_lock)); 37667c478bd9Sstevel@tonic-gate for (np = nfs4_server_lst.forw; np != &nfs4_server_lst; np = np->forw) { 37677c478bd9Sstevel@tonic-gate if (np->zoneid == zoneid && 37687c478bd9Sstevel@tonic-gate np->saddr.len == srv_p->sv_addr.len && 37697c478bd9Sstevel@tonic-gate bcmp(np->saddr.buf, srv_p->sv_addr.buf, 3770b9238976Sth np->saddr.len) == 0 && 37717c478bd9Sstevel@tonic-gate np->s_thread_exit != NFS4_THREAD_EXIT) { 37727c478bd9Sstevel@tonic-gate mutex_enter(&np->s_lock); 37737c478bd9Sstevel@tonic-gate np->s_refcnt++; 37747c478bd9Sstevel@tonic-gate return (np); 37757c478bd9Sstevel@tonic-gate } 37767c478bd9Sstevel@tonic-gate } 37777c478bd9Sstevel@tonic-gate return (NULL); 37787c478bd9Sstevel@tonic-gate } 37797c478bd9Sstevel@tonic-gate 37807c478bd9Sstevel@tonic-gate /* 37817c478bd9Sstevel@tonic-gate * Locks the nfs4_server down if it is found and returns a reference that 37827c478bd9Sstevel@tonic-gate * must eventually be freed. 378322dc8f51SPavel Filipensky */ 378422dc8f51SPavel Filipensky static nfs4_server_t * 378522dc8f51SPavel Filipensky lookup_nfs4_server(nfs4_server_t *sp, int any_state) 378622dc8f51SPavel Filipensky { 378722dc8f51SPavel Filipensky nfs4_server_t *np; 378822dc8f51SPavel Filipensky 378922dc8f51SPavel Filipensky mutex_enter(&nfs4_server_lst_lock); 379022dc8f51SPavel Filipensky for (np = nfs4_server_lst.forw; np != &nfs4_server_lst; np = np->forw) { 379122dc8f51SPavel Filipensky mutex_enter(&np->s_lock); 379222dc8f51SPavel Filipensky if (np == sp && np->s_refcnt > 0 && 379322dc8f51SPavel Filipensky (np->s_thread_exit != NFS4_THREAD_EXIT || any_state)) { 379422dc8f51SPavel Filipensky mutex_exit(&nfs4_server_lst_lock); 379522dc8f51SPavel Filipensky np->s_refcnt++; 379622dc8f51SPavel Filipensky return (np); 379722dc8f51SPavel Filipensky } 379822dc8f51SPavel Filipensky mutex_exit(&np->s_lock); 379922dc8f51SPavel Filipensky } 380022dc8f51SPavel Filipensky mutex_exit(&nfs4_server_lst_lock); 380122dc8f51SPavel Filipensky 380222dc8f51SPavel Filipensky return (NULL); 380322dc8f51SPavel Filipensky } 380422dc8f51SPavel Filipensky 380522dc8f51SPavel Filipensky /* 38067c478bd9Sstevel@tonic-gate * The caller should be holding mi->mi_recovlock, and it should continue to 38077c478bd9Sstevel@tonic-gate * hold the lock until done with the returned nfs4_server_t. Once 38087c478bd9Sstevel@tonic-gate * mi->mi_recovlock is released, there is no guarantee that the returned 38097c478bd9Sstevel@tonic-gate * mi->nfs4_server_t will continue to correspond to mi. 38107c478bd9Sstevel@tonic-gate */ 38117c478bd9Sstevel@tonic-gate nfs4_server_t * 38127c478bd9Sstevel@tonic-gate find_nfs4_server(mntinfo4_t *mi) 38137c478bd9Sstevel@tonic-gate { 381422dc8f51SPavel Filipensky ASSERT(nfs_rw_lock_held(&mi->mi_recovlock, RW_READER) || 381522dc8f51SPavel Filipensky nfs_rw_lock_held(&mi->mi_recovlock, RW_WRITER)); 381622dc8f51SPavel Filipensky 381722dc8f51SPavel Filipensky return (lookup_nfs4_server(mi->mi_srv, 0)); 38187c478bd9Sstevel@tonic-gate } 38197c478bd9Sstevel@tonic-gate 38207c478bd9Sstevel@tonic-gate /* 382122dc8f51SPavel Filipensky * Same as above, but takes an "any_state" parameter which can be 38227c478bd9Sstevel@tonic-gate * set to 1 if the caller wishes to find nfs4_server_t's which 38237c478bd9Sstevel@tonic-gate * have been marked for termination by the exit of the renew 38247c478bd9Sstevel@tonic-gate * thread. This should only be used by operations which are 38257c478bd9Sstevel@tonic-gate * cleaning up and will not cause an OTW op. 38267c478bd9Sstevel@tonic-gate */ 38277c478bd9Sstevel@tonic-gate nfs4_server_t * 382822dc8f51SPavel Filipensky find_nfs4_server_all(mntinfo4_t *mi, int any_state) 38297c478bd9Sstevel@tonic-gate { 38307c478bd9Sstevel@tonic-gate ASSERT(nfs_rw_lock_held(&mi->mi_recovlock, RW_READER) || 38317c478bd9Sstevel@tonic-gate nfs_rw_lock_held(&mi->mi_recovlock, RW_WRITER)); 38327c478bd9Sstevel@tonic-gate 383322dc8f51SPavel Filipensky return (lookup_nfs4_server(mi->mi_srv, any_state)); 383422dc8f51SPavel Filipensky } 383522dc8f51SPavel Filipensky 383622dc8f51SPavel Filipensky /* 383722dc8f51SPavel Filipensky * Lock sp, but only if it's still active (in the list and hasn't been 383822dc8f51SPavel Filipensky * flagged as exiting) or 'any_state' is non-zero. 383922dc8f51SPavel Filipensky * Returns TRUE if sp got locked and adds a reference to sp. 384022dc8f51SPavel Filipensky */ 384122dc8f51SPavel Filipensky bool_t 384222dc8f51SPavel Filipensky nfs4_server_vlock(nfs4_server_t *sp, int any_state) 384322dc8f51SPavel Filipensky { 384422dc8f51SPavel Filipensky return (lookup_nfs4_server(sp, any_state) != NULL); 38457c478bd9Sstevel@tonic-gate } 38467c478bd9Sstevel@tonic-gate 38477c478bd9Sstevel@tonic-gate /* 38487c478bd9Sstevel@tonic-gate * Release the reference to sp and destroy it if that's the last one. 38497c478bd9Sstevel@tonic-gate */ 38507c478bd9Sstevel@tonic-gate 38517c478bd9Sstevel@tonic-gate void 38527c478bd9Sstevel@tonic-gate nfs4_server_rele(nfs4_server_t *sp) 38537c478bd9Sstevel@tonic-gate { 38547c478bd9Sstevel@tonic-gate mutex_enter(&sp->s_lock); 38557c478bd9Sstevel@tonic-gate ASSERT(sp->s_refcnt > 0); 38567c478bd9Sstevel@tonic-gate sp->s_refcnt--; 38577c478bd9Sstevel@tonic-gate if (sp->s_refcnt > 0) { 38587c478bd9Sstevel@tonic-gate mutex_exit(&sp->s_lock); 38597c478bd9Sstevel@tonic-gate return; 38607c478bd9Sstevel@tonic-gate } 38617c478bd9Sstevel@tonic-gate mutex_exit(&sp->s_lock); 3862f86c6ccaSdm 38637c478bd9Sstevel@tonic-gate mutex_enter(&nfs4_server_lst_lock); 38647c478bd9Sstevel@tonic-gate mutex_enter(&sp->s_lock); 38657c478bd9Sstevel@tonic-gate if (sp->s_refcnt > 0) { 38667c478bd9Sstevel@tonic-gate mutex_exit(&sp->s_lock); 38677c478bd9Sstevel@tonic-gate mutex_exit(&nfs4_server_lst_lock); 38687c478bd9Sstevel@tonic-gate return; 38697c478bd9Sstevel@tonic-gate } 3870f86c6ccaSdm remque(sp); 3871f86c6ccaSdm sp->forw = sp->back = NULL; 38727c478bd9Sstevel@tonic-gate mutex_exit(&nfs4_server_lst_lock); 38737c478bd9Sstevel@tonic-gate destroy_nfs4_server(sp); 38747c478bd9Sstevel@tonic-gate } 38757c478bd9Sstevel@tonic-gate 38767c478bd9Sstevel@tonic-gate static void 38777c478bd9Sstevel@tonic-gate destroy_nfs4_server(nfs4_server_t *sp) 38787c478bd9Sstevel@tonic-gate { 38797c478bd9Sstevel@tonic-gate ASSERT(MUTEX_HELD(&sp->s_lock)); 38807c478bd9Sstevel@tonic-gate ASSERT(sp->s_refcnt == 0); 38817c478bd9Sstevel@tonic-gate ASSERT(sp->s_otw_call_count == 0); 38827c478bd9Sstevel@tonic-gate 38837c478bd9Sstevel@tonic-gate remove_all_mi(sp); 38847c478bd9Sstevel@tonic-gate 38857c478bd9Sstevel@tonic-gate crfree(sp->s_cred); 38867c478bd9Sstevel@tonic-gate kmem_free(sp->saddr.buf, sp->saddr.maxlen); 38877c478bd9Sstevel@tonic-gate kmem_free(sp->clidtosend.id_val, sp->clidtosend.id_len); 38887c478bd9Sstevel@tonic-gate mutex_exit(&sp->s_lock); 38897c478bd9Sstevel@tonic-gate 38907c478bd9Sstevel@tonic-gate /* destroy the nfs4_server */ 38917c478bd9Sstevel@tonic-gate nfs4callback_destroy(sp); 38927c478bd9Sstevel@tonic-gate list_destroy(&sp->s_deleg_list); 38937c478bd9Sstevel@tonic-gate mutex_destroy(&sp->s_lock); 38947c478bd9Sstevel@tonic-gate cv_destroy(&sp->cv_thread_exit); 38957c478bd9Sstevel@tonic-gate cv_destroy(&sp->s_cv_otw_count); 3896f86c6ccaSdm cv_destroy(&sp->s_clientid_pend); 38977c478bd9Sstevel@tonic-gate cv_destroy(&sp->wait_cb_null); 38987c478bd9Sstevel@tonic-gate nfs_rw_destroy(&sp->s_recovlock); 38997c478bd9Sstevel@tonic-gate kmem_free(sp, sizeof (*sp)); 39007c478bd9Sstevel@tonic-gate } 39017c478bd9Sstevel@tonic-gate 39027c478bd9Sstevel@tonic-gate /* 39037c478bd9Sstevel@tonic-gate * Fork off a thread to free the data structures for a mount. 39047c478bd9Sstevel@tonic-gate */ 39057c478bd9Sstevel@tonic-gate 39067c478bd9Sstevel@tonic-gate static void 3907b9238976Sth async_free_mount(vfs_t *vfsp, int flag, cred_t *cr) 39087c478bd9Sstevel@tonic-gate { 39097c478bd9Sstevel@tonic-gate freemountargs_t *args; 39107c478bd9Sstevel@tonic-gate args = kmem_alloc(sizeof (freemountargs_t), KM_SLEEP); 39117c478bd9Sstevel@tonic-gate args->fm_vfsp = vfsp; 39127c478bd9Sstevel@tonic-gate VFS_HOLD(vfsp); 391350a83466Sjwahlig MI4_HOLD(VFTOMI4(vfsp)); 3914b9238976Sth args->fm_flag = flag; 39157c478bd9Sstevel@tonic-gate args->fm_cr = cr; 39167c478bd9Sstevel@tonic-gate crhold(cr); 39177c478bd9Sstevel@tonic-gate (void) zthread_create(NULL, 0, nfs4_free_mount_thread, args, 0, 39187c478bd9Sstevel@tonic-gate minclsyspri); 39197c478bd9Sstevel@tonic-gate } 39207c478bd9Sstevel@tonic-gate 39217c478bd9Sstevel@tonic-gate static void 39227c478bd9Sstevel@tonic-gate nfs4_free_mount_thread(freemountargs_t *args) 39237c478bd9Sstevel@tonic-gate { 392450a83466Sjwahlig mntinfo4_t *mi; 3925b9238976Sth nfs4_free_mount(args->fm_vfsp, args->fm_flag, args->fm_cr); 392650a83466Sjwahlig mi = VFTOMI4(args->fm_vfsp); 39277c478bd9Sstevel@tonic-gate crfree(args->fm_cr); 392850a83466Sjwahlig VFS_RELE(args->fm_vfsp); 392950a83466Sjwahlig MI4_RELE(mi); 39307c478bd9Sstevel@tonic-gate kmem_free(args, sizeof (freemountargs_t)); 39317c478bd9Sstevel@tonic-gate zthread_exit(); 39327c478bd9Sstevel@tonic-gate /* NOTREACHED */ 39337c478bd9Sstevel@tonic-gate } 39347c478bd9Sstevel@tonic-gate 39357c478bd9Sstevel@tonic-gate /* 39367c478bd9Sstevel@tonic-gate * Thread to free the data structures for a given filesystem. 39377c478bd9Sstevel@tonic-gate */ 39387c478bd9Sstevel@tonic-gate static void 3939b9238976Sth nfs4_free_mount(vfs_t *vfsp, int flag, cred_t *cr) 39407c478bd9Sstevel@tonic-gate { 3941b9238976Sth mntinfo4_t *mi = VFTOMI4(vfsp); 3942b9238976Sth nfs4_server_t *sp; 3943b9238976Sth callb_cpr_t cpr_info; 3944b9238976Sth kmutex_t cpr_lock; 3945b9238976Sth boolean_t async_thread; 3946b9238976Sth int removed; 3947b9238976Sth 3948d3a14591SThomas Haynes bool_t must_unlock; 3949d708af74SThomas Haynes bool_t must_rele; 3950b9238976Sth nfs4_ephemeral_tree_t *eph_tree; 39517c478bd9Sstevel@tonic-gate 39527c478bd9Sstevel@tonic-gate /* 39537c478bd9Sstevel@tonic-gate * We need to participate in the CPR framework if this is a kernel 39547c478bd9Sstevel@tonic-gate * thread. 39557c478bd9Sstevel@tonic-gate */ 3956108322fbScarlsonj async_thread = (curproc == nfs_zone()->zone_zsched); 39577c478bd9Sstevel@tonic-gate if (async_thread) { 39587c478bd9Sstevel@tonic-gate mutex_init(&cpr_lock, NULL, MUTEX_DEFAULT, NULL); 39597c478bd9Sstevel@tonic-gate CALLB_CPR_INIT(&cpr_info, &cpr_lock, callb_generic_cpr, 39607c478bd9Sstevel@tonic-gate "nfsv4AsyncUnmount"); 39617c478bd9Sstevel@tonic-gate } 39627c478bd9Sstevel@tonic-gate 39637c478bd9Sstevel@tonic-gate /* 39647c478bd9Sstevel@tonic-gate * We need to wait for all outstanding OTW calls 39657c478bd9Sstevel@tonic-gate * and recovery to finish before we remove the mi 39667c478bd9Sstevel@tonic-gate * from the nfs4_server_t, as current pending 39677c478bd9Sstevel@tonic-gate * calls might still need this linkage (in order 39687c478bd9Sstevel@tonic-gate * to find a nfs4_server_t from a mntinfo4_t). 39697c478bd9Sstevel@tonic-gate */ 39707c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&mi->mi_recovlock, RW_READER, FALSE); 39717c478bd9Sstevel@tonic-gate sp = find_nfs4_server(mi); 39727c478bd9Sstevel@tonic-gate nfs_rw_exit(&mi->mi_recovlock); 39737c478bd9Sstevel@tonic-gate 39747c478bd9Sstevel@tonic-gate if (sp) { 39757c478bd9Sstevel@tonic-gate while (sp->s_otw_call_count != 0) { 39767c478bd9Sstevel@tonic-gate if (async_thread) { 39777c478bd9Sstevel@tonic-gate mutex_enter(&cpr_lock); 39787c478bd9Sstevel@tonic-gate CALLB_CPR_SAFE_BEGIN(&cpr_info); 39797c478bd9Sstevel@tonic-gate mutex_exit(&cpr_lock); 39807c478bd9Sstevel@tonic-gate } 39817c478bd9Sstevel@tonic-gate cv_wait(&sp->s_cv_otw_count, &sp->s_lock); 39827c478bd9Sstevel@tonic-gate if (async_thread) { 39837c478bd9Sstevel@tonic-gate mutex_enter(&cpr_lock); 39847c478bd9Sstevel@tonic-gate CALLB_CPR_SAFE_END(&cpr_info, &cpr_lock); 39857c478bd9Sstevel@tonic-gate mutex_exit(&cpr_lock); 39867c478bd9Sstevel@tonic-gate } 39877c478bd9Sstevel@tonic-gate } 39887c478bd9Sstevel@tonic-gate mutex_exit(&sp->s_lock); 39897c478bd9Sstevel@tonic-gate nfs4_server_rele(sp); 39907c478bd9Sstevel@tonic-gate sp = NULL; 39917c478bd9Sstevel@tonic-gate } 39927c478bd9Sstevel@tonic-gate 39937c478bd9Sstevel@tonic-gate mutex_enter(&mi->mi_lock); 39947c478bd9Sstevel@tonic-gate while (mi->mi_in_recovery != 0) { 39957c478bd9Sstevel@tonic-gate if (async_thread) { 39967c478bd9Sstevel@tonic-gate mutex_enter(&cpr_lock); 39977c478bd9Sstevel@tonic-gate CALLB_CPR_SAFE_BEGIN(&cpr_info); 39987c478bd9Sstevel@tonic-gate mutex_exit(&cpr_lock); 39997c478bd9Sstevel@tonic-gate } 40007c478bd9Sstevel@tonic-gate cv_wait(&mi->mi_cv_in_recov, &mi->mi_lock); 40017c478bd9Sstevel@tonic-gate if (async_thread) { 40027c478bd9Sstevel@tonic-gate mutex_enter(&cpr_lock); 40037c478bd9Sstevel@tonic-gate CALLB_CPR_SAFE_END(&cpr_info, &cpr_lock); 40047c478bd9Sstevel@tonic-gate mutex_exit(&cpr_lock); 40057c478bd9Sstevel@tonic-gate } 40067c478bd9Sstevel@tonic-gate } 40077c478bd9Sstevel@tonic-gate mutex_exit(&mi->mi_lock); 40087c478bd9Sstevel@tonic-gate 4009eabd0450Sth /* 4010eabd0450Sth * If we got an error, then do not nuke the 4011eabd0450Sth * tree. Either the harvester is busy reclaiming 4012eabd0450Sth * this node or we ran into some busy condition. 4013eabd0450Sth * 4014eabd0450Sth * The harvester will eventually come along and cleanup. 4015eabd0450Sth * The only problem would be the root mount point. 4016eabd0450Sth * 4017eabd0450Sth * Since the busy node can occur for a variety 4018eabd0450Sth * of reasons and can result in an entry staying 4019eabd0450Sth * in df output but no longer accessible from the 4020eabd0450Sth * directory tree, we are okay. 4021eabd0450Sth */ 4022eabd0450Sth if (!nfs4_ephemeral_umount(mi, flag, cr, 4023d708af74SThomas Haynes &must_unlock, &must_rele, &eph_tree)) 4024eabd0450Sth nfs4_ephemeral_umount_activate(mi, &must_unlock, 4025d708af74SThomas Haynes &must_rele, &eph_tree); 4026b9238976Sth 40277c478bd9Sstevel@tonic-gate /* 40287c478bd9Sstevel@tonic-gate * The original purge of the dnlc via 'dounmount' 40297c478bd9Sstevel@tonic-gate * doesn't guarantee that another dnlc entry was not 40307c478bd9Sstevel@tonic-gate * added while we waitied for all outstanding OTW 40317c478bd9Sstevel@tonic-gate * and recovery calls to finish. So re-purge the 40327c478bd9Sstevel@tonic-gate * dnlc now. 40337c478bd9Sstevel@tonic-gate */ 40347c478bd9Sstevel@tonic-gate (void) dnlc_purge_vfsp(vfsp, 0); 40357c478bd9Sstevel@tonic-gate 40367c478bd9Sstevel@tonic-gate /* 40377c478bd9Sstevel@tonic-gate * We need to explicitly stop the manager thread; the asyc worker 40387c478bd9Sstevel@tonic-gate * threads can timeout and exit on their own. 40397c478bd9Sstevel@tonic-gate */ 404050a83466Sjwahlig mutex_enter(&mi->mi_async_lock); 404150a83466Sjwahlig mi->mi_max_threads = 0; 404250a83466Sjwahlig cv_broadcast(&mi->mi_async_work_cv); 404350a83466Sjwahlig mutex_exit(&mi->mi_async_lock); 404450a83466Sjwahlig if (mi->mi_manager_thread) 404550a83466Sjwahlig nfs4_async_manager_stop(vfsp); 40467c478bd9Sstevel@tonic-gate 40477c478bd9Sstevel@tonic-gate destroy_rtable4(vfsp, cr); 40487c478bd9Sstevel@tonic-gate 40497c478bd9Sstevel@tonic-gate nfs4_remove_mi_from_server(mi, NULL); 40507c478bd9Sstevel@tonic-gate 40517c478bd9Sstevel@tonic-gate if (async_thread) { 40527c478bd9Sstevel@tonic-gate mutex_enter(&cpr_lock); 40537c478bd9Sstevel@tonic-gate CALLB_CPR_EXIT(&cpr_info); /* drops cpr_lock */ 40547c478bd9Sstevel@tonic-gate mutex_destroy(&cpr_lock); 40557c478bd9Sstevel@tonic-gate } 405650a83466Sjwahlig 405750a83466Sjwahlig removed = nfs4_mi_zonelist_remove(mi); 405850a83466Sjwahlig if (removed) 405950a83466Sjwahlig zone_rele(mi->mi_zone); 40607c478bd9Sstevel@tonic-gate } 4061