17c478bd9Sstevel@tonic-gate /* 27c478bd9Sstevel@tonic-gate * CDDL HEADER START 37c478bd9Sstevel@tonic-gate * 47c478bd9Sstevel@tonic-gate * The contents of this file are subject to the terms of the 57c478bd9Sstevel@tonic-gate * Common Development and Distribution License, Version 1.0 only 67c478bd9Sstevel@tonic-gate * (the "License"). You may not use this file except in compliance 77c478bd9Sstevel@tonic-gate * with the License. 87c478bd9Sstevel@tonic-gate * 97c478bd9Sstevel@tonic-gate * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 107c478bd9Sstevel@tonic-gate * or http://www.opensolaris.org/os/licensing. 117c478bd9Sstevel@tonic-gate * See the License for the specific language governing permissions 127c478bd9Sstevel@tonic-gate * and limitations under the License. 137c478bd9Sstevel@tonic-gate * 147c478bd9Sstevel@tonic-gate * When distributing Covered Code, include this CDDL HEADER in each 157c478bd9Sstevel@tonic-gate * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 167c478bd9Sstevel@tonic-gate * If applicable, add the following below this CDDL HEADER, with the 177c478bd9Sstevel@tonic-gate * fields enclosed by brackets "[]" replaced with your own identifying 187c478bd9Sstevel@tonic-gate * information: Portions Copyright [yyyy] [name of copyright owner] 197c478bd9Sstevel@tonic-gate * 207c478bd9Sstevel@tonic-gate * CDDL HEADER END 217c478bd9Sstevel@tonic-gate */ 227c478bd9Sstevel@tonic-gate /* 237c478bd9Sstevel@tonic-gate * Copyright 2005 Sun Microsystems, Inc. All rights reserved. 247c478bd9Sstevel@tonic-gate * Use is subject to license terms. 257c478bd9Sstevel@tonic-gate */ 267c478bd9Sstevel@tonic-gate 277c478bd9Sstevel@tonic-gate /* 287c478bd9Sstevel@tonic-gate * Copyright (c) 1983,1984,1985,1986,1987,1988,1989 AT&T. 297c478bd9Sstevel@tonic-gate * All Rights Reserved 307c478bd9Sstevel@tonic-gate */ 317c478bd9Sstevel@tonic-gate 327c478bd9Sstevel@tonic-gate #pragma ident "%Z%%M% %I% %E% SMI" 337c478bd9Sstevel@tonic-gate 347c478bd9Sstevel@tonic-gate #include <sys/param.h> 357c478bd9Sstevel@tonic-gate #include <sys/types.h> 367c478bd9Sstevel@tonic-gate #include <sys/systm.h> 377c478bd9Sstevel@tonic-gate #include <sys/cred.h> 387c478bd9Sstevel@tonic-gate #include <sys/vfs.h> 397c478bd9Sstevel@tonic-gate #include <sys/vnode.h> 407c478bd9Sstevel@tonic-gate #include <sys/pathname.h> 417c478bd9Sstevel@tonic-gate #include <sys/sysmacros.h> 427c478bd9Sstevel@tonic-gate #include <sys/kmem.h> 437c478bd9Sstevel@tonic-gate #include <sys/mkdev.h> 447c478bd9Sstevel@tonic-gate #include <sys/mount.h> 457c478bd9Sstevel@tonic-gate #include <sys/statvfs.h> 467c478bd9Sstevel@tonic-gate #include <sys/errno.h> 477c478bd9Sstevel@tonic-gate #include <sys/debug.h> 487c478bd9Sstevel@tonic-gate #include <sys/cmn_err.h> 497c478bd9Sstevel@tonic-gate #include <sys/utsname.h> 507c478bd9Sstevel@tonic-gate #include <sys/bootconf.h> 517c478bd9Sstevel@tonic-gate #include <sys/modctl.h> 527c478bd9Sstevel@tonic-gate #include <sys/acl.h> 537c478bd9Sstevel@tonic-gate #include <sys/flock.h> 547c478bd9Sstevel@tonic-gate #include <sys/time.h> 557c478bd9Sstevel@tonic-gate #include <sys/disp.h> 567c478bd9Sstevel@tonic-gate #include <sys/policy.h> 577c478bd9Sstevel@tonic-gate #include <sys/socket.h> 587c478bd9Sstevel@tonic-gate #include <sys/netconfig.h> 597c478bd9Sstevel@tonic-gate #include <sys/dnlc.h> 607c478bd9Sstevel@tonic-gate #include <sys/list.h> 617c478bd9Sstevel@tonic-gate 627c478bd9Sstevel@tonic-gate #include <rpc/types.h> 637c478bd9Sstevel@tonic-gate #include <rpc/auth.h> 647c478bd9Sstevel@tonic-gate #include <rpc/rpcsec_gss.h> 657c478bd9Sstevel@tonic-gate #include <rpc/clnt.h> 667c478bd9Sstevel@tonic-gate 677c478bd9Sstevel@tonic-gate #include <nfs/nfs.h> 687c478bd9Sstevel@tonic-gate #include <nfs/nfs_clnt.h> 697c478bd9Sstevel@tonic-gate #include <nfs/mount.h> 707c478bd9Sstevel@tonic-gate #include <nfs/nfs_acl.h> 717c478bd9Sstevel@tonic-gate 727c478bd9Sstevel@tonic-gate #include <fs/fs_subr.h> 737c478bd9Sstevel@tonic-gate 747c478bd9Sstevel@tonic-gate #include <nfs/nfs4.h> 757c478bd9Sstevel@tonic-gate #include <nfs/rnode4.h> 767c478bd9Sstevel@tonic-gate #include <nfs/nfs4_clnt.h> 777c478bd9Sstevel@tonic-gate 787c478bd9Sstevel@tonic-gate /* 797c478bd9Sstevel@tonic-gate * Arguments passed to thread to free data structures from forced unmount. 807c478bd9Sstevel@tonic-gate */ 817c478bd9Sstevel@tonic-gate 827c478bd9Sstevel@tonic-gate typedef struct { 837c478bd9Sstevel@tonic-gate vfs_t *fm_vfsp; 847c478bd9Sstevel@tonic-gate cred_t *fm_cr; 857c478bd9Sstevel@tonic-gate } freemountargs_t; 867c478bd9Sstevel@tonic-gate 877c478bd9Sstevel@tonic-gate static void async_free_mount(vfs_t *, cred_t *); 887c478bd9Sstevel@tonic-gate static void nfs4_free_mount(vfs_t *, cred_t *); 897c478bd9Sstevel@tonic-gate static void nfs4_free_mount_thread(freemountargs_t *); 907c478bd9Sstevel@tonic-gate static int nfs4_chkdup_servinfo4(servinfo4_t *, servinfo4_t *); 917c478bd9Sstevel@tonic-gate 927c478bd9Sstevel@tonic-gate /* 937c478bd9Sstevel@tonic-gate * From rpcsec module (common/rpcsec). 947c478bd9Sstevel@tonic-gate */ 957c478bd9Sstevel@tonic-gate extern int sec_clnt_loadinfo(struct sec_data *, struct sec_data **, model_t); 967c478bd9Sstevel@tonic-gate extern void sec_clnt_freeinfo(struct sec_data *); 977c478bd9Sstevel@tonic-gate 987c478bd9Sstevel@tonic-gate /* 997c478bd9Sstevel@tonic-gate * The order and contents of this structure must be kept in sync with that of 1007c478bd9Sstevel@tonic-gate * rfsreqcnt_v4_tmpl in nfs_stats.c 1017c478bd9Sstevel@tonic-gate */ 1027c478bd9Sstevel@tonic-gate static char *rfsnames_v4[] = { 1037c478bd9Sstevel@tonic-gate "null", "compound", "reserved", "access", "close", "commit", "create", 1047c478bd9Sstevel@tonic-gate "delegpurge", "delegreturn", "getattr", "getfh", "link", "lock", 1057c478bd9Sstevel@tonic-gate "lockt", "locku", "lookup", "lookupp", "nverify", "open", "openattr", 1067c478bd9Sstevel@tonic-gate "open_confirm", "open_downgrade", "putfh", "putpubfh", "putrootfh", 1077c478bd9Sstevel@tonic-gate "read", "readdir", "readlink", "remove", "rename", "renew", 1087c478bd9Sstevel@tonic-gate "restorefh", "savefh", "secinfo", "setattr", "setclientid", 1097c478bd9Sstevel@tonic-gate "setclientid_confirm", "verify", "write" 1107c478bd9Sstevel@tonic-gate }; 1117c478bd9Sstevel@tonic-gate 1127c478bd9Sstevel@tonic-gate /* 1137c478bd9Sstevel@tonic-gate * nfs4_max_mount_retry is the number of times the client will redrive 1147c478bd9Sstevel@tonic-gate * a mount compound before giving up and returning failure. The intent 1157c478bd9Sstevel@tonic-gate * is to redrive mount compounds which fail NFS4ERR_STALE so that 1167c478bd9Sstevel@tonic-gate * if a component of the server path being mounted goes stale, it can 1177c478bd9Sstevel@tonic-gate * "recover" by redriving the mount compund (LOOKUP ops). This recovery 1187c478bd9Sstevel@tonic-gate * code is needed outside of the recovery framework because mount is a 1197c478bd9Sstevel@tonic-gate * special case. The client doesn't create vnodes/rnodes for components 1207c478bd9Sstevel@tonic-gate * of the server path being mounted. The recovery code recovers real 1217c478bd9Sstevel@tonic-gate * client objects, not STALE FHs which map to components of the server 1227c478bd9Sstevel@tonic-gate * path being mounted. 1237c478bd9Sstevel@tonic-gate * 1247c478bd9Sstevel@tonic-gate * We could just fail the mount on the first time, but that would 1257c478bd9Sstevel@tonic-gate * instantly trigger failover (from nfs4_mount), and the client should 1267c478bd9Sstevel@tonic-gate * try to re-lookup the STALE FH before doing failover. The easiest 1277c478bd9Sstevel@tonic-gate * way to "re-lookup" is to simply redrive the mount compound. 1287c478bd9Sstevel@tonic-gate */ 1297c478bd9Sstevel@tonic-gate static int nfs4_max_mount_retry = 2; 1307c478bd9Sstevel@tonic-gate 1317c478bd9Sstevel@tonic-gate /* 1327c478bd9Sstevel@tonic-gate * nfs4 vfs operations. 1337c478bd9Sstevel@tonic-gate */ 1347c478bd9Sstevel@tonic-gate static int nfs4_mount(vfs_t *, vnode_t *, struct mounta *, cred_t *); 1357c478bd9Sstevel@tonic-gate static int nfs4_unmount(vfs_t *, int, cred_t *); 1367c478bd9Sstevel@tonic-gate static int nfs4_root(vfs_t *, vnode_t **); 1377c478bd9Sstevel@tonic-gate static int nfs4_statvfs(vfs_t *, struct statvfs64 *); 1387c478bd9Sstevel@tonic-gate static int nfs4_sync(vfs_t *, short, cred_t *); 1397c478bd9Sstevel@tonic-gate static int nfs4_vget(vfs_t *, vnode_t **, fid_t *); 1407c478bd9Sstevel@tonic-gate static int nfs4_mountroot(vfs_t *, whymountroot_t); 1417c478bd9Sstevel@tonic-gate static void nfs4_freevfs(vfs_t *); 1427c478bd9Sstevel@tonic-gate 1437c478bd9Sstevel@tonic-gate static int nfs4rootvp(vnode_t **, vfs_t *, struct servinfo4 *, 1447c478bd9Sstevel@tonic-gate int, cred_t *, zone_t *); 1457c478bd9Sstevel@tonic-gate 1467c478bd9Sstevel@tonic-gate vfsops_t *nfs4_vfsops; 1477c478bd9Sstevel@tonic-gate 1487c478bd9Sstevel@tonic-gate int nfs4_vfsinit(void); 1497c478bd9Sstevel@tonic-gate void nfs4_vfsfini(void); 1507c478bd9Sstevel@tonic-gate static void nfs4setclientid_init(void); 1517c478bd9Sstevel@tonic-gate static void nfs4setclientid_fini(void); 1527c478bd9Sstevel@tonic-gate static void nfs4setclientid_otw(mntinfo4_t *, servinfo4_t *, cred_t *, 1537c478bd9Sstevel@tonic-gate struct nfs4_server *, nfs4_error_t *, int *); 1547c478bd9Sstevel@tonic-gate static void destroy_nfs4_server(nfs4_server_t *); 1557c478bd9Sstevel@tonic-gate static void remove_mi(nfs4_server_t *, mntinfo4_t *); 1567c478bd9Sstevel@tonic-gate 1577c478bd9Sstevel@tonic-gate /* 1587c478bd9Sstevel@tonic-gate * Initialize the vfs structure 1597c478bd9Sstevel@tonic-gate */ 1607c478bd9Sstevel@tonic-gate 1617c478bd9Sstevel@tonic-gate static int nfs4fstyp; 1627c478bd9Sstevel@tonic-gate 1637c478bd9Sstevel@tonic-gate 1647c478bd9Sstevel@tonic-gate /* 1657c478bd9Sstevel@tonic-gate * Debug variable to check for rdma based 1667c478bd9Sstevel@tonic-gate * transport startup and cleanup. Controlled 1677c478bd9Sstevel@tonic-gate * through /etc/system. Off by default. 1687c478bd9Sstevel@tonic-gate */ 1697c478bd9Sstevel@tonic-gate extern int rdma_debug; 1707c478bd9Sstevel@tonic-gate 1717c478bd9Sstevel@tonic-gate int 1727c478bd9Sstevel@tonic-gate nfs4init(int fstyp, char *name) 1737c478bd9Sstevel@tonic-gate { 1747c478bd9Sstevel@tonic-gate static const fs_operation_def_t nfs4_vfsops_template[] = { 1757c478bd9Sstevel@tonic-gate VFSNAME_MOUNT, nfs4_mount, 1767c478bd9Sstevel@tonic-gate VFSNAME_UNMOUNT, nfs4_unmount, 1777c478bd9Sstevel@tonic-gate VFSNAME_ROOT, nfs4_root, 1787c478bd9Sstevel@tonic-gate VFSNAME_STATVFS, nfs4_statvfs, 1797c478bd9Sstevel@tonic-gate VFSNAME_SYNC, (fs_generic_func_p) nfs4_sync, 1807c478bd9Sstevel@tonic-gate VFSNAME_VGET, nfs4_vget, 1817c478bd9Sstevel@tonic-gate VFSNAME_MOUNTROOT, nfs4_mountroot, 1827c478bd9Sstevel@tonic-gate VFSNAME_FREEVFS, (fs_generic_func_p)nfs4_freevfs, 1837c478bd9Sstevel@tonic-gate NULL, NULL 1847c478bd9Sstevel@tonic-gate }; 1857c478bd9Sstevel@tonic-gate int error; 1867c478bd9Sstevel@tonic-gate 1877c478bd9Sstevel@tonic-gate error = vfs_setfsops(fstyp, nfs4_vfsops_template, &nfs4_vfsops); 1887c478bd9Sstevel@tonic-gate if (error != 0) { 1897c478bd9Sstevel@tonic-gate zcmn_err(GLOBAL_ZONEID, CE_WARN, 1907c478bd9Sstevel@tonic-gate "nfs4init: bad vfs ops template"); 1917c478bd9Sstevel@tonic-gate return (error); 1927c478bd9Sstevel@tonic-gate } 1937c478bd9Sstevel@tonic-gate 1947c478bd9Sstevel@tonic-gate error = vn_make_ops(name, nfs4_vnodeops_template, &nfs4_vnodeops); 1957c478bd9Sstevel@tonic-gate if (error != 0) { 1967c478bd9Sstevel@tonic-gate (void) vfs_freevfsops_by_type(fstyp); 1977c478bd9Sstevel@tonic-gate zcmn_err(GLOBAL_ZONEID, CE_WARN, 1987c478bd9Sstevel@tonic-gate "nfs4init: bad vnode ops template"); 1997c478bd9Sstevel@tonic-gate return (error); 2007c478bd9Sstevel@tonic-gate } 2017c478bd9Sstevel@tonic-gate 2027c478bd9Sstevel@tonic-gate nfs4fstyp = fstyp; 2037c478bd9Sstevel@tonic-gate 2047c478bd9Sstevel@tonic-gate (void) nfs4_vfsinit(); 2057c478bd9Sstevel@tonic-gate 2067c478bd9Sstevel@tonic-gate (void) nfs4_init_dot_entries(); 2077c478bd9Sstevel@tonic-gate 2087c478bd9Sstevel@tonic-gate return (0); 2097c478bd9Sstevel@tonic-gate } 2107c478bd9Sstevel@tonic-gate 2117c478bd9Sstevel@tonic-gate void 2127c478bd9Sstevel@tonic-gate nfs4fini(void) 2137c478bd9Sstevel@tonic-gate { 2147c478bd9Sstevel@tonic-gate (void) nfs4_destroy_dot_entries(); 2157c478bd9Sstevel@tonic-gate nfs4_vfsfini(); 2167c478bd9Sstevel@tonic-gate } 2177c478bd9Sstevel@tonic-gate 2187c478bd9Sstevel@tonic-gate /* 2197c478bd9Sstevel@tonic-gate * Create a new sec_data structure to store AUTH_DH related data: 2207c478bd9Sstevel@tonic-gate * netname, syncaddr, knetconfig. There is no AUTH_F_RPCTIMESYNC 2217c478bd9Sstevel@tonic-gate * flag set for NFS V4 since we are avoiding to contact the rpcbind 2227c478bd9Sstevel@tonic-gate * daemon and is using the IP time service (IPPORT_TIMESERVER). 2237c478bd9Sstevel@tonic-gate * 2247c478bd9Sstevel@tonic-gate * sec_data can be freed by sec_clnt_freeinfo(). 2257c478bd9Sstevel@tonic-gate */ 2267c478bd9Sstevel@tonic-gate struct sec_data * 2277c478bd9Sstevel@tonic-gate create_authdh_data(char *netname, int nlen, struct netbuf *syncaddr, 2287c478bd9Sstevel@tonic-gate struct knetconfig *knconf) { 2297c478bd9Sstevel@tonic-gate struct sec_data *secdata; 2307c478bd9Sstevel@tonic-gate dh_k4_clntdata_t *data; 2317c478bd9Sstevel@tonic-gate char *pf, *p; 2327c478bd9Sstevel@tonic-gate 2337c478bd9Sstevel@tonic-gate if (syncaddr == NULL || syncaddr->buf == NULL || nlen == 0) 2347c478bd9Sstevel@tonic-gate return (NULL); 2357c478bd9Sstevel@tonic-gate 2367c478bd9Sstevel@tonic-gate secdata = kmem_alloc(sizeof (*secdata), KM_SLEEP); 2377c478bd9Sstevel@tonic-gate secdata->flags = 0; 2387c478bd9Sstevel@tonic-gate 2397c478bd9Sstevel@tonic-gate data = kmem_alloc(sizeof (*data), KM_SLEEP); 2407c478bd9Sstevel@tonic-gate 2417c478bd9Sstevel@tonic-gate data->syncaddr.maxlen = syncaddr->maxlen; 2427c478bd9Sstevel@tonic-gate data->syncaddr.len = syncaddr->len; 2437c478bd9Sstevel@tonic-gate data->syncaddr.buf = (char *)kmem_alloc(syncaddr->len, KM_SLEEP); 2447c478bd9Sstevel@tonic-gate bcopy(syncaddr->buf, data->syncaddr.buf, syncaddr->len); 2457c478bd9Sstevel@tonic-gate 2467c478bd9Sstevel@tonic-gate /* 2477c478bd9Sstevel@tonic-gate * duplicate the knconf information for the 2487c478bd9Sstevel@tonic-gate * new opaque data. 2497c478bd9Sstevel@tonic-gate */ 2507c478bd9Sstevel@tonic-gate data->knconf = kmem_alloc(sizeof (*knconf), KM_SLEEP); 2517c478bd9Sstevel@tonic-gate *data->knconf = *knconf; 2527c478bd9Sstevel@tonic-gate pf = kmem_alloc(KNC_STRSIZE, KM_SLEEP); 2537c478bd9Sstevel@tonic-gate p = kmem_alloc(KNC_STRSIZE, KM_SLEEP); 2547c478bd9Sstevel@tonic-gate bcopy(knconf->knc_protofmly, pf, KNC_STRSIZE); 2557c478bd9Sstevel@tonic-gate bcopy(knconf->knc_proto, p, KNC_STRSIZE); 2567c478bd9Sstevel@tonic-gate data->knconf->knc_protofmly = pf; 2577c478bd9Sstevel@tonic-gate data->knconf->knc_proto = p; 2587c478bd9Sstevel@tonic-gate 2597c478bd9Sstevel@tonic-gate /* move server netname to the sec_data structure */ 2607c478bd9Sstevel@tonic-gate data->netname = kmem_alloc(nlen, KM_SLEEP); 2617c478bd9Sstevel@tonic-gate bcopy(netname, data->netname, nlen); 2627c478bd9Sstevel@tonic-gate data->netnamelen = (int)nlen; 2637c478bd9Sstevel@tonic-gate 2647c478bd9Sstevel@tonic-gate secdata->secmod = AUTH_DH; 2657c478bd9Sstevel@tonic-gate secdata->rpcflavor = AUTH_DH; 2667c478bd9Sstevel@tonic-gate secdata->data = (caddr_t)data; 2677c478bd9Sstevel@tonic-gate 2687c478bd9Sstevel@tonic-gate return (secdata); 2697c478bd9Sstevel@tonic-gate } 2707c478bd9Sstevel@tonic-gate 2717c478bd9Sstevel@tonic-gate static int 2727c478bd9Sstevel@tonic-gate nfs4_chkdup_servinfo4(servinfo4_t *svp_head, servinfo4_t *svp) 2737c478bd9Sstevel@tonic-gate { 2747c478bd9Sstevel@tonic-gate servinfo4_t *si; 2757c478bd9Sstevel@tonic-gate 2767c478bd9Sstevel@tonic-gate /* 2777c478bd9Sstevel@tonic-gate * Iterate over the servinfo4 list to make sure 2787c478bd9Sstevel@tonic-gate * we do not have a duplicate. Skip any servinfo4 2797c478bd9Sstevel@tonic-gate * that has been marked "NOT IN USE" 2807c478bd9Sstevel@tonic-gate */ 2817c478bd9Sstevel@tonic-gate for (si = svp_head; si; si = si->sv_next) { 2827c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&si->sv_lock, RW_READER, 0); 2837c478bd9Sstevel@tonic-gate if (si->sv_flags & SV4_NOTINUSE) { 2847c478bd9Sstevel@tonic-gate nfs_rw_exit(&si->sv_lock); 2857c478bd9Sstevel@tonic-gate continue; 2867c478bd9Sstevel@tonic-gate } 2877c478bd9Sstevel@tonic-gate nfs_rw_exit(&si->sv_lock); 2887c478bd9Sstevel@tonic-gate if (si == svp) 2897c478bd9Sstevel@tonic-gate continue; 2907c478bd9Sstevel@tonic-gate if (si->sv_addr.len == svp->sv_addr.len && 2917c478bd9Sstevel@tonic-gate strcmp(si->sv_knconf->knc_protofmly, 2927c478bd9Sstevel@tonic-gate svp->sv_knconf->knc_protofmly) == 0 && 2937c478bd9Sstevel@tonic-gate bcmp(si->sv_addr.buf, svp->sv_addr.buf, 2947c478bd9Sstevel@tonic-gate si->sv_addr.len) == 0) { 2957c478bd9Sstevel@tonic-gate /* it's a duplicate */ 2967c478bd9Sstevel@tonic-gate return (1); 2977c478bd9Sstevel@tonic-gate } 2987c478bd9Sstevel@tonic-gate } 2997c478bd9Sstevel@tonic-gate /* it's not a duplicate */ 3007c478bd9Sstevel@tonic-gate return (0); 3017c478bd9Sstevel@tonic-gate } 3027c478bd9Sstevel@tonic-gate 3037c478bd9Sstevel@tonic-gate /* 3047c478bd9Sstevel@tonic-gate * nfs mount vfsop 3057c478bd9Sstevel@tonic-gate * Set up mount info record and attach it to vfs struct. 3067c478bd9Sstevel@tonic-gate */ 3077c478bd9Sstevel@tonic-gate static int 3087c478bd9Sstevel@tonic-gate nfs4_mount(vfs_t *vfsp, vnode_t *mvp, struct mounta *uap, cred_t *cr) 3097c478bd9Sstevel@tonic-gate { 3107c478bd9Sstevel@tonic-gate char *data = uap->dataptr; 3117c478bd9Sstevel@tonic-gate int error; 3127c478bd9Sstevel@tonic-gate vnode_t *rtvp; /* the server's root */ 3137c478bd9Sstevel@tonic-gate mntinfo4_t *mi; /* mount info, pointed at by vfs */ 3147c478bd9Sstevel@tonic-gate size_t hlen; /* length of hostname */ 3157c478bd9Sstevel@tonic-gate size_t nlen; /* length of netname */ 3167c478bd9Sstevel@tonic-gate char netname[MAXNETNAMELEN+1]; /* server's netname */ 3177c478bd9Sstevel@tonic-gate struct netbuf addr; /* server's address */ 3187c478bd9Sstevel@tonic-gate struct netbuf syncaddr; /* AUTH_DES time sync addr */ 3197c478bd9Sstevel@tonic-gate struct knetconfig *knconf; /* transport knetconfig structure */ 3207c478bd9Sstevel@tonic-gate struct knetconfig *rdma_knconf; /* rdma transport structure */ 3217c478bd9Sstevel@tonic-gate rnode4_t *rp; 3227c478bd9Sstevel@tonic-gate struct servinfo4 *svp; /* nfs server info */ 3237c478bd9Sstevel@tonic-gate struct servinfo4 *svp_tail = NULL; /* previous nfs server info */ 3247c478bd9Sstevel@tonic-gate struct servinfo4 *svp_head; /* first nfs server info */ 3257c478bd9Sstevel@tonic-gate struct servinfo4 *svp_2ndlast; /* 2nd last in server info list */ 3267c478bd9Sstevel@tonic-gate struct sec_data *secdata; /* security data */ 3277c478bd9Sstevel@tonic-gate STRUCT_DECL(nfs_args, args); /* nfs mount arguments */ 3287c478bd9Sstevel@tonic-gate STRUCT_DECL(knetconfig, knconf_tmp); 3297c478bd9Sstevel@tonic-gate STRUCT_DECL(netbuf, addr_tmp); 3307c478bd9Sstevel@tonic-gate int flags, addr_type; 3317c478bd9Sstevel@tonic-gate char *p, *pf; 3327c478bd9Sstevel@tonic-gate struct pathname pn; 3337c478bd9Sstevel@tonic-gate char *userbufptr; 334*108322fbScarlsonj zone_t *zone = nfs_zone(); 3357c478bd9Sstevel@tonic-gate nfs4_error_t n4e; 3367c478bd9Sstevel@tonic-gate 3377c478bd9Sstevel@tonic-gate if (secpolicy_fs_mount(cr, mvp, vfsp) != 0) 3387c478bd9Sstevel@tonic-gate return (EPERM); 3397c478bd9Sstevel@tonic-gate if (mvp->v_type != VDIR) 3407c478bd9Sstevel@tonic-gate return (ENOTDIR); 3417c478bd9Sstevel@tonic-gate /* 3427c478bd9Sstevel@tonic-gate * get arguments 3437c478bd9Sstevel@tonic-gate * 3447c478bd9Sstevel@tonic-gate * nfs_args is now versioned and is extensible, so 3457c478bd9Sstevel@tonic-gate * uap->datalen might be different from sizeof (args) 3467c478bd9Sstevel@tonic-gate * in a compatible situation. 3477c478bd9Sstevel@tonic-gate */ 3487c478bd9Sstevel@tonic-gate more: 3497c478bd9Sstevel@tonic-gate STRUCT_INIT(args, get_udatamodel()); 3507c478bd9Sstevel@tonic-gate bzero(STRUCT_BUF(args), SIZEOF_STRUCT(nfs_args, DATAMODEL_NATIVE)); 3517c478bd9Sstevel@tonic-gate if (copyin(data, STRUCT_BUF(args), MIN(uap->datalen, 3527c478bd9Sstevel@tonic-gate STRUCT_SIZE(args)))) 3537c478bd9Sstevel@tonic-gate return (EFAULT); 3547c478bd9Sstevel@tonic-gate 3557c478bd9Sstevel@tonic-gate flags = STRUCT_FGET(args, flags); 3567c478bd9Sstevel@tonic-gate 3577c478bd9Sstevel@tonic-gate /* 3587c478bd9Sstevel@tonic-gate * If the request changes the locking type, disallow the remount, 3597c478bd9Sstevel@tonic-gate * because it's questionable whether we can transfer the 3607c478bd9Sstevel@tonic-gate * locking state correctly. 3617c478bd9Sstevel@tonic-gate */ 3627c478bd9Sstevel@tonic-gate if (uap->flags & MS_REMOUNT) { 3637c478bd9Sstevel@tonic-gate if ((mi = VFTOMI4(vfsp)) != NULL) { 3647c478bd9Sstevel@tonic-gate uint_t new_mi_llock; 3657c478bd9Sstevel@tonic-gate uint_t old_mi_llock; 3667c478bd9Sstevel@tonic-gate 3677c478bd9Sstevel@tonic-gate new_mi_llock = (flags & NFSMNT_LLOCK) ? 1 : 0; 3687c478bd9Sstevel@tonic-gate old_mi_llock = (mi->mi_flags & MI4_LLOCK) ? 1 : 0; 3697c478bd9Sstevel@tonic-gate if (old_mi_llock != new_mi_llock) 3707c478bd9Sstevel@tonic-gate return (EBUSY); 3717c478bd9Sstevel@tonic-gate } 3727c478bd9Sstevel@tonic-gate return (0); 3737c478bd9Sstevel@tonic-gate } 3747c478bd9Sstevel@tonic-gate 3757c478bd9Sstevel@tonic-gate mutex_enter(&mvp->v_lock); 3767c478bd9Sstevel@tonic-gate if (!(uap->flags & MS_OVERLAY) && 3777c478bd9Sstevel@tonic-gate (mvp->v_count != 1 || (mvp->v_flag & VROOT))) { 3787c478bd9Sstevel@tonic-gate mutex_exit(&mvp->v_lock); 3797c478bd9Sstevel@tonic-gate return (EBUSY); 3807c478bd9Sstevel@tonic-gate } 3817c478bd9Sstevel@tonic-gate mutex_exit(&mvp->v_lock); 3827c478bd9Sstevel@tonic-gate 3837c478bd9Sstevel@tonic-gate /* make sure things are zeroed for errout: */ 3847c478bd9Sstevel@tonic-gate rtvp = NULL; 3857c478bd9Sstevel@tonic-gate mi = NULL; 3867c478bd9Sstevel@tonic-gate addr.buf = NULL; 3877c478bd9Sstevel@tonic-gate syncaddr.buf = NULL; 3887c478bd9Sstevel@tonic-gate secdata = NULL; 3897c478bd9Sstevel@tonic-gate 3907c478bd9Sstevel@tonic-gate /* 3917c478bd9Sstevel@tonic-gate * A valid knetconfig structure is required. 3927c478bd9Sstevel@tonic-gate */ 3937c478bd9Sstevel@tonic-gate if (!(flags & NFSMNT_KNCONF)) 3947c478bd9Sstevel@tonic-gate return (EINVAL); 3957c478bd9Sstevel@tonic-gate 3967c478bd9Sstevel@tonic-gate /* 3977c478bd9Sstevel@tonic-gate * Allocate a servinfo4 struct. 3987c478bd9Sstevel@tonic-gate */ 3997c478bd9Sstevel@tonic-gate svp = kmem_zalloc(sizeof (*svp), KM_SLEEP); 4007c478bd9Sstevel@tonic-gate nfs_rw_init(&svp->sv_lock, NULL, RW_DEFAULT, NULL); 4017c478bd9Sstevel@tonic-gate if (svp_tail) { 4027c478bd9Sstevel@tonic-gate svp_2ndlast = svp_tail; 4037c478bd9Sstevel@tonic-gate svp_tail->sv_next = svp; 4047c478bd9Sstevel@tonic-gate } else { 4057c478bd9Sstevel@tonic-gate svp_head = svp; 4067c478bd9Sstevel@tonic-gate svp_2ndlast = svp; 4077c478bd9Sstevel@tonic-gate } 4087c478bd9Sstevel@tonic-gate 4097c478bd9Sstevel@tonic-gate svp_tail = svp; 4107c478bd9Sstevel@tonic-gate 4117c478bd9Sstevel@tonic-gate /* 4127c478bd9Sstevel@tonic-gate * Allocate space for a knetconfig structure and 4137c478bd9Sstevel@tonic-gate * its strings and copy in from user-land. 4147c478bd9Sstevel@tonic-gate */ 4157c478bd9Sstevel@tonic-gate knconf = kmem_zalloc(sizeof (*knconf), KM_SLEEP); 4167c478bd9Sstevel@tonic-gate svp->sv_knconf = knconf; 4177c478bd9Sstevel@tonic-gate STRUCT_INIT(knconf_tmp, get_udatamodel()); 4187c478bd9Sstevel@tonic-gate if (copyin(STRUCT_FGETP(args, knconf), STRUCT_BUF(knconf_tmp), 4197c478bd9Sstevel@tonic-gate STRUCT_SIZE(knconf_tmp))) { 4207c478bd9Sstevel@tonic-gate sv4_free(svp_head); 4217c478bd9Sstevel@tonic-gate return (EFAULT); 4227c478bd9Sstevel@tonic-gate } 4237c478bd9Sstevel@tonic-gate 4247c478bd9Sstevel@tonic-gate knconf->knc_semantics = STRUCT_FGET(knconf_tmp, knc_semantics); 4257c478bd9Sstevel@tonic-gate knconf->knc_protofmly = STRUCT_FGETP(knconf_tmp, knc_protofmly); 4267c478bd9Sstevel@tonic-gate knconf->knc_proto = STRUCT_FGETP(knconf_tmp, knc_proto); 4277c478bd9Sstevel@tonic-gate if (get_udatamodel() != DATAMODEL_LP64) { 4287c478bd9Sstevel@tonic-gate knconf->knc_rdev = expldev(STRUCT_FGET(knconf_tmp, knc_rdev)); 4297c478bd9Sstevel@tonic-gate } else { 4307c478bd9Sstevel@tonic-gate knconf->knc_rdev = STRUCT_FGET(knconf_tmp, knc_rdev); 4317c478bd9Sstevel@tonic-gate } 4327c478bd9Sstevel@tonic-gate 4337c478bd9Sstevel@tonic-gate pf = kmem_alloc(KNC_STRSIZE, KM_SLEEP); 4347c478bd9Sstevel@tonic-gate p = kmem_alloc(KNC_STRSIZE, KM_SLEEP); 4357c478bd9Sstevel@tonic-gate error = copyinstr(knconf->knc_protofmly, pf, KNC_STRSIZE, NULL); 4367c478bd9Sstevel@tonic-gate if (error) { 4377c478bd9Sstevel@tonic-gate kmem_free(pf, KNC_STRSIZE); 4387c478bd9Sstevel@tonic-gate kmem_free(p, KNC_STRSIZE); 4397c478bd9Sstevel@tonic-gate sv4_free(svp_head); 4407c478bd9Sstevel@tonic-gate return (error); 4417c478bd9Sstevel@tonic-gate } 4427c478bd9Sstevel@tonic-gate error = copyinstr(knconf->knc_proto, p, KNC_STRSIZE, NULL); 4437c478bd9Sstevel@tonic-gate if (error) { 4447c478bd9Sstevel@tonic-gate kmem_free(pf, KNC_STRSIZE); 4457c478bd9Sstevel@tonic-gate kmem_free(p, KNC_STRSIZE); 4467c478bd9Sstevel@tonic-gate sv4_free(svp_head); 4477c478bd9Sstevel@tonic-gate return (error); 4487c478bd9Sstevel@tonic-gate } 4497c478bd9Sstevel@tonic-gate if (strcmp(p, NC_UDP) == 0) { 4507c478bd9Sstevel@tonic-gate kmem_free(pf, KNC_STRSIZE); 4517c478bd9Sstevel@tonic-gate kmem_free(p, KNC_STRSIZE); 4527c478bd9Sstevel@tonic-gate sv4_free(svp_head); 4537c478bd9Sstevel@tonic-gate return (ENOTSUP); 4547c478bd9Sstevel@tonic-gate } 4557c478bd9Sstevel@tonic-gate knconf->knc_protofmly = pf; 4567c478bd9Sstevel@tonic-gate knconf->knc_proto = p; 4577c478bd9Sstevel@tonic-gate 4587c478bd9Sstevel@tonic-gate /* 4597c478bd9Sstevel@tonic-gate * Get server address 4607c478bd9Sstevel@tonic-gate */ 4617c478bd9Sstevel@tonic-gate STRUCT_INIT(addr_tmp, get_udatamodel()); 4627c478bd9Sstevel@tonic-gate if (copyin(STRUCT_FGETP(args, addr), STRUCT_BUF(addr_tmp), 4637c478bd9Sstevel@tonic-gate STRUCT_SIZE(addr_tmp))) { 4647c478bd9Sstevel@tonic-gate error = EFAULT; 4657c478bd9Sstevel@tonic-gate goto errout; 4667c478bd9Sstevel@tonic-gate } 4677c478bd9Sstevel@tonic-gate 4687c478bd9Sstevel@tonic-gate userbufptr = addr.buf = STRUCT_FGETP(addr_tmp, buf); 4697c478bd9Sstevel@tonic-gate addr.len = STRUCT_FGET(addr_tmp, len); 4707c478bd9Sstevel@tonic-gate addr.buf = kmem_alloc(addr.len, KM_SLEEP); 4717c478bd9Sstevel@tonic-gate addr.maxlen = addr.len; 4727c478bd9Sstevel@tonic-gate if (copyin(userbufptr, addr.buf, addr.len)) { 4737c478bd9Sstevel@tonic-gate kmem_free(addr.buf, addr.len); 4747c478bd9Sstevel@tonic-gate error = EFAULT; 4757c478bd9Sstevel@tonic-gate goto errout; 4767c478bd9Sstevel@tonic-gate } 4777c478bd9Sstevel@tonic-gate 4787c478bd9Sstevel@tonic-gate svp->sv_addr = addr; 4797c478bd9Sstevel@tonic-gate 4807c478bd9Sstevel@tonic-gate /* 4817c478bd9Sstevel@tonic-gate * Get the root fhandle 4827c478bd9Sstevel@tonic-gate */ 4837c478bd9Sstevel@tonic-gate error = pn_get(STRUCT_FGETP(args, fh), UIO_USERSPACE, &pn); 4847c478bd9Sstevel@tonic-gate 4857c478bd9Sstevel@tonic-gate if (error) 4867c478bd9Sstevel@tonic-gate goto errout; 4877c478bd9Sstevel@tonic-gate 4887c478bd9Sstevel@tonic-gate /* Volatile fh: keep server paths, so use actual-size strings */ 4897c478bd9Sstevel@tonic-gate svp->sv_path = kmem_alloc(pn.pn_pathlen + 1, KM_SLEEP); 4907c478bd9Sstevel@tonic-gate bcopy(pn.pn_path, svp->sv_path, pn.pn_pathlen); 4917c478bd9Sstevel@tonic-gate svp->sv_path[pn.pn_pathlen] = '\0'; 4927c478bd9Sstevel@tonic-gate svp->sv_pathlen = pn.pn_pathlen + 1; 4937c478bd9Sstevel@tonic-gate pn_free(&pn); 4947c478bd9Sstevel@tonic-gate 4957c478bd9Sstevel@tonic-gate /* 4967c478bd9Sstevel@tonic-gate * Get server's hostname 4977c478bd9Sstevel@tonic-gate */ 4987c478bd9Sstevel@tonic-gate if (flags & NFSMNT_HOSTNAME) { 4997c478bd9Sstevel@tonic-gate error = copyinstr(STRUCT_FGETP(args, hostname), 5007c478bd9Sstevel@tonic-gate netname, sizeof (netname), &hlen); 5017c478bd9Sstevel@tonic-gate if (error) 5027c478bd9Sstevel@tonic-gate goto errout; 5037c478bd9Sstevel@tonic-gate } else { 5047c478bd9Sstevel@tonic-gate char *p = "unknown-host"; 5057c478bd9Sstevel@tonic-gate hlen = strlen(p) + 1; 5067c478bd9Sstevel@tonic-gate (void) strcpy(netname, p); 5077c478bd9Sstevel@tonic-gate } 5087c478bd9Sstevel@tonic-gate svp->sv_hostnamelen = hlen; 5097c478bd9Sstevel@tonic-gate svp->sv_hostname = kmem_alloc(svp->sv_hostnamelen, KM_SLEEP); 5107c478bd9Sstevel@tonic-gate (void) strcpy(svp->sv_hostname, netname); 5117c478bd9Sstevel@tonic-gate 5127c478bd9Sstevel@tonic-gate /* 5137c478bd9Sstevel@tonic-gate * RDMA MOUNT SUPPORT FOR NFS v4. 5147c478bd9Sstevel@tonic-gate * Establish, is it possible to use RDMA, if so overload the 5157c478bd9Sstevel@tonic-gate * knconf with rdma specific knconf and free the orignal knconf. 5167c478bd9Sstevel@tonic-gate */ 5177c478bd9Sstevel@tonic-gate if ((flags & NFSMNT_TRYRDMA) || (flags & NFSMNT_DORDMA)) { 5187c478bd9Sstevel@tonic-gate /* 5197c478bd9Sstevel@tonic-gate * Determine the addr type for RDMA, IPv4 or v6. 5207c478bd9Sstevel@tonic-gate */ 5217c478bd9Sstevel@tonic-gate if (strcmp(svp->sv_knconf->knc_protofmly, NC_INET) == 0) 5227c478bd9Sstevel@tonic-gate addr_type = AF_INET; 5237c478bd9Sstevel@tonic-gate else if (strcmp(svp->sv_knconf->knc_protofmly, NC_INET6) == 0) 5247c478bd9Sstevel@tonic-gate addr_type = AF_INET6; 5257c478bd9Sstevel@tonic-gate 5267c478bd9Sstevel@tonic-gate if (rdma_reachable(addr_type, &svp->sv_addr, 5277c478bd9Sstevel@tonic-gate &rdma_knconf) == 0) { 5287c478bd9Sstevel@tonic-gate /* 5297c478bd9Sstevel@tonic-gate * If successful, hijack the orignal knconf and 5307c478bd9Sstevel@tonic-gate * replace with the new one, depending on the flags. 5317c478bd9Sstevel@tonic-gate */ 5327c478bd9Sstevel@tonic-gate svp->sv_origknconf = svp->sv_knconf; 5337c478bd9Sstevel@tonic-gate svp->sv_knconf = rdma_knconf; 5347c478bd9Sstevel@tonic-gate knconf = rdma_knconf; 5357c478bd9Sstevel@tonic-gate } else { 5367c478bd9Sstevel@tonic-gate if (flags & NFSMNT_TRYRDMA) { 5377c478bd9Sstevel@tonic-gate #ifdef DEBUG 5387c478bd9Sstevel@tonic-gate if (rdma_debug) 5397c478bd9Sstevel@tonic-gate zcmn_err(getzoneid(), CE_WARN, 5407c478bd9Sstevel@tonic-gate "no RDMA onboard, revert\n"); 5417c478bd9Sstevel@tonic-gate #endif 5427c478bd9Sstevel@tonic-gate } 5437c478bd9Sstevel@tonic-gate 5447c478bd9Sstevel@tonic-gate if (flags & NFSMNT_DORDMA) { 5457c478bd9Sstevel@tonic-gate /* 5467c478bd9Sstevel@tonic-gate * If proto=rdma is specified and no RDMA 5477c478bd9Sstevel@tonic-gate * path to this server is avialable then 5487c478bd9Sstevel@tonic-gate * ditch this server. 5497c478bd9Sstevel@tonic-gate * This is not included in the mountable 5507c478bd9Sstevel@tonic-gate * server list or the replica list. 5517c478bd9Sstevel@tonic-gate * Check if more servers are specified; 5527c478bd9Sstevel@tonic-gate * Failover case, otherwise bail out of mount. 5537c478bd9Sstevel@tonic-gate */ 5547c478bd9Sstevel@tonic-gate if (STRUCT_FGET(args, nfs_args_ext) == 5557c478bd9Sstevel@tonic-gate NFS_ARGS_EXTB && STRUCT_FGETP(args, 5567c478bd9Sstevel@tonic-gate nfs_ext_u.nfs_extB.next) != NULL) { 5577c478bd9Sstevel@tonic-gate if (uap->flags & MS_RDONLY && 5587c478bd9Sstevel@tonic-gate !(flags & NFSMNT_SOFT)) { 5597c478bd9Sstevel@tonic-gate data = (char *) 5607c478bd9Sstevel@tonic-gate STRUCT_FGETP(args, 5617c478bd9Sstevel@tonic-gate nfs_ext_u.nfs_extB.next); 5627c478bd9Sstevel@tonic-gate if (svp_head->sv_next == NULL) { 5637c478bd9Sstevel@tonic-gate svp_tail = NULL; 5647c478bd9Sstevel@tonic-gate svp_2ndlast = NULL; 5657c478bd9Sstevel@tonic-gate sv4_free(svp_head); 5667c478bd9Sstevel@tonic-gate goto more; 5677c478bd9Sstevel@tonic-gate } else { 5687c478bd9Sstevel@tonic-gate svp_tail = svp_2ndlast; 5697c478bd9Sstevel@tonic-gate svp_2ndlast->sv_next = 5707c478bd9Sstevel@tonic-gate NULL; 5717c478bd9Sstevel@tonic-gate sv4_free(svp); 5727c478bd9Sstevel@tonic-gate goto more; 5737c478bd9Sstevel@tonic-gate } 5747c478bd9Sstevel@tonic-gate } 5757c478bd9Sstevel@tonic-gate } else { 5767c478bd9Sstevel@tonic-gate /* 5777c478bd9Sstevel@tonic-gate * This is the last server specified 5787c478bd9Sstevel@tonic-gate * in the nfs_args list passed down 5797c478bd9Sstevel@tonic-gate * and its not rdma capable. 5807c478bd9Sstevel@tonic-gate */ 5817c478bd9Sstevel@tonic-gate if (svp_head->sv_next == NULL) { 5827c478bd9Sstevel@tonic-gate /* 5837c478bd9Sstevel@tonic-gate * Is this the only one 5847c478bd9Sstevel@tonic-gate */ 5857c478bd9Sstevel@tonic-gate error = EINVAL; 5867c478bd9Sstevel@tonic-gate #ifdef DEBUG 5877c478bd9Sstevel@tonic-gate if (rdma_debug) 5887c478bd9Sstevel@tonic-gate zcmn_err(getzoneid(), 5897c478bd9Sstevel@tonic-gate CE_WARN, 5907c478bd9Sstevel@tonic-gate "No RDMA srv"); 5917c478bd9Sstevel@tonic-gate #endif 5927c478bd9Sstevel@tonic-gate goto errout; 5937c478bd9Sstevel@tonic-gate } else { 5947c478bd9Sstevel@tonic-gate /* 5957c478bd9Sstevel@tonic-gate * There is list, since some 5967c478bd9Sstevel@tonic-gate * servers specified before 5977c478bd9Sstevel@tonic-gate * this passed all requirements 5987c478bd9Sstevel@tonic-gate */ 5997c478bd9Sstevel@tonic-gate svp_tail = svp_2ndlast; 6007c478bd9Sstevel@tonic-gate svp_2ndlast->sv_next = NULL; 6017c478bd9Sstevel@tonic-gate sv4_free(svp); 6027c478bd9Sstevel@tonic-gate goto proceed; 6037c478bd9Sstevel@tonic-gate } 6047c478bd9Sstevel@tonic-gate } 6057c478bd9Sstevel@tonic-gate } 6067c478bd9Sstevel@tonic-gate } 6077c478bd9Sstevel@tonic-gate } 6087c478bd9Sstevel@tonic-gate 6097c478bd9Sstevel@tonic-gate /* 6107c478bd9Sstevel@tonic-gate * If there are syncaddr and netname data, load them in. This is 6117c478bd9Sstevel@tonic-gate * to support data needed for NFSV4 when AUTH_DH is the negotiated 6127c478bd9Sstevel@tonic-gate * flavor via SECINFO. (instead of using MOUNT protocol in V3). 6137c478bd9Sstevel@tonic-gate */ 6147c478bd9Sstevel@tonic-gate netname[0] = '\0'; 6157c478bd9Sstevel@tonic-gate if (flags & NFSMNT_SECURE) { 6167c478bd9Sstevel@tonic-gate 6177c478bd9Sstevel@tonic-gate /* get syncaddr */ 6187c478bd9Sstevel@tonic-gate STRUCT_INIT(addr_tmp, get_udatamodel()); 6197c478bd9Sstevel@tonic-gate if (copyin(STRUCT_FGETP(args, syncaddr), STRUCT_BUF(addr_tmp), 6207c478bd9Sstevel@tonic-gate STRUCT_SIZE(addr_tmp))) { 6217c478bd9Sstevel@tonic-gate error = EINVAL; 6227c478bd9Sstevel@tonic-gate goto errout; 6237c478bd9Sstevel@tonic-gate } 6247c478bd9Sstevel@tonic-gate userbufptr = STRUCT_FGETP(addr_tmp, buf); 6257c478bd9Sstevel@tonic-gate syncaddr.len = STRUCT_FGET(addr_tmp, len); 6267c478bd9Sstevel@tonic-gate syncaddr.buf = kmem_alloc(syncaddr.len, KM_SLEEP); 6277c478bd9Sstevel@tonic-gate syncaddr.maxlen = syncaddr.len; 6287c478bd9Sstevel@tonic-gate if (copyin(userbufptr, syncaddr.buf, syncaddr.len)) { 6297c478bd9Sstevel@tonic-gate kmem_free(syncaddr.buf, syncaddr.len); 6307c478bd9Sstevel@tonic-gate error = EFAULT; 6317c478bd9Sstevel@tonic-gate goto errout; 6327c478bd9Sstevel@tonic-gate } 6337c478bd9Sstevel@tonic-gate 6347c478bd9Sstevel@tonic-gate /* get server's netname */ 6357c478bd9Sstevel@tonic-gate if (copyinstr(STRUCT_FGETP(args, netname), netname, 6367c478bd9Sstevel@tonic-gate sizeof (netname), &nlen)) { 6377c478bd9Sstevel@tonic-gate kmem_free(syncaddr.buf, syncaddr.len); 6387c478bd9Sstevel@tonic-gate error = EFAULT; 6397c478bd9Sstevel@tonic-gate goto errout; 6407c478bd9Sstevel@tonic-gate } 6417c478bd9Sstevel@tonic-gate netname[nlen] = '\0'; 6427c478bd9Sstevel@tonic-gate 6437c478bd9Sstevel@tonic-gate svp->sv_dhsec = create_authdh_data(netname, nlen, &syncaddr, 6447c478bd9Sstevel@tonic-gate knconf); 6457c478bd9Sstevel@tonic-gate } 6467c478bd9Sstevel@tonic-gate 6477c478bd9Sstevel@tonic-gate /* 6487c478bd9Sstevel@tonic-gate * Get the extention data which has the security data structure. 6497c478bd9Sstevel@tonic-gate * This includes data for AUTH_SYS as well. 6507c478bd9Sstevel@tonic-gate */ 6517c478bd9Sstevel@tonic-gate if (flags & NFSMNT_NEWARGS) { 6527c478bd9Sstevel@tonic-gate switch (STRUCT_FGET(args, nfs_args_ext)) { 6537c478bd9Sstevel@tonic-gate case NFS_ARGS_EXTA: 6547c478bd9Sstevel@tonic-gate case NFS_ARGS_EXTB: 6557c478bd9Sstevel@tonic-gate /* 6567c478bd9Sstevel@tonic-gate * Indicating the application is using the new 6577c478bd9Sstevel@tonic-gate * sec_data structure to pass in the security 6587c478bd9Sstevel@tonic-gate * data. 6597c478bd9Sstevel@tonic-gate */ 6607c478bd9Sstevel@tonic-gate if (STRUCT_FGETP(args, 6617c478bd9Sstevel@tonic-gate nfs_ext_u.nfs_extA.secdata) == NULL) { 6627c478bd9Sstevel@tonic-gate error = EINVAL; 6637c478bd9Sstevel@tonic-gate } else { 6647c478bd9Sstevel@tonic-gate error = sec_clnt_loadinfo( 6657c478bd9Sstevel@tonic-gate (struct sec_data *)STRUCT_FGETP(args, 6667c478bd9Sstevel@tonic-gate nfs_ext_u.nfs_extA.secdata), 6677c478bd9Sstevel@tonic-gate &secdata, get_udatamodel()); 6687c478bd9Sstevel@tonic-gate } 6697c478bd9Sstevel@tonic-gate break; 6707c478bd9Sstevel@tonic-gate 6717c478bd9Sstevel@tonic-gate default: 6727c478bd9Sstevel@tonic-gate error = EINVAL; 6737c478bd9Sstevel@tonic-gate break; 6747c478bd9Sstevel@tonic-gate } 6757c478bd9Sstevel@tonic-gate 6767c478bd9Sstevel@tonic-gate } else if (flags & NFSMNT_SECURE) { 6777c478bd9Sstevel@tonic-gate /* 6787c478bd9Sstevel@tonic-gate * NFSMNT_SECURE is deprecated but we keep it 6797c478bd9Sstevel@tonic-gate * to support the rouge user generated application 6807c478bd9Sstevel@tonic-gate * that may use this undocumented interface to do 6817c478bd9Sstevel@tonic-gate * AUTH_DH security. 6827c478bd9Sstevel@tonic-gate */ 6837c478bd9Sstevel@tonic-gate secdata = create_authdh_data(netname, nlen, &syncaddr, knconf); 6847c478bd9Sstevel@tonic-gate 6857c478bd9Sstevel@tonic-gate } else { 6867c478bd9Sstevel@tonic-gate secdata = kmem_alloc(sizeof (*secdata), KM_SLEEP); 6877c478bd9Sstevel@tonic-gate secdata->secmod = secdata->rpcflavor = AUTH_SYS; 6887c478bd9Sstevel@tonic-gate secdata->data = NULL; 6897c478bd9Sstevel@tonic-gate } 6907c478bd9Sstevel@tonic-gate 6917c478bd9Sstevel@tonic-gate svp->sv_secdata = secdata; 6927c478bd9Sstevel@tonic-gate 6937c478bd9Sstevel@tonic-gate /* syncaddr is no longer needed. */ 6947c478bd9Sstevel@tonic-gate if (syncaddr.buf != NULL) 6957c478bd9Sstevel@tonic-gate kmem_free(syncaddr.buf, syncaddr.len); 6967c478bd9Sstevel@tonic-gate 6977c478bd9Sstevel@tonic-gate /* 6987c478bd9Sstevel@tonic-gate * User does not explictly specify a flavor, and a user 6997c478bd9Sstevel@tonic-gate * defined default flavor is passed down. 7007c478bd9Sstevel@tonic-gate */ 7017c478bd9Sstevel@tonic-gate if (flags & NFSMNT_SECDEFAULT) { 7027c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_WRITER, 0); 7037c478bd9Sstevel@tonic-gate svp->sv_flags |= SV4_TRYSECDEFAULT; 7047c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 7057c478bd9Sstevel@tonic-gate } 7067c478bd9Sstevel@tonic-gate 7077c478bd9Sstevel@tonic-gate /* 7087c478bd9Sstevel@tonic-gate * Failover support: 7097c478bd9Sstevel@tonic-gate * 7107c478bd9Sstevel@tonic-gate * We may have a linked list of nfs_args structures, 7117c478bd9Sstevel@tonic-gate * which means the user is looking for failover. If 7127c478bd9Sstevel@tonic-gate * the mount is either not "read-only" or "soft", 7137c478bd9Sstevel@tonic-gate * we want to bail out with EINVAL. 7147c478bd9Sstevel@tonic-gate */ 7157c478bd9Sstevel@tonic-gate if (STRUCT_FGET(args, nfs_args_ext) == NFS_ARGS_EXTB && 7167c478bd9Sstevel@tonic-gate STRUCT_FGETP(args, nfs_ext_u.nfs_extB.next) != NULL) { 7177c478bd9Sstevel@tonic-gate if (uap->flags & MS_RDONLY && !(flags & NFSMNT_SOFT)) { 7187c478bd9Sstevel@tonic-gate data = (char *)STRUCT_FGETP(args, 7197c478bd9Sstevel@tonic-gate nfs_ext_u.nfs_extB.next); 7207c478bd9Sstevel@tonic-gate goto more; 7217c478bd9Sstevel@tonic-gate } 7227c478bd9Sstevel@tonic-gate error = EINVAL; 7237c478bd9Sstevel@tonic-gate goto errout; 7247c478bd9Sstevel@tonic-gate } 7257c478bd9Sstevel@tonic-gate 7267c478bd9Sstevel@tonic-gate /* 7277c478bd9Sstevel@tonic-gate * Determine the zone we're being mounted into. 7287c478bd9Sstevel@tonic-gate */ 7297c478bd9Sstevel@tonic-gate if (getzoneid() == GLOBAL_ZONEID) { 7307c478bd9Sstevel@tonic-gate zone_t *mntzone; 7317c478bd9Sstevel@tonic-gate 7327c478bd9Sstevel@tonic-gate mntzone = zone_find_by_path(refstr_value(vfsp->vfs_mntpt)); 7337c478bd9Sstevel@tonic-gate ASSERT(mntzone != NULL); 7347c478bd9Sstevel@tonic-gate zone_rele(mntzone); 7357c478bd9Sstevel@tonic-gate if (mntzone != zone) { 7367c478bd9Sstevel@tonic-gate error = EBUSY; 7377c478bd9Sstevel@tonic-gate goto errout; 7387c478bd9Sstevel@tonic-gate } 7397c478bd9Sstevel@tonic-gate } 7407c478bd9Sstevel@tonic-gate 7417c478bd9Sstevel@tonic-gate /* 7427c478bd9Sstevel@tonic-gate * Stop the mount from going any further if the zone is going away. 7437c478bd9Sstevel@tonic-gate */ 744*108322fbScarlsonj if (zone_status_get(curproc->p_zone) >= ZONE_IS_SHUTTING_DOWN) { 7457c478bd9Sstevel@tonic-gate error = EBUSY; 7467c478bd9Sstevel@tonic-gate goto errout; 7477c478bd9Sstevel@tonic-gate } 7487c478bd9Sstevel@tonic-gate 7497c478bd9Sstevel@tonic-gate /* 7507c478bd9Sstevel@tonic-gate * Get root vnode. 7517c478bd9Sstevel@tonic-gate */ 7527c478bd9Sstevel@tonic-gate proceed: 7537c478bd9Sstevel@tonic-gate error = nfs4rootvp(&rtvp, vfsp, svp_head, flags, cr, zone); 7547c478bd9Sstevel@tonic-gate 7557c478bd9Sstevel@tonic-gate if (error) 7567c478bd9Sstevel@tonic-gate goto errout; 7577c478bd9Sstevel@tonic-gate 7587c478bd9Sstevel@tonic-gate mi = VTOMI4(rtvp); 7597c478bd9Sstevel@tonic-gate 7607c478bd9Sstevel@tonic-gate /* 7617c478bd9Sstevel@tonic-gate * Send client id to the server, if necessary 7627c478bd9Sstevel@tonic-gate */ 7637c478bd9Sstevel@tonic-gate nfs4_error_zinit(&n4e); 7647c478bd9Sstevel@tonic-gate nfs4setclientid(mi, cr, FALSE, &n4e); 7657c478bd9Sstevel@tonic-gate error = n4e.error; 7667c478bd9Sstevel@tonic-gate 7677c478bd9Sstevel@tonic-gate if (error) 7687c478bd9Sstevel@tonic-gate goto errout; 7697c478bd9Sstevel@tonic-gate 7707c478bd9Sstevel@tonic-gate /* 7717c478bd9Sstevel@tonic-gate * Set option fields in the mount info record 7727c478bd9Sstevel@tonic-gate */ 7737c478bd9Sstevel@tonic-gate 7747c478bd9Sstevel@tonic-gate if (svp_head->sv_next) { 7757c478bd9Sstevel@tonic-gate mutex_enter(&mi->mi_lock); 7767c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_LLOCK; 7777c478bd9Sstevel@tonic-gate mutex_exit(&mi->mi_lock); 7787c478bd9Sstevel@tonic-gate } 7797c478bd9Sstevel@tonic-gate 7807c478bd9Sstevel@tonic-gate error = nfs4_setopts(rtvp, get_udatamodel(), STRUCT_BUF(args)); 7817c478bd9Sstevel@tonic-gate 7827c478bd9Sstevel@tonic-gate errout: 7837c478bd9Sstevel@tonic-gate if (error) { 7847c478bd9Sstevel@tonic-gate if (rtvp != NULL) { 7857c478bd9Sstevel@tonic-gate rp = VTOR4(rtvp); 7867c478bd9Sstevel@tonic-gate if (rp->r_flags & R4HASHED) 7877c478bd9Sstevel@tonic-gate rp4_rmhash(rp); 7887c478bd9Sstevel@tonic-gate } 7897c478bd9Sstevel@tonic-gate if (mi != NULL) { 7907c478bd9Sstevel@tonic-gate nfs4_async_stop(vfsp); 7917c478bd9Sstevel@tonic-gate nfs4_async_manager_stop(vfsp); 7927c478bd9Sstevel@tonic-gate nfs4_remove_mi_from_server(mi, NULL); 7937c478bd9Sstevel@tonic-gate /* 7947c478bd9Sstevel@tonic-gate * In this error path we need to sfh4_rele() before 7957c478bd9Sstevel@tonic-gate * we free the mntinfo4_t as sfh4_rele() has a 7967c478bd9Sstevel@tonic-gate * dependancy on mi_fh_lock. 7977c478bd9Sstevel@tonic-gate */ 7987c478bd9Sstevel@tonic-gate if (rtvp != NULL) 7997c478bd9Sstevel@tonic-gate VN_RELE(rtvp); 8007c478bd9Sstevel@tonic-gate if (mi->mi_io_kstats) { 8017c478bd9Sstevel@tonic-gate kstat_delete(mi->mi_io_kstats); 8027c478bd9Sstevel@tonic-gate mi->mi_io_kstats = NULL; 8037c478bd9Sstevel@tonic-gate } 8047c478bd9Sstevel@tonic-gate if (mi->mi_ro_kstats) { 8057c478bd9Sstevel@tonic-gate kstat_delete(mi->mi_ro_kstats); 8067c478bd9Sstevel@tonic-gate mi->mi_ro_kstats = NULL; 8077c478bd9Sstevel@tonic-gate } 8087c478bd9Sstevel@tonic-gate if (mi->mi_recov_ksp) { 8097c478bd9Sstevel@tonic-gate kstat_delete(mi->mi_recov_ksp); 8107c478bd9Sstevel@tonic-gate mi->mi_recov_ksp = NULL; 8117c478bd9Sstevel@tonic-gate } 8127c478bd9Sstevel@tonic-gate nfs_free_mi4(mi); 8137c478bd9Sstevel@tonic-gate return (error); 8147c478bd9Sstevel@tonic-gate } 8157c478bd9Sstevel@tonic-gate sv4_free(svp_head); 8167c478bd9Sstevel@tonic-gate } 8177c478bd9Sstevel@tonic-gate 8187c478bd9Sstevel@tonic-gate if (rtvp != NULL) 8197c478bd9Sstevel@tonic-gate VN_RELE(rtvp); 8207c478bd9Sstevel@tonic-gate 8217c478bd9Sstevel@tonic-gate return (error); 8227c478bd9Sstevel@tonic-gate } 8237c478bd9Sstevel@tonic-gate 8247c478bd9Sstevel@tonic-gate #ifdef DEBUG 8257c478bd9Sstevel@tonic-gate #define VERS_MSG "NFS4 server " 8267c478bd9Sstevel@tonic-gate #else 8277c478bd9Sstevel@tonic-gate #define VERS_MSG "NFS server " 8287c478bd9Sstevel@tonic-gate #endif 8297c478bd9Sstevel@tonic-gate 8307c478bd9Sstevel@tonic-gate #define READ_MSG \ 8317c478bd9Sstevel@tonic-gate VERS_MSG "%s returned 0 for read transfer size" 8327c478bd9Sstevel@tonic-gate #define WRITE_MSG \ 8337c478bd9Sstevel@tonic-gate VERS_MSG "%s returned 0 for write transfer size" 8347c478bd9Sstevel@tonic-gate #define SIZE_MSG \ 8357c478bd9Sstevel@tonic-gate VERS_MSG "%s returned 0 for maximum file size" 8367c478bd9Sstevel@tonic-gate 8377c478bd9Sstevel@tonic-gate /* 8387c478bd9Sstevel@tonic-gate * Get the symbolic link text from the server for a given filehandle 8397c478bd9Sstevel@tonic-gate * of that symlink. 8407c478bd9Sstevel@tonic-gate * 8417c478bd9Sstevel@tonic-gate * (get symlink text) PUTFH READLINK 8427c478bd9Sstevel@tonic-gate */ 8437c478bd9Sstevel@tonic-gate static int 8447c478bd9Sstevel@tonic-gate getlinktext_otw(mntinfo4_t *mi, nfs_fh4 *fh, char **linktextp, cred_t *cr, 8457c478bd9Sstevel@tonic-gate int flags) 8467c478bd9Sstevel@tonic-gate { 8477c478bd9Sstevel@tonic-gate COMPOUND4args_clnt args; 8487c478bd9Sstevel@tonic-gate COMPOUND4res_clnt res; 8497c478bd9Sstevel@tonic-gate int doqueue; 8507c478bd9Sstevel@tonic-gate nfs_argop4 argop[2]; 8517c478bd9Sstevel@tonic-gate nfs_resop4 *resop; 8527c478bd9Sstevel@tonic-gate READLINK4res *lr_res; 8537c478bd9Sstevel@tonic-gate uint_t len; 8547c478bd9Sstevel@tonic-gate bool_t needrecov = FALSE; 8557c478bd9Sstevel@tonic-gate nfs4_recov_state_t recov_state; 8567c478bd9Sstevel@tonic-gate nfs4_sharedfh_t *sfh; 8577c478bd9Sstevel@tonic-gate nfs4_error_t e; 8587c478bd9Sstevel@tonic-gate int num_retry = nfs4_max_mount_retry; 8597c478bd9Sstevel@tonic-gate int recovery = !(flags & NFS4_GETFH_NEEDSOP); 8607c478bd9Sstevel@tonic-gate 8617c478bd9Sstevel@tonic-gate sfh = sfh4_get(fh, mi); 8627c478bd9Sstevel@tonic-gate recov_state.rs_flags = 0; 8637c478bd9Sstevel@tonic-gate recov_state.rs_num_retry_despite_err = 0; 8647c478bd9Sstevel@tonic-gate 8657c478bd9Sstevel@tonic-gate recov_retry: 8667c478bd9Sstevel@tonic-gate nfs4_error_zinit(&e); 8677c478bd9Sstevel@tonic-gate 8687c478bd9Sstevel@tonic-gate args.array_len = 2; 8697c478bd9Sstevel@tonic-gate args.array = argop; 8707c478bd9Sstevel@tonic-gate args.ctag = TAG_GET_SYMLINK; 8717c478bd9Sstevel@tonic-gate 8727c478bd9Sstevel@tonic-gate if (! recovery) { 8737c478bd9Sstevel@tonic-gate e.error = nfs4_start_op(mi, NULL, NULL, &recov_state); 8747c478bd9Sstevel@tonic-gate if (e.error) { 8757c478bd9Sstevel@tonic-gate sfh4_rele(&sfh); 8767c478bd9Sstevel@tonic-gate return (e.error); 8777c478bd9Sstevel@tonic-gate } 8787c478bd9Sstevel@tonic-gate } 8797c478bd9Sstevel@tonic-gate 8807c478bd9Sstevel@tonic-gate /* 0. putfh symlink fh */ 8817c478bd9Sstevel@tonic-gate argop[0].argop = OP_CPUTFH; 8827c478bd9Sstevel@tonic-gate argop[0].nfs_argop4_u.opcputfh.sfh = sfh; 8837c478bd9Sstevel@tonic-gate 8847c478bd9Sstevel@tonic-gate /* 1. readlink */ 8857c478bd9Sstevel@tonic-gate argop[1].argop = OP_READLINK; 8867c478bd9Sstevel@tonic-gate 8877c478bd9Sstevel@tonic-gate doqueue = 1; 8887c478bd9Sstevel@tonic-gate 8897c478bd9Sstevel@tonic-gate rfs4call(mi, &args, &res, cr, &doqueue, 0, &e); 8907c478bd9Sstevel@tonic-gate 8917c478bd9Sstevel@tonic-gate needrecov = nfs4_needs_recovery(&e, FALSE, mi->mi_vfsp); 8927c478bd9Sstevel@tonic-gate 8937c478bd9Sstevel@tonic-gate if (needrecov && !recovery && num_retry-- > 0) { 8947c478bd9Sstevel@tonic-gate 8957c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_recov_debug, (CE_NOTE, 8967c478bd9Sstevel@tonic-gate "getlinktext_otw: initiating recovery\n")); 8977c478bd9Sstevel@tonic-gate 8987c478bd9Sstevel@tonic-gate if (nfs4_start_recovery(&e, mi, NULL, NULL, NULL, NULL, 8997c478bd9Sstevel@tonic-gate OP_READLINK, NULL) == FALSE) { 9007c478bd9Sstevel@tonic-gate nfs4_end_op(mi, NULL, NULL, &recov_state, needrecov); 9017c478bd9Sstevel@tonic-gate if (!e.error) 9027c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, 9037c478bd9Sstevel@tonic-gate (caddr_t)&res); 9047c478bd9Sstevel@tonic-gate goto recov_retry; 9057c478bd9Sstevel@tonic-gate } 9067c478bd9Sstevel@tonic-gate } 9077c478bd9Sstevel@tonic-gate 9087c478bd9Sstevel@tonic-gate /* 9097c478bd9Sstevel@tonic-gate * If non-NFS4 pcol error and/or we weren't able to recover. 9107c478bd9Sstevel@tonic-gate */ 9117c478bd9Sstevel@tonic-gate if (e.error != 0) { 9127c478bd9Sstevel@tonic-gate if (! recovery) 9137c478bd9Sstevel@tonic-gate nfs4_end_op(mi, NULL, NULL, &recov_state, needrecov); 9147c478bd9Sstevel@tonic-gate sfh4_rele(&sfh); 9157c478bd9Sstevel@tonic-gate return (e.error); 9167c478bd9Sstevel@tonic-gate } 9177c478bd9Sstevel@tonic-gate 9187c478bd9Sstevel@tonic-gate if (res.status) { 9197c478bd9Sstevel@tonic-gate e.error = geterrno4(res.status); 9207c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 9217c478bd9Sstevel@tonic-gate if (! recovery) 9227c478bd9Sstevel@tonic-gate nfs4_end_op(mi, NULL, NULL, &recov_state, needrecov); 9237c478bd9Sstevel@tonic-gate sfh4_rele(&sfh); 9247c478bd9Sstevel@tonic-gate return (e.error); 9257c478bd9Sstevel@tonic-gate } 9267c478bd9Sstevel@tonic-gate 9277c478bd9Sstevel@tonic-gate /* res.status == NFS4_OK */ 9287c478bd9Sstevel@tonic-gate ASSERT(res.status == NFS4_OK); 9297c478bd9Sstevel@tonic-gate 9307c478bd9Sstevel@tonic-gate resop = &res.array[1]; /* readlink res */ 9317c478bd9Sstevel@tonic-gate lr_res = &resop->nfs_resop4_u.opreadlink; 9327c478bd9Sstevel@tonic-gate 9337c478bd9Sstevel@tonic-gate /* treat symlink name as data */ 9347c478bd9Sstevel@tonic-gate *linktextp = utf8_to_str(&lr_res->link, &len, NULL); 9357c478bd9Sstevel@tonic-gate 9367c478bd9Sstevel@tonic-gate if (! recovery) 9377c478bd9Sstevel@tonic-gate nfs4_end_op(mi, NULL, NULL, &recov_state, needrecov); 9387c478bd9Sstevel@tonic-gate sfh4_rele(&sfh); 9397c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 9407c478bd9Sstevel@tonic-gate 9417c478bd9Sstevel@tonic-gate return (0); 9427c478bd9Sstevel@tonic-gate } 9437c478bd9Sstevel@tonic-gate 9447c478bd9Sstevel@tonic-gate /* 9457c478bd9Sstevel@tonic-gate * Skip over consecutive slashes and "/./" in a pathname. 9467c478bd9Sstevel@tonic-gate */ 9477c478bd9Sstevel@tonic-gate void 9487c478bd9Sstevel@tonic-gate pathname_skipslashdot(struct pathname *pnp) 9497c478bd9Sstevel@tonic-gate { 9507c478bd9Sstevel@tonic-gate char *c1, *c2; 9517c478bd9Sstevel@tonic-gate 9527c478bd9Sstevel@tonic-gate while (pnp->pn_pathlen > 0 && *pnp->pn_path == '/') { 9537c478bd9Sstevel@tonic-gate 9547c478bd9Sstevel@tonic-gate c1 = pnp->pn_path + 1; 9557c478bd9Sstevel@tonic-gate c2 = pnp->pn_path + 2; 9567c478bd9Sstevel@tonic-gate 9577c478bd9Sstevel@tonic-gate if (*c1 == '.' && (*c2 == '/' || *c2 == '\0')) { 9587c478bd9Sstevel@tonic-gate pnp->pn_path = pnp->pn_path + 2; /* skip "/." */ 9597c478bd9Sstevel@tonic-gate pnp->pn_pathlen = pnp->pn_pathlen - 2; 9607c478bd9Sstevel@tonic-gate } else { 9617c478bd9Sstevel@tonic-gate pnp->pn_path++; 9627c478bd9Sstevel@tonic-gate pnp->pn_pathlen--; 9637c478bd9Sstevel@tonic-gate } 9647c478bd9Sstevel@tonic-gate } 9657c478bd9Sstevel@tonic-gate } 9667c478bd9Sstevel@tonic-gate 9677c478bd9Sstevel@tonic-gate /* 9687c478bd9Sstevel@tonic-gate * Resolve a symbolic link path. The symlink is in the nth component of 9697c478bd9Sstevel@tonic-gate * svp->sv_path and has an nfs4 file handle "fh". 9707c478bd9Sstevel@tonic-gate * Upon return, the sv_path will point to the new path that has the nth 9717c478bd9Sstevel@tonic-gate * component resolved to its symlink text. 9727c478bd9Sstevel@tonic-gate */ 9737c478bd9Sstevel@tonic-gate int 9747c478bd9Sstevel@tonic-gate resolve_sympath(mntinfo4_t *mi, servinfo4_t *svp, int nth, nfs_fh4 *fh, 9757c478bd9Sstevel@tonic-gate cred_t *cr, int flags) 9767c478bd9Sstevel@tonic-gate { 9777c478bd9Sstevel@tonic-gate char *oldpath; 9787c478bd9Sstevel@tonic-gate char *symlink, *newpath; 9797c478bd9Sstevel@tonic-gate struct pathname oldpn, newpn; 9807c478bd9Sstevel@tonic-gate char component[MAXNAMELEN]; 9817c478bd9Sstevel@tonic-gate int i, addlen, error = 0; 9827c478bd9Sstevel@tonic-gate int oldpathlen; 9837c478bd9Sstevel@tonic-gate 9847c478bd9Sstevel@tonic-gate /* Get the symbolic link text over the wire. */ 9857c478bd9Sstevel@tonic-gate error = getlinktext_otw(mi, fh, &symlink, cr, flags); 9867c478bd9Sstevel@tonic-gate 9877c478bd9Sstevel@tonic-gate if (error || symlink == NULL || strlen(symlink) == 0) 9887c478bd9Sstevel@tonic-gate return (error); 9897c478bd9Sstevel@tonic-gate 9907c478bd9Sstevel@tonic-gate /* 9917c478bd9Sstevel@tonic-gate * Compose the new pathname. 9927c478bd9Sstevel@tonic-gate * Note: 9937c478bd9Sstevel@tonic-gate * - only the nth component is resolved for the pathname. 9947c478bd9Sstevel@tonic-gate * - pathname.pn_pathlen does not count the ending null byte. 9957c478bd9Sstevel@tonic-gate */ 9967c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 9977c478bd9Sstevel@tonic-gate oldpath = svp->sv_path; 9987c478bd9Sstevel@tonic-gate oldpathlen = svp->sv_pathlen; 9997c478bd9Sstevel@tonic-gate if (error = pn_get(oldpath, UIO_SYSSPACE, &oldpn)) { 10007c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 10017c478bd9Sstevel@tonic-gate kmem_free(symlink, strlen(symlink) + 1); 10027c478bd9Sstevel@tonic-gate return (error); 10037c478bd9Sstevel@tonic-gate } 10047c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 10057c478bd9Sstevel@tonic-gate pn_alloc(&newpn); 10067c478bd9Sstevel@tonic-gate 10077c478bd9Sstevel@tonic-gate /* 10087c478bd9Sstevel@tonic-gate * Skip over previous components from the oldpath so that the 10097c478bd9Sstevel@tonic-gate * oldpn.pn_path will point to the symlink component. Skip 10107c478bd9Sstevel@tonic-gate * leading slashes and "/./" (no OP_LOOKUP on ".") so that 10117c478bd9Sstevel@tonic-gate * pn_getcompnent can get the component. 10127c478bd9Sstevel@tonic-gate */ 10137c478bd9Sstevel@tonic-gate for (i = 1; i < nth; i++) { 10147c478bd9Sstevel@tonic-gate pathname_skipslashdot(&oldpn); 10157c478bd9Sstevel@tonic-gate error = pn_getcomponent(&oldpn, component); 10167c478bd9Sstevel@tonic-gate if (error) 10177c478bd9Sstevel@tonic-gate goto out; 10187c478bd9Sstevel@tonic-gate } 10197c478bd9Sstevel@tonic-gate 10207c478bd9Sstevel@tonic-gate /* 10217c478bd9Sstevel@tonic-gate * Copy the old path upto the component right before the symlink 10227c478bd9Sstevel@tonic-gate * if the symlink is not an absolute path. 10237c478bd9Sstevel@tonic-gate */ 10247c478bd9Sstevel@tonic-gate if (symlink[0] != '/') { 10257c478bd9Sstevel@tonic-gate addlen = oldpn.pn_path - oldpn.pn_buf; 10267c478bd9Sstevel@tonic-gate bcopy(oldpn.pn_buf, newpn.pn_path, addlen); 10277c478bd9Sstevel@tonic-gate newpn.pn_pathlen += addlen; 10287c478bd9Sstevel@tonic-gate newpn.pn_path += addlen; 10297c478bd9Sstevel@tonic-gate newpn.pn_buf[newpn.pn_pathlen] = '/'; 10307c478bd9Sstevel@tonic-gate newpn.pn_pathlen++; 10317c478bd9Sstevel@tonic-gate newpn.pn_path++; 10327c478bd9Sstevel@tonic-gate } 10337c478bd9Sstevel@tonic-gate 10347c478bd9Sstevel@tonic-gate /* copy the resolved symbolic link text */ 10357c478bd9Sstevel@tonic-gate addlen = strlen(symlink); 10367c478bd9Sstevel@tonic-gate if (newpn.pn_pathlen + addlen >= newpn.pn_bufsize) { 10377c478bd9Sstevel@tonic-gate error = ENAMETOOLONG; 10387c478bd9Sstevel@tonic-gate goto out; 10397c478bd9Sstevel@tonic-gate } 10407c478bd9Sstevel@tonic-gate bcopy(symlink, newpn.pn_path, addlen); 10417c478bd9Sstevel@tonic-gate newpn.pn_pathlen += addlen; 10427c478bd9Sstevel@tonic-gate newpn.pn_path += addlen; 10437c478bd9Sstevel@tonic-gate 10447c478bd9Sstevel@tonic-gate /* 10457c478bd9Sstevel@tonic-gate * Check if there is any remaining path after the symlink component. 10467c478bd9Sstevel@tonic-gate * First, skip the symlink component. 10477c478bd9Sstevel@tonic-gate */ 10487c478bd9Sstevel@tonic-gate pathname_skipslashdot(&oldpn); 10497c478bd9Sstevel@tonic-gate if (error = pn_getcomponent(&oldpn, component)) 10507c478bd9Sstevel@tonic-gate goto out; 10517c478bd9Sstevel@tonic-gate 10527c478bd9Sstevel@tonic-gate addlen = pn_pathleft(&oldpn); /* includes counting the slash */ 10537c478bd9Sstevel@tonic-gate 10547c478bd9Sstevel@tonic-gate /* 10557c478bd9Sstevel@tonic-gate * Copy the remaining path to the new pathname if there is any. 10567c478bd9Sstevel@tonic-gate */ 10577c478bd9Sstevel@tonic-gate if (addlen > 0) { 10587c478bd9Sstevel@tonic-gate if (newpn.pn_pathlen + addlen >= newpn.pn_bufsize) { 10597c478bd9Sstevel@tonic-gate error = ENAMETOOLONG; 10607c478bd9Sstevel@tonic-gate goto out; 10617c478bd9Sstevel@tonic-gate } 10627c478bd9Sstevel@tonic-gate bcopy(oldpn.pn_path, newpn.pn_path, addlen); 10637c478bd9Sstevel@tonic-gate newpn.pn_pathlen += addlen; 10647c478bd9Sstevel@tonic-gate } 10657c478bd9Sstevel@tonic-gate newpn.pn_buf[newpn.pn_pathlen] = '\0'; 10667c478bd9Sstevel@tonic-gate 10677c478bd9Sstevel@tonic-gate /* get the newpath and store it in the servinfo4_t */ 10687c478bd9Sstevel@tonic-gate newpath = kmem_alloc(newpn.pn_pathlen + 1, KM_SLEEP); 10697c478bd9Sstevel@tonic-gate bcopy(newpn.pn_buf, newpath, newpn.pn_pathlen); 10707c478bd9Sstevel@tonic-gate newpath[newpn.pn_pathlen] = '\0'; 10717c478bd9Sstevel@tonic-gate 10727c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_WRITER, 0); 10737c478bd9Sstevel@tonic-gate svp->sv_path = newpath; 10747c478bd9Sstevel@tonic-gate svp->sv_pathlen = strlen(newpath) + 1; 10757c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 10767c478bd9Sstevel@tonic-gate 10777c478bd9Sstevel@tonic-gate kmem_free(oldpath, oldpathlen); 10787c478bd9Sstevel@tonic-gate out: 10797c478bd9Sstevel@tonic-gate kmem_free(symlink, strlen(symlink) + 1); 10807c478bd9Sstevel@tonic-gate pn_free(&newpn); 10817c478bd9Sstevel@tonic-gate pn_free(&oldpn); 10827c478bd9Sstevel@tonic-gate 10837c478bd9Sstevel@tonic-gate return (error); 10847c478bd9Sstevel@tonic-gate } 10857c478bd9Sstevel@tonic-gate 10867c478bd9Sstevel@tonic-gate /* 10877c478bd9Sstevel@tonic-gate * Get the root filehandle for the given filesystem and server, and update 10887c478bd9Sstevel@tonic-gate * svp. 10897c478bd9Sstevel@tonic-gate * 10907c478bd9Sstevel@tonic-gate * If NFS4_GETFH_NEEDSOP is set, then use nfs4_start_fop and nfs4_end_fop 10917c478bd9Sstevel@tonic-gate * to coordinate with recovery. Otherwise, the caller is assumed to be 10927c478bd9Sstevel@tonic-gate * the recovery thread or have already done a start_fop. 10937c478bd9Sstevel@tonic-gate * 10947c478bd9Sstevel@tonic-gate * Errors are returned by the nfs4_error_t parameter. 10957c478bd9Sstevel@tonic-gate */ 10967c478bd9Sstevel@tonic-gate 10977c478bd9Sstevel@tonic-gate static void 10987c478bd9Sstevel@tonic-gate nfs4getfh_otw(struct mntinfo4 *mi, servinfo4_t *svp, vtype_t *vtp, 10997c478bd9Sstevel@tonic-gate int flags, cred_t *cr, nfs4_error_t *ep) 11007c478bd9Sstevel@tonic-gate { 11017c478bd9Sstevel@tonic-gate COMPOUND4args_clnt args; 11027c478bd9Sstevel@tonic-gate COMPOUND4res_clnt res; 11037c478bd9Sstevel@tonic-gate int doqueue = 1; 11047c478bd9Sstevel@tonic-gate nfs_argop4 *argop; 11057c478bd9Sstevel@tonic-gate nfs_resop4 *resop; 11067c478bd9Sstevel@tonic-gate nfs4_ga_res_t *garp; 11077c478bd9Sstevel@tonic-gate int num_argops; 11087c478bd9Sstevel@tonic-gate lookup4_param_t lookuparg; 11097c478bd9Sstevel@tonic-gate nfs_fh4 *tmpfhp; 11107c478bd9Sstevel@tonic-gate nfs_fh4 *resfhp; 11117c478bd9Sstevel@tonic-gate bool_t needrecov = FALSE; 11127c478bd9Sstevel@tonic-gate nfs4_recov_state_t recov_state; 11137c478bd9Sstevel@tonic-gate int llndx; 11147c478bd9Sstevel@tonic-gate int nthcomp; 11157c478bd9Sstevel@tonic-gate int recovery = !(flags & NFS4_GETFH_NEEDSOP); 11167c478bd9Sstevel@tonic-gate 11177c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 11187c478bd9Sstevel@tonic-gate ASSERT(svp->sv_path != NULL); 11197c478bd9Sstevel@tonic-gate if (svp->sv_path[0] == '\0') { 11207c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 11217c478bd9Sstevel@tonic-gate nfs4_error_init(ep, EINVAL); 11227c478bd9Sstevel@tonic-gate return; 11237c478bd9Sstevel@tonic-gate } 11247c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 11257c478bd9Sstevel@tonic-gate 11267c478bd9Sstevel@tonic-gate recov_state.rs_flags = 0; 11277c478bd9Sstevel@tonic-gate recov_state.rs_num_retry_despite_err = 0; 11287c478bd9Sstevel@tonic-gate recov_retry: 11297c478bd9Sstevel@tonic-gate nfs4_error_zinit(ep); 11307c478bd9Sstevel@tonic-gate 11317c478bd9Sstevel@tonic-gate if (!recovery) { 11327c478bd9Sstevel@tonic-gate ep->error = nfs4_start_fop(mi, NULL, NULL, OH_MOUNT, 11337c478bd9Sstevel@tonic-gate &recov_state, NULL); 11347c478bd9Sstevel@tonic-gate 11357c478bd9Sstevel@tonic-gate /* 11367c478bd9Sstevel@tonic-gate * If recovery has been started and this request as 11377c478bd9Sstevel@tonic-gate * initiated by a mount, then we must wait for recovery 11387c478bd9Sstevel@tonic-gate * to finish before proceeding, otherwise, the error 11397c478bd9Sstevel@tonic-gate * cleanup would remove data structures needed by the 11407c478bd9Sstevel@tonic-gate * recovery thread. 11417c478bd9Sstevel@tonic-gate */ 11427c478bd9Sstevel@tonic-gate if (ep->error) { 11437c478bd9Sstevel@tonic-gate mutex_enter(&mi->mi_lock); 11447c478bd9Sstevel@tonic-gate if (mi->mi_flags & MI4_MOUNTING) { 11457c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_RECOV_FAIL; 11467c478bd9Sstevel@tonic-gate mi->mi_error = EIO; 11477c478bd9Sstevel@tonic-gate 11487c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_recov_debug, (CE_NOTE, 11497c478bd9Sstevel@tonic-gate "nfs4getfh_otw: waiting 4 recovery\n")); 11507c478bd9Sstevel@tonic-gate 11517c478bd9Sstevel@tonic-gate while (mi->mi_flags & MI4_RECOV_ACTIV) 11527c478bd9Sstevel@tonic-gate cv_wait(&mi->mi_failover_cv, 11537c478bd9Sstevel@tonic-gate &mi->mi_lock); 11547c478bd9Sstevel@tonic-gate } 11557c478bd9Sstevel@tonic-gate mutex_exit(&mi->mi_lock); 11567c478bd9Sstevel@tonic-gate return; 11577c478bd9Sstevel@tonic-gate } 11587c478bd9Sstevel@tonic-gate 11597c478bd9Sstevel@tonic-gate /* 11607c478bd9Sstevel@tonic-gate * If the client does not specify a specific flavor to use 11617c478bd9Sstevel@tonic-gate * and has not gotten a secinfo list from the server yet, 11627c478bd9Sstevel@tonic-gate * retrieve the secinfo list from the server and use a 11637c478bd9Sstevel@tonic-gate * flavor from the list to mount. 11647c478bd9Sstevel@tonic-gate * 11657c478bd9Sstevel@tonic-gate * If fail to get the secinfo list from the server, then 11667c478bd9Sstevel@tonic-gate * try the default flavor. 11677c478bd9Sstevel@tonic-gate */ 11687c478bd9Sstevel@tonic-gate if ((svp->sv_flags & SV4_TRYSECDEFAULT) && 11697c478bd9Sstevel@tonic-gate svp->sv_secinfo == NULL) { 11707c478bd9Sstevel@tonic-gate (void) nfs4_secinfo_path(mi, cr, FALSE); 11717c478bd9Sstevel@tonic-gate } 11727c478bd9Sstevel@tonic-gate } 11737c478bd9Sstevel@tonic-gate 11747c478bd9Sstevel@tonic-gate if (recovery) 11757c478bd9Sstevel@tonic-gate args.ctag = TAG_REMAP_MOUNT; 11767c478bd9Sstevel@tonic-gate else 11777c478bd9Sstevel@tonic-gate args.ctag = TAG_MOUNT; 11787c478bd9Sstevel@tonic-gate 11797c478bd9Sstevel@tonic-gate lookuparg.l4_getattrs = LKP4_ALL_ATTRIBUTES; 11807c478bd9Sstevel@tonic-gate lookuparg.argsp = &args; 11817c478bd9Sstevel@tonic-gate lookuparg.resp = &res; 11827c478bd9Sstevel@tonic-gate lookuparg.header_len = 2; /* Putrootfh, getfh */ 11837c478bd9Sstevel@tonic-gate lookuparg.trailer_len = 0; 11847c478bd9Sstevel@tonic-gate lookuparg.ga_bits = FATTR4_FSINFO_MASK; 11857c478bd9Sstevel@tonic-gate lookuparg.mi = mi; 11867c478bd9Sstevel@tonic-gate 11877c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 11887c478bd9Sstevel@tonic-gate ASSERT(svp->sv_path != NULL); 11897c478bd9Sstevel@tonic-gate llndx = nfs4lookup_setup(svp->sv_path, &lookuparg, 0); 11907c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 11917c478bd9Sstevel@tonic-gate 11927c478bd9Sstevel@tonic-gate argop = args.array; 11937c478bd9Sstevel@tonic-gate num_argops = args.array_len; 11947c478bd9Sstevel@tonic-gate 11957c478bd9Sstevel@tonic-gate /* choose public or root filehandle */ 11967c478bd9Sstevel@tonic-gate if (flags & NFS4_GETFH_PUBLIC) 11977c478bd9Sstevel@tonic-gate argop[0].argop = OP_PUTPUBFH; 11987c478bd9Sstevel@tonic-gate else 11997c478bd9Sstevel@tonic-gate argop[0].argop = OP_PUTROOTFH; 12007c478bd9Sstevel@tonic-gate 12017c478bd9Sstevel@tonic-gate /* get fh */ 12027c478bd9Sstevel@tonic-gate argop[1].argop = OP_GETFH; 12037c478bd9Sstevel@tonic-gate 12047c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_call_debug, (CE_NOTE, 12057c478bd9Sstevel@tonic-gate "nfs4getfh_otw: %s call, mi 0x%p", 12067c478bd9Sstevel@tonic-gate needrecov ? "recov" : "first", (void *)mi)); 12077c478bd9Sstevel@tonic-gate 12087c478bd9Sstevel@tonic-gate rfs4call(mi, &args, &res, cr, &doqueue, RFSCALL_SOFT, ep); 12097c478bd9Sstevel@tonic-gate 12107c478bd9Sstevel@tonic-gate needrecov = nfs4_needs_recovery(ep, FALSE, mi->mi_vfsp); 12117c478bd9Sstevel@tonic-gate 12127c478bd9Sstevel@tonic-gate if (needrecov) { 12137c478bd9Sstevel@tonic-gate bool_t abort; 12147c478bd9Sstevel@tonic-gate 12157c478bd9Sstevel@tonic-gate if (recovery) { 12167c478bd9Sstevel@tonic-gate nfs4args_lookup_free(argop, num_argops); 12177c478bd9Sstevel@tonic-gate kmem_free(argop, 12187c478bd9Sstevel@tonic-gate lookuparg.arglen * sizeof (nfs_argop4)); 12197c478bd9Sstevel@tonic-gate if (!ep->error) 12207c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, 12217c478bd9Sstevel@tonic-gate (caddr_t)&res); 12227c478bd9Sstevel@tonic-gate return; 12237c478bd9Sstevel@tonic-gate } 12247c478bd9Sstevel@tonic-gate 12257c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_recov_debug, 12267c478bd9Sstevel@tonic-gate (CE_NOTE, "nfs4getfh_otw: initiating recovery\n")); 12277c478bd9Sstevel@tonic-gate 12287c478bd9Sstevel@tonic-gate abort = nfs4_start_recovery(ep, mi, NULL, 12297c478bd9Sstevel@tonic-gate NULL, NULL, NULL, OP_GETFH, NULL); 12307c478bd9Sstevel@tonic-gate if (!ep->error) { 12317c478bd9Sstevel@tonic-gate ep->error = geterrno4(res.status); 12327c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 12337c478bd9Sstevel@tonic-gate } 12347c478bd9Sstevel@tonic-gate nfs4args_lookup_free(argop, num_argops); 12357c478bd9Sstevel@tonic-gate kmem_free(argop, lookuparg.arglen * sizeof (nfs_argop4)); 12367c478bd9Sstevel@tonic-gate nfs4_end_fop(mi, NULL, NULL, OH_MOUNT, &recov_state, needrecov); 12377c478bd9Sstevel@tonic-gate /* have another go? */ 12387c478bd9Sstevel@tonic-gate if (abort == FALSE) 12397c478bd9Sstevel@tonic-gate goto recov_retry; 12407c478bd9Sstevel@tonic-gate return; 12417c478bd9Sstevel@tonic-gate } 12427c478bd9Sstevel@tonic-gate 12437c478bd9Sstevel@tonic-gate /* 12447c478bd9Sstevel@tonic-gate * No recovery, but check if error is set. 12457c478bd9Sstevel@tonic-gate */ 12467c478bd9Sstevel@tonic-gate if (ep->error) { 12477c478bd9Sstevel@tonic-gate nfs4args_lookup_free(argop, num_argops); 12487c478bd9Sstevel@tonic-gate kmem_free(argop, lookuparg.arglen * sizeof (nfs_argop4)); 12497c478bd9Sstevel@tonic-gate if (!recovery) 12507c478bd9Sstevel@tonic-gate nfs4_end_fop(mi, NULL, NULL, OH_MOUNT, &recov_state, 12517c478bd9Sstevel@tonic-gate needrecov); 12527c478bd9Sstevel@tonic-gate return; 12537c478bd9Sstevel@tonic-gate } 12547c478bd9Sstevel@tonic-gate 12557c478bd9Sstevel@tonic-gate is_link_err: 12567c478bd9Sstevel@tonic-gate 12577c478bd9Sstevel@tonic-gate /* for non-recovery errors */ 12587c478bd9Sstevel@tonic-gate if (res.status && res.status != NFS4ERR_SYMLINK) { 12597c478bd9Sstevel@tonic-gate if (!recovery) { 12607c478bd9Sstevel@tonic-gate nfs4_end_fop(mi, NULL, NULL, OH_MOUNT, &recov_state, 12617c478bd9Sstevel@tonic-gate needrecov); 12627c478bd9Sstevel@tonic-gate } 12637c478bd9Sstevel@tonic-gate nfs4args_lookup_free(argop, num_argops); 12647c478bd9Sstevel@tonic-gate kmem_free(argop, lookuparg.arglen * sizeof (nfs_argop4)); 12657c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 12667c478bd9Sstevel@tonic-gate return; 12677c478bd9Sstevel@tonic-gate } 12687c478bd9Sstevel@tonic-gate 12697c478bd9Sstevel@tonic-gate /* 12707c478bd9Sstevel@tonic-gate * If any intermediate component in the path is a symbolic link, 12717c478bd9Sstevel@tonic-gate * resolve the symlink, then try mount again using the new path. 12727c478bd9Sstevel@tonic-gate */ 12737c478bd9Sstevel@tonic-gate if (res.status == NFS4ERR_SYMLINK) { 12747c478bd9Sstevel@tonic-gate int where; 12757c478bd9Sstevel@tonic-gate 12767c478bd9Sstevel@tonic-gate /* 12777c478bd9Sstevel@tonic-gate * This must be from OP_LOOKUP failure. The (cfh) for this 12787c478bd9Sstevel@tonic-gate * OP_LOOKUP is a symlink node. Found out where the 12797c478bd9Sstevel@tonic-gate * OP_GETFH is for the (cfh) that is a symlink node. 12807c478bd9Sstevel@tonic-gate * 12817c478bd9Sstevel@tonic-gate * Example: 12827c478bd9Sstevel@tonic-gate * (mount) PUTROOTFH, GETFH, LOOKUP comp1, GETFH, GETATTR, 12837c478bd9Sstevel@tonic-gate * LOOKUP comp2, GETFH, GETATTR, LOOKUP comp3, GETFH, GETATTR 12847c478bd9Sstevel@tonic-gate * 12857c478bd9Sstevel@tonic-gate * LOOKUP comp3 fails with SYMLINK because comp2 is a symlink. 12867c478bd9Sstevel@tonic-gate * In this case, where = 7, nthcomp = 2. 12877c478bd9Sstevel@tonic-gate */ 12887c478bd9Sstevel@tonic-gate where = res.array_len - 2; 12897c478bd9Sstevel@tonic-gate ASSERT(where > 0); 12907c478bd9Sstevel@tonic-gate 12917c478bd9Sstevel@tonic-gate resop = &res.array[where - 1]; 12927c478bd9Sstevel@tonic-gate ASSERT(resop->resop == OP_GETFH); 12937c478bd9Sstevel@tonic-gate tmpfhp = &resop->nfs_resop4_u.opgetfh.object; 12947c478bd9Sstevel@tonic-gate nthcomp = res.array_len/3 - 1; 12957c478bd9Sstevel@tonic-gate 12967c478bd9Sstevel@tonic-gate /* 12977c478bd9Sstevel@tonic-gate * Need to call nfs4_end_op before resolve_sympath to avoid 12987c478bd9Sstevel@tonic-gate * potential nfs4_start_op deadlock. 12997c478bd9Sstevel@tonic-gate */ 13007c478bd9Sstevel@tonic-gate if (!recovery) 13017c478bd9Sstevel@tonic-gate nfs4_end_fop(mi, NULL, NULL, OH_MOUNT, &recov_state, 13027c478bd9Sstevel@tonic-gate needrecov); 13037c478bd9Sstevel@tonic-gate 13047c478bd9Sstevel@tonic-gate ep->error = resolve_sympath(mi, svp, nthcomp, tmpfhp, cr, 13057c478bd9Sstevel@tonic-gate flags); 13067c478bd9Sstevel@tonic-gate 13077c478bd9Sstevel@tonic-gate nfs4args_lookup_free(argop, num_argops); 13087c478bd9Sstevel@tonic-gate kmem_free(argop, lookuparg.arglen * sizeof (nfs_argop4)); 13097c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 13107c478bd9Sstevel@tonic-gate 13117c478bd9Sstevel@tonic-gate if (ep->error) 13127c478bd9Sstevel@tonic-gate return; 13137c478bd9Sstevel@tonic-gate 13147c478bd9Sstevel@tonic-gate goto recov_retry; 13157c478bd9Sstevel@tonic-gate } 13167c478bd9Sstevel@tonic-gate 13177c478bd9Sstevel@tonic-gate /* getfh */ 13187c478bd9Sstevel@tonic-gate resop = &res.array[res.array_len - 2]; 13197c478bd9Sstevel@tonic-gate ASSERT(resop->resop == OP_GETFH); 13207c478bd9Sstevel@tonic-gate resfhp = &resop->nfs_resop4_u.opgetfh.object; 13217c478bd9Sstevel@tonic-gate 13227c478bd9Sstevel@tonic-gate /* getattr fsinfo res */ 13237c478bd9Sstevel@tonic-gate resop++; 13247c478bd9Sstevel@tonic-gate garp = &resop->nfs_resop4_u.opgetattr.ga_res; 13257c478bd9Sstevel@tonic-gate 13267c478bd9Sstevel@tonic-gate *vtp = garp->n4g_va.va_type; 13277c478bd9Sstevel@tonic-gate 13287c478bd9Sstevel@tonic-gate mi->mi_fh_expire_type = garp->n4g_ext_res->n4g_fet; 13297c478bd9Sstevel@tonic-gate 13307c478bd9Sstevel@tonic-gate mutex_enter(&mi->mi_lock); 13317c478bd9Sstevel@tonic-gate if (garp->n4g_ext_res->n4g_pc4.pc4_link_support) 13327c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_LINK; 13337c478bd9Sstevel@tonic-gate if (garp->n4g_ext_res->n4g_pc4.pc4_symlink_support) 13347c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_SYMLINK; 13357c478bd9Sstevel@tonic-gate if (garp->n4g_ext_res->n4g_suppattrs & FATTR4_ACL_MASK) 13367c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_ACL; 13377c478bd9Sstevel@tonic-gate mutex_exit(&mi->mi_lock); 13387c478bd9Sstevel@tonic-gate 13397c478bd9Sstevel@tonic-gate if (garp->n4g_ext_res->n4g_maxread == 0) 13407c478bd9Sstevel@tonic-gate mi->mi_tsize = 13417c478bd9Sstevel@tonic-gate MIN(MAXBSIZE, mi->mi_tsize); 13427c478bd9Sstevel@tonic-gate else 13437c478bd9Sstevel@tonic-gate mi->mi_tsize = 13447c478bd9Sstevel@tonic-gate MIN(garp->n4g_ext_res->n4g_maxread, 13457c478bd9Sstevel@tonic-gate mi->mi_tsize); 13467c478bd9Sstevel@tonic-gate 13477c478bd9Sstevel@tonic-gate if (garp->n4g_ext_res->n4g_maxwrite == 0) 13487c478bd9Sstevel@tonic-gate mi->mi_stsize = 13497c478bd9Sstevel@tonic-gate MIN(MAXBSIZE, mi->mi_stsize); 13507c478bd9Sstevel@tonic-gate else 13517c478bd9Sstevel@tonic-gate mi->mi_stsize = 13527c478bd9Sstevel@tonic-gate MIN(garp->n4g_ext_res->n4g_maxwrite, 13537c478bd9Sstevel@tonic-gate mi->mi_stsize); 13547c478bd9Sstevel@tonic-gate 13557c478bd9Sstevel@tonic-gate if (garp->n4g_ext_res->n4g_maxfilesize != 0) 13567c478bd9Sstevel@tonic-gate mi->mi_maxfilesize = 13577c478bd9Sstevel@tonic-gate MIN(garp->n4g_ext_res->n4g_maxfilesize, 13587c478bd9Sstevel@tonic-gate mi->mi_maxfilesize); 13597c478bd9Sstevel@tonic-gate 13607c478bd9Sstevel@tonic-gate /* 13617c478bd9Sstevel@tonic-gate * If the final component is a a symbolic link, resolve the symlink, 13627c478bd9Sstevel@tonic-gate * then try mount again using the new path. 13637c478bd9Sstevel@tonic-gate * 13647c478bd9Sstevel@tonic-gate * Assume no symbolic link for root filesysm "/". 13657c478bd9Sstevel@tonic-gate */ 13667c478bd9Sstevel@tonic-gate if (*vtp == VLNK) { 13677c478bd9Sstevel@tonic-gate /* 13687c478bd9Sstevel@tonic-gate * nthcomp is the total result length minus 13697c478bd9Sstevel@tonic-gate * the 1st 2 OPs (PUTROOTFH, GETFH), 13707c478bd9Sstevel@tonic-gate * then divided by 3 (LOOKUP,GETFH,GETATTR) 13717c478bd9Sstevel@tonic-gate * 13727c478bd9Sstevel@tonic-gate * e.g. PUTROOTFH GETFH LOOKUP 1st-comp GETFH GETATTR 13737c478bd9Sstevel@tonic-gate * LOOKUP 2nd-comp GETFH GETATTR 13747c478bd9Sstevel@tonic-gate * 13757c478bd9Sstevel@tonic-gate * (8 - 2)/3 = 2 13767c478bd9Sstevel@tonic-gate */ 13777c478bd9Sstevel@tonic-gate nthcomp = (res.array_len - 2)/3; 13787c478bd9Sstevel@tonic-gate 13797c478bd9Sstevel@tonic-gate /* 13807c478bd9Sstevel@tonic-gate * Need to call nfs4_end_op before resolve_sympath to avoid 13817c478bd9Sstevel@tonic-gate * potential nfs4_start_op deadlock. See RFE 4777612. 13827c478bd9Sstevel@tonic-gate */ 13837c478bd9Sstevel@tonic-gate if (!recovery) 13847c478bd9Sstevel@tonic-gate nfs4_end_fop(mi, NULL, NULL, OH_MOUNT, &recov_state, 13857c478bd9Sstevel@tonic-gate needrecov); 13867c478bd9Sstevel@tonic-gate 13877c478bd9Sstevel@tonic-gate ep->error = resolve_sympath(mi, svp, nthcomp, resfhp, cr, 13887c478bd9Sstevel@tonic-gate flags); 13897c478bd9Sstevel@tonic-gate 13907c478bd9Sstevel@tonic-gate nfs4args_lookup_free(argop, num_argops); 13917c478bd9Sstevel@tonic-gate kmem_free(argop, lookuparg.arglen * sizeof (nfs_argop4)); 13927c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 13937c478bd9Sstevel@tonic-gate 13947c478bd9Sstevel@tonic-gate if (ep->error) 13957c478bd9Sstevel@tonic-gate return; 13967c478bd9Sstevel@tonic-gate 13977c478bd9Sstevel@tonic-gate goto recov_retry; 13987c478bd9Sstevel@tonic-gate } 13997c478bd9Sstevel@tonic-gate 14007c478bd9Sstevel@tonic-gate /* 14017c478bd9Sstevel@tonic-gate * We need to figure out where in the compound the getfh 14027c478bd9Sstevel@tonic-gate * for the parent directory is. If the object to be mounted is 14037c478bd9Sstevel@tonic-gate * the root, then there is no lookup at all: 14047c478bd9Sstevel@tonic-gate * PUTROOTFH, GETFH. 14057c478bd9Sstevel@tonic-gate * If the object to be mounted is in the root, then the compound is: 14067c478bd9Sstevel@tonic-gate * PUTROOTFH, GETFH, LOOKUP, GETFH, GETATTR. 14077c478bd9Sstevel@tonic-gate * In either of these cases, the index of the GETFH is 1. 14087c478bd9Sstevel@tonic-gate * If it is not at the root, then it's something like: 14097c478bd9Sstevel@tonic-gate * PUTROOTFH, GETFH, LOOKUP, GETFH, GETATTR, 14107c478bd9Sstevel@tonic-gate * LOOKUP, GETFH, GETATTR 14117c478bd9Sstevel@tonic-gate * In this case, the index is llndx (last lookup index) - 2. 14127c478bd9Sstevel@tonic-gate */ 14137c478bd9Sstevel@tonic-gate if (llndx == -1 || llndx == 2) 14147c478bd9Sstevel@tonic-gate resop = &res.array[1]; 14157c478bd9Sstevel@tonic-gate else { 14167c478bd9Sstevel@tonic-gate ASSERT(llndx > 2); 14177c478bd9Sstevel@tonic-gate resop = &res.array[llndx-2]; 14187c478bd9Sstevel@tonic-gate } 14197c478bd9Sstevel@tonic-gate 14207c478bd9Sstevel@tonic-gate ASSERT(resop->resop == OP_GETFH); 14217c478bd9Sstevel@tonic-gate tmpfhp = &resop->nfs_resop4_u.opgetfh.object; 14227c478bd9Sstevel@tonic-gate 14237c478bd9Sstevel@tonic-gate /* save the filehandles for the replica */ 14247c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_WRITER, 0); 14257c478bd9Sstevel@tonic-gate ASSERT(tmpfhp->nfs_fh4_len <= NFS4_FHSIZE); 14267c478bd9Sstevel@tonic-gate svp->sv_pfhandle.fh_len = tmpfhp->nfs_fh4_len; 14277c478bd9Sstevel@tonic-gate bcopy(tmpfhp->nfs_fh4_val, svp->sv_pfhandle.fh_buf, 14287c478bd9Sstevel@tonic-gate tmpfhp->nfs_fh4_len); 14297c478bd9Sstevel@tonic-gate ASSERT(resfhp->nfs_fh4_len <= NFS4_FHSIZE); 14307c478bd9Sstevel@tonic-gate svp->sv_fhandle.fh_len = resfhp->nfs_fh4_len; 14317c478bd9Sstevel@tonic-gate bcopy(resfhp->nfs_fh4_val, svp->sv_fhandle.fh_buf, resfhp->nfs_fh4_len); 14327c478bd9Sstevel@tonic-gate 14337c478bd9Sstevel@tonic-gate /* initialize fsid and supp_attrs for server fs */ 14347c478bd9Sstevel@tonic-gate svp->sv_fsid = garp->n4g_fsid; 14357c478bd9Sstevel@tonic-gate svp->sv_supp_attrs = 14367c478bd9Sstevel@tonic-gate garp->n4g_ext_res->n4g_suppattrs | FATTR4_MANDATTR_MASK; 14377c478bd9Sstevel@tonic-gate 14387c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 14397c478bd9Sstevel@tonic-gate 14407c478bd9Sstevel@tonic-gate nfs4args_lookup_free(argop, num_argops); 14417c478bd9Sstevel@tonic-gate kmem_free(argop, lookuparg.arglen * sizeof (nfs_argop4)); 14427c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 14437c478bd9Sstevel@tonic-gate if (!recovery) 14447c478bd9Sstevel@tonic-gate nfs4_end_fop(mi, NULL, NULL, OH_MOUNT, &recov_state, needrecov); 14457c478bd9Sstevel@tonic-gate } 14467c478bd9Sstevel@tonic-gate 14477c478bd9Sstevel@tonic-gate static ushort_t nfs4_max_threads = 8; /* max number of active async threads */ 14487c478bd9Sstevel@tonic-gate static uint_t nfs4_bsize = 32 * 1024; /* client `block' size */ 14497c478bd9Sstevel@tonic-gate static uint_t nfs4_async_clusters = 1; /* # of reqs from each async queue */ 14507c478bd9Sstevel@tonic-gate static uint_t nfs4_cots_timeo = NFS_COTS_TIMEO; 14517c478bd9Sstevel@tonic-gate 14527c478bd9Sstevel@tonic-gate /* 14537c478bd9Sstevel@tonic-gate * Remap the root filehandle for the given filesystem. 14547c478bd9Sstevel@tonic-gate * 14557c478bd9Sstevel@tonic-gate * results returned via the nfs4_error_t parameter. 14567c478bd9Sstevel@tonic-gate */ 14577c478bd9Sstevel@tonic-gate void 14587c478bd9Sstevel@tonic-gate nfs4_remap_root(mntinfo4_t *mi, nfs4_error_t *ep, int flags) 14597c478bd9Sstevel@tonic-gate { 14607c478bd9Sstevel@tonic-gate struct servinfo4 *svp; 14617c478bd9Sstevel@tonic-gate vtype_t vtype; 14627c478bd9Sstevel@tonic-gate nfs_fh4 rootfh; 14637c478bd9Sstevel@tonic-gate int getfh_flags; 14647c478bd9Sstevel@tonic-gate char *orig_sv_path; 14657c478bd9Sstevel@tonic-gate int orig_sv_pathlen, num_retry; 14667c478bd9Sstevel@tonic-gate 14677c478bd9Sstevel@tonic-gate mutex_enter(&mi->mi_lock); 14687c478bd9Sstevel@tonic-gate svp = mi->mi_curr_serv; 14697c478bd9Sstevel@tonic-gate getfh_flags = 14707c478bd9Sstevel@tonic-gate (flags & NFS4_REMAP_NEEDSOP) ? NFS4_GETFH_NEEDSOP : 0; 14717c478bd9Sstevel@tonic-gate getfh_flags |= 14727c478bd9Sstevel@tonic-gate (mi->mi_flags & MI4_PUBLIC) ? NFS4_GETFH_PUBLIC : 0; 14737c478bd9Sstevel@tonic-gate mutex_exit(&mi->mi_lock); 14747c478bd9Sstevel@tonic-gate 14757c478bd9Sstevel@tonic-gate /* 14767c478bd9Sstevel@tonic-gate * Just in case server path being mounted contains 14777c478bd9Sstevel@tonic-gate * symlinks and fails w/STALE, save the initial sv_path 14787c478bd9Sstevel@tonic-gate * so we can redrive the initial mount compound with the 14797c478bd9Sstevel@tonic-gate * initial sv_path -- not a symlink-expanded version. 14807c478bd9Sstevel@tonic-gate * 14817c478bd9Sstevel@tonic-gate * This could only happen if a symlink was expanded 14827c478bd9Sstevel@tonic-gate * and the expanded mount compound failed stale. Because 14837c478bd9Sstevel@tonic-gate * it could be the case that the symlink was removed at 14847c478bd9Sstevel@tonic-gate * the server (and replaced with another symlink/dir, 14857c478bd9Sstevel@tonic-gate * we need to use the initial sv_path when attempting 14867c478bd9Sstevel@tonic-gate * to re-lookup everything and recover. 14877c478bd9Sstevel@tonic-gate */ 14887c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 14897c478bd9Sstevel@tonic-gate orig_sv_pathlen = svp->sv_pathlen; 14907c478bd9Sstevel@tonic-gate orig_sv_path = kmem_alloc(orig_sv_pathlen, KM_SLEEP); 14917c478bd9Sstevel@tonic-gate bcopy(svp->sv_path, orig_sv_path, orig_sv_pathlen); 14927c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 14937c478bd9Sstevel@tonic-gate 14947c478bd9Sstevel@tonic-gate num_retry = nfs4_max_mount_retry; 14957c478bd9Sstevel@tonic-gate 14967c478bd9Sstevel@tonic-gate do { 14977c478bd9Sstevel@tonic-gate /* 14987c478bd9Sstevel@tonic-gate * Get the root fh from the server. Retry nfs4_max_mount_retry 14997c478bd9Sstevel@tonic-gate * (2) times if it fails with STALE since the recovery 15007c478bd9Sstevel@tonic-gate * infrastructure doesn't do STALE recovery for components 15017c478bd9Sstevel@tonic-gate * of the server path to the object being mounted. 15027c478bd9Sstevel@tonic-gate */ 15037c478bd9Sstevel@tonic-gate nfs4getfh_otw(mi, svp, &vtype, getfh_flags, CRED(), ep); 15047c478bd9Sstevel@tonic-gate 15057c478bd9Sstevel@tonic-gate if (ep->error == 0 && ep->stat == NFS4_OK) 15067c478bd9Sstevel@tonic-gate break; 15077c478bd9Sstevel@tonic-gate 15087c478bd9Sstevel@tonic-gate /* 15097c478bd9Sstevel@tonic-gate * For some reason, the mount compound failed. Before 15107c478bd9Sstevel@tonic-gate * retrying, we need to restore the original sv_path 15117c478bd9Sstevel@tonic-gate * because it might have contained symlinks that were 15127c478bd9Sstevel@tonic-gate * expanded by nfsgetfh_otw before the failure occurred. 15137c478bd9Sstevel@tonic-gate * replace current sv_path with orig sv_path -- just in case 15147c478bd9Sstevel@tonic-gate * it changed due to embedded symlinks. 15157c478bd9Sstevel@tonic-gate */ 15167c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 15177c478bd9Sstevel@tonic-gate if (orig_sv_pathlen != svp->sv_pathlen) { 15187c478bd9Sstevel@tonic-gate kmem_free(svp->sv_path, svp->sv_pathlen); 15197c478bd9Sstevel@tonic-gate svp->sv_path = kmem_alloc(orig_sv_pathlen, KM_SLEEP); 15207c478bd9Sstevel@tonic-gate svp->sv_pathlen = orig_sv_pathlen; 15217c478bd9Sstevel@tonic-gate 15227c478bd9Sstevel@tonic-gate } 15237c478bd9Sstevel@tonic-gate bcopy(orig_sv_path, svp->sv_path, orig_sv_pathlen); 15247c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 15257c478bd9Sstevel@tonic-gate 15267c478bd9Sstevel@tonic-gate } while (num_retry-- > 0); 15277c478bd9Sstevel@tonic-gate 15287c478bd9Sstevel@tonic-gate kmem_free(orig_sv_path, orig_sv_pathlen); 15297c478bd9Sstevel@tonic-gate 15307c478bd9Sstevel@tonic-gate if (ep->error != 0 || ep->stat != 0) { 15317c478bd9Sstevel@tonic-gate return; 15327c478bd9Sstevel@tonic-gate } 15337c478bd9Sstevel@tonic-gate 15347c478bd9Sstevel@tonic-gate if (vtype != VNON && vtype != mi->mi_type) { 15357c478bd9Sstevel@tonic-gate /* shouldn't happen */ 15367c478bd9Sstevel@tonic-gate zcmn_err(mi->mi_zone->zone_id, CE_WARN, 15377c478bd9Sstevel@tonic-gate "nfs4_remap_root: server root vnode type (%d) doesn't " 15387c478bd9Sstevel@tonic-gate "match mount info (%d)", vtype, mi->mi_type); 15397c478bd9Sstevel@tonic-gate } 15407c478bd9Sstevel@tonic-gate 15417c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 15427c478bd9Sstevel@tonic-gate rootfh.nfs_fh4_val = svp->sv_fhandle.fh_buf; 15437c478bd9Sstevel@tonic-gate rootfh.nfs_fh4_len = svp->sv_fhandle.fh_len; 15447c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 15457c478bd9Sstevel@tonic-gate sfh4_update(mi->mi_rootfh, &rootfh); 15467c478bd9Sstevel@tonic-gate 15477c478bd9Sstevel@tonic-gate #ifdef DEBUG 15487c478bd9Sstevel@tonic-gate /* 15497c478bd9Sstevel@tonic-gate * There shouldn't have been any other recovery activity on the 15507c478bd9Sstevel@tonic-gate * filesystem. 15517c478bd9Sstevel@tonic-gate */ 15527c478bd9Sstevel@tonic-gate mutex_enter(&mi->mi_lock); 15537c478bd9Sstevel@tonic-gate ASSERT(mi->mi_curr_serv == svp); 15547c478bd9Sstevel@tonic-gate mutex_exit(&mi->mi_lock); 15557c478bd9Sstevel@tonic-gate #endif 15567c478bd9Sstevel@tonic-gate } 15577c478bd9Sstevel@tonic-gate 15587c478bd9Sstevel@tonic-gate static int 15597c478bd9Sstevel@tonic-gate nfs4rootvp(vnode_t **rtvpp, vfs_t *vfsp, struct servinfo4 *svp_head, 15607c478bd9Sstevel@tonic-gate int flags, cred_t *cr, zone_t *zone) 15617c478bd9Sstevel@tonic-gate { 15627c478bd9Sstevel@tonic-gate vnode_t *rtvp = NULL; 15637c478bd9Sstevel@tonic-gate mntinfo4_t *mi; 15647c478bd9Sstevel@tonic-gate dev_t nfs_dev; 15657c478bd9Sstevel@tonic-gate int error = 0; 15667c478bd9Sstevel@tonic-gate rnode4_t *rp; 15677c478bd9Sstevel@tonic-gate int i; 15687c478bd9Sstevel@tonic-gate struct vattr va; 15697c478bd9Sstevel@tonic-gate vtype_t vtype = VNON; 15707c478bd9Sstevel@tonic-gate vtype_t tmp_vtype = VNON; 15717c478bd9Sstevel@tonic-gate struct servinfo4 *firstsvp = NULL, *svp = svp_head; 15727c478bd9Sstevel@tonic-gate nfs4_oo_hash_bucket_t *bucketp; 15737c478bd9Sstevel@tonic-gate nfs_fh4 fh; 15747c478bd9Sstevel@tonic-gate char *droptext = ""; 15757c478bd9Sstevel@tonic-gate struct nfs_stats *nfsstatsp; 15767c478bd9Sstevel@tonic-gate nfs4_fname_t *mfname; 15777c478bd9Sstevel@tonic-gate nfs4_error_t e; 15787c478bd9Sstevel@tonic-gate char *orig_sv_path; 15797c478bd9Sstevel@tonic-gate int orig_sv_pathlen, num_retry; 15807c478bd9Sstevel@tonic-gate cred_t *lcr = NULL, *tcr = cr; 15817c478bd9Sstevel@tonic-gate 1582*108322fbScarlsonj nfsstatsp = zone_getspecific(nfsstat_zone_key, nfs_zone()); 15837c478bd9Sstevel@tonic-gate ASSERT(nfsstatsp != NULL); 15847c478bd9Sstevel@tonic-gate 1585*108322fbScarlsonj ASSERT(nfs_zone() == zone); 15867c478bd9Sstevel@tonic-gate ASSERT(crgetref(cr)); 15877c478bd9Sstevel@tonic-gate 15887c478bd9Sstevel@tonic-gate /* 15897c478bd9Sstevel@tonic-gate * Create a mount record and link it to the vfs struct. 15907c478bd9Sstevel@tonic-gate */ 15917c478bd9Sstevel@tonic-gate mi = kmem_zalloc(sizeof (*mi), KM_SLEEP); 15927c478bd9Sstevel@tonic-gate mutex_init(&mi->mi_lock, NULL, MUTEX_DEFAULT, NULL); 15937c478bd9Sstevel@tonic-gate nfs_rw_init(&mi->mi_recovlock, NULL, RW_DEFAULT, NULL); 15947c478bd9Sstevel@tonic-gate nfs_rw_init(&mi->mi_rename_lock, NULL, RW_DEFAULT, NULL); 15957c478bd9Sstevel@tonic-gate nfs_rw_init(&mi->mi_fh_lock, NULL, RW_DEFAULT, NULL); 15967c478bd9Sstevel@tonic-gate 15977c478bd9Sstevel@tonic-gate if (!(flags & NFSMNT_SOFT)) 15987c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_HARD; 15997c478bd9Sstevel@tonic-gate if ((flags & NFSMNT_NOPRINT)) 16007c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_NOPRINT; 16017c478bd9Sstevel@tonic-gate if (flags & NFSMNT_INT) 16027c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_INT; 16037c478bd9Sstevel@tonic-gate if (flags & NFSMNT_PUBLIC) 16047c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_PUBLIC; 16057c478bd9Sstevel@tonic-gate mi->mi_retrans = NFS_RETRIES; 16067c478bd9Sstevel@tonic-gate if (svp->sv_knconf->knc_semantics == NC_TPI_COTS_ORD || 16077c478bd9Sstevel@tonic-gate svp->sv_knconf->knc_semantics == NC_TPI_COTS) 16087c478bd9Sstevel@tonic-gate mi->mi_timeo = nfs4_cots_timeo; 16097c478bd9Sstevel@tonic-gate else 16107c478bd9Sstevel@tonic-gate mi->mi_timeo = NFS_TIMEO; 16117c478bd9Sstevel@tonic-gate mi->mi_prog = NFS_PROGRAM; 16127c478bd9Sstevel@tonic-gate mi->mi_vers = NFS_V4; 16137c478bd9Sstevel@tonic-gate mi->mi_rfsnames = rfsnames_v4; 16147c478bd9Sstevel@tonic-gate mi->mi_reqs = nfsstatsp->nfs_stats_v4.rfsreqcnt_ptr; 16157c478bd9Sstevel@tonic-gate cv_init(&mi->mi_failover_cv, NULL, CV_DEFAULT, NULL); 16167c478bd9Sstevel@tonic-gate mi->mi_servers = svp; 16177c478bd9Sstevel@tonic-gate mi->mi_curr_serv = svp; 16187c478bd9Sstevel@tonic-gate mi->mi_acregmin = SEC2HR(ACREGMIN); 16197c478bd9Sstevel@tonic-gate mi->mi_acregmax = SEC2HR(ACREGMAX); 16207c478bd9Sstevel@tonic-gate mi->mi_acdirmin = SEC2HR(ACDIRMIN); 16217c478bd9Sstevel@tonic-gate mi->mi_acdirmax = SEC2HR(ACDIRMAX); 16227c478bd9Sstevel@tonic-gate mi->mi_fh_expire_type = FH4_PERSISTENT; 16237c478bd9Sstevel@tonic-gate mi->mi_clientid_next = NULL; 16247c478bd9Sstevel@tonic-gate mi->mi_clientid_prev = NULL; 16257c478bd9Sstevel@tonic-gate mi->mi_grace_wait = 0; 16267c478bd9Sstevel@tonic-gate mi->mi_error = 0; 16277c478bd9Sstevel@tonic-gate mi->mi_srvsettime = 0; 16287c478bd9Sstevel@tonic-gate 16297c478bd9Sstevel@tonic-gate mi->mi_tsize = nfs4_tsize(svp->sv_knconf); 16307c478bd9Sstevel@tonic-gate mi->mi_stsize = mi->mi_tsize; 16317c478bd9Sstevel@tonic-gate 16327c478bd9Sstevel@tonic-gate if (flags & NFSMNT_DIRECTIO) 16337c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_DIRECTIO; 16347c478bd9Sstevel@tonic-gate 16357c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_MOUNTING; 16367c478bd9Sstevel@tonic-gate 16377c478bd9Sstevel@tonic-gate /* 16387c478bd9Sstevel@tonic-gate * Make a vfs struct for nfs. We do this here instead of below 16397c478bd9Sstevel@tonic-gate * because rtvp needs a vfs before we can do a getattr on it. 16407c478bd9Sstevel@tonic-gate * 16417c478bd9Sstevel@tonic-gate * Assign a unique device id to the mount 16427c478bd9Sstevel@tonic-gate */ 16437c478bd9Sstevel@tonic-gate mutex_enter(&nfs_minor_lock); 16447c478bd9Sstevel@tonic-gate do { 16457c478bd9Sstevel@tonic-gate nfs_minor = (nfs_minor + 1) & MAXMIN32; 16467c478bd9Sstevel@tonic-gate nfs_dev = makedevice(nfs_major, nfs_minor); 16477c478bd9Sstevel@tonic-gate } while (vfs_devismounted(nfs_dev)); 16487c478bd9Sstevel@tonic-gate mutex_exit(&nfs_minor_lock); 16497c478bd9Sstevel@tonic-gate 16507c478bd9Sstevel@tonic-gate vfsp->vfs_dev = nfs_dev; 16517c478bd9Sstevel@tonic-gate vfs_make_fsid(&vfsp->vfs_fsid, nfs_dev, nfs4fstyp); 16527c478bd9Sstevel@tonic-gate vfsp->vfs_data = (caddr_t)mi; 16537c478bd9Sstevel@tonic-gate vfsp->vfs_fstype = nfsfstyp; 16547c478bd9Sstevel@tonic-gate vfsp->vfs_bsize = nfs4_bsize; 16557c478bd9Sstevel@tonic-gate 16567c478bd9Sstevel@tonic-gate /* 16577c478bd9Sstevel@tonic-gate * Initialize fields used to support async putpage operations. 16587c478bd9Sstevel@tonic-gate */ 16597c478bd9Sstevel@tonic-gate for (i = 0; i < NFS4_ASYNC_TYPES; i++) 16607c478bd9Sstevel@tonic-gate mi->mi_async_clusters[i] = nfs4_async_clusters; 16617c478bd9Sstevel@tonic-gate mi->mi_async_init_clusters = nfs4_async_clusters; 16627c478bd9Sstevel@tonic-gate mi->mi_async_curr = &mi->mi_async_reqs[0]; 16637c478bd9Sstevel@tonic-gate mi->mi_max_threads = nfs4_max_threads; 16647c478bd9Sstevel@tonic-gate mutex_init(&mi->mi_async_lock, NULL, MUTEX_DEFAULT, NULL); 16657c478bd9Sstevel@tonic-gate cv_init(&mi->mi_async_reqs_cv, NULL, CV_DEFAULT, NULL); 16667c478bd9Sstevel@tonic-gate cv_init(&mi->mi_async_work_cv, NULL, CV_DEFAULT, NULL); 16677c478bd9Sstevel@tonic-gate cv_init(&mi->mi_async_cv, NULL, CV_DEFAULT, NULL); 16687c478bd9Sstevel@tonic-gate cv_init(&mi->mi_inact_req_cv, NULL, CV_DEFAULT, NULL); 16697c478bd9Sstevel@tonic-gate 16707c478bd9Sstevel@tonic-gate mi->mi_vfsp = vfsp; 16717c478bd9Sstevel@tonic-gate zone_hold(mi->mi_zone = zone); 16727c478bd9Sstevel@tonic-gate nfs4_mi_zonelist_add(mi); 16737c478bd9Sstevel@tonic-gate 16747c478bd9Sstevel@tonic-gate /* 16757c478bd9Sstevel@tonic-gate * Initialize the <open owner/cred> hash table. 16767c478bd9Sstevel@tonic-gate */ 16777c478bd9Sstevel@tonic-gate for (i = 0; i < NFS4_NUM_OO_BUCKETS; i++) { 16787c478bd9Sstevel@tonic-gate bucketp = &(mi->mi_oo_list[i]); 16797c478bd9Sstevel@tonic-gate mutex_init(&bucketp->b_lock, NULL, MUTEX_DEFAULT, NULL); 16807c478bd9Sstevel@tonic-gate list_create(&bucketp->b_oo_hash_list, 16817c478bd9Sstevel@tonic-gate sizeof (nfs4_open_owner_t), 16827c478bd9Sstevel@tonic-gate offsetof(nfs4_open_owner_t, oo_hash_node)); 16837c478bd9Sstevel@tonic-gate } 16847c478bd9Sstevel@tonic-gate 16857c478bd9Sstevel@tonic-gate /* 16867c478bd9Sstevel@tonic-gate * Initialize the freed open owner list. 16877c478bd9Sstevel@tonic-gate */ 16887c478bd9Sstevel@tonic-gate mi->mi_foo_num = 0; 16897c478bd9Sstevel@tonic-gate mi->mi_foo_max = NFS4_NUM_FREED_OPEN_OWNERS; 16907c478bd9Sstevel@tonic-gate list_create(&mi->mi_foo_list, sizeof (nfs4_open_owner_t), 16917c478bd9Sstevel@tonic-gate offsetof(nfs4_open_owner_t, oo_foo_node)); 16927c478bd9Sstevel@tonic-gate 16937c478bd9Sstevel@tonic-gate list_create(&mi->mi_lost_state, sizeof (nfs4_lost_rqst_t), 16947c478bd9Sstevel@tonic-gate offsetof(nfs4_lost_rqst_t, lr_node)); 16957c478bd9Sstevel@tonic-gate 16967c478bd9Sstevel@tonic-gate list_create(&mi->mi_bseqid_list, sizeof (nfs4_bseqid_entry_t), 16977c478bd9Sstevel@tonic-gate offsetof(nfs4_bseqid_entry_t, bs_node)); 16987c478bd9Sstevel@tonic-gate 16997c478bd9Sstevel@tonic-gate /* 17007c478bd9Sstevel@tonic-gate * Initialize the msg buffer. 17017c478bd9Sstevel@tonic-gate */ 17027c478bd9Sstevel@tonic-gate list_create(&mi->mi_msg_list, sizeof (nfs4_debug_msg_t), 17037c478bd9Sstevel@tonic-gate offsetof(nfs4_debug_msg_t, msg_node)); 17047c478bd9Sstevel@tonic-gate mi->mi_msg_count = 0; 17057c478bd9Sstevel@tonic-gate mutex_init(&mi->mi_msg_list_lock, NULL, MUTEX_DEFAULT, NULL); 17067c478bd9Sstevel@tonic-gate 17077c478bd9Sstevel@tonic-gate /* 17087c478bd9Sstevel@tonic-gate * Initialize kstats 17097c478bd9Sstevel@tonic-gate */ 17107c478bd9Sstevel@tonic-gate nfs4_mnt_kstat_init(vfsp); 17117c478bd9Sstevel@tonic-gate 17127c478bd9Sstevel@tonic-gate /* 17137c478bd9Sstevel@tonic-gate * Initialize the shared filehandle pool, and get the fname for 17147c478bd9Sstevel@tonic-gate * the filesystem root. 17157c478bd9Sstevel@tonic-gate */ 17167c478bd9Sstevel@tonic-gate sfh4_createtab(&mi->mi_filehandles); 17177c478bd9Sstevel@tonic-gate mi->mi_fname = fn_get(NULL, "."); 17187c478bd9Sstevel@tonic-gate 17197c478bd9Sstevel@tonic-gate /* 17207c478bd9Sstevel@tonic-gate * Save server path we're attempting to mount. 17217c478bd9Sstevel@tonic-gate */ 17227c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_WRITER, 0); 17237c478bd9Sstevel@tonic-gate orig_sv_pathlen = svp_head->sv_pathlen; 17247c478bd9Sstevel@tonic-gate orig_sv_path = kmem_alloc(svp_head->sv_pathlen, KM_SLEEP); 17257c478bd9Sstevel@tonic-gate bcopy(svp_head->sv_path, orig_sv_path, svp_head->sv_pathlen); 17267c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 17277c478bd9Sstevel@tonic-gate 17287c478bd9Sstevel@tonic-gate /* 17297c478bd9Sstevel@tonic-gate * Make the GETFH call to get root fh for each replica. 17307c478bd9Sstevel@tonic-gate */ 17317c478bd9Sstevel@tonic-gate if (svp_head->sv_next) 17327c478bd9Sstevel@tonic-gate droptext = ", dropping replica"; 17337c478bd9Sstevel@tonic-gate 17347c478bd9Sstevel@tonic-gate /* 17357c478bd9Sstevel@tonic-gate * If the uid is set then set the creds for secure mounts 17367c478bd9Sstevel@tonic-gate * by proxy processes such as automountd. 17377c478bd9Sstevel@tonic-gate */ 17387c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 17397c478bd9Sstevel@tonic-gate if (svp->sv_secdata->uid != 0) { 17407c478bd9Sstevel@tonic-gate lcr = crdup(cr); 17417c478bd9Sstevel@tonic-gate (void) crsetugid(lcr, svp->sv_secdata->uid, crgetgid(cr)); 17427c478bd9Sstevel@tonic-gate tcr = lcr; 17437c478bd9Sstevel@tonic-gate } 17447c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 17457c478bd9Sstevel@tonic-gate for (svp = svp_head; svp; svp = svp->sv_next) { 17467c478bd9Sstevel@tonic-gate if (nfs4_chkdup_servinfo4(svp_head, svp)) { 17477c478bd9Sstevel@tonic-gate nfs_cmn_err(error, CE_WARN, 17487c478bd9Sstevel@tonic-gate VERS_MSG "Host %s is a duplicate%s", 17497c478bd9Sstevel@tonic-gate svp->sv_hostname, droptext); 17507c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_WRITER, 0); 17517c478bd9Sstevel@tonic-gate svp->sv_flags |= SV4_NOTINUSE; 17527c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 17537c478bd9Sstevel@tonic-gate continue; 17547c478bd9Sstevel@tonic-gate } 17557c478bd9Sstevel@tonic-gate mi->mi_curr_serv = svp; 17567c478bd9Sstevel@tonic-gate 17577c478bd9Sstevel@tonic-gate /* 17587c478bd9Sstevel@tonic-gate * Just in case server path being mounted contains 17597c478bd9Sstevel@tonic-gate * symlinks and fails w/STALE, save the initial sv_path 17607c478bd9Sstevel@tonic-gate * so we can redrive the initial mount compound with the 17617c478bd9Sstevel@tonic-gate * initial sv_path -- not a symlink-expanded version. 17627c478bd9Sstevel@tonic-gate * 17637c478bd9Sstevel@tonic-gate * This could only happen if a symlink was expanded 17647c478bd9Sstevel@tonic-gate * and the expanded mount compound failed stale. Because 17657c478bd9Sstevel@tonic-gate * it could be the case that the symlink was removed at 17667c478bd9Sstevel@tonic-gate * the server (and replaced with another symlink/dir, 17677c478bd9Sstevel@tonic-gate * we need to use the initial sv_path when attempting 17687c478bd9Sstevel@tonic-gate * to re-lookup everything and recover. 17697c478bd9Sstevel@tonic-gate * 17707c478bd9Sstevel@tonic-gate * Other mount errors should evenutally be handled here also 17717c478bd9Sstevel@tonic-gate * (NFS4ERR_DELAY, NFS4ERR_RESOURCE). For now, all mount 17727c478bd9Sstevel@tonic-gate * failures will result in mount being redriven a few times. 17737c478bd9Sstevel@tonic-gate */ 17747c478bd9Sstevel@tonic-gate num_retry = nfs4_max_mount_retry; 17757c478bd9Sstevel@tonic-gate do { 17767c478bd9Sstevel@tonic-gate nfs4getfh_otw(mi, svp, &tmp_vtype, 17777c478bd9Sstevel@tonic-gate ((flags & NFSMNT_PUBLIC) ? NFS4_GETFH_PUBLIC : 0) | 17787c478bd9Sstevel@tonic-gate NFS4_GETFH_NEEDSOP, tcr, &e); 17797c478bd9Sstevel@tonic-gate 17807c478bd9Sstevel@tonic-gate if (e.error == 0 && e.stat == NFS4_OK) 17817c478bd9Sstevel@tonic-gate break; 17827c478bd9Sstevel@tonic-gate 17837c478bd9Sstevel@tonic-gate /* 17847c478bd9Sstevel@tonic-gate * replace current sv_path with orig sv_path -- just in 17857c478bd9Sstevel@tonic-gate * case it changed due to embedded symlinks. 17867c478bd9Sstevel@tonic-gate */ 17877c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 17887c478bd9Sstevel@tonic-gate if (orig_sv_pathlen != svp->sv_pathlen) { 17897c478bd9Sstevel@tonic-gate kmem_free(svp->sv_path, svp->sv_pathlen); 17907c478bd9Sstevel@tonic-gate svp->sv_path = kmem_alloc(orig_sv_pathlen, 17917c478bd9Sstevel@tonic-gate KM_SLEEP); 17927c478bd9Sstevel@tonic-gate svp->sv_pathlen = orig_sv_pathlen; 17937c478bd9Sstevel@tonic-gate } 17947c478bd9Sstevel@tonic-gate bcopy(orig_sv_path, svp->sv_path, orig_sv_pathlen); 17957c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 17967c478bd9Sstevel@tonic-gate 17977c478bd9Sstevel@tonic-gate } while (num_retry-- > 0); 17987c478bd9Sstevel@tonic-gate 17997c478bd9Sstevel@tonic-gate error = e.error ? e.error : geterrno4(e.stat); 18007c478bd9Sstevel@tonic-gate if (error) { 18017c478bd9Sstevel@tonic-gate nfs_cmn_err(error, CE_WARN, 18027c478bd9Sstevel@tonic-gate VERS_MSG "initial call to %s failed%s: %m", 18037c478bd9Sstevel@tonic-gate svp->sv_hostname, droptext); 18047c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_WRITER, 0); 18057c478bd9Sstevel@tonic-gate svp->sv_flags |= SV4_NOTINUSE; 18067c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 18077c478bd9Sstevel@tonic-gate mi->mi_flags &= ~MI4_RECOV_FAIL; 18087c478bd9Sstevel@tonic-gate mi->mi_error = 0; 18097c478bd9Sstevel@tonic-gate continue; 18107c478bd9Sstevel@tonic-gate } 18117c478bd9Sstevel@tonic-gate 18127c478bd9Sstevel@tonic-gate if (tmp_vtype == VBAD) { 18137c478bd9Sstevel@tonic-gate zcmn_err(mi->mi_zone->zone_id, CE_WARN, 18147c478bd9Sstevel@tonic-gate VERS_MSG "%s returned a bad file type for " 18157c478bd9Sstevel@tonic-gate "root%s", svp->sv_hostname, droptext); 18167c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_WRITER, 0); 18177c478bd9Sstevel@tonic-gate svp->sv_flags |= SV4_NOTINUSE; 18187c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 18197c478bd9Sstevel@tonic-gate continue; 18207c478bd9Sstevel@tonic-gate } 18217c478bd9Sstevel@tonic-gate 18227c478bd9Sstevel@tonic-gate if (vtype == VNON) { 18237c478bd9Sstevel@tonic-gate vtype = tmp_vtype; 18247c478bd9Sstevel@tonic-gate } else if (vtype != tmp_vtype) { 18257c478bd9Sstevel@tonic-gate zcmn_err(mi->mi_zone->zone_id, CE_WARN, 18267c478bd9Sstevel@tonic-gate VERS_MSG "%s returned a different file type " 18277c478bd9Sstevel@tonic-gate "for root%s", svp->sv_hostname, droptext); 18287c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_WRITER, 0); 18297c478bd9Sstevel@tonic-gate svp->sv_flags |= SV4_NOTINUSE; 18307c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 18317c478bd9Sstevel@tonic-gate continue; 18327c478bd9Sstevel@tonic-gate } 18337c478bd9Sstevel@tonic-gate if (firstsvp == NULL) 18347c478bd9Sstevel@tonic-gate firstsvp = svp; 18357c478bd9Sstevel@tonic-gate } 18367c478bd9Sstevel@tonic-gate 18377c478bd9Sstevel@tonic-gate kmem_free(orig_sv_path, orig_sv_pathlen); 18387c478bd9Sstevel@tonic-gate 18397c478bd9Sstevel@tonic-gate if (firstsvp == NULL) { 18407c478bd9Sstevel@tonic-gate if (error == 0) 18417c478bd9Sstevel@tonic-gate error = ENOENT; 18427c478bd9Sstevel@tonic-gate goto bad; 18437c478bd9Sstevel@tonic-gate } 18447c478bd9Sstevel@tonic-gate 18457c478bd9Sstevel@tonic-gate mi->mi_curr_serv = svp = firstsvp; 18467c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 18477c478bd9Sstevel@tonic-gate ASSERT((mi->mi_curr_serv->sv_flags & SV4_NOTINUSE) == 0); 18487c478bd9Sstevel@tonic-gate fh.nfs_fh4_len = svp->sv_fhandle.fh_len; 18497c478bd9Sstevel@tonic-gate fh.nfs_fh4_val = svp->sv_fhandle.fh_buf; 18507c478bd9Sstevel@tonic-gate mi->mi_rootfh = sfh4_get(&fh, mi); 18517c478bd9Sstevel@tonic-gate fh.nfs_fh4_len = svp->sv_pfhandle.fh_len; 18527c478bd9Sstevel@tonic-gate fh.nfs_fh4_val = svp->sv_pfhandle.fh_buf; 18537c478bd9Sstevel@tonic-gate mi->mi_srvparentfh = sfh4_get(&fh, mi); 18547c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 18557c478bd9Sstevel@tonic-gate 18567c478bd9Sstevel@tonic-gate /* 18577c478bd9Sstevel@tonic-gate * Make the root vnode without attributes. 18587c478bd9Sstevel@tonic-gate */ 18597c478bd9Sstevel@tonic-gate mfname = mi->mi_fname; 18607c478bd9Sstevel@tonic-gate fn_hold(mfname); 18617c478bd9Sstevel@tonic-gate rtvp = makenfs4node_by_fh(mi->mi_rootfh, NULL, 18627c478bd9Sstevel@tonic-gate &mfname, NULL, mi, cr, gethrtime()); 18637c478bd9Sstevel@tonic-gate rtvp->v_type = vtype; 18647c478bd9Sstevel@tonic-gate 18657c478bd9Sstevel@tonic-gate mi->mi_curread = mi->mi_tsize; 18667c478bd9Sstevel@tonic-gate mi->mi_curwrite = mi->mi_stsize; 18677c478bd9Sstevel@tonic-gate 18687c478bd9Sstevel@tonic-gate /* 18697c478bd9Sstevel@tonic-gate * Start the manager thread responsible for handling async worker 18707c478bd9Sstevel@tonic-gate * threads. 18717c478bd9Sstevel@tonic-gate */ 18727c478bd9Sstevel@tonic-gate VFS_HOLD(vfsp); /* add reference for thread */ 18737c478bd9Sstevel@tonic-gate mi->mi_manager_thread = zthread_create(NULL, 0, nfs4_async_manager, 18747c478bd9Sstevel@tonic-gate vfsp, 0, minclsyspri); 18757c478bd9Sstevel@tonic-gate ASSERT(mi->mi_manager_thread != NULL); 18767c478bd9Sstevel@tonic-gate /* 18777c478bd9Sstevel@tonic-gate * Create the thread that handles over-the-wire calls for 18787c478bd9Sstevel@tonic-gate * VOP_INACTIVE. 18797c478bd9Sstevel@tonic-gate * This needs to happen after the manager thread is created. 18807c478bd9Sstevel@tonic-gate */ 18817c478bd9Sstevel@tonic-gate mi->mi_inactive_thread = zthread_create(NULL, 0, nfs4_inactive_thread, 18827c478bd9Sstevel@tonic-gate mi, 0, minclsyspri); 18837c478bd9Sstevel@tonic-gate ASSERT(mi->mi_inactive_thread != NULL); 18847c478bd9Sstevel@tonic-gate 18857c478bd9Sstevel@tonic-gate /* If we didn't get a type, get one now */ 18867c478bd9Sstevel@tonic-gate if (rtvp->v_type == VNON) { 18877c478bd9Sstevel@tonic-gate va.va_mask = AT_TYPE; 18887c478bd9Sstevel@tonic-gate error = nfs4getattr(rtvp, &va, tcr); 18897c478bd9Sstevel@tonic-gate if (error) 18907c478bd9Sstevel@tonic-gate goto bad; 18917c478bd9Sstevel@tonic-gate rtvp->v_type = va.va_type; 18927c478bd9Sstevel@tonic-gate } 18937c478bd9Sstevel@tonic-gate 18947c478bd9Sstevel@tonic-gate mi->mi_type = rtvp->v_type; 18957c478bd9Sstevel@tonic-gate 18967c478bd9Sstevel@tonic-gate mutex_enter(&mi->mi_lock); 18977c478bd9Sstevel@tonic-gate mi->mi_flags &= ~MI4_MOUNTING; 18987c478bd9Sstevel@tonic-gate mutex_exit(&mi->mi_lock); 18997c478bd9Sstevel@tonic-gate 19007c478bd9Sstevel@tonic-gate *rtvpp = rtvp; 19017c478bd9Sstevel@tonic-gate if (lcr != NULL) 19027c478bd9Sstevel@tonic-gate crfree(lcr); 19037c478bd9Sstevel@tonic-gate 19047c478bd9Sstevel@tonic-gate return (0); 19057c478bd9Sstevel@tonic-gate bad: 19067c478bd9Sstevel@tonic-gate /* 19077c478bd9Sstevel@tonic-gate * An error occurred somewhere, need to clean up... 19087c478bd9Sstevel@tonic-gate * 19097c478bd9Sstevel@tonic-gate * XXX Should not svp be cleaned too? 19107c478bd9Sstevel@tonic-gate */ 19117c478bd9Sstevel@tonic-gate if (lcr != NULL) 19127c478bd9Sstevel@tonic-gate crfree(lcr); 19137c478bd9Sstevel@tonic-gate if (rtvp != NULL) { 19147c478bd9Sstevel@tonic-gate /* 19157c478bd9Sstevel@tonic-gate * We need to release our reference to the root vnode and 19167c478bd9Sstevel@tonic-gate * destroy the mntinfo4 struct that we just created. 19177c478bd9Sstevel@tonic-gate */ 19187c478bd9Sstevel@tonic-gate rp = VTOR4(rtvp); 19197c478bd9Sstevel@tonic-gate if (rp->r_flags & R4HASHED) 19207c478bd9Sstevel@tonic-gate rp4_rmhash(rp); 19217c478bd9Sstevel@tonic-gate VN_RELE(rtvp); 19227c478bd9Sstevel@tonic-gate } 19237c478bd9Sstevel@tonic-gate nfs4_async_stop(vfsp); 19247c478bd9Sstevel@tonic-gate nfs4_async_manager_stop(vfsp); 19257c478bd9Sstevel@tonic-gate if (mi->mi_io_kstats) { 19267c478bd9Sstevel@tonic-gate kstat_delete(mi->mi_io_kstats); 19277c478bd9Sstevel@tonic-gate mi->mi_io_kstats = NULL; 19287c478bd9Sstevel@tonic-gate } 19297c478bd9Sstevel@tonic-gate if (mi->mi_ro_kstats) { 19307c478bd9Sstevel@tonic-gate kstat_delete(mi->mi_ro_kstats); 19317c478bd9Sstevel@tonic-gate mi->mi_ro_kstats = NULL; 19327c478bd9Sstevel@tonic-gate } 19337c478bd9Sstevel@tonic-gate if (mi->mi_recov_ksp) { 19347c478bd9Sstevel@tonic-gate kstat_delete(mi->mi_recov_ksp); 19357c478bd9Sstevel@tonic-gate mi->mi_recov_ksp = NULL; 19367c478bd9Sstevel@tonic-gate } 19377c478bd9Sstevel@tonic-gate nfs_free_mi4(mi); 19387c478bd9Sstevel@tonic-gate *rtvpp = NULL; 19397c478bd9Sstevel@tonic-gate return (error); 19407c478bd9Sstevel@tonic-gate } 19417c478bd9Sstevel@tonic-gate 19427c478bd9Sstevel@tonic-gate /* 19437c478bd9Sstevel@tonic-gate * vfs operations 19447c478bd9Sstevel@tonic-gate */ 19457c478bd9Sstevel@tonic-gate static int 19467c478bd9Sstevel@tonic-gate nfs4_unmount(vfs_t *vfsp, int flag, cred_t *cr) 19477c478bd9Sstevel@tonic-gate { 19487c478bd9Sstevel@tonic-gate mntinfo4_t *mi; 19497c478bd9Sstevel@tonic-gate ushort_t omax; 19507c478bd9Sstevel@tonic-gate 19517c478bd9Sstevel@tonic-gate if (secpolicy_fs_unmount(cr, vfsp) != 0) 19527c478bd9Sstevel@tonic-gate return (EPERM); 19537c478bd9Sstevel@tonic-gate 19547c478bd9Sstevel@tonic-gate mi = VFTOMI4(vfsp); 19557c478bd9Sstevel@tonic-gate 19567c478bd9Sstevel@tonic-gate if (flag & MS_FORCE) { 19577c478bd9Sstevel@tonic-gate vfsp->vfs_flag |= VFS_UNMOUNTED; 1958*108322fbScarlsonj if (nfs_zone() != mi->mi_zone) { 19597c478bd9Sstevel@tonic-gate /* 19607c478bd9Sstevel@tonic-gate * If the request is coming from the wrong zone, 19617c478bd9Sstevel@tonic-gate * we don't want to create any new threads, and 19627c478bd9Sstevel@tonic-gate * performance is not a concern. Do everything 19637c478bd9Sstevel@tonic-gate * inline. 19647c478bd9Sstevel@tonic-gate */ 19657c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_zone_debug, (CE_NOTE, 19667c478bd9Sstevel@tonic-gate "nfs4_unmount x-zone forced unmount of vfs %p\n", 19677c478bd9Sstevel@tonic-gate (void *)vfsp)); 19687c478bd9Sstevel@tonic-gate nfs4_free_mount(vfsp, cr); 19697c478bd9Sstevel@tonic-gate } else { 19707c478bd9Sstevel@tonic-gate /* 19717c478bd9Sstevel@tonic-gate * Free data structures asynchronously, to avoid 19727c478bd9Sstevel@tonic-gate * blocking the current thread (for performance 19737c478bd9Sstevel@tonic-gate * reasons only). 19747c478bd9Sstevel@tonic-gate */ 19757c478bd9Sstevel@tonic-gate async_free_mount(vfsp, cr); 19767c478bd9Sstevel@tonic-gate } 19777c478bd9Sstevel@tonic-gate return (0); 19787c478bd9Sstevel@tonic-gate } 19797c478bd9Sstevel@tonic-gate /* 19807c478bd9Sstevel@tonic-gate * Wait until all asynchronous putpage operations on 19817c478bd9Sstevel@tonic-gate * this file system are complete before flushing rnodes 19827c478bd9Sstevel@tonic-gate * from the cache. 19837c478bd9Sstevel@tonic-gate */ 19847c478bd9Sstevel@tonic-gate omax = mi->mi_max_threads; 19857c478bd9Sstevel@tonic-gate if (nfs4_async_stop_sig(vfsp)) { 19867c478bd9Sstevel@tonic-gate return (EINTR); 19877c478bd9Sstevel@tonic-gate } 19887c478bd9Sstevel@tonic-gate r4flush(vfsp, cr); 19897c478bd9Sstevel@tonic-gate /* 19907c478bd9Sstevel@tonic-gate * If there are any active vnodes on this file system, 19917c478bd9Sstevel@tonic-gate * then the file system is busy and can't be umounted. 19927c478bd9Sstevel@tonic-gate */ 19937c478bd9Sstevel@tonic-gate if (check_rtable4(vfsp)) { 19947c478bd9Sstevel@tonic-gate mutex_enter(&mi->mi_async_lock); 19957c478bd9Sstevel@tonic-gate mi->mi_max_threads = omax; 19967c478bd9Sstevel@tonic-gate mutex_exit(&mi->mi_async_lock); 19977c478bd9Sstevel@tonic-gate return (EBUSY); 19987c478bd9Sstevel@tonic-gate } 19997c478bd9Sstevel@tonic-gate /* 20007c478bd9Sstevel@tonic-gate * The unmount can't fail from now on, and there are no active 20017c478bd9Sstevel@tonic-gate * files that could require over-the-wire calls to the server, 20027c478bd9Sstevel@tonic-gate * so stop the async manager and the inactive thread. 20037c478bd9Sstevel@tonic-gate */ 20047c478bd9Sstevel@tonic-gate nfs4_async_manager_stop(vfsp); 20057c478bd9Sstevel@tonic-gate /* 20067c478bd9Sstevel@tonic-gate * Destroy all rnodes belonging to this file system from the 20077c478bd9Sstevel@tonic-gate * rnode hash queues and purge any resources allocated to 20087c478bd9Sstevel@tonic-gate * them. 20097c478bd9Sstevel@tonic-gate */ 20107c478bd9Sstevel@tonic-gate destroy_rtable4(vfsp, cr); 20117c478bd9Sstevel@tonic-gate vfsp->vfs_flag |= VFS_UNMOUNTED; 20127c478bd9Sstevel@tonic-gate nfs4_remove_mi_from_server(mi, NULL); 20137c478bd9Sstevel@tonic-gate if (mi->mi_io_kstats) { 20147c478bd9Sstevel@tonic-gate kstat_delete(mi->mi_io_kstats); 20157c478bd9Sstevel@tonic-gate mi->mi_io_kstats = NULL; 20167c478bd9Sstevel@tonic-gate } 20177c478bd9Sstevel@tonic-gate if (mi->mi_ro_kstats) { 20187c478bd9Sstevel@tonic-gate kstat_delete(mi->mi_ro_kstats); 20197c478bd9Sstevel@tonic-gate mi->mi_ro_kstats = NULL; 20207c478bd9Sstevel@tonic-gate } 20217c478bd9Sstevel@tonic-gate if (mi->mi_recov_ksp) { 20227c478bd9Sstevel@tonic-gate kstat_delete(mi->mi_recov_ksp); 20237c478bd9Sstevel@tonic-gate mi->mi_recov_ksp = NULL; 20247c478bd9Sstevel@tonic-gate } 20257c478bd9Sstevel@tonic-gate return (0); 20267c478bd9Sstevel@tonic-gate } 20277c478bd9Sstevel@tonic-gate 20287c478bd9Sstevel@tonic-gate /* 20297c478bd9Sstevel@tonic-gate * find root of nfs 20307c478bd9Sstevel@tonic-gate */ 20317c478bd9Sstevel@tonic-gate static int 20327c478bd9Sstevel@tonic-gate nfs4_root(vfs_t *vfsp, vnode_t **vpp) 20337c478bd9Sstevel@tonic-gate { 20347c478bd9Sstevel@tonic-gate mntinfo4_t *mi; 20357c478bd9Sstevel@tonic-gate vnode_t *vp; 20367c478bd9Sstevel@tonic-gate nfs4_fname_t *mfname; 20377c478bd9Sstevel@tonic-gate servinfo4_t *svp; 20387c478bd9Sstevel@tonic-gate 20397c478bd9Sstevel@tonic-gate mi = VFTOMI4(vfsp); 20407c478bd9Sstevel@tonic-gate 2041*108322fbScarlsonj if (nfs_zone() != mi->mi_zone) 20427c478bd9Sstevel@tonic-gate return (EPERM); 20437c478bd9Sstevel@tonic-gate 20447c478bd9Sstevel@tonic-gate svp = mi->mi_curr_serv; 20457c478bd9Sstevel@tonic-gate if (svp) { 20467c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 20477c478bd9Sstevel@tonic-gate if (svp->sv_flags & SV4_ROOT_STALE) { 20487c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 20497c478bd9Sstevel@tonic-gate 20507c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_WRITER, 0); 20517c478bd9Sstevel@tonic-gate if (svp->sv_flags & SV4_ROOT_STALE) { 20527c478bd9Sstevel@tonic-gate svp->sv_flags &= ~SV4_ROOT_STALE; 20537c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 20547c478bd9Sstevel@tonic-gate return (ENOENT); 20557c478bd9Sstevel@tonic-gate } 20567c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 20577c478bd9Sstevel@tonic-gate } else 20587c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 20597c478bd9Sstevel@tonic-gate } 20607c478bd9Sstevel@tonic-gate 20617c478bd9Sstevel@tonic-gate mfname = mi->mi_fname; 20627c478bd9Sstevel@tonic-gate fn_hold(mfname); 20637c478bd9Sstevel@tonic-gate vp = makenfs4node_by_fh(mi->mi_rootfh, NULL, &mfname, NULL, 20647c478bd9Sstevel@tonic-gate VFTOMI4(vfsp), CRED(), gethrtime()); 20657c478bd9Sstevel@tonic-gate 20667c478bd9Sstevel@tonic-gate if (VTOR4(vp)->r_flags & R4STALE) { 20677c478bd9Sstevel@tonic-gate VN_RELE(vp); 20687c478bd9Sstevel@tonic-gate return (ENOENT); 20697c478bd9Sstevel@tonic-gate } 20707c478bd9Sstevel@tonic-gate 20717c478bd9Sstevel@tonic-gate ASSERT(vp->v_type == VNON || vp->v_type == mi->mi_type); 20727c478bd9Sstevel@tonic-gate 20737c478bd9Sstevel@tonic-gate vp->v_type = mi->mi_type; 20747c478bd9Sstevel@tonic-gate 20757c478bd9Sstevel@tonic-gate *vpp = vp; 20767c478bd9Sstevel@tonic-gate 20777c478bd9Sstevel@tonic-gate return (0); 20787c478bd9Sstevel@tonic-gate } 20797c478bd9Sstevel@tonic-gate 20807c478bd9Sstevel@tonic-gate static int 20817c478bd9Sstevel@tonic-gate nfs4_statfs_otw(vnode_t *vp, struct statvfs64 *sbp, cred_t *cr) 20827c478bd9Sstevel@tonic-gate { 20837c478bd9Sstevel@tonic-gate int error; 20847c478bd9Sstevel@tonic-gate nfs4_ga_res_t gar; 20857c478bd9Sstevel@tonic-gate nfs4_ga_ext_res_t ger; 20867c478bd9Sstevel@tonic-gate 20877c478bd9Sstevel@tonic-gate gar.n4g_ext_res = &ger; 20887c478bd9Sstevel@tonic-gate 20897c478bd9Sstevel@tonic-gate if (error = nfs4_attr_otw(vp, TAG_FSINFO, &gar, 20907c478bd9Sstevel@tonic-gate NFS4_STATFS_ATTR_MASK, cr)) 20917c478bd9Sstevel@tonic-gate return (error); 20927c478bd9Sstevel@tonic-gate 20937c478bd9Sstevel@tonic-gate *sbp = gar.n4g_ext_res->n4g_sb; 20947c478bd9Sstevel@tonic-gate 20957c478bd9Sstevel@tonic-gate return (0); 20967c478bd9Sstevel@tonic-gate } 20977c478bd9Sstevel@tonic-gate 20987c478bd9Sstevel@tonic-gate /* 20997c478bd9Sstevel@tonic-gate * Get file system statistics. 21007c478bd9Sstevel@tonic-gate */ 21017c478bd9Sstevel@tonic-gate static int 21027c478bd9Sstevel@tonic-gate nfs4_statvfs(vfs_t *vfsp, struct statvfs64 *sbp) 21037c478bd9Sstevel@tonic-gate { 21047c478bd9Sstevel@tonic-gate int error; 21057c478bd9Sstevel@tonic-gate vnode_t *vp; 21067c478bd9Sstevel@tonic-gate cred_t *cr; 21077c478bd9Sstevel@tonic-gate 21087c478bd9Sstevel@tonic-gate error = nfs4_root(vfsp, &vp); 21097c478bd9Sstevel@tonic-gate if (error) 21107c478bd9Sstevel@tonic-gate return (error); 21117c478bd9Sstevel@tonic-gate 21127c478bd9Sstevel@tonic-gate cr = CRED(); 21137c478bd9Sstevel@tonic-gate 21147c478bd9Sstevel@tonic-gate error = nfs4_statfs_otw(vp, sbp, cr); 21157c478bd9Sstevel@tonic-gate if (!error) { 21167c478bd9Sstevel@tonic-gate (void) strncpy(sbp->f_basetype, 21177c478bd9Sstevel@tonic-gate vfssw[vfsp->vfs_fstype].vsw_name, FSTYPSZ); 21187c478bd9Sstevel@tonic-gate sbp->f_flag = vf_to_stf(vfsp->vfs_flag); 21197c478bd9Sstevel@tonic-gate } else { 21207c478bd9Sstevel@tonic-gate nfs4_purge_stale_fh(error, vp, cr); 21217c478bd9Sstevel@tonic-gate } 21227c478bd9Sstevel@tonic-gate 21237c478bd9Sstevel@tonic-gate VN_RELE(vp); 21247c478bd9Sstevel@tonic-gate 21257c478bd9Sstevel@tonic-gate return (error); 21267c478bd9Sstevel@tonic-gate } 21277c478bd9Sstevel@tonic-gate 21287c478bd9Sstevel@tonic-gate static kmutex_t nfs4_syncbusy; 21297c478bd9Sstevel@tonic-gate 21307c478bd9Sstevel@tonic-gate /* 21317c478bd9Sstevel@tonic-gate * Flush dirty nfs files for file system vfsp. 21327c478bd9Sstevel@tonic-gate * If vfsp == NULL, all nfs files are flushed. 21337c478bd9Sstevel@tonic-gate * 21347c478bd9Sstevel@tonic-gate * SYNC_CLOSE in flag is passed to us to 21357c478bd9Sstevel@tonic-gate * indicate that we are shutting down and or 21367c478bd9Sstevel@tonic-gate * rebooting. 21377c478bd9Sstevel@tonic-gate */ 21387c478bd9Sstevel@tonic-gate static int 21397c478bd9Sstevel@tonic-gate nfs4_sync(vfs_t *vfsp, short flag, cred_t *cr) 21407c478bd9Sstevel@tonic-gate { 21417c478bd9Sstevel@tonic-gate /* 21427c478bd9Sstevel@tonic-gate * Cross-zone calls are OK here, since this translates to a 21437c478bd9Sstevel@tonic-gate * VOP_PUTPAGE(B_ASYNC), which gets picked up by the right zone. 21447c478bd9Sstevel@tonic-gate */ 21457c478bd9Sstevel@tonic-gate if (!(flag & SYNC_ATTR) && mutex_tryenter(&nfs4_syncbusy) != 0) { 21467c478bd9Sstevel@tonic-gate r4flush(vfsp, cr); 21477c478bd9Sstevel@tonic-gate mutex_exit(&nfs4_syncbusy); 21487c478bd9Sstevel@tonic-gate } 21497c478bd9Sstevel@tonic-gate 21507c478bd9Sstevel@tonic-gate /* 21517c478bd9Sstevel@tonic-gate * if SYNC_CLOSE is set then we know that 21527c478bd9Sstevel@tonic-gate * the system is rebooting, mark the mntinfo 21537c478bd9Sstevel@tonic-gate * for later examination. 21547c478bd9Sstevel@tonic-gate */ 21557c478bd9Sstevel@tonic-gate if (vfsp && (flag & SYNC_CLOSE)) { 21567c478bd9Sstevel@tonic-gate mntinfo4_t *mi; 21577c478bd9Sstevel@tonic-gate 21587c478bd9Sstevel@tonic-gate mi = VFTOMI4(vfsp); 21597c478bd9Sstevel@tonic-gate if (!(mi->mi_flags & MI4_SHUTDOWN)) { 21607c478bd9Sstevel@tonic-gate mutex_enter(&mi->mi_lock); 21617c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_SHUTDOWN; 21627c478bd9Sstevel@tonic-gate mutex_exit(&mi->mi_lock); 21637c478bd9Sstevel@tonic-gate } 21647c478bd9Sstevel@tonic-gate } 21657c478bd9Sstevel@tonic-gate return (0); 21667c478bd9Sstevel@tonic-gate } 21677c478bd9Sstevel@tonic-gate 21687c478bd9Sstevel@tonic-gate /* 21697c478bd9Sstevel@tonic-gate * vget is difficult, if not impossible, to support in v4 because we don't 21707c478bd9Sstevel@tonic-gate * know the parent directory or name, which makes it impossible to create a 21717c478bd9Sstevel@tonic-gate * useful shadow vnode. And we need the shadow vnode for things like 21727c478bd9Sstevel@tonic-gate * OPEN. 21737c478bd9Sstevel@tonic-gate */ 21747c478bd9Sstevel@tonic-gate 21757c478bd9Sstevel@tonic-gate /* ARGSUSED */ 21767c478bd9Sstevel@tonic-gate /* 21777c478bd9Sstevel@tonic-gate * XXX Check nfs4_vget_pseudo() for dependency. 21787c478bd9Sstevel@tonic-gate */ 21797c478bd9Sstevel@tonic-gate static int 21807c478bd9Sstevel@tonic-gate nfs4_vget(vfs_t *vfsp, vnode_t **vpp, fid_t *fidp) 21817c478bd9Sstevel@tonic-gate { 21827c478bd9Sstevel@tonic-gate return (EREMOTE); 21837c478bd9Sstevel@tonic-gate } 21847c478bd9Sstevel@tonic-gate 21857c478bd9Sstevel@tonic-gate /* 21867c478bd9Sstevel@tonic-gate * nfs4_mountroot get called in the case where we are diskless booting. All 21877c478bd9Sstevel@tonic-gate * we need from here is the ability to get the server info and from there we 21887c478bd9Sstevel@tonic-gate * can simply call nfs4_rootvp. 21897c478bd9Sstevel@tonic-gate */ 21907c478bd9Sstevel@tonic-gate /* ARGSUSED */ 21917c478bd9Sstevel@tonic-gate static int 21927c478bd9Sstevel@tonic-gate nfs4_mountroot(vfs_t *vfsp, whymountroot_t why) 21937c478bd9Sstevel@tonic-gate { 21947c478bd9Sstevel@tonic-gate vnode_t *rtvp; 21957c478bd9Sstevel@tonic-gate char root_hostname[SYS_NMLN+1]; 21967c478bd9Sstevel@tonic-gate struct servinfo4 *svp; 21977c478bd9Sstevel@tonic-gate int error; 21987c478bd9Sstevel@tonic-gate int vfsflags; 21997c478bd9Sstevel@tonic-gate size_t size; 22007c478bd9Sstevel@tonic-gate char *root_path; 22017c478bd9Sstevel@tonic-gate struct pathname pn; 22027c478bd9Sstevel@tonic-gate char *name; 22037c478bd9Sstevel@tonic-gate cred_t *cr; 22047c478bd9Sstevel@tonic-gate mntinfo4_t *mi; 22057c478bd9Sstevel@tonic-gate struct nfs_args args; /* nfs mount arguments */ 22067c478bd9Sstevel@tonic-gate static char token[10]; 22077c478bd9Sstevel@tonic-gate nfs4_error_t n4e; 22087c478bd9Sstevel@tonic-gate 22097c478bd9Sstevel@tonic-gate bzero(&args, sizeof (args)); 22107c478bd9Sstevel@tonic-gate 22117c478bd9Sstevel@tonic-gate /* do this BEFORE getfile which causes xid stamps to be initialized */ 22127c478bd9Sstevel@tonic-gate clkset(-1L); /* hack for now - until we get time svc? */ 22137c478bd9Sstevel@tonic-gate 22147c478bd9Sstevel@tonic-gate if (why == ROOT_REMOUNT) { 22157c478bd9Sstevel@tonic-gate /* 22167c478bd9Sstevel@tonic-gate * Shouldn't happen. 22177c478bd9Sstevel@tonic-gate */ 22187c478bd9Sstevel@tonic-gate panic("nfs4_mountroot: why == ROOT_REMOUNT"); 22197c478bd9Sstevel@tonic-gate } 22207c478bd9Sstevel@tonic-gate 22217c478bd9Sstevel@tonic-gate if (why == ROOT_UNMOUNT) { 22227c478bd9Sstevel@tonic-gate /* 22237c478bd9Sstevel@tonic-gate * Nothing to do for NFS. 22247c478bd9Sstevel@tonic-gate */ 22257c478bd9Sstevel@tonic-gate return (0); 22267c478bd9Sstevel@tonic-gate } 22277c478bd9Sstevel@tonic-gate 22287c478bd9Sstevel@tonic-gate /* 22297c478bd9Sstevel@tonic-gate * why == ROOT_INIT 22307c478bd9Sstevel@tonic-gate */ 22317c478bd9Sstevel@tonic-gate 22327c478bd9Sstevel@tonic-gate name = token; 22337c478bd9Sstevel@tonic-gate *name = 0; 22347c478bd9Sstevel@tonic-gate (void) getfsname("root", name, sizeof (token)); 22357c478bd9Sstevel@tonic-gate 22367c478bd9Sstevel@tonic-gate pn_alloc(&pn); 22377c478bd9Sstevel@tonic-gate root_path = pn.pn_path; 22387c478bd9Sstevel@tonic-gate 22397c478bd9Sstevel@tonic-gate svp = kmem_zalloc(sizeof (*svp), KM_SLEEP); 22407c478bd9Sstevel@tonic-gate nfs_rw_init(&svp->sv_lock, NULL, RW_DEFAULT, NULL); 22417c478bd9Sstevel@tonic-gate svp->sv_knconf = kmem_zalloc(sizeof (*svp->sv_knconf), KM_SLEEP); 22427c478bd9Sstevel@tonic-gate svp->sv_knconf->knc_protofmly = kmem_alloc(KNC_STRSIZE, KM_SLEEP); 22437c478bd9Sstevel@tonic-gate svp->sv_knconf->knc_proto = kmem_alloc(KNC_STRSIZE, KM_SLEEP); 22447c478bd9Sstevel@tonic-gate 22457c478bd9Sstevel@tonic-gate /* 22467c478bd9Sstevel@tonic-gate * Get server address 22477c478bd9Sstevel@tonic-gate * Get the root path 22487c478bd9Sstevel@tonic-gate * Get server's transport 22497c478bd9Sstevel@tonic-gate * Get server's hostname 22507c478bd9Sstevel@tonic-gate * Get options 22517c478bd9Sstevel@tonic-gate */ 22527c478bd9Sstevel@tonic-gate args.addr = &svp->sv_addr; 22537c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 22547c478bd9Sstevel@tonic-gate args.fh = (char *)&svp->sv_fhandle; 22557c478bd9Sstevel@tonic-gate args.knconf = svp->sv_knconf; 22567c478bd9Sstevel@tonic-gate args.hostname = root_hostname; 22577c478bd9Sstevel@tonic-gate vfsflags = 0; 22587c478bd9Sstevel@tonic-gate if (error = mount_root(*name ? name : "root", root_path, NFS_V4, 22597c478bd9Sstevel@tonic-gate &args, &vfsflags)) { 22607c478bd9Sstevel@tonic-gate if (error == EPROTONOSUPPORT) 22617c478bd9Sstevel@tonic-gate nfs_cmn_err(error, CE_WARN, "nfs4_mountroot: " 22627c478bd9Sstevel@tonic-gate "mount_root failed: server doesn't support NFS V4"); 22637c478bd9Sstevel@tonic-gate else 22647c478bd9Sstevel@tonic-gate nfs_cmn_err(error, CE_WARN, 22657c478bd9Sstevel@tonic-gate "nfs4_mountroot: mount_root failed: %m"); 22667c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 22677c478bd9Sstevel@tonic-gate sv4_free(svp); 22687c478bd9Sstevel@tonic-gate pn_free(&pn); 22697c478bd9Sstevel@tonic-gate return (error); 22707c478bd9Sstevel@tonic-gate } 22717c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 22727c478bd9Sstevel@tonic-gate svp->sv_hostnamelen = (int)(strlen(root_hostname) + 1); 22737c478bd9Sstevel@tonic-gate svp->sv_hostname = kmem_alloc(svp->sv_hostnamelen, KM_SLEEP); 22747c478bd9Sstevel@tonic-gate (void) strcpy(svp->sv_hostname, root_hostname); 22757c478bd9Sstevel@tonic-gate 22767c478bd9Sstevel@tonic-gate svp->sv_pathlen = (int)(strlen(root_path) + 1); 22777c478bd9Sstevel@tonic-gate svp->sv_path = kmem_alloc(svp->sv_pathlen, KM_SLEEP); 22787c478bd9Sstevel@tonic-gate (void) strcpy(svp->sv_path, root_path); 22797c478bd9Sstevel@tonic-gate 22807c478bd9Sstevel@tonic-gate /* 22817c478bd9Sstevel@tonic-gate * Force root partition to always be mounted with AUTH_UNIX for now 22827c478bd9Sstevel@tonic-gate */ 22837c478bd9Sstevel@tonic-gate svp->sv_secdata = kmem_alloc(sizeof (*svp->sv_secdata), KM_SLEEP); 22847c478bd9Sstevel@tonic-gate svp->sv_secdata->secmod = AUTH_UNIX; 22857c478bd9Sstevel@tonic-gate svp->sv_secdata->rpcflavor = AUTH_UNIX; 22867c478bd9Sstevel@tonic-gate svp->sv_secdata->data = NULL; 22877c478bd9Sstevel@tonic-gate 22887c478bd9Sstevel@tonic-gate cr = crgetcred(); 22897c478bd9Sstevel@tonic-gate rtvp = NULL; 22907c478bd9Sstevel@tonic-gate 22917c478bd9Sstevel@tonic-gate error = nfs4rootvp(&rtvp, vfsp, svp, args.flags, cr, global_zone); 22927c478bd9Sstevel@tonic-gate 22937c478bd9Sstevel@tonic-gate if (error) { 22947c478bd9Sstevel@tonic-gate crfree(cr); 22957c478bd9Sstevel@tonic-gate pn_free(&pn); 22967c478bd9Sstevel@tonic-gate goto errout; 22977c478bd9Sstevel@tonic-gate } 22987c478bd9Sstevel@tonic-gate 22997c478bd9Sstevel@tonic-gate mi = VTOMI4(rtvp); 23007c478bd9Sstevel@tonic-gate 23017c478bd9Sstevel@tonic-gate /* 23027c478bd9Sstevel@tonic-gate * Send client id to the server, if necessary 23037c478bd9Sstevel@tonic-gate */ 23047c478bd9Sstevel@tonic-gate nfs4_error_zinit(&n4e); 23057c478bd9Sstevel@tonic-gate nfs4setclientid(mi, cr, FALSE, &n4e); 23067c478bd9Sstevel@tonic-gate error = n4e.error; 23077c478bd9Sstevel@tonic-gate 23087c478bd9Sstevel@tonic-gate crfree(cr); 23097c478bd9Sstevel@tonic-gate 23107c478bd9Sstevel@tonic-gate if (error) { 23117c478bd9Sstevel@tonic-gate pn_free(&pn); 23127c478bd9Sstevel@tonic-gate goto errout; 23137c478bd9Sstevel@tonic-gate } 23147c478bd9Sstevel@tonic-gate 23157c478bd9Sstevel@tonic-gate error = nfs4_setopts(rtvp, DATAMODEL_NATIVE, &args); 23167c478bd9Sstevel@tonic-gate if (error) { 23177c478bd9Sstevel@tonic-gate nfs_cmn_err(error, CE_WARN, 23187c478bd9Sstevel@tonic-gate "nfs4_mountroot: invalid root mount options"); 23197c478bd9Sstevel@tonic-gate pn_free(&pn); 23207c478bd9Sstevel@tonic-gate goto errout; 23217c478bd9Sstevel@tonic-gate } 23227c478bd9Sstevel@tonic-gate 23237c478bd9Sstevel@tonic-gate (void) vfs_lock_wait(vfsp); 23247c478bd9Sstevel@tonic-gate vfs_add(NULL, vfsp, vfsflags); 23257c478bd9Sstevel@tonic-gate vfs_unlock(vfsp); 23267c478bd9Sstevel@tonic-gate 23277c478bd9Sstevel@tonic-gate size = strlen(svp->sv_hostname); 23287c478bd9Sstevel@tonic-gate (void) strcpy(rootfs.bo_name, svp->sv_hostname); 23297c478bd9Sstevel@tonic-gate rootfs.bo_name[size] = ':'; 23307c478bd9Sstevel@tonic-gate (void) strcpy(&rootfs.bo_name[size + 1], root_path); 23317c478bd9Sstevel@tonic-gate 23327c478bd9Sstevel@tonic-gate pn_free(&pn); 23337c478bd9Sstevel@tonic-gate 23347c478bd9Sstevel@tonic-gate errout: 23357c478bd9Sstevel@tonic-gate if (error) { 23367c478bd9Sstevel@tonic-gate sv4_free(svp); 23377c478bd9Sstevel@tonic-gate nfs4_async_stop(vfsp); 23387c478bd9Sstevel@tonic-gate nfs4_async_manager_stop(vfsp); 23397c478bd9Sstevel@tonic-gate } 23407c478bd9Sstevel@tonic-gate 23417c478bd9Sstevel@tonic-gate if (rtvp != NULL) 23427c478bd9Sstevel@tonic-gate VN_RELE(rtvp); 23437c478bd9Sstevel@tonic-gate 23447c478bd9Sstevel@tonic-gate return (error); 23457c478bd9Sstevel@tonic-gate } 23467c478bd9Sstevel@tonic-gate 23477c478bd9Sstevel@tonic-gate /* 23487c478bd9Sstevel@tonic-gate * Initialization routine for VFS routines. Should only be called once 23497c478bd9Sstevel@tonic-gate */ 23507c478bd9Sstevel@tonic-gate int 23517c478bd9Sstevel@tonic-gate nfs4_vfsinit(void) 23527c478bd9Sstevel@tonic-gate { 23537c478bd9Sstevel@tonic-gate mutex_init(&nfs4_syncbusy, NULL, MUTEX_DEFAULT, NULL); 23547c478bd9Sstevel@tonic-gate nfs4setclientid_init(); 23557c478bd9Sstevel@tonic-gate return (0); 23567c478bd9Sstevel@tonic-gate } 23577c478bd9Sstevel@tonic-gate 23587c478bd9Sstevel@tonic-gate void 23597c478bd9Sstevel@tonic-gate nfs4_vfsfini(void) 23607c478bd9Sstevel@tonic-gate { 23617c478bd9Sstevel@tonic-gate nfs4setclientid_fini(); 23627c478bd9Sstevel@tonic-gate mutex_destroy(&nfs4_syncbusy); 23637c478bd9Sstevel@tonic-gate } 23647c478bd9Sstevel@tonic-gate 23657c478bd9Sstevel@tonic-gate void 23667c478bd9Sstevel@tonic-gate nfs4_freevfs(vfs_t *vfsp) 23677c478bd9Sstevel@tonic-gate { 23687c478bd9Sstevel@tonic-gate mntinfo4_t *mi; 23697c478bd9Sstevel@tonic-gate servinfo4_t *svp; 23707c478bd9Sstevel@tonic-gate 23717c478bd9Sstevel@tonic-gate /* free up the resources */ 23727c478bd9Sstevel@tonic-gate mi = VFTOMI4(vfsp); 23737c478bd9Sstevel@tonic-gate svp = mi->mi_servers; 23747c478bd9Sstevel@tonic-gate mi->mi_servers = mi->mi_curr_serv = NULL; 23757c478bd9Sstevel@tonic-gate sv4_free(svp); 23767c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_lease_debug, (CE_NOTE, "nfs4_freevfs: " 23777c478bd9Sstevel@tonic-gate "free mi %p", (void *)mi)); 23787c478bd9Sstevel@tonic-gate 23797c478bd9Sstevel@tonic-gate /* 23807c478bd9Sstevel@tonic-gate * By this time we should have already deleted the 23817c478bd9Sstevel@tonic-gate * mi kstats in the unmount code. If they are still around 23827c478bd9Sstevel@tonic-gate * somethings wrong 23837c478bd9Sstevel@tonic-gate */ 23847c478bd9Sstevel@tonic-gate ASSERT(mi->mi_io_kstats == NULL); 23857c478bd9Sstevel@tonic-gate 23867c478bd9Sstevel@tonic-gate nfs_free_mi4(mi); 23877c478bd9Sstevel@tonic-gate } 23887c478bd9Sstevel@tonic-gate 23897c478bd9Sstevel@tonic-gate /* 23907c478bd9Sstevel@tonic-gate * Client side SETCLIENTID and SETCLIENTID_CONFIRM 23917c478bd9Sstevel@tonic-gate */ 23927c478bd9Sstevel@tonic-gate struct nfs4_server nfs4_server_lst = 23937c478bd9Sstevel@tonic-gate { &nfs4_server_lst, &nfs4_server_lst }; 23947c478bd9Sstevel@tonic-gate 23957c478bd9Sstevel@tonic-gate kmutex_t nfs4_server_lst_lock; 23967c478bd9Sstevel@tonic-gate 23977c478bd9Sstevel@tonic-gate static void 23987c478bd9Sstevel@tonic-gate nfs4setclientid_init(void) 23997c478bd9Sstevel@tonic-gate { 24007c478bd9Sstevel@tonic-gate mutex_init(&nfs4_server_lst_lock, NULL, MUTEX_DEFAULT, NULL); 24017c478bd9Sstevel@tonic-gate } 24027c478bd9Sstevel@tonic-gate 24037c478bd9Sstevel@tonic-gate static void 24047c478bd9Sstevel@tonic-gate nfs4setclientid_fini(void) 24057c478bd9Sstevel@tonic-gate { 24067c478bd9Sstevel@tonic-gate mutex_destroy(&nfs4_server_lst_lock); 24077c478bd9Sstevel@tonic-gate } 24087c478bd9Sstevel@tonic-gate 24097c478bd9Sstevel@tonic-gate int nfs4_retry_sclid_delay = NFS4_RETRY_SCLID_DELAY; 24107c478bd9Sstevel@tonic-gate int nfs4_num_sclid_retries = NFS4_NUM_SCLID_RETRIES; 24117c478bd9Sstevel@tonic-gate 24127c478bd9Sstevel@tonic-gate /* 24137c478bd9Sstevel@tonic-gate * Set the clientid for the server for "mi". No-op if the clientid is 24147c478bd9Sstevel@tonic-gate * already set. 24157c478bd9Sstevel@tonic-gate * 24167c478bd9Sstevel@tonic-gate * The recovery boolean should be set to TRUE if this function was called 2417a092743bSek * by the recovery code, and FALSE otherwise. This is used to determine 2418a092743bSek * if we need to call nfs4_start/end_op as well as grab the mi_recovlock 2419a092743bSek * for adding a mntinfo4_t to a nfs4_server_t. 24207c478bd9Sstevel@tonic-gate * 24217c478bd9Sstevel@tonic-gate * Error is returned via 'n4ep'. If there was a 'n4ep->stat' error, then 24227c478bd9Sstevel@tonic-gate * 'n4ep->error' is set to geterrno4(n4ep->stat). 24237c478bd9Sstevel@tonic-gate */ 24247c478bd9Sstevel@tonic-gate void 24257c478bd9Sstevel@tonic-gate nfs4setclientid(mntinfo4_t *mi, cred_t *cr, bool_t recovery, nfs4_error_t *n4ep) 24267c478bd9Sstevel@tonic-gate { 24277c478bd9Sstevel@tonic-gate struct nfs4_server *np; 24287c478bd9Sstevel@tonic-gate struct servinfo4 *svp = mi->mi_curr_serv; 24297c478bd9Sstevel@tonic-gate nfs4_recov_state_t recov_state; 24307c478bd9Sstevel@tonic-gate int num_retries = 0; 24317c478bd9Sstevel@tonic-gate bool_t retry = FALSE; 24327c478bd9Sstevel@tonic-gate cred_t *lcr = NULL; 24337c478bd9Sstevel@tonic-gate int retry_inuse = 1; /* only retry once on NFS4ERR_CLID_INUSE */ 24347c478bd9Sstevel@tonic-gate time_t lease_time = 0; 24357c478bd9Sstevel@tonic-gate 24367c478bd9Sstevel@tonic-gate recov_state.rs_flags = 0; 24377c478bd9Sstevel@tonic-gate recov_state.rs_num_retry_despite_err = 0; 24387c478bd9Sstevel@tonic-gate ASSERT(n4ep != NULL); 24397c478bd9Sstevel@tonic-gate 24407c478bd9Sstevel@tonic-gate recov_retry: 24417c478bd9Sstevel@tonic-gate nfs4_error_zinit(n4ep); 2442a092743bSek if (!recovery) 2443a092743bSek (void) nfs_rw_enter_sig(&mi->mi_recovlock, RW_READER, 0); 2444a092743bSek 24457c478bd9Sstevel@tonic-gate /* This locks np if it is found */ 24467c478bd9Sstevel@tonic-gate np = servinfo4_to_nfs4_server(svp); 24477c478bd9Sstevel@tonic-gate ASSERT(np == NULL || MUTEX_HELD(&np->s_lock)); 24487c478bd9Sstevel@tonic-gate 24497c478bd9Sstevel@tonic-gate /* 24507c478bd9Sstevel@tonic-gate * If we find the server already in the list, then just 24517c478bd9Sstevel@tonic-gate * return, we've already done SETCLIENTID to that server 24527c478bd9Sstevel@tonic-gate */ 24537c478bd9Sstevel@tonic-gate 24547c478bd9Sstevel@tonic-gate if (np && (np->s_flags & N4S_CLIENTID_SET)) { 24557c478bd9Sstevel@tonic-gate /* 24567c478bd9Sstevel@tonic-gate * XXX - more is needed here. SETCLIENTID may not 24577c478bd9Sstevel@tonic-gate * be completed. A VFS lock may prevent multiple 24587c478bd9Sstevel@tonic-gate * mounts and provide needed serialization. 24597c478bd9Sstevel@tonic-gate */ 24607c478bd9Sstevel@tonic-gate /* add mi to np's mntinfo4_list */ 24617c478bd9Sstevel@tonic-gate nfs4_add_mi_to_server(np, mi); 2462a092743bSek if (!recovery) 2463a092743bSek nfs_rw_exit(&mi->mi_recovlock); 24647c478bd9Sstevel@tonic-gate mutex_exit(&np->s_lock); 24657c478bd9Sstevel@tonic-gate nfs4_server_rele(np); 24667c478bd9Sstevel@tonic-gate return; 24677c478bd9Sstevel@tonic-gate } 24687c478bd9Sstevel@tonic-gate 2469a092743bSek /* 2470a092743bSek * Drop the mi_recovlock since nfs4_start_op will 2471a092743bSek * acquire it again for us. 2472a092743bSek */ 2473a092743bSek if (!recovery) 2474a092743bSek nfs_rw_exit(&mi->mi_recovlock); 2475a092743bSek 24767c478bd9Sstevel@tonic-gate if (!np) 24777c478bd9Sstevel@tonic-gate np = new_nfs4_server(svp, cr); 24787c478bd9Sstevel@tonic-gate else 24797c478bd9Sstevel@tonic-gate mutex_exit(&np->s_lock); 24807c478bd9Sstevel@tonic-gate 24817c478bd9Sstevel@tonic-gate if (!recovery) { 24827c478bd9Sstevel@tonic-gate n4ep->error = nfs4_start_op(mi, NULL, NULL, &recov_state); 24837c478bd9Sstevel@tonic-gate if (n4ep->error) { 24847c478bd9Sstevel@tonic-gate nfs4_server_rele(np); 24857c478bd9Sstevel@tonic-gate return; 24867c478bd9Sstevel@tonic-gate } 24877c478bd9Sstevel@tonic-gate } 24887c478bd9Sstevel@tonic-gate 24897c478bd9Sstevel@tonic-gate /* 24907c478bd9Sstevel@tonic-gate * Will potentially add np to global list, which transfers 24917c478bd9Sstevel@tonic-gate * ownership of the reference to the list. 24927c478bd9Sstevel@tonic-gate */ 24937c478bd9Sstevel@tonic-gate mutex_enter(&nfs4_server_lst_lock); 24947c478bd9Sstevel@tonic-gate mutex_enter(&np->s_lock); 24957c478bd9Sstevel@tonic-gate 24967c478bd9Sstevel@tonic-gate /* 24977c478bd9Sstevel@tonic-gate * Reset the N4S_CB_PINGED flag. This is used to 24987c478bd9Sstevel@tonic-gate * indicate if we have received a CB_NULL from the 24997c478bd9Sstevel@tonic-gate * server. Also we reset the waiter flag. 25007c478bd9Sstevel@tonic-gate */ 25017c478bd9Sstevel@tonic-gate np->s_flags &= ~(N4S_CB_PINGED | N4S_CB_WAITER); 25027c478bd9Sstevel@tonic-gate 25037c478bd9Sstevel@tonic-gate if (np->s_flags & N4S_CLIENTID_SET) { 25047c478bd9Sstevel@tonic-gate /* XXX copied/pasted from above */ 25057c478bd9Sstevel@tonic-gate /* 25067c478bd9Sstevel@tonic-gate * XXX - more is needed here. SETCLIENTID may not 25077c478bd9Sstevel@tonic-gate * be completed. A VFS lock may prevent multiple 25087c478bd9Sstevel@tonic-gate * mounts and provide needed serialization. 25097c478bd9Sstevel@tonic-gate */ 25107c478bd9Sstevel@tonic-gate /* add mi to np's mntinfo4_list */ 25117c478bd9Sstevel@tonic-gate nfs4_add_mi_to_server(np, mi); 25127c478bd9Sstevel@tonic-gate mutex_exit(&np->s_lock); 25137c478bd9Sstevel@tonic-gate mutex_exit(&nfs4_server_lst_lock); 25147c478bd9Sstevel@tonic-gate nfs4_server_rele(np); 25157c478bd9Sstevel@tonic-gate if (!recovery) 25167c478bd9Sstevel@tonic-gate nfs4_end_op(mi, NULL, NULL, &recov_state, recovery); 25177c478bd9Sstevel@tonic-gate return; 25187c478bd9Sstevel@tonic-gate } 25197c478bd9Sstevel@tonic-gate 25207c478bd9Sstevel@tonic-gate nfs4setclientid_otw(mi, svp, cr, np, n4ep, &retry_inuse); 25217c478bd9Sstevel@tonic-gate 25227c478bd9Sstevel@tonic-gate if (n4ep->error == EACCES) { 25237c478bd9Sstevel@tonic-gate /* 25247c478bd9Sstevel@tonic-gate * If the uid is set then set the creds for secure mounts 25257c478bd9Sstevel@tonic-gate * by proxy processes such as automountd. 25267c478bd9Sstevel@tonic-gate */ 25277c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&svp->sv_lock, RW_READER, 0); 25287c478bd9Sstevel@tonic-gate if (svp->sv_secdata->uid != 0) { 25297c478bd9Sstevel@tonic-gate lcr = crdup(cr); 25307c478bd9Sstevel@tonic-gate (void) crsetugid(lcr, svp->sv_secdata->uid, 25317c478bd9Sstevel@tonic-gate crgetgid(cr)); 25327c478bd9Sstevel@tonic-gate crfree(np->s_cred); 25337c478bd9Sstevel@tonic-gate np->s_cred = lcr; 25347c478bd9Sstevel@tonic-gate } 25357c478bd9Sstevel@tonic-gate nfs_rw_exit(&svp->sv_lock); 25367c478bd9Sstevel@tonic-gate 25377c478bd9Sstevel@tonic-gate if (lcr != NULL) 25387c478bd9Sstevel@tonic-gate nfs4setclientid_otw(mi, svp, lcr, np, n4ep, 25397c478bd9Sstevel@tonic-gate &retry_inuse); 25407c478bd9Sstevel@tonic-gate } 25417c478bd9Sstevel@tonic-gate lease_time = np->s_lease_time; 25427c478bd9Sstevel@tonic-gate mutex_exit(&np->s_lock); 25437c478bd9Sstevel@tonic-gate mutex_exit(&nfs4_server_lst_lock); 25447c478bd9Sstevel@tonic-gate 25457c478bd9Sstevel@tonic-gate if (n4ep->error != 0 || n4ep->stat != NFS4_OK) { 25467c478bd9Sstevel@tonic-gate /* 25477c478bd9Sstevel@tonic-gate * Start recovery if failover is a possibility. If 25487c478bd9Sstevel@tonic-gate * invoked by the recovery thread itself, then just 25497c478bd9Sstevel@tonic-gate * return and let it handle the failover first. NB: 25507c478bd9Sstevel@tonic-gate * recovery is not allowed if the mount is in progress 25517c478bd9Sstevel@tonic-gate * since the infrastructure is not sufficiently setup 25527c478bd9Sstevel@tonic-gate * to allow it. Just return the error (after suitable 25537c478bd9Sstevel@tonic-gate * retries). 25547c478bd9Sstevel@tonic-gate */ 25557c478bd9Sstevel@tonic-gate if (FAILOVER_MOUNT4(mi) && nfs4_try_failover(n4ep)) { 25567c478bd9Sstevel@tonic-gate (void) nfs4_start_recovery(n4ep, mi, NULL, 25577c478bd9Sstevel@tonic-gate NULL, NULL, NULL, OP_SETCLIENTID, NULL); 25587c478bd9Sstevel@tonic-gate /* 25597c478bd9Sstevel@tonic-gate * Don't retry here, just return and let 25607c478bd9Sstevel@tonic-gate * recovery take over. 25617c478bd9Sstevel@tonic-gate */ 25627c478bd9Sstevel@tonic-gate if (recovery) 25637c478bd9Sstevel@tonic-gate retry = FALSE; 25647c478bd9Sstevel@tonic-gate } else if (nfs4_rpc_retry_error(n4ep->error) || 25657c478bd9Sstevel@tonic-gate n4ep->stat == NFS4ERR_RESOURCE || 25667c478bd9Sstevel@tonic-gate n4ep->stat == NFS4ERR_STALE_CLIENTID) { 25677c478bd9Sstevel@tonic-gate 25687c478bd9Sstevel@tonic-gate retry = TRUE; 25697c478bd9Sstevel@tonic-gate /* 25707c478bd9Sstevel@tonic-gate * Always retry if in recovery or once had 25717c478bd9Sstevel@tonic-gate * contact with the server (but now it's 25727c478bd9Sstevel@tonic-gate * overloaded). 25737c478bd9Sstevel@tonic-gate */ 25747c478bd9Sstevel@tonic-gate if (recovery == TRUE || 25757c478bd9Sstevel@tonic-gate n4ep->error == ETIMEDOUT || 25767c478bd9Sstevel@tonic-gate n4ep->error == ECONNRESET) 25777c478bd9Sstevel@tonic-gate num_retries = 0; 25787c478bd9Sstevel@tonic-gate } else if (retry_inuse && n4ep->error == 0 && 25797c478bd9Sstevel@tonic-gate n4ep->stat == NFS4ERR_CLID_INUSE) { 25807c478bd9Sstevel@tonic-gate retry = TRUE; 25817c478bd9Sstevel@tonic-gate num_retries = 0; 25827c478bd9Sstevel@tonic-gate } 25837c478bd9Sstevel@tonic-gate } 25847c478bd9Sstevel@tonic-gate 25857c478bd9Sstevel@tonic-gate if (!recovery) 25867c478bd9Sstevel@tonic-gate nfs4_end_op(mi, NULL, NULL, &recov_state, recovery); 25877c478bd9Sstevel@tonic-gate nfs4_server_rele(np); 25887c478bd9Sstevel@tonic-gate 25897c478bd9Sstevel@tonic-gate if (retry && num_retries++ < nfs4_num_sclid_retries) { 25907c478bd9Sstevel@tonic-gate if (retry_inuse) { 25917c478bd9Sstevel@tonic-gate delay(SEC_TO_TICK(lease_time + nfs4_retry_sclid_delay)); 25927c478bd9Sstevel@tonic-gate retry_inuse = 0; 25937c478bd9Sstevel@tonic-gate } else 25947c478bd9Sstevel@tonic-gate delay(SEC_TO_TICK(nfs4_retry_sclid_delay)); 25957c478bd9Sstevel@tonic-gate goto recov_retry; 25967c478bd9Sstevel@tonic-gate } 25977c478bd9Sstevel@tonic-gate 25987c478bd9Sstevel@tonic-gate if (n4ep->error == 0) 25997c478bd9Sstevel@tonic-gate n4ep->error = geterrno4(n4ep->stat); 26007c478bd9Sstevel@tonic-gate } 26017c478bd9Sstevel@tonic-gate 26027c478bd9Sstevel@tonic-gate int nfs4setclientid_otw_debug = 0; 26037c478bd9Sstevel@tonic-gate 26047c478bd9Sstevel@tonic-gate /* 26057c478bd9Sstevel@tonic-gate * This assumes np is locked down. 26067c478bd9Sstevel@tonic-gate * This function handles the recovery of STALE_CLIENTID for SETCLIENTID_CONFRIM, 26077c478bd9Sstevel@tonic-gate * but nothing else; the calling function must be designed to handle those 26087c478bd9Sstevel@tonic-gate * other errors. 26097c478bd9Sstevel@tonic-gate */ 26107c478bd9Sstevel@tonic-gate static void 26117c478bd9Sstevel@tonic-gate nfs4setclientid_otw(mntinfo4_t *mi, struct servinfo4 *svp, cred_t *cr, 26127c478bd9Sstevel@tonic-gate struct nfs4_server *np, nfs4_error_t *ep, int *retry_inusep) 26137c478bd9Sstevel@tonic-gate { 26147c478bd9Sstevel@tonic-gate COMPOUND4args_clnt args; 26157c478bd9Sstevel@tonic-gate COMPOUND4res_clnt res; 26167c478bd9Sstevel@tonic-gate nfs_argop4 argop[3]; 26177c478bd9Sstevel@tonic-gate SETCLIENTID4args *s_args; 26187c478bd9Sstevel@tonic-gate SETCLIENTID4resok *s_resok; 26197c478bd9Sstevel@tonic-gate int doqueue = 1; 26207c478bd9Sstevel@tonic-gate nfs4_ga_res_t *garp = NULL; 26217c478bd9Sstevel@tonic-gate timespec_t prop_time, after_time; 26227c478bd9Sstevel@tonic-gate verifier4 verf; 26237c478bd9Sstevel@tonic-gate clientid4 tmp_clientid; 26247c478bd9Sstevel@tonic-gate 26257c478bd9Sstevel@tonic-gate ASSERT(MUTEX_HELD(&np->s_lock)); 26267c478bd9Sstevel@tonic-gate 26277c478bd9Sstevel@tonic-gate args.ctag = TAG_SETCLIENTID; 26287c478bd9Sstevel@tonic-gate 26297c478bd9Sstevel@tonic-gate args.array = argop; 26307c478bd9Sstevel@tonic-gate args.array_len = 3; 26317c478bd9Sstevel@tonic-gate 26327c478bd9Sstevel@tonic-gate /* PUTROOTFH */ 26337c478bd9Sstevel@tonic-gate argop[0].argop = OP_PUTROOTFH; 26347c478bd9Sstevel@tonic-gate 26357c478bd9Sstevel@tonic-gate /* GETATTR */ 26367c478bd9Sstevel@tonic-gate argop[1].argop = OP_GETATTR; 26377c478bd9Sstevel@tonic-gate argop[1].nfs_argop4_u.opgetattr.attr_request = FATTR4_LEASE_TIME_MASK; 26387c478bd9Sstevel@tonic-gate argop[1].nfs_argop4_u.opgetattr.mi = mi; 26397c478bd9Sstevel@tonic-gate 26407c478bd9Sstevel@tonic-gate /* SETCLIENTID */ 26417c478bd9Sstevel@tonic-gate argop[2].argop = OP_SETCLIENTID; 26427c478bd9Sstevel@tonic-gate 26437c478bd9Sstevel@tonic-gate s_args = &argop[2].nfs_argop4_u.opsetclientid; 26447c478bd9Sstevel@tonic-gate 26457c478bd9Sstevel@tonic-gate s_args->client.verifier = np->clidtosend.verifier; 26467c478bd9Sstevel@tonic-gate s_args->client.id_len = np->clidtosend.id_len; 26477c478bd9Sstevel@tonic-gate ASSERT(s_args->client.id_len <= NFS4_OPAQUE_LIMIT); 26487c478bd9Sstevel@tonic-gate s_args->client.id_val = np->clidtosend.id_val; 26497c478bd9Sstevel@tonic-gate 26507c478bd9Sstevel@tonic-gate /* 26517c478bd9Sstevel@tonic-gate * Callback needs to happen on non-RDMA transport 26527c478bd9Sstevel@tonic-gate * Check if we have saved the original knetconfig 26537c478bd9Sstevel@tonic-gate * if so, use that instead. 26547c478bd9Sstevel@tonic-gate */ 26557c478bd9Sstevel@tonic-gate if (svp->sv_origknconf != NULL) 26567c478bd9Sstevel@tonic-gate nfs4_cb_args(np, svp->sv_origknconf, s_args); 26577c478bd9Sstevel@tonic-gate else 26587c478bd9Sstevel@tonic-gate nfs4_cb_args(np, svp->sv_knconf, s_args); 26597c478bd9Sstevel@tonic-gate 26607c478bd9Sstevel@tonic-gate rfs4call(mi, &args, &res, cr, &doqueue, RFSCALL_SOFT, ep); 26617c478bd9Sstevel@tonic-gate 26627c478bd9Sstevel@tonic-gate if (ep->error) 26637c478bd9Sstevel@tonic-gate return; 26647c478bd9Sstevel@tonic-gate 26657c478bd9Sstevel@tonic-gate /* getattr lease_time res */ 26667c478bd9Sstevel@tonic-gate if (res.array_len >= 2) { 26677c478bd9Sstevel@tonic-gate garp = &res.array[1].nfs_resop4_u.opgetattr.ga_res; 26687c478bd9Sstevel@tonic-gate 26697c478bd9Sstevel@tonic-gate #ifndef _LP64 26707c478bd9Sstevel@tonic-gate /* 26717c478bd9Sstevel@tonic-gate * The 32 bit client cannot handle a lease time greater than 26727c478bd9Sstevel@tonic-gate * (INT32_MAX/1000000). This is due to the use of the 26737c478bd9Sstevel@tonic-gate * lease_time in calls to drv_usectohz() in 26747c478bd9Sstevel@tonic-gate * nfs4_renew_lease_thread(). The problem is that 26757c478bd9Sstevel@tonic-gate * drv_usectohz() takes a time_t (which is just a long = 4 26767c478bd9Sstevel@tonic-gate * bytes) as its parameter. The lease_time is multiplied by 26777c478bd9Sstevel@tonic-gate * 1000000 to convert seconds to usecs for the parameter. If 26787c478bd9Sstevel@tonic-gate * a number bigger than (INT32_MAX/1000000) is used then we 26797c478bd9Sstevel@tonic-gate * overflow on the 32bit client. 26807c478bd9Sstevel@tonic-gate */ 26817c478bd9Sstevel@tonic-gate if (garp->n4g_ext_res->n4g_leasetime > (INT32_MAX/1000000)) { 26827c478bd9Sstevel@tonic-gate garp->n4g_ext_res->n4g_leasetime = INT32_MAX/1000000; 26837c478bd9Sstevel@tonic-gate } 26847c478bd9Sstevel@tonic-gate #endif 26857c478bd9Sstevel@tonic-gate 26867c478bd9Sstevel@tonic-gate np->s_lease_time = garp->n4g_ext_res->n4g_leasetime; 26877c478bd9Sstevel@tonic-gate 26887c478bd9Sstevel@tonic-gate /* 26897c478bd9Sstevel@tonic-gate * Keep track of the lease period for the mi's 26907c478bd9Sstevel@tonic-gate * mi_msg_list. We need an appropiate time 26917c478bd9Sstevel@tonic-gate * bound to associate past facts with a current 26927c478bd9Sstevel@tonic-gate * event. The lease period is perfect for this. 26937c478bd9Sstevel@tonic-gate */ 26947c478bd9Sstevel@tonic-gate mutex_enter(&mi->mi_msg_list_lock); 26957c478bd9Sstevel@tonic-gate mi->mi_lease_period = np->s_lease_time; 26967c478bd9Sstevel@tonic-gate mutex_exit(&mi->mi_msg_list_lock); 26977c478bd9Sstevel@tonic-gate } 26987c478bd9Sstevel@tonic-gate 26997c478bd9Sstevel@tonic-gate 27007c478bd9Sstevel@tonic-gate if (res.status == NFS4ERR_CLID_INUSE) { 27017c478bd9Sstevel@tonic-gate clientaddr4 *clid_inuse; 27027c478bd9Sstevel@tonic-gate 27037c478bd9Sstevel@tonic-gate if (!(*retry_inusep)) { 27047c478bd9Sstevel@tonic-gate clid_inuse = &res.array->nfs_resop4_u. 27057c478bd9Sstevel@tonic-gate opsetclientid.SETCLIENTID4res_u.client_using; 27067c478bd9Sstevel@tonic-gate 27077c478bd9Sstevel@tonic-gate zcmn_err(mi->mi_zone->zone_id, CE_NOTE, 27087c478bd9Sstevel@tonic-gate "NFS4 mount (SETCLIENTID failed)." 27097c478bd9Sstevel@tonic-gate " nfs4_client_id.id is in" 27107c478bd9Sstevel@tonic-gate "use already by: r_netid<%s> r_addr<%s>", 27117c478bd9Sstevel@tonic-gate clid_inuse->r_netid, clid_inuse->r_addr); 27127c478bd9Sstevel@tonic-gate } 27137c478bd9Sstevel@tonic-gate 27147c478bd9Sstevel@tonic-gate /* 27157c478bd9Sstevel@tonic-gate * XXX - The client should be more robust in its 27167c478bd9Sstevel@tonic-gate * handling of clientid in use errors (regen another 27177c478bd9Sstevel@tonic-gate * clientid and try again?) 27187c478bd9Sstevel@tonic-gate */ 27197c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 27207c478bd9Sstevel@tonic-gate return; 27217c478bd9Sstevel@tonic-gate } 27227c478bd9Sstevel@tonic-gate 27237c478bd9Sstevel@tonic-gate if (res.status) { 27247c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 27257c478bd9Sstevel@tonic-gate return; 27267c478bd9Sstevel@tonic-gate } 27277c478bd9Sstevel@tonic-gate 27287c478bd9Sstevel@tonic-gate s_resok = &res.array[2].nfs_resop4_u. 27297c478bd9Sstevel@tonic-gate opsetclientid.SETCLIENTID4res_u.resok4; 27307c478bd9Sstevel@tonic-gate 27317c478bd9Sstevel@tonic-gate tmp_clientid = s_resok->clientid; 27327c478bd9Sstevel@tonic-gate 27337c478bd9Sstevel@tonic-gate verf = s_resok->setclientid_confirm; 27347c478bd9Sstevel@tonic-gate 27357c478bd9Sstevel@tonic-gate #ifdef DEBUG 27367c478bd9Sstevel@tonic-gate if (nfs4setclientid_otw_debug) { 27377c478bd9Sstevel@tonic-gate union { 27387c478bd9Sstevel@tonic-gate clientid4 clientid; 27397c478bd9Sstevel@tonic-gate int foo[2]; 27407c478bd9Sstevel@tonic-gate } cid; 27417c478bd9Sstevel@tonic-gate 27427c478bd9Sstevel@tonic-gate cid.clientid = s_resok->clientid; 27437c478bd9Sstevel@tonic-gate 27447c478bd9Sstevel@tonic-gate zcmn_err(mi->mi_zone->zone_id, CE_NOTE, 27457c478bd9Sstevel@tonic-gate "nfs4setclientid_otw: OK, clientid = %x,%x, " 27467c478bd9Sstevel@tonic-gate "verifier = %" PRIx64 "\n", cid.foo[0], cid.foo[1], verf); 27477c478bd9Sstevel@tonic-gate } 27487c478bd9Sstevel@tonic-gate #endif 27497c478bd9Sstevel@tonic-gate 27507c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 27517c478bd9Sstevel@tonic-gate 27527c478bd9Sstevel@tonic-gate /* Confirm the client id and get the lease_time attribute */ 27537c478bd9Sstevel@tonic-gate 27547c478bd9Sstevel@tonic-gate args.ctag = TAG_SETCLIENTID_CF; 27557c478bd9Sstevel@tonic-gate 27567c478bd9Sstevel@tonic-gate args.array = argop; 27577c478bd9Sstevel@tonic-gate args.array_len = 1; 27587c478bd9Sstevel@tonic-gate 27597c478bd9Sstevel@tonic-gate argop[0].argop = OP_SETCLIENTID_CONFIRM; 27607c478bd9Sstevel@tonic-gate 27617c478bd9Sstevel@tonic-gate argop[0].nfs_argop4_u.opsetclientid_confirm.clientid = tmp_clientid; 27627c478bd9Sstevel@tonic-gate argop[0].nfs_argop4_u.opsetclientid_confirm.setclientid_confirm = verf; 27637c478bd9Sstevel@tonic-gate 27647c478bd9Sstevel@tonic-gate /* used to figure out RTT for np */ 27657c478bd9Sstevel@tonic-gate gethrestime(&prop_time); 27667c478bd9Sstevel@tonic-gate 27677c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_lease_debug, (CE_NOTE, "nfs4setlientid_otw: " 27687c478bd9Sstevel@tonic-gate "start time: %ld sec %ld nsec", prop_time.tv_sec, 27697c478bd9Sstevel@tonic-gate prop_time.tv_nsec)); 27707c478bd9Sstevel@tonic-gate 27717c478bd9Sstevel@tonic-gate rfs4call(mi, &args, &res, cr, &doqueue, 0, ep); 27727c478bd9Sstevel@tonic-gate 27737c478bd9Sstevel@tonic-gate gethrestime(&after_time); 27747c478bd9Sstevel@tonic-gate np->propagation_delay.tv_sec = 27757c478bd9Sstevel@tonic-gate MAX(1, after_time.tv_sec - prop_time.tv_sec); 27767c478bd9Sstevel@tonic-gate 27777c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_lease_debug, (CE_NOTE, "nfs4setlcientid_otw: " 27787c478bd9Sstevel@tonic-gate "finish time: %ld sec ", after_time.tv_sec)); 27797c478bd9Sstevel@tonic-gate 27807c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_lease_debug, (CE_NOTE, "nfs4setclientid_otw: " 27817c478bd9Sstevel@tonic-gate "propagation delay set to %ld sec", 27827c478bd9Sstevel@tonic-gate np->propagation_delay.tv_sec)); 27837c478bd9Sstevel@tonic-gate 27847c478bd9Sstevel@tonic-gate if (ep->error) 27857c478bd9Sstevel@tonic-gate return; 27867c478bd9Sstevel@tonic-gate 27877c478bd9Sstevel@tonic-gate if (res.status == NFS4ERR_CLID_INUSE) { 27887c478bd9Sstevel@tonic-gate clientaddr4 *clid_inuse; 27897c478bd9Sstevel@tonic-gate 27907c478bd9Sstevel@tonic-gate if (!(*retry_inusep)) { 27917c478bd9Sstevel@tonic-gate clid_inuse = &res.array->nfs_resop4_u. 27927c478bd9Sstevel@tonic-gate opsetclientid.SETCLIENTID4res_u.client_using; 27937c478bd9Sstevel@tonic-gate 27947c478bd9Sstevel@tonic-gate zcmn_err(mi->mi_zone->zone_id, CE_NOTE, 27957c478bd9Sstevel@tonic-gate "SETCLIENTID_CONFIRM failed. " 27967c478bd9Sstevel@tonic-gate "nfs4_client_id.id is in use already by: " 27977c478bd9Sstevel@tonic-gate "r_netid<%s> r_addr<%s>", 27987c478bd9Sstevel@tonic-gate clid_inuse->r_netid, clid_inuse->r_addr); 27997c478bd9Sstevel@tonic-gate } 28007c478bd9Sstevel@tonic-gate 28017c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 28027c478bd9Sstevel@tonic-gate return; 28037c478bd9Sstevel@tonic-gate } 28047c478bd9Sstevel@tonic-gate 28057c478bd9Sstevel@tonic-gate if (res.status) { 28067c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 28077c478bd9Sstevel@tonic-gate return; 28087c478bd9Sstevel@tonic-gate } 28097c478bd9Sstevel@tonic-gate 28107c478bd9Sstevel@tonic-gate if (!(np->s_flags & N4S_INSERTED)) { 28117c478bd9Sstevel@tonic-gate ASSERT(MUTEX_HELD(&nfs4_server_lst_lock)); 28127c478bd9Sstevel@tonic-gate insque(np, &nfs4_server_lst); 28137c478bd9Sstevel@tonic-gate ASSERT(MUTEX_HELD(&np->s_lock)); 28147c478bd9Sstevel@tonic-gate np->s_flags |= N4S_INSERTED; 28157c478bd9Sstevel@tonic-gate np->s_refcnt++; /* list gets a reference */ 28167c478bd9Sstevel@tonic-gate } 28177c478bd9Sstevel@tonic-gate 28187c478bd9Sstevel@tonic-gate np->clientid = tmp_clientid; 28197c478bd9Sstevel@tonic-gate np->s_flags |= N4S_CLIENTID_SET; 28207c478bd9Sstevel@tonic-gate 28217c478bd9Sstevel@tonic-gate /* Add mi to np's mntinfo4 list */ 28227c478bd9Sstevel@tonic-gate nfs4_add_mi_to_server(np, mi); 28237c478bd9Sstevel@tonic-gate 28247c478bd9Sstevel@tonic-gate if (np->lease_valid == NFS4_LEASE_NOT_STARTED) { 28257c478bd9Sstevel@tonic-gate /* 28267c478bd9Sstevel@tonic-gate * Start lease management thread. 28277c478bd9Sstevel@tonic-gate * Keep trying until we succeed. 28287c478bd9Sstevel@tonic-gate */ 28297c478bd9Sstevel@tonic-gate 28307c478bd9Sstevel@tonic-gate np->s_refcnt++; /* pass reference to thread */ 28317c478bd9Sstevel@tonic-gate (void) zthread_create(NULL, 0, nfs4_renew_lease_thread, np, 0, 28327c478bd9Sstevel@tonic-gate minclsyspri); 28337c478bd9Sstevel@tonic-gate } 28347c478bd9Sstevel@tonic-gate 28357c478bd9Sstevel@tonic-gate (void) xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res); 28367c478bd9Sstevel@tonic-gate } 28377c478bd9Sstevel@tonic-gate 28387c478bd9Sstevel@tonic-gate /* 28397c478bd9Sstevel@tonic-gate * Add mi to sp's mntinfo4_list if it isn't already in the list. Makes 28407c478bd9Sstevel@tonic-gate * mi's clientid the same as sp's. 28417c478bd9Sstevel@tonic-gate * Assumes sp is locked down. 28427c478bd9Sstevel@tonic-gate */ 28437c478bd9Sstevel@tonic-gate void 28447c478bd9Sstevel@tonic-gate nfs4_add_mi_to_server(nfs4_server_t *sp, mntinfo4_t *mi) 28457c478bd9Sstevel@tonic-gate { 28467c478bd9Sstevel@tonic-gate mntinfo4_t *tmi; 28477c478bd9Sstevel@tonic-gate int in_list = 0; 28487c478bd9Sstevel@tonic-gate 2849a092743bSek ASSERT(nfs_rw_lock_held(&mi->mi_recovlock, RW_READER) || 2850a092743bSek nfs_rw_lock_held(&mi->mi_recovlock, RW_WRITER)); 28517c478bd9Sstevel@tonic-gate ASSERT(sp != &nfs4_server_lst); 28527c478bd9Sstevel@tonic-gate ASSERT(MUTEX_HELD(&sp->s_lock)); 28537c478bd9Sstevel@tonic-gate 28547c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_lease_debug, (CE_NOTE, 28557c478bd9Sstevel@tonic-gate "nfs4_add_mi_to_server: add mi %p to sp %p", 28567c478bd9Sstevel@tonic-gate (void*)mi, (void*)sp)); 28577c478bd9Sstevel@tonic-gate 28587c478bd9Sstevel@tonic-gate for (tmi = sp->mntinfo4_list; 28597c478bd9Sstevel@tonic-gate tmi != NULL; 28607c478bd9Sstevel@tonic-gate tmi = tmi->mi_clientid_next) { 28617c478bd9Sstevel@tonic-gate if (tmi == mi) { 28627c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_lease_debug, 28637c478bd9Sstevel@tonic-gate (CE_NOTE, 28647c478bd9Sstevel@tonic-gate "nfs4_add_mi_to_server: mi in list")); 28657c478bd9Sstevel@tonic-gate in_list = 1; 28667c478bd9Sstevel@tonic-gate } 28677c478bd9Sstevel@tonic-gate } 28687c478bd9Sstevel@tonic-gate 28697c478bd9Sstevel@tonic-gate /* 28707c478bd9Sstevel@tonic-gate * First put a hold on the mntinfo4's vfsp so that references via 28717c478bd9Sstevel@tonic-gate * mntinfo4_list will be valid. 28727c478bd9Sstevel@tonic-gate */ 28737c478bd9Sstevel@tonic-gate if (!in_list) 28747c478bd9Sstevel@tonic-gate VFS_HOLD(mi->mi_vfsp); 28757c478bd9Sstevel@tonic-gate 28767c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_lease_debug, (CE_NOTE, "nfs4_add_mi_to_server: " 28777c478bd9Sstevel@tonic-gate "hold vfs %p for mi: %p", (void*)mi->mi_vfsp, (void*)mi)); 28787c478bd9Sstevel@tonic-gate 28797c478bd9Sstevel@tonic-gate if (!in_list) { 28807c478bd9Sstevel@tonic-gate if (sp->mntinfo4_list) 28817c478bd9Sstevel@tonic-gate sp->mntinfo4_list->mi_clientid_prev = mi; 28827c478bd9Sstevel@tonic-gate mi->mi_clientid_next = sp->mntinfo4_list; 28837c478bd9Sstevel@tonic-gate sp->mntinfo4_list = mi; 28847c478bd9Sstevel@tonic-gate mi->mi_srvsettime = gethrestime_sec(); 28857c478bd9Sstevel@tonic-gate } 28867c478bd9Sstevel@tonic-gate 28877c478bd9Sstevel@tonic-gate /* set mi's clientid to that of sp's for later matching */ 28887c478bd9Sstevel@tonic-gate mi->mi_clientid = sp->clientid; 28897c478bd9Sstevel@tonic-gate 28907c478bd9Sstevel@tonic-gate /* 28917c478bd9Sstevel@tonic-gate * Update the clientid for any other mi's belonging to sp. This 28927c478bd9Sstevel@tonic-gate * must be done here while we hold sp->s_lock, so that 28937c478bd9Sstevel@tonic-gate * find_nfs4_server() continues to work. 28947c478bd9Sstevel@tonic-gate */ 28957c478bd9Sstevel@tonic-gate 28967c478bd9Sstevel@tonic-gate for (tmi = sp->mntinfo4_list; 28977c478bd9Sstevel@tonic-gate tmi != NULL; 28987c478bd9Sstevel@tonic-gate tmi = tmi->mi_clientid_next) { 28997c478bd9Sstevel@tonic-gate if (tmi != mi) { 29007c478bd9Sstevel@tonic-gate tmi->mi_clientid = sp->clientid; 29017c478bd9Sstevel@tonic-gate } 29027c478bd9Sstevel@tonic-gate } 29037c478bd9Sstevel@tonic-gate } 29047c478bd9Sstevel@tonic-gate 29057c478bd9Sstevel@tonic-gate /* 29067c478bd9Sstevel@tonic-gate * Remove the mi from sp's mntinfo4_list and release its reference. 29077c478bd9Sstevel@tonic-gate * Exception: if mi still has open files, flag it for later removal (when 29087c478bd9Sstevel@tonic-gate * all the files are closed). 29097c478bd9Sstevel@tonic-gate * 29107c478bd9Sstevel@tonic-gate * If this is the last mntinfo4 in sp's list then tell the lease renewal 29117c478bd9Sstevel@tonic-gate * thread to exit. 29127c478bd9Sstevel@tonic-gate */ 29137c478bd9Sstevel@tonic-gate static void 29147c478bd9Sstevel@tonic-gate nfs4_remove_mi_from_server_nolock(mntinfo4_t *mi, nfs4_server_t *sp) 29157c478bd9Sstevel@tonic-gate { 29167c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_lease_debug, (CE_NOTE, 29177c478bd9Sstevel@tonic-gate "nfs4_remove_mi_from_server_nolock: remove mi %p from sp %p", 29187c478bd9Sstevel@tonic-gate (void*)mi, (void*)sp)); 29197c478bd9Sstevel@tonic-gate 29207c478bd9Sstevel@tonic-gate ASSERT(sp != NULL); 29217c478bd9Sstevel@tonic-gate ASSERT(MUTEX_HELD(&sp->s_lock)); 29227c478bd9Sstevel@tonic-gate ASSERT(mi->mi_open_files >= 0); 29237c478bd9Sstevel@tonic-gate 29247c478bd9Sstevel@tonic-gate /* 29257c478bd9Sstevel@tonic-gate * First make sure this mntinfo4 can be taken off of the list, 29267c478bd9Sstevel@tonic-gate * ie: it doesn't have any open files remaining. 29277c478bd9Sstevel@tonic-gate */ 29287c478bd9Sstevel@tonic-gate if (mi->mi_open_files > 0) { 29297c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_lease_debug, (CE_NOTE, 29307c478bd9Sstevel@tonic-gate "nfs4_remove_mi_from_server_nolock: don't " 29317c478bd9Sstevel@tonic-gate "remove mi since it still has files open")); 29327c478bd9Sstevel@tonic-gate 29337c478bd9Sstevel@tonic-gate mutex_enter(&mi->mi_lock); 29347c478bd9Sstevel@tonic-gate mi->mi_flags |= MI4_REMOVE_ON_LAST_CLOSE; 29357c478bd9Sstevel@tonic-gate mutex_exit(&mi->mi_lock); 29367c478bd9Sstevel@tonic-gate return; 29377c478bd9Sstevel@tonic-gate } 29387c478bd9Sstevel@tonic-gate 29397c478bd9Sstevel@tonic-gate remove_mi(sp, mi); 29407c478bd9Sstevel@tonic-gate 29417c478bd9Sstevel@tonic-gate if (sp->mntinfo4_list == NULL) { 29427c478bd9Sstevel@tonic-gate /* last fs unmounted, kill the thread */ 29437c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_lease_debug, (CE_NOTE, 29447c478bd9Sstevel@tonic-gate "remove_mi_from_nfs4_server_nolock: kill the thread")); 29457c478bd9Sstevel@tonic-gate nfs4_mark_srv_dead(sp); 29467c478bd9Sstevel@tonic-gate } 29477c478bd9Sstevel@tonic-gate } 29487c478bd9Sstevel@tonic-gate 29497c478bd9Sstevel@tonic-gate /* 29507c478bd9Sstevel@tonic-gate * Remove mi from sp's mntinfo4_list and release the vfs reference. 29517c478bd9Sstevel@tonic-gate */ 29527c478bd9Sstevel@tonic-gate static void 29537c478bd9Sstevel@tonic-gate remove_mi(nfs4_server_t *sp, mntinfo4_t *mi) 29547c478bd9Sstevel@tonic-gate { 29557c478bd9Sstevel@tonic-gate ASSERT(MUTEX_HELD(&sp->s_lock)); 29567c478bd9Sstevel@tonic-gate 29577c478bd9Sstevel@tonic-gate /* 29587c478bd9Sstevel@tonic-gate * We release a reference, and the caller must still have a 29597c478bd9Sstevel@tonic-gate * reference. 29607c478bd9Sstevel@tonic-gate */ 29617c478bd9Sstevel@tonic-gate ASSERT(mi->mi_vfsp->vfs_count >= 2); 29627c478bd9Sstevel@tonic-gate 29637c478bd9Sstevel@tonic-gate if (mi->mi_clientid_prev) { 29647c478bd9Sstevel@tonic-gate mi->mi_clientid_prev->mi_clientid_next = mi->mi_clientid_next; 29657c478bd9Sstevel@tonic-gate } else { 29667c478bd9Sstevel@tonic-gate /* This is the first mi in sp's mntinfo4_list */ 29677c478bd9Sstevel@tonic-gate /* 29687c478bd9Sstevel@tonic-gate * Make sure the first mntinfo4 in the list is the actual 29697c478bd9Sstevel@tonic-gate * mntinfo4 passed in. 29707c478bd9Sstevel@tonic-gate */ 29717c478bd9Sstevel@tonic-gate ASSERT(sp->mntinfo4_list == mi); 29727c478bd9Sstevel@tonic-gate 29737c478bd9Sstevel@tonic-gate sp->mntinfo4_list = mi->mi_clientid_next; 29747c478bd9Sstevel@tonic-gate } 29757c478bd9Sstevel@tonic-gate if (mi->mi_clientid_next) 29767c478bd9Sstevel@tonic-gate mi->mi_clientid_next->mi_clientid_prev = mi->mi_clientid_prev; 29777c478bd9Sstevel@tonic-gate 29787c478bd9Sstevel@tonic-gate /* Now mark the mntinfo4's links as being removed */ 29797c478bd9Sstevel@tonic-gate mi->mi_clientid_prev = mi->mi_clientid_next = NULL; 29807c478bd9Sstevel@tonic-gate 29817c478bd9Sstevel@tonic-gate VFS_RELE(mi->mi_vfsp); 29827c478bd9Sstevel@tonic-gate } 29837c478bd9Sstevel@tonic-gate 29847c478bd9Sstevel@tonic-gate /* 29857c478bd9Sstevel@tonic-gate * Free all the entries in sp's mntinfo4_list. 29867c478bd9Sstevel@tonic-gate */ 29877c478bd9Sstevel@tonic-gate static void 29887c478bd9Sstevel@tonic-gate remove_all_mi(nfs4_server_t *sp) 29897c478bd9Sstevel@tonic-gate { 29907c478bd9Sstevel@tonic-gate mntinfo4_t *mi; 29917c478bd9Sstevel@tonic-gate 29927c478bd9Sstevel@tonic-gate ASSERT(MUTEX_HELD(&sp->s_lock)); 29937c478bd9Sstevel@tonic-gate 29947c478bd9Sstevel@tonic-gate while (sp->mntinfo4_list != NULL) { 29957c478bd9Sstevel@tonic-gate mi = sp->mntinfo4_list; 29967c478bd9Sstevel@tonic-gate /* 29977c478bd9Sstevel@tonic-gate * Grab a reference in case there is only one left (which 29987c478bd9Sstevel@tonic-gate * remove_mi() frees). 29997c478bd9Sstevel@tonic-gate */ 30007c478bd9Sstevel@tonic-gate VFS_HOLD(mi->mi_vfsp); 30017c478bd9Sstevel@tonic-gate remove_mi(sp, mi); 30027c478bd9Sstevel@tonic-gate VFS_RELE(mi->mi_vfsp); 30037c478bd9Sstevel@tonic-gate } 30047c478bd9Sstevel@tonic-gate } 30057c478bd9Sstevel@tonic-gate 30067c478bd9Sstevel@tonic-gate /* 30077c478bd9Sstevel@tonic-gate * Remove the mi from sp's mntinfo4_list as above, and rele the vfs. 30087c478bd9Sstevel@tonic-gate * 30097c478bd9Sstevel@tonic-gate * This version can be called with a null nfs4_server_t arg, 30107c478bd9Sstevel@tonic-gate * and will either find the right one and handle locking, or 30117c478bd9Sstevel@tonic-gate * do nothing because the mi wasn't added to an sp's mntinfo4_list. 30127c478bd9Sstevel@tonic-gate */ 30137c478bd9Sstevel@tonic-gate void 30147c478bd9Sstevel@tonic-gate nfs4_remove_mi_from_server(mntinfo4_t *mi, nfs4_server_t *esp) 30157c478bd9Sstevel@tonic-gate { 30167c478bd9Sstevel@tonic-gate nfs4_server_t *sp; 30177c478bd9Sstevel@tonic-gate 30187c478bd9Sstevel@tonic-gate if (esp == NULL) { 30197c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&mi->mi_recovlock, RW_READER, 0); 30207c478bd9Sstevel@tonic-gate sp = find_nfs4_server_all(mi, 1); 30217c478bd9Sstevel@tonic-gate } else 30227c478bd9Sstevel@tonic-gate sp = esp; 30237c478bd9Sstevel@tonic-gate 30247c478bd9Sstevel@tonic-gate if (sp != NULL) 30257c478bd9Sstevel@tonic-gate nfs4_remove_mi_from_server_nolock(mi, sp); 30267c478bd9Sstevel@tonic-gate 30277c478bd9Sstevel@tonic-gate /* 30287c478bd9Sstevel@tonic-gate * If we had a valid esp as input, the calling function will be 30297c478bd9Sstevel@tonic-gate * responsible for unlocking the esp nfs4_server. 30307c478bd9Sstevel@tonic-gate */ 30317c478bd9Sstevel@tonic-gate if (esp == NULL) { 30327c478bd9Sstevel@tonic-gate if (sp != NULL) 30337c478bd9Sstevel@tonic-gate mutex_exit(&sp->s_lock); 30347c478bd9Sstevel@tonic-gate nfs_rw_exit(&mi->mi_recovlock); 30357c478bd9Sstevel@tonic-gate if (sp != NULL) 30367c478bd9Sstevel@tonic-gate nfs4_server_rele(sp); 30377c478bd9Sstevel@tonic-gate } 30387c478bd9Sstevel@tonic-gate } 30397c478bd9Sstevel@tonic-gate 30407c478bd9Sstevel@tonic-gate /* 30417c478bd9Sstevel@tonic-gate * Return TRUE if the given server has any non-unmounted filesystems. 30427c478bd9Sstevel@tonic-gate */ 30437c478bd9Sstevel@tonic-gate 30447c478bd9Sstevel@tonic-gate bool_t 30457c478bd9Sstevel@tonic-gate nfs4_fs_active(nfs4_server_t *sp) 30467c478bd9Sstevel@tonic-gate { 30477c478bd9Sstevel@tonic-gate mntinfo4_t *mi; 30487c478bd9Sstevel@tonic-gate 30497c478bd9Sstevel@tonic-gate ASSERT(MUTEX_HELD(&sp->s_lock)); 30507c478bd9Sstevel@tonic-gate 30517c478bd9Sstevel@tonic-gate for (mi = sp->mntinfo4_list; mi != NULL; mi = mi->mi_clientid_next) { 30527c478bd9Sstevel@tonic-gate if (!(mi->mi_vfsp->vfs_flag & VFS_UNMOUNTED)) 30537c478bd9Sstevel@tonic-gate return (TRUE); 30547c478bd9Sstevel@tonic-gate } 30557c478bd9Sstevel@tonic-gate 30567c478bd9Sstevel@tonic-gate return (FALSE); 30577c478bd9Sstevel@tonic-gate } 30587c478bd9Sstevel@tonic-gate 30597c478bd9Sstevel@tonic-gate /* 30607c478bd9Sstevel@tonic-gate * Mark sp as finished and notify any waiters. 30617c478bd9Sstevel@tonic-gate */ 30627c478bd9Sstevel@tonic-gate 30637c478bd9Sstevel@tonic-gate void 30647c478bd9Sstevel@tonic-gate nfs4_mark_srv_dead(nfs4_server_t *sp) 30657c478bd9Sstevel@tonic-gate { 30667c478bd9Sstevel@tonic-gate ASSERT(MUTEX_HELD(&sp->s_lock)); 30677c478bd9Sstevel@tonic-gate 30687c478bd9Sstevel@tonic-gate sp->s_thread_exit = NFS4_THREAD_EXIT; 30697c478bd9Sstevel@tonic-gate cv_broadcast(&sp->cv_thread_exit); 30707c478bd9Sstevel@tonic-gate } 30717c478bd9Sstevel@tonic-gate 30727c478bd9Sstevel@tonic-gate /* 30737c478bd9Sstevel@tonic-gate * Create a new nfs4_server_t structure. 30747c478bd9Sstevel@tonic-gate * Returns new node unlocked and not in list, but with a reference count of 30757c478bd9Sstevel@tonic-gate * 1. 30767c478bd9Sstevel@tonic-gate */ 30777c478bd9Sstevel@tonic-gate struct nfs4_server * 30787c478bd9Sstevel@tonic-gate new_nfs4_server(struct servinfo4 *svp, cred_t *cr) 30797c478bd9Sstevel@tonic-gate { 30807c478bd9Sstevel@tonic-gate struct nfs4_server *np; 30817c478bd9Sstevel@tonic-gate timespec_t tt; 30827c478bd9Sstevel@tonic-gate union { 30837c478bd9Sstevel@tonic-gate struct { 30847c478bd9Sstevel@tonic-gate uint32_t sec; 30857c478bd9Sstevel@tonic-gate uint32_t subsec; 30867c478bd9Sstevel@tonic-gate } un_curtime; 30877c478bd9Sstevel@tonic-gate verifier4 un_verifier; 30887c478bd9Sstevel@tonic-gate } nfs4clientid_verifier; 30897c478bd9Sstevel@tonic-gate char id_val[] = "Solaris: %s, NFSv4 kernel client"; 30907c478bd9Sstevel@tonic-gate int len; 30917c478bd9Sstevel@tonic-gate 30927c478bd9Sstevel@tonic-gate np = kmem_zalloc(sizeof (struct nfs4_server), KM_SLEEP); 30937c478bd9Sstevel@tonic-gate np->saddr.len = svp->sv_addr.len; 30947c478bd9Sstevel@tonic-gate np->saddr.maxlen = svp->sv_addr.maxlen; 30957c478bd9Sstevel@tonic-gate np->saddr.buf = kmem_alloc(svp->sv_addr.maxlen, KM_SLEEP); 30967c478bd9Sstevel@tonic-gate bcopy(svp->sv_addr.buf, np->saddr.buf, svp->sv_addr.len); 30977c478bd9Sstevel@tonic-gate np->s_refcnt = 1; 30987c478bd9Sstevel@tonic-gate 30997c478bd9Sstevel@tonic-gate /* 31007c478bd9Sstevel@tonic-gate * Build the nfs_client_id4 for this server mount. Ensure 31017c478bd9Sstevel@tonic-gate * the verifier is useful and that the identification is 31027c478bd9Sstevel@tonic-gate * somehow based on the server's address for the case of 31037c478bd9Sstevel@tonic-gate * multi-homed servers. 31047c478bd9Sstevel@tonic-gate */ 31057c478bd9Sstevel@tonic-gate nfs4clientid_verifier.un_verifier = 0; 31067c478bd9Sstevel@tonic-gate gethrestime(&tt); 31077c478bd9Sstevel@tonic-gate nfs4clientid_verifier.un_curtime.sec = (uint32_t)tt.tv_sec; 31087c478bd9Sstevel@tonic-gate nfs4clientid_verifier.un_curtime.subsec = (uint32_t)tt.tv_nsec; 31097c478bd9Sstevel@tonic-gate np->clidtosend.verifier = nfs4clientid_verifier.un_verifier; 31107c478bd9Sstevel@tonic-gate 31117c478bd9Sstevel@tonic-gate /* 31127c478bd9Sstevel@tonic-gate * calculate the length of the opaque identifier. Subtract 2 31137c478bd9Sstevel@tonic-gate * for the "%s" and add the traditional +1 for null 31147c478bd9Sstevel@tonic-gate * termination. 31157c478bd9Sstevel@tonic-gate */ 31167c478bd9Sstevel@tonic-gate len = strlen(id_val) - 2 + strlen(uts_nodename()) + 1; 31177c478bd9Sstevel@tonic-gate np->clidtosend.id_len = len + np->saddr.maxlen; 31187c478bd9Sstevel@tonic-gate 31197c478bd9Sstevel@tonic-gate np->clidtosend.id_val = kmem_alloc(np->clidtosend.id_len, KM_SLEEP); 31207c478bd9Sstevel@tonic-gate (void) sprintf(np->clidtosend.id_val, id_val, uts_nodename()); 31217c478bd9Sstevel@tonic-gate bcopy(np->saddr.buf, &np->clidtosend.id_val[len], np->saddr.len); 31227c478bd9Sstevel@tonic-gate 31237c478bd9Sstevel@tonic-gate np->s_flags = 0; 31247c478bd9Sstevel@tonic-gate np->mntinfo4_list = NULL; 31257c478bd9Sstevel@tonic-gate /* save cred for issuing rfs4calls inside the renew thread */ 31267c478bd9Sstevel@tonic-gate crhold(cr); 31277c478bd9Sstevel@tonic-gate np->s_cred = cr; 31287c478bd9Sstevel@tonic-gate cv_init(&np->cv_thread_exit, NULL, CV_DEFAULT, NULL); 31297c478bd9Sstevel@tonic-gate mutex_init(&np->s_lock, NULL, MUTEX_DEFAULT, NULL); 31307c478bd9Sstevel@tonic-gate nfs_rw_init(&np->s_recovlock, NULL, RW_DEFAULT, NULL); 31317c478bd9Sstevel@tonic-gate list_create(&np->s_deleg_list, sizeof (rnode4_t), 31327c478bd9Sstevel@tonic-gate offsetof(rnode4_t, r_deleg_link)); 31337c478bd9Sstevel@tonic-gate np->s_thread_exit = 0; 31347c478bd9Sstevel@tonic-gate np->state_ref_count = 0; 31357c478bd9Sstevel@tonic-gate np->lease_valid = NFS4_LEASE_NOT_STARTED; 31367c478bd9Sstevel@tonic-gate cv_init(&np->s_cv_otw_count, NULL, CV_DEFAULT, NULL); 31377c478bd9Sstevel@tonic-gate np->s_otw_call_count = 0; 31387c478bd9Sstevel@tonic-gate cv_init(&np->wait_cb_null, NULL, CV_DEFAULT, NULL); 31397c478bd9Sstevel@tonic-gate np->zoneid = getzoneid(); 31407c478bd9Sstevel@tonic-gate np->zone_globals = nfs4_get_callback_globals(); 31417c478bd9Sstevel@tonic-gate ASSERT(np->zone_globals != NULL); 31427c478bd9Sstevel@tonic-gate return (np); 31437c478bd9Sstevel@tonic-gate } 31447c478bd9Sstevel@tonic-gate 31457c478bd9Sstevel@tonic-gate /* 31467c478bd9Sstevel@tonic-gate * Create a new nfs4_server_t structure and add it to the list. 31477c478bd9Sstevel@tonic-gate * Returns new node locked; reference must eventually be freed. 31487c478bd9Sstevel@tonic-gate */ 31497c478bd9Sstevel@tonic-gate static struct nfs4_server * 31507c478bd9Sstevel@tonic-gate add_new_nfs4_server(struct servinfo4 *svp, cred_t *cr) 31517c478bd9Sstevel@tonic-gate { 31527c478bd9Sstevel@tonic-gate nfs4_server_t *sp; 31537c478bd9Sstevel@tonic-gate 31547c478bd9Sstevel@tonic-gate ASSERT(MUTEX_HELD(&nfs4_server_lst_lock)); 31557c478bd9Sstevel@tonic-gate sp = new_nfs4_server(svp, cr); 31567c478bd9Sstevel@tonic-gate mutex_enter(&sp->s_lock); 31577c478bd9Sstevel@tonic-gate insque(sp, &nfs4_server_lst); 31587c478bd9Sstevel@tonic-gate sp->s_refcnt++; /* list gets a reference */ 31597c478bd9Sstevel@tonic-gate sp->clientid = 0; 31607c478bd9Sstevel@tonic-gate sp->s_flags |= N4S_INSERTED; 31617c478bd9Sstevel@tonic-gate return (sp); 31627c478bd9Sstevel@tonic-gate } 31637c478bd9Sstevel@tonic-gate 31647c478bd9Sstevel@tonic-gate int nfs4_server_t_debug = 0; 31657c478bd9Sstevel@tonic-gate 31667c478bd9Sstevel@tonic-gate #ifdef lint 31677c478bd9Sstevel@tonic-gate extern void 31687c478bd9Sstevel@tonic-gate dumpnfs4slist(char *, mntinfo4_t *, clientid4, servinfo4_t *); 31697c478bd9Sstevel@tonic-gate #endif 31707c478bd9Sstevel@tonic-gate 31717c478bd9Sstevel@tonic-gate #ifndef lint 31727c478bd9Sstevel@tonic-gate #ifdef DEBUG 31737c478bd9Sstevel@tonic-gate void 31747c478bd9Sstevel@tonic-gate dumpnfs4slist(char *txt, mntinfo4_t *mi, clientid4 clientid, servinfo4_t *srv_p) 31757c478bd9Sstevel@tonic-gate { 31767c478bd9Sstevel@tonic-gate int hash16(void *p, int len); 31777c478bd9Sstevel@tonic-gate nfs4_server_t *np; 31787c478bd9Sstevel@tonic-gate 31797c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_server_t_debug, (CE_NOTE, 31807c478bd9Sstevel@tonic-gate "dumping nfs4_server_t list in %s", txt)); 31817c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_server_t_debug, (CE_CONT, 31827c478bd9Sstevel@tonic-gate "mi 0x%p, want clientid %llx, addr %d/%04X", 31837c478bd9Sstevel@tonic-gate mi, (longlong_t)clientid, srv_p->sv_addr.len, 31847c478bd9Sstevel@tonic-gate hash16((void *)srv_p->sv_addr.buf, srv_p->sv_addr.len))); 31857c478bd9Sstevel@tonic-gate for (np = nfs4_server_lst.forw; np != &nfs4_server_lst; 31867c478bd9Sstevel@tonic-gate np = np->forw) { 31877c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_server_t_debug, (CE_CONT, 31887c478bd9Sstevel@tonic-gate "node 0x%p, clientid %llx, addr %d/%04X, cnt %d", 31897c478bd9Sstevel@tonic-gate np, (longlong_t)np->clientid, np->saddr.len, 31907c478bd9Sstevel@tonic-gate hash16((void *)np->saddr.buf, np->saddr.len), 31917c478bd9Sstevel@tonic-gate np->state_ref_count)); 31927c478bd9Sstevel@tonic-gate if (np->saddr.len == srv_p->sv_addr.len && 31937c478bd9Sstevel@tonic-gate bcmp(np->saddr.buf, srv_p->sv_addr.buf, 31947c478bd9Sstevel@tonic-gate np->saddr.len) == 0) 31957c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_server_t_debug, (CE_CONT, 31967c478bd9Sstevel@tonic-gate " - address matches")); 31977c478bd9Sstevel@tonic-gate if (np->clientid == clientid || np->clientid == 0) 31987c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_server_t_debug, (CE_CONT, 31997c478bd9Sstevel@tonic-gate " - clientid matches")); 32007c478bd9Sstevel@tonic-gate if (np->s_thread_exit != NFS4_THREAD_EXIT) 32017c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_server_t_debug, (CE_CONT, 32027c478bd9Sstevel@tonic-gate " - thread not exiting")); 32037c478bd9Sstevel@tonic-gate } 32047c478bd9Sstevel@tonic-gate delay(hz); 32057c478bd9Sstevel@tonic-gate } 32067c478bd9Sstevel@tonic-gate #endif 32077c478bd9Sstevel@tonic-gate #endif 32087c478bd9Sstevel@tonic-gate 32097c478bd9Sstevel@tonic-gate 32107c478bd9Sstevel@tonic-gate /* 32117c478bd9Sstevel@tonic-gate * Move a mntinfo4_t from one server list to another. 32127c478bd9Sstevel@tonic-gate * Locking of the two nfs4_server_t nodes will be done in list order. 32137c478bd9Sstevel@tonic-gate * 32147c478bd9Sstevel@tonic-gate * Returns NULL if the current nfs4_server_t for the filesystem could not 32157c478bd9Sstevel@tonic-gate * be found (e.g., due to forced unmount). Otherwise returns a reference 32167c478bd9Sstevel@tonic-gate * to the new nfs4_server_t, which must eventually be freed. 32177c478bd9Sstevel@tonic-gate */ 32187c478bd9Sstevel@tonic-gate nfs4_server_t * 32197c478bd9Sstevel@tonic-gate nfs4_move_mi(mntinfo4_t *mi, servinfo4_t *old, servinfo4_t *new) 32207c478bd9Sstevel@tonic-gate { 32217c478bd9Sstevel@tonic-gate nfs4_server_t *p, *op = NULL, *np = NULL; 32227c478bd9Sstevel@tonic-gate int num_open; 3223*108322fbScarlsonj zoneid_t zoneid = nfs_zoneid(); 32247c478bd9Sstevel@tonic-gate 3225*108322fbScarlsonj ASSERT(nfs_zone() == mi->mi_zone); 32267c478bd9Sstevel@tonic-gate 32277c478bd9Sstevel@tonic-gate mutex_enter(&nfs4_server_lst_lock); 32287c478bd9Sstevel@tonic-gate #ifdef DEBUG 32297c478bd9Sstevel@tonic-gate if (nfs4_server_t_debug) 32307c478bd9Sstevel@tonic-gate dumpnfs4slist("nfs4_move_mi", mi, (clientid4)0, new); 32317c478bd9Sstevel@tonic-gate #endif 32327c478bd9Sstevel@tonic-gate for (p = nfs4_server_lst.forw; p != &nfs4_server_lst; p = p->forw) { 32337c478bd9Sstevel@tonic-gate if (p->zoneid != zoneid) 32347c478bd9Sstevel@tonic-gate continue; 32357c478bd9Sstevel@tonic-gate if (p->saddr.len == old->sv_addr.len && 32367c478bd9Sstevel@tonic-gate bcmp(p->saddr.buf, old->sv_addr.buf, p->saddr.len) == 0 && 32377c478bd9Sstevel@tonic-gate p->s_thread_exit != NFS4_THREAD_EXIT) { 32387c478bd9Sstevel@tonic-gate op = p; 32397c478bd9Sstevel@tonic-gate mutex_enter(&op->s_lock); 32407c478bd9Sstevel@tonic-gate op->s_refcnt++; 32417c478bd9Sstevel@tonic-gate } 32427c478bd9Sstevel@tonic-gate if (p->saddr.len == new->sv_addr.len && 32437c478bd9Sstevel@tonic-gate bcmp(p->saddr.buf, new->sv_addr.buf, p->saddr.len) == 0 && 32447c478bd9Sstevel@tonic-gate p->s_thread_exit != NFS4_THREAD_EXIT) { 32457c478bd9Sstevel@tonic-gate np = p; 32467c478bd9Sstevel@tonic-gate mutex_enter(&np->s_lock); 32477c478bd9Sstevel@tonic-gate } 32487c478bd9Sstevel@tonic-gate if (op != NULL && np != NULL) 32497c478bd9Sstevel@tonic-gate break; 32507c478bd9Sstevel@tonic-gate } 32517c478bd9Sstevel@tonic-gate if (op == NULL) { 32527c478bd9Sstevel@tonic-gate /* 32537c478bd9Sstevel@tonic-gate * Filesystem has been forcibly unmounted. Bail out. 32547c478bd9Sstevel@tonic-gate */ 32557c478bd9Sstevel@tonic-gate if (np != NULL) 32567c478bd9Sstevel@tonic-gate mutex_exit(&np->s_lock); 32577c478bd9Sstevel@tonic-gate mutex_exit(&nfs4_server_lst_lock); 32587c478bd9Sstevel@tonic-gate return (NULL); 32597c478bd9Sstevel@tonic-gate } 32607c478bd9Sstevel@tonic-gate if (np != NULL) { 32617c478bd9Sstevel@tonic-gate np->s_refcnt++; 32627c478bd9Sstevel@tonic-gate } else { 32637c478bd9Sstevel@tonic-gate #ifdef DEBUG 32647c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_failover_debug, (CE_NOTE, 32657c478bd9Sstevel@tonic-gate "nfs4_move_mi: no target nfs4_server, will create.")); 32667c478bd9Sstevel@tonic-gate #endif 32677c478bd9Sstevel@tonic-gate np = add_new_nfs4_server(new, kcred); 32687c478bd9Sstevel@tonic-gate } 32697c478bd9Sstevel@tonic-gate mutex_exit(&nfs4_server_lst_lock); 32707c478bd9Sstevel@tonic-gate 32717c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_failover_debug, (CE_NOTE, 32727c478bd9Sstevel@tonic-gate "nfs4_move_mi: for mi 0x%p, " 32737c478bd9Sstevel@tonic-gate "old servinfo4 0x%p, new servinfo4 0x%p, " 32747c478bd9Sstevel@tonic-gate "old nfs4_server 0x%p, new nfs4_server 0x%p, ", 32757c478bd9Sstevel@tonic-gate (void*)mi, (void*)old, (void*)new, 32767c478bd9Sstevel@tonic-gate (void*)op, (void*)np)); 32777c478bd9Sstevel@tonic-gate ASSERT(op != NULL && np != NULL); 32787c478bd9Sstevel@tonic-gate 32797c478bd9Sstevel@tonic-gate /* discard any delegations */ 32807c478bd9Sstevel@tonic-gate nfs4_deleg_discard(mi, op); 32817c478bd9Sstevel@tonic-gate 32827c478bd9Sstevel@tonic-gate num_open = mi->mi_open_files; 32837c478bd9Sstevel@tonic-gate mi->mi_open_files = 0; 32847c478bd9Sstevel@tonic-gate op->state_ref_count -= num_open; 32857c478bd9Sstevel@tonic-gate ASSERT(op->state_ref_count >= 0); 32867c478bd9Sstevel@tonic-gate np->state_ref_count += num_open; 32877c478bd9Sstevel@tonic-gate nfs4_remove_mi_from_server_nolock(mi, op); 32887c478bd9Sstevel@tonic-gate mi->mi_open_files = num_open; 32897c478bd9Sstevel@tonic-gate NFS4_DEBUG(nfs4_client_failover_debug, (CE_NOTE, 32907c478bd9Sstevel@tonic-gate "nfs4_move_mi: mi_open_files %d, op->cnt %d, np->cnt %d", 32917c478bd9Sstevel@tonic-gate mi->mi_open_files, op->state_ref_count, np->state_ref_count)); 32927c478bd9Sstevel@tonic-gate 32937c478bd9Sstevel@tonic-gate nfs4_add_mi_to_server(np, mi); 32947c478bd9Sstevel@tonic-gate 32957c478bd9Sstevel@tonic-gate mutex_exit(&op->s_lock); 32967c478bd9Sstevel@tonic-gate nfs4_server_rele(op); 32977c478bd9Sstevel@tonic-gate mutex_exit(&np->s_lock); 32987c478bd9Sstevel@tonic-gate 32997c478bd9Sstevel@tonic-gate return (np); 33007c478bd9Sstevel@tonic-gate } 33017c478bd9Sstevel@tonic-gate 33027c478bd9Sstevel@tonic-gate /* 33037c478bd9Sstevel@tonic-gate * Search the nfs4_server list to find a match on this servinfo4 33047c478bd9Sstevel@tonic-gate * based on its address. 33057c478bd9Sstevel@tonic-gate * 33067c478bd9Sstevel@tonic-gate * Returns NULL if no match is found. Otherwise returns a reference (which 33077c478bd9Sstevel@tonic-gate * must eventually be freed) to a locked nfs4_server. 33087c478bd9Sstevel@tonic-gate */ 33097c478bd9Sstevel@tonic-gate nfs4_server_t * 33107c478bd9Sstevel@tonic-gate servinfo4_to_nfs4_server(servinfo4_t *srv_p) 33117c478bd9Sstevel@tonic-gate { 33127c478bd9Sstevel@tonic-gate nfs4_server_t *np; 3313*108322fbScarlsonj zoneid_t zoneid = nfs_zoneid(); 33147c478bd9Sstevel@tonic-gate 33157c478bd9Sstevel@tonic-gate mutex_enter(&nfs4_server_lst_lock); 33167c478bd9Sstevel@tonic-gate for (np = nfs4_server_lst.forw; np != &nfs4_server_lst; np = np->forw) { 33177c478bd9Sstevel@tonic-gate if (np->zoneid == zoneid && 33187c478bd9Sstevel@tonic-gate np->saddr.len == srv_p->sv_addr.len && 33197c478bd9Sstevel@tonic-gate bcmp(np->saddr.buf, srv_p->sv_addr.buf, 33207c478bd9Sstevel@tonic-gate np->saddr.len) == 0 && 33217c478bd9Sstevel@tonic-gate np->s_thread_exit != NFS4_THREAD_EXIT) { 33227c478bd9Sstevel@tonic-gate mutex_enter(&np->s_lock); 33237c478bd9Sstevel@tonic-gate np->s_refcnt++; 33247c478bd9Sstevel@tonic-gate mutex_exit(&nfs4_server_lst_lock); 33257c478bd9Sstevel@tonic-gate return (np); 33267c478bd9Sstevel@tonic-gate } 33277c478bd9Sstevel@tonic-gate } 33287c478bd9Sstevel@tonic-gate mutex_exit(&nfs4_server_lst_lock); 33297c478bd9Sstevel@tonic-gate return (NULL); 33307c478bd9Sstevel@tonic-gate } 33317c478bd9Sstevel@tonic-gate 33327c478bd9Sstevel@tonic-gate /* 33337c478bd9Sstevel@tonic-gate * Search the nfs4_server_lst to find a match based on clientid and 33347c478bd9Sstevel@tonic-gate * addr. 33357c478bd9Sstevel@tonic-gate * Locks the nfs4_server down if it is found and returns a reference that 33367c478bd9Sstevel@tonic-gate * must eventually be freed. 33377c478bd9Sstevel@tonic-gate * 33387c478bd9Sstevel@tonic-gate * Returns NULL it no match is found. This means one of two things: either 33397c478bd9Sstevel@tonic-gate * mi is in the process of being mounted, or mi has been unmounted. 33407c478bd9Sstevel@tonic-gate * 33417c478bd9Sstevel@tonic-gate * The caller should be holding mi->mi_recovlock, and it should continue to 33427c478bd9Sstevel@tonic-gate * hold the lock until done with the returned nfs4_server_t. Once 33437c478bd9Sstevel@tonic-gate * mi->mi_recovlock is released, there is no guarantee that the returned 33447c478bd9Sstevel@tonic-gate * mi->nfs4_server_t will continue to correspond to mi. 33457c478bd9Sstevel@tonic-gate */ 33467c478bd9Sstevel@tonic-gate nfs4_server_t * 33477c478bd9Sstevel@tonic-gate find_nfs4_server(mntinfo4_t *mi) 33487c478bd9Sstevel@tonic-gate { 33497c478bd9Sstevel@tonic-gate return (find_nfs4_server_all(mi, 0)); 33507c478bd9Sstevel@tonic-gate } 33517c478bd9Sstevel@tonic-gate 33527c478bd9Sstevel@tonic-gate /* 33537c478bd9Sstevel@tonic-gate * Same as above, but takes an "all" parameter which can be 33547c478bd9Sstevel@tonic-gate * set to 1 if the caller wishes to find nfs4_server_t's which 33557c478bd9Sstevel@tonic-gate * have been marked for termination by the exit of the renew 33567c478bd9Sstevel@tonic-gate * thread. This should only be used by operations which are 33577c478bd9Sstevel@tonic-gate * cleaning up and will not cause an OTW op. 33587c478bd9Sstevel@tonic-gate */ 33597c478bd9Sstevel@tonic-gate nfs4_server_t * 33607c478bd9Sstevel@tonic-gate find_nfs4_server_all(mntinfo4_t *mi, int all) 33617c478bd9Sstevel@tonic-gate { 33627c478bd9Sstevel@tonic-gate nfs4_server_t *np; 33637c478bd9Sstevel@tonic-gate servinfo4_t *svp; 33647c478bd9Sstevel@tonic-gate zoneid_t zoneid = mi->mi_zone->zone_id; 33657c478bd9Sstevel@tonic-gate 33667c478bd9Sstevel@tonic-gate ASSERT(nfs_rw_lock_held(&mi->mi_recovlock, RW_READER) || 33677c478bd9Sstevel@tonic-gate nfs_rw_lock_held(&mi->mi_recovlock, RW_WRITER)); 33687c478bd9Sstevel@tonic-gate /* 33697c478bd9Sstevel@tonic-gate * This can be called from nfs4_unmount() which can be called from the 33707c478bd9Sstevel@tonic-gate * global zone, hence it's legal for the global zone to muck with 33717c478bd9Sstevel@tonic-gate * another zone's server list, as long as it doesn't try to contact 33727c478bd9Sstevel@tonic-gate * them. 33737c478bd9Sstevel@tonic-gate */ 3374*108322fbScarlsonj ASSERT(zoneid == getzoneid() || getzoneid() == GLOBAL_ZONEID || 3375*108322fbScarlsonj nfs_global_client_only != 0); 33767c478bd9Sstevel@tonic-gate 33777c478bd9Sstevel@tonic-gate /* 33787c478bd9Sstevel@tonic-gate * The nfs4_server_lst_lock global lock is held when we get a new 33797c478bd9Sstevel@tonic-gate * clientid (via SETCLIENTID OTW). Holding this global lock and 33807c478bd9Sstevel@tonic-gate * mi_recovlock (READER is fine) ensures that the nfs4_server 33817c478bd9Sstevel@tonic-gate * and this mntinfo4 can't get out of sync, so the following search is 33827c478bd9Sstevel@tonic-gate * always valid. 33837c478bd9Sstevel@tonic-gate */ 33847c478bd9Sstevel@tonic-gate mutex_enter(&nfs4_server_lst_lock); 33857c478bd9Sstevel@tonic-gate #ifdef DEBUG 33867c478bd9Sstevel@tonic-gate if (nfs4_server_t_debug) { 33877c478bd9Sstevel@tonic-gate /* mi->mi_clientid is unprotected, ok for debug output */ 33887c478bd9Sstevel@tonic-gate dumpnfs4slist("find_nfs4_server", mi, mi->mi_clientid, 33897c478bd9Sstevel@tonic-gate mi->mi_curr_serv); 33907c478bd9Sstevel@tonic-gate } 33917c478bd9Sstevel@tonic-gate #endif 33927c478bd9Sstevel@tonic-gate for (np = nfs4_server_lst.forw; np != &nfs4_server_lst; np = np->forw) { 33937c478bd9Sstevel@tonic-gate mutex_enter(&np->s_lock); 33947c478bd9Sstevel@tonic-gate svp = mi->mi_curr_serv; 33957c478bd9Sstevel@tonic-gate 33967c478bd9Sstevel@tonic-gate if (np->zoneid == zoneid && 33977c478bd9Sstevel@tonic-gate np->clientid == mi->mi_clientid && 33987c478bd9Sstevel@tonic-gate np->saddr.len == svp->sv_addr.len && 33997c478bd9Sstevel@tonic-gate bcmp(np->saddr.buf, svp->sv_addr.buf, np->saddr.len) == 0 && 34007c478bd9Sstevel@tonic-gate (np->s_thread_exit != NFS4_THREAD_EXIT || all != 0)) { 34017c478bd9Sstevel@tonic-gate mutex_exit(&nfs4_server_lst_lock); 34027c478bd9Sstevel@tonic-gate np->s_refcnt++; 34037c478bd9Sstevel@tonic-gate return (np); 34047c478bd9Sstevel@tonic-gate } 34057c478bd9Sstevel@tonic-gate mutex_exit(&np->s_lock); 34067c478bd9Sstevel@tonic-gate } 34077c478bd9Sstevel@tonic-gate mutex_exit(&nfs4_server_lst_lock); 34087c478bd9Sstevel@tonic-gate 34097c478bd9Sstevel@tonic-gate return (NULL); 34107c478bd9Sstevel@tonic-gate } 34117c478bd9Sstevel@tonic-gate 34127c478bd9Sstevel@tonic-gate /* 34137c478bd9Sstevel@tonic-gate * Release the reference to sp and destroy it if that's the last one. 34147c478bd9Sstevel@tonic-gate */ 34157c478bd9Sstevel@tonic-gate 34167c478bd9Sstevel@tonic-gate void 34177c478bd9Sstevel@tonic-gate nfs4_server_rele(nfs4_server_t *sp) 34187c478bd9Sstevel@tonic-gate { 34197c478bd9Sstevel@tonic-gate mutex_enter(&sp->s_lock); 34207c478bd9Sstevel@tonic-gate ASSERT(sp->s_refcnt > 0); 34217c478bd9Sstevel@tonic-gate sp->s_refcnt--; 34227c478bd9Sstevel@tonic-gate if (sp->s_refcnt > 0) { 34237c478bd9Sstevel@tonic-gate mutex_exit(&sp->s_lock); 34247c478bd9Sstevel@tonic-gate return; 34257c478bd9Sstevel@tonic-gate } 34267c478bd9Sstevel@tonic-gate if (!(sp->s_flags & N4S_INSERTED)) { 34277c478bd9Sstevel@tonic-gate destroy_nfs4_server(sp); 34287c478bd9Sstevel@tonic-gate return; 34297c478bd9Sstevel@tonic-gate } 34307c478bd9Sstevel@tonic-gate mutex_exit(&sp->s_lock); 34317c478bd9Sstevel@tonic-gate mutex_enter(&nfs4_server_lst_lock); 34327c478bd9Sstevel@tonic-gate mutex_enter(&sp->s_lock); 34337c478bd9Sstevel@tonic-gate if (sp->s_refcnt > 0) { 34347c478bd9Sstevel@tonic-gate mutex_exit(&sp->s_lock); 34357c478bd9Sstevel@tonic-gate mutex_exit(&nfs4_server_lst_lock); 34367c478bd9Sstevel@tonic-gate return; 34377c478bd9Sstevel@tonic-gate } 34387c478bd9Sstevel@tonic-gate if (sp->s_flags & N4S_INSERTED) { 34397c478bd9Sstevel@tonic-gate remque(sp); 34407c478bd9Sstevel@tonic-gate sp->forw = sp->back = NULL; 34417c478bd9Sstevel@tonic-gate sp->s_flags &= ~N4S_INSERTED; 34427c478bd9Sstevel@tonic-gate } 34437c478bd9Sstevel@tonic-gate mutex_exit(&nfs4_server_lst_lock); 34447c478bd9Sstevel@tonic-gate destroy_nfs4_server(sp); 34457c478bd9Sstevel@tonic-gate } 34467c478bd9Sstevel@tonic-gate 34477c478bd9Sstevel@tonic-gate static void 34487c478bd9Sstevel@tonic-gate destroy_nfs4_server(nfs4_server_t *sp) 34497c478bd9Sstevel@tonic-gate { 34507c478bd9Sstevel@tonic-gate ASSERT(MUTEX_HELD(&sp->s_lock)); 34517c478bd9Sstevel@tonic-gate ASSERT(!(sp->s_flags & N4S_INSERTED)); 34527c478bd9Sstevel@tonic-gate ASSERT(sp->s_refcnt == 0); 34537c478bd9Sstevel@tonic-gate ASSERT(sp->s_otw_call_count == 0); 34547c478bd9Sstevel@tonic-gate 34557c478bd9Sstevel@tonic-gate remove_all_mi(sp); 34567c478bd9Sstevel@tonic-gate 34577c478bd9Sstevel@tonic-gate crfree(sp->s_cred); 34587c478bd9Sstevel@tonic-gate kmem_free(sp->saddr.buf, sp->saddr.maxlen); 34597c478bd9Sstevel@tonic-gate kmem_free(sp->clidtosend.id_val, sp->clidtosend.id_len); 34607c478bd9Sstevel@tonic-gate mutex_exit(&sp->s_lock); 34617c478bd9Sstevel@tonic-gate 34627c478bd9Sstevel@tonic-gate /* destroy the nfs4_server */ 34637c478bd9Sstevel@tonic-gate nfs4callback_destroy(sp); 34647c478bd9Sstevel@tonic-gate list_destroy(&sp->s_deleg_list); 34657c478bd9Sstevel@tonic-gate mutex_destroy(&sp->s_lock); 34667c478bd9Sstevel@tonic-gate cv_destroy(&sp->cv_thread_exit); 34677c478bd9Sstevel@tonic-gate cv_destroy(&sp->s_cv_otw_count); 34687c478bd9Sstevel@tonic-gate cv_destroy(&sp->wait_cb_null); 34697c478bd9Sstevel@tonic-gate nfs_rw_destroy(&sp->s_recovlock); 34707c478bd9Sstevel@tonic-gate kmem_free(sp, sizeof (*sp)); 34717c478bd9Sstevel@tonic-gate } 34727c478bd9Sstevel@tonic-gate 34737c478bd9Sstevel@tonic-gate /* 34747c478bd9Sstevel@tonic-gate * Lock sp, but only if it's still active (in the list and hasn't been 34757c478bd9Sstevel@tonic-gate * flagged as exiting) or 'all' is non-zero. 34767c478bd9Sstevel@tonic-gate * Returns TRUE if sp got locked and adds a reference to sp. 34777c478bd9Sstevel@tonic-gate */ 34787c478bd9Sstevel@tonic-gate bool_t 34797c478bd9Sstevel@tonic-gate nfs4_server_vlock(nfs4_server_t *sp, int all) 34807c478bd9Sstevel@tonic-gate { 34817c478bd9Sstevel@tonic-gate nfs4_server_t *np; 34827c478bd9Sstevel@tonic-gate 34837c478bd9Sstevel@tonic-gate mutex_enter(&nfs4_server_lst_lock); 34847c478bd9Sstevel@tonic-gate for (np = nfs4_server_lst.forw; np != &nfs4_server_lst; np = np->forw) { 34857c478bd9Sstevel@tonic-gate if (sp == np && (np->s_thread_exit != NFS4_THREAD_EXIT || 34867c478bd9Sstevel@tonic-gate all != 0)) { 34877c478bd9Sstevel@tonic-gate mutex_enter(&np->s_lock); 34887c478bd9Sstevel@tonic-gate np->s_refcnt++; 34897c478bd9Sstevel@tonic-gate mutex_exit(&nfs4_server_lst_lock); 34907c478bd9Sstevel@tonic-gate return (TRUE); 34917c478bd9Sstevel@tonic-gate } 34927c478bd9Sstevel@tonic-gate } 34937c478bd9Sstevel@tonic-gate mutex_exit(&nfs4_server_lst_lock); 34947c478bd9Sstevel@tonic-gate return (FALSE); 34957c478bd9Sstevel@tonic-gate } 34967c478bd9Sstevel@tonic-gate 34977c478bd9Sstevel@tonic-gate /* 34987c478bd9Sstevel@tonic-gate * Fork off a thread to free the data structures for a mount. 34997c478bd9Sstevel@tonic-gate */ 35007c478bd9Sstevel@tonic-gate 35017c478bd9Sstevel@tonic-gate static void 35027c478bd9Sstevel@tonic-gate async_free_mount(vfs_t *vfsp, cred_t *cr) 35037c478bd9Sstevel@tonic-gate { 35047c478bd9Sstevel@tonic-gate freemountargs_t *args; 35057c478bd9Sstevel@tonic-gate 35067c478bd9Sstevel@tonic-gate args = kmem_alloc(sizeof (freemountargs_t), KM_SLEEP); 35077c478bd9Sstevel@tonic-gate args->fm_vfsp = vfsp; 35087c478bd9Sstevel@tonic-gate VFS_HOLD(vfsp); 35097c478bd9Sstevel@tonic-gate args->fm_cr = cr; 35107c478bd9Sstevel@tonic-gate crhold(cr); 35117c478bd9Sstevel@tonic-gate 35127c478bd9Sstevel@tonic-gate (void) zthread_create(NULL, 0, nfs4_free_mount_thread, args, 0, 35137c478bd9Sstevel@tonic-gate minclsyspri); 35147c478bd9Sstevel@tonic-gate } 35157c478bd9Sstevel@tonic-gate 35167c478bd9Sstevel@tonic-gate static void 35177c478bd9Sstevel@tonic-gate nfs4_free_mount_thread(freemountargs_t *args) 35187c478bd9Sstevel@tonic-gate { 35197c478bd9Sstevel@tonic-gate nfs4_free_mount(args->fm_vfsp, args->fm_cr); 35207c478bd9Sstevel@tonic-gate VFS_RELE(args->fm_vfsp); 35217c478bd9Sstevel@tonic-gate crfree(args->fm_cr); 35227c478bd9Sstevel@tonic-gate kmem_free(args, sizeof (freemountargs_t)); 35237c478bd9Sstevel@tonic-gate zthread_exit(); 35247c478bd9Sstevel@tonic-gate /* NOTREACHED */ 35257c478bd9Sstevel@tonic-gate } 35267c478bd9Sstevel@tonic-gate 35277c478bd9Sstevel@tonic-gate /* 35287c478bd9Sstevel@tonic-gate * Thread to free the data structures for a given filesystem. 35297c478bd9Sstevel@tonic-gate */ 35307c478bd9Sstevel@tonic-gate static void 35317c478bd9Sstevel@tonic-gate nfs4_free_mount(vfs_t *vfsp, cred_t *cr) 35327c478bd9Sstevel@tonic-gate { 35337c478bd9Sstevel@tonic-gate mntinfo4_t *mi = VFTOMI4(vfsp); 35347c478bd9Sstevel@tonic-gate nfs4_server_t *sp; 35357c478bd9Sstevel@tonic-gate callb_cpr_t cpr_info; 35367c478bd9Sstevel@tonic-gate kmutex_t cpr_lock; 35377c478bd9Sstevel@tonic-gate boolean_t async_thread; 35387c478bd9Sstevel@tonic-gate 35397c478bd9Sstevel@tonic-gate /* 35407c478bd9Sstevel@tonic-gate * We need to participate in the CPR framework if this is a kernel 35417c478bd9Sstevel@tonic-gate * thread. 35427c478bd9Sstevel@tonic-gate */ 3543*108322fbScarlsonj async_thread = (curproc == nfs_zone()->zone_zsched); 35447c478bd9Sstevel@tonic-gate if (async_thread) { 35457c478bd9Sstevel@tonic-gate mutex_init(&cpr_lock, NULL, MUTEX_DEFAULT, NULL); 35467c478bd9Sstevel@tonic-gate CALLB_CPR_INIT(&cpr_info, &cpr_lock, callb_generic_cpr, 35477c478bd9Sstevel@tonic-gate "nfsv4AsyncUnmount"); 35487c478bd9Sstevel@tonic-gate } 35497c478bd9Sstevel@tonic-gate 35507c478bd9Sstevel@tonic-gate /* 35517c478bd9Sstevel@tonic-gate * We need to wait for all outstanding OTW calls 35527c478bd9Sstevel@tonic-gate * and recovery to finish before we remove the mi 35537c478bd9Sstevel@tonic-gate * from the nfs4_server_t, as current pending 35547c478bd9Sstevel@tonic-gate * calls might still need this linkage (in order 35557c478bd9Sstevel@tonic-gate * to find a nfs4_server_t from a mntinfo4_t). 35567c478bd9Sstevel@tonic-gate */ 35577c478bd9Sstevel@tonic-gate (void) nfs_rw_enter_sig(&mi->mi_recovlock, RW_READER, FALSE); 35587c478bd9Sstevel@tonic-gate sp = find_nfs4_server(mi); 35597c478bd9Sstevel@tonic-gate nfs_rw_exit(&mi->mi_recovlock); 35607c478bd9Sstevel@tonic-gate 35617c478bd9Sstevel@tonic-gate if (sp) { 35627c478bd9Sstevel@tonic-gate while (sp->s_otw_call_count != 0) { 35637c478bd9Sstevel@tonic-gate if (async_thread) { 35647c478bd9Sstevel@tonic-gate mutex_enter(&cpr_lock); 35657c478bd9Sstevel@tonic-gate CALLB_CPR_SAFE_BEGIN(&cpr_info); 35667c478bd9Sstevel@tonic-gate mutex_exit(&cpr_lock); 35677c478bd9Sstevel@tonic-gate } 35687c478bd9Sstevel@tonic-gate cv_wait(&sp->s_cv_otw_count, &sp->s_lock); 35697c478bd9Sstevel@tonic-gate if (async_thread) { 35707c478bd9Sstevel@tonic-gate mutex_enter(&cpr_lock); 35717c478bd9Sstevel@tonic-gate CALLB_CPR_SAFE_END(&cpr_info, &cpr_lock); 35727c478bd9Sstevel@tonic-gate mutex_exit(&cpr_lock); 35737c478bd9Sstevel@tonic-gate } 35747c478bd9Sstevel@tonic-gate } 35757c478bd9Sstevel@tonic-gate mutex_exit(&sp->s_lock); 35767c478bd9Sstevel@tonic-gate nfs4_server_rele(sp); 35777c478bd9Sstevel@tonic-gate sp = NULL; 35787c478bd9Sstevel@tonic-gate } 35797c478bd9Sstevel@tonic-gate 35807c478bd9Sstevel@tonic-gate 35817c478bd9Sstevel@tonic-gate mutex_enter(&mi->mi_lock); 35827c478bd9Sstevel@tonic-gate while (mi->mi_in_recovery != 0) { 35837c478bd9Sstevel@tonic-gate if (async_thread) { 35847c478bd9Sstevel@tonic-gate mutex_enter(&cpr_lock); 35857c478bd9Sstevel@tonic-gate CALLB_CPR_SAFE_BEGIN(&cpr_info); 35867c478bd9Sstevel@tonic-gate mutex_exit(&cpr_lock); 35877c478bd9Sstevel@tonic-gate } 35887c478bd9Sstevel@tonic-gate cv_wait(&mi->mi_cv_in_recov, &mi->mi_lock); 35897c478bd9Sstevel@tonic-gate if (async_thread) { 35907c478bd9Sstevel@tonic-gate mutex_enter(&cpr_lock); 35917c478bd9Sstevel@tonic-gate CALLB_CPR_SAFE_END(&cpr_info, &cpr_lock); 35927c478bd9Sstevel@tonic-gate mutex_exit(&cpr_lock); 35937c478bd9Sstevel@tonic-gate } 35947c478bd9Sstevel@tonic-gate } 35957c478bd9Sstevel@tonic-gate mutex_exit(&mi->mi_lock); 35967c478bd9Sstevel@tonic-gate 35977c478bd9Sstevel@tonic-gate /* 35987c478bd9Sstevel@tonic-gate * The original purge of the dnlc via 'dounmount' 35997c478bd9Sstevel@tonic-gate * doesn't guarantee that another dnlc entry was not 36007c478bd9Sstevel@tonic-gate * added while we waitied for all outstanding OTW 36017c478bd9Sstevel@tonic-gate * and recovery calls to finish. So re-purge the 36027c478bd9Sstevel@tonic-gate * dnlc now. 36037c478bd9Sstevel@tonic-gate */ 36047c478bd9Sstevel@tonic-gate (void) dnlc_purge_vfsp(vfsp, 0); 36057c478bd9Sstevel@tonic-gate 36067c478bd9Sstevel@tonic-gate /* 36077c478bd9Sstevel@tonic-gate * We need to explicitly stop the manager thread; the asyc worker 36087c478bd9Sstevel@tonic-gate * threads can timeout and exit on their own. 36097c478bd9Sstevel@tonic-gate */ 36107c478bd9Sstevel@tonic-gate nfs4_async_manager_stop(vfsp); 36117c478bd9Sstevel@tonic-gate 36127c478bd9Sstevel@tonic-gate destroy_rtable4(vfsp, cr); 36137c478bd9Sstevel@tonic-gate 36147c478bd9Sstevel@tonic-gate nfs4_remove_mi_from_server(mi, NULL); 36157c478bd9Sstevel@tonic-gate 36167c478bd9Sstevel@tonic-gate if (mi->mi_io_kstats) { 36177c478bd9Sstevel@tonic-gate kstat_delete(mi->mi_io_kstats); 36187c478bd9Sstevel@tonic-gate mi->mi_io_kstats = NULL; 36197c478bd9Sstevel@tonic-gate } 36207c478bd9Sstevel@tonic-gate if (mi->mi_ro_kstats) { 36217c478bd9Sstevel@tonic-gate kstat_delete(mi->mi_ro_kstats); 36227c478bd9Sstevel@tonic-gate mi->mi_ro_kstats = NULL; 36237c478bd9Sstevel@tonic-gate } 36247c478bd9Sstevel@tonic-gate if (mi->mi_recov_ksp) { 36257c478bd9Sstevel@tonic-gate kstat_delete(mi->mi_recov_ksp); 36267c478bd9Sstevel@tonic-gate mi->mi_recov_ksp = NULL; 36277c478bd9Sstevel@tonic-gate } 36287c478bd9Sstevel@tonic-gate 36297c478bd9Sstevel@tonic-gate if (async_thread) { 36307c478bd9Sstevel@tonic-gate mutex_enter(&cpr_lock); 36317c478bd9Sstevel@tonic-gate CALLB_CPR_EXIT(&cpr_info); /* drops cpr_lock */ 36327c478bd9Sstevel@tonic-gate mutex_destroy(&cpr_lock); 36337c478bd9Sstevel@tonic-gate } 36347c478bd9Sstevel@tonic-gate } 3635