smbclnt/smbfs/smbfs_vnops.c

4bff34e3Sthurlow/*
4bff34e3Sthurlow * Copyright (c) 2000-2001 Boris Popov
4bff34e3Sthurlow * All rights reserved.
4bff34e3Sthurlow *
4bff34e3Sthurlow * Redistribution and use in source and binary forms, with or without
4bff34e3Sthurlow * modification, are permitted provided that the following conditions
4bff34e3Sthurlow * are met:
4bff34e3Sthurlow * 1. Redistributions of source code must retain the above copyright
4bff34e3Sthurlow *    notice, this list of conditions and the following disclaimer.
4bff34e3Sthurlow * 2. Redistributions in binary form must reproduce the above copyright
4bff34e3Sthurlow *    notice, this list of conditions and the following disclaimer in the
4bff34e3Sthurlow *    documentation and/or other materials provided with the distribution.
4bff34e3Sthurlow * 3. All advertising materials mentioning features or use of this software
4bff34e3Sthurlow *    must display the following acknowledgement:
4bff34e3Sthurlow *    This product includes software developed by Boris Popov.
4bff34e3Sthurlow * 4. Neither the name of the author nor the names of any co-contributors
4bff34e3Sthurlow *    may be used to endorse or promote products derived from this software
4bff34e3Sthurlow *    without specific prior written permission.
4bff34e3Sthurlow *
4bff34e3Sthurlow * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
4bff34e3Sthurlow * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
4bff34e3Sthurlow * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
4bff34e3Sthurlow * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
4bff34e3Sthurlow * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
4bff34e3Sthurlow * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
4bff34e3Sthurlow * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
4bff34e3Sthurlow * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
4bff34e3Sthurlow * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
4bff34e3Sthurlow * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
4bff34e3Sthurlow * SUCH DAMAGE.
4bff34e3Sthurlow *
4bff34e3Sthurlow * $Id: smbfs_vnops.c,v 1.128.36.1 2005/05/27 02:35:28 lindak Exp $
4bff34e3Sthurlow */
4bff34e3Sthurlow
4bff34e3Sthurlow/*
134a1f4eSCasper H.S. Dik * Copyright (c) 2008, 2010, Oracle and/or its affiliates. All rights reserved.
*168091e5SGordon Ross * Copyright 2021 Tintri by DDN, Inc.  All rights reserved.
4bff34e3Sthurlow */
4bff34e3Sthurlow
5f4fc069Sjilinxpd/*
5f4fc069Sjilinxpd * Vnode operations
5f4fc069Sjilinxpd *
5f4fc069Sjilinxpd * This file is similar to nfs3_vnops.c
5f4fc069Sjilinxpd */
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd#include <sys/param.h>
4bff34e3Sthurlow#include <sys/systm.h>
4bff34e3Sthurlow#include <sys/cred.h>
4bff34e3Sthurlow#include <sys/vnode.h>
4bff34e3Sthurlow#include <sys/vfs.h>
7568150aSgwr#include <sys/filio.h>
4bff34e3Sthurlow#include <sys/uio.h>
4bff34e3Sthurlow#include <sys/dirent.h>
4bff34e3Sthurlow#include <sys/errno.h>
613a2f6bSGordon Ross#include <sys/sunddi.h>
4bff34e3Sthurlow#include <sys/sysmacros.h>
4bff34e3Sthurlow#include <sys/kmem.h>
4bff34e3Sthurlow#include <sys/cmn_err.h>
4bff34e3Sthurlow#include <sys/vfs_opreg.h>
4bff34e3Sthurlow#include <sys/policy.h>
5f4fc069Sjilinxpd#include <sys/sdt.h>
4e72ade1SGordon Ross#include <sys/taskq_impl.h>
5f4fc069Sjilinxpd#include <sys/zone.h>
5f4fc069Sjilinxpd
8329232eSGordon Ross#ifdef	_KERNEL
8329232eSGordon Ross#include <sys/vmsystm.h>	// for desfree
5f4fc069Sjilinxpd#include <vm/hat.h>
5f4fc069Sjilinxpd#include <vm/as.h>
5f4fc069Sjilinxpd#include <vm/page.h>
5f4fc069Sjilinxpd#include <vm/pvn.h>
5f4fc069Sjilinxpd#include <vm/seg.h>
5f4fc069Sjilinxpd#include <vm/seg_map.h>
5f4fc069Sjilinxpd#include <vm/seg_kpm.h>
5f4fc069Sjilinxpd#include <vm/seg_vn.h>
8329232eSGordon Ross#endif	// _KERNEL
4bff34e3Sthurlow
4bff34e3Sthurlow#include <netsmb/smb_osdep.h>
4bff34e3Sthurlow#include <netsmb/smb.h>
4bff34e3Sthurlow#include <netsmb/smb_conn.h>
4bff34e3Sthurlow#include <netsmb/smb_subr.h>
4bff34e3Sthurlow
4bff34e3Sthurlow#include <smbfs/smbfs.h>
4bff34e3Sthurlow#include <smbfs/smbfs_node.h>
4bff34e3Sthurlow#include <smbfs/smbfs_subr.h>
4bff34e3Sthurlow
7568150aSgwr#include <sys/fs/smbfs_ioctl.h>
4bff34e3Sthurlow#include <fs/fs_subr.h>
4bff34e3Sthurlow
8329232eSGordon Ross#ifndef	MAXOFF32_T
8329232eSGordon Ross#define	MAXOFF32_T	0x7fffffff
8329232eSGordon Ross#endif
8329232eSGordon Ross
5ecede33SGordon Ross/*
5ecede33SGordon Ross * We assign directory offsets like the NFS client, where the
5ecede33SGordon Ross * offset increments by _one_ after each directory entry.
5ecede33SGordon Ross * Further, the entries "." and ".." are always at offsets
5ecede33SGordon Ross * zero and one (respectively) and the "real" entries from
5ecede33SGordon Ross * the server appear at offsets starting with two.  This
5ecede33SGordon Ross * macro is used to initialize the n_dirofs field after
5ecede33SGordon Ross * setting n_dirseq with a _findopen call.
5ecede33SGordon Ross */
5ecede33SGordon Ross#define	FIRST_DIROFS	2
5ecede33SGordon Ross
4bff34e3Sthurlow/*
4bff34e3Sthurlow * These characters are illegal in NTFS file names.
4bff34e3Sthurlow * ref: http://support.microsoft.com/kb/147438
91d632c8Sgwr *
91d632c8Sgwr * Careful!  The check in the XATTR case skips the
91d632c8Sgwr * first character to allow colon in XATTR names.
4bff34e3Sthurlow */
4bff34e3Sthurlowstatic const char illegal_chars[] = {
91d632c8Sgwr	':',	/* colon - keep this first! */
4bff34e3Sthurlow	'\\',	/* back slash */
4bff34e3Sthurlow	'/',	/* slash */
4bff34e3Sthurlow	'*',	/* asterisk */
4bff34e3Sthurlow	'?',	/* question mark */
4bff34e3Sthurlow	'"',	/* double quote */
4bff34e3Sthurlow	'<',	/* less than sign */
4bff34e3Sthurlow	'>',	/* greater than sign */
4bff34e3Sthurlow	'|',	/* vertical bar */
4bff34e3Sthurlow	0
4bff34e3Sthurlow};
4bff34e3Sthurlow
4bff34e3Sthurlow/*
4bff34e3Sthurlow * Turning this on causes nodes to be created in the cache
02d09e03SGordon Ross * during directory listings, normally avoiding a second
02d09e03SGordon Ross * OtW attribute fetch just after a readdir.
4bff34e3Sthurlow */
02d09e03SGordon Rossint smbfs_fastlookup = 1;
4bff34e3Sthurlow
5f4fc069Sjilinxpdstruct vnodeops *smbfs_vnodeops = NULL;
5f4fc069Sjilinxpd
4bff34e3Sthurlow/* local static function defines */
4bff34e3Sthurlow
02d09e03SGordon Rossstatic int	smbfslookup_cache(vnode_t *, char *, int, vnode_t **,
02d09e03SGordon Ross			cred_t *);
4bff34e3Sthurlowstatic int	smbfslookup(vnode_t *dvp, char *nm, vnode_t **vpp, cred_t *cr,
02d09e03SGordon Ross			int cache_ok, caller_context_t *);
ff1e230cSjilinxpdstatic int	smbfsremove(vnode_t *dvp, vnode_t *vp, struct smb_cred *scred,
ff1e230cSjilinxpd			int flags);
ff1e230cSjilinxpdstatic int	smbfsrename(vnode_t *odvp, vnode_t *ovp, vnode_t *ndvp,
ff1e230cSjilinxpd			char *nnm, struct smb_cred *scred, int flags);
4bff34e3Sthurlowstatic int	smbfssetattr(vnode_t *, struct vattr *, int, cred_t *);
4bff34e3Sthurlowstatic int	smbfs_accessx(void *, int, cred_t *);
4bff34e3Sthurlowstatic int	smbfs_readvdir(vnode_t *vp, uio_t *uio, cred_t *cr, int *eofp,
4bff34e3Sthurlow			caller_context_t *);
adee6784SGordon Rossstatic int	smbfsflush(smbnode_t *, struct smb_cred *);
42d15982SGordon Rossstatic void	smbfs_rele_fid(smbnode_t *, struct smb_cred *);
28162916SGordon Rossstatic uint32_t xvattr_to_dosattr(smbnode_t *, struct vattr *);
42d15982SGordon Ross
5f4fc069Sjilinxpdstatic int	smbfs_fsync(vnode_t *, int, cred_t *, caller_context_t *);
8329232eSGordon Ross
5f4fc069Sjilinxpdstatic int	smbfs_putpage(vnode_t *, offset_t, size_t, int, cred_t *,
5f4fc069Sjilinxpd			caller_context_t *);
8329232eSGordon Ross#ifdef	_KERNEL
5f4fc069Sjilinxpdstatic int	smbfs_getapage(vnode_t *, u_offset_t, size_t, uint_t *,
5f4fc069Sjilinxpd			page_t *[], size_t, struct seg *, caddr_t,
5f4fc069Sjilinxpd			enum seg_rw, cred_t *);
5f4fc069Sjilinxpdstatic int	smbfs_putapage(vnode_t *, page_t *, u_offset_t *, size_t *,
5f4fc069Sjilinxpd			int, cred_t *);
4e72ade1SGordon Rossstatic void	smbfs_delmap_async(void *);
5f4fc069Sjilinxpd
8329232eSGordon Rossstatic int	smbfs_rdwrlbn(vnode_t *, page_t *, u_offset_t, size_t, int,
8329232eSGordon Ross			cred_t *);
8329232eSGordon Rossstatic int	smbfs_bio(struct buf *, int, cred_t *);
8329232eSGordon Rossstatic int	smbfs_writenp(smbnode_t *np, caddr_t base, int tcount,
8329232eSGordon Ross			struct uio *uiop, int pgcreated);
8329232eSGordon Ross#endif	// _KERNEL
8329232eSGordon Ross
5f4fc069Sjilinxpd/*
5f4fc069Sjilinxpd * Error flags used to pass information about certain special errors
5f4fc069Sjilinxpd * which need to be handled specially.
5f4fc069Sjilinxpd */
5f4fc069Sjilinxpd#define	SMBFS_EOF			-98
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd/* When implementing OtW locks, make this a real function. */
5f4fc069Sjilinxpd#define	smbfs_lm_has_sleep(vp) 0
5f4fc069Sjilinxpd
4bff34e3Sthurlow/*
4bff34e3Sthurlow * These are the vnode ops routines which implement the vnode interface to
4bff34e3Sthurlow * the networked file system.  These routines just take their parameters,
4bff34e3Sthurlow * make them look networkish by putting the right info into interface structs,
4bff34e3Sthurlow * and then calling the appropriate remote routine(s) to do the work.
4bff34e3Sthurlow *
4bff34e3Sthurlow * Note on directory name lookup cacheing:  If we detect a stale fhandle,
4bff34e3Sthurlow * we purge the directory cache relative to that vnode.  This way, the
4bff34e3Sthurlow * user won't get burned by the cache repeatedly.  See <smbfs/smbnode.h> for
4bff34e3Sthurlow * more details on smbnode locking.
4bff34e3Sthurlow */
4bff34e3Sthurlow
4bff34e3Sthurlow
4bff34e3Sthurlow/*
4bff34e3Sthurlow * XXX
4bff34e3Sthurlow * When new and relevant functionality is enabled, we should be
4bff34e3Sthurlow * calling vfs_set_feature() to inform callers that pieces of
9660e5cbSJanice Chang * functionality are available, per PSARC 2007/227.
4bff34e3Sthurlow */
4bff34e3Sthurlow/* ARGSUSED */
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_open(vnode_t **vpp, int flag, cred_t *cr, caller_context_t *ct)
4bff34e3Sthurlow{
4bff34e3Sthurlow	smbnode_t	*np;
4bff34e3Sthurlow	vnode_t		*vp;
02d09e03SGordon Ross	smbfattr_t	fa;
adee6784SGordon Ross	smb_fh_t	*fid = NULL;
adee6784SGordon Ross	smb_fh_t	*oldfid;
adee6784SGordon Ross	uint32_t	rights;
4bff34e3Sthurlow	struct smb_cred scred;
4bff34e3Sthurlow	smbmntinfo_t	*smi;
613a2f6bSGordon Ross	smb_share_t	*ssp;
4bff34e3Sthurlow	cred_t		*oldcr;
4bff34e3Sthurlow	int		error = 0;
4bff34e3Sthurlow
4bff34e3Sthurlow	vp = *vpp;
4bff34e3Sthurlow	np = VTOSMB(vp);
4bff34e3Sthurlow	smi = VTOSMI(vp);
613a2f6bSGordon Ross	ssp = smi->smi_share;
4bff34e3Sthurlow
a19609f8Sjv	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (smi->smi_flags & SMI_DEAD || vp->v_vfsp->vfs_flag & VFS_UNMOUNTED)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (vp->v_type != VREG && vp->v_type != VDIR) { /* XXX VLNK? */
4bff34e3Sthurlow		SMBVDEBUG("open eacces vtype=%d\n", vp->v_type);
4bff34e3Sthurlow		return (EACCES);
4bff34e3Sthurlow	}
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Get exclusive access to n_fid and related stuff.
4bff34e3Sthurlow	 * No returns after this until out.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	if (smbfs_rw_enter_sig(&np->r_lkserlock, RW_WRITER, SMBINTR(vp)))
4bff34e3Sthurlow		return (EINTR);
613a2f6bSGordon Ross	smb_credinit(&scred, cr);
4bff34e3Sthurlow
91d632c8Sgwr	/*
91d632c8Sgwr	 * Keep track of the vnode type at first open.
91d632c8Sgwr	 * It may change later, and we need close to do
91d632c8Sgwr	 * cleanup for the type we opened.  Also deny
91d632c8Sgwr	 * open of new types until old type is closed.
91d632c8Sgwr	 */
91d632c8Sgwr	if (np->n_ovtype == VNON) {
91d632c8Sgwr		ASSERT(np->n_dirrefs == 0);
91d632c8Sgwr		ASSERT(np->n_fidrefs == 0);
91d632c8Sgwr	} else if (np->n_ovtype != vp->v_type) {
91d632c8Sgwr		SMBVDEBUG("open n_ovtype=%d v_type=%d\n",
91d632c8Sgwr		    np->n_ovtype, vp->v_type);
91d632c8Sgwr		error = EACCES;
91d632c8Sgwr		goto out;
91d632c8Sgwr	}
91d632c8Sgwr
4bff34e3Sthurlow	/*
5ecede33SGordon Ross	 * Directory open.  See smbfs_readvdir()
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	if (vp->v_type == VDIR) {
5ecede33SGordon Ross		if (np->n_dirseq == NULL) {
5ecede33SGordon Ross			/* first open */
5ecede33SGordon Ross			error = smbfs_smb_findopen(np, "*", 1,
5ecede33SGordon Ross			    SMB_FA_SYSTEM | SMB_FA_HIDDEN | SMB_FA_DIR,
5ecede33SGordon Ross			    &scred, &np->n_dirseq);
5ecede33SGordon Ross			if (error != 0)
5ecede33SGordon Ross				goto out;
5ecede33SGordon Ross		}
5ecede33SGordon Ross		np->n_dirofs = FIRST_DIROFS;
4bff34e3Sthurlow		np->n_dirrefs++;
4bff34e3Sthurlow		goto have_fid;
4bff34e3Sthurlow	}
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * If caller specified O_TRUNC/FTRUNC, then be sure to set
4bff34e3Sthurlow	 * FWRITE (to drive successful setattr(size=0) after open)
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	if (flag & FTRUNC)
4bff34e3Sthurlow		flag |= FWRITE;
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
613a2f6bSGordon Ross	 * If we already have it open, and the FID is still valid,
613a2f6bSGordon Ross	 * check whether the rights are sufficient for FID reuse.
4bff34e3Sthurlow	 */
613a2f6bSGordon Ross	if (np->n_fidrefs > 0 &&
adee6784SGordon Ross	    (fid = np->n_fid) != NULL &&
adee6784SGordon Ross	    fid->fh_vcgenid == ssp->ss_vcgenid) {
4bff34e3Sthurlow		int upgrade = 0;
4bff34e3Sthurlow
4bff34e3Sthurlow		if ((flag & FWRITE) &&
adee6784SGordon Ross		    !(fid->fh_rights & SA_RIGHT_FILE_WRITE_DATA))
4bff34e3Sthurlow			upgrade = 1;
4bff34e3Sthurlow		if ((flag & FREAD) &&
adee6784SGordon Ross		    !(fid->fh_rights & SA_RIGHT_FILE_READ_DATA))
4bff34e3Sthurlow			upgrade = 1;
4bff34e3Sthurlow		if (!upgrade) {
4bff34e3Sthurlow			/*
4bff34e3Sthurlow			 *  the existing open is good enough
4bff34e3Sthurlow			 */
4bff34e3Sthurlow			np->n_fidrefs++;
4bff34e3Sthurlow			goto have_fid;
4bff34e3Sthurlow		}
adee6784SGordon Ross		fid = NULL;
4bff34e3Sthurlow	}
adee6784SGordon Ross	rights = (fid != NULL) ? fid->fh_rights : 0;
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * we always ask for READ_CONTROL so we can always get the
91d632c8Sgwr	 * owner/group IDs to satisfy a stat.  Ditto attributes.
4bff34e3Sthurlow	 */
91d632c8Sgwr	rights |= (STD_RIGHT_READ_CONTROL_ACCESS |
91d632c8Sgwr	    SA_RIGHT_FILE_READ_ATTRIBUTES);
4bff34e3Sthurlow	if ((flag & FREAD))
4bff34e3Sthurlow		rights |= SA_RIGHT_FILE_READ_DATA;
4bff34e3Sthurlow	if ((flag & FWRITE))
02d09e03SGordon Ross		rights |= SA_RIGHT_FILE_WRITE_DATA |
02d09e03SGordon Ross		    SA_RIGHT_FILE_APPEND_DATA |
02d09e03SGordon Ross		    SA_RIGHT_FILE_WRITE_ATTRIBUTES;
02d09e03SGordon Ross
02d09e03SGordon Ross	bzero(&fa, sizeof (fa));
02d09e03SGordon Ross	error = smbfs_smb_open(np,
02d09e03SGordon Ross	    NULL, 0, 0, /* name nmlen xattr */
02d09e03SGordon Ross	    rights, &scred,
adee6784SGordon Ross	    &fid, &fa);
4bff34e3Sthurlow	if (error)
4bff34e3Sthurlow		goto out;
02d09e03SGordon Ross	smbfs_attrcache_fa(vp, &fa);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * We have a new FID and access rights.
4bff34e3Sthurlow	 */
*168091e5SGordon Ross	VERIFY(fid != NULL);
4bff34e3Sthurlow	oldfid = np->n_fid;
4bff34e3Sthurlow	np->n_fid = fid;
4bff34e3Sthurlow	np->n_fidrefs++;
adee6784SGordon Ross	if (oldfid != NULL)
adee6784SGordon Ross		smb_fh_rele(oldfid);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * This thread did the open.
4bff34e3Sthurlow	 * Save our credentials too.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	mutex_enter(&np->r_statelock);
4bff34e3Sthurlow	oldcr = np->r_cred;
4bff34e3Sthurlow	np->r_cred = cr;
4bff34e3Sthurlow	crhold(cr);
4bff34e3Sthurlow	if (oldcr)
4bff34e3Sthurlow		crfree(oldcr);
4bff34e3Sthurlow	mutex_exit(&np->r_statelock);
4bff34e3Sthurlow
4bff34e3Sthurlowhave_fid:
91d632c8Sgwr	/*
91d632c8Sgwr	 * Keep track of the vnode type at first open.
91d632c8Sgwr	 * (see comments above)
91d632c8Sgwr	 */
91d632c8Sgwr	if (np->n_ovtype == VNON)
91d632c8Sgwr		np->n_ovtype = vp->v_type;
4bff34e3Sthurlow
4bff34e3Sthurlowout:
4bff34e3Sthurlow	smb_credrele(&scred);
4bff34e3Sthurlow	smbfs_rw_exit(&np->r_lkserlock);
4bff34e3Sthurlow	return (error);
4bff34e3Sthurlow}
4bff34e3Sthurlow
4bff34e3Sthurlow/*ARGSUSED*/
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_close(vnode_t *vp, int flag, int count, offset_t offset, cred_t *cr,
4bff34e3Sthurlow	caller_context_t *ct)
4bff34e3Sthurlow{
4bff34e3Sthurlow	smbnode_t	*np;
613a2f6bSGordon Ross	smbmntinfo_t	*smi;
4bff34e3Sthurlow	struct smb_cred scred;
5f4fc069Sjilinxpd	int error = 0;
4bff34e3Sthurlow
4bff34e3Sthurlow	np = VTOSMB(vp);
613a2f6bSGordon Ross	smi = VTOSMI(vp);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Don't "bail out" for VFS_UNMOUNTED here,
4bff34e3Sthurlow	 * as we want to do cleanup, etc.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * zone_enter(2) prevents processes from changing zones with SMBFS files
4bff34e3Sthurlow	 * open; if we happen to get here from the wrong zone we can't do
4bff34e3Sthurlow	 * anything over the wire.
4bff34e3Sthurlow	 */
a19609f8Sjv	if (smi->smi_zone_ref.zref_zone != curproc->p_zone) {
4bff34e3Sthurlow		/*
4bff34e3Sthurlow		 * We could attempt to clean up locks, except we're sure
4bff34e3Sthurlow		 * that the current process didn't acquire any locks on
4bff34e3Sthurlow		 * the file: any attempt to lock a file belong to another zone
4bff34e3Sthurlow		 * will fail, and one can't lock an SMBFS file and then change
4bff34e3Sthurlow		 * zones, as that fails too.
4bff34e3Sthurlow		 *
4bff34e3Sthurlow		 * Returning an error here is the sane thing to do.  A
4bff34e3Sthurlow		 * subsequent call to VN_RELE() which translates to a
4bff34e3Sthurlow		 * smbfs_inactive() will clean up state: if the zone of the
4bff34e3Sthurlow		 * vnode's origin is still alive and kicking, an async worker
4bff34e3Sthurlow		 * thread will handle the request (from the correct zone), and
4bff34e3Sthurlow		 * everything (minus the final smbfs_getattr_otw() call) should
4bff34e3Sthurlow		 * be OK. If the zone is going away smbfs_async_inactive() will
4bff34e3Sthurlow		 * throw away cached pages inline.
4bff34e3Sthurlow		 */
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow	}
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * If we are using local locking for this filesystem, then
4bff34e3Sthurlow	 * release all of the SYSV style record locks.  Otherwise,
4bff34e3Sthurlow	 * we are doing network locking and we need to release all
4bff34e3Sthurlow	 * of the network locks.  All of the locks held by this
4bff34e3Sthurlow	 * process on this file are released no matter what the
4bff34e3Sthurlow	 * incoming reference count is.
4bff34e3Sthurlow	 */
42d15982SGordon Ross	if (smi->smi_flags & SMI_LLOCK) {
613a2f6bSGordon Ross		pid_t pid = ddi_get_pid();
613a2f6bSGordon Ross		cleanlocks(vp, pid, 0);
613a2f6bSGordon Ross		cleanshares(vp, pid);
4bff34e3Sthurlow	}
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * else doing OtW locking.  SMB servers drop all locks
5f4fc069Sjilinxpd	 * on the file ID we close here, so no _lockrelease()
5f4fc069Sjilinxpd	 */
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
02d09e03SGordon Ross	 * This (passed in) count is the ref. count from the
02d09e03SGordon Ross	 * user's file_t before the closef call (fio.c).
5f4fc069Sjilinxpd	 * The rest happens only on last close.
4bff34e3Sthurlow	 */
02d09e03SGordon Ross	if (count > 1)
02d09e03SGordon Ross		return (0);
4bff34e3Sthurlow
5f4fc069Sjilinxpd	/* NFS has DNLC purge here. */
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * If the file was open for write and there are pages,
5f4fc069Sjilinxpd	 * then make sure dirty pages written back.
5f4fc069Sjilinxpd	 *
5f4fc069Sjilinxpd	 * NFS does this async when "close-to-open" is off
5f4fc069Sjilinxpd	 * (MI_NOCTO flag is set) to avoid blocking the caller.
5f4fc069Sjilinxpd	 * For now, always do this synchronously (no B_ASYNC).
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	if ((flag & FWRITE) && vn_has_cached_data(vp)) {
5f4fc069Sjilinxpd		error = smbfs_putpage(vp, (offset_t)0, 0, 0, cr, ct);
5f4fc069Sjilinxpd		if (error == EAGAIN)
5f4fc069Sjilinxpd			error = 0;
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd	if (error == 0) {
5f4fc069Sjilinxpd		mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd		np->r_flags &= ~RSTALE;
5f4fc069Sjilinxpd		np->r_error = 0;
5f4fc069Sjilinxpd		mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
4bff34e3Sthurlow	/*
42d15982SGordon Ross	 * Decrement the reference count for the FID
42d15982SGordon Ross	 * and possibly do the OtW close.
42d15982SGordon Ross	 *
4bff34e3Sthurlow	 * Exclusive lock for modifying n_fid stuff.
4bff34e3Sthurlow	 * Don't want this one ever interruptible.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	(void) smbfs_rw_enter_sig(&np->r_lkserlock, RW_WRITER, 0);
613a2f6bSGordon Ross	smb_credinit(&scred, cr);
4bff34e3Sthurlow
42d15982SGordon Ross	smbfs_rele_fid(np, &scred);
42d15982SGordon Ross
42d15982SGordon Ross	smb_credrele(&scred);
42d15982SGordon Ross	smbfs_rw_exit(&np->r_lkserlock);
42d15982SGordon Ross
42d15982SGordon Ross	return (0);
42d15982SGordon Ross}
42d15982SGordon Ross
42d15982SGordon Ross/*
42d15982SGordon Ross * Helper for smbfs_close.  Decrement the reference count
42d15982SGordon Ross * for an SMB-level file or directory ID, and when the last
42d15982SGordon Ross * reference for the fid goes away, do the OtW close.
42d15982SGordon Ross * Also called in smbfs_inactive (defensive cleanup).
42d15982SGordon Ross */
42d15982SGordon Rossstatic void
42d15982SGordon Rosssmbfs_rele_fid(smbnode_t *np, struct smb_cred *scred)
42d15982SGordon Ross{
42d15982SGordon Ross	cred_t		*oldcr;
42d15982SGordon Ross	struct smbfs_fctx *fctx;
42d15982SGordon Ross	int		error;
adee6784SGordon Ross	smb_fh_t	*ofid;
42d15982SGordon Ross
4bff34e3Sthurlow	error = 0;
91d632c8Sgwr
42d15982SGordon Ross	/* Make sure we serialize for n_dirseq use. */
42d15982SGordon Ross	ASSERT(smbfs_rw_lock_held(&np->r_lkserlock, RW_WRITER));
42d15982SGordon Ross
91d632c8Sgwr	/*
91d632c8Sgwr	 * Note that vp->v_type may change if a remote node
91d632c8Sgwr	 * is deleted and recreated as a different type, and
91d632c8Sgwr	 * our getattr may change v_type accordingly.
91d632c8Sgwr	 * Now use n_ovtype to keep track of the v_type
91d632c8Sgwr	 * we had during open (see comments above).
91d632c8Sgwr	 */
42d15982SGordon Ross	switch (np->n_ovtype) {
42d15982SGordon Ross	case VDIR:
4bff34e3Sthurlow		ASSERT(np->n_dirrefs > 0);
4bff34e3Sthurlow		if (--np->n_dirrefs)
42d15982SGordon Ross			return;
4bff34e3Sthurlow		if ((fctx = np->n_dirseq) != NULL) {
4bff34e3Sthurlow			np->n_dirseq = NULL;
5ecede33SGordon Ross			np->n_dirofs = 0;
42d15982SGordon Ross			error = smbfs_smb_findclose(fctx, scred);
4bff34e3Sthurlow		}
42d15982SGordon Ross		break;
42d15982SGordon Ross
42d15982SGordon Ross	case VREG:
4bff34e3Sthurlow		ASSERT(np->n_fidrefs > 0);
4bff34e3Sthurlow		if (--np->n_fidrefs)
42d15982SGordon Ross			return;
adee6784SGordon Ross		if ((ofid = np->n_fid) != NULL) {
adee6784SGordon Ross			np->n_fid = NULL;
adee6784SGordon Ross			smb_fh_rele(ofid);
4bff34e3Sthurlow		}
42d15982SGordon Ross		break;
42d15982SGordon Ross
42d15982SGordon Ross	default:
42d15982SGordon Ross		SMBVDEBUG("bad n_ovtype %d\n", np->n_ovtype);
42d15982SGordon Ross		break;
4bff34e3Sthurlow	}
4bff34e3Sthurlow	if (error) {
02d09e03SGordon Ross		SMBVDEBUG("error %d closing %s\n",
4bff34e3Sthurlow		    error, np->n_rpath);
4bff34e3Sthurlow	}
4bff34e3Sthurlow
91d632c8Sgwr	/* Allow next open to use any v_type. */
91d632c8Sgwr	np->n_ovtype = VNON;
91d632c8Sgwr
02d09e03SGordon Ross	/*
02d09e03SGordon Ross	 * Other "last close" stuff.
02d09e03SGordon Ross	 */
02d09e03SGordon Ross	mutex_enter(&np->r_statelock);
4bff34e3Sthurlow	if (np->n_flag & NATTRCHANGED)
02d09e03SGordon Ross		smbfs_attrcache_rm_locked(np);
02d09e03SGordon Ross	oldcr = np->r_cred;
02d09e03SGordon Ross	np->r_cred = NULL;
02d09e03SGordon Ross	mutex_exit(&np->r_statelock);
02d09e03SGordon Ross	if (oldcr != NULL)
02d09e03SGordon Ross		crfree(oldcr);
4bff34e3Sthurlow}
4bff34e3Sthurlow
4bff34e3Sthurlow/* ARGSUSED */
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_read(vnode_t *vp, struct uio *uiop, int ioflag, cred_t *cr,
4bff34e3Sthurlow	caller_context_t *ct)
4bff34e3Sthurlow{
9c9af259SGordon Ross	struct smb_cred scred;
9c9af259SGordon Ross	struct vattr	va;
613a2f6bSGordon Ross	smbnode_t	*np;
613a2f6bSGordon Ross	smbmntinfo_t	*smi;
9c9af259SGordon Ross	offset_t	endoff;
9c9af259SGordon Ross	ssize_t		past_eof;
9c9af259SGordon Ross	int		error;
4bff34e3Sthurlow
4bff34e3Sthurlow	np = VTOSMB(vp);
4bff34e3Sthurlow	smi = VTOSMI(vp);
4bff34e3Sthurlow
a19609f8Sjv	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (smi->smi_flags & SMI_DEAD || vp->v_vfsp->vfs_flag & VFS_UNMOUNTED)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
*168091e5SGordon Ross	/* Sanity check: should have a valid open */
*168091e5SGordon Ross	if (np->n_fid == NULL)
*168091e5SGordon Ross		return (EIO);
*168091e5SGordon Ross
4bff34e3Sthurlow	ASSERT(smbfs_rw_lock_held(&np->r_rwlock, RW_READER));
4bff34e3Sthurlow
4bff34e3Sthurlow	if (vp->v_type != VREG)
4bff34e3Sthurlow		return (EISDIR);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (uiop->uio_resid == 0)
4bff34e3Sthurlow		return (0);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Like NFS3, just check for 63-bit overflow.
4bff34e3Sthurlow	 * Our SMB layer takes care to return EFBIG
4bff34e3Sthurlow	 * when it has to fallback to a 32-bit call.
4bff34e3Sthurlow	 */
613a2f6bSGordon Ross	endoff = uiop->uio_loffset + uiop->uio_resid;
613a2f6bSGordon Ross	if (uiop->uio_loffset < 0 || endoff < 0)
4bff34e3Sthurlow		return (EINVAL);
4bff34e3Sthurlow
4bff34e3Sthurlow	/* get vnode attributes from server */
4bff34e3Sthurlow	va.va_mask = AT_SIZE | AT_MTIME;
4bff34e3Sthurlow	if (error = smbfsgetattr(vp, &va, cr))
9c9af259SGordon Ross		return (error);
4bff34e3Sthurlow
9c9af259SGordon Ross	/* Update mtime with mtime from server here? */
9c9af259SGordon Ross
9c9af259SGordon Ross	/* if offset is beyond EOF, read nothing */
9c9af259SGordon Ross	if (uiop->uio_loffset >= va.va_size)
9c9af259SGordon Ross		return (0);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
9c9af259SGordon Ross	 * Limit the read to the remaining file size.
9c9af259SGordon Ross	 * Do this by temporarily reducing uio_resid
9c9af259SGordon Ross	 * by the amount the lies beyoned the EOF.
4bff34e3Sthurlow	 */
9c9af259SGordon Ross	if (endoff > va.va_size) {
9c9af259SGordon Ross		past_eof = (ssize_t)(endoff - va.va_size);
9c9af259SGordon Ross		uiop->uio_resid -= past_eof;
9c9af259SGordon Ross	} else
9c9af259SGordon Ross		past_eof = 0;
9c9af259SGordon Ross
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * Bypass VM if caching has been disabled (e.g., locking) or if
5f4fc069Sjilinxpd	 * using client-side direct I/O and the file is not mmap'd and
5f4fc069Sjilinxpd	 * there are no cached pages.
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	if ((vp->v_flag & VNOCACHE) ||
5f4fc069Sjilinxpd	    (((np->r_flags & RDIRECTIO) || (smi->smi_flags & SMI_DIRECTIO)) &&
5f4fc069Sjilinxpd	    np->r_mapcnt == 0 && np->r_inmap == 0 &&
5f4fc069Sjilinxpd	    !vn_has_cached_data(vp))) {
4bff34e3Sthurlow
5f4fc069Sjilinxpd		/* Shared lock for n_fid use in smb_rwuio */
5f4fc069Sjilinxpd		if (smbfs_rw_enter_sig(&np->r_lkserlock, RW_READER, SMBINTR(vp)))
5f4fc069Sjilinxpd			return (EINTR);
5f4fc069Sjilinxpd		smb_credinit(&scred, cr);
9c9af259SGordon Ross
adee6784SGordon Ross		error = smb_rwuio(np->n_fid, UIO_READ,
adee6784SGordon Ross		    uiop, &scred, smb_timo_read);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		smb_credrele(&scred);
5f4fc069Sjilinxpd		smbfs_rw_exit(&np->r_lkserlock);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		/* undo adjustment of resid */
5f4fc069Sjilinxpd		uiop->uio_resid += past_eof;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		return (error);
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
8329232eSGordon Ross#ifdef	_KERNEL
5f4fc069Sjilinxpd	/* (else) Do I/O through segmap. */
5f4fc069Sjilinxpd	do {
8329232eSGordon Ross		caddr_t		base;
8329232eSGordon Ross		u_offset_t	off;
8329232eSGordon Ross		size_t		n;
8329232eSGordon Ross		int		on;
8329232eSGordon Ross		uint_t		flags;
8329232eSGordon Ross
5f4fc069Sjilinxpd		off = uiop->uio_loffset & MAXBMASK; /* mapping offset */
5f4fc069Sjilinxpd		on = uiop->uio_loffset & MAXBOFFSET; /* Relative offset */
5f4fc069Sjilinxpd		n = MIN(MAXBSIZE - on, uiop->uio_resid);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		error = smbfs_validate_caches(vp, cr);
5f4fc069Sjilinxpd		if (error)
5f4fc069Sjilinxpd			break;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		/* NFS waits for RINCACHEPURGE here. */
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		if (vpm_enable) {
5f4fc069Sjilinxpd			/*
5f4fc069Sjilinxpd			 * Copy data.
5f4fc069Sjilinxpd			 */
5f4fc069Sjilinxpd			error = vpm_data_copy(vp, off + on, n, uiop,
5f4fc069Sjilinxpd			    1, NULL, 0, S_READ);
5f4fc069Sjilinxpd		} else {
5f4fc069Sjilinxpd			base = segmap_getmapflt(segkmap, vp, off + on, n, 1,
5f4fc069Sjilinxpd			    S_READ);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd			error = uiomove(base + on, n, UIO_READ, uiop);
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		if (!error) {
5f4fc069Sjilinxpd			/*
5f4fc069Sjilinxpd			 * If read a whole block or read to eof,
5f4fc069Sjilinxpd			 * won't need this buffer again soon.
5f4fc069Sjilinxpd			 */
5f4fc069Sjilinxpd			mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd			if (n + on == MAXBSIZE ||
5f4fc069Sjilinxpd			    uiop->uio_loffset == np->r_size)
5f4fc069Sjilinxpd				flags = SM_DONTNEED;
5f4fc069Sjilinxpd			else
5f4fc069Sjilinxpd				flags = 0;
5f4fc069Sjilinxpd			mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd			if (vpm_enable) {
5f4fc069Sjilinxpd				error = vpm_sync_pages(vp, off, n, flags);
5f4fc069Sjilinxpd			} else {
5f4fc069Sjilinxpd				error = segmap_release(segkmap, base, flags);
5f4fc069Sjilinxpd			}
5f4fc069Sjilinxpd		} else {
5f4fc069Sjilinxpd			if (vpm_enable) {
5f4fc069Sjilinxpd				(void) vpm_sync_pages(vp, off, n, 0);
5f4fc069Sjilinxpd			} else {
5f4fc069Sjilinxpd				(void) segmap_release(segkmap, base, 0);
5f4fc069Sjilinxpd			}
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd	} while (!error && uiop->uio_resid > 0);
8329232eSGordon Ross#else	// _KERNEL
8329232eSGordon Ross	error = ENOSYS;
8329232eSGordon Ross#endif	// _KERNEL
4bff34e3Sthurlow
9c9af259SGordon Ross	/* undo adjustment of resid */
9c9af259SGordon Ross	uiop->uio_resid += past_eof;
9c9af259SGordon Ross
9c9af259SGordon Ross	return (error);
4bff34e3Sthurlow}
4bff34e3Sthurlow
4bff34e3Sthurlow
4bff34e3Sthurlow/* ARGSUSED */
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_write(vnode_t *vp, struct uio *uiop, int ioflag, cred_t *cr,
4bff34e3Sthurlow	caller_context_t *ct)
4bff34e3Sthurlow{
9c9af259SGordon Ross	struct smb_cred scred;
5f4fc069Sjilinxpd	struct vattr    va;
613a2f6bSGordon Ross	smbnode_t	*np;
613a2f6bSGordon Ross	smbmntinfo_t	*smi;
9c9af259SGordon Ross	offset_t	endoff, limit;
9c9af259SGordon Ross	ssize_t		past_limit;
9c9af259SGordon Ross	int		error, timo;
5f4fc069Sjilinxpd	u_offset_t	last_off;
5f4fc069Sjilinxpd	size_t		last_resid;
8329232eSGordon Ross#ifdef	_KERNEL
5f4fc069Sjilinxpd	uint_t		bsize;
8329232eSGordon Ross#endif
4bff34e3Sthurlow
4bff34e3Sthurlow	np = VTOSMB(vp);
4bff34e3Sthurlow	smi = VTOSMI(vp);
4bff34e3Sthurlow
a19609f8Sjv	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (smi->smi_flags & SMI_DEAD || vp->v_vfsp->vfs_flag & VFS_UNMOUNTED)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
*168091e5SGordon Ross	/* Sanity check: should have a valid open */
*168091e5SGordon Ross	if (np->n_fid == NULL)
*168091e5SGordon Ross		return (EIO);
*168091e5SGordon Ross
4bff34e3Sthurlow	ASSERT(smbfs_rw_lock_held(&np->r_rwlock, RW_WRITER));
4bff34e3Sthurlow
4bff34e3Sthurlow	if (vp->v_type != VREG)
4bff34e3Sthurlow		return (EISDIR);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (uiop->uio_resid == 0)
4bff34e3Sthurlow		return (0);
4bff34e3Sthurlow
9c9af259SGordon Ross	/*
9c9af259SGordon Ross	 * Handle ioflag bits: (FAPPEND|FSYNC|FDSYNC)
9c9af259SGordon Ross	 */
9c9af259SGordon Ross	if (ioflag & (FAPPEND | FSYNC)) {
9c9af259SGordon Ross		if (np->n_flag & NMODIFIED) {
02d09e03SGordon Ross			smbfs_attrcache_remove(np);
9c9af259SGordon Ross		}
9c9af259SGordon Ross	}
9c9af259SGordon Ross	if (ioflag & FAPPEND) {
9c9af259SGordon Ross		/*
9c9af259SGordon Ross		 * File size can be changed by another client
5f4fc069Sjilinxpd		 *
5f4fc069Sjilinxpd		 * Todo: Consider redesigning this to use a
5f4fc069Sjilinxpd		 * handle opened for append instead.
9c9af259SGordon Ross		 */
9c9af259SGordon Ross		va.va_mask = AT_SIZE;
9c9af259SGordon Ross		if (error = smbfsgetattr(vp, &va, cr))
9c9af259SGordon Ross			return (error);
9c9af259SGordon Ross		uiop->uio_loffset = va.va_size;
9c9af259SGordon Ross	}
4bff34e3Sthurlow
9c9af259SGordon Ross	/*
9c9af259SGordon Ross	 * Like NFS3, just check for 63-bit overflow.
9c9af259SGordon Ross	 */
9c9af259SGordon Ross	endoff = uiop->uio_loffset + uiop->uio_resid;
9c9af259SGordon Ross	if (uiop->uio_loffset < 0 || endoff < 0)
9c9af259SGordon Ross		return (EINVAL);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
9c9af259SGordon Ross	 * Check to make sure that the process will not exceed
9c9af259SGordon Ross	 * its limit on file size.  It is okay to write up to
9c9af259SGordon Ross	 * the limit, but not beyond.  Thus, the write which
9c9af259SGordon Ross	 * reaches the limit will be short and the next write
9c9af259SGordon Ross	 * will return an error.
9c9af259SGordon Ross	 *
9c9af259SGordon Ross	 * So if we're starting at or beyond the limit, EFBIG.
9c9af259SGordon Ross	 * Otherwise, temporarily reduce resid to the amount
5f4fc069Sjilinxpd	 * that is after the limit.
4bff34e3Sthurlow	 */
9c9af259SGordon Ross	limit = uiop->uio_llimit;
9c9af259SGordon Ross	if (limit == RLIM64_INFINITY || limit > MAXOFFSET_T)
9c9af259SGordon Ross		limit = MAXOFFSET_T;
5f4fc069Sjilinxpd	if (uiop->uio_loffset >= limit) {
8329232eSGordon Ross#ifdef	_KERNEL
5f4fc069Sjilinxpd		proc_t *p = ttoproc(curthread);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		mutex_enter(&p->p_lock);
5f4fc069Sjilinxpd		(void) rctl_action(rctlproc_legacy[RLIMIT_FSIZE],
5f4fc069Sjilinxpd		    p->p_rctls, p, RCA_UNSAFE_SIGINFO);
5f4fc069Sjilinxpd		mutex_exit(&p->p_lock);
8329232eSGordon Ross#endif	// _KERNEL
9c9af259SGordon Ross		return (EFBIG);
5f4fc069Sjilinxpd	}
9c9af259SGordon Ross	if (endoff > limit) {
9c9af259SGordon Ross		past_limit = (ssize_t)(endoff - limit);
9c9af259SGordon Ross		uiop->uio_resid -= past_limit;
9c9af259SGordon Ross	} else
9c9af259SGordon Ross		past_limit = 0;
9c9af259SGordon Ross
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * Bypass VM if caching has been disabled (e.g., locking) or if
5f4fc069Sjilinxpd	 * using client-side direct I/O and the file is not mmap'd and
5f4fc069Sjilinxpd	 * there are no cached pages.
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	if ((vp->v_flag & VNOCACHE) ||
5f4fc069Sjilinxpd	    (((np->r_flags & RDIRECTIO) || (smi->smi_flags & SMI_DIRECTIO)) &&
5f4fc069Sjilinxpd	    np->r_mapcnt == 0 && np->r_inmap == 0 &&
5f4fc069Sjilinxpd	    !vn_has_cached_data(vp))) {
5f4fc069Sjilinxpd
8329232eSGordon Ross#ifdef	_KERNEL
5f4fc069Sjilinxpdsmbfs_fwrite:
8329232eSGordon Ross#endif	// _KERNEL
5f4fc069Sjilinxpd		if (np->r_flags & RSTALE) {
5f4fc069Sjilinxpd			last_resid = uiop->uio_resid;
5f4fc069Sjilinxpd			last_off = uiop->uio_loffset;
5f4fc069Sjilinxpd			error = np->r_error;
5f4fc069Sjilinxpd			/*
5f4fc069Sjilinxpd			 * A close may have cleared r_error, if so,
5f4fc069Sjilinxpd			 * propagate ESTALE error return properly
5f4fc069Sjilinxpd			 */
5f4fc069Sjilinxpd			if (error == 0)
5f4fc069Sjilinxpd				error = ESTALE;
5f4fc069Sjilinxpd			goto bottom;
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		/* Timeout: longer for append. */
5f4fc069Sjilinxpd		timo = smb_timo_write;
5f4fc069Sjilinxpd		if (endoff > np->r_size)
5f4fc069Sjilinxpd			timo = smb_timo_append;
9c9af259SGordon Ross
5f4fc069Sjilinxpd		/* Shared lock for n_fid use in smb_rwuio */
5f4fc069Sjilinxpd		if (smbfs_rw_enter_sig(&np->r_lkserlock, RW_READER, SMBINTR(vp)))
5f4fc069Sjilinxpd			return (EINTR);
5f4fc069Sjilinxpd		smb_credinit(&scred, cr);
4bff34e3Sthurlow
adee6784SGordon Ross		error = smb_rwuio(np->n_fid, UIO_WRITE,
adee6784SGordon Ross		    uiop, &scred, timo);
9c9af259SGordon Ross
5f4fc069Sjilinxpd		if (error == 0) {
5f4fc069Sjilinxpd			mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd			np->n_flag |= (NFLUSHWIRE | NATTRCHANGED);
5f4fc069Sjilinxpd			if (uiop->uio_loffset > (offset_t)np->r_size)
5f4fc069Sjilinxpd				np->r_size = (len_t)uiop->uio_loffset;
5f4fc069Sjilinxpd			mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd			if (ioflag & (FSYNC | FDSYNC)) {
5f4fc069Sjilinxpd				/* Don't error the I/O if this fails. */
adee6784SGordon Ross				(void) smbfsflush(np, &scred);
5f4fc069Sjilinxpd			}
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		smb_credrele(&scred);
5f4fc069Sjilinxpd		smbfs_rw_exit(&np->r_lkserlock);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		/* undo adjustment of resid */
5f4fc069Sjilinxpd		uiop->uio_resid += past_limit;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		return (error);
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
8329232eSGordon Ross#ifdef	_KERNEL
5f4fc069Sjilinxpd	/* (else) Do I/O through segmap. */
5f4fc069Sjilinxpd	bsize = vp->v_vfsp->vfs_bsize;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	do {
8329232eSGordon Ross		caddr_t		base;
8329232eSGordon Ross		u_offset_t	off;
8329232eSGordon Ross		size_t		n;
8329232eSGordon Ross		int		on;
8329232eSGordon Ross		uint_t		flags;
8329232eSGordon Ross
5f4fc069Sjilinxpd		off = uiop->uio_loffset & MAXBMASK; /* mapping offset */
5f4fc069Sjilinxpd		on = uiop->uio_loffset & MAXBOFFSET; /* Relative offset */
5f4fc069Sjilinxpd		n = MIN(MAXBSIZE - on, uiop->uio_resid);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		last_resid = uiop->uio_resid;
5f4fc069Sjilinxpd		last_off = uiop->uio_loffset;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		if (np->r_flags & RSTALE) {
5f4fc069Sjilinxpd			error = np->r_error;
5f4fc069Sjilinxpd			/*
5f4fc069Sjilinxpd			 * A close may have cleared r_error, if so,
5f4fc069Sjilinxpd			 * propagate ESTALE error return properly
5f4fc069Sjilinxpd			 */
5f4fc069Sjilinxpd			if (error == 0)
5f4fc069Sjilinxpd				error = ESTALE;
5f4fc069Sjilinxpd			break;
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		/*
5f4fc069Sjilinxpd		 * From NFS: Don't create dirty pages faster than they
5f4fc069Sjilinxpd		 * can be cleaned.
5f4fc069Sjilinxpd		 *
5f4fc069Sjilinxpd		 * Here NFS also checks for async writes (np->r_awcount)
5f4fc069Sjilinxpd		 */
9c9af259SGordon Ross		mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd		while (np->r_gcount > 0) {
5f4fc069Sjilinxpd			if (SMBINTR(vp)) {
5f4fc069Sjilinxpd				klwp_t *lwp = ttolwp(curthread);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd				if (lwp != NULL)
5f4fc069Sjilinxpd					lwp->lwp_nostop++;
5f4fc069Sjilinxpd				if (!cv_wait_sig(&np->r_cv, &np->r_statelock)) {
5f4fc069Sjilinxpd					mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd					if (lwp != NULL)
5f4fc069Sjilinxpd						lwp->lwp_nostop--;
5f4fc069Sjilinxpd					error = EINTR;
5f4fc069Sjilinxpd					goto bottom;
5f4fc069Sjilinxpd				}
5f4fc069Sjilinxpd				if (lwp != NULL)
5f4fc069Sjilinxpd					lwp->lwp_nostop--;
5f4fc069Sjilinxpd			} else
5f4fc069Sjilinxpd				cv_wait(&np->r_cv, &np->r_statelock);
5f4fc069Sjilinxpd		}
9c9af259SGordon Ross		mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		/*
5f4fc069Sjilinxpd		 * Touch the page and fault it in if it is not in core
5f4fc069Sjilinxpd		 * before segmap_getmapflt or vpm_data_copy can lock it.
5f4fc069Sjilinxpd		 * This is to avoid the deadlock if the buffer is mapped
5f4fc069Sjilinxpd		 * to the same file through mmap which we want to write.
5f4fc069Sjilinxpd		 */
5f4fc069Sjilinxpd		uio_prefaultpages((long)n, uiop);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		if (vpm_enable) {
5f4fc069Sjilinxpd			/*
5f4fc069Sjilinxpd			 * It will use kpm mappings, so no need to
5f4fc069Sjilinxpd			 * pass an address.
5f4fc069Sjilinxpd			 */
5f4fc069Sjilinxpd			error = smbfs_writenp(np, NULL, n, uiop, 0);
5f4fc069Sjilinxpd		} else {
5f4fc069Sjilinxpd			if (segmap_kpm) {
5f4fc069Sjilinxpd				int pon = uiop->uio_loffset & PAGEOFFSET;
5f4fc069Sjilinxpd				size_t pn = MIN(PAGESIZE - pon,
5f4fc069Sjilinxpd				    uiop->uio_resid);
5f4fc069Sjilinxpd				int pagecreate;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd				mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd				pagecreate = (pon == 0) && (pn == PAGESIZE ||
5f4fc069Sjilinxpd				    uiop->uio_loffset + pn >= np->r_size);
5f4fc069Sjilinxpd				mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd				base = segmap_getmapflt(segkmap, vp, off + on,
5f4fc069Sjilinxpd				    pn, !pagecreate, S_WRITE);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd				error = smbfs_writenp(np, base + pon, n, uiop,
5f4fc069Sjilinxpd				    pagecreate);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd			} else {
5f4fc069Sjilinxpd				base = segmap_getmapflt(segkmap, vp, off + on,
5f4fc069Sjilinxpd				    n, 0, S_READ);
5f4fc069Sjilinxpd				error = smbfs_writenp(np, base + on, n, uiop, 0);
5f4fc069Sjilinxpd			}
9c9af259SGordon Ross		}
9c9af259SGordon Ross
5f4fc069Sjilinxpd		if (!error) {
5f4fc069Sjilinxpd			if (smi->smi_flags & SMI_NOAC)
5f4fc069Sjilinxpd				flags = SM_WRITE;
5f4fc069Sjilinxpd			else if ((uiop->uio_loffset % bsize) == 0 ||
5f4fc069Sjilinxpd			    IS_SWAPVP(vp)) {
5f4fc069Sjilinxpd				/*
5f4fc069Sjilinxpd				 * Have written a whole block.
5f4fc069Sjilinxpd				 * Start an asynchronous write
5f4fc069Sjilinxpd				 * and mark the buffer to
5f4fc069Sjilinxpd				 * indicate that it won't be
5f4fc069Sjilinxpd				 * needed again soon.
5f4fc069Sjilinxpd				 */
5f4fc069Sjilinxpd				flags = SM_WRITE | SM_ASYNC | SM_DONTNEED;
5f4fc069Sjilinxpd			} else
5f4fc069Sjilinxpd				flags = 0;
5f4fc069Sjilinxpd			if ((ioflag & (FSYNC|FDSYNC)) ||
5f4fc069Sjilinxpd			    (np->r_flags & ROUTOFSPACE)) {
5f4fc069Sjilinxpd				flags &= ~SM_ASYNC;
5f4fc069Sjilinxpd				flags |= SM_WRITE;
5f4fc069Sjilinxpd			}
5f4fc069Sjilinxpd			if (vpm_enable) {
5f4fc069Sjilinxpd				error = vpm_sync_pages(vp, off, n, flags);
5f4fc069Sjilinxpd			} else {
5f4fc069Sjilinxpd				error = segmap_release(segkmap, base, flags);
5f4fc069Sjilinxpd			}
5f4fc069Sjilinxpd		} else {
5f4fc069Sjilinxpd			if (vpm_enable) {
5f4fc069Sjilinxpd				(void) vpm_sync_pages(vp, off, n, 0);
5f4fc069Sjilinxpd			} else {
5f4fc069Sjilinxpd				(void) segmap_release(segkmap, base, 0);
5f4fc069Sjilinxpd			}
5f4fc069Sjilinxpd			/*
5f4fc069Sjilinxpd			 * In the event that we got an access error while
5f4fc069Sjilinxpd			 * faulting in a page for a write-only file just
5f4fc069Sjilinxpd			 * force a write.
5f4fc069Sjilinxpd			 */
5f4fc069Sjilinxpd			if (error == EACCES)
5f4fc069Sjilinxpd				goto smbfs_fwrite;
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd	} while (!error && uiop->uio_resid > 0);
8329232eSGordon Ross#else	// _KERNEL
8329232eSGordon Ross	last_resid = uiop->uio_resid;
8329232eSGordon Ross	last_off = uiop->uio_loffset;
8329232eSGordon Ross	error = ENOSYS;
8329232eSGordon Ross#endif	// _KERNEL
4bff34e3Sthurlow
5f4fc069Sjilinxpdbottom:
9c9af259SGordon Ross	/* undo adjustment of resid */
5f4fc069Sjilinxpd	if (error) {
5f4fc069Sjilinxpd		uiop->uio_resid = last_resid + past_limit;
5f4fc069Sjilinxpd		uiop->uio_loffset = last_off;
5f4fc069Sjilinxpd	} else {
5f4fc069Sjilinxpd		uiop->uio_resid += past_limit;
5f4fc069Sjilinxpd	}
9c9af259SGordon Ross
9c9af259SGordon Ross	return (error);
4bff34e3Sthurlow}
4bff34e3Sthurlow
8329232eSGordon Ross#ifdef	_KERNEL
8329232eSGordon Ross
5f4fc069Sjilinxpd/*
5f4fc069Sjilinxpd * Like nfs_client.c: writerp()
5f4fc069Sjilinxpd *
5f4fc069Sjilinxpd * Write by creating pages and uiomove data onto them.
5f4fc069Sjilinxpd */
4bff34e3Sthurlow
5f4fc069Sjilinxpdint
5f4fc069Sjilinxpdsmbfs_writenp(smbnode_t *np, caddr_t base, int tcount, struct uio *uio,
5f4fc069Sjilinxpd    int pgcreated)
7568150aSgwr{
5f4fc069Sjilinxpd	int		pagecreate;
5f4fc069Sjilinxpd	int		n;
5f4fc069Sjilinxpd	int		saved_n;
5f4fc069Sjilinxpd	caddr_t		saved_base;
5f4fc069Sjilinxpd	u_offset_t	offset;
7568150aSgwr	int		error;
5f4fc069Sjilinxpd	int		sm_error;
5f4fc069Sjilinxpd	vnode_t		*vp = SMBTOV(np);
7568150aSgwr
5f4fc069Sjilinxpd	ASSERT(tcount <= MAXBSIZE && tcount <= uio->uio_resid);
5f4fc069Sjilinxpd	ASSERT(smbfs_rw_lock_held(&np->r_rwlock, RW_WRITER));
5f4fc069Sjilinxpd	if (!vpm_enable) {
5f4fc069Sjilinxpd		ASSERT(((uintptr_t)base & MAXBOFFSET) + tcount <= MAXBSIZE);
5f4fc069Sjilinxpd	}
7568150aSgwr
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * Move bytes in at most PAGESIZE chunks. We must avoid
5f4fc069Sjilinxpd	 * spanning pages in uiomove() because page faults may cause
5f4fc069Sjilinxpd	 * the cache to be invalidated out from under us. The r_size is not
5f4fc069Sjilinxpd	 * updated until after the uiomove. If we push the last page of a
5f4fc069Sjilinxpd	 * file before r_size is correct, we will lose the data written past
5f4fc069Sjilinxpd	 * the current (and invalid) r_size.
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	do {
5f4fc069Sjilinxpd		offset = uio->uio_loffset;
5f4fc069Sjilinxpd		pagecreate = 0;
7568150aSgwr
5f4fc069Sjilinxpd		/*
5f4fc069Sjilinxpd		 * n is the number of bytes required to satisfy the request
5f4fc069Sjilinxpd		 *   or the number of bytes to fill out the page.
5f4fc069Sjilinxpd		 */
5f4fc069Sjilinxpd		n = (int)MIN((PAGESIZE - (offset & PAGEOFFSET)), tcount);
7568150aSgwr
5f4fc069Sjilinxpd		/*
5f4fc069Sjilinxpd		 * Check to see if we can skip reading in the page
5f4fc069Sjilinxpd		 * and just allocate the memory.  We can do this
5f4fc069Sjilinxpd		 * if we are going to rewrite the entire mapping
5f4fc069Sjilinxpd		 * or if we are going to write to or beyond the current
5f4fc069Sjilinxpd		 * end of file from the beginning of the mapping.
5f4fc069Sjilinxpd		 *
5f4fc069Sjilinxpd		 * The read of r_size is now protected by r_statelock.
5f4fc069Sjilinxpd		 */
5f4fc069Sjilinxpd		mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd		/*
5f4fc069Sjilinxpd		 * When pgcreated is nonzero the caller has already done
5f4fc069Sjilinxpd		 * a segmap_getmapflt with forcefault 0 and S_WRITE. With
5f4fc069Sjilinxpd		 * segkpm this means we already have at least one page
5f4fc069Sjilinxpd		 * created and mapped at base.
5f4fc069Sjilinxpd		 */
5f4fc069Sjilinxpd		pagecreate = pgcreated ||
5f4fc069Sjilinxpd		    ((offset & PAGEOFFSET) == 0 &&
5f4fc069Sjilinxpd		    (n == PAGESIZE || ((offset + n) >= np->r_size)));
7568150aSgwr
5f4fc069Sjilinxpd		mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd		if (!vpm_enable && pagecreate) {
5f4fc069Sjilinxpd			/*
5f4fc069Sjilinxpd			 * The last argument tells segmap_pagecreate() to
5f4fc069Sjilinxpd			 * always lock the page, as opposed to sometimes
5f4fc069Sjilinxpd			 * returning with the page locked. This way we avoid a
5f4fc069Sjilinxpd			 * fault on the ensuing uiomove(), but also
5f4fc069Sjilinxpd			 * more importantly (to fix bug 1094402) we can
5f4fc069Sjilinxpd			 * call segmap_fault() to unlock the page in all
5f4fc069Sjilinxpd			 * cases. An alternative would be to modify
5f4fc069Sjilinxpd			 * segmap_pagecreate() to tell us when it is
5f4fc069Sjilinxpd			 * locking a page, but that's a fairly major
5f4fc069Sjilinxpd			 * interface change.
5f4fc069Sjilinxpd			 */
5f4fc069Sjilinxpd			if (pgcreated == 0)
5f4fc069Sjilinxpd				(void) segmap_pagecreate(segkmap, base,
5f4fc069Sjilinxpd				    (uint_t)n, 1);
5f4fc069Sjilinxpd			saved_base = base;
5f4fc069Sjilinxpd			saved_n = n;
5f4fc069Sjilinxpd		}
7568150aSgwr
7568150aSgwr		/*
5f4fc069Sjilinxpd		 * The number of bytes of data in the last page can not
5f4fc069Sjilinxpd		 * be accurately be determined while page is being
5f4fc069Sjilinxpd		 * uiomove'd to and the size of the file being updated.
5f4fc069Sjilinxpd		 * Thus, inform threads which need to know accurately
5f4fc069Sjilinxpd		 * how much data is in the last page of the file.  They
5f4fc069Sjilinxpd		 * will not do the i/o immediately, but will arrange for
5f4fc069Sjilinxpd		 * the i/o to happen later when this modify operation
5f4fc069Sjilinxpd		 * will have finished.
7568150aSgwr		 */
5f4fc069Sjilinxpd		ASSERT(!(np->r_flags & RMODINPROGRESS));
5f4fc069Sjilinxpd		mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd		np->r_flags |= RMODINPROGRESS;
5f4fc069Sjilinxpd		np->r_modaddr = (offset & MAXBMASK);
5f4fc069Sjilinxpd		mutex_exit(&np->r_statelock);
7568150aSgwr
5f4fc069Sjilinxpd		if (vpm_enable) {
5f4fc069Sjilinxpd			/*
5f4fc069Sjilinxpd			 * Copy data. If new pages are created, part of
5f4fc069Sjilinxpd			 * the page that is not written will be initizliazed
5f4fc069Sjilinxpd			 * with zeros.
5f4fc069Sjilinxpd			 */
5f4fc069Sjilinxpd			error = vpm_data_copy(vp, offset, n, uio,
5f4fc069Sjilinxpd			    !pagecreate, NULL, 0, S_WRITE);
5f4fc069Sjilinxpd		} else {
5f4fc069Sjilinxpd			error = uiomove(base, n, UIO_WRITE, uio);
5f4fc069Sjilinxpd		}
7568150aSgwr
7568150aSgwr		/*
5f4fc069Sjilinxpd		 * r_size is the maximum number of
5f4fc069Sjilinxpd		 * bytes known to be in the file.
5f4fc069Sjilinxpd		 * Make sure it is at least as high as the
5f4fc069Sjilinxpd		 * first unwritten byte pointed to by uio_loffset.
7568150aSgwr		 */
5f4fc069Sjilinxpd		mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd		if (np->r_size < uio->uio_loffset)
5f4fc069Sjilinxpd			np->r_size = uio->uio_loffset;
5f4fc069Sjilinxpd		np->r_flags &= ~RMODINPROGRESS;
5f4fc069Sjilinxpd		np->r_flags |= RDIRTY;
5f4fc069Sjilinxpd		mutex_exit(&np->r_statelock);
7568150aSgwr
5f4fc069Sjilinxpd		/* n = # of bytes written */
5f4fc069Sjilinxpd		n = (int)(uio->uio_loffset - offset);
7568150aSgwr
5f4fc069Sjilinxpd		if (!vpm_enable) {
5f4fc069Sjilinxpd			base += n;
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd		tcount -= n;
5f4fc069Sjilinxpd		/*
5f4fc069Sjilinxpd		 * If we created pages w/o initializing them completely,
5f4fc069Sjilinxpd		 * we need to zero the part that wasn't set up.
5f4fc069Sjilinxpd		 * This happens on a most EOF write cases and if
5f4fc069Sjilinxpd		 * we had some sort of error during the uiomove.
5f4fc069Sjilinxpd		 */
5f4fc069Sjilinxpd		if (!vpm_enable && pagecreate) {
5f4fc069Sjilinxpd			if ((uio->uio_loffset & PAGEOFFSET) || n == 0)
5f4fc069Sjilinxpd				(void) kzero(base, PAGESIZE - n);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd			if (pgcreated) {
5f4fc069Sjilinxpd				/*
5f4fc069Sjilinxpd				 * Caller is responsible for this page,
5f4fc069Sjilinxpd				 * it was not created in this loop.
5f4fc069Sjilinxpd				 */
5f4fc069Sjilinxpd				pgcreated = 0;
5f4fc069Sjilinxpd			} else {
5f4fc069Sjilinxpd				/*
5f4fc069Sjilinxpd				 * For bug 1094402: segmap_pagecreate locks
5f4fc069Sjilinxpd				 * page. Unlock it. This also unlocks the
5f4fc069Sjilinxpd				 * pages allocated by page_create_va() in
5f4fc069Sjilinxpd				 * segmap_pagecreate().
5f4fc069Sjilinxpd				 */
5f4fc069Sjilinxpd				sm_error = segmap_fault(kas.a_hat, segkmap,
5f4fc069Sjilinxpd				    saved_base, saved_n,
5f4fc069Sjilinxpd				    F_SOFTUNLOCK, S_WRITE);
5f4fc069Sjilinxpd				if (error == 0)
5f4fc069Sjilinxpd					error = sm_error;
5f4fc069Sjilinxpd			}
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd	} while (tcount > 0 && error == 0);
7568150aSgwr
7568150aSgwr	return (error);
7568150aSgwr}
7568150aSgwr
4bff34e3Sthurlow/*
5f4fc069Sjilinxpd * Flags are composed of {B_ASYNC, B_INVAL, B_FREE, B_DONTNEED}
5f4fc069Sjilinxpd * Like nfs3_rdwrlbn()
4bff34e3Sthurlow */
4bff34e3Sthurlowstatic int
5f4fc069Sjilinxpdsmbfs_rdwrlbn(vnode_t *vp, page_t *pp, u_offset_t off, size_t len,
5f4fc069Sjilinxpd	int flags, cred_t *cr)
4bff34e3Sthurlow{
5f4fc069Sjilinxpd	smbmntinfo_t	*smi = VTOSMI(vp);
5f4fc069Sjilinxpd	struct buf *bp;
5f4fc069Sjilinxpd	int error;
5f4fc069Sjilinxpd	int sync;
4bff34e3Sthurlow
a19609f8Sjv	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (smi->smi_flags & SMI_DEAD || vp->v_vfsp->vfs_flag & VFS_UNMOUNTED)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
5f4fc069Sjilinxpd	bp = pageio_setup(pp, len, vp, flags);
5f4fc069Sjilinxpd	ASSERT(bp != NULL);
5f4fc069Sjilinxpd
4bff34e3Sthurlow	/*
5f4fc069Sjilinxpd	 * pageio_setup should have set b_addr to 0.  This
5f4fc069Sjilinxpd	 * is correct since we want to do I/O on a page
5f4fc069Sjilinxpd	 * boundary.  bp_mapin will use this addr to calculate
5f4fc069Sjilinxpd	 * an offset, and then set b_addr to the kernel virtual
5f4fc069Sjilinxpd	 * address it allocated for us.
4bff34e3Sthurlow	 */
5f4fc069Sjilinxpd	ASSERT(bp->b_un.b_addr == 0);
4bff34e3Sthurlow
5f4fc069Sjilinxpd	bp->b_edev = 0;
5f4fc069Sjilinxpd	bp->b_dev = 0;
5f4fc069Sjilinxpd	bp->b_lblkno = lbtodb(off);
5f4fc069Sjilinxpd	bp->b_file = vp;
5f4fc069Sjilinxpd	bp->b_offset = (offset_t)off;
5f4fc069Sjilinxpd	bp_mapin(bp);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * Calculate the desired level of stability to write data.
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	if ((flags & (B_WRITE|B_ASYNC)) == (B_WRITE|B_ASYNC) &&
5f4fc069Sjilinxpd	    freemem > desfree) {
5f4fc069Sjilinxpd		sync = 0;
5f4fc069Sjilinxpd	} else {
5f4fc069Sjilinxpd		sync = 1;
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	error = smbfs_bio(bp, sync, cr);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	bp_mapout(bp);
5f4fc069Sjilinxpd	pageio_done(bp);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	return (error);
5f4fc069Sjilinxpd}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd/*
5f4fc069Sjilinxpd * Corresponds to nfs3_vnopc.c : nfs3_bio(), though the NFS code
5f4fc069Sjilinxpd * uses nfs3read()/nfs3write() where we use smb_rwuio().  Also,
5f4fc069Sjilinxpd * NFS has this later in the file.  Move it up here closer to
5f4fc069Sjilinxpd * the one call site just above.
5f4fc069Sjilinxpd */
5f4fc069Sjilinxpd
5f4fc069Sjilinxpdstatic int
5f4fc069Sjilinxpdsmbfs_bio(struct buf *bp, int sync, cred_t *cr)
5f4fc069Sjilinxpd{
5f4fc069Sjilinxpd	struct iovec aiov[1];
5f4fc069Sjilinxpd	struct uio  auio;
5f4fc069Sjilinxpd	struct smb_cred scred;
5f4fc069Sjilinxpd	smbnode_t *np = VTOSMB(bp->b_vp);
5f4fc069Sjilinxpd	smbmntinfo_t *smi = np->n_mount;
5f4fc069Sjilinxpd	offset_t offset;
5f4fc069Sjilinxpd	offset_t endoff;
5f4fc069Sjilinxpd	size_t count;
5f4fc069Sjilinxpd	size_t past_eof;
5f4fc069Sjilinxpd	int error;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	ASSERT(curproc->p_zone == smi->smi_zone_ref.zref_zone);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	offset = ldbtob(bp->b_lblkno);
5f4fc069Sjilinxpd	count = bp->b_bcount;
5f4fc069Sjilinxpd	endoff = offset + count;
5f4fc069Sjilinxpd	if (offset < 0 || endoff < 0)
5f4fc069Sjilinxpd		return (EINVAL);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * Limit file I/O to the remaining file size, but see
5f4fc069Sjilinxpd	 * the notes in smbfs_getpage about SMBFS_EOF.
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd	if (offset >= np->r_size) {
5f4fc069Sjilinxpd		mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd		if (bp->b_flags & B_READ) {
5f4fc069Sjilinxpd			return (SMBFS_EOF);
5f4fc069Sjilinxpd		} else {
5f4fc069Sjilinxpd			return (EINVAL);
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd	if (endoff > np->r_size) {
5f4fc069Sjilinxpd		past_eof = (size_t)(endoff - np->r_size);
5f4fc069Sjilinxpd		count -= past_eof;
5f4fc069Sjilinxpd	} else
5f4fc069Sjilinxpd		past_eof = 0;
5f4fc069Sjilinxpd	mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd	ASSERT(count > 0);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/* Caller did bpmapin().  Mapped address is... */
5f4fc069Sjilinxpd	aiov[0].iov_base = bp->b_un.b_addr;
5f4fc069Sjilinxpd	aiov[0].iov_len = count;
5f4fc069Sjilinxpd	auio.uio_iov = aiov;
5f4fc069Sjilinxpd	auio.uio_iovcnt = 1;
5f4fc069Sjilinxpd	auio.uio_loffset = offset;
5f4fc069Sjilinxpd	auio.uio_segflg = UIO_SYSSPACE;
5f4fc069Sjilinxpd	auio.uio_fmode = 0;
5f4fc069Sjilinxpd	auio.uio_resid = count;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/* Shared lock for n_fid use in smb_rwuio */
5f4fc069Sjilinxpd	if (smbfs_rw_enter_sig(&np->r_lkserlock, RW_READER,
5f4fc069Sjilinxpd	    smi->smi_flags & SMI_INT))
5f4fc069Sjilinxpd		return (EINTR);
5f4fc069Sjilinxpd	smb_credinit(&scred, cr);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	DTRACE_IO1(start, struct buf *, bp);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (bp->b_flags & B_READ) {
5f4fc069Sjilinxpd
adee6784SGordon Ross		error = smb_rwuio(np->n_fid, UIO_READ,
adee6784SGordon Ross		    &auio, &scred, smb_timo_read);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		/* Like NFS, only set b_error here. */
5f4fc069Sjilinxpd		bp->b_error = error;
5f4fc069Sjilinxpd		bp->b_resid = auio.uio_resid;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		if (!error && auio.uio_resid != 0)
5f4fc069Sjilinxpd			error = EIO;
5f4fc069Sjilinxpd		if (!error && past_eof != 0) {
5f4fc069Sjilinxpd			/* Zero the memory beyond EOF. */
5f4fc069Sjilinxpd			bzero(bp->b_un.b_addr + count, past_eof);
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd	} else {
5f4fc069Sjilinxpd
adee6784SGordon Ross		error = smb_rwuio(np->n_fid, UIO_WRITE,
adee6784SGordon Ross		    &auio, &scred, smb_timo_write);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		/* Like NFS, only set b_error here. */
5f4fc069Sjilinxpd		bp->b_error = error;
5f4fc069Sjilinxpd		bp->b_resid = auio.uio_resid;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		if (!error && auio.uio_resid != 0)
5f4fc069Sjilinxpd			error = EIO;
5f4fc069Sjilinxpd		if (!error && sync) {
adee6784SGordon Ross			(void) smbfsflush(np, &scred);
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * This comes from nfs3_commit()
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	if (error != 0) {
5f4fc069Sjilinxpd		mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd		if (error == ESTALE)
5f4fc069Sjilinxpd			np->r_flags |= RSTALE;
5f4fc069Sjilinxpd		if (!np->r_error)
5f4fc069Sjilinxpd			np->r_error = error;
5f4fc069Sjilinxpd		mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd		bp->b_flags |= B_ERROR;
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	DTRACE_IO1(done, struct buf *, bp);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	smb_credrele(&scred);
5f4fc069Sjilinxpd	smbfs_rw_exit(&np->r_lkserlock);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (error == ESTALE)
5f4fc069Sjilinxpd		smbfs_attrcache_remove(np);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	return (error);
5f4fc069Sjilinxpd}
8329232eSGordon Ross#endif	// _KERNEL
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd/*
5f4fc069Sjilinxpd * Here NFS has: nfs3write, nfs3read
5f4fc069Sjilinxpd * We use smb_rwuio instead.
5f4fc069Sjilinxpd */
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd/* ARGSUSED */
5f4fc069Sjilinxpdstatic int
5f4fc069Sjilinxpdsmbfs_ioctl(vnode_t *vp, int cmd, intptr_t arg, int flag,
5f4fc069Sjilinxpd	cred_t *cr, int *rvalp,	caller_context_t *ct)
5f4fc069Sjilinxpd{
5f4fc069Sjilinxpd	int		error;
5f4fc069Sjilinxpd	smbmntinfo_t	*smi;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	smi = VTOSMI(vp);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
5f4fc069Sjilinxpd		return (EIO);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (smi->smi_flags & SMI_DEAD || vp->v_vfsp->vfs_flag & VFS_UNMOUNTED)
5f4fc069Sjilinxpd		return (EIO);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	switch (cmd) {
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	case _FIOFFS:
5f4fc069Sjilinxpd		error = smbfs_fsync(vp, 0, cr, ct);
5f4fc069Sjilinxpd		break;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		/*
5f4fc069Sjilinxpd		 * The following two ioctls are used by bfu.
5f4fc069Sjilinxpd		 * Silently ignore to avoid bfu errors.
5f4fc069Sjilinxpd		 */
5f4fc069Sjilinxpd	case _FIOGDIO:
5f4fc069Sjilinxpd	case _FIOSDIO:
5f4fc069Sjilinxpd		error = 0;
5f4fc069Sjilinxpd		break;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd#if 0	/* Todo - SMB ioctl query regions */
5f4fc069Sjilinxpd	case _FIO_SEEK_DATA:
5f4fc069Sjilinxpd	case _FIO_SEEK_HOLE:
5f4fc069Sjilinxpd#endif
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	case _FIODIRECTIO:
5f4fc069Sjilinxpd		error = smbfs_directio(vp, (int)arg, cr);
5f4fc069Sjilinxpd		break;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		/*
5f4fc069Sjilinxpd		 * Allow get/set with "raw" security descriptor (SD) data.
5f4fc069Sjilinxpd		 * Useful for testing, diagnosing idmap problems, etc.
5f4fc069Sjilinxpd		 */
5f4fc069Sjilinxpd	case SMBFSIO_GETSD:
5f4fc069Sjilinxpd		error = smbfs_acl_iocget(vp, arg, flag, cr);
5f4fc069Sjilinxpd		break;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	case SMBFSIO_SETSD:
5f4fc069Sjilinxpd		error = smbfs_acl_iocset(vp, arg, flag, cr);
5f4fc069Sjilinxpd		break;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	default:
5f4fc069Sjilinxpd		error = ENOTTY;
5f4fc069Sjilinxpd		break;
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	return (error);
5f4fc069Sjilinxpd}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd/*
5f4fc069Sjilinxpd * Return either cached or remote attributes. If get remote attr
5f4fc069Sjilinxpd * use them to check and invalidate caches, then cache the new attributes.
5f4fc069Sjilinxpd */
5f4fc069Sjilinxpd/* ARGSUSED */
5f4fc069Sjilinxpdstatic int
5f4fc069Sjilinxpdsmbfs_getattr(vnode_t *vp, struct vattr *vap, int flags, cred_t *cr,
5f4fc069Sjilinxpd	caller_context_t *ct)
5f4fc069Sjilinxpd{
5f4fc069Sjilinxpd	smbnode_t *np;
5f4fc069Sjilinxpd	smbmntinfo_t *smi;
5f4fc069Sjilinxpd	int error;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	smi = VTOSMI(vp);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
5f4fc069Sjilinxpd		return (EIO);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (smi->smi_flags & SMI_DEAD || vp->v_vfsp->vfs_flag & VFS_UNMOUNTED)
5f4fc069Sjilinxpd		return (EIO);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * If it has been specified that the return value will
5f4fc069Sjilinxpd	 * just be used as a hint, and we are only being asked
5f4fc069Sjilinxpd	 * for size, fsid or rdevid, then return the client's
5f4fc069Sjilinxpd	 * notion of these values without checking to make sure
5f4fc069Sjilinxpd	 * that the attribute cache is up to date.
5f4fc069Sjilinxpd	 * The whole point is to avoid an over the wire GETATTR
5f4fc069Sjilinxpd	 * call.
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	np = VTOSMB(vp);
5f4fc069Sjilinxpd	if (flags & ATTR_HINT) {
5f4fc069Sjilinxpd		if (vap->va_mask ==
5f4fc069Sjilinxpd		    (vap->va_mask & (AT_SIZE | AT_FSID | AT_RDEV))) {
5f4fc069Sjilinxpd			mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd			if (vap->va_mask | AT_SIZE)
5f4fc069Sjilinxpd				vap->va_size = np->r_size;
5f4fc069Sjilinxpd			if (vap->va_mask | AT_FSID)
5f4fc069Sjilinxpd				vap->va_fsid = vp->v_vfsp->vfs_dev;
5f4fc069Sjilinxpd			if (vap->va_mask | AT_RDEV)
5f4fc069Sjilinxpd				vap->va_rdev = vp->v_rdev;
5f4fc069Sjilinxpd			mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd			return (0);
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * Only need to flush pages if asking for the mtime
5f4fc069Sjilinxpd	 * and if there any dirty pages.
5f4fc069Sjilinxpd	 *
5f4fc069Sjilinxpd	 * Here NFS also checks for async writes (np->r_awcount)
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	if (vap->va_mask & AT_MTIME) {
5f4fc069Sjilinxpd		if (vn_has_cached_data(vp) &&
5f4fc069Sjilinxpd		    ((np->r_flags & RDIRTY) != 0)) {
5f4fc069Sjilinxpd			mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd			np->r_gcount++;
5f4fc069Sjilinxpd			mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd			error = smbfs_putpage(vp, (offset_t)0, 0, 0, cr, ct);
5f4fc069Sjilinxpd			mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd			if (error && (error == ENOSPC || error == EDQUOT)) {
5f4fc069Sjilinxpd				if (!np->r_error)
5f4fc069Sjilinxpd					np->r_error = error;
5f4fc069Sjilinxpd			}
5f4fc069Sjilinxpd			if (--np->r_gcount == 0)
5f4fc069Sjilinxpd				cv_broadcast(&np->r_cv);
5f4fc069Sjilinxpd			mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	return (smbfsgetattr(vp, vap, cr));
5f4fc069Sjilinxpd}
4bff34e3Sthurlow
02d09e03SGordon Ross/* smbfsgetattr() in smbfs_client.c */
4bff34e3Sthurlow
4bff34e3Sthurlow/*ARGSUSED4*/
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_setattr(vnode_t *vp, struct vattr *vap, int flags, cred_t *cr,
4bff34e3Sthurlow		caller_context_t *ct)
4bff34e3Sthurlow{
02d09e03SGordon Ross	vfs_t		*vfsp;
02d09e03SGordon Ross	smbmntinfo_t	*smi;
4bff34e3Sthurlow	int		error;
4bff34e3Sthurlow	uint_t		mask;
4bff34e3Sthurlow	struct vattr	oldva;
4bff34e3Sthurlow
02d09e03SGordon Ross	vfsp = vp->v_vfsp;
02d09e03SGordon Ross	smi = VFTOSMI(vfsp);
4bff34e3Sthurlow
a19609f8Sjv	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
02d09e03SGordon Ross	if (smi->smi_flags & SMI_DEAD || vfsp->vfs_flag & VFS_UNMOUNTED)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	mask = vap->va_mask;
4bff34e3Sthurlow	if (mask & AT_NOSET)
4bff34e3Sthurlow		return (EINVAL);
4bff34e3Sthurlow
02d09e03SGordon Ross	if (vfsp->vfs_flag & VFS_RDONLY)
02d09e03SGordon Ross		return (EROFS);
02d09e03SGordon Ross
bd7c6f51SGordon Ross	/*
bd7c6f51SGordon Ross	 * This is a _local_ access check so that only the owner of
bd7c6f51SGordon Ross	 * this mount can set attributes.  With ACLs enabled, the
bd7c6f51SGordon Ross	 * file owner can be different from the mount owner, and we
bd7c6f51SGordon Ross	 * need to check the _mount_ owner here.  See _access_rwx
bd7c6f51SGordon Ross	 */
02d09e03SGordon Ross	bzero(&oldva, sizeof (oldva));
bd7c6f51SGordon Ross	oldva.va_mask = AT_TYPE | AT_MODE;
4bff34e3Sthurlow	error = smbfsgetattr(vp, &oldva, cr);
4bff34e3Sthurlow	if (error)
4bff34e3Sthurlow		return (error);
bd7c6f51SGordon Ross	oldva.va_mask |= AT_UID | AT_GID;
bd7c6f51SGordon Ross	oldva.va_uid = smi->smi_uid;
bd7c6f51SGordon Ross	oldva.va_gid = smi->smi_gid;
4bff34e3Sthurlow
4bff34e3Sthurlow	error = secpolicy_vnode_setattr(cr, vp, vap, &oldva, flags,
4bff34e3Sthurlow	    smbfs_accessx, vp);
4bff34e3Sthurlow	if (error)
4bff34e3Sthurlow		return (error);
4bff34e3Sthurlow
bd7c6f51SGordon Ross	if (mask & (AT_UID | AT_GID)) {
bd7c6f51SGordon Ross		if (smi->smi_flags & SMI_ACL)
bd7c6f51SGordon Ross			error = smbfs_acl_setids(vp, vap, cr);
bd7c6f51SGordon Ross		else
bd7c6f51SGordon Ross			error = ENOSYS;
bd7c6f51SGordon Ross		if (error != 0) {
bd7c6f51SGordon Ross			SMBVDEBUG("error %d seting UID/GID on %s",
bd7c6f51SGordon Ross			    error, VTOSMB(vp)->n_rpath);
bd7c6f51SGordon Ross			/*
bd7c6f51SGordon Ross			 * It might be more correct to return the
bd7c6f51SGordon Ross			 * error here, but that causes complaints
bd7c6f51SGordon Ross			 * when root extracts a cpio archive, etc.
bd7c6f51SGordon Ross			 * So ignore this error, and go ahead with
bd7c6f51SGordon Ross			 * the rest of the setattr work.
bd7c6f51SGordon Ross			 */
bd7c6f51SGordon Ross		}
bd7c6f51SGordon Ross	}
bd7c6f51SGordon Ross
5f4fc069Sjilinxpd	error = smbfssetattr(vp, vap, flags, cr);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd#ifdef	SMBFS_VNEVENT
5f4fc069Sjilinxpd	if (error == 0 && (vap->va_mask & AT_SIZE) && vap->va_size == 0)
5f4fc069Sjilinxpd		vnevent_truncate(vp, ct);
5f4fc069Sjilinxpd#endif
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	return (error);
4bff34e3Sthurlow}
4bff34e3Sthurlow
4bff34e3Sthurlow/*
4bff34e3Sthurlow * Mostly from Darwin smbfs_setattr()
4bff34e3Sthurlow * but then modified a lot.
4bff34e3Sthurlow */
4bff34e3Sthurlow/* ARGSUSED */
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfssetattr(vnode_t *vp, struct vattr *vap, int flags, cred_t *cr)
4bff34e3Sthurlow{
4bff34e3Sthurlow	int		error = 0;
4bff34e3Sthurlow	smbnode_t	*np = VTOSMB(vp);
adee6784SGordon Ross	smbmntinfo_t	*smi = np->n_mount;
4bff34e3Sthurlow	uint_t		mask = vap->va_mask;
4bff34e3Sthurlow	struct timespec	*mtime, *atime;
4bff34e3Sthurlow	struct smb_cred	scred;
adee6784SGordon Ross	int		modified = 0;
adee6784SGordon Ross	smb_fh_t	*fid = NULL;
4bff34e3Sthurlow	uint32_t rights = 0;
28162916SGordon Ross	uint32_t dosattr = 0;
4bff34e3Sthurlow
a19609f8Sjv	ASSERT(curproc->p_zone == VTOSMI(vp)->smi_zone_ref.zref_zone);
4bff34e3Sthurlow
91d632c8Sgwr	/*
91d632c8Sgwr	 * There are no settable attributes on the XATTR dir,
91d632c8Sgwr	 * so just silently ignore these.  On XATTR files,
91d632c8Sgwr	 * you can set the size but nothing else.
91d632c8Sgwr	 */
91d632c8Sgwr	if (vp->v_flag & V_XATTRDIR)
91d632c8Sgwr		return (0);
91d632c8Sgwr	if (np->n_flag & N_XATTR) {
91d632c8Sgwr		if (mask & AT_TIMES)
91d632c8Sgwr			SMBVDEBUG("ignore set time on xattr\n");
91d632c8Sgwr		mask &= AT_SIZE;
91d632c8Sgwr	}
91d632c8Sgwr
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * Only need to flush pages if there are any pages and
5f4fc069Sjilinxpd	 * if the file is marked as dirty in some fashion.  The
5f4fc069Sjilinxpd	 * file must be flushed so that we can accurately
5f4fc069Sjilinxpd	 * determine the size of the file and the cached data
5f4fc069Sjilinxpd	 * after the SETATTR returns.  A file is considered to
5f4fc069Sjilinxpd	 * be dirty if it is either marked with RDIRTY, has
5f4fc069Sjilinxpd	 * outstanding i/o's active, or is mmap'd.  In this
5f4fc069Sjilinxpd	 * last case, we can't tell whether there are dirty
5f4fc069Sjilinxpd	 * pages, so we flush just to be sure.
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	if (vn_has_cached_data(vp) &&
5f4fc069Sjilinxpd	    ((np->r_flags & RDIRTY) ||
5f4fc069Sjilinxpd	    np->r_count > 0 ||
5f4fc069Sjilinxpd	    np->r_mapcnt > 0)) {
5f4fc069Sjilinxpd		ASSERT(vp->v_type != VCHR);
5f4fc069Sjilinxpd		error = smbfs_putpage(vp, (offset_t)0, 0, 0, cr, NULL);
5f4fc069Sjilinxpd		if (error && (error == ENOSPC || error == EDQUOT)) {
5f4fc069Sjilinxpd			mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd			if (!np->r_error)
5f4fc069Sjilinxpd				np->r_error = error;
5f4fc069Sjilinxpd			mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * If our caller is trying to set multiple attributes, they
4bff34e3Sthurlow	 * can make no assumption about what order they are done in.
4bff34e3Sthurlow	 * Here we try to do them in order of decreasing likelihood
4bff34e3Sthurlow	 * of failure, just to minimize the chance we'll wind up
4bff34e3Sthurlow	 * with a partially complete request.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow
613a2f6bSGordon Ross	smb_credinit(&scred, cr);
4bff34e3Sthurlow
28162916SGordon Ross	/*
28162916SGordon Ross	 * If the caller has provided extensible attributes,
28162916SGordon Ross	 * map those into DOS attributes supported by SMB.
28162916SGordon Ross	 * Note: zero means "no change".
28162916SGordon Ross	 */
28162916SGordon Ross	if (mask & AT_XVATTR)
28162916SGordon Ross		dosattr = xvattr_to_dosattr(np, vap);
28162916SGordon Ross
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Will we need an open handle for this setattr?
4bff34e3Sthurlow	 * If so, what rights will we need?
4bff34e3Sthurlow	 */
28162916SGordon Ross	if (dosattr || (mask & (AT_ATIME | AT_MTIME))) {
4bff34e3Sthurlow		rights |=
02d09e03SGordon Ross		    SA_RIGHT_FILE_WRITE_ATTRIBUTES;
4bff34e3Sthurlow	}
4bff34e3Sthurlow	if (mask & AT_SIZE) {
4bff34e3Sthurlow		rights |=
4bff34e3Sthurlow		    SA_RIGHT_FILE_WRITE_DATA |
4bff34e3Sthurlow		    SA_RIGHT_FILE_APPEND_DATA;
02d09e03SGordon Ross	}
02d09e03SGordon Ross
02d09e03SGordon Ross	/*
02d09e03SGordon Ross	 * Only SIZE really requires a handle, but it's
02d09e03SGordon Ross	 * simpler and more reliable to set via a handle.
02d09e03SGordon Ross	 * Some servers like NT4 won't set times by path.
02d09e03SGordon Ross	 * Also, we're usually setting everything anyway.
02d09e03SGordon Ross	 */
28162916SGordon Ross	if (rights != 0) {
4bff34e3Sthurlow		error = smbfs_smb_tmpopen(np, rights, &scred, &fid);
4bff34e3Sthurlow		if (error) {
4bff34e3Sthurlow			SMBVDEBUG("error %d opening %s\n",
4bff34e3Sthurlow			    error, np->n_rpath);
4bff34e3Sthurlow			goto out;
4bff34e3Sthurlow		}
adee6784SGordon Ross		ASSERT(fid != NULL);
4bff34e3Sthurlow	}
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * If the server supports the UNIX extensions, right here is where
4bff34e3Sthurlow	 * we'd support changes to uid, gid, mode, and possibly va_flags.
4bff34e3Sthurlow	 * For now we claim to have made any such changes.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow
4bff34e3Sthurlow	if (mask & AT_SIZE) {
4bff34e3Sthurlow		/*
4bff34e3Sthurlow		 * If the new file size is less than what the client sees as
4bff34e3Sthurlow		 * the file size, then just change the size and invalidate
4bff34e3Sthurlow		 * the pages.
4bff34e3Sthurlow		 */
4bff34e3Sthurlow
4bff34e3Sthurlow		/*
4bff34e3Sthurlow		 * Set the file size to vap->va_size.
4bff34e3Sthurlow		 */
adee6784SGordon Ross		ASSERT(fid != NULL);
adee6784SGordon Ross		error = smbfs_smb_setfsize(smi->smi_share, fid,
adee6784SGordon Ross		    vap->va_size, &scred);
4bff34e3Sthurlow		if (error) {
4bff34e3Sthurlow			SMBVDEBUG("setsize error %d file %s\n",
4bff34e3Sthurlow			    error, np->n_rpath);
4bff34e3Sthurlow		} else {
4bff34e3Sthurlow			/*
4bff34e3Sthurlow			 * Darwin had code here to zero-extend.
4bff34e3Sthurlow			 * Tests indicate the server will zero-fill,
5f4fc069Sjilinxpd			 * so looks like we don't need to do that.
4bff34e3Sthurlow			 */
4bff34e3Sthurlow			mutex_enter(&np->r_statelock);
4bff34e3Sthurlow			np->r_size = vap->va_size;
adee6784SGordon Ross			np->n_flag |= (NFLUSHWIRE | NATTRCHANGED);
4bff34e3Sthurlow			mutex_exit(&np->r_statelock);
4bff34e3Sthurlow			modified = 1;
4bff34e3Sthurlow		}
4bff34e3Sthurlow	}
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
5f4fc069Sjilinxpd	 * Todo: Implement setting create_time (which is
5f4fc069Sjilinxpd	 * different from ctime).
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	mtime = ((mask & AT_MTIME) ? &vap->va_mtime : 0);
4bff34e3Sthurlow	atime = ((mask & AT_ATIME) ? &vap->va_atime : 0);
4bff34e3Sthurlow
28162916SGordon Ross	if (dosattr || mtime || atime) {
4bff34e3Sthurlow		/*
02d09e03SGordon Ross		 * Always use the handle-based set attr call now.
4bff34e3Sthurlow		 */
adee6784SGordon Ross		ASSERT(fid != NULL);
adee6784SGordon Ross		error = smbfs_smb_setfattr(smi->smi_share, fid,
28162916SGordon Ross		    dosattr, mtime, atime, &scred);
4bff34e3Sthurlow		if (error) {
4bff34e3Sthurlow			SMBVDEBUG("set times error %d file %s\n",
4bff34e3Sthurlow			    error, np->n_rpath);
4bff34e3Sthurlow		} else {
4bff34e3Sthurlow			modified = 1;
4bff34e3Sthurlow		}
4bff34e3Sthurlow	}
4bff34e3Sthurlow
4bff34e3Sthurlowout:
adee6784SGordon Ross	if (fid != NULL)
adee6784SGordon Ross		smbfs_smb_tmpclose(np, fid);
4bff34e3Sthurlow
4bff34e3Sthurlow	smb_credrele(&scred);
4bff34e3Sthurlow
5f4fc069Sjilinxpd	if (modified) {
5f4fc069Sjilinxpd		/*
5f4fc069Sjilinxpd		 * Invalidate attribute cache in case the server
5f4fc069Sjilinxpd		 * doesn't set exactly the attributes we asked.
5f4fc069Sjilinxpd		 */
5f4fc069Sjilinxpd		smbfs_attrcache_remove(np);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		/*
5f4fc069Sjilinxpd		 * If changing the size of the file, invalidate
5f4fc069Sjilinxpd		 * any local cached data which is no longer part
5f4fc069Sjilinxpd		 * of the file.  We also possibly invalidate the
5f4fc069Sjilinxpd		 * last page in the file.  We could use
5f4fc069Sjilinxpd		 * pvn_vpzero(), but this would mark the page as
5f4fc069Sjilinxpd		 * modified and require it to be written back to
5f4fc069Sjilinxpd		 * the server for no particularly good reason.
5f4fc069Sjilinxpd		 * This way, if we access it, then we bring it
5f4fc069Sjilinxpd		 * back in.  A read should be cheaper than a
5f4fc069Sjilinxpd		 * write.
5f4fc069Sjilinxpd		 */
5f4fc069Sjilinxpd		if (mask & AT_SIZE) {
5f4fc069Sjilinxpd			smbfs_invalidate_pages(vp,
5f4fc069Sjilinxpd			    (vap->va_size & PAGEMASK), cr);
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
4bff34e3Sthurlow	return (error);
4bff34e3Sthurlow}
4bff34e3Sthurlow
28162916SGordon Ross/*
28162916SGordon Ross * Helper function for extensible system attributes (PSARC 2007/315)
28162916SGordon Ross * Compute the DOS attribute word to pass to _setfattr (see above).
28162916SGordon Ross * This returns zero IFF no change is being made to attributes.
28162916SGordon Ross * Otherwise return the new attributes or SMB_EFA_NORMAL.
28162916SGordon Ross */
28162916SGordon Rossstatic uint32_t
28162916SGordon Rossxvattr_to_dosattr(smbnode_t *np, struct vattr *vap)
28162916SGordon Ross{
28162916SGordon Ross	xvattr_t *xvap = (xvattr_t *)vap;
28162916SGordon Ross	xoptattr_t *xoap = NULL;
28162916SGordon Ross	uint32_t attr = np->r_attr.fa_attr;
28162916SGordon Ross	boolean_t anyset = B_FALSE;
28162916SGordon Ross
28162916SGordon Ross	if ((xoap = xva_getxoptattr(xvap)) == NULL)
28162916SGordon Ross		return (0);
28162916SGordon Ross
28162916SGordon Ross	if (XVA_ISSET_REQ(xvap, XAT_ARCHIVE)) {
28162916SGordon Ross		if (xoap->xoa_archive)
28162916SGordon Ross			attr |= SMB_FA_ARCHIVE;
28162916SGordon Ross		else
28162916SGordon Ross			attr &= ~SMB_FA_ARCHIVE;
28162916SGordon Ross		XVA_SET_RTN(xvap, XAT_ARCHIVE);
28162916SGordon Ross		anyset = B_TRUE;
28162916SGordon Ross	}
28162916SGordon Ross	if (XVA_ISSET_REQ(xvap, XAT_SYSTEM)) {
28162916SGordon Ross		if (xoap->xoa_system)
28162916SGordon Ross			attr |= SMB_FA_SYSTEM;
28162916SGordon Ross		else
28162916SGordon Ross			attr &= ~SMB_FA_SYSTEM;
28162916SGordon Ross		XVA_SET_RTN(xvap, XAT_SYSTEM);
28162916SGordon Ross		anyset = B_TRUE;
28162916SGordon Ross	}
28162916SGordon Ross	if (XVA_ISSET_REQ(xvap, XAT_READONLY)) {
28162916SGordon Ross		if (xoap->xoa_readonly)
28162916SGordon Ross			attr |= SMB_FA_RDONLY;
28162916SGordon Ross		else
28162916SGordon Ross			attr &= ~SMB_FA_RDONLY;
28162916SGordon Ross		XVA_SET_RTN(xvap, XAT_READONLY);
28162916SGordon Ross		anyset = B_TRUE;
28162916SGordon Ross	}
28162916SGordon Ross	if (XVA_ISSET_REQ(xvap, XAT_HIDDEN)) {
28162916SGordon Ross		if (xoap->xoa_hidden)
28162916SGordon Ross			attr |= SMB_FA_HIDDEN;
28162916SGordon Ross		else
28162916SGordon Ross			attr &= ~SMB_FA_HIDDEN;
28162916SGordon Ross		XVA_SET_RTN(xvap, XAT_HIDDEN);
28162916SGordon Ross		anyset = B_TRUE;
28162916SGordon Ross	}
28162916SGordon Ross
28162916SGordon Ross	if (anyset == B_FALSE)
28162916SGordon Ross		return (0);	/* no change */
28162916SGordon Ross	if (attr == 0)
28162916SGordon Ross		attr = SMB_EFA_NORMAL;
28162916SGordon Ross
28162916SGordon Ross	return (attr);
28162916SGordon Ross}
28162916SGordon Ross
4bff34e3Sthurlow/*
4bff34e3Sthurlow * smbfs_access_rwx()
4bff34e3Sthurlow * Common function for smbfs_access, etc.
4bff34e3Sthurlow *
4bff34e3Sthurlow * The security model implemented by the FS is unusual
bd7c6f51SGordon Ross * due to the current "single user mounts" restriction:
4bff34e3Sthurlow * All access under a given mount point uses the CIFS
4bff34e3Sthurlow * credentials established by the owner of the mount.
4bff34e3Sthurlow *
4bff34e3Sthurlow * Most access checking is handled by the CIFS server,
4bff34e3Sthurlow * but we need sufficient Unix access checks here to
4bff34e3Sthurlow * prevent other local Unix users from having access
4bff34e3Sthurlow * to objects under this mount that the uid/gid/mode
4bff34e3Sthurlow * settings in the mount would not allow.
4bff34e3Sthurlow *
4bff34e3Sthurlow * With this model, there is a case where we need the
4bff34e3Sthurlow * ability to do an access check before we have the
4bff34e3Sthurlow * vnode for an object.  This function takes advantage
4bff34e3Sthurlow * of the fact that the uid/gid/mode is per mount, and
4bff34e3Sthurlow * avoids the need for a vnode.
4bff34e3Sthurlow *
4bff34e3Sthurlow * We still (sort of) need a vnode when we call
4bff34e3Sthurlow * secpolicy_vnode_access, but that only uses
4bff34e3Sthurlow * the vtype field, so we can use a pair of fake
4bff34e3Sthurlow * vnodes that have only v_type filled in.
4bff34e3Sthurlow */
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_access_rwx(vfs_t *vfsp, int vtype, int mode, cred_t *cr)
4bff34e3Sthurlow{
4bff34e3Sthurlow	/* See the secpolicy call below. */
4bff34e3Sthurlow	static const vnode_t tmpl_vdir = { .v_type = VDIR };
4bff34e3Sthurlow	static const vnode_t tmpl_vreg = { .v_type = VREG };
4bff34e3Sthurlow	vattr_t		va;
4bff34e3Sthurlow	vnode_t		*tvp;
4bff34e3Sthurlow	struct smbmntinfo *smi = VFTOSMI(vfsp);
4bff34e3Sthurlow	int shift = 0;
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Build our (fabricated) vnode attributes.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	bzero(&va, sizeof (va));
4bff34e3Sthurlow	va.va_mask = AT_TYPE | AT_MODE | AT_UID | AT_GID;
4bff34e3Sthurlow	va.va_type = vtype;
4bff34e3Sthurlow	va.va_mode = (vtype == VDIR) ?
02d09e03SGordon Ross	    smi->smi_dmode : smi->smi_fmode;
02d09e03SGordon Ross	va.va_uid = smi->smi_uid;
02d09e03SGordon Ross	va.va_gid = smi->smi_gid;
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Disallow write attempts on read-only file systems,
4bff34e3Sthurlow	 * unless the file is a device or fifo node.  Note:
4bff34e3Sthurlow	 * Inline vn_is_readonly and IS_DEVVP here because
4bff34e3Sthurlow	 * we may not have a vnode ptr.  Original expr. was:
4bff34e3Sthurlow	 * (mode & VWRITE) && vn_is_readonly(vp) && !IS_DEVVP(vp))
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	if ((mode & VWRITE) &&
4bff34e3Sthurlow	    (vfsp->vfs_flag & VFS_RDONLY) &&
4bff34e3Sthurlow	    !(vtype == VCHR || vtype == VBLK || vtype == VFIFO))
4bff34e3Sthurlow		return (EROFS);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Disallow attempts to access mandatory lock files.
4bff34e3Sthurlow	 * Similarly, expand MANDLOCK here.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	if ((mode & (VWRITE | VREAD | VEXEC)) &&
4bff34e3Sthurlow	    va.va_type == VREG && MANDMODE(va.va_mode))
4bff34e3Sthurlow		return (EACCES);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Access check is based on only
4bff34e3Sthurlow	 * one of owner, group, public.
4bff34e3Sthurlow	 * If not owner, then check group.
4bff34e3Sthurlow	 * If not a member of the group,
4bff34e3Sthurlow	 * then check public access.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	if (crgetuid(cr) != va.va_uid) {
4bff34e3Sthurlow		shift += 3;
4bff34e3Sthurlow		if (!groupmember(va.va_gid, cr))
4bff34e3Sthurlow			shift += 3;
4bff34e3Sthurlow	}
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * We need a vnode for secpolicy_vnode_access,
4bff34e3Sthurlow	 * but the only thing it looks at is v_type,
4bff34e3Sthurlow	 * so pass one of the templates above.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	tvp = (va.va_type == VDIR) ?
4bff34e3Sthurlow	    (vnode_t *)&tmpl_vdir :
4bff34e3Sthurlow	    (vnode_t *)&tmpl_vreg;
134a1f4eSCasper H.S. Dik
134a1f4eSCasper H.S. Dik	return (secpolicy_vnode_access2(cr, tvp, va.va_uid,
134a1f4eSCasper H.S. Dik	    va.va_mode << shift, mode));
4bff34e3Sthurlow}
4bff34e3Sthurlow
4bff34e3Sthurlow/*
4bff34e3Sthurlow * See smbfs_setattr
4bff34e3Sthurlow */
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_accessx(void *arg, int mode, cred_t *cr)
4bff34e3Sthurlow{
4bff34e3Sthurlow	vnode_t *vp = arg;
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Note: The caller has checked the current zone,
4bff34e3Sthurlow	 * the SMI_DEAD and VFS_UNMOUNTED flags, etc.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	return (smbfs_access_rwx(vp->v_vfsp, vp->v_type, mode, cr));
4bff34e3Sthurlow}
4bff34e3Sthurlow
4bff34e3Sthurlow/*
4bff34e3Sthurlow * XXX
4bff34e3Sthurlow * This op should support PSARC 2007/403, Modified Access Checks for CIFS
4bff34e3Sthurlow */
4bff34e3Sthurlow/* ARGSUSED */
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_access(vnode_t *vp, int mode, int flags, cred_t *cr, caller_context_t *ct)
4bff34e3Sthurlow{
4bff34e3Sthurlow	vfs_t		*vfsp;
4bff34e3Sthurlow	smbmntinfo_t	*smi;
4bff34e3Sthurlow
4bff34e3Sthurlow	vfsp = vp->v_vfsp;
4bff34e3Sthurlow	smi = VFTOSMI(vfsp);
4bff34e3Sthurlow
a19609f8Sjv	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (smi->smi_flags & SMI_DEAD || vfsp->vfs_flag & VFS_UNMOUNTED)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	return (smbfs_access_rwx(vfsp, vp->v_type, mode, cr));
4bff34e3Sthurlow}
4bff34e3Sthurlow
4bff34e3Sthurlow
5f4fc069Sjilinxpd/* ARGSUSED */
5f4fc069Sjilinxpdstatic int
5f4fc069Sjilinxpdsmbfs_readlink(vnode_t *vp, struct uio *uiop, cred_t *cr, caller_context_t *ct)
5f4fc069Sjilinxpd{
5f4fc069Sjilinxpd	/* Not yet... */
5f4fc069Sjilinxpd	return (ENOSYS);
5f4fc069Sjilinxpd}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd
4bff34e3Sthurlow/*
4bff34e3Sthurlow * Flush local dirty pages to stable storage on the server.
4bff34e3Sthurlow *
4bff34e3Sthurlow * If FNODSYNC is specified, then there is nothing to do because
4bff34e3Sthurlow * metadata changes are not cached on the client before being
4bff34e3Sthurlow * sent to the server.
4bff34e3Sthurlow */
4bff34e3Sthurlow/* ARGSUSED */
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_fsync(vnode_t *vp, int syncflag, cred_t *cr, caller_context_t *ct)
4bff34e3Sthurlow{
4bff34e3Sthurlow	int		error = 0;
4bff34e3Sthurlow	smbmntinfo_t	*smi;
5f4fc069Sjilinxpd	smbnode_t	*np;
2f5e3e91SGordon Ross	struct smb_cred scred;
4bff34e3Sthurlow
2f5e3e91SGordon Ross	np = VTOSMB(vp);
4bff34e3Sthurlow	smi = VTOSMI(vp);
4bff34e3Sthurlow
a19609f8Sjv	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (smi->smi_flags & SMI_DEAD || vp->v_vfsp->vfs_flag & VFS_UNMOUNTED)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	if ((syncflag & FNODSYNC) || IS_SWAPVP(vp))
4bff34e3Sthurlow		return (0);
4bff34e3Sthurlow
2f5e3e91SGordon Ross	if ((syncflag & (FSYNC|FDSYNC)) == 0)
2f5e3e91SGordon Ross		return (0);
2f5e3e91SGordon Ross
5f4fc069Sjilinxpd	error = smbfs_putpage(vp, (offset_t)0, 0, 0, cr, ct);
5f4fc069Sjilinxpd	if (error)
5f4fc069Sjilinxpd		return (error);
5f4fc069Sjilinxpd
2f5e3e91SGordon Ross	/* Shared lock for n_fid use in _flush */
2f5e3e91SGordon Ross	if (smbfs_rw_enter_sig(&np->r_lkserlock, RW_READER, SMBINTR(vp)))
2f5e3e91SGordon Ross		return (EINTR);
613a2f6bSGordon Ross	smb_credinit(&scred, cr);
2f5e3e91SGordon Ross
adee6784SGordon Ross	error = smbfsflush(np, &scred);
2f5e3e91SGordon Ross
2f5e3e91SGordon Ross	smb_credrele(&scred);
2f5e3e91SGordon Ross	smbfs_rw_exit(&np->r_lkserlock);
2f5e3e91SGordon Ross
4bff34e3Sthurlow	return (error);
4bff34e3Sthurlow}
4bff34e3Sthurlow
adee6784SGordon Rossstatic int
adee6784SGordon Rosssmbfsflush(smbnode_t *np, struct smb_cred *scrp)
adee6784SGordon Ross{
adee6784SGordon Ross	struct smb_share *ssp = np->n_mount->smi_share;
adee6784SGordon Ross	smb_fh_t *fhp;
adee6784SGordon Ross	int error;
adee6784SGordon Ross
adee6784SGordon Ross	/* Shared lock for n_fid use below. */
adee6784SGordon Ross	ASSERT(smbfs_rw_lock_held(&np->r_lkserlock, RW_READER));
adee6784SGordon Ross
adee6784SGordon Ross	if (!(np->n_flag & NFLUSHWIRE))
adee6784SGordon Ross		return (0);
adee6784SGordon Ross	if (np->n_fidrefs == 0)
adee6784SGordon Ross		return (0); /* not open */
adee6784SGordon Ross	if ((fhp = np->n_fid) == NULL)
adee6784SGordon Ross		return (0);
adee6784SGordon Ross
adee6784SGordon Ross	/* After reconnect, n_fid is invalid */
adee6784SGordon Ross	if (fhp->fh_vcgenid != ssp->ss_vcgenid)
adee6784SGordon Ross		return (ESTALE);
adee6784SGordon Ross
adee6784SGordon Ross	error = smbfs_smb_flush(ssp, fhp, scrp);
adee6784SGordon Ross
adee6784SGordon Ross	if (!error) {
adee6784SGordon Ross		mutex_enter(&np->r_statelock);
adee6784SGordon Ross		np->n_flag &= ~NFLUSHWIRE;
adee6784SGordon Ross		mutex_exit(&np->r_statelock);
adee6784SGordon Ross	}
adee6784SGordon Ross	return (error);
adee6784SGordon Ross}
adee6784SGordon Ross
4bff34e3Sthurlow/*
4bff34e3Sthurlow * Last reference to vnode went away.
4bff34e3Sthurlow */
4bff34e3Sthurlow/* ARGSUSED */
4bff34e3Sthurlowstatic void
4bff34e3Sthurlowsmbfs_inactive(vnode_t *vp, cred_t *cr, caller_context_t *ct)
4bff34e3Sthurlow{
42d15982SGordon Ross	struct smb_cred scred;
5f4fc069Sjilinxpd	smbnode_t	*np = VTOSMB(vp);
5f4fc069Sjilinxpd	int error;
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Don't "bail out" for VFS_UNMOUNTED here,
4bff34e3Sthurlow	 * as we want to do cleanup, etc.
4bff34e3Sthurlow	 * See also pcfs_inactive
4bff34e3Sthurlow	 */
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * If this is coming from the wrong zone, we let someone in the right
4bff34e3Sthurlow	 * zone take care of it asynchronously.  We can get here due to
4bff34e3Sthurlow	 * VN_RELE() being called from pageout() or fsflush().  This call may
4bff34e3Sthurlow	 * potentially turn into an expensive no-op if, for instance, v_count
4bff34e3Sthurlow	 * gets incremented in the meantime, but it's still correct.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * From NFS:rinactive()
5f4fc069Sjilinxpd	 *
5f4fc069Sjilinxpd	 * Before freeing anything, wait until all asynchronous
5f4fc069Sjilinxpd	 * activity is done on this rnode.  This will allow all
5f4fc069Sjilinxpd	 * asynchronous read ahead and write behind i/o's to
5f4fc069Sjilinxpd	 * finish.
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd	while (np->r_count > 0)
5f4fc069Sjilinxpd		cv_wait(&np->r_cv, &np->r_statelock);
5f4fc069Sjilinxpd	mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * Flush and invalidate all pages associated with the vnode.
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	if (vn_has_cached_data(vp)) {
5f4fc069Sjilinxpd		if ((np->r_flags & RDIRTY) && !np->r_error) {
5f4fc069Sjilinxpd			error = smbfs_putpage(vp, (u_offset_t)0, 0, 0, cr, ct);
5f4fc069Sjilinxpd			if (error && (error == ENOSPC || error == EDQUOT)) {
5f4fc069Sjilinxpd				mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd				if (!np->r_error)
5f4fc069Sjilinxpd					np->r_error = error;
5f4fc069Sjilinxpd				mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd			}
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd		smbfs_invalidate_pages(vp, (u_offset_t)0, cr);
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * This vnode should have lost all cached data.
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	ASSERT(vn_has_cached_data(vp) == 0);
5f4fc069Sjilinxpd
4bff34e3Sthurlow	/*
42d15982SGordon Ross	 * Defend against the possibility that higher-level callers
42d15982SGordon Ross	 * might not correctly balance open and close calls.  If we
42d15982SGordon Ross	 * get here with open references remaining, it means there
42d15982SGordon Ross	 * was a missing VOP_CLOSE somewhere.  If that happens, do
42d15982SGordon Ross	 * the close here so we don't "leak" FIDs on the server.
4bff34e3Sthurlow	 *
42d15982SGordon Ross	 * Exclusive lock for modifying n_fid stuff.
42d15982SGordon Ross	 * Don't want this one ever interruptible.
4bff34e3Sthurlow	 */
42d15982SGordon Ross	(void) smbfs_rw_enter_sig(&np->r_lkserlock, RW_WRITER, 0);
42d15982SGordon Ross	smb_credinit(&scred, cr);
42d15982SGordon Ross
42d15982SGordon Ross	switch (np->n_ovtype) {
42d15982SGordon Ross	case VNON:
42d15982SGordon Ross		/* not open (OK) */
42d15982SGordon Ross		break;
42d15982SGordon Ross
42d15982SGordon Ross	case VDIR:
42d15982SGordon Ross		if (np->n_dirrefs == 0)
42d15982SGordon Ross			break;
42d15982SGordon Ross		SMBVDEBUG("open dir: refs %d path %s\n",
42d15982SGordon Ross		    np->n_dirrefs, np->n_rpath);
42d15982SGordon Ross		/* Force last close. */
42d15982SGordon Ross		np->n_dirrefs = 1;
42d15982SGordon Ross		smbfs_rele_fid(np, &scred);
42d15982SGordon Ross		break;
42d15982SGordon Ross
42d15982SGordon Ross	case VREG:
42d15982SGordon Ross		if (np->n_fidrefs == 0)
42d15982SGordon Ross			break;
adee6784SGordon Ross		SMBVDEBUG("open file: refs %d path %s\n",
adee6784SGordon Ross		    np->n_fidrefs, np->n_rpath);
42d15982SGordon Ross		/* Force last close. */
42d15982SGordon Ross		np->n_fidrefs = 1;
42d15982SGordon Ross		smbfs_rele_fid(np, &scred);
42d15982SGordon Ross		break;
42d15982SGordon Ross
42d15982SGordon Ross	default:
42d15982SGordon Ross		SMBVDEBUG("bad n_ovtype %d\n", np->n_ovtype);
42d15982SGordon Ross		np->n_ovtype = VNON;
42d15982SGordon Ross		break;
4bff34e3Sthurlow	}
42d15982SGordon Ross
42d15982SGordon Ross	smb_credrele(&scred);
42d15982SGordon Ross	smbfs_rw_exit(&np->r_lkserlock);
4bff34e3Sthurlow
ff1e230cSjilinxpd	/*
ff1e230cSjilinxpd	 * XATTR directories (and the files under them) have
ff1e230cSjilinxpd	 * little value for reclaim, so just remove them from
ff1e230cSjilinxpd	 * the "hash" (AVL) as soon as they go inactive.
ff1e230cSjilinxpd	 * Note that the node may already have been removed
ff1e230cSjilinxpd	 * from the hash by smbfsremove.
ff1e230cSjilinxpd	 */
ff1e230cSjilinxpd	if ((np->n_flag & N_XATTR) != 0 &&
ff1e230cSjilinxpd	    (np->r_flags & RHASHED) != 0)
ff1e230cSjilinxpd		smbfs_rmhash(np);
ff1e230cSjilinxpd
02d09e03SGordon Ross	smbfs_addfree(np);
4bff34e3Sthurlow}
4bff34e3Sthurlow
4bff34e3Sthurlow/*
4bff34e3Sthurlow * Remote file system operations having to do with directory manipulation.
4bff34e3Sthurlow */
4bff34e3Sthurlow/* ARGSUSED */
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_lookup(vnode_t *dvp, char *nm, vnode_t **vpp, struct pathname *pnp,
4bff34e3Sthurlow	int flags, vnode_t *rdir, cred_t *cr, caller_context_t *ct,
4bff34e3Sthurlow	int *direntflags, pathname_t *realpnp)
4bff34e3Sthurlow{
91d632c8Sgwr	vfs_t		*vfs;
4bff34e3Sthurlow	smbmntinfo_t	*smi;
91d632c8Sgwr	smbnode_t	*dnp;
91d632c8Sgwr	int		error;
4bff34e3Sthurlow
91d632c8Sgwr	vfs = dvp->v_vfsp;
91d632c8Sgwr	smi = VFTOSMI(vfs);
4bff34e3Sthurlow
a19609f8Sjv	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
4bff34e3Sthurlow		return (EPERM);
4bff34e3Sthurlow
91d632c8Sgwr	if (smi->smi_flags & SMI_DEAD || vfs->vfs_flag & VFS_UNMOUNTED)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	dnp = VTOSMB(dvp);
91d632c8Sgwr
91d632c8Sgwr	/*
91d632c8Sgwr	 * Are we looking up extended attributes?  If so, "dvp" is
91d632c8Sgwr	 * the file or directory for which we want attributes, and
91d632c8Sgwr	 * we need a lookup of the (faked up) attribute directory
91d632c8Sgwr	 * before we lookup the rest of the path.
91d632c8Sgwr	 */
91d632c8Sgwr	if (flags & LOOKUP_XATTR) {
91d632c8Sgwr		/*
91d632c8Sgwr		 * Require the xattr mount option.
91d632c8Sgwr		 */
91d632c8Sgwr		if ((vfs->vfs_flag & VFS_XATTR) == 0)
91d632c8Sgwr			return (EINVAL);
91d632c8Sgwr
91d632c8Sgwr		error = smbfs_get_xattrdir(dvp, vpp, cr, flags);
91d632c8Sgwr		return (error);
91d632c8Sgwr	}
91d632c8Sgwr
02d09e03SGordon Ross	if (smbfs_rw_enter_sig(&dnp->r_rwlock, RW_READER, SMBINTR(dvp)))
02d09e03SGordon Ross		return (EINTR);
4bff34e3Sthurlow
4bff34e3Sthurlow	error = smbfslookup(dvp, nm, vpp, cr, 1, ct);
4bff34e3Sthurlow
4bff34e3Sthurlow	smbfs_rw_exit(&dnp->r_rwlock);
4bff34e3Sthurlow
adee6784SGordon Ross	/*
adee6784SGordon Ross	 * If the caller passes an invalid name here, we'll have
adee6784SGordon Ross	 * error == EINVAL but want to return ENOENT.  This is
adee6784SGordon Ross	 * common with things like "ls foo*" with no matches.
adee6784SGordon Ross	 */
adee6784SGordon Ross	if (error == EINVAL)
adee6784SGordon Ross		error = ENOENT;
adee6784SGordon Ross
4bff34e3Sthurlow	return (error);
4bff34e3Sthurlow}
4bff34e3Sthurlow
4bff34e3Sthurlow/* ARGSUSED */
4bff34e3Sthurlowstatic int
02d09e03SGordon Rosssmbfslookup(vnode_t *dvp, char *nm, vnode_t **vpp, cred_t *cr,
02d09e03SGordon Ross	int cache_ok, caller_context_t *ct)
4bff34e3Sthurlow{
4bff34e3Sthurlow	int		error;
4bff34e3Sthurlow	int		supplen; /* supported length */
4bff34e3Sthurlow	vnode_t		*vp;
02d09e03SGordon Ross	smbnode_t	*np;
4bff34e3Sthurlow	smbnode_t	*dnp;
4bff34e3Sthurlow	smbmntinfo_t	*smi;
4bff34e3Sthurlow	/* struct smb_vc	*vcp; */
91d632c8Sgwr	const char	*ill;
4bff34e3Sthurlow	const char	*name = (const char *)nm;
5f4fc069Sjilinxpd	int		nmlen = strlen(nm);
5f4fc069Sjilinxpd	int		rplen;
4bff34e3Sthurlow	struct smb_cred scred;
4bff34e3Sthurlow	struct smbfattr fa;
4bff34e3Sthurlow
4bff34e3Sthurlow	smi = VTOSMI(dvp);
4bff34e3Sthurlow	dnp = VTOSMB(dvp);
4bff34e3Sthurlow
a19609f8Sjv	ASSERT(curproc->p_zone == smi->smi_zone_ref.zref_zone);
4bff34e3Sthurlow
4bff34e3Sthurlow	supplen = 255;
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * RWlock must be held, either reader or writer.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	ASSERT(dnp->r_rwlock.count != 0);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
02d09e03SGordon Ross	 * If lookup is for "", just return dvp.
02d09e03SGordon Ross	 * No need to perform any access checks.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	if (nmlen == 0) {
4bff34e3Sthurlow		VN_HOLD(dvp);
4bff34e3Sthurlow		*vpp = dvp;
4bff34e3Sthurlow		return (0);
4bff34e3Sthurlow	}
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
91d632c8Sgwr	 * Can't do lookups in non-directories.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	if (dvp->v_type != VDIR)
4bff34e3Sthurlow		return (ENOTDIR);
4bff34e3Sthurlow
91d632c8Sgwr	/*
91d632c8Sgwr	 * Need search permission in the directory.
91d632c8Sgwr	 */
4bff34e3Sthurlow	error = smbfs_access(dvp, VEXEC, 0, cr, ct);
4bff34e3Sthurlow	if (error)
4bff34e3Sthurlow		return (error);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
02d09e03SGordon Ross	 * If lookup is for ".", just return dvp.
02d09e03SGordon Ross	 * Access check was done above.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	if (nmlen == 1 && name[0] == '.') {
4bff34e3Sthurlow		VN_HOLD(dvp);
4bff34e3Sthurlow		*vpp = dvp;
4bff34e3Sthurlow		return (0);
4bff34e3Sthurlow	}
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
91d632c8Sgwr	 * Now some sanity checks on the name.
91d632c8Sgwr	 * First check the length.
4bff34e3Sthurlow	 */
91d632c8Sgwr	if (nmlen > supplen)
91d632c8Sgwr		return (ENAMETOOLONG);
91d632c8Sgwr
91d632c8Sgwr	/*
91d632c8Sgwr	 * Avoid surprises with characters that are
91d632c8Sgwr	 * illegal in Windows file names.
5f4fc069Sjilinxpd	 * Todo: CATIA mappings?
91d632c8Sgwr	 */
91d632c8Sgwr	ill = illegal_chars;
91d632c8Sgwr	if (dnp->n_flag & N_XATTR)
91d632c8Sgwr		ill++; /* allow colon */
91d632c8Sgwr	if (strpbrk(nm, ill))
91d632c8Sgwr		return (EINVAL);
91d632c8Sgwr
4bff34e3Sthurlow	/*
02d09e03SGordon Ross	 * Special handling for lookup of ".."
4bff34e3Sthurlow	 *
4bff34e3Sthurlow	 * We keep full pathnames (as seen on the server)
4bff34e3Sthurlow	 * so we can just trim off the last component to
4bff34e3Sthurlow	 * get the full pathname of the parent.  Note:
4bff34e3Sthurlow	 * We don't actually copy and modify, but just
4bff34e3Sthurlow	 * compute the trimmed length and pass that with
4bff34e3Sthurlow	 * the current dir path (not null terminated).
4bff34e3Sthurlow	 *
4bff34e3Sthurlow	 * We don't go over-the-wire to get attributes
4bff34e3Sthurlow	 * for ".." because we know it's a directory,
4bff34e3Sthurlow	 * and we can just leave the rest "stale"
4bff34e3Sthurlow	 * until someone does a getattr.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	if (nmlen == 2 && name[0] == '.' && name[1] == '.') {
4bff34e3Sthurlow		if (dvp->v_flag & VROOT) {
4bff34e3Sthurlow			/*
4bff34e3Sthurlow			 * Already at the root.  This can happen
4bff34e3Sthurlow			 * with directory listings at the root,
4bff34e3Sthurlow			 * which lookup "." and ".." to get the
4bff34e3Sthurlow			 * inode numbers.  Let ".." be the same
4bff34e3Sthurlow			 * as "." in the FS root.
4bff34e3Sthurlow			 */
4bff34e3Sthurlow			VN_HOLD(dvp);
4bff34e3Sthurlow			*vpp = dvp;
4bff34e3Sthurlow			return (0);
4bff34e3Sthurlow		}
4bff34e3Sthurlow
91d632c8Sgwr		/*
91d632c8Sgwr		 * Special case for XATTR directory
91d632c8Sgwr		 */
91d632c8Sgwr		if (dvp->v_flag & V_XATTRDIR) {
91d632c8Sgwr			error = smbfs_xa_parent(dvp, vpp);
91d632c8Sgwr			return (error);
91d632c8Sgwr		}
91d632c8Sgwr
4bff34e3Sthurlow		/*
4bff34e3Sthurlow		 * Find the parent path length.
4bff34e3Sthurlow		 */
4bff34e3Sthurlow		rplen = dnp->n_rplen;
4bff34e3Sthurlow		ASSERT(rplen > 0);
4bff34e3Sthurlow		while (--rplen >= 0) {
4bff34e3Sthurlow			if (dnp->n_rpath[rplen] == '\\')
4bff34e3Sthurlow				break;
4bff34e3Sthurlow		}
02d09e03SGordon Ross		if (rplen <= 0) {
4bff34e3Sthurlow			/* Found our way to the root. */
4bff34e3Sthurlow			vp = SMBTOV(smi->smi_root);
4bff34e3Sthurlow			VN_HOLD(vp);
4bff34e3Sthurlow			*vpp = vp;
4bff34e3Sthurlow			return (0);
4bff34e3Sthurlow		}
02d09e03SGordon Ross		np = smbfs_node_findcreate(smi,
02d09e03SGordon Ross		    dnp->n_rpath, rplen, NULL, 0, 0,
02d09e03SGordon Ross		    &smbfs_fattr0); /* force create */
02d09e03SGordon Ross		ASSERT(np != NULL);
02d09e03SGordon Ross		vp = SMBTOV(np);
4bff34e3Sthurlow		vp->v_type = VDIR;
4bff34e3Sthurlow
4bff34e3Sthurlow		/* Success! */
4bff34e3Sthurlow		*vpp = vp;
4bff34e3Sthurlow		return (0);
4bff34e3Sthurlow	}
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
02d09e03SGordon Ross	 * Normal lookup of a name under this directory.
02d09e03SGordon Ross	 * Note we handled "", ".", ".." above.
02d09e03SGordon Ross	 */
02d09e03SGordon Ross	if (cache_ok) {
02d09e03SGordon Ross		/*
02d09e03SGordon Ross		 * The caller indicated that it's OK to use a
02d09e03SGordon Ross		 * cached result for this lookup, so try to
02d09e03SGordon Ross		 * reclaim a node from the smbfs node cache.
02d09e03SGordon Ross		 */
02d09e03SGordon Ross		error = smbfslookup_cache(dvp, nm, nmlen, &vp, cr);
02d09e03SGordon Ross		if (error)
02d09e03SGordon Ross			return (error);
02d09e03SGordon Ross		if (vp != NULL) {
02d09e03SGordon Ross			/* hold taken in lookup_cache */
02d09e03SGordon Ross			*vpp = vp;
02d09e03SGordon Ross			return (0);
02d09e03SGordon Ross		}
02d09e03SGordon Ross	}
02d09e03SGordon Ross
02d09e03SGordon Ross	/*
02d09e03SGordon Ross	 * OK, go over-the-wire to get the attributes,
02d09e03SGordon Ross	 * then create the node.
4bff34e3Sthurlow	 */
613a2f6bSGordon Ross	smb_credinit(&scred, cr);
4bff34e3Sthurlow	/* Note: this can allocate a new "name" */
4bff34e3Sthurlow	error = smbfs_smb_lookup(dnp, &name, &nmlen, &fa, &scred);
4bff34e3Sthurlow	smb_credrele(&scred);
02d09e03SGordon Ross	if (error == ENOTDIR) {
02d09e03SGordon Ross		/*
02d09e03SGordon Ross		 * Lookup failed because this directory was
02d09e03SGordon Ross		 * removed or renamed by another client.
02d09e03SGordon Ross		 * Remove any cached attributes under it.
02d09e03SGordon Ross		 */
02d09e03SGordon Ross		smbfs_attrcache_remove(dnp);
02d09e03SGordon Ross		smbfs_attrcache_prune(dnp);
02d09e03SGordon Ross	}
4bff34e3Sthurlow	if (error)
4bff34e3Sthurlow		goto out;
4bff34e3Sthurlow
4bff34e3Sthurlow	error = smbfs_nget(dvp, name, nmlen, &fa, &vp);
4bff34e3Sthurlow	if (error)
4bff34e3Sthurlow		goto out;
4bff34e3Sthurlow
4bff34e3Sthurlow	/* Success! */
4bff34e3Sthurlow	*vpp = vp;
4bff34e3Sthurlow
4bff34e3Sthurlowout:
4bff34e3Sthurlow	/* smbfs_smb_lookup may have allocated name. */
4bff34e3Sthurlow	if (name != nm)
4bff34e3Sthurlow		smbfs_name_free(name, nmlen);
4bff34e3Sthurlow
4bff34e3Sthurlow	return (error);
4bff34e3Sthurlow}
4bff34e3Sthurlow
02d09e03SGordon Ross/*
02d09e03SGordon Ross * smbfslookup_cache
02d09e03SGordon Ross *
02d09e03SGordon Ross * Try to reclaim a node from the smbfs node cache.
02d09e03SGordon Ross * Some statistics for DEBUG.
02d09e03SGordon Ross *
02d09e03SGordon Ross * This mechanism lets us avoid many of the five (or more)
02d09e03SGordon Ross * OtW lookup calls per file seen with "ls -l" if we search
02d09e03SGordon Ross * the smbfs node cache for recently inactive(ated) nodes.
02d09e03SGordon Ross */
91d632c8Sgwr#ifdef DEBUG
02d09e03SGordon Rossint smbfs_lookup_cache_calls = 0;
02d09e03SGordon Rossint smbfs_lookup_cache_error = 0;
02d09e03SGordon Rossint smbfs_lookup_cache_miss = 0;
02d09e03SGordon Rossint smbfs_lookup_cache_stale = 0;
02d09e03SGordon Rossint smbfs_lookup_cache_hits = 0;
02d09e03SGordon Ross#endif /* DEBUG */
91d632c8Sgwr
91d632c8Sgwr/* ARGSUSED */
91d632c8Sgwrstatic int
02d09e03SGordon Rosssmbfslookup_cache(vnode_t *dvp, char *nm, int nmlen,
02d09e03SGordon Ross	vnode_t **vpp, cred_t *cr)
91d632c8Sgwr{
91d632c8Sgwr	struct vattr va;
91d632c8Sgwr	smbnode_t *dnp;
02d09e03SGordon Ross	smbnode_t *np;
02d09e03SGordon Ross	vnode_t *vp;
02d09e03SGordon Ross	int error;
02d09e03SGordon Ross	char sep;
91d632c8Sgwr
91d632c8Sgwr	dnp = VTOSMB(dvp);
02d09e03SGordon Ross	*vpp = NULL;
91d632c8Sgwr
02d09e03SGordon Ross#ifdef DEBUG
02d09e03SGordon Ross	smbfs_lookup_cache_calls++;
02d09e03SGordon Ross#endif
91d632c8Sgwr
91d632c8Sgwr	/*
02d09e03SGordon Ross	 * First make sure we can get attributes for the
02d09e03SGordon Ross	 * directory.  Cached attributes are OK here.
02d09e03SGordon Ross	 * If we removed or renamed the directory, this
02d09e03SGordon Ross	 * will return ENOENT.  If someone else removed
02d09e03SGordon Ross	 * this directory or file, we'll find out when we
02d09e03SGordon Ross	 * try to open or get attributes.
91d632c8Sgwr	 */
02d09e03SGordon Ross	va.va_mask = AT_TYPE | AT_MODE;
02d09e03SGordon Ross	error = smbfsgetattr(dvp, &va, cr);
02d09e03SGordon Ross	if (error) {
91d632c8Sgwr#ifdef DEBUG
02d09e03SGordon Ross		smbfs_lookup_cache_error++;
91d632c8Sgwr#endif
02d09e03SGordon Ross		return (error);
02d09e03SGordon Ross	}
02d09e03SGordon Ross
02d09e03SGordon Ross	/*
02d09e03SGordon Ross	 * Passing NULL smbfattr here so we will
02d09e03SGordon Ross	 * just look, not create.
02d09e03SGordon Ross	 */
02d09e03SGordon Ross	sep = SMBFS_DNP_SEP(dnp);
02d09e03SGordon Ross	np = smbfs_node_findcreate(dnp->n_mount,
02d09e03SGordon Ross	    dnp->n_rpath, dnp->n_rplen,
02d09e03SGordon Ross	    nm, nmlen, sep, NULL);
02d09e03SGordon Ross	if (np == NULL) {
91d632c8Sgwr#ifdef DEBUG
02d09e03SGordon Ross		smbfs_lookup_cache_miss++;
91d632c8Sgwr#endif
02d09e03SGordon Ross		return (0);
02d09e03SGordon Ross	}
02d09e03SGordon Ross
02d09e03SGordon Ross	/*
02d09e03SGordon Ross	 * Found it.  Attributes still valid?
02d09e03SGordon Ross	 */
02d09e03SGordon Ross	vp = SMBTOV(np);
02d09e03SGordon Ross	if (np->r_attrtime <= gethrtime()) {
02d09e03SGordon Ross		/* stale */
91d632c8Sgwr#ifdef DEBUG
02d09e03SGordon Ross		smbfs_lookup_cache_stale++;
91d632c8Sgwr#endif
02d09e03SGordon Ross		VN_RELE(vp);
02d09e03SGordon Ross		return (0);
91d632c8Sgwr	}
02d09e03SGordon Ross
02d09e03SGordon Ross	/*
02d09e03SGordon Ross	 * Success!
02d09e03SGordon Ross	 * Caller gets hold from smbfs_node_findcreate
02d09e03SGordon Ross	 */
91d632c8Sgwr#ifdef DEBUG
02d09e03SGordon Ross	smbfs_lookup_cache_hits++;
91d632c8Sgwr#endif
02d09e03SGordon Ross	*vpp = vp;
91d632c8Sgwr	return (0);
91d632c8Sgwr}
91d632c8Sgwr
5f4fc069Sjilinxpd
4bff34e3Sthurlow/*
4bff34e3Sthurlow * XXX
4bff34e3Sthurlow * vsecattr_t is new to build 77, and we need to eventually support
4bff34e3Sthurlow * it in order to create an ACL when an object is created.
4bff34e3Sthurlow *
4bff34e3Sthurlow * This op should support the new FIGNORECASE flag for case-insensitive
4bff34e3Sthurlow * lookups, per PSARC 2007/244.
4bff34e3Sthurlow */
4bff34e3Sthurlow/* ARGSUSED */
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_create(vnode_t *dvp, char *nm, struct vattr *va, enum vcexcl exclusive,
4bff34e3Sthurlow	int mode, vnode_t **vpp, cred_t *cr, int lfaware, caller_context_t *ct,
4bff34e3Sthurlow	vsecattr_t *vsecp)
4bff34e3Sthurlow{
4bff34e3Sthurlow	int		error;
4bff34e3Sthurlow	vfs_t		*vfsp;
4bff34e3Sthurlow	vnode_t		*vp;
4bff34e3Sthurlow	smbnode_t	*np;
4bff34e3Sthurlow	smbnode_t	*dnp;
4bff34e3Sthurlow	smbmntinfo_t	*smi;
4bff34e3Sthurlow	struct vattr	vattr;
4bff34e3Sthurlow	struct smbfattr	fattr;
4bff34e3Sthurlow	struct smb_cred	scred;
4bff34e3Sthurlow	const char *name = (const char *)nm;
4bff34e3Sthurlow	int		nmlen = strlen(nm);
4bff34e3Sthurlow	uint32_t	disp;
adee6784SGordon Ross	smb_fh_t	*fid = NULL;
91d632c8Sgwr	int		xattr;
4bff34e3Sthurlow
4bff34e3Sthurlow	vfsp = dvp->v_vfsp;
4bff34e3Sthurlow	smi = VFTOSMI(vfsp);
4bff34e3Sthurlow	dnp = VTOSMB(dvp);
4bff34e3Sthurlow	vp = NULL;
4bff34e3Sthurlow
a19609f8Sjv	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
4bff34e3Sthurlow		return (EPERM);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (smi->smi_flags & SMI_DEAD || vfsp->vfs_flag & VFS_UNMOUNTED)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Note: this may break mknod(2) calls to create a directory,
4bff34e3Sthurlow	 * but that's obscure use.  Some other filesystems do this.
5f4fc069Sjilinxpd	 * Todo: redirect VDIR type here to _mkdir.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	if (va->va_type != VREG)
4bff34e3Sthurlow		return (EINVAL);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * If the pathname is "", just use dvp, no checks.
4bff34e3Sthurlow	 * Do this outside of the rwlock (like zfs).
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	if (nmlen == 0) {
4bff34e3Sthurlow		VN_HOLD(dvp);
4bff34e3Sthurlow		*vpp = dvp;
4bff34e3Sthurlow		return (0);
4bff34e3Sthurlow	}
4bff34e3Sthurlow
4bff34e3Sthurlow	/* Don't allow "." or ".." through here. */
4bff34e3Sthurlow	if ((nmlen == 1 && name[0] == '.') ||
4bff34e3Sthurlow	    (nmlen == 2 && name[0] == '.' && name[1] == '.'))
4bff34e3Sthurlow		return (EISDIR);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * We make a copy of the attributes because the caller does not
4bff34e3Sthurlow	 * expect us to change what va points to.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	vattr = *va;
4bff34e3Sthurlow
4bff34e3Sthurlow	if (smbfs_rw_enter_sig(&dnp->r_rwlock, RW_WRITER, SMBINTR(dvp)))
4bff34e3Sthurlow		return (EINTR);
613a2f6bSGordon Ross	smb_credinit(&scred, cr);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * NFS needs to go over the wire, just to be sure whether the
02d09e03SGordon Ross	 * file exists or not.  Using a cached result is dangerous in
4bff34e3Sthurlow	 * this case when making a decision regarding existence.
4bff34e3Sthurlow	 *
4bff34e3Sthurlow	 * The SMB protocol does NOT really need to go OTW here
4bff34e3Sthurlow	 * thanks to the expressive NTCREATE disposition values.
4bff34e3Sthurlow	 * Unfortunately, to do Unix access checks correctly,
4bff34e3Sthurlow	 * we need to know if the object already exists.
4bff34e3Sthurlow	 * When the object does not exist, we need VWRITE on
4bff34e3Sthurlow	 * the directory.  Note: smbfslookup() checks VEXEC.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	error = smbfslookup(dvp, nm, &vp, cr, 0, ct);
4bff34e3Sthurlow	if (error == 0) {
4bff34e3Sthurlow		/*
42645588SGordon Ross		 * The file already exists.  Error?
42645588SGordon Ross		 * NB: have a hold from smbfslookup
4bff34e3Sthurlow		 */
4bff34e3Sthurlow		if (exclusive == EXCL) {
4bff34e3Sthurlow			error = EEXIST;
42645588SGordon Ross			VN_RELE(vp);
4bff34e3Sthurlow			goto out;
4bff34e3Sthurlow		}
4bff34e3Sthurlow		/*
4bff34e3Sthurlow		 * Verify requested access.
4bff34e3Sthurlow		 */
4bff34e3Sthurlow		error = smbfs_access(vp, mode, 0, cr, ct);
42645588SGordon Ross		if (error) {
42645588SGordon Ross			VN_RELE(vp);
4bff34e3Sthurlow			goto out;
42645588SGordon Ross		}
4bff34e3Sthurlow
4bff34e3Sthurlow		/*
4bff34e3Sthurlow		 * Truncate (if requested).
4bff34e3Sthurlow		 */
5f4fc069Sjilinxpd		if ((vattr.va_mask & AT_SIZE) && vp->v_type == VREG) {
5f4fc069Sjilinxpd			np = VTOSMB(vp);
5f4fc069Sjilinxpd			/*
5f4fc069Sjilinxpd			 * Check here for large file truncation by
5f4fc069Sjilinxpd			 * LF-unaware process, like ufs_create().
5f4fc069Sjilinxpd			 */
5f4fc069Sjilinxpd			if (!(lfaware & FOFFMAX)) {
5f4fc069Sjilinxpd				mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd				if (np->r_size > MAXOFF32_T)
5f4fc069Sjilinxpd					error = EOVERFLOW;
5f4fc069Sjilinxpd				mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd			}
5f4fc069Sjilinxpd			if (error) {
5f4fc069Sjilinxpd				VN_RELE(vp);
5f4fc069Sjilinxpd				goto out;
5f4fc069Sjilinxpd			}
5f4fc069Sjilinxpd			vattr.va_mask = AT_SIZE;
5f4fc069Sjilinxpd			error = smbfssetattr(vp, &vattr, 0, cr);
42645588SGordon Ross			if (error) {
42645588SGordon Ross				VN_RELE(vp);
4bff34e3Sthurlow				goto out;
42645588SGordon Ross			}
5f4fc069Sjilinxpd#ifdef	SMBFS_VNEVENT
5f4fc069Sjilinxpd			/* Existing file was truncated */
5f4fc069Sjilinxpd			vnevent_create(vp, ct);
5f4fc069Sjilinxpd#endif
5f4fc069Sjilinxpd			/* invalidate pages done in smbfssetattr() */
4bff34e3Sthurlow		}
4bff34e3Sthurlow		/* Success! */
4bff34e3Sthurlow		*vpp = vp;
4bff34e3Sthurlow		goto out;
4bff34e3Sthurlow	}
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * The file did not exist.  Need VWRITE in the directory.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	error = smbfs_access(dvp, VWRITE, 0, cr, ct);
4bff34e3Sthurlow	if (error)
4bff34e3Sthurlow		goto out;
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Now things get tricky.  We also need to check the
4bff34e3Sthurlow	 * requested open mode against the file we may create.
4bff34e3Sthurlow	 * See comments at smbfs_access_rwx
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	error = smbfs_access_rwx(vfsp, VREG, mode, cr);
4bff34e3Sthurlow	if (error)
4bff34e3Sthurlow		goto out;
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Now the code derived from Darwin,
4bff34e3Sthurlow	 * but with greater use of NT_CREATE
4bff34e3Sthurlow	 * disposition options.  Much changed.
4bff34e3Sthurlow	 *
4bff34e3Sthurlow	 * Create (or open) a new child node.
4bff34e3Sthurlow	 * Note we handled "." and ".." above.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow
4bff34e3Sthurlow	if (exclusive == EXCL)
4bff34e3Sthurlow		disp = NTCREATEX_DISP_CREATE;
4bff34e3Sthurlow	else {
4bff34e3Sthurlow		/* Truncate regular files if requested. */
4bff34e3Sthurlow		if ((va->va_type == VREG) &&
4bff34e3Sthurlow		    (va->va_mask & AT_SIZE) &&
4bff34e3Sthurlow		    (va->va_size == 0))
4bff34e3Sthurlow			disp = NTCREATEX_DISP_OVERWRITE_IF;
4bff34e3Sthurlow		else
4bff34e3Sthurlow			disp = NTCREATEX_DISP_OPEN_IF;
4bff34e3Sthurlow	}
91d632c8Sgwr	xattr = (dnp->n_flag & N_XATTR) ? 1 : 0;
02d09e03SGordon Ross	error = smbfs_smb_create(dnp,
02d09e03SGordon Ross	    name, nmlen, xattr,
02d09e03SGordon Ross	    disp, &scred, &fid);
4bff34e3Sthurlow	if (error)
4bff34e3Sthurlow		goto out;
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Should use the fid to get/set the size
4bff34e3Sthurlow	 * while we have it opened here.  See above.
4bff34e3Sthurlow	 */
adee6784SGordon Ross	smbfs_smb_close(fid);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * In the open case, the name may differ a little
4bff34e3Sthurlow	 * from what we passed to create (case, etc.)
4bff34e3Sthurlow	 * so call lookup to get the (opened) name.
4bff34e3Sthurlow	 *
4bff34e3Sthurlow	 * XXX: Could avoid this extra lookup if the
4bff34e3Sthurlow	 * "createact" result from NT_CREATE says we
4bff34e3Sthurlow	 * created the object.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	error = smbfs_smb_lookup(dnp, &name, &nmlen, &fattr, &scred);
4bff34e3Sthurlow	if (error)
4bff34e3Sthurlow		goto out;
4bff34e3Sthurlow
4bff34e3Sthurlow	/* update attr and directory cache */
4bff34e3Sthurlow	smbfs_attr_touchdir(dnp);
4bff34e3Sthurlow
4bff34e3Sthurlow	error = smbfs_nget(dvp, name, nmlen, &fattr, &vp);
4bff34e3Sthurlow	if (error)
4bff34e3Sthurlow		goto out;
4bff34e3Sthurlow
4bff34e3Sthurlow	/* Success! */
4bff34e3Sthurlow	*vpp = vp;
4bff34e3Sthurlow	error = 0;
4bff34e3Sthurlow
4bff34e3Sthurlowout:
4bff34e3Sthurlow	smb_credrele(&scred);
02d09e03SGordon Ross	smbfs_rw_exit(&dnp->r_rwlock);
4bff34e3Sthurlow	if (name != nm)
4bff34e3Sthurlow		smbfs_name_free(name, nmlen);
4bff34e3Sthurlow	return (error);
4bff34e3Sthurlow}
4bff34e3Sthurlow
4bff34e3Sthurlow/*
4bff34e3Sthurlow * XXX
4bff34e3Sthurlow * This op should support the new FIGNORECASE flag for case-insensitive
4bff34e3Sthurlow * lookups, per PSARC 2007/244.
4bff34e3Sthurlow */
4bff34e3Sthurlow/* ARGSUSED */
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_remove(vnode_t *dvp, char *nm, cred_t *cr, caller_context_t *ct,
4bff34e3Sthurlow	int flags)
4bff34e3Sthurlow{
4bff34e3Sthurlow	struct smb_cred	scred;
ff1e230cSjilinxpd	vnode_t		*vp = NULL;
ff1e230cSjilinxpd	smbnode_t	*dnp = VTOSMB(dvp);
ff1e230cSjilinxpd	smbmntinfo_t	*smi = VTOSMI(dvp);
ff1e230cSjilinxpd	int		error;
4bff34e3Sthurlow
a19609f8Sjv	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
4bff34e3Sthurlow		return (EPERM);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (smi->smi_flags & SMI_DEAD || dvp->v_vfsp->vfs_flag & VFS_UNMOUNTED)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Verify access to the dirctory.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	error = smbfs_access(dvp, VWRITE|VEXEC, 0, cr, ct);
4bff34e3Sthurlow	if (error)
ff1e230cSjilinxpd		return (error);
ff1e230cSjilinxpd
ff1e230cSjilinxpd	if (smbfs_rw_enter_sig(&dnp->r_rwlock, RW_WRITER, SMBINTR(dvp)))
ff1e230cSjilinxpd		return (EINTR);
ff1e230cSjilinxpd	smb_credinit(&scred, cr);
ff1e230cSjilinxpd
ff1e230cSjilinxpd	/* Lookup the file to remove. */
ff1e230cSjilinxpd	error = smbfslookup(dvp, nm, &vp, cr, 0, ct);
adee6784SGordon Ross	if (error != 0)
adee6784SGordon Ross		goto out;
adee6784SGordon Ross
adee6784SGordon Ross	/* Don't allow unlink of a directory. */
adee6784SGordon Ross	if (vp->v_type == VDIR) {
adee6784SGordon Ross		error = EPERM;
adee6784SGordon Ross		goto out;
ff1e230cSjilinxpd	}
ff1e230cSjilinxpd
adee6784SGordon Ross	/*
adee6784SGordon Ross	 * Do the real remove work
adee6784SGordon Ross	 */
adee6784SGordon Ross	error = smbfsremove(dvp, vp, &scred, flags);
adee6784SGordon Ross	if (error != 0)
adee6784SGordon Ross		goto out;
adee6784SGordon Ross
adee6784SGordon Ross#ifdef	SMBFS_VNEVENT
adee6784SGordon Ross	vnevent_remove(vp, dvp, nm, ct);
adee6784SGordon Ross#endif
adee6784SGordon Ross
adee6784SGordon Rossout:
adee6784SGordon Ross	if (vp != NULL)
adee6784SGordon Ross		VN_RELE(vp);
adee6784SGordon Ross
ff1e230cSjilinxpd	smb_credrele(&scred);
ff1e230cSjilinxpd	smbfs_rw_exit(&dnp->r_rwlock);
ff1e230cSjilinxpd
ff1e230cSjilinxpd	return (error);
ff1e230cSjilinxpd}
ff1e230cSjilinxpd
ff1e230cSjilinxpd/*
ff1e230cSjilinxpd * smbfsremove does the real work of removing in SMBFS
ff1e230cSjilinxpd * Caller has done dir access checks etc.
ff1e230cSjilinxpd *
ff1e230cSjilinxpd * The normal way to delete a file over SMB is open it (with DELETE access),
ff1e230cSjilinxpd * set the "delete-on-close" flag, and close the file.  The problem for Unix
ff1e230cSjilinxpd * applications is that they expect the file name to be gone once the unlink
ff1e230cSjilinxpd * completes, and the SMB server does not actually delete the file until ALL
ff1e230cSjilinxpd * opens of that file are closed.  We can't assume our open handles are the
ff1e230cSjilinxpd * only open handles on a file we're deleting, so to be safe we'll try to
ff1e230cSjilinxpd * rename the file to a temporary name and then set delete-on-close.  If we
ff1e230cSjilinxpd * fail to set delete-on-close (i.e. because other opens prevent it) then
ff1e230cSjilinxpd * undo the changes we made and give up with EBUSY.  Note that we might have
ff1e230cSjilinxpd * permission to delete a file but lack permission to rename, so we want to
ff1e230cSjilinxpd * continue in cases where rename fails.  As an optimization, only do the
ff1e230cSjilinxpd * rename when we have the file open.
ff1e230cSjilinxpd *
ff1e230cSjilinxpd * This is similar to what NFS does when deleting a file that has local opens,
ff1e230cSjilinxpd * but thanks to SMB delete-on-close, we don't need to keep track of when the
ff1e230cSjilinxpd * last local open goes away and send a delete.  The server does that for us.
ff1e230cSjilinxpd */
ff1e230cSjilinxpd/* ARGSUSED */
ff1e230cSjilinxpdstatic int
ff1e230cSjilinxpdsmbfsremove(vnode_t *dvp, vnode_t *vp, struct smb_cred *scred,
ff1e230cSjilinxpd    int flags)
ff1e230cSjilinxpd{
ff1e230cSjilinxpd	smbnode_t	*dnp = VTOSMB(dvp);
ff1e230cSjilinxpd	smbnode_t	*np = VTOSMB(vp);
adee6784SGordon Ross	smbmntinfo_t	*smi = np->n_mount;
ff1e230cSjilinxpd	char		*tmpname = NULL;
ff1e230cSjilinxpd	int		tnlen;
ff1e230cSjilinxpd	int		error;
adee6784SGordon Ross	smb_fh_t	*fid = NULL;
ff1e230cSjilinxpd	boolean_t	renamed = B_FALSE;
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
ff1e230cSjilinxpd	 * The dvp RWlock must be held as writer.
4bff34e3Sthurlow	 */
ff1e230cSjilinxpd	ASSERT(dnp->r_rwlock.owner == curthread);
4bff34e3Sthurlow
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * We need to flush any dirty pages which happen to
5f4fc069Sjilinxpd	 * be hanging around before removing the file.  This
5f4fc069Sjilinxpd	 * shouldn't happen very often and mostly on file
5f4fc069Sjilinxpd	 * systems mounted "nocto".
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	if (vn_has_cached_data(vp) &&
5f4fc069Sjilinxpd	    ((np->r_flags & RDIRTY) || np->r_count > 0)) {
5f4fc069Sjilinxpd		error = smbfs_putpage(vp, (offset_t)0, 0, 0,
5f4fc069Sjilinxpd		    scred->scr_cred, NULL);
5f4fc069Sjilinxpd		if (error && (error == ENOSPC || error == EDQUOT)) {
5f4fc069Sjilinxpd			mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd			if (!np->r_error)
5f4fc069Sjilinxpd				np->r_error = error;
5f4fc069Sjilinxpd			mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
ff1e230cSjilinxpd	/*
ff1e230cSjilinxpd	 * Get a file handle with delete access.
ff1e230cSjilinxpd	 * Close this FID before return.
ff1e230cSjilinxpd	 */
ff1e230cSjilinxpd	error = smbfs_smb_tmpopen(np, STD_RIGHT_DELETE_ACCESS,
ff1e230cSjilinxpd	    scred, &fid);
ff1e230cSjilinxpd	if (error) {
ff1e230cSjilinxpd		SMBVDEBUG("error %d opening %s\n",
ff1e230cSjilinxpd		    error, np->n_rpath);
4bff34e3Sthurlow		goto out;
4bff34e3Sthurlow	}
adee6784SGordon Ross	ASSERT(fid != NULL);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
ff1e230cSjilinxpd	 * If we have the file open, try to rename it to a temporary name.
ff1e230cSjilinxpd	 * If we can't rename, continue on and try setting DoC anyway.
adee6784SGordon Ross	 * Unnecessary for directories.
4bff34e3Sthurlow	 */
adee6784SGordon Ross	if (vp->v_type != VDIR && vp->v_count > 1 && np->n_fidrefs > 0) {
ff1e230cSjilinxpd		tmpname = kmem_alloc(MAXNAMELEN, KM_SLEEP);
ff1e230cSjilinxpd		tnlen = smbfs_newname(tmpname, MAXNAMELEN);
adee6784SGordon Ross		error = smbfs_smb_rename(dnp, np, dnp, tmpname, tnlen,
adee6784SGordon Ross		    fid, scred);
ff1e230cSjilinxpd		if (error != 0) {
ff1e230cSjilinxpd			SMBVDEBUG("error %d renaming %s -> %s\n",
5f4fc069Sjilinxpd			    error, np->n_rpath, tmpname);
ff1e230cSjilinxpd			/* Keep going without the rename. */
ff1e230cSjilinxpd		} else {
ff1e230cSjilinxpd			renamed = B_TRUE;
ff1e230cSjilinxpd		}
ff1e230cSjilinxpd	}
4bff34e3Sthurlow
ff1e230cSjilinxpd	/*
ff1e230cSjilinxpd	 * Mark the file as delete-on-close.  If we can't,
ff1e230cSjilinxpd	 * undo what we did and err out.
ff1e230cSjilinxpd	 */
adee6784SGordon Ross	error = smbfs_smb_setdisp(smi->smi_share, fid, 1, scred);
ff1e230cSjilinxpd	if (error != 0) {
ff1e230cSjilinxpd		SMBVDEBUG("error %d setting DoC on %s\n",
ff1e230cSjilinxpd		    error, np->n_rpath);
02d09e03SGordon Ross		/*
ff1e230cSjilinxpd		 * Failed to set DoC. If we renamed, undo that.
ff1e230cSjilinxpd		 * Need np->n_rpath relative to parent (dnp).
ff1e230cSjilinxpd		 * Use parent path name length plus one for
ff1e230cSjilinxpd		 * the separator ('/' or ':')
02d09e03SGordon Ross		 */
ff1e230cSjilinxpd		if (renamed) {
ff1e230cSjilinxpd			char *oldname;
ff1e230cSjilinxpd			int oldnlen;
ff1e230cSjilinxpd			int err2;
ff1e230cSjilinxpd
ff1e230cSjilinxpd			oldname = np->n_rpath + (dnp->n_rplen + 1);
ff1e230cSjilinxpd			oldnlen = np->n_rplen - (dnp->n_rplen + 1);
adee6784SGordon Ross			err2 = smbfs_smb_rename(dnp, np, dnp, oldname, oldnlen,
adee6784SGordon Ross			    fid, scred);
ff1e230cSjilinxpd			SMBVDEBUG("error %d un-renaming %s -> %s\n",
5f4fc069Sjilinxpd			    err2, tmpname, np->n_rpath);
02d09e03SGordon Ross		}
ff1e230cSjilinxpd		error = EBUSY;
ff1e230cSjilinxpd		goto out;
4bff34e3Sthurlow	}
ff1e230cSjilinxpd	/* Done! */
adee6784SGordon Ross	smbfs_attrcache_remove(np);
ff1e230cSjilinxpd	smbfs_attrcache_prune(np);
4bff34e3Sthurlow
4bff34e3Sthurlowout:
ff1e230cSjilinxpd	if (tmpname != NULL)
ff1e230cSjilinxpd		kmem_free(tmpname, MAXNAMELEN);
adee6784SGordon Ross	if (fid != NULL)
adee6784SGordon Ross		smbfs_smb_tmpclose(np, fid);
ff1e230cSjilinxpd
ff1e230cSjilinxpd	if (error == 0) {
ff1e230cSjilinxpd		/* Keep lookup from finding this node anymore. */
ff1e230cSjilinxpd		smbfs_rmhash(np);
ff1e230cSjilinxpd	}
4bff34e3Sthurlow
4bff34e3Sthurlow	return (error);
4bff34e3Sthurlow}
4bff34e3Sthurlow
4bff34e3Sthurlow
5f4fc069Sjilinxpd/* ARGSUSED */
5f4fc069Sjilinxpdstatic int
5f4fc069Sjilinxpdsmbfs_link(vnode_t *tdvp, vnode_t *svp, char *tnm, cred_t *cr,
5f4fc069Sjilinxpd	caller_context_t *ct, int flags)
5f4fc069Sjilinxpd{
5f4fc069Sjilinxpd	/* Not yet... */
5f4fc069Sjilinxpd	return (ENOSYS);
5f4fc069Sjilinxpd}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd
4bff34e3Sthurlow/*
4bff34e3Sthurlow * XXX
4bff34e3Sthurlow * This op should support the new FIGNORECASE flag for case-insensitive
4bff34e3Sthurlow * lookups, per PSARC 2007/244.
4bff34e3Sthurlow */
4bff34e3Sthurlow/* ARGSUSED */
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_rename(vnode_t *odvp, char *onm, vnode_t *ndvp, char *nnm, cred_t *cr,
4bff34e3Sthurlow	caller_context_t *ct, int flags)
4bff34e3Sthurlow{
ff1e230cSjilinxpd	struct smb_cred	scred;
ff1e230cSjilinxpd	smbnode_t	*odnp = VTOSMB(odvp);
ff1e230cSjilinxpd	smbnode_t	*ndnp = VTOSMB(ndvp);
ff1e230cSjilinxpd	vnode_t		*ovp;
ff1e230cSjilinxpd	int error;
4bff34e3Sthurlow
a19609f8Sjv	if (curproc->p_zone != VTOSMI(odvp)->smi_zone_ref.zref_zone ||
a19609f8Sjv	    curproc->p_zone != VTOSMI(ndvp)->smi_zone_ref.zref_zone)
4bff34e3Sthurlow		return (EPERM);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (VTOSMI(odvp)->smi_flags & SMI_DEAD ||
4bff34e3Sthurlow	    VTOSMI(ndvp)->smi_flags & SMI_DEAD ||
4bff34e3Sthurlow	    odvp->v_vfsp->vfs_flag & VFS_UNMOUNTED ||
4bff34e3Sthurlow	    ndvp->v_vfsp->vfs_flag & VFS_UNMOUNTED)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (strcmp(onm, ".") == 0 || strcmp(onm, "..") == 0 ||
4bff34e3Sthurlow	    strcmp(nnm, ".") == 0 || strcmp(nnm, "..") == 0)
4bff34e3Sthurlow		return (EINVAL);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Check that everything is on the same filesystem.
4bff34e3Sthurlow	 * vn_rename checks the fsid's, but in case we don't
4bff34e3Sthurlow	 * fill those in correctly, check here too.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	if (odvp->v_vfsp != ndvp->v_vfsp)
4bff34e3Sthurlow		return (EXDEV);
4bff34e3Sthurlow
ff1e230cSjilinxpd	/*
ff1e230cSjilinxpd	 * Need write access on source and target.
ff1e230cSjilinxpd	 * Server takes care of most checks.
ff1e230cSjilinxpd	 */
ff1e230cSjilinxpd	error = smbfs_access(odvp, VWRITE|VEXEC, 0, cr, ct);
ff1e230cSjilinxpd	if (error)
ff1e230cSjilinxpd		return (error);
ff1e230cSjilinxpd	if (odvp != ndvp) {
ff1e230cSjilinxpd		error = smbfs_access(ndvp, VWRITE, 0, cr, ct);
ff1e230cSjilinxpd		if (error)
ff1e230cSjilinxpd			return (error);
ff1e230cSjilinxpd	}
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
ff1e230cSjilinxpd	 * Need to lock both old/new dirs as writer.
ff1e230cSjilinxpd	 *
4bff34e3Sthurlow	 * Avoid deadlock here on old vs new directory nodes
4bff34e3Sthurlow	 * by always taking the locks in order of address.
4bff34e3Sthurlow	 * The order is arbitrary, but must be consistent.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	if (odnp < ndnp) {
4bff34e3Sthurlow		if (smbfs_rw_enter_sig(&odnp->r_rwlock, RW_WRITER,
4bff34e3Sthurlow		    SMBINTR(odvp)))
4bff34e3Sthurlow			return (EINTR);
4bff34e3Sthurlow		if (smbfs_rw_enter_sig(&ndnp->r_rwlock, RW_WRITER,
4bff34e3Sthurlow		    SMBINTR(ndvp))) {
4bff34e3Sthurlow			smbfs_rw_exit(&odnp->r_rwlock);
4bff34e3Sthurlow			return (EINTR);
4bff34e3Sthurlow		}
4bff34e3Sthurlow	} else {
4bff34e3Sthurlow		if (smbfs_rw_enter_sig(&ndnp->r_rwlock, RW_WRITER,
4bff34e3Sthurlow		    SMBINTR(ndvp)))
4bff34e3Sthurlow			return (EINTR);
4bff34e3Sthurlow		if (smbfs_rw_enter_sig(&odnp->r_rwlock, RW_WRITER,
4bff34e3Sthurlow		    SMBINTR(odvp))) {
4bff34e3Sthurlow			smbfs_rw_exit(&ndnp->r_rwlock);
4bff34e3Sthurlow			return (EINTR);
4bff34e3Sthurlow		}
4bff34e3Sthurlow	}
02d09e03SGordon Ross	smb_credinit(&scred, cr);
4bff34e3Sthurlow
ff1e230cSjilinxpd	/* Lookup the "old" name */
ff1e230cSjilinxpd	error = smbfslookup(odvp, onm, &ovp, cr, 0, ct);
ff1e230cSjilinxpd	if (error == 0) {
ff1e230cSjilinxpd		/*
ff1e230cSjilinxpd		 * Do the real rename work
ff1e230cSjilinxpd		 */
ff1e230cSjilinxpd		error = smbfsrename(odvp, ovp, ndvp, nnm, &scred, flags);
ff1e230cSjilinxpd		VN_RELE(ovp);
4bff34e3Sthurlow	}
4bff34e3Sthurlow
ff1e230cSjilinxpd	smb_credrele(&scred);
ff1e230cSjilinxpd	smbfs_rw_exit(&odnp->r_rwlock);
ff1e230cSjilinxpd	smbfs_rw_exit(&ndnp->r_rwlock);
ff1e230cSjilinxpd
ff1e230cSjilinxpd	return (error);
ff1e230cSjilinxpd}
ff1e230cSjilinxpd
ff1e230cSjilinxpd/*
ff1e230cSjilinxpd * smbfsrename does the real work of renaming in SMBFS
ff1e230cSjilinxpd * Caller has done dir access checks etc.
ff1e230cSjilinxpd */
ff1e230cSjilinxpd/* ARGSUSED */
ff1e230cSjilinxpdstatic int
ff1e230cSjilinxpdsmbfsrename(vnode_t *odvp, vnode_t *ovp, vnode_t *ndvp, char *nnm,
ff1e230cSjilinxpd    struct smb_cred *scred, int flags)
ff1e230cSjilinxpd{
ff1e230cSjilinxpd	smbnode_t	*odnp = VTOSMB(odvp);
ff1e230cSjilinxpd	smbnode_t	*onp = VTOSMB(ovp);
ff1e230cSjilinxpd	smbnode_t	*ndnp = VTOSMB(ndvp);
ff1e230cSjilinxpd	vnode_t		*nvp = NULL;
ff1e230cSjilinxpd	int		error;
ff1e230cSjilinxpd	int		nvp_locked = 0;
adee6784SGordon Ross	smb_fh_t	*fid = NULL;
ff1e230cSjilinxpd
ff1e230cSjilinxpd	/* Things our caller should have checked. */
ff1e230cSjilinxpd	ASSERT(curproc->p_zone == VTOSMI(odvp)->smi_zone_ref.zref_zone);
ff1e230cSjilinxpd	ASSERT(odvp->v_vfsp == ndvp->v_vfsp);
ff1e230cSjilinxpd	ASSERT(odnp->r_rwlock.owner == curthread);
ff1e230cSjilinxpd	ASSERT(ndnp->r_rwlock.owner == curthread);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Lookup the target file.  If it exists, it needs to be
4bff34e3Sthurlow	 * checked to see whether it is a mount point and whether
4bff34e3Sthurlow	 * it is active (open).
4bff34e3Sthurlow	 */
ff1e230cSjilinxpd	error = smbfslookup(ndvp, nnm, &nvp, scred->scr_cred, 0, NULL);
4bff34e3Sthurlow	if (!error) {
4bff34e3Sthurlow		/*
4bff34e3Sthurlow		 * Target (nvp) already exists.  Check that it
4bff34e3Sthurlow		 * has the same type as the source.  The server
4bff34e3Sthurlow		 * will check this also, (and more reliably) but
4bff34e3Sthurlow		 * this lets us return the correct error codes.
4bff34e3Sthurlow		 */
4bff34e3Sthurlow		if (ovp->v_type == VDIR) {
4bff34e3Sthurlow			if (nvp->v_type != VDIR) {
4bff34e3Sthurlow				error = ENOTDIR;
4bff34e3Sthurlow				goto out;
4bff34e3Sthurlow			}
4bff34e3Sthurlow		} else {
4bff34e3Sthurlow			if (nvp->v_type == VDIR) {
4bff34e3Sthurlow				error = EISDIR;
4bff34e3Sthurlow				goto out;
4bff34e3Sthurlow			}
4bff34e3Sthurlow		}
4bff34e3Sthurlow
4bff34e3Sthurlow		/*
4bff34e3Sthurlow		 * POSIX dictates that when the source and target
4bff34e3Sthurlow		 * entries refer to the same file object, rename
4bff34e3Sthurlow		 * must do nothing and exit without error.
4bff34e3Sthurlow		 */
4bff34e3Sthurlow		if (ovp == nvp) {
4bff34e3Sthurlow			error = 0;
4bff34e3Sthurlow			goto out;
4bff34e3Sthurlow		}
4bff34e3Sthurlow
4bff34e3Sthurlow		/*
4bff34e3Sthurlow		 * Also must ensure the target is not a mount point,
4bff34e3Sthurlow		 * and keep mount/umount away until we're done.
4bff34e3Sthurlow		 */
4bff34e3Sthurlow		if (vn_vfsrlock(nvp)) {
4bff34e3Sthurlow			error = EBUSY;
4bff34e3Sthurlow			goto out;
4bff34e3Sthurlow		}
4bff34e3Sthurlow		nvp_locked = 1;
4bff34e3Sthurlow		if (vn_mountedvfs(nvp) != NULL) {
4bff34e3Sthurlow			error = EBUSY;
4bff34e3Sthurlow			goto out;
4bff34e3Sthurlow		}
4bff34e3Sthurlow
91d632c8Sgwr		/*
ff1e230cSjilinxpd		 * CIFS may give a SHARING_VIOLATION error when
91d632c8Sgwr		 * trying to rename onto an exising object,
91d632c8Sgwr		 * so try to remove the target first.
91d632c8Sgwr		 * (Only for files, not directories.)
91d632c8Sgwr		 */
91d632c8Sgwr		if (nvp->v_type == VDIR) {
91d632c8Sgwr			error = EEXIST;
91d632c8Sgwr			goto out;
91d632c8Sgwr		}
ff1e230cSjilinxpd		error = smbfsremove(ndvp, nvp, scred, flags);
ff1e230cSjilinxpd		if (error != 0)
4bff34e3Sthurlow			goto out;
02d09e03SGordon Ross
91d632c8Sgwr		/*
91d632c8Sgwr		 * OK, removed the target file.  Continue as if
91d632c8Sgwr		 * lookup target had failed (nvp == NULL).
91d632c8Sgwr		 */
91d632c8Sgwr		vn_vfsunlock(nvp);
91d632c8Sgwr		nvp_locked = 0;
91d632c8Sgwr		VN_RELE(nvp);
91d632c8Sgwr		nvp = NULL;
4bff34e3Sthurlow	} /* nvp */
4bff34e3Sthurlow
adee6784SGordon Ross	/*
adee6784SGordon Ross	 * Get a file handle with delete access.
adee6784SGordon Ross	 * Close this FID before return.
adee6784SGordon Ross	 */
adee6784SGordon Ross	error = smbfs_smb_tmpopen(onp, STD_RIGHT_DELETE_ACCESS,
adee6784SGordon Ross	    scred, &fid);
adee6784SGordon Ross	if (error) {
adee6784SGordon Ross		SMBVDEBUG("error %d opening %s\n",
adee6784SGordon Ross		    error, onp->n_rpath);
adee6784SGordon Ross		goto out;
adee6784SGordon Ross	}
adee6784SGordon Ross
02d09e03SGordon Ross	smbfs_attrcache_remove(onp);
adee6784SGordon Ross	error = smbfs_smb_rename(odnp, onp, ndnp, nnm, strlen(nnm),
adee6784SGordon Ross	    fid, scred);
adee6784SGordon Ross
adee6784SGordon Ross	smbfs_smb_tmpclose(onp, fid);
4bff34e3Sthurlow
02d09e03SGordon Ross	/*
02d09e03SGordon Ross	 * If the old name should no longer exist,
02d09e03SGordon Ross	 * discard any cached attributes under it.
02d09e03SGordon Ross	 */
5f4fc069Sjilinxpd	if (error == 0) {
02d09e03SGordon Ross		smbfs_attrcache_prune(onp);
5f4fc069Sjilinxpd		/* SMBFS_VNEVENT... */
5f4fc069Sjilinxpd	}
4bff34e3Sthurlow
4bff34e3Sthurlowout:
4bff34e3Sthurlow	if (nvp) {
4bff34e3Sthurlow		if (nvp_locked)
4bff34e3Sthurlow			vn_vfsunlock(nvp);
4bff34e3Sthurlow		VN_RELE(nvp);
4bff34e3Sthurlow	}
4bff34e3Sthurlow
4bff34e3Sthurlow	return (error);
4bff34e3Sthurlow}
4bff34e3Sthurlow
4bff34e3Sthurlow/*
4bff34e3Sthurlow * XXX
4bff34e3Sthurlow * vsecattr_t is new to build 77, and we need to eventually support
4bff34e3Sthurlow * it in order to create an ACL when an object is created.
4bff34e3Sthurlow *
4bff34e3Sthurlow * This op should support the new FIGNORECASE flag for case-insensitive
4bff34e3Sthurlow * lookups, per PSARC 2007/244.
4bff34e3Sthurlow */
4bff34e3Sthurlow/* ARGSUSED */
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_mkdir(vnode_t *dvp, char *nm, struct vattr *va, vnode_t **vpp,
4bff34e3Sthurlow	cred_t *cr, caller_context_t *ct, int flags, vsecattr_t *vsecp)
4bff34e3Sthurlow{
4bff34e3Sthurlow	vnode_t		*vp;
4bff34e3Sthurlow	struct smbnode	*dnp = VTOSMB(dvp);
4bff34e3Sthurlow	struct smbmntinfo *smi = VTOSMI(dvp);
4bff34e3Sthurlow	struct smb_cred	scred;
4bff34e3Sthurlow	struct smbfattr	fattr;
4bff34e3Sthurlow	const char		*name = (const char *) nm;
4bff34e3Sthurlow	int		nmlen = strlen(name);
adee6784SGordon Ross	int		error;
4bff34e3Sthurlow
a19609f8Sjv	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
4bff34e3Sthurlow		return (EPERM);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (smi->smi_flags & SMI_DEAD || dvp->v_vfsp->vfs_flag & VFS_UNMOUNTED)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	if ((nmlen == 1 && name[0] == '.') ||
4bff34e3Sthurlow	    (nmlen == 2 && name[0] == '.' && name[1] == '.'))
4bff34e3Sthurlow		return (EEXIST);
4bff34e3Sthurlow
91d632c8Sgwr	/* Only plain files are allowed in V_XATTRDIR. */
91d632c8Sgwr	if (dvp->v_flag & V_XATTRDIR)
91d632c8Sgwr		return (EINVAL);
91d632c8Sgwr
4bff34e3Sthurlow	if (smbfs_rw_enter_sig(&dnp->r_rwlock, RW_WRITER, SMBINTR(dvp)))
4bff34e3Sthurlow		return (EINTR);
613a2f6bSGordon Ross	smb_credinit(&scred, cr);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Require write access in the containing directory.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	error = smbfs_access(dvp, VWRITE, 0, cr, ct);
4bff34e3Sthurlow	if (error)
4bff34e3Sthurlow		goto out;
4bff34e3Sthurlow
4bff34e3Sthurlow	error = smbfs_smb_mkdir(dnp, name, nmlen, &scred);
4bff34e3Sthurlow	if (error)
4bff34e3Sthurlow		goto out;
4bff34e3Sthurlow
4bff34e3Sthurlow	error = smbfs_smb_lookup(dnp, &name, &nmlen, &fattr, &scred);
4bff34e3Sthurlow	if (error)
4bff34e3Sthurlow		goto out;
4bff34e3Sthurlow
4bff34e3Sthurlow	smbfs_attr_touchdir(dnp);
4bff34e3Sthurlow
4bff34e3Sthurlow	error = smbfs_nget(dvp, name, nmlen, &fattr, &vp);
4bff34e3Sthurlow	if (error)
4bff34e3Sthurlow		goto out;
4bff34e3Sthurlow
4bff34e3Sthurlow	/* Success! */
4bff34e3Sthurlow	*vpp = vp;
4bff34e3Sthurlow	error = 0;
4bff34e3Sthurlowout:
4bff34e3Sthurlow	smb_credrele(&scred);
4bff34e3Sthurlow	smbfs_rw_exit(&dnp->r_rwlock);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (name != nm)
4bff34e3Sthurlow		smbfs_name_free(name, nmlen);
4bff34e3Sthurlow
4bff34e3Sthurlow	return (error);
4bff34e3Sthurlow}
4bff34e3Sthurlow
4bff34e3Sthurlow/*
4bff34e3Sthurlow * XXX
4bff34e3Sthurlow * This op should support the new FIGNORECASE flag for case-insensitive
4bff34e3Sthurlow * lookups, per PSARC 2007/244.
4bff34e3Sthurlow */
4bff34e3Sthurlow/* ARGSUSED */
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_rmdir(vnode_t *dvp, char *nm, vnode_t *cdir, cred_t *cr,
4bff34e3Sthurlow	caller_context_t *ct, int flags)
4bff34e3Sthurlow{
adee6784SGordon Ross	struct smb_cred	scred;
4bff34e3Sthurlow	vnode_t		*vp = NULL;
4bff34e3Sthurlow	int		vp_locked = 0;
4bff34e3Sthurlow	struct smbmntinfo *smi = VTOSMI(dvp);
4bff34e3Sthurlow	struct smbnode	*dnp = VTOSMB(dvp);
4bff34e3Sthurlow	struct smbnode	*np;
4bff34e3Sthurlow	int		error;
4bff34e3Sthurlow
a19609f8Sjv	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
4bff34e3Sthurlow		return (EPERM);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (smi->smi_flags & SMI_DEAD || dvp->v_vfsp->vfs_flag & VFS_UNMOUNTED)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
adee6784SGordon Ross	 * Verify access to the dirctory.
4bff34e3Sthurlow	 */
adee6784SGordon Ross	error = smbfs_access(dvp, VWRITE|VEXEC, 0, cr, ct);
4bff34e3Sthurlow	if (error)
adee6784SGordon Ross		return (error);
adee6784SGordon Ross
adee6784SGordon Ross	if (smbfs_rw_enter_sig(&dnp->r_rwlock, RW_WRITER, SMBINTR(dvp)))
adee6784SGordon Ross		return (EINTR);
adee6784SGordon Ross	smb_credinit(&scred, cr);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * First lookup the entry to be removed.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	error = smbfslookup(dvp, nm, &vp, cr, 0, ct);
4bff34e3Sthurlow	if (error)
4bff34e3Sthurlow		goto out;
4bff34e3Sthurlow	np = VTOSMB(vp);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Disallow rmdir of "." or current dir, or the FS root.
4bff34e3Sthurlow	 * Also make sure it's a directory, not a mount point,
4bff34e3Sthurlow	 * and lock to keep mount/umount away until we're done.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	if ((vp == dvp) || (vp == cdir) || (vp->v_flag & VROOT)) {
4bff34e3Sthurlow		error = EINVAL;
4bff34e3Sthurlow		goto out;
4bff34e3Sthurlow	}
4bff34e3Sthurlow	if (vp->v_type != VDIR) {
4bff34e3Sthurlow		error = ENOTDIR;
4bff34e3Sthurlow		goto out;
4bff34e3Sthurlow	}
4bff34e3Sthurlow	if (vn_vfsrlock(vp)) {
4bff34e3Sthurlow		error = EBUSY;
4bff34e3Sthurlow		goto out;
4bff34e3Sthurlow	}
4bff34e3Sthurlow	vp_locked = 1;
4bff34e3Sthurlow	if (vn_mountedvfs(vp) != NULL) {
4bff34e3Sthurlow		error = EBUSY;
4bff34e3Sthurlow		goto out;
4bff34e3Sthurlow	}
4bff34e3Sthurlow
91d632c8Sgwr	/*
adee6784SGordon Ross	 * Do the real rmdir work
91d632c8Sgwr	 */
adee6784SGordon Ross	error = smbfsremove(dvp, vp, &scred, flags);
4bff34e3Sthurlow	if (error)
4bff34e3Sthurlow		goto out;
4bff34e3Sthurlow
adee6784SGordon Ross#ifdef	SMBFS_VNEVENT
adee6784SGordon Ross	vnevent_rmdir(vp, dvp, nm, ct);
adee6784SGordon Ross#endif
adee6784SGordon Ross
4bff34e3Sthurlow	mutex_enter(&np->r_statelock);
4bff34e3Sthurlow	dnp->n_flag |= NMODIFIED;
4bff34e3Sthurlow	mutex_exit(&np->r_statelock);
4bff34e3Sthurlow	smbfs_attr_touchdir(dnp);
02d09e03SGordon Ross	smbfs_rmhash(np);
4bff34e3Sthurlow
4bff34e3Sthurlowout:
4bff34e3Sthurlow	if (vp) {
4bff34e3Sthurlow		if (vp_locked)
4bff34e3Sthurlow			vn_vfsunlock(vp);
4bff34e3Sthurlow		VN_RELE(vp);
4bff34e3Sthurlow	}
4bff34e3Sthurlow	smb_credrele(&scred);
4bff34e3Sthurlow	smbfs_rw_exit(&dnp->r_rwlock);
4bff34e3Sthurlow
4bff34e3Sthurlow	return (error);
4bff34e3Sthurlow}
4bff34e3Sthurlow
4bff34e3Sthurlow
5f4fc069Sjilinxpd/* ARGSUSED */
5f4fc069Sjilinxpdstatic int
5f4fc069Sjilinxpdsmbfs_symlink(vnode_t *dvp, char *lnm, struct vattr *tva, char *tnm, cred_t *cr,
5f4fc069Sjilinxpd	caller_context_t *ct, int flags)
5f4fc069Sjilinxpd{
5f4fc069Sjilinxpd	/* Not yet... */
5f4fc069Sjilinxpd	return (ENOSYS);
5f4fc069Sjilinxpd}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd
4bff34e3Sthurlow/* ARGSUSED */
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_readdir(vnode_t *vp, struct uio *uiop, cred_t *cr, int *eofp,
4bff34e3Sthurlow	caller_context_t *ct, int flags)
4bff34e3Sthurlow{
4bff34e3Sthurlow	struct smbnode	*np = VTOSMB(vp);
4bff34e3Sthurlow	int		error = 0;
4bff34e3Sthurlow	smbmntinfo_t	*smi;
4bff34e3Sthurlow
4bff34e3Sthurlow	smi = VTOSMI(vp);
4bff34e3Sthurlow
a19609f8Sjv	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (smi->smi_flags & SMI_DEAD || vp->v_vfsp->vfs_flag & VFS_UNMOUNTED)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Require read access in the directory.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	error = smbfs_access(vp, VREAD, 0, cr, ct);
4bff34e3Sthurlow	if (error)
4bff34e3Sthurlow		return (error);
4bff34e3Sthurlow
4bff34e3Sthurlow	ASSERT(smbfs_rw_lock_held(&np->r_rwlock, RW_READER));
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
5f4fc069Sjilinxpd	 * Todo readdir cache here
4bff34e3Sthurlow	 *
4bff34e3Sthurlow	 * I am serializing the entire readdir opreation
4bff34e3Sthurlow	 * now since we have not yet implemented readdir
4bff34e3Sthurlow	 * cache. This fix needs to be revisited once
4bff34e3Sthurlow	 * we implement readdir cache.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	if (smbfs_rw_enter_sig(&np->r_lkserlock, RW_WRITER, SMBINTR(vp)))
4bff34e3Sthurlow		return (EINTR);
4bff34e3Sthurlow
4bff34e3Sthurlow	error = smbfs_readvdir(vp, uiop, cr, eofp, ct);
4bff34e3Sthurlow
4bff34e3Sthurlow	smbfs_rw_exit(&np->r_lkserlock);
4bff34e3Sthurlow
4bff34e3Sthurlow	return (error);
4bff34e3Sthurlow}
4bff34e3Sthurlow
4bff34e3Sthurlow/* ARGSUSED */
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_readvdir(vnode_t *vp, uio_t *uio, cred_t *cr, int *eofp,
4bff34e3Sthurlow	caller_context_t *ct)
4bff34e3Sthurlow{
5ecede33SGordon Ross	/*
5ecede33SGordon Ross	 * Note: "limit" tells the SMB-level FindFirst/FindNext
5ecede33SGordon Ross	 * functions how many directory entries to request in
5ecede33SGordon Ross	 * each OtW call.  It needs to be large enough so that
5ecede33SGordon Ross	 * we don't make lots of tiny OtW requests, but there's
5ecede33SGordon Ross	 * no point making it larger than the maximum number of
5ecede33SGordon Ross	 * OtW entries that would fit in a maximum sized trans2
5ecede33SGordon Ross	 * response (64k / 48).  Beyond that, it's just tuning.
5ecede33SGordon Ross	 * WinNT used 512, Win2k used 1366.  We use 1000.
5ecede33SGordon Ross	 */
5ecede33SGordon Ross	static const int limit = 1000;
5ecede33SGordon Ross	/* Largest possible dirent size. */
5ecede33SGordon Ross	static const size_t dbufsiz = DIRENT64_RECLEN(SMB_MAXFNAMELEN);
4bff34e3Sthurlow	struct smb_cred scred;
4bff34e3Sthurlow	vnode_t		*newvp;
4bff34e3Sthurlow	struct smbnode	*np = VTOSMB(vp);
4bff34e3Sthurlow	struct smbfs_fctx *ctx;
5ecede33SGordon Ross	struct dirent64 *dp;
5ecede33SGordon Ross	ssize_t		save_resid;
5ecede33SGordon Ross	offset_t	save_offset; /* 64 bits */
5ecede33SGordon Ross	int		offset; /* yes, 32 bits */
5ecede33SGordon Ross	int		nmlen, error;
5ecede33SGordon Ross	ushort_t	reclen;
4bff34e3Sthurlow
a19609f8Sjv	ASSERT(curproc->p_zone == VTOSMI(vp)->smi_zone_ref.zref_zone);
4bff34e3Sthurlow
4bff34e3Sthurlow	/* Make sure we serialize for n_dirseq use. */
4bff34e3Sthurlow	ASSERT(smbfs_rw_lock_held(&np->r_lkserlock, RW_WRITER));
4bff34e3Sthurlow
5ecede33SGordon Ross	/*
5ecede33SGordon Ross	 * Make sure smbfs_open filled in n_dirseq
5ecede33SGordon Ross	 */
5ecede33SGordon Ross	if (np->n_dirseq == NULL)
5ecede33SGordon Ross		return (EBADF);
5ecede33SGordon Ross
5ecede33SGordon Ross	/* Check for overflow of (32-bit) directory offset. */
5ecede33SGordon Ross	if (uio->uio_loffset < 0 || uio->uio_loffset > INT32_MAX ||
5ecede33SGordon Ross	    (uio->uio_loffset + uio->uio_resid) > INT32_MAX)
5ecede33SGordon Ross		return (EINVAL);
5ecede33SGordon Ross
5ecede33SGordon Ross	/* Require space for at least one dirent. */
5ecede33SGordon Ross	if (uio->uio_resid < dbufsiz)
4bff34e3Sthurlow		return (EINVAL);
4bff34e3Sthurlow
4bff34e3Sthurlow	SMBVDEBUG("dirname='%s'\n", np->n_rpath);
613a2f6bSGordon Ross	smb_credinit(&scred, cr);
4bff34e3Sthurlow	dp = kmem_alloc(dbufsiz, KM_SLEEP);
4bff34e3Sthurlow
5ecede33SGordon Ross	save_resid = uio->uio_resid;
5ecede33SGordon Ross	save_offset = uio->uio_loffset;
5ecede33SGordon Ross	offset = uio->uio_offset;
5ecede33SGordon Ross	SMBVDEBUG("in: offset=%d, resid=%d\n",
5ecede33SGordon Ross	    (int)uio->uio_offset, (int)uio->uio_resid);
5ecede33SGordon Ross	error = 0;
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Generate the "." and ".." entries here so we can
4bff34e3Sthurlow	 * (1) make sure they appear (but only once), and
4bff34e3Sthurlow	 * (2) deal with getting their I numbers which the
4bff34e3Sthurlow	 * findnext below does only for normal names.
4bff34e3Sthurlow	 */
5ecede33SGordon Ross	while (offset < FIRST_DIROFS) {
5ecede33SGordon Ross		/*
5ecede33SGordon Ross		 * Tricky bit filling in the first two:
5ecede33SGordon Ross		 * offset 0 is ".", offset 1 is ".."
5ecede33SGordon Ross		 * so strlen of these is offset+1.
5ecede33SGordon Ross		 */
4bff34e3Sthurlow		reclen = DIRENT64_RECLEN(offset + 1);
5ecede33SGordon Ross		if (uio->uio_resid < reclen)
5ecede33SGordon Ross			goto out;
4bff34e3Sthurlow		bzero(dp, reclen);
4bff34e3Sthurlow		dp->d_reclen = reclen;
4bff34e3Sthurlow		dp->d_name[0] = '.';
4bff34e3Sthurlow		dp->d_name[1] = '.';
4bff34e3Sthurlow		dp->d_name[offset + 1] = '\0';
4bff34e3Sthurlow		/*
4bff34e3Sthurlow		 * Want the real I-numbers for the "." and ".."
4bff34e3Sthurlow		 * entries.  For these two names, we know that
5ecede33SGordon Ross		 * smbfslookup can get the nodes efficiently.
4bff34e3Sthurlow		 */
4bff34e3Sthurlow		error = smbfslookup(vp, dp->d_name, &newvp, cr, 1, ct);
4bff34e3Sthurlow		if (error) {
4bff34e3Sthurlow			dp->d_ino = np->n_ino + offset; /* fiction */
4bff34e3Sthurlow		} else {
4bff34e3Sthurlow			dp->d_ino = VTOSMB(newvp)->n_ino;
4bff34e3Sthurlow			VN_RELE(newvp);
4bff34e3Sthurlow		}
5ecede33SGordon Ross		/*
5ecede33SGordon Ross		 * Note: d_off is the offset that a user-level program
5ecede33SGordon Ross		 * should seek to for reading the NEXT directory entry.
5ecede33SGordon Ross		 * See libc: readdir, telldir, seekdir
5ecede33SGordon Ross		 */
5ecede33SGordon Ross		dp->d_off = offset + 1;
5ecede33SGordon Ross		error = uiomove(dp, reclen, UIO_READ, uio);
4bff34e3Sthurlow		if (error)
4bff34e3Sthurlow			goto out;
5ecede33SGordon Ross		/*
5ecede33SGordon Ross		 * Note: uiomove updates uio->uio_offset,
5ecede33SGordon Ross		 * but we want it to be our "cookie" value,
5ecede33SGordon Ross		 * which just counts dirents ignoring size.
5ecede33SGordon Ross		 */
4bff34e3Sthurlow		uio->uio_offset = ++offset;
4bff34e3Sthurlow	}
5ecede33SGordon Ross
5ecede33SGordon Ross	/*
5ecede33SGordon Ross	 * If there was a backward seek, we have to reopen.
5ecede33SGordon Ross	 */
5ecede33SGordon Ross	if (offset < np->n_dirofs) {
5ecede33SGordon Ross		SMBVDEBUG("Reopening search %d:%d\n",
5ecede33SGordon Ross		    offset, np->n_dirofs);
4bff34e3Sthurlow		error = smbfs_smb_findopen(np, "*", 1,
4bff34e3Sthurlow		    SMB_FA_SYSTEM | SMB_FA_HIDDEN | SMB_FA_DIR,
4bff34e3Sthurlow		    &scred, &ctx);
4bff34e3Sthurlow		if (error) {
4bff34e3Sthurlow			SMBVDEBUG("can not open search, error = %d", error);
4bff34e3Sthurlow			goto out;
4bff34e3Sthurlow		}
5ecede33SGordon Ross		/* free the old one */
5ecede33SGordon Ross		(void) smbfs_smb_findclose(np->n_dirseq, &scred);
5ecede33SGordon Ross		/* save the new one */
4bff34e3Sthurlow		np->n_dirseq = ctx;
5ecede33SGordon Ross		np->n_dirofs = FIRST_DIROFS;
5ecede33SGordon Ross	} else {
4bff34e3Sthurlow		ctx = np->n_dirseq;
5ecede33SGordon Ross	}
5ecede33SGordon Ross
5ecede33SGordon Ross	/*
5ecede33SGordon Ross	 * Skip entries before the requested offset.
5ecede33SGordon Ross	 */
4bff34e3Sthurlow	while (np->n_dirofs < offset) {
5ecede33SGordon Ross		error = smbfs_smb_findnext(ctx, limit, &scred);
5ecede33SGordon Ross		if (error != 0)
4bff34e3Sthurlow			goto out;
5ecede33SGordon Ross		np->n_dirofs++;
4bff34e3Sthurlow	}
5ecede33SGordon Ross
5ecede33SGordon Ross	/*
5ecede33SGordon Ross	 * While there's room in the caller's buffer:
5ecede33SGordon Ross	 *	get a directory entry from SMB,
5ecede33SGordon Ross	 *	convert to a dirent, copyout.
5ecede33SGordon Ross	 * We stop when there is no longer room for a
5ecede33SGordon Ross	 * maximum sized dirent because we must decide
5ecede33SGordon Ross	 * before we know anything about the next entry.
5ecede33SGordon Ross	 */
5ecede33SGordon Ross	while (uio->uio_resid >= dbufsiz) {
4bff34e3Sthurlow		error = smbfs_smb_findnext(ctx, limit, &scred);
5ecede33SGordon Ross		if (error != 0)
5ecede33SGordon Ross			goto out;
4bff34e3Sthurlow		np->n_dirofs++;
5ecede33SGordon Ross
4bff34e3Sthurlow		/* Sanity check the name length. */
4bff34e3Sthurlow		nmlen = ctx->f_nmlen;
613a2f6bSGordon Ross		if (nmlen > SMB_MAXFNAMELEN) {
613a2f6bSGordon Ross			nmlen = SMB_MAXFNAMELEN;
4bff34e3Sthurlow			SMBVDEBUG("Truncating name: %s\n", ctx->f_name);
4bff34e3Sthurlow		}
4bff34e3Sthurlow		if (smbfs_fastlookup) {
02d09e03SGordon Ross			/* See comment at smbfs_fastlookup above. */
5ecede33SGordon Ross			if (smbfs_nget(vp, ctx->f_name, nmlen,
5ecede33SGordon Ross			    &ctx->f_attr, &newvp) == 0)
4bff34e3Sthurlow				VN_RELE(newvp);
4bff34e3Sthurlow		}
5ecede33SGordon Ross
5ecede33SGordon Ross		reclen = DIRENT64_RECLEN(nmlen);
5ecede33SGordon Ross		bzero(dp, reclen);
5ecede33SGordon Ross		dp->d_reclen = reclen;
5ecede33SGordon Ross		bcopy(ctx->f_name, dp->d_name, nmlen);
5ecede33SGordon Ross		dp->d_name[nmlen] = '\0';
02d09e03SGordon Ross		dp->d_ino = ctx->f_inum;
5ecede33SGordon Ross		dp->d_off = offset + 1;	/* See d_off comment above */
5ecede33SGordon Ross		error = uiomove(dp, reclen, UIO_READ, uio);
4bff34e3Sthurlow		if (error)
5ecede33SGordon Ross			goto out;
5ecede33SGordon Ross		/* See comment re. uio_offset above. */
4bff34e3Sthurlow		uio->uio_offset = ++offset;
4bff34e3Sthurlow	}
5ecede33SGordon Ross
4bff34e3Sthurlowout:
5ecede33SGordon Ross	/*
5ecede33SGordon Ross	 * When we come to the end of a directory, the
5ecede33SGordon Ross	 * SMB-level functions return ENOENT, but the
5ecede33SGordon Ross	 * caller is not expecting an error return.
5ecede33SGordon Ross	 *
5ecede33SGordon Ross	 * Also note that we must delay the call to
5ecede33SGordon Ross	 * smbfs_smb_findclose(np->n_dirseq, ...)
5ecede33SGordon Ross	 * until smbfs_close so that all reads at the
5ecede33SGordon Ross	 * end of the directory will return no data.
5ecede33SGordon Ross	 */
5ecede33SGordon Ross	if (error == ENOENT) {
5ecede33SGordon Ross		error = 0;
5ecede33SGordon Ross		if (eofp)
5ecede33SGordon Ross			*eofp = 1;
5ecede33SGordon Ross	}
5ecede33SGordon Ross	/*
5ecede33SGordon Ross	 * If we encountered an error (i.e. "access denied")
5ecede33SGordon Ross	 * from the FindFirst call, we will have copied out
5ecede33SGordon Ross	 * the "." and ".." entries leaving offset == 2.
5ecede33SGordon Ross	 * In that case, restore the original offset/resid
5ecede33SGordon Ross	 * so the caller gets no data with the error.
5ecede33SGordon Ross	 */
5ecede33SGordon Ross	if (error != 0 && offset == FIRST_DIROFS) {
5ecede33SGordon Ross		uio->uio_loffset = save_offset;
5ecede33SGordon Ross		uio->uio_resid = save_resid;
5ecede33SGordon Ross	}
5ecede33SGordon Ross	SMBVDEBUG("out: offset=%d, resid=%d\n",
5ecede33SGordon Ross	    (int)uio->uio_offset, (int)uio->uio_resid);
5ecede33SGordon Ross
4bff34e3Sthurlow	kmem_free(dp, dbufsiz);
4bff34e3Sthurlow	smb_credrele(&scred);
4bff34e3Sthurlow	return (error);
4bff34e3Sthurlow}
4bff34e3Sthurlow
5f4fc069Sjilinxpd/*
5f4fc069Sjilinxpd * Here NFS has: nfs3_bio
5f4fc069Sjilinxpd * See smbfs_bio above.
5f4fc069Sjilinxpd */
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd/* ARGSUSED */
5f4fc069Sjilinxpdstatic int
5f4fc069Sjilinxpdsmbfs_fid(vnode_t *vp, fid_t *fidp, caller_context_t *ct)
5f4fc069Sjilinxpd{
5f4fc069Sjilinxpd	return (ENOSYS);
5f4fc069Sjilinxpd}
5f4fc069Sjilinxpd
4bff34e3Sthurlow
4bff34e3Sthurlow/*
4bff34e3Sthurlow * The pair of functions VOP_RWLOCK, VOP_RWUNLOCK
4bff34e3Sthurlow * are optional functions that are called by:
4bff34e3Sthurlow *    getdents, before/after VOP_READDIR
4bff34e3Sthurlow *    pread, before/after ... VOP_READ
4bff34e3Sthurlow *    pwrite, before/after ... VOP_WRITE
4bff34e3Sthurlow *    (other places)
4bff34e3Sthurlow *
4bff34e3Sthurlow * Careful here: None of the above check for any
4bff34e3Sthurlow * error returns from VOP_RWLOCK / VOP_RWUNLOCK!
4bff34e3Sthurlow * In fact, the return value from _rwlock is NOT
4bff34e3Sthurlow * an error code, but V_WRITELOCK_TRUE / _FALSE.
4bff34e3Sthurlow *
4bff34e3Sthurlow * Therefore, it's up to _this_ code to make sure
4bff34e3Sthurlow * the lock state remains balanced, which means
4bff34e3Sthurlow * we can't "bail out" on interrupts, etc.
4bff34e3Sthurlow */
4bff34e3Sthurlow
4bff34e3Sthurlow/* ARGSUSED2 */
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_rwlock(vnode_t *vp, int write_lock, caller_context_t *ctp)
4bff34e3Sthurlow{
4bff34e3Sthurlow	smbnode_t	*np = VTOSMB(vp);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (!write_lock) {
4bff34e3Sthurlow		(void) smbfs_rw_enter_sig(&np->r_rwlock, RW_READER, FALSE);
4bff34e3Sthurlow		return (V_WRITELOCK_FALSE);
4bff34e3Sthurlow	}
4bff34e3Sthurlow
4bff34e3Sthurlow
4bff34e3Sthurlow	(void) smbfs_rw_enter_sig(&np->r_rwlock, RW_WRITER, FALSE);
4bff34e3Sthurlow	return (V_WRITELOCK_TRUE);
4bff34e3Sthurlow}
4bff34e3Sthurlow
4bff34e3Sthurlow/* ARGSUSED */
4bff34e3Sthurlowstatic void
4bff34e3Sthurlowsmbfs_rwunlock(vnode_t *vp, int write_lock, caller_context_t *ctp)
4bff34e3Sthurlow{
4bff34e3Sthurlow	smbnode_t	*np = VTOSMB(vp);
4bff34e3Sthurlow
4bff34e3Sthurlow	smbfs_rw_exit(&np->r_rwlock);
4bff34e3Sthurlow}
4bff34e3Sthurlow
4bff34e3Sthurlow
4bff34e3Sthurlow/* ARGSUSED */
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_seek(vnode_t *vp, offset_t ooff, offset_t *noffp, caller_context_t *ct)
4bff34e3Sthurlow{
4bff34e3Sthurlow	smbmntinfo_t	*smi;
4bff34e3Sthurlow
4bff34e3Sthurlow	smi = VTOSMI(vp);
4bff34e3Sthurlow
a19609f8Sjv	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
4bff34e3Sthurlow		return (EPERM);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (smi->smi_flags & SMI_DEAD || vp->v_vfsp->vfs_flag & VFS_UNMOUNTED)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Because we stuff the readdir cookie into the offset field
4bff34e3Sthurlow	 * someone may attempt to do an lseek with the cookie which
4bff34e3Sthurlow	 * we want to succeed.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow	if (vp->v_type == VDIR)
4bff34e3Sthurlow		return (0);
4bff34e3Sthurlow
4bff34e3Sthurlow	/* Like NFS3, just check for 63-bit overflow. */
4bff34e3Sthurlow	if (*noffp < 0)
4bff34e3Sthurlow		return (EINVAL);
4bff34e3Sthurlow
4bff34e3Sthurlow	return (0);
4bff34e3Sthurlow}
4bff34e3Sthurlow
5f4fc069Sjilinxpd/* mmap support ******************************************************** */
5f4fc069Sjilinxpd
8329232eSGordon Ross#ifdef	_KERNEL
8329232eSGordon Ross
5f4fc069Sjilinxpd#ifdef DEBUG
5f4fc069Sjilinxpdstatic int smbfs_lostpage = 0;	/* number of times we lost original page */
5f4fc069Sjilinxpd#endif
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd/*
5f4fc069Sjilinxpd * Return all the pages from [off..off+len) in file
5f4fc069Sjilinxpd * Like nfs3_getpage
5f4fc069Sjilinxpd */
5f4fc069Sjilinxpd/* ARGSUSED */
5f4fc069Sjilinxpdstatic int
5f4fc069Sjilinxpdsmbfs_getpage(vnode_t *vp, offset_t off, size_t len, uint_t *protp,
5f4fc069Sjilinxpd	page_t *pl[], size_t plsz, struct seg *seg, caddr_t addr,
5f4fc069Sjilinxpd	enum seg_rw rw, cred_t *cr, caller_context_t *ct)
5f4fc069Sjilinxpd{
5f4fc069Sjilinxpd	smbnode_t	*np;
5f4fc069Sjilinxpd	smbmntinfo_t	*smi;
5f4fc069Sjilinxpd	int		error;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	np = VTOSMB(vp);
5f4fc069Sjilinxpd	smi = VTOSMI(vp);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
5f4fc069Sjilinxpd		return (EIO);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (smi->smi_flags & SMI_DEAD || vp->v_vfsp->vfs_flag & VFS_UNMOUNTED)
5f4fc069Sjilinxpd		return (EIO);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (vp->v_flag & VNOMAP)
5f4fc069Sjilinxpd		return (ENOSYS);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (protp != NULL)
5f4fc069Sjilinxpd		*protp = PROT_ALL;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * Now valididate that the caches are up to date.
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	error = smbfs_validate_caches(vp, cr);
5f4fc069Sjilinxpd	if (error)
5f4fc069Sjilinxpd		return (error);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpdretry:
5f4fc069Sjilinxpd	mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * Don't create dirty pages faster than they
5f4fc069Sjilinxpd	 * can be cleaned ... (etc. see nfs)
5f4fc069Sjilinxpd	 *
5f4fc069Sjilinxpd	 * Here NFS also tests:
5f4fc069Sjilinxpd	 *  (mi->mi_max_threads != 0 &&
5f4fc069Sjilinxpd	 *  rp->r_awcount > 2 * mi->mi_max_threads)
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	if (rw == S_CREATE) {
5f4fc069Sjilinxpd		while (np->r_gcount > 0)
5f4fc069Sjilinxpd			cv_wait(&np->r_cv, &np->r_statelock);
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * If we are getting called as a side effect of a write
5f4fc069Sjilinxpd	 * operation the local file size might not be extended yet.
5f4fc069Sjilinxpd	 * In this case we want to be able to return pages of zeroes.
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	if (off + len > np->r_size + PAGEOFFSET && seg != segkmap) {
5f4fc069Sjilinxpd		mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd		return (EFAULT);		/* beyond EOF */
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	error = pvn_getpages(smbfs_getapage, vp, off, len, protp,
5f4fc069Sjilinxpd	    pl, plsz, seg, addr, rw, cr);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	switch (error) {
5f4fc069Sjilinxpd	case SMBFS_EOF:
5f4fc069Sjilinxpd		smbfs_purge_caches(vp, cr);
5f4fc069Sjilinxpd		goto retry;
5f4fc069Sjilinxpd	case ESTALE:
5f4fc069Sjilinxpd		/*
5f4fc069Sjilinxpd		 * Here NFS has: PURGE_STALE_FH(error, vp, cr);
5f4fc069Sjilinxpd		 * In-line here as we only use it once.
5f4fc069Sjilinxpd		 */
5f4fc069Sjilinxpd		mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd		np->r_flags |= RSTALE;
5f4fc069Sjilinxpd		if (!np->r_error)
5f4fc069Sjilinxpd			np->r_error = (error);
5f4fc069Sjilinxpd		mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd		if (vn_has_cached_data(vp))
5f4fc069Sjilinxpd			smbfs_invalidate_pages(vp, (u_offset_t)0, cr);
5f4fc069Sjilinxpd		smbfs_purge_caches(vp, cr);
5f4fc069Sjilinxpd		break;
5f4fc069Sjilinxpd	default:
5f4fc069Sjilinxpd		break;
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	return (error);
5f4fc069Sjilinxpd}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd/*
5f4fc069Sjilinxpd * Called from pvn_getpages to get a particular page.
5f4fc069Sjilinxpd * Like nfs3_getapage
5f4fc069Sjilinxpd */
5f4fc069Sjilinxpd/* ARGSUSED */
5f4fc069Sjilinxpdstatic int
5f4fc069Sjilinxpdsmbfs_getapage(vnode_t *vp, u_offset_t off, size_t len, uint_t *protp,
5f4fc069Sjilinxpd	page_t *pl[], size_t plsz, struct seg *seg, caddr_t addr,
5f4fc069Sjilinxpd	enum seg_rw rw, cred_t *cr)
5f4fc069Sjilinxpd{
5f4fc069Sjilinxpd	smbnode_t	*np;
5f4fc069Sjilinxpd	smbmntinfo_t   *smi;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	uint_t		bsize;
5f4fc069Sjilinxpd	struct buf	*bp;
5f4fc069Sjilinxpd	page_t		*pp;
5f4fc069Sjilinxpd	u_offset_t	lbn;
5f4fc069Sjilinxpd	u_offset_t	io_off;
5f4fc069Sjilinxpd	u_offset_t	blkoff;
5f4fc069Sjilinxpd	size_t		io_len;
5f4fc069Sjilinxpd	uint_t blksize;
5f4fc069Sjilinxpd	int error;
5f4fc069Sjilinxpd	/* int readahead; */
5f4fc069Sjilinxpd	int readahead_issued = 0;
5f4fc069Sjilinxpd	/* int ra_window; * readahead window */
5f4fc069Sjilinxpd	page_t *pagefound;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	np = VTOSMB(vp);
5f4fc069Sjilinxpd	smi = VTOSMI(vp);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
5f4fc069Sjilinxpd		return (EIO);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (smi->smi_flags & SMI_DEAD || vp->v_vfsp->vfs_flag & VFS_UNMOUNTED)
5f4fc069Sjilinxpd		return (EIO);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	bsize = MAX(vp->v_vfsp->vfs_bsize, PAGESIZE);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpdreread:
5f4fc069Sjilinxpd	bp = NULL;
5f4fc069Sjilinxpd	pp = NULL;
5f4fc069Sjilinxpd	pagefound = NULL;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (pl != NULL)
5f4fc069Sjilinxpd		pl[0] = NULL;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	error = 0;
5f4fc069Sjilinxpd	lbn = off / bsize;
5f4fc069Sjilinxpd	blkoff = lbn * bsize;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * NFS queues up readahead work here.
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd
5f4fc069Sjilinxpdagain:
5f4fc069Sjilinxpd	if ((pagefound = page_exists(vp, off)) == NULL) {
5f4fc069Sjilinxpd		if (pl == NULL) {
5f4fc069Sjilinxpd			(void) 0; /* Todo: smbfs_async_readahead(); */
5f4fc069Sjilinxpd		} else if (rw == S_CREATE) {
5f4fc069Sjilinxpd			/*
5f4fc069Sjilinxpd			 * Block for this page is not allocated, or the offset
5f4fc069Sjilinxpd			 * is beyond the current allocation size, or we're
5f4fc069Sjilinxpd			 * allocating a swap slot and the page was not found,
5f4fc069Sjilinxpd			 * so allocate it and return a zero page.
5f4fc069Sjilinxpd			 */
5f4fc069Sjilinxpd			if ((pp = page_create_va(vp, off,
5f4fc069Sjilinxpd			    PAGESIZE, PG_WAIT, seg, addr)) == NULL)
5f4fc069Sjilinxpd				cmn_err(CE_PANIC, "smbfs_getapage: page_create");
5f4fc069Sjilinxpd			io_len = PAGESIZE;
5f4fc069Sjilinxpd			mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd			np->r_nextr = off + PAGESIZE;
5f4fc069Sjilinxpd			mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd		} else {
5f4fc069Sjilinxpd			/*
5f4fc069Sjilinxpd			 * Need to go to server to get a BLOCK, exception to
5f4fc069Sjilinxpd			 * that being while reading at offset = 0 or doing
5f4fc069Sjilinxpd			 * random i/o, in that case read only a PAGE.
5f4fc069Sjilinxpd			 */
5f4fc069Sjilinxpd			mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd			if (blkoff < np->r_size &&
5f4fc069Sjilinxpd			    blkoff + bsize >= np->r_size) {
5f4fc069Sjilinxpd				/*
5f4fc069Sjilinxpd				 * If only a block or less is left in
5f4fc069Sjilinxpd				 * the file, read all that is remaining.
5f4fc069Sjilinxpd				 */
5f4fc069Sjilinxpd				if (np->r_size <= off) {
5f4fc069Sjilinxpd					/*
5f4fc069Sjilinxpd					 * Trying to access beyond EOF,
5f4fc069Sjilinxpd					 * set up to get at least one page.
5f4fc069Sjilinxpd					 */
5f4fc069Sjilinxpd					blksize = off + PAGESIZE - blkoff;
5f4fc069Sjilinxpd				} else
5f4fc069Sjilinxpd					blksize = np->r_size - blkoff;
5f4fc069Sjilinxpd			} else if ((off == 0) ||
5f4fc069Sjilinxpd			    (off != np->r_nextr && !readahead_issued)) {
5f4fc069Sjilinxpd				blksize = PAGESIZE;
5f4fc069Sjilinxpd				blkoff = off; /* block = page here */
5f4fc069Sjilinxpd			} else
5f4fc069Sjilinxpd				blksize = bsize;
5f4fc069Sjilinxpd			mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd			pp = pvn_read_kluster(vp, off, seg, addr, &io_off,
5f4fc069Sjilinxpd			    &io_len, blkoff, blksize, 0);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd			/*
5f4fc069Sjilinxpd			 * Some other thread has entered the page,
5f4fc069Sjilinxpd			 * so just use it.
5f4fc069Sjilinxpd			 */
5f4fc069Sjilinxpd			if (pp == NULL)
5f4fc069Sjilinxpd				goto again;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd			/*
5f4fc069Sjilinxpd			 * Now round the request size up to page boundaries.
5f4fc069Sjilinxpd			 * This ensures that the entire page will be
5f4fc069Sjilinxpd			 * initialized to zeroes if EOF is encountered.
5f4fc069Sjilinxpd			 */
5f4fc069Sjilinxpd			io_len = ptob(btopr(io_len));
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd			bp = pageio_setup(pp, io_len, vp, B_READ);
5f4fc069Sjilinxpd			ASSERT(bp != NULL);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd			/*
5f4fc069Sjilinxpd			 * pageio_setup should have set b_addr to 0.  This
5f4fc069Sjilinxpd			 * is correct since we want to do I/O on a page
5f4fc069Sjilinxpd			 * boundary.  bp_mapin will use this addr to calculate
5f4fc069Sjilinxpd			 * an offset, and then set b_addr to the kernel virtual
5f4fc069Sjilinxpd			 * address it allocated for us.
5f4fc069Sjilinxpd			 */
5f4fc069Sjilinxpd			ASSERT(bp->b_un.b_addr == 0);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd			bp->b_edev = 0;
5f4fc069Sjilinxpd			bp->b_dev = 0;
5f4fc069Sjilinxpd			bp->b_lblkno = lbtodb(io_off);
5f4fc069Sjilinxpd			bp->b_file = vp;
5f4fc069Sjilinxpd			bp->b_offset = (offset_t)off;
5f4fc069Sjilinxpd			bp_mapin(bp);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd			/*
5f4fc069Sjilinxpd			 * If doing a write beyond what we believe is EOF,
5f4fc069Sjilinxpd			 * don't bother trying to read the pages from the
5f4fc069Sjilinxpd			 * server, we'll just zero the pages here.  We
5f4fc069Sjilinxpd			 * don't check that the rw flag is S_WRITE here
5f4fc069Sjilinxpd			 * because some implementations may attempt a
5f4fc069Sjilinxpd			 * read access to the buffer before copying data.
5f4fc069Sjilinxpd			 */
5f4fc069Sjilinxpd			mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd			if (io_off >= np->r_size && seg == segkmap) {
5f4fc069Sjilinxpd				mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd				bzero(bp->b_un.b_addr, io_len);
5f4fc069Sjilinxpd			} else {
5f4fc069Sjilinxpd				mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd				error = smbfs_bio(bp, 0, cr);
5f4fc069Sjilinxpd			}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd			/*
5f4fc069Sjilinxpd			 * Unmap the buffer before freeing it.
5f4fc069Sjilinxpd			 */
5f4fc069Sjilinxpd			bp_mapout(bp);
5f4fc069Sjilinxpd			pageio_done(bp);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd			/* Here NFS3 updates all pp->p_fsdata */
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd			if (error == SMBFS_EOF) {
5f4fc069Sjilinxpd				/*
5f4fc069Sjilinxpd				 * If doing a write system call just return
5f4fc069Sjilinxpd				 * zeroed pages, else user tried to get pages
5f4fc069Sjilinxpd				 * beyond EOF, return error.  We don't check
5f4fc069Sjilinxpd				 * that the rw flag is S_WRITE here because
5f4fc069Sjilinxpd				 * some implementations may attempt a read
5f4fc069Sjilinxpd				 * access to the buffer before copying data.
5f4fc069Sjilinxpd				 */
5f4fc069Sjilinxpd				if (seg == segkmap)
5f4fc069Sjilinxpd					error = 0;
5f4fc069Sjilinxpd				else
5f4fc069Sjilinxpd					error = EFAULT;
5f4fc069Sjilinxpd			}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd			if (!readahead_issued && !error) {
5f4fc069Sjilinxpd				mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd				np->r_nextr = io_off + io_len;
5f4fc069Sjilinxpd				mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd			}
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (pl == NULL)
5f4fc069Sjilinxpd		return (error);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (error) {
5f4fc069Sjilinxpd		if (pp != NULL)
5f4fc069Sjilinxpd			pvn_read_done(pp, B_ERROR);
5f4fc069Sjilinxpd		return (error);
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (pagefound) {
5f4fc069Sjilinxpd		se_t se = (rw == S_CREATE ? SE_EXCL : SE_SHARED);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		/*
5f4fc069Sjilinxpd		 * Page exists in the cache, acquire the appropriate lock.
5f4fc069Sjilinxpd		 * If this fails, start all over again.
5f4fc069Sjilinxpd		 */
5f4fc069Sjilinxpd		if ((pp = page_lookup(vp, off, se)) == NULL) {
5f4fc069Sjilinxpd#ifdef DEBUG
5f4fc069Sjilinxpd			smbfs_lostpage++;
5f4fc069Sjilinxpd#endif
5f4fc069Sjilinxpd			goto reread;
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd		pl[0] = pp;
5f4fc069Sjilinxpd		pl[1] = NULL;
5f4fc069Sjilinxpd		return (0);
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (pp != NULL)
5f4fc069Sjilinxpd		pvn_plist_init(pp, pl, plsz, off, io_len, rw);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	return (error);
5f4fc069Sjilinxpd}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd/*
5f4fc069Sjilinxpd * Here NFS has: nfs3_readahead
5f4fc069Sjilinxpd * No read-ahead in smbfs yet.
5f4fc069Sjilinxpd */
5f4fc069Sjilinxpd
8329232eSGordon Ross#endif	// _KERNEL
8329232eSGordon Ross
5f4fc069Sjilinxpd/*
5f4fc069Sjilinxpd * Flags are composed of {B_INVAL, B_FREE, B_DONTNEED, B_FORCE}
5f4fc069Sjilinxpd * If len == 0, do from off to EOF.
5f4fc069Sjilinxpd *
5f4fc069Sjilinxpd * The normal cases should be len == 0 && off == 0 (entire vp list),
5f4fc069Sjilinxpd * len == MAXBSIZE (from segmap_release actions), and len == PAGESIZE
5f4fc069Sjilinxpd * (from pageout).
5f4fc069Sjilinxpd *
5f4fc069Sjilinxpd * Like nfs3_putpage + nfs_putpages
5f4fc069Sjilinxpd */
5f4fc069Sjilinxpd/* ARGSUSED */
5f4fc069Sjilinxpdstatic int
5f4fc069Sjilinxpdsmbfs_putpage(vnode_t *vp, offset_t off, size_t len, int flags, cred_t *cr,
5f4fc069Sjilinxpd	caller_context_t *ct)
5f4fc069Sjilinxpd{
8329232eSGordon Ross#ifdef	_KERNEL
5f4fc069Sjilinxpd	smbnode_t *np;
5f4fc069Sjilinxpd	smbmntinfo_t *smi;
5f4fc069Sjilinxpd	page_t *pp;
5f4fc069Sjilinxpd	u_offset_t eoff;
5f4fc069Sjilinxpd	u_offset_t io_off;
5f4fc069Sjilinxpd	size_t io_len;
5f4fc069Sjilinxpd	int error;
5f4fc069Sjilinxpd	int rdirty;
5f4fc069Sjilinxpd	int err;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	np = VTOSMB(vp);
5f4fc069Sjilinxpd	smi = VTOSMI(vp);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
5f4fc069Sjilinxpd		return (EIO);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (smi->smi_flags & SMI_DEAD || vp->v_vfsp->vfs_flag & VFS_UNMOUNTED)
5f4fc069Sjilinxpd		return (EIO);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (vp->v_flag & VNOMAP)
5f4fc069Sjilinxpd		return (ENOSYS);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/* Here NFS does rp->r_count (++/--) stuff. */
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/* Beginning of code from nfs_putpages. */
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (!vn_has_cached_data(vp))
5f4fc069Sjilinxpd		return (0);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * If ROUTOFSPACE is set, then all writes turn into B_INVAL
5f4fc069Sjilinxpd	 * writes.  B_FORCE is set to force the VM system to actually
5f4fc069Sjilinxpd	 * invalidate the pages, even if the i/o failed.  The pages
5f4fc069Sjilinxpd	 * need to get invalidated because they can't be written out
5f4fc069Sjilinxpd	 * because there isn't any space left on either the server's
5f4fc069Sjilinxpd	 * file system or in the user's disk quota.  The B_FREE bit
5f4fc069Sjilinxpd	 * is cleared to avoid confusion as to whether this is a
5f4fc069Sjilinxpd	 * request to place the page on the freelist or to destroy
5f4fc069Sjilinxpd	 * it.
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	if ((np->r_flags & ROUTOFSPACE) ||
5f4fc069Sjilinxpd	    (vp->v_vfsp->vfs_flag & VFS_UNMOUNTED))
5f4fc069Sjilinxpd		flags = (flags & ~B_FREE) | B_INVAL | B_FORCE;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (len == 0) {
5f4fc069Sjilinxpd		/*
5f4fc069Sjilinxpd		 * If doing a full file synchronous operation, then clear
5f4fc069Sjilinxpd		 * the RDIRTY bit.  If a page gets dirtied while the flush
5f4fc069Sjilinxpd		 * is happening, then RDIRTY will get set again.  The
5f4fc069Sjilinxpd		 * RDIRTY bit must get cleared before the flush so that
5f4fc069Sjilinxpd		 * we don't lose this information.
5f4fc069Sjilinxpd		 *
5f4fc069Sjilinxpd		 * NFS has B_ASYNC vs sync stuff here.
5f4fc069Sjilinxpd		 */
5f4fc069Sjilinxpd		if (off == (u_offset_t)0 &&
5f4fc069Sjilinxpd		    (np->r_flags & RDIRTY)) {
5f4fc069Sjilinxpd			mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd			rdirty = (np->r_flags & RDIRTY);
5f4fc069Sjilinxpd			np->r_flags &= ~RDIRTY;
5f4fc069Sjilinxpd			mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd		} else
5f4fc069Sjilinxpd			rdirty = 0;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		/*
5f4fc069Sjilinxpd		 * Search the entire vp list for pages >= off, and flush
5f4fc069Sjilinxpd		 * the dirty pages.
5f4fc069Sjilinxpd		 */
5f4fc069Sjilinxpd		error = pvn_vplist_dirty(vp, off, smbfs_putapage,
5f4fc069Sjilinxpd		    flags, cr);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		/*
5f4fc069Sjilinxpd		 * If an error occurred and the file was marked as dirty
5f4fc069Sjilinxpd		 * before and we aren't forcibly invalidating pages, then
5f4fc069Sjilinxpd		 * reset the RDIRTY flag.
5f4fc069Sjilinxpd		 */
5f4fc069Sjilinxpd		if (error && rdirty &&
5f4fc069Sjilinxpd		    (flags & (B_INVAL | B_FORCE)) != (B_INVAL | B_FORCE)) {
5f4fc069Sjilinxpd			mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd			np->r_flags |= RDIRTY;
5f4fc069Sjilinxpd			mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd	} else {
5f4fc069Sjilinxpd		/*
5f4fc069Sjilinxpd		 * Do a range from [off...off + len) looking for pages
5f4fc069Sjilinxpd		 * to deal with.
5f4fc069Sjilinxpd		 */
5f4fc069Sjilinxpd		error = 0;
5f4fc069Sjilinxpd		io_len = 1; /* quiet warnings */
5f4fc069Sjilinxpd		eoff = off + len;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		for (io_off = off; io_off < eoff; io_off += io_len) {
5f4fc069Sjilinxpd			mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd			if (io_off >= np->r_size) {
5f4fc069Sjilinxpd				mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd				break;
5f4fc069Sjilinxpd			}
5f4fc069Sjilinxpd			mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd			/*
5f4fc069Sjilinxpd			 * If we are not invalidating, synchronously
5f4fc069Sjilinxpd			 * freeing or writing pages use the routine
5f4fc069Sjilinxpd			 * page_lookup_nowait() to prevent reclaiming
5f4fc069Sjilinxpd			 * them from the free list.
5f4fc069Sjilinxpd			 */
5f4fc069Sjilinxpd			if ((flags & B_INVAL) || !(flags & B_ASYNC)) {
5f4fc069Sjilinxpd				pp = page_lookup(vp, io_off,
5f4fc069Sjilinxpd				    (flags & (B_INVAL | B_FREE)) ?
5f4fc069Sjilinxpd				    SE_EXCL : SE_SHARED);
5f4fc069Sjilinxpd			} else {
5f4fc069Sjilinxpd				pp = page_lookup_nowait(vp, io_off,
5f4fc069Sjilinxpd				    (flags & B_FREE) ? SE_EXCL : SE_SHARED);
5f4fc069Sjilinxpd			}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd			if (pp == NULL || !pvn_getdirty(pp, flags))
5f4fc069Sjilinxpd				io_len = PAGESIZE;
5f4fc069Sjilinxpd			else {
5f4fc069Sjilinxpd				err = smbfs_putapage(vp, pp, &io_off,
5f4fc069Sjilinxpd				    &io_len, flags, cr);
5f4fc069Sjilinxpd				if (!error)
5f4fc069Sjilinxpd					error = err;
5f4fc069Sjilinxpd				/*
5f4fc069Sjilinxpd				 * "io_off" and "io_len" are returned as
5f4fc069Sjilinxpd				 * the range of pages we actually wrote.
5f4fc069Sjilinxpd				 * This allows us to skip ahead more quickly
5f4fc069Sjilinxpd				 * since several pages may've been dealt
5f4fc069Sjilinxpd				 * with by this iteration of the loop.
5f4fc069Sjilinxpd				 */
5f4fc069Sjilinxpd			}
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	return (error);
8329232eSGordon Ross
8329232eSGordon Ross#else	// _KERNEL
8329232eSGordon Ross	return (ENOSYS);
8329232eSGordon Ross#endif	// _KERNEL
5f4fc069Sjilinxpd}
5f4fc069Sjilinxpd
8329232eSGordon Ross#ifdef	_KERNEL
8329232eSGordon Ross
5f4fc069Sjilinxpd/*
5f4fc069Sjilinxpd * Write out a single page, possibly klustering adjacent dirty pages.
5f4fc069Sjilinxpd *
5f4fc069Sjilinxpd * Like nfs3_putapage / nfs3_sync_putapage
5f4fc069Sjilinxpd */
5f4fc069Sjilinxpdstatic int
5f4fc069Sjilinxpdsmbfs_putapage(vnode_t *vp, page_t *pp, u_offset_t *offp, size_t *lenp,
5f4fc069Sjilinxpd	int flags, cred_t *cr)
5f4fc069Sjilinxpd{
5f4fc069Sjilinxpd	smbnode_t *np;
5f4fc069Sjilinxpd	u_offset_t io_off;
5f4fc069Sjilinxpd	u_offset_t lbn_off;
5f4fc069Sjilinxpd	u_offset_t lbn;
5f4fc069Sjilinxpd	size_t io_len;
5f4fc069Sjilinxpd	uint_t bsize;
5f4fc069Sjilinxpd	int error;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	np = VTOSMB(vp);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	ASSERT(!vn_is_readonly(vp));
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	bsize = MAX(vp->v_vfsp->vfs_bsize, PAGESIZE);
5f4fc069Sjilinxpd	lbn = pp->p_offset / bsize;
5f4fc069Sjilinxpd	lbn_off = lbn * bsize;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * Find a kluster that fits in one block, or in
5f4fc069Sjilinxpd	 * one page if pages are bigger than blocks.  If
5f4fc069Sjilinxpd	 * there is less file space allocated than a whole
5f4fc069Sjilinxpd	 * page, we'll shorten the i/o request below.
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	pp = pvn_write_kluster(vp, pp, &io_off, &io_len, lbn_off,
5f4fc069Sjilinxpd	    roundup(bsize, PAGESIZE), flags);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * pvn_write_kluster shouldn't have returned a page with offset
5f4fc069Sjilinxpd	 * behind the original page we were given.  Verify that.
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	ASSERT((pp->p_offset / bsize) >= lbn);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * Now pp will have the list of kept dirty pages marked for
5f4fc069Sjilinxpd	 * write back.  It will also handle invalidation and freeing
5f4fc069Sjilinxpd	 * of pages that are not dirty.  Check for page length rounding
5f4fc069Sjilinxpd	 * problems.
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	if (io_off + io_len > lbn_off + bsize) {
5f4fc069Sjilinxpd		ASSERT((io_off + io_len) - (lbn_off + bsize) < PAGESIZE);
5f4fc069Sjilinxpd		io_len = lbn_off + bsize - io_off;
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * The RMODINPROGRESS flag makes sure that smbfs_bio() sees a
5f4fc069Sjilinxpd	 * consistent value of r_size. RMODINPROGRESS is set in writerp().
5f4fc069Sjilinxpd	 * When RMODINPROGRESS is set it indicates that a uiomove() is in
5f4fc069Sjilinxpd	 * progress and the r_size has not been made consistent with the
5f4fc069Sjilinxpd	 * new size of the file. When the uiomove() completes the r_size is
5f4fc069Sjilinxpd	 * updated and the RMODINPROGRESS flag is cleared.
5f4fc069Sjilinxpd	 *
5f4fc069Sjilinxpd	 * The RMODINPROGRESS flag makes sure that smbfs_bio() sees a
5f4fc069Sjilinxpd	 * consistent value of r_size. Without this handshaking, it is
5f4fc069Sjilinxpd	 * possible that smbfs_bio() picks  up the old value of r_size
5f4fc069Sjilinxpd	 * before the uiomove() in writerp() completes. This will result
5f4fc069Sjilinxpd	 * in the write through smbfs_bio() being dropped.
5f4fc069Sjilinxpd	 *
5f4fc069Sjilinxpd	 * More precisely, there is a window between the time the uiomove()
5f4fc069Sjilinxpd	 * completes and the time the r_size is updated. If a VOP_PUTPAGE()
5f4fc069Sjilinxpd	 * operation intervenes in this window, the page will be picked up,
5f4fc069Sjilinxpd	 * because it is dirty (it will be unlocked, unless it was
5f4fc069Sjilinxpd	 * pagecreate'd). When the page is picked up as dirty, the dirty
5f4fc069Sjilinxpd	 * bit is reset (pvn_getdirty()). In smbfs_write(), r_size is
5f4fc069Sjilinxpd	 * checked. This will still be the old size. Therefore the page will
5f4fc069Sjilinxpd	 * not be written out. When segmap_release() calls VOP_PUTPAGE(),
5f4fc069Sjilinxpd	 * the page will be found to be clean and the write will be dropped.
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	if (np->r_flags & RMODINPROGRESS) {
5f4fc069Sjilinxpd		mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd		if ((np->r_flags & RMODINPROGRESS) &&
5f4fc069Sjilinxpd		    np->r_modaddr + MAXBSIZE > io_off &&
5f4fc069Sjilinxpd		    np->r_modaddr < io_off + io_len) {
5f4fc069Sjilinxpd			page_t *plist;
5f4fc069Sjilinxpd			/*
5f4fc069Sjilinxpd			 * A write is in progress for this region of the file.
5f4fc069Sjilinxpd			 * If we did not detect RMODINPROGRESS here then this
5f4fc069Sjilinxpd			 * path through smbfs_putapage() would eventually go to
5f4fc069Sjilinxpd			 * smbfs_bio() and may not write out all of the data
5f4fc069Sjilinxpd			 * in the pages. We end up losing data. So we decide
5f4fc069Sjilinxpd			 * to set the modified bit on each page in the page
5f4fc069Sjilinxpd			 * list and mark the rnode with RDIRTY. This write
5f4fc069Sjilinxpd			 * will be restarted at some later time.
5f4fc069Sjilinxpd			 */
5f4fc069Sjilinxpd			plist = pp;
5f4fc069Sjilinxpd			while (plist != NULL) {
5f4fc069Sjilinxpd				pp = plist;
5f4fc069Sjilinxpd				page_sub(&plist, pp);
5f4fc069Sjilinxpd				hat_setmod(pp);
5f4fc069Sjilinxpd				page_io_unlock(pp);
5f4fc069Sjilinxpd				page_unlock(pp);
5f4fc069Sjilinxpd			}
5f4fc069Sjilinxpd			np->r_flags |= RDIRTY;
5f4fc069Sjilinxpd			mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd			if (offp)
5f4fc069Sjilinxpd				*offp = io_off;
5f4fc069Sjilinxpd			if (lenp)
5f4fc069Sjilinxpd				*lenp = io_len;
5f4fc069Sjilinxpd			return (0);
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd		mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * NFS handles (flags & B_ASYNC) here...
5f4fc069Sjilinxpd	 * (See nfs_async_putapage())
5f4fc069Sjilinxpd	 *
5f4fc069Sjilinxpd	 * This code section from: nfs3_sync_putapage()
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	flags |= B_WRITE;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	error = smbfs_rdwrlbn(vp, pp, io_off, io_len, flags, cr);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if ((error == ENOSPC || error == EDQUOT || error == EFBIG ||
5f4fc069Sjilinxpd	    error == EACCES) &&
5f4fc069Sjilinxpd	    (flags & (B_INVAL|B_FORCE)) != (B_INVAL|B_FORCE)) {
5f4fc069Sjilinxpd		if (!(np->r_flags & ROUTOFSPACE)) {
5f4fc069Sjilinxpd			mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd			np->r_flags |= ROUTOFSPACE;
5f4fc069Sjilinxpd			mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd		flags |= B_ERROR;
5f4fc069Sjilinxpd		pvn_write_done(pp, flags);
5f4fc069Sjilinxpd		/*
5f4fc069Sjilinxpd		 * If this was not an async thread, then try again to
5f4fc069Sjilinxpd		 * write out the pages, but this time, also destroy
5f4fc069Sjilinxpd		 * them whether or not the write is successful.  This
5f4fc069Sjilinxpd		 * will prevent memory from filling up with these
5f4fc069Sjilinxpd		 * pages and destroying them is the only alternative
5f4fc069Sjilinxpd		 * if they can't be written out.
5f4fc069Sjilinxpd		 *
5f4fc069Sjilinxpd		 * Don't do this if this is an async thread because
5f4fc069Sjilinxpd		 * when the pages are unlocked in pvn_write_done,
5f4fc069Sjilinxpd		 * some other thread could have come along, locked
5f4fc069Sjilinxpd		 * them, and queued for an async thread.  It would be
5f4fc069Sjilinxpd		 * possible for all of the async threads to be tied
5f4fc069Sjilinxpd		 * up waiting to lock the pages again and they would
5f4fc069Sjilinxpd		 * all already be locked and waiting for an async
5f4fc069Sjilinxpd		 * thread to handle them.  Deadlock.
5f4fc069Sjilinxpd		 */
5f4fc069Sjilinxpd		if (!(flags & B_ASYNC)) {
5f4fc069Sjilinxpd			error = smbfs_putpage(vp, io_off, io_len,
5f4fc069Sjilinxpd			    B_INVAL | B_FORCE, cr, NULL);
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd	} else {
5f4fc069Sjilinxpd		if (error)
5f4fc069Sjilinxpd			flags |= B_ERROR;
5f4fc069Sjilinxpd		else if (np->r_flags & ROUTOFSPACE) {
5f4fc069Sjilinxpd			mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd			np->r_flags &= ~ROUTOFSPACE;
5f4fc069Sjilinxpd			mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd		}
5f4fc069Sjilinxpd		pvn_write_done(pp, flags);
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/* Now more code from: nfs3_putapage */
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (offp)
5f4fc069Sjilinxpd		*offp = io_off;
5f4fc069Sjilinxpd	if (lenp)
5f4fc069Sjilinxpd		*lenp = io_len;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	return (error);
5f4fc069Sjilinxpd}
5f4fc069Sjilinxpd
8329232eSGordon Ross#endif	// _KERNEL
8329232eSGordon Ross
8329232eSGordon Ross
5f4fc069Sjilinxpd/*
5f4fc069Sjilinxpd * NFS has this in nfs_client.c (shared by v2,v3,...)
5f4fc069Sjilinxpd * We have it here so smbfs_putapage can be file scope.
5f4fc069Sjilinxpd */
5f4fc069Sjilinxpdvoid
5f4fc069Sjilinxpdsmbfs_invalidate_pages(vnode_t *vp, u_offset_t off, cred_t *cr)
5f4fc069Sjilinxpd{
5f4fc069Sjilinxpd	smbnode_t *np;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	np = VTOSMB(vp);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd	while (np->r_flags & RTRUNCATE)
5f4fc069Sjilinxpd		cv_wait(&np->r_cv, &np->r_statelock);
5f4fc069Sjilinxpd	np->r_flags |= RTRUNCATE;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (off == (u_offset_t)0) {
5f4fc069Sjilinxpd		np->r_flags &= ~RDIRTY;
5f4fc069Sjilinxpd		if (!(np->r_flags & RSTALE))
5f4fc069Sjilinxpd			np->r_error = 0;
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd	/* Here NFSv3 has np->r_truncaddr = off; */
5f4fc069Sjilinxpd	mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd
8329232eSGordon Ross#ifdef	_KERNEL
5f4fc069Sjilinxpd	(void) pvn_vplist_dirty(vp, off, smbfs_putapage,
5f4fc069Sjilinxpd	    B_INVAL | B_TRUNC, cr);
8329232eSGordon Ross#endif	// _KERNEL
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd	np->r_flags &= ~RTRUNCATE;
5f4fc069Sjilinxpd	cv_broadcast(&np->r_cv);
5f4fc069Sjilinxpd	mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd}
5f4fc069Sjilinxpd
8329232eSGordon Ross#ifdef	_KERNEL
8329232eSGordon Ross
5f4fc069Sjilinxpd/* Like nfs3_map */
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd/* ARGSUSED */
5f4fc069Sjilinxpdstatic int
5f4fc069Sjilinxpdsmbfs_map(vnode_t *vp, offset_t off, struct as *as, caddr_t *addrp,
5f4fc069Sjilinxpd	size_t len, uchar_t prot, uchar_t maxprot, uint_t flags,
5f4fc069Sjilinxpd	cred_t *cr, caller_context_t *ct)
5f4fc069Sjilinxpd{
5f4fc069Sjilinxpd	segvn_crargs_t	vn_a;
5f4fc069Sjilinxpd	struct vattr	va;
5f4fc069Sjilinxpd	smbnode_t	*np;
5f4fc069Sjilinxpd	smbmntinfo_t	*smi;
5f4fc069Sjilinxpd	int		error;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	np = VTOSMB(vp);
5f4fc069Sjilinxpd	smi = VTOSMI(vp);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
5f4fc069Sjilinxpd		return (EIO);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (smi->smi_flags & SMI_DEAD || vp->v_vfsp->vfs_flag & VFS_UNMOUNTED)
5f4fc069Sjilinxpd		return (EIO);
5f4fc069Sjilinxpd
*168091e5SGordon Ross	/* Sanity check: should have a valid open */
*168091e5SGordon Ross	if (np->n_fid == NULL)
*168091e5SGordon Ross		return (EIO);
*168091e5SGordon Ross
5f4fc069Sjilinxpd	if (vp->v_flag & VNOMAP)
5f4fc069Sjilinxpd		return (ENOSYS);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (off < 0 || off + (ssize_t)len < 0)
5f4fc069Sjilinxpd		return (ENXIO);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (vp->v_type != VREG)
5f4fc069Sjilinxpd		return (ENODEV);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * NFS does close-to-open consistency stuff here.
5f4fc069Sjilinxpd	 * Just get (possibly cached) attributes.
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	va.va_mask = AT_ALL;
5f4fc069Sjilinxpd	if ((error = smbfsgetattr(vp, &va, cr)) != 0)
5f4fc069Sjilinxpd		return (error);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * Check to see if the vnode is currently marked as not cachable.
5f4fc069Sjilinxpd	 * This means portions of the file are locked (through VOP_FRLOCK).
5f4fc069Sjilinxpd	 * In this case the map request must be refused.  We use
5f4fc069Sjilinxpd	 * rp->r_lkserlock to avoid a race with concurrent lock requests.
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * Atomically increment r_inmap after acquiring r_rwlock. The
5f4fc069Sjilinxpd	 * idea here is to acquire r_rwlock to block read/write and
5f4fc069Sjilinxpd	 * not to protect r_inmap. r_inmap will inform smbfs_read/write()
5f4fc069Sjilinxpd	 * that we are in smbfs_map(). Now, r_rwlock is acquired in order
5f4fc069Sjilinxpd	 * and we can prevent the deadlock that would have occurred
5f4fc069Sjilinxpd	 * when smbfs_addmap() would have acquired it out of order.
5f4fc069Sjilinxpd	 *
5f4fc069Sjilinxpd	 * Since we are not protecting r_inmap by any lock, we do not
5f4fc069Sjilinxpd	 * hold any lock when we decrement it. We atomically decrement
5f4fc069Sjilinxpd	 * r_inmap after we release r_lkserlock.  Note that rwlock is
5f4fc069Sjilinxpd	 * re-entered as writer in smbfs_addmap (called via as_map).
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (smbfs_rw_enter_sig(&np->r_rwlock, RW_WRITER, SMBINTR(vp)))
5f4fc069Sjilinxpd		return (EINTR);
5f4fc069Sjilinxpd	atomic_inc_uint(&np->r_inmap);
5f4fc069Sjilinxpd	smbfs_rw_exit(&np->r_rwlock);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (smbfs_rw_enter_sig(&np->r_lkserlock, RW_WRITER, SMBINTR(vp))) {
5f4fc069Sjilinxpd		atomic_dec_uint(&np->r_inmap);
5f4fc069Sjilinxpd		return (EINTR);
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (vp->v_flag & VNOCACHE) {
5f4fc069Sjilinxpd		error = EAGAIN;
5f4fc069Sjilinxpd		goto done;
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * Don't allow concurrent locks and mapping if mandatory locking is
5f4fc069Sjilinxpd	 * enabled.
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	if ((flk_has_remote_locks(vp) || smbfs_lm_has_sleep(vp)) &&
5f4fc069Sjilinxpd	    MANDLOCK(vp, va.va_mode)) {
5f4fc069Sjilinxpd		error = EAGAIN;
5f4fc069Sjilinxpd		goto done;
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	as_rangelock(as);
5f4fc069Sjilinxpd	error = choose_addr(as, addrp, len, off, ADDR_VACALIGN, flags);
5f4fc069Sjilinxpd	if (error != 0) {
5f4fc069Sjilinxpd		as_rangeunlock(as);
5f4fc069Sjilinxpd		goto done;
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	vn_a.vp = vp;
5f4fc069Sjilinxpd	vn_a.offset = off;
5f4fc069Sjilinxpd	vn_a.type = (flags & MAP_TYPE);
5f4fc069Sjilinxpd	vn_a.prot = (uchar_t)prot;
5f4fc069Sjilinxpd	vn_a.maxprot = (uchar_t)maxprot;
5f4fc069Sjilinxpd	vn_a.flags = (flags & ~MAP_TYPE);
5f4fc069Sjilinxpd	vn_a.cred = cr;
5f4fc069Sjilinxpd	vn_a.amp = NULL;
5f4fc069Sjilinxpd	vn_a.szc = 0;
5f4fc069Sjilinxpd	vn_a.lgrp_mem_policy_flags = 0;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	error = as_map(as, *addrp, len, segvn_create, &vn_a);
5f4fc069Sjilinxpd	as_rangeunlock(as);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpddone:
5f4fc069Sjilinxpd	smbfs_rw_exit(&np->r_lkserlock);
5f4fc069Sjilinxpd	atomic_dec_uint(&np->r_inmap);
5f4fc069Sjilinxpd	return (error);
5f4fc069Sjilinxpd}
5f4fc069Sjilinxpd
4e72ade1SGordon Ross/*
4e72ade1SGordon Ross * This uses addmap/delmap functions to hold the SMB FID open as long as
4e72ade1SGordon Ross * there are pages mapped in this as/seg.  Increment the FID refs. when
4e72ade1SGordon Ross * the maping count goes from zero to non-zero, and release the FID ref
4e72ade1SGordon Ross * when the maping count goes from non-zero to zero.
4e72ade1SGordon Ross */
4e72ade1SGordon Ross
5f4fc069Sjilinxpd/* ARGSUSED */
5f4fc069Sjilinxpdstatic int
5f4fc069Sjilinxpdsmbfs_addmap(vnode_t *vp, offset_t off, struct as *as, caddr_t addr,
5f4fc069Sjilinxpd	size_t len, uchar_t prot, uchar_t maxprot, uint_t flags,
5f4fc069Sjilinxpd	cred_t *cr, caller_context_t *ct)
5f4fc069Sjilinxpd{
5f4fc069Sjilinxpd	smbnode_t *np = VTOSMB(vp);
5f4fc069Sjilinxpd	boolean_t inc_fidrefs = B_FALSE;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * When r_mapcnt goes from zero to non-zero,
5f4fc069Sjilinxpd	 * increment n_fidrefs
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd	if (np->r_mapcnt == 0)
5f4fc069Sjilinxpd		inc_fidrefs = B_TRUE;
5f4fc069Sjilinxpd	np->r_mapcnt += btopr(len);
5f4fc069Sjilinxpd	mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if (inc_fidrefs) {
5f4fc069Sjilinxpd		(void) smbfs_rw_enter_sig(&np->r_lkserlock, RW_WRITER, 0);
5f4fc069Sjilinxpd		np->n_fidrefs++;
5f4fc069Sjilinxpd		smbfs_rw_exit(&np->r_lkserlock);
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	return (0);
5f4fc069Sjilinxpd}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd/*
4e72ade1SGordon Ross * Args passed to smbfs_delmap_async
5f4fc069Sjilinxpd */
5f4fc069Sjilinxpdtypedef struct smbfs_delmap_args {
4e72ade1SGordon Ross	taskq_ent_t		dm_tqent;
4e72ade1SGordon Ross	cred_t			*dm_cr;
4e72ade1SGordon Ross	vnode_t			*dm_vp;
4e72ade1SGordon Ross	offset_t		dm_off;
4e72ade1SGordon Ross	caddr_t			dm_addr;
4e72ade1SGordon Ross	size_t			dm_len;
4e72ade1SGordon Ross	uint_t			dm_prot;
4e72ade1SGordon Ross	uint_t			dm_maxprot;
4e72ade1SGordon Ross	uint_t			dm_flags;
4e72ade1SGordon Ross	boolean_t		dm_rele_fid;
5f4fc069Sjilinxpd} smbfs_delmap_args_t;
5f4fc069Sjilinxpd
4e72ade1SGordon Ross/*
4e72ade1SGordon Ross * Using delmap not only to release the SMB FID (as described above)
4e72ade1SGordon Ross * but to flush dirty pages as needed.  Both of those do the actual
4e72ade1SGordon Ross * work in an async taskq job to avoid interfering with locks held
4e72ade1SGordon Ross * in the VM layer when this is called.
4e72ade1SGordon Ross */
4e72ade1SGordon Ross
5f4fc069Sjilinxpd/* ARGSUSED */
5f4fc069Sjilinxpdstatic int
5f4fc069Sjilinxpdsmbfs_delmap(vnode_t *vp, offset_t off, struct as *as, caddr_t addr,
5f4fc069Sjilinxpd	size_t len, uint_t prot, uint_t maxprot, uint_t flags,
5f4fc069Sjilinxpd	cred_t *cr, caller_context_t *ct)
5f4fc069Sjilinxpd{
4e72ade1SGordon Ross	smbnode_t		*np = VTOSMB(vp);
4e72ade1SGordon Ross	smbmntinfo_t		*smi = VTOSMI(vp);
5f4fc069Sjilinxpd	smbfs_delmap_args_t	*dmapp;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	dmapp = kmem_zalloc(sizeof (*dmapp), KM_SLEEP);
5f4fc069Sjilinxpd
4e72ade1SGordon Ross	/*
4e72ade1SGordon Ross	 * The VM layer may segvn_free the seg holding this vnode
4e72ade1SGordon Ross	 * before our callback has a chance run, so take a hold on
4e72ade1SGordon Ross	 * the vnode here and release it in the callback.
4e72ade1SGordon Ross	 * (same for the cred)
4e72ade1SGordon Ross	 */
4e72ade1SGordon Ross	crhold(cr);
4e72ade1SGordon Ross	VN_HOLD(vp);
4e72ade1SGordon Ross
4e72ade1SGordon Ross	dmapp->dm_vp = vp;
4e72ade1SGordon Ross	dmapp->dm_cr = cr;
4e72ade1SGordon Ross	dmapp->dm_off = off;
4e72ade1SGordon Ross	dmapp->dm_addr = addr;
4e72ade1SGordon Ross	dmapp->dm_len = len;
4e72ade1SGordon Ross	dmapp->dm_prot = prot;
4e72ade1SGordon Ross	dmapp->dm_maxprot = maxprot;
4e72ade1SGordon Ross	dmapp->dm_flags = flags;
4e72ade1SGordon Ross	dmapp->dm_rele_fid = B_FALSE;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
4e72ade1SGordon Ross	 * Go ahead and decrement r_mapcount now, which is
4e72ade1SGordon Ross	 * the primary purpose of this function.
4e72ade1SGordon Ross	 *
4e72ade1SGordon Ross	 * When r_mapcnt goes to zero, we need to call
4e72ade1SGordon Ross	 * smbfs_rele_fid, but can't do that here, so
4e72ade1SGordon Ross	 * set a flag telling the async task to do it.
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd	np->r_mapcnt -= btopr(len);
5f4fc069Sjilinxpd	ASSERT(np->r_mapcnt >= 0);
5f4fc069Sjilinxpd	if (np->r_mapcnt == 0)
4e72ade1SGordon Ross		dmapp->dm_rele_fid = B_TRUE;
5f4fc069Sjilinxpd	mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd
4e72ade1SGordon Ross	taskq_dispatch_ent(smi->smi_taskq, smbfs_delmap_async, dmapp, 0,
4e72ade1SGordon Ross	    &dmapp->dm_tqent);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	return (0);
5f4fc069Sjilinxpd}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd/*
5f4fc069Sjilinxpd * Remove some pages from an mmap'd vnode.  Flush any
5f4fc069Sjilinxpd * dirty pages in the unmapped range.
5f4fc069Sjilinxpd */
5f4fc069Sjilinxpd/* ARGSUSED */
5f4fc069Sjilinxpdstatic void
4e72ade1SGordon Rosssmbfs_delmap_async(void *varg)
5f4fc069Sjilinxpd{
4e72ade1SGordon Ross	smbfs_delmap_args_t	*dmapp = varg;
4e72ade1SGordon Ross	cred_t			*cr;
5f4fc069Sjilinxpd	vnode_t			*vp;
5f4fc069Sjilinxpd	smbnode_t		*np;
5f4fc069Sjilinxpd	smbmntinfo_t		*smi;
5f4fc069Sjilinxpd
4e72ade1SGordon Ross	cr = dmapp->dm_cr;
4e72ade1SGordon Ross	vp = dmapp->dm_vp;
5f4fc069Sjilinxpd	np = VTOSMB(vp);
5f4fc069Sjilinxpd	smi = VTOSMI(vp);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/* Decremented r_mapcnt in smbfs_delmap */
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * Initiate a page flush and potential commit if there are
5f4fc069Sjilinxpd	 * pages, the file system was not mounted readonly, the segment
5f4fc069Sjilinxpd	 * was mapped shared, and the pages themselves were writeable.
5f4fc069Sjilinxpd	 *
5f4fc069Sjilinxpd	 * mark RDIRTY here, will be used to check if a file is dirty when
5f4fc069Sjilinxpd	 * unmount smbfs
5f4fc069Sjilinxpd	 */
5f4fc069Sjilinxpd	if (vn_has_cached_data(vp) && !vn_is_readonly(vp) &&
4e72ade1SGordon Ross	    dmapp->dm_flags == MAP_SHARED &&
4e72ade1SGordon Ross	    (dmapp->dm_maxprot & PROT_WRITE) != 0) {
5f4fc069Sjilinxpd		mutex_enter(&np->r_statelock);
5f4fc069Sjilinxpd		np->r_flags |= RDIRTY;
5f4fc069Sjilinxpd		mutex_exit(&np->r_statelock);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		/*
5f4fc069Sjilinxpd		 * Need to finish the putpage before we
5f4fc069Sjilinxpd		 * close the OtW FID needed for I/O.
5f4fc069Sjilinxpd		 */
4e72ade1SGordon Ross		(void) smbfs_putpage(vp, dmapp->dm_off, dmapp->dm_len, 0,
4e72ade1SGordon Ross		    dmapp->dm_cr, NULL);
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	if ((np->r_flags & RDIRECTIO) || (smi->smi_flags & SMI_DIRECTIO))
4e72ade1SGordon Ross		(void) smbfs_putpage(vp, dmapp->dm_off, dmapp->dm_len,
4e72ade1SGordon Ross		    B_INVAL, dmapp->dm_cr, NULL);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	/*
5f4fc069Sjilinxpd	 * If r_mapcnt went to zero, drop our FID ref now.
5f4fc069Sjilinxpd	 * On the last fidref, this does an OtW close.
5f4fc069Sjilinxpd	 */
4e72ade1SGordon Ross	if (dmapp->dm_rele_fid) {
5f4fc069Sjilinxpd		struct smb_cred scred;
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		(void) smbfs_rw_enter_sig(&np->r_lkserlock, RW_WRITER, 0);
4e72ade1SGordon Ross		smb_credinit(&scred, dmapp->dm_cr);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		smbfs_rele_fid(np, &scred);
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd		smb_credrele(&scred);
5f4fc069Sjilinxpd		smbfs_rw_exit(&np->r_lkserlock);
5f4fc069Sjilinxpd	}
5f4fc069Sjilinxpd
4e72ade1SGordon Ross	/* Release holds taken in smbfs_delmap */
4e72ade1SGordon Ross	VN_RELE(vp);
4e72ade1SGordon Ross	crfree(cr);
4e72ade1SGordon Ross
5f4fc069Sjilinxpd	kmem_free(dmapp, sizeof (*dmapp));
5f4fc069Sjilinxpd}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd/* No smbfs_pageio() or smbfs_dispose() ops. */
5f4fc069Sjilinxpd
8329232eSGordon Ross#endif	// _KERNEL
8329232eSGordon Ross
5f4fc069Sjilinxpd/* misc. ******************************************************** */
5f4fc069Sjilinxpd
4bff34e3Sthurlow
4bff34e3Sthurlow/*
4bff34e3Sthurlow * XXX
4bff34e3Sthurlow * This op may need to support PSARC 2007/440, nbmand changes for CIFS Service.
4bff34e3Sthurlow */
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_frlock(vnode_t *vp, int cmd, struct flock64 *bfp, int flag,
4bff34e3Sthurlow	offset_t offset, struct flk_callback *flk_cbp, cred_t *cr,
4bff34e3Sthurlow	caller_context_t *ct)
4bff34e3Sthurlow{
a19609f8Sjv	if (curproc->p_zone != VTOSMI(vp)->smi_zone_ref.zref_zone)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (VTOSMI(vp)->smi_flags & SMI_LLOCK)
4bff34e3Sthurlow		return (fs_frlock(vp, cmd, bfp, flag, offset, flk_cbp, cr, ct));
4bff34e3Sthurlow	else
4bff34e3Sthurlow		return (ENOSYS);
4bff34e3Sthurlow}
4bff34e3Sthurlow
4bff34e3Sthurlow/*
4bff34e3Sthurlow * Free storage space associated with the specified vnode.  The portion
4bff34e3Sthurlow * to be freed is specified by bfp->l_start and bfp->l_len (already
4bff34e3Sthurlow * normalized to a "whence" of 0).
4bff34e3Sthurlow *
4bff34e3Sthurlow * Called by fcntl(fd, F_FREESP, lkp) for libc:ftruncate, etc.
4bff34e3Sthurlow */
4bff34e3Sthurlow/* ARGSUSED */
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_space(vnode_t *vp, int cmd, struct flock64 *bfp, int flag,
4bff34e3Sthurlow	offset_t offset, cred_t *cr, caller_context_t *ct)
4bff34e3Sthurlow{
4bff34e3Sthurlow	int		error;
4bff34e3Sthurlow	smbmntinfo_t	*smi;
4bff34e3Sthurlow
4bff34e3Sthurlow	smi = VTOSMI(vp);
4bff34e3Sthurlow
a19609f8Sjv	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (smi->smi_flags & SMI_DEAD || vp->v_vfsp->vfs_flag & VFS_UNMOUNTED)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
91d632c8Sgwr	/* Caller (fcntl) has checked v_type */
4bff34e3Sthurlow	ASSERT(vp->v_type == VREG);
4bff34e3Sthurlow	if (cmd != F_FREESP)
4bff34e3Sthurlow		return (EINVAL);
4bff34e3Sthurlow
4bff34e3Sthurlow	/*
4bff34e3Sthurlow	 * Like NFS3, no 32-bit offset checks here.
4bff34e3Sthurlow	 * Our SMB layer takes care to return EFBIG
4bff34e3Sthurlow	 * when it has to fallback to a 32-bit call.
4bff34e3Sthurlow	 */
4bff34e3Sthurlow
4bff34e3Sthurlow	error = convoff(vp, bfp, 0, offset);
4bff34e3Sthurlow	if (!error) {
4bff34e3Sthurlow		ASSERT(bfp->l_start >= 0);
4bff34e3Sthurlow		if (bfp->l_len == 0) {
4bff34e3Sthurlow			struct vattr va;
4bff34e3Sthurlow
4bff34e3Sthurlow			/*
4bff34e3Sthurlow			 * ftruncate should not change the ctime and
4bff34e3Sthurlow			 * mtime if we truncate the file to its
4bff34e3Sthurlow			 * previous size.
4bff34e3Sthurlow			 */
4bff34e3Sthurlow			va.va_mask = AT_SIZE;
4bff34e3Sthurlow			error = smbfsgetattr(vp, &va, cr);
4bff34e3Sthurlow			if (error || va.va_size == bfp->l_start)
4bff34e3Sthurlow				return (error);
4bff34e3Sthurlow			va.va_mask = AT_SIZE;
4bff34e3Sthurlow			va.va_size = bfp->l_start;
4bff34e3Sthurlow			error = smbfssetattr(vp, &va, 0, cr);
5f4fc069Sjilinxpd			/* SMBFS_VNEVENT... */
4bff34e3Sthurlow		} else
4bff34e3Sthurlow			error = EINVAL;
4bff34e3Sthurlow	}
4bff34e3Sthurlow
4bff34e3Sthurlow	return (error);
4bff34e3Sthurlow}
4bff34e3Sthurlow
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd/* ARGSUSED */
5f4fc069Sjilinxpdstatic int
5f4fc069Sjilinxpdsmbfs_realvp(vnode_t *vp, vnode_t **vpp, caller_context_t *ct)
5f4fc069Sjilinxpd{
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd	return (ENOSYS);
5f4fc069Sjilinxpd}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd
4bff34e3Sthurlow/* ARGSUSED */
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_pathconf(vnode_t *vp, int cmd, ulong_t *valp, cred_t *cr,
4bff34e3Sthurlow	caller_context_t *ct)
4bff34e3Sthurlow{
91d632c8Sgwr	vfs_t *vfs;
4bff34e3Sthurlow	smbmntinfo_t *smi;
4bff34e3Sthurlow	struct smb_share *ssp;
4bff34e3Sthurlow
91d632c8Sgwr	vfs = vp->v_vfsp;
91d632c8Sgwr	smi = VFTOSMI(vfs);
4bff34e3Sthurlow
a19609f8Sjv	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (smi->smi_flags & SMI_DEAD || vp->v_vfsp->vfs_flag & VFS_UNMOUNTED)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	switch (cmd) {
4bff34e3Sthurlow	case _PC_FILESIZEBITS:
4bff34e3Sthurlow		ssp = smi->smi_share;
4bff34e3Sthurlow		if (SSTOVC(ssp)->vc_sopt.sv_caps & SMB_CAP_LARGE_FILES)
4bff34e3Sthurlow			*valp = 64;
4bff34e3Sthurlow		else
4bff34e3Sthurlow			*valp = 32;
4bff34e3Sthurlow		break;
4bff34e3Sthurlow
4bff34e3Sthurlow	case _PC_LINK_MAX:
4bff34e3Sthurlow		/* We only ever report one link to an object */
4bff34e3Sthurlow		*valp = 1;
4bff34e3Sthurlow		break;
4bff34e3Sthurlow
7568150aSgwr	case _PC_ACL_ENABLED:
7568150aSgwr		/*
02d09e03SGordon Ross		 * Always indicate that ACLs are enabled and
02d09e03SGordon Ross		 * that we support ACE_T format, otherwise
02d09e03SGordon Ross		 * libsec will ask for ACLENT_T format data
02d09e03SGordon Ross		 * which we don't support.
7568150aSgwr		 */
7568150aSgwr		*valp = _ACL_ACE_ENABLED;
7568150aSgwr		break;
7568150aSgwr
4bff34e3Sthurlow	case _PC_SYMLINK_MAX:	/* No symlinks until we do Unix extensions */
4bff34e3Sthurlow		*valp = 0;
4bff34e3Sthurlow		break;
4bff34e3Sthurlow
91d632c8Sgwr	case _PC_XATTR_EXISTS:
91d632c8Sgwr		if (vfs->vfs_flag & VFS_XATTR) {
91d632c8Sgwr			*valp = smbfs_xa_exists(vp, cr);
91d632c8Sgwr			break;
91d632c8Sgwr		}
91d632c8Sgwr		return (EINVAL);
91d632c8Sgwr
28162916SGordon Ross	case _PC_SATTR_ENABLED:
28162916SGordon Ross	case _PC_SATTR_EXISTS:
28162916SGordon Ross		*valp = 1;
28162916SGordon Ross		break;
28162916SGordon Ross
3b862e9aSRoger A. Faulkner	case _PC_TIMESTAMP_RESOLUTION:
02d09e03SGordon Ross		/*
02d09e03SGordon Ross		 * Windows times are tenths of microseconds
02d09e03SGordon Ross		 * (multiples of 100 nanoseconds).
02d09e03SGordon Ross		 */
02d09e03SGordon Ross		*valp = 100L;
3b862e9aSRoger A. Faulkner		break;
3b862e9aSRoger A. Faulkner
4bff34e3Sthurlow	default:
4bff34e3Sthurlow		return (fs_pathconf(vp, cmd, valp, cr, ct));
4bff34e3Sthurlow	}
4bff34e3Sthurlow	return (0);
4bff34e3Sthurlow}
4bff34e3Sthurlow
7568150aSgwr/* ARGSUSED */
7568150aSgwrstatic int
7568150aSgwrsmbfs_getsecattr(vnode_t *vp, vsecattr_t *vsa, int flag, cred_t *cr,
7568150aSgwr	caller_context_t *ct)
7568150aSgwr{
7568150aSgwr	vfs_t *vfsp;
7568150aSgwr	smbmntinfo_t *smi;
02d09e03SGordon Ross	int	error;
7568150aSgwr	uint_t	mask;
7568150aSgwr
7568150aSgwr	vfsp = vp->v_vfsp;
7568150aSgwr	smi = VFTOSMI(vfsp);
7568150aSgwr
a19609f8Sjv	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
7568150aSgwr		return (EIO);
7568150aSgwr
7568150aSgwr	if (smi->smi_flags & SMI_DEAD || vfsp->vfs_flag & VFS_UNMOUNTED)
7568150aSgwr		return (EIO);
7568150aSgwr
7568150aSgwr	/*
7568150aSgwr	 * Our _pathconf indicates _ACL_ACE_ENABLED,
7568150aSgwr	 * so we should only see VSA_ACE, etc here.
7568150aSgwr	 * Note: vn_create asks for VSA_DFACLCNT,
7568150aSgwr	 * and it expects ENOSYS and empty data.
7568150aSgwr	 */
7568150aSgwr	mask = vsa->vsa_mask & (VSA_ACE | VSA_ACECNT |
7568150aSgwr	    VSA_ACE_ACLFLAGS | VSA_ACE_ALLTYPES);
7568150aSgwr	if (mask == 0)
7568150aSgwr		return (ENOSYS);
7568150aSgwr
02d09e03SGordon Ross	if (smi->smi_flags & SMI_ACL)
bd7c6f51SGordon Ross		error = smbfs_acl_getvsa(vp, vsa, flag, cr);
02d09e03SGordon Ross	else
7568150aSgwr		error = ENOSYS;
7568150aSgwr
7568150aSgwr	if (error == ENOSYS)
7568150aSgwr		error = fs_fab_acl(vp, vsa, flag, cr, ct);
7568150aSgwr
7568150aSgwr	return (error);
7568150aSgwr}
7568150aSgwr
7568150aSgwr/* ARGSUSED */
7568150aSgwrstatic int
7568150aSgwrsmbfs_setsecattr(vnode_t *vp, vsecattr_t *vsa, int flag, cred_t *cr,
7568150aSgwr	caller_context_t *ct)
7568150aSgwr{
7568150aSgwr	vfs_t *vfsp;
7568150aSgwr	smbmntinfo_t *smi;
7568150aSgwr	int	error;
7568150aSgwr	uint_t	mask;
7568150aSgwr
7568150aSgwr	vfsp = vp->v_vfsp;
7568150aSgwr	smi = VFTOSMI(vfsp);
7568150aSgwr
a19609f8Sjv	if (curproc->p_zone != smi->smi_zone_ref.zref_zone)
7568150aSgwr		return (EIO);
7568150aSgwr
7568150aSgwr	if (smi->smi_flags & SMI_DEAD || vfsp->vfs_flag & VFS_UNMOUNTED)
7568150aSgwr		return (EIO);
7568150aSgwr
7568150aSgwr	/*
7568150aSgwr	 * Our _pathconf indicates _ACL_ACE_ENABLED,
7568150aSgwr	 * so we should only see VSA_ACE, etc here.
7568150aSgwr	 */
7568150aSgwr	mask = vsa->vsa_mask & (VSA_ACE | VSA_ACECNT);
7568150aSgwr	if (mask == 0)
7568150aSgwr		return (ENOSYS);
7568150aSgwr
7568150aSgwr	if (vfsp->vfs_flag & VFS_RDONLY)
7568150aSgwr		return (EROFS);
7568150aSgwr
02d09e03SGordon Ross	/*
02d09e03SGordon Ross	 * Allow only the mount owner to do this.
02d09e03SGordon Ross	 * See comments at smbfs_access_rwx.
02d09e03SGordon Ross	 */
02d09e03SGordon Ross	error = secpolicy_vnode_setdac(cr, smi->smi_uid);
02d09e03SGordon Ross	if (error != 0)
02d09e03SGordon Ross		return (error);
02d09e03SGordon Ross
02d09e03SGordon Ross	if (smi->smi_flags & SMI_ACL)
bd7c6f51SGordon Ross		error = smbfs_acl_setvsa(vp, vsa, flag, cr);
02d09e03SGordon Ross	else
7568150aSgwr		error = ENOSYS;
7568150aSgwr
7568150aSgwr	return (error);
7568150aSgwr}
4bff34e3Sthurlow
4bff34e3Sthurlow
4bff34e3Sthurlow/*
4bff34e3Sthurlow * XXX
4bff34e3Sthurlow * This op should eventually support PSARC 2007/268.
4bff34e3Sthurlow */
4bff34e3Sthurlowstatic int
4bff34e3Sthurlowsmbfs_shrlock(vnode_t *vp, int cmd, struct shrlock *shr, int flag, cred_t *cr,
4bff34e3Sthurlow	caller_context_t *ct)
4bff34e3Sthurlow{
a19609f8Sjv	if (curproc->p_zone != VTOSMI(vp)->smi_zone_ref.zref_zone)
4bff34e3Sthurlow		return (EIO);
4bff34e3Sthurlow
4bff34e3Sthurlow	if (VTOSMI(vp)->smi_flags & SMI_LLOCK)
4bff34e3Sthurlow		return (fs_shrlock(vp, cmd, shr, flag, cr, ct));
4bff34e3Sthurlow	else
4bff34e3Sthurlow		return (ENOSYS);
4bff34e3Sthurlow}
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd
5f4fc069Sjilinxpd/*
5f4fc069Sjilinxpd * Most unimplemented ops will return ENOSYS because of fs_nosys().
5f4fc069Sjilinxpd * The only ops where that won't work are ACCESS (due to open(2)
5f4fc069Sjilinxpd * failures) and ... (anything else left?)
5f4fc069Sjilinxpd */
5f4fc069Sjilinxpdconst fs_operation_def_t smbfs_vnodeops_template[] = {
5f4fc069Sjilinxpd	VOPNAME_OPEN,		{ .vop_open = smbfs_open },
5f4fc069Sjilinxpd	VOPNAME_CLOSE,		{ .vop_close = smbfs_close },
5f4fc069Sjilinxpd	VOPNAME_READ,		{ .vop_read = smbfs_read },
5f4fc069Sjilinxpd	VOPNAME_WRITE,		{ .vop_write = smbfs_write },
5f4fc069Sjilinxpd	VOPNAME_IOCTL,		{ .vop_ioctl = smbfs_ioctl },
5f4fc069Sjilinxpd	VOPNAME_GETATTR,	{ .vop_getattr = smbfs_getattr },
5f4fc069Sjilinxpd	VOPNAME_SETATTR,	{ .vop_setattr = smbfs_setattr },
5f4fc069Sjilinxpd	VOPNAME_ACCESS,		{ .vop_access = smbfs_access },
5f4fc069Sjilinxpd	VOPNAME_LOOKUP,		{ .vop_lookup = smbfs_lookup },
5f4fc069Sjilinxpd	VOPNAME_CREATE,		{ .vop_create = smbfs_create },
5f4fc069Sjilinxpd	VOPNAME_REMOVE,		{ .vop_remove = smbfs_remove },
5f4fc069Sjilinxpd	VOPNAME_LINK,		{ .vop_link = smbfs_link },
5f4fc069Sjilinxpd	VOPNAME_RENAME,		{ .vop_rename = smbfs_rename },
5f4fc069Sjilinxpd	VOPNAME_MKDIR,		{ .vop_mkdir = smbfs_mkdir },
5f4fc069Sjilinxpd	VOPNAME_RMDIR,		{ .vop_rmdir = smbfs_rmdir },
5f4fc069Sjilinxpd	VOPNAME_READDIR,	{ .vop_readdir = smbfs_readdir },
5f4fc069Sjilinxpd	VOPNAME_SYMLINK,	{ .vop_symlink = smbfs_symlink },
5f4fc069Sjilinxpd	VOPNAME_READLINK,	{ .vop_readlink = smbfs_readlink },
5f4fc069Sjilinxpd	VOPNAME_FSYNC,		{ .vop_fsync = smbfs_fsync },
5f4fc069Sjilinxpd	VOPNAME_INACTIVE,	{ .vop_inactive = smbfs_inactive },
5f4fc069Sjilinxpd	VOPNAME_FID,		{ .vop_fid = smbfs_fid },
5f4fc069Sjilinxpd	VOPNAME_RWLOCK,		{ .vop_rwlock = smbfs_rwlock },
5f4fc069Sjilinxpd	VOPNAME_RWUNLOCK,	{ .vop_rwunlock = smbfs_rwunlock },
5f4fc069Sjilinxpd	VOPNAME_SEEK,		{ .vop_seek = smbfs_seek },
5f4fc069Sjilinxpd	VOPNAME_FRLOCK,		{ .vop_frlock = smbfs_frlock },
5f4fc069Sjilinxpd	VOPNAME_SPACE,		{ .vop_space = smbfs_space },
5f4fc069Sjilinxpd	VOPNAME_REALVP,		{ .vop_realvp = smbfs_realvp },
8329232eSGordon Ross#ifdef	_KERNEL
5f4fc069Sjilinxpd	VOPNAME_GETPAGE,	{ .vop_getpage = smbfs_getpage },
5f4fc069Sjilinxpd	VOPNAME_PUTPAGE,	{ .vop_putpage = smbfs_putpage },
5f4fc069Sjilinxpd	VOPNAME_MAP,		{ .vop_map = smbfs_map },
5f4fc069Sjilinxpd	VOPNAME_ADDMAP,		{ .vop_addmap = smbfs_addmap },
5f4fc069Sjilinxpd	VOPNAME_DELMAP,		{ .vop_delmap = smbfs_delmap },
8329232eSGordon Ross#endif	// _KERNEL
5f4fc069Sjilinxpd	VOPNAME_PATHCONF,	{ .vop_pathconf = smbfs_pathconf },
5f4fc069Sjilinxpd	VOPNAME_SETSECATTR,	{ .vop_setsecattr = smbfs_setsecattr },
5f4fc069Sjilinxpd	VOPNAME_GETSECATTR,	{ .vop_getsecattr = smbfs_getsecattr },
5f4fc069Sjilinxpd	VOPNAME_SHRLOCK,	{ .vop_shrlock = smbfs_shrlock },
5f4fc069Sjilinxpd#ifdef	SMBFS_VNEVENT
5f4fc069Sjilinxpd	VOPNAME_VNEVENT,	{ .vop_vnevent = fs_vnevent_support },
5f4fc069Sjilinxpd#endif
5f4fc069Sjilinxpd	{ NULL, NULL }
5f4fc069Sjilinxpd};