1 /*
   2  * Copyright (c) 2000-2001, Boris Popov
   3  * All rights reserved.
   4  *
   5  * Redistribution and use in source and binary forms, with or without
   6  * modification, are permitted provided that the following conditions
   7  * are met:
   8  * 1. Redistributions of source code must retain the above copyright
   9  *    notice, this list of conditions and the following disclaimer.
  10  * 2. Redistributions in binary form must reproduce the above copyright
  11  *    notice, this list of conditions and the following disclaimer in the
  12  *    documentation and/or other materials provided with the distribution.
  13  * 3. All advertising materials mentioning features or use of this software
  14  *    must display the following acknowledgement:
  15  *    This product includes software developed by Boris Popov.
  16  * 4. Neither the name of the author nor the names of any co-contributors
  17  *    may be used to endorse or promote products derived from this software
  18  *    without specific prior written permission.
  19  *
  20  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
  21  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  22  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  23  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
  24  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  25  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  26  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  27  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  28  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  29  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  30  * SUCH DAMAGE.
  31  *
  32  * $Id: smbfs_node.h,v 1.31.52.1 2005/05/27 02:35:28 lindak Exp $
  33  */
  34 
  35 /*
  36  * Copyright 2011 Nexenta Systems, Inc.  All rights reserved.
  37  * Copyright 2010 Sun Microsystems, Inc.  All rights reserved.
  38  * Use is subject to license terms.
  39  */
  40 
  41 #ifndef _FS_SMBFS_NODE_H_
  42 #define _FS_SMBFS_NODE_H_
  43 
  44 /*
  45  * Much code copied into here from Sun NFS.
  46  * Compare with nfs_clnt.h
  47  */
  48 
  49 #include <sys/avl.h>
  50 #include <sys/list.h>
  51 #include <netsmb/smb_subr.h>
  52 
  53 #ifdef __cplusplus
  54 extern "C" {
  55 #endif
  56 
  57 /*
  58  * Cache whole directories (not yet)
  59  */
  60 typedef struct rddir_cache {
  61         lloff_t _cookie;        /* cookie used to find this cache entry */
  62         lloff_t _ncookie;       /* cookie used to find the next cache entry */
  63         char *entries;          /* buffer containing dirent entries */
  64         int eof;                /* EOF reached after this request */
  65         int entlen;             /* size of dirent entries in buf */
  66         int buflen;             /* size of the buffer used to store entries */
  67         int flags;              /* control flags, see below */
  68         kcondvar_t cv;          /* cv for blocking */
  69         int error;              /* error from RPC operation */
  70         kmutex_t lock;
  71         uint_t count;           /* reference count */
  72         avl_node_t tree;        /* AVL tree links */
  73 } rddir_cache;
  74 
  75 #define smbfs_cookie    _cookie._p._l
  76 #define smbfs_ncookie   _ncookie._p._l
  77 #define smbfs3_cookie   _cookie._f
  78 #define smbfs3_ncookie  _ncookie._f
  79 
  80 #define RDDIR           0x1     /* readdir operation in progress */
  81 #define RDDIRWAIT       0x2     /* waiting on readdir in progress */
  82 #define RDDIRREQ        0x4     /* a new readdir is required */
  83 #define RDDIRCACHED     0x8     /* entry is in the cache */
  84 
  85 #define HAVE_RDDIR_CACHE(rp)    (avl_numnodes(&(rp)->r_dir) > 0)
  86 
  87 /*
  88  * A homegrown reader/writer lock implementation.  It addresses
  89  * two requirements not addressed by the system primitives.  They
  90  * are that the `enter" operation is optionally interruptible and
  91  * that that they can be re`enter'ed by writers without deadlock.
  92  */
  93 typedef struct smbfs_rwlock {
  94         int count;
  95         int waiters;
  96         kthread_t *owner;
  97         kmutex_t lock;
  98         kcondvar_t cv;
  99 } smbfs_rwlock_t;
 100 
 101 /*
 102  * The format of the smbfs node header, which contains the
 103  * fields used to link nodes in the AVL tree, and those
 104  * fields needed by the AVL node comparison functions.
 105  * It's a separate struct so we can call avl_find with
 106  * this relatively small struct as a stack local.
 107  *
 108  * The AVL tree is mntinfo.smi_hash_avl,
 109  * and its lock is mntinfo.smi_hash_lk.
 110  */
 111 typedef struct smbfs_node_hdr {
 112         /*
 113          * Our linkage in the node cache AVL tree.
 114          */
 115         avl_node_t      hdr_avl_node;
 116 
 117         /*
 118          * Identity of this node:  The full path name,
 119          * in server form, relative to the share root.
 120          */
 121         char            *hdr_n_rpath;
 122         int             hdr_n_rplen;
 123 } smbfs_node_hdr_t;
 124 
 125 /*
 126  * Below is the SMBFS-specific representation of a "node".
 127  * This struct is a mixture of Sun NFS and Darwin code.
 128  * Fields starting with "r_" came from NFS struct "rnode"
 129  * and fields starting with "n_" came from Darwin, or
 130  * were added during the Solaris port.  We have avoided
 131  * renaming fields so we would not cause excessive
 132  * changes in the code using this struct.
 133  *
 134  * Now using an AVL tree instead of hash lists, but kept the
 135  * "hash" in some member names and functions to reduce churn.
 136  * One AVL tree per mount replaces the global hash buckets.
 137  *
 138  * Notes carried over from the NFS code:
 139  *
 140  * The smbnode is the "inode" for remote files.  It contains all the
 141  * information necessary to handle remote file on the client side.
 142  *
 143  * Note on file sizes:  we keep two file sizes in the smbnode: the size
 144  * according to the client (r_size) and the size according to the server
 145  * (r_attr.fa_size).  They can differ because we modify r_size during a
 146  * write system call (smbfs_rdwr), before the write request goes over the
 147  * wire (before the file is actually modified on the server).  If an OTW
 148  * request occurs before the cached data is written to the server the file
 149  * size returned from the server (r_attr.fa_size) may not match r_size.
 150  * r_size is the one we use, in general.  r_attr.fa_size is only used to
 151  * determine whether or not our cached data is valid.
 152  *
 153  * Each smbnode has 3 locks associated with it (not including the smbnode
 154  * "hash" AVL tree and free list locks):
 155  *
 156  *      r_rwlock:       Serializes smbfs_write and smbfs_setattr requests
 157  *                      and allows smbfs_read requests to proceed in parallel.
 158  *                      Serializes reads/updates to directories.
 159  *
 160  *      r_lkserlock:    Serializes lock requests with map, write, and
 161  *                      readahead operations.
 162  *
 163  *      r_statelock:    Protects all fields in the smbnode except for
 164  *                      those listed below.  This lock is intented
 165  *                      to be held for relatively short periods of
 166  *                      time (not accross entire putpage operations,
 167  *                      for example).
 168  *
 169  * The following members are protected by the mutex smbfreelist_lock:
 170  *      r_freef
 171  *      r_freeb
 172  *
 173  * The following members are protected by the AVL tree rwlock:
 174  *      r_avl_node      (r__hdr.hdr_avl_node)
 175  *
 176  * Note: r_modaddr is only accessed when the r_statelock mutex is held.
 177  *      Its value is also controlled via r_rwlock.  It is assumed that
 178  *      there will be only 1 writer active at a time, so it safe to
 179  *      set r_modaddr and release r_statelock as long as the r_rwlock
 180  *      writer lock is held.
 181  *
 182  * 64-bit offsets: the code formerly assumed that atomic reads of
 183  * r_size were safe and reliable; on 32-bit architectures, this is
 184  * not true since an intervening bus cycle from another processor
 185  * could update half of the size field.  The r_statelock must now
 186  * be held whenever any kind of access of r_size is made.
 187  *
 188  * Lock ordering:
 189  *      r_rwlock > r_lkserlock > r_statelock
 190  */
 191 
 192 typedef struct smbnode {
 193         /* Our linkage in the node cache AVL tree (see above). */
 194         smbfs_node_hdr_t        r__hdr;
 195 
 196         /* short-hand names for r__hdr members */
 197 #define r_avl_node      r__hdr.hdr_avl_node
 198 #define n_rpath         r__hdr.hdr_n_rpath
 199 #define n_rplen         r__hdr.hdr_n_rplen
 200 
 201         smbmntinfo_t    *n_mount;       /* VFS data */
 202         vnode_t         *r_vnode;       /* associated vnode */
 203 
 204         /*
 205          * Linkage in smbfreelist, for reclaiming nodes.
 206          * Lock for the free list is: smbfreelist_lock
 207          */
 208         struct smbnode  *r_freef;       /* free list forward pointer */
 209         struct smbnode  *r_freeb;       /* free list back pointer */
 210 
 211         smbfs_rwlock_t  r_rwlock;       /* serialize write/setattr requests */
 212         smbfs_rwlock_t  r_lkserlock;    /* serialize lock with other ops */
 213         kmutex_t        r_statelock;    /* protect (most) smbnode fields */
 214 
 215         /*
 216          * File handle, directory search handle,
 217          * and reference counts for them, etc.
 218          * Lock for these is: r_lkserlock
 219          */
 220         int             n_dirrefs;
 221         struct smbfs_fctx       *n_dirseq;      /* ff context */
 222         int             n_dirofs;       /* last ff offset */
 223         int             n_fidrefs;
 224         uint16_t        n_fid;          /* file handle */
 225         enum vtype      n_ovtype;       /* vnode type opened */
 226         uint32_t        n_rights;       /* granted rights */
 227         int             n_vcgenid;      /* gereration no. (reconnect) */
 228 
 229         /*
 230          * Misc. bookkeeping
 231          */
 232         cred_t          *r_cred;        /* current credentials */
 233         u_offset_t      r_nextr;        /* next read offset (read-ahead) */
 234         long            r_mapcnt;       /* count of mmapped pages */
 235         uint_t          r_inmap;        /* to serialize read/write and mmap */
 236         uint_t          r_count;        /* # of refs not reflect in v_count */
 237         uint_t          r_awcount;      /* # of outstanding async write */
 238         uint_t          r_gcount;       /* getattrs waiting to flush pages */
 239         uint_t          r_flags;        /* flags, see below */
 240         uint32_t        n_flag;         /* N--- flags below */
 241         uint_t          r_error;        /* async write error */
 242         kcondvar_t      r_cv;           /* condvar for blocked threads */
 243         avl_tree_t      r_dir;          /* cache of readdir responses */
 244         rddir_cache     *r_direof;      /* pointer to the EOF entry */
 245         u_offset_t      r_modaddr;      /* address for page in writenp */
 246         kthread_t       *r_serial;      /* id of purging thread */
 247         list_t          r_indelmap;     /* list of delmap callers */
 248 
 249         /*
 250          * Attributes: local, and as last seen on the server.
 251          * See notes above re: r_size vs r_attr.fa_size, etc.
 252          */
 253         smbfattr_t      r_attr;         /* attributes from the server */
 254         hrtime_t        r_attrtime;     /* time attributes become invalid */
 255         hrtime_t        r_mtime;        /* client time file last modified */
 256         len_t           r_size;         /* client's view of file size */
 257 
 258         /*
 259          * Security attributes.
 260          */
 261         vsecattr_t      r_secattr;
 262         hrtime_t        r_sectime;
 263 
 264         /*
 265          * Other attributes, not carried in smbfattr_t
 266          */
 267         u_longlong_t    n_ino;
 268         uid_t           n_uid;
 269         gid_t           n_gid;
 270         mode_t          n_mode;
 271 } smbnode_t;
 272 
 273 /*
 274  * Flag bits in: smbnode_t .n_flag
 275  */
 276 #define NFLUSHINPROG    0x00001
 277 #define NFLUSHWANT      0x00002 /* they should gone ... */
 278 #define NMODIFIED       0x00004 /* bogus, until async IO implemented */
 279 #define NREFPARENT      0x00010 /* node holds parent from recycling */
 280 #define NGOTIDS         0x00020
 281 #define NRDIRSERIAL     0x00080 /* serialize readdir operation */
 282 #define NISMAPPED       0x00800
 283 #define NFLUSHWIRE      0x01000
 284 #define NATTRCHANGED    0x02000 /* kill cached attributes at close */
 285 #define NALLOC          0x04000 /* being created */
 286 #define NWALLOC         0x08000 /* awaiting creation */
 287 #define N_XATTR         0x10000 /* extended attribute (dir or file) */
 288 
 289 /*
 290  * Flag bits in: smbnode_t .r_flags
 291  */
 292 #define RREADDIRPLUS    0x1     /* issue a READDIRPLUS instead of READDIR */
 293 #define RDIRTY          0x2     /* dirty pages from write operation */
 294 #define RSTALE          0x4     /* file handle is stale */
 295 #define RMODINPROGRESS  0x8     /* page modification happening */
 296 #define RTRUNCATE       0x10    /* truncating, don't commit */
 297 #define RHAVEVERF       0x20    /* have a write verifier to compare against */
 298 #define RCOMMIT         0x40    /* commit in progress */
 299 #define RCOMMITWAIT     0x80    /* someone is waiting to do a commit */
 300 #define RHASHED         0x100   /* smbnode is in the "hash" AVL tree */
 301 #define ROUTOFSPACE     0x200   /* an out of space error has happened */
 302 #define RDIRECTIO       0x400   /* bypass the buffer cache */
 303 #define RLOOKUP         0x800   /* a lookup has been performed */
 304 #define RWRITEATTR      0x1000  /* attributes came from WRITE */
 305 #define RINDNLCPURGE    0x2000  /* in the process of purging DNLC references */
 306 #define RDELMAPLIST     0x4000  /* delmap callers tracking for as callback */
 307 
 308 /*
 309  * Convert between vnode and smbnode
 310  */
 311 #define VTOSMB(vp)      ((smbnode_t *)((vp)->v_data))
 312 #define SMBTOV(np)      ((np)->r_vnode)
 313 
 314 /*
 315  * A macro to compute the separator that should be used for
 316  * names under some directory.  See smbfs_fullpath().
 317  */
 318 #define SMBFS_DNP_SEP(dnp) \
 319         (((dnp->n_flag & N_XATTR) == 0 && dnp->n_rplen > 1) ? '\\' : '\0')
 320 
 321 #ifdef __cplusplus
 322 }
 323 #endif
 324 
 325 #endif /* _FS_SMBFS_NODE_H_ */