1 /*
   2  * CDDL HEADER START
   3  *
   4  * The contents of this file are subject to the terms of the
   5  * Common Development and Distribution License (the "License").
   6  * You may not use this file except in compliance with the License.
   7  *
   8  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
   9  * or http://www.opensolaris.org/os/licensing.
  10  * See the License for the specific language governing permissions
  11  * and limitations under the License.
  12  *
  13  * When distributing Covered Code, include this CDDL HEADER in each
  14  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
  15  * If applicable, add the following below this CDDL HEADER, with the
  16  * fields enclosed by brackets "[]" replaced with your own identifying
  17  * information: Portions Copyright [yyyy] [name of copyright owner]
  18  *
  19  * CDDL HEADER END
  20  */
  21 
  22 /*
  23  * Copyright (c) 2008, 2010, Oracle and/or its affiliates. All rights reserved.
  24  * Copyright 2013 Nexenta Systems, Inc. All rights reserved.
  25  * Copyright (c) 2013 by Delphix. All rights reserved.
  26  */
  27 
  28 #include <sys/sysmacros.h>
  29 #include <sys/conf.h>
  30 #include <sys/file.h>
  31 #include <sys/ddi.h>
  32 #include <sys/sunddi.h>
  33 #include <sys/modctl.h>
  34 #include <sys/scsi/scsi.h>
  35 #include <sys/scsi/impl/scsi_reset_notify.h>
  36 #include <sys/disp.h>
  37 #include <sys/byteorder.h>
  38 #include <sys/pathname.h>
  39 #include <sys/atomic.h>
  40 #include <sys/nvpair.h>
  41 #include <sys/fs/zfs.h>
  42 #include <sys/sdt.h>
  43 #include <sys/dkio.h>
  44 #include <sys/zfs_ioctl.h>
  45 
  46 #include <sys/stmf.h>
  47 #include <sys/lpif.h>
  48 #include <sys/stmf_ioctl.h>
  49 #include <sys/stmf_sbd_ioctl.h>
  50 
  51 #include "stmf_sbd.h"
  52 #include "sbd_impl.h"
  53 
  54 #define SBD_IS_ZVOL(zvol)       (strncmp("/dev/zvol", zvol, 9))
  55 
  56 extern sbd_status_t sbd_pgr_meta_init(sbd_lu_t *sl);
  57 extern sbd_status_t sbd_pgr_meta_load(sbd_lu_t *sl);
  58 extern void sbd_pgr_reset(sbd_lu_t *sl);
  59 
  60 static int sbd_getinfo(dev_info_t *dip, ddi_info_cmd_t cmd, void *arg,
  61     void **result);
  62 static int sbd_attach(dev_info_t *dip, ddi_attach_cmd_t cmd);
  63 static int sbd_detach(dev_info_t *dip, ddi_detach_cmd_t cmd);
  64 static int sbd_open(dev_t *devp, int flag, int otype, cred_t *credp);
  65 static int sbd_close(dev_t dev, int flag, int otype, cred_t *credp);
  66 static int stmf_sbd_ioctl(dev_t dev, int cmd, intptr_t data, int mode,
  67     cred_t *credp, int *rval);
  68 void sbd_lp_cb(stmf_lu_provider_t *lp, int cmd, void *arg, uint32_t flags);
  69 stmf_status_t sbd_proxy_reg_lu(uint8_t *luid, void *proxy_reg_arg,
  70     uint32_t proxy_reg_arg_len);
  71 stmf_status_t sbd_proxy_dereg_lu(uint8_t *luid, void *proxy_reg_arg,
  72     uint32_t proxy_reg_arg_len);
  73 stmf_status_t sbd_proxy_msg(uint8_t *luid, void *proxy_arg,
  74     uint32_t proxy_arg_len, uint32_t type);
  75 int sbd_create_register_lu(sbd_create_and_reg_lu_t *slu, int struct_sz,
  76     uint32_t *err_ret);
  77 int sbd_create_standby_lu(sbd_create_standby_lu_t *slu, uint32_t *err_ret);
  78 int sbd_set_lu_standby(sbd_set_lu_standby_t *stlu, uint32_t *err_ret);
  79 int sbd_import_lu(sbd_import_lu_t *ilu, int struct_sz, uint32_t *err_ret,
  80     int no_register, sbd_lu_t **slr);
  81 int sbd_import_active_lu(sbd_import_lu_t *ilu, sbd_lu_t *sl, uint32_t *err_ret);
  82 int sbd_delete_lu(sbd_delete_lu_t *dlu, int struct_sz, uint32_t *err_ret);
  83 int sbd_modify_lu(sbd_modify_lu_t *mlu, int struct_sz, uint32_t *err_ret);
  84 int sbd_set_global_props(sbd_global_props_t *mlu, int struct_sz,
  85     uint32_t *err_ret);
  86 int sbd_get_global_props(sbd_global_props_t *oslp, uint32_t oslp_sz,
  87     uint32_t *err_ret);
  88 int sbd_get_lu_props(sbd_lu_props_t *islp, uint32_t islp_sz,
  89     sbd_lu_props_t *oslp, uint32_t oslp_sz, uint32_t *err_ret);
  90 static char *sbd_get_zvol_name(sbd_lu_t *);
  91 static int sbd_get_unmap_props(sbd_unmap_props_t *sup, sbd_unmap_props_t *osup,
  92     uint32_t *err_ret);
  93 sbd_status_t sbd_create_zfs_meta_object(sbd_lu_t *sl);
  94 sbd_status_t sbd_open_zfs_meta(sbd_lu_t *sl);
  95 sbd_status_t sbd_read_zfs_meta(sbd_lu_t *sl, uint8_t *buf, uint64_t sz,
  96     uint64_t off);
  97 sbd_status_t sbd_write_zfs_meta(sbd_lu_t *sl, uint8_t *buf, uint64_t sz,
  98     uint64_t off);
  99 sbd_status_t sbd_update_zfs_prop(sbd_lu_t *sl);
 100 int sbd_is_zvol(char *path);
 101 int sbd_zvolget(char *zvol_name, char **comstarprop);
 102 int sbd_zvolset(char *zvol_name, char *comstarprop);
 103 char sbd_ctoi(char c);
 104 void sbd_close_lu(sbd_lu_t *sl);
 105 
 106 static ldi_ident_t      sbd_zfs_ident;
 107 static stmf_lu_provider_t *sbd_lp;
 108 static sbd_lu_t         *sbd_lu_list = NULL;
 109 static kmutex_t         sbd_lock;
 110 static dev_info_t       *sbd_dip;
 111 static uint32_t         sbd_lu_count = 0;
 112 
 113 /* Global property settings for the logical unit */
 114 char sbd_vendor_id[]    = "SUN     ";
 115 char sbd_product_id[]   = "COMSTAR         ";
 116 char sbd_revision[]     = "1.0 ";
 117 char *sbd_mgmt_url = NULL;
 118 uint16_t sbd_mgmt_url_alloc_size = 0;
 119 krwlock_t sbd_global_prop_lock;
 120 
 121 static char sbd_name[] = "sbd";
 122 
 123 static struct cb_ops sbd_cb_ops = {
 124         sbd_open,                       /* open */
 125         sbd_close,                      /* close */
 126         nodev,                          /* strategy */
 127         nodev,                          /* print */
 128         nodev,                          /* dump */
 129         nodev,                          /* read */
 130         nodev,                          /* write */
 131         stmf_sbd_ioctl,                 /* ioctl */
 132         nodev,                          /* devmap */
 133         nodev,                          /* mmap */
 134         nodev,                          /* segmap */
 135         nochpoll,                       /* chpoll */
 136         ddi_prop_op,                    /* cb_prop_op */
 137         0,                              /* streamtab */
 138         D_NEW | D_MP,                   /* cb_flag */
 139         CB_REV,                         /* rev */
 140         nodev,                          /* aread */
 141         nodev                           /* awrite */
 142 };
 143 
 144 static struct dev_ops sbd_ops = {
 145         DEVO_REV,
 146         0,
 147         sbd_getinfo,
 148         nulldev,                /* identify */
 149         nulldev,                /* probe */
 150         sbd_attach,
 151         sbd_detach,
 152         nodev,                  /* reset */
 153         &sbd_cb_ops,
 154         NULL,                   /* bus_ops */
 155         NULL                    /* power */
 156 };
 157 
 158 #define SBD_NAME        "COMSTAR SBD"
 159 
 160 static struct modldrv modldrv = {
 161         &mod_driverops,
 162         SBD_NAME,
 163         &sbd_ops
 164 };
 165 
 166 static struct modlinkage modlinkage = {
 167         MODREV_1,
 168         &modldrv,
 169         NULL
 170 };
 171 
 172 int
 173 _init(void)
 174 {
 175         int ret;
 176 
 177         ret = mod_install(&modlinkage);
 178         if (ret)
 179                 return (ret);
 180         sbd_lp = (stmf_lu_provider_t *)stmf_alloc(STMF_STRUCT_LU_PROVIDER,
 181             0, 0);
 182         sbd_lp->lp_lpif_rev = LPIF_REV_2;
 183         sbd_lp->lp_instance = 0;
 184         sbd_lp->lp_name = sbd_name;
 185         sbd_lp->lp_cb = sbd_lp_cb;
 186         sbd_lp->lp_alua_support = 1;
 187         sbd_lp->lp_proxy_msg = sbd_proxy_msg;
 188         sbd_zfs_ident = ldi_ident_from_anon();
 189 
 190         if (stmf_register_lu_provider(sbd_lp) != STMF_SUCCESS) {
 191                 (void) mod_remove(&modlinkage);
 192                 stmf_free(sbd_lp);
 193                 return (EINVAL);
 194         }
 195         mutex_init(&sbd_lock, NULL, MUTEX_DRIVER, NULL);
 196         rw_init(&sbd_global_prop_lock, NULL, RW_DRIVER, NULL);
 197         return (0);
 198 }
 199 
 200 int
 201 _fini(void)
 202 {
 203         int ret;
 204 
 205         /*
 206          * If we have registered lus, then make sure they are all offline
 207          * if so then deregister them. This should drop the sbd_lu_count
 208          * to zero.
 209          */
 210         if (sbd_lu_count) {
 211                 sbd_lu_t *slu;
 212 
 213                 /* See if all of them are offline */
 214                 mutex_enter(&sbd_lock);
 215                 for (slu = sbd_lu_list; slu != NULL; slu = slu->sl_next) {
 216                         if ((slu->sl_state != STMF_STATE_OFFLINE) ||
 217                             slu->sl_state_not_acked) {
 218                                 mutex_exit(&sbd_lock);
 219                                 return (EBUSY);
 220                         }
 221                 }
 222                 mutex_exit(&sbd_lock);
 223 
 224 #if 0
 225                 /* ok start deregistering them */
 226                 while (sbd_lu_list) {
 227                         sbd_store_t *sst = sbd_lu_list->sl_sst;
 228                         if (sst->sst_deregister_lu(sst) != STMF_SUCCESS)
 229                                 return (EBUSY);
 230                 }
 231 #endif
 232                 return (EBUSY);
 233         }
 234         if (stmf_deregister_lu_provider(sbd_lp) != STMF_SUCCESS)
 235                 return (EBUSY);
 236         ret = mod_remove(&modlinkage);
 237         if (ret != 0) {
 238                 (void) stmf_register_lu_provider(sbd_lp);
 239                 return (ret);
 240         }
 241         stmf_free(sbd_lp);
 242         mutex_destroy(&sbd_lock);
 243         rw_destroy(&sbd_global_prop_lock);
 244         ldi_ident_release(sbd_zfs_ident);
 245         return (0);
 246 }
 247 
 248 int
 249 _info(struct modinfo *modinfop)
 250 {
 251         return (mod_info(&modlinkage, modinfop));
 252 }
 253 
 254 /* ARGSUSED */
 255 static int
 256 sbd_getinfo(dev_info_t *dip, ddi_info_cmd_t cmd, void *arg, void **result)
 257 {
 258         switch (cmd) {
 259         case DDI_INFO_DEVT2DEVINFO:
 260                 *result = sbd_dip;
 261                 break;
 262         case DDI_INFO_DEVT2INSTANCE:
 263                 *result = (void *)(uintptr_t)ddi_get_instance(sbd_dip);
 264                 break;
 265         default:
 266                 return (DDI_FAILURE);
 267         }
 268 
 269         return (DDI_SUCCESS);
 270 }
 271 
 272 static int
 273 sbd_attach(dev_info_t *dip, ddi_attach_cmd_t cmd)
 274 {
 275         switch (cmd) {
 276         case DDI_ATTACH:
 277                 sbd_dip = dip;
 278 
 279                 if (ddi_create_minor_node(dip, "admin", S_IFCHR, 0,
 280                     DDI_NT_STMF_LP, 0) != DDI_SUCCESS) {
 281                         break;
 282                 }
 283                 ddi_report_dev(dip);
 284                 return (DDI_SUCCESS);
 285         }
 286 
 287         return (DDI_FAILURE);
 288 }
 289 
 290 static int
 291 sbd_detach(dev_info_t *dip, ddi_detach_cmd_t cmd)
 292 {
 293         switch (cmd) {
 294         case DDI_DETACH:
 295                 ddi_remove_minor_node(dip, 0);
 296                 return (DDI_SUCCESS);
 297         }
 298 
 299         return (DDI_FAILURE);
 300 }
 301 
 302 /* ARGSUSED */
 303 static int
 304 sbd_open(dev_t *devp, int flag, int otype, cred_t *credp)
 305 {
 306         if (otype != OTYP_CHR)
 307                 return (EINVAL);
 308         return (0);
 309 }
 310 
 311 /* ARGSUSED */
 312 static int
 313 sbd_close(dev_t dev, int flag, int otype, cred_t *credp)
 314 {
 315         return (0);
 316 }
 317 
 318 /* ARGSUSED */
 319 static int
 320 stmf_sbd_ioctl(dev_t dev, int cmd, intptr_t data, int mode,
 321         cred_t *credp, int *rval)
 322 {
 323         stmf_iocdata_t          *iocd;
 324         void                    *ibuf   = NULL;
 325         void                    *obuf   = NULL;
 326         sbd_lu_t                *nsl;
 327         int                     i;
 328         int                     ret;
 329 
 330         if (drv_priv(credp) != 0) {
 331                 return (EPERM);
 332         }
 333 
 334         ret = stmf_copyin_iocdata(data, mode, &iocd, &ibuf, &obuf);
 335         if (ret)
 336                 return (ret);
 337         iocd->stmf_error = 0;
 338 
 339         switch (cmd) {
 340         case SBD_IOCTL_CREATE_AND_REGISTER_LU:
 341                 if (iocd->stmf_ibuf_size <
 342                     (sizeof (sbd_create_and_reg_lu_t) - 8)) {
 343                         ret = EFAULT;
 344                         break;
 345                 }
 346                 if ((iocd->stmf_obuf_size == 0) ||
 347                     (iocd->stmf_obuf_size > iocd->stmf_ibuf_size)) {
 348                         ret = EINVAL;
 349                         break;
 350                 }
 351                 ret = sbd_create_register_lu((sbd_create_and_reg_lu_t *)
 352                     ibuf, iocd->stmf_ibuf_size, &iocd->stmf_error);
 353                 bcopy(ibuf, obuf, iocd->stmf_obuf_size);
 354                 break;
 355         case SBD_IOCTL_SET_LU_STANDBY:
 356                 if (iocd->stmf_ibuf_size < sizeof (sbd_set_lu_standby_t)) {
 357                         ret = EFAULT;
 358                         break;
 359                 }
 360                 if (iocd->stmf_obuf_size) {
 361                         ret = EINVAL;
 362                         break;
 363                 }
 364                 ret = sbd_set_lu_standby((sbd_set_lu_standby_t *)ibuf,
 365                     &iocd->stmf_error);
 366                 break;
 367         case SBD_IOCTL_IMPORT_LU:
 368                 if (iocd->stmf_ibuf_size <
 369                     (sizeof (sbd_import_lu_t) - 8)) {
 370                         ret = EFAULT;
 371                         break;
 372                 }
 373                 if ((iocd->stmf_obuf_size == 0) ||
 374                     (iocd->stmf_obuf_size > iocd->stmf_ibuf_size)) {
 375                         ret = EINVAL;
 376                         break;
 377                 }
 378                 ret = sbd_import_lu((sbd_import_lu_t *)ibuf,
 379                     iocd->stmf_ibuf_size, &iocd->stmf_error, 0, NULL);
 380                 bcopy(ibuf, obuf, iocd->stmf_obuf_size);
 381                 break;
 382         case SBD_IOCTL_DELETE_LU:
 383                 if (iocd->stmf_ibuf_size < (sizeof (sbd_delete_lu_t) - 8)) {
 384                         ret = EFAULT;
 385                         break;
 386                 }
 387                 if (iocd->stmf_obuf_size) {
 388                         ret = EINVAL;
 389                         break;
 390                 }
 391                 ret = sbd_delete_lu((sbd_delete_lu_t *)ibuf,
 392                     iocd->stmf_ibuf_size, &iocd->stmf_error);
 393                 break;
 394         case SBD_IOCTL_MODIFY_LU:
 395                 if (iocd->stmf_ibuf_size < (sizeof (sbd_modify_lu_t) - 8)) {
 396                         ret = EFAULT;
 397                         break;
 398                 }
 399                 if (iocd->stmf_obuf_size) {
 400                         ret = EINVAL;
 401                         break;
 402                 }
 403                 ret = sbd_modify_lu((sbd_modify_lu_t *)ibuf,
 404                     iocd->stmf_ibuf_size, &iocd->stmf_error);
 405                 break;
 406         case SBD_IOCTL_SET_GLOBAL_LU:
 407                 if (iocd->stmf_ibuf_size < (sizeof (sbd_global_props_t) - 8)) {
 408                         ret = EFAULT;
 409                         break;
 410                 }
 411                 if (iocd->stmf_obuf_size) {
 412                         ret = EINVAL;
 413                         break;
 414                 }
 415                 ret = sbd_set_global_props((sbd_global_props_t *)ibuf,
 416                     iocd->stmf_ibuf_size, &iocd->stmf_error);
 417                 break;
 418         case SBD_IOCTL_GET_GLOBAL_LU:
 419                 if (iocd->stmf_ibuf_size) {
 420                         ret = EINVAL;
 421                         break;
 422                 }
 423                 if (iocd->stmf_obuf_size < sizeof (sbd_global_props_t)) {
 424                         ret = EINVAL;
 425                         break;
 426                 }
 427                 ret = sbd_get_global_props((sbd_global_props_t *)obuf,
 428                     iocd->stmf_obuf_size, &iocd->stmf_error);
 429                 break;
 430         case SBD_IOCTL_GET_LU_PROPS:
 431                 if (iocd->stmf_ibuf_size < (sizeof (sbd_lu_props_t) - 8)) {
 432                         ret = EFAULT;
 433                         break;
 434                 }
 435                 if (iocd->stmf_obuf_size < sizeof (sbd_lu_props_t)) {
 436                         ret = EINVAL;
 437                         break;
 438                 }
 439                 ret = sbd_get_lu_props((sbd_lu_props_t *)ibuf,
 440                     iocd->stmf_ibuf_size, (sbd_lu_props_t *)obuf,
 441                     iocd->stmf_obuf_size, &iocd->stmf_error);
 442                 break;
 443         case SBD_IOCTL_GET_LU_LIST:
 444                 mutex_enter(&sbd_lock);
 445                 iocd->stmf_obuf_max_nentries = sbd_lu_count;
 446                 iocd->stmf_obuf_nentries = min((iocd->stmf_obuf_size >> 4),
 447                     sbd_lu_count);
 448                 for (nsl = sbd_lu_list, i = 0; nsl &&
 449                     (i < iocd->stmf_obuf_nentries); i++, nsl = nsl->sl_next) {
 450                         bcopy(nsl->sl_device_id + 4,
 451                             &(((uint8_t *)obuf)[i << 4]), 16);
 452                 }
 453                 mutex_exit(&sbd_lock);
 454                 ret = 0;
 455                 iocd->stmf_error = 0;
 456                 break;
 457         case SBD_IOCTL_GET_UNMAP_PROPS:
 458                 if (iocd->stmf_ibuf_size < sizeof (sbd_unmap_props_t)) {
 459                         ret = EFAULT;
 460                         break;
 461                 }
 462                 if (iocd->stmf_obuf_size < sizeof (sbd_unmap_props_t)) {
 463                         ret = EINVAL;
 464                         break;
 465                 }
 466                 ret = sbd_get_unmap_props((sbd_unmap_props_t *)ibuf,
 467                     (sbd_unmap_props_t *)obuf, &iocd->stmf_error);
 468                 break;
 469         default:
 470                 ret = ENOTTY;
 471         }
 472 
 473         if (ret == 0) {
 474                 ret = stmf_copyout_iocdata(data, mode, iocd, obuf);
 475         } else if (iocd->stmf_error) {
 476                 (void) stmf_copyout_iocdata(data, mode, iocd, obuf);
 477         }
 478         if (obuf) {
 479                 kmem_free(obuf, iocd->stmf_obuf_size);
 480                 obuf = NULL;
 481         }
 482         if (ibuf) {
 483                 kmem_free(ibuf, iocd->stmf_ibuf_size);
 484                 ibuf = NULL;
 485         }
 486         kmem_free(iocd, sizeof (stmf_iocdata_t));
 487         return (ret);
 488 }
 489 
 490 /* ARGSUSED */
 491 void
 492 sbd_lp_cb(stmf_lu_provider_t *lp, int cmd, void *arg, uint32_t flags)
 493 {
 494         nvpair_t        *np;
 495         char            *s;
 496         sbd_import_lu_t *ilu;
 497         uint32_t        ilu_sz;
 498         uint32_t        struct_sz;
 499         uint32_t        err_ret;
 500         int             iret;
 501 
 502         if ((cmd != STMF_PROVIDER_DATA_UPDATED) || (arg == NULL)) {
 503                 return;
 504         }
 505 
 506         if ((flags & (STMF_PCB_STMF_ONLINING | STMF_PCB_PREG_COMPLETE)) == 0) {
 507                 return;
 508         }
 509 
 510         np = NULL;
 511         ilu_sz = 1024;
 512         ilu = (sbd_import_lu_t *)kmem_zalloc(ilu_sz, KM_SLEEP);
 513         while ((np = nvlist_next_nvpair((nvlist_t *)arg, np)) != NULL) {
 514                 if (nvpair_type(np) != DATA_TYPE_STRING) {
 515                         continue;
 516                 }
 517                 if (nvpair_value_string(np, &s) != 0) {
 518                         continue;
 519                 }
 520                 struct_sz = max(8, strlen(s) + 1);
 521                 struct_sz += sizeof (sbd_import_lu_t) - 8;
 522                 if (struct_sz > ilu_sz) {
 523                         kmem_free(ilu, ilu_sz);
 524                         ilu_sz = struct_sz + 32;
 525                         ilu = (sbd_import_lu_t *)kmem_zalloc(ilu_sz, KM_SLEEP);
 526                 }
 527                 ilu->ilu_struct_size = struct_sz;
 528                 (void) strcpy(ilu->ilu_meta_fname, s);
 529                 iret = sbd_import_lu(ilu, struct_sz, &err_ret, 0, NULL);
 530                 if (iret) {
 531                         stmf_trace(0, "sbd_lp_cb: import_lu failed, ret = %d, "
 532                             "err_ret = %d", iret, err_ret);
 533                 } else {
 534                         stmf_trace(0, "Imported the LU %s", nvpair_name(np));
 535                 }
 536         }
 537 
 538         if (ilu) {
 539                 kmem_free(ilu, ilu_sz);
 540                 ilu = NULL;
 541         }
 542 }
 543 
 544 sbd_status_t
 545 sbd_link_lu(sbd_lu_t *sl)
 546 {
 547         sbd_lu_t *nsl;
 548 
 549         mutex_enter(&sbd_lock);
 550         mutex_enter(&sl->sl_lock);
 551         ASSERT(sl->sl_trans_op != SL_OP_NONE);
 552 
 553         if (sl->sl_flags & SL_LINKED) {
 554                 mutex_exit(&sbd_lock);
 555                 mutex_exit(&sl->sl_lock);
 556                 return (SBD_ALREADY);
 557         }
 558         for (nsl = sbd_lu_list; nsl; nsl = nsl->sl_next) {
 559                 if (strcmp(nsl->sl_name, sl->sl_name) == 0)
 560                         break;
 561         }
 562         if (nsl) {
 563                 mutex_exit(&sbd_lock);
 564                 mutex_exit(&sl->sl_lock);
 565                 return (SBD_ALREADY);
 566         }
 567         sl->sl_next = sbd_lu_list;
 568         sbd_lu_list = sl;
 569         sl->sl_flags |= SL_LINKED;
 570         mutex_exit(&sbd_lock);
 571         mutex_exit(&sl->sl_lock);
 572         return (SBD_SUCCESS);
 573 }
 574 
 575 void
 576 sbd_unlink_lu(sbd_lu_t *sl)
 577 {
 578         sbd_lu_t **ppnsl;
 579 
 580         mutex_enter(&sbd_lock);
 581         mutex_enter(&sl->sl_lock);
 582         ASSERT(sl->sl_trans_op != SL_OP_NONE);
 583 
 584         ASSERT(sl->sl_flags & SL_LINKED);
 585         for (ppnsl = &sbd_lu_list; *ppnsl; ppnsl = &((*ppnsl)->sl_next)) {
 586                 if (*ppnsl == sl)
 587                         break;
 588         }
 589         ASSERT(*ppnsl);
 590         *ppnsl = (*ppnsl)->sl_next;
 591         sl->sl_flags &= ~SL_LINKED;
 592         mutex_exit(&sbd_lock);
 593         mutex_exit(&sl->sl_lock);
 594 }
 595 
 596 sbd_status_t
 597 sbd_find_and_lock_lu(uint8_t *guid, uint8_t *meta_name, uint8_t op,
 598     sbd_lu_t **ppsl)
 599 {
 600         sbd_lu_t *sl;
 601         int found = 0;
 602         sbd_status_t sret;
 603 
 604         mutex_enter(&sbd_lock);
 605         for (sl = sbd_lu_list; sl; sl = sl->sl_next) {
 606                 if (guid) {
 607                         found = bcmp(sl->sl_device_id + 4, guid, 16) == 0;
 608                 } else {
 609                         found = strcmp(sl->sl_name, (char *)meta_name) == 0;
 610                 }
 611                 if (found)
 612                         break;
 613         }
 614         if (!found) {
 615                 mutex_exit(&sbd_lock);
 616                 return (SBD_NOT_FOUND);
 617         }
 618         mutex_enter(&sl->sl_lock);
 619         if (sl->sl_trans_op == SL_OP_NONE) {
 620                 sl->sl_trans_op = op;
 621                 *ppsl = sl;
 622                 sret = SBD_SUCCESS;
 623         } else {
 624                 sret = SBD_BUSY;
 625         }
 626         mutex_exit(&sl->sl_lock);
 627         mutex_exit(&sbd_lock);
 628         return (sret);
 629 }
 630 
 631 sbd_status_t
 632 sbd_read_meta(sbd_lu_t *sl, uint64_t offset, uint64_t size, uint8_t *buf)
 633 {
 634         uint64_t        meta_align;
 635         uint64_t        starting_off;
 636         uint64_t        data_off;
 637         uint64_t        ending_off;
 638         uint64_t        io_size;
 639         uint8_t         *io_buf;
 640         vnode_t         *vp;
 641         sbd_status_t    ret;
 642         ssize_t         resid;
 643         int             vret;
 644 
 645         ASSERT(sl->sl_flags & SL_META_OPENED);
 646         if (sl->sl_flags & SL_SHARED_META) {
 647                 meta_align = (((uint64_t)1) << sl->sl_data_blocksize_shift) - 1;
 648                 vp = sl->sl_data_vp;
 649                 ASSERT(vp);
 650         } else {
 651                 meta_align = (((uint64_t)1) << sl->sl_meta_blocksize_shift) - 1;
 652                 if ((sl->sl_flags & SL_ZFS_META) == 0) {
 653                         vp = sl->sl_meta_vp;
 654                         ASSERT(vp);
 655                 }
 656         }
 657         starting_off = offset & ~(meta_align);
 658         data_off = offset & meta_align;
 659         ending_off = (offset + size + meta_align) & (~meta_align);
 660         if (ending_off > sl->sl_meta_size_used) {
 661                 bzero(buf, size);
 662                 if (starting_off >= sl->sl_meta_size_used) {
 663                         return (SBD_SUCCESS);
 664                 }
 665                 ending_off = (sl->sl_meta_size_used + meta_align) &
 666                     (~meta_align);
 667                 if (size > (ending_off - (starting_off + data_off))) {
 668                         size = ending_off - (starting_off + data_off);
 669                 }
 670         }
 671         io_size = ending_off - starting_off;
 672         io_buf = (uint8_t *)kmem_zalloc(io_size, KM_SLEEP);
 673         ASSERT((starting_off + io_size) <= sl->sl_total_meta_size);
 674 
 675         /*
 676          * Don't proceed if the device has been closed
 677          * This can occur on an access state change to standby or
 678          * a delete. The writer lock is acquired before closing the
 679          * lu. If importing, reading the metadata is valid, hence
 680          * the check on SL_OP_IMPORT_LU.
 681          */
 682         rw_enter(&sl->sl_access_state_lock, RW_READER);
 683         if ((sl->sl_flags & SL_MEDIA_LOADED) == 0 &&
 684             sl->sl_trans_op != SL_OP_IMPORT_LU) {
 685                 rw_exit(&sl->sl_access_state_lock);
 686                 ret = SBD_FILEIO_FAILURE;
 687                 goto sbd_read_meta_failure;
 688         }
 689         if (sl->sl_flags & SL_ZFS_META) {
 690                 if ((ret = sbd_read_zfs_meta(sl, io_buf, io_size,
 691                     starting_off)) != SBD_SUCCESS) {
 692                         rw_exit(&sl->sl_access_state_lock);
 693                         goto sbd_read_meta_failure;
 694                 }
 695         } else {
 696                 vret = vn_rdwr(UIO_READ, vp, (caddr_t)io_buf, (ssize_t)io_size,
 697                     (offset_t)starting_off, UIO_SYSSPACE, FRSYNC,
 698                     RLIM64_INFINITY, CRED(), &resid);
 699 
 700                 if (vret || resid) {
 701                         ret = SBD_FILEIO_FAILURE | vret;
 702                         rw_exit(&sl->sl_access_state_lock);
 703                         goto sbd_read_meta_failure;
 704                 }
 705         }
 706         rw_exit(&sl->sl_access_state_lock);
 707 
 708         bcopy(io_buf + data_off, buf, size);
 709         ret = SBD_SUCCESS;
 710 
 711 sbd_read_meta_failure:
 712         kmem_free(io_buf, io_size);
 713         return (ret);
 714 }
 715 
 716 sbd_status_t
 717 sbd_write_meta(sbd_lu_t *sl, uint64_t offset, uint64_t size, uint8_t *buf)
 718 {
 719         uint64_t        meta_align;
 720         uint64_t        starting_off;
 721         uint64_t        data_off;
 722         uint64_t        ending_off;
 723         uint64_t        io_size;
 724         uint8_t         *io_buf;
 725         vnode_t         *vp;
 726         sbd_status_t    ret;
 727         ssize_t         resid;
 728         int             vret;
 729 
 730         ASSERT(sl->sl_flags & SL_META_OPENED);
 731         if (sl->sl_flags & SL_SHARED_META) {
 732                 meta_align = (((uint64_t)1) << sl->sl_data_blocksize_shift) - 1;
 733                 vp = sl->sl_data_vp;
 734                 ASSERT(vp);
 735         } else {
 736                 meta_align = (((uint64_t)1) << sl->sl_meta_blocksize_shift) - 1;
 737                 if ((sl->sl_flags & SL_ZFS_META) == 0) {
 738                         vp = sl->sl_meta_vp;
 739                         ASSERT(vp);
 740                 }
 741         }
 742         starting_off = offset & ~(meta_align);
 743         data_off = offset & meta_align;
 744         ending_off = (offset + size + meta_align) & (~meta_align);
 745         io_size = ending_off - starting_off;
 746         io_buf = (uint8_t *)kmem_zalloc(io_size, KM_SLEEP);
 747         ret = sbd_read_meta(sl, starting_off, io_size, io_buf);
 748         if (ret != SBD_SUCCESS) {
 749                 goto sbd_write_meta_failure;
 750         }
 751         bcopy(buf, io_buf + data_off, size);
 752         /*
 753          * Don't proceed if the device has been closed
 754          * This can occur on an access state change to standby or
 755          * a delete. The writer lock is acquired before closing the
 756          * lu. If importing, reading the metadata is valid, hence
 757          * the check on SL_OP_IMPORT_LU.
 758          */
 759         rw_enter(&sl->sl_access_state_lock, RW_READER);
 760         if ((sl->sl_flags & SL_MEDIA_LOADED) == 0 &&
 761             sl->sl_trans_op != SL_OP_IMPORT_LU) {
 762                 rw_exit(&sl->sl_access_state_lock);
 763                 ret = SBD_FILEIO_FAILURE;
 764                 goto sbd_write_meta_failure;
 765         }
 766         if (sl->sl_flags & SL_ZFS_META) {
 767                 if ((ret = sbd_write_zfs_meta(sl, io_buf, io_size,
 768                     starting_off)) != SBD_SUCCESS) {
 769                         rw_exit(&sl->sl_access_state_lock);
 770                         goto sbd_write_meta_failure;
 771                 }
 772         } else {
 773                 vret = vn_rdwr(UIO_WRITE, vp, (caddr_t)io_buf, (ssize_t)io_size,
 774                     (offset_t)starting_off, UIO_SYSSPACE, FDSYNC,
 775                     RLIM64_INFINITY, CRED(), &resid);
 776 
 777                 if (vret || resid) {
 778                         ret = SBD_FILEIO_FAILURE | vret;
 779                         rw_exit(&sl->sl_access_state_lock);
 780                         goto sbd_write_meta_failure;
 781                 }
 782         }
 783         rw_exit(&sl->sl_access_state_lock);
 784 
 785         ret = SBD_SUCCESS;
 786 
 787 sbd_write_meta_failure:
 788         kmem_free(io_buf, io_size);
 789         return (ret);
 790 }
 791 
 792 uint8_t
 793 sbd_calc_sum(uint8_t *buf, int size)
 794 {
 795         uint8_t s = 0;
 796 
 797         while (size > 0)
 798                 s += buf[--size];
 799 
 800         return (s);
 801 }
 802 
 803 uint8_t
 804 sbd_calc_section_sum(sm_section_hdr_t *sm, uint32_t sz)
 805 {
 806         uint8_t s, o;
 807 
 808         o = sm->sms_chksum;
 809         sm->sms_chksum = 0;
 810         s = sbd_calc_sum((uint8_t *)sm, sz);
 811         sm->sms_chksum = o;
 812 
 813         return (s);
 814 }
 815 
 816 uint32_t
 817 sbd_strlen(char *str, uint32_t maxlen)
 818 {
 819         uint32_t i;
 820 
 821         for (i = 0; i < maxlen; i++) {
 822                 if (str[i] == 0)
 823                         return (i);
 824         }
 825         return (i);
 826 }
 827 
 828 void
 829 sbd_swap_meta_start(sbd_meta_start_t *sm)
 830 {
 831         if (sm->sm_magic == SBD_MAGIC)
 832                 return;
 833         sm->sm_magic         = BSWAP_64(sm->sm_magic);
 834         sm->sm_meta_size     = BSWAP_64(sm->sm_meta_size);
 835         sm->sm_meta_size_used        = BSWAP_64(sm->sm_meta_size_used);
 836         sm->sm_ver_major     = BSWAP_16(sm->sm_ver_major);
 837         sm->sm_ver_minor     = BSWAP_16(sm->sm_ver_minor);
 838         sm->sm_ver_subminor  = BSWAP_16(sm->sm_ver_subminor);
 839 }
 840 
 841 void
 842 sbd_swap_section_hdr(sm_section_hdr_t *sm)
 843 {
 844         if (sm->sms_data_order == SMS_DATA_ORDER)
 845                 return;
 846         sm->sms_offset               = BSWAP_64(sm->sms_offset);
 847         sm->sms_size         = BSWAP_32(sm->sms_size);
 848         sm->sms_id           = BSWAP_16(sm->sms_id);
 849         sm->sms_chksum               += SMS_DATA_ORDER - sm->sms_data_order;
 850         sm->sms_data_order   = SMS_DATA_ORDER;
 851 }
 852 
 853 void
 854 sbd_swap_lu_info_1_0(sbd_lu_info_1_0_t *sli)
 855 {
 856         sbd_swap_section_hdr(&sli->sli_sms_header);
 857         if (sli->sli_data_order == SMS_DATA_ORDER)
 858                 return;
 859         sli->sli_sms_header.sms_chksum       += SMS_DATA_ORDER - sli->sli_data_order;
 860         sli->sli_data_order          = SMS_DATA_ORDER;
 861         sli->sli_total_store_size    = BSWAP_64(sli->sli_total_store_size);
 862         sli->sli_total_meta_size     = BSWAP_64(sli->sli_total_meta_size);
 863         sli->sli_lu_data_offset              = BSWAP_64(sli->sli_lu_data_offset);
 864         sli->sli_lu_data_size                = BSWAP_64(sli->sli_lu_data_size);
 865         sli->sli_flags                       = BSWAP_32(sli->sli_flags);
 866         sli->sli_blocksize           = BSWAP_16(sli->sli_blocksize);
 867 }
 868 
 869 void
 870 sbd_swap_lu_info_1_1(sbd_lu_info_1_1_t *sli)
 871 {
 872         sbd_swap_section_hdr(&sli->sli_sms_header);
 873         if (sli->sli_data_order == SMS_DATA_ORDER)
 874                 return;
 875         sli->sli_sms_header.sms_chksum       += SMS_DATA_ORDER - sli->sli_data_order;
 876         sli->sli_data_order          = SMS_DATA_ORDER;
 877         sli->sli_flags                       = BSWAP_32(sli->sli_flags);
 878         sli->sli_lu_size             = BSWAP_64(sli->sli_lu_size);
 879         sli->sli_meta_fname_offset   = BSWAP_64(sli->sli_meta_fname_offset);
 880         sli->sli_data_fname_offset   = BSWAP_64(sli->sli_data_fname_offset);
 881         sli->sli_serial_offset               = BSWAP_64(sli->sli_serial_offset);
 882         sli->sli_alias_offset                = BSWAP_64(sli->sli_alias_offset);
 883         sli->sli_mgmt_url_offset     = BSWAP_64(sli->sli_mgmt_url_offset);
 884 }
 885 
 886 sbd_status_t
 887 sbd_load_section_hdr(sbd_lu_t *sl, sm_section_hdr_t *sms)
 888 {
 889         sm_section_hdr_t        h;
 890         uint64_t                st;
 891         sbd_status_t            ret;
 892 
 893         for (st = sl->sl_meta_offset + sizeof (sbd_meta_start_t);
 894             st < sl->sl_meta_size_used; st += h.sms_size) {
 895                 if ((ret = sbd_read_meta(sl, st, sizeof (sm_section_hdr_t),
 896                     (uint8_t *)&h)) != SBD_SUCCESS) {
 897                         return (ret);
 898                 }
 899                 if (h.sms_data_order != SMS_DATA_ORDER) {
 900                         sbd_swap_section_hdr(&h);
 901                 }
 902                 if ((h.sms_data_order != SMS_DATA_ORDER) ||
 903                     (h.sms_offset != st) || (h.sms_size < sizeof (h)) ||
 904                     ((st + h.sms_size) > sl->sl_meta_size_used)) {
 905                         return (SBD_META_CORRUPTED);
 906                 }
 907                 if (h.sms_id == sms->sms_id) {
 908                         bcopy(&h, sms, sizeof (h));
 909                         return (SBD_SUCCESS);
 910                 }
 911         }
 912 
 913         return (SBD_NOT_FOUND);
 914 }
 915 
 916 sbd_status_t
 917 sbd_load_meta_start(sbd_lu_t *sl)
 918 {
 919         sbd_meta_start_t *sm;
 920         sbd_status_t ret;
 921 
 922         /* Fake meta params initially */
 923         sl->sl_total_meta_size = (uint64_t)-1;
 924         sl->sl_meta_size_used = sl->sl_meta_offset + sizeof (sbd_meta_start_t);
 925 
 926         sm = kmem_zalloc(sizeof (*sm), KM_SLEEP);
 927         ret = sbd_read_meta(sl, sl->sl_meta_offset, sizeof (*sm),
 928             (uint8_t *)sm);
 929         if (ret != SBD_SUCCESS) {
 930                 goto load_meta_start_failed;
 931         }
 932 
 933         if (sm->sm_magic != SBD_MAGIC) {
 934                 sbd_swap_meta_start(sm);
 935         }
 936 
 937         if ((sm->sm_magic != SBD_MAGIC) || (sbd_calc_sum((uint8_t *)sm,
 938             sizeof (*sm) - 1) != sm->sm_chksum)) {
 939                 ret = SBD_META_CORRUPTED;
 940                 goto load_meta_start_failed;
 941         }
 942 
 943         if (sm->sm_ver_major != SBD_VER_MAJOR) {
 944                 ret = SBD_NOT_SUPPORTED;
 945                 goto load_meta_start_failed;
 946         }
 947 
 948         sl->sl_total_meta_size = sm->sm_meta_size;
 949         sl->sl_meta_size_used = sm->sm_meta_size_used;
 950         ret = SBD_SUCCESS;
 951 
 952 load_meta_start_failed:
 953         kmem_free(sm, sizeof (*sm));
 954         return (ret);
 955 }
 956 
 957 sbd_status_t
 958 sbd_write_meta_start(sbd_lu_t *sl, uint64_t meta_size, uint64_t meta_size_used)
 959 {
 960         sbd_meta_start_t *sm;
 961         sbd_status_t ret;
 962 
 963         sm = (sbd_meta_start_t *)kmem_zalloc(sizeof (sbd_meta_start_t),
 964             KM_SLEEP);
 965 
 966         sm->sm_magic = SBD_MAGIC;
 967         sm->sm_meta_size = meta_size;
 968         sm->sm_meta_size_used = meta_size_used;
 969         sm->sm_ver_major = SBD_VER_MAJOR;
 970         sm->sm_ver_minor = SBD_VER_MINOR;
 971         sm->sm_ver_subminor = SBD_VER_SUBMINOR;
 972         sm->sm_chksum = sbd_calc_sum((uint8_t *)sm, sizeof (*sm) - 1);
 973 
 974         ret = sbd_write_meta(sl, sl->sl_meta_offset, sizeof (*sm),
 975             (uint8_t *)sm);
 976         kmem_free(sm, sizeof (*sm));
 977 
 978         return (ret);
 979 }
 980 
 981 sbd_status_t
 982 sbd_read_meta_section(sbd_lu_t *sl, sm_section_hdr_t **ppsms, uint16_t sms_id)
 983 {
 984         sbd_status_t ret;
 985         sm_section_hdr_t sms;
 986         int alloced = 0;
 987 
 988         mutex_enter(&sl->sl_metadata_lock);
 989         if (((*ppsms) == NULL) || ((*ppsms)->sms_offset == 0)) {
 990                 bzero(&sms, sizeof (sm_section_hdr_t));
 991                 sms.sms_id = sms_id;
 992                 if ((ret = sbd_load_section_hdr(sl, &sms)) != SBD_SUCCESS) {
 993                         mutex_exit(&sl->sl_metadata_lock);
 994                         return (ret);
 995                 } else {
 996                         if ((*ppsms) == NULL) {
 997                                 *ppsms = (sm_section_hdr_t *)kmem_zalloc(
 998                                     sms.sms_size, KM_SLEEP);
 999                                 alloced = 1;
1000                         }
1001                         bcopy(&sms, *ppsms, sizeof (sm_section_hdr_t));
1002                 }
1003         }
1004 
1005         ret = sbd_read_meta(sl, (*ppsms)->sms_offset, (*ppsms)->sms_size,
1006             (uint8_t *)(*ppsms));
1007         if (ret == SBD_SUCCESS) {
1008                 uint8_t s;
1009                 if ((*ppsms)->sms_data_order != SMS_DATA_ORDER)
1010                         sbd_swap_section_hdr(*ppsms);
1011                 if ((*ppsms)->sms_id != SMS_ID_UNUSED) {
1012                         s = sbd_calc_section_sum(*ppsms, (*ppsms)->sms_size);
1013                         if (s != (*ppsms)->sms_chksum)
1014                                 ret = SBD_META_CORRUPTED;
1015                 }
1016         }
1017         mutex_exit(&sl->sl_metadata_lock);
1018 
1019         if ((ret != SBD_SUCCESS) && alloced)
1020                 kmem_free(*ppsms, sms.sms_size);
1021         return (ret);
1022 }
1023 
1024 sbd_status_t
1025 sbd_load_section_hdr_unbuffered(sbd_lu_t *sl, sm_section_hdr_t *sms)
1026 {
1027         sbd_status_t    ret;
1028 
1029         /*
1030          * Bypass buffering and re-read the meta data from permanent storage.
1031          */
1032         if (sl->sl_flags & SL_ZFS_META) {
1033                 if ((ret = sbd_open_zfs_meta(sl)) != SBD_SUCCESS) {
1034                         return (ret);
1035                 }
1036         }
1037         /* Re-get the meta sizes into sl */
1038         if ((ret = sbd_load_meta_start(sl)) != SBD_SUCCESS) {
1039                 return (ret);
1040         }
1041         return (sbd_load_section_hdr(sl, sms));
1042 }
1043 
1044 sbd_status_t
1045 sbd_write_meta_section(sbd_lu_t *sl, sm_section_hdr_t *sms)
1046 {
1047         sm_section_hdr_t t;
1048         uint64_t off, s;
1049         uint64_t unused_start;
1050         sbd_status_t ret;
1051         sbd_status_t write_meta_ret = SBD_SUCCESS;
1052         uint8_t *cb;
1053         int meta_size_changed = 0;
1054         sm_section_hdr_t sms_before_unused = {0};
1055 
1056         mutex_enter(&sl->sl_metadata_lock);
1057 write_meta_section_again:
1058         if (sms->sms_offset) {
1059                 /*
1060                  * If the section already exists and the size is the
1061                  * same as this new data then overwrite in place. If
1062                  * the sizes are different then mark the existing as
1063                  * unused and look for free space.
1064                  */
1065                 ret = sbd_read_meta(sl, sms->sms_offset, sizeof (t),
1066                     (uint8_t *)&t);
1067                 if (ret != SBD_SUCCESS) {
1068                         mutex_exit(&sl->sl_metadata_lock);
1069                         return (ret);
1070                 }
1071                 if (t.sms_data_order != SMS_DATA_ORDER) {
1072                         sbd_swap_section_hdr(&t);
1073                 }
1074                 if (t.sms_id != sms->sms_id) {
1075                         mutex_exit(&sl->sl_metadata_lock);
1076                         return (SBD_INVALID_ARG);
1077                 }
1078                 if (t.sms_size == sms->sms_size) {
1079                         ret = sbd_write_meta(sl, sms->sms_offset,
1080                             sms->sms_size, (uint8_t *)sms);
1081                         mutex_exit(&sl->sl_metadata_lock);
1082                         return (ret);
1083                 }
1084                 sms_before_unused = t;
1085 
1086                 t.sms_id = SMS_ID_UNUSED;
1087                 /*
1088                  * For unused sections we only use chksum of the header. for
1089                  * all other sections, the chksum is for the entire section.
1090                  */
1091                 t.sms_chksum = sbd_calc_section_sum(&t, sizeof (t));
1092                 ret = sbd_write_meta(sl, t.sms_offset, sizeof (t),
1093                     (uint8_t *)&t);
1094                 if (ret != SBD_SUCCESS) {
1095                         mutex_exit(&sl->sl_metadata_lock);
1096                         return (ret);
1097                 }
1098                 sms->sms_offset = 0;
1099         } else {
1100                 /* Section location is unknown, search for it. */
1101                 t.sms_id = sms->sms_id;
1102                 t.sms_data_order = SMS_DATA_ORDER;
1103                 ret = sbd_load_section_hdr(sl, &t);
1104                 if (ret == SBD_SUCCESS) {
1105                         sms->sms_offset = t.sms_offset;
1106                         sms->sms_chksum =
1107                             sbd_calc_section_sum(sms, sms->sms_size);
1108                         goto write_meta_section_again;
1109                 } else if (ret != SBD_NOT_FOUND) {
1110                         mutex_exit(&sl->sl_metadata_lock);
1111                         return (ret);
1112                 }
1113         }
1114 
1115         /*
1116          * At this point we know that section does not already exist.
1117          * Find space large enough to hold the section or grow meta if
1118          * possible.
1119          */
1120         unused_start = 0;
1121         s = 0;  /* size of space found */
1122 
1123         /*
1124          * Search all sections for unused space of sufficient size.
1125          * The first one found is taken. Contiguous unused sections
1126          * will be combined.
1127          */
1128         for (off = sl->sl_meta_offset + sizeof (sbd_meta_start_t);
1129             off < sl->sl_meta_size_used; off += t.sms_size) {
1130                 ret = sbd_read_meta(sl, off, sizeof (t), (uint8_t *)&t);
1131                 if (ret != SBD_SUCCESS) {
1132                         mutex_exit(&sl->sl_metadata_lock);
1133                         return (ret);
1134                 }
1135                 if (t.sms_data_order != SMS_DATA_ORDER)
1136                         sbd_swap_section_hdr(&t);
1137                 if (t.sms_size == 0) {
1138                         mutex_exit(&sl->sl_metadata_lock);
1139                         return (SBD_META_CORRUPTED);
1140                 }
1141                 if (t.sms_id == SMS_ID_UNUSED) {
1142                         if (unused_start == 0)
1143                                 unused_start = off;
1144                         /*
1145                          * Calculate size of the unused space, break out
1146                          * if it satisfies the requirement.
1147                          */
1148                         s = t.sms_size - unused_start + off;
1149                         if ((s == sms->sms_size) || (s >= (sms->sms_size +
1150                             sizeof (t)))) {
1151                                 break;
1152                         } else {
1153                                 s = 0;
1154                         }
1155                 } else {
1156                         unused_start = 0;
1157                 }
1158         }
1159 
1160         off = (unused_start == 0) ? sl->sl_meta_size_used : unused_start;
1161         /*
1162          * If none found, how much room is at the end?
1163          * See if the data can be expanded.
1164          */
1165         if (s == 0) {
1166                 s = sl->sl_total_meta_size - off;
1167                 if (s >= sms->sms_size || !(sl->sl_flags & SL_SHARED_META)) {
1168                         s = sms->sms_size;
1169                         meta_size_changed = 1;
1170                 } else {
1171                         s = 0;
1172                 }
1173         }
1174 
1175         if (s == 0) {
1176                 mutex_exit(&sl->sl_metadata_lock);
1177                 return (SBD_ALLOC_FAILURE);
1178         }
1179 
1180         sms->sms_offset = off;
1181         sms->sms_chksum = sbd_calc_section_sum(sms, sms->sms_size);
1182         /*
1183          * Since we may have to write more than one section (current +
1184          * any unused), use a combined buffer.
1185          */
1186         cb = kmem_zalloc(s, KM_SLEEP);
1187         bcopy(sms, cb, sms->sms_size);
1188         if (s > sms->sms_size) {
1189                 t.sms_offset = off + sms->sms_size;
1190                 t.sms_size = s - sms->sms_size;
1191                 t.sms_id = SMS_ID_UNUSED;
1192                 t.sms_data_order = SMS_DATA_ORDER;
1193                 t.sms_chksum = sbd_calc_section_sum(&t, sizeof (t));
1194                 bcopy(&t, cb + sms->sms_size, sizeof (t));
1195         }
1196         /*
1197          * Two write events & statuses take place. Failure writing the
1198          * meta section takes precedence, can possibly be rolled back,
1199          * & gets reported. Else return status from writing the meta start.
1200          */
1201         ret = SBD_SUCCESS; /* Set a default, it's not always loaded below. */
1202         if (meta_size_changed) {
1203                 uint64_t old_meta_size;
1204                 uint64_t old_sz_used = sl->sl_meta_size_used; /* save a copy */
1205                 old_meta_size = sl->sl_total_meta_size; /* save a copy */
1206 
1207                 write_meta_ret = sbd_write_meta(sl, off, s, cb);
1208                 if (write_meta_ret == SBD_SUCCESS) {
1209                         sl->sl_meta_size_used = off + s;
1210                         if (sl->sl_total_meta_size < sl->sl_meta_size_used) {
1211                                 uint64_t meta_align =
1212                                     (((uint64_t)1) <<
1213                                     sl->sl_meta_blocksize_shift) - 1;
1214                                 sl->sl_total_meta_size =
1215                                     (sl->sl_meta_size_used + meta_align) &
1216                                     (~meta_align);
1217                         }
1218                         ret = sbd_write_meta_start(sl, sl->sl_total_meta_size,
1219                             sl->sl_meta_size_used);
1220                         if (ret != SBD_SUCCESS) {
1221                                 sl->sl_meta_size_used = old_sz_used;
1222                                 sl->sl_total_meta_size = old_meta_size;
1223                         }
1224                 } else {
1225                         sl->sl_meta_size_used = old_sz_used;
1226                         sl->sl_total_meta_size = old_meta_size;
1227                 }
1228         } else {
1229                 write_meta_ret = sbd_write_meta(sl, off, s, cb);
1230         }
1231         if ((write_meta_ret != SBD_SUCCESS) &&
1232             (sms_before_unused.sms_offset != 0)) {
1233                 sm_section_hdr_t new_sms;
1234                 sm_section_hdr_t *unused_sms;
1235                 /*
1236                  * On failure writing the meta section attempt to undo
1237                  * the change to unused.
1238                  * Re-read the meta data from permanent storage.
1239                  * The section id can't exist for undo to be possible.
1240                  * Read what should be the entire old section data and
1241                  * insure the old data's still present by validating
1242                  * against it's old checksum.
1243                  */
1244                 new_sms.sms_id = sms->sms_id;
1245                 new_sms.sms_data_order = SMS_DATA_ORDER;
1246                 if (sbd_load_section_hdr_unbuffered(sl, &new_sms) !=
1247                     SBD_NOT_FOUND) {
1248                         goto done;
1249                 }
1250                 unused_sms = kmem_zalloc(sms_before_unused.sms_size, KM_SLEEP);
1251                 if (sbd_read_meta(sl, sms_before_unused.sms_offset,
1252                     sms_before_unused.sms_size,
1253                     (uint8_t *)unused_sms) != SBD_SUCCESS) {
1254                         goto done;
1255                 }
1256                 if (unused_sms->sms_data_order != SMS_DATA_ORDER) {
1257                         sbd_swap_section_hdr(unused_sms);
1258                 }
1259                 if (unused_sms->sms_id != SMS_ID_UNUSED) {
1260                         goto done;
1261                 }
1262                 if (unused_sms->sms_offset != sms_before_unused.sms_offset) {
1263                         goto done;
1264                 }
1265                 if (unused_sms->sms_size != sms_before_unused.sms_size) {
1266                         goto done;
1267                 }
1268                 unused_sms->sms_id = sms_before_unused.sms_id;
1269                 if (sbd_calc_section_sum(unused_sms,
1270                     sizeof (sm_section_hdr_t)) !=
1271                     sbd_calc_section_sum(&sms_before_unused,
1272                     sizeof (sm_section_hdr_t))) {
1273                         goto done;
1274                 }
1275                 unused_sms->sms_chksum =
1276                     sbd_calc_section_sum(unused_sms, unused_sms->sms_size);
1277                 if (unused_sms->sms_chksum != sms_before_unused.sms_chksum) {
1278                         goto done;
1279                 }
1280                 (void) sbd_write_meta(sl, unused_sms->sms_offset,
1281                     sizeof (sm_section_hdr_t), (uint8_t *)unused_sms);
1282         }
1283 done:
1284         mutex_exit(&sl->sl_metadata_lock);
1285         kmem_free(cb, s);
1286         if (write_meta_ret != SBD_SUCCESS) {
1287                 return (write_meta_ret);
1288         }
1289         return (ret);
1290 }
1291 
1292 sbd_status_t
1293 sbd_write_lu_info(sbd_lu_t *sl)
1294 {
1295         sbd_lu_info_1_1_t *sli;
1296         int s;
1297         uint8_t *p;
1298         char *zvol_name = NULL;
1299         sbd_status_t ret;
1300 
1301         mutex_enter(&sl->sl_lock);
1302 
1303         s = sl->sl_serial_no_size;
1304         if ((sl->sl_flags & (SL_SHARED_META | SL_ZFS_META)) == 0) {
1305                 if (sl->sl_data_filename) {
1306                         s += strlen(sl->sl_data_filename) + 1;
1307                 }
1308         }
1309         if (sl->sl_flags & SL_ZFS_META) {
1310                 zvol_name = sbd_get_zvol_name(sl);
1311                 s += strlen(zvol_name) + 1;
1312         }
1313         if (sl->sl_alias) {
1314                 s += strlen(sl->sl_alias) + 1;
1315         }
1316         if (sl->sl_mgmt_url) {
1317                 s += strlen(sl->sl_mgmt_url) + 1;
1318         }
1319         sli = (sbd_lu_info_1_1_t *)kmem_zalloc(sizeof (*sli) + s, KM_SLEEP);
1320         p = sli->sli_buf;
1321         if ((sl->sl_flags & (SL_SHARED_META | SL_ZFS_META)) == 0) {
1322                 sli->sli_flags |= SLI_SEPARATE_META;
1323                 (void) strcpy((char *)p, sl->sl_data_filename);
1324                 sli->sli_data_fname_offset =
1325                     (uintptr_t)p - (uintptr_t)sli->sli_buf;
1326                 sli->sli_flags |= SLI_DATA_FNAME_VALID;
1327                 p += strlen(sl->sl_data_filename) + 1;
1328         }
1329         if (sl->sl_flags & SL_ZFS_META) {
1330                 (void) strcpy((char *)p, zvol_name);
1331                 sli->sli_meta_fname_offset =
1332                     (uintptr_t)p - (uintptr_t)sli->sli_buf;
1333                 sli->sli_flags |= SLI_META_FNAME_VALID | SLI_ZFS_META;
1334                 p += strlen(zvol_name) + 1;
1335                 kmem_free(zvol_name, strlen(zvol_name) + 1);
1336                 zvol_name = NULL;
1337         }
1338         if (sl->sl_alias) {
1339                 (void) strcpy((char *)p, sl->sl_alias);
1340                 sli->sli_alias_offset =
1341                     (uintptr_t)p - (uintptr_t)sli->sli_buf;
1342                 sli->sli_flags |= SLI_ALIAS_VALID;
1343                 p += strlen(sl->sl_alias) + 1;
1344         }
1345         if (sl->sl_mgmt_url) {
1346                 (void) strcpy((char *)p, sl->sl_mgmt_url);
1347                 sli->sli_mgmt_url_offset =
1348                     (uintptr_t)p - (uintptr_t)sli->sli_buf;
1349                 sli->sli_flags |= SLI_MGMT_URL_VALID;
1350                 p += strlen(sl->sl_mgmt_url) + 1;
1351         }
1352         if (sl->sl_flags & SL_WRITE_PROTECTED) {
1353                 sli->sli_flags |= SLI_WRITE_PROTECTED;
1354         }
1355         if (sl->sl_flags & SL_SAVED_WRITE_CACHE_DISABLE) {
1356                 sli->sli_flags |= SLI_WRITEBACK_CACHE_DISABLE;
1357         }
1358         if (sl->sl_flags & SL_VID_VALID) {
1359                 bcopy(sl->sl_vendor_id, sli->sli_vid, 8);
1360                 sli->sli_flags |= SLI_VID_VALID;
1361         }
1362         if (sl->sl_flags & SL_PID_VALID) {
1363                 bcopy(sl->sl_product_id, sli->sli_pid, 16);
1364                 sli->sli_flags |= SLI_PID_VALID;
1365         }
1366         if (sl->sl_flags & SL_REV_VALID) {
1367                 bcopy(sl->sl_revision, sli->sli_rev, 4);
1368                 sli->sli_flags |= SLI_REV_VALID;
1369         }
1370         if (sl->sl_serial_no_size) {
1371                 bcopy(sl->sl_serial_no, p, sl->sl_serial_no_size);
1372                 sli->sli_serial_size = sl->sl_serial_no_size;
1373                 sli->sli_serial_offset =
1374                     (uintptr_t)p - (uintptr_t)sli->sli_buf;
1375                 sli->sli_flags |= SLI_SERIAL_VALID;
1376                 p += sli->sli_serial_size;
1377         }
1378         sli->sli_lu_size = sl->sl_lu_size;
1379         sli->sli_data_blocksize_shift = sl->sl_data_blocksize_shift;
1380         sli->sli_data_order = SMS_DATA_ORDER;
1381         bcopy(sl->sl_device_id, sli->sli_device_id, 20);
1382 
1383         sli->sli_sms_header.sms_size = sizeof (*sli) + s;
1384         sli->sli_sms_header.sms_id = SMS_ID_LU_INFO_1_1;
1385         sli->sli_sms_header.sms_data_order = SMS_DATA_ORDER;
1386 
1387         mutex_exit(&sl->sl_lock);
1388         ret = sbd_write_meta_section(sl, (sm_section_hdr_t *)sli);
1389         kmem_free(sli, sizeof (*sli) + s);
1390         return (ret);
1391 }
1392 
1393 /*
1394  * Will scribble SL_UNMAP_ENABLED into sl_flags if we succeed.
1395  */
1396 static void
1397 do_unmap_setup(sbd_lu_t *sl)
1398 {
1399         ASSERT((sl->sl_flags & SL_UNMAP_ENABLED) == 0);
1400 
1401         if ((sl->sl_flags & SL_ZFS_META) == 0)
1402                 return; /* No UNMAP for you. */
1403 
1404         sl->sl_flags |= SL_UNMAP_ENABLED;
1405 }
1406 
1407 int
1408 sbd_populate_and_register_lu(sbd_lu_t *sl, uint32_t *err_ret)
1409 {
1410         stmf_lu_t *lu = sl->sl_lu;
1411         stmf_status_t ret;
1412 
1413         do_unmap_setup(sl);
1414 
1415         lu->lu_id = (scsi_devid_desc_t *)sl->sl_device_id;
1416         if (sl->sl_alias) {
1417                 lu->lu_alias = sl->sl_alias;
1418         } else {
1419                 lu->lu_alias = sl->sl_name;
1420         }
1421         if (sl->sl_access_state == SBD_LU_STANDBY) {
1422                 /* call set access state */
1423                 ret = stmf_set_lu_access(lu, STMF_LU_STANDBY);
1424                 if (ret != STMF_SUCCESS) {
1425                         *err_ret = SBD_RET_ACCESS_STATE_FAILED;
1426                         return (EIO);
1427                 }
1428         }
1429         /* set proxy_reg_cb_arg to meta filename */
1430         if (sl->sl_meta_filename) {
1431                 lu->lu_proxy_reg_arg = sl->sl_meta_filename;
1432                 lu->lu_proxy_reg_arg_len = strlen(sl->sl_meta_filename) + 1;
1433         } else {
1434                 lu->lu_proxy_reg_arg = sl->sl_data_filename;
1435                 lu->lu_proxy_reg_arg_len = strlen(sl->sl_data_filename) + 1;
1436         }
1437         lu->lu_lp = sbd_lp;
1438         lu->lu_task_alloc = sbd_task_alloc;
1439         lu->lu_new_task = sbd_new_task;
1440         lu->lu_dbuf_xfer_done = sbd_dbuf_xfer_done;
1441         lu->lu_send_status_done = sbd_send_status_done;
1442         lu->lu_task_free = sbd_task_free;
1443         lu->lu_abort = sbd_abort;
1444         lu->lu_dbuf_free = sbd_dbuf_free;
1445         lu->lu_ctl = sbd_ctl;
1446         lu->lu_info = sbd_info;
1447         sl->sl_state = STMF_STATE_OFFLINE;
1448 
1449         if ((ret = stmf_register_lu(lu)) != STMF_SUCCESS) {
1450                 stmf_trace(0, "Failed to register with framework, ret=%llx",
1451                     ret);
1452                 if (ret == STMF_ALREADY) {
1453                         *err_ret = SBD_RET_GUID_ALREADY_REGISTERED;
1454                 }
1455                 return (EIO);
1456         }
1457 
1458         *err_ret = 0;
1459         return (0);
1460 }
1461 
1462 int
1463 sbd_open_data_file(sbd_lu_t *sl, uint32_t *err_ret, int lu_size_valid,
1464     int vp_valid, int keep_open)
1465 {
1466         int ret;
1467         int flag;
1468         ulong_t nbits;
1469         uint64_t supported_size;
1470         vattr_t vattr;
1471         enum vtype vt;
1472         struct dk_cinfo dki;
1473         int unused;
1474 
1475         mutex_enter(&sl->sl_lock);
1476         if (vp_valid) {
1477                 goto odf_over_open;
1478         }
1479         if (sl->sl_data_filename[0] != '/') {
1480                 *err_ret = SBD_RET_DATA_PATH_NOT_ABSOLUTE;
1481                 mutex_exit(&sl->sl_lock);
1482                 return (EINVAL);
1483         }
1484         if ((ret = lookupname(sl->sl_data_filename, UIO_SYSSPACE, FOLLOW,
1485             NULLVPP, &sl->sl_data_vp)) != 0) {
1486                 *err_ret = SBD_RET_DATA_FILE_LOOKUP_FAILED;
1487                 mutex_exit(&sl->sl_lock);
1488                 return (ret);
1489         }
1490         sl->sl_data_vtype = vt = sl->sl_data_vp->v_type;
1491         VN_RELE(sl->sl_data_vp);
1492         if ((vt != VREG) && (vt != VCHR) && (vt != VBLK)) {
1493                 *err_ret = SBD_RET_WRONG_DATA_FILE_TYPE;
1494                 mutex_exit(&sl->sl_lock);
1495                 return (EINVAL);
1496         }
1497         if (sl->sl_flags & SL_WRITE_PROTECTED) {
1498                 flag = FREAD | FOFFMAX;
1499         } else {
1500                 flag = FREAD | FWRITE | FOFFMAX | FEXCL;
1501         }
1502         if ((ret = vn_open(sl->sl_data_filename, UIO_SYSSPACE, flag, 0,
1503             &sl->sl_data_vp, 0, 0)) != 0) {
1504                 *err_ret = SBD_RET_DATA_FILE_OPEN_FAILED;
1505                 mutex_exit(&sl->sl_lock);
1506                 return (ret);
1507         }
1508 odf_over_open:
1509         vattr.va_mask = AT_SIZE;
1510         if ((ret = VOP_GETATTR(sl->sl_data_vp, &vattr, 0, CRED(), NULL)) != 0) {
1511                 *err_ret = SBD_RET_DATA_FILE_GETATTR_FAILED;
1512                 goto odf_close_data_and_exit;
1513         }
1514         if ((vt != VREG) && (vattr.va_size == 0)) {
1515                 /*
1516                  * Its a zero byte block or char device. This cannot be
1517                  * a raw disk.
1518                  */
1519                 *err_ret = SBD_RET_WRONG_DATA_FILE_TYPE;
1520                 ret = EINVAL;
1521                 goto odf_close_data_and_exit;
1522         }
1523         /* sl_data_readable size includes any metadata. */
1524         sl->sl_data_readable_size = vattr.va_size;
1525 
1526         if (VOP_PATHCONF(sl->sl_data_vp, _PC_FILESIZEBITS, &nbits,
1527             CRED(), NULL) != 0) {
1528                 nbits = 0;
1529         }
1530         /* nbits cannot be greater than 64 */
1531         sl->sl_data_fs_nbits = (uint8_t)nbits;
1532         if (lu_size_valid) {
1533                 sl->sl_total_data_size = sl->sl_lu_size;
1534                 if (sl->sl_flags & SL_SHARED_META) {
1535                         sl->sl_total_data_size += SHARED_META_DATA_SIZE;
1536                 }
1537                 if ((nbits > 0) && (nbits < 64)) {
1538                         /*
1539                          * The expression below is correct only if nbits is
1540                          * positive and less than 64.
1541                          */
1542                         supported_size = (((uint64_t)1) << nbits) - 1;
1543                         if (sl->sl_total_data_size > supported_size) {
1544                                 *err_ret = SBD_RET_SIZE_NOT_SUPPORTED_BY_FS;
1545                                 ret = EINVAL;
1546                                 goto odf_close_data_and_exit;
1547                         }
1548                 }
1549         } else {
1550                 sl->sl_total_data_size = vattr.va_size;
1551                 if (sl->sl_flags & SL_SHARED_META) {
1552                         if (vattr.va_size > SHARED_META_DATA_SIZE) {
1553                                 sl->sl_lu_size = vattr.va_size -
1554                                     SHARED_META_DATA_SIZE;
1555                         } else {
1556                                 *err_ret = SBD_RET_FILE_SIZE_ERROR;
1557                                 ret = EINVAL;
1558                                 goto odf_close_data_and_exit;
1559                         }
1560                 } else {
1561                         sl->sl_lu_size = vattr.va_size;
1562                 }
1563         }
1564         if (sl->sl_lu_size < SBD_MIN_LU_SIZE) {
1565                 *err_ret = SBD_RET_FILE_SIZE_ERROR;
1566                 ret = EINVAL;
1567                 goto odf_close_data_and_exit;
1568         }
1569         if (sl->sl_lu_size &
1570             ((((uint64_t)1) << sl->sl_data_blocksize_shift) - 1)) {
1571                 *err_ret = SBD_RET_FILE_ALIGN_ERROR;
1572                 ret = EINVAL;
1573                 goto odf_close_data_and_exit;
1574         }
1575         /*
1576          * Get the minor device for direct zvol access
1577          */
1578         if (sl->sl_flags & SL_ZFS_META) {
1579                 if ((ret = VOP_IOCTL(sl->sl_data_vp, DKIOCINFO, (intptr_t)&dki,
1580                     FKIOCTL, kcred, &unused, NULL)) != 0) {
1581                         cmn_err(CE_WARN, "ioctl(DKIOCINFO) failed %d", ret);
1582                         /* zvol reserves 0, so this would fail later */
1583                         sl->sl_zvol_minor = 0;
1584                 } else {
1585                         sl->sl_zvol_minor = dki.dki_unit;
1586                         if (sbd_zvol_get_volume_params(sl) == 0)
1587                                 sl->sl_flags |= SL_CALL_ZVOL;
1588                 }
1589         }
1590         sl->sl_flags |= SL_MEDIA_LOADED;
1591         mutex_exit(&sl->sl_lock);
1592         return (0);
1593 
1594 odf_close_data_and_exit:
1595         if (!keep_open) {
1596                 (void) VOP_CLOSE(sl->sl_data_vp, flag, 1, 0, CRED(), NULL);
1597                 VN_RELE(sl->sl_data_vp);
1598         }
1599         mutex_exit(&sl->sl_lock);
1600         return (ret);
1601 }
1602 
1603 void
1604 sbd_close_lu(sbd_lu_t *sl)
1605 {
1606         int flag;
1607 
1608         if (((sl->sl_flags & SL_SHARED_META) == 0) &&
1609             (sl->sl_flags & SL_META_OPENED)) {
1610                 if (sl->sl_flags & SL_ZFS_META) {
1611                         rw_destroy(&sl->sl_zfs_meta_lock);
1612                         if (sl->sl_zfs_meta) {
1613                                 kmem_free(sl->sl_zfs_meta, ZAP_MAXVALUELEN / 2);
1614                                 sl->sl_zfs_meta = NULL;
1615                         }
1616                 } else {
1617                         flag = FREAD | FWRITE | FOFFMAX | FEXCL;
1618                         (void) VOP_CLOSE(sl->sl_meta_vp, flag, 1, 0,
1619                             CRED(), NULL);
1620                         VN_RELE(sl->sl_meta_vp);
1621                 }
1622                 sl->sl_flags &= ~SL_META_OPENED;
1623         }
1624         if (sl->sl_flags & SL_MEDIA_LOADED) {
1625                 if (sl->sl_flags & SL_WRITE_PROTECTED) {
1626                         flag = FREAD | FOFFMAX;
1627                 } else {
1628                         flag = FREAD | FWRITE | FOFFMAX | FEXCL;
1629                 }
1630                 (void) VOP_CLOSE(sl->sl_data_vp, flag, 1, 0, CRED(), NULL);
1631                 VN_RELE(sl->sl_data_vp);
1632                 sl->sl_flags &= ~SL_MEDIA_LOADED;
1633                 if (sl->sl_flags & SL_SHARED_META) {
1634                         sl->sl_flags &= ~SL_META_OPENED;
1635                 }
1636         }
1637 }
1638 
1639 int
1640 sbd_set_lu_standby(sbd_set_lu_standby_t *stlu, uint32_t *err_ret)
1641 {
1642         sbd_lu_t *sl;
1643         sbd_status_t sret;
1644         stmf_status_t stret;
1645         uint8_t old_access_state;
1646 
1647         sret = sbd_find_and_lock_lu(stlu->stlu_guid, NULL,
1648             SL_OP_MODIFY_LU, &sl);
1649         if (sret != SBD_SUCCESS) {
1650                 if (sret == SBD_BUSY) {
1651                         *err_ret = SBD_RET_LU_BUSY;
1652                         return (EBUSY);
1653                 } else if (sret == SBD_NOT_FOUND) {
1654                         *err_ret = SBD_RET_NOT_FOUND;
1655                         return (ENOENT);
1656                 }
1657                 *err_ret = SBD_RET_ACCESS_STATE_FAILED;
1658                 return (EIO);
1659         }
1660 
1661         old_access_state = sl->sl_access_state;
1662         sl->sl_access_state = SBD_LU_TRANSITION_TO_STANDBY;
1663         stret = stmf_set_lu_access((stmf_lu_t *)sl->sl_lu, STMF_LU_STANDBY);
1664         if (stret != STMF_SUCCESS) {
1665                 sl->sl_trans_op = SL_OP_NONE;
1666                 *err_ret = SBD_RET_ACCESS_STATE_FAILED;
1667                 sl->sl_access_state = old_access_state;
1668                 return (EIO);
1669         }
1670 
1671         /*
1672          * acquire the writer lock here to ensure we're not pulling
1673          * the rug from the vn_rdwr to the backing store
1674          */
1675         rw_enter(&sl->sl_access_state_lock, RW_WRITER);
1676         sbd_close_lu(sl);
1677         rw_exit(&sl->sl_access_state_lock);
1678 
1679         sl->sl_trans_op = SL_OP_NONE;
1680         return (0);
1681 }
1682 
1683 int
1684 sbd_close_delete_lu(sbd_lu_t *sl, int ret)
1685 {
1686 
1687         /*
1688          * acquire the writer lock here to ensure we're not pulling
1689          * the rug from the vn_rdwr to the backing store
1690          */
1691         rw_enter(&sl->sl_access_state_lock, RW_WRITER);
1692         sbd_close_lu(sl);
1693         rw_exit(&sl->sl_access_state_lock);
1694 
1695         if (sl->sl_flags & SL_LINKED)
1696                 sbd_unlink_lu(sl);
1697         mutex_destroy(&sl->sl_metadata_lock);
1698         mutex_destroy(&sl->sl_lock);
1699         rw_destroy(&sl->sl_pgr->pgr_lock);
1700         rw_destroy(&sl->sl_access_state_lock);
1701         if (sl->sl_serial_no_alloc_size) {
1702                 kmem_free(sl->sl_serial_no, sl->sl_serial_no_alloc_size);
1703         }
1704         if (sl->sl_data_fname_alloc_size) {
1705                 kmem_free(sl->sl_data_filename, sl->sl_data_fname_alloc_size);
1706         }
1707         if (sl->sl_alias_alloc_size) {
1708                 kmem_free(sl->sl_alias, sl->sl_alias_alloc_size);
1709         }
1710         if (sl->sl_mgmt_url_alloc_size) {
1711                 kmem_free(sl->sl_mgmt_url, sl->sl_mgmt_url_alloc_size);
1712         }
1713         stmf_free(sl->sl_lu);
1714         return (ret);
1715 }
1716 
1717 int
1718 sbd_create_register_lu(sbd_create_and_reg_lu_t *slu, int struct_sz,
1719     uint32_t *err_ret)
1720 {
1721         char *namebuf;
1722         sbd_lu_t *sl;
1723         stmf_lu_t *lu;
1724         char *p;
1725         int sz;
1726         int alloc_sz;
1727         int ret = EIO;
1728         int flag;
1729         int wcd = 0;
1730         uint32_t hid = 0;
1731         enum vtype vt;
1732 
1733         sz = struct_sz - sizeof (sbd_create_and_reg_lu_t) + 8 + 1;
1734 
1735         *err_ret = 0;
1736 
1737         /* Lets validate various offsets */
1738         if (((slu->slu_meta_fname_valid) &&
1739             (slu->slu_meta_fname_off >= sz)) ||
1740             (slu->slu_data_fname_off >= sz) ||
1741             ((slu->slu_alias_valid) &&
1742             (slu->slu_alias_off >= sz)) ||
1743             ((slu->slu_mgmt_url_valid) &&
1744             (slu->slu_mgmt_url_off >= sz)) ||
1745             ((slu->slu_serial_valid) &&
1746             ((slu->slu_serial_off + slu->slu_serial_size) >= sz))) {
1747                 return (EINVAL);
1748         }
1749 
1750         namebuf = kmem_zalloc(sz, KM_SLEEP);
1751         bcopy(slu->slu_buf, namebuf, sz - 1);
1752         namebuf[sz - 1] = 0;
1753 
1754         alloc_sz = sizeof (sbd_lu_t) + sizeof (sbd_pgr_t);
1755         if (slu->slu_meta_fname_valid) {
1756                 alloc_sz += strlen(namebuf + slu->slu_meta_fname_off) + 1;
1757         }
1758         alloc_sz += strlen(namebuf + slu->slu_data_fname_off) + 1;
1759         if (slu->slu_alias_valid) {
1760                 alloc_sz += strlen(namebuf + slu->slu_alias_off) + 1;
1761         }
1762         if (slu->slu_mgmt_url_valid) {
1763                 alloc_sz += strlen(namebuf + slu->slu_mgmt_url_off) + 1;
1764         }
1765         if (slu->slu_serial_valid) {
1766                 alloc_sz += slu->slu_serial_size;
1767         }
1768 
1769         lu = (stmf_lu_t *)stmf_alloc(STMF_STRUCT_STMF_LU, alloc_sz, 0);
1770         if (lu == NULL) {
1771                 kmem_free(namebuf, sz);
1772                 return (ENOMEM);
1773         }
1774         sl = (sbd_lu_t *)lu->lu_provider_private;
1775         bzero(sl, alloc_sz);
1776         sl->sl_lu = lu;
1777         sl->sl_alloc_size = alloc_sz;
1778         sl->sl_pgr = (sbd_pgr_t *)(sl + 1);
1779         rw_init(&sl->sl_pgr->pgr_lock, NULL, RW_DRIVER, NULL);
1780         mutex_init(&sl->sl_lock, NULL, MUTEX_DRIVER, NULL);
1781         mutex_init(&sl->sl_metadata_lock, NULL, MUTEX_DRIVER, NULL);
1782         rw_init(&sl->sl_access_state_lock, NULL, RW_DRIVER, NULL);
1783         p = ((char *)sl) + sizeof (sbd_lu_t) + sizeof (sbd_pgr_t);
1784         sl->sl_data_filename = p;
1785         (void) strcpy(sl->sl_data_filename, namebuf + slu->slu_data_fname_off);
1786         p += strlen(sl->sl_data_filename) + 1;
1787         sl->sl_meta_offset = SBD_META_OFFSET;
1788         sl->sl_access_state = SBD_LU_ACTIVE;
1789         if (slu->slu_meta_fname_valid) {
1790                 sl->sl_alias = sl->sl_name = sl->sl_meta_filename = p;
1791                 (void) strcpy(sl->sl_meta_filename, namebuf +
1792                     slu->slu_meta_fname_off);
1793                 p += strlen(sl->sl_meta_filename) + 1;
1794         } else {
1795                 sl->sl_alias = sl->sl_name = sl->sl_data_filename;
1796                 if (sbd_is_zvol(sl->sl_data_filename)) {
1797                         sl->sl_flags |= SL_ZFS_META;
1798                         sl->sl_meta_offset = 0;
1799                 } else {
1800                         sl->sl_flags |= SL_SHARED_META;
1801                         sl->sl_data_offset = SHARED_META_DATA_SIZE;
1802                         sl->sl_total_meta_size = SHARED_META_DATA_SIZE;
1803                         sl->sl_meta_size_used = 0;
1804                 }
1805         }
1806         if (slu->slu_alias_valid) {
1807                 sl->sl_alias = p;
1808                 (void) strcpy(p, namebuf + slu->slu_alias_off);
1809                 p += strlen(sl->sl_alias) + 1;
1810         }
1811         if (slu->slu_mgmt_url_valid) {
1812                 sl->sl_mgmt_url = p;
1813                 (void) strcpy(p, namebuf + slu->slu_mgmt_url_off);
1814                 p += strlen(sl->sl_mgmt_url) + 1;
1815         }
1816         if (slu->slu_serial_valid) {
1817                 sl->sl_serial_no = (uint8_t *)p;
1818                 bcopy(namebuf + slu->slu_serial_off, sl->sl_serial_no,
1819                     slu->slu_serial_size);
1820                 sl->sl_serial_no_size = slu->slu_serial_size;
1821                 p += slu->slu_serial_size;
1822         }
1823         kmem_free(namebuf, sz);
1824         if (slu->slu_vid_valid) {
1825                 bcopy(slu->slu_vid, sl->sl_vendor_id, 8);
1826                 sl->sl_flags |= SL_VID_VALID;
1827         }
1828         if (slu->slu_pid_valid) {
1829                 bcopy(slu->slu_pid, sl->sl_product_id, 16);
1830                 sl->sl_flags |= SL_PID_VALID;
1831         }
1832         if (slu->slu_rev_valid) {
1833                 bcopy(slu->slu_rev, sl->sl_revision, 4);
1834                 sl->sl_flags |= SL_REV_VALID;
1835         }
1836         if (slu->slu_write_protected) {
1837                 sl->sl_flags |= SL_WRITE_PROTECTED;
1838         }
1839         if (slu->slu_blksize_valid) {
1840                 if (!ISP2(slu->slu_blksize) ||
1841                     (slu->slu_blksize > (32 * 1024)) ||
1842                     (slu->slu_blksize == 0)) {
1843                         *err_ret = SBD_RET_INVALID_BLKSIZE;
1844                         ret = EINVAL;
1845                         goto scm_err_out;
1846                 }
1847                 while ((1 << sl->sl_data_blocksize_shift) != slu->slu_blksize) {
1848                         sl->sl_data_blocksize_shift++;
1849                 }
1850         } else {
1851                 sl->sl_data_blocksize_shift = 9;     /* 512 by default */
1852                 slu->slu_blksize = 512;
1853         }
1854 
1855         /* Now lets start creating meta */
1856         sl->sl_trans_op = SL_OP_CREATE_REGISTER_LU;
1857         if (sbd_link_lu(sl) != SBD_SUCCESS) {
1858                 *err_ret = SBD_RET_FILE_ALREADY_REGISTERED;
1859                 ret = EALREADY;
1860                 goto scm_err_out;
1861         }
1862 
1863         /* 1st focus on the data store */
1864         if (slu->slu_lu_size_valid) {
1865                 sl->sl_lu_size = slu->slu_lu_size;
1866         }
1867         ret = sbd_open_data_file(sl, err_ret, slu->slu_lu_size_valid, 0, 0);
1868         slu->slu_ret_filesize_nbits = sl->sl_data_fs_nbits;
1869         slu->slu_lu_size = sl->sl_lu_size;
1870         if (ret) {
1871                 goto scm_err_out;
1872         }
1873 
1874         /*
1875          * Check if we were explicitly asked to disable/enable write
1876          * cache on the device, otherwise get current device setting.
1877          */
1878         if (slu->slu_writeback_cache_disable_valid) {
1879                 if (slu->slu_writeback_cache_disable) {
1880                         /*
1881                          * Set write cache disable on the device. If it fails,
1882                          * we'll support it using sync/flush.
1883                          */
1884                         (void) sbd_wcd_set(1, sl);
1885                         wcd = 1;
1886                 } else {
1887                         /*
1888                          * Set write cache enable on the device. If it fails,
1889                          * return an error.
1890                          */
1891                         if (sbd_wcd_set(0, sl) != SBD_SUCCESS) {
1892                                 *err_ret = SBD_RET_WRITE_CACHE_SET_FAILED;
1893                                 ret = EFAULT;
1894                                 goto scm_err_out;
1895                         }
1896                 }
1897         } else {
1898                 sbd_wcd_get(&wcd, sl);
1899         }
1900 
1901         if (wcd) {
1902                 sl->sl_flags |= SL_WRITEBACK_CACHE_DISABLE |
1903                     SL_SAVED_WRITE_CACHE_DISABLE;
1904         }
1905 
1906         if (sl->sl_flags & SL_SHARED_META) {
1907                 goto over_meta_open;
1908         }
1909         if (sl->sl_flags & SL_ZFS_META) {
1910                 if (sbd_create_zfs_meta_object(sl) != SBD_SUCCESS) {
1911                         *err_ret = SBD_RET_ZFS_META_CREATE_FAILED;
1912                         ret = ENOMEM;
1913                         goto scm_err_out;
1914                 }
1915                 sl->sl_meta_blocksize_shift = 0;
1916                 goto over_meta_create;
1917         }
1918         if ((ret = lookupname(sl->sl_meta_filename, UIO_SYSSPACE, FOLLOW,
1919             NULLVPP, &sl->sl_meta_vp)) != 0) {
1920                 *err_ret = SBD_RET_META_FILE_LOOKUP_FAILED;
1921                 goto scm_err_out;
1922         }
1923         sl->sl_meta_vtype = vt = sl->sl_meta_vp->v_type;
1924         VN_RELE(sl->sl_meta_vp);
1925         if ((vt != VREG) && (vt != VCHR) && (vt != VBLK)) {
1926                 *err_ret = SBD_RET_WRONG_META_FILE_TYPE;
1927                 ret = EINVAL;
1928                 goto scm_err_out;
1929         }
1930         if (vt == VREG) {
1931                 sl->sl_meta_blocksize_shift = 0;
1932         } else {
1933                 sl->sl_meta_blocksize_shift = 9;
1934         }
1935         flag = FREAD | FWRITE | FOFFMAX | FEXCL;
1936         if ((ret = vn_open(sl->sl_meta_filename, UIO_SYSSPACE, flag, 0,
1937             &sl->sl_meta_vp, 0, 0)) != 0) {
1938                 *err_ret = SBD_RET_META_FILE_OPEN_FAILED;
1939                 goto scm_err_out;
1940         }
1941 over_meta_create:
1942         sl->sl_total_meta_size = sl->sl_meta_offset + sizeof (sbd_meta_start_t);
1943         sl->sl_total_meta_size +=
1944             (((uint64_t)1) << sl->sl_meta_blocksize_shift) - 1;
1945         sl->sl_total_meta_size &=
1946             ~((((uint64_t)1) << sl->sl_meta_blocksize_shift) - 1);
1947         sl->sl_meta_size_used = 0;
1948 over_meta_open:
1949         sl->sl_flags |= SL_META_OPENED;
1950 
1951         sl->sl_device_id[3] = 16;
1952         if (slu->slu_guid_valid) {
1953                 sl->sl_device_id[0] = 0xf1;
1954                 sl->sl_device_id[1] = 3;
1955                 sl->sl_device_id[2] = 0;
1956                 bcopy(slu->slu_guid, sl->sl_device_id + 4, 16);
1957         } else {
1958                 if (slu->slu_host_id_valid)
1959                         hid = slu->slu_host_id;
1960                 if (!slu->slu_company_id_valid)
1961                         slu->slu_company_id = COMPANY_ID_SUN;
1962                 if (stmf_scsilib_uniq_lu_id2(slu->slu_company_id, hid,
1963                     (scsi_devid_desc_t *)&sl->sl_device_id[0]) !=
1964                     STMF_SUCCESS) {
1965                         *err_ret = SBD_RET_META_CREATION_FAILED;
1966                         ret = EIO;
1967                         goto scm_err_out;
1968                 }
1969                 bcopy(sl->sl_device_id + 4, slu->slu_guid, 16);
1970         }
1971 
1972         /* Lets create the meta now */
1973         mutex_enter(&sl->sl_metadata_lock);
1974         if (sbd_write_meta_start(sl, sl->sl_total_meta_size,
1975             sizeof (sbd_meta_start_t)) != SBD_SUCCESS) {
1976                 mutex_exit(&sl->sl_metadata_lock);
1977                 *err_ret = SBD_RET_META_CREATION_FAILED;
1978                 ret = EIO;
1979                 goto scm_err_out;
1980         }
1981         mutex_exit(&sl->sl_metadata_lock);
1982         sl->sl_meta_size_used = sl->sl_meta_offset + sizeof (sbd_meta_start_t);
1983 
1984         if (sbd_write_lu_info(sl) != SBD_SUCCESS) {
1985                 *err_ret = SBD_RET_META_CREATION_FAILED;
1986                 ret = EIO;
1987                 goto scm_err_out;
1988         }
1989 
1990         if (sbd_pgr_meta_init(sl) != SBD_SUCCESS) {
1991                 *err_ret = SBD_RET_META_CREATION_FAILED;
1992                 ret = EIO;
1993                 goto scm_err_out;
1994         }
1995 
1996         /*
1997          * Update the zvol separately as this need only be called upon
1998          * completion of the metadata initialization.
1999          */
2000         if (sl->sl_flags & SL_ZFS_META) {
2001                 if (sbd_update_zfs_prop(sl) != SBD_SUCCESS) {
2002                         *err_ret = SBD_RET_META_CREATION_FAILED;
2003                         ret = EIO;
2004                         goto scm_err_out;
2005                 }
2006         }
2007 
2008         ret = sbd_populate_and_register_lu(sl, err_ret);
2009         if (ret) {
2010                 goto scm_err_out;
2011         }
2012 
2013         sl->sl_trans_op = SL_OP_NONE;
2014         atomic_inc_32(&sbd_lu_count);
2015         return (0);
2016 
2017 scm_err_out:
2018         return (sbd_close_delete_lu(sl, ret));
2019 }
2020 
2021 stmf_status_t
2022 sbd_proxy_msg(uint8_t *luid, void *proxy_arg, uint32_t proxy_arg_len,
2023     uint32_t type)
2024 {
2025         switch (type) {
2026                 case STMF_MSG_LU_ACTIVE:
2027                         return (sbd_proxy_reg_lu(luid, proxy_arg,
2028                             proxy_arg_len));
2029                 case STMF_MSG_LU_REGISTER:
2030                         return (sbd_proxy_reg_lu(luid, proxy_arg,
2031                             proxy_arg_len));
2032                 case STMF_MSG_LU_DEREGISTER:
2033                         return (sbd_proxy_dereg_lu(luid, proxy_arg,
2034                             proxy_arg_len));
2035                 default:
2036                         return (STMF_INVALID_ARG);
2037         }
2038 }
2039 
2040 
2041 /*
2042  * register a standby logical unit
2043  * proxy_reg_arg contains the meta filename
2044  */
2045 stmf_status_t
2046 sbd_proxy_reg_lu(uint8_t *luid, void *proxy_reg_arg, uint32_t proxy_reg_arg_len)
2047 {
2048         sbd_lu_t *sl;
2049         sbd_status_t sret;
2050         sbd_create_standby_lu_t *stlu;
2051         int alloc_sz;
2052         uint32_t err_ret = 0;
2053         stmf_status_t stret = STMF_SUCCESS;
2054 
2055         if (luid == NULL) {
2056                 return (STMF_INVALID_ARG);
2057         }
2058 
2059         do {
2060                 sret = sbd_find_and_lock_lu(luid, NULL, SL_OP_MODIFY_LU, &sl);
2061         } while (sret == SBD_BUSY);
2062 
2063         if (sret == SBD_NOT_FOUND) {
2064                 alloc_sz = sizeof (*stlu) + proxy_reg_arg_len - 8;
2065                 stlu = (sbd_create_standby_lu_t *)kmem_zalloc(alloc_sz,
2066                     KM_SLEEP);
2067                 bcopy(luid, stlu->stlu_guid, 16);
2068                 if (proxy_reg_arg_len) {
2069                         bcopy(proxy_reg_arg, stlu->stlu_meta_fname,
2070                             proxy_reg_arg_len);
2071                         stlu->stlu_meta_fname_size = proxy_reg_arg_len;
2072                 }
2073                 if (sbd_create_standby_lu(stlu, &err_ret) != 0) {
2074                         cmn_err(CE_WARN,
2075                             "Unable to create standby logical unit for %s",
2076                             stlu->stlu_meta_fname);
2077                         stret = STMF_FAILURE;
2078                 }
2079                 kmem_free(stlu, alloc_sz);
2080                 return (stret);
2081         } else if (sret == SBD_SUCCESS) {
2082                 /*
2083                  * if the lu is already registered, then the lu should now
2084                  * be in standby mode
2085                  */
2086                 sbd_it_data_t *it;
2087                 if (sl->sl_access_state != SBD_LU_STANDBY) {
2088                         mutex_enter(&sl->sl_lock);
2089                         sl->sl_access_state = SBD_LU_STANDBY;
2090                         for (it = sl->sl_it_list; it != NULL;
2091                             it = it->sbd_it_next) {
2092                                 it->sbd_it_ua_conditions |=
2093                                     SBD_UA_ASYMMETRIC_ACCESS_CHANGED;
2094                                 it->sbd_it_flags &=
2095                                     ~SBD_IT_HAS_SCSI2_RESERVATION;
2096                                 sl->sl_flags &= ~SL_LU_HAS_SCSI2_RESERVATION;
2097                         }
2098                         mutex_exit(&sl->sl_lock);
2099                         sbd_pgr_reset(sl);
2100                 }
2101                 sl->sl_trans_op = SL_OP_NONE;
2102         } else {
2103                 cmn_err(CE_WARN, "could not find and lock logical unit");
2104                 stret = STMF_FAILURE;
2105         }
2106 out:
2107         return (stret);
2108 }
2109 
2110 /* ARGSUSED */
2111 stmf_status_t
2112 sbd_proxy_dereg_lu(uint8_t *luid, void *proxy_reg_arg,
2113     uint32_t proxy_reg_arg_len)
2114 {
2115         sbd_delete_lu_t dlu = {0};
2116         uint32_t err_ret;
2117 
2118         if (luid == NULL) {
2119                 cmn_err(CE_WARN, "de-register lu request had null luid");
2120                 return (STMF_INVALID_ARG);
2121         }
2122 
2123         bcopy(luid, &dlu.dlu_guid, 16);
2124 
2125         if (sbd_delete_lu(&dlu, (int)sizeof (dlu), &err_ret) != 0) {
2126                 cmn_err(CE_WARN, "failed to delete de-register lu request");
2127                 return (STMF_FAILURE);
2128         }
2129 
2130         return (STMF_SUCCESS);
2131 }
2132 
2133 int
2134 sbd_create_standby_lu(sbd_create_standby_lu_t *slu, uint32_t *err_ret)
2135 {
2136         sbd_lu_t *sl;
2137         stmf_lu_t *lu;
2138         int ret = EIO;
2139         int alloc_sz;
2140 
2141         alloc_sz = sizeof (sbd_lu_t) + sizeof (sbd_pgr_t) +
2142             slu->stlu_meta_fname_size;
2143         lu = (stmf_lu_t *)stmf_alloc(STMF_STRUCT_STMF_LU, alloc_sz, 0);
2144         if (lu == NULL) {
2145                 return (ENOMEM);
2146         }
2147         sl = (sbd_lu_t *)lu->lu_provider_private;
2148         bzero(sl, alloc_sz);
2149         sl->sl_lu = lu;
2150         sl->sl_alloc_size = alloc_sz;
2151 
2152         sl->sl_pgr = (sbd_pgr_t *)(sl + 1);
2153         sl->sl_meta_filename = ((char *)sl) + sizeof (sbd_lu_t) +
2154             sizeof (sbd_pgr_t);
2155 
2156         if (slu->stlu_meta_fname_size > 0) {
2157                 (void) strcpy(sl->sl_meta_filename, slu->stlu_meta_fname);
2158         }
2159         sl->sl_name = sl->sl_meta_filename;
2160 
2161         sl->sl_device_id[3] = 16;
2162         sl->sl_device_id[0] = 0xf1;
2163         sl->sl_device_id[1] = 3;
2164         sl->sl_device_id[2] = 0;
2165         bcopy(slu->stlu_guid, sl->sl_device_id + 4, 16);
2166         lu->lu_id = (scsi_devid_desc_t *)sl->sl_device_id;
2167         sl->sl_access_state = SBD_LU_STANDBY;
2168 
2169         rw_init(&sl->sl_pgr->pgr_lock, NULL, RW_DRIVER, NULL);
2170         mutex_init(&sl->sl_lock, NULL, MUTEX_DRIVER, NULL);
2171         mutex_init(&sl->sl_metadata_lock, NULL, MUTEX_DRIVER, NULL);
2172         rw_init(&sl->sl_access_state_lock, NULL, RW_DRIVER, NULL);
2173 
2174         sl->sl_trans_op = SL_OP_CREATE_REGISTER_LU;
2175 
2176         if (sbd_link_lu(sl) != SBD_SUCCESS) {
2177                 *err_ret = SBD_RET_FILE_ALREADY_REGISTERED;
2178                 ret = EALREADY;
2179                 goto scs_err_out;
2180         }
2181 
2182         ret = sbd_populate_and_register_lu(sl, err_ret);
2183         if (ret) {
2184                 goto scs_err_out;
2185         }
2186 
2187         sl->sl_trans_op = SL_OP_NONE;
2188         atomic_inc_32(&sbd_lu_count);
2189         return (0);
2190 
2191 scs_err_out:
2192         return (sbd_close_delete_lu(sl, ret));
2193 }
2194 
2195 int
2196 sbd_load_sli_1_0(sbd_lu_t *sl, uint32_t *err_ret)
2197 {
2198         sbd_lu_info_1_0_t *sli = NULL;
2199         sbd_status_t sret;
2200 
2201         sret = sbd_read_meta_section(sl, (sm_section_hdr_t **)&sli,
2202             SMS_ID_LU_INFO_1_0);
2203 
2204         if (sret != SBD_SUCCESS) {
2205                 *err_ret = SBD_RET_NO_META;
2206                 return (EIO);
2207         }
2208         if (sli->sli_data_order != SMS_DATA_ORDER) {
2209                 sbd_swap_lu_info_1_0(sli);
2210                 if (sli->sli_data_order != SMS_DATA_ORDER) {
2211                         kmem_free(sli, sli->sli_sms_header.sms_size);
2212                         *err_ret = SBD_RET_NO_META;
2213                         return (EIO);
2214                 }
2215         }
2216 
2217         sl->sl_flags |= SL_SHARED_META;
2218         sl->sl_data_blocksize_shift = 9;
2219         sl->sl_data_offset = SHARED_META_DATA_SIZE;
2220         sl->sl_lu_size = sli->sli_total_store_size - SHARED_META_DATA_SIZE;
2221         sl->sl_total_data_size = SHARED_META_DATA_SIZE + sl->sl_lu_size;
2222         bcopy(sli->sli_lu_devid, sl->sl_device_id, 20);
2223 
2224         kmem_free(sli, sli->sli_sms_header.sms_size);
2225         return (0);
2226 }
2227 
2228 int
2229 sbd_import_lu(sbd_import_lu_t *ilu, int struct_sz, uint32_t *err_ret,
2230     int no_register, sbd_lu_t **slr)
2231 {
2232         stmf_lu_t *lu;
2233         sbd_lu_t *sl;
2234         sbd_lu_info_1_1_t *sli = NULL;
2235         int asz;
2236         int ret = 0;
2237         stmf_status_t stret;
2238         int flag;
2239         int wcd = 0;
2240         int data_opened;
2241         uint16_t sli_buf_sz;
2242         uint8_t *sli_buf_copy = NULL;
2243         enum vtype vt;
2244         int standby = 0;
2245         sbd_status_t sret;
2246 
2247         if (no_register && slr == NULL) {
2248                 return (EINVAL);
2249         }
2250         ilu->ilu_meta_fname[struct_sz - sizeof (*ilu) + 8 - 1] = 0;
2251         /*
2252          * check whether logical unit is already registered ALUA
2253          * For a standby logical unit, the meta filename is set. Use
2254          * that to search for an existing logical unit.
2255          */
2256         sret = sbd_find_and_lock_lu(NULL, (uint8_t *)&(ilu->ilu_meta_fname),
2257             SL_OP_IMPORT_LU, &sl);
2258 
2259         if (sret == SBD_SUCCESS) {
2260                 if (sl->sl_access_state != SBD_LU_ACTIVE) {
2261                         no_register = 1;
2262                         standby = 1;
2263                         lu = sl->sl_lu;
2264                         if (sl->sl_alias_alloc_size) {
2265                                 kmem_free(sl->sl_alias,
2266                                     sl->sl_alias_alloc_size);
2267                                 sl->sl_alias_alloc_size = 0;
2268                                 sl->sl_alias = NULL;
2269                                 lu->lu_alias = NULL;
2270                         }
2271                         if (sl->sl_meta_filename == NULL) {
2272                                 sl->sl_meta_filename = sl->sl_data_filename;
2273                         } else if (sl->sl_data_fname_alloc_size) {
2274                                 kmem_free(sl->sl_data_filename,
2275                                     sl->sl_data_fname_alloc_size);
2276                                 sl->sl_data_fname_alloc_size = 0;
2277                         }
2278                         if (sl->sl_serial_no_alloc_size) {
2279                                 kmem_free(sl->sl_serial_no,
2280                                     sl->sl_serial_no_alloc_size);
2281                                 sl->sl_serial_no_alloc_size = 0;
2282                         }
2283                         if (sl->sl_mgmt_url_alloc_size) {
2284                                 kmem_free(sl->sl_mgmt_url,
2285                                     sl->sl_mgmt_url_alloc_size);
2286                                 sl->sl_mgmt_url_alloc_size = 0;
2287                         }
2288                 } else {
2289                         *err_ret = SBD_RET_FILE_ALREADY_REGISTERED;
2290                         bcopy(sl->sl_device_id + 4, ilu->ilu_ret_guid, 16);
2291                         sl->sl_trans_op = SL_OP_NONE;
2292                         return (EALREADY);
2293                 }
2294         } else if (sret == SBD_NOT_FOUND) {
2295                 asz = strlen(ilu->ilu_meta_fname) + 1;
2296 
2297                 lu = (stmf_lu_t *)stmf_alloc(STMF_STRUCT_STMF_LU,
2298                     sizeof (sbd_lu_t) + sizeof (sbd_pgr_t) + asz, 0);
2299                 if (lu == NULL) {
2300                         return (ENOMEM);
2301                 }
2302                 sl = (sbd_lu_t *)lu->lu_provider_private;
2303                 bzero(sl, sizeof (*sl));
2304                 sl->sl_lu = lu;
2305                 sl->sl_pgr = (sbd_pgr_t *)(sl + 1);
2306                 sl->sl_meta_filename = ((char *)sl) + sizeof (*sl) +
2307                     sizeof (sbd_pgr_t);
2308                 (void) strcpy(sl->sl_meta_filename, ilu->ilu_meta_fname);
2309                 sl->sl_name = sl->sl_meta_filename;
2310                 rw_init(&sl->sl_pgr->pgr_lock, NULL, RW_DRIVER, NULL);
2311                 rw_init(&sl->sl_access_state_lock, NULL, RW_DRIVER, NULL);
2312                 mutex_init(&sl->sl_lock, NULL, MUTEX_DRIVER, NULL);
2313                 mutex_init(&sl->sl_metadata_lock, NULL, MUTEX_DRIVER, NULL);
2314                 sl->sl_trans_op = SL_OP_IMPORT_LU;
2315         } else {
2316                 *err_ret = SBD_RET_META_FILE_LOOKUP_FAILED;
2317                 return (EIO);
2318         }
2319 
2320         /* we're only loading the metadata */
2321         if (!no_register) {
2322                 if (sbd_link_lu(sl) != SBD_SUCCESS) {
2323                         *err_ret = SBD_RET_FILE_ALREADY_REGISTERED;
2324                         bcopy(sl->sl_device_id + 4, ilu->ilu_ret_guid, 16);
2325                         ret = EALREADY;
2326                         goto sim_err_out;
2327                 }
2328         }
2329         if ((ret = lookupname(sl->sl_meta_filename, UIO_SYSSPACE, FOLLOW,
2330             NULLVPP, &sl->sl_meta_vp)) != 0) {
2331                 *err_ret = SBD_RET_META_FILE_LOOKUP_FAILED;
2332                 goto sim_err_out;
2333         }
2334         if (sbd_is_zvol(sl->sl_meta_filename)) {
2335                 sl->sl_flags |= SL_ZFS_META;
2336                 sl->sl_data_filename = sl->sl_meta_filename;
2337         }
2338         sl->sl_meta_vtype = vt = sl->sl_meta_vp->v_type;
2339         VN_RELE(sl->sl_meta_vp);
2340         if ((vt != VREG) && (vt != VCHR) && (vt != VBLK)) {
2341                 *err_ret = SBD_RET_WRONG_META_FILE_TYPE;
2342                 ret = EINVAL;
2343                 goto sim_err_out;
2344         }
2345         if (sl->sl_flags & SL_ZFS_META) {
2346                 if (sbd_open_zfs_meta(sl) != SBD_SUCCESS) {
2347                         /* let see if metadata is in the 64k block */
2348                         sl->sl_flags &= ~SL_ZFS_META;
2349                 }
2350         }
2351         if (!(sl->sl_flags & SL_ZFS_META)) {
2352                 /* metadata is always writable */
2353                 flag = FREAD | FWRITE | FOFFMAX | FEXCL;
2354                 if ((ret = vn_open(sl->sl_meta_filename, UIO_SYSSPACE, flag, 0,
2355                     &sl->sl_meta_vp, 0, 0)) != 0) {
2356                         *err_ret = SBD_RET_META_FILE_OPEN_FAILED;
2357                         goto sim_err_out;
2358                 }
2359         }
2360         if ((sl->sl_flags & SL_ZFS_META) || (vt == VREG)) {
2361                 sl->sl_meta_blocksize_shift = 0;
2362         } else {
2363                 sl->sl_meta_blocksize_shift = 9;
2364         }
2365         sl->sl_meta_offset = (sl->sl_flags & SL_ZFS_META) ? 0 : SBD_META_OFFSET;
2366         sl->sl_flags |= SL_META_OPENED;
2367 
2368         mutex_enter(&sl->sl_metadata_lock);
2369         sret = sbd_load_meta_start(sl);
2370         mutex_exit(&sl->sl_metadata_lock);
2371         if (sret != SBD_SUCCESS) {
2372                 if (sret == SBD_META_CORRUPTED) {
2373                         *err_ret = SBD_RET_NO_META;
2374                 } else if (sret == SBD_NOT_SUPPORTED) {
2375                         *err_ret = SBD_RET_VERSION_NOT_SUPPORTED;
2376                 } else {
2377                         *err_ret = SBD_RET_NO_META;
2378                 }
2379                 ret = EINVAL;
2380                 goto sim_err_out;
2381         }
2382 
2383         /* Now lets see if we can read the most recent LU info */
2384         sret = sbd_read_meta_section(sl, (sm_section_hdr_t **)&sli,
2385             SMS_ID_LU_INFO_1_1);
2386         if ((sret == SBD_NOT_FOUND) && ((sl->sl_flags & SL_ZFS_META) == 0)) {
2387                 ret = sbd_load_sli_1_0(sl, err_ret);
2388                 if (ret) {
2389                         goto sim_err_out;
2390                 }
2391                 goto sim_sli_loaded;
2392         }
2393         if (sret != SBD_SUCCESS) {
2394                 *err_ret = SBD_RET_NO_META;
2395                 ret = EIO;
2396                 goto sim_err_out;
2397         }
2398         /* load sli 1.1 */
2399         if (sli->sli_data_order != SMS_DATA_ORDER) {
2400                 sbd_swap_lu_info_1_1(sli);
2401                 if (sli->sli_data_order != SMS_DATA_ORDER) {
2402                         *err_ret = SBD_RET_NO_META;
2403                         ret = EIO;
2404                         goto sim_err_out;
2405                 }
2406         }
2407 
2408         sli_buf_sz = sli->sli_sms_header.sms_size -
2409             sizeof (sbd_lu_info_1_1_t) + 8;
2410         sli_buf_copy = kmem_alloc(sli_buf_sz + 1, KM_SLEEP);
2411         bcopy(sli->sli_buf, sli_buf_copy, sli_buf_sz);
2412         sli_buf_copy[sli_buf_sz] = 0;
2413 
2414         /* Make sure all the offsets are within limits */
2415         if (((sli->sli_flags & SLI_META_FNAME_VALID) &&
2416             (sli->sli_meta_fname_offset > sli_buf_sz)) ||
2417             ((sli->sli_flags & SLI_DATA_FNAME_VALID) &&
2418             (sli->sli_data_fname_offset > sli_buf_sz)) ||
2419             ((sli->sli_flags & SLI_MGMT_URL_VALID) &&
2420             (sli->sli_mgmt_url_offset > sli_buf_sz)) ||
2421             ((sli->sli_flags & SLI_SERIAL_VALID) &&
2422             ((sli->sli_serial_offset + sli->sli_serial_size) > sli_buf_sz)) ||
2423             ((sli->sli_flags & SLI_ALIAS_VALID) &&
2424             (sli->sli_alias_offset > sli_buf_sz))) {
2425                 *err_ret = SBD_RET_NO_META;
2426                 ret = EIO;
2427                 goto sim_err_out;
2428         }
2429 
2430         sl->sl_lu_size = sli->sli_lu_size;
2431         sl->sl_data_blocksize_shift = sli->sli_data_blocksize_shift;
2432         bcopy(sli->sli_device_id, sl->sl_device_id, 20);
2433         if (sli->sli_flags & SLI_SERIAL_VALID) {
2434                 sl->sl_serial_no_size = sl->sl_serial_no_alloc_size =
2435                     sli->sli_serial_size;
2436                 sl->sl_serial_no = kmem_zalloc(sli->sli_serial_size, KM_SLEEP);
2437                 bcopy(sli_buf_copy + sli->sli_serial_offset, sl->sl_serial_no,
2438                     sl->sl_serial_no_size);
2439         }
2440         if (sli->sli_flags & SLI_SEPARATE_META) {
2441                 sl->sl_total_data_size = sl->sl_lu_size;
2442                 if (sli->sli_flags & SLI_DATA_FNAME_VALID) {
2443                         sl->sl_data_fname_alloc_size = strlen((char *)
2444                             sli_buf_copy + sli->sli_data_fname_offset) + 1;
2445                         sl->sl_data_filename = kmem_zalloc(
2446                             sl->sl_data_fname_alloc_size, KM_SLEEP);
2447                         (void) strcpy(sl->sl_data_filename,
2448                             (char *)sli_buf_copy + sli->sli_data_fname_offset);
2449                 }
2450         } else {
2451                 if (sl->sl_flags & SL_ZFS_META) {
2452                         sl->sl_total_data_size = sl->sl_lu_size;
2453                         sl->sl_data_offset = 0;
2454                 } else {
2455                         sl->sl_total_data_size =
2456                             sl->sl_lu_size + SHARED_META_DATA_SIZE;
2457                         sl->sl_data_offset = SHARED_META_DATA_SIZE;
2458                         sl->sl_flags |= SL_SHARED_META;
2459                 }
2460         }
2461         if (sli->sli_flags & SLI_ALIAS_VALID) {
2462                 sl->sl_alias_alloc_size = strlen((char *)sli_buf_copy +
2463                     sli->sli_alias_offset) + 1;
2464                 sl->sl_alias = kmem_alloc(sl->sl_alias_alloc_size, KM_SLEEP);
2465                 (void) strcpy(sl->sl_alias, (char *)sli_buf_copy +
2466                     sli->sli_alias_offset);
2467         }
2468         if (sli->sli_flags & SLI_MGMT_URL_VALID) {
2469                 sl->sl_mgmt_url_alloc_size = strlen((char *)sli_buf_copy +
2470                     sli->sli_mgmt_url_offset) + 1;
2471                 sl->sl_mgmt_url = kmem_alloc(sl->sl_mgmt_url_alloc_size,
2472                     KM_SLEEP);
2473                 (void) strcpy(sl->sl_mgmt_url, (char *)sli_buf_copy +
2474                     sli->sli_mgmt_url_offset);
2475         }
2476         if (sli->sli_flags & SLI_WRITE_PROTECTED) {
2477                 sl->sl_flags |= SL_WRITE_PROTECTED;
2478         }
2479         if (sli->sli_flags & SLI_VID_VALID) {
2480                 sl->sl_flags |= SL_VID_VALID;
2481                 bcopy(sli->sli_vid, sl->sl_vendor_id, 8);
2482         }
2483         if (sli->sli_flags & SLI_PID_VALID) {
2484                 sl->sl_flags |= SL_PID_VALID;
2485                 bcopy(sli->sli_pid, sl->sl_product_id, 16);
2486         }
2487         if (sli->sli_flags & SLI_REV_VALID) {
2488                 sl->sl_flags |= SL_REV_VALID;
2489                 bcopy(sli->sli_rev, sl->sl_revision, 4);
2490         }
2491         if (sli->sli_flags & SLI_WRITEBACK_CACHE_DISABLE) {
2492                 sl->sl_flags |= SL_WRITEBACK_CACHE_DISABLE;
2493         }
2494 sim_sli_loaded:
2495         if ((sl->sl_flags & SL_SHARED_META) == 0) {
2496                 data_opened = 0;
2497         } else {
2498                 data_opened = 1;
2499                 sl->sl_data_filename = sl->sl_meta_filename;
2500                 sl->sl_data_vp = sl->sl_meta_vp;
2501                 sl->sl_data_vtype = sl->sl_meta_vtype;
2502         }
2503 
2504         sret = sbd_pgr_meta_load(sl);
2505         if (sret != SBD_SUCCESS) {
2506                 *err_ret = SBD_RET_NO_META;
2507                 ret = EIO;
2508                 goto sim_err_out;
2509         }
2510 
2511         ret = sbd_open_data_file(sl, err_ret, 1, data_opened, 0);
2512         if (ret) {
2513                 goto sim_err_out;
2514         }
2515 
2516         /*
2517          * set write cache disable on the device
2518          * Note: this shouldn't fail on import unless the cache capabilities
2519          * of the device changed. If that happened, modify will need to
2520          * be used to set the cache flag appropriately after import is done.
2521          */
2522         if (sl->sl_flags & SL_WRITEBACK_CACHE_DISABLE) {
2523                 (void) sbd_wcd_set(1, sl);
2524                 wcd = 1;
2525         /*
2526          * if not explicitly set, attempt to set it to enable, if that fails
2527          * get the current setting and use that
2528          */
2529         } else {
2530                 sret = sbd_wcd_set(0, sl);
2531                 if (sret != SBD_SUCCESS) {
2532                         sbd_wcd_get(&wcd, sl);
2533                 }
2534         }
2535 
2536         if (wcd) {
2537                 sl->sl_flags |= SL_WRITEBACK_CACHE_DISABLE |
2538                     SL_SAVED_WRITE_CACHE_DISABLE;
2539         }
2540 
2541         /* we're only loading the metadata */
2542         if (!no_register) {
2543                 ret = sbd_populate_and_register_lu(sl, err_ret);
2544                 if (ret) {
2545                         goto sim_err_out;
2546                 }
2547                 atomic_inc_32(&sbd_lu_count);
2548         }
2549 
2550         bcopy(sl->sl_device_id + 4, ilu->ilu_ret_guid, 16);
2551         sl->sl_trans_op = SL_OP_NONE;
2552 
2553         if (sli) {
2554                 kmem_free(sli, sli->sli_sms_header.sms_size);
2555                 sli = NULL;
2556         }
2557         if (sli_buf_copy) {
2558                 kmem_free(sli_buf_copy, sli_buf_sz + 1);
2559                 sli_buf_copy = NULL;
2560         }
2561         if (no_register && !standby) {
2562                 *slr = sl;
2563         }
2564 
2565         /*
2566          * if this was imported from standby, set the access state
2567          * to active.
2568          */
2569         if (standby) {
2570                 sbd_it_data_t *it;
2571                 mutex_enter(&sl->sl_lock);
2572                 sl->sl_access_state = SBD_LU_ACTIVE;
2573                 for (it = sl->sl_it_list; it != NULL;
2574                     it = it->sbd_it_next) {
2575                         it->sbd_it_ua_conditions |=
2576                             SBD_UA_ASYMMETRIC_ACCESS_CHANGED;
2577                         it->sbd_it_ua_conditions |= SBD_UA_POR;
2578                         it->sbd_it_flags |=  SBD_IT_PGR_CHECK_FLAG;
2579                 }
2580                 mutex_exit(&sl->sl_lock);
2581                 /* call set access state */
2582                 stret = stmf_set_lu_access(lu, STMF_LU_ACTIVE);
2583                 if (stret != STMF_SUCCESS) {
2584                         *err_ret = SBD_RET_ACCESS_STATE_FAILED;
2585                         sl->sl_access_state = SBD_LU_STANDBY;
2586                         goto sim_err_out;
2587                 }
2588                 if (sl->sl_alias) {
2589                         lu->lu_alias = sl->sl_alias;
2590                 } else {
2591                         lu->lu_alias = sl->sl_name;
2592                 }
2593         }
2594         sl->sl_access_state = SBD_LU_ACTIVE;
2595         return (0);
2596 
2597 sim_err_out:
2598         if (sli) {
2599                 kmem_free(sli, sli->sli_sms_header.sms_size);
2600                 sli = NULL;
2601         }
2602         if (sli_buf_copy) {
2603                 kmem_free(sli_buf_copy, sli_buf_sz + 1);
2604                 sli_buf_copy = NULL;
2605         }
2606 
2607         if (standby) {
2608                 *err_ret = SBD_RET_ACCESS_STATE_FAILED;
2609                 sl->sl_trans_op = SL_OP_NONE;
2610                 return (EIO);
2611         } else {
2612                 return (sbd_close_delete_lu(sl, ret));
2613         }
2614 }
2615 
2616 int
2617 sbd_modify_lu(sbd_modify_lu_t *mlu, int struct_sz, uint32_t *err_ret)
2618 {
2619         sbd_lu_t *sl = NULL;
2620         uint16_t alias_sz;
2621         int ret = 0;
2622         sbd_it_data_t *it;
2623         sbd_status_t sret;
2624         uint64_t old_size;
2625         int modify_unregistered = 0;
2626         int ua = 0;
2627         sbd_import_lu_t *ilu;
2628         stmf_lu_t *lu;
2629         uint32_t ilu_sz;
2630         uint32_t sz;
2631 
2632         sz = struct_sz - sizeof (*mlu) + 8 + 1;
2633 
2634         /* if there is data in the buf, null terminate it */
2635         if (struct_sz > sizeof (*mlu)) {
2636                 mlu->mlu_buf[struct_sz - sizeof (*mlu) + 8 - 1] = 0;
2637         }
2638 
2639         *err_ret = 0;
2640 
2641         /* Lets validate offsets */
2642         if (((mlu->mlu_alias_valid) &&
2643             (mlu->mlu_alias_off >= sz)) ||
2644             ((mlu->mlu_mgmt_url_valid) &&
2645             (mlu->mlu_mgmt_url_off >= sz)) ||
2646             (mlu->mlu_by_fname) &&
2647             (mlu->mlu_fname_off >= sz)) {
2648                 return (EINVAL);
2649         }
2650 
2651         /*
2652          * We'll look for the device but if we don't find it registered,
2653          * we'll still try to modify the unregistered device.
2654          */
2655         if (mlu->mlu_by_guid) {
2656                 sret = sbd_find_and_lock_lu(mlu->mlu_input_guid, NULL,
2657                     SL_OP_MODIFY_LU, &sl);
2658         } else if (mlu->mlu_by_fname) {
2659                 sret = sbd_find_and_lock_lu(NULL,
2660                     (uint8_t *)&(mlu->mlu_buf[mlu->mlu_fname_off]),
2661                     SL_OP_MODIFY_LU, &sl);
2662         } else {
2663                 return (EINVAL);
2664         }
2665 
2666 
2667         if (sret != SBD_SUCCESS) {
2668                 if (sret == SBD_BUSY) {
2669                         *err_ret = SBD_RET_LU_BUSY;
2670                         return (EBUSY);
2671                 } else if (sret != SBD_NOT_FOUND) {
2672                         return (EIO);
2673                 } else if (!mlu->mlu_by_fname) {
2674                         return (EINVAL);
2675                 }
2676                 /* Okay, try to import the device */
2677                 struct_sz = max(8, strlen(&(mlu->mlu_buf[mlu->mlu_fname_off]))
2678                     + 1);
2679                 struct_sz += sizeof (sbd_import_lu_t) - 8;
2680                 ilu_sz = struct_sz;
2681                 ilu = (sbd_import_lu_t *)kmem_zalloc(ilu_sz, KM_SLEEP);
2682                 ilu->ilu_struct_size = struct_sz;
2683                 (void) strcpy(ilu->ilu_meta_fname,
2684                     &(mlu->mlu_buf[mlu->mlu_fname_off]));
2685                 ret = sbd_import_lu(ilu, struct_sz, err_ret, 1, &sl);
2686                 kmem_free(ilu, ilu_sz);
2687                 if (ret != SBD_SUCCESS) {
2688                         return (ENOENT);
2689                 }
2690                 modify_unregistered = 1;
2691         }
2692 
2693         if (sl->sl_access_state != SBD_LU_ACTIVE) {
2694                 *err_ret = SBD_RET_ACCESS_STATE_FAILED;
2695                 ret = EINVAL;
2696                 goto smm_err_out;
2697         }
2698 
2699         /* check for write cache change */
2700         if (mlu->mlu_writeback_cache_disable_valid) {
2701                 /* set wce on device */
2702                 sret = sbd_wcd_set(mlu->mlu_writeback_cache_disable, sl);
2703                 if (!mlu->mlu_writeback_cache_disable && sret != SBD_SUCCESS) {
2704                         *err_ret = SBD_RET_WRITE_CACHE_SET_FAILED;
2705                         ret = EFAULT;
2706                         goto smm_err_out;
2707                 }
2708                 mutex_enter(&sl->sl_lock);
2709                 if (!mlu->mlu_writeback_cache_disable) {
2710                         if (sl->sl_flags & SL_WRITEBACK_CACHE_DISABLE) {
2711                                 ua = 1;
2712                                 sl->sl_flags &= ~SL_WRITEBACK_CACHE_DISABLE;
2713                                 sl->sl_flags &= ~SL_SAVED_WRITE_CACHE_DISABLE;
2714                         }
2715                 } else {
2716                         if ((sl->sl_flags & SL_WRITEBACK_CACHE_DISABLE) == 0) {
2717                                 ua = 1;
2718                                 sl->sl_flags |= SL_WRITEBACK_CACHE_DISABLE;
2719                                 sl->sl_flags |= SL_SAVED_WRITE_CACHE_DISABLE;
2720                         }
2721                 }
2722                 for (it = sl->sl_it_list; ua && it != NULL;
2723                     it = it->sbd_it_next) {
2724                         it->sbd_it_ua_conditions |=
2725                             SBD_UA_MODE_PARAMETERS_CHANGED;
2726                 }
2727                 mutex_exit(&sl->sl_lock);
2728         }
2729         ua = 0;
2730 
2731         if (mlu->mlu_alias_valid) {
2732                 alias_sz = strlen((char *)mlu->mlu_buf +
2733                     mlu->mlu_alias_off) + 1;
2734                 /*
2735                  * Use the allocated buffer or alloc a new one.
2736                  * Don't copy into sl_alias if sl_alias_alloc_size is 0
2737                  * otherwise or you'll be writing over the data/metadata
2738                  * filename.
2739                  */
2740                 mutex_enter(&sl->sl_lock);
2741                 if (sl->sl_alias_alloc_size > 0 &&
2742                     sl->sl_alias_alloc_size < alias_sz) {
2743                         kmem_free(sl->sl_alias,
2744                             sl->sl_alias_alloc_size);
2745                         sl->sl_alias_alloc_size = 0;
2746                 }
2747                 if (sl->sl_alias_alloc_size == 0) {
2748                         sl->sl_alias = kmem_alloc(alias_sz, KM_SLEEP);
2749                         sl->sl_alias_alloc_size = alias_sz;
2750                 }
2751                 (void) strcpy(sl->sl_alias, (char *)mlu->mlu_buf +
2752                     mlu->mlu_alias_off);
2753                 lu = sl->sl_lu;
2754                 lu->lu_alias = sl->sl_alias;
2755                 mutex_exit(&sl->sl_lock);
2756         }
2757 
2758         if (mlu->mlu_mgmt_url_valid) {
2759                 uint16_t url_sz;
2760 
2761                 url_sz = strlen((char *)mlu->mlu_buf + mlu->mlu_mgmt_url_off);
2762                 if (url_sz > 0)
2763                         url_sz++;
2764 
2765                 mutex_enter(&sl->sl_lock);
2766                 if (sl->sl_mgmt_url_alloc_size > 0 &&
2767                     (url_sz == 0 || sl->sl_mgmt_url_alloc_size < url_sz)) {
2768                         kmem_free(sl->sl_mgmt_url, sl->sl_mgmt_url_alloc_size);
2769                         sl->sl_mgmt_url = NULL;
2770                         sl->sl_mgmt_url_alloc_size = 0;
2771                 }
2772                 if (url_sz > 0) {
2773                         if (sl->sl_mgmt_url_alloc_size == 0) {
2774                                 sl->sl_mgmt_url = kmem_alloc(url_sz, KM_SLEEP);
2775                                 sl->sl_mgmt_url_alloc_size = url_sz;
2776                         }
2777                         (void) strcpy(sl->sl_mgmt_url, (char *)mlu->mlu_buf +
2778                             mlu->mlu_mgmt_url_off);
2779                 }
2780                 for (it = sl->sl_it_list; it != NULL;
2781                     it = it->sbd_it_next) {
2782                         it->sbd_it_ua_conditions |=
2783                             SBD_UA_MODE_PARAMETERS_CHANGED;
2784                 }
2785                 mutex_exit(&sl->sl_lock);
2786         }
2787 
2788         if (mlu->mlu_write_protected_valid) {
2789                 mutex_enter(&sl->sl_lock);
2790                 if (mlu->mlu_write_protected) {
2791                         if ((sl->sl_flags & SL_WRITE_PROTECTED) == 0) {
2792                                 ua = 1;
2793                                 sl->sl_flags |= SL_WRITE_PROTECTED;
2794                         }
2795                 } else {
2796                         if (sl->sl_flags & SL_WRITE_PROTECTED) {
2797                                 ua = 1;
2798                                 sl->sl_flags &= ~SL_WRITE_PROTECTED;
2799                         }
2800                 }
2801                 for (it = sl->sl_it_list; ua && it != NULL;
2802                     it = it->sbd_it_next) {
2803                         it->sbd_it_ua_conditions |=
2804                             SBD_UA_MODE_PARAMETERS_CHANGED;
2805                 }
2806                 mutex_exit(&sl->sl_lock);
2807         }
2808 
2809         if (mlu->mlu_lu_size_valid) {
2810                 /*
2811                  * validate lu size and set
2812                  * For open file only (registered lu)
2813                  */
2814                 mutex_enter(&sl->sl_lock);
2815                 old_size = sl->sl_lu_size;
2816                 sl->sl_lu_size = mlu->mlu_lu_size;
2817                 mutex_exit(&sl->sl_lock);
2818                 ret = sbd_open_data_file(sl, err_ret, 1, 1, 1);
2819                 if (ret) {
2820                         mutex_enter(&sl->sl_lock);
2821                         sl->sl_lu_size = old_size;
2822                         mutex_exit(&sl->sl_lock);
2823                         goto smm_err_out;
2824                 }
2825                 if (old_size != mlu->mlu_lu_size) {
2826                         mutex_enter(&sl->sl_lock);
2827                         for (it = sl->sl_it_list; it != NULL;
2828                             it = it->sbd_it_next) {
2829                                 it->sbd_it_ua_conditions |=
2830                                     SBD_UA_CAPACITY_CHANGED;
2831                         }
2832                         mutex_exit(&sl->sl_lock);
2833                 }
2834         }
2835 
2836         if (sbd_write_lu_info(sl) != SBD_SUCCESS) {
2837                 *err_ret = SBD_RET_META_CREATION_FAILED;
2838                 ret = EIO;
2839         }
2840 
2841 smm_err_out:
2842         if (modify_unregistered) {
2843                 (void) sbd_close_delete_lu(sl, 0);
2844         } else {
2845                 sl->sl_trans_op = SL_OP_NONE;
2846         }
2847         return (ret);
2848 }
2849 
2850 int
2851 sbd_set_global_props(sbd_global_props_t *mlu, int struct_sz,
2852     uint32_t *err_ret)
2853 {
2854         sbd_lu_t *sl = NULL;
2855         int ret = 0;
2856         sbd_it_data_t *it;
2857         uint32_t sz;
2858 
2859         sz = struct_sz - sizeof (*mlu) + 8 + 1;
2860 
2861         /* if there is data in the buf, null terminate it */
2862         if (struct_sz > sizeof (*mlu)) {
2863                 mlu->mlu_buf[struct_sz - sizeof (*mlu) + 8 - 1] = 0;
2864         }
2865 
2866         *err_ret = 0;
2867 
2868         /* Lets validate offsets */
2869         if (((mlu->mlu_mgmt_url_valid) &&
2870             (mlu->mlu_mgmt_url_off >= sz))) {
2871                 return (EINVAL);
2872         }
2873 
2874         if (mlu->mlu_mgmt_url_valid) {
2875                 uint16_t url_sz;
2876 
2877                 url_sz = strlen((char *)mlu->mlu_buf + mlu->mlu_mgmt_url_off);
2878                 if (url_sz > 0)
2879                         url_sz++;
2880 
2881                 rw_enter(&sbd_global_prop_lock, RW_WRITER);
2882                 if (sbd_mgmt_url_alloc_size > 0 &&
2883                     (url_sz == 0 || sbd_mgmt_url_alloc_size < url_sz)) {
2884                         kmem_free(sbd_mgmt_url, sbd_mgmt_url_alloc_size);
2885                         sbd_mgmt_url = NULL;
2886                         sbd_mgmt_url_alloc_size = 0;
2887                 }
2888                 if (url_sz > 0) {
2889                         if (sbd_mgmt_url_alloc_size == 0) {
2890                                 sbd_mgmt_url = kmem_alloc(url_sz, KM_SLEEP);
2891                                 sbd_mgmt_url_alloc_size = url_sz;
2892                         }
2893                         (void) strcpy(sbd_mgmt_url, (char *)mlu->mlu_buf +
2894                             mlu->mlu_mgmt_url_off);
2895                 }
2896                 /*
2897                  * check each lu to determine whether a UA is needed.
2898                  */
2899                 mutex_enter(&sbd_lock);
2900                 for (sl = sbd_lu_list; sl; sl = sl->sl_next) {
2901                         if (sl->sl_mgmt_url) {
2902                                 continue;
2903                         }
2904                         mutex_enter(&sl->sl_lock);
2905                         for (it = sl->sl_it_list; it != NULL;
2906                             it = it->sbd_it_next) {
2907                                 it->sbd_it_ua_conditions |=
2908                                     SBD_UA_MODE_PARAMETERS_CHANGED;
2909                         }
2910                         mutex_exit(&sl->sl_lock);
2911                 }
2912                 mutex_exit(&sbd_lock);
2913                 rw_exit(&sbd_global_prop_lock);
2914         }
2915         return (ret);
2916 }
2917 
2918 /* ARGSUSED */
2919 int
2920 sbd_delete_locked_lu(sbd_lu_t *sl, uint32_t *err_ret,
2921     stmf_state_change_info_t *ssi)
2922 {
2923         int i;
2924         stmf_status_t ret;
2925 
2926         if ((sl->sl_state == STMF_STATE_OFFLINE) &&
2927             !sl->sl_state_not_acked) {
2928                 goto sdl_do_dereg;
2929         }
2930 
2931         if ((sl->sl_state != STMF_STATE_ONLINE) ||
2932             sl->sl_state_not_acked) {
2933                 return (EBUSY);
2934         }
2935 
2936         ret = stmf_ctl(STMF_CMD_LU_OFFLINE, sl->sl_lu, ssi);
2937         if ((ret != STMF_SUCCESS) && (ret != STMF_ALREADY)) {
2938                 return (EBUSY);
2939         }
2940 
2941         for (i = 0; i < 500; i++) {
2942                 if ((sl->sl_state == STMF_STATE_OFFLINE) &&
2943                     !sl->sl_state_not_acked) {
2944                         goto sdl_do_dereg;
2945                 }
2946                 delay(drv_usectohz(10000));
2947         }
2948         return (EBUSY);
2949 
2950 sdl_do_dereg:;
2951         if (stmf_deregister_lu(sl->sl_lu) != STMF_SUCCESS)
2952                 return (EBUSY);
2953         atomic_dec_32(&sbd_lu_count);
2954 
2955         return (sbd_close_delete_lu(sl, 0));
2956 }
2957 
2958 int
2959 sbd_delete_lu(sbd_delete_lu_t *dlu, int struct_sz, uint32_t *err_ret)
2960 {
2961         sbd_lu_t *sl;
2962         sbd_status_t sret;
2963         stmf_state_change_info_t ssi;
2964         int ret;
2965 
2966         if (dlu->dlu_by_meta_name) {
2967                 ((char *)dlu)[struct_sz - 1] = 0;
2968                 sret = sbd_find_and_lock_lu(NULL, dlu->dlu_meta_name,
2969                     SL_OP_DELETE_LU, &sl);
2970         } else {
2971                 sret = sbd_find_and_lock_lu(dlu->dlu_guid, NULL,
2972                     SL_OP_DELETE_LU, &sl);
2973         }
2974         if (sret != SBD_SUCCESS) {
2975                 if (sret == SBD_BUSY) {
2976                         *err_ret = SBD_RET_LU_BUSY;
2977                         return (EBUSY);
2978                 } else if (sret == SBD_NOT_FOUND) {
2979                         *err_ret = SBD_RET_NOT_FOUND;
2980                         return (ENOENT);
2981                 }
2982                 return (EIO);
2983         }
2984 
2985         ssi.st_rflags = STMF_RFLAG_USER_REQUEST;
2986         ssi.st_additional_info = "sbd_delete_lu call (ioctl)";
2987         ret = sbd_delete_locked_lu(sl, err_ret, &ssi);
2988 
2989         if (ret) {
2990                 /* Once its locked, no need to grab mutex again */
2991                 sl->sl_trans_op = SL_OP_NONE;
2992         }
2993         return (ret);
2994 }
2995 
2996 sbd_status_t
2997 sbd_data_read(sbd_lu_t *sl, struct scsi_task *task,
2998     uint64_t offset, uint64_t size, uint8_t *buf)
2999 {
3000         int ret;
3001         long resid;
3002 
3003         if ((offset + size) > sl->sl_lu_size) {
3004                 return (SBD_IO_PAST_EOF);
3005         }
3006 
3007         offset += sl->sl_data_offset;
3008 
3009         if ((offset + size) > sl->sl_data_readable_size) {
3010                 uint64_t store_end;
3011                 if (offset > sl->sl_data_readable_size) {
3012                         bzero(buf, size);
3013                         return (SBD_SUCCESS);
3014                 }
3015                 store_end = sl->sl_data_readable_size - offset;
3016                 bzero(buf + store_end, size - store_end);
3017                 size = store_end;
3018         }
3019 
3020         DTRACE_PROBE5(backing__store__read__start, sbd_lu_t *, sl,
3021             uint8_t *, buf, uint64_t, size, uint64_t, offset,
3022             scsi_task_t *, task);
3023 
3024         /*
3025          * Don't proceed if the device has been closed
3026          * This can occur on an access state change to standby or
3027          * a delete. The writer lock is acquired before closing the
3028          * lu.
3029          */
3030         rw_enter(&sl->sl_access_state_lock, RW_READER);
3031         if ((sl->sl_flags & SL_MEDIA_LOADED) == 0) {
3032                 rw_exit(&sl->sl_access_state_lock);
3033                 return (SBD_FAILURE);
3034         }
3035         ret = vn_rdwr(UIO_READ, sl->sl_data_vp, (caddr_t)buf, (ssize_t)size,
3036             (offset_t)offset, UIO_SYSSPACE, 0, RLIM64_INFINITY, CRED(),
3037             &resid);
3038         rw_exit(&sl->sl_access_state_lock);
3039 
3040         DTRACE_PROBE6(backing__store__read__end, sbd_lu_t *, sl,
3041             uint8_t *, buf, uint64_t, size, uint64_t, offset,
3042             int, ret, scsi_task_t *, task);
3043 
3044 over_sl_data_read:
3045         if (ret || resid) {
3046                 stmf_trace(0, "UIO_READ failed, ret = %d, resid = %d", ret,
3047                     resid);
3048                 return (SBD_FAILURE);
3049         }
3050 
3051         return (SBD_SUCCESS);
3052 }
3053 
3054 sbd_status_t
3055 sbd_data_write(sbd_lu_t *sl, struct scsi_task *task,
3056     uint64_t offset, uint64_t size, uint8_t *buf)
3057 {
3058         int ret;
3059         long resid;
3060         sbd_status_t sret = SBD_SUCCESS;
3061         int ioflag;
3062 
3063         if ((offset + size) > sl->sl_lu_size) {
3064                 return (SBD_IO_PAST_EOF);
3065         }
3066 
3067         offset += sl->sl_data_offset;
3068 
3069         if ((sl->sl_flags & SL_WRITEBACK_CACHE_DISABLE) &&
3070             (sl->sl_flags & SL_FLUSH_ON_DISABLED_WRITECACHE)) {
3071                 ioflag = FSYNC;
3072         } else {
3073                 ioflag = 0;
3074         }
3075 
3076         DTRACE_PROBE5(backing__store__write__start, sbd_lu_t *, sl,
3077             uint8_t *, buf, uint64_t, size, uint64_t, offset,
3078             scsi_task_t *, task);
3079 
3080         /*
3081          * Don't proceed if the device has been closed
3082          * This can occur on an access state change to standby or
3083          * a delete. The writer lock is acquired before closing the
3084          * lu.
3085          */
3086         rw_enter(&sl->sl_access_state_lock, RW_READER);
3087         if ((sl->sl_flags & SL_MEDIA_LOADED) == 0) {
3088                 rw_exit(&sl->sl_access_state_lock);
3089                 return (SBD_FAILURE);
3090         }
3091         ret = vn_rdwr(UIO_WRITE, sl->sl_data_vp, (caddr_t)buf, (ssize_t)size,
3092             (offset_t)offset, UIO_SYSSPACE, ioflag, RLIM64_INFINITY, CRED(),
3093             &resid);
3094         rw_exit(&sl->sl_access_state_lock);
3095 
3096         DTRACE_PROBE6(backing__store__write__end, sbd_lu_t *, sl,
3097             uint8_t *, buf, uint64_t, size, uint64_t, offset,
3098             int, ret, scsi_task_t *, task);
3099 
3100         if ((ret == 0) && (resid == 0) &&
3101             (sl->sl_flags & SL_WRITEBACK_CACHE_DISABLE) &&
3102             (sl->sl_flags & SL_FLUSH_ON_DISABLED_WRITECACHE)) {
3103                 sret = sbd_flush_data_cache(sl, 1);
3104         }
3105 over_sl_data_write:
3106 
3107         if ((ret || resid) || (sret != SBD_SUCCESS)) {
3108                 return (SBD_FAILURE);
3109         } else if ((offset + size) > sl->sl_data_readable_size) {
3110                 uint64_t old_size, new_size;
3111 
3112                 do {
3113                         old_size = sl->sl_data_readable_size;
3114                         if ((offset + size) <= old_size)
3115                                 break;
3116                         new_size = offset + size;
3117                 } while (atomic_cas_64(&sl->sl_data_readable_size, old_size,
3118                     new_size) != old_size);
3119         }
3120 
3121         return (SBD_SUCCESS);
3122 }
3123 
3124 int
3125 sbd_get_global_props(sbd_global_props_t *oslp, uint32_t oslp_sz,
3126     uint32_t *err_ret)
3127 {
3128         uint32_t sz = 0;
3129         uint16_t off;
3130 
3131         rw_enter(&sbd_global_prop_lock, RW_READER);
3132         if (sbd_mgmt_url) {
3133                 sz += strlen(sbd_mgmt_url) + 1;
3134         }
3135         bzero(oslp, sizeof (*oslp) - 8);
3136         oslp->mlu_buf_size_needed = sz;
3137 
3138         if (sz > (oslp_sz - sizeof (*oslp) + 8)) {
3139                 *err_ret = SBD_RET_INSUFFICIENT_BUF_SPACE;
3140                 rw_exit(&sbd_global_prop_lock);
3141                 return (ENOMEM);
3142         }
3143 
3144         off = 0;
3145         if (sbd_mgmt_url) {
3146                 oslp->mlu_mgmt_url_valid = 1;
3147                 oslp->mlu_mgmt_url_off = off;
3148                 (void) strcpy((char *)&oslp->mlu_buf[off], sbd_mgmt_url);
3149                 off += strlen(sbd_mgmt_url) + 1;
3150         }
3151 
3152         rw_exit(&sbd_global_prop_lock);
3153         return (0);
3154 }
3155 
3156 static int
3157 sbd_get_unmap_props(sbd_unmap_props_t *sup,
3158     sbd_unmap_props_t *osup, uint32_t *err_ret)
3159 {
3160         sbd_status_t sret;
3161         sbd_lu_t *sl = NULL;
3162 
3163         if (sup->sup_guid_valid) {
3164                 sret = sbd_find_and_lock_lu(sup->sup_guid,
3165                     NULL, SL_OP_LU_PROPS, &sl);
3166         } else {
3167                 sret = sbd_find_and_lock_lu(NULL,
3168                     (uint8_t *)sup->sup_zvol_path, SL_OP_LU_PROPS,
3169                     &sl);
3170         }
3171         if (sret != SBD_SUCCESS) {
3172                 if (sret == SBD_BUSY) {
3173                         *err_ret = SBD_RET_LU_BUSY;
3174                         return (EBUSY);
3175                 } else if (sret == SBD_NOT_FOUND) {
3176                         *err_ret = SBD_RET_NOT_FOUND;
3177                         return (ENOENT);
3178                 }
3179                 return (EIO);
3180         }
3181 
3182         sup->sup_found_lu = 1;
3183         sup->sup_guid_valid = 1;
3184         bcopy(sl->sl_device_id + 4, sup->sup_guid, 16);
3185         if (sl->sl_flags & SL_UNMAP_ENABLED)
3186                 sup->sup_unmap_enabled = 1;
3187         else
3188                 sup->sup_unmap_enabled = 0;
3189 
3190         *osup = *sup;
3191         sl->sl_trans_op = SL_OP_NONE;
3192 
3193         return (0);
3194 }
3195 
3196 int
3197 sbd_get_lu_props(sbd_lu_props_t *islp, uint32_t islp_sz,
3198     sbd_lu_props_t *oslp, uint32_t oslp_sz, uint32_t *err_ret)
3199 {
3200         sbd_status_t sret;
3201         sbd_lu_t *sl = NULL;
3202         uint32_t sz;
3203         uint16_t off;
3204 
3205         if (islp->slp_input_guid) {
3206                 sret = sbd_find_and_lock_lu(islp->slp_guid, NULL,
3207                     SL_OP_LU_PROPS, &sl);
3208         } else {
3209                 ((char *)islp)[islp_sz - 1] = 0;
3210                 sret = sbd_find_and_lock_lu(NULL, islp->slp_buf,
3211                     SL_OP_LU_PROPS, &sl);
3212         }
3213         if (sret != SBD_SUCCESS) {
3214                 if (sret == SBD_BUSY) {
3215                         *err_ret = SBD_RET_LU_BUSY;
3216                         return (EBUSY);
3217                 } else if (sret == SBD_NOT_FOUND) {
3218                         *err_ret = SBD_RET_NOT_FOUND;
3219                         return (ENOENT);
3220                 }
3221                 return (EIO);
3222         }
3223 
3224         sz = strlen(sl->sl_name) + 1;
3225         if ((sl->sl_flags & (SL_ZFS_META | SL_SHARED_META)) == 0) {
3226                 if (sl->sl_data_filename) {
3227                         sz += strlen(sl->sl_data_filename) + 1;
3228                 }
3229         }
3230         sz += sl->sl_serial_no_size;
3231         if (sl->sl_alias) {
3232                 sz += strlen(sl->sl_alias) + 1;
3233         }
3234 
3235         rw_enter(&sbd_global_prop_lock, RW_READER);
3236         if (sl->sl_mgmt_url) {
3237                 sz += strlen(sl->sl_mgmt_url) + 1;
3238         } else if (sbd_mgmt_url) {
3239                 sz += strlen(sbd_mgmt_url) + 1;
3240         }
3241         bzero(oslp, sizeof (*oslp) - 8);
3242         oslp->slp_buf_size_needed = sz;
3243 
3244         if (sz > (oslp_sz - sizeof (*oslp) + 8)) {
3245                 sl->sl_trans_op = SL_OP_NONE;
3246                 *err_ret = SBD_RET_INSUFFICIENT_BUF_SPACE;
3247                 rw_exit(&sbd_global_prop_lock);
3248                 return (ENOMEM);
3249         }
3250 
3251         off = 0;
3252         (void) strcpy((char *)oslp->slp_buf, sl->sl_name);
3253         oslp->slp_meta_fname_off = off;
3254         off += strlen(sl->sl_name) + 1;
3255         if ((sl->sl_flags & (SL_ZFS_META | SL_SHARED_META)) == 0) {
3256                 oslp->slp_meta_fname_valid = 1;
3257                 oslp->slp_separate_meta = 1;
3258                 if (sl->sl_data_filename) {
3259                         oslp->slp_data_fname_valid = 1;
3260                         oslp->slp_data_fname_off = off;
3261                         (void) strcpy((char *)&oslp->slp_buf[off],
3262                             sl->sl_data_filename);
3263                         off += strlen(sl->sl_data_filename) + 1;
3264                 }
3265         } else {
3266                 oslp->slp_data_fname_valid = 1;
3267                 oslp->slp_data_fname_off = oslp->slp_meta_fname_off;
3268                 if (sl->sl_flags & SL_ZFS_META) {
3269                         oslp->slp_zfs_meta = 1;
3270                 }
3271         }
3272         if (sl->sl_alias) {
3273                 oslp->slp_alias_valid = 1;
3274                 oslp->slp_alias_off = off;
3275                 (void) strcpy((char *)&oslp->slp_buf[off], sl->sl_alias);
3276                 off += strlen(sl->sl_alias) + 1;
3277         }
3278         if (sl->sl_mgmt_url) {
3279                 oslp->slp_mgmt_url_valid = 1;
3280                 oslp->slp_mgmt_url_off = off;
3281                 (void) strcpy((char *)&oslp->slp_buf[off], sl->sl_mgmt_url);
3282                 off += strlen(sl->sl_mgmt_url) + 1;
3283         } else if (sbd_mgmt_url) {
3284                 oslp->slp_mgmt_url_valid = 1;
3285                 oslp->slp_mgmt_url_off = off;
3286                 (void) strcpy((char *)&oslp->slp_buf[off], sbd_mgmt_url);
3287                 off += strlen(sbd_mgmt_url) + 1;
3288         }
3289         if (sl->sl_serial_no_size) {
3290                 oslp->slp_serial_off = off;
3291                 bcopy(sl->sl_serial_no, &oslp->slp_buf[off],
3292                     sl->sl_serial_no_size);
3293                 oslp->slp_serial_size = sl->sl_serial_no_size;
3294                 oslp->slp_serial_valid = 1;
3295                 off += sl->sl_serial_no_size;
3296         }
3297 
3298         oslp->slp_lu_size = sl->sl_lu_size;
3299         oslp->slp_blksize = ((uint16_t)1) << sl->sl_data_blocksize_shift;
3300 
3301         oslp->slp_access_state = sl->sl_access_state;
3302 
3303         if (sl->sl_flags & SL_VID_VALID) {
3304                 oslp->slp_lu_vid = 1;
3305                 bcopy(sl->sl_vendor_id, oslp->slp_vid, 8);
3306         } else {
3307                 bcopy(sbd_vendor_id, oslp->slp_vid, 8);
3308         }
3309         if (sl->sl_flags & SL_PID_VALID) {
3310                 oslp->slp_lu_pid = 1;
3311                 bcopy(sl->sl_product_id, oslp->slp_pid, 16);
3312         } else {
3313                 bcopy(sbd_product_id, oslp->slp_pid, 16);
3314         }
3315         if (sl->sl_flags & SL_REV_VALID) {
3316                 oslp->slp_lu_rev = 1;
3317                 bcopy(sl->sl_revision, oslp->slp_rev, 4);
3318         } else {
3319                 bcopy(sbd_revision, oslp->slp_rev, 4);
3320         }
3321         bcopy(sl->sl_device_id + 4, oslp->slp_guid, 16);
3322 
3323         if (sl->sl_flags & SL_WRITEBACK_CACHE_DISABLE)
3324                 oslp->slp_writeback_cache_disable_cur = 1;
3325         if (sl->sl_flags & SL_SAVED_WRITE_CACHE_DISABLE)
3326                 oslp->slp_writeback_cache_disable_saved = 1;
3327         if (sl->sl_flags & SL_WRITE_PROTECTED)
3328                 oslp->slp_write_protected = 1;
3329 
3330         sl->sl_trans_op = SL_OP_NONE;
3331 
3332         rw_exit(&sbd_global_prop_lock);
3333         return (0);
3334 }
3335 
3336 /*
3337  * Returns an allocated string with the "<pool>/..." form of the zvol name.
3338  */
3339 static char *
3340 sbd_get_zvol_name(sbd_lu_t *sl)
3341 {
3342         char *src;
3343         char *p;
3344 
3345         if (sl->sl_data_filename)
3346                 src = sl->sl_data_filename;
3347         else
3348                 src = sl->sl_meta_filename;
3349         /* There has to be a better way */
3350         if (SBD_IS_ZVOL(src) != 0) {
3351                 ASSERT(0);
3352         }
3353         src += 14;      /* Past /dev/zvol/dsk/ */
3354         if (*src == '/')
3355                 src++;  /* or /dev/zvol/rdsk/ */
3356         p = (char *)kmem_alloc(strlen(src) + 1, KM_SLEEP);
3357         (void) strcpy(p, src);
3358         return (p);
3359 }
3360 
3361 /*
3362  * this function creates a local metadata zvol property
3363  */
3364 sbd_status_t
3365 sbd_create_zfs_meta_object(sbd_lu_t *sl)
3366 {
3367         /*
3368          * -allocate 1/2 the property size, the zfs property
3369          *  is 8k in size and stored as ascii hex string, all
3370          *  we needed is 4k buffer to store the binary data.
3371          * -initialize reader/write lock
3372          */
3373         if ((sl->sl_zfs_meta = kmem_zalloc(ZAP_MAXVALUELEN / 2, KM_SLEEP))
3374             == NULL)
3375                 return (SBD_FAILURE);
3376         rw_init(&sl->sl_zfs_meta_lock, NULL, RW_DRIVER, NULL);
3377         return (SBD_SUCCESS);
3378 }
3379 
3380 char
3381 sbd_ctoi(char c)
3382 {
3383         if ((c >= '0') && (c <= '9'))
3384                 c -= '0';
3385         else if ((c >= 'A') && (c <= 'F'))
3386                 c = c - 'A' + 10;
3387         else if ((c >= 'a') && (c <= 'f'))
3388                 c = c - 'a' + 10;
3389         else
3390                 c = -1;
3391         return (c);
3392 }
3393 
3394 /*
3395  * read zvol property and convert to binary
3396  */
3397 sbd_status_t
3398 sbd_open_zfs_meta(sbd_lu_t *sl)
3399 {
3400         char            *meta = NULL, cl, ch;
3401         int             i;
3402         char            *tmp, *ptr;
3403         uint64_t        rc = SBD_SUCCESS;
3404         int             len;
3405         char            *file;
3406 
3407         if (sl->sl_zfs_meta == NULL) {
3408                 if (sbd_create_zfs_meta_object(sl) == SBD_FAILURE)
3409                         return (SBD_FAILURE);
3410         } else {
3411                 bzero(sl->sl_zfs_meta, (ZAP_MAXVALUELEN / 2));
3412         }
3413 
3414         rw_enter(&sl->sl_zfs_meta_lock, RW_WRITER);
3415         file = sbd_get_zvol_name(sl);
3416         if (sbd_zvolget(file, &meta)) {
3417                 rc = SBD_FAILURE;
3418                 goto done;
3419         }
3420         tmp = meta;
3421         /* convert ascii hex to binary meta */
3422         len = strlen(meta);
3423         ptr = sl->sl_zfs_meta;
3424         for (i = 0; i < len; i += 2) {
3425                 ch = sbd_ctoi(*tmp++);
3426                 cl = sbd_ctoi(*tmp++);
3427                 if (ch == -1 || cl == -1) {
3428                         rc = SBD_FAILURE;
3429                         break;
3430                 }
3431                 *ptr++ = (ch << 4) + cl;
3432         }
3433 done:
3434         rw_exit(&sl->sl_zfs_meta_lock);
3435         if (meta)
3436                 kmem_free(meta, len + 1);
3437         kmem_free(file, strlen(file) + 1);
3438         return (rc);
3439 }
3440 
3441 sbd_status_t
3442 sbd_read_zfs_meta(sbd_lu_t *sl, uint8_t *buf, uint64_t sz, uint64_t off)
3443 {
3444         ASSERT(sl->sl_zfs_meta);
3445         rw_enter(&sl->sl_zfs_meta_lock, RW_READER);
3446         bcopy(&sl->sl_zfs_meta[off], buf, sz);
3447         rw_exit(&sl->sl_zfs_meta_lock);
3448         return (SBD_SUCCESS);
3449 }
3450 
3451 sbd_status_t
3452 sbd_write_zfs_meta(sbd_lu_t *sl, uint8_t *buf, uint64_t sz, uint64_t off)
3453 {
3454         ASSERT(sl->sl_zfs_meta);
3455         if ((off + sz) > (ZAP_MAXVALUELEN / 2 - 1)) {
3456                 return (SBD_META_CORRUPTED);
3457         }
3458         if ((off + sz) > sl->sl_meta_size_used) {
3459                 sl->sl_meta_size_used = off + sz;
3460                 if (sl->sl_total_meta_size < sl->sl_meta_size_used) {
3461                         uint64_t meta_align =
3462                             (((uint64_t)1) << sl->sl_meta_blocksize_shift) - 1;
3463                         sl->sl_total_meta_size = (sl->sl_meta_size_used +
3464                             meta_align) & (~meta_align);
3465                 }
3466         }
3467         rw_enter(&sl->sl_zfs_meta_lock, RW_WRITER);
3468         bcopy(buf, &sl->sl_zfs_meta[off], sz);
3469         rw_exit(&sl->sl_zfs_meta_lock);
3470         /*
3471          * During creation of a logical unit, sbd_update_zfs_prop will be
3472          * called separately to avoid multiple calls as each meta section
3473          * create/update will result in a call to sbd_write_zfs_meta().
3474          * We only need to update the zvol once during create.
3475          */
3476         mutex_enter(&sl->sl_lock);
3477         if (sl->sl_trans_op != SL_OP_CREATE_REGISTER_LU) {
3478                 mutex_exit(&sl->sl_lock);
3479                 return (sbd_update_zfs_prop(sl));
3480         }
3481         mutex_exit(&sl->sl_lock);
3482         return (SBD_SUCCESS);
3483 }
3484 
3485 sbd_status_t
3486 sbd_update_zfs_prop(sbd_lu_t *sl)
3487 {
3488         char    *ptr, *ah_meta;
3489         char    *dp = NULL;
3490         int     i, num;
3491         char    *file;
3492         sbd_status_t ret = SBD_SUCCESS;
3493 
3494         ASSERT(sl->sl_zfs_meta);
3495         ptr = ah_meta = kmem_zalloc(ZAP_MAXVALUELEN, KM_SLEEP);
3496         rw_enter(&sl->sl_zfs_meta_lock, RW_READER);
3497         /* convert local copy to ascii hex */
3498         dp = sl->sl_zfs_meta;
3499         for (i = 0; i < sl->sl_total_meta_size; i++, dp++) {
3500                 num = ((*dp) >> 4) & 0xF;
3501                 *ah_meta++ = (num < 10) ? (num + '0') : (num + ('a' - 10));
3502                 num = (*dp) & 0xF;
3503                 *ah_meta++ = (num < 10) ? (num + '0') : (num + ('a' - 10));
3504         }
3505         *ah_meta = NULL;
3506         file = sbd_get_zvol_name(sl);
3507         if (sbd_zvolset(file, (char *)ptr)) {
3508                 ret = SBD_META_CORRUPTED;
3509         }
3510         rw_exit(&sl->sl_zfs_meta_lock);
3511         kmem_free(ptr, ZAP_MAXVALUELEN);
3512         kmem_free(file, strlen(file) + 1);
3513         return (ret);
3514 }
3515 
3516 int
3517 sbd_is_zvol(char *path)
3518 {
3519         int is_zfs = 0;
3520 
3521         if (SBD_IS_ZVOL(path) == 0)
3522                 is_zfs = 1;
3523 
3524         return (is_zfs);
3525 }
3526 
3527 /*
3528  * set write cache disable
3529  * wcd - 1 = disable, 0 = enable
3530  */
3531 sbd_status_t
3532 sbd_wcd_set(int wcd, sbd_lu_t *sl)
3533 {
3534         /* translate to wce bit */
3535         int wce = wcd ? 0 : 1;
3536         int ret;
3537         sbd_status_t sret = SBD_SUCCESS;
3538 
3539         mutex_enter(&sl->sl_lock);
3540         sl->sl_flags &= ~SL_WRITEBACK_CACHE_SET_UNSUPPORTED;
3541 
3542         if (sl->sl_data_vp->v_type == VREG) {
3543                 sl->sl_flags |= SL_FLUSH_ON_DISABLED_WRITECACHE;
3544                 goto done;
3545         }
3546 
3547         ret = VOP_IOCTL(sl->sl_data_vp, DKIOCSETWCE, (intptr_t)&wce, FKIOCTL,
3548             kcred, NULL, NULL);
3549         if (ret == 0) {
3550                 sl->sl_flags &= ~SL_WRITEBACK_CACHE_SET_UNSUPPORTED;
3551                 sl->sl_flags &= ~SL_FLUSH_ON_DISABLED_WRITECACHE;
3552         } else {
3553                 sl->sl_flags |= SL_WRITEBACK_CACHE_SET_UNSUPPORTED;
3554                 sl->sl_flags |= SL_FLUSH_ON_DISABLED_WRITECACHE;
3555                 sret = SBD_FAILURE;
3556                 goto done;
3557         }
3558 
3559 done:
3560         mutex_exit(&sl->sl_lock);
3561         return (sret);
3562 }
3563 
3564 /*
3565  * get write cache disable
3566  * wcd - 1 = disable, 0 = enable
3567  */
3568 void
3569 sbd_wcd_get(int *wcd, sbd_lu_t *sl)
3570 {
3571         int wce;
3572         int ret;
3573 
3574         if (sl->sl_data_vp->v_type == VREG) {
3575                 *wcd = 0;
3576                 return;
3577         }
3578 
3579         ret = VOP_IOCTL(sl->sl_data_vp, DKIOCGETWCE, (intptr_t)&wce, FKIOCTL,
3580             kcred, NULL, NULL);
3581         /* if write cache get failed, assume disabled */
3582         if (ret) {
3583                 *wcd = 1;
3584         } else {
3585                 /* translate to wcd bit */
3586                 *wcd = wce ? 0 : 1;
3587         }
3588 }
3589 
3590 int
3591 sbd_zvolget(char *zvol_name, char **comstarprop)
3592 {
3593         ldi_handle_t    zfs_lh;
3594         nvlist_t        *nv = NULL, *nv2;
3595         zfs_cmd_t       *zc;
3596         char            *ptr;
3597         int size = 1024;
3598         int unused;
3599         int rc;
3600 
3601         if ((rc = ldi_open_by_name("/dev/zfs", FREAD | FWRITE, kcred,
3602             &zfs_lh, sbd_zfs_ident)) != 0) {
3603                 cmn_err(CE_WARN, "ldi_open %d", rc);
3604                 return (ENXIO);
3605         }
3606 
3607         zc = kmem_zalloc(sizeof (zfs_cmd_t), KM_SLEEP);
3608         (void) strlcpy(zc->zc_name, zvol_name, sizeof (zc->zc_name));
3609 again:
3610         zc->zc_nvlist_dst = (uint64_t)(intptr_t)kmem_alloc(size,
3611             KM_SLEEP);
3612         zc->zc_nvlist_dst_size = size;
3613         rc = ldi_ioctl(zfs_lh, ZFS_IOC_OBJSET_STATS, (intptr_t)zc,
3614             FKIOCTL, kcred, &unused);
3615         /*
3616          * ENOMEM means the list is larger than what we've allocated
3617          * ldi_ioctl will fail with ENOMEM only once
3618          */
3619         if (rc == ENOMEM) {
3620                 int newsize;
3621                 newsize = zc->zc_nvlist_dst_size;
3622                 kmem_free((void *)(uintptr_t)zc->zc_nvlist_dst, size);
3623                 size = newsize;
3624                 goto again;
3625         } else if (rc != 0) {
3626                 goto out;
3627         }
3628         rc = nvlist_unpack((char *)(uintptr_t)zc->zc_nvlist_dst,
3629             zc->zc_nvlist_dst_size, &nv, 0);
3630         ASSERT(rc == 0);        /* nvlist_unpack should not fail */
3631         if ((rc = nvlist_lookup_nvlist(nv, "stmf_sbd_lu", &nv2)) == 0) {
3632                 rc = nvlist_lookup_string(nv2, ZPROP_VALUE, &ptr);
3633                 if (rc != 0) {
3634                         cmn_err(CE_WARN, "couldn't get value");
3635                 } else {
3636                         *comstarprop = kmem_alloc(strlen(ptr) + 1,
3637                             KM_SLEEP);
3638                         (void) strcpy(*comstarprop, ptr);
3639                 }
3640         }
3641 out:
3642         nvlist_free(nv);
3643         kmem_free((void *)(uintptr_t)zc->zc_nvlist_dst, size);
3644         kmem_free(zc, sizeof (zfs_cmd_t));
3645         (void) ldi_close(zfs_lh, FREAD|FWRITE, kcred);
3646 
3647         return (rc);
3648 }
3649 
3650 int
3651 sbd_zvolset(char *zvol_name, char *comstarprop)
3652 {
3653         ldi_handle_t    zfs_lh;
3654         nvlist_t        *nv;
3655         char            *packed = NULL;
3656         size_t          len;
3657         zfs_cmd_t       *zc;
3658         int unused;
3659         int rc;
3660 
3661         if ((rc = ldi_open_by_name("/dev/zfs", FREAD | FWRITE, kcred,
3662             &zfs_lh, sbd_zfs_ident)) != 0) {
3663                 cmn_err(CE_WARN, "ldi_open %d", rc);
3664                 return (ENXIO);
3665         }
3666         (void) nvlist_alloc(&nv, NV_UNIQUE_NAME, KM_SLEEP);
3667         (void) nvlist_add_string(nv, "stmf_sbd_lu", comstarprop);
3668         if ((rc = nvlist_pack(nv, &packed, &len, NV_ENCODE_NATIVE, KM_SLEEP))) {
3669                 goto out;
3670         }
3671 
3672         zc = kmem_zalloc(sizeof (zfs_cmd_t), KM_SLEEP);
3673         (void) strlcpy(zc->zc_name, zvol_name, sizeof (zc->zc_name));
3674         zc->zc_nvlist_src = (uint64_t)(intptr_t)packed;
3675         zc->zc_nvlist_src_size = len;
3676         rc = ldi_ioctl(zfs_lh, ZFS_IOC_SET_PROP, (intptr_t)zc,
3677             FKIOCTL, kcred, &unused);
3678         if (rc != 0) {
3679                 cmn_err(CE_NOTE, "ioctl failed %d", rc);
3680         }
3681         kmem_free(zc, sizeof (zfs_cmd_t));
3682         if (packed)
3683                 kmem_free(packed, len);
3684 out:
3685         nvlist_free(nv);
3686         (void) ldi_close(zfs_lh, FREAD|FWRITE, kcred);
3687         return (rc);
3688 }
3689 
3690 /*
3691  * Unmap a region in a volume.  Currently only supported for zvols.
3692  */
3693 int
3694 sbd_unmap(sbd_lu_t *sl, uint64_t offset, uint64_t length)
3695 {
3696         vnode_t *vp;
3697         int unused;
3698         dkioc_free_t df;
3699 
3700         /* Right now, we only support UNMAP on zvols. */
3701         if (!(sl->sl_flags & SL_ZFS_META))
3702                 return (EIO);
3703 
3704         df.df_flags = (sl->sl_flags & SL_WRITEBACK_CACHE_DISABLE) ?
3705             DF_WAIT_SYNC : 0;
3706         df.df_start = offset;
3707         df.df_length = length;
3708 
3709         /* Use the data vnode we have to send a fop_ioctl(). */
3710         vp = sl->sl_data_vp;
3711         if (vp == NULL) {
3712                 cmn_err(CE_WARN, "Cannot unmap - no vnode pointer.");
3713                 return (EIO);
3714         }
3715 
3716         return (VOP_IOCTL(vp, DKIOCFREE, (intptr_t)(&df), FKIOCTL, kcred,
3717             &unused, NULL));
3718 }