1 /* 2 * CDDL HEADER START 3 * 4 * The contents of this file are subject to the terms of the 5 * Common Development and Distribution License (the "License"). 6 * You may not use this file except in compliance with the License. 7 * 8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9 * or http://www.opensolaris.org/os/licensing. 10 * See the License for the specific language governing permissions 11 * and limitations under the License. 12 * 13 * When distributing Covered Code, include this CDDL HEADER in each 14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15 * If applicable, add the following below this CDDL HEADER, with the 16 * fields enclosed by brackets "[]" replaced with your own identifying 17 * information: Portions Copyright [yyyy] [name of copyright owner] 18 * 19 * CDDL HEADER END 20 */ 21 22 /* 23 * Copyright (c) 2008, 2010, Oracle and/or its affiliates. All rights reserved. 24 * Copyright 2013 Nexenta Systems, Inc. All rights reserved. 25 * Copyright (c) 2013 by Delphix. All rights reserved. 26 */ 27 28 #include <sys/sysmacros.h> 29 #include <sys/conf.h> 30 #include <sys/file.h> 31 #include <sys/ddi.h> 32 #include <sys/sunddi.h> 33 #include <sys/modctl.h> 34 #include <sys/scsi/scsi.h> 35 #include <sys/scsi/impl/scsi_reset_notify.h> 36 #include <sys/disp.h> 37 #include <sys/byteorder.h> 38 #include <sys/pathname.h> 39 #include <sys/atomic.h> 40 #include <sys/nvpair.h> 41 #include <sys/fs/zfs.h> 42 #include <sys/sdt.h> 43 #include <sys/dkio.h> 44 #include <sys/zfs_ioctl.h> 45 46 #include <sys/stmf.h> 47 #include <sys/lpif.h> 48 #include <sys/stmf_ioctl.h> 49 #include <sys/stmf_sbd_ioctl.h> 50 51 #include "stmf_sbd.h" 52 #include "sbd_impl.h" 53 54 #define SBD_IS_ZVOL(zvol) (strncmp("/dev/zvol", zvol, 9)) 55 56 extern sbd_status_t sbd_pgr_meta_init(sbd_lu_t *sl); 57 extern sbd_status_t sbd_pgr_meta_load(sbd_lu_t *sl); 58 extern void sbd_pgr_reset(sbd_lu_t *sl); 59 60 static int sbd_getinfo(dev_info_t *dip, ddi_info_cmd_t cmd, void *arg, 61 void **result); 62 static int sbd_attach(dev_info_t *dip, ddi_attach_cmd_t cmd); 63 static int sbd_detach(dev_info_t *dip, ddi_detach_cmd_t cmd); 64 static int sbd_open(dev_t *devp, int flag, int otype, cred_t *credp); 65 static int sbd_close(dev_t dev, int flag, int otype, cred_t *credp); 66 static int stmf_sbd_ioctl(dev_t dev, int cmd, intptr_t data, int mode, 67 cred_t *credp, int *rval); 68 void sbd_lp_cb(stmf_lu_provider_t *lp, int cmd, void *arg, uint32_t flags); 69 stmf_status_t sbd_proxy_reg_lu(uint8_t *luid, void *proxy_reg_arg, 70 uint32_t proxy_reg_arg_len); 71 stmf_status_t sbd_proxy_dereg_lu(uint8_t *luid, void *proxy_reg_arg, 72 uint32_t proxy_reg_arg_len); 73 stmf_status_t sbd_proxy_msg(uint8_t *luid, void *proxy_arg, 74 uint32_t proxy_arg_len, uint32_t type); 75 int sbd_create_register_lu(sbd_create_and_reg_lu_t *slu, int struct_sz, 76 uint32_t *err_ret); 77 int sbd_create_standby_lu(sbd_create_standby_lu_t *slu, uint32_t *err_ret); 78 int sbd_set_lu_standby(sbd_set_lu_standby_t *stlu, uint32_t *err_ret); 79 int sbd_import_lu(sbd_import_lu_t *ilu, int struct_sz, uint32_t *err_ret, 80 int no_register, sbd_lu_t **slr); 81 int sbd_import_active_lu(sbd_import_lu_t *ilu, sbd_lu_t *sl, uint32_t *err_ret); 82 int sbd_delete_lu(sbd_delete_lu_t *dlu, int struct_sz, uint32_t *err_ret); 83 int sbd_modify_lu(sbd_modify_lu_t *mlu, int struct_sz, uint32_t *err_ret); 84 int sbd_set_global_props(sbd_global_props_t *mlu, int struct_sz, 85 uint32_t *err_ret); 86 int sbd_get_global_props(sbd_global_props_t *oslp, uint32_t oslp_sz, 87 uint32_t *err_ret); 88 int sbd_get_lu_props(sbd_lu_props_t *islp, uint32_t islp_sz, 89 sbd_lu_props_t *oslp, uint32_t oslp_sz, uint32_t *err_ret); 90 static char *sbd_get_zvol_name(sbd_lu_t *); 91 static int sbd_get_unmap_props(sbd_unmap_props_t *sup, sbd_unmap_props_t *osup, 92 uint32_t *err_ret); 93 sbd_status_t sbd_create_zfs_meta_object(sbd_lu_t *sl); 94 sbd_status_t sbd_open_zfs_meta(sbd_lu_t *sl); 95 sbd_status_t sbd_read_zfs_meta(sbd_lu_t *sl, uint8_t *buf, uint64_t sz, 96 uint64_t off); 97 sbd_status_t sbd_write_zfs_meta(sbd_lu_t *sl, uint8_t *buf, uint64_t sz, 98 uint64_t off); 99 sbd_status_t sbd_update_zfs_prop(sbd_lu_t *sl); 100 int sbd_is_zvol(char *path); 101 int sbd_zvolget(char *zvol_name, char **comstarprop); 102 int sbd_zvolset(char *zvol_name, char *comstarprop); 103 char sbd_ctoi(char c); 104 void sbd_close_lu(sbd_lu_t *sl); 105 106 static ldi_ident_t sbd_zfs_ident; 107 static stmf_lu_provider_t *sbd_lp; 108 static sbd_lu_t *sbd_lu_list = NULL; 109 static kmutex_t sbd_lock; 110 static dev_info_t *sbd_dip; 111 static uint32_t sbd_lu_count = 0; 112 113 /* Global property settings for the logical unit */ 114 char sbd_vendor_id[] = "SUN "; 115 char sbd_product_id[] = "COMSTAR "; 116 char sbd_revision[] = "1.0 "; 117 char *sbd_mgmt_url = NULL; 118 uint16_t sbd_mgmt_url_alloc_size = 0; 119 krwlock_t sbd_global_prop_lock; 120 121 static char sbd_name[] = "sbd"; 122 123 static struct cb_ops sbd_cb_ops = { 124 sbd_open, /* open */ 125 sbd_close, /* close */ 126 nodev, /* strategy */ 127 nodev, /* print */ 128 nodev, /* dump */ 129 nodev, /* read */ 130 nodev, /* write */ 131 stmf_sbd_ioctl, /* ioctl */ 132 nodev, /* devmap */ 133 nodev, /* mmap */ 134 nodev, /* segmap */ 135 nochpoll, /* chpoll */ 136 ddi_prop_op, /* cb_prop_op */ 137 0, /* streamtab */ 138 D_NEW | D_MP, /* cb_flag */ 139 CB_REV, /* rev */ 140 nodev, /* aread */ 141 nodev /* awrite */ 142 }; 143 144 static struct dev_ops sbd_ops = { 145 DEVO_REV, 146 0, 147 sbd_getinfo, 148 nulldev, /* identify */ 149 nulldev, /* probe */ 150 sbd_attach, 151 sbd_detach, 152 nodev, /* reset */ 153 &sbd_cb_ops, 154 NULL, /* bus_ops */ 155 NULL /* power */ 156 }; 157 158 #define SBD_NAME "COMSTAR SBD" 159 160 static struct modldrv modldrv = { 161 &mod_driverops, 162 SBD_NAME, 163 &sbd_ops 164 }; 165 166 static struct modlinkage modlinkage = { 167 MODREV_1, 168 &modldrv, 169 NULL 170 }; 171 172 int 173 _init(void) 174 { 175 int ret; 176 177 ret = mod_install(&modlinkage); 178 if (ret) 179 return (ret); 180 sbd_lp = (stmf_lu_provider_t *)stmf_alloc(STMF_STRUCT_LU_PROVIDER, 181 0, 0); 182 sbd_lp->lp_lpif_rev = LPIF_REV_2; 183 sbd_lp->lp_instance = 0; 184 sbd_lp->lp_name = sbd_name; 185 sbd_lp->lp_cb = sbd_lp_cb; 186 sbd_lp->lp_alua_support = 1; 187 sbd_lp->lp_proxy_msg = sbd_proxy_msg; 188 sbd_zfs_ident = ldi_ident_from_anon(); 189 190 if (stmf_register_lu_provider(sbd_lp) != STMF_SUCCESS) { 191 (void) mod_remove(&modlinkage); 192 stmf_free(sbd_lp); 193 return (EINVAL); 194 } 195 mutex_init(&sbd_lock, NULL, MUTEX_DRIVER, NULL); 196 rw_init(&sbd_global_prop_lock, NULL, RW_DRIVER, NULL); 197 return (0); 198 } 199 200 int 201 _fini(void) 202 { 203 int ret; 204 205 /* 206 * If we have registered lus, then make sure they are all offline 207 * if so then deregister them. This should drop the sbd_lu_count 208 * to zero. 209 */ 210 if (sbd_lu_count) { 211 sbd_lu_t *slu; 212 213 /* See if all of them are offline */ 214 mutex_enter(&sbd_lock); 215 for (slu = sbd_lu_list; slu != NULL; slu = slu->sl_next) { 216 if ((slu->sl_state != STMF_STATE_OFFLINE) || 217 slu->sl_state_not_acked) { 218 mutex_exit(&sbd_lock); 219 return (EBUSY); 220 } 221 } 222 mutex_exit(&sbd_lock); 223 224 #if 0 225 /* ok start deregistering them */ 226 while (sbd_lu_list) { 227 sbd_store_t *sst = sbd_lu_list->sl_sst; 228 if (sst->sst_deregister_lu(sst) != STMF_SUCCESS) 229 return (EBUSY); 230 } 231 #endif 232 return (EBUSY); 233 } 234 if (stmf_deregister_lu_provider(sbd_lp) != STMF_SUCCESS) 235 return (EBUSY); 236 ret = mod_remove(&modlinkage); 237 if (ret != 0) { 238 (void) stmf_register_lu_provider(sbd_lp); 239 return (ret); 240 } 241 stmf_free(sbd_lp); 242 mutex_destroy(&sbd_lock); 243 rw_destroy(&sbd_global_prop_lock); 244 ldi_ident_release(sbd_zfs_ident); 245 return (0); 246 } 247 248 int 249 _info(struct modinfo *modinfop) 250 { 251 return (mod_info(&modlinkage, modinfop)); 252 } 253 254 /* ARGSUSED */ 255 static int 256 sbd_getinfo(dev_info_t *dip, ddi_info_cmd_t cmd, void *arg, void **result) 257 { 258 switch (cmd) { 259 case DDI_INFO_DEVT2DEVINFO: 260 *result = sbd_dip; 261 break; 262 case DDI_INFO_DEVT2INSTANCE: 263 *result = (void *)(uintptr_t)ddi_get_instance(sbd_dip); 264 break; 265 default: 266 return (DDI_FAILURE); 267 } 268 269 return (DDI_SUCCESS); 270 } 271 272 static int 273 sbd_attach(dev_info_t *dip, ddi_attach_cmd_t cmd) 274 { 275 switch (cmd) { 276 case DDI_ATTACH: 277 sbd_dip = dip; 278 279 if (ddi_create_minor_node(dip, "admin", S_IFCHR, 0, 280 DDI_NT_STMF_LP, 0) != DDI_SUCCESS) { 281 break; 282 } 283 ddi_report_dev(dip); 284 return (DDI_SUCCESS); 285 } 286 287 return (DDI_FAILURE); 288 } 289 290 static int 291 sbd_detach(dev_info_t *dip, ddi_detach_cmd_t cmd) 292 { 293 switch (cmd) { 294 case DDI_DETACH: 295 ddi_remove_minor_node(dip, 0); 296 return (DDI_SUCCESS); 297 } 298 299 return (DDI_FAILURE); 300 } 301 302 /* ARGSUSED */ 303 static int 304 sbd_open(dev_t *devp, int flag, int otype, cred_t *credp) 305 { 306 if (otype != OTYP_CHR) 307 return (EINVAL); 308 return (0); 309 } 310 311 /* ARGSUSED */ 312 static int 313 sbd_close(dev_t dev, int flag, int otype, cred_t *credp) 314 { 315 return (0); 316 } 317 318 /* ARGSUSED */ 319 static int 320 stmf_sbd_ioctl(dev_t dev, int cmd, intptr_t data, int mode, 321 cred_t *credp, int *rval) 322 { 323 stmf_iocdata_t *iocd; 324 void *ibuf = NULL; 325 void *obuf = NULL; 326 sbd_lu_t *nsl; 327 int i; 328 int ret; 329 330 if (drv_priv(credp) != 0) { 331 return (EPERM); 332 } 333 334 ret = stmf_copyin_iocdata(data, mode, &iocd, &ibuf, &obuf); 335 if (ret) 336 return (ret); 337 iocd->stmf_error = 0; 338 339 switch (cmd) { 340 case SBD_IOCTL_CREATE_AND_REGISTER_LU: 341 if (iocd->stmf_ibuf_size < 342 (sizeof (sbd_create_and_reg_lu_t) - 8)) { 343 ret = EFAULT; 344 break; 345 } 346 if ((iocd->stmf_obuf_size == 0) || 347 (iocd->stmf_obuf_size > iocd->stmf_ibuf_size)) { 348 ret = EINVAL; 349 break; 350 } 351 ret = sbd_create_register_lu((sbd_create_and_reg_lu_t *) 352 ibuf, iocd->stmf_ibuf_size, &iocd->stmf_error); 353 bcopy(ibuf, obuf, iocd->stmf_obuf_size); 354 break; 355 case SBD_IOCTL_SET_LU_STANDBY: 356 if (iocd->stmf_ibuf_size < sizeof (sbd_set_lu_standby_t)) { 357 ret = EFAULT; 358 break; 359 } 360 if (iocd->stmf_obuf_size) { 361 ret = EINVAL; 362 break; 363 } 364 ret = sbd_set_lu_standby((sbd_set_lu_standby_t *)ibuf, 365 &iocd->stmf_error); 366 break; 367 case SBD_IOCTL_IMPORT_LU: 368 if (iocd->stmf_ibuf_size < 369 (sizeof (sbd_import_lu_t) - 8)) { 370 ret = EFAULT; 371 break; 372 } 373 if ((iocd->stmf_obuf_size == 0) || 374 (iocd->stmf_obuf_size > iocd->stmf_ibuf_size)) { 375 ret = EINVAL; 376 break; 377 } 378 ret = sbd_import_lu((sbd_import_lu_t *)ibuf, 379 iocd->stmf_ibuf_size, &iocd->stmf_error, 0, NULL); 380 bcopy(ibuf, obuf, iocd->stmf_obuf_size); 381 break; 382 case SBD_IOCTL_DELETE_LU: 383 if (iocd->stmf_ibuf_size < (sizeof (sbd_delete_lu_t) - 8)) { 384 ret = EFAULT; 385 break; 386 } 387 if (iocd->stmf_obuf_size) { 388 ret = EINVAL; 389 break; 390 } 391 ret = sbd_delete_lu((sbd_delete_lu_t *)ibuf, 392 iocd->stmf_ibuf_size, &iocd->stmf_error); 393 break; 394 case SBD_IOCTL_MODIFY_LU: 395 if (iocd->stmf_ibuf_size < (sizeof (sbd_modify_lu_t) - 8)) { 396 ret = EFAULT; 397 break; 398 } 399 if (iocd->stmf_obuf_size) { 400 ret = EINVAL; 401 break; 402 } 403 ret = sbd_modify_lu((sbd_modify_lu_t *)ibuf, 404 iocd->stmf_ibuf_size, &iocd->stmf_error); 405 break; 406 case SBD_IOCTL_SET_GLOBAL_LU: 407 if (iocd->stmf_ibuf_size < (sizeof (sbd_global_props_t) - 8)) { 408 ret = EFAULT; 409 break; 410 } 411 if (iocd->stmf_obuf_size) { 412 ret = EINVAL; 413 break; 414 } 415 ret = sbd_set_global_props((sbd_global_props_t *)ibuf, 416 iocd->stmf_ibuf_size, &iocd->stmf_error); 417 break; 418 case SBD_IOCTL_GET_GLOBAL_LU: 419 if (iocd->stmf_ibuf_size) { 420 ret = EINVAL; 421 break; 422 } 423 if (iocd->stmf_obuf_size < sizeof (sbd_global_props_t)) { 424 ret = EINVAL; 425 break; 426 } 427 ret = sbd_get_global_props((sbd_global_props_t *)obuf, 428 iocd->stmf_obuf_size, &iocd->stmf_error); 429 break; 430 case SBD_IOCTL_GET_LU_PROPS: 431 if (iocd->stmf_ibuf_size < (sizeof (sbd_lu_props_t) - 8)) { 432 ret = EFAULT; 433 break; 434 } 435 if (iocd->stmf_obuf_size < sizeof (sbd_lu_props_t)) { 436 ret = EINVAL; 437 break; 438 } 439 ret = sbd_get_lu_props((sbd_lu_props_t *)ibuf, 440 iocd->stmf_ibuf_size, (sbd_lu_props_t *)obuf, 441 iocd->stmf_obuf_size, &iocd->stmf_error); 442 break; 443 case SBD_IOCTL_GET_LU_LIST: 444 mutex_enter(&sbd_lock); 445 iocd->stmf_obuf_max_nentries = sbd_lu_count; 446 iocd->stmf_obuf_nentries = min((iocd->stmf_obuf_size >> 4), 447 sbd_lu_count); 448 for (nsl = sbd_lu_list, i = 0; nsl && 449 (i < iocd->stmf_obuf_nentries); i++, nsl = nsl->sl_next) { 450 bcopy(nsl->sl_device_id + 4, 451 &(((uint8_t *)obuf)[i << 4]), 16); 452 } 453 mutex_exit(&sbd_lock); 454 ret = 0; 455 iocd->stmf_error = 0; 456 break; 457 case SBD_IOCTL_GET_UNMAP_PROPS: 458 if (iocd->stmf_ibuf_size < sizeof (sbd_unmap_props_t)) { 459 ret = EFAULT; 460 break; 461 } 462 if (iocd->stmf_obuf_size < sizeof (sbd_unmap_props_t)) { 463 ret = EINVAL; 464 break; 465 } 466 ret = sbd_get_unmap_props((sbd_unmap_props_t *)ibuf, 467 (sbd_unmap_props_t *)obuf, &iocd->stmf_error); 468 break; 469 default: 470 ret = ENOTTY; 471 } 472 473 if (ret == 0) { 474 ret = stmf_copyout_iocdata(data, mode, iocd, obuf); 475 } else if (iocd->stmf_error) { 476 (void) stmf_copyout_iocdata(data, mode, iocd, obuf); 477 } 478 if (obuf) { 479 kmem_free(obuf, iocd->stmf_obuf_size); 480 obuf = NULL; 481 } 482 if (ibuf) { 483 kmem_free(ibuf, iocd->stmf_ibuf_size); 484 ibuf = NULL; 485 } 486 kmem_free(iocd, sizeof (stmf_iocdata_t)); 487 return (ret); 488 } 489 490 /* ARGSUSED */ 491 void 492 sbd_lp_cb(stmf_lu_provider_t *lp, int cmd, void *arg, uint32_t flags) 493 { 494 nvpair_t *np; 495 char *s; 496 sbd_import_lu_t *ilu; 497 uint32_t ilu_sz; 498 uint32_t struct_sz; 499 uint32_t err_ret; 500 int iret; 501 502 if ((cmd != STMF_PROVIDER_DATA_UPDATED) || (arg == NULL)) { 503 return; 504 } 505 506 if ((flags & (STMF_PCB_STMF_ONLINING | STMF_PCB_PREG_COMPLETE)) == 0) { 507 return; 508 } 509 510 np = NULL; 511 ilu_sz = 1024; 512 ilu = (sbd_import_lu_t *)kmem_zalloc(ilu_sz, KM_SLEEP); 513 while ((np = nvlist_next_nvpair((nvlist_t *)arg, np)) != NULL) { 514 if (nvpair_type(np) != DATA_TYPE_STRING) { 515 continue; 516 } 517 if (nvpair_value_string(np, &s) != 0) { 518 continue; 519 } 520 struct_sz = max(8, strlen(s) + 1); 521 struct_sz += sizeof (sbd_import_lu_t) - 8; 522 if (struct_sz > ilu_sz) { 523 kmem_free(ilu, ilu_sz); 524 ilu_sz = struct_sz + 32; 525 ilu = (sbd_import_lu_t *)kmem_zalloc(ilu_sz, KM_SLEEP); 526 } 527 ilu->ilu_struct_size = struct_sz; 528 (void) strcpy(ilu->ilu_meta_fname, s); 529 iret = sbd_import_lu(ilu, struct_sz, &err_ret, 0, NULL); 530 if (iret) { 531 stmf_trace(0, "sbd_lp_cb: import_lu failed, ret = %d, " 532 "err_ret = %d", iret, err_ret); 533 } else { 534 stmf_trace(0, "Imported the LU %s", nvpair_name(np)); 535 } 536 } 537 538 if (ilu) { 539 kmem_free(ilu, ilu_sz); 540 ilu = NULL; 541 } 542 } 543 544 sbd_status_t 545 sbd_link_lu(sbd_lu_t *sl) 546 { 547 sbd_lu_t *nsl; 548 549 mutex_enter(&sbd_lock); 550 mutex_enter(&sl->sl_lock); 551 ASSERT(sl->sl_trans_op != SL_OP_NONE); 552 553 if (sl->sl_flags & SL_LINKED) { 554 mutex_exit(&sbd_lock); 555 mutex_exit(&sl->sl_lock); 556 return (SBD_ALREADY); 557 } 558 for (nsl = sbd_lu_list; nsl; nsl = nsl->sl_next) { 559 if (strcmp(nsl->sl_name, sl->sl_name) == 0) 560 break; 561 } 562 if (nsl) { 563 mutex_exit(&sbd_lock); 564 mutex_exit(&sl->sl_lock); 565 return (SBD_ALREADY); 566 } 567 sl->sl_next = sbd_lu_list; 568 sbd_lu_list = sl; 569 sl->sl_flags |= SL_LINKED; 570 mutex_exit(&sbd_lock); 571 mutex_exit(&sl->sl_lock); 572 return (SBD_SUCCESS); 573 } 574 575 void 576 sbd_unlink_lu(sbd_lu_t *sl) 577 { 578 sbd_lu_t **ppnsl; 579 580 mutex_enter(&sbd_lock); 581 mutex_enter(&sl->sl_lock); 582 ASSERT(sl->sl_trans_op != SL_OP_NONE); 583 584 ASSERT(sl->sl_flags & SL_LINKED); 585 for (ppnsl = &sbd_lu_list; *ppnsl; ppnsl = &((*ppnsl)->sl_next)) { 586 if (*ppnsl == sl) 587 break; 588 } 589 ASSERT(*ppnsl); 590 *ppnsl = (*ppnsl)->sl_next; 591 sl->sl_flags &= ~SL_LINKED; 592 mutex_exit(&sbd_lock); 593 mutex_exit(&sl->sl_lock); 594 } 595 596 sbd_status_t 597 sbd_find_and_lock_lu(uint8_t *guid, uint8_t *meta_name, uint8_t op, 598 sbd_lu_t **ppsl) 599 { 600 sbd_lu_t *sl; 601 int found = 0; 602 sbd_status_t sret; 603 604 mutex_enter(&sbd_lock); 605 for (sl = sbd_lu_list; sl; sl = sl->sl_next) { 606 if (guid) { 607 found = bcmp(sl->sl_device_id + 4, guid, 16) == 0; 608 } else { 609 found = strcmp(sl->sl_name, (char *)meta_name) == 0; 610 } 611 if (found) 612 break; 613 } 614 if (!found) { 615 mutex_exit(&sbd_lock); 616 return (SBD_NOT_FOUND); 617 } 618 mutex_enter(&sl->sl_lock); 619 if (sl->sl_trans_op == SL_OP_NONE) { 620 sl->sl_trans_op = op; 621 *ppsl = sl; 622 sret = SBD_SUCCESS; 623 } else { 624 sret = SBD_BUSY; 625 } 626 mutex_exit(&sl->sl_lock); 627 mutex_exit(&sbd_lock); 628 return (sret); 629 } 630 631 sbd_status_t 632 sbd_read_meta(sbd_lu_t *sl, uint64_t offset, uint64_t size, uint8_t *buf) 633 { 634 uint64_t meta_align; 635 uint64_t starting_off; 636 uint64_t data_off; 637 uint64_t ending_off; 638 uint64_t io_size; 639 uint8_t *io_buf; 640 vnode_t *vp; 641 sbd_status_t ret; 642 ssize_t resid; 643 int vret; 644 645 ASSERT(sl->sl_flags & SL_META_OPENED); 646 if (sl->sl_flags & SL_SHARED_META) { 647 meta_align = (((uint64_t)1) << sl->sl_data_blocksize_shift) - 1; 648 vp = sl->sl_data_vp; 649 ASSERT(vp); 650 } else { 651 meta_align = (((uint64_t)1) << sl->sl_meta_blocksize_shift) - 1; 652 if ((sl->sl_flags & SL_ZFS_META) == 0) { 653 vp = sl->sl_meta_vp; 654 ASSERT(vp); 655 } 656 } 657 starting_off = offset & ~(meta_align); 658 data_off = offset & meta_align; 659 ending_off = (offset + size + meta_align) & (~meta_align); 660 if (ending_off > sl->sl_meta_size_used) { 661 bzero(buf, size); 662 if (starting_off >= sl->sl_meta_size_used) { 663 return (SBD_SUCCESS); 664 } 665 ending_off = (sl->sl_meta_size_used + meta_align) & 666 (~meta_align); 667 if (size > (ending_off - (starting_off + data_off))) { 668 size = ending_off - (starting_off + data_off); 669 } 670 } 671 io_size = ending_off - starting_off; 672 io_buf = (uint8_t *)kmem_zalloc(io_size, KM_SLEEP); 673 ASSERT((starting_off + io_size) <= sl->sl_total_meta_size); 674 675 /* 676 * Don't proceed if the device has been closed 677 * This can occur on an access state change to standby or 678 * a delete. The writer lock is acquired before closing the 679 * lu. If importing, reading the metadata is valid, hence 680 * the check on SL_OP_IMPORT_LU. 681 */ 682 rw_enter(&sl->sl_access_state_lock, RW_READER); 683 if ((sl->sl_flags & SL_MEDIA_LOADED) == 0 && 684 sl->sl_trans_op != SL_OP_IMPORT_LU) { 685 rw_exit(&sl->sl_access_state_lock); 686 ret = SBD_FILEIO_FAILURE; 687 goto sbd_read_meta_failure; 688 } 689 if (sl->sl_flags & SL_ZFS_META) { 690 if ((ret = sbd_read_zfs_meta(sl, io_buf, io_size, 691 starting_off)) != SBD_SUCCESS) { 692 rw_exit(&sl->sl_access_state_lock); 693 goto sbd_read_meta_failure; 694 } 695 } else { 696 vret = vn_rdwr(UIO_READ, vp, (caddr_t)io_buf, (ssize_t)io_size, 697 (offset_t)starting_off, UIO_SYSSPACE, FRSYNC, 698 RLIM64_INFINITY, CRED(), &resid); 699 700 if (vret || resid) { 701 ret = SBD_FILEIO_FAILURE | vret; 702 rw_exit(&sl->sl_access_state_lock); 703 goto sbd_read_meta_failure; 704 } 705 } 706 rw_exit(&sl->sl_access_state_lock); 707 708 bcopy(io_buf + data_off, buf, size); 709 ret = SBD_SUCCESS; 710 711 sbd_read_meta_failure: 712 kmem_free(io_buf, io_size); 713 return (ret); 714 } 715 716 sbd_status_t 717 sbd_write_meta(sbd_lu_t *sl, uint64_t offset, uint64_t size, uint8_t *buf) 718 { 719 uint64_t meta_align; 720 uint64_t starting_off; 721 uint64_t data_off; 722 uint64_t ending_off; 723 uint64_t io_size; 724 uint8_t *io_buf; 725 vnode_t *vp; 726 sbd_status_t ret; 727 ssize_t resid; 728 int vret; 729 730 ASSERT(sl->sl_flags & SL_META_OPENED); 731 if (sl->sl_flags & SL_SHARED_META) { 732 meta_align = (((uint64_t)1) << sl->sl_data_blocksize_shift) - 1; 733 vp = sl->sl_data_vp; 734 ASSERT(vp); 735 } else { 736 meta_align = (((uint64_t)1) << sl->sl_meta_blocksize_shift) - 1; 737 if ((sl->sl_flags & SL_ZFS_META) == 0) { 738 vp = sl->sl_meta_vp; 739 ASSERT(vp); 740 } 741 } 742 starting_off = offset & ~(meta_align); 743 data_off = offset & meta_align; 744 ending_off = (offset + size + meta_align) & (~meta_align); 745 io_size = ending_off - starting_off; 746 io_buf = (uint8_t *)kmem_zalloc(io_size, KM_SLEEP); 747 ret = sbd_read_meta(sl, starting_off, io_size, io_buf); 748 if (ret != SBD_SUCCESS) { 749 goto sbd_write_meta_failure; 750 } 751 bcopy(buf, io_buf + data_off, size); 752 /* 753 * Don't proceed if the device has been closed 754 * This can occur on an access state change to standby or 755 * a delete. The writer lock is acquired before closing the 756 * lu. If importing, reading the metadata is valid, hence 757 * the check on SL_OP_IMPORT_LU. 758 */ 759 rw_enter(&sl->sl_access_state_lock, RW_READER); 760 if ((sl->sl_flags & SL_MEDIA_LOADED) == 0 && 761 sl->sl_trans_op != SL_OP_IMPORT_LU) { 762 rw_exit(&sl->sl_access_state_lock); 763 ret = SBD_FILEIO_FAILURE; 764 goto sbd_write_meta_failure; 765 } 766 if (sl->sl_flags & SL_ZFS_META) { 767 if ((ret = sbd_write_zfs_meta(sl, io_buf, io_size, 768 starting_off)) != SBD_SUCCESS) { 769 rw_exit(&sl->sl_access_state_lock); 770 goto sbd_write_meta_failure; 771 } 772 } else { 773 vret = vn_rdwr(UIO_WRITE, vp, (caddr_t)io_buf, (ssize_t)io_size, 774 (offset_t)starting_off, UIO_SYSSPACE, FDSYNC, 775 RLIM64_INFINITY, CRED(), &resid); 776 777 if (vret || resid) { 778 ret = SBD_FILEIO_FAILURE | vret; 779 rw_exit(&sl->sl_access_state_lock); 780 goto sbd_write_meta_failure; 781 } 782 } 783 rw_exit(&sl->sl_access_state_lock); 784 785 ret = SBD_SUCCESS; 786 787 sbd_write_meta_failure: 788 kmem_free(io_buf, io_size); 789 return (ret); 790 } 791 792 uint8_t 793 sbd_calc_sum(uint8_t *buf, int size) 794 { 795 uint8_t s = 0; 796 797 while (size > 0) 798 s += buf[--size]; 799 800 return (s); 801 } 802 803 uint8_t 804 sbd_calc_section_sum(sm_section_hdr_t *sm, uint32_t sz) 805 { 806 uint8_t s, o; 807 808 o = sm->sms_chksum; 809 sm->sms_chksum = 0; 810 s = sbd_calc_sum((uint8_t *)sm, sz); 811 sm->sms_chksum = o; 812 813 return (s); 814 } 815 816 uint32_t 817 sbd_strlen(char *str, uint32_t maxlen) 818 { 819 uint32_t i; 820 821 for (i = 0; i < maxlen; i++) { 822 if (str[i] == 0) 823 return (i); 824 } 825 return (i); 826 } 827 828 void 829 sbd_swap_meta_start(sbd_meta_start_t *sm) 830 { 831 if (sm->sm_magic == SBD_MAGIC) 832 return; 833 sm->sm_magic = BSWAP_64(sm->sm_magic); 834 sm->sm_meta_size = BSWAP_64(sm->sm_meta_size); 835 sm->sm_meta_size_used = BSWAP_64(sm->sm_meta_size_used); 836 sm->sm_ver_major = BSWAP_16(sm->sm_ver_major); 837 sm->sm_ver_minor = BSWAP_16(sm->sm_ver_minor); 838 sm->sm_ver_subminor = BSWAP_16(sm->sm_ver_subminor); 839 } 840 841 void 842 sbd_swap_section_hdr(sm_section_hdr_t *sm) 843 { 844 if (sm->sms_data_order == SMS_DATA_ORDER) 845 return; 846 sm->sms_offset = BSWAP_64(sm->sms_offset); 847 sm->sms_size = BSWAP_32(sm->sms_size); 848 sm->sms_id = BSWAP_16(sm->sms_id); 849 sm->sms_chksum += SMS_DATA_ORDER - sm->sms_data_order; 850 sm->sms_data_order = SMS_DATA_ORDER; 851 } 852 853 void 854 sbd_swap_lu_info_1_0(sbd_lu_info_1_0_t *sli) 855 { 856 sbd_swap_section_hdr(&sli->sli_sms_header); 857 if (sli->sli_data_order == SMS_DATA_ORDER) 858 return; 859 sli->sli_sms_header.sms_chksum += SMS_DATA_ORDER - sli->sli_data_order; 860 sli->sli_data_order = SMS_DATA_ORDER; 861 sli->sli_total_store_size = BSWAP_64(sli->sli_total_store_size); 862 sli->sli_total_meta_size = BSWAP_64(sli->sli_total_meta_size); 863 sli->sli_lu_data_offset = BSWAP_64(sli->sli_lu_data_offset); 864 sli->sli_lu_data_size = BSWAP_64(sli->sli_lu_data_size); 865 sli->sli_flags = BSWAP_32(sli->sli_flags); 866 sli->sli_blocksize = BSWAP_16(sli->sli_blocksize); 867 } 868 869 void 870 sbd_swap_lu_info_1_1(sbd_lu_info_1_1_t *sli) 871 { 872 sbd_swap_section_hdr(&sli->sli_sms_header); 873 if (sli->sli_data_order == SMS_DATA_ORDER) 874 return; 875 sli->sli_sms_header.sms_chksum += SMS_DATA_ORDER - sli->sli_data_order; 876 sli->sli_data_order = SMS_DATA_ORDER; 877 sli->sli_flags = BSWAP_32(sli->sli_flags); 878 sli->sli_lu_size = BSWAP_64(sli->sli_lu_size); 879 sli->sli_meta_fname_offset = BSWAP_64(sli->sli_meta_fname_offset); 880 sli->sli_data_fname_offset = BSWAP_64(sli->sli_data_fname_offset); 881 sli->sli_serial_offset = BSWAP_64(sli->sli_serial_offset); 882 sli->sli_alias_offset = BSWAP_64(sli->sli_alias_offset); 883 sli->sli_mgmt_url_offset = BSWAP_64(sli->sli_mgmt_url_offset); 884 } 885 886 sbd_status_t 887 sbd_load_section_hdr(sbd_lu_t *sl, sm_section_hdr_t *sms) 888 { 889 sm_section_hdr_t h; 890 uint64_t st; 891 sbd_status_t ret; 892 893 for (st = sl->sl_meta_offset + sizeof (sbd_meta_start_t); 894 st < sl->sl_meta_size_used; st += h.sms_size) { 895 if ((ret = sbd_read_meta(sl, st, sizeof (sm_section_hdr_t), 896 (uint8_t *)&h)) != SBD_SUCCESS) { 897 return (ret); 898 } 899 if (h.sms_data_order != SMS_DATA_ORDER) { 900 sbd_swap_section_hdr(&h); 901 } 902 if ((h.sms_data_order != SMS_DATA_ORDER) || 903 (h.sms_offset != st) || (h.sms_size < sizeof (h)) || 904 ((st + h.sms_size) > sl->sl_meta_size_used)) { 905 return (SBD_META_CORRUPTED); 906 } 907 if (h.sms_id == sms->sms_id) { 908 bcopy(&h, sms, sizeof (h)); 909 return (SBD_SUCCESS); 910 } 911 } 912 913 return (SBD_NOT_FOUND); 914 } 915 916 sbd_status_t 917 sbd_load_meta_start(sbd_lu_t *sl) 918 { 919 sbd_meta_start_t *sm; 920 sbd_status_t ret; 921 922 /* Fake meta params initially */ 923 sl->sl_total_meta_size = (uint64_t)-1; 924 sl->sl_meta_size_used = sl->sl_meta_offset + sizeof (sbd_meta_start_t); 925 926 sm = kmem_zalloc(sizeof (*sm), KM_SLEEP); 927 ret = sbd_read_meta(sl, sl->sl_meta_offset, sizeof (*sm), 928 (uint8_t *)sm); 929 if (ret != SBD_SUCCESS) { 930 goto load_meta_start_failed; 931 } 932 933 if (sm->sm_magic != SBD_MAGIC) { 934 sbd_swap_meta_start(sm); 935 } 936 937 if ((sm->sm_magic != SBD_MAGIC) || (sbd_calc_sum((uint8_t *)sm, 938 sizeof (*sm) - 1) != sm->sm_chksum)) { 939 ret = SBD_META_CORRUPTED; 940 goto load_meta_start_failed; 941 } 942 943 if (sm->sm_ver_major != SBD_VER_MAJOR) { 944 ret = SBD_NOT_SUPPORTED; 945 goto load_meta_start_failed; 946 } 947 948 sl->sl_total_meta_size = sm->sm_meta_size; 949 sl->sl_meta_size_used = sm->sm_meta_size_used; 950 ret = SBD_SUCCESS; 951 952 load_meta_start_failed: 953 kmem_free(sm, sizeof (*sm)); 954 return (ret); 955 } 956 957 sbd_status_t 958 sbd_write_meta_start(sbd_lu_t *sl, uint64_t meta_size, uint64_t meta_size_used) 959 { 960 sbd_meta_start_t *sm; 961 sbd_status_t ret; 962 963 sm = (sbd_meta_start_t *)kmem_zalloc(sizeof (sbd_meta_start_t), 964 KM_SLEEP); 965 966 sm->sm_magic = SBD_MAGIC; 967 sm->sm_meta_size = meta_size; 968 sm->sm_meta_size_used = meta_size_used; 969 sm->sm_ver_major = SBD_VER_MAJOR; 970 sm->sm_ver_minor = SBD_VER_MINOR; 971 sm->sm_ver_subminor = SBD_VER_SUBMINOR; 972 sm->sm_chksum = sbd_calc_sum((uint8_t *)sm, sizeof (*sm) - 1); 973 974 ret = sbd_write_meta(sl, sl->sl_meta_offset, sizeof (*sm), 975 (uint8_t *)sm); 976 kmem_free(sm, sizeof (*sm)); 977 978 return (ret); 979 } 980 981 sbd_status_t 982 sbd_read_meta_section(sbd_lu_t *sl, sm_section_hdr_t **ppsms, uint16_t sms_id) 983 { 984 sbd_status_t ret; 985 sm_section_hdr_t sms; 986 int alloced = 0; 987 988 mutex_enter(&sl->sl_metadata_lock); 989 if (((*ppsms) == NULL) || ((*ppsms)->sms_offset == 0)) { 990 bzero(&sms, sizeof (sm_section_hdr_t)); 991 sms.sms_id = sms_id; 992 if ((ret = sbd_load_section_hdr(sl, &sms)) != SBD_SUCCESS) { 993 mutex_exit(&sl->sl_metadata_lock); 994 return (ret); 995 } else { 996 if ((*ppsms) == NULL) { 997 *ppsms = (sm_section_hdr_t *)kmem_zalloc( 998 sms.sms_size, KM_SLEEP); 999 alloced = 1; 1000 } 1001 bcopy(&sms, *ppsms, sizeof (sm_section_hdr_t)); 1002 } 1003 } 1004 1005 ret = sbd_read_meta(sl, (*ppsms)->sms_offset, (*ppsms)->sms_size, 1006 (uint8_t *)(*ppsms)); 1007 if (ret == SBD_SUCCESS) { 1008 uint8_t s; 1009 if ((*ppsms)->sms_data_order != SMS_DATA_ORDER) 1010 sbd_swap_section_hdr(*ppsms); 1011 if ((*ppsms)->sms_id != SMS_ID_UNUSED) { 1012 s = sbd_calc_section_sum(*ppsms, (*ppsms)->sms_size); 1013 if (s != (*ppsms)->sms_chksum) 1014 ret = SBD_META_CORRUPTED; 1015 } 1016 } 1017 mutex_exit(&sl->sl_metadata_lock); 1018 1019 if ((ret != SBD_SUCCESS) && alloced) 1020 kmem_free(*ppsms, sms.sms_size); 1021 return (ret); 1022 } 1023 1024 sbd_status_t 1025 sbd_load_section_hdr_unbuffered(sbd_lu_t *sl, sm_section_hdr_t *sms) 1026 { 1027 sbd_status_t ret; 1028 1029 /* 1030 * Bypass buffering and re-read the meta data from permanent storage. 1031 */ 1032 if (sl->sl_flags & SL_ZFS_META) { 1033 if ((ret = sbd_open_zfs_meta(sl)) != SBD_SUCCESS) { 1034 return (ret); 1035 } 1036 } 1037 /* Re-get the meta sizes into sl */ 1038 if ((ret = sbd_load_meta_start(sl)) != SBD_SUCCESS) { 1039 return (ret); 1040 } 1041 return (sbd_load_section_hdr(sl, sms)); 1042 } 1043 1044 sbd_status_t 1045 sbd_write_meta_section(sbd_lu_t *sl, sm_section_hdr_t *sms) 1046 { 1047 sm_section_hdr_t t; 1048 uint64_t off, s; 1049 uint64_t unused_start; 1050 sbd_status_t ret; 1051 sbd_status_t write_meta_ret = SBD_SUCCESS; 1052 uint8_t *cb; 1053 int meta_size_changed = 0; 1054 sm_section_hdr_t sms_before_unused = {0}; 1055 1056 mutex_enter(&sl->sl_metadata_lock); 1057 write_meta_section_again: 1058 if (sms->sms_offset) { 1059 /* 1060 * If the section already exists and the size is the 1061 * same as this new data then overwrite in place. If 1062 * the sizes are different then mark the existing as 1063 * unused and look for free space. 1064 */ 1065 ret = sbd_read_meta(sl, sms->sms_offset, sizeof (t), 1066 (uint8_t *)&t); 1067 if (ret != SBD_SUCCESS) { 1068 mutex_exit(&sl->sl_metadata_lock); 1069 return (ret); 1070 } 1071 if (t.sms_data_order != SMS_DATA_ORDER) { 1072 sbd_swap_section_hdr(&t); 1073 } 1074 if (t.sms_id != sms->sms_id) { 1075 mutex_exit(&sl->sl_metadata_lock); 1076 return (SBD_INVALID_ARG); 1077 } 1078 if (t.sms_size == sms->sms_size) { 1079 ret = sbd_write_meta(sl, sms->sms_offset, 1080 sms->sms_size, (uint8_t *)sms); 1081 mutex_exit(&sl->sl_metadata_lock); 1082 return (ret); 1083 } 1084 sms_before_unused = t; 1085 1086 t.sms_id = SMS_ID_UNUSED; 1087 /* 1088 * For unused sections we only use chksum of the header. for 1089 * all other sections, the chksum is for the entire section. 1090 */ 1091 t.sms_chksum = sbd_calc_section_sum(&t, sizeof (t)); 1092 ret = sbd_write_meta(sl, t.sms_offset, sizeof (t), 1093 (uint8_t *)&t); 1094 if (ret != SBD_SUCCESS) { 1095 mutex_exit(&sl->sl_metadata_lock); 1096 return (ret); 1097 } 1098 sms->sms_offset = 0; 1099 } else { 1100 /* Section location is unknown, search for it. */ 1101 t.sms_id = sms->sms_id; 1102 t.sms_data_order = SMS_DATA_ORDER; 1103 ret = sbd_load_section_hdr(sl, &t); 1104 if (ret == SBD_SUCCESS) { 1105 sms->sms_offset = t.sms_offset; 1106 sms->sms_chksum = 1107 sbd_calc_section_sum(sms, sms->sms_size); 1108 goto write_meta_section_again; 1109 } else if (ret != SBD_NOT_FOUND) { 1110 mutex_exit(&sl->sl_metadata_lock); 1111 return (ret); 1112 } 1113 } 1114 1115 /* 1116 * At this point we know that section does not already exist. 1117 * Find space large enough to hold the section or grow meta if 1118 * possible. 1119 */ 1120 unused_start = 0; 1121 s = 0; /* size of space found */ 1122 1123 /* 1124 * Search all sections for unused space of sufficient size. 1125 * The first one found is taken. Contiguous unused sections 1126 * will be combined. 1127 */ 1128 for (off = sl->sl_meta_offset + sizeof (sbd_meta_start_t); 1129 off < sl->sl_meta_size_used; off += t.sms_size) { 1130 ret = sbd_read_meta(sl, off, sizeof (t), (uint8_t *)&t); 1131 if (ret != SBD_SUCCESS) { 1132 mutex_exit(&sl->sl_metadata_lock); 1133 return (ret); 1134 } 1135 if (t.sms_data_order != SMS_DATA_ORDER) 1136 sbd_swap_section_hdr(&t); 1137 if (t.sms_size == 0) { 1138 mutex_exit(&sl->sl_metadata_lock); 1139 return (SBD_META_CORRUPTED); 1140 } 1141 if (t.sms_id == SMS_ID_UNUSED) { 1142 if (unused_start == 0) 1143 unused_start = off; 1144 /* 1145 * Calculate size of the unused space, break out 1146 * if it satisfies the requirement. 1147 */ 1148 s = t.sms_size - unused_start + off; 1149 if ((s == sms->sms_size) || (s >= (sms->sms_size + 1150 sizeof (t)))) { 1151 break; 1152 } else { 1153 s = 0; 1154 } 1155 } else { 1156 unused_start = 0; 1157 } 1158 } 1159 1160 off = (unused_start == 0) ? sl->sl_meta_size_used : unused_start; 1161 /* 1162 * If none found, how much room is at the end? 1163 * See if the data can be expanded. 1164 */ 1165 if (s == 0) { 1166 s = sl->sl_total_meta_size - off; 1167 if (s >= sms->sms_size || !(sl->sl_flags & SL_SHARED_META)) { 1168 s = sms->sms_size; 1169 meta_size_changed = 1; 1170 } else { 1171 s = 0; 1172 } 1173 } 1174 1175 if (s == 0) { 1176 mutex_exit(&sl->sl_metadata_lock); 1177 return (SBD_ALLOC_FAILURE); 1178 } 1179 1180 sms->sms_offset = off; 1181 sms->sms_chksum = sbd_calc_section_sum(sms, sms->sms_size); 1182 /* 1183 * Since we may have to write more than one section (current + 1184 * any unused), use a combined buffer. 1185 */ 1186 cb = kmem_zalloc(s, KM_SLEEP); 1187 bcopy(sms, cb, sms->sms_size); 1188 if (s > sms->sms_size) { 1189 t.sms_offset = off + sms->sms_size; 1190 t.sms_size = s - sms->sms_size; 1191 t.sms_id = SMS_ID_UNUSED; 1192 t.sms_data_order = SMS_DATA_ORDER; 1193 t.sms_chksum = sbd_calc_section_sum(&t, sizeof (t)); 1194 bcopy(&t, cb + sms->sms_size, sizeof (t)); 1195 } 1196 /* 1197 * Two write events & statuses take place. Failure writing the 1198 * meta section takes precedence, can possibly be rolled back, 1199 * & gets reported. Else return status from writing the meta start. 1200 */ 1201 ret = SBD_SUCCESS; /* Set a default, it's not always loaded below. */ 1202 if (meta_size_changed) { 1203 uint64_t old_meta_size; 1204 uint64_t old_sz_used = sl->sl_meta_size_used; /* save a copy */ 1205 old_meta_size = sl->sl_total_meta_size; /* save a copy */ 1206 1207 write_meta_ret = sbd_write_meta(sl, off, s, cb); 1208 if (write_meta_ret == SBD_SUCCESS) { 1209 sl->sl_meta_size_used = off + s; 1210 if (sl->sl_total_meta_size < sl->sl_meta_size_used) { 1211 uint64_t meta_align = 1212 (((uint64_t)1) << 1213 sl->sl_meta_blocksize_shift) - 1; 1214 sl->sl_total_meta_size = 1215 (sl->sl_meta_size_used + meta_align) & 1216 (~meta_align); 1217 } 1218 ret = sbd_write_meta_start(sl, sl->sl_total_meta_size, 1219 sl->sl_meta_size_used); 1220 if (ret != SBD_SUCCESS) { 1221 sl->sl_meta_size_used = old_sz_used; 1222 sl->sl_total_meta_size = old_meta_size; 1223 } 1224 } else { 1225 sl->sl_meta_size_used = old_sz_used; 1226 sl->sl_total_meta_size = old_meta_size; 1227 } 1228 } else { 1229 write_meta_ret = sbd_write_meta(sl, off, s, cb); 1230 } 1231 if ((write_meta_ret != SBD_SUCCESS) && 1232 (sms_before_unused.sms_offset != 0)) { 1233 sm_section_hdr_t new_sms; 1234 sm_section_hdr_t *unused_sms; 1235 /* 1236 * On failure writing the meta section attempt to undo 1237 * the change to unused. 1238 * Re-read the meta data from permanent storage. 1239 * The section id can't exist for undo to be possible. 1240 * Read what should be the entire old section data and 1241 * insure the old data's still present by validating 1242 * against it's old checksum. 1243 */ 1244 new_sms.sms_id = sms->sms_id; 1245 new_sms.sms_data_order = SMS_DATA_ORDER; 1246 if (sbd_load_section_hdr_unbuffered(sl, &new_sms) != 1247 SBD_NOT_FOUND) { 1248 goto done; 1249 } 1250 unused_sms = kmem_zalloc(sms_before_unused.sms_size, KM_SLEEP); 1251 if (sbd_read_meta(sl, sms_before_unused.sms_offset, 1252 sms_before_unused.sms_size, 1253 (uint8_t *)unused_sms) != SBD_SUCCESS) { 1254 goto done; 1255 } 1256 if (unused_sms->sms_data_order != SMS_DATA_ORDER) { 1257 sbd_swap_section_hdr(unused_sms); 1258 } 1259 if (unused_sms->sms_id != SMS_ID_UNUSED) { 1260 goto done; 1261 } 1262 if (unused_sms->sms_offset != sms_before_unused.sms_offset) { 1263 goto done; 1264 } 1265 if (unused_sms->sms_size != sms_before_unused.sms_size) { 1266 goto done; 1267 } 1268 unused_sms->sms_id = sms_before_unused.sms_id; 1269 if (sbd_calc_section_sum(unused_sms, 1270 sizeof (sm_section_hdr_t)) != 1271 sbd_calc_section_sum(&sms_before_unused, 1272 sizeof (sm_section_hdr_t))) { 1273 goto done; 1274 } 1275 unused_sms->sms_chksum = 1276 sbd_calc_section_sum(unused_sms, unused_sms->sms_size); 1277 if (unused_sms->sms_chksum != sms_before_unused.sms_chksum) { 1278 goto done; 1279 } 1280 (void) sbd_write_meta(sl, unused_sms->sms_offset, 1281 sizeof (sm_section_hdr_t), (uint8_t *)unused_sms); 1282 } 1283 done: 1284 mutex_exit(&sl->sl_metadata_lock); 1285 kmem_free(cb, s); 1286 if (write_meta_ret != SBD_SUCCESS) { 1287 return (write_meta_ret); 1288 } 1289 return (ret); 1290 } 1291 1292 sbd_status_t 1293 sbd_write_lu_info(sbd_lu_t *sl) 1294 { 1295 sbd_lu_info_1_1_t *sli; 1296 int s; 1297 uint8_t *p; 1298 char *zvol_name = NULL; 1299 sbd_status_t ret; 1300 1301 mutex_enter(&sl->sl_lock); 1302 1303 s = sl->sl_serial_no_size; 1304 if ((sl->sl_flags & (SL_SHARED_META | SL_ZFS_META)) == 0) { 1305 if (sl->sl_data_filename) { 1306 s += strlen(sl->sl_data_filename) + 1; 1307 } 1308 } 1309 if (sl->sl_flags & SL_ZFS_META) { 1310 zvol_name = sbd_get_zvol_name(sl); 1311 s += strlen(zvol_name) + 1; 1312 } 1313 if (sl->sl_alias) { 1314 s += strlen(sl->sl_alias) + 1; 1315 } 1316 if (sl->sl_mgmt_url) { 1317 s += strlen(sl->sl_mgmt_url) + 1; 1318 } 1319 sli = (sbd_lu_info_1_1_t *)kmem_zalloc(sizeof (*sli) + s, KM_SLEEP); 1320 p = sli->sli_buf; 1321 if ((sl->sl_flags & (SL_SHARED_META | SL_ZFS_META)) == 0) { 1322 sli->sli_flags |= SLI_SEPARATE_META; 1323 (void) strcpy((char *)p, sl->sl_data_filename); 1324 sli->sli_data_fname_offset = 1325 (uintptr_t)p - (uintptr_t)sli->sli_buf; 1326 sli->sli_flags |= SLI_DATA_FNAME_VALID; 1327 p += strlen(sl->sl_data_filename) + 1; 1328 } 1329 if (sl->sl_flags & SL_ZFS_META) { 1330 (void) strcpy((char *)p, zvol_name); 1331 sli->sli_meta_fname_offset = 1332 (uintptr_t)p - (uintptr_t)sli->sli_buf; 1333 sli->sli_flags |= SLI_META_FNAME_VALID | SLI_ZFS_META; 1334 p += strlen(zvol_name) + 1; 1335 kmem_free(zvol_name, strlen(zvol_name) + 1); 1336 zvol_name = NULL; 1337 } 1338 if (sl->sl_alias) { 1339 (void) strcpy((char *)p, sl->sl_alias); 1340 sli->sli_alias_offset = 1341 (uintptr_t)p - (uintptr_t)sli->sli_buf; 1342 sli->sli_flags |= SLI_ALIAS_VALID; 1343 p += strlen(sl->sl_alias) + 1; 1344 } 1345 if (sl->sl_mgmt_url) { 1346 (void) strcpy((char *)p, sl->sl_mgmt_url); 1347 sli->sli_mgmt_url_offset = 1348 (uintptr_t)p - (uintptr_t)sli->sli_buf; 1349 sli->sli_flags |= SLI_MGMT_URL_VALID; 1350 p += strlen(sl->sl_mgmt_url) + 1; 1351 } 1352 if (sl->sl_flags & SL_WRITE_PROTECTED) { 1353 sli->sli_flags |= SLI_WRITE_PROTECTED; 1354 } 1355 if (sl->sl_flags & SL_SAVED_WRITE_CACHE_DISABLE) { 1356 sli->sli_flags |= SLI_WRITEBACK_CACHE_DISABLE; 1357 } 1358 if (sl->sl_flags & SL_VID_VALID) { 1359 bcopy(sl->sl_vendor_id, sli->sli_vid, 8); 1360 sli->sli_flags |= SLI_VID_VALID; 1361 } 1362 if (sl->sl_flags & SL_PID_VALID) { 1363 bcopy(sl->sl_product_id, sli->sli_pid, 16); 1364 sli->sli_flags |= SLI_PID_VALID; 1365 } 1366 if (sl->sl_flags & SL_REV_VALID) { 1367 bcopy(sl->sl_revision, sli->sli_rev, 4); 1368 sli->sli_flags |= SLI_REV_VALID; 1369 } 1370 if (sl->sl_serial_no_size) { 1371 bcopy(sl->sl_serial_no, p, sl->sl_serial_no_size); 1372 sli->sli_serial_size = sl->sl_serial_no_size; 1373 sli->sli_serial_offset = 1374 (uintptr_t)p - (uintptr_t)sli->sli_buf; 1375 sli->sli_flags |= SLI_SERIAL_VALID; 1376 p += sli->sli_serial_size; 1377 } 1378 sli->sli_lu_size = sl->sl_lu_size; 1379 sli->sli_data_blocksize_shift = sl->sl_data_blocksize_shift; 1380 sli->sli_data_order = SMS_DATA_ORDER; 1381 bcopy(sl->sl_device_id, sli->sli_device_id, 20); 1382 1383 sli->sli_sms_header.sms_size = sizeof (*sli) + s; 1384 sli->sli_sms_header.sms_id = SMS_ID_LU_INFO_1_1; 1385 sli->sli_sms_header.sms_data_order = SMS_DATA_ORDER; 1386 1387 mutex_exit(&sl->sl_lock); 1388 ret = sbd_write_meta_section(sl, (sm_section_hdr_t *)sli); 1389 kmem_free(sli, sizeof (*sli) + s); 1390 return (ret); 1391 } 1392 1393 /* 1394 * Will scribble SL_UNMAP_ENABLED into sl_flags if we succeed. 1395 */ 1396 static void 1397 do_unmap_setup(sbd_lu_t *sl) 1398 { 1399 ASSERT((sl->sl_flags & SL_UNMAP_ENABLED) == 0); 1400 1401 if ((sl->sl_flags & SL_ZFS_META) == 0) 1402 return; /* No UNMAP for you. */ 1403 1404 sl->sl_flags |= SL_UNMAP_ENABLED; 1405 } 1406 1407 int 1408 sbd_populate_and_register_lu(sbd_lu_t *sl, uint32_t *err_ret) 1409 { 1410 stmf_lu_t *lu = sl->sl_lu; 1411 stmf_status_t ret; 1412 1413 do_unmap_setup(sl); 1414 1415 lu->lu_id = (scsi_devid_desc_t *)sl->sl_device_id; 1416 if (sl->sl_alias) { 1417 lu->lu_alias = sl->sl_alias; 1418 } else { 1419 lu->lu_alias = sl->sl_name; 1420 } 1421 if (sl->sl_access_state == SBD_LU_STANDBY) { 1422 /* call set access state */ 1423 ret = stmf_set_lu_access(lu, STMF_LU_STANDBY); 1424 if (ret != STMF_SUCCESS) { 1425 *err_ret = SBD_RET_ACCESS_STATE_FAILED; 1426 return (EIO); 1427 } 1428 } 1429 /* set proxy_reg_cb_arg to meta filename */ 1430 if (sl->sl_meta_filename) { 1431 lu->lu_proxy_reg_arg = sl->sl_meta_filename; 1432 lu->lu_proxy_reg_arg_len = strlen(sl->sl_meta_filename) + 1; 1433 } else { 1434 lu->lu_proxy_reg_arg = sl->sl_data_filename; 1435 lu->lu_proxy_reg_arg_len = strlen(sl->sl_data_filename) + 1; 1436 } 1437 lu->lu_lp = sbd_lp; 1438 lu->lu_task_alloc = sbd_task_alloc; 1439 lu->lu_new_task = sbd_new_task; 1440 lu->lu_dbuf_xfer_done = sbd_dbuf_xfer_done; 1441 lu->lu_send_status_done = sbd_send_status_done; 1442 lu->lu_task_free = sbd_task_free; 1443 lu->lu_abort = sbd_abort; 1444 lu->lu_dbuf_free = sbd_dbuf_free; 1445 lu->lu_ctl = sbd_ctl; 1446 lu->lu_info = sbd_info; 1447 sl->sl_state = STMF_STATE_OFFLINE; 1448 1449 if ((ret = stmf_register_lu(lu)) != STMF_SUCCESS) { 1450 stmf_trace(0, "Failed to register with framework, ret=%llx", 1451 ret); 1452 if (ret == STMF_ALREADY) { 1453 *err_ret = SBD_RET_GUID_ALREADY_REGISTERED; 1454 } 1455 return (EIO); 1456 } 1457 1458 *err_ret = 0; 1459 return (0); 1460 } 1461 1462 int 1463 sbd_open_data_file(sbd_lu_t *sl, uint32_t *err_ret, int lu_size_valid, 1464 int vp_valid, int keep_open) 1465 { 1466 int ret; 1467 int flag; 1468 ulong_t nbits; 1469 uint64_t supported_size; 1470 vattr_t vattr; 1471 enum vtype vt; 1472 struct dk_cinfo dki; 1473 int unused; 1474 1475 mutex_enter(&sl->sl_lock); 1476 if (vp_valid) { 1477 goto odf_over_open; 1478 } 1479 if (sl->sl_data_filename[0] != '/') { 1480 *err_ret = SBD_RET_DATA_PATH_NOT_ABSOLUTE; 1481 mutex_exit(&sl->sl_lock); 1482 return (EINVAL); 1483 } 1484 if ((ret = lookupname(sl->sl_data_filename, UIO_SYSSPACE, FOLLOW, 1485 NULLVPP, &sl->sl_data_vp)) != 0) { 1486 *err_ret = SBD_RET_DATA_FILE_LOOKUP_FAILED; 1487 mutex_exit(&sl->sl_lock); 1488 return (ret); 1489 } 1490 sl->sl_data_vtype = vt = sl->sl_data_vp->v_type; 1491 VN_RELE(sl->sl_data_vp); 1492 if ((vt != VREG) && (vt != VCHR) && (vt != VBLK)) { 1493 *err_ret = SBD_RET_WRONG_DATA_FILE_TYPE; 1494 mutex_exit(&sl->sl_lock); 1495 return (EINVAL); 1496 } 1497 if (sl->sl_flags & SL_WRITE_PROTECTED) { 1498 flag = FREAD | FOFFMAX; 1499 } else { 1500 flag = FREAD | FWRITE | FOFFMAX | FEXCL; 1501 } 1502 if ((ret = vn_open(sl->sl_data_filename, UIO_SYSSPACE, flag, 0, 1503 &sl->sl_data_vp, 0, 0)) != 0) { 1504 *err_ret = SBD_RET_DATA_FILE_OPEN_FAILED; 1505 mutex_exit(&sl->sl_lock); 1506 return (ret); 1507 } 1508 odf_over_open: 1509 vattr.va_mask = AT_SIZE; 1510 if ((ret = VOP_GETATTR(sl->sl_data_vp, &vattr, 0, CRED(), NULL)) != 0) { 1511 *err_ret = SBD_RET_DATA_FILE_GETATTR_FAILED; 1512 goto odf_close_data_and_exit; 1513 } 1514 if ((vt != VREG) && (vattr.va_size == 0)) { 1515 /* 1516 * Its a zero byte block or char device. This cannot be 1517 * a raw disk. 1518 */ 1519 *err_ret = SBD_RET_WRONG_DATA_FILE_TYPE; 1520 ret = EINVAL; 1521 goto odf_close_data_and_exit; 1522 } 1523 /* sl_data_readable size includes any metadata. */ 1524 sl->sl_data_readable_size = vattr.va_size; 1525 1526 if (VOP_PATHCONF(sl->sl_data_vp, _PC_FILESIZEBITS, &nbits, 1527 CRED(), NULL) != 0) { 1528 nbits = 0; 1529 } 1530 /* nbits cannot be greater than 64 */ 1531 sl->sl_data_fs_nbits = (uint8_t)nbits; 1532 if (lu_size_valid) { 1533 sl->sl_total_data_size = sl->sl_lu_size; 1534 if (sl->sl_flags & SL_SHARED_META) { 1535 sl->sl_total_data_size += SHARED_META_DATA_SIZE; 1536 } 1537 if ((nbits > 0) && (nbits < 64)) { 1538 /* 1539 * The expression below is correct only if nbits is 1540 * positive and less than 64. 1541 */ 1542 supported_size = (((uint64_t)1) << nbits) - 1; 1543 if (sl->sl_total_data_size > supported_size) { 1544 *err_ret = SBD_RET_SIZE_NOT_SUPPORTED_BY_FS; 1545 ret = EINVAL; 1546 goto odf_close_data_and_exit; 1547 } 1548 } 1549 } else { 1550 sl->sl_total_data_size = vattr.va_size; 1551 if (sl->sl_flags & SL_SHARED_META) { 1552 if (vattr.va_size > SHARED_META_DATA_SIZE) { 1553 sl->sl_lu_size = vattr.va_size - 1554 SHARED_META_DATA_SIZE; 1555 } else { 1556 *err_ret = SBD_RET_FILE_SIZE_ERROR; 1557 ret = EINVAL; 1558 goto odf_close_data_and_exit; 1559 } 1560 } else { 1561 sl->sl_lu_size = vattr.va_size; 1562 } 1563 } 1564 if (sl->sl_lu_size < SBD_MIN_LU_SIZE) { 1565 *err_ret = SBD_RET_FILE_SIZE_ERROR; 1566 ret = EINVAL; 1567 goto odf_close_data_and_exit; 1568 } 1569 if (sl->sl_lu_size & 1570 ((((uint64_t)1) << sl->sl_data_blocksize_shift) - 1)) { 1571 *err_ret = SBD_RET_FILE_ALIGN_ERROR; 1572 ret = EINVAL; 1573 goto odf_close_data_and_exit; 1574 } 1575 /* 1576 * Get the minor device for direct zvol access 1577 */ 1578 if (sl->sl_flags & SL_ZFS_META) { 1579 if ((ret = VOP_IOCTL(sl->sl_data_vp, DKIOCINFO, (intptr_t)&dki, 1580 FKIOCTL, kcred, &unused, NULL)) != 0) { 1581 cmn_err(CE_WARN, "ioctl(DKIOCINFO) failed %d", ret); 1582 /* zvol reserves 0, so this would fail later */ 1583 sl->sl_zvol_minor = 0; 1584 } else { 1585 sl->sl_zvol_minor = dki.dki_unit; 1586 if (sbd_zvol_get_volume_params(sl) == 0) 1587 sl->sl_flags |= SL_CALL_ZVOL; 1588 } 1589 } 1590 sl->sl_flags |= SL_MEDIA_LOADED; 1591 mutex_exit(&sl->sl_lock); 1592 return (0); 1593 1594 odf_close_data_and_exit: 1595 if (!keep_open) { 1596 (void) VOP_CLOSE(sl->sl_data_vp, flag, 1, 0, CRED(), NULL); 1597 VN_RELE(sl->sl_data_vp); 1598 } 1599 mutex_exit(&sl->sl_lock); 1600 return (ret); 1601 } 1602 1603 void 1604 sbd_close_lu(sbd_lu_t *sl) 1605 { 1606 int flag; 1607 1608 if (((sl->sl_flags & SL_SHARED_META) == 0) && 1609 (sl->sl_flags & SL_META_OPENED)) { 1610 if (sl->sl_flags & SL_ZFS_META) { 1611 rw_destroy(&sl->sl_zfs_meta_lock); 1612 if (sl->sl_zfs_meta) { 1613 kmem_free(sl->sl_zfs_meta, ZAP_MAXVALUELEN / 2); 1614 sl->sl_zfs_meta = NULL; 1615 } 1616 } else { 1617 flag = FREAD | FWRITE | FOFFMAX | FEXCL; 1618 (void) VOP_CLOSE(sl->sl_meta_vp, flag, 1, 0, 1619 CRED(), NULL); 1620 VN_RELE(sl->sl_meta_vp); 1621 } 1622 sl->sl_flags &= ~SL_META_OPENED; 1623 } 1624 if (sl->sl_flags & SL_MEDIA_LOADED) { 1625 if (sl->sl_flags & SL_WRITE_PROTECTED) { 1626 flag = FREAD | FOFFMAX; 1627 } else { 1628 flag = FREAD | FWRITE | FOFFMAX | FEXCL; 1629 } 1630 (void) VOP_CLOSE(sl->sl_data_vp, flag, 1, 0, CRED(), NULL); 1631 VN_RELE(sl->sl_data_vp); 1632 sl->sl_flags &= ~SL_MEDIA_LOADED; 1633 if (sl->sl_flags & SL_SHARED_META) { 1634 sl->sl_flags &= ~SL_META_OPENED; 1635 } 1636 } 1637 } 1638 1639 int 1640 sbd_set_lu_standby(sbd_set_lu_standby_t *stlu, uint32_t *err_ret) 1641 { 1642 sbd_lu_t *sl; 1643 sbd_status_t sret; 1644 stmf_status_t stret; 1645 uint8_t old_access_state; 1646 1647 sret = sbd_find_and_lock_lu(stlu->stlu_guid, NULL, 1648 SL_OP_MODIFY_LU, &sl); 1649 if (sret != SBD_SUCCESS) { 1650 if (sret == SBD_BUSY) { 1651 *err_ret = SBD_RET_LU_BUSY; 1652 return (EBUSY); 1653 } else if (sret == SBD_NOT_FOUND) { 1654 *err_ret = SBD_RET_NOT_FOUND; 1655 return (ENOENT); 1656 } 1657 *err_ret = SBD_RET_ACCESS_STATE_FAILED; 1658 return (EIO); 1659 } 1660 1661 old_access_state = sl->sl_access_state; 1662 sl->sl_access_state = SBD_LU_TRANSITION_TO_STANDBY; 1663 stret = stmf_set_lu_access((stmf_lu_t *)sl->sl_lu, STMF_LU_STANDBY); 1664 if (stret != STMF_SUCCESS) { 1665 sl->sl_trans_op = SL_OP_NONE; 1666 *err_ret = SBD_RET_ACCESS_STATE_FAILED; 1667 sl->sl_access_state = old_access_state; 1668 return (EIO); 1669 } 1670 1671 /* 1672 * acquire the writer lock here to ensure we're not pulling 1673 * the rug from the vn_rdwr to the backing store 1674 */ 1675 rw_enter(&sl->sl_access_state_lock, RW_WRITER); 1676 sbd_close_lu(sl); 1677 rw_exit(&sl->sl_access_state_lock); 1678 1679 sl->sl_trans_op = SL_OP_NONE; 1680 return (0); 1681 } 1682 1683 int 1684 sbd_close_delete_lu(sbd_lu_t *sl, int ret) 1685 { 1686 1687 /* 1688 * acquire the writer lock here to ensure we're not pulling 1689 * the rug from the vn_rdwr to the backing store 1690 */ 1691 rw_enter(&sl->sl_access_state_lock, RW_WRITER); 1692 sbd_close_lu(sl); 1693 rw_exit(&sl->sl_access_state_lock); 1694 1695 if (sl->sl_flags & SL_LINKED) 1696 sbd_unlink_lu(sl); 1697 mutex_destroy(&sl->sl_metadata_lock); 1698 mutex_destroy(&sl->sl_lock); 1699 rw_destroy(&sl->sl_pgr->pgr_lock); 1700 rw_destroy(&sl->sl_access_state_lock); 1701 if (sl->sl_serial_no_alloc_size) { 1702 kmem_free(sl->sl_serial_no, sl->sl_serial_no_alloc_size); 1703 } 1704 if (sl->sl_data_fname_alloc_size) { 1705 kmem_free(sl->sl_data_filename, sl->sl_data_fname_alloc_size); 1706 } 1707 if (sl->sl_alias_alloc_size) { 1708 kmem_free(sl->sl_alias, sl->sl_alias_alloc_size); 1709 } 1710 if (sl->sl_mgmt_url_alloc_size) { 1711 kmem_free(sl->sl_mgmt_url, sl->sl_mgmt_url_alloc_size); 1712 } 1713 stmf_free(sl->sl_lu); 1714 return (ret); 1715 } 1716 1717 int 1718 sbd_create_register_lu(sbd_create_and_reg_lu_t *slu, int struct_sz, 1719 uint32_t *err_ret) 1720 { 1721 char *namebuf; 1722 sbd_lu_t *sl; 1723 stmf_lu_t *lu; 1724 char *p; 1725 int sz; 1726 int alloc_sz; 1727 int ret = EIO; 1728 int flag; 1729 int wcd = 0; 1730 uint32_t hid = 0; 1731 enum vtype vt; 1732 1733 sz = struct_sz - sizeof (sbd_create_and_reg_lu_t) + 8 + 1; 1734 1735 *err_ret = 0; 1736 1737 /* Lets validate various offsets */ 1738 if (((slu->slu_meta_fname_valid) && 1739 (slu->slu_meta_fname_off >= sz)) || 1740 (slu->slu_data_fname_off >= sz) || 1741 ((slu->slu_alias_valid) && 1742 (slu->slu_alias_off >= sz)) || 1743 ((slu->slu_mgmt_url_valid) && 1744 (slu->slu_mgmt_url_off >= sz)) || 1745 ((slu->slu_serial_valid) && 1746 ((slu->slu_serial_off + slu->slu_serial_size) >= sz))) { 1747 return (EINVAL); 1748 } 1749 1750 namebuf = kmem_zalloc(sz, KM_SLEEP); 1751 bcopy(slu->slu_buf, namebuf, sz - 1); 1752 namebuf[sz - 1] = 0; 1753 1754 alloc_sz = sizeof (sbd_lu_t) + sizeof (sbd_pgr_t); 1755 if (slu->slu_meta_fname_valid) { 1756 alloc_sz += strlen(namebuf + slu->slu_meta_fname_off) + 1; 1757 } 1758 alloc_sz += strlen(namebuf + slu->slu_data_fname_off) + 1; 1759 if (slu->slu_alias_valid) { 1760 alloc_sz += strlen(namebuf + slu->slu_alias_off) + 1; 1761 } 1762 if (slu->slu_mgmt_url_valid) { 1763 alloc_sz += strlen(namebuf + slu->slu_mgmt_url_off) + 1; 1764 } 1765 if (slu->slu_serial_valid) { 1766 alloc_sz += slu->slu_serial_size; 1767 } 1768 1769 lu = (stmf_lu_t *)stmf_alloc(STMF_STRUCT_STMF_LU, alloc_sz, 0); 1770 if (lu == NULL) { 1771 kmem_free(namebuf, sz); 1772 return (ENOMEM); 1773 } 1774 sl = (sbd_lu_t *)lu->lu_provider_private; 1775 bzero(sl, alloc_sz); 1776 sl->sl_lu = lu; 1777 sl->sl_alloc_size = alloc_sz; 1778 sl->sl_pgr = (sbd_pgr_t *)(sl + 1); 1779 rw_init(&sl->sl_pgr->pgr_lock, NULL, RW_DRIVER, NULL); 1780 mutex_init(&sl->sl_lock, NULL, MUTEX_DRIVER, NULL); 1781 mutex_init(&sl->sl_metadata_lock, NULL, MUTEX_DRIVER, NULL); 1782 rw_init(&sl->sl_access_state_lock, NULL, RW_DRIVER, NULL); 1783 p = ((char *)sl) + sizeof (sbd_lu_t) + sizeof (sbd_pgr_t); 1784 sl->sl_data_filename = p; 1785 (void) strcpy(sl->sl_data_filename, namebuf + slu->slu_data_fname_off); 1786 p += strlen(sl->sl_data_filename) + 1; 1787 sl->sl_meta_offset = SBD_META_OFFSET; 1788 sl->sl_access_state = SBD_LU_ACTIVE; 1789 if (slu->slu_meta_fname_valid) { 1790 sl->sl_alias = sl->sl_name = sl->sl_meta_filename = p; 1791 (void) strcpy(sl->sl_meta_filename, namebuf + 1792 slu->slu_meta_fname_off); 1793 p += strlen(sl->sl_meta_filename) + 1; 1794 } else { 1795 sl->sl_alias = sl->sl_name = sl->sl_data_filename; 1796 if (sbd_is_zvol(sl->sl_data_filename)) { 1797 sl->sl_flags |= SL_ZFS_META; 1798 sl->sl_meta_offset = 0; 1799 } else { 1800 sl->sl_flags |= SL_SHARED_META; 1801 sl->sl_data_offset = SHARED_META_DATA_SIZE; 1802 sl->sl_total_meta_size = SHARED_META_DATA_SIZE; 1803 sl->sl_meta_size_used = 0; 1804 } 1805 } 1806 if (slu->slu_alias_valid) { 1807 sl->sl_alias = p; 1808 (void) strcpy(p, namebuf + slu->slu_alias_off); 1809 p += strlen(sl->sl_alias) + 1; 1810 } 1811 if (slu->slu_mgmt_url_valid) { 1812 sl->sl_mgmt_url = p; 1813 (void) strcpy(p, namebuf + slu->slu_mgmt_url_off); 1814 p += strlen(sl->sl_mgmt_url) + 1; 1815 } 1816 if (slu->slu_serial_valid) { 1817 sl->sl_serial_no = (uint8_t *)p; 1818 bcopy(namebuf + slu->slu_serial_off, sl->sl_serial_no, 1819 slu->slu_serial_size); 1820 sl->sl_serial_no_size = slu->slu_serial_size; 1821 p += slu->slu_serial_size; 1822 } 1823 kmem_free(namebuf, sz); 1824 if (slu->slu_vid_valid) { 1825 bcopy(slu->slu_vid, sl->sl_vendor_id, 8); 1826 sl->sl_flags |= SL_VID_VALID; 1827 } 1828 if (slu->slu_pid_valid) { 1829 bcopy(slu->slu_pid, sl->sl_product_id, 16); 1830 sl->sl_flags |= SL_PID_VALID; 1831 } 1832 if (slu->slu_rev_valid) { 1833 bcopy(slu->slu_rev, sl->sl_revision, 4); 1834 sl->sl_flags |= SL_REV_VALID; 1835 } 1836 if (slu->slu_write_protected) { 1837 sl->sl_flags |= SL_WRITE_PROTECTED; 1838 } 1839 if (slu->slu_blksize_valid) { 1840 if (!ISP2(slu->slu_blksize) || 1841 (slu->slu_blksize > (32 * 1024)) || 1842 (slu->slu_blksize == 0)) { 1843 *err_ret = SBD_RET_INVALID_BLKSIZE; 1844 ret = EINVAL; 1845 goto scm_err_out; 1846 } 1847 while ((1 << sl->sl_data_blocksize_shift) != slu->slu_blksize) { 1848 sl->sl_data_blocksize_shift++; 1849 } 1850 } else { 1851 sl->sl_data_blocksize_shift = 9; /* 512 by default */ 1852 slu->slu_blksize = 512; 1853 } 1854 1855 /* Now lets start creating meta */ 1856 sl->sl_trans_op = SL_OP_CREATE_REGISTER_LU; 1857 if (sbd_link_lu(sl) != SBD_SUCCESS) { 1858 *err_ret = SBD_RET_FILE_ALREADY_REGISTERED; 1859 ret = EALREADY; 1860 goto scm_err_out; 1861 } 1862 1863 /* 1st focus on the data store */ 1864 if (slu->slu_lu_size_valid) { 1865 sl->sl_lu_size = slu->slu_lu_size; 1866 } 1867 ret = sbd_open_data_file(sl, err_ret, slu->slu_lu_size_valid, 0, 0); 1868 slu->slu_ret_filesize_nbits = sl->sl_data_fs_nbits; 1869 slu->slu_lu_size = sl->sl_lu_size; 1870 if (ret) { 1871 goto scm_err_out; 1872 } 1873 1874 /* 1875 * Check if we were explicitly asked to disable/enable write 1876 * cache on the device, otherwise get current device setting. 1877 */ 1878 if (slu->slu_writeback_cache_disable_valid) { 1879 if (slu->slu_writeback_cache_disable) { 1880 /* 1881 * Set write cache disable on the device. If it fails, 1882 * we'll support it using sync/flush. 1883 */ 1884 (void) sbd_wcd_set(1, sl); 1885 wcd = 1; 1886 } else { 1887 /* 1888 * Set write cache enable on the device. If it fails, 1889 * return an error. 1890 */ 1891 if (sbd_wcd_set(0, sl) != SBD_SUCCESS) { 1892 *err_ret = SBD_RET_WRITE_CACHE_SET_FAILED; 1893 ret = EFAULT; 1894 goto scm_err_out; 1895 } 1896 } 1897 } else { 1898 sbd_wcd_get(&wcd, sl); 1899 } 1900 1901 if (wcd) { 1902 sl->sl_flags |= SL_WRITEBACK_CACHE_DISABLE | 1903 SL_SAVED_WRITE_CACHE_DISABLE; 1904 } 1905 1906 if (sl->sl_flags & SL_SHARED_META) { 1907 goto over_meta_open; 1908 } 1909 if (sl->sl_flags & SL_ZFS_META) { 1910 if (sbd_create_zfs_meta_object(sl) != SBD_SUCCESS) { 1911 *err_ret = SBD_RET_ZFS_META_CREATE_FAILED; 1912 ret = ENOMEM; 1913 goto scm_err_out; 1914 } 1915 sl->sl_meta_blocksize_shift = 0; 1916 goto over_meta_create; 1917 } 1918 if ((ret = lookupname(sl->sl_meta_filename, UIO_SYSSPACE, FOLLOW, 1919 NULLVPP, &sl->sl_meta_vp)) != 0) { 1920 *err_ret = SBD_RET_META_FILE_LOOKUP_FAILED; 1921 goto scm_err_out; 1922 } 1923 sl->sl_meta_vtype = vt = sl->sl_meta_vp->v_type; 1924 VN_RELE(sl->sl_meta_vp); 1925 if ((vt != VREG) && (vt != VCHR) && (vt != VBLK)) { 1926 *err_ret = SBD_RET_WRONG_META_FILE_TYPE; 1927 ret = EINVAL; 1928 goto scm_err_out; 1929 } 1930 if (vt == VREG) { 1931 sl->sl_meta_blocksize_shift = 0; 1932 } else { 1933 sl->sl_meta_blocksize_shift = 9; 1934 } 1935 flag = FREAD | FWRITE | FOFFMAX | FEXCL; 1936 if ((ret = vn_open(sl->sl_meta_filename, UIO_SYSSPACE, flag, 0, 1937 &sl->sl_meta_vp, 0, 0)) != 0) { 1938 *err_ret = SBD_RET_META_FILE_OPEN_FAILED; 1939 goto scm_err_out; 1940 } 1941 over_meta_create: 1942 sl->sl_total_meta_size = sl->sl_meta_offset + sizeof (sbd_meta_start_t); 1943 sl->sl_total_meta_size += 1944 (((uint64_t)1) << sl->sl_meta_blocksize_shift) - 1; 1945 sl->sl_total_meta_size &= 1946 ~((((uint64_t)1) << sl->sl_meta_blocksize_shift) - 1); 1947 sl->sl_meta_size_used = 0; 1948 over_meta_open: 1949 sl->sl_flags |= SL_META_OPENED; 1950 1951 sl->sl_device_id[3] = 16; 1952 if (slu->slu_guid_valid) { 1953 sl->sl_device_id[0] = 0xf1; 1954 sl->sl_device_id[1] = 3; 1955 sl->sl_device_id[2] = 0; 1956 bcopy(slu->slu_guid, sl->sl_device_id + 4, 16); 1957 } else { 1958 if (slu->slu_host_id_valid) 1959 hid = slu->slu_host_id; 1960 if (!slu->slu_company_id_valid) 1961 slu->slu_company_id = COMPANY_ID_SUN; 1962 if (stmf_scsilib_uniq_lu_id2(slu->slu_company_id, hid, 1963 (scsi_devid_desc_t *)&sl->sl_device_id[0]) != 1964 STMF_SUCCESS) { 1965 *err_ret = SBD_RET_META_CREATION_FAILED; 1966 ret = EIO; 1967 goto scm_err_out; 1968 } 1969 bcopy(sl->sl_device_id + 4, slu->slu_guid, 16); 1970 } 1971 1972 /* Lets create the meta now */ 1973 mutex_enter(&sl->sl_metadata_lock); 1974 if (sbd_write_meta_start(sl, sl->sl_total_meta_size, 1975 sizeof (sbd_meta_start_t)) != SBD_SUCCESS) { 1976 mutex_exit(&sl->sl_metadata_lock); 1977 *err_ret = SBD_RET_META_CREATION_FAILED; 1978 ret = EIO; 1979 goto scm_err_out; 1980 } 1981 mutex_exit(&sl->sl_metadata_lock); 1982 sl->sl_meta_size_used = sl->sl_meta_offset + sizeof (sbd_meta_start_t); 1983 1984 if (sbd_write_lu_info(sl) != SBD_SUCCESS) { 1985 *err_ret = SBD_RET_META_CREATION_FAILED; 1986 ret = EIO; 1987 goto scm_err_out; 1988 } 1989 1990 if (sbd_pgr_meta_init(sl) != SBD_SUCCESS) { 1991 *err_ret = SBD_RET_META_CREATION_FAILED; 1992 ret = EIO; 1993 goto scm_err_out; 1994 } 1995 1996 /* 1997 * Update the zvol separately as this need only be called upon 1998 * completion of the metadata initialization. 1999 */ 2000 if (sl->sl_flags & SL_ZFS_META) { 2001 if (sbd_update_zfs_prop(sl) != SBD_SUCCESS) { 2002 *err_ret = SBD_RET_META_CREATION_FAILED; 2003 ret = EIO; 2004 goto scm_err_out; 2005 } 2006 } 2007 2008 ret = sbd_populate_and_register_lu(sl, err_ret); 2009 if (ret) { 2010 goto scm_err_out; 2011 } 2012 2013 sl->sl_trans_op = SL_OP_NONE; 2014 atomic_inc_32(&sbd_lu_count); 2015 return (0); 2016 2017 scm_err_out: 2018 return (sbd_close_delete_lu(sl, ret)); 2019 } 2020 2021 stmf_status_t 2022 sbd_proxy_msg(uint8_t *luid, void *proxy_arg, uint32_t proxy_arg_len, 2023 uint32_t type) 2024 { 2025 switch (type) { 2026 case STMF_MSG_LU_ACTIVE: 2027 return (sbd_proxy_reg_lu(luid, proxy_arg, 2028 proxy_arg_len)); 2029 case STMF_MSG_LU_REGISTER: 2030 return (sbd_proxy_reg_lu(luid, proxy_arg, 2031 proxy_arg_len)); 2032 case STMF_MSG_LU_DEREGISTER: 2033 return (sbd_proxy_dereg_lu(luid, proxy_arg, 2034 proxy_arg_len)); 2035 default: 2036 return (STMF_INVALID_ARG); 2037 } 2038 } 2039 2040 2041 /* 2042 * register a standby logical unit 2043 * proxy_reg_arg contains the meta filename 2044 */ 2045 stmf_status_t 2046 sbd_proxy_reg_lu(uint8_t *luid, void *proxy_reg_arg, uint32_t proxy_reg_arg_len) 2047 { 2048 sbd_lu_t *sl; 2049 sbd_status_t sret; 2050 sbd_create_standby_lu_t *stlu; 2051 int alloc_sz; 2052 uint32_t err_ret = 0; 2053 stmf_status_t stret = STMF_SUCCESS; 2054 2055 if (luid == NULL) { 2056 return (STMF_INVALID_ARG); 2057 } 2058 2059 do { 2060 sret = sbd_find_and_lock_lu(luid, NULL, SL_OP_MODIFY_LU, &sl); 2061 } while (sret == SBD_BUSY); 2062 2063 if (sret == SBD_NOT_FOUND) { 2064 alloc_sz = sizeof (*stlu) + proxy_reg_arg_len - 8; 2065 stlu = (sbd_create_standby_lu_t *)kmem_zalloc(alloc_sz, 2066 KM_SLEEP); 2067 bcopy(luid, stlu->stlu_guid, 16); 2068 if (proxy_reg_arg_len) { 2069 bcopy(proxy_reg_arg, stlu->stlu_meta_fname, 2070 proxy_reg_arg_len); 2071 stlu->stlu_meta_fname_size = proxy_reg_arg_len; 2072 } 2073 if (sbd_create_standby_lu(stlu, &err_ret) != 0) { 2074 cmn_err(CE_WARN, 2075 "Unable to create standby logical unit for %s", 2076 stlu->stlu_meta_fname); 2077 stret = STMF_FAILURE; 2078 } 2079 kmem_free(stlu, alloc_sz); 2080 return (stret); 2081 } else if (sret == SBD_SUCCESS) { 2082 /* 2083 * if the lu is already registered, then the lu should now 2084 * be in standby mode 2085 */ 2086 sbd_it_data_t *it; 2087 if (sl->sl_access_state != SBD_LU_STANDBY) { 2088 mutex_enter(&sl->sl_lock); 2089 sl->sl_access_state = SBD_LU_STANDBY; 2090 for (it = sl->sl_it_list; it != NULL; 2091 it = it->sbd_it_next) { 2092 it->sbd_it_ua_conditions |= 2093 SBD_UA_ASYMMETRIC_ACCESS_CHANGED; 2094 it->sbd_it_flags &= 2095 ~SBD_IT_HAS_SCSI2_RESERVATION; 2096 sl->sl_flags &= ~SL_LU_HAS_SCSI2_RESERVATION; 2097 } 2098 mutex_exit(&sl->sl_lock); 2099 sbd_pgr_reset(sl); 2100 } 2101 sl->sl_trans_op = SL_OP_NONE; 2102 } else { 2103 cmn_err(CE_WARN, "could not find and lock logical unit"); 2104 stret = STMF_FAILURE; 2105 } 2106 out: 2107 return (stret); 2108 } 2109 2110 /* ARGSUSED */ 2111 stmf_status_t 2112 sbd_proxy_dereg_lu(uint8_t *luid, void *proxy_reg_arg, 2113 uint32_t proxy_reg_arg_len) 2114 { 2115 sbd_delete_lu_t dlu = {0}; 2116 uint32_t err_ret; 2117 2118 if (luid == NULL) { 2119 cmn_err(CE_WARN, "de-register lu request had null luid"); 2120 return (STMF_INVALID_ARG); 2121 } 2122 2123 bcopy(luid, &dlu.dlu_guid, 16); 2124 2125 if (sbd_delete_lu(&dlu, (int)sizeof (dlu), &err_ret) != 0) { 2126 cmn_err(CE_WARN, "failed to delete de-register lu request"); 2127 return (STMF_FAILURE); 2128 } 2129 2130 return (STMF_SUCCESS); 2131 } 2132 2133 int 2134 sbd_create_standby_lu(sbd_create_standby_lu_t *slu, uint32_t *err_ret) 2135 { 2136 sbd_lu_t *sl; 2137 stmf_lu_t *lu; 2138 int ret = EIO; 2139 int alloc_sz; 2140 2141 alloc_sz = sizeof (sbd_lu_t) + sizeof (sbd_pgr_t) + 2142 slu->stlu_meta_fname_size; 2143 lu = (stmf_lu_t *)stmf_alloc(STMF_STRUCT_STMF_LU, alloc_sz, 0); 2144 if (lu == NULL) { 2145 return (ENOMEM); 2146 } 2147 sl = (sbd_lu_t *)lu->lu_provider_private; 2148 bzero(sl, alloc_sz); 2149 sl->sl_lu = lu; 2150 sl->sl_alloc_size = alloc_sz; 2151 2152 sl->sl_pgr = (sbd_pgr_t *)(sl + 1); 2153 sl->sl_meta_filename = ((char *)sl) + sizeof (sbd_lu_t) + 2154 sizeof (sbd_pgr_t); 2155 2156 if (slu->stlu_meta_fname_size > 0) { 2157 (void) strcpy(sl->sl_meta_filename, slu->stlu_meta_fname); 2158 } 2159 sl->sl_name = sl->sl_meta_filename; 2160 2161 sl->sl_device_id[3] = 16; 2162 sl->sl_device_id[0] = 0xf1; 2163 sl->sl_device_id[1] = 3; 2164 sl->sl_device_id[2] = 0; 2165 bcopy(slu->stlu_guid, sl->sl_device_id + 4, 16); 2166 lu->lu_id = (scsi_devid_desc_t *)sl->sl_device_id; 2167 sl->sl_access_state = SBD_LU_STANDBY; 2168 2169 rw_init(&sl->sl_pgr->pgr_lock, NULL, RW_DRIVER, NULL); 2170 mutex_init(&sl->sl_lock, NULL, MUTEX_DRIVER, NULL); 2171 mutex_init(&sl->sl_metadata_lock, NULL, MUTEX_DRIVER, NULL); 2172 rw_init(&sl->sl_access_state_lock, NULL, RW_DRIVER, NULL); 2173 2174 sl->sl_trans_op = SL_OP_CREATE_REGISTER_LU; 2175 2176 if (sbd_link_lu(sl) != SBD_SUCCESS) { 2177 *err_ret = SBD_RET_FILE_ALREADY_REGISTERED; 2178 ret = EALREADY; 2179 goto scs_err_out; 2180 } 2181 2182 ret = sbd_populate_and_register_lu(sl, err_ret); 2183 if (ret) { 2184 goto scs_err_out; 2185 } 2186 2187 sl->sl_trans_op = SL_OP_NONE; 2188 atomic_inc_32(&sbd_lu_count); 2189 return (0); 2190 2191 scs_err_out: 2192 return (sbd_close_delete_lu(sl, ret)); 2193 } 2194 2195 int 2196 sbd_load_sli_1_0(sbd_lu_t *sl, uint32_t *err_ret) 2197 { 2198 sbd_lu_info_1_0_t *sli = NULL; 2199 sbd_status_t sret; 2200 2201 sret = sbd_read_meta_section(sl, (sm_section_hdr_t **)&sli, 2202 SMS_ID_LU_INFO_1_0); 2203 2204 if (sret != SBD_SUCCESS) { 2205 *err_ret = SBD_RET_NO_META; 2206 return (EIO); 2207 } 2208 if (sli->sli_data_order != SMS_DATA_ORDER) { 2209 sbd_swap_lu_info_1_0(sli); 2210 if (sli->sli_data_order != SMS_DATA_ORDER) { 2211 kmem_free(sli, sli->sli_sms_header.sms_size); 2212 *err_ret = SBD_RET_NO_META; 2213 return (EIO); 2214 } 2215 } 2216 2217 sl->sl_flags |= SL_SHARED_META; 2218 sl->sl_data_blocksize_shift = 9; 2219 sl->sl_data_offset = SHARED_META_DATA_SIZE; 2220 sl->sl_lu_size = sli->sli_total_store_size - SHARED_META_DATA_SIZE; 2221 sl->sl_total_data_size = SHARED_META_DATA_SIZE + sl->sl_lu_size; 2222 bcopy(sli->sli_lu_devid, sl->sl_device_id, 20); 2223 2224 kmem_free(sli, sli->sli_sms_header.sms_size); 2225 return (0); 2226 } 2227 2228 int 2229 sbd_import_lu(sbd_import_lu_t *ilu, int struct_sz, uint32_t *err_ret, 2230 int no_register, sbd_lu_t **slr) 2231 { 2232 stmf_lu_t *lu; 2233 sbd_lu_t *sl; 2234 sbd_lu_info_1_1_t *sli = NULL; 2235 int asz; 2236 int ret = 0; 2237 stmf_status_t stret; 2238 int flag; 2239 int wcd = 0; 2240 int data_opened; 2241 uint16_t sli_buf_sz; 2242 uint8_t *sli_buf_copy = NULL; 2243 enum vtype vt; 2244 int standby = 0; 2245 sbd_status_t sret; 2246 2247 if (no_register && slr == NULL) { 2248 return (EINVAL); 2249 } 2250 ilu->ilu_meta_fname[struct_sz - sizeof (*ilu) + 8 - 1] = 0; 2251 /* 2252 * check whether logical unit is already registered ALUA 2253 * For a standby logical unit, the meta filename is set. Use 2254 * that to search for an existing logical unit. 2255 */ 2256 sret = sbd_find_and_lock_lu(NULL, (uint8_t *)&(ilu->ilu_meta_fname), 2257 SL_OP_IMPORT_LU, &sl); 2258 2259 if (sret == SBD_SUCCESS) { 2260 if (sl->sl_access_state != SBD_LU_ACTIVE) { 2261 no_register = 1; 2262 standby = 1; 2263 lu = sl->sl_lu; 2264 if (sl->sl_alias_alloc_size) { 2265 kmem_free(sl->sl_alias, 2266 sl->sl_alias_alloc_size); 2267 sl->sl_alias_alloc_size = 0; 2268 sl->sl_alias = NULL; 2269 lu->lu_alias = NULL; 2270 } 2271 if (sl->sl_meta_filename == NULL) { 2272 sl->sl_meta_filename = sl->sl_data_filename; 2273 } else if (sl->sl_data_fname_alloc_size) { 2274 kmem_free(sl->sl_data_filename, 2275 sl->sl_data_fname_alloc_size); 2276 sl->sl_data_fname_alloc_size = 0; 2277 } 2278 if (sl->sl_serial_no_alloc_size) { 2279 kmem_free(sl->sl_serial_no, 2280 sl->sl_serial_no_alloc_size); 2281 sl->sl_serial_no_alloc_size = 0; 2282 } 2283 if (sl->sl_mgmt_url_alloc_size) { 2284 kmem_free(sl->sl_mgmt_url, 2285 sl->sl_mgmt_url_alloc_size); 2286 sl->sl_mgmt_url_alloc_size = 0; 2287 } 2288 } else { 2289 *err_ret = SBD_RET_FILE_ALREADY_REGISTERED; 2290 bcopy(sl->sl_device_id + 4, ilu->ilu_ret_guid, 16); 2291 sl->sl_trans_op = SL_OP_NONE; 2292 return (EALREADY); 2293 } 2294 } else if (sret == SBD_NOT_FOUND) { 2295 asz = strlen(ilu->ilu_meta_fname) + 1; 2296 2297 lu = (stmf_lu_t *)stmf_alloc(STMF_STRUCT_STMF_LU, 2298 sizeof (sbd_lu_t) + sizeof (sbd_pgr_t) + asz, 0); 2299 if (lu == NULL) { 2300 return (ENOMEM); 2301 } 2302 sl = (sbd_lu_t *)lu->lu_provider_private; 2303 bzero(sl, sizeof (*sl)); 2304 sl->sl_lu = lu; 2305 sl->sl_pgr = (sbd_pgr_t *)(sl + 1); 2306 sl->sl_meta_filename = ((char *)sl) + sizeof (*sl) + 2307 sizeof (sbd_pgr_t); 2308 (void) strcpy(sl->sl_meta_filename, ilu->ilu_meta_fname); 2309 sl->sl_name = sl->sl_meta_filename; 2310 rw_init(&sl->sl_pgr->pgr_lock, NULL, RW_DRIVER, NULL); 2311 rw_init(&sl->sl_access_state_lock, NULL, RW_DRIVER, NULL); 2312 mutex_init(&sl->sl_lock, NULL, MUTEX_DRIVER, NULL); 2313 mutex_init(&sl->sl_metadata_lock, NULL, MUTEX_DRIVER, NULL); 2314 sl->sl_trans_op = SL_OP_IMPORT_LU; 2315 } else { 2316 *err_ret = SBD_RET_META_FILE_LOOKUP_FAILED; 2317 return (EIO); 2318 } 2319 2320 /* we're only loading the metadata */ 2321 if (!no_register) { 2322 if (sbd_link_lu(sl) != SBD_SUCCESS) { 2323 *err_ret = SBD_RET_FILE_ALREADY_REGISTERED; 2324 bcopy(sl->sl_device_id + 4, ilu->ilu_ret_guid, 16); 2325 ret = EALREADY; 2326 goto sim_err_out; 2327 } 2328 } 2329 if ((ret = lookupname(sl->sl_meta_filename, UIO_SYSSPACE, FOLLOW, 2330 NULLVPP, &sl->sl_meta_vp)) != 0) { 2331 *err_ret = SBD_RET_META_FILE_LOOKUP_FAILED; 2332 goto sim_err_out; 2333 } 2334 if (sbd_is_zvol(sl->sl_meta_filename)) { 2335 sl->sl_flags |= SL_ZFS_META; 2336 sl->sl_data_filename = sl->sl_meta_filename; 2337 } 2338 sl->sl_meta_vtype = vt = sl->sl_meta_vp->v_type; 2339 VN_RELE(sl->sl_meta_vp); 2340 if ((vt != VREG) && (vt != VCHR) && (vt != VBLK)) { 2341 *err_ret = SBD_RET_WRONG_META_FILE_TYPE; 2342 ret = EINVAL; 2343 goto sim_err_out; 2344 } 2345 if (sl->sl_flags & SL_ZFS_META) { 2346 if (sbd_open_zfs_meta(sl) != SBD_SUCCESS) { 2347 /* let see if metadata is in the 64k block */ 2348 sl->sl_flags &= ~SL_ZFS_META; 2349 } 2350 } 2351 if (!(sl->sl_flags & SL_ZFS_META)) { 2352 /* metadata is always writable */ 2353 flag = FREAD | FWRITE | FOFFMAX | FEXCL; 2354 if ((ret = vn_open(sl->sl_meta_filename, UIO_SYSSPACE, flag, 0, 2355 &sl->sl_meta_vp, 0, 0)) != 0) { 2356 *err_ret = SBD_RET_META_FILE_OPEN_FAILED; 2357 goto sim_err_out; 2358 } 2359 } 2360 if ((sl->sl_flags & SL_ZFS_META) || (vt == VREG)) { 2361 sl->sl_meta_blocksize_shift = 0; 2362 } else { 2363 sl->sl_meta_blocksize_shift = 9; 2364 } 2365 sl->sl_meta_offset = (sl->sl_flags & SL_ZFS_META) ? 0 : SBD_META_OFFSET; 2366 sl->sl_flags |= SL_META_OPENED; 2367 2368 mutex_enter(&sl->sl_metadata_lock); 2369 sret = sbd_load_meta_start(sl); 2370 mutex_exit(&sl->sl_metadata_lock); 2371 if (sret != SBD_SUCCESS) { 2372 if (sret == SBD_META_CORRUPTED) { 2373 *err_ret = SBD_RET_NO_META; 2374 } else if (sret == SBD_NOT_SUPPORTED) { 2375 *err_ret = SBD_RET_VERSION_NOT_SUPPORTED; 2376 } else { 2377 *err_ret = SBD_RET_NO_META; 2378 } 2379 ret = EINVAL; 2380 goto sim_err_out; 2381 } 2382 2383 /* Now lets see if we can read the most recent LU info */ 2384 sret = sbd_read_meta_section(sl, (sm_section_hdr_t **)&sli, 2385 SMS_ID_LU_INFO_1_1); 2386 if ((sret == SBD_NOT_FOUND) && ((sl->sl_flags & SL_ZFS_META) == 0)) { 2387 ret = sbd_load_sli_1_0(sl, err_ret); 2388 if (ret) { 2389 goto sim_err_out; 2390 } 2391 goto sim_sli_loaded; 2392 } 2393 if (sret != SBD_SUCCESS) { 2394 *err_ret = SBD_RET_NO_META; 2395 ret = EIO; 2396 goto sim_err_out; 2397 } 2398 /* load sli 1.1 */ 2399 if (sli->sli_data_order != SMS_DATA_ORDER) { 2400 sbd_swap_lu_info_1_1(sli); 2401 if (sli->sli_data_order != SMS_DATA_ORDER) { 2402 *err_ret = SBD_RET_NO_META; 2403 ret = EIO; 2404 goto sim_err_out; 2405 } 2406 } 2407 2408 sli_buf_sz = sli->sli_sms_header.sms_size - 2409 sizeof (sbd_lu_info_1_1_t) + 8; 2410 sli_buf_copy = kmem_alloc(sli_buf_sz + 1, KM_SLEEP); 2411 bcopy(sli->sli_buf, sli_buf_copy, sli_buf_sz); 2412 sli_buf_copy[sli_buf_sz] = 0; 2413 2414 /* Make sure all the offsets are within limits */ 2415 if (((sli->sli_flags & SLI_META_FNAME_VALID) && 2416 (sli->sli_meta_fname_offset > sli_buf_sz)) || 2417 ((sli->sli_flags & SLI_DATA_FNAME_VALID) && 2418 (sli->sli_data_fname_offset > sli_buf_sz)) || 2419 ((sli->sli_flags & SLI_MGMT_URL_VALID) && 2420 (sli->sli_mgmt_url_offset > sli_buf_sz)) || 2421 ((sli->sli_flags & SLI_SERIAL_VALID) && 2422 ((sli->sli_serial_offset + sli->sli_serial_size) > sli_buf_sz)) || 2423 ((sli->sli_flags & SLI_ALIAS_VALID) && 2424 (sli->sli_alias_offset > sli_buf_sz))) { 2425 *err_ret = SBD_RET_NO_META; 2426 ret = EIO; 2427 goto sim_err_out; 2428 } 2429 2430 sl->sl_lu_size = sli->sli_lu_size; 2431 sl->sl_data_blocksize_shift = sli->sli_data_blocksize_shift; 2432 bcopy(sli->sli_device_id, sl->sl_device_id, 20); 2433 if (sli->sli_flags & SLI_SERIAL_VALID) { 2434 sl->sl_serial_no_size = sl->sl_serial_no_alloc_size = 2435 sli->sli_serial_size; 2436 sl->sl_serial_no = kmem_zalloc(sli->sli_serial_size, KM_SLEEP); 2437 bcopy(sli_buf_copy + sli->sli_serial_offset, sl->sl_serial_no, 2438 sl->sl_serial_no_size); 2439 } 2440 if (sli->sli_flags & SLI_SEPARATE_META) { 2441 sl->sl_total_data_size = sl->sl_lu_size; 2442 if (sli->sli_flags & SLI_DATA_FNAME_VALID) { 2443 sl->sl_data_fname_alloc_size = strlen((char *) 2444 sli_buf_copy + sli->sli_data_fname_offset) + 1; 2445 sl->sl_data_filename = kmem_zalloc( 2446 sl->sl_data_fname_alloc_size, KM_SLEEP); 2447 (void) strcpy(sl->sl_data_filename, 2448 (char *)sli_buf_copy + sli->sli_data_fname_offset); 2449 } 2450 } else { 2451 if (sl->sl_flags & SL_ZFS_META) { 2452 sl->sl_total_data_size = sl->sl_lu_size; 2453 sl->sl_data_offset = 0; 2454 } else { 2455 sl->sl_total_data_size = 2456 sl->sl_lu_size + SHARED_META_DATA_SIZE; 2457 sl->sl_data_offset = SHARED_META_DATA_SIZE; 2458 sl->sl_flags |= SL_SHARED_META; 2459 } 2460 } 2461 if (sli->sli_flags & SLI_ALIAS_VALID) { 2462 sl->sl_alias_alloc_size = strlen((char *)sli_buf_copy + 2463 sli->sli_alias_offset) + 1; 2464 sl->sl_alias = kmem_alloc(sl->sl_alias_alloc_size, KM_SLEEP); 2465 (void) strcpy(sl->sl_alias, (char *)sli_buf_copy + 2466 sli->sli_alias_offset); 2467 } 2468 if (sli->sli_flags & SLI_MGMT_URL_VALID) { 2469 sl->sl_mgmt_url_alloc_size = strlen((char *)sli_buf_copy + 2470 sli->sli_mgmt_url_offset) + 1; 2471 sl->sl_mgmt_url = kmem_alloc(sl->sl_mgmt_url_alloc_size, 2472 KM_SLEEP); 2473 (void) strcpy(sl->sl_mgmt_url, (char *)sli_buf_copy + 2474 sli->sli_mgmt_url_offset); 2475 } 2476 if (sli->sli_flags & SLI_WRITE_PROTECTED) { 2477 sl->sl_flags |= SL_WRITE_PROTECTED; 2478 } 2479 if (sli->sli_flags & SLI_VID_VALID) { 2480 sl->sl_flags |= SL_VID_VALID; 2481 bcopy(sli->sli_vid, sl->sl_vendor_id, 8); 2482 } 2483 if (sli->sli_flags & SLI_PID_VALID) { 2484 sl->sl_flags |= SL_PID_VALID; 2485 bcopy(sli->sli_pid, sl->sl_product_id, 16); 2486 } 2487 if (sli->sli_flags & SLI_REV_VALID) { 2488 sl->sl_flags |= SL_REV_VALID; 2489 bcopy(sli->sli_rev, sl->sl_revision, 4); 2490 } 2491 if (sli->sli_flags & SLI_WRITEBACK_CACHE_DISABLE) { 2492 sl->sl_flags |= SL_WRITEBACK_CACHE_DISABLE; 2493 } 2494 sim_sli_loaded: 2495 if ((sl->sl_flags & SL_SHARED_META) == 0) { 2496 data_opened = 0; 2497 } else { 2498 data_opened = 1; 2499 sl->sl_data_filename = sl->sl_meta_filename; 2500 sl->sl_data_vp = sl->sl_meta_vp; 2501 sl->sl_data_vtype = sl->sl_meta_vtype; 2502 } 2503 2504 sret = sbd_pgr_meta_load(sl); 2505 if (sret != SBD_SUCCESS) { 2506 *err_ret = SBD_RET_NO_META; 2507 ret = EIO; 2508 goto sim_err_out; 2509 } 2510 2511 ret = sbd_open_data_file(sl, err_ret, 1, data_opened, 0); 2512 if (ret) { 2513 goto sim_err_out; 2514 } 2515 2516 /* 2517 * set write cache disable on the device 2518 * Note: this shouldn't fail on import unless the cache capabilities 2519 * of the device changed. If that happened, modify will need to 2520 * be used to set the cache flag appropriately after import is done. 2521 */ 2522 if (sl->sl_flags & SL_WRITEBACK_CACHE_DISABLE) { 2523 (void) sbd_wcd_set(1, sl); 2524 wcd = 1; 2525 /* 2526 * if not explicitly set, attempt to set it to enable, if that fails 2527 * get the current setting and use that 2528 */ 2529 } else { 2530 sret = sbd_wcd_set(0, sl); 2531 if (sret != SBD_SUCCESS) { 2532 sbd_wcd_get(&wcd, sl); 2533 } 2534 } 2535 2536 if (wcd) { 2537 sl->sl_flags |= SL_WRITEBACK_CACHE_DISABLE | 2538 SL_SAVED_WRITE_CACHE_DISABLE; 2539 } 2540 2541 /* we're only loading the metadata */ 2542 if (!no_register) { 2543 ret = sbd_populate_and_register_lu(sl, err_ret); 2544 if (ret) { 2545 goto sim_err_out; 2546 } 2547 atomic_inc_32(&sbd_lu_count); 2548 } 2549 2550 bcopy(sl->sl_device_id + 4, ilu->ilu_ret_guid, 16); 2551 sl->sl_trans_op = SL_OP_NONE; 2552 2553 if (sli) { 2554 kmem_free(sli, sli->sli_sms_header.sms_size); 2555 sli = NULL; 2556 } 2557 if (sli_buf_copy) { 2558 kmem_free(sli_buf_copy, sli_buf_sz + 1); 2559 sli_buf_copy = NULL; 2560 } 2561 if (no_register && !standby) { 2562 *slr = sl; 2563 } 2564 2565 /* 2566 * if this was imported from standby, set the access state 2567 * to active. 2568 */ 2569 if (standby) { 2570 sbd_it_data_t *it; 2571 mutex_enter(&sl->sl_lock); 2572 sl->sl_access_state = SBD_LU_ACTIVE; 2573 for (it = sl->sl_it_list; it != NULL; 2574 it = it->sbd_it_next) { 2575 it->sbd_it_ua_conditions |= 2576 SBD_UA_ASYMMETRIC_ACCESS_CHANGED; 2577 it->sbd_it_ua_conditions |= SBD_UA_POR; 2578 it->sbd_it_flags |= SBD_IT_PGR_CHECK_FLAG; 2579 } 2580 mutex_exit(&sl->sl_lock); 2581 /* call set access state */ 2582 stret = stmf_set_lu_access(lu, STMF_LU_ACTIVE); 2583 if (stret != STMF_SUCCESS) { 2584 *err_ret = SBD_RET_ACCESS_STATE_FAILED; 2585 sl->sl_access_state = SBD_LU_STANDBY; 2586 goto sim_err_out; 2587 } 2588 if (sl->sl_alias) { 2589 lu->lu_alias = sl->sl_alias; 2590 } else { 2591 lu->lu_alias = sl->sl_name; 2592 } 2593 } 2594 sl->sl_access_state = SBD_LU_ACTIVE; 2595 return (0); 2596 2597 sim_err_out: 2598 if (sli) { 2599 kmem_free(sli, sli->sli_sms_header.sms_size); 2600 sli = NULL; 2601 } 2602 if (sli_buf_copy) { 2603 kmem_free(sli_buf_copy, sli_buf_sz + 1); 2604 sli_buf_copy = NULL; 2605 } 2606 2607 if (standby) { 2608 *err_ret = SBD_RET_ACCESS_STATE_FAILED; 2609 sl->sl_trans_op = SL_OP_NONE; 2610 return (EIO); 2611 } else { 2612 return (sbd_close_delete_lu(sl, ret)); 2613 } 2614 } 2615 2616 int 2617 sbd_modify_lu(sbd_modify_lu_t *mlu, int struct_sz, uint32_t *err_ret) 2618 { 2619 sbd_lu_t *sl = NULL; 2620 uint16_t alias_sz; 2621 int ret = 0; 2622 sbd_it_data_t *it; 2623 sbd_status_t sret; 2624 uint64_t old_size; 2625 int modify_unregistered = 0; 2626 int ua = 0; 2627 sbd_import_lu_t *ilu; 2628 stmf_lu_t *lu; 2629 uint32_t ilu_sz; 2630 uint32_t sz; 2631 2632 sz = struct_sz - sizeof (*mlu) + 8 + 1; 2633 2634 /* if there is data in the buf, null terminate it */ 2635 if (struct_sz > sizeof (*mlu)) { 2636 mlu->mlu_buf[struct_sz - sizeof (*mlu) + 8 - 1] = 0; 2637 } 2638 2639 *err_ret = 0; 2640 2641 /* Lets validate offsets */ 2642 if (((mlu->mlu_alias_valid) && 2643 (mlu->mlu_alias_off >= sz)) || 2644 ((mlu->mlu_mgmt_url_valid) && 2645 (mlu->mlu_mgmt_url_off >= sz)) || 2646 (mlu->mlu_by_fname) && 2647 (mlu->mlu_fname_off >= sz)) { 2648 return (EINVAL); 2649 } 2650 2651 /* 2652 * We'll look for the device but if we don't find it registered, 2653 * we'll still try to modify the unregistered device. 2654 */ 2655 if (mlu->mlu_by_guid) { 2656 sret = sbd_find_and_lock_lu(mlu->mlu_input_guid, NULL, 2657 SL_OP_MODIFY_LU, &sl); 2658 } else if (mlu->mlu_by_fname) { 2659 sret = sbd_find_and_lock_lu(NULL, 2660 (uint8_t *)&(mlu->mlu_buf[mlu->mlu_fname_off]), 2661 SL_OP_MODIFY_LU, &sl); 2662 } else { 2663 return (EINVAL); 2664 } 2665 2666 2667 if (sret != SBD_SUCCESS) { 2668 if (sret == SBD_BUSY) { 2669 *err_ret = SBD_RET_LU_BUSY; 2670 return (EBUSY); 2671 } else if (sret != SBD_NOT_FOUND) { 2672 return (EIO); 2673 } else if (!mlu->mlu_by_fname) { 2674 return (EINVAL); 2675 } 2676 /* Okay, try to import the device */ 2677 struct_sz = max(8, strlen(&(mlu->mlu_buf[mlu->mlu_fname_off])) 2678 + 1); 2679 struct_sz += sizeof (sbd_import_lu_t) - 8; 2680 ilu_sz = struct_sz; 2681 ilu = (sbd_import_lu_t *)kmem_zalloc(ilu_sz, KM_SLEEP); 2682 ilu->ilu_struct_size = struct_sz; 2683 (void) strcpy(ilu->ilu_meta_fname, 2684 &(mlu->mlu_buf[mlu->mlu_fname_off])); 2685 ret = sbd_import_lu(ilu, struct_sz, err_ret, 1, &sl); 2686 kmem_free(ilu, ilu_sz); 2687 if (ret != SBD_SUCCESS) { 2688 return (ENOENT); 2689 } 2690 modify_unregistered = 1; 2691 } 2692 2693 if (sl->sl_access_state != SBD_LU_ACTIVE) { 2694 *err_ret = SBD_RET_ACCESS_STATE_FAILED; 2695 ret = EINVAL; 2696 goto smm_err_out; 2697 } 2698 2699 /* check for write cache change */ 2700 if (mlu->mlu_writeback_cache_disable_valid) { 2701 /* set wce on device */ 2702 sret = sbd_wcd_set(mlu->mlu_writeback_cache_disable, sl); 2703 if (!mlu->mlu_writeback_cache_disable && sret != SBD_SUCCESS) { 2704 *err_ret = SBD_RET_WRITE_CACHE_SET_FAILED; 2705 ret = EFAULT; 2706 goto smm_err_out; 2707 } 2708 mutex_enter(&sl->sl_lock); 2709 if (!mlu->mlu_writeback_cache_disable) { 2710 if (sl->sl_flags & SL_WRITEBACK_CACHE_DISABLE) { 2711 ua = 1; 2712 sl->sl_flags &= ~SL_WRITEBACK_CACHE_DISABLE; 2713 sl->sl_flags &= ~SL_SAVED_WRITE_CACHE_DISABLE; 2714 } 2715 } else { 2716 if ((sl->sl_flags & SL_WRITEBACK_CACHE_DISABLE) == 0) { 2717 ua = 1; 2718 sl->sl_flags |= SL_WRITEBACK_CACHE_DISABLE; 2719 sl->sl_flags |= SL_SAVED_WRITE_CACHE_DISABLE; 2720 } 2721 } 2722 for (it = sl->sl_it_list; ua && it != NULL; 2723 it = it->sbd_it_next) { 2724 it->sbd_it_ua_conditions |= 2725 SBD_UA_MODE_PARAMETERS_CHANGED; 2726 } 2727 mutex_exit(&sl->sl_lock); 2728 } 2729 ua = 0; 2730 2731 if (mlu->mlu_alias_valid) { 2732 alias_sz = strlen((char *)mlu->mlu_buf + 2733 mlu->mlu_alias_off) + 1; 2734 /* 2735 * Use the allocated buffer or alloc a new one. 2736 * Don't copy into sl_alias if sl_alias_alloc_size is 0 2737 * otherwise or you'll be writing over the data/metadata 2738 * filename. 2739 */ 2740 mutex_enter(&sl->sl_lock); 2741 if (sl->sl_alias_alloc_size > 0 && 2742 sl->sl_alias_alloc_size < alias_sz) { 2743 kmem_free(sl->sl_alias, 2744 sl->sl_alias_alloc_size); 2745 sl->sl_alias_alloc_size = 0; 2746 } 2747 if (sl->sl_alias_alloc_size == 0) { 2748 sl->sl_alias = kmem_alloc(alias_sz, KM_SLEEP); 2749 sl->sl_alias_alloc_size = alias_sz; 2750 } 2751 (void) strcpy(sl->sl_alias, (char *)mlu->mlu_buf + 2752 mlu->mlu_alias_off); 2753 lu = sl->sl_lu; 2754 lu->lu_alias = sl->sl_alias; 2755 mutex_exit(&sl->sl_lock); 2756 } 2757 2758 if (mlu->mlu_mgmt_url_valid) { 2759 uint16_t url_sz; 2760 2761 url_sz = strlen((char *)mlu->mlu_buf + mlu->mlu_mgmt_url_off); 2762 if (url_sz > 0) 2763 url_sz++; 2764 2765 mutex_enter(&sl->sl_lock); 2766 if (sl->sl_mgmt_url_alloc_size > 0 && 2767 (url_sz == 0 || sl->sl_mgmt_url_alloc_size < url_sz)) { 2768 kmem_free(sl->sl_mgmt_url, sl->sl_mgmt_url_alloc_size); 2769 sl->sl_mgmt_url = NULL; 2770 sl->sl_mgmt_url_alloc_size = 0; 2771 } 2772 if (url_sz > 0) { 2773 if (sl->sl_mgmt_url_alloc_size == 0) { 2774 sl->sl_mgmt_url = kmem_alloc(url_sz, KM_SLEEP); 2775 sl->sl_mgmt_url_alloc_size = url_sz; 2776 } 2777 (void) strcpy(sl->sl_mgmt_url, (char *)mlu->mlu_buf + 2778 mlu->mlu_mgmt_url_off); 2779 } 2780 for (it = sl->sl_it_list; it != NULL; 2781 it = it->sbd_it_next) { 2782 it->sbd_it_ua_conditions |= 2783 SBD_UA_MODE_PARAMETERS_CHANGED; 2784 } 2785 mutex_exit(&sl->sl_lock); 2786 } 2787 2788 if (mlu->mlu_write_protected_valid) { 2789 mutex_enter(&sl->sl_lock); 2790 if (mlu->mlu_write_protected) { 2791 if ((sl->sl_flags & SL_WRITE_PROTECTED) == 0) { 2792 ua = 1; 2793 sl->sl_flags |= SL_WRITE_PROTECTED; 2794 } 2795 } else { 2796 if (sl->sl_flags & SL_WRITE_PROTECTED) { 2797 ua = 1; 2798 sl->sl_flags &= ~SL_WRITE_PROTECTED; 2799 } 2800 } 2801 for (it = sl->sl_it_list; ua && it != NULL; 2802 it = it->sbd_it_next) { 2803 it->sbd_it_ua_conditions |= 2804 SBD_UA_MODE_PARAMETERS_CHANGED; 2805 } 2806 mutex_exit(&sl->sl_lock); 2807 } 2808 2809 if (mlu->mlu_lu_size_valid) { 2810 /* 2811 * validate lu size and set 2812 * For open file only (registered lu) 2813 */ 2814 mutex_enter(&sl->sl_lock); 2815 old_size = sl->sl_lu_size; 2816 sl->sl_lu_size = mlu->mlu_lu_size; 2817 mutex_exit(&sl->sl_lock); 2818 ret = sbd_open_data_file(sl, err_ret, 1, 1, 1); 2819 if (ret) { 2820 mutex_enter(&sl->sl_lock); 2821 sl->sl_lu_size = old_size; 2822 mutex_exit(&sl->sl_lock); 2823 goto smm_err_out; 2824 } 2825 if (old_size != mlu->mlu_lu_size) { 2826 mutex_enter(&sl->sl_lock); 2827 for (it = sl->sl_it_list; it != NULL; 2828 it = it->sbd_it_next) { 2829 it->sbd_it_ua_conditions |= 2830 SBD_UA_CAPACITY_CHANGED; 2831 } 2832 mutex_exit(&sl->sl_lock); 2833 } 2834 } 2835 2836 if (sbd_write_lu_info(sl) != SBD_SUCCESS) { 2837 *err_ret = SBD_RET_META_CREATION_FAILED; 2838 ret = EIO; 2839 } 2840 2841 smm_err_out: 2842 if (modify_unregistered) { 2843 (void) sbd_close_delete_lu(sl, 0); 2844 } else { 2845 sl->sl_trans_op = SL_OP_NONE; 2846 } 2847 return (ret); 2848 } 2849 2850 int 2851 sbd_set_global_props(sbd_global_props_t *mlu, int struct_sz, 2852 uint32_t *err_ret) 2853 { 2854 sbd_lu_t *sl = NULL; 2855 int ret = 0; 2856 sbd_it_data_t *it; 2857 uint32_t sz; 2858 2859 sz = struct_sz - sizeof (*mlu) + 8 + 1; 2860 2861 /* if there is data in the buf, null terminate it */ 2862 if (struct_sz > sizeof (*mlu)) { 2863 mlu->mlu_buf[struct_sz - sizeof (*mlu) + 8 - 1] = 0; 2864 } 2865 2866 *err_ret = 0; 2867 2868 /* Lets validate offsets */ 2869 if (((mlu->mlu_mgmt_url_valid) && 2870 (mlu->mlu_mgmt_url_off >= sz))) { 2871 return (EINVAL); 2872 } 2873 2874 if (mlu->mlu_mgmt_url_valid) { 2875 uint16_t url_sz; 2876 2877 url_sz = strlen((char *)mlu->mlu_buf + mlu->mlu_mgmt_url_off); 2878 if (url_sz > 0) 2879 url_sz++; 2880 2881 rw_enter(&sbd_global_prop_lock, RW_WRITER); 2882 if (sbd_mgmt_url_alloc_size > 0 && 2883 (url_sz == 0 || sbd_mgmt_url_alloc_size < url_sz)) { 2884 kmem_free(sbd_mgmt_url, sbd_mgmt_url_alloc_size); 2885 sbd_mgmt_url = NULL; 2886 sbd_mgmt_url_alloc_size = 0; 2887 } 2888 if (url_sz > 0) { 2889 if (sbd_mgmt_url_alloc_size == 0) { 2890 sbd_mgmt_url = kmem_alloc(url_sz, KM_SLEEP); 2891 sbd_mgmt_url_alloc_size = url_sz; 2892 } 2893 (void) strcpy(sbd_mgmt_url, (char *)mlu->mlu_buf + 2894 mlu->mlu_mgmt_url_off); 2895 } 2896 /* 2897 * check each lu to determine whether a UA is needed. 2898 */ 2899 mutex_enter(&sbd_lock); 2900 for (sl = sbd_lu_list; sl; sl = sl->sl_next) { 2901 if (sl->sl_mgmt_url) { 2902 continue; 2903 } 2904 mutex_enter(&sl->sl_lock); 2905 for (it = sl->sl_it_list; it != NULL; 2906 it = it->sbd_it_next) { 2907 it->sbd_it_ua_conditions |= 2908 SBD_UA_MODE_PARAMETERS_CHANGED; 2909 } 2910 mutex_exit(&sl->sl_lock); 2911 } 2912 mutex_exit(&sbd_lock); 2913 rw_exit(&sbd_global_prop_lock); 2914 } 2915 return (ret); 2916 } 2917 2918 /* ARGSUSED */ 2919 int 2920 sbd_delete_locked_lu(sbd_lu_t *sl, uint32_t *err_ret, 2921 stmf_state_change_info_t *ssi) 2922 { 2923 int i; 2924 stmf_status_t ret; 2925 2926 if ((sl->sl_state == STMF_STATE_OFFLINE) && 2927 !sl->sl_state_not_acked) { 2928 goto sdl_do_dereg; 2929 } 2930 2931 if ((sl->sl_state != STMF_STATE_ONLINE) || 2932 sl->sl_state_not_acked) { 2933 return (EBUSY); 2934 } 2935 2936 ret = stmf_ctl(STMF_CMD_LU_OFFLINE, sl->sl_lu, ssi); 2937 if ((ret != STMF_SUCCESS) && (ret != STMF_ALREADY)) { 2938 return (EBUSY); 2939 } 2940 2941 for (i = 0; i < 500; i++) { 2942 if ((sl->sl_state == STMF_STATE_OFFLINE) && 2943 !sl->sl_state_not_acked) { 2944 goto sdl_do_dereg; 2945 } 2946 delay(drv_usectohz(10000)); 2947 } 2948 return (EBUSY); 2949 2950 sdl_do_dereg:; 2951 if (stmf_deregister_lu(sl->sl_lu) != STMF_SUCCESS) 2952 return (EBUSY); 2953 atomic_dec_32(&sbd_lu_count); 2954 2955 return (sbd_close_delete_lu(sl, 0)); 2956 } 2957 2958 int 2959 sbd_delete_lu(sbd_delete_lu_t *dlu, int struct_sz, uint32_t *err_ret) 2960 { 2961 sbd_lu_t *sl; 2962 sbd_status_t sret; 2963 stmf_state_change_info_t ssi; 2964 int ret; 2965 2966 if (dlu->dlu_by_meta_name) { 2967 ((char *)dlu)[struct_sz - 1] = 0; 2968 sret = sbd_find_and_lock_lu(NULL, dlu->dlu_meta_name, 2969 SL_OP_DELETE_LU, &sl); 2970 } else { 2971 sret = sbd_find_and_lock_lu(dlu->dlu_guid, NULL, 2972 SL_OP_DELETE_LU, &sl); 2973 } 2974 if (sret != SBD_SUCCESS) { 2975 if (sret == SBD_BUSY) { 2976 *err_ret = SBD_RET_LU_BUSY; 2977 return (EBUSY); 2978 } else if (sret == SBD_NOT_FOUND) { 2979 *err_ret = SBD_RET_NOT_FOUND; 2980 return (ENOENT); 2981 } 2982 return (EIO); 2983 } 2984 2985 ssi.st_rflags = STMF_RFLAG_USER_REQUEST; 2986 ssi.st_additional_info = "sbd_delete_lu call (ioctl)"; 2987 ret = sbd_delete_locked_lu(sl, err_ret, &ssi); 2988 2989 if (ret) { 2990 /* Once its locked, no need to grab mutex again */ 2991 sl->sl_trans_op = SL_OP_NONE; 2992 } 2993 return (ret); 2994 } 2995 2996 sbd_status_t 2997 sbd_data_read(sbd_lu_t *sl, struct scsi_task *task, 2998 uint64_t offset, uint64_t size, uint8_t *buf) 2999 { 3000 int ret; 3001 long resid; 3002 3003 if ((offset + size) > sl->sl_lu_size) { 3004 return (SBD_IO_PAST_EOF); 3005 } 3006 3007 offset += sl->sl_data_offset; 3008 3009 if ((offset + size) > sl->sl_data_readable_size) { 3010 uint64_t store_end; 3011 if (offset > sl->sl_data_readable_size) { 3012 bzero(buf, size); 3013 return (SBD_SUCCESS); 3014 } 3015 store_end = sl->sl_data_readable_size - offset; 3016 bzero(buf + store_end, size - store_end); 3017 size = store_end; 3018 } 3019 3020 DTRACE_PROBE5(backing__store__read__start, sbd_lu_t *, sl, 3021 uint8_t *, buf, uint64_t, size, uint64_t, offset, 3022 scsi_task_t *, task); 3023 3024 /* 3025 * Don't proceed if the device has been closed 3026 * This can occur on an access state change to standby or 3027 * a delete. The writer lock is acquired before closing the 3028 * lu. 3029 */ 3030 rw_enter(&sl->sl_access_state_lock, RW_READER); 3031 if ((sl->sl_flags & SL_MEDIA_LOADED) == 0) { 3032 rw_exit(&sl->sl_access_state_lock); 3033 return (SBD_FAILURE); 3034 } 3035 ret = vn_rdwr(UIO_READ, sl->sl_data_vp, (caddr_t)buf, (ssize_t)size, 3036 (offset_t)offset, UIO_SYSSPACE, 0, RLIM64_INFINITY, CRED(), 3037 &resid); 3038 rw_exit(&sl->sl_access_state_lock); 3039 3040 DTRACE_PROBE6(backing__store__read__end, sbd_lu_t *, sl, 3041 uint8_t *, buf, uint64_t, size, uint64_t, offset, 3042 int, ret, scsi_task_t *, task); 3043 3044 over_sl_data_read: 3045 if (ret || resid) { 3046 stmf_trace(0, "UIO_READ failed, ret = %d, resid = %d", ret, 3047 resid); 3048 return (SBD_FAILURE); 3049 } 3050 3051 return (SBD_SUCCESS); 3052 } 3053 3054 sbd_status_t 3055 sbd_data_write(sbd_lu_t *sl, struct scsi_task *task, 3056 uint64_t offset, uint64_t size, uint8_t *buf) 3057 { 3058 int ret; 3059 long resid; 3060 sbd_status_t sret = SBD_SUCCESS; 3061 int ioflag; 3062 3063 if ((offset + size) > sl->sl_lu_size) { 3064 return (SBD_IO_PAST_EOF); 3065 } 3066 3067 offset += sl->sl_data_offset; 3068 3069 if ((sl->sl_flags & SL_WRITEBACK_CACHE_DISABLE) && 3070 (sl->sl_flags & SL_FLUSH_ON_DISABLED_WRITECACHE)) { 3071 ioflag = FSYNC; 3072 } else { 3073 ioflag = 0; 3074 } 3075 3076 DTRACE_PROBE5(backing__store__write__start, sbd_lu_t *, sl, 3077 uint8_t *, buf, uint64_t, size, uint64_t, offset, 3078 scsi_task_t *, task); 3079 3080 /* 3081 * Don't proceed if the device has been closed 3082 * This can occur on an access state change to standby or 3083 * a delete. The writer lock is acquired before closing the 3084 * lu. 3085 */ 3086 rw_enter(&sl->sl_access_state_lock, RW_READER); 3087 if ((sl->sl_flags & SL_MEDIA_LOADED) == 0) { 3088 rw_exit(&sl->sl_access_state_lock); 3089 return (SBD_FAILURE); 3090 } 3091 ret = vn_rdwr(UIO_WRITE, sl->sl_data_vp, (caddr_t)buf, (ssize_t)size, 3092 (offset_t)offset, UIO_SYSSPACE, ioflag, RLIM64_INFINITY, CRED(), 3093 &resid); 3094 rw_exit(&sl->sl_access_state_lock); 3095 3096 DTRACE_PROBE6(backing__store__write__end, sbd_lu_t *, sl, 3097 uint8_t *, buf, uint64_t, size, uint64_t, offset, 3098 int, ret, scsi_task_t *, task); 3099 3100 if ((ret == 0) && (resid == 0) && 3101 (sl->sl_flags & SL_WRITEBACK_CACHE_DISABLE) && 3102 (sl->sl_flags & SL_FLUSH_ON_DISABLED_WRITECACHE)) { 3103 sret = sbd_flush_data_cache(sl, 1); 3104 } 3105 over_sl_data_write: 3106 3107 if ((ret || resid) || (sret != SBD_SUCCESS)) { 3108 return (SBD_FAILURE); 3109 } else if ((offset + size) > sl->sl_data_readable_size) { 3110 uint64_t old_size, new_size; 3111 3112 do { 3113 old_size = sl->sl_data_readable_size; 3114 if ((offset + size) <= old_size) 3115 break; 3116 new_size = offset + size; 3117 } while (atomic_cas_64(&sl->sl_data_readable_size, old_size, 3118 new_size) != old_size); 3119 } 3120 3121 return (SBD_SUCCESS); 3122 } 3123 3124 int 3125 sbd_get_global_props(sbd_global_props_t *oslp, uint32_t oslp_sz, 3126 uint32_t *err_ret) 3127 { 3128 uint32_t sz = 0; 3129 uint16_t off; 3130 3131 rw_enter(&sbd_global_prop_lock, RW_READER); 3132 if (sbd_mgmt_url) { 3133 sz += strlen(sbd_mgmt_url) + 1; 3134 } 3135 bzero(oslp, sizeof (*oslp) - 8); 3136 oslp->mlu_buf_size_needed = sz; 3137 3138 if (sz > (oslp_sz - sizeof (*oslp) + 8)) { 3139 *err_ret = SBD_RET_INSUFFICIENT_BUF_SPACE; 3140 rw_exit(&sbd_global_prop_lock); 3141 return (ENOMEM); 3142 } 3143 3144 off = 0; 3145 if (sbd_mgmt_url) { 3146 oslp->mlu_mgmt_url_valid = 1; 3147 oslp->mlu_mgmt_url_off = off; 3148 (void) strcpy((char *)&oslp->mlu_buf[off], sbd_mgmt_url); 3149 off += strlen(sbd_mgmt_url) + 1; 3150 } 3151 3152 rw_exit(&sbd_global_prop_lock); 3153 return (0); 3154 } 3155 3156 static int 3157 sbd_get_unmap_props(sbd_unmap_props_t *sup, 3158 sbd_unmap_props_t *osup, uint32_t *err_ret) 3159 { 3160 sbd_status_t sret; 3161 sbd_lu_t *sl = NULL; 3162 3163 if (sup->sup_guid_valid) { 3164 sret = sbd_find_and_lock_lu(sup->sup_guid, 3165 NULL, SL_OP_LU_PROPS, &sl); 3166 } else { 3167 sret = sbd_find_and_lock_lu(NULL, 3168 (uint8_t *)sup->sup_zvol_path, SL_OP_LU_PROPS, 3169 &sl); 3170 } 3171 if (sret != SBD_SUCCESS) { 3172 if (sret == SBD_BUSY) { 3173 *err_ret = SBD_RET_LU_BUSY; 3174 return (EBUSY); 3175 } else if (sret == SBD_NOT_FOUND) { 3176 *err_ret = SBD_RET_NOT_FOUND; 3177 return (ENOENT); 3178 } 3179 return (EIO); 3180 } 3181 3182 sup->sup_found_lu = 1; 3183 sup->sup_guid_valid = 1; 3184 bcopy(sl->sl_device_id + 4, sup->sup_guid, 16); 3185 if (sl->sl_flags & SL_UNMAP_ENABLED) 3186 sup->sup_unmap_enabled = 1; 3187 else 3188 sup->sup_unmap_enabled = 0; 3189 3190 *osup = *sup; 3191 sl->sl_trans_op = SL_OP_NONE; 3192 3193 return (0); 3194 } 3195 3196 int 3197 sbd_get_lu_props(sbd_lu_props_t *islp, uint32_t islp_sz, 3198 sbd_lu_props_t *oslp, uint32_t oslp_sz, uint32_t *err_ret) 3199 { 3200 sbd_status_t sret; 3201 sbd_lu_t *sl = NULL; 3202 uint32_t sz; 3203 uint16_t off; 3204 3205 if (islp->slp_input_guid) { 3206 sret = sbd_find_and_lock_lu(islp->slp_guid, NULL, 3207 SL_OP_LU_PROPS, &sl); 3208 } else { 3209 ((char *)islp)[islp_sz - 1] = 0; 3210 sret = sbd_find_and_lock_lu(NULL, islp->slp_buf, 3211 SL_OP_LU_PROPS, &sl); 3212 } 3213 if (sret != SBD_SUCCESS) { 3214 if (sret == SBD_BUSY) { 3215 *err_ret = SBD_RET_LU_BUSY; 3216 return (EBUSY); 3217 } else if (sret == SBD_NOT_FOUND) { 3218 *err_ret = SBD_RET_NOT_FOUND; 3219 return (ENOENT); 3220 } 3221 return (EIO); 3222 } 3223 3224 sz = strlen(sl->sl_name) + 1; 3225 if ((sl->sl_flags & (SL_ZFS_META | SL_SHARED_META)) == 0) { 3226 if (sl->sl_data_filename) { 3227 sz += strlen(sl->sl_data_filename) + 1; 3228 } 3229 } 3230 sz += sl->sl_serial_no_size; 3231 if (sl->sl_alias) { 3232 sz += strlen(sl->sl_alias) + 1; 3233 } 3234 3235 rw_enter(&sbd_global_prop_lock, RW_READER); 3236 if (sl->sl_mgmt_url) { 3237 sz += strlen(sl->sl_mgmt_url) + 1; 3238 } else if (sbd_mgmt_url) { 3239 sz += strlen(sbd_mgmt_url) + 1; 3240 } 3241 bzero(oslp, sizeof (*oslp) - 8); 3242 oslp->slp_buf_size_needed = sz; 3243 3244 if (sz > (oslp_sz - sizeof (*oslp) + 8)) { 3245 sl->sl_trans_op = SL_OP_NONE; 3246 *err_ret = SBD_RET_INSUFFICIENT_BUF_SPACE; 3247 rw_exit(&sbd_global_prop_lock); 3248 return (ENOMEM); 3249 } 3250 3251 off = 0; 3252 (void) strcpy((char *)oslp->slp_buf, sl->sl_name); 3253 oslp->slp_meta_fname_off = off; 3254 off += strlen(sl->sl_name) + 1; 3255 if ((sl->sl_flags & (SL_ZFS_META | SL_SHARED_META)) == 0) { 3256 oslp->slp_meta_fname_valid = 1; 3257 oslp->slp_separate_meta = 1; 3258 if (sl->sl_data_filename) { 3259 oslp->slp_data_fname_valid = 1; 3260 oslp->slp_data_fname_off = off; 3261 (void) strcpy((char *)&oslp->slp_buf[off], 3262 sl->sl_data_filename); 3263 off += strlen(sl->sl_data_filename) + 1; 3264 } 3265 } else { 3266 oslp->slp_data_fname_valid = 1; 3267 oslp->slp_data_fname_off = oslp->slp_meta_fname_off; 3268 if (sl->sl_flags & SL_ZFS_META) { 3269 oslp->slp_zfs_meta = 1; 3270 } 3271 } 3272 if (sl->sl_alias) { 3273 oslp->slp_alias_valid = 1; 3274 oslp->slp_alias_off = off; 3275 (void) strcpy((char *)&oslp->slp_buf[off], sl->sl_alias); 3276 off += strlen(sl->sl_alias) + 1; 3277 } 3278 if (sl->sl_mgmt_url) { 3279 oslp->slp_mgmt_url_valid = 1; 3280 oslp->slp_mgmt_url_off = off; 3281 (void) strcpy((char *)&oslp->slp_buf[off], sl->sl_mgmt_url); 3282 off += strlen(sl->sl_mgmt_url) + 1; 3283 } else if (sbd_mgmt_url) { 3284 oslp->slp_mgmt_url_valid = 1; 3285 oslp->slp_mgmt_url_off = off; 3286 (void) strcpy((char *)&oslp->slp_buf[off], sbd_mgmt_url); 3287 off += strlen(sbd_mgmt_url) + 1; 3288 } 3289 if (sl->sl_serial_no_size) { 3290 oslp->slp_serial_off = off; 3291 bcopy(sl->sl_serial_no, &oslp->slp_buf[off], 3292 sl->sl_serial_no_size); 3293 oslp->slp_serial_size = sl->sl_serial_no_size; 3294 oslp->slp_serial_valid = 1; 3295 off += sl->sl_serial_no_size; 3296 } 3297 3298 oslp->slp_lu_size = sl->sl_lu_size; 3299 oslp->slp_blksize = ((uint16_t)1) << sl->sl_data_blocksize_shift; 3300 3301 oslp->slp_access_state = sl->sl_access_state; 3302 3303 if (sl->sl_flags & SL_VID_VALID) { 3304 oslp->slp_lu_vid = 1; 3305 bcopy(sl->sl_vendor_id, oslp->slp_vid, 8); 3306 } else { 3307 bcopy(sbd_vendor_id, oslp->slp_vid, 8); 3308 } 3309 if (sl->sl_flags & SL_PID_VALID) { 3310 oslp->slp_lu_pid = 1; 3311 bcopy(sl->sl_product_id, oslp->slp_pid, 16); 3312 } else { 3313 bcopy(sbd_product_id, oslp->slp_pid, 16); 3314 } 3315 if (sl->sl_flags & SL_REV_VALID) { 3316 oslp->slp_lu_rev = 1; 3317 bcopy(sl->sl_revision, oslp->slp_rev, 4); 3318 } else { 3319 bcopy(sbd_revision, oslp->slp_rev, 4); 3320 } 3321 bcopy(sl->sl_device_id + 4, oslp->slp_guid, 16); 3322 3323 if (sl->sl_flags & SL_WRITEBACK_CACHE_DISABLE) 3324 oslp->slp_writeback_cache_disable_cur = 1; 3325 if (sl->sl_flags & SL_SAVED_WRITE_CACHE_DISABLE) 3326 oslp->slp_writeback_cache_disable_saved = 1; 3327 if (sl->sl_flags & SL_WRITE_PROTECTED) 3328 oslp->slp_write_protected = 1; 3329 3330 sl->sl_trans_op = SL_OP_NONE; 3331 3332 rw_exit(&sbd_global_prop_lock); 3333 return (0); 3334 } 3335 3336 /* 3337 * Returns an allocated string with the "<pool>/..." form of the zvol name. 3338 */ 3339 static char * 3340 sbd_get_zvol_name(sbd_lu_t *sl) 3341 { 3342 char *src; 3343 char *p; 3344 3345 if (sl->sl_data_filename) 3346 src = sl->sl_data_filename; 3347 else 3348 src = sl->sl_meta_filename; 3349 /* There has to be a better way */ 3350 if (SBD_IS_ZVOL(src) != 0) { 3351 ASSERT(0); 3352 } 3353 src += 14; /* Past /dev/zvol/dsk/ */ 3354 if (*src == '/') 3355 src++; /* or /dev/zvol/rdsk/ */ 3356 p = (char *)kmem_alloc(strlen(src) + 1, KM_SLEEP); 3357 (void) strcpy(p, src); 3358 return (p); 3359 } 3360 3361 /* 3362 * this function creates a local metadata zvol property 3363 */ 3364 sbd_status_t 3365 sbd_create_zfs_meta_object(sbd_lu_t *sl) 3366 { 3367 /* 3368 * -allocate 1/2 the property size, the zfs property 3369 * is 8k in size and stored as ascii hex string, all 3370 * we needed is 4k buffer to store the binary data. 3371 * -initialize reader/write lock 3372 */ 3373 if ((sl->sl_zfs_meta = kmem_zalloc(ZAP_MAXVALUELEN / 2, KM_SLEEP)) 3374 == NULL) 3375 return (SBD_FAILURE); 3376 rw_init(&sl->sl_zfs_meta_lock, NULL, RW_DRIVER, NULL); 3377 return (SBD_SUCCESS); 3378 } 3379 3380 char 3381 sbd_ctoi(char c) 3382 { 3383 if ((c >= '0') && (c <= '9')) 3384 c -= '0'; 3385 else if ((c >= 'A') && (c <= 'F')) 3386 c = c - 'A' + 10; 3387 else if ((c >= 'a') && (c <= 'f')) 3388 c = c - 'a' + 10; 3389 else 3390 c = -1; 3391 return (c); 3392 } 3393 3394 /* 3395 * read zvol property and convert to binary 3396 */ 3397 sbd_status_t 3398 sbd_open_zfs_meta(sbd_lu_t *sl) 3399 { 3400 char *meta = NULL, cl, ch; 3401 int i; 3402 char *tmp, *ptr; 3403 uint64_t rc = SBD_SUCCESS; 3404 int len; 3405 char *file; 3406 3407 if (sl->sl_zfs_meta == NULL) { 3408 if (sbd_create_zfs_meta_object(sl) == SBD_FAILURE) 3409 return (SBD_FAILURE); 3410 } else { 3411 bzero(sl->sl_zfs_meta, (ZAP_MAXVALUELEN / 2)); 3412 } 3413 3414 rw_enter(&sl->sl_zfs_meta_lock, RW_WRITER); 3415 file = sbd_get_zvol_name(sl); 3416 if (sbd_zvolget(file, &meta)) { 3417 rc = SBD_FAILURE; 3418 goto done; 3419 } 3420 tmp = meta; 3421 /* convert ascii hex to binary meta */ 3422 len = strlen(meta); 3423 ptr = sl->sl_zfs_meta; 3424 for (i = 0; i < len; i += 2) { 3425 ch = sbd_ctoi(*tmp++); 3426 cl = sbd_ctoi(*tmp++); 3427 if (ch == -1 || cl == -1) { 3428 rc = SBD_FAILURE; 3429 break; 3430 } 3431 *ptr++ = (ch << 4) + cl; 3432 } 3433 done: 3434 rw_exit(&sl->sl_zfs_meta_lock); 3435 if (meta) 3436 kmem_free(meta, len + 1); 3437 kmem_free(file, strlen(file) + 1); 3438 return (rc); 3439 } 3440 3441 sbd_status_t 3442 sbd_read_zfs_meta(sbd_lu_t *sl, uint8_t *buf, uint64_t sz, uint64_t off) 3443 { 3444 ASSERT(sl->sl_zfs_meta); 3445 rw_enter(&sl->sl_zfs_meta_lock, RW_READER); 3446 bcopy(&sl->sl_zfs_meta[off], buf, sz); 3447 rw_exit(&sl->sl_zfs_meta_lock); 3448 return (SBD_SUCCESS); 3449 } 3450 3451 sbd_status_t 3452 sbd_write_zfs_meta(sbd_lu_t *sl, uint8_t *buf, uint64_t sz, uint64_t off) 3453 { 3454 ASSERT(sl->sl_zfs_meta); 3455 if ((off + sz) > (ZAP_MAXVALUELEN / 2 - 1)) { 3456 return (SBD_META_CORRUPTED); 3457 } 3458 if ((off + sz) > sl->sl_meta_size_used) { 3459 sl->sl_meta_size_used = off + sz; 3460 if (sl->sl_total_meta_size < sl->sl_meta_size_used) { 3461 uint64_t meta_align = 3462 (((uint64_t)1) << sl->sl_meta_blocksize_shift) - 1; 3463 sl->sl_total_meta_size = (sl->sl_meta_size_used + 3464 meta_align) & (~meta_align); 3465 } 3466 } 3467 rw_enter(&sl->sl_zfs_meta_lock, RW_WRITER); 3468 bcopy(buf, &sl->sl_zfs_meta[off], sz); 3469 rw_exit(&sl->sl_zfs_meta_lock); 3470 /* 3471 * During creation of a logical unit, sbd_update_zfs_prop will be 3472 * called separately to avoid multiple calls as each meta section 3473 * create/update will result in a call to sbd_write_zfs_meta(). 3474 * We only need to update the zvol once during create. 3475 */ 3476 mutex_enter(&sl->sl_lock); 3477 if (sl->sl_trans_op != SL_OP_CREATE_REGISTER_LU) { 3478 mutex_exit(&sl->sl_lock); 3479 return (sbd_update_zfs_prop(sl)); 3480 } 3481 mutex_exit(&sl->sl_lock); 3482 return (SBD_SUCCESS); 3483 } 3484 3485 sbd_status_t 3486 sbd_update_zfs_prop(sbd_lu_t *sl) 3487 { 3488 char *ptr, *ah_meta; 3489 char *dp = NULL; 3490 int i, num; 3491 char *file; 3492 sbd_status_t ret = SBD_SUCCESS; 3493 3494 ASSERT(sl->sl_zfs_meta); 3495 ptr = ah_meta = kmem_zalloc(ZAP_MAXVALUELEN, KM_SLEEP); 3496 rw_enter(&sl->sl_zfs_meta_lock, RW_READER); 3497 /* convert local copy to ascii hex */ 3498 dp = sl->sl_zfs_meta; 3499 for (i = 0; i < sl->sl_total_meta_size; i++, dp++) { 3500 num = ((*dp) >> 4) & 0xF; 3501 *ah_meta++ = (num < 10) ? (num + '0') : (num + ('a' - 10)); 3502 num = (*dp) & 0xF; 3503 *ah_meta++ = (num < 10) ? (num + '0') : (num + ('a' - 10)); 3504 } 3505 *ah_meta = NULL; 3506 file = sbd_get_zvol_name(sl); 3507 if (sbd_zvolset(file, (char *)ptr)) { 3508 ret = SBD_META_CORRUPTED; 3509 } 3510 rw_exit(&sl->sl_zfs_meta_lock); 3511 kmem_free(ptr, ZAP_MAXVALUELEN); 3512 kmem_free(file, strlen(file) + 1); 3513 return (ret); 3514 } 3515 3516 int 3517 sbd_is_zvol(char *path) 3518 { 3519 int is_zfs = 0; 3520 3521 if (SBD_IS_ZVOL(path) == 0) 3522 is_zfs = 1; 3523 3524 return (is_zfs); 3525 } 3526 3527 /* 3528 * set write cache disable 3529 * wcd - 1 = disable, 0 = enable 3530 */ 3531 sbd_status_t 3532 sbd_wcd_set(int wcd, sbd_lu_t *sl) 3533 { 3534 /* translate to wce bit */ 3535 int wce = wcd ? 0 : 1; 3536 int ret; 3537 sbd_status_t sret = SBD_SUCCESS; 3538 3539 mutex_enter(&sl->sl_lock); 3540 sl->sl_flags &= ~SL_WRITEBACK_CACHE_SET_UNSUPPORTED; 3541 3542 if (sl->sl_data_vp->v_type == VREG) { 3543 sl->sl_flags |= SL_FLUSH_ON_DISABLED_WRITECACHE; 3544 goto done; 3545 } 3546 3547 ret = VOP_IOCTL(sl->sl_data_vp, DKIOCSETWCE, (intptr_t)&wce, FKIOCTL, 3548 kcred, NULL, NULL); 3549 if (ret == 0) { 3550 sl->sl_flags &= ~SL_WRITEBACK_CACHE_SET_UNSUPPORTED; 3551 sl->sl_flags &= ~SL_FLUSH_ON_DISABLED_WRITECACHE; 3552 } else { 3553 sl->sl_flags |= SL_WRITEBACK_CACHE_SET_UNSUPPORTED; 3554 sl->sl_flags |= SL_FLUSH_ON_DISABLED_WRITECACHE; 3555 sret = SBD_FAILURE; 3556 goto done; 3557 } 3558 3559 done: 3560 mutex_exit(&sl->sl_lock); 3561 return (sret); 3562 } 3563 3564 /* 3565 * get write cache disable 3566 * wcd - 1 = disable, 0 = enable 3567 */ 3568 void 3569 sbd_wcd_get(int *wcd, sbd_lu_t *sl) 3570 { 3571 int wce; 3572 int ret; 3573 3574 if (sl->sl_data_vp->v_type == VREG) { 3575 *wcd = 0; 3576 return; 3577 } 3578 3579 ret = VOP_IOCTL(sl->sl_data_vp, DKIOCGETWCE, (intptr_t)&wce, FKIOCTL, 3580 kcred, NULL, NULL); 3581 /* if write cache get failed, assume disabled */ 3582 if (ret) { 3583 *wcd = 1; 3584 } else { 3585 /* translate to wcd bit */ 3586 *wcd = wce ? 0 : 1; 3587 } 3588 } 3589 3590 int 3591 sbd_zvolget(char *zvol_name, char **comstarprop) 3592 { 3593 ldi_handle_t zfs_lh; 3594 nvlist_t *nv = NULL, *nv2; 3595 zfs_cmd_t *zc; 3596 char *ptr; 3597 int size = 1024; 3598 int unused; 3599 int rc; 3600 3601 if ((rc = ldi_open_by_name("/dev/zfs", FREAD | FWRITE, kcred, 3602 &zfs_lh, sbd_zfs_ident)) != 0) { 3603 cmn_err(CE_WARN, "ldi_open %d", rc); 3604 return (ENXIO); 3605 } 3606 3607 zc = kmem_zalloc(sizeof (zfs_cmd_t), KM_SLEEP); 3608 (void) strlcpy(zc->zc_name, zvol_name, sizeof (zc->zc_name)); 3609 again: 3610 zc->zc_nvlist_dst = (uint64_t)(intptr_t)kmem_alloc(size, 3611 KM_SLEEP); 3612 zc->zc_nvlist_dst_size = size; 3613 rc = ldi_ioctl(zfs_lh, ZFS_IOC_OBJSET_STATS, (intptr_t)zc, 3614 FKIOCTL, kcred, &unused); 3615 /* 3616 * ENOMEM means the list is larger than what we've allocated 3617 * ldi_ioctl will fail with ENOMEM only once 3618 */ 3619 if (rc == ENOMEM) { 3620 int newsize; 3621 newsize = zc->zc_nvlist_dst_size; 3622 kmem_free((void *)(uintptr_t)zc->zc_nvlist_dst, size); 3623 size = newsize; 3624 goto again; 3625 } else if (rc != 0) { 3626 goto out; 3627 } 3628 rc = nvlist_unpack((char *)(uintptr_t)zc->zc_nvlist_dst, 3629 zc->zc_nvlist_dst_size, &nv, 0); 3630 ASSERT(rc == 0); /* nvlist_unpack should not fail */ 3631 if ((rc = nvlist_lookup_nvlist(nv, "stmf_sbd_lu", &nv2)) == 0) { 3632 rc = nvlist_lookup_string(nv2, ZPROP_VALUE, &ptr); 3633 if (rc != 0) { 3634 cmn_err(CE_WARN, "couldn't get value"); 3635 } else { 3636 *comstarprop = kmem_alloc(strlen(ptr) + 1, 3637 KM_SLEEP); 3638 (void) strcpy(*comstarprop, ptr); 3639 } 3640 } 3641 out: 3642 nvlist_free(nv); 3643 kmem_free((void *)(uintptr_t)zc->zc_nvlist_dst, size); 3644 kmem_free(zc, sizeof (zfs_cmd_t)); 3645 (void) ldi_close(zfs_lh, FREAD|FWRITE, kcred); 3646 3647 return (rc); 3648 } 3649 3650 int 3651 sbd_zvolset(char *zvol_name, char *comstarprop) 3652 { 3653 ldi_handle_t zfs_lh; 3654 nvlist_t *nv; 3655 char *packed = NULL; 3656 size_t len; 3657 zfs_cmd_t *zc; 3658 int unused; 3659 int rc; 3660 3661 if ((rc = ldi_open_by_name("/dev/zfs", FREAD | FWRITE, kcred, 3662 &zfs_lh, sbd_zfs_ident)) != 0) { 3663 cmn_err(CE_WARN, "ldi_open %d", rc); 3664 return (ENXIO); 3665 } 3666 (void) nvlist_alloc(&nv, NV_UNIQUE_NAME, KM_SLEEP); 3667 (void) nvlist_add_string(nv, "stmf_sbd_lu", comstarprop); 3668 if ((rc = nvlist_pack(nv, &packed, &len, NV_ENCODE_NATIVE, KM_SLEEP))) { 3669 goto out; 3670 } 3671 3672 zc = kmem_zalloc(sizeof (zfs_cmd_t), KM_SLEEP); 3673 (void) strlcpy(zc->zc_name, zvol_name, sizeof (zc->zc_name)); 3674 zc->zc_nvlist_src = (uint64_t)(intptr_t)packed; 3675 zc->zc_nvlist_src_size = len; 3676 rc = ldi_ioctl(zfs_lh, ZFS_IOC_SET_PROP, (intptr_t)zc, 3677 FKIOCTL, kcred, &unused); 3678 if (rc != 0) { 3679 cmn_err(CE_NOTE, "ioctl failed %d", rc); 3680 } 3681 kmem_free(zc, sizeof (zfs_cmd_t)); 3682 if (packed) 3683 kmem_free(packed, len); 3684 out: 3685 nvlist_free(nv); 3686 (void) ldi_close(zfs_lh, FREAD|FWRITE, kcred); 3687 return (rc); 3688 } 3689 3690 /* 3691 * Unmap a region in a volume. Currently only supported for zvols. 3692 */ 3693 int 3694 sbd_unmap(sbd_lu_t *sl, uint64_t offset, uint64_t length) 3695 { 3696 vnode_t *vp; 3697 int unused; 3698 dkioc_free_t df; 3699 3700 /* Right now, we only support UNMAP on zvols. */ 3701 if (!(sl->sl_flags & SL_ZFS_META)) 3702 return (EIO); 3703 3704 df.df_flags = (sl->sl_flags & SL_WRITEBACK_CACHE_DISABLE) ? 3705 DF_WAIT_SYNC : 0; 3706 df.df_start = offset; 3707 df.df_length = length; 3708 3709 /* Use the data vnode we have to send a fop_ioctl(). */ 3710 vp = sl->sl_data_vp; 3711 if (vp == NULL) { 3712 cmn_err(CE_WARN, "Cannot unmap - no vnode pointer."); 3713 return (EIO); 3714 } 3715 3716 return (VOP_IOCTL(vp, DKIOCFREE, (intptr_t)(&df), FKIOCTL, kcred, 3717 &unused, NULL)); 3718 }