Print this page
cstyle fixes
dsl_dataset_set_fsid_guid should use ZFS_SPACE_CHECK_RESERVED
dsl_dataset_set_fsid_guid _check and _sync func declared static,
removed from dsl_dataset.h
rewrite unique_valid
6333 ZFS should let the user specify or modify the fsid_guid of a dataset
Split |
Close |
Expand all |
Collapse all |
--- old/usr/src/uts/common/fs/zfs/zfs_ioctl.c
+++ new/usr/src/uts/common/fs/zfs/zfs_ioctl.c
1 1 /*
2 2 * CDDL HEADER START
3 3 *
4 4 * The contents of this file are subject to the terms of the
5 5 * Common Development and Distribution License (the "License").
6 6 * You may not use this file except in compliance with the License.
7 7 *
8 8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9 9 * or http://www.opensolaris.org/os/licensing.
10 10 * See the License for the specific language governing permissions
11 11 * and limitations under the License.
12 12 *
13 13 * When distributing Covered Code, include this CDDL HEADER in each
14 14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15 15 * If applicable, add the following below this CDDL HEADER, with the
16 16 * fields enclosed by brackets "[]" replaced with your own identifying
17 17 * information: Portions Copyright [yyyy] [name of copyright owner]
18 18 *
19 19 * CDDL HEADER END
20 20 */
21 21
22 22 /*
23 23 * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
24 24 * Portions Copyright 2011 Martin Matuska
25 25 * Copyright 2015 Nexenta Systems, Inc. All rights reserved.
26 26 * Copyright (c) 2014, Joyent, Inc. All rights reserved.
27 27 * Copyright (c) 2011, 2015 by Delphix. All rights reserved.
28 28 * Copyright (c) 2013 by Saso Kiselkov. All rights reserved.
29 29 * Copyright (c) 2013 Steven Hartland. All rights reserved.
30 30 */
31 31
32 32 /*
33 33 * ZFS ioctls.
34 34 *
35 35 * This file handles the ioctls to /dev/zfs, used for configuring ZFS storage
36 36 * pools and filesystems, e.g. with /sbin/zfs and /sbin/zpool.
37 37 *
38 38 * There are two ways that we handle ioctls: the legacy way where almost
39 39 * all of the logic is in the ioctl callback, and the new way where most
40 40 * of the marshalling is handled in the common entry point, zfsdev_ioctl().
41 41 *
42 42 * Non-legacy ioctls should be registered by calling
43 43 * zfs_ioctl_register() from zfs_ioctl_init(). The ioctl is invoked
44 44 * from userland by lzc_ioctl().
45 45 *
46 46 * The registration arguments are as follows:
47 47 *
48 48 * const char *name
49 49 * The name of the ioctl. This is used for history logging. If the
50 50 * ioctl returns successfully (the callback returns 0), and allow_log
51 51 * is true, then a history log entry will be recorded with the input &
52 52 * output nvlists. The log entry can be printed with "zpool history -i".
53 53 *
54 54 * zfs_ioc_t ioc
55 55 * The ioctl request number, which userland will pass to ioctl(2).
56 56 * The ioctl numbers can change from release to release, because
57 57 * the caller (libzfs) must be matched to the kernel.
58 58 *
59 59 * zfs_secpolicy_func_t *secpolicy
60 60 * This function will be called before the zfs_ioc_func_t, to
61 61 * determine if this operation is permitted. It should return EPERM
62 62 * on failure, and 0 on success. Checks include determining if the
63 63 * dataset is visible in this zone, and if the user has either all
64 64 * zfs privileges in the zone (SYS_MOUNT), or has been granted permission
65 65 * to do this operation on this dataset with "zfs allow".
66 66 *
67 67 * zfs_ioc_namecheck_t namecheck
68 68 * This specifies what to expect in the zfs_cmd_t:zc_name -- a pool
69 69 * name, a dataset name, or nothing. If the name is not well-formed,
70 70 * the ioctl will fail and the callback will not be called.
71 71 * Therefore, the callback can assume that the name is well-formed
72 72 * (e.g. is null-terminated, doesn't have more than one '@' character,
73 73 * doesn't have invalid characters).
74 74 *
75 75 * zfs_ioc_poolcheck_t pool_check
76 76 * This specifies requirements on the pool state. If the pool does
77 77 * not meet them (is suspended or is readonly), the ioctl will fail
78 78 * and the callback will not be called. If any checks are specified
79 79 * (i.e. it is not POOL_CHECK_NONE), namecheck must not be NO_NAME.
80 80 * Multiple checks can be or-ed together (e.g. POOL_CHECK_SUSPENDED |
81 81 * POOL_CHECK_READONLY).
82 82 *
83 83 * boolean_t smush_outnvlist
84 84 * If smush_outnvlist is true, then the output is presumed to be a
85 85 * list of errors, and it will be "smushed" down to fit into the
86 86 * caller's buffer, by removing some entries and replacing them with a
87 87 * single "N_MORE_ERRORS" entry indicating how many were removed. See
88 88 * nvlist_smush() for details. If smush_outnvlist is false, and the
89 89 * outnvlist does not fit into the userland-provided buffer, then the
90 90 * ioctl will fail with ENOMEM.
91 91 *
92 92 * zfs_ioc_func_t *func
93 93 * The callback function that will perform the operation.
94 94 *
95 95 * The callback should return 0 on success, or an error number on
96 96 * failure. If the function fails, the userland ioctl will return -1,
97 97 * and errno will be set to the callback's return value. The callback
98 98 * will be called with the following arguments:
99 99 *
100 100 * const char *name
101 101 * The name of the pool or dataset to operate on, from
102 102 * zfs_cmd_t:zc_name. The 'namecheck' argument specifies the
103 103 * expected type (pool, dataset, or none).
104 104 *
105 105 * nvlist_t *innvl
106 106 * The input nvlist, deserialized from zfs_cmd_t:zc_nvlist_src. Or
107 107 * NULL if no input nvlist was provided. Changes to this nvlist are
108 108 * ignored. If the input nvlist could not be deserialized, the
109 109 * ioctl will fail and the callback will not be called.
110 110 *
111 111 * nvlist_t *outnvl
112 112 * The output nvlist, initially empty. The callback can fill it in,
113 113 * and it will be returned to userland by serializing it into
114 114 * zfs_cmd_t:zc_nvlist_dst. If it is non-empty, and serialization
115 115 * fails (e.g. because the caller didn't supply a large enough
116 116 * buffer), then the overall ioctl will fail. See the
117 117 * 'smush_nvlist' argument above for additional behaviors.
118 118 *
119 119 * There are two typical uses of the output nvlist:
120 120 * - To return state, e.g. property values. In this case,
121 121 * smush_outnvlist should be false. If the buffer was not large
122 122 * enough, the caller will reallocate a larger buffer and try
123 123 * the ioctl again.
124 124 *
125 125 * - To return multiple errors from an ioctl which makes on-disk
126 126 * changes. In this case, smush_outnvlist should be true.
127 127 * Ioctls which make on-disk modifications should generally not
128 128 * use the outnvl if they succeed, because the caller can not
129 129 * distinguish between the operation failing, and
130 130 * deserialization failing.
131 131 */
132 132
133 133 #include <sys/types.h>
134 134 #include <sys/param.h>
135 135 #include <sys/errno.h>
136 136 #include <sys/uio.h>
137 137 #include <sys/buf.h>
138 138 #include <sys/modctl.h>
139 139 #include <sys/open.h>
140 140 #include <sys/file.h>
141 141 #include <sys/kmem.h>
142 142 #include <sys/conf.h>
143 143 #include <sys/cmn_err.h>
144 144 #include <sys/stat.h>
145 145 #include <sys/zfs_ioctl.h>
146 146 #include <sys/zfs_vfsops.h>
147 147 #include <sys/zfs_znode.h>
148 148 #include <sys/zap.h>
149 149 #include <sys/spa.h>
150 150 #include <sys/spa_impl.h>
151 151 #include <sys/vdev.h>
152 152 #include <sys/priv_impl.h>
153 153 #include <sys/dmu.h>
154 154 #include <sys/dsl_dir.h>
155 155 #include <sys/dsl_dataset.h>
156 156 #include <sys/dsl_prop.h>
157 157 #include <sys/dsl_deleg.h>
158 158 #include <sys/dmu_objset.h>
159 159 #include <sys/dmu_impl.h>
160 160 #include <sys/dmu_tx.h>
161 161 #include <sys/ddi.h>
162 162 #include <sys/sunddi.h>
163 163 #include <sys/sunldi.h>
164 164 #include <sys/policy.h>
165 165 #include <sys/zone.h>
166 166 #include <sys/nvpair.h>
167 167 #include <sys/pathname.h>
168 168 #include <sys/mount.h>
169 169 #include <sys/sdt.h>
170 170 #include <sys/fs/zfs.h>
171 171 #include <sys/zfs_ctldir.h>
172 172 #include <sys/zfs_dir.h>
173 173 #include <sys/zfs_onexit.h>
174 174 #include <sys/zvol.h>
175 175 #include <sys/dsl_scan.h>
176 176 #include <sharefs/share.h>
177 177 #include <sys/dmu_objset.h>
178 178 #include <sys/dmu_send.h>
179 179 #include <sys/dsl_destroy.h>
180 180 #include <sys/dsl_bookmark.h>
181 181 #include <sys/dsl_userhold.h>
182 182 #include <sys/zfeature.h>
183 183 #include <sys/zio_checksum.h>
184 184
185 185 #include "zfs_namecheck.h"
186 186 #include "zfs_prop.h"
187 187 #include "zfs_deleg.h"
188 188 #include "zfs_comutil.h"
189 189
190 190 extern struct modlfs zfs_modlfs;
191 191
192 192 extern void zfs_init(void);
193 193 extern void zfs_fini(void);
194 194
195 195 ldi_ident_t zfs_li = NULL;
196 196 dev_info_t *zfs_dip;
197 197
198 198 uint_t zfs_fsyncer_key;
199 199 extern uint_t rrw_tsd_key;
200 200 static uint_t zfs_allow_log_key;
201 201
202 202 typedef int zfs_ioc_legacy_func_t(zfs_cmd_t *);
203 203 typedef int zfs_ioc_func_t(const char *, nvlist_t *, nvlist_t *);
204 204 typedef int zfs_secpolicy_func_t(zfs_cmd_t *, nvlist_t *, cred_t *);
205 205
206 206 typedef enum {
207 207 NO_NAME,
208 208 POOL_NAME,
209 209 DATASET_NAME
210 210 } zfs_ioc_namecheck_t;
211 211
212 212 typedef enum {
213 213 POOL_CHECK_NONE = 1 << 0,
214 214 POOL_CHECK_SUSPENDED = 1 << 1,
215 215 POOL_CHECK_READONLY = 1 << 2,
216 216 } zfs_ioc_poolcheck_t;
217 217
218 218 typedef struct zfs_ioc_vec {
219 219 zfs_ioc_legacy_func_t *zvec_legacy_func;
220 220 zfs_ioc_func_t *zvec_func;
221 221 zfs_secpolicy_func_t *zvec_secpolicy;
222 222 zfs_ioc_namecheck_t zvec_namecheck;
223 223 boolean_t zvec_allow_log;
224 224 zfs_ioc_poolcheck_t zvec_pool_check;
225 225 boolean_t zvec_smush_outnvlist;
226 226 const char *zvec_name;
227 227 } zfs_ioc_vec_t;
228 228
229 229 /* This array is indexed by zfs_userquota_prop_t */
230 230 static const char *userquota_perms[] = {
231 231 ZFS_DELEG_PERM_USERUSED,
232 232 ZFS_DELEG_PERM_USERQUOTA,
233 233 ZFS_DELEG_PERM_GROUPUSED,
234 234 ZFS_DELEG_PERM_GROUPQUOTA,
235 235 };
236 236
237 237 static int zfs_ioc_userspace_upgrade(zfs_cmd_t *zc);
238 238 static int zfs_check_settable(const char *name, nvpair_t *property,
239 239 cred_t *cr);
240 240 static int zfs_check_clearable(char *dataset, nvlist_t *props,
241 241 nvlist_t **errors);
242 242 static int zfs_fill_zplprops_root(uint64_t, nvlist_t *, nvlist_t *,
243 243 boolean_t *);
244 244 int zfs_set_prop_nvlist(const char *, zprop_source_t, nvlist_t *, nvlist_t *);
245 245 static int get_nvlist(uint64_t nvl, uint64_t size, int iflag, nvlist_t **nvp);
246 246
247 247 static int zfs_prop_activate_feature(spa_t *spa, spa_feature_t feature);
248 248
249 249 /* _NOTE(PRINTFLIKE(4)) - this is printf-like, but lint is too whiney */
250 250 void
251 251 __dprintf(const char *file, const char *func, int line, const char *fmt, ...)
252 252 {
253 253 const char *newfile;
254 254 char buf[512];
255 255 va_list adx;
256 256
257 257 /*
258 258 * Get rid of annoying "../common/" prefix to filename.
259 259 */
260 260 newfile = strrchr(file, '/');
261 261 if (newfile != NULL) {
262 262 newfile = newfile + 1; /* Get rid of leading / */
263 263 } else {
264 264 newfile = file;
265 265 }
266 266
267 267 va_start(adx, fmt);
268 268 (void) vsnprintf(buf, sizeof (buf), fmt, adx);
269 269 va_end(adx);
270 270
271 271 /*
272 272 * To get this data, use the zfs-dprintf probe as so:
273 273 * dtrace -q -n 'zfs-dprintf \
274 274 * /stringof(arg0) == "dbuf.c"/ \
275 275 * {printf("%s: %s", stringof(arg1), stringof(arg3))}'
276 276 * arg0 = file name
277 277 * arg1 = function name
278 278 * arg2 = line number
279 279 * arg3 = message
280 280 */
281 281 DTRACE_PROBE4(zfs__dprintf,
282 282 char *, newfile, char *, func, int, line, char *, buf);
283 283 }
284 284
285 285 static void
286 286 history_str_free(char *buf)
287 287 {
288 288 kmem_free(buf, HIS_MAX_RECORD_LEN);
289 289 }
290 290
291 291 static char *
292 292 history_str_get(zfs_cmd_t *zc)
293 293 {
294 294 char *buf;
295 295
296 296 if (zc->zc_history == NULL)
297 297 return (NULL);
298 298
299 299 buf = kmem_alloc(HIS_MAX_RECORD_LEN, KM_SLEEP);
300 300 if (copyinstr((void *)(uintptr_t)zc->zc_history,
301 301 buf, HIS_MAX_RECORD_LEN, NULL) != 0) {
302 302 history_str_free(buf);
303 303 return (NULL);
304 304 }
305 305
306 306 buf[HIS_MAX_RECORD_LEN -1] = '\0';
307 307
308 308 return (buf);
309 309 }
310 310
311 311 /*
312 312 * Check to see if the named dataset is currently defined as bootable
313 313 */
314 314 static boolean_t
315 315 zfs_is_bootfs(const char *name)
316 316 {
317 317 objset_t *os;
318 318
319 319 if (dmu_objset_hold(name, FTAG, &os) == 0) {
320 320 boolean_t ret;
321 321 ret = (dmu_objset_id(os) == spa_bootfs(dmu_objset_spa(os)));
322 322 dmu_objset_rele(os, FTAG);
323 323 return (ret);
324 324 }
325 325 return (B_FALSE);
326 326 }
327 327
328 328 /*
329 329 * Return non-zero if the spa version is less than requested version.
330 330 */
331 331 static int
332 332 zfs_earlier_version(const char *name, int version)
333 333 {
334 334 spa_t *spa;
335 335
336 336 if (spa_open(name, &spa, FTAG) == 0) {
337 337 if (spa_version(spa) < version) {
338 338 spa_close(spa, FTAG);
339 339 return (1);
340 340 }
341 341 spa_close(spa, FTAG);
342 342 }
343 343 return (0);
344 344 }
345 345
346 346 /*
347 347 * Return TRUE if the ZPL version is less than requested version.
348 348 */
349 349 static boolean_t
350 350 zpl_earlier_version(const char *name, int version)
351 351 {
352 352 objset_t *os;
353 353 boolean_t rc = B_TRUE;
354 354
355 355 if (dmu_objset_hold(name, FTAG, &os) == 0) {
356 356 uint64_t zplversion;
357 357
358 358 if (dmu_objset_type(os) != DMU_OST_ZFS) {
359 359 dmu_objset_rele(os, FTAG);
360 360 return (B_TRUE);
361 361 }
362 362 /* XXX reading from non-owned objset */
363 363 if (zfs_get_zplprop(os, ZFS_PROP_VERSION, &zplversion) == 0)
364 364 rc = zplversion < version;
365 365 dmu_objset_rele(os, FTAG);
366 366 }
367 367 return (rc);
368 368 }
369 369
370 370 static void
371 371 zfs_log_history(zfs_cmd_t *zc)
372 372 {
373 373 spa_t *spa;
374 374 char *buf;
375 375
376 376 if ((buf = history_str_get(zc)) == NULL)
377 377 return;
378 378
379 379 if (spa_open(zc->zc_name, &spa, FTAG) == 0) {
380 380 if (spa_version(spa) >= SPA_VERSION_ZPOOL_HISTORY)
381 381 (void) spa_history_log(spa, buf);
382 382 spa_close(spa, FTAG);
383 383 }
384 384 history_str_free(buf);
385 385 }
386 386
387 387 /*
388 388 * Policy for top-level read operations (list pools). Requires no privileges,
389 389 * and can be used in the local zone, as there is no associated dataset.
390 390 */
391 391 /* ARGSUSED */
392 392 static int
393 393 zfs_secpolicy_none(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
394 394 {
395 395 return (0);
396 396 }
397 397
398 398 /*
399 399 * Policy for dataset read operations (list children, get statistics). Requires
400 400 * no privileges, but must be visible in the local zone.
401 401 */
402 402 /* ARGSUSED */
403 403 static int
404 404 zfs_secpolicy_read(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
405 405 {
406 406 if (INGLOBALZONE(curproc) ||
407 407 zone_dataset_visible(zc->zc_name, NULL))
408 408 return (0);
409 409
410 410 return (SET_ERROR(ENOENT));
411 411 }
412 412
413 413 static int
414 414 zfs_dozonecheck_impl(const char *dataset, uint64_t zoned, cred_t *cr)
415 415 {
416 416 int writable = 1;
417 417
418 418 /*
419 419 * The dataset must be visible by this zone -- check this first
420 420 * so they don't see EPERM on something they shouldn't know about.
421 421 */
422 422 if (!INGLOBALZONE(curproc) &&
423 423 !zone_dataset_visible(dataset, &writable))
424 424 return (SET_ERROR(ENOENT));
425 425
426 426 if (INGLOBALZONE(curproc)) {
427 427 /*
428 428 * If the fs is zoned, only root can access it from the
429 429 * global zone.
430 430 */
431 431 if (secpolicy_zfs(cr) && zoned)
432 432 return (SET_ERROR(EPERM));
433 433 } else {
434 434 /*
435 435 * If we are in a local zone, the 'zoned' property must be set.
436 436 */
437 437 if (!zoned)
438 438 return (SET_ERROR(EPERM));
439 439
440 440 /* must be writable by this zone */
441 441 if (!writable)
442 442 return (SET_ERROR(EPERM));
443 443 }
444 444 return (0);
445 445 }
446 446
447 447 static int
448 448 zfs_dozonecheck(const char *dataset, cred_t *cr)
449 449 {
450 450 uint64_t zoned;
451 451
452 452 if (dsl_prop_get_integer(dataset, "zoned", &zoned, NULL))
453 453 return (SET_ERROR(ENOENT));
454 454
455 455 return (zfs_dozonecheck_impl(dataset, zoned, cr));
456 456 }
457 457
458 458 static int
459 459 zfs_dozonecheck_ds(const char *dataset, dsl_dataset_t *ds, cred_t *cr)
460 460 {
461 461 uint64_t zoned;
462 462
463 463 if (dsl_prop_get_int_ds(ds, "zoned", &zoned))
464 464 return (SET_ERROR(ENOENT));
465 465
466 466 return (zfs_dozonecheck_impl(dataset, zoned, cr));
467 467 }
468 468
469 469 static int
470 470 zfs_secpolicy_write_perms_ds(const char *name, dsl_dataset_t *ds,
471 471 const char *perm, cred_t *cr)
472 472 {
473 473 int error;
474 474
475 475 error = zfs_dozonecheck_ds(name, ds, cr);
476 476 if (error == 0) {
477 477 error = secpolicy_zfs(cr);
478 478 if (error != 0)
479 479 error = dsl_deleg_access_impl(ds, perm, cr);
480 480 }
481 481 return (error);
482 482 }
483 483
484 484 static int
485 485 zfs_secpolicy_write_perms(const char *name, const char *perm, cred_t *cr)
486 486 {
487 487 int error;
488 488 dsl_dataset_t *ds;
489 489 dsl_pool_t *dp;
490 490
491 491 error = dsl_pool_hold(name, FTAG, &dp);
492 492 if (error != 0)
493 493 return (error);
494 494
495 495 error = dsl_dataset_hold(dp, name, FTAG, &ds);
496 496 if (error != 0) {
497 497 dsl_pool_rele(dp, FTAG);
498 498 return (error);
499 499 }
500 500
501 501 error = zfs_secpolicy_write_perms_ds(name, ds, perm, cr);
502 502
503 503 dsl_dataset_rele(ds, FTAG);
504 504 dsl_pool_rele(dp, FTAG);
505 505 return (error);
506 506 }
507 507
508 508 /*
509 509 * Policy for setting the security label property.
510 510 *
511 511 * Returns 0 for success, non-zero for access and other errors.
512 512 */
513 513 static int
514 514 zfs_set_slabel_policy(const char *name, char *strval, cred_t *cr)
515 515 {
516 516 char ds_hexsl[MAXNAMELEN];
517 517 bslabel_t ds_sl, new_sl;
518 518 boolean_t new_default = FALSE;
519 519 uint64_t zoned;
520 520 int needed_priv = -1;
521 521 int error;
522 522
523 523 /* First get the existing dataset label. */
524 524 error = dsl_prop_get(name, zfs_prop_to_name(ZFS_PROP_MLSLABEL),
525 525 1, sizeof (ds_hexsl), &ds_hexsl, NULL);
526 526 if (error != 0)
527 527 return (SET_ERROR(EPERM));
528 528
529 529 if (strcasecmp(strval, ZFS_MLSLABEL_DEFAULT) == 0)
530 530 new_default = TRUE;
531 531
532 532 /* The label must be translatable */
533 533 if (!new_default && (hexstr_to_label(strval, &new_sl) != 0))
534 534 return (SET_ERROR(EINVAL));
535 535
536 536 /*
537 537 * In a non-global zone, disallow attempts to set a label that
538 538 * doesn't match that of the zone; otherwise no other checks
539 539 * are needed.
540 540 */
541 541 if (!INGLOBALZONE(curproc)) {
542 542 if (new_default || !blequal(&new_sl, CR_SL(CRED())))
543 543 return (SET_ERROR(EPERM));
544 544 return (0);
545 545 }
546 546
547 547 /*
548 548 * For global-zone datasets (i.e., those whose zoned property is
549 549 * "off", verify that the specified new label is valid for the
550 550 * global zone.
551 551 */
552 552 if (dsl_prop_get_integer(name,
553 553 zfs_prop_to_name(ZFS_PROP_ZONED), &zoned, NULL))
554 554 return (SET_ERROR(EPERM));
555 555 if (!zoned) {
556 556 if (zfs_check_global_label(name, strval) != 0)
557 557 return (SET_ERROR(EPERM));
558 558 }
559 559
560 560 /*
561 561 * If the existing dataset label is nondefault, check if the
562 562 * dataset is mounted (label cannot be changed while mounted).
563 563 * Get the zfsvfs; if there isn't one, then the dataset isn't
564 564 * mounted (or isn't a dataset, doesn't exist, ...).
565 565 */
566 566 if (strcasecmp(ds_hexsl, ZFS_MLSLABEL_DEFAULT) != 0) {
567 567 objset_t *os;
568 568 static char *setsl_tag = "setsl_tag";
569 569
570 570 /*
571 571 * Try to own the dataset; abort if there is any error,
572 572 * (e.g., already mounted, in use, or other error).
573 573 */
574 574 error = dmu_objset_own(name, DMU_OST_ZFS, B_TRUE,
575 575 setsl_tag, &os);
576 576 if (error != 0)
577 577 return (SET_ERROR(EPERM));
578 578
579 579 dmu_objset_disown(os, setsl_tag);
580 580
581 581 if (new_default) {
582 582 needed_priv = PRIV_FILE_DOWNGRADE_SL;
583 583 goto out_check;
584 584 }
585 585
586 586 if (hexstr_to_label(strval, &new_sl) != 0)
587 587 return (SET_ERROR(EPERM));
588 588
589 589 if (blstrictdom(&ds_sl, &new_sl))
590 590 needed_priv = PRIV_FILE_DOWNGRADE_SL;
591 591 else if (blstrictdom(&new_sl, &ds_sl))
592 592 needed_priv = PRIV_FILE_UPGRADE_SL;
593 593 } else {
594 594 /* dataset currently has a default label */
595 595 if (!new_default)
596 596 needed_priv = PRIV_FILE_UPGRADE_SL;
597 597 }
598 598
599 599 out_check:
600 600 if (needed_priv != -1)
601 601 return (PRIV_POLICY(cr, needed_priv, B_FALSE, EPERM, NULL));
602 602 return (0);
603 603 }
604 604
605 605 static int
606 606 zfs_secpolicy_setprop(const char *dsname, zfs_prop_t prop, nvpair_t *propval,
607 607 cred_t *cr)
608 608 {
609 609 char *strval;
610 610
611 611 /*
612 612 * Check permissions for special properties.
613 613 */
614 614 switch (prop) {
615 615 case ZFS_PROP_ZONED:
616 616 /*
617 617 * Disallow setting of 'zoned' from within a local zone.
618 618 */
619 619 if (!INGLOBALZONE(curproc))
620 620 return (SET_ERROR(EPERM));
621 621 break;
622 622
623 623 case ZFS_PROP_QUOTA:
624 624 case ZFS_PROP_FILESYSTEM_LIMIT:
625 625 case ZFS_PROP_SNAPSHOT_LIMIT:
626 626 if (!INGLOBALZONE(curproc)) {
627 627 uint64_t zoned;
628 628 char setpoint[MAXNAMELEN];
629 629 /*
630 630 * Unprivileged users are allowed to modify the
631 631 * limit on things *under* (ie. contained by)
632 632 * the thing they own.
633 633 */
634 634 if (dsl_prop_get_integer(dsname, "zoned", &zoned,
635 635 setpoint))
636 636 return (SET_ERROR(EPERM));
637 637 if (!zoned || strlen(dsname) <= strlen(setpoint))
638 638 return (SET_ERROR(EPERM));
639 639 }
640 640 break;
641 641
642 642 case ZFS_PROP_MLSLABEL:
643 643 if (!is_system_labeled())
644 644 return (SET_ERROR(EPERM));
645 645
646 646 if (nvpair_value_string(propval, &strval) == 0) {
647 647 int err;
648 648
649 649 err = zfs_set_slabel_policy(dsname, strval, CRED());
650 650 if (err != 0)
651 651 return (err);
652 652 }
653 653 break;
654 654 }
655 655
656 656 return (zfs_secpolicy_write_perms(dsname, zfs_prop_to_name(prop), cr));
657 657 }
658 658
659 659 /* ARGSUSED */
660 660 static int
661 661 zfs_secpolicy_set_fsacl(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
662 662 {
663 663 int error;
664 664
665 665 error = zfs_dozonecheck(zc->zc_name, cr);
666 666 if (error != 0)
667 667 return (error);
668 668
669 669 /*
670 670 * permission to set permissions will be evaluated later in
671 671 * dsl_deleg_can_allow()
672 672 */
673 673 return (0);
674 674 }
675 675
676 676 /* ARGSUSED */
677 677 static int
678 678 zfs_secpolicy_rollback(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
679 679 {
680 680 return (zfs_secpolicy_write_perms(zc->zc_name,
681 681 ZFS_DELEG_PERM_ROLLBACK, cr));
682 682 }
683 683
684 684 /* ARGSUSED */
685 685 static int
686 686 zfs_secpolicy_send(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
687 687 {
688 688 dsl_pool_t *dp;
689 689 dsl_dataset_t *ds;
690 690 char *cp;
691 691 int error;
692 692
693 693 /*
694 694 * Generate the current snapshot name from the given objsetid, then
695 695 * use that name for the secpolicy/zone checks.
696 696 */
697 697 cp = strchr(zc->zc_name, '@');
698 698 if (cp == NULL)
699 699 return (SET_ERROR(EINVAL));
700 700 error = dsl_pool_hold(zc->zc_name, FTAG, &dp);
701 701 if (error != 0)
702 702 return (error);
703 703
704 704 error = dsl_dataset_hold_obj(dp, zc->zc_sendobj, FTAG, &ds);
705 705 if (error != 0) {
706 706 dsl_pool_rele(dp, FTAG);
707 707 return (error);
708 708 }
709 709
710 710 dsl_dataset_name(ds, zc->zc_name);
711 711
712 712 error = zfs_secpolicy_write_perms_ds(zc->zc_name, ds,
713 713 ZFS_DELEG_PERM_SEND, cr);
714 714 dsl_dataset_rele(ds, FTAG);
715 715 dsl_pool_rele(dp, FTAG);
716 716
717 717 return (error);
718 718 }
719 719
720 720 /* ARGSUSED */
721 721 static int
722 722 zfs_secpolicy_send_new(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
723 723 {
724 724 return (zfs_secpolicy_write_perms(zc->zc_name,
725 725 ZFS_DELEG_PERM_SEND, cr));
726 726 }
727 727
728 728 /* ARGSUSED */
729 729 static int
730 730 zfs_secpolicy_deleg_share(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
731 731 {
732 732 vnode_t *vp;
733 733 int error;
734 734
735 735 if ((error = lookupname(zc->zc_value, UIO_SYSSPACE,
736 736 NO_FOLLOW, NULL, &vp)) != 0)
737 737 return (error);
738 738
739 739 /* Now make sure mntpnt and dataset are ZFS */
740 740
741 741 if (vp->v_vfsp->vfs_fstype != zfsfstype ||
742 742 (strcmp((char *)refstr_value(vp->v_vfsp->vfs_resource),
743 743 zc->zc_name) != 0)) {
744 744 VN_RELE(vp);
745 745 return (SET_ERROR(EPERM));
746 746 }
747 747
748 748 VN_RELE(vp);
749 749 return (dsl_deleg_access(zc->zc_name,
750 750 ZFS_DELEG_PERM_SHARE, cr));
751 751 }
752 752
753 753 int
754 754 zfs_secpolicy_share(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
755 755 {
756 756 if (!INGLOBALZONE(curproc))
757 757 return (SET_ERROR(EPERM));
758 758
759 759 if (secpolicy_nfs(cr) == 0) {
760 760 return (0);
761 761 } else {
762 762 return (zfs_secpolicy_deleg_share(zc, innvl, cr));
763 763 }
764 764 }
765 765
766 766 int
767 767 zfs_secpolicy_smb_acl(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
768 768 {
769 769 if (!INGLOBALZONE(curproc))
770 770 return (SET_ERROR(EPERM));
771 771
772 772 if (secpolicy_smb(cr) == 0) {
773 773 return (0);
774 774 } else {
775 775 return (zfs_secpolicy_deleg_share(zc, innvl, cr));
776 776 }
777 777 }
778 778
779 779 static int
780 780 zfs_get_parent(const char *datasetname, char *parent, int parentsize)
781 781 {
782 782 char *cp;
783 783
784 784 /*
785 785 * Remove the @bla or /bla from the end of the name to get the parent.
786 786 */
787 787 (void) strncpy(parent, datasetname, parentsize);
788 788 cp = strrchr(parent, '@');
789 789 if (cp != NULL) {
790 790 cp[0] = '\0';
791 791 } else {
792 792 cp = strrchr(parent, '/');
793 793 if (cp == NULL)
794 794 return (SET_ERROR(ENOENT));
795 795 cp[0] = '\0';
796 796 }
797 797
798 798 return (0);
799 799 }
800 800
801 801 int
802 802 zfs_secpolicy_destroy_perms(const char *name, cred_t *cr)
803 803 {
804 804 int error;
805 805
806 806 if ((error = zfs_secpolicy_write_perms(name,
807 807 ZFS_DELEG_PERM_MOUNT, cr)) != 0)
808 808 return (error);
809 809
810 810 return (zfs_secpolicy_write_perms(name, ZFS_DELEG_PERM_DESTROY, cr));
811 811 }
812 812
813 813 /* ARGSUSED */
814 814 static int
815 815 zfs_secpolicy_destroy(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
816 816 {
817 817 return (zfs_secpolicy_destroy_perms(zc->zc_name, cr));
818 818 }
819 819
820 820 /*
821 821 * Destroying snapshots with delegated permissions requires
822 822 * descendant mount and destroy permissions.
823 823 */
824 824 /* ARGSUSED */
825 825 static int
826 826 zfs_secpolicy_destroy_snaps(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
827 827 {
828 828 nvlist_t *snaps;
829 829 nvpair_t *pair, *nextpair;
830 830 int error = 0;
831 831
832 832 if (nvlist_lookup_nvlist(innvl, "snaps", &snaps) != 0)
833 833 return (SET_ERROR(EINVAL));
834 834 for (pair = nvlist_next_nvpair(snaps, NULL); pair != NULL;
835 835 pair = nextpair) {
836 836 nextpair = nvlist_next_nvpair(snaps, pair);
837 837 error = zfs_secpolicy_destroy_perms(nvpair_name(pair), cr);
838 838 if (error == ENOENT) {
839 839 /*
840 840 * Ignore any snapshots that don't exist (we consider
841 841 * them "already destroyed"). Remove the name from the
842 842 * nvl here in case the snapshot is created between
843 843 * now and when we try to destroy it (in which case
844 844 * we don't want to destroy it since we haven't
845 845 * checked for permission).
846 846 */
847 847 fnvlist_remove_nvpair(snaps, pair);
848 848 error = 0;
849 849 }
850 850 if (error != 0)
851 851 break;
852 852 }
853 853
854 854 return (error);
855 855 }
856 856
857 857 int
858 858 zfs_secpolicy_rename_perms(const char *from, const char *to, cred_t *cr)
859 859 {
860 860 char parentname[MAXNAMELEN];
861 861 int error;
862 862
863 863 if ((error = zfs_secpolicy_write_perms(from,
864 864 ZFS_DELEG_PERM_RENAME, cr)) != 0)
865 865 return (error);
866 866
867 867 if ((error = zfs_secpolicy_write_perms(from,
868 868 ZFS_DELEG_PERM_MOUNT, cr)) != 0)
869 869 return (error);
870 870
871 871 if ((error = zfs_get_parent(to, parentname,
872 872 sizeof (parentname))) != 0)
873 873 return (error);
874 874
875 875 if ((error = zfs_secpolicy_write_perms(parentname,
876 876 ZFS_DELEG_PERM_CREATE, cr)) != 0)
877 877 return (error);
878 878
879 879 if ((error = zfs_secpolicy_write_perms(parentname,
880 880 ZFS_DELEG_PERM_MOUNT, cr)) != 0)
881 881 return (error);
882 882
883 883 return (error);
884 884 }
885 885
886 886 /* ARGSUSED */
887 887 static int
888 888 zfs_secpolicy_rename(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
889 889 {
890 890 return (zfs_secpolicy_rename_perms(zc->zc_name, zc->zc_value, cr));
891 891 }
892 892
893 893 /* ARGSUSED */
894 894 static int
895 895 zfs_secpolicy_promote(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
896 896 {
897 897 dsl_pool_t *dp;
898 898 dsl_dataset_t *clone;
899 899 int error;
900 900
901 901 error = zfs_secpolicy_write_perms(zc->zc_name,
902 902 ZFS_DELEG_PERM_PROMOTE, cr);
903 903 if (error != 0)
904 904 return (error);
905 905
906 906 error = dsl_pool_hold(zc->zc_name, FTAG, &dp);
907 907 if (error != 0)
908 908 return (error);
909 909
910 910 error = dsl_dataset_hold(dp, zc->zc_name, FTAG, &clone);
911 911
912 912 if (error == 0) {
913 913 char parentname[MAXNAMELEN];
914 914 dsl_dataset_t *origin = NULL;
915 915 dsl_dir_t *dd;
916 916 dd = clone->ds_dir;
917 917
918 918 error = dsl_dataset_hold_obj(dd->dd_pool,
919 919 dsl_dir_phys(dd)->dd_origin_obj, FTAG, &origin);
920 920 if (error != 0) {
921 921 dsl_dataset_rele(clone, FTAG);
922 922 dsl_pool_rele(dp, FTAG);
923 923 return (error);
924 924 }
925 925
926 926 error = zfs_secpolicy_write_perms_ds(zc->zc_name, clone,
927 927 ZFS_DELEG_PERM_MOUNT, cr);
928 928
929 929 dsl_dataset_name(origin, parentname);
930 930 if (error == 0) {
931 931 error = zfs_secpolicy_write_perms_ds(parentname, origin,
932 932 ZFS_DELEG_PERM_PROMOTE, cr);
933 933 }
934 934 dsl_dataset_rele(clone, FTAG);
935 935 dsl_dataset_rele(origin, FTAG);
936 936 }
937 937 dsl_pool_rele(dp, FTAG);
938 938 return (error);
939 939 }
940 940
941 941 /* ARGSUSED */
942 942 static int
943 943 zfs_secpolicy_recv(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
944 944 {
945 945 int error;
946 946
947 947 if ((error = zfs_secpolicy_write_perms(zc->zc_name,
948 948 ZFS_DELEG_PERM_RECEIVE, cr)) != 0)
949 949 return (error);
950 950
951 951 if ((error = zfs_secpolicy_write_perms(zc->zc_name,
952 952 ZFS_DELEG_PERM_MOUNT, cr)) != 0)
953 953 return (error);
954 954
955 955 return (zfs_secpolicy_write_perms(zc->zc_name,
956 956 ZFS_DELEG_PERM_CREATE, cr));
957 957 }
958 958
959 959 int
960 960 zfs_secpolicy_snapshot_perms(const char *name, cred_t *cr)
961 961 {
962 962 return (zfs_secpolicy_write_perms(name,
963 963 ZFS_DELEG_PERM_SNAPSHOT, cr));
964 964 }
965 965
966 966 /*
967 967 * Check for permission to create each snapshot in the nvlist.
968 968 */
969 969 /* ARGSUSED */
970 970 static int
971 971 zfs_secpolicy_snapshot(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
972 972 {
973 973 nvlist_t *snaps;
974 974 int error = 0;
975 975 nvpair_t *pair;
976 976
977 977 if (nvlist_lookup_nvlist(innvl, "snaps", &snaps) != 0)
978 978 return (SET_ERROR(EINVAL));
979 979 for (pair = nvlist_next_nvpair(snaps, NULL); pair != NULL;
980 980 pair = nvlist_next_nvpair(snaps, pair)) {
981 981 char *name = nvpair_name(pair);
982 982 char *atp = strchr(name, '@');
983 983
984 984 if (atp == NULL) {
985 985 error = SET_ERROR(EINVAL);
986 986 break;
987 987 }
988 988 *atp = '\0';
989 989 error = zfs_secpolicy_snapshot_perms(name, cr);
990 990 *atp = '@';
991 991 if (error != 0)
992 992 break;
993 993 }
994 994 return (error);
995 995 }
996 996
997 997 /*
998 998 * Check for permission to create each snapshot in the nvlist.
999 999 */
1000 1000 /* ARGSUSED */
1001 1001 static int
1002 1002 zfs_secpolicy_bookmark(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1003 1003 {
1004 1004 int error = 0;
1005 1005
1006 1006 for (nvpair_t *pair = nvlist_next_nvpair(innvl, NULL);
1007 1007 pair != NULL; pair = nvlist_next_nvpair(innvl, pair)) {
1008 1008 char *name = nvpair_name(pair);
1009 1009 char *hashp = strchr(name, '#');
1010 1010
1011 1011 if (hashp == NULL) {
1012 1012 error = SET_ERROR(EINVAL);
1013 1013 break;
1014 1014 }
1015 1015 *hashp = '\0';
1016 1016 error = zfs_secpolicy_write_perms(name,
1017 1017 ZFS_DELEG_PERM_BOOKMARK, cr);
1018 1018 *hashp = '#';
1019 1019 if (error != 0)
1020 1020 break;
1021 1021 }
1022 1022 return (error);
1023 1023 }
1024 1024
1025 1025 /* ARGSUSED */
1026 1026 static int
1027 1027 zfs_secpolicy_destroy_bookmarks(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1028 1028 {
1029 1029 nvpair_t *pair, *nextpair;
1030 1030 int error = 0;
1031 1031
1032 1032 for (pair = nvlist_next_nvpair(innvl, NULL); pair != NULL;
1033 1033 pair = nextpair) {
1034 1034 char *name = nvpair_name(pair);
1035 1035 char *hashp = strchr(name, '#');
1036 1036 nextpair = nvlist_next_nvpair(innvl, pair);
1037 1037
1038 1038 if (hashp == NULL) {
1039 1039 error = SET_ERROR(EINVAL);
1040 1040 break;
1041 1041 }
1042 1042
1043 1043 *hashp = '\0';
1044 1044 error = zfs_secpolicy_write_perms(name,
1045 1045 ZFS_DELEG_PERM_DESTROY, cr);
1046 1046 *hashp = '#';
1047 1047 if (error == ENOENT) {
1048 1048 /*
1049 1049 * Ignore any filesystems that don't exist (we consider
1050 1050 * their bookmarks "already destroyed"). Remove
1051 1051 * the name from the nvl here in case the filesystem
1052 1052 * is created between now and when we try to destroy
1053 1053 * the bookmark (in which case we don't want to
1054 1054 * destroy it since we haven't checked for permission).
1055 1055 */
1056 1056 fnvlist_remove_nvpair(innvl, pair);
1057 1057 error = 0;
1058 1058 }
1059 1059 if (error != 0)
1060 1060 break;
1061 1061 }
1062 1062
1063 1063 return (error);
1064 1064 }
1065 1065
1066 1066 /* ARGSUSED */
1067 1067 static int
1068 1068 zfs_secpolicy_log_history(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1069 1069 {
1070 1070 /*
1071 1071 * Even root must have a proper TSD so that we know what pool
1072 1072 * to log to.
1073 1073 */
1074 1074 if (tsd_get(zfs_allow_log_key) == NULL)
1075 1075 return (SET_ERROR(EPERM));
1076 1076 return (0);
1077 1077 }
1078 1078
1079 1079 static int
1080 1080 zfs_secpolicy_create_clone(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1081 1081 {
1082 1082 char parentname[MAXNAMELEN];
1083 1083 int error;
1084 1084 char *origin;
1085 1085
1086 1086 if ((error = zfs_get_parent(zc->zc_name, parentname,
1087 1087 sizeof (parentname))) != 0)
1088 1088 return (error);
1089 1089
1090 1090 if (nvlist_lookup_string(innvl, "origin", &origin) == 0 &&
1091 1091 (error = zfs_secpolicy_write_perms(origin,
1092 1092 ZFS_DELEG_PERM_CLONE, cr)) != 0)
1093 1093 return (error);
1094 1094
1095 1095 if ((error = zfs_secpolicy_write_perms(parentname,
1096 1096 ZFS_DELEG_PERM_CREATE, cr)) != 0)
1097 1097 return (error);
1098 1098
1099 1099 return (zfs_secpolicy_write_perms(parentname,
1100 1100 ZFS_DELEG_PERM_MOUNT, cr));
1101 1101 }
1102 1102
1103 1103 /*
1104 1104 * Policy for pool operations - create/destroy pools, add vdevs, etc. Requires
1105 1105 * SYS_CONFIG privilege, which is not available in a local zone.
1106 1106 */
1107 1107 /* ARGSUSED */
1108 1108 static int
1109 1109 zfs_secpolicy_config(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1110 1110 {
1111 1111 if (secpolicy_sys_config(cr, B_FALSE) != 0)
1112 1112 return (SET_ERROR(EPERM));
1113 1113
1114 1114 return (0);
1115 1115 }
1116 1116
1117 1117 /*
1118 1118 * Policy for object to name lookups.
1119 1119 */
1120 1120 /* ARGSUSED */
1121 1121 static int
1122 1122 zfs_secpolicy_diff(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1123 1123 {
1124 1124 int error;
1125 1125
1126 1126 if ((error = secpolicy_sys_config(cr, B_FALSE)) == 0)
1127 1127 return (0);
1128 1128
1129 1129 error = zfs_secpolicy_write_perms(zc->zc_name, ZFS_DELEG_PERM_DIFF, cr);
1130 1130 return (error);
1131 1131 }
1132 1132
1133 1133 /*
1134 1134 * Policy for fault injection. Requires all privileges.
1135 1135 */
1136 1136 /* ARGSUSED */
1137 1137 static int
1138 1138 zfs_secpolicy_inject(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1139 1139 {
1140 1140 return (secpolicy_zinject(cr));
1141 1141 }
1142 1142
1143 1143 /* ARGSUSED */
1144 1144 static int
1145 1145 zfs_secpolicy_inherit_prop(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1146 1146 {
1147 1147 zfs_prop_t prop = zfs_name_to_prop(zc->zc_value);
1148 1148
1149 1149 if (prop == ZPROP_INVAL) {
1150 1150 if (!zfs_prop_user(zc->zc_value))
1151 1151 return (SET_ERROR(EINVAL));
1152 1152 return (zfs_secpolicy_write_perms(zc->zc_name,
1153 1153 ZFS_DELEG_PERM_USERPROP, cr));
1154 1154 } else {
1155 1155 return (zfs_secpolicy_setprop(zc->zc_name, prop,
1156 1156 NULL, cr));
1157 1157 }
1158 1158 }
1159 1159
1160 1160 static int
1161 1161 zfs_secpolicy_userspace_one(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1162 1162 {
1163 1163 int err = zfs_secpolicy_read(zc, innvl, cr);
1164 1164 if (err)
1165 1165 return (err);
1166 1166
1167 1167 if (zc->zc_objset_type >= ZFS_NUM_USERQUOTA_PROPS)
1168 1168 return (SET_ERROR(EINVAL));
1169 1169
1170 1170 if (zc->zc_value[0] == 0) {
1171 1171 /*
1172 1172 * They are asking about a posix uid/gid. If it's
1173 1173 * themself, allow it.
1174 1174 */
1175 1175 if (zc->zc_objset_type == ZFS_PROP_USERUSED ||
1176 1176 zc->zc_objset_type == ZFS_PROP_USERQUOTA) {
1177 1177 if (zc->zc_guid == crgetuid(cr))
1178 1178 return (0);
1179 1179 } else {
1180 1180 if (groupmember(zc->zc_guid, cr))
1181 1181 return (0);
1182 1182 }
1183 1183 }
1184 1184
1185 1185 return (zfs_secpolicy_write_perms(zc->zc_name,
1186 1186 userquota_perms[zc->zc_objset_type], cr));
1187 1187 }
1188 1188
1189 1189 static int
1190 1190 zfs_secpolicy_userspace_many(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1191 1191 {
1192 1192 int err = zfs_secpolicy_read(zc, innvl, cr);
1193 1193 if (err)
1194 1194 return (err);
1195 1195
1196 1196 if (zc->zc_objset_type >= ZFS_NUM_USERQUOTA_PROPS)
1197 1197 return (SET_ERROR(EINVAL));
1198 1198
1199 1199 return (zfs_secpolicy_write_perms(zc->zc_name,
1200 1200 userquota_perms[zc->zc_objset_type], cr));
1201 1201 }
1202 1202
1203 1203 /* ARGSUSED */
1204 1204 static int
1205 1205 zfs_secpolicy_userspace_upgrade(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1206 1206 {
1207 1207 return (zfs_secpolicy_setprop(zc->zc_name, ZFS_PROP_VERSION,
1208 1208 NULL, cr));
1209 1209 }
1210 1210
1211 1211 /* ARGSUSED */
1212 1212 static int
1213 1213 zfs_secpolicy_hold(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1214 1214 {
1215 1215 nvpair_t *pair;
1216 1216 nvlist_t *holds;
1217 1217 int error;
1218 1218
1219 1219 error = nvlist_lookup_nvlist(innvl, "holds", &holds);
1220 1220 if (error != 0)
1221 1221 return (SET_ERROR(EINVAL));
1222 1222
1223 1223 for (pair = nvlist_next_nvpair(holds, NULL); pair != NULL;
1224 1224 pair = nvlist_next_nvpair(holds, pair)) {
1225 1225 char fsname[MAXNAMELEN];
1226 1226 error = dmu_fsname(nvpair_name(pair), fsname);
1227 1227 if (error != 0)
1228 1228 return (error);
1229 1229 error = zfs_secpolicy_write_perms(fsname,
1230 1230 ZFS_DELEG_PERM_HOLD, cr);
1231 1231 if (error != 0)
1232 1232 return (error);
1233 1233 }
1234 1234 return (0);
1235 1235 }
1236 1236
1237 1237 /* ARGSUSED */
1238 1238 static int
1239 1239 zfs_secpolicy_release(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1240 1240 {
1241 1241 nvpair_t *pair;
1242 1242 int error;
1243 1243
1244 1244 for (pair = nvlist_next_nvpair(innvl, NULL); pair != NULL;
1245 1245 pair = nvlist_next_nvpair(innvl, pair)) {
1246 1246 char fsname[MAXNAMELEN];
1247 1247 error = dmu_fsname(nvpair_name(pair), fsname);
1248 1248 if (error != 0)
1249 1249 return (error);
1250 1250 error = zfs_secpolicy_write_perms(fsname,
1251 1251 ZFS_DELEG_PERM_RELEASE, cr);
1252 1252 if (error != 0)
1253 1253 return (error);
1254 1254 }
1255 1255 return (0);
1256 1256 }
1257 1257
1258 1258 /*
1259 1259 * Policy for allowing temporary snapshots to be taken or released
1260 1260 */
1261 1261 static int
1262 1262 zfs_secpolicy_tmp_snapshot(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1263 1263 {
1264 1264 /*
1265 1265 * A temporary snapshot is the same as a snapshot,
1266 1266 * hold, destroy and release all rolled into one.
1267 1267 * Delegated diff alone is sufficient that we allow this.
1268 1268 */
1269 1269 int error;
1270 1270
1271 1271 if ((error = zfs_secpolicy_write_perms(zc->zc_name,
1272 1272 ZFS_DELEG_PERM_DIFF, cr)) == 0)
1273 1273 return (0);
1274 1274
1275 1275 error = zfs_secpolicy_snapshot_perms(zc->zc_name, cr);
1276 1276 if (error == 0)
1277 1277 error = zfs_secpolicy_hold(zc, innvl, cr);
1278 1278 if (error == 0)
1279 1279 error = zfs_secpolicy_release(zc, innvl, cr);
1280 1280 if (error == 0)
1281 1281 error = zfs_secpolicy_destroy(zc, innvl, cr);
1282 1282 return (error);
1283 1283 }
1284 1284
1285 1285 /*
1286 1286 * Returns the nvlist as specified by the user in the zfs_cmd_t.
1287 1287 */
1288 1288 static int
1289 1289 get_nvlist(uint64_t nvl, uint64_t size, int iflag, nvlist_t **nvp)
1290 1290 {
1291 1291 char *packed;
1292 1292 int error;
1293 1293 nvlist_t *list = NULL;
1294 1294
1295 1295 /*
1296 1296 * Read in and unpack the user-supplied nvlist.
1297 1297 */
1298 1298 if (size == 0)
1299 1299 return (SET_ERROR(EINVAL));
1300 1300
1301 1301 packed = kmem_alloc(size, KM_SLEEP);
1302 1302
1303 1303 if ((error = ddi_copyin((void *)(uintptr_t)nvl, packed, size,
1304 1304 iflag)) != 0) {
1305 1305 kmem_free(packed, size);
1306 1306 return (error);
1307 1307 }
1308 1308
1309 1309 if ((error = nvlist_unpack(packed, size, &list, 0)) != 0) {
1310 1310 kmem_free(packed, size);
1311 1311 return (error);
1312 1312 }
1313 1313
1314 1314 kmem_free(packed, size);
1315 1315
1316 1316 *nvp = list;
1317 1317 return (0);
1318 1318 }
1319 1319
1320 1320 /*
1321 1321 * Reduce the size of this nvlist until it can be serialized in 'max' bytes.
1322 1322 * Entries will be removed from the end of the nvlist, and one int32 entry
1323 1323 * named "N_MORE_ERRORS" will be added indicating how many entries were
1324 1324 * removed.
1325 1325 */
1326 1326 static int
1327 1327 nvlist_smush(nvlist_t *errors, size_t max)
1328 1328 {
1329 1329 size_t size;
1330 1330
1331 1331 size = fnvlist_size(errors);
1332 1332
1333 1333 if (size > max) {
1334 1334 nvpair_t *more_errors;
1335 1335 int n = 0;
1336 1336
1337 1337 if (max < 1024)
1338 1338 return (SET_ERROR(ENOMEM));
1339 1339
1340 1340 fnvlist_add_int32(errors, ZPROP_N_MORE_ERRORS, 0);
1341 1341 more_errors = nvlist_prev_nvpair(errors, NULL);
1342 1342
1343 1343 do {
1344 1344 nvpair_t *pair = nvlist_prev_nvpair(errors,
1345 1345 more_errors);
1346 1346 fnvlist_remove_nvpair(errors, pair);
1347 1347 n++;
1348 1348 size = fnvlist_size(errors);
1349 1349 } while (size > max);
1350 1350
1351 1351 fnvlist_remove_nvpair(errors, more_errors);
1352 1352 fnvlist_add_int32(errors, ZPROP_N_MORE_ERRORS, n);
1353 1353 ASSERT3U(fnvlist_size(errors), <=, max);
1354 1354 }
1355 1355
1356 1356 return (0);
1357 1357 }
1358 1358
1359 1359 static int
1360 1360 put_nvlist(zfs_cmd_t *zc, nvlist_t *nvl)
1361 1361 {
1362 1362 char *packed = NULL;
1363 1363 int error = 0;
1364 1364 size_t size;
1365 1365
1366 1366 size = fnvlist_size(nvl);
1367 1367
1368 1368 if (size > zc->zc_nvlist_dst_size) {
1369 1369 error = SET_ERROR(ENOMEM);
1370 1370 } else {
1371 1371 packed = fnvlist_pack(nvl, &size);
1372 1372 if (ddi_copyout(packed, (void *)(uintptr_t)zc->zc_nvlist_dst,
1373 1373 size, zc->zc_iflags) != 0)
1374 1374 error = SET_ERROR(EFAULT);
1375 1375 fnvlist_pack_free(packed, size);
1376 1376 }
1377 1377
1378 1378 zc->zc_nvlist_dst_size = size;
1379 1379 zc->zc_nvlist_dst_filled = B_TRUE;
1380 1380 return (error);
1381 1381 }
1382 1382
1383 1383 static int
1384 1384 getzfsvfs(const char *dsname, zfsvfs_t **zfvp)
1385 1385 {
1386 1386 objset_t *os;
1387 1387 int error;
1388 1388
1389 1389 error = dmu_objset_hold(dsname, FTAG, &os);
1390 1390 if (error != 0)
1391 1391 return (error);
1392 1392 if (dmu_objset_type(os) != DMU_OST_ZFS) {
1393 1393 dmu_objset_rele(os, FTAG);
1394 1394 return (SET_ERROR(EINVAL));
1395 1395 }
1396 1396
1397 1397 mutex_enter(&os->os_user_ptr_lock);
1398 1398 *zfvp = dmu_objset_get_user(os);
1399 1399 if (*zfvp) {
1400 1400 VFS_HOLD((*zfvp)->z_vfs);
1401 1401 } else {
1402 1402 error = SET_ERROR(ESRCH);
1403 1403 }
1404 1404 mutex_exit(&os->os_user_ptr_lock);
1405 1405 dmu_objset_rele(os, FTAG);
1406 1406 return (error);
1407 1407 }
1408 1408
1409 1409 /*
1410 1410 * Find a zfsvfs_t for a mounted filesystem, or create our own, in which
1411 1411 * case its z_vfs will be NULL, and it will be opened as the owner.
1412 1412 * If 'writer' is set, the z_teardown_lock will be held for RW_WRITER,
1413 1413 * which prevents all vnode ops from running.
1414 1414 */
1415 1415 static int
1416 1416 zfsvfs_hold(const char *name, void *tag, zfsvfs_t **zfvp, boolean_t writer)
1417 1417 {
1418 1418 int error = 0;
1419 1419
1420 1420 if (getzfsvfs(name, zfvp) != 0)
1421 1421 error = zfsvfs_create(name, zfvp);
1422 1422 if (error == 0) {
1423 1423 rrm_enter(&(*zfvp)->z_teardown_lock, (writer) ? RW_WRITER :
1424 1424 RW_READER, tag);
1425 1425 if ((*zfvp)->z_unmounted) {
1426 1426 /*
1427 1427 * XXX we could probably try again, since the unmounting
1428 1428 * thread should be just about to disassociate the
1429 1429 * objset from the zfsvfs.
1430 1430 */
1431 1431 rrm_exit(&(*zfvp)->z_teardown_lock, tag);
1432 1432 return (SET_ERROR(EBUSY));
1433 1433 }
1434 1434 }
1435 1435 return (error);
1436 1436 }
1437 1437
1438 1438 static void
1439 1439 zfsvfs_rele(zfsvfs_t *zfsvfs, void *tag)
1440 1440 {
1441 1441 rrm_exit(&zfsvfs->z_teardown_lock, tag);
1442 1442
1443 1443 if (zfsvfs->z_vfs) {
1444 1444 VFS_RELE(zfsvfs->z_vfs);
1445 1445 } else {
1446 1446 dmu_objset_disown(zfsvfs->z_os, zfsvfs);
1447 1447 zfsvfs_free(zfsvfs);
1448 1448 }
1449 1449 }
1450 1450
1451 1451 static int
1452 1452 zfs_ioc_pool_create(zfs_cmd_t *zc)
1453 1453 {
1454 1454 int error;
1455 1455 nvlist_t *config, *props = NULL;
1456 1456 nvlist_t *rootprops = NULL;
1457 1457 nvlist_t *zplprops = NULL;
1458 1458
1459 1459 if (error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1460 1460 zc->zc_iflags, &config))
1461 1461 return (error);
1462 1462
1463 1463 if (zc->zc_nvlist_src_size != 0 && (error =
1464 1464 get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
1465 1465 zc->zc_iflags, &props))) {
1466 1466 nvlist_free(config);
1467 1467 return (error);
1468 1468 }
1469 1469
1470 1470 if (props) {
1471 1471 nvlist_t *nvl = NULL;
1472 1472 uint64_t version = SPA_VERSION;
1473 1473
1474 1474 (void) nvlist_lookup_uint64(props,
1475 1475 zpool_prop_to_name(ZPOOL_PROP_VERSION), &version);
1476 1476 if (!SPA_VERSION_IS_SUPPORTED(version)) {
1477 1477 error = SET_ERROR(EINVAL);
1478 1478 goto pool_props_bad;
1479 1479 }
1480 1480 (void) nvlist_lookup_nvlist(props, ZPOOL_ROOTFS_PROPS, &nvl);
1481 1481 if (nvl) {
1482 1482 error = nvlist_dup(nvl, &rootprops, KM_SLEEP);
1483 1483 if (error != 0) {
1484 1484 nvlist_free(config);
1485 1485 nvlist_free(props);
1486 1486 return (error);
1487 1487 }
1488 1488 (void) nvlist_remove_all(props, ZPOOL_ROOTFS_PROPS);
1489 1489 }
1490 1490 VERIFY(nvlist_alloc(&zplprops, NV_UNIQUE_NAME, KM_SLEEP) == 0);
1491 1491 error = zfs_fill_zplprops_root(version, rootprops,
1492 1492 zplprops, NULL);
1493 1493 if (error != 0)
1494 1494 goto pool_props_bad;
1495 1495 }
1496 1496
1497 1497 error = spa_create(zc->zc_name, config, props, zplprops);
1498 1498
1499 1499 /*
1500 1500 * Set the remaining root properties
1501 1501 */
1502 1502 if (!error && (error = zfs_set_prop_nvlist(zc->zc_name,
1503 1503 ZPROP_SRC_LOCAL, rootprops, NULL)) != 0)
1504 1504 (void) spa_destroy(zc->zc_name);
1505 1505
1506 1506 pool_props_bad:
1507 1507 nvlist_free(rootprops);
1508 1508 nvlist_free(zplprops);
1509 1509 nvlist_free(config);
1510 1510 nvlist_free(props);
1511 1511
1512 1512 return (error);
1513 1513 }
1514 1514
1515 1515 static int
1516 1516 zfs_ioc_pool_destroy(zfs_cmd_t *zc)
1517 1517 {
1518 1518 int error;
1519 1519 zfs_log_history(zc);
1520 1520 error = spa_destroy(zc->zc_name);
1521 1521 if (error == 0)
1522 1522 zvol_remove_minors(zc->zc_name);
1523 1523 return (error);
1524 1524 }
1525 1525
1526 1526 static int
1527 1527 zfs_ioc_pool_import(zfs_cmd_t *zc)
1528 1528 {
1529 1529 nvlist_t *config, *props = NULL;
1530 1530 uint64_t guid;
1531 1531 int error;
1532 1532
1533 1533 if ((error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1534 1534 zc->zc_iflags, &config)) != 0)
1535 1535 return (error);
1536 1536
1537 1537 if (zc->zc_nvlist_src_size != 0 && (error =
1538 1538 get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
1539 1539 zc->zc_iflags, &props))) {
1540 1540 nvlist_free(config);
1541 1541 return (error);
1542 1542 }
1543 1543
1544 1544 if (nvlist_lookup_uint64(config, ZPOOL_CONFIG_POOL_GUID, &guid) != 0 ||
1545 1545 guid != zc->zc_guid)
1546 1546 error = SET_ERROR(EINVAL);
1547 1547 else
1548 1548 error = spa_import(zc->zc_name, config, props, zc->zc_cookie);
1549 1549
1550 1550 if (zc->zc_nvlist_dst != 0) {
1551 1551 int err;
1552 1552
1553 1553 if ((err = put_nvlist(zc, config)) != 0)
1554 1554 error = err;
1555 1555 }
1556 1556
1557 1557 nvlist_free(config);
1558 1558
1559 1559 if (props)
1560 1560 nvlist_free(props);
1561 1561
1562 1562 return (error);
1563 1563 }
1564 1564
1565 1565 static int
1566 1566 zfs_ioc_pool_export(zfs_cmd_t *zc)
1567 1567 {
1568 1568 int error;
1569 1569 boolean_t force = (boolean_t)zc->zc_cookie;
1570 1570 boolean_t hardforce = (boolean_t)zc->zc_guid;
1571 1571
1572 1572 zfs_log_history(zc);
1573 1573 error = spa_export(zc->zc_name, NULL, force, hardforce);
1574 1574 if (error == 0)
1575 1575 zvol_remove_minors(zc->zc_name);
1576 1576 return (error);
1577 1577 }
1578 1578
1579 1579 static int
1580 1580 zfs_ioc_pool_configs(zfs_cmd_t *zc)
1581 1581 {
1582 1582 nvlist_t *configs;
1583 1583 int error;
1584 1584
1585 1585 if ((configs = spa_all_configs(&zc->zc_cookie)) == NULL)
1586 1586 return (SET_ERROR(EEXIST));
1587 1587
1588 1588 error = put_nvlist(zc, configs);
1589 1589
1590 1590 nvlist_free(configs);
1591 1591
1592 1592 return (error);
1593 1593 }
1594 1594
1595 1595 /*
1596 1596 * inputs:
1597 1597 * zc_name name of the pool
1598 1598 *
1599 1599 * outputs:
1600 1600 * zc_cookie real errno
1601 1601 * zc_nvlist_dst config nvlist
1602 1602 * zc_nvlist_dst_size size of config nvlist
1603 1603 */
1604 1604 static int
1605 1605 zfs_ioc_pool_stats(zfs_cmd_t *zc)
1606 1606 {
1607 1607 nvlist_t *config;
1608 1608 int error;
1609 1609 int ret = 0;
1610 1610
1611 1611 error = spa_get_stats(zc->zc_name, &config, zc->zc_value,
1612 1612 sizeof (zc->zc_value));
1613 1613
1614 1614 if (config != NULL) {
1615 1615 ret = put_nvlist(zc, config);
1616 1616 nvlist_free(config);
1617 1617
1618 1618 /*
1619 1619 * The config may be present even if 'error' is non-zero.
1620 1620 * In this case we return success, and preserve the real errno
1621 1621 * in 'zc_cookie'.
1622 1622 */
1623 1623 zc->zc_cookie = error;
1624 1624 } else {
1625 1625 ret = error;
1626 1626 }
1627 1627
1628 1628 return (ret);
1629 1629 }
1630 1630
1631 1631 /*
1632 1632 * Try to import the given pool, returning pool stats as appropriate so that
1633 1633 * user land knows which devices are available and overall pool health.
1634 1634 */
1635 1635 static int
1636 1636 zfs_ioc_pool_tryimport(zfs_cmd_t *zc)
1637 1637 {
1638 1638 nvlist_t *tryconfig, *config;
1639 1639 int error;
1640 1640
1641 1641 if ((error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1642 1642 zc->zc_iflags, &tryconfig)) != 0)
1643 1643 return (error);
1644 1644
1645 1645 config = spa_tryimport(tryconfig);
1646 1646
1647 1647 nvlist_free(tryconfig);
1648 1648
1649 1649 if (config == NULL)
1650 1650 return (SET_ERROR(EINVAL));
1651 1651
1652 1652 error = put_nvlist(zc, config);
1653 1653 nvlist_free(config);
1654 1654
1655 1655 return (error);
1656 1656 }
1657 1657
1658 1658 /*
1659 1659 * inputs:
1660 1660 * zc_name name of the pool
1661 1661 * zc_cookie scan func (pool_scan_func_t)
1662 1662 */
1663 1663 static int
1664 1664 zfs_ioc_pool_scan(zfs_cmd_t *zc)
1665 1665 {
1666 1666 spa_t *spa;
1667 1667 int error;
1668 1668
1669 1669 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1670 1670 return (error);
1671 1671
1672 1672 if (zc->zc_cookie == POOL_SCAN_NONE)
1673 1673 error = spa_scan_stop(spa);
1674 1674 else
1675 1675 error = spa_scan(spa, zc->zc_cookie);
1676 1676
1677 1677 spa_close(spa, FTAG);
1678 1678
1679 1679 return (error);
1680 1680 }
1681 1681
1682 1682 static int
1683 1683 zfs_ioc_pool_freeze(zfs_cmd_t *zc)
1684 1684 {
1685 1685 spa_t *spa;
1686 1686 int error;
1687 1687
1688 1688 error = spa_open(zc->zc_name, &spa, FTAG);
1689 1689 if (error == 0) {
1690 1690 spa_freeze(spa);
1691 1691 spa_close(spa, FTAG);
1692 1692 }
1693 1693 return (error);
1694 1694 }
1695 1695
1696 1696 static int
1697 1697 zfs_ioc_pool_upgrade(zfs_cmd_t *zc)
1698 1698 {
1699 1699 spa_t *spa;
1700 1700 int error;
1701 1701
1702 1702 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1703 1703 return (error);
1704 1704
1705 1705 if (zc->zc_cookie < spa_version(spa) ||
1706 1706 !SPA_VERSION_IS_SUPPORTED(zc->zc_cookie)) {
1707 1707 spa_close(spa, FTAG);
1708 1708 return (SET_ERROR(EINVAL));
1709 1709 }
1710 1710
1711 1711 spa_upgrade(spa, zc->zc_cookie);
1712 1712 spa_close(spa, FTAG);
1713 1713
1714 1714 return (error);
1715 1715 }
1716 1716
1717 1717 static int
1718 1718 zfs_ioc_pool_get_history(zfs_cmd_t *zc)
1719 1719 {
1720 1720 spa_t *spa;
1721 1721 char *hist_buf;
1722 1722 uint64_t size;
1723 1723 int error;
1724 1724
1725 1725 if ((size = zc->zc_history_len) == 0)
1726 1726 return (SET_ERROR(EINVAL));
1727 1727
1728 1728 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1729 1729 return (error);
1730 1730
1731 1731 if (spa_version(spa) < SPA_VERSION_ZPOOL_HISTORY) {
1732 1732 spa_close(spa, FTAG);
1733 1733 return (SET_ERROR(ENOTSUP));
1734 1734 }
1735 1735
1736 1736 hist_buf = kmem_alloc(size, KM_SLEEP);
1737 1737 if ((error = spa_history_get(spa, &zc->zc_history_offset,
1738 1738 &zc->zc_history_len, hist_buf)) == 0) {
1739 1739 error = ddi_copyout(hist_buf,
1740 1740 (void *)(uintptr_t)zc->zc_history,
1741 1741 zc->zc_history_len, zc->zc_iflags);
1742 1742 }
1743 1743
1744 1744 spa_close(spa, FTAG);
1745 1745 kmem_free(hist_buf, size);
1746 1746 return (error);
1747 1747 }
1748 1748
1749 1749 static int
1750 1750 zfs_ioc_pool_reguid(zfs_cmd_t *zc)
1751 1751 {
1752 1752 spa_t *spa;
1753 1753 int error;
1754 1754
1755 1755 error = spa_open(zc->zc_name, &spa, FTAG);
1756 1756 if (error == 0) {
1757 1757 error = spa_change_guid(spa);
1758 1758 spa_close(spa, FTAG);
1759 1759 }
1760 1760 return (error);
1761 1761 }
1762 1762
1763 1763 static int
1764 1764 zfs_ioc_dsobj_to_dsname(zfs_cmd_t *zc)
1765 1765 {
1766 1766 return (dsl_dsobj_to_dsname(zc->zc_name, zc->zc_obj, zc->zc_value));
1767 1767 }
1768 1768
1769 1769 /*
1770 1770 * inputs:
1771 1771 * zc_name name of filesystem
1772 1772 * zc_obj object to find
1773 1773 *
1774 1774 * outputs:
1775 1775 * zc_value name of object
1776 1776 */
1777 1777 static int
1778 1778 zfs_ioc_obj_to_path(zfs_cmd_t *zc)
1779 1779 {
1780 1780 objset_t *os;
1781 1781 int error;
1782 1782
1783 1783 /* XXX reading from objset not owned */
1784 1784 if ((error = dmu_objset_hold(zc->zc_name, FTAG, &os)) != 0)
1785 1785 return (error);
1786 1786 if (dmu_objset_type(os) != DMU_OST_ZFS) {
1787 1787 dmu_objset_rele(os, FTAG);
1788 1788 return (SET_ERROR(EINVAL));
1789 1789 }
1790 1790 error = zfs_obj_to_path(os, zc->zc_obj, zc->zc_value,
1791 1791 sizeof (zc->zc_value));
1792 1792 dmu_objset_rele(os, FTAG);
1793 1793
1794 1794 return (error);
1795 1795 }
1796 1796
1797 1797 /*
1798 1798 * inputs:
1799 1799 * zc_name name of filesystem
1800 1800 * zc_obj object to find
1801 1801 *
1802 1802 * outputs:
1803 1803 * zc_stat stats on object
1804 1804 * zc_value path to object
1805 1805 */
1806 1806 static int
1807 1807 zfs_ioc_obj_to_stats(zfs_cmd_t *zc)
1808 1808 {
1809 1809 objset_t *os;
1810 1810 int error;
1811 1811
1812 1812 /* XXX reading from objset not owned */
1813 1813 if ((error = dmu_objset_hold(zc->zc_name, FTAG, &os)) != 0)
1814 1814 return (error);
1815 1815 if (dmu_objset_type(os) != DMU_OST_ZFS) {
1816 1816 dmu_objset_rele(os, FTAG);
1817 1817 return (SET_ERROR(EINVAL));
1818 1818 }
1819 1819 error = zfs_obj_to_stats(os, zc->zc_obj, &zc->zc_stat, zc->zc_value,
1820 1820 sizeof (zc->zc_value));
1821 1821 dmu_objset_rele(os, FTAG);
1822 1822
1823 1823 return (error);
1824 1824 }
1825 1825
1826 1826 static int
1827 1827 zfs_ioc_vdev_add(zfs_cmd_t *zc)
1828 1828 {
1829 1829 spa_t *spa;
1830 1830 int error;
1831 1831 nvlist_t *config, **l2cache, **spares;
1832 1832 uint_t nl2cache = 0, nspares = 0;
1833 1833
1834 1834 error = spa_open(zc->zc_name, &spa, FTAG);
1835 1835 if (error != 0)
1836 1836 return (error);
1837 1837
1838 1838 error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1839 1839 zc->zc_iflags, &config);
1840 1840 (void) nvlist_lookup_nvlist_array(config, ZPOOL_CONFIG_L2CACHE,
1841 1841 &l2cache, &nl2cache);
1842 1842
1843 1843 (void) nvlist_lookup_nvlist_array(config, ZPOOL_CONFIG_SPARES,
1844 1844 &spares, &nspares);
1845 1845
1846 1846 /*
1847 1847 * A root pool with concatenated devices is not supported.
1848 1848 * Thus, can not add a device to a root pool.
1849 1849 *
1850 1850 * Intent log device can not be added to a rootpool because
1851 1851 * during mountroot, zil is replayed, a seperated log device
1852 1852 * can not be accessed during the mountroot time.
1853 1853 *
1854 1854 * l2cache and spare devices are ok to be added to a rootpool.
1855 1855 */
1856 1856 if (spa_bootfs(spa) != 0 && nl2cache == 0 && nspares == 0) {
1857 1857 nvlist_free(config);
1858 1858 spa_close(spa, FTAG);
1859 1859 return (SET_ERROR(EDOM));
1860 1860 }
1861 1861
1862 1862 if (error == 0) {
1863 1863 error = spa_vdev_add(spa, config);
1864 1864 nvlist_free(config);
1865 1865 }
1866 1866 spa_close(spa, FTAG);
1867 1867 return (error);
1868 1868 }
1869 1869
1870 1870 /*
1871 1871 * inputs:
1872 1872 * zc_name name of the pool
1873 1873 * zc_nvlist_conf nvlist of devices to remove
1874 1874 * zc_cookie to stop the remove?
1875 1875 */
1876 1876 static int
1877 1877 zfs_ioc_vdev_remove(zfs_cmd_t *zc)
1878 1878 {
1879 1879 spa_t *spa;
1880 1880 int error;
1881 1881
1882 1882 error = spa_open(zc->zc_name, &spa, FTAG);
1883 1883 if (error != 0)
1884 1884 return (error);
1885 1885 error = spa_vdev_remove(spa, zc->zc_guid, B_FALSE);
1886 1886 spa_close(spa, FTAG);
1887 1887 return (error);
1888 1888 }
1889 1889
1890 1890 static int
1891 1891 zfs_ioc_vdev_set_state(zfs_cmd_t *zc)
1892 1892 {
1893 1893 spa_t *spa;
1894 1894 int error;
1895 1895 vdev_state_t newstate = VDEV_STATE_UNKNOWN;
1896 1896
1897 1897 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1898 1898 return (error);
1899 1899 switch (zc->zc_cookie) {
1900 1900 case VDEV_STATE_ONLINE:
1901 1901 error = vdev_online(spa, zc->zc_guid, zc->zc_obj, &newstate);
1902 1902 break;
1903 1903
1904 1904 case VDEV_STATE_OFFLINE:
1905 1905 error = vdev_offline(spa, zc->zc_guid, zc->zc_obj);
1906 1906 break;
1907 1907
1908 1908 case VDEV_STATE_FAULTED:
1909 1909 if (zc->zc_obj != VDEV_AUX_ERR_EXCEEDED &&
1910 1910 zc->zc_obj != VDEV_AUX_EXTERNAL)
1911 1911 zc->zc_obj = VDEV_AUX_ERR_EXCEEDED;
1912 1912
1913 1913 error = vdev_fault(spa, zc->zc_guid, zc->zc_obj);
1914 1914 break;
1915 1915
1916 1916 case VDEV_STATE_DEGRADED:
1917 1917 if (zc->zc_obj != VDEV_AUX_ERR_EXCEEDED &&
1918 1918 zc->zc_obj != VDEV_AUX_EXTERNAL)
1919 1919 zc->zc_obj = VDEV_AUX_ERR_EXCEEDED;
1920 1920
1921 1921 error = vdev_degrade(spa, zc->zc_guid, zc->zc_obj);
1922 1922 break;
1923 1923
1924 1924 default:
1925 1925 error = SET_ERROR(EINVAL);
1926 1926 }
1927 1927 zc->zc_cookie = newstate;
1928 1928 spa_close(spa, FTAG);
1929 1929 return (error);
1930 1930 }
1931 1931
1932 1932 static int
1933 1933 zfs_ioc_vdev_attach(zfs_cmd_t *zc)
1934 1934 {
1935 1935 spa_t *spa;
1936 1936 int replacing = zc->zc_cookie;
1937 1937 nvlist_t *config;
1938 1938 int error;
1939 1939
1940 1940 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1941 1941 return (error);
1942 1942
1943 1943 if ((error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1944 1944 zc->zc_iflags, &config)) == 0) {
1945 1945 error = spa_vdev_attach(spa, zc->zc_guid, config, replacing);
1946 1946 nvlist_free(config);
1947 1947 }
1948 1948
1949 1949 spa_close(spa, FTAG);
1950 1950 return (error);
1951 1951 }
1952 1952
1953 1953 static int
1954 1954 zfs_ioc_vdev_detach(zfs_cmd_t *zc)
1955 1955 {
1956 1956 spa_t *spa;
1957 1957 int error;
1958 1958
1959 1959 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1960 1960 return (error);
1961 1961
1962 1962 error = spa_vdev_detach(spa, zc->zc_guid, 0, B_FALSE);
1963 1963
1964 1964 spa_close(spa, FTAG);
1965 1965 return (error);
1966 1966 }
1967 1967
1968 1968 static int
1969 1969 zfs_ioc_vdev_split(zfs_cmd_t *zc)
1970 1970 {
1971 1971 spa_t *spa;
1972 1972 nvlist_t *config, *props = NULL;
1973 1973 int error;
1974 1974 boolean_t exp = !!(zc->zc_cookie & ZPOOL_EXPORT_AFTER_SPLIT);
1975 1975
1976 1976 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1977 1977 return (error);
1978 1978
1979 1979 if (error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1980 1980 zc->zc_iflags, &config)) {
1981 1981 spa_close(spa, FTAG);
1982 1982 return (error);
1983 1983 }
1984 1984
1985 1985 if (zc->zc_nvlist_src_size != 0 && (error =
1986 1986 get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
1987 1987 zc->zc_iflags, &props))) {
1988 1988 spa_close(spa, FTAG);
1989 1989 nvlist_free(config);
1990 1990 return (error);
1991 1991 }
1992 1992
1993 1993 error = spa_vdev_split_mirror(spa, zc->zc_string, config, props, exp);
1994 1994
1995 1995 spa_close(spa, FTAG);
1996 1996
1997 1997 nvlist_free(config);
1998 1998 nvlist_free(props);
1999 1999
2000 2000 return (error);
2001 2001 }
2002 2002
2003 2003 static int
2004 2004 zfs_ioc_vdev_setpath(zfs_cmd_t *zc)
2005 2005 {
2006 2006 spa_t *spa;
2007 2007 char *path = zc->zc_value;
2008 2008 uint64_t guid = zc->zc_guid;
2009 2009 int error;
2010 2010
2011 2011 error = spa_open(zc->zc_name, &spa, FTAG);
2012 2012 if (error != 0)
2013 2013 return (error);
2014 2014
2015 2015 error = spa_vdev_setpath(spa, guid, path);
2016 2016 spa_close(spa, FTAG);
2017 2017 return (error);
2018 2018 }
2019 2019
2020 2020 static int
2021 2021 zfs_ioc_vdev_setfru(zfs_cmd_t *zc)
2022 2022 {
2023 2023 spa_t *spa;
2024 2024 char *fru = zc->zc_value;
2025 2025 uint64_t guid = zc->zc_guid;
2026 2026 int error;
2027 2027
2028 2028 error = spa_open(zc->zc_name, &spa, FTAG);
2029 2029 if (error != 0)
2030 2030 return (error);
2031 2031
2032 2032 error = spa_vdev_setfru(spa, guid, fru);
2033 2033 spa_close(spa, FTAG);
2034 2034 return (error);
2035 2035 }
2036 2036
2037 2037 static int
2038 2038 zfs_ioc_objset_stats_impl(zfs_cmd_t *zc, objset_t *os)
2039 2039 {
2040 2040 int error = 0;
2041 2041 nvlist_t *nv;
2042 2042
2043 2043 dmu_objset_fast_stat(os, &zc->zc_objset_stats);
2044 2044
2045 2045 if (zc->zc_nvlist_dst != 0 &&
2046 2046 (error = dsl_prop_get_all(os, &nv)) == 0) {
2047 2047 dmu_objset_stats(os, nv);
2048 2048 /*
2049 2049 * NB: zvol_get_stats() will read the objset contents,
2050 2050 * which we aren't supposed to do with a
2051 2051 * DS_MODE_USER hold, because it could be
2052 2052 * inconsistent. So this is a bit of a workaround...
2053 2053 * XXX reading with out owning
2054 2054 */
2055 2055 if (!zc->zc_objset_stats.dds_inconsistent &&
2056 2056 dmu_objset_type(os) == DMU_OST_ZVOL) {
2057 2057 error = zvol_get_stats(os, nv);
2058 2058 if (error == EIO)
2059 2059 return (error);
2060 2060 VERIFY0(error);
2061 2061 }
2062 2062 error = put_nvlist(zc, nv);
2063 2063 nvlist_free(nv);
2064 2064 }
2065 2065
2066 2066 return (error);
2067 2067 }
2068 2068
2069 2069 /*
2070 2070 * inputs:
2071 2071 * zc_name name of filesystem
2072 2072 * zc_nvlist_dst_size size of buffer for property nvlist
2073 2073 *
2074 2074 * outputs:
2075 2075 * zc_objset_stats stats
2076 2076 * zc_nvlist_dst property nvlist
2077 2077 * zc_nvlist_dst_size size of property nvlist
2078 2078 */
2079 2079 static int
2080 2080 zfs_ioc_objset_stats(zfs_cmd_t *zc)
2081 2081 {
2082 2082 objset_t *os;
2083 2083 int error;
2084 2084
2085 2085 error = dmu_objset_hold(zc->zc_name, FTAG, &os);
2086 2086 if (error == 0) {
2087 2087 error = zfs_ioc_objset_stats_impl(zc, os);
2088 2088 dmu_objset_rele(os, FTAG);
2089 2089 }
2090 2090
2091 2091 return (error);
2092 2092 }
2093 2093
2094 2094 /*
2095 2095 * inputs:
2096 2096 * zc_name name of filesystem
2097 2097 * zc_nvlist_dst_size size of buffer for property nvlist
2098 2098 *
2099 2099 * outputs:
2100 2100 * zc_nvlist_dst received property nvlist
2101 2101 * zc_nvlist_dst_size size of received property nvlist
2102 2102 *
2103 2103 * Gets received properties (distinct from local properties on or after
2104 2104 * SPA_VERSION_RECVD_PROPS) for callers who want to differentiate received from
2105 2105 * local property values.
2106 2106 */
2107 2107 static int
2108 2108 zfs_ioc_objset_recvd_props(zfs_cmd_t *zc)
2109 2109 {
2110 2110 int error = 0;
2111 2111 nvlist_t *nv;
2112 2112
2113 2113 /*
2114 2114 * Without this check, we would return local property values if the
2115 2115 * caller has not already received properties on or after
2116 2116 * SPA_VERSION_RECVD_PROPS.
2117 2117 */
2118 2118 if (!dsl_prop_get_hasrecvd(zc->zc_name))
2119 2119 return (SET_ERROR(ENOTSUP));
2120 2120
2121 2121 if (zc->zc_nvlist_dst != 0 &&
2122 2122 (error = dsl_prop_get_received(zc->zc_name, &nv)) == 0) {
2123 2123 error = put_nvlist(zc, nv);
2124 2124 nvlist_free(nv);
2125 2125 }
2126 2126
2127 2127 return (error);
2128 2128 }
2129 2129
2130 2130 static int
2131 2131 nvl_add_zplprop(objset_t *os, nvlist_t *props, zfs_prop_t prop)
2132 2132 {
2133 2133 uint64_t value;
2134 2134 int error;
2135 2135
2136 2136 /*
2137 2137 * zfs_get_zplprop() will either find a value or give us
2138 2138 * the default value (if there is one).
2139 2139 */
2140 2140 if ((error = zfs_get_zplprop(os, prop, &value)) != 0)
2141 2141 return (error);
2142 2142 VERIFY(nvlist_add_uint64(props, zfs_prop_to_name(prop), value) == 0);
2143 2143 return (0);
2144 2144 }
2145 2145
2146 2146 /*
2147 2147 * inputs:
2148 2148 * zc_name name of filesystem
2149 2149 * zc_nvlist_dst_size size of buffer for zpl property nvlist
2150 2150 *
2151 2151 * outputs:
2152 2152 * zc_nvlist_dst zpl property nvlist
2153 2153 * zc_nvlist_dst_size size of zpl property nvlist
2154 2154 */
2155 2155 static int
2156 2156 zfs_ioc_objset_zplprops(zfs_cmd_t *zc)
2157 2157 {
2158 2158 objset_t *os;
2159 2159 int err;
2160 2160
2161 2161 /* XXX reading without owning */
2162 2162 if (err = dmu_objset_hold(zc->zc_name, FTAG, &os))
2163 2163 return (err);
2164 2164
2165 2165 dmu_objset_fast_stat(os, &zc->zc_objset_stats);
2166 2166
2167 2167 /*
2168 2168 * NB: nvl_add_zplprop() will read the objset contents,
2169 2169 * which we aren't supposed to do with a DS_MODE_USER
2170 2170 * hold, because it could be inconsistent.
2171 2171 */
2172 2172 if (zc->zc_nvlist_dst != NULL &&
2173 2173 !zc->zc_objset_stats.dds_inconsistent &&
2174 2174 dmu_objset_type(os) == DMU_OST_ZFS) {
2175 2175 nvlist_t *nv;
2176 2176
2177 2177 VERIFY(nvlist_alloc(&nv, NV_UNIQUE_NAME, KM_SLEEP) == 0);
2178 2178 if ((err = nvl_add_zplprop(os, nv, ZFS_PROP_VERSION)) == 0 &&
2179 2179 (err = nvl_add_zplprop(os, nv, ZFS_PROP_NORMALIZE)) == 0 &&
2180 2180 (err = nvl_add_zplprop(os, nv, ZFS_PROP_UTF8ONLY)) == 0 &&
2181 2181 (err = nvl_add_zplprop(os, nv, ZFS_PROP_CASE)) == 0)
2182 2182 err = put_nvlist(zc, nv);
2183 2183 nvlist_free(nv);
2184 2184 } else {
2185 2185 err = SET_ERROR(ENOENT);
2186 2186 }
2187 2187 dmu_objset_rele(os, FTAG);
2188 2188 return (err);
2189 2189 }
2190 2190
2191 2191 static boolean_t
2192 2192 dataset_name_hidden(const char *name)
2193 2193 {
2194 2194 /*
2195 2195 * Skip over datasets that are not visible in this zone,
2196 2196 * internal datasets (which have a $ in their name), and
2197 2197 * temporary datasets (which have a % in their name).
2198 2198 */
2199 2199 if (strchr(name, '$') != NULL)
2200 2200 return (B_TRUE);
2201 2201 if (strchr(name, '%') != NULL)
2202 2202 return (B_TRUE);
2203 2203 if (!INGLOBALZONE(curproc) && !zone_dataset_visible(name, NULL))
2204 2204 return (B_TRUE);
2205 2205 return (B_FALSE);
2206 2206 }
2207 2207
2208 2208 /*
2209 2209 * inputs:
2210 2210 * zc_name name of filesystem
2211 2211 * zc_cookie zap cursor
2212 2212 * zc_nvlist_dst_size size of buffer for property nvlist
2213 2213 *
2214 2214 * outputs:
2215 2215 * zc_name name of next filesystem
2216 2216 * zc_cookie zap cursor
2217 2217 * zc_objset_stats stats
2218 2218 * zc_nvlist_dst property nvlist
2219 2219 * zc_nvlist_dst_size size of property nvlist
2220 2220 */
2221 2221 static int
2222 2222 zfs_ioc_dataset_list_next(zfs_cmd_t *zc)
2223 2223 {
2224 2224 objset_t *os;
2225 2225 int error;
2226 2226 char *p;
2227 2227 size_t orig_len = strlen(zc->zc_name);
2228 2228
2229 2229 top:
2230 2230 if (error = dmu_objset_hold(zc->zc_name, FTAG, &os)) {
2231 2231 if (error == ENOENT)
2232 2232 error = SET_ERROR(ESRCH);
2233 2233 return (error);
2234 2234 }
2235 2235
2236 2236 p = strrchr(zc->zc_name, '/');
2237 2237 if (p == NULL || p[1] != '\0')
2238 2238 (void) strlcat(zc->zc_name, "/", sizeof (zc->zc_name));
2239 2239 p = zc->zc_name + strlen(zc->zc_name);
2240 2240
2241 2241 do {
2242 2242 error = dmu_dir_list_next(os,
2243 2243 sizeof (zc->zc_name) - (p - zc->zc_name), p,
2244 2244 NULL, &zc->zc_cookie);
2245 2245 if (error == ENOENT)
2246 2246 error = SET_ERROR(ESRCH);
2247 2247 } while (error == 0 && dataset_name_hidden(zc->zc_name));
2248 2248 dmu_objset_rele(os, FTAG);
2249 2249
2250 2250 /*
2251 2251 * If it's an internal dataset (ie. with a '$' in its name),
2252 2252 * don't try to get stats for it, otherwise we'll return ENOENT.
2253 2253 */
2254 2254 if (error == 0 && strchr(zc->zc_name, '$') == NULL) {
2255 2255 error = zfs_ioc_objset_stats(zc); /* fill in the stats */
2256 2256 if (error == ENOENT) {
2257 2257 /* We lost a race with destroy, get the next one. */
2258 2258 zc->zc_name[orig_len] = '\0';
2259 2259 goto top;
2260 2260 }
2261 2261 }
2262 2262 return (error);
2263 2263 }
2264 2264
2265 2265 /*
2266 2266 * inputs:
2267 2267 * zc_name name of filesystem
2268 2268 * zc_cookie zap cursor
2269 2269 * zc_nvlist_dst_size size of buffer for property nvlist
2270 2270 *
2271 2271 * outputs:
2272 2272 * zc_name name of next snapshot
2273 2273 * zc_objset_stats stats
2274 2274 * zc_nvlist_dst property nvlist
2275 2275 * zc_nvlist_dst_size size of property nvlist
2276 2276 */
2277 2277 static int
2278 2278 zfs_ioc_snapshot_list_next(zfs_cmd_t *zc)
2279 2279 {
2280 2280 objset_t *os;
2281 2281 int error;
2282 2282
2283 2283 error = dmu_objset_hold(zc->zc_name, FTAG, &os);
2284 2284 if (error != 0) {
2285 2285 return (error == ENOENT ? ESRCH : error);
2286 2286 }
2287 2287
2288 2288 /*
2289 2289 * A dataset name of maximum length cannot have any snapshots,
2290 2290 * so exit immediately.
2291 2291 */
2292 2292 if (strlcat(zc->zc_name, "@", sizeof (zc->zc_name)) >= MAXNAMELEN) {
2293 2293 dmu_objset_rele(os, FTAG);
2294 2294 return (SET_ERROR(ESRCH));
2295 2295 }
2296 2296
2297 2297 error = dmu_snapshot_list_next(os,
2298 2298 sizeof (zc->zc_name) - strlen(zc->zc_name),
2299 2299 zc->zc_name + strlen(zc->zc_name), &zc->zc_obj, &zc->zc_cookie,
2300 2300 NULL);
2301 2301
2302 2302 if (error == 0) {
2303 2303 dsl_dataset_t *ds;
2304 2304 dsl_pool_t *dp = os->os_dsl_dataset->ds_dir->dd_pool;
2305 2305
2306 2306 error = dsl_dataset_hold_obj(dp, zc->zc_obj, FTAG, &ds);
2307 2307 if (error == 0) {
2308 2308 objset_t *ossnap;
2309 2309
2310 2310 error = dmu_objset_from_ds(ds, &ossnap);
2311 2311 if (error == 0)
2312 2312 error = zfs_ioc_objset_stats_impl(zc, ossnap);
2313 2313 dsl_dataset_rele(ds, FTAG);
2314 2314 }
2315 2315 } else if (error == ENOENT) {
2316 2316 error = SET_ERROR(ESRCH);
2317 2317 }
2318 2318
2319 2319 dmu_objset_rele(os, FTAG);
2320 2320 /* if we failed, undo the @ that we tacked on to zc_name */
2321 2321 if (error != 0)
2322 2322 *strchr(zc->zc_name, '@') = '\0';
2323 2323 return (error);
2324 2324 }
2325 2325
2326 2326 static int
2327 2327 zfs_prop_set_userquota(const char *dsname, nvpair_t *pair)
2328 2328 {
2329 2329 const char *propname = nvpair_name(pair);
2330 2330 uint64_t *valary;
2331 2331 unsigned int vallen;
2332 2332 const char *domain;
2333 2333 char *dash;
2334 2334 zfs_userquota_prop_t type;
2335 2335 uint64_t rid;
2336 2336 uint64_t quota;
2337 2337 zfsvfs_t *zfsvfs;
2338 2338 int err;
2339 2339
2340 2340 if (nvpair_type(pair) == DATA_TYPE_NVLIST) {
2341 2341 nvlist_t *attrs;
2342 2342 VERIFY(nvpair_value_nvlist(pair, &attrs) == 0);
2343 2343 if (nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
2344 2344 &pair) != 0)
2345 2345 return (SET_ERROR(EINVAL));
2346 2346 }
2347 2347
2348 2348 /*
2349 2349 * A correctly constructed propname is encoded as
2350 2350 * userquota@<rid>-<domain>.
2351 2351 */
2352 2352 if ((dash = strchr(propname, '-')) == NULL ||
2353 2353 nvpair_value_uint64_array(pair, &valary, &vallen) != 0 ||
2354 2354 vallen != 3)
2355 2355 return (SET_ERROR(EINVAL));
2356 2356
2357 2357 domain = dash + 1;
2358 2358 type = valary[0];
2359 2359 rid = valary[1];
2360 2360 quota = valary[2];
2361 2361
2362 2362 err = zfsvfs_hold(dsname, FTAG, &zfsvfs, B_FALSE);
2363 2363 if (err == 0) {
2364 2364 err = zfs_set_userquota(zfsvfs, type, domain, rid, quota);
2365 2365 zfsvfs_rele(zfsvfs, FTAG);
2366 2366 }
2367 2367
2368 2368 return (err);
2369 2369 }
2370 2370
2371 2371 /*
2372 2372 * If the named property is one that has a special function to set its value,
2373 2373 * return 0 on success and a positive error code on failure; otherwise if it is
2374 2374 * not one of the special properties handled by this function, return -1.
2375 2375 *
2376 2376 * XXX: It would be better for callers of the property interface if we handled
2377 2377 * these special cases in dsl_prop.c (in the dsl layer).
2378 2378 */
2379 2379 static int
2380 2380 zfs_prop_set_special(const char *dsname, zprop_source_t source,
2381 2381 nvpair_t *pair)
2382 2382 {
2383 2383 const char *propname = nvpair_name(pair);
2384 2384 zfs_prop_t prop = zfs_name_to_prop(propname);
2385 2385 uint64_t intval;
2386 2386 int err = -1;
2387 2387
2388 2388 if (prop == ZPROP_INVAL) {
2389 2389 if (zfs_prop_userquota(propname))
2390 2390 return (zfs_prop_set_userquota(dsname, pair));
2391 2391 return (-1);
2392 2392 }
2393 2393
2394 2394 if (nvpair_type(pair) == DATA_TYPE_NVLIST) {
2395 2395 nvlist_t *attrs;
2396 2396 VERIFY(nvpair_value_nvlist(pair, &attrs) == 0);
↓ open down ↓ |
2396 lines elided |
↑ open up ↑ |
2397 2397 VERIFY(nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
2398 2398 &pair) == 0);
2399 2399 }
2400 2400
2401 2401 if (zfs_prop_get_type(prop) == PROP_TYPE_STRING)
2402 2402 return (-1);
2403 2403
2404 2404 VERIFY(0 == nvpair_value_uint64(pair, &intval));
2405 2405
2406 2406 switch (prop) {
2407 + case ZFS_PROP_FSID_GUID:
2408 + err = dsl_dataset_set_fsid_guid(dsname, source, intval);
2409 + break;
2407 2410 case ZFS_PROP_QUOTA:
2408 2411 err = dsl_dir_set_quota(dsname, source, intval);
2409 2412 break;
2410 2413 case ZFS_PROP_REFQUOTA:
2411 2414 err = dsl_dataset_set_refquota(dsname, source, intval);
2412 2415 break;
2413 2416 case ZFS_PROP_FILESYSTEM_LIMIT:
2414 2417 case ZFS_PROP_SNAPSHOT_LIMIT:
2415 2418 if (intval == UINT64_MAX) {
2416 2419 /* clearing the limit, just do it */
2417 2420 err = 0;
2418 2421 } else {
2419 2422 err = dsl_dir_activate_fs_ss_limit(dsname);
2420 2423 }
2421 2424 /*
2422 2425 * Set err to -1 to force the zfs_set_prop_nvlist code down the
2423 2426 * default path to set the value in the nvlist.
2424 2427 */
2425 2428 if (err == 0)
2426 2429 err = -1;
2427 2430 break;
2428 2431 case ZFS_PROP_RESERVATION:
2429 2432 err = dsl_dir_set_reservation(dsname, source, intval);
2430 2433 break;
2431 2434 case ZFS_PROP_REFRESERVATION:
2432 2435 err = dsl_dataset_set_refreservation(dsname, source, intval);
2433 2436 break;
2434 2437 case ZFS_PROP_VOLSIZE:
2435 2438 err = zvol_set_volsize(dsname, intval);
2436 2439 break;
2437 2440 case ZFS_PROP_VERSION:
2438 2441 {
2439 2442 zfsvfs_t *zfsvfs;
2440 2443
2441 2444 if ((err = zfsvfs_hold(dsname, FTAG, &zfsvfs, B_TRUE)) != 0)
2442 2445 break;
2443 2446
2444 2447 err = zfs_set_version(zfsvfs, intval);
2445 2448 zfsvfs_rele(zfsvfs, FTAG);
2446 2449
2447 2450 if (err == 0 && intval >= ZPL_VERSION_USERSPACE) {
2448 2451 zfs_cmd_t *zc;
2449 2452
2450 2453 zc = kmem_zalloc(sizeof (zfs_cmd_t), KM_SLEEP);
2451 2454 (void) strcpy(zc->zc_name, dsname);
2452 2455 (void) zfs_ioc_userspace_upgrade(zc);
2453 2456 kmem_free(zc, sizeof (zfs_cmd_t));
2454 2457 }
2455 2458 break;
2456 2459 }
2457 2460 default:
2458 2461 err = -1;
2459 2462 }
2460 2463
2461 2464 return (err);
2462 2465 }
2463 2466
2464 2467 /*
2465 2468 * This function is best effort. If it fails to set any of the given properties,
2466 2469 * it continues to set as many as it can and returns the last error
2467 2470 * encountered. If the caller provides a non-NULL errlist, it will be filled in
2468 2471 * with the list of names of all the properties that failed along with the
2469 2472 * corresponding error numbers.
2470 2473 *
2471 2474 * If every property is set successfully, zero is returned and errlist is not
2472 2475 * modified.
2473 2476 */
2474 2477 int
2475 2478 zfs_set_prop_nvlist(const char *dsname, zprop_source_t source, nvlist_t *nvl,
2476 2479 nvlist_t *errlist)
2477 2480 {
2478 2481 nvpair_t *pair;
2479 2482 nvpair_t *propval;
2480 2483 int rv = 0;
2481 2484 uint64_t intval;
2482 2485 char *strval;
2483 2486 nvlist_t *genericnvl = fnvlist_alloc();
2484 2487 nvlist_t *retrynvl = fnvlist_alloc();
2485 2488
2486 2489 retry:
2487 2490 pair = NULL;
2488 2491 while ((pair = nvlist_next_nvpair(nvl, pair)) != NULL) {
2489 2492 const char *propname = nvpair_name(pair);
2490 2493 zfs_prop_t prop = zfs_name_to_prop(propname);
2491 2494 int err = 0;
2492 2495
2493 2496 /* decode the property value */
2494 2497 propval = pair;
2495 2498 if (nvpair_type(pair) == DATA_TYPE_NVLIST) {
2496 2499 nvlist_t *attrs;
2497 2500 attrs = fnvpair_value_nvlist(pair);
2498 2501 if (nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
2499 2502 &propval) != 0)
2500 2503 err = SET_ERROR(EINVAL);
2501 2504 }
2502 2505
2503 2506 /* Validate value type */
2504 2507 if (err == 0 && prop == ZPROP_INVAL) {
2505 2508 if (zfs_prop_user(propname)) {
2506 2509 if (nvpair_type(propval) != DATA_TYPE_STRING)
2507 2510 err = SET_ERROR(EINVAL);
2508 2511 } else if (zfs_prop_userquota(propname)) {
2509 2512 if (nvpair_type(propval) !=
2510 2513 DATA_TYPE_UINT64_ARRAY)
2511 2514 err = SET_ERROR(EINVAL);
2512 2515 } else {
2513 2516 err = SET_ERROR(EINVAL);
2514 2517 }
2515 2518 } else if (err == 0) {
2516 2519 if (nvpair_type(propval) == DATA_TYPE_STRING) {
2517 2520 if (zfs_prop_get_type(prop) != PROP_TYPE_STRING)
2518 2521 err = SET_ERROR(EINVAL);
2519 2522 } else if (nvpair_type(propval) == DATA_TYPE_UINT64) {
2520 2523 const char *unused;
2521 2524
2522 2525 intval = fnvpair_value_uint64(propval);
2523 2526
2524 2527 switch (zfs_prop_get_type(prop)) {
2525 2528 case PROP_TYPE_NUMBER:
2526 2529 break;
2527 2530 case PROP_TYPE_STRING:
2528 2531 err = SET_ERROR(EINVAL);
2529 2532 break;
2530 2533 case PROP_TYPE_INDEX:
2531 2534 if (zfs_prop_index_to_string(prop,
2532 2535 intval, &unused) != 0)
2533 2536 err = SET_ERROR(EINVAL);
2534 2537 break;
2535 2538 default:
2536 2539 cmn_err(CE_PANIC,
2537 2540 "unknown property type");
2538 2541 }
2539 2542 } else {
2540 2543 err = SET_ERROR(EINVAL);
2541 2544 }
2542 2545 }
2543 2546
2544 2547 /* Validate permissions */
2545 2548 if (err == 0)
2546 2549 err = zfs_check_settable(dsname, pair, CRED());
2547 2550
2548 2551 if (err == 0) {
2549 2552 err = zfs_prop_set_special(dsname, source, pair);
2550 2553 if (err == -1) {
2551 2554 /*
2552 2555 * For better performance we build up a list of
2553 2556 * properties to set in a single transaction.
2554 2557 */
2555 2558 err = nvlist_add_nvpair(genericnvl, pair);
2556 2559 } else if (err != 0 && nvl != retrynvl) {
2557 2560 /*
2558 2561 * This may be a spurious error caused by
2559 2562 * receiving quota and reservation out of order.
2560 2563 * Try again in a second pass.
2561 2564 */
2562 2565 err = nvlist_add_nvpair(retrynvl, pair);
2563 2566 }
2564 2567 }
2565 2568
2566 2569 if (err != 0) {
2567 2570 if (errlist != NULL)
2568 2571 fnvlist_add_int32(errlist, propname, err);
2569 2572 rv = err;
2570 2573 }
2571 2574 }
2572 2575
2573 2576 if (nvl != retrynvl && !nvlist_empty(retrynvl)) {
2574 2577 nvl = retrynvl;
2575 2578 goto retry;
2576 2579 }
2577 2580
2578 2581 if (!nvlist_empty(genericnvl) &&
2579 2582 dsl_props_set(dsname, source, genericnvl) != 0) {
2580 2583 /*
2581 2584 * If this fails, we still want to set as many properties as we
2582 2585 * can, so try setting them individually.
2583 2586 */
2584 2587 pair = NULL;
2585 2588 while ((pair = nvlist_next_nvpair(genericnvl, pair)) != NULL) {
2586 2589 const char *propname = nvpair_name(pair);
2587 2590 int err = 0;
2588 2591
2589 2592 propval = pair;
2590 2593 if (nvpair_type(pair) == DATA_TYPE_NVLIST) {
2591 2594 nvlist_t *attrs;
2592 2595 attrs = fnvpair_value_nvlist(pair);
2593 2596 propval = fnvlist_lookup_nvpair(attrs,
2594 2597 ZPROP_VALUE);
2595 2598 }
2596 2599
2597 2600 if (nvpair_type(propval) == DATA_TYPE_STRING) {
2598 2601 strval = fnvpair_value_string(propval);
2599 2602 err = dsl_prop_set_string(dsname, propname,
2600 2603 source, strval);
2601 2604 } else {
2602 2605 intval = fnvpair_value_uint64(propval);
2603 2606 err = dsl_prop_set_int(dsname, propname, source,
2604 2607 intval);
2605 2608 }
2606 2609
2607 2610 if (err != 0) {
2608 2611 if (errlist != NULL) {
2609 2612 fnvlist_add_int32(errlist, propname,
2610 2613 err);
2611 2614 }
2612 2615 rv = err;
2613 2616 }
2614 2617 }
2615 2618 }
2616 2619 nvlist_free(genericnvl);
2617 2620 nvlist_free(retrynvl);
2618 2621
2619 2622 return (rv);
2620 2623 }
2621 2624
2622 2625 /*
2623 2626 * Check that all the properties are valid user properties.
2624 2627 */
2625 2628 static int
2626 2629 zfs_check_userprops(const char *fsname, nvlist_t *nvl)
2627 2630 {
2628 2631 nvpair_t *pair = NULL;
2629 2632 int error = 0;
2630 2633
2631 2634 while ((pair = nvlist_next_nvpair(nvl, pair)) != NULL) {
2632 2635 const char *propname = nvpair_name(pair);
2633 2636
2634 2637 if (!zfs_prop_user(propname) ||
2635 2638 nvpair_type(pair) != DATA_TYPE_STRING)
2636 2639 return (SET_ERROR(EINVAL));
2637 2640
2638 2641 if (error = zfs_secpolicy_write_perms(fsname,
2639 2642 ZFS_DELEG_PERM_USERPROP, CRED()))
2640 2643 return (error);
2641 2644
2642 2645 if (strlen(propname) >= ZAP_MAXNAMELEN)
2643 2646 return (SET_ERROR(ENAMETOOLONG));
2644 2647
2645 2648 if (strlen(fnvpair_value_string(pair)) >= ZAP_MAXVALUELEN)
2646 2649 return (E2BIG);
2647 2650 }
2648 2651 return (0);
2649 2652 }
2650 2653
2651 2654 static void
2652 2655 props_skip(nvlist_t *props, nvlist_t *skipped, nvlist_t **newprops)
2653 2656 {
2654 2657 nvpair_t *pair;
2655 2658
2656 2659 VERIFY(nvlist_alloc(newprops, NV_UNIQUE_NAME, KM_SLEEP) == 0);
2657 2660
2658 2661 pair = NULL;
2659 2662 while ((pair = nvlist_next_nvpair(props, pair)) != NULL) {
2660 2663 if (nvlist_exists(skipped, nvpair_name(pair)))
2661 2664 continue;
2662 2665
2663 2666 VERIFY(nvlist_add_nvpair(*newprops, pair) == 0);
2664 2667 }
2665 2668 }
2666 2669
2667 2670 static int
2668 2671 clear_received_props(const char *dsname, nvlist_t *props,
2669 2672 nvlist_t *skipped)
2670 2673 {
2671 2674 int err = 0;
2672 2675 nvlist_t *cleared_props = NULL;
2673 2676 props_skip(props, skipped, &cleared_props);
2674 2677 if (!nvlist_empty(cleared_props)) {
2675 2678 /*
2676 2679 * Acts on local properties until the dataset has received
2677 2680 * properties at least once on or after SPA_VERSION_RECVD_PROPS.
2678 2681 */
2679 2682 zprop_source_t flags = (ZPROP_SRC_NONE |
2680 2683 (dsl_prop_get_hasrecvd(dsname) ? ZPROP_SRC_RECEIVED : 0));
2681 2684 err = zfs_set_prop_nvlist(dsname, flags, cleared_props, NULL);
2682 2685 }
2683 2686 nvlist_free(cleared_props);
2684 2687 return (err);
2685 2688 }
2686 2689
2687 2690 /*
2688 2691 * inputs:
2689 2692 * zc_name name of filesystem
2690 2693 * zc_value name of property to set
2691 2694 * zc_nvlist_src{_size} nvlist of properties to apply
2692 2695 * zc_cookie received properties flag
2693 2696 *
2694 2697 * outputs:
2695 2698 * zc_nvlist_dst{_size} error for each unapplied received property
2696 2699 */
2697 2700 static int
2698 2701 zfs_ioc_set_prop(zfs_cmd_t *zc)
2699 2702 {
2700 2703 nvlist_t *nvl;
2701 2704 boolean_t received = zc->zc_cookie;
2702 2705 zprop_source_t source = (received ? ZPROP_SRC_RECEIVED :
2703 2706 ZPROP_SRC_LOCAL);
2704 2707 nvlist_t *errors;
2705 2708 int error;
2706 2709
2707 2710 if ((error = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
2708 2711 zc->zc_iflags, &nvl)) != 0)
2709 2712 return (error);
2710 2713
2711 2714 if (received) {
2712 2715 nvlist_t *origprops;
2713 2716
2714 2717 if (dsl_prop_get_received(zc->zc_name, &origprops) == 0) {
2715 2718 (void) clear_received_props(zc->zc_name,
2716 2719 origprops, nvl);
2717 2720 nvlist_free(origprops);
2718 2721 }
2719 2722
2720 2723 error = dsl_prop_set_hasrecvd(zc->zc_name);
2721 2724 }
2722 2725
2723 2726 errors = fnvlist_alloc();
2724 2727 if (error == 0)
2725 2728 error = zfs_set_prop_nvlist(zc->zc_name, source, nvl, errors);
2726 2729
2727 2730 if (zc->zc_nvlist_dst != NULL && errors != NULL) {
2728 2731 (void) put_nvlist(zc, errors);
2729 2732 }
2730 2733
2731 2734 nvlist_free(errors);
2732 2735 nvlist_free(nvl);
2733 2736 return (error);
2734 2737 }
2735 2738
2736 2739 /*
2737 2740 * inputs:
2738 2741 * zc_name name of filesystem
2739 2742 * zc_value name of property to inherit
2740 2743 * zc_cookie revert to received value if TRUE
2741 2744 *
2742 2745 * outputs: none
2743 2746 */
2744 2747 static int
2745 2748 zfs_ioc_inherit_prop(zfs_cmd_t *zc)
2746 2749 {
2747 2750 const char *propname = zc->zc_value;
2748 2751 zfs_prop_t prop = zfs_name_to_prop(propname);
2749 2752 boolean_t received = zc->zc_cookie;
2750 2753 zprop_source_t source = (received
2751 2754 ? ZPROP_SRC_NONE /* revert to received value, if any */
2752 2755 : ZPROP_SRC_INHERITED); /* explicitly inherit */
2753 2756
2754 2757 if (received) {
2755 2758 nvlist_t *dummy;
2756 2759 nvpair_t *pair;
2757 2760 zprop_type_t type;
2758 2761 int err;
2759 2762
2760 2763 /*
2761 2764 * zfs_prop_set_special() expects properties in the form of an
2762 2765 * nvpair with type info.
2763 2766 */
2764 2767 if (prop == ZPROP_INVAL) {
2765 2768 if (!zfs_prop_user(propname))
2766 2769 return (SET_ERROR(EINVAL));
2767 2770
2768 2771 type = PROP_TYPE_STRING;
2769 2772 } else if (prop == ZFS_PROP_VOLSIZE ||
2770 2773 prop == ZFS_PROP_VERSION) {
2771 2774 return (SET_ERROR(EINVAL));
2772 2775 } else {
2773 2776 type = zfs_prop_get_type(prop);
2774 2777 }
2775 2778
2776 2779 VERIFY(nvlist_alloc(&dummy, NV_UNIQUE_NAME, KM_SLEEP) == 0);
2777 2780
2778 2781 switch (type) {
2779 2782 case PROP_TYPE_STRING:
2780 2783 VERIFY(0 == nvlist_add_string(dummy, propname, ""));
2781 2784 break;
2782 2785 case PROP_TYPE_NUMBER:
2783 2786 case PROP_TYPE_INDEX:
2784 2787 VERIFY(0 == nvlist_add_uint64(dummy, propname, 0));
2785 2788 break;
2786 2789 default:
2787 2790 nvlist_free(dummy);
2788 2791 return (SET_ERROR(EINVAL));
2789 2792 }
2790 2793
2791 2794 pair = nvlist_next_nvpair(dummy, NULL);
2792 2795 err = zfs_prop_set_special(zc->zc_name, source, pair);
2793 2796 nvlist_free(dummy);
2794 2797 if (err != -1)
2795 2798 return (err); /* special property already handled */
2796 2799 } else {
2797 2800 /*
2798 2801 * Only check this in the non-received case. We want to allow
2799 2802 * 'inherit -S' to revert non-inheritable properties like quota
2800 2803 * and reservation to the received or default values even though
2801 2804 * they are not considered inheritable.
2802 2805 */
2803 2806 if (prop != ZPROP_INVAL && !zfs_prop_inheritable(prop))
2804 2807 return (SET_ERROR(EINVAL));
2805 2808 }
2806 2809
2807 2810 /* property name has been validated by zfs_secpolicy_inherit_prop() */
2808 2811 return (dsl_prop_inherit(zc->zc_name, zc->zc_value, source));
2809 2812 }
2810 2813
2811 2814 static int
2812 2815 zfs_ioc_pool_set_props(zfs_cmd_t *zc)
2813 2816 {
2814 2817 nvlist_t *props;
2815 2818 spa_t *spa;
2816 2819 int error;
2817 2820 nvpair_t *pair;
2818 2821
2819 2822 if (error = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
2820 2823 zc->zc_iflags, &props))
2821 2824 return (error);
2822 2825
2823 2826 /*
2824 2827 * If the only property is the configfile, then just do a spa_lookup()
2825 2828 * to handle the faulted case.
2826 2829 */
2827 2830 pair = nvlist_next_nvpair(props, NULL);
2828 2831 if (pair != NULL && strcmp(nvpair_name(pair),
2829 2832 zpool_prop_to_name(ZPOOL_PROP_CACHEFILE)) == 0 &&
2830 2833 nvlist_next_nvpair(props, pair) == NULL) {
2831 2834 mutex_enter(&spa_namespace_lock);
2832 2835 if ((spa = spa_lookup(zc->zc_name)) != NULL) {
2833 2836 spa_configfile_set(spa, props, B_FALSE);
2834 2837 spa_config_sync(spa, B_FALSE, B_TRUE);
2835 2838 }
2836 2839 mutex_exit(&spa_namespace_lock);
2837 2840 if (spa != NULL) {
2838 2841 nvlist_free(props);
2839 2842 return (0);
2840 2843 }
2841 2844 }
2842 2845
2843 2846 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0) {
2844 2847 nvlist_free(props);
2845 2848 return (error);
2846 2849 }
2847 2850
2848 2851 error = spa_prop_set(spa, props);
2849 2852
2850 2853 nvlist_free(props);
2851 2854 spa_close(spa, FTAG);
2852 2855
2853 2856 return (error);
2854 2857 }
2855 2858
2856 2859 static int
2857 2860 zfs_ioc_pool_get_props(zfs_cmd_t *zc)
2858 2861 {
2859 2862 spa_t *spa;
2860 2863 int error;
2861 2864 nvlist_t *nvp = NULL;
2862 2865
2863 2866 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0) {
2864 2867 /*
2865 2868 * If the pool is faulted, there may be properties we can still
2866 2869 * get (such as altroot and cachefile), so attempt to get them
2867 2870 * anyway.
2868 2871 */
2869 2872 mutex_enter(&spa_namespace_lock);
2870 2873 if ((spa = spa_lookup(zc->zc_name)) != NULL)
2871 2874 error = spa_prop_get(spa, &nvp);
2872 2875 mutex_exit(&spa_namespace_lock);
2873 2876 } else {
2874 2877 error = spa_prop_get(spa, &nvp);
2875 2878 spa_close(spa, FTAG);
2876 2879 }
2877 2880
2878 2881 if (error == 0 && zc->zc_nvlist_dst != NULL)
2879 2882 error = put_nvlist(zc, nvp);
2880 2883 else
2881 2884 error = SET_ERROR(EFAULT);
2882 2885
2883 2886 nvlist_free(nvp);
2884 2887 return (error);
2885 2888 }
2886 2889
2887 2890 /*
2888 2891 * inputs:
2889 2892 * zc_name name of filesystem
2890 2893 * zc_nvlist_src{_size} nvlist of delegated permissions
2891 2894 * zc_perm_action allow/unallow flag
2892 2895 *
2893 2896 * outputs: none
2894 2897 */
2895 2898 static int
2896 2899 zfs_ioc_set_fsacl(zfs_cmd_t *zc)
2897 2900 {
2898 2901 int error;
2899 2902 nvlist_t *fsaclnv = NULL;
2900 2903
2901 2904 if ((error = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
2902 2905 zc->zc_iflags, &fsaclnv)) != 0)
2903 2906 return (error);
2904 2907
2905 2908 /*
2906 2909 * Verify nvlist is constructed correctly
2907 2910 */
2908 2911 if ((error = zfs_deleg_verify_nvlist(fsaclnv)) != 0) {
2909 2912 nvlist_free(fsaclnv);
2910 2913 return (SET_ERROR(EINVAL));
2911 2914 }
2912 2915
2913 2916 /*
2914 2917 * If we don't have PRIV_SYS_MOUNT, then validate
2915 2918 * that user is allowed to hand out each permission in
2916 2919 * the nvlist(s)
2917 2920 */
2918 2921
2919 2922 error = secpolicy_zfs(CRED());
2920 2923 if (error != 0) {
2921 2924 if (zc->zc_perm_action == B_FALSE) {
2922 2925 error = dsl_deleg_can_allow(zc->zc_name,
2923 2926 fsaclnv, CRED());
2924 2927 } else {
2925 2928 error = dsl_deleg_can_unallow(zc->zc_name,
2926 2929 fsaclnv, CRED());
2927 2930 }
2928 2931 }
2929 2932
2930 2933 if (error == 0)
2931 2934 error = dsl_deleg_set(zc->zc_name, fsaclnv, zc->zc_perm_action);
2932 2935
2933 2936 nvlist_free(fsaclnv);
2934 2937 return (error);
2935 2938 }
2936 2939
2937 2940 /*
2938 2941 * inputs:
2939 2942 * zc_name name of filesystem
2940 2943 *
2941 2944 * outputs:
2942 2945 * zc_nvlist_src{_size} nvlist of delegated permissions
2943 2946 */
2944 2947 static int
2945 2948 zfs_ioc_get_fsacl(zfs_cmd_t *zc)
2946 2949 {
2947 2950 nvlist_t *nvp;
2948 2951 int error;
2949 2952
2950 2953 if ((error = dsl_deleg_get(zc->zc_name, &nvp)) == 0) {
2951 2954 error = put_nvlist(zc, nvp);
2952 2955 nvlist_free(nvp);
2953 2956 }
2954 2957
2955 2958 return (error);
2956 2959 }
2957 2960
2958 2961 /*
2959 2962 * Search the vfs list for a specified resource. Returns a pointer to it
2960 2963 * or NULL if no suitable entry is found. The caller of this routine
2961 2964 * is responsible for releasing the returned vfs pointer.
2962 2965 */
2963 2966 static vfs_t *
2964 2967 zfs_get_vfs(const char *resource)
2965 2968 {
2966 2969 struct vfs *vfsp;
2967 2970 struct vfs *vfs_found = NULL;
2968 2971
2969 2972 vfs_list_read_lock();
2970 2973 vfsp = rootvfs;
2971 2974 do {
2972 2975 if (strcmp(refstr_value(vfsp->vfs_resource), resource) == 0) {
2973 2976 VFS_HOLD(vfsp);
2974 2977 vfs_found = vfsp;
2975 2978 break;
2976 2979 }
2977 2980 vfsp = vfsp->vfs_next;
2978 2981 } while (vfsp != rootvfs);
2979 2982 vfs_list_unlock();
2980 2983 return (vfs_found);
2981 2984 }
2982 2985
2983 2986 /* ARGSUSED */
2984 2987 static void
2985 2988 zfs_create_cb(objset_t *os, void *arg, cred_t *cr, dmu_tx_t *tx)
2986 2989 {
2987 2990 zfs_creat_t *zct = arg;
2988 2991
2989 2992 zfs_create_fs(os, cr, zct->zct_zplprops, tx);
2990 2993 }
2991 2994
2992 2995 #define ZFS_PROP_UNDEFINED ((uint64_t)-1)
2993 2996
2994 2997 /*
2995 2998 * inputs:
2996 2999 * os parent objset pointer (NULL if root fs)
2997 3000 * fuids_ok fuids allowed in this version of the spa?
2998 3001 * sa_ok SAs allowed in this version of the spa?
2999 3002 * createprops list of properties requested by creator
3000 3003 *
3001 3004 * outputs:
3002 3005 * zplprops values for the zplprops we attach to the master node object
3003 3006 * is_ci true if requested file system will be purely case-insensitive
3004 3007 *
3005 3008 * Determine the settings for utf8only, normalization and
3006 3009 * casesensitivity. Specific values may have been requested by the
3007 3010 * creator and/or we can inherit values from the parent dataset. If
3008 3011 * the file system is of too early a vintage, a creator can not
3009 3012 * request settings for these properties, even if the requested
3010 3013 * setting is the default value. We don't actually want to create dsl
3011 3014 * properties for these, so remove them from the source nvlist after
3012 3015 * processing.
3013 3016 */
3014 3017 static int
3015 3018 zfs_fill_zplprops_impl(objset_t *os, uint64_t zplver,
3016 3019 boolean_t fuids_ok, boolean_t sa_ok, nvlist_t *createprops,
3017 3020 nvlist_t *zplprops, boolean_t *is_ci)
3018 3021 {
3019 3022 uint64_t sense = ZFS_PROP_UNDEFINED;
3020 3023 uint64_t norm = ZFS_PROP_UNDEFINED;
3021 3024 uint64_t u8 = ZFS_PROP_UNDEFINED;
3022 3025
3023 3026 ASSERT(zplprops != NULL);
3024 3027
3025 3028 /*
3026 3029 * Pull out creator prop choices, if any.
3027 3030 */
3028 3031 if (createprops) {
3029 3032 (void) nvlist_lookup_uint64(createprops,
3030 3033 zfs_prop_to_name(ZFS_PROP_VERSION), &zplver);
3031 3034 (void) nvlist_lookup_uint64(createprops,
3032 3035 zfs_prop_to_name(ZFS_PROP_NORMALIZE), &norm);
3033 3036 (void) nvlist_remove_all(createprops,
3034 3037 zfs_prop_to_name(ZFS_PROP_NORMALIZE));
3035 3038 (void) nvlist_lookup_uint64(createprops,
3036 3039 zfs_prop_to_name(ZFS_PROP_UTF8ONLY), &u8);
3037 3040 (void) nvlist_remove_all(createprops,
3038 3041 zfs_prop_to_name(ZFS_PROP_UTF8ONLY));
3039 3042 (void) nvlist_lookup_uint64(createprops,
3040 3043 zfs_prop_to_name(ZFS_PROP_CASE), &sense);
3041 3044 (void) nvlist_remove_all(createprops,
3042 3045 zfs_prop_to_name(ZFS_PROP_CASE));
3043 3046 }
3044 3047
3045 3048 /*
3046 3049 * If the zpl version requested is whacky or the file system
3047 3050 * or pool is version is too "young" to support normalization
3048 3051 * and the creator tried to set a value for one of the props,
3049 3052 * error out.
3050 3053 */
3051 3054 if ((zplver < ZPL_VERSION_INITIAL || zplver > ZPL_VERSION) ||
3052 3055 (zplver >= ZPL_VERSION_FUID && !fuids_ok) ||
3053 3056 (zplver >= ZPL_VERSION_SA && !sa_ok) ||
3054 3057 (zplver < ZPL_VERSION_NORMALIZATION &&
3055 3058 (norm != ZFS_PROP_UNDEFINED || u8 != ZFS_PROP_UNDEFINED ||
3056 3059 sense != ZFS_PROP_UNDEFINED)))
3057 3060 return (SET_ERROR(ENOTSUP));
3058 3061
3059 3062 /*
3060 3063 * Put the version in the zplprops
3061 3064 */
3062 3065 VERIFY(nvlist_add_uint64(zplprops,
3063 3066 zfs_prop_to_name(ZFS_PROP_VERSION), zplver) == 0);
3064 3067
3065 3068 if (norm == ZFS_PROP_UNDEFINED)
3066 3069 VERIFY(zfs_get_zplprop(os, ZFS_PROP_NORMALIZE, &norm) == 0);
3067 3070 VERIFY(nvlist_add_uint64(zplprops,
3068 3071 zfs_prop_to_name(ZFS_PROP_NORMALIZE), norm) == 0);
3069 3072
3070 3073 /*
3071 3074 * If we're normalizing, names must always be valid UTF-8 strings.
3072 3075 */
3073 3076 if (norm)
3074 3077 u8 = 1;
3075 3078 if (u8 == ZFS_PROP_UNDEFINED)
3076 3079 VERIFY(zfs_get_zplprop(os, ZFS_PROP_UTF8ONLY, &u8) == 0);
3077 3080 VERIFY(nvlist_add_uint64(zplprops,
3078 3081 zfs_prop_to_name(ZFS_PROP_UTF8ONLY), u8) == 0);
3079 3082
3080 3083 if (sense == ZFS_PROP_UNDEFINED)
3081 3084 VERIFY(zfs_get_zplprop(os, ZFS_PROP_CASE, &sense) == 0);
3082 3085 VERIFY(nvlist_add_uint64(zplprops,
3083 3086 zfs_prop_to_name(ZFS_PROP_CASE), sense) == 0);
3084 3087
3085 3088 if (is_ci)
3086 3089 *is_ci = (sense == ZFS_CASE_INSENSITIVE);
3087 3090
3088 3091 return (0);
3089 3092 }
3090 3093
3091 3094 static int
3092 3095 zfs_fill_zplprops(const char *dataset, nvlist_t *createprops,
3093 3096 nvlist_t *zplprops, boolean_t *is_ci)
3094 3097 {
3095 3098 boolean_t fuids_ok, sa_ok;
3096 3099 uint64_t zplver = ZPL_VERSION;
3097 3100 objset_t *os = NULL;
3098 3101 char parentname[MAXNAMELEN];
3099 3102 char *cp;
3100 3103 spa_t *spa;
3101 3104 uint64_t spa_vers;
3102 3105 int error;
3103 3106
3104 3107 (void) strlcpy(parentname, dataset, sizeof (parentname));
3105 3108 cp = strrchr(parentname, '/');
3106 3109 ASSERT(cp != NULL);
3107 3110 cp[0] = '\0';
3108 3111
3109 3112 if ((error = spa_open(dataset, &spa, FTAG)) != 0)
3110 3113 return (error);
3111 3114
3112 3115 spa_vers = spa_version(spa);
3113 3116 spa_close(spa, FTAG);
3114 3117
3115 3118 zplver = zfs_zpl_version_map(spa_vers);
3116 3119 fuids_ok = (zplver >= ZPL_VERSION_FUID);
3117 3120 sa_ok = (zplver >= ZPL_VERSION_SA);
3118 3121
3119 3122 /*
3120 3123 * Open parent object set so we can inherit zplprop values.
3121 3124 */
3122 3125 if ((error = dmu_objset_hold(parentname, FTAG, &os)) != 0)
3123 3126 return (error);
3124 3127
3125 3128 error = zfs_fill_zplprops_impl(os, zplver, fuids_ok, sa_ok, createprops,
3126 3129 zplprops, is_ci);
3127 3130 dmu_objset_rele(os, FTAG);
3128 3131 return (error);
3129 3132 }
3130 3133
3131 3134 static int
3132 3135 zfs_fill_zplprops_root(uint64_t spa_vers, nvlist_t *createprops,
3133 3136 nvlist_t *zplprops, boolean_t *is_ci)
3134 3137 {
3135 3138 boolean_t fuids_ok;
3136 3139 boolean_t sa_ok;
3137 3140 uint64_t zplver = ZPL_VERSION;
3138 3141 int error;
3139 3142
3140 3143 zplver = zfs_zpl_version_map(spa_vers);
3141 3144 fuids_ok = (zplver >= ZPL_VERSION_FUID);
3142 3145 sa_ok = (zplver >= ZPL_VERSION_SA);
3143 3146
3144 3147 error = zfs_fill_zplprops_impl(NULL, zplver, fuids_ok, sa_ok,
3145 3148 createprops, zplprops, is_ci);
3146 3149 return (error);
3147 3150 }
3148 3151
3149 3152 /*
3150 3153 * innvl: {
3151 3154 * "type" -> dmu_objset_type_t (int32)
3152 3155 * (optional) "props" -> { prop -> value }
3153 3156 * }
3154 3157 *
3155 3158 * outnvl: propname -> error code (int32)
3156 3159 */
3157 3160 static int
3158 3161 zfs_ioc_create(const char *fsname, nvlist_t *innvl, nvlist_t *outnvl)
3159 3162 {
3160 3163 int error = 0;
3161 3164 zfs_creat_t zct = { 0 };
3162 3165 nvlist_t *nvprops = NULL;
3163 3166 void (*cbfunc)(objset_t *os, void *arg, cred_t *cr, dmu_tx_t *tx);
3164 3167 int32_t type32;
3165 3168 dmu_objset_type_t type;
3166 3169 boolean_t is_insensitive = B_FALSE;
3167 3170
3168 3171 if (nvlist_lookup_int32(innvl, "type", &type32) != 0)
3169 3172 return (SET_ERROR(EINVAL));
3170 3173 type = type32;
3171 3174 (void) nvlist_lookup_nvlist(innvl, "props", &nvprops);
3172 3175
3173 3176 switch (type) {
3174 3177 case DMU_OST_ZFS:
3175 3178 cbfunc = zfs_create_cb;
3176 3179 break;
3177 3180
3178 3181 case DMU_OST_ZVOL:
3179 3182 cbfunc = zvol_create_cb;
3180 3183 break;
3181 3184
3182 3185 default:
3183 3186 cbfunc = NULL;
3184 3187 break;
3185 3188 }
3186 3189 if (strchr(fsname, '@') ||
3187 3190 strchr(fsname, '%'))
3188 3191 return (SET_ERROR(EINVAL));
3189 3192
3190 3193 zct.zct_props = nvprops;
3191 3194
3192 3195 if (cbfunc == NULL)
3193 3196 return (SET_ERROR(EINVAL));
3194 3197
3195 3198 if (type == DMU_OST_ZVOL) {
3196 3199 uint64_t volsize, volblocksize;
3197 3200
3198 3201 if (nvprops == NULL)
3199 3202 return (SET_ERROR(EINVAL));
3200 3203 if (nvlist_lookup_uint64(nvprops,
3201 3204 zfs_prop_to_name(ZFS_PROP_VOLSIZE), &volsize) != 0)
3202 3205 return (SET_ERROR(EINVAL));
3203 3206
3204 3207 if ((error = nvlist_lookup_uint64(nvprops,
3205 3208 zfs_prop_to_name(ZFS_PROP_VOLBLOCKSIZE),
3206 3209 &volblocksize)) != 0 && error != ENOENT)
3207 3210 return (SET_ERROR(EINVAL));
3208 3211
3209 3212 if (error != 0)
3210 3213 volblocksize = zfs_prop_default_numeric(
3211 3214 ZFS_PROP_VOLBLOCKSIZE);
3212 3215
3213 3216 if ((error = zvol_check_volblocksize(
3214 3217 volblocksize)) != 0 ||
3215 3218 (error = zvol_check_volsize(volsize,
3216 3219 volblocksize)) != 0)
3217 3220 return (error);
3218 3221 } else if (type == DMU_OST_ZFS) {
3219 3222 int error;
3220 3223
3221 3224 /*
3222 3225 * We have to have normalization and
3223 3226 * case-folding flags correct when we do the
3224 3227 * file system creation, so go figure them out
3225 3228 * now.
3226 3229 */
3227 3230 VERIFY(nvlist_alloc(&zct.zct_zplprops,
3228 3231 NV_UNIQUE_NAME, KM_SLEEP) == 0);
3229 3232 error = zfs_fill_zplprops(fsname, nvprops,
3230 3233 zct.zct_zplprops, &is_insensitive);
3231 3234 if (error != 0) {
3232 3235 nvlist_free(zct.zct_zplprops);
3233 3236 return (error);
3234 3237 }
3235 3238 }
3236 3239
3237 3240 error = dmu_objset_create(fsname, type,
3238 3241 is_insensitive ? DS_FLAG_CI_DATASET : 0, cbfunc, &zct);
3239 3242 nvlist_free(zct.zct_zplprops);
3240 3243
3241 3244 /*
3242 3245 * It would be nice to do this atomically.
3243 3246 */
3244 3247 if (error == 0) {
3245 3248 error = zfs_set_prop_nvlist(fsname, ZPROP_SRC_LOCAL,
3246 3249 nvprops, outnvl);
3247 3250 if (error != 0)
3248 3251 (void) dsl_destroy_head(fsname);
3249 3252 }
3250 3253 return (error);
3251 3254 }
3252 3255
3253 3256 /*
3254 3257 * innvl: {
3255 3258 * "origin" -> name of origin snapshot
3256 3259 * (optional) "props" -> { prop -> value }
3257 3260 * }
3258 3261 *
3259 3262 * outnvl: propname -> error code (int32)
3260 3263 */
3261 3264 static int
3262 3265 zfs_ioc_clone(const char *fsname, nvlist_t *innvl, nvlist_t *outnvl)
3263 3266 {
3264 3267 int error = 0;
3265 3268 nvlist_t *nvprops = NULL;
3266 3269 char *origin_name;
3267 3270
3268 3271 if (nvlist_lookup_string(innvl, "origin", &origin_name) != 0)
3269 3272 return (SET_ERROR(EINVAL));
3270 3273 (void) nvlist_lookup_nvlist(innvl, "props", &nvprops);
3271 3274
3272 3275 if (strchr(fsname, '@') ||
3273 3276 strchr(fsname, '%'))
3274 3277 return (SET_ERROR(EINVAL));
3275 3278
3276 3279 if (dataset_namecheck(origin_name, NULL, NULL) != 0)
3277 3280 return (SET_ERROR(EINVAL));
3278 3281 error = dmu_objset_clone(fsname, origin_name);
3279 3282 if (error != 0)
3280 3283 return (error);
3281 3284
3282 3285 /*
3283 3286 * It would be nice to do this atomically.
3284 3287 */
3285 3288 if (error == 0) {
3286 3289 error = zfs_set_prop_nvlist(fsname, ZPROP_SRC_LOCAL,
3287 3290 nvprops, outnvl);
3288 3291 if (error != 0)
3289 3292 (void) dsl_destroy_head(fsname);
3290 3293 }
3291 3294 return (error);
3292 3295 }
3293 3296
3294 3297 /*
3295 3298 * innvl: {
3296 3299 * "snaps" -> { snapshot1, snapshot2 }
3297 3300 * (optional) "props" -> { prop -> value (string) }
3298 3301 * }
3299 3302 *
3300 3303 * outnvl: snapshot -> error code (int32)
3301 3304 */
3302 3305 static int
3303 3306 zfs_ioc_snapshot(const char *poolname, nvlist_t *innvl, nvlist_t *outnvl)
3304 3307 {
3305 3308 nvlist_t *snaps;
3306 3309 nvlist_t *props = NULL;
3307 3310 int error, poollen;
3308 3311 nvpair_t *pair;
3309 3312
3310 3313 (void) nvlist_lookup_nvlist(innvl, "props", &props);
3311 3314 if ((error = zfs_check_userprops(poolname, props)) != 0)
3312 3315 return (error);
3313 3316
3314 3317 if (!nvlist_empty(props) &&
3315 3318 zfs_earlier_version(poolname, SPA_VERSION_SNAP_PROPS))
3316 3319 return (SET_ERROR(ENOTSUP));
3317 3320
3318 3321 if (nvlist_lookup_nvlist(innvl, "snaps", &snaps) != 0)
3319 3322 return (SET_ERROR(EINVAL));
3320 3323 poollen = strlen(poolname);
3321 3324 for (pair = nvlist_next_nvpair(snaps, NULL); pair != NULL;
3322 3325 pair = nvlist_next_nvpair(snaps, pair)) {
3323 3326 const char *name = nvpair_name(pair);
3324 3327 const char *cp = strchr(name, '@');
3325 3328
3326 3329 /*
3327 3330 * The snap name must contain an @, and the part after it must
3328 3331 * contain only valid characters.
3329 3332 */
3330 3333 if (cp == NULL ||
3331 3334 zfs_component_namecheck(cp + 1, NULL, NULL) != 0)
3332 3335 return (SET_ERROR(EINVAL));
3333 3336
3334 3337 /*
3335 3338 * The snap must be in the specified pool.
3336 3339 */
3337 3340 if (strncmp(name, poolname, poollen) != 0 ||
3338 3341 (name[poollen] != '/' && name[poollen] != '@'))
3339 3342 return (SET_ERROR(EXDEV));
3340 3343
3341 3344 /* This must be the only snap of this fs. */
3342 3345 for (nvpair_t *pair2 = nvlist_next_nvpair(snaps, pair);
3343 3346 pair2 != NULL; pair2 = nvlist_next_nvpair(snaps, pair2)) {
3344 3347 if (strncmp(name, nvpair_name(pair2), cp - name + 1)
3345 3348 == 0) {
3346 3349 return (SET_ERROR(EXDEV));
3347 3350 }
3348 3351 }
3349 3352 }
3350 3353
3351 3354 error = dsl_dataset_snapshot(snaps, props, outnvl);
3352 3355 return (error);
3353 3356 }
3354 3357
3355 3358 /*
3356 3359 * innvl: "message" -> string
3357 3360 */
3358 3361 /* ARGSUSED */
3359 3362 static int
3360 3363 zfs_ioc_log_history(const char *unused, nvlist_t *innvl, nvlist_t *outnvl)
3361 3364 {
3362 3365 char *message;
3363 3366 spa_t *spa;
3364 3367 int error;
3365 3368 char *poolname;
3366 3369
3367 3370 /*
3368 3371 * The poolname in the ioctl is not set, we get it from the TSD,
3369 3372 * which was set at the end of the last successful ioctl that allows
3370 3373 * logging. The secpolicy func already checked that it is set.
3371 3374 * Only one log ioctl is allowed after each successful ioctl, so
3372 3375 * we clear the TSD here.
3373 3376 */
3374 3377 poolname = tsd_get(zfs_allow_log_key);
3375 3378 (void) tsd_set(zfs_allow_log_key, NULL);
3376 3379 error = spa_open(poolname, &spa, FTAG);
3377 3380 strfree(poolname);
3378 3381 if (error != 0)
3379 3382 return (error);
3380 3383
3381 3384 if (nvlist_lookup_string(innvl, "message", &message) != 0) {
3382 3385 spa_close(spa, FTAG);
3383 3386 return (SET_ERROR(EINVAL));
3384 3387 }
3385 3388
3386 3389 if (spa_version(spa) < SPA_VERSION_ZPOOL_HISTORY) {
3387 3390 spa_close(spa, FTAG);
3388 3391 return (SET_ERROR(ENOTSUP));
3389 3392 }
3390 3393
3391 3394 error = spa_history_log(spa, message);
3392 3395 spa_close(spa, FTAG);
3393 3396 return (error);
3394 3397 }
3395 3398
3396 3399 /*
3397 3400 * The dp_config_rwlock must not be held when calling this, because the
3398 3401 * unmount may need to write out data.
3399 3402 *
3400 3403 * This function is best-effort. Callers must deal gracefully if it
3401 3404 * remains mounted (or is remounted after this call).
3402 3405 *
3403 3406 * Returns 0 if the argument is not a snapshot, or it is not currently a
3404 3407 * filesystem, or we were able to unmount it. Returns error code otherwise.
3405 3408 */
3406 3409 int
3407 3410 zfs_unmount_snap(const char *snapname)
3408 3411 {
3409 3412 vfs_t *vfsp;
3410 3413 zfsvfs_t *zfsvfs;
3411 3414 int err;
3412 3415
3413 3416 if (strchr(snapname, '@') == NULL)
3414 3417 return (0);
3415 3418
3416 3419 vfsp = zfs_get_vfs(snapname);
3417 3420 if (vfsp == NULL)
3418 3421 return (0);
3419 3422
3420 3423 zfsvfs = vfsp->vfs_data;
3421 3424 ASSERT(!dsl_pool_config_held(dmu_objset_pool(zfsvfs->z_os)));
3422 3425
3423 3426 err = vn_vfswlock(vfsp->vfs_vnodecovered);
3424 3427 VFS_RELE(vfsp);
3425 3428 if (err != 0)
3426 3429 return (SET_ERROR(err));
3427 3430
3428 3431 /*
3429 3432 * Always force the unmount for snapshots.
3430 3433 */
3431 3434 (void) dounmount(vfsp, MS_FORCE, kcred);
3432 3435 return (0);
3433 3436 }
3434 3437
3435 3438 /* ARGSUSED */
3436 3439 static int
3437 3440 zfs_unmount_snap_cb(const char *snapname, void *arg)
3438 3441 {
3439 3442 return (zfs_unmount_snap(snapname));
3440 3443 }
3441 3444
3442 3445 /*
3443 3446 * When a clone is destroyed, its origin may also need to be destroyed,
3444 3447 * in which case it must be unmounted. This routine will do that unmount
3445 3448 * if necessary.
3446 3449 */
3447 3450 void
3448 3451 zfs_destroy_unmount_origin(const char *fsname)
3449 3452 {
3450 3453 int error;
3451 3454 objset_t *os;
3452 3455 dsl_dataset_t *ds;
3453 3456
3454 3457 error = dmu_objset_hold(fsname, FTAG, &os);
3455 3458 if (error != 0)
3456 3459 return;
3457 3460 ds = dmu_objset_ds(os);
3458 3461 if (dsl_dir_is_clone(ds->ds_dir) && DS_IS_DEFER_DESTROY(ds->ds_prev)) {
3459 3462 char originname[MAXNAMELEN];
3460 3463 dsl_dataset_name(ds->ds_prev, originname);
3461 3464 dmu_objset_rele(os, FTAG);
3462 3465 (void) zfs_unmount_snap(originname);
3463 3466 } else {
3464 3467 dmu_objset_rele(os, FTAG);
3465 3468 }
3466 3469 }
3467 3470
3468 3471 /*
3469 3472 * innvl: {
3470 3473 * "snaps" -> { snapshot1, snapshot2 }
3471 3474 * (optional boolean) "defer"
3472 3475 * }
3473 3476 *
3474 3477 * outnvl: snapshot -> error code (int32)
3475 3478 *
3476 3479 */
3477 3480 /* ARGSUSED */
3478 3481 static int
3479 3482 zfs_ioc_destroy_snaps(const char *poolname, nvlist_t *innvl, nvlist_t *outnvl)
3480 3483 {
3481 3484 nvlist_t *snaps;
3482 3485 nvpair_t *pair;
3483 3486 boolean_t defer;
3484 3487
3485 3488 if (nvlist_lookup_nvlist(innvl, "snaps", &snaps) != 0)
3486 3489 return (SET_ERROR(EINVAL));
3487 3490 defer = nvlist_exists(innvl, "defer");
3488 3491
3489 3492 for (pair = nvlist_next_nvpair(snaps, NULL); pair != NULL;
3490 3493 pair = nvlist_next_nvpair(snaps, pair)) {
3491 3494 (void) zfs_unmount_snap(nvpair_name(pair));
3492 3495 }
3493 3496
3494 3497 return (dsl_destroy_snapshots_nvl(snaps, defer, outnvl));
3495 3498 }
3496 3499
3497 3500 /*
3498 3501 * Create bookmarks. Bookmark names are of the form <fs>#<bmark>.
3499 3502 * All bookmarks must be in the same pool.
3500 3503 *
3501 3504 * innvl: {
3502 3505 * bookmark1 -> snapshot1, bookmark2 -> snapshot2
3503 3506 * }
3504 3507 *
3505 3508 * outnvl: bookmark -> error code (int32)
3506 3509 *
3507 3510 */
3508 3511 /* ARGSUSED */
3509 3512 static int
3510 3513 zfs_ioc_bookmark(const char *poolname, nvlist_t *innvl, nvlist_t *outnvl)
3511 3514 {
3512 3515 for (nvpair_t *pair = nvlist_next_nvpair(innvl, NULL);
3513 3516 pair != NULL; pair = nvlist_next_nvpair(innvl, pair)) {
3514 3517 char *snap_name;
3515 3518
3516 3519 /*
3517 3520 * Verify the snapshot argument.
3518 3521 */
3519 3522 if (nvpair_value_string(pair, &snap_name) != 0)
3520 3523 return (SET_ERROR(EINVAL));
3521 3524
3522 3525
3523 3526 /* Verify that the keys (bookmarks) are unique */
3524 3527 for (nvpair_t *pair2 = nvlist_next_nvpair(innvl, pair);
3525 3528 pair2 != NULL; pair2 = nvlist_next_nvpair(innvl, pair2)) {
3526 3529 if (strcmp(nvpair_name(pair), nvpair_name(pair2)) == 0)
3527 3530 return (SET_ERROR(EINVAL));
3528 3531 }
3529 3532 }
3530 3533
3531 3534 return (dsl_bookmark_create(innvl, outnvl));
3532 3535 }
3533 3536
3534 3537 /*
3535 3538 * innvl: {
3536 3539 * property 1, property 2, ...
3537 3540 * }
3538 3541 *
3539 3542 * outnvl: {
3540 3543 * bookmark name 1 -> { property 1, property 2, ... },
3541 3544 * bookmark name 2 -> { property 1, property 2, ... }
3542 3545 * }
3543 3546 *
3544 3547 */
3545 3548 static int
3546 3549 zfs_ioc_get_bookmarks(const char *fsname, nvlist_t *innvl, nvlist_t *outnvl)
3547 3550 {
3548 3551 return (dsl_get_bookmarks(fsname, innvl, outnvl));
3549 3552 }
3550 3553
3551 3554 /*
3552 3555 * innvl: {
3553 3556 * bookmark name 1, bookmark name 2
3554 3557 * }
3555 3558 *
3556 3559 * outnvl: bookmark -> error code (int32)
3557 3560 *
3558 3561 */
3559 3562 static int
3560 3563 zfs_ioc_destroy_bookmarks(const char *poolname, nvlist_t *innvl,
3561 3564 nvlist_t *outnvl)
3562 3565 {
3563 3566 int error, poollen;
3564 3567
3565 3568 poollen = strlen(poolname);
3566 3569 for (nvpair_t *pair = nvlist_next_nvpair(innvl, NULL);
3567 3570 pair != NULL; pair = nvlist_next_nvpair(innvl, pair)) {
3568 3571 const char *name = nvpair_name(pair);
3569 3572 const char *cp = strchr(name, '#');
3570 3573
3571 3574 /*
3572 3575 * The bookmark name must contain an #, and the part after it
3573 3576 * must contain only valid characters.
3574 3577 */
3575 3578 if (cp == NULL ||
3576 3579 zfs_component_namecheck(cp + 1, NULL, NULL) != 0)
3577 3580 return (SET_ERROR(EINVAL));
3578 3581
3579 3582 /*
3580 3583 * The bookmark must be in the specified pool.
3581 3584 */
3582 3585 if (strncmp(name, poolname, poollen) != 0 ||
3583 3586 (name[poollen] != '/' && name[poollen] != '#'))
3584 3587 return (SET_ERROR(EXDEV));
3585 3588 }
3586 3589
3587 3590 error = dsl_bookmark_destroy(innvl, outnvl);
3588 3591 return (error);
3589 3592 }
3590 3593
3591 3594 /*
3592 3595 * inputs:
3593 3596 * zc_name name of dataset to destroy
3594 3597 * zc_objset_type type of objset
3595 3598 * zc_defer_destroy mark for deferred destroy
3596 3599 *
3597 3600 * outputs: none
3598 3601 */
3599 3602 static int
3600 3603 zfs_ioc_destroy(zfs_cmd_t *zc)
3601 3604 {
3602 3605 int err;
3603 3606
3604 3607 if (zc->zc_objset_type == DMU_OST_ZFS) {
3605 3608 err = zfs_unmount_snap(zc->zc_name);
3606 3609 if (err != 0)
3607 3610 return (err);
3608 3611 }
3609 3612
3610 3613 if (strchr(zc->zc_name, '@'))
3611 3614 err = dsl_destroy_snapshot(zc->zc_name, zc->zc_defer_destroy);
3612 3615 else
3613 3616 err = dsl_destroy_head(zc->zc_name);
3614 3617 if (zc->zc_objset_type == DMU_OST_ZVOL && err == 0)
3615 3618 (void) zvol_remove_minor(zc->zc_name);
3616 3619 return (err);
3617 3620 }
3618 3621
3619 3622 /*
3620 3623 * fsname is name of dataset to rollback (to most recent snapshot)
3621 3624 *
3622 3625 * innvl is not used.
3623 3626 *
3624 3627 * outnvl: "target" -> name of most recent snapshot
3625 3628 * }
3626 3629 */
3627 3630 /* ARGSUSED */
3628 3631 static int
3629 3632 zfs_ioc_rollback(const char *fsname, nvlist_t *args, nvlist_t *outnvl)
3630 3633 {
3631 3634 zfsvfs_t *zfsvfs;
3632 3635 int error;
3633 3636
3634 3637 if (getzfsvfs(fsname, &zfsvfs) == 0) {
3635 3638 error = zfs_suspend_fs(zfsvfs);
3636 3639 if (error == 0) {
3637 3640 int resume_err;
3638 3641
3639 3642 error = dsl_dataset_rollback(fsname, zfsvfs, outnvl);
3640 3643 resume_err = zfs_resume_fs(zfsvfs, fsname);
3641 3644 error = error ? error : resume_err;
3642 3645 }
3643 3646 VFS_RELE(zfsvfs->z_vfs);
3644 3647 } else {
3645 3648 error = dsl_dataset_rollback(fsname, NULL, outnvl);
3646 3649 }
3647 3650 return (error);
3648 3651 }
3649 3652
3650 3653 static int
3651 3654 recursive_unmount(const char *fsname, void *arg)
3652 3655 {
3653 3656 const char *snapname = arg;
3654 3657 char fullname[MAXNAMELEN];
3655 3658
3656 3659 (void) snprintf(fullname, sizeof (fullname), "%s@%s", fsname, snapname);
3657 3660 return (zfs_unmount_snap(fullname));
3658 3661 }
3659 3662
3660 3663 /*
3661 3664 * inputs:
3662 3665 * zc_name old name of dataset
3663 3666 * zc_value new name of dataset
3664 3667 * zc_cookie recursive flag (only valid for snapshots)
3665 3668 *
3666 3669 * outputs: none
3667 3670 */
3668 3671 static int
3669 3672 zfs_ioc_rename(zfs_cmd_t *zc)
3670 3673 {
3671 3674 boolean_t recursive = zc->zc_cookie & 1;
3672 3675 char *at;
3673 3676
3674 3677 zc->zc_value[sizeof (zc->zc_value) - 1] = '\0';
3675 3678 if (dataset_namecheck(zc->zc_value, NULL, NULL) != 0 ||
3676 3679 strchr(zc->zc_value, '%'))
3677 3680 return (SET_ERROR(EINVAL));
3678 3681
3679 3682 at = strchr(zc->zc_name, '@');
3680 3683 if (at != NULL) {
3681 3684 /* snaps must be in same fs */
3682 3685 int error;
3683 3686
3684 3687 if (strncmp(zc->zc_name, zc->zc_value, at - zc->zc_name + 1))
3685 3688 return (SET_ERROR(EXDEV));
3686 3689 *at = '\0';
3687 3690 if (zc->zc_objset_type == DMU_OST_ZFS) {
3688 3691 error = dmu_objset_find(zc->zc_name,
3689 3692 recursive_unmount, at + 1,
3690 3693 recursive ? DS_FIND_CHILDREN : 0);
3691 3694 if (error != 0) {
3692 3695 *at = '@';
3693 3696 return (error);
3694 3697 }
3695 3698 }
3696 3699 error = dsl_dataset_rename_snapshot(zc->zc_name,
3697 3700 at + 1, strchr(zc->zc_value, '@') + 1, recursive);
3698 3701 *at = '@';
3699 3702
3700 3703 return (error);
3701 3704 } else {
3702 3705 if (zc->zc_objset_type == DMU_OST_ZVOL)
3703 3706 (void) zvol_remove_minor(zc->zc_name);
3704 3707 return (dsl_dir_rename(zc->zc_name, zc->zc_value));
3705 3708 }
3706 3709 }
3707 3710
3708 3711 static int
3709 3712 zfs_check_settable(const char *dsname, nvpair_t *pair, cred_t *cr)
3710 3713 {
3711 3714 const char *propname = nvpair_name(pair);
3712 3715 boolean_t issnap = (strchr(dsname, '@') != NULL);
3713 3716 zfs_prop_t prop = zfs_name_to_prop(propname);
3714 3717 uint64_t intval;
3715 3718 int err;
3716 3719
3717 3720 if (prop == ZPROP_INVAL) {
3718 3721 if (zfs_prop_user(propname)) {
3719 3722 if (err = zfs_secpolicy_write_perms(dsname,
3720 3723 ZFS_DELEG_PERM_USERPROP, cr))
3721 3724 return (err);
3722 3725 return (0);
3723 3726 }
3724 3727
3725 3728 if (!issnap && zfs_prop_userquota(propname)) {
3726 3729 const char *perm = NULL;
3727 3730 const char *uq_prefix =
3728 3731 zfs_userquota_prop_prefixes[ZFS_PROP_USERQUOTA];
3729 3732 const char *gq_prefix =
3730 3733 zfs_userquota_prop_prefixes[ZFS_PROP_GROUPQUOTA];
3731 3734
3732 3735 if (strncmp(propname, uq_prefix,
3733 3736 strlen(uq_prefix)) == 0) {
3734 3737 perm = ZFS_DELEG_PERM_USERQUOTA;
3735 3738 } else if (strncmp(propname, gq_prefix,
3736 3739 strlen(gq_prefix)) == 0) {
3737 3740 perm = ZFS_DELEG_PERM_GROUPQUOTA;
3738 3741 } else {
3739 3742 /* USERUSED and GROUPUSED are read-only */
3740 3743 return (SET_ERROR(EINVAL));
3741 3744 }
3742 3745
3743 3746 if (err = zfs_secpolicy_write_perms(dsname, perm, cr))
3744 3747 return (err);
3745 3748 return (0);
3746 3749 }
3747 3750
3748 3751 return (SET_ERROR(EINVAL));
3749 3752 }
3750 3753
3751 3754 if (issnap)
3752 3755 return (SET_ERROR(EINVAL));
3753 3756
3754 3757 if (nvpair_type(pair) == DATA_TYPE_NVLIST) {
3755 3758 /*
3756 3759 * dsl_prop_get_all_impl() returns properties in this
3757 3760 * format.
3758 3761 */
3759 3762 nvlist_t *attrs;
3760 3763 VERIFY(nvpair_value_nvlist(pair, &attrs) == 0);
3761 3764 VERIFY(nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
3762 3765 &pair) == 0);
3763 3766 }
3764 3767
3765 3768 /*
3766 3769 * Check that this value is valid for this pool version
3767 3770 */
3768 3771 switch (prop) {
3769 3772 case ZFS_PROP_COMPRESSION:
3770 3773 /*
3771 3774 * If the user specified gzip compression, make sure
3772 3775 * the SPA supports it. We ignore any errors here since
3773 3776 * we'll catch them later.
3774 3777 */
3775 3778 if (nvpair_value_uint64(pair, &intval) == 0) {
3776 3779 if (intval >= ZIO_COMPRESS_GZIP_1 &&
3777 3780 intval <= ZIO_COMPRESS_GZIP_9 &&
3778 3781 zfs_earlier_version(dsname,
3779 3782 SPA_VERSION_GZIP_COMPRESSION)) {
3780 3783 return (SET_ERROR(ENOTSUP));
3781 3784 }
3782 3785
3783 3786 if (intval == ZIO_COMPRESS_ZLE &&
3784 3787 zfs_earlier_version(dsname,
3785 3788 SPA_VERSION_ZLE_COMPRESSION))
3786 3789 return (SET_ERROR(ENOTSUP));
3787 3790
3788 3791 if (intval == ZIO_COMPRESS_LZ4) {
3789 3792 spa_t *spa;
3790 3793
3791 3794 if ((err = spa_open(dsname, &spa, FTAG)) != 0)
3792 3795 return (err);
3793 3796
3794 3797 if (!spa_feature_is_enabled(spa,
3795 3798 SPA_FEATURE_LZ4_COMPRESS)) {
3796 3799 spa_close(spa, FTAG);
3797 3800 return (SET_ERROR(ENOTSUP));
3798 3801 }
3799 3802 spa_close(spa, FTAG);
3800 3803 }
3801 3804
3802 3805 /*
3803 3806 * If this is a bootable dataset then
3804 3807 * verify that the compression algorithm
3805 3808 * is supported for booting. We must return
3806 3809 * something other than ENOTSUP since it
3807 3810 * implies a downrev pool version.
3808 3811 */
3809 3812 if (zfs_is_bootfs(dsname) &&
3810 3813 !BOOTFS_COMPRESS_VALID(intval)) {
3811 3814 return (SET_ERROR(ERANGE));
3812 3815 }
3813 3816 }
3814 3817 break;
3815 3818
3816 3819 case ZFS_PROP_COPIES:
3817 3820 if (zfs_earlier_version(dsname, SPA_VERSION_DITTO_BLOCKS))
3818 3821 return (SET_ERROR(ENOTSUP));
3819 3822 break;
3820 3823
3821 3824 case ZFS_PROP_RECORDSIZE:
3822 3825 /* Record sizes above 128k need the feature to be enabled */
3823 3826 if (nvpair_value_uint64(pair, &intval) == 0 &&
3824 3827 intval > SPA_OLD_MAXBLOCKSIZE) {
3825 3828 spa_t *spa;
3826 3829
3827 3830 /*
3828 3831 * If this is a bootable dataset then
3829 3832 * the we don't allow large (>128K) blocks,
3830 3833 * because GRUB doesn't support them.
3831 3834 */
3832 3835 if (zfs_is_bootfs(dsname) &&
3833 3836 intval > SPA_OLD_MAXBLOCKSIZE) {
3834 3837 return (SET_ERROR(ERANGE));
3835 3838 }
3836 3839
3837 3840 /*
3838 3841 * We don't allow setting the property above 1MB,
3839 3842 * unless the tunable has been changed.
3840 3843 */
3841 3844 if (intval > zfs_max_recordsize ||
3842 3845 intval > SPA_MAXBLOCKSIZE)
3843 3846 return (SET_ERROR(ERANGE));
3844 3847
3845 3848 if ((err = spa_open(dsname, &spa, FTAG)) != 0)
3846 3849 return (err);
3847 3850
3848 3851 if (!spa_feature_is_enabled(spa,
3849 3852 SPA_FEATURE_LARGE_BLOCKS)) {
3850 3853 spa_close(spa, FTAG);
3851 3854 return (SET_ERROR(ENOTSUP));
3852 3855 }
3853 3856 spa_close(spa, FTAG);
3854 3857 }
3855 3858 break;
3856 3859
3857 3860 case ZFS_PROP_SHARESMB:
3858 3861 if (zpl_earlier_version(dsname, ZPL_VERSION_FUID))
3859 3862 return (SET_ERROR(ENOTSUP));
3860 3863 break;
3861 3864
3862 3865 case ZFS_PROP_ACLINHERIT:
3863 3866 if (nvpair_type(pair) == DATA_TYPE_UINT64 &&
3864 3867 nvpair_value_uint64(pair, &intval) == 0) {
3865 3868 if (intval == ZFS_ACL_PASSTHROUGH_X &&
3866 3869 zfs_earlier_version(dsname,
3867 3870 SPA_VERSION_PASSTHROUGH_X))
3868 3871 return (SET_ERROR(ENOTSUP));
3869 3872 }
3870 3873 break;
3871 3874
3872 3875 case ZFS_PROP_CHECKSUM:
3873 3876 case ZFS_PROP_DEDUP:
3874 3877 {
3875 3878 spa_feature_t feature;
3876 3879 spa_t *spa;
3877 3880
3878 3881 /* dedup feature version checks */
3879 3882 if (prop == ZFS_PROP_DEDUP &&
3880 3883 zfs_earlier_version(dsname, SPA_VERSION_DEDUP))
3881 3884 return (SET_ERROR(ENOTSUP));
3882 3885
3883 3886 if (nvpair_value_uint64(pair, &intval) != 0)
3884 3887 return (SET_ERROR(EINVAL));
3885 3888
3886 3889 /* check prop value is enabled in features */
3887 3890 feature = zio_checksum_to_feature(intval);
3888 3891 if (feature == SPA_FEATURE_NONE)
3889 3892 break;
3890 3893
3891 3894 if ((err = spa_open(dsname, &spa, FTAG)) != 0)
3892 3895 return (err);
3893 3896 /*
3894 3897 * Salted checksums are not supported on root pools.
3895 3898 */
3896 3899 if (spa_bootfs(spa) != 0 &&
3897 3900 intval < ZIO_CHECKSUM_FUNCTIONS &&
3898 3901 (zio_checksum_table[intval].ci_flags &
3899 3902 ZCHECKSUM_FLAG_SALTED)) {
3900 3903 spa_close(spa, FTAG);
3901 3904 return (SET_ERROR(ERANGE));
3902 3905 }
3903 3906 if (!spa_feature_is_enabled(spa, feature)) {
3904 3907 spa_close(spa, FTAG);
3905 3908 return (SET_ERROR(ENOTSUP));
3906 3909 }
3907 3910 spa_close(spa, FTAG);
3908 3911 break;
3909 3912 }
3910 3913 }
3911 3914
3912 3915 return (zfs_secpolicy_setprop(dsname, prop, pair, CRED()));
3913 3916 }
3914 3917
3915 3918 /*
3916 3919 * Checks for a race condition to make sure we don't increment a feature flag
3917 3920 * multiple times.
3918 3921 */
3919 3922 static int
3920 3923 zfs_prop_activate_feature_check(void *arg, dmu_tx_t *tx)
3921 3924 {
3922 3925 spa_t *spa = dmu_tx_pool(tx)->dp_spa;
3923 3926 spa_feature_t *featurep = arg;
3924 3927
3925 3928 if (!spa_feature_is_active(spa, *featurep))
3926 3929 return (0);
3927 3930 else
3928 3931 return (SET_ERROR(EBUSY));
3929 3932 }
3930 3933
3931 3934 /*
3932 3935 * The callback invoked on feature activation in the sync task caused by
3933 3936 * zfs_prop_activate_feature.
3934 3937 */
3935 3938 static void
3936 3939 zfs_prop_activate_feature_sync(void *arg, dmu_tx_t *tx)
3937 3940 {
3938 3941 spa_t *spa = dmu_tx_pool(tx)->dp_spa;
3939 3942 spa_feature_t *featurep = arg;
3940 3943
3941 3944 spa_feature_incr(spa, *featurep, tx);
3942 3945 }
3943 3946
3944 3947 /*
3945 3948 * Activates a feature on a pool in response to a property setting. This
3946 3949 * creates a new sync task which modifies the pool to reflect the feature
3947 3950 * as being active.
3948 3951 */
3949 3952 static int
3950 3953 zfs_prop_activate_feature(spa_t *spa, spa_feature_t feature)
3951 3954 {
3952 3955 int err;
3953 3956
3954 3957 /* EBUSY here indicates that the feature is already active */
3955 3958 err = dsl_sync_task(spa_name(spa),
3956 3959 zfs_prop_activate_feature_check, zfs_prop_activate_feature_sync,
3957 3960 &feature, 2, ZFS_SPACE_CHECK_RESERVED);
3958 3961
3959 3962 if (err != 0 && err != EBUSY)
3960 3963 return (err);
3961 3964 else
3962 3965 return (0);
3963 3966 }
3964 3967
3965 3968 /*
3966 3969 * Removes properties from the given props list that fail permission checks
3967 3970 * needed to clear them and to restore them in case of a receive error. For each
3968 3971 * property, make sure we have both set and inherit permissions.
3969 3972 *
3970 3973 * Returns the first error encountered if any permission checks fail. If the
3971 3974 * caller provides a non-NULL errlist, it also gives the complete list of names
3972 3975 * of all the properties that failed a permission check along with the
3973 3976 * corresponding error numbers. The caller is responsible for freeing the
3974 3977 * returned errlist.
3975 3978 *
3976 3979 * If every property checks out successfully, zero is returned and the list
3977 3980 * pointed at by errlist is NULL.
3978 3981 */
3979 3982 static int
3980 3983 zfs_check_clearable(char *dataset, nvlist_t *props, nvlist_t **errlist)
3981 3984 {
3982 3985 zfs_cmd_t *zc;
3983 3986 nvpair_t *pair, *next_pair;
3984 3987 nvlist_t *errors;
3985 3988 int err, rv = 0;
3986 3989
3987 3990 if (props == NULL)
3988 3991 return (0);
3989 3992
3990 3993 VERIFY(nvlist_alloc(&errors, NV_UNIQUE_NAME, KM_SLEEP) == 0);
3991 3994
3992 3995 zc = kmem_alloc(sizeof (zfs_cmd_t), KM_SLEEP);
3993 3996 (void) strcpy(zc->zc_name, dataset);
3994 3997 pair = nvlist_next_nvpair(props, NULL);
3995 3998 while (pair != NULL) {
3996 3999 next_pair = nvlist_next_nvpair(props, pair);
3997 4000
3998 4001 (void) strcpy(zc->zc_value, nvpair_name(pair));
3999 4002 if ((err = zfs_check_settable(dataset, pair, CRED())) != 0 ||
4000 4003 (err = zfs_secpolicy_inherit_prop(zc, NULL, CRED())) != 0) {
4001 4004 VERIFY(nvlist_remove_nvpair(props, pair) == 0);
4002 4005 VERIFY(nvlist_add_int32(errors,
4003 4006 zc->zc_value, err) == 0);
4004 4007 }
4005 4008 pair = next_pair;
4006 4009 }
4007 4010 kmem_free(zc, sizeof (zfs_cmd_t));
4008 4011
4009 4012 if ((pair = nvlist_next_nvpair(errors, NULL)) == NULL) {
4010 4013 nvlist_free(errors);
4011 4014 errors = NULL;
4012 4015 } else {
4013 4016 VERIFY(nvpair_value_int32(pair, &rv) == 0);
4014 4017 }
4015 4018
4016 4019 if (errlist == NULL)
4017 4020 nvlist_free(errors);
4018 4021 else
4019 4022 *errlist = errors;
4020 4023
4021 4024 return (rv);
4022 4025 }
4023 4026
4024 4027 static boolean_t
4025 4028 propval_equals(nvpair_t *p1, nvpair_t *p2)
4026 4029 {
4027 4030 if (nvpair_type(p1) == DATA_TYPE_NVLIST) {
4028 4031 /* dsl_prop_get_all_impl() format */
4029 4032 nvlist_t *attrs;
4030 4033 VERIFY(nvpair_value_nvlist(p1, &attrs) == 0);
4031 4034 VERIFY(nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
4032 4035 &p1) == 0);
4033 4036 }
4034 4037
4035 4038 if (nvpair_type(p2) == DATA_TYPE_NVLIST) {
4036 4039 nvlist_t *attrs;
4037 4040 VERIFY(nvpair_value_nvlist(p2, &attrs) == 0);
4038 4041 VERIFY(nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
4039 4042 &p2) == 0);
4040 4043 }
4041 4044
4042 4045 if (nvpair_type(p1) != nvpair_type(p2))
4043 4046 return (B_FALSE);
4044 4047
4045 4048 if (nvpair_type(p1) == DATA_TYPE_STRING) {
4046 4049 char *valstr1, *valstr2;
4047 4050
4048 4051 VERIFY(nvpair_value_string(p1, (char **)&valstr1) == 0);
4049 4052 VERIFY(nvpair_value_string(p2, (char **)&valstr2) == 0);
4050 4053 return (strcmp(valstr1, valstr2) == 0);
4051 4054 } else {
4052 4055 uint64_t intval1, intval2;
4053 4056
4054 4057 VERIFY(nvpair_value_uint64(p1, &intval1) == 0);
4055 4058 VERIFY(nvpair_value_uint64(p2, &intval2) == 0);
4056 4059 return (intval1 == intval2);
4057 4060 }
4058 4061 }
4059 4062
4060 4063 /*
4061 4064 * Remove properties from props if they are not going to change (as determined
4062 4065 * by comparison with origprops). Remove them from origprops as well, since we
4063 4066 * do not need to clear or restore properties that won't change.
4064 4067 */
4065 4068 static void
4066 4069 props_reduce(nvlist_t *props, nvlist_t *origprops)
4067 4070 {
4068 4071 nvpair_t *pair, *next_pair;
4069 4072
4070 4073 if (origprops == NULL)
4071 4074 return; /* all props need to be received */
4072 4075
4073 4076 pair = nvlist_next_nvpair(props, NULL);
4074 4077 while (pair != NULL) {
4075 4078 const char *propname = nvpair_name(pair);
4076 4079 nvpair_t *match;
4077 4080
4078 4081 next_pair = nvlist_next_nvpair(props, pair);
4079 4082
4080 4083 if ((nvlist_lookup_nvpair(origprops, propname,
4081 4084 &match) != 0) || !propval_equals(pair, match))
4082 4085 goto next; /* need to set received value */
4083 4086
4084 4087 /* don't clear the existing received value */
4085 4088 (void) nvlist_remove_nvpair(origprops, match);
4086 4089 /* don't bother receiving the property */
4087 4090 (void) nvlist_remove_nvpair(props, pair);
4088 4091 next:
4089 4092 pair = next_pair;
4090 4093 }
4091 4094 }
4092 4095
4093 4096 #ifdef DEBUG
4094 4097 static boolean_t zfs_ioc_recv_inject_err;
4095 4098 #endif
4096 4099
4097 4100 /*
4098 4101 * inputs:
4099 4102 * zc_name name of containing filesystem
4100 4103 * zc_nvlist_src{_size} nvlist of properties to apply
4101 4104 * zc_value name of snapshot to create
4102 4105 * zc_string name of clone origin (if DRR_FLAG_CLONE)
4103 4106 * zc_cookie file descriptor to recv from
4104 4107 * zc_begin_record the BEGIN record of the stream (not byteswapped)
4105 4108 * zc_guid force flag
4106 4109 * zc_cleanup_fd cleanup-on-exit file descriptor
4107 4110 * zc_action_handle handle for this guid/ds mapping (or zero on first call)
4108 4111 * zc_resumable if data is incomplete assume sender will resume
4109 4112 *
4110 4113 * outputs:
4111 4114 * zc_cookie number of bytes read
4112 4115 * zc_nvlist_dst{_size} error for each unapplied received property
4113 4116 * zc_obj zprop_errflags_t
4114 4117 * zc_action_handle handle for this guid/ds mapping
4115 4118 */
4116 4119 static int
4117 4120 zfs_ioc_recv(zfs_cmd_t *zc)
4118 4121 {
4119 4122 file_t *fp;
4120 4123 dmu_recv_cookie_t drc;
4121 4124 boolean_t force = (boolean_t)zc->zc_guid;
4122 4125 int fd;
4123 4126 int error = 0;
4124 4127 int props_error = 0;
4125 4128 nvlist_t *errors;
4126 4129 offset_t off;
4127 4130 nvlist_t *props = NULL; /* sent properties */
4128 4131 nvlist_t *origprops = NULL; /* existing properties */
4129 4132 char *origin = NULL;
4130 4133 char *tosnap;
4131 4134 char tofs[ZFS_MAXNAMELEN];
4132 4135 boolean_t first_recvd_props = B_FALSE;
4133 4136
4134 4137 if (dataset_namecheck(zc->zc_value, NULL, NULL) != 0 ||
4135 4138 strchr(zc->zc_value, '@') == NULL ||
4136 4139 strchr(zc->zc_value, '%'))
4137 4140 return (SET_ERROR(EINVAL));
4138 4141
4139 4142 (void) strcpy(tofs, zc->zc_value);
4140 4143 tosnap = strchr(tofs, '@');
4141 4144 *tosnap++ = '\0';
4142 4145
4143 4146 if (zc->zc_nvlist_src != NULL &&
4144 4147 (error = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
4145 4148 zc->zc_iflags, &props)) != 0)
4146 4149 return (error);
4147 4150
4148 4151 fd = zc->zc_cookie;
4149 4152 fp = getf(fd);
4150 4153 if (fp == NULL) {
4151 4154 nvlist_free(props);
4152 4155 return (SET_ERROR(EBADF));
4153 4156 }
4154 4157
4155 4158 errors = fnvlist_alloc();
4156 4159
4157 4160 if (zc->zc_string[0])
4158 4161 origin = zc->zc_string;
4159 4162
4160 4163 error = dmu_recv_begin(tofs, tosnap,
4161 4164 &zc->zc_begin_record, force, zc->zc_resumable, origin, &drc);
4162 4165 if (error != 0)
4163 4166 goto out;
4164 4167
4165 4168 /*
4166 4169 * Set properties before we receive the stream so that they are applied
4167 4170 * to the new data. Note that we must call dmu_recv_stream() if
4168 4171 * dmu_recv_begin() succeeds.
4169 4172 */
4170 4173 if (props != NULL && !drc.drc_newfs) {
4171 4174 if (spa_version(dsl_dataset_get_spa(drc.drc_ds)) >=
4172 4175 SPA_VERSION_RECVD_PROPS &&
4173 4176 !dsl_prop_get_hasrecvd(tofs))
4174 4177 first_recvd_props = B_TRUE;
4175 4178
4176 4179 /*
4177 4180 * If new received properties are supplied, they are to
4178 4181 * completely replace the existing received properties, so stash
4179 4182 * away the existing ones.
4180 4183 */
4181 4184 if (dsl_prop_get_received(tofs, &origprops) == 0) {
4182 4185 nvlist_t *errlist = NULL;
4183 4186 /*
4184 4187 * Don't bother writing a property if its value won't
4185 4188 * change (and avoid the unnecessary security checks).
4186 4189 *
4187 4190 * The first receive after SPA_VERSION_RECVD_PROPS is a
4188 4191 * special case where we blow away all local properties
4189 4192 * regardless.
4190 4193 */
4191 4194 if (!first_recvd_props)
4192 4195 props_reduce(props, origprops);
4193 4196 if (zfs_check_clearable(tofs, origprops, &errlist) != 0)
4194 4197 (void) nvlist_merge(errors, errlist, 0);
4195 4198 nvlist_free(errlist);
4196 4199
4197 4200 if (clear_received_props(tofs, origprops,
4198 4201 first_recvd_props ? NULL : props) != 0)
4199 4202 zc->zc_obj |= ZPROP_ERR_NOCLEAR;
4200 4203 } else {
4201 4204 zc->zc_obj |= ZPROP_ERR_NOCLEAR;
4202 4205 }
4203 4206 }
4204 4207
4205 4208 if (props != NULL) {
4206 4209 props_error = dsl_prop_set_hasrecvd(tofs);
4207 4210
4208 4211 if (props_error == 0) {
4209 4212 (void) zfs_set_prop_nvlist(tofs, ZPROP_SRC_RECEIVED,
4210 4213 props, errors);
4211 4214 }
4212 4215 }
4213 4216
4214 4217 if (zc->zc_nvlist_dst_size != 0 &&
4215 4218 (nvlist_smush(errors, zc->zc_nvlist_dst_size) != 0 ||
4216 4219 put_nvlist(zc, errors) != 0)) {
4217 4220 /*
4218 4221 * Caller made zc->zc_nvlist_dst less than the minimum expected
4219 4222 * size or supplied an invalid address.
4220 4223 */
4221 4224 props_error = SET_ERROR(EINVAL);
4222 4225 }
4223 4226
4224 4227 off = fp->f_offset;
4225 4228 error = dmu_recv_stream(&drc, fp->f_vnode, &off, zc->zc_cleanup_fd,
4226 4229 &zc->zc_action_handle);
4227 4230
4228 4231 if (error == 0) {
4229 4232 zfsvfs_t *zfsvfs = NULL;
4230 4233
4231 4234 if (getzfsvfs(tofs, &zfsvfs) == 0) {
4232 4235 /* online recv */
4233 4236 int end_err;
4234 4237
4235 4238 error = zfs_suspend_fs(zfsvfs);
4236 4239 /*
4237 4240 * If the suspend fails, then the recv_end will
4238 4241 * likely also fail, and clean up after itself.
4239 4242 */
4240 4243 end_err = dmu_recv_end(&drc, zfsvfs);
4241 4244 if (error == 0)
4242 4245 error = zfs_resume_fs(zfsvfs, tofs);
4243 4246 error = error ? error : end_err;
4244 4247 VFS_RELE(zfsvfs->z_vfs);
4245 4248 } else {
4246 4249 error = dmu_recv_end(&drc, NULL);
4247 4250 }
4248 4251 }
4249 4252
4250 4253 zc->zc_cookie = off - fp->f_offset;
4251 4254 if (VOP_SEEK(fp->f_vnode, fp->f_offset, &off, NULL) == 0)
4252 4255 fp->f_offset = off;
4253 4256
4254 4257 #ifdef DEBUG
4255 4258 if (zfs_ioc_recv_inject_err) {
4256 4259 zfs_ioc_recv_inject_err = B_FALSE;
4257 4260 error = 1;
4258 4261 }
4259 4262 #endif
4260 4263 /*
4261 4264 * On error, restore the original props.
4262 4265 */
4263 4266 if (error != 0 && props != NULL && !drc.drc_newfs) {
4264 4267 if (clear_received_props(tofs, props, NULL) != 0) {
4265 4268 /*
4266 4269 * We failed to clear the received properties.
4267 4270 * Since we may have left a $recvd value on the
4268 4271 * system, we can't clear the $hasrecvd flag.
4269 4272 */
4270 4273 zc->zc_obj |= ZPROP_ERR_NORESTORE;
4271 4274 } else if (first_recvd_props) {
4272 4275 dsl_prop_unset_hasrecvd(tofs);
4273 4276 }
4274 4277
4275 4278 if (origprops == NULL && !drc.drc_newfs) {
4276 4279 /* We failed to stash the original properties. */
4277 4280 zc->zc_obj |= ZPROP_ERR_NORESTORE;
4278 4281 }
4279 4282
4280 4283 /*
4281 4284 * dsl_props_set() will not convert RECEIVED to LOCAL on or
4282 4285 * after SPA_VERSION_RECVD_PROPS, so we need to specify LOCAL
4283 4286 * explictly if we're restoring local properties cleared in the
4284 4287 * first new-style receive.
4285 4288 */
4286 4289 if (origprops != NULL &&
4287 4290 zfs_set_prop_nvlist(tofs, (first_recvd_props ?
4288 4291 ZPROP_SRC_LOCAL : ZPROP_SRC_RECEIVED),
4289 4292 origprops, NULL) != 0) {
4290 4293 /*
4291 4294 * We stashed the original properties but failed to
4292 4295 * restore them.
4293 4296 */
4294 4297 zc->zc_obj |= ZPROP_ERR_NORESTORE;
4295 4298 }
4296 4299 }
4297 4300 out:
4298 4301 nvlist_free(props);
4299 4302 nvlist_free(origprops);
4300 4303 nvlist_free(errors);
4301 4304 releasef(fd);
4302 4305
4303 4306 if (error == 0)
4304 4307 error = props_error;
4305 4308
4306 4309 return (error);
4307 4310 }
4308 4311
4309 4312 /*
4310 4313 * inputs:
4311 4314 * zc_name name of snapshot to send
4312 4315 * zc_cookie file descriptor to send stream to
4313 4316 * zc_obj fromorigin flag (mutually exclusive with zc_fromobj)
4314 4317 * zc_sendobj objsetid of snapshot to send
4315 4318 * zc_fromobj objsetid of incremental fromsnap (may be zero)
4316 4319 * zc_guid if set, estimate size of stream only. zc_cookie is ignored.
4317 4320 * output size in zc_objset_type.
4318 4321 * zc_flags lzc_send_flags
4319 4322 *
4320 4323 * outputs:
4321 4324 * zc_objset_type estimated size, if zc_guid is set
4322 4325 */
4323 4326 static int
4324 4327 zfs_ioc_send(zfs_cmd_t *zc)
4325 4328 {
4326 4329 int error;
4327 4330 offset_t off;
4328 4331 boolean_t estimate = (zc->zc_guid != 0);
4329 4332 boolean_t embedok = (zc->zc_flags & 0x1);
4330 4333 boolean_t large_block_ok = (zc->zc_flags & 0x2);
4331 4334
4332 4335 if (zc->zc_obj != 0) {
4333 4336 dsl_pool_t *dp;
4334 4337 dsl_dataset_t *tosnap;
4335 4338
4336 4339 error = dsl_pool_hold(zc->zc_name, FTAG, &dp);
4337 4340 if (error != 0)
4338 4341 return (error);
4339 4342
4340 4343 error = dsl_dataset_hold_obj(dp, zc->zc_sendobj, FTAG, &tosnap);
4341 4344 if (error != 0) {
4342 4345 dsl_pool_rele(dp, FTAG);
4343 4346 return (error);
4344 4347 }
4345 4348
4346 4349 if (dsl_dir_is_clone(tosnap->ds_dir))
4347 4350 zc->zc_fromobj =
4348 4351 dsl_dir_phys(tosnap->ds_dir)->dd_origin_obj;
4349 4352 dsl_dataset_rele(tosnap, FTAG);
4350 4353 dsl_pool_rele(dp, FTAG);
4351 4354 }
4352 4355
4353 4356 if (estimate) {
4354 4357 dsl_pool_t *dp;
4355 4358 dsl_dataset_t *tosnap;
4356 4359 dsl_dataset_t *fromsnap = NULL;
4357 4360
4358 4361 error = dsl_pool_hold(zc->zc_name, FTAG, &dp);
4359 4362 if (error != 0)
4360 4363 return (error);
4361 4364
4362 4365 error = dsl_dataset_hold_obj(dp, zc->zc_sendobj, FTAG, &tosnap);
4363 4366 if (error != 0) {
4364 4367 dsl_pool_rele(dp, FTAG);
4365 4368 return (error);
4366 4369 }
4367 4370
4368 4371 if (zc->zc_fromobj != 0) {
4369 4372 error = dsl_dataset_hold_obj(dp, zc->zc_fromobj,
4370 4373 FTAG, &fromsnap);
4371 4374 if (error != 0) {
4372 4375 dsl_dataset_rele(tosnap, FTAG);
4373 4376 dsl_pool_rele(dp, FTAG);
4374 4377 return (error);
4375 4378 }
4376 4379 }
4377 4380
4378 4381 error = dmu_send_estimate(tosnap, fromsnap,
4379 4382 &zc->zc_objset_type);
4380 4383
4381 4384 if (fromsnap != NULL)
4382 4385 dsl_dataset_rele(fromsnap, FTAG);
4383 4386 dsl_dataset_rele(tosnap, FTAG);
4384 4387 dsl_pool_rele(dp, FTAG);
4385 4388 } else {
4386 4389 file_t *fp = getf(zc->zc_cookie);
4387 4390 if (fp == NULL)
4388 4391 return (SET_ERROR(EBADF));
4389 4392
4390 4393 off = fp->f_offset;
4391 4394 error = dmu_send_obj(zc->zc_name, zc->zc_sendobj,
4392 4395 zc->zc_fromobj, embedok, large_block_ok,
4393 4396 zc->zc_cookie, fp->f_vnode, &off);
4394 4397
4395 4398 if (VOP_SEEK(fp->f_vnode, fp->f_offset, &off, NULL) == 0)
4396 4399 fp->f_offset = off;
4397 4400 releasef(zc->zc_cookie);
4398 4401 }
4399 4402 return (error);
4400 4403 }
4401 4404
4402 4405 /*
4403 4406 * inputs:
4404 4407 * zc_name name of snapshot on which to report progress
4405 4408 * zc_cookie file descriptor of send stream
4406 4409 *
4407 4410 * outputs:
4408 4411 * zc_cookie number of bytes written in send stream thus far
4409 4412 */
4410 4413 static int
4411 4414 zfs_ioc_send_progress(zfs_cmd_t *zc)
4412 4415 {
4413 4416 dsl_pool_t *dp;
4414 4417 dsl_dataset_t *ds;
4415 4418 dmu_sendarg_t *dsp = NULL;
4416 4419 int error;
4417 4420
4418 4421 error = dsl_pool_hold(zc->zc_name, FTAG, &dp);
4419 4422 if (error != 0)
4420 4423 return (error);
4421 4424
4422 4425 error = dsl_dataset_hold(dp, zc->zc_name, FTAG, &ds);
4423 4426 if (error != 0) {
4424 4427 dsl_pool_rele(dp, FTAG);
4425 4428 return (error);
4426 4429 }
4427 4430
4428 4431 mutex_enter(&ds->ds_sendstream_lock);
4429 4432
4430 4433 /*
4431 4434 * Iterate over all the send streams currently active on this dataset.
4432 4435 * If there's one which matches the specified file descriptor _and_ the
4433 4436 * stream was started by the current process, return the progress of
4434 4437 * that stream.
4435 4438 */
4436 4439 for (dsp = list_head(&ds->ds_sendstreams); dsp != NULL;
4437 4440 dsp = list_next(&ds->ds_sendstreams, dsp)) {
4438 4441 if (dsp->dsa_outfd == zc->zc_cookie &&
4439 4442 dsp->dsa_proc == curproc)
4440 4443 break;
4441 4444 }
4442 4445
4443 4446 if (dsp != NULL)
4444 4447 zc->zc_cookie = *(dsp->dsa_off);
4445 4448 else
4446 4449 error = SET_ERROR(ENOENT);
4447 4450
4448 4451 mutex_exit(&ds->ds_sendstream_lock);
4449 4452 dsl_dataset_rele(ds, FTAG);
4450 4453 dsl_pool_rele(dp, FTAG);
4451 4454 return (error);
4452 4455 }
4453 4456
4454 4457 static int
4455 4458 zfs_ioc_inject_fault(zfs_cmd_t *zc)
4456 4459 {
4457 4460 int id, error;
4458 4461
4459 4462 error = zio_inject_fault(zc->zc_name, (int)zc->zc_guid, &id,
4460 4463 &zc->zc_inject_record);
4461 4464
4462 4465 if (error == 0)
4463 4466 zc->zc_guid = (uint64_t)id;
4464 4467
4465 4468 return (error);
4466 4469 }
4467 4470
4468 4471 static int
4469 4472 zfs_ioc_clear_fault(zfs_cmd_t *zc)
4470 4473 {
4471 4474 return (zio_clear_fault((int)zc->zc_guid));
4472 4475 }
4473 4476
4474 4477 static int
4475 4478 zfs_ioc_inject_list_next(zfs_cmd_t *zc)
4476 4479 {
4477 4480 int id = (int)zc->zc_guid;
4478 4481 int error;
4479 4482
4480 4483 error = zio_inject_list_next(&id, zc->zc_name, sizeof (zc->zc_name),
4481 4484 &zc->zc_inject_record);
4482 4485
4483 4486 zc->zc_guid = id;
4484 4487
4485 4488 return (error);
4486 4489 }
4487 4490
4488 4491 static int
4489 4492 zfs_ioc_error_log(zfs_cmd_t *zc)
4490 4493 {
4491 4494 spa_t *spa;
4492 4495 int error;
4493 4496 size_t count = (size_t)zc->zc_nvlist_dst_size;
4494 4497
4495 4498 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
4496 4499 return (error);
4497 4500
4498 4501 error = spa_get_errlog(spa, (void *)(uintptr_t)zc->zc_nvlist_dst,
4499 4502 &count);
4500 4503 if (error == 0)
4501 4504 zc->zc_nvlist_dst_size = count;
4502 4505 else
4503 4506 zc->zc_nvlist_dst_size = spa_get_errlog_size(spa);
4504 4507
4505 4508 spa_close(spa, FTAG);
4506 4509
4507 4510 return (error);
4508 4511 }
4509 4512
4510 4513 static int
4511 4514 zfs_ioc_clear(zfs_cmd_t *zc)
4512 4515 {
4513 4516 spa_t *spa;
4514 4517 vdev_t *vd;
4515 4518 int error;
4516 4519
4517 4520 /*
4518 4521 * On zpool clear we also fix up missing slogs
4519 4522 */
4520 4523 mutex_enter(&spa_namespace_lock);
4521 4524 spa = spa_lookup(zc->zc_name);
4522 4525 if (spa == NULL) {
4523 4526 mutex_exit(&spa_namespace_lock);
4524 4527 return (SET_ERROR(EIO));
4525 4528 }
4526 4529 if (spa_get_log_state(spa) == SPA_LOG_MISSING) {
4527 4530 /* we need to let spa_open/spa_load clear the chains */
4528 4531 spa_set_log_state(spa, SPA_LOG_CLEAR);
4529 4532 }
4530 4533 spa->spa_last_open_failed = 0;
4531 4534 mutex_exit(&spa_namespace_lock);
4532 4535
4533 4536 if (zc->zc_cookie & ZPOOL_NO_REWIND) {
4534 4537 error = spa_open(zc->zc_name, &spa, FTAG);
4535 4538 } else {
4536 4539 nvlist_t *policy;
4537 4540 nvlist_t *config = NULL;
4538 4541
4539 4542 if (zc->zc_nvlist_src == NULL)
4540 4543 return (SET_ERROR(EINVAL));
4541 4544
4542 4545 if ((error = get_nvlist(zc->zc_nvlist_src,
4543 4546 zc->zc_nvlist_src_size, zc->zc_iflags, &policy)) == 0) {
4544 4547 error = spa_open_rewind(zc->zc_name, &spa, FTAG,
4545 4548 policy, &config);
4546 4549 if (config != NULL) {
4547 4550 int err;
4548 4551
4549 4552 if ((err = put_nvlist(zc, config)) != 0)
4550 4553 error = err;
4551 4554 nvlist_free(config);
4552 4555 }
4553 4556 nvlist_free(policy);
4554 4557 }
4555 4558 }
4556 4559
4557 4560 if (error != 0)
4558 4561 return (error);
4559 4562
4560 4563 spa_vdev_state_enter(spa, SCL_NONE);
4561 4564
4562 4565 if (zc->zc_guid == 0) {
4563 4566 vd = NULL;
4564 4567 } else {
4565 4568 vd = spa_lookup_by_guid(spa, zc->zc_guid, B_TRUE);
4566 4569 if (vd == NULL) {
4567 4570 (void) spa_vdev_state_exit(spa, NULL, ENODEV);
4568 4571 spa_close(spa, FTAG);
4569 4572 return (SET_ERROR(ENODEV));
4570 4573 }
4571 4574 }
4572 4575
4573 4576 vdev_clear(spa, vd);
4574 4577
4575 4578 (void) spa_vdev_state_exit(spa, NULL, 0);
4576 4579
4577 4580 /*
4578 4581 * Resume any suspended I/Os.
4579 4582 */
4580 4583 if (zio_resume(spa) != 0)
4581 4584 error = SET_ERROR(EIO);
4582 4585
4583 4586 spa_close(spa, FTAG);
4584 4587
4585 4588 return (error);
4586 4589 }
4587 4590
4588 4591 static int
4589 4592 zfs_ioc_pool_reopen(zfs_cmd_t *zc)
4590 4593 {
4591 4594 spa_t *spa;
4592 4595 int error;
4593 4596
4594 4597 error = spa_open(zc->zc_name, &spa, FTAG);
4595 4598 if (error != 0)
4596 4599 return (error);
4597 4600
4598 4601 spa_vdev_state_enter(spa, SCL_NONE);
4599 4602
4600 4603 /*
4601 4604 * If a resilver is already in progress then set the
4602 4605 * spa_scrub_reopen flag to B_TRUE so that we don't restart
4603 4606 * the scan as a side effect of the reopen. Otherwise, let
4604 4607 * vdev_open() decided if a resilver is required.
4605 4608 */
4606 4609 spa->spa_scrub_reopen = dsl_scan_resilvering(spa->spa_dsl_pool);
4607 4610 vdev_reopen(spa->spa_root_vdev);
4608 4611 spa->spa_scrub_reopen = B_FALSE;
4609 4612
4610 4613 (void) spa_vdev_state_exit(spa, NULL, 0);
4611 4614 spa_close(spa, FTAG);
4612 4615 return (0);
4613 4616 }
4614 4617 /*
4615 4618 * inputs:
4616 4619 * zc_name name of filesystem
4617 4620 * zc_value name of origin snapshot
4618 4621 *
4619 4622 * outputs:
4620 4623 * zc_string name of conflicting snapshot, if there is one
4621 4624 */
4622 4625 static int
4623 4626 zfs_ioc_promote(zfs_cmd_t *zc)
4624 4627 {
4625 4628 char *cp;
4626 4629
4627 4630 /*
4628 4631 * We don't need to unmount *all* the origin fs's snapshots, but
4629 4632 * it's easier.
4630 4633 */
4631 4634 cp = strchr(zc->zc_value, '@');
4632 4635 if (cp)
4633 4636 *cp = '\0';
4634 4637 (void) dmu_objset_find(zc->zc_value,
4635 4638 zfs_unmount_snap_cb, NULL, DS_FIND_SNAPSHOTS);
4636 4639 return (dsl_dataset_promote(zc->zc_name, zc->zc_string));
4637 4640 }
4638 4641
4639 4642 /*
4640 4643 * Retrieve a single {user|group}{used|quota}@... property.
4641 4644 *
4642 4645 * inputs:
4643 4646 * zc_name name of filesystem
4644 4647 * zc_objset_type zfs_userquota_prop_t
4645 4648 * zc_value domain name (eg. "S-1-234-567-89")
4646 4649 * zc_guid RID/UID/GID
4647 4650 *
4648 4651 * outputs:
4649 4652 * zc_cookie property value
4650 4653 */
4651 4654 static int
4652 4655 zfs_ioc_userspace_one(zfs_cmd_t *zc)
4653 4656 {
4654 4657 zfsvfs_t *zfsvfs;
4655 4658 int error;
4656 4659
4657 4660 if (zc->zc_objset_type >= ZFS_NUM_USERQUOTA_PROPS)
4658 4661 return (SET_ERROR(EINVAL));
4659 4662
4660 4663 error = zfsvfs_hold(zc->zc_name, FTAG, &zfsvfs, B_FALSE);
4661 4664 if (error != 0)
4662 4665 return (error);
4663 4666
4664 4667 error = zfs_userspace_one(zfsvfs,
4665 4668 zc->zc_objset_type, zc->zc_value, zc->zc_guid, &zc->zc_cookie);
4666 4669 zfsvfs_rele(zfsvfs, FTAG);
4667 4670
4668 4671 return (error);
4669 4672 }
4670 4673
4671 4674 /*
4672 4675 * inputs:
4673 4676 * zc_name name of filesystem
4674 4677 * zc_cookie zap cursor
4675 4678 * zc_objset_type zfs_userquota_prop_t
4676 4679 * zc_nvlist_dst[_size] buffer to fill (not really an nvlist)
4677 4680 *
4678 4681 * outputs:
4679 4682 * zc_nvlist_dst[_size] data buffer (array of zfs_useracct_t)
4680 4683 * zc_cookie zap cursor
4681 4684 */
4682 4685 static int
4683 4686 zfs_ioc_userspace_many(zfs_cmd_t *zc)
4684 4687 {
4685 4688 zfsvfs_t *zfsvfs;
4686 4689 int bufsize = zc->zc_nvlist_dst_size;
4687 4690
4688 4691 if (bufsize <= 0)
4689 4692 return (SET_ERROR(ENOMEM));
4690 4693
4691 4694 int error = zfsvfs_hold(zc->zc_name, FTAG, &zfsvfs, B_FALSE);
4692 4695 if (error != 0)
4693 4696 return (error);
4694 4697
4695 4698 void *buf = kmem_alloc(bufsize, KM_SLEEP);
4696 4699
4697 4700 error = zfs_userspace_many(zfsvfs, zc->zc_objset_type, &zc->zc_cookie,
4698 4701 buf, &zc->zc_nvlist_dst_size);
4699 4702
4700 4703 if (error == 0) {
4701 4704 error = xcopyout(buf,
4702 4705 (void *)(uintptr_t)zc->zc_nvlist_dst,
4703 4706 zc->zc_nvlist_dst_size);
4704 4707 }
4705 4708 kmem_free(buf, bufsize);
4706 4709 zfsvfs_rele(zfsvfs, FTAG);
4707 4710
4708 4711 return (error);
4709 4712 }
4710 4713
4711 4714 /*
4712 4715 * inputs:
4713 4716 * zc_name name of filesystem
4714 4717 *
4715 4718 * outputs:
4716 4719 * none
4717 4720 */
4718 4721 static int
4719 4722 zfs_ioc_userspace_upgrade(zfs_cmd_t *zc)
4720 4723 {
4721 4724 objset_t *os;
4722 4725 int error = 0;
4723 4726 zfsvfs_t *zfsvfs;
4724 4727
4725 4728 if (getzfsvfs(zc->zc_name, &zfsvfs) == 0) {
4726 4729 if (!dmu_objset_userused_enabled(zfsvfs->z_os)) {
4727 4730 /*
4728 4731 * If userused is not enabled, it may be because the
4729 4732 * objset needs to be closed & reopened (to grow the
4730 4733 * objset_phys_t). Suspend/resume the fs will do that.
4731 4734 */
4732 4735 error = zfs_suspend_fs(zfsvfs);
4733 4736 if (error == 0) {
4734 4737 dmu_objset_refresh_ownership(zfsvfs->z_os,
4735 4738 zfsvfs);
4736 4739 error = zfs_resume_fs(zfsvfs, zc->zc_name);
4737 4740 }
4738 4741 }
4739 4742 if (error == 0)
4740 4743 error = dmu_objset_userspace_upgrade(zfsvfs->z_os);
4741 4744 VFS_RELE(zfsvfs->z_vfs);
4742 4745 } else {
4743 4746 /* XXX kind of reading contents without owning */
4744 4747 error = dmu_objset_hold(zc->zc_name, FTAG, &os);
4745 4748 if (error != 0)
4746 4749 return (error);
4747 4750
4748 4751 error = dmu_objset_userspace_upgrade(os);
4749 4752 dmu_objset_rele(os, FTAG);
4750 4753 }
4751 4754
4752 4755 return (error);
4753 4756 }
4754 4757
4755 4758 /*
4756 4759 * We don't want to have a hard dependency
4757 4760 * against some special symbols in sharefs
4758 4761 * nfs, and smbsrv. Determine them if needed when
4759 4762 * the first file system is shared.
4760 4763 * Neither sharefs, nfs or smbsrv are unloadable modules.
4761 4764 */
4762 4765 int (*znfsexport_fs)(void *arg);
4763 4766 int (*zshare_fs)(enum sharefs_sys_op, share_t *, uint32_t);
4764 4767 int (*zsmbexport_fs)(void *arg, boolean_t add_share);
4765 4768
4766 4769 int zfs_nfsshare_inited;
4767 4770 int zfs_smbshare_inited;
4768 4771
4769 4772 ddi_modhandle_t nfs_mod;
4770 4773 ddi_modhandle_t sharefs_mod;
4771 4774 ddi_modhandle_t smbsrv_mod;
4772 4775 kmutex_t zfs_share_lock;
4773 4776
4774 4777 static int
4775 4778 zfs_init_sharefs()
4776 4779 {
4777 4780 int error;
4778 4781
4779 4782 ASSERT(MUTEX_HELD(&zfs_share_lock));
4780 4783 /* Both NFS and SMB shares also require sharetab support. */
4781 4784 if (sharefs_mod == NULL && ((sharefs_mod =
4782 4785 ddi_modopen("fs/sharefs",
4783 4786 KRTLD_MODE_FIRST, &error)) == NULL)) {
4784 4787 return (SET_ERROR(ENOSYS));
4785 4788 }
4786 4789 if (zshare_fs == NULL && ((zshare_fs =
4787 4790 (int (*)(enum sharefs_sys_op, share_t *, uint32_t))
4788 4791 ddi_modsym(sharefs_mod, "sharefs_impl", &error)) == NULL)) {
4789 4792 return (SET_ERROR(ENOSYS));
4790 4793 }
4791 4794 return (0);
4792 4795 }
4793 4796
4794 4797 static int
4795 4798 zfs_ioc_share(zfs_cmd_t *zc)
4796 4799 {
4797 4800 int error;
4798 4801 int opcode;
4799 4802
4800 4803 switch (zc->zc_share.z_sharetype) {
4801 4804 case ZFS_SHARE_NFS:
4802 4805 case ZFS_UNSHARE_NFS:
4803 4806 if (zfs_nfsshare_inited == 0) {
4804 4807 mutex_enter(&zfs_share_lock);
4805 4808 if (nfs_mod == NULL && ((nfs_mod = ddi_modopen("fs/nfs",
4806 4809 KRTLD_MODE_FIRST, &error)) == NULL)) {
4807 4810 mutex_exit(&zfs_share_lock);
4808 4811 return (SET_ERROR(ENOSYS));
4809 4812 }
4810 4813 if (znfsexport_fs == NULL &&
4811 4814 ((znfsexport_fs = (int (*)(void *))
4812 4815 ddi_modsym(nfs_mod,
4813 4816 "nfs_export", &error)) == NULL)) {
4814 4817 mutex_exit(&zfs_share_lock);
4815 4818 return (SET_ERROR(ENOSYS));
4816 4819 }
4817 4820 error = zfs_init_sharefs();
4818 4821 if (error != 0) {
4819 4822 mutex_exit(&zfs_share_lock);
4820 4823 return (SET_ERROR(ENOSYS));
4821 4824 }
4822 4825 zfs_nfsshare_inited = 1;
4823 4826 mutex_exit(&zfs_share_lock);
4824 4827 }
4825 4828 break;
4826 4829 case ZFS_SHARE_SMB:
4827 4830 case ZFS_UNSHARE_SMB:
4828 4831 if (zfs_smbshare_inited == 0) {
4829 4832 mutex_enter(&zfs_share_lock);
4830 4833 if (smbsrv_mod == NULL && ((smbsrv_mod =
4831 4834 ddi_modopen("drv/smbsrv",
4832 4835 KRTLD_MODE_FIRST, &error)) == NULL)) {
4833 4836 mutex_exit(&zfs_share_lock);
4834 4837 return (SET_ERROR(ENOSYS));
4835 4838 }
4836 4839 if (zsmbexport_fs == NULL && ((zsmbexport_fs =
4837 4840 (int (*)(void *, boolean_t))ddi_modsym(smbsrv_mod,
4838 4841 "smb_server_share", &error)) == NULL)) {
4839 4842 mutex_exit(&zfs_share_lock);
4840 4843 return (SET_ERROR(ENOSYS));
4841 4844 }
4842 4845 error = zfs_init_sharefs();
4843 4846 if (error != 0) {
4844 4847 mutex_exit(&zfs_share_lock);
4845 4848 return (SET_ERROR(ENOSYS));
4846 4849 }
4847 4850 zfs_smbshare_inited = 1;
4848 4851 mutex_exit(&zfs_share_lock);
4849 4852 }
4850 4853 break;
4851 4854 default:
4852 4855 return (SET_ERROR(EINVAL));
4853 4856 }
4854 4857
4855 4858 switch (zc->zc_share.z_sharetype) {
4856 4859 case ZFS_SHARE_NFS:
4857 4860 case ZFS_UNSHARE_NFS:
4858 4861 if (error =
4859 4862 znfsexport_fs((void *)
4860 4863 (uintptr_t)zc->zc_share.z_exportdata))
4861 4864 return (error);
4862 4865 break;
4863 4866 case ZFS_SHARE_SMB:
4864 4867 case ZFS_UNSHARE_SMB:
4865 4868 if (error = zsmbexport_fs((void *)
4866 4869 (uintptr_t)zc->zc_share.z_exportdata,
4867 4870 zc->zc_share.z_sharetype == ZFS_SHARE_SMB ?
4868 4871 B_TRUE: B_FALSE)) {
4869 4872 return (error);
4870 4873 }
4871 4874 break;
4872 4875 }
4873 4876
4874 4877 opcode = (zc->zc_share.z_sharetype == ZFS_SHARE_NFS ||
4875 4878 zc->zc_share.z_sharetype == ZFS_SHARE_SMB) ?
4876 4879 SHAREFS_ADD : SHAREFS_REMOVE;
4877 4880
4878 4881 /*
4879 4882 * Add or remove share from sharetab
4880 4883 */
4881 4884 error = zshare_fs(opcode,
4882 4885 (void *)(uintptr_t)zc->zc_share.z_sharedata,
4883 4886 zc->zc_share.z_sharemax);
4884 4887
4885 4888 return (error);
4886 4889
4887 4890 }
4888 4891
4889 4892 ace_t full_access[] = {
4890 4893 {(uid_t)-1, ACE_ALL_PERMS, ACE_EVERYONE, 0}
4891 4894 };
4892 4895
4893 4896 /*
4894 4897 * inputs:
4895 4898 * zc_name name of containing filesystem
4896 4899 * zc_obj object # beyond which we want next in-use object #
4897 4900 *
4898 4901 * outputs:
4899 4902 * zc_obj next in-use object #
4900 4903 */
4901 4904 static int
4902 4905 zfs_ioc_next_obj(zfs_cmd_t *zc)
4903 4906 {
4904 4907 objset_t *os = NULL;
4905 4908 int error;
4906 4909
4907 4910 error = dmu_objset_hold(zc->zc_name, FTAG, &os);
4908 4911 if (error != 0)
4909 4912 return (error);
4910 4913
4911 4914 error = dmu_object_next(os, &zc->zc_obj, B_FALSE,
4912 4915 dsl_dataset_phys(os->os_dsl_dataset)->ds_prev_snap_txg);
4913 4916
4914 4917 dmu_objset_rele(os, FTAG);
4915 4918 return (error);
4916 4919 }
4917 4920
4918 4921 /*
4919 4922 * inputs:
4920 4923 * zc_name name of filesystem
4921 4924 * zc_value prefix name for snapshot
4922 4925 * zc_cleanup_fd cleanup-on-exit file descriptor for calling process
4923 4926 *
4924 4927 * outputs:
4925 4928 * zc_value short name of new snapshot
4926 4929 */
4927 4930 static int
4928 4931 zfs_ioc_tmp_snapshot(zfs_cmd_t *zc)
4929 4932 {
4930 4933 char *snap_name;
4931 4934 char *hold_name;
4932 4935 int error;
4933 4936 minor_t minor;
4934 4937
4935 4938 error = zfs_onexit_fd_hold(zc->zc_cleanup_fd, &minor);
4936 4939 if (error != 0)
4937 4940 return (error);
4938 4941
4939 4942 snap_name = kmem_asprintf("%s-%016llx", zc->zc_value,
4940 4943 (u_longlong_t)ddi_get_lbolt64());
4941 4944 hold_name = kmem_asprintf("%%%s", zc->zc_value);
4942 4945
4943 4946 error = dsl_dataset_snapshot_tmp(zc->zc_name, snap_name, minor,
4944 4947 hold_name);
4945 4948 if (error == 0)
4946 4949 (void) strcpy(zc->zc_value, snap_name);
4947 4950 strfree(snap_name);
4948 4951 strfree(hold_name);
4949 4952 zfs_onexit_fd_rele(zc->zc_cleanup_fd);
4950 4953 return (error);
4951 4954 }
4952 4955
4953 4956 /*
4954 4957 * inputs:
4955 4958 * zc_name name of "to" snapshot
4956 4959 * zc_value name of "from" snapshot
4957 4960 * zc_cookie file descriptor to write diff data on
4958 4961 *
4959 4962 * outputs:
4960 4963 * dmu_diff_record_t's to the file descriptor
4961 4964 */
4962 4965 static int
4963 4966 zfs_ioc_diff(zfs_cmd_t *zc)
4964 4967 {
4965 4968 file_t *fp;
4966 4969 offset_t off;
4967 4970 int error;
4968 4971
4969 4972 fp = getf(zc->zc_cookie);
4970 4973 if (fp == NULL)
4971 4974 return (SET_ERROR(EBADF));
4972 4975
4973 4976 off = fp->f_offset;
4974 4977
4975 4978 error = dmu_diff(zc->zc_name, zc->zc_value, fp->f_vnode, &off);
4976 4979
4977 4980 if (VOP_SEEK(fp->f_vnode, fp->f_offset, &off, NULL) == 0)
4978 4981 fp->f_offset = off;
4979 4982 releasef(zc->zc_cookie);
4980 4983
4981 4984 return (error);
4982 4985 }
4983 4986
4984 4987 /*
4985 4988 * Remove all ACL files in shares dir
4986 4989 */
4987 4990 static int
4988 4991 zfs_smb_acl_purge(znode_t *dzp)
4989 4992 {
4990 4993 zap_cursor_t zc;
4991 4994 zap_attribute_t zap;
4992 4995 zfsvfs_t *zfsvfs = dzp->z_zfsvfs;
4993 4996 int error;
4994 4997
4995 4998 for (zap_cursor_init(&zc, zfsvfs->z_os, dzp->z_id);
4996 4999 (error = zap_cursor_retrieve(&zc, &zap)) == 0;
4997 5000 zap_cursor_advance(&zc)) {
4998 5001 if ((error = VOP_REMOVE(ZTOV(dzp), zap.za_name, kcred,
4999 5002 NULL, 0)) != 0)
5000 5003 break;
5001 5004 }
5002 5005 zap_cursor_fini(&zc);
5003 5006 return (error);
5004 5007 }
5005 5008
5006 5009 static int
5007 5010 zfs_ioc_smb_acl(zfs_cmd_t *zc)
5008 5011 {
5009 5012 vnode_t *vp;
5010 5013 znode_t *dzp;
5011 5014 vnode_t *resourcevp = NULL;
5012 5015 znode_t *sharedir;
5013 5016 zfsvfs_t *zfsvfs;
5014 5017 nvlist_t *nvlist;
5015 5018 char *src, *target;
5016 5019 vattr_t vattr;
5017 5020 vsecattr_t vsec;
5018 5021 int error = 0;
5019 5022
5020 5023 if ((error = lookupname(zc->zc_value, UIO_SYSSPACE,
5021 5024 NO_FOLLOW, NULL, &vp)) != 0)
5022 5025 return (error);
5023 5026
5024 5027 /* Now make sure mntpnt and dataset are ZFS */
5025 5028
5026 5029 if (vp->v_vfsp->vfs_fstype != zfsfstype ||
5027 5030 (strcmp((char *)refstr_value(vp->v_vfsp->vfs_resource),
5028 5031 zc->zc_name) != 0)) {
5029 5032 VN_RELE(vp);
5030 5033 return (SET_ERROR(EINVAL));
5031 5034 }
5032 5035
5033 5036 dzp = VTOZ(vp);
5034 5037 zfsvfs = dzp->z_zfsvfs;
5035 5038 ZFS_ENTER(zfsvfs);
5036 5039
5037 5040 /*
5038 5041 * Create share dir if its missing.
5039 5042 */
5040 5043 mutex_enter(&zfsvfs->z_lock);
5041 5044 if (zfsvfs->z_shares_dir == 0) {
5042 5045 dmu_tx_t *tx;
5043 5046
5044 5047 tx = dmu_tx_create(zfsvfs->z_os);
5045 5048 dmu_tx_hold_zap(tx, MASTER_NODE_OBJ, TRUE,
5046 5049 ZFS_SHARES_DIR);
5047 5050 dmu_tx_hold_zap(tx, DMU_NEW_OBJECT, FALSE, NULL);
5048 5051 error = dmu_tx_assign(tx, TXG_WAIT);
5049 5052 if (error != 0) {
5050 5053 dmu_tx_abort(tx);
5051 5054 } else {
5052 5055 error = zfs_create_share_dir(zfsvfs, tx);
5053 5056 dmu_tx_commit(tx);
5054 5057 }
5055 5058 if (error != 0) {
5056 5059 mutex_exit(&zfsvfs->z_lock);
5057 5060 VN_RELE(vp);
5058 5061 ZFS_EXIT(zfsvfs);
5059 5062 return (error);
5060 5063 }
5061 5064 }
5062 5065 mutex_exit(&zfsvfs->z_lock);
5063 5066
5064 5067 ASSERT(zfsvfs->z_shares_dir);
5065 5068 if ((error = zfs_zget(zfsvfs, zfsvfs->z_shares_dir, &sharedir)) != 0) {
5066 5069 VN_RELE(vp);
5067 5070 ZFS_EXIT(zfsvfs);
5068 5071 return (error);
5069 5072 }
5070 5073
5071 5074 switch (zc->zc_cookie) {
5072 5075 case ZFS_SMB_ACL_ADD:
5073 5076 vattr.va_mask = AT_MODE|AT_UID|AT_GID|AT_TYPE;
5074 5077 vattr.va_type = VREG;
5075 5078 vattr.va_mode = S_IFREG|0777;
5076 5079 vattr.va_uid = 0;
5077 5080 vattr.va_gid = 0;
5078 5081
5079 5082 vsec.vsa_mask = VSA_ACE;
5080 5083 vsec.vsa_aclentp = &full_access;
5081 5084 vsec.vsa_aclentsz = sizeof (full_access);
5082 5085 vsec.vsa_aclcnt = 1;
5083 5086
5084 5087 error = VOP_CREATE(ZTOV(sharedir), zc->zc_string,
5085 5088 &vattr, EXCL, 0, &resourcevp, kcred, 0, NULL, &vsec);
5086 5089 if (resourcevp)
5087 5090 VN_RELE(resourcevp);
5088 5091 break;
5089 5092
5090 5093 case ZFS_SMB_ACL_REMOVE:
5091 5094 error = VOP_REMOVE(ZTOV(sharedir), zc->zc_string, kcred,
5092 5095 NULL, 0);
5093 5096 break;
5094 5097
5095 5098 case ZFS_SMB_ACL_RENAME:
5096 5099 if ((error = get_nvlist(zc->zc_nvlist_src,
5097 5100 zc->zc_nvlist_src_size, zc->zc_iflags, &nvlist)) != 0) {
5098 5101 VN_RELE(vp);
5099 5102 VN_RELE(ZTOV(sharedir));
5100 5103 ZFS_EXIT(zfsvfs);
5101 5104 return (error);
5102 5105 }
5103 5106 if (nvlist_lookup_string(nvlist, ZFS_SMB_ACL_SRC, &src) ||
5104 5107 nvlist_lookup_string(nvlist, ZFS_SMB_ACL_TARGET,
5105 5108 &target)) {
5106 5109 VN_RELE(vp);
5107 5110 VN_RELE(ZTOV(sharedir));
5108 5111 ZFS_EXIT(zfsvfs);
5109 5112 nvlist_free(nvlist);
5110 5113 return (error);
5111 5114 }
5112 5115 error = VOP_RENAME(ZTOV(sharedir), src, ZTOV(sharedir), target,
5113 5116 kcred, NULL, 0);
5114 5117 nvlist_free(nvlist);
5115 5118 break;
5116 5119
5117 5120 case ZFS_SMB_ACL_PURGE:
5118 5121 error = zfs_smb_acl_purge(sharedir);
5119 5122 break;
5120 5123
5121 5124 default:
5122 5125 error = SET_ERROR(EINVAL);
5123 5126 break;
5124 5127 }
5125 5128
5126 5129 VN_RELE(vp);
5127 5130 VN_RELE(ZTOV(sharedir));
5128 5131
5129 5132 ZFS_EXIT(zfsvfs);
5130 5133
5131 5134 return (error);
5132 5135 }
5133 5136
5134 5137 /*
5135 5138 * innvl: {
5136 5139 * "holds" -> { snapname -> holdname (string), ... }
5137 5140 * (optional) "cleanup_fd" -> fd (int32)
5138 5141 * }
5139 5142 *
5140 5143 * outnvl: {
5141 5144 * snapname -> error value (int32)
5142 5145 * ...
5143 5146 * }
5144 5147 */
5145 5148 /* ARGSUSED */
5146 5149 static int
5147 5150 zfs_ioc_hold(const char *pool, nvlist_t *args, nvlist_t *errlist)
5148 5151 {
5149 5152 nvpair_t *pair;
5150 5153 nvlist_t *holds;
5151 5154 int cleanup_fd = -1;
5152 5155 int error;
5153 5156 minor_t minor = 0;
5154 5157
5155 5158 error = nvlist_lookup_nvlist(args, "holds", &holds);
5156 5159 if (error != 0)
5157 5160 return (SET_ERROR(EINVAL));
5158 5161
5159 5162 /* make sure the user didn't pass us any invalid (empty) tags */
5160 5163 for (pair = nvlist_next_nvpair(holds, NULL); pair != NULL;
5161 5164 pair = nvlist_next_nvpair(holds, pair)) {
5162 5165 char *htag;
5163 5166
5164 5167 error = nvpair_value_string(pair, &htag);
5165 5168 if (error != 0)
5166 5169 return (SET_ERROR(error));
5167 5170
5168 5171 if (strlen(htag) == 0)
5169 5172 return (SET_ERROR(EINVAL));
5170 5173 }
5171 5174
5172 5175 if (nvlist_lookup_int32(args, "cleanup_fd", &cleanup_fd) == 0) {
5173 5176 error = zfs_onexit_fd_hold(cleanup_fd, &minor);
5174 5177 if (error != 0)
5175 5178 return (error);
5176 5179 }
5177 5180
5178 5181 error = dsl_dataset_user_hold(holds, minor, errlist);
5179 5182 if (minor != 0)
5180 5183 zfs_onexit_fd_rele(cleanup_fd);
5181 5184 return (error);
5182 5185 }
5183 5186
5184 5187 /*
5185 5188 * innvl is not used.
5186 5189 *
5187 5190 * outnvl: {
5188 5191 * holdname -> time added (uint64 seconds since epoch)
5189 5192 * ...
5190 5193 * }
5191 5194 */
5192 5195 /* ARGSUSED */
5193 5196 static int
5194 5197 zfs_ioc_get_holds(const char *snapname, nvlist_t *args, nvlist_t *outnvl)
5195 5198 {
5196 5199 return (dsl_dataset_get_holds(snapname, outnvl));
5197 5200 }
5198 5201
5199 5202 /*
5200 5203 * innvl: {
5201 5204 * snapname -> { holdname, ... }
5202 5205 * ...
5203 5206 * }
5204 5207 *
5205 5208 * outnvl: {
5206 5209 * snapname -> error value (int32)
5207 5210 * ...
5208 5211 * }
5209 5212 */
5210 5213 /* ARGSUSED */
5211 5214 static int
5212 5215 zfs_ioc_release(const char *pool, nvlist_t *holds, nvlist_t *errlist)
5213 5216 {
5214 5217 return (dsl_dataset_user_release(holds, errlist));
5215 5218 }
5216 5219
5217 5220 /*
5218 5221 * inputs:
5219 5222 * zc_name name of new filesystem or snapshot
5220 5223 * zc_value full name of old snapshot
5221 5224 *
5222 5225 * outputs:
5223 5226 * zc_cookie space in bytes
5224 5227 * zc_objset_type compressed space in bytes
5225 5228 * zc_perm_action uncompressed space in bytes
5226 5229 */
5227 5230 static int
5228 5231 zfs_ioc_space_written(zfs_cmd_t *zc)
5229 5232 {
5230 5233 int error;
5231 5234 dsl_pool_t *dp;
5232 5235 dsl_dataset_t *new, *old;
5233 5236
5234 5237 error = dsl_pool_hold(zc->zc_name, FTAG, &dp);
5235 5238 if (error != 0)
5236 5239 return (error);
5237 5240 error = dsl_dataset_hold(dp, zc->zc_name, FTAG, &new);
5238 5241 if (error != 0) {
5239 5242 dsl_pool_rele(dp, FTAG);
5240 5243 return (error);
5241 5244 }
5242 5245 error = dsl_dataset_hold(dp, zc->zc_value, FTAG, &old);
5243 5246 if (error != 0) {
5244 5247 dsl_dataset_rele(new, FTAG);
5245 5248 dsl_pool_rele(dp, FTAG);
5246 5249 return (error);
5247 5250 }
5248 5251
5249 5252 error = dsl_dataset_space_written(old, new, &zc->zc_cookie,
5250 5253 &zc->zc_objset_type, &zc->zc_perm_action);
5251 5254 dsl_dataset_rele(old, FTAG);
5252 5255 dsl_dataset_rele(new, FTAG);
5253 5256 dsl_pool_rele(dp, FTAG);
5254 5257 return (error);
5255 5258 }
5256 5259
5257 5260 /*
5258 5261 * innvl: {
5259 5262 * "firstsnap" -> snapshot name
5260 5263 * }
5261 5264 *
5262 5265 * outnvl: {
5263 5266 * "used" -> space in bytes
5264 5267 * "compressed" -> compressed space in bytes
5265 5268 * "uncompressed" -> uncompressed space in bytes
5266 5269 * }
5267 5270 */
5268 5271 static int
5269 5272 zfs_ioc_space_snaps(const char *lastsnap, nvlist_t *innvl, nvlist_t *outnvl)
5270 5273 {
5271 5274 int error;
5272 5275 dsl_pool_t *dp;
5273 5276 dsl_dataset_t *new, *old;
5274 5277 char *firstsnap;
5275 5278 uint64_t used, comp, uncomp;
5276 5279
5277 5280 if (nvlist_lookup_string(innvl, "firstsnap", &firstsnap) != 0)
5278 5281 return (SET_ERROR(EINVAL));
5279 5282
5280 5283 error = dsl_pool_hold(lastsnap, FTAG, &dp);
5281 5284 if (error != 0)
5282 5285 return (error);
5283 5286
5284 5287 error = dsl_dataset_hold(dp, lastsnap, FTAG, &new);
5285 5288 if (error == 0 && !new->ds_is_snapshot) {
5286 5289 dsl_dataset_rele(new, FTAG);
5287 5290 error = SET_ERROR(EINVAL);
5288 5291 }
5289 5292 if (error != 0) {
5290 5293 dsl_pool_rele(dp, FTAG);
5291 5294 return (error);
5292 5295 }
5293 5296 error = dsl_dataset_hold(dp, firstsnap, FTAG, &old);
5294 5297 if (error == 0 && !old->ds_is_snapshot) {
5295 5298 dsl_dataset_rele(old, FTAG);
5296 5299 error = SET_ERROR(EINVAL);
5297 5300 }
5298 5301 if (error != 0) {
5299 5302 dsl_dataset_rele(new, FTAG);
5300 5303 dsl_pool_rele(dp, FTAG);
5301 5304 return (error);
5302 5305 }
5303 5306
5304 5307 error = dsl_dataset_space_wouldfree(old, new, &used, &comp, &uncomp);
5305 5308 dsl_dataset_rele(old, FTAG);
5306 5309 dsl_dataset_rele(new, FTAG);
5307 5310 dsl_pool_rele(dp, FTAG);
5308 5311 fnvlist_add_uint64(outnvl, "used", used);
5309 5312 fnvlist_add_uint64(outnvl, "compressed", comp);
5310 5313 fnvlist_add_uint64(outnvl, "uncompressed", uncomp);
5311 5314 return (error);
5312 5315 }
5313 5316
5314 5317 /*
5315 5318 * innvl: {
5316 5319 * "fd" -> file descriptor to write stream to (int32)
5317 5320 * (optional) "fromsnap" -> full snap name to send an incremental from
5318 5321 * (optional) "largeblockok" -> (value ignored)
5319 5322 * indicates that blocks > 128KB are permitted
5320 5323 * (optional) "embedok" -> (value ignored)
5321 5324 * presence indicates DRR_WRITE_EMBEDDED records are permitted
5322 5325 * (optional) "resume_object" and "resume_offset" -> (uint64)
5323 5326 * if present, resume send stream from specified object and offset.
5324 5327 * }
5325 5328 *
5326 5329 * outnvl is unused
5327 5330 */
5328 5331 /* ARGSUSED */
5329 5332 static int
5330 5333 zfs_ioc_send_new(const char *snapname, nvlist_t *innvl, nvlist_t *outnvl)
5331 5334 {
5332 5335 int error;
5333 5336 offset_t off;
5334 5337 char *fromname = NULL;
5335 5338 int fd;
5336 5339 boolean_t largeblockok;
5337 5340 boolean_t embedok;
5338 5341 uint64_t resumeobj = 0;
5339 5342 uint64_t resumeoff = 0;
5340 5343
5341 5344 error = nvlist_lookup_int32(innvl, "fd", &fd);
5342 5345 if (error != 0)
5343 5346 return (SET_ERROR(EINVAL));
5344 5347
5345 5348 (void) nvlist_lookup_string(innvl, "fromsnap", &fromname);
5346 5349
5347 5350 largeblockok = nvlist_exists(innvl, "largeblockok");
5348 5351 embedok = nvlist_exists(innvl, "embedok");
5349 5352
5350 5353 (void) nvlist_lookup_uint64(innvl, "resume_object", &resumeobj);
5351 5354 (void) nvlist_lookup_uint64(innvl, "resume_offset", &resumeoff);
5352 5355
5353 5356 file_t *fp = getf(fd);
5354 5357 if (fp == NULL)
5355 5358 return (SET_ERROR(EBADF));
5356 5359
5357 5360 off = fp->f_offset;
5358 5361 error = dmu_send(snapname, fromname, embedok, largeblockok, fd,
5359 5362 resumeobj, resumeoff, fp->f_vnode, &off);
5360 5363
5361 5364 if (VOP_SEEK(fp->f_vnode, fp->f_offset, &off, NULL) == 0)
5362 5365 fp->f_offset = off;
5363 5366 releasef(fd);
5364 5367 return (error);
5365 5368 }
5366 5369
5367 5370 /*
5368 5371 * Determine approximately how large a zfs send stream will be -- the number
5369 5372 * of bytes that will be written to the fd supplied to zfs_ioc_send_new().
5370 5373 *
5371 5374 * innvl: {
5372 5375 * (optional) "from" -> full snap or bookmark name to send an incremental
5373 5376 * from
5374 5377 * }
5375 5378 *
5376 5379 * outnvl: {
5377 5380 * "space" -> bytes of space (uint64)
5378 5381 * }
5379 5382 */
5380 5383 static int
5381 5384 zfs_ioc_send_space(const char *snapname, nvlist_t *innvl, nvlist_t *outnvl)
5382 5385 {
5383 5386 dsl_pool_t *dp;
5384 5387 dsl_dataset_t *tosnap;
5385 5388 int error;
5386 5389 char *fromname;
5387 5390 uint64_t space;
5388 5391
5389 5392 error = dsl_pool_hold(snapname, FTAG, &dp);
5390 5393 if (error != 0)
5391 5394 return (error);
5392 5395
5393 5396 error = dsl_dataset_hold(dp, snapname, FTAG, &tosnap);
5394 5397 if (error != 0) {
5395 5398 dsl_pool_rele(dp, FTAG);
5396 5399 return (error);
5397 5400 }
5398 5401
5399 5402 error = nvlist_lookup_string(innvl, "from", &fromname);
5400 5403 if (error == 0) {
5401 5404 if (strchr(fromname, '@') != NULL) {
5402 5405 /*
5403 5406 * If from is a snapshot, hold it and use the more
5404 5407 * efficient dmu_send_estimate to estimate send space
5405 5408 * size using deadlists.
5406 5409 */
5407 5410 dsl_dataset_t *fromsnap;
5408 5411 error = dsl_dataset_hold(dp, fromname, FTAG, &fromsnap);
5409 5412 if (error != 0)
5410 5413 goto out;
5411 5414 error = dmu_send_estimate(tosnap, fromsnap, &space);
5412 5415 dsl_dataset_rele(fromsnap, FTAG);
5413 5416 } else if (strchr(fromname, '#') != NULL) {
5414 5417 /*
5415 5418 * If from is a bookmark, fetch the creation TXG of the
5416 5419 * snapshot it was created from and use that to find
5417 5420 * blocks that were born after it.
5418 5421 */
5419 5422 zfs_bookmark_phys_t frombm;
5420 5423
5421 5424 error = dsl_bookmark_lookup(dp, fromname, tosnap,
5422 5425 &frombm);
5423 5426 if (error != 0)
5424 5427 goto out;
5425 5428 error = dmu_send_estimate_from_txg(tosnap,
5426 5429 frombm.zbm_creation_txg, &space);
5427 5430 } else {
5428 5431 /*
5429 5432 * from is not properly formatted as a snapshot or
5430 5433 * bookmark
5431 5434 */
5432 5435 error = SET_ERROR(EINVAL);
5433 5436 goto out;
5434 5437 }
5435 5438 } else {
5436 5439 // If estimating the size of a full send, use dmu_send_estimate
5437 5440 error = dmu_send_estimate(tosnap, NULL, &space);
5438 5441 }
5439 5442
5440 5443 fnvlist_add_uint64(outnvl, "space", space);
5441 5444
5442 5445 out:
5443 5446 dsl_dataset_rele(tosnap, FTAG);
5444 5447 dsl_pool_rele(dp, FTAG);
5445 5448 return (error);
5446 5449 }
5447 5450
5448 5451 static zfs_ioc_vec_t zfs_ioc_vec[ZFS_IOC_LAST - ZFS_IOC_FIRST];
5449 5452
5450 5453 static void
5451 5454 zfs_ioctl_register_legacy(zfs_ioc_t ioc, zfs_ioc_legacy_func_t *func,
5452 5455 zfs_secpolicy_func_t *secpolicy, zfs_ioc_namecheck_t namecheck,
5453 5456 boolean_t log_history, zfs_ioc_poolcheck_t pool_check)
5454 5457 {
5455 5458 zfs_ioc_vec_t *vec = &zfs_ioc_vec[ioc - ZFS_IOC_FIRST];
5456 5459
5457 5460 ASSERT3U(ioc, >=, ZFS_IOC_FIRST);
5458 5461 ASSERT3U(ioc, <, ZFS_IOC_LAST);
5459 5462 ASSERT3P(vec->zvec_legacy_func, ==, NULL);
5460 5463 ASSERT3P(vec->zvec_func, ==, NULL);
5461 5464
5462 5465 vec->zvec_legacy_func = func;
5463 5466 vec->zvec_secpolicy = secpolicy;
5464 5467 vec->zvec_namecheck = namecheck;
5465 5468 vec->zvec_allow_log = log_history;
5466 5469 vec->zvec_pool_check = pool_check;
5467 5470 }
5468 5471
5469 5472 /*
5470 5473 * See the block comment at the beginning of this file for details on
5471 5474 * each argument to this function.
5472 5475 */
5473 5476 static void
5474 5477 zfs_ioctl_register(const char *name, zfs_ioc_t ioc, zfs_ioc_func_t *func,
5475 5478 zfs_secpolicy_func_t *secpolicy, zfs_ioc_namecheck_t namecheck,
5476 5479 zfs_ioc_poolcheck_t pool_check, boolean_t smush_outnvlist,
5477 5480 boolean_t allow_log)
5478 5481 {
5479 5482 zfs_ioc_vec_t *vec = &zfs_ioc_vec[ioc - ZFS_IOC_FIRST];
5480 5483
5481 5484 ASSERT3U(ioc, >=, ZFS_IOC_FIRST);
5482 5485 ASSERT3U(ioc, <, ZFS_IOC_LAST);
5483 5486 ASSERT3P(vec->zvec_legacy_func, ==, NULL);
5484 5487 ASSERT3P(vec->zvec_func, ==, NULL);
5485 5488
5486 5489 /* if we are logging, the name must be valid */
5487 5490 ASSERT(!allow_log || namecheck != NO_NAME);
5488 5491
5489 5492 vec->zvec_name = name;
5490 5493 vec->zvec_func = func;
5491 5494 vec->zvec_secpolicy = secpolicy;
5492 5495 vec->zvec_namecheck = namecheck;
5493 5496 vec->zvec_pool_check = pool_check;
5494 5497 vec->zvec_smush_outnvlist = smush_outnvlist;
5495 5498 vec->zvec_allow_log = allow_log;
5496 5499 }
5497 5500
5498 5501 static void
5499 5502 zfs_ioctl_register_pool(zfs_ioc_t ioc, zfs_ioc_legacy_func_t *func,
5500 5503 zfs_secpolicy_func_t *secpolicy, boolean_t log_history,
5501 5504 zfs_ioc_poolcheck_t pool_check)
5502 5505 {
5503 5506 zfs_ioctl_register_legacy(ioc, func, secpolicy,
5504 5507 POOL_NAME, log_history, pool_check);
5505 5508 }
5506 5509
5507 5510 static void
5508 5511 zfs_ioctl_register_dataset_nolog(zfs_ioc_t ioc, zfs_ioc_legacy_func_t *func,
5509 5512 zfs_secpolicy_func_t *secpolicy, zfs_ioc_poolcheck_t pool_check)
5510 5513 {
5511 5514 zfs_ioctl_register_legacy(ioc, func, secpolicy,
5512 5515 DATASET_NAME, B_FALSE, pool_check);
5513 5516 }
5514 5517
5515 5518 static void
5516 5519 zfs_ioctl_register_pool_modify(zfs_ioc_t ioc, zfs_ioc_legacy_func_t *func)
5517 5520 {
5518 5521 zfs_ioctl_register_legacy(ioc, func, zfs_secpolicy_config,
5519 5522 POOL_NAME, B_TRUE, POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY);
5520 5523 }
5521 5524
5522 5525 static void
5523 5526 zfs_ioctl_register_pool_meta(zfs_ioc_t ioc, zfs_ioc_legacy_func_t *func,
5524 5527 zfs_secpolicy_func_t *secpolicy)
5525 5528 {
5526 5529 zfs_ioctl_register_legacy(ioc, func, secpolicy,
5527 5530 NO_NAME, B_FALSE, POOL_CHECK_NONE);
5528 5531 }
5529 5532
5530 5533 static void
5531 5534 zfs_ioctl_register_dataset_read_secpolicy(zfs_ioc_t ioc,
5532 5535 zfs_ioc_legacy_func_t *func, zfs_secpolicy_func_t *secpolicy)
5533 5536 {
5534 5537 zfs_ioctl_register_legacy(ioc, func, secpolicy,
5535 5538 DATASET_NAME, B_FALSE, POOL_CHECK_SUSPENDED);
5536 5539 }
5537 5540
5538 5541 static void
5539 5542 zfs_ioctl_register_dataset_read(zfs_ioc_t ioc, zfs_ioc_legacy_func_t *func)
5540 5543 {
5541 5544 zfs_ioctl_register_dataset_read_secpolicy(ioc, func,
5542 5545 zfs_secpolicy_read);
5543 5546 }
5544 5547
5545 5548 static void
5546 5549 zfs_ioctl_register_dataset_modify(zfs_ioc_t ioc, zfs_ioc_legacy_func_t *func,
5547 5550 zfs_secpolicy_func_t *secpolicy)
5548 5551 {
5549 5552 zfs_ioctl_register_legacy(ioc, func, secpolicy,
5550 5553 DATASET_NAME, B_TRUE, POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY);
5551 5554 }
5552 5555
5553 5556 static void
5554 5557 zfs_ioctl_init(void)
5555 5558 {
5556 5559 zfs_ioctl_register("snapshot", ZFS_IOC_SNAPSHOT,
5557 5560 zfs_ioc_snapshot, zfs_secpolicy_snapshot, POOL_NAME,
5558 5561 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_TRUE, B_TRUE);
5559 5562
5560 5563 zfs_ioctl_register("log_history", ZFS_IOC_LOG_HISTORY,
5561 5564 zfs_ioc_log_history, zfs_secpolicy_log_history, NO_NAME,
5562 5565 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_FALSE, B_FALSE);
5563 5566
5564 5567 zfs_ioctl_register("space_snaps", ZFS_IOC_SPACE_SNAPS,
5565 5568 zfs_ioc_space_snaps, zfs_secpolicy_read, DATASET_NAME,
5566 5569 POOL_CHECK_SUSPENDED, B_FALSE, B_FALSE);
5567 5570
5568 5571 zfs_ioctl_register("send", ZFS_IOC_SEND_NEW,
5569 5572 zfs_ioc_send_new, zfs_secpolicy_send_new, DATASET_NAME,
5570 5573 POOL_CHECK_SUSPENDED, B_FALSE, B_FALSE);
5571 5574
5572 5575 zfs_ioctl_register("send_space", ZFS_IOC_SEND_SPACE,
5573 5576 zfs_ioc_send_space, zfs_secpolicy_read, DATASET_NAME,
5574 5577 POOL_CHECK_SUSPENDED, B_FALSE, B_FALSE);
5575 5578
5576 5579 zfs_ioctl_register("create", ZFS_IOC_CREATE,
5577 5580 zfs_ioc_create, zfs_secpolicy_create_clone, DATASET_NAME,
5578 5581 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_TRUE, B_TRUE);
5579 5582
5580 5583 zfs_ioctl_register("clone", ZFS_IOC_CLONE,
5581 5584 zfs_ioc_clone, zfs_secpolicy_create_clone, DATASET_NAME,
5582 5585 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_TRUE, B_TRUE);
5583 5586
5584 5587 zfs_ioctl_register("destroy_snaps", ZFS_IOC_DESTROY_SNAPS,
5585 5588 zfs_ioc_destroy_snaps, zfs_secpolicy_destroy_snaps, POOL_NAME,
5586 5589 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_TRUE, B_TRUE);
5587 5590
5588 5591 zfs_ioctl_register("hold", ZFS_IOC_HOLD,
5589 5592 zfs_ioc_hold, zfs_secpolicy_hold, POOL_NAME,
5590 5593 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_TRUE, B_TRUE);
5591 5594 zfs_ioctl_register("release", ZFS_IOC_RELEASE,
5592 5595 zfs_ioc_release, zfs_secpolicy_release, POOL_NAME,
5593 5596 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_TRUE, B_TRUE);
5594 5597
5595 5598 zfs_ioctl_register("get_holds", ZFS_IOC_GET_HOLDS,
5596 5599 zfs_ioc_get_holds, zfs_secpolicy_read, DATASET_NAME,
5597 5600 POOL_CHECK_SUSPENDED, B_FALSE, B_FALSE);
5598 5601
5599 5602 zfs_ioctl_register("rollback", ZFS_IOC_ROLLBACK,
5600 5603 zfs_ioc_rollback, zfs_secpolicy_rollback, DATASET_NAME,
5601 5604 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_FALSE, B_TRUE);
5602 5605
5603 5606 zfs_ioctl_register("bookmark", ZFS_IOC_BOOKMARK,
5604 5607 zfs_ioc_bookmark, zfs_secpolicy_bookmark, POOL_NAME,
5605 5608 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_TRUE, B_TRUE);
5606 5609
5607 5610 zfs_ioctl_register("get_bookmarks", ZFS_IOC_GET_BOOKMARKS,
5608 5611 zfs_ioc_get_bookmarks, zfs_secpolicy_read, DATASET_NAME,
5609 5612 POOL_CHECK_SUSPENDED, B_FALSE, B_FALSE);
5610 5613
5611 5614 zfs_ioctl_register("destroy_bookmarks", ZFS_IOC_DESTROY_BOOKMARKS,
5612 5615 zfs_ioc_destroy_bookmarks, zfs_secpolicy_destroy_bookmarks,
5613 5616 POOL_NAME,
5614 5617 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_TRUE, B_TRUE);
5615 5618
5616 5619 /* IOCTLS that use the legacy function signature */
5617 5620
5618 5621 zfs_ioctl_register_legacy(ZFS_IOC_POOL_FREEZE, zfs_ioc_pool_freeze,
5619 5622 zfs_secpolicy_config, NO_NAME, B_FALSE, POOL_CHECK_READONLY);
5620 5623
5621 5624 zfs_ioctl_register_pool(ZFS_IOC_POOL_CREATE, zfs_ioc_pool_create,
5622 5625 zfs_secpolicy_config, B_TRUE, POOL_CHECK_NONE);
5623 5626 zfs_ioctl_register_pool_modify(ZFS_IOC_POOL_SCAN,
5624 5627 zfs_ioc_pool_scan);
5625 5628 zfs_ioctl_register_pool_modify(ZFS_IOC_POOL_UPGRADE,
5626 5629 zfs_ioc_pool_upgrade);
5627 5630 zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_ADD,
5628 5631 zfs_ioc_vdev_add);
5629 5632 zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_REMOVE,
5630 5633 zfs_ioc_vdev_remove);
5631 5634 zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_SET_STATE,
5632 5635 zfs_ioc_vdev_set_state);
5633 5636 zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_ATTACH,
5634 5637 zfs_ioc_vdev_attach);
5635 5638 zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_DETACH,
5636 5639 zfs_ioc_vdev_detach);
5637 5640 zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_SETPATH,
5638 5641 zfs_ioc_vdev_setpath);
5639 5642 zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_SETFRU,
5640 5643 zfs_ioc_vdev_setfru);
5641 5644 zfs_ioctl_register_pool_modify(ZFS_IOC_POOL_SET_PROPS,
5642 5645 zfs_ioc_pool_set_props);
5643 5646 zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_SPLIT,
5644 5647 zfs_ioc_vdev_split);
5645 5648 zfs_ioctl_register_pool_modify(ZFS_IOC_POOL_REGUID,
5646 5649 zfs_ioc_pool_reguid);
5647 5650
5648 5651 zfs_ioctl_register_pool_meta(ZFS_IOC_POOL_CONFIGS,
5649 5652 zfs_ioc_pool_configs, zfs_secpolicy_none);
5650 5653 zfs_ioctl_register_pool_meta(ZFS_IOC_POOL_TRYIMPORT,
5651 5654 zfs_ioc_pool_tryimport, zfs_secpolicy_config);
5652 5655 zfs_ioctl_register_pool_meta(ZFS_IOC_INJECT_FAULT,
5653 5656 zfs_ioc_inject_fault, zfs_secpolicy_inject);
5654 5657 zfs_ioctl_register_pool_meta(ZFS_IOC_CLEAR_FAULT,
5655 5658 zfs_ioc_clear_fault, zfs_secpolicy_inject);
5656 5659 zfs_ioctl_register_pool_meta(ZFS_IOC_INJECT_LIST_NEXT,
5657 5660 zfs_ioc_inject_list_next, zfs_secpolicy_inject);
5658 5661
5659 5662 /*
5660 5663 * pool destroy, and export don't log the history as part of
5661 5664 * zfsdev_ioctl, but rather zfs_ioc_pool_export
5662 5665 * does the logging of those commands.
5663 5666 */
5664 5667 zfs_ioctl_register_pool(ZFS_IOC_POOL_DESTROY, zfs_ioc_pool_destroy,
5665 5668 zfs_secpolicy_config, B_FALSE, POOL_CHECK_NONE);
5666 5669 zfs_ioctl_register_pool(ZFS_IOC_POOL_EXPORT, zfs_ioc_pool_export,
5667 5670 zfs_secpolicy_config, B_FALSE, POOL_CHECK_NONE);
5668 5671
5669 5672 zfs_ioctl_register_pool(ZFS_IOC_POOL_STATS, zfs_ioc_pool_stats,
5670 5673 zfs_secpolicy_read, B_FALSE, POOL_CHECK_NONE);
5671 5674 zfs_ioctl_register_pool(ZFS_IOC_POOL_GET_PROPS, zfs_ioc_pool_get_props,
5672 5675 zfs_secpolicy_read, B_FALSE, POOL_CHECK_NONE);
5673 5676
5674 5677 zfs_ioctl_register_pool(ZFS_IOC_ERROR_LOG, zfs_ioc_error_log,
5675 5678 zfs_secpolicy_inject, B_FALSE, POOL_CHECK_SUSPENDED);
5676 5679 zfs_ioctl_register_pool(ZFS_IOC_DSOBJ_TO_DSNAME,
5677 5680 zfs_ioc_dsobj_to_dsname,
5678 5681 zfs_secpolicy_diff, B_FALSE, POOL_CHECK_SUSPENDED);
5679 5682 zfs_ioctl_register_pool(ZFS_IOC_POOL_GET_HISTORY,
5680 5683 zfs_ioc_pool_get_history,
5681 5684 zfs_secpolicy_config, B_FALSE, POOL_CHECK_SUSPENDED);
5682 5685
5683 5686 zfs_ioctl_register_pool(ZFS_IOC_POOL_IMPORT, zfs_ioc_pool_import,
5684 5687 zfs_secpolicy_config, B_TRUE, POOL_CHECK_NONE);
5685 5688
5686 5689 zfs_ioctl_register_pool(ZFS_IOC_CLEAR, zfs_ioc_clear,
5687 5690 zfs_secpolicy_config, B_TRUE, POOL_CHECK_NONE);
5688 5691 zfs_ioctl_register_pool(ZFS_IOC_POOL_REOPEN, zfs_ioc_pool_reopen,
5689 5692 zfs_secpolicy_config, B_TRUE, POOL_CHECK_SUSPENDED);
5690 5693
5691 5694 zfs_ioctl_register_dataset_read(ZFS_IOC_SPACE_WRITTEN,
5692 5695 zfs_ioc_space_written);
5693 5696 zfs_ioctl_register_dataset_read(ZFS_IOC_OBJSET_RECVD_PROPS,
5694 5697 zfs_ioc_objset_recvd_props);
5695 5698 zfs_ioctl_register_dataset_read(ZFS_IOC_NEXT_OBJ,
5696 5699 zfs_ioc_next_obj);
5697 5700 zfs_ioctl_register_dataset_read(ZFS_IOC_GET_FSACL,
5698 5701 zfs_ioc_get_fsacl);
5699 5702 zfs_ioctl_register_dataset_read(ZFS_IOC_OBJSET_STATS,
5700 5703 zfs_ioc_objset_stats);
5701 5704 zfs_ioctl_register_dataset_read(ZFS_IOC_OBJSET_ZPLPROPS,
5702 5705 zfs_ioc_objset_zplprops);
5703 5706 zfs_ioctl_register_dataset_read(ZFS_IOC_DATASET_LIST_NEXT,
5704 5707 zfs_ioc_dataset_list_next);
5705 5708 zfs_ioctl_register_dataset_read(ZFS_IOC_SNAPSHOT_LIST_NEXT,
5706 5709 zfs_ioc_snapshot_list_next);
5707 5710 zfs_ioctl_register_dataset_read(ZFS_IOC_SEND_PROGRESS,
5708 5711 zfs_ioc_send_progress);
5709 5712
5710 5713 zfs_ioctl_register_dataset_read_secpolicy(ZFS_IOC_DIFF,
5711 5714 zfs_ioc_diff, zfs_secpolicy_diff);
5712 5715 zfs_ioctl_register_dataset_read_secpolicy(ZFS_IOC_OBJ_TO_STATS,
5713 5716 zfs_ioc_obj_to_stats, zfs_secpolicy_diff);
5714 5717 zfs_ioctl_register_dataset_read_secpolicy(ZFS_IOC_OBJ_TO_PATH,
5715 5718 zfs_ioc_obj_to_path, zfs_secpolicy_diff);
5716 5719 zfs_ioctl_register_dataset_read_secpolicy(ZFS_IOC_USERSPACE_ONE,
5717 5720 zfs_ioc_userspace_one, zfs_secpolicy_userspace_one);
5718 5721 zfs_ioctl_register_dataset_read_secpolicy(ZFS_IOC_USERSPACE_MANY,
5719 5722 zfs_ioc_userspace_many, zfs_secpolicy_userspace_many);
5720 5723 zfs_ioctl_register_dataset_read_secpolicy(ZFS_IOC_SEND,
5721 5724 zfs_ioc_send, zfs_secpolicy_send);
5722 5725
5723 5726 zfs_ioctl_register_dataset_modify(ZFS_IOC_SET_PROP, zfs_ioc_set_prop,
5724 5727 zfs_secpolicy_none);
5725 5728 zfs_ioctl_register_dataset_modify(ZFS_IOC_DESTROY, zfs_ioc_destroy,
5726 5729 zfs_secpolicy_destroy);
5727 5730 zfs_ioctl_register_dataset_modify(ZFS_IOC_RENAME, zfs_ioc_rename,
5728 5731 zfs_secpolicy_rename);
5729 5732 zfs_ioctl_register_dataset_modify(ZFS_IOC_RECV, zfs_ioc_recv,
5730 5733 zfs_secpolicy_recv);
5731 5734 zfs_ioctl_register_dataset_modify(ZFS_IOC_PROMOTE, zfs_ioc_promote,
5732 5735 zfs_secpolicy_promote);
5733 5736 zfs_ioctl_register_dataset_modify(ZFS_IOC_INHERIT_PROP,
5734 5737 zfs_ioc_inherit_prop, zfs_secpolicy_inherit_prop);
5735 5738 zfs_ioctl_register_dataset_modify(ZFS_IOC_SET_FSACL, zfs_ioc_set_fsacl,
5736 5739 zfs_secpolicy_set_fsacl);
5737 5740
5738 5741 zfs_ioctl_register_dataset_nolog(ZFS_IOC_SHARE, zfs_ioc_share,
5739 5742 zfs_secpolicy_share, POOL_CHECK_NONE);
5740 5743 zfs_ioctl_register_dataset_nolog(ZFS_IOC_SMB_ACL, zfs_ioc_smb_acl,
5741 5744 zfs_secpolicy_smb_acl, POOL_CHECK_NONE);
5742 5745 zfs_ioctl_register_dataset_nolog(ZFS_IOC_USERSPACE_UPGRADE,
5743 5746 zfs_ioc_userspace_upgrade, zfs_secpolicy_userspace_upgrade,
5744 5747 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY);
5745 5748 zfs_ioctl_register_dataset_nolog(ZFS_IOC_TMP_SNAPSHOT,
5746 5749 zfs_ioc_tmp_snapshot, zfs_secpolicy_tmp_snapshot,
5747 5750 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY);
5748 5751 }
5749 5752
5750 5753 int
5751 5754 pool_status_check(const char *name, zfs_ioc_namecheck_t type,
5752 5755 zfs_ioc_poolcheck_t check)
5753 5756 {
5754 5757 spa_t *spa;
5755 5758 int error;
5756 5759
5757 5760 ASSERT(type == POOL_NAME || type == DATASET_NAME);
5758 5761
5759 5762 if (check & POOL_CHECK_NONE)
5760 5763 return (0);
5761 5764
5762 5765 error = spa_open(name, &spa, FTAG);
5763 5766 if (error == 0) {
5764 5767 if ((check & POOL_CHECK_SUSPENDED) && spa_suspended(spa))
5765 5768 error = SET_ERROR(EAGAIN);
5766 5769 else if ((check & POOL_CHECK_READONLY) && !spa_writeable(spa))
5767 5770 error = SET_ERROR(EROFS);
5768 5771 spa_close(spa, FTAG);
5769 5772 }
5770 5773 return (error);
5771 5774 }
5772 5775
5773 5776 /*
5774 5777 * Find a free minor number.
5775 5778 */
5776 5779 minor_t
5777 5780 zfsdev_minor_alloc(void)
5778 5781 {
5779 5782 static minor_t last_minor;
5780 5783 minor_t m;
5781 5784
5782 5785 ASSERT(MUTEX_HELD(&zfsdev_state_lock));
5783 5786
5784 5787 for (m = last_minor + 1; m != last_minor; m++) {
5785 5788 if (m > ZFSDEV_MAX_MINOR)
5786 5789 m = 1;
5787 5790 if (ddi_get_soft_state(zfsdev_state, m) == NULL) {
5788 5791 last_minor = m;
5789 5792 return (m);
5790 5793 }
5791 5794 }
5792 5795
5793 5796 return (0);
5794 5797 }
5795 5798
5796 5799 static int
5797 5800 zfs_ctldev_init(dev_t *devp)
5798 5801 {
5799 5802 minor_t minor;
5800 5803 zfs_soft_state_t *zs;
5801 5804
5802 5805 ASSERT(MUTEX_HELD(&zfsdev_state_lock));
5803 5806 ASSERT(getminor(*devp) == 0);
5804 5807
5805 5808 minor = zfsdev_minor_alloc();
5806 5809 if (minor == 0)
5807 5810 return (SET_ERROR(ENXIO));
5808 5811
5809 5812 if (ddi_soft_state_zalloc(zfsdev_state, minor) != DDI_SUCCESS)
5810 5813 return (SET_ERROR(EAGAIN));
5811 5814
5812 5815 *devp = makedevice(getemajor(*devp), minor);
5813 5816
5814 5817 zs = ddi_get_soft_state(zfsdev_state, minor);
5815 5818 zs->zss_type = ZSST_CTLDEV;
5816 5819 zfs_onexit_init((zfs_onexit_t **)&zs->zss_data);
5817 5820
5818 5821 return (0);
5819 5822 }
5820 5823
5821 5824 static void
5822 5825 zfs_ctldev_destroy(zfs_onexit_t *zo, minor_t minor)
5823 5826 {
5824 5827 ASSERT(MUTEX_HELD(&zfsdev_state_lock));
5825 5828
5826 5829 zfs_onexit_destroy(zo);
5827 5830 ddi_soft_state_free(zfsdev_state, minor);
5828 5831 }
5829 5832
5830 5833 void *
5831 5834 zfsdev_get_soft_state(minor_t minor, enum zfs_soft_state_type which)
5832 5835 {
5833 5836 zfs_soft_state_t *zp;
5834 5837
5835 5838 zp = ddi_get_soft_state(zfsdev_state, minor);
5836 5839 if (zp == NULL || zp->zss_type != which)
5837 5840 return (NULL);
5838 5841
5839 5842 return (zp->zss_data);
5840 5843 }
5841 5844
5842 5845 static int
5843 5846 zfsdev_open(dev_t *devp, int flag, int otyp, cred_t *cr)
5844 5847 {
5845 5848 int error = 0;
5846 5849
5847 5850 if (getminor(*devp) != 0)
5848 5851 return (zvol_open(devp, flag, otyp, cr));
5849 5852
5850 5853 /* This is the control device. Allocate a new minor if requested. */
5851 5854 if (flag & FEXCL) {
5852 5855 mutex_enter(&zfsdev_state_lock);
5853 5856 error = zfs_ctldev_init(devp);
5854 5857 mutex_exit(&zfsdev_state_lock);
5855 5858 }
5856 5859
5857 5860 return (error);
5858 5861 }
5859 5862
5860 5863 static int
5861 5864 zfsdev_close(dev_t dev, int flag, int otyp, cred_t *cr)
5862 5865 {
5863 5866 zfs_onexit_t *zo;
5864 5867 minor_t minor = getminor(dev);
5865 5868
5866 5869 if (minor == 0)
5867 5870 return (0);
5868 5871
5869 5872 mutex_enter(&zfsdev_state_lock);
5870 5873 zo = zfsdev_get_soft_state(minor, ZSST_CTLDEV);
5871 5874 if (zo == NULL) {
5872 5875 mutex_exit(&zfsdev_state_lock);
5873 5876 return (zvol_close(dev, flag, otyp, cr));
5874 5877 }
5875 5878 zfs_ctldev_destroy(zo, minor);
5876 5879 mutex_exit(&zfsdev_state_lock);
5877 5880
5878 5881 return (0);
5879 5882 }
5880 5883
5881 5884 static int
5882 5885 zfsdev_ioctl(dev_t dev, int cmd, intptr_t arg, int flag, cred_t *cr, int *rvalp)
5883 5886 {
5884 5887 zfs_cmd_t *zc;
5885 5888 uint_t vecnum;
5886 5889 int error, rc, len;
5887 5890 minor_t minor = getminor(dev);
5888 5891 const zfs_ioc_vec_t *vec;
5889 5892 char *saved_poolname = NULL;
5890 5893 nvlist_t *innvl = NULL;
5891 5894
5892 5895 if (minor != 0 &&
5893 5896 zfsdev_get_soft_state(minor, ZSST_CTLDEV) == NULL)
5894 5897 return (zvol_ioctl(dev, cmd, arg, flag, cr, rvalp));
5895 5898
5896 5899 vecnum = cmd - ZFS_IOC_FIRST;
5897 5900 ASSERT3U(getmajor(dev), ==, ddi_driver_major(zfs_dip));
5898 5901
5899 5902 if (vecnum >= sizeof (zfs_ioc_vec) / sizeof (zfs_ioc_vec[0]))
5900 5903 return (SET_ERROR(EINVAL));
5901 5904 vec = &zfs_ioc_vec[vecnum];
5902 5905
5903 5906 zc = kmem_zalloc(sizeof (zfs_cmd_t), KM_SLEEP);
5904 5907
5905 5908 error = ddi_copyin((void *)arg, zc, sizeof (zfs_cmd_t), flag);
5906 5909 if (error != 0) {
5907 5910 error = SET_ERROR(EFAULT);
5908 5911 goto out;
5909 5912 }
5910 5913
5911 5914 zc->zc_iflags = flag & FKIOCTL;
5912 5915 if (zc->zc_nvlist_src_size != 0) {
5913 5916 error = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
5914 5917 zc->zc_iflags, &innvl);
5915 5918 if (error != 0)
5916 5919 goto out;
5917 5920 }
5918 5921
5919 5922 /*
5920 5923 * Ensure that all pool/dataset names are valid before we pass down to
5921 5924 * the lower layers.
5922 5925 */
5923 5926 zc->zc_name[sizeof (zc->zc_name) - 1] = '\0';
5924 5927 switch (vec->zvec_namecheck) {
5925 5928 case POOL_NAME:
5926 5929 if (pool_namecheck(zc->zc_name, NULL, NULL) != 0)
5927 5930 error = SET_ERROR(EINVAL);
5928 5931 else
5929 5932 error = pool_status_check(zc->zc_name,
5930 5933 vec->zvec_namecheck, vec->zvec_pool_check);
5931 5934 break;
5932 5935
5933 5936 case DATASET_NAME:
5934 5937 if (dataset_namecheck(zc->zc_name, NULL, NULL) != 0)
5935 5938 error = SET_ERROR(EINVAL);
5936 5939 else
5937 5940 error = pool_status_check(zc->zc_name,
5938 5941 vec->zvec_namecheck, vec->zvec_pool_check);
5939 5942 break;
5940 5943
5941 5944 case NO_NAME:
5942 5945 break;
5943 5946 }
5944 5947
5945 5948
5946 5949 if (error == 0 && !(flag & FKIOCTL))
5947 5950 error = vec->zvec_secpolicy(zc, innvl, cr);
5948 5951
5949 5952 if (error != 0)
5950 5953 goto out;
5951 5954
5952 5955 /* legacy ioctls can modify zc_name */
5953 5956 len = strcspn(zc->zc_name, "/@#") + 1;
5954 5957 saved_poolname = kmem_alloc(len, KM_SLEEP);
5955 5958 (void) strlcpy(saved_poolname, zc->zc_name, len);
5956 5959
5957 5960 if (vec->zvec_func != NULL) {
5958 5961 nvlist_t *outnvl;
5959 5962 int puterror = 0;
5960 5963 spa_t *spa;
5961 5964 nvlist_t *lognv = NULL;
5962 5965
5963 5966 ASSERT(vec->zvec_legacy_func == NULL);
5964 5967
5965 5968 /*
5966 5969 * Add the innvl to the lognv before calling the func,
5967 5970 * in case the func changes the innvl.
5968 5971 */
5969 5972 if (vec->zvec_allow_log) {
5970 5973 lognv = fnvlist_alloc();
5971 5974 fnvlist_add_string(lognv, ZPOOL_HIST_IOCTL,
5972 5975 vec->zvec_name);
5973 5976 if (!nvlist_empty(innvl)) {
5974 5977 fnvlist_add_nvlist(lognv, ZPOOL_HIST_INPUT_NVL,
5975 5978 innvl);
5976 5979 }
5977 5980 }
5978 5981
5979 5982 outnvl = fnvlist_alloc();
5980 5983 error = vec->zvec_func(zc->zc_name, innvl, outnvl);
5981 5984
5982 5985 if (error == 0 && vec->zvec_allow_log &&
5983 5986 spa_open(zc->zc_name, &spa, FTAG) == 0) {
5984 5987 if (!nvlist_empty(outnvl)) {
5985 5988 fnvlist_add_nvlist(lognv, ZPOOL_HIST_OUTPUT_NVL,
5986 5989 outnvl);
5987 5990 }
5988 5991 (void) spa_history_log_nvl(spa, lognv);
5989 5992 spa_close(spa, FTAG);
5990 5993 }
5991 5994 fnvlist_free(lognv);
5992 5995
5993 5996 if (!nvlist_empty(outnvl) || zc->zc_nvlist_dst_size != 0) {
5994 5997 int smusherror = 0;
5995 5998 if (vec->zvec_smush_outnvlist) {
5996 5999 smusherror = nvlist_smush(outnvl,
5997 6000 zc->zc_nvlist_dst_size);
5998 6001 }
5999 6002 if (smusherror == 0)
6000 6003 puterror = put_nvlist(zc, outnvl);
6001 6004 }
6002 6005
6003 6006 if (puterror != 0)
6004 6007 error = puterror;
6005 6008
6006 6009 nvlist_free(outnvl);
6007 6010 } else {
6008 6011 error = vec->zvec_legacy_func(zc);
6009 6012 }
6010 6013
6011 6014 out:
6012 6015 nvlist_free(innvl);
6013 6016 rc = ddi_copyout(zc, (void *)arg, sizeof (zfs_cmd_t), flag);
6014 6017 if (error == 0 && rc != 0)
6015 6018 error = SET_ERROR(EFAULT);
6016 6019 if (error == 0 && vec->zvec_allow_log) {
6017 6020 char *s = tsd_get(zfs_allow_log_key);
6018 6021 if (s != NULL)
6019 6022 strfree(s);
6020 6023 (void) tsd_set(zfs_allow_log_key, saved_poolname);
6021 6024 } else {
6022 6025 if (saved_poolname != NULL)
6023 6026 strfree(saved_poolname);
6024 6027 }
6025 6028
6026 6029 kmem_free(zc, sizeof (zfs_cmd_t));
6027 6030 return (error);
6028 6031 }
6029 6032
6030 6033 static int
6031 6034 zfs_attach(dev_info_t *dip, ddi_attach_cmd_t cmd)
6032 6035 {
6033 6036 if (cmd != DDI_ATTACH)
6034 6037 return (DDI_FAILURE);
6035 6038
6036 6039 if (ddi_create_minor_node(dip, "zfs", S_IFCHR, 0,
6037 6040 DDI_PSEUDO, 0) == DDI_FAILURE)
6038 6041 return (DDI_FAILURE);
6039 6042
6040 6043 zfs_dip = dip;
6041 6044
6042 6045 ddi_report_dev(dip);
6043 6046
6044 6047 return (DDI_SUCCESS);
6045 6048 }
6046 6049
6047 6050 static int
6048 6051 zfs_detach(dev_info_t *dip, ddi_detach_cmd_t cmd)
6049 6052 {
6050 6053 if (spa_busy() || zfs_busy() || zvol_busy())
6051 6054 return (DDI_FAILURE);
6052 6055
6053 6056 if (cmd != DDI_DETACH)
6054 6057 return (DDI_FAILURE);
6055 6058
6056 6059 zfs_dip = NULL;
6057 6060
6058 6061 ddi_prop_remove_all(dip);
6059 6062 ddi_remove_minor_node(dip, NULL);
6060 6063
6061 6064 return (DDI_SUCCESS);
6062 6065 }
6063 6066
6064 6067 /*ARGSUSED*/
6065 6068 static int
6066 6069 zfs_info(dev_info_t *dip, ddi_info_cmd_t infocmd, void *arg, void **result)
6067 6070 {
6068 6071 switch (infocmd) {
6069 6072 case DDI_INFO_DEVT2DEVINFO:
6070 6073 *result = zfs_dip;
6071 6074 return (DDI_SUCCESS);
6072 6075
6073 6076 case DDI_INFO_DEVT2INSTANCE:
6074 6077 *result = (void *)0;
6075 6078 return (DDI_SUCCESS);
6076 6079 }
6077 6080
6078 6081 return (DDI_FAILURE);
6079 6082 }
6080 6083
6081 6084 /*
6082 6085 * OK, so this is a little weird.
6083 6086 *
6084 6087 * /dev/zfs is the control node, i.e. minor 0.
6085 6088 * /dev/zvol/[r]dsk/pool/dataset are the zvols, minor > 0.
6086 6089 *
6087 6090 * /dev/zfs has basically nothing to do except serve up ioctls,
6088 6091 * so most of the standard driver entry points are in zvol.c.
6089 6092 */
6090 6093 static struct cb_ops zfs_cb_ops = {
6091 6094 zfsdev_open, /* open */
6092 6095 zfsdev_close, /* close */
6093 6096 zvol_strategy, /* strategy */
6094 6097 nodev, /* print */
6095 6098 zvol_dump, /* dump */
6096 6099 zvol_read, /* read */
6097 6100 zvol_write, /* write */
6098 6101 zfsdev_ioctl, /* ioctl */
6099 6102 nodev, /* devmap */
6100 6103 nodev, /* mmap */
6101 6104 nodev, /* segmap */
6102 6105 nochpoll, /* poll */
6103 6106 ddi_prop_op, /* prop_op */
6104 6107 NULL, /* streamtab */
6105 6108 D_NEW | D_MP | D_64BIT, /* Driver compatibility flag */
6106 6109 CB_REV, /* version */
6107 6110 nodev, /* async read */
6108 6111 nodev, /* async write */
6109 6112 };
6110 6113
6111 6114 static struct dev_ops zfs_dev_ops = {
6112 6115 DEVO_REV, /* version */
6113 6116 0, /* refcnt */
6114 6117 zfs_info, /* info */
6115 6118 nulldev, /* identify */
6116 6119 nulldev, /* probe */
6117 6120 zfs_attach, /* attach */
6118 6121 zfs_detach, /* detach */
6119 6122 nodev, /* reset */
6120 6123 &zfs_cb_ops, /* driver operations */
6121 6124 NULL, /* no bus operations */
6122 6125 NULL, /* power */
6123 6126 ddi_quiesce_not_needed, /* quiesce */
6124 6127 };
6125 6128
6126 6129 static struct modldrv zfs_modldrv = {
6127 6130 &mod_driverops,
6128 6131 "ZFS storage pool",
6129 6132 &zfs_dev_ops
6130 6133 };
6131 6134
6132 6135 static struct modlinkage modlinkage = {
6133 6136 MODREV_1,
6134 6137 (void *)&zfs_modlfs,
6135 6138 (void *)&zfs_modldrv,
6136 6139 NULL
6137 6140 };
6138 6141
6139 6142 static void
6140 6143 zfs_allow_log_destroy(void *arg)
6141 6144 {
6142 6145 char *poolname = arg;
6143 6146 strfree(poolname);
6144 6147 }
6145 6148
6146 6149 int
6147 6150 _init(void)
6148 6151 {
6149 6152 int error;
6150 6153
6151 6154 spa_init(FREAD | FWRITE);
6152 6155 zfs_init();
6153 6156 zvol_init();
6154 6157 zfs_ioctl_init();
6155 6158
6156 6159 if ((error = mod_install(&modlinkage)) != 0) {
6157 6160 zvol_fini();
6158 6161 zfs_fini();
6159 6162 spa_fini();
6160 6163 return (error);
6161 6164 }
6162 6165
6163 6166 tsd_create(&zfs_fsyncer_key, NULL);
6164 6167 tsd_create(&rrw_tsd_key, rrw_tsd_destroy);
6165 6168 tsd_create(&zfs_allow_log_key, zfs_allow_log_destroy);
6166 6169
6167 6170 error = ldi_ident_from_mod(&modlinkage, &zfs_li);
6168 6171 ASSERT(error == 0);
6169 6172 mutex_init(&zfs_share_lock, NULL, MUTEX_DEFAULT, NULL);
6170 6173
6171 6174 return (0);
6172 6175 }
6173 6176
6174 6177 int
6175 6178 _fini(void)
6176 6179 {
6177 6180 int error;
6178 6181
6179 6182 if (spa_busy() || zfs_busy() || zvol_busy() || zio_injection_enabled)
6180 6183 return (SET_ERROR(EBUSY));
6181 6184
6182 6185 if ((error = mod_remove(&modlinkage)) != 0)
6183 6186 return (error);
6184 6187
6185 6188 zvol_fini();
6186 6189 zfs_fini();
6187 6190 spa_fini();
6188 6191 if (zfs_nfsshare_inited)
6189 6192 (void) ddi_modclose(nfs_mod);
6190 6193 if (zfs_smbshare_inited)
6191 6194 (void) ddi_modclose(smbsrv_mod);
6192 6195 if (zfs_nfsshare_inited || zfs_smbshare_inited)
6193 6196 (void) ddi_modclose(sharefs_mod);
6194 6197
6195 6198 tsd_destroy(&zfs_fsyncer_key);
6196 6199 ldi_ident_release(zfs_li);
6197 6200 zfs_li = NULL;
6198 6201 mutex_destroy(&zfs_share_lock);
6199 6202
6200 6203 return (error);
6201 6204 }
6202 6205
6203 6206 int
6204 6207 _info(struct modinfo *modinfop)
6205 6208 {
6206 6209 return (mod_info(&modlinkage, modinfop));
6207 6210 }
↓ open down ↓ |
3791 lines elided |
↑ open up ↑ |
XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX