Print this page
Matt's code review fixes
| Split |
Close |
| Expand all |
| Collapse all |
--- old/usr/src/uts/common/fs/zfs/zfs_ioctl.c
+++ new/usr/src/uts/common/fs/zfs/zfs_ioctl.c
1 1 /*
2 2 * CDDL HEADER START
3 3 *
4 4 * The contents of this file are subject to the terms of the
5 5 * Common Development and Distribution License (the "License").
6 6 * You may not use this file except in compliance with the License.
7 7 *
8 8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9 9 * or http://www.opensolaris.org/os/licensing.
10 10 * See the License for the specific language governing permissions
11 11 * and limitations under the License.
12 12 *
13 13 * When distributing Covered Code, include this CDDL HEADER in each
14 14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15 15 * If applicable, add the following below this CDDL HEADER, with the
16 16 * fields enclosed by brackets "[]" replaced with your own identifying
17 17 * information: Portions Copyright [yyyy] [name of copyright owner]
18 18 *
19 19 * CDDL HEADER END
20 20 */
21 21
22 22 /*
23 23 * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
24 24 * Portions Copyright 2011 Martin Matuska
25 25 * Copyright 2015 Nexenta Systems, Inc. All rights reserved.
26 26 * Copyright (c) 2014, Joyent, Inc. All rights reserved.
27 27 * Copyright (c) 2011, 2015 by Delphix. All rights reserved.
28 28 * Copyright (c) 2013 by Saso Kiselkov. All rights reserved.
29 29 * Copyright (c) 2013 Steven Hartland. All rights reserved.
30 30 */
31 31
32 32 /*
33 33 * ZFS ioctls.
34 34 *
35 35 * This file handles the ioctls to /dev/zfs, used for configuring ZFS storage
36 36 * pools and filesystems, e.g. with /sbin/zfs and /sbin/zpool.
37 37 *
38 38 * There are two ways that we handle ioctls: the legacy way where almost
39 39 * all of the logic is in the ioctl callback, and the new way where most
40 40 * of the marshalling is handled in the common entry point, zfsdev_ioctl().
41 41 *
42 42 * Non-legacy ioctls should be registered by calling
43 43 * zfs_ioctl_register() from zfs_ioctl_init(). The ioctl is invoked
44 44 * from userland by lzc_ioctl().
45 45 *
46 46 * The registration arguments are as follows:
47 47 *
48 48 * const char *name
49 49 * The name of the ioctl. This is used for history logging. If the
50 50 * ioctl returns successfully (the callback returns 0), and allow_log
51 51 * is true, then a history log entry will be recorded with the input &
52 52 * output nvlists. The log entry can be printed with "zpool history -i".
53 53 *
54 54 * zfs_ioc_t ioc
55 55 * The ioctl request number, which userland will pass to ioctl(2).
56 56 * The ioctl numbers can change from release to release, because
57 57 * the caller (libzfs) must be matched to the kernel.
58 58 *
59 59 * zfs_secpolicy_func_t *secpolicy
60 60 * This function will be called before the zfs_ioc_func_t, to
61 61 * determine if this operation is permitted. It should return EPERM
62 62 * on failure, and 0 on success. Checks include determining if the
63 63 * dataset is visible in this zone, and if the user has either all
64 64 * zfs privileges in the zone (SYS_MOUNT), or has been granted permission
65 65 * to do this operation on this dataset with "zfs allow".
66 66 *
67 67 * zfs_ioc_namecheck_t namecheck
68 68 * This specifies what to expect in the zfs_cmd_t:zc_name -- a pool
69 69 * name, a dataset name, or nothing. If the name is not well-formed,
70 70 * the ioctl will fail and the callback will not be called.
71 71 * Therefore, the callback can assume that the name is well-formed
72 72 * (e.g. is null-terminated, doesn't have more than one '@' character,
73 73 * doesn't have invalid characters).
74 74 *
75 75 * zfs_ioc_poolcheck_t pool_check
76 76 * This specifies requirements on the pool state. If the pool does
77 77 * not meet them (is suspended or is readonly), the ioctl will fail
78 78 * and the callback will not be called. If any checks are specified
79 79 * (i.e. it is not POOL_CHECK_NONE), namecheck must not be NO_NAME.
80 80 * Multiple checks can be or-ed together (e.g. POOL_CHECK_SUSPENDED |
81 81 * POOL_CHECK_READONLY).
82 82 *
83 83 * boolean_t smush_outnvlist
84 84 * If smush_outnvlist is true, then the output is presumed to be a
85 85 * list of errors, and it will be "smushed" down to fit into the
86 86 * caller's buffer, by removing some entries and replacing them with a
87 87 * single "N_MORE_ERRORS" entry indicating how many were removed. See
88 88 * nvlist_smush() for details. If smush_outnvlist is false, and the
89 89 * outnvlist does not fit into the userland-provided buffer, then the
90 90 * ioctl will fail with ENOMEM.
91 91 *
92 92 * zfs_ioc_func_t *func
93 93 * The callback function that will perform the operation.
94 94 *
95 95 * The callback should return 0 on success, or an error number on
96 96 * failure. If the function fails, the userland ioctl will return -1,
97 97 * and errno will be set to the callback's return value. The callback
98 98 * will be called with the following arguments:
99 99 *
100 100 * const char *name
101 101 * The name of the pool or dataset to operate on, from
102 102 * zfs_cmd_t:zc_name. The 'namecheck' argument specifies the
103 103 * expected type (pool, dataset, or none).
104 104 *
105 105 * nvlist_t *innvl
106 106 * The input nvlist, deserialized from zfs_cmd_t:zc_nvlist_src. Or
107 107 * NULL if no input nvlist was provided. Changes to this nvlist are
108 108 * ignored. If the input nvlist could not be deserialized, the
109 109 * ioctl will fail and the callback will not be called.
110 110 *
111 111 * nvlist_t *outnvl
112 112 * The output nvlist, initially empty. The callback can fill it in,
113 113 * and it will be returned to userland by serializing it into
114 114 * zfs_cmd_t:zc_nvlist_dst. If it is non-empty, and serialization
115 115 * fails (e.g. because the caller didn't supply a large enough
116 116 * buffer), then the overall ioctl will fail. See the
117 117 * 'smush_nvlist' argument above for additional behaviors.
118 118 *
119 119 * There are two typical uses of the output nvlist:
120 120 * - To return state, e.g. property values. In this case,
121 121 * smush_outnvlist should be false. If the buffer was not large
122 122 * enough, the caller will reallocate a larger buffer and try
123 123 * the ioctl again.
124 124 *
125 125 * - To return multiple errors from an ioctl which makes on-disk
126 126 * changes. In this case, smush_outnvlist should be true.
127 127 * Ioctls which make on-disk modifications should generally not
128 128 * use the outnvl if they succeed, because the caller can not
129 129 * distinguish between the operation failing, and
130 130 * deserialization failing.
131 131 */
132 132
133 133 #include <sys/types.h>
134 134 #include <sys/param.h>
135 135 #include <sys/errno.h>
136 136 #include <sys/uio.h>
137 137 #include <sys/buf.h>
138 138 #include <sys/modctl.h>
139 139 #include <sys/open.h>
140 140 #include <sys/file.h>
141 141 #include <sys/kmem.h>
142 142 #include <sys/conf.h>
143 143 #include <sys/cmn_err.h>
144 144 #include <sys/stat.h>
145 145 #include <sys/zfs_ioctl.h>
146 146 #include <sys/zfs_vfsops.h>
147 147 #include <sys/zfs_znode.h>
148 148 #include <sys/zap.h>
149 149 #include <sys/spa.h>
150 150 #include <sys/spa_impl.h>
151 151 #include <sys/vdev.h>
152 152 #include <sys/priv_impl.h>
153 153 #include <sys/dmu.h>
154 154 #include <sys/dsl_dir.h>
155 155 #include <sys/dsl_dataset.h>
156 156 #include <sys/dsl_prop.h>
157 157 #include <sys/dsl_deleg.h>
158 158 #include <sys/dmu_objset.h>
159 159 #include <sys/dmu_impl.h>
160 160 #include <sys/dmu_tx.h>
161 161 #include <sys/ddi.h>
162 162 #include <sys/sunddi.h>
163 163 #include <sys/sunldi.h>
164 164 #include <sys/policy.h>
165 165 #include <sys/zone.h>
166 166 #include <sys/nvpair.h>
167 167 #include <sys/pathname.h>
168 168 #include <sys/mount.h>
169 169 #include <sys/sdt.h>
170 170 #include <sys/fs/zfs.h>
171 171 #include <sys/zfs_ctldir.h>
172 172 #include <sys/zfs_dir.h>
173 173 #include <sys/zfs_onexit.h>
174 174 #include <sys/zvol.h>
175 175 #include <sys/dsl_scan.h>
176 176 #include <sharefs/share.h>
177 177 #include <sys/dmu_objset.h>
178 178 #include <sys/dmu_send.h>
179 179 #include <sys/dsl_destroy.h>
180 180 #include <sys/dsl_bookmark.h>
181 181 #include <sys/dsl_userhold.h>
182 182 #include <sys/zfeature.h>
183 183 #include <sys/zio_checksum.h>
184 184
185 185 #include "zfs_namecheck.h"
186 186 #include "zfs_prop.h"
187 187 #include "zfs_deleg.h"
188 188 #include "zfs_comutil.h"
189 189
190 190 extern struct modlfs zfs_modlfs;
191 191
192 192 extern void zfs_init(void);
193 193 extern void zfs_fini(void);
194 194
195 195 ldi_ident_t zfs_li = NULL;
196 196 dev_info_t *zfs_dip;
197 197
198 198 uint_t zfs_fsyncer_key;
199 199 extern uint_t rrw_tsd_key;
200 200 static uint_t zfs_allow_log_key;
201 201
202 202 typedef int zfs_ioc_legacy_func_t(zfs_cmd_t *);
203 203 typedef int zfs_ioc_func_t(const char *, nvlist_t *, nvlist_t *);
204 204 typedef int zfs_secpolicy_func_t(zfs_cmd_t *, nvlist_t *, cred_t *);
205 205
206 206 typedef enum {
207 207 NO_NAME,
208 208 POOL_NAME,
209 209 DATASET_NAME
210 210 } zfs_ioc_namecheck_t;
211 211
212 212 typedef enum {
213 213 POOL_CHECK_NONE = 1 << 0,
214 214 POOL_CHECK_SUSPENDED = 1 << 1,
215 215 POOL_CHECK_READONLY = 1 << 2,
216 216 } zfs_ioc_poolcheck_t;
217 217
218 218 typedef struct zfs_ioc_vec {
219 219 zfs_ioc_legacy_func_t *zvec_legacy_func;
220 220 zfs_ioc_func_t *zvec_func;
221 221 zfs_secpolicy_func_t *zvec_secpolicy;
222 222 zfs_ioc_namecheck_t zvec_namecheck;
223 223 boolean_t zvec_allow_log;
224 224 zfs_ioc_poolcheck_t zvec_pool_check;
225 225 boolean_t zvec_smush_outnvlist;
226 226 const char *zvec_name;
227 227 } zfs_ioc_vec_t;
228 228
229 229 /* This array is indexed by zfs_userquota_prop_t */
230 230 static const char *userquota_perms[] = {
231 231 ZFS_DELEG_PERM_USERUSED,
232 232 ZFS_DELEG_PERM_USERQUOTA,
233 233 ZFS_DELEG_PERM_GROUPUSED,
234 234 ZFS_DELEG_PERM_GROUPQUOTA,
235 235 };
236 236
237 237 static int zfs_ioc_userspace_upgrade(zfs_cmd_t *zc);
238 238 static int zfs_check_settable(const char *name, nvpair_t *property,
239 239 cred_t *cr);
240 240 static int zfs_check_clearable(char *dataset, nvlist_t *props,
241 241 nvlist_t **errors);
242 242 static int zfs_fill_zplprops_root(uint64_t, nvlist_t *, nvlist_t *,
243 243 boolean_t *);
244 244 int zfs_set_prop_nvlist(const char *, zprop_source_t, nvlist_t *, nvlist_t *);
245 245 static int get_nvlist(uint64_t nvl, uint64_t size, int iflag, nvlist_t **nvp);
246 246
247 247 static int zfs_prop_activate_feature(spa_t *spa, spa_feature_t feature);
248 248
249 249 /* _NOTE(PRINTFLIKE(4)) - this is printf-like, but lint is too whiney */
250 250 void
251 251 __dprintf(const char *file, const char *func, int line, const char *fmt, ...)
252 252 {
253 253 const char *newfile;
254 254 char buf[512];
255 255 va_list adx;
256 256
257 257 /*
258 258 * Get rid of annoying "../common/" prefix to filename.
259 259 */
260 260 newfile = strrchr(file, '/');
261 261 if (newfile != NULL) {
262 262 newfile = newfile + 1; /* Get rid of leading / */
263 263 } else {
264 264 newfile = file;
265 265 }
266 266
267 267 va_start(adx, fmt);
268 268 (void) vsnprintf(buf, sizeof (buf), fmt, adx);
269 269 va_end(adx);
270 270
271 271 /*
272 272 * To get this data, use the zfs-dprintf probe as so:
273 273 * dtrace -q -n 'zfs-dprintf \
274 274 * /stringof(arg0) == "dbuf.c"/ \
275 275 * {printf("%s: %s", stringof(arg1), stringof(arg3))}'
276 276 * arg0 = file name
277 277 * arg1 = function name
278 278 * arg2 = line number
279 279 * arg3 = message
280 280 */
281 281 DTRACE_PROBE4(zfs__dprintf,
282 282 char *, newfile, char *, func, int, line, char *, buf);
283 283 }
284 284
285 285 static void
286 286 history_str_free(char *buf)
287 287 {
288 288 kmem_free(buf, HIS_MAX_RECORD_LEN);
289 289 }
290 290
291 291 static char *
292 292 history_str_get(zfs_cmd_t *zc)
293 293 {
294 294 char *buf;
295 295
296 296 if (zc->zc_history == NULL)
297 297 return (NULL);
298 298
299 299 buf = kmem_alloc(HIS_MAX_RECORD_LEN, KM_SLEEP);
300 300 if (copyinstr((void *)(uintptr_t)zc->zc_history,
301 301 buf, HIS_MAX_RECORD_LEN, NULL) != 0) {
302 302 history_str_free(buf);
303 303 return (NULL);
304 304 }
305 305
306 306 buf[HIS_MAX_RECORD_LEN -1] = '\0';
307 307
308 308 return (buf);
309 309 }
310 310
311 311 /*
312 312 * Check to see if the named dataset is currently defined as bootable
313 313 */
314 314 static boolean_t
315 315 zfs_is_bootfs(const char *name)
316 316 {
317 317 objset_t *os;
318 318
319 319 if (dmu_objset_hold(name, FTAG, &os) == 0) {
320 320 boolean_t ret;
321 321 ret = (dmu_objset_id(os) == spa_bootfs(dmu_objset_spa(os)));
322 322 dmu_objset_rele(os, FTAG);
323 323 return (ret);
324 324 }
325 325 return (B_FALSE);
326 326 }
327 327
328 328 /*
329 329 * Return non-zero if the spa version is less than requested version.
330 330 */
331 331 static int
332 332 zfs_earlier_version(const char *name, int version)
333 333 {
334 334 spa_t *spa;
335 335
336 336 if (spa_open(name, &spa, FTAG) == 0) {
337 337 if (spa_version(spa) < version) {
338 338 spa_close(spa, FTAG);
339 339 return (1);
340 340 }
341 341 spa_close(spa, FTAG);
342 342 }
343 343 return (0);
344 344 }
345 345
346 346 /*
347 347 * Return TRUE if the ZPL version is less than requested version.
348 348 */
349 349 static boolean_t
350 350 zpl_earlier_version(const char *name, int version)
351 351 {
352 352 objset_t *os;
353 353 boolean_t rc = B_TRUE;
354 354
355 355 if (dmu_objset_hold(name, FTAG, &os) == 0) {
356 356 uint64_t zplversion;
357 357
358 358 if (dmu_objset_type(os) != DMU_OST_ZFS) {
359 359 dmu_objset_rele(os, FTAG);
360 360 return (B_TRUE);
361 361 }
362 362 /* XXX reading from non-owned objset */
363 363 if (zfs_get_zplprop(os, ZFS_PROP_VERSION, &zplversion) == 0)
364 364 rc = zplversion < version;
365 365 dmu_objset_rele(os, FTAG);
366 366 }
367 367 return (rc);
368 368 }
369 369
370 370 static void
371 371 zfs_log_history(zfs_cmd_t *zc)
372 372 {
373 373 spa_t *spa;
374 374 char *buf;
375 375
376 376 if ((buf = history_str_get(zc)) == NULL)
377 377 return;
378 378
379 379 if (spa_open(zc->zc_name, &spa, FTAG) == 0) {
380 380 if (spa_version(spa) >= SPA_VERSION_ZPOOL_HISTORY)
381 381 (void) spa_history_log(spa, buf);
382 382 spa_close(spa, FTAG);
383 383 }
384 384 history_str_free(buf);
385 385 }
386 386
387 387 /*
388 388 * Policy for top-level read operations (list pools). Requires no privileges,
389 389 * and can be used in the local zone, as there is no associated dataset.
390 390 */
391 391 /* ARGSUSED */
392 392 static int
393 393 zfs_secpolicy_none(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
394 394 {
395 395 return (0);
396 396 }
397 397
398 398 /*
399 399 * Policy for dataset read operations (list children, get statistics). Requires
400 400 * no privileges, but must be visible in the local zone.
401 401 */
402 402 /* ARGSUSED */
403 403 static int
404 404 zfs_secpolicy_read(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
405 405 {
406 406 if (INGLOBALZONE(curproc) ||
407 407 zone_dataset_visible(zc->zc_name, NULL))
408 408 return (0);
409 409
410 410 return (SET_ERROR(ENOENT));
411 411 }
412 412
413 413 static int
414 414 zfs_dozonecheck_impl(const char *dataset, uint64_t zoned, cred_t *cr)
415 415 {
416 416 int writable = 1;
417 417
418 418 /*
419 419 * The dataset must be visible by this zone -- check this first
420 420 * so they don't see EPERM on something they shouldn't know about.
421 421 */
422 422 if (!INGLOBALZONE(curproc) &&
423 423 !zone_dataset_visible(dataset, &writable))
424 424 return (SET_ERROR(ENOENT));
425 425
426 426 if (INGLOBALZONE(curproc)) {
427 427 /*
428 428 * If the fs is zoned, only root can access it from the
429 429 * global zone.
430 430 */
431 431 if (secpolicy_zfs(cr) && zoned)
432 432 return (SET_ERROR(EPERM));
433 433 } else {
434 434 /*
435 435 * If we are in a local zone, the 'zoned' property must be set.
436 436 */
437 437 if (!zoned)
438 438 return (SET_ERROR(EPERM));
439 439
440 440 /* must be writable by this zone */
441 441 if (!writable)
442 442 return (SET_ERROR(EPERM));
443 443 }
444 444 return (0);
445 445 }
446 446
447 447 static int
448 448 zfs_dozonecheck(const char *dataset, cred_t *cr)
449 449 {
450 450 uint64_t zoned;
451 451
452 452 if (dsl_prop_get_integer(dataset, "zoned", &zoned, NULL))
453 453 return (SET_ERROR(ENOENT));
454 454
455 455 return (zfs_dozonecheck_impl(dataset, zoned, cr));
456 456 }
457 457
458 458 static int
459 459 zfs_dozonecheck_ds(const char *dataset, dsl_dataset_t *ds, cred_t *cr)
460 460 {
461 461 uint64_t zoned;
462 462
463 463 if (dsl_prop_get_int_ds(ds, "zoned", &zoned))
464 464 return (SET_ERROR(ENOENT));
465 465
466 466 return (zfs_dozonecheck_impl(dataset, zoned, cr));
467 467 }
468 468
469 469 static int
470 470 zfs_secpolicy_write_perms_ds(const char *name, dsl_dataset_t *ds,
471 471 const char *perm, cred_t *cr)
472 472 {
473 473 int error;
474 474
475 475 error = zfs_dozonecheck_ds(name, ds, cr);
476 476 if (error == 0) {
477 477 error = secpolicy_zfs(cr);
478 478 if (error != 0)
479 479 error = dsl_deleg_access_impl(ds, perm, cr);
480 480 }
481 481 return (error);
482 482 }
483 483
484 484 static int
485 485 zfs_secpolicy_write_perms(const char *name, const char *perm, cred_t *cr)
486 486 {
487 487 int error;
488 488 dsl_dataset_t *ds;
489 489 dsl_pool_t *dp;
490 490
491 491 error = dsl_pool_hold(name, FTAG, &dp);
492 492 if (error != 0)
493 493 return (error);
494 494
495 495 error = dsl_dataset_hold(dp, name, FTAG, &ds);
496 496 if (error != 0) {
497 497 dsl_pool_rele(dp, FTAG);
498 498 return (error);
499 499 }
500 500
501 501 error = zfs_secpolicy_write_perms_ds(name, ds, perm, cr);
502 502
503 503 dsl_dataset_rele(ds, FTAG);
504 504 dsl_pool_rele(dp, FTAG);
505 505 return (error);
506 506 }
507 507
508 508 /*
509 509 * Policy for setting the security label property.
510 510 *
511 511 * Returns 0 for success, non-zero for access and other errors.
512 512 */
513 513 static int
514 514 zfs_set_slabel_policy(const char *name, char *strval, cred_t *cr)
515 515 {
516 516 char ds_hexsl[MAXNAMELEN];
517 517 bslabel_t ds_sl, new_sl;
518 518 boolean_t new_default = FALSE;
519 519 uint64_t zoned;
520 520 int needed_priv = -1;
521 521 int error;
522 522
523 523 /* First get the existing dataset label. */
524 524 error = dsl_prop_get(name, zfs_prop_to_name(ZFS_PROP_MLSLABEL),
525 525 1, sizeof (ds_hexsl), &ds_hexsl, NULL);
526 526 if (error != 0)
527 527 return (SET_ERROR(EPERM));
528 528
529 529 if (strcasecmp(strval, ZFS_MLSLABEL_DEFAULT) == 0)
530 530 new_default = TRUE;
531 531
532 532 /* The label must be translatable */
533 533 if (!new_default && (hexstr_to_label(strval, &new_sl) != 0))
534 534 return (SET_ERROR(EINVAL));
535 535
536 536 /*
537 537 * In a non-global zone, disallow attempts to set a label that
538 538 * doesn't match that of the zone; otherwise no other checks
539 539 * are needed.
540 540 */
541 541 if (!INGLOBALZONE(curproc)) {
542 542 if (new_default || !blequal(&new_sl, CR_SL(CRED())))
543 543 return (SET_ERROR(EPERM));
544 544 return (0);
545 545 }
546 546
547 547 /*
548 548 * For global-zone datasets (i.e., those whose zoned property is
549 549 * "off", verify that the specified new label is valid for the
550 550 * global zone.
551 551 */
552 552 if (dsl_prop_get_integer(name,
553 553 zfs_prop_to_name(ZFS_PROP_ZONED), &zoned, NULL))
554 554 return (SET_ERROR(EPERM));
555 555 if (!zoned) {
556 556 if (zfs_check_global_label(name, strval) != 0)
557 557 return (SET_ERROR(EPERM));
558 558 }
559 559
560 560 /*
561 561 * If the existing dataset label is nondefault, check if the
562 562 * dataset is mounted (label cannot be changed while mounted).
563 563 * Get the zfsvfs; if there isn't one, then the dataset isn't
564 564 * mounted (or isn't a dataset, doesn't exist, ...).
565 565 */
566 566 if (strcasecmp(ds_hexsl, ZFS_MLSLABEL_DEFAULT) != 0) {
567 567 objset_t *os;
568 568 static char *setsl_tag = "setsl_tag";
569 569
570 570 /*
571 571 * Try to own the dataset; abort if there is any error,
572 572 * (e.g., already mounted, in use, or other error).
573 573 */
574 574 error = dmu_objset_own(name, DMU_OST_ZFS, B_TRUE,
575 575 setsl_tag, &os);
576 576 if (error != 0)
577 577 return (SET_ERROR(EPERM));
578 578
579 579 dmu_objset_disown(os, setsl_tag);
580 580
581 581 if (new_default) {
582 582 needed_priv = PRIV_FILE_DOWNGRADE_SL;
583 583 goto out_check;
584 584 }
585 585
586 586 if (hexstr_to_label(strval, &new_sl) != 0)
587 587 return (SET_ERROR(EPERM));
588 588
589 589 if (blstrictdom(&ds_sl, &new_sl))
590 590 needed_priv = PRIV_FILE_DOWNGRADE_SL;
591 591 else if (blstrictdom(&new_sl, &ds_sl))
592 592 needed_priv = PRIV_FILE_UPGRADE_SL;
593 593 } else {
594 594 /* dataset currently has a default label */
595 595 if (!new_default)
596 596 needed_priv = PRIV_FILE_UPGRADE_SL;
597 597 }
598 598
599 599 out_check:
600 600 if (needed_priv != -1)
601 601 return (PRIV_POLICY(cr, needed_priv, B_FALSE, EPERM, NULL));
602 602 return (0);
603 603 }
604 604
605 605 static int
606 606 zfs_secpolicy_setprop(const char *dsname, zfs_prop_t prop, nvpair_t *propval,
607 607 cred_t *cr)
608 608 {
609 609 char *strval;
610 610
611 611 /*
612 612 * Check permissions for special properties.
613 613 */
614 614 switch (prop) {
615 615 case ZFS_PROP_ZONED:
616 616 /*
617 617 * Disallow setting of 'zoned' from within a local zone.
618 618 */
619 619 if (!INGLOBALZONE(curproc))
620 620 return (SET_ERROR(EPERM));
621 621 break;
622 622
623 623 case ZFS_PROP_QUOTA:
624 624 case ZFS_PROP_FILESYSTEM_LIMIT:
625 625 case ZFS_PROP_SNAPSHOT_LIMIT:
626 626 if (!INGLOBALZONE(curproc)) {
627 627 uint64_t zoned;
628 628 char setpoint[MAXNAMELEN];
629 629 /*
630 630 * Unprivileged users are allowed to modify the
631 631 * limit on things *under* (ie. contained by)
632 632 * the thing they own.
633 633 */
634 634 if (dsl_prop_get_integer(dsname, "zoned", &zoned,
635 635 setpoint))
636 636 return (SET_ERROR(EPERM));
637 637 if (!zoned || strlen(dsname) <= strlen(setpoint))
638 638 return (SET_ERROR(EPERM));
639 639 }
640 640 break;
641 641
642 642 case ZFS_PROP_MLSLABEL:
643 643 if (!is_system_labeled())
644 644 return (SET_ERROR(EPERM));
645 645
646 646 if (nvpair_value_string(propval, &strval) == 0) {
647 647 int err;
648 648
649 649 err = zfs_set_slabel_policy(dsname, strval, CRED());
650 650 if (err != 0)
651 651 return (err);
652 652 }
653 653 break;
654 654 }
655 655
656 656 return (zfs_secpolicy_write_perms(dsname, zfs_prop_to_name(prop), cr));
657 657 }
658 658
659 659 /* ARGSUSED */
660 660 static int
661 661 zfs_secpolicy_set_fsacl(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
662 662 {
663 663 int error;
664 664
665 665 error = zfs_dozonecheck(zc->zc_name, cr);
666 666 if (error != 0)
667 667 return (error);
668 668
669 669 /*
670 670 * permission to set permissions will be evaluated later in
671 671 * dsl_deleg_can_allow()
672 672 */
673 673 return (0);
674 674 }
675 675
676 676 /* ARGSUSED */
677 677 static int
678 678 zfs_secpolicy_rollback(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
679 679 {
680 680 return (zfs_secpolicy_write_perms(zc->zc_name,
681 681 ZFS_DELEG_PERM_ROLLBACK, cr));
682 682 }
683 683
684 684 /* ARGSUSED */
685 685 static int
686 686 zfs_secpolicy_send(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
687 687 {
688 688 dsl_pool_t *dp;
689 689 dsl_dataset_t *ds;
690 690 char *cp;
691 691 int error;
692 692
693 693 /*
694 694 * Generate the current snapshot name from the given objsetid, then
695 695 * use that name for the secpolicy/zone checks.
696 696 */
697 697 cp = strchr(zc->zc_name, '@');
698 698 if (cp == NULL)
699 699 return (SET_ERROR(EINVAL));
700 700 error = dsl_pool_hold(zc->zc_name, FTAG, &dp);
701 701 if (error != 0)
702 702 return (error);
703 703
704 704 error = dsl_dataset_hold_obj(dp, zc->zc_sendobj, FTAG, &ds);
705 705 if (error != 0) {
706 706 dsl_pool_rele(dp, FTAG);
707 707 return (error);
708 708 }
709 709
710 710 dsl_dataset_name(ds, zc->zc_name);
711 711
712 712 error = zfs_secpolicy_write_perms_ds(zc->zc_name, ds,
713 713 ZFS_DELEG_PERM_SEND, cr);
714 714 dsl_dataset_rele(ds, FTAG);
715 715 dsl_pool_rele(dp, FTAG);
716 716
717 717 return (error);
718 718 }
719 719
720 720 /* ARGSUSED */
721 721 static int
722 722 zfs_secpolicy_send_new(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
723 723 {
724 724 return (zfs_secpolicy_write_perms(zc->zc_name,
725 725 ZFS_DELEG_PERM_SEND, cr));
726 726 }
727 727
728 728 /* ARGSUSED */
729 729 static int
730 730 zfs_secpolicy_deleg_share(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
731 731 {
732 732 vnode_t *vp;
733 733 int error;
734 734
735 735 if ((error = lookupname(zc->zc_value, UIO_SYSSPACE,
736 736 NO_FOLLOW, NULL, &vp)) != 0)
737 737 return (error);
738 738
739 739 /* Now make sure mntpnt and dataset are ZFS */
740 740
741 741 if (vp->v_vfsp->vfs_fstype != zfsfstype ||
742 742 (strcmp((char *)refstr_value(vp->v_vfsp->vfs_resource),
743 743 zc->zc_name) != 0)) {
744 744 VN_RELE(vp);
745 745 return (SET_ERROR(EPERM));
746 746 }
747 747
748 748 VN_RELE(vp);
749 749 return (dsl_deleg_access(zc->zc_name,
750 750 ZFS_DELEG_PERM_SHARE, cr));
751 751 }
752 752
753 753 int
754 754 zfs_secpolicy_share(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
755 755 {
756 756 if (!INGLOBALZONE(curproc))
757 757 return (SET_ERROR(EPERM));
758 758
759 759 if (secpolicy_nfs(cr) == 0) {
760 760 return (0);
761 761 } else {
762 762 return (zfs_secpolicy_deleg_share(zc, innvl, cr));
763 763 }
764 764 }
765 765
766 766 int
767 767 zfs_secpolicy_smb_acl(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
768 768 {
769 769 if (!INGLOBALZONE(curproc))
770 770 return (SET_ERROR(EPERM));
771 771
772 772 if (secpolicy_smb(cr) == 0) {
773 773 return (0);
774 774 } else {
775 775 return (zfs_secpolicy_deleg_share(zc, innvl, cr));
776 776 }
777 777 }
778 778
779 779 static int
780 780 zfs_get_parent(const char *datasetname, char *parent, int parentsize)
781 781 {
782 782 char *cp;
783 783
784 784 /*
785 785 * Remove the @bla or /bla from the end of the name to get the parent.
786 786 */
787 787 (void) strncpy(parent, datasetname, parentsize);
788 788 cp = strrchr(parent, '@');
789 789 if (cp != NULL) {
790 790 cp[0] = '\0';
791 791 } else {
792 792 cp = strrchr(parent, '/');
793 793 if (cp == NULL)
794 794 return (SET_ERROR(ENOENT));
795 795 cp[0] = '\0';
796 796 }
797 797
798 798 return (0);
799 799 }
800 800
801 801 int
802 802 zfs_secpolicy_destroy_perms(const char *name, cred_t *cr)
803 803 {
804 804 int error;
805 805
806 806 if ((error = zfs_secpolicy_write_perms(name,
807 807 ZFS_DELEG_PERM_MOUNT, cr)) != 0)
808 808 return (error);
809 809
810 810 return (zfs_secpolicy_write_perms(name, ZFS_DELEG_PERM_DESTROY, cr));
811 811 }
812 812
813 813 /* ARGSUSED */
814 814 static int
815 815 zfs_secpolicy_destroy(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
816 816 {
817 817 return (zfs_secpolicy_destroy_perms(zc->zc_name, cr));
818 818 }
819 819
820 820 /*
821 821 * Destroying snapshots with delegated permissions requires
822 822 * descendant mount and destroy permissions.
823 823 */
824 824 /* ARGSUSED */
825 825 static int
826 826 zfs_secpolicy_destroy_snaps(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
827 827 {
828 828 nvlist_t *snaps;
829 829 nvpair_t *pair, *nextpair;
830 830 int error = 0;
831 831
832 832 if (nvlist_lookup_nvlist(innvl, "snaps", &snaps) != 0)
833 833 return (SET_ERROR(EINVAL));
834 834 for (pair = nvlist_next_nvpair(snaps, NULL); pair != NULL;
835 835 pair = nextpair) {
836 836 nextpair = nvlist_next_nvpair(snaps, pair);
837 837 error = zfs_secpolicy_destroy_perms(nvpair_name(pair), cr);
838 838 if (error == ENOENT) {
839 839 /*
840 840 * Ignore any snapshots that don't exist (we consider
841 841 * them "already destroyed"). Remove the name from the
842 842 * nvl here in case the snapshot is created between
843 843 * now and when we try to destroy it (in which case
844 844 * we don't want to destroy it since we haven't
845 845 * checked for permission).
846 846 */
847 847 fnvlist_remove_nvpair(snaps, pair);
848 848 error = 0;
849 849 }
850 850 if (error != 0)
851 851 break;
852 852 }
853 853
854 854 return (error);
855 855 }
856 856
857 857 int
858 858 zfs_secpolicy_rename_perms(const char *from, const char *to, cred_t *cr)
859 859 {
860 860 char parentname[MAXNAMELEN];
861 861 int error;
862 862
863 863 if ((error = zfs_secpolicy_write_perms(from,
864 864 ZFS_DELEG_PERM_RENAME, cr)) != 0)
865 865 return (error);
866 866
867 867 if ((error = zfs_secpolicy_write_perms(from,
868 868 ZFS_DELEG_PERM_MOUNT, cr)) != 0)
869 869 return (error);
870 870
871 871 if ((error = zfs_get_parent(to, parentname,
872 872 sizeof (parentname))) != 0)
873 873 return (error);
874 874
875 875 if ((error = zfs_secpolicy_write_perms(parentname,
876 876 ZFS_DELEG_PERM_CREATE, cr)) != 0)
877 877 return (error);
878 878
879 879 if ((error = zfs_secpolicy_write_perms(parentname,
880 880 ZFS_DELEG_PERM_MOUNT, cr)) != 0)
881 881 return (error);
882 882
883 883 return (error);
884 884 }
885 885
886 886 /* ARGSUSED */
887 887 static int
888 888 zfs_secpolicy_rename(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
889 889 {
890 890 return (zfs_secpolicy_rename_perms(zc->zc_name, zc->zc_value, cr));
891 891 }
892 892
893 893 /* ARGSUSED */
894 894 static int
895 895 zfs_secpolicy_promote(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
896 896 {
897 897 dsl_pool_t *dp;
898 898 dsl_dataset_t *clone;
899 899 int error;
900 900
901 901 error = zfs_secpolicy_write_perms(zc->zc_name,
902 902 ZFS_DELEG_PERM_PROMOTE, cr);
903 903 if (error != 0)
904 904 return (error);
905 905
906 906 error = dsl_pool_hold(zc->zc_name, FTAG, &dp);
907 907 if (error != 0)
908 908 return (error);
909 909
910 910 error = dsl_dataset_hold(dp, zc->zc_name, FTAG, &clone);
911 911
912 912 if (error == 0) {
913 913 char parentname[MAXNAMELEN];
914 914 dsl_dataset_t *origin = NULL;
915 915 dsl_dir_t *dd;
916 916 dd = clone->ds_dir;
917 917
918 918 error = dsl_dataset_hold_obj(dd->dd_pool,
919 919 dsl_dir_phys(dd)->dd_origin_obj, FTAG, &origin);
920 920 if (error != 0) {
921 921 dsl_dataset_rele(clone, FTAG);
922 922 dsl_pool_rele(dp, FTAG);
923 923 return (error);
924 924 }
925 925
926 926 error = zfs_secpolicy_write_perms_ds(zc->zc_name, clone,
927 927 ZFS_DELEG_PERM_MOUNT, cr);
928 928
929 929 dsl_dataset_name(origin, parentname);
930 930 if (error == 0) {
931 931 error = zfs_secpolicy_write_perms_ds(parentname, origin,
932 932 ZFS_DELEG_PERM_PROMOTE, cr);
933 933 }
934 934 dsl_dataset_rele(clone, FTAG);
935 935 dsl_dataset_rele(origin, FTAG);
936 936 }
937 937 dsl_pool_rele(dp, FTAG);
938 938 return (error);
939 939 }
940 940
941 941 /* ARGSUSED */
942 942 static int
943 943 zfs_secpolicy_recv(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
944 944 {
945 945 int error;
946 946
947 947 if ((error = zfs_secpolicy_write_perms(zc->zc_name,
948 948 ZFS_DELEG_PERM_RECEIVE, cr)) != 0)
949 949 return (error);
950 950
951 951 if ((error = zfs_secpolicy_write_perms(zc->zc_name,
952 952 ZFS_DELEG_PERM_MOUNT, cr)) != 0)
953 953 return (error);
954 954
955 955 return (zfs_secpolicy_write_perms(zc->zc_name,
956 956 ZFS_DELEG_PERM_CREATE, cr));
957 957 }
958 958
959 959 int
960 960 zfs_secpolicy_snapshot_perms(const char *name, cred_t *cr)
961 961 {
962 962 return (zfs_secpolicy_write_perms(name,
963 963 ZFS_DELEG_PERM_SNAPSHOT, cr));
964 964 }
965 965
966 966 /*
967 967 * Check for permission to create each snapshot in the nvlist.
968 968 */
969 969 /* ARGSUSED */
970 970 static int
971 971 zfs_secpolicy_snapshot(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
972 972 {
973 973 nvlist_t *snaps;
974 974 int error = 0;
975 975 nvpair_t *pair;
976 976
977 977 if (nvlist_lookup_nvlist(innvl, "snaps", &snaps) != 0)
978 978 return (SET_ERROR(EINVAL));
979 979 for (pair = nvlist_next_nvpair(snaps, NULL); pair != NULL;
980 980 pair = nvlist_next_nvpair(snaps, pair)) {
981 981 char *name = nvpair_name(pair);
982 982 char *atp = strchr(name, '@');
983 983
984 984 if (atp == NULL) {
985 985 error = SET_ERROR(EINVAL);
986 986 break;
987 987 }
988 988 *atp = '\0';
989 989 error = zfs_secpolicy_snapshot_perms(name, cr);
990 990 *atp = '@';
991 991 if (error != 0)
992 992 break;
993 993 }
994 994 return (error);
995 995 }
996 996
997 997 /*
998 998 * Check for permission to create each snapshot in the nvlist.
999 999 */
1000 1000 /* ARGSUSED */
1001 1001 static int
1002 1002 zfs_secpolicy_bookmark(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1003 1003 {
1004 1004 int error = 0;
1005 1005
1006 1006 for (nvpair_t *pair = nvlist_next_nvpair(innvl, NULL);
1007 1007 pair != NULL; pair = nvlist_next_nvpair(innvl, pair)) {
1008 1008 char *name = nvpair_name(pair);
1009 1009 char *hashp = strchr(name, '#');
1010 1010
1011 1011 if (hashp == NULL) {
1012 1012 error = SET_ERROR(EINVAL);
1013 1013 break;
1014 1014 }
1015 1015 *hashp = '\0';
1016 1016 error = zfs_secpolicy_write_perms(name,
1017 1017 ZFS_DELEG_PERM_BOOKMARK, cr);
1018 1018 *hashp = '#';
1019 1019 if (error != 0)
1020 1020 break;
1021 1021 }
1022 1022 return (error);
1023 1023 }
1024 1024
1025 1025 /* ARGSUSED */
1026 1026 static int
1027 1027 zfs_secpolicy_destroy_bookmarks(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1028 1028 {
1029 1029 nvpair_t *pair, *nextpair;
1030 1030 int error = 0;
1031 1031
1032 1032 for (pair = nvlist_next_nvpair(innvl, NULL); pair != NULL;
1033 1033 pair = nextpair) {
1034 1034 char *name = nvpair_name(pair);
1035 1035 char *hashp = strchr(name, '#');
1036 1036 nextpair = nvlist_next_nvpair(innvl, pair);
1037 1037
1038 1038 if (hashp == NULL) {
1039 1039 error = SET_ERROR(EINVAL);
1040 1040 break;
1041 1041 }
1042 1042
1043 1043 *hashp = '\0';
1044 1044 error = zfs_secpolicy_write_perms(name,
1045 1045 ZFS_DELEG_PERM_DESTROY, cr);
1046 1046 *hashp = '#';
1047 1047 if (error == ENOENT) {
1048 1048 /*
1049 1049 * Ignore any filesystems that don't exist (we consider
1050 1050 * their bookmarks "already destroyed"). Remove
1051 1051 * the name from the nvl here in case the filesystem
1052 1052 * is created between now and when we try to destroy
1053 1053 * the bookmark (in which case we don't want to
1054 1054 * destroy it since we haven't checked for permission).
1055 1055 */
1056 1056 fnvlist_remove_nvpair(innvl, pair);
1057 1057 error = 0;
1058 1058 }
1059 1059 if (error != 0)
1060 1060 break;
1061 1061 }
1062 1062
1063 1063 return (error);
1064 1064 }
1065 1065
1066 1066 /* ARGSUSED */
1067 1067 static int
1068 1068 zfs_secpolicy_log_history(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1069 1069 {
1070 1070 /*
1071 1071 * Even root must have a proper TSD so that we know what pool
1072 1072 * to log to.
1073 1073 */
1074 1074 if (tsd_get(zfs_allow_log_key) == NULL)
1075 1075 return (SET_ERROR(EPERM));
1076 1076 return (0);
1077 1077 }
1078 1078
1079 1079 static int
1080 1080 zfs_secpolicy_create_clone(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1081 1081 {
1082 1082 char parentname[MAXNAMELEN];
1083 1083 int error;
1084 1084 char *origin;
1085 1085
1086 1086 if ((error = zfs_get_parent(zc->zc_name, parentname,
1087 1087 sizeof (parentname))) != 0)
1088 1088 return (error);
1089 1089
1090 1090 if (nvlist_lookup_string(innvl, "origin", &origin) == 0 &&
1091 1091 (error = zfs_secpolicy_write_perms(origin,
1092 1092 ZFS_DELEG_PERM_CLONE, cr)) != 0)
1093 1093 return (error);
1094 1094
1095 1095 if ((error = zfs_secpolicy_write_perms(parentname,
1096 1096 ZFS_DELEG_PERM_CREATE, cr)) != 0)
1097 1097 return (error);
1098 1098
1099 1099 return (zfs_secpolicy_write_perms(parentname,
1100 1100 ZFS_DELEG_PERM_MOUNT, cr));
1101 1101 }
1102 1102
1103 1103 /*
1104 1104 * Policy for pool operations - create/destroy pools, add vdevs, etc. Requires
1105 1105 * SYS_CONFIG privilege, which is not available in a local zone.
1106 1106 */
1107 1107 /* ARGSUSED */
1108 1108 static int
1109 1109 zfs_secpolicy_config(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1110 1110 {
1111 1111 if (secpolicy_sys_config(cr, B_FALSE) != 0)
1112 1112 return (SET_ERROR(EPERM));
1113 1113
1114 1114 return (0);
1115 1115 }
1116 1116
1117 1117 /*
1118 1118 * Policy for object to name lookups.
1119 1119 */
1120 1120 /* ARGSUSED */
1121 1121 static int
1122 1122 zfs_secpolicy_diff(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1123 1123 {
1124 1124 int error;
1125 1125
1126 1126 if ((error = secpolicy_sys_config(cr, B_FALSE)) == 0)
1127 1127 return (0);
1128 1128
1129 1129 error = zfs_secpolicy_write_perms(zc->zc_name, ZFS_DELEG_PERM_DIFF, cr);
1130 1130 return (error);
1131 1131 }
1132 1132
1133 1133 /*
1134 1134 * Policy for fault injection. Requires all privileges.
1135 1135 */
1136 1136 /* ARGSUSED */
1137 1137 static int
1138 1138 zfs_secpolicy_inject(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1139 1139 {
1140 1140 return (secpolicy_zinject(cr));
1141 1141 }
1142 1142
1143 1143 /* ARGSUSED */
1144 1144 static int
1145 1145 zfs_secpolicy_inherit_prop(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1146 1146 {
1147 1147 zfs_prop_t prop = zfs_name_to_prop(zc->zc_value);
1148 1148
1149 1149 if (prop == ZPROP_INVAL) {
1150 1150 if (!zfs_prop_user(zc->zc_value))
1151 1151 return (SET_ERROR(EINVAL));
1152 1152 return (zfs_secpolicy_write_perms(zc->zc_name,
1153 1153 ZFS_DELEG_PERM_USERPROP, cr));
1154 1154 } else {
1155 1155 return (zfs_secpolicy_setprop(zc->zc_name, prop,
1156 1156 NULL, cr));
1157 1157 }
1158 1158 }
1159 1159
1160 1160 static int
1161 1161 zfs_secpolicy_userspace_one(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1162 1162 {
1163 1163 int err = zfs_secpolicy_read(zc, innvl, cr);
1164 1164 if (err)
1165 1165 return (err);
1166 1166
1167 1167 if (zc->zc_objset_type >= ZFS_NUM_USERQUOTA_PROPS)
1168 1168 return (SET_ERROR(EINVAL));
1169 1169
1170 1170 if (zc->zc_value[0] == 0) {
1171 1171 /*
1172 1172 * They are asking about a posix uid/gid. If it's
1173 1173 * themself, allow it.
1174 1174 */
1175 1175 if (zc->zc_objset_type == ZFS_PROP_USERUSED ||
1176 1176 zc->zc_objset_type == ZFS_PROP_USERQUOTA) {
1177 1177 if (zc->zc_guid == crgetuid(cr))
1178 1178 return (0);
1179 1179 } else {
1180 1180 if (groupmember(zc->zc_guid, cr))
1181 1181 return (0);
1182 1182 }
1183 1183 }
1184 1184
1185 1185 return (zfs_secpolicy_write_perms(zc->zc_name,
1186 1186 userquota_perms[zc->zc_objset_type], cr));
1187 1187 }
1188 1188
1189 1189 static int
1190 1190 zfs_secpolicy_userspace_many(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1191 1191 {
1192 1192 int err = zfs_secpolicy_read(zc, innvl, cr);
1193 1193 if (err)
1194 1194 return (err);
1195 1195
1196 1196 if (zc->zc_objset_type >= ZFS_NUM_USERQUOTA_PROPS)
1197 1197 return (SET_ERROR(EINVAL));
1198 1198
1199 1199 return (zfs_secpolicy_write_perms(zc->zc_name,
1200 1200 userquota_perms[zc->zc_objset_type], cr));
1201 1201 }
1202 1202
1203 1203 /* ARGSUSED */
1204 1204 static int
1205 1205 zfs_secpolicy_userspace_upgrade(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1206 1206 {
1207 1207 return (zfs_secpolicy_setprop(zc->zc_name, ZFS_PROP_VERSION,
1208 1208 NULL, cr));
1209 1209 }
1210 1210
1211 1211 /* ARGSUSED */
1212 1212 static int
1213 1213 zfs_secpolicy_hold(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1214 1214 {
1215 1215 nvpair_t *pair;
1216 1216 nvlist_t *holds;
1217 1217 int error;
1218 1218
1219 1219 error = nvlist_lookup_nvlist(innvl, "holds", &holds);
1220 1220 if (error != 0)
1221 1221 return (SET_ERROR(EINVAL));
1222 1222
1223 1223 for (pair = nvlist_next_nvpair(holds, NULL); pair != NULL;
1224 1224 pair = nvlist_next_nvpair(holds, pair)) {
1225 1225 char fsname[MAXNAMELEN];
1226 1226 error = dmu_fsname(nvpair_name(pair), fsname);
1227 1227 if (error != 0)
1228 1228 return (error);
1229 1229 error = zfs_secpolicy_write_perms(fsname,
1230 1230 ZFS_DELEG_PERM_HOLD, cr);
1231 1231 if (error != 0)
1232 1232 return (error);
1233 1233 }
1234 1234 return (0);
1235 1235 }
1236 1236
1237 1237 /* ARGSUSED */
1238 1238 static int
1239 1239 zfs_secpolicy_release(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1240 1240 {
1241 1241 nvpair_t *pair;
1242 1242 int error;
1243 1243
1244 1244 for (pair = nvlist_next_nvpair(innvl, NULL); pair != NULL;
1245 1245 pair = nvlist_next_nvpair(innvl, pair)) {
1246 1246 char fsname[MAXNAMELEN];
1247 1247 error = dmu_fsname(nvpair_name(pair), fsname);
1248 1248 if (error != 0)
1249 1249 return (error);
1250 1250 error = zfs_secpolicy_write_perms(fsname,
1251 1251 ZFS_DELEG_PERM_RELEASE, cr);
1252 1252 if (error != 0)
1253 1253 return (error);
1254 1254 }
1255 1255 return (0);
1256 1256 }
1257 1257
1258 1258 /*
1259 1259 * Policy for allowing temporary snapshots to be taken or released
1260 1260 */
1261 1261 static int
1262 1262 zfs_secpolicy_tmp_snapshot(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1263 1263 {
1264 1264 /*
1265 1265 * A temporary snapshot is the same as a snapshot,
1266 1266 * hold, destroy and release all rolled into one.
1267 1267 * Delegated diff alone is sufficient that we allow this.
1268 1268 */
1269 1269 int error;
1270 1270
1271 1271 if ((error = zfs_secpolicy_write_perms(zc->zc_name,
1272 1272 ZFS_DELEG_PERM_DIFF, cr)) == 0)
1273 1273 return (0);
1274 1274
1275 1275 error = zfs_secpolicy_snapshot_perms(zc->zc_name, cr);
1276 1276 if (error == 0)
1277 1277 error = zfs_secpolicy_hold(zc, innvl, cr);
1278 1278 if (error == 0)
1279 1279 error = zfs_secpolicy_release(zc, innvl, cr);
1280 1280 if (error == 0)
1281 1281 error = zfs_secpolicy_destroy(zc, innvl, cr);
1282 1282 return (error);
1283 1283 }
1284 1284
1285 1285 /*
1286 1286 * Returns the nvlist as specified by the user in the zfs_cmd_t.
1287 1287 */
1288 1288 static int
1289 1289 get_nvlist(uint64_t nvl, uint64_t size, int iflag, nvlist_t **nvp)
1290 1290 {
1291 1291 char *packed;
1292 1292 int error;
1293 1293 nvlist_t *list = NULL;
1294 1294
1295 1295 /*
1296 1296 * Read in and unpack the user-supplied nvlist.
1297 1297 */
1298 1298 if (size == 0)
1299 1299 return (SET_ERROR(EINVAL));
1300 1300
1301 1301 packed = kmem_alloc(size, KM_SLEEP);
1302 1302
1303 1303 if ((error = ddi_copyin((void *)(uintptr_t)nvl, packed, size,
1304 1304 iflag)) != 0) {
1305 1305 kmem_free(packed, size);
1306 1306 return (SET_ERROR(EFAULT));
1307 1307 }
1308 1308
1309 1309 if ((error = nvlist_unpack(packed, size, &list, 0)) != 0) {
1310 1310 kmem_free(packed, size);
1311 1311 return (error);
1312 1312 }
1313 1313
1314 1314 kmem_free(packed, size);
1315 1315
1316 1316 *nvp = list;
1317 1317 return (0);
1318 1318 }
1319 1319
1320 1320 /*
1321 1321 * Reduce the size of this nvlist until it can be serialized in 'max' bytes.
1322 1322 * Entries will be removed from the end of the nvlist, and one int32 entry
1323 1323 * named "N_MORE_ERRORS" will be added indicating how many entries were
1324 1324 * removed.
1325 1325 */
1326 1326 static int
1327 1327 nvlist_smush(nvlist_t *errors, size_t max)
1328 1328 {
1329 1329 size_t size;
1330 1330
1331 1331 size = fnvlist_size(errors);
1332 1332
1333 1333 if (size > max) {
1334 1334 nvpair_t *more_errors;
1335 1335 int n = 0;
1336 1336
1337 1337 if (max < 1024)
1338 1338 return (SET_ERROR(ENOMEM));
1339 1339
1340 1340 fnvlist_add_int32(errors, ZPROP_N_MORE_ERRORS, 0);
1341 1341 more_errors = nvlist_prev_nvpair(errors, NULL);
1342 1342
1343 1343 do {
1344 1344 nvpair_t *pair = nvlist_prev_nvpair(errors,
1345 1345 more_errors);
1346 1346 fnvlist_remove_nvpair(errors, pair);
1347 1347 n++;
1348 1348 size = fnvlist_size(errors);
1349 1349 } while (size > max);
1350 1350
1351 1351 fnvlist_remove_nvpair(errors, more_errors);
1352 1352 fnvlist_add_int32(errors, ZPROP_N_MORE_ERRORS, n);
1353 1353 ASSERT3U(fnvlist_size(errors), <=, max);
1354 1354 }
1355 1355
1356 1356 return (0);
1357 1357 }
1358 1358
1359 1359 static int
1360 1360 put_nvlist(zfs_cmd_t *zc, nvlist_t *nvl)
1361 1361 {
1362 1362 char *packed = NULL;
1363 1363 int error = 0;
1364 1364 size_t size;
1365 1365
1366 1366 size = fnvlist_size(nvl);
1367 1367
1368 1368 if (size > zc->zc_nvlist_dst_size) {
1369 1369 error = SET_ERROR(ENOMEM);
1370 1370 } else {
1371 1371 packed = fnvlist_pack(nvl, &size);
1372 1372 if (ddi_copyout(packed, (void *)(uintptr_t)zc->zc_nvlist_dst,
1373 1373 size, zc->zc_iflags) != 0)
1374 1374 error = SET_ERROR(EFAULT);
1375 1375 fnvlist_pack_free(packed, size);
1376 1376 }
1377 1377
1378 1378 zc->zc_nvlist_dst_size = size;
1379 1379 zc->zc_nvlist_dst_filled = B_TRUE;
1380 1380 return (error);
1381 1381 }
1382 1382
1383 1383 static int
1384 1384 getzfsvfs(const char *dsname, zfsvfs_t **zfvp)
1385 1385 {
1386 1386 objset_t *os;
1387 1387 int error;
1388 1388
1389 1389 error = dmu_objset_hold(dsname, FTAG, &os);
1390 1390 if (error != 0)
1391 1391 return (error);
1392 1392 if (dmu_objset_type(os) != DMU_OST_ZFS) {
1393 1393 dmu_objset_rele(os, FTAG);
1394 1394 return (SET_ERROR(EINVAL));
1395 1395 }
1396 1396
1397 1397 mutex_enter(&os->os_user_ptr_lock);
1398 1398 *zfvp = dmu_objset_get_user(os);
1399 1399 if (*zfvp) {
1400 1400 VFS_HOLD((*zfvp)->z_vfs);
1401 1401 } else {
1402 1402 error = SET_ERROR(ESRCH);
1403 1403 }
1404 1404 mutex_exit(&os->os_user_ptr_lock);
1405 1405 dmu_objset_rele(os, FTAG);
1406 1406 return (error);
1407 1407 }
1408 1408
1409 1409 /*
1410 1410 * Find a zfsvfs_t for a mounted filesystem, or create our own, in which
1411 1411 * case its z_vfs will be NULL, and it will be opened as the owner.
1412 1412 * If 'writer' is set, the z_teardown_lock will be held for RW_WRITER,
1413 1413 * which prevents all vnode ops from running.
1414 1414 */
1415 1415 static int
1416 1416 zfsvfs_hold(const char *name, void *tag, zfsvfs_t **zfvp, boolean_t writer)
1417 1417 {
1418 1418 int error = 0;
1419 1419
1420 1420 if (getzfsvfs(name, zfvp) != 0)
1421 1421 error = zfsvfs_create(name, zfvp);
1422 1422 if (error == 0) {
1423 1423 rrm_enter(&(*zfvp)->z_teardown_lock, (writer) ? RW_WRITER :
1424 1424 RW_READER, tag);
1425 1425 if ((*zfvp)->z_unmounted) {
1426 1426 /*
1427 1427 * XXX we could probably try again, since the unmounting
1428 1428 * thread should be just about to disassociate the
1429 1429 * objset from the zfsvfs.
1430 1430 */
1431 1431 rrm_exit(&(*zfvp)->z_teardown_lock, tag);
1432 1432 return (SET_ERROR(EBUSY));
1433 1433 }
1434 1434 }
1435 1435 return (error);
1436 1436 }
1437 1437
1438 1438 static void
1439 1439 zfsvfs_rele(zfsvfs_t *zfsvfs, void *tag)
1440 1440 {
1441 1441 rrm_exit(&zfsvfs->z_teardown_lock, tag);
1442 1442
1443 1443 if (zfsvfs->z_vfs) {
1444 1444 VFS_RELE(zfsvfs->z_vfs);
1445 1445 } else {
1446 1446 dmu_objset_disown(zfsvfs->z_os, zfsvfs);
1447 1447 zfsvfs_free(zfsvfs);
1448 1448 }
1449 1449 }
1450 1450
1451 1451 static int
1452 1452 zfs_ioc_pool_create(zfs_cmd_t *zc)
1453 1453 {
1454 1454 int error;
1455 1455 nvlist_t *config, *props = NULL;
1456 1456 nvlist_t *rootprops = NULL;
1457 1457 nvlist_t *zplprops = NULL;
1458 1458
1459 1459 if (error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1460 1460 zc->zc_iflags, &config))
1461 1461 return (error);
1462 1462
1463 1463 if (zc->zc_nvlist_src_size != 0 && (error =
1464 1464 get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
1465 1465 zc->zc_iflags, &props))) {
1466 1466 nvlist_free(config);
1467 1467 return (error);
1468 1468 }
1469 1469
1470 1470 if (props) {
1471 1471 nvlist_t *nvl = NULL;
1472 1472 uint64_t version = SPA_VERSION;
1473 1473
1474 1474 (void) nvlist_lookup_uint64(props,
1475 1475 zpool_prop_to_name(ZPOOL_PROP_VERSION), &version);
1476 1476 if (!SPA_VERSION_IS_SUPPORTED(version)) {
1477 1477 error = SET_ERROR(EINVAL);
1478 1478 goto pool_props_bad;
1479 1479 }
1480 1480 (void) nvlist_lookup_nvlist(props, ZPOOL_ROOTFS_PROPS, &nvl);
1481 1481 if (nvl) {
1482 1482 error = nvlist_dup(nvl, &rootprops, KM_SLEEP);
1483 1483 if (error != 0) {
1484 1484 nvlist_free(config);
1485 1485 nvlist_free(props);
1486 1486 return (error);
1487 1487 }
1488 1488 (void) nvlist_remove_all(props, ZPOOL_ROOTFS_PROPS);
1489 1489 }
1490 1490 VERIFY(nvlist_alloc(&zplprops, NV_UNIQUE_NAME, KM_SLEEP) == 0);
1491 1491 error = zfs_fill_zplprops_root(version, rootprops,
1492 1492 zplprops, NULL);
1493 1493 if (error != 0)
1494 1494 goto pool_props_bad;
1495 1495 }
1496 1496
1497 1497 error = spa_create(zc->zc_name, config, props, zplprops);
1498 1498
1499 1499 /*
1500 1500 * Set the remaining root properties
1501 1501 */
1502 1502 if (!error && (error = zfs_set_prop_nvlist(zc->zc_name,
1503 1503 ZPROP_SRC_LOCAL, rootprops, NULL)) != 0)
1504 1504 (void) spa_destroy(zc->zc_name);
1505 1505
1506 1506 pool_props_bad:
1507 1507 nvlist_free(rootprops);
1508 1508 nvlist_free(zplprops);
1509 1509 nvlist_free(config);
1510 1510 nvlist_free(props);
1511 1511
1512 1512 return (error);
1513 1513 }
1514 1514
1515 1515 static int
1516 1516 zfs_ioc_pool_destroy(zfs_cmd_t *zc)
1517 1517 {
1518 1518 int error;
1519 1519 zfs_log_history(zc);
1520 1520 error = spa_destroy(zc->zc_name);
1521 1521 if (error == 0)
1522 1522 zvol_remove_minors(zc->zc_name);
1523 1523 return (error);
1524 1524 }
1525 1525
1526 1526 static int
1527 1527 zfs_ioc_pool_import(zfs_cmd_t *zc)
1528 1528 {
1529 1529 nvlist_t *config, *props = NULL;
1530 1530 uint64_t guid;
1531 1531 int error;
1532 1532
1533 1533 if ((error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1534 1534 zc->zc_iflags, &config)) != 0)
1535 1535 return (error);
1536 1536
1537 1537 if (zc->zc_nvlist_src_size != 0 && (error =
1538 1538 get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
1539 1539 zc->zc_iflags, &props))) {
1540 1540 nvlist_free(config);
1541 1541 return (error);
1542 1542 }
1543 1543
1544 1544 if (nvlist_lookup_uint64(config, ZPOOL_CONFIG_POOL_GUID, &guid) != 0 ||
1545 1545 guid != zc->zc_guid)
1546 1546 error = SET_ERROR(EINVAL);
1547 1547 else
1548 1548 error = spa_import(zc->zc_name, config, props, zc->zc_cookie);
1549 1549
1550 1550 if (zc->zc_nvlist_dst != 0) {
1551 1551 int err;
1552 1552
1553 1553 if ((err = put_nvlist(zc, config)) != 0)
1554 1554 error = err;
1555 1555 }
1556 1556
1557 1557 nvlist_free(config);
1558 1558
1559 1559 if (props)
1560 1560 nvlist_free(props);
1561 1561
1562 1562 return (error);
1563 1563 }
1564 1564
1565 1565 static int
1566 1566 zfs_ioc_pool_export(zfs_cmd_t *zc)
1567 1567 {
1568 1568 int error;
1569 1569 boolean_t force = (boolean_t)zc->zc_cookie;
1570 1570 boolean_t hardforce = (boolean_t)zc->zc_guid;
1571 1571
1572 1572 zfs_log_history(zc);
1573 1573 error = spa_export(zc->zc_name, NULL, force, hardforce);
1574 1574 if (error == 0)
1575 1575 zvol_remove_minors(zc->zc_name);
1576 1576 return (error);
1577 1577 }
1578 1578
1579 1579 static int
1580 1580 zfs_ioc_pool_configs(zfs_cmd_t *zc)
1581 1581 {
1582 1582 nvlist_t *configs;
1583 1583 int error;
1584 1584
1585 1585 if ((configs = spa_all_configs(&zc->zc_cookie)) == NULL)
1586 1586 return (SET_ERROR(EEXIST));
1587 1587
1588 1588 error = put_nvlist(zc, configs);
1589 1589
1590 1590 nvlist_free(configs);
1591 1591
1592 1592 return (error);
1593 1593 }
1594 1594
1595 1595 /*
1596 1596 * inputs:
1597 1597 * zc_name name of the pool
1598 1598 *
1599 1599 * outputs:
1600 1600 * zc_cookie real errno
1601 1601 * zc_nvlist_dst config nvlist
1602 1602 * zc_nvlist_dst_size size of config nvlist
1603 1603 */
1604 1604 static int
1605 1605 zfs_ioc_pool_stats(zfs_cmd_t *zc)
1606 1606 {
1607 1607 nvlist_t *config;
1608 1608 int error;
1609 1609 int ret = 0;
1610 1610
1611 1611 error = spa_get_stats(zc->zc_name, &config, zc->zc_value,
1612 1612 sizeof (zc->zc_value));
1613 1613
1614 1614 if (config != NULL) {
1615 1615 ret = put_nvlist(zc, config);
1616 1616 nvlist_free(config);
1617 1617
1618 1618 /*
1619 1619 * The config may be present even if 'error' is non-zero.
1620 1620 * In this case we return success, and preserve the real errno
1621 1621 * in 'zc_cookie'.
1622 1622 */
1623 1623 zc->zc_cookie = error;
1624 1624 } else {
1625 1625 ret = error;
1626 1626 }
1627 1627
1628 1628 return (ret);
1629 1629 }
1630 1630
1631 1631 /*
1632 1632 * Try to import the given pool, returning pool stats as appropriate so that
1633 1633 * user land knows which devices are available and overall pool health.
1634 1634 */
1635 1635 static int
1636 1636 zfs_ioc_pool_tryimport(zfs_cmd_t *zc)
1637 1637 {
1638 1638 nvlist_t *tryconfig, *config;
1639 1639 int error;
1640 1640
1641 1641 if ((error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1642 1642 zc->zc_iflags, &tryconfig)) != 0)
1643 1643 return (error);
1644 1644
1645 1645 config = spa_tryimport(tryconfig);
1646 1646
1647 1647 nvlist_free(tryconfig);
1648 1648
1649 1649 if (config == NULL)
1650 1650 return (SET_ERROR(EINVAL));
1651 1651
1652 1652 error = put_nvlist(zc, config);
1653 1653 nvlist_free(config);
1654 1654
1655 1655 return (error);
1656 1656 }
1657 1657
1658 1658 /*
1659 1659 * inputs:
1660 1660 * zc_name name of the pool
1661 1661 * zc_cookie scan func (pool_scan_func_t)
1662 1662 */
1663 1663 static int
1664 1664 zfs_ioc_pool_scan(zfs_cmd_t *zc)
1665 1665 {
1666 1666 spa_t *spa;
1667 1667 int error;
1668 1668
1669 1669 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1670 1670 return (error);
1671 1671
1672 1672 if (zc->zc_cookie == POOL_SCAN_NONE)
1673 1673 error = spa_scan_stop(spa);
1674 1674 else
1675 1675 error = spa_scan(spa, zc->zc_cookie);
1676 1676
1677 1677 spa_close(spa, FTAG);
1678 1678
1679 1679 return (error);
1680 1680 }
1681 1681
1682 1682 static int
1683 1683 zfs_ioc_pool_freeze(zfs_cmd_t *zc)
1684 1684 {
1685 1685 spa_t *spa;
1686 1686 int error;
1687 1687
1688 1688 error = spa_open(zc->zc_name, &spa, FTAG);
1689 1689 if (error == 0) {
1690 1690 spa_freeze(spa);
1691 1691 spa_close(spa, FTAG);
1692 1692 }
1693 1693 return (error);
1694 1694 }
1695 1695
1696 1696 static int
1697 1697 zfs_ioc_pool_upgrade(zfs_cmd_t *zc)
1698 1698 {
1699 1699 spa_t *spa;
1700 1700 int error;
1701 1701
1702 1702 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1703 1703 return (error);
1704 1704
1705 1705 if (zc->zc_cookie < spa_version(spa) ||
1706 1706 !SPA_VERSION_IS_SUPPORTED(zc->zc_cookie)) {
1707 1707 spa_close(spa, FTAG);
1708 1708 return (SET_ERROR(EINVAL));
1709 1709 }
1710 1710
1711 1711 spa_upgrade(spa, zc->zc_cookie);
1712 1712 spa_close(spa, FTAG);
1713 1713
1714 1714 return (error);
1715 1715 }
1716 1716
1717 1717 static int
1718 1718 zfs_ioc_pool_get_history(zfs_cmd_t *zc)
1719 1719 {
1720 1720 spa_t *spa;
1721 1721 char *hist_buf;
1722 1722 uint64_t size;
1723 1723 int error;
1724 1724
1725 1725 if ((size = zc->zc_history_len) == 0)
1726 1726 return (SET_ERROR(EINVAL));
1727 1727
1728 1728 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1729 1729 return (error);
1730 1730
1731 1731 if (spa_version(spa) < SPA_VERSION_ZPOOL_HISTORY) {
1732 1732 spa_close(spa, FTAG);
1733 1733 return (SET_ERROR(ENOTSUP));
1734 1734 }
1735 1735
1736 1736 hist_buf = kmem_alloc(size, KM_SLEEP);
1737 1737 if ((error = spa_history_get(spa, &zc->zc_history_offset,
1738 1738 &zc->zc_history_len, hist_buf)) == 0) {
1739 1739 error = ddi_copyout(hist_buf,
1740 1740 (void *)(uintptr_t)zc->zc_history,
1741 1741 zc->zc_history_len, zc->zc_iflags);
1742 1742 }
1743 1743
1744 1744 spa_close(spa, FTAG);
1745 1745 kmem_free(hist_buf, size);
1746 1746 return (error);
1747 1747 }
1748 1748
1749 1749 static int
1750 1750 zfs_ioc_pool_reguid(zfs_cmd_t *zc)
1751 1751 {
1752 1752 spa_t *spa;
1753 1753 int error;
1754 1754
1755 1755 error = spa_open(zc->zc_name, &spa, FTAG);
1756 1756 if (error == 0) {
1757 1757 error = spa_change_guid(spa);
1758 1758 spa_close(spa, FTAG);
1759 1759 }
1760 1760 return (error);
1761 1761 }
1762 1762
1763 1763 static int
1764 1764 zfs_ioc_dsobj_to_dsname(zfs_cmd_t *zc)
1765 1765 {
1766 1766 return (dsl_dsobj_to_dsname(zc->zc_name, zc->zc_obj, zc->zc_value));
1767 1767 }
1768 1768
1769 1769 /*
1770 1770 * inputs:
1771 1771 * zc_name name of filesystem
1772 1772 * zc_obj object to find
1773 1773 *
1774 1774 * outputs:
1775 1775 * zc_value name of object
1776 1776 */
1777 1777 static int
1778 1778 zfs_ioc_obj_to_path(zfs_cmd_t *zc)
1779 1779 {
1780 1780 objset_t *os;
1781 1781 int error;
1782 1782
1783 1783 /* XXX reading from objset not owned */
1784 1784 if ((error = dmu_objset_hold(zc->zc_name, FTAG, &os)) != 0)
1785 1785 return (error);
1786 1786 if (dmu_objset_type(os) != DMU_OST_ZFS) {
1787 1787 dmu_objset_rele(os, FTAG);
1788 1788 return (SET_ERROR(EINVAL));
1789 1789 }
1790 1790 error = zfs_obj_to_path(os, zc->zc_obj, zc->zc_value,
1791 1791 sizeof (zc->zc_value));
1792 1792 dmu_objset_rele(os, FTAG);
1793 1793
1794 1794 return (error);
1795 1795 }
1796 1796
1797 1797 /*
1798 1798 * inputs:
1799 1799 * zc_name name of filesystem
1800 1800 * zc_obj object to find
1801 1801 *
1802 1802 * outputs:
1803 1803 * zc_stat stats on object
1804 1804 * zc_value path to object
1805 1805 */
1806 1806 static int
1807 1807 zfs_ioc_obj_to_stats(zfs_cmd_t *zc)
1808 1808 {
1809 1809 objset_t *os;
1810 1810 int error;
1811 1811
1812 1812 /* XXX reading from objset not owned */
1813 1813 if ((error = dmu_objset_hold(zc->zc_name, FTAG, &os)) != 0)
1814 1814 return (error);
1815 1815 if (dmu_objset_type(os) != DMU_OST_ZFS) {
1816 1816 dmu_objset_rele(os, FTAG);
1817 1817 return (SET_ERROR(EINVAL));
1818 1818 }
1819 1819 error = zfs_obj_to_stats(os, zc->zc_obj, &zc->zc_stat, zc->zc_value,
1820 1820 sizeof (zc->zc_value));
1821 1821 dmu_objset_rele(os, FTAG);
1822 1822
1823 1823 return (error);
1824 1824 }
1825 1825
1826 1826 static int
1827 1827 zfs_ioc_vdev_add(zfs_cmd_t *zc)
1828 1828 {
1829 1829 spa_t *spa;
1830 1830 int error;
1831 1831 nvlist_t *config, **l2cache, **spares;
1832 1832 uint_t nl2cache = 0, nspares = 0;
1833 1833
1834 1834 error = spa_open(zc->zc_name, &spa, FTAG);
1835 1835 if (error != 0)
1836 1836 return (error);
1837 1837
1838 1838 error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1839 1839 zc->zc_iflags, &config);
1840 1840 (void) nvlist_lookup_nvlist_array(config, ZPOOL_CONFIG_L2CACHE,
1841 1841 &l2cache, &nl2cache);
1842 1842
1843 1843 (void) nvlist_lookup_nvlist_array(config, ZPOOL_CONFIG_SPARES,
1844 1844 &spares, &nspares);
1845 1845
1846 1846 /*
1847 1847 * A root pool with concatenated devices is not supported.
1848 1848 * Thus, can not add a device to a root pool.
1849 1849 *
1850 1850 * Intent log device can not be added to a rootpool because
1851 1851 * during mountroot, zil is replayed, a seperated log device
1852 1852 * can not be accessed during the mountroot time.
1853 1853 *
1854 1854 * l2cache and spare devices are ok to be added to a rootpool.
1855 1855 */
1856 1856 if (spa_bootfs(spa) != 0 && nl2cache == 0 && nspares == 0) {
1857 1857 nvlist_free(config);
1858 1858 spa_close(spa, FTAG);
1859 1859 return (SET_ERROR(EDOM));
1860 1860 }
1861 1861
1862 1862 if (error == 0) {
1863 1863 error = spa_vdev_add(spa, config);
1864 1864 nvlist_free(config);
1865 1865 }
1866 1866 spa_close(spa, FTAG);
1867 1867 return (error);
1868 1868 }
1869 1869
1870 1870 /*
1871 1871 * inputs:
1872 1872 * zc_name name of the pool
1873 1873 * zc_nvlist_conf nvlist of devices to remove
1874 1874 * zc_cookie to stop the remove?
1875 1875 */
1876 1876 static int
1877 1877 zfs_ioc_vdev_remove(zfs_cmd_t *zc)
1878 1878 {
1879 1879 spa_t *spa;
1880 1880 int error;
1881 1881
1882 1882 error = spa_open(zc->zc_name, &spa, FTAG);
1883 1883 if (error != 0)
1884 1884 return (error);
1885 1885 error = spa_vdev_remove(spa, zc->zc_guid, B_FALSE);
1886 1886 spa_close(spa, FTAG);
1887 1887 return (error);
1888 1888 }
1889 1889
1890 1890 static int
1891 1891 zfs_ioc_vdev_set_state(zfs_cmd_t *zc)
1892 1892 {
1893 1893 spa_t *spa;
1894 1894 int error;
1895 1895 vdev_state_t newstate = VDEV_STATE_UNKNOWN;
1896 1896
1897 1897 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1898 1898 return (error);
1899 1899 switch (zc->zc_cookie) {
1900 1900 case VDEV_STATE_ONLINE:
1901 1901 error = vdev_online(spa, zc->zc_guid, zc->zc_obj, &newstate);
1902 1902 break;
1903 1903
1904 1904 case VDEV_STATE_OFFLINE:
1905 1905 error = vdev_offline(spa, zc->zc_guid, zc->zc_obj);
1906 1906 break;
1907 1907
1908 1908 case VDEV_STATE_FAULTED:
1909 1909 if (zc->zc_obj != VDEV_AUX_ERR_EXCEEDED &&
1910 1910 zc->zc_obj != VDEV_AUX_EXTERNAL)
1911 1911 zc->zc_obj = VDEV_AUX_ERR_EXCEEDED;
1912 1912
1913 1913 error = vdev_fault(spa, zc->zc_guid, zc->zc_obj);
1914 1914 break;
1915 1915
1916 1916 case VDEV_STATE_DEGRADED:
1917 1917 if (zc->zc_obj != VDEV_AUX_ERR_EXCEEDED &&
1918 1918 zc->zc_obj != VDEV_AUX_EXTERNAL)
1919 1919 zc->zc_obj = VDEV_AUX_ERR_EXCEEDED;
1920 1920
1921 1921 error = vdev_degrade(spa, zc->zc_guid, zc->zc_obj);
1922 1922 break;
1923 1923
1924 1924 default:
1925 1925 error = SET_ERROR(EINVAL);
1926 1926 }
1927 1927 zc->zc_cookie = newstate;
1928 1928 spa_close(spa, FTAG);
1929 1929 return (error);
1930 1930 }
1931 1931
1932 1932 static int
1933 1933 zfs_ioc_vdev_attach(zfs_cmd_t *zc)
1934 1934 {
1935 1935 spa_t *spa;
1936 1936 int replacing = zc->zc_cookie;
1937 1937 nvlist_t *config;
1938 1938 int error;
1939 1939
1940 1940 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1941 1941 return (error);
1942 1942
1943 1943 if ((error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1944 1944 zc->zc_iflags, &config)) == 0) {
1945 1945 error = spa_vdev_attach(spa, zc->zc_guid, config, replacing);
1946 1946 nvlist_free(config);
1947 1947 }
1948 1948
1949 1949 spa_close(spa, FTAG);
1950 1950 return (error);
1951 1951 }
1952 1952
1953 1953 static int
1954 1954 zfs_ioc_vdev_detach(zfs_cmd_t *zc)
1955 1955 {
1956 1956 spa_t *spa;
1957 1957 int error;
1958 1958
1959 1959 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1960 1960 return (error);
1961 1961
1962 1962 error = spa_vdev_detach(spa, zc->zc_guid, 0, B_FALSE);
1963 1963
1964 1964 spa_close(spa, FTAG);
1965 1965 return (error);
1966 1966 }
1967 1967
1968 1968 static int
1969 1969 zfs_ioc_vdev_split(zfs_cmd_t *zc)
1970 1970 {
1971 1971 spa_t *spa;
1972 1972 nvlist_t *config, *props = NULL;
1973 1973 int error;
1974 1974 boolean_t exp = !!(zc->zc_cookie & ZPOOL_EXPORT_AFTER_SPLIT);
1975 1975
1976 1976 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1977 1977 return (error);
1978 1978
1979 1979 if (error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1980 1980 zc->zc_iflags, &config)) {
1981 1981 spa_close(spa, FTAG);
1982 1982 return (error);
1983 1983 }
1984 1984
1985 1985 if (zc->zc_nvlist_src_size != 0 && (error =
1986 1986 get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
1987 1987 zc->zc_iflags, &props))) {
1988 1988 spa_close(spa, FTAG);
1989 1989 nvlist_free(config);
1990 1990 return (error);
1991 1991 }
1992 1992
1993 1993 error = spa_vdev_split_mirror(spa, zc->zc_string, config, props, exp);
1994 1994
1995 1995 spa_close(spa, FTAG);
1996 1996
1997 1997 nvlist_free(config);
1998 1998 nvlist_free(props);
1999 1999
2000 2000 return (error);
2001 2001 }
2002 2002
2003 2003 static int
2004 2004 zfs_ioc_vdev_setpath(zfs_cmd_t *zc)
2005 2005 {
2006 2006 spa_t *spa;
2007 2007 char *path = zc->zc_value;
2008 2008 uint64_t guid = zc->zc_guid;
2009 2009 int error;
2010 2010
2011 2011 error = spa_open(zc->zc_name, &spa, FTAG);
2012 2012 if (error != 0)
2013 2013 return (error);
2014 2014
2015 2015 error = spa_vdev_setpath(spa, guid, path);
2016 2016 spa_close(spa, FTAG);
2017 2017 return (error);
2018 2018 }
2019 2019
2020 2020 static int
2021 2021 zfs_ioc_vdev_setfru(zfs_cmd_t *zc)
2022 2022 {
2023 2023 spa_t *spa;
2024 2024 char *fru = zc->zc_value;
2025 2025 uint64_t guid = zc->zc_guid;
2026 2026 int error;
2027 2027
2028 2028 error = spa_open(zc->zc_name, &spa, FTAG);
2029 2029 if (error != 0)
2030 2030 return (error);
2031 2031
2032 2032 error = spa_vdev_setfru(spa, guid, fru);
2033 2033 spa_close(spa, FTAG);
2034 2034 return (error);
2035 2035 }
2036 2036
2037 2037 static int
2038 2038 zfs_ioc_objset_stats_impl(zfs_cmd_t *zc, objset_t *os)
2039 2039 {
2040 2040 int error = 0;
2041 2041 nvlist_t *nv;
2042 2042
2043 2043 dmu_objset_fast_stat(os, &zc->zc_objset_stats);
2044 2044
2045 2045 if (zc->zc_nvlist_dst != 0 &&
2046 2046 (error = dsl_prop_get_all(os, &nv)) == 0) {
2047 2047 dmu_objset_stats(os, nv);
2048 2048 /*
2049 2049 * NB: zvol_get_stats() will read the objset contents,
2050 2050 * which we aren't supposed to do with a
2051 2051 * DS_MODE_USER hold, because it could be
2052 2052 * inconsistent. So this is a bit of a workaround...
2053 2053 * XXX reading with out owning
2054 2054 */
2055 2055 if (!zc->zc_objset_stats.dds_inconsistent &&
2056 2056 dmu_objset_type(os) == DMU_OST_ZVOL) {
2057 2057 error = zvol_get_stats(os, nv);
2058 2058 if (error == EIO)
2059 2059 return (error);
2060 2060 VERIFY0(error);
2061 2061 }
2062 2062 error = put_nvlist(zc, nv);
2063 2063 nvlist_free(nv);
2064 2064 }
2065 2065
2066 2066 return (error);
2067 2067 }
2068 2068
2069 2069 /*
2070 2070 * inputs:
2071 2071 * zc_name name of filesystem
2072 2072 * zc_nvlist_dst_size size of buffer for property nvlist
2073 2073 *
2074 2074 * outputs:
2075 2075 * zc_objset_stats stats
2076 2076 * zc_nvlist_dst property nvlist
2077 2077 * zc_nvlist_dst_size size of property nvlist
2078 2078 */
2079 2079 static int
2080 2080 zfs_ioc_objset_stats(zfs_cmd_t *zc)
2081 2081 {
2082 2082 objset_t *os;
2083 2083 int error;
2084 2084
2085 2085 error = dmu_objset_hold(zc->zc_name, FTAG, &os);
2086 2086 if (error == 0) {
2087 2087 error = zfs_ioc_objset_stats_impl(zc, os);
2088 2088 dmu_objset_rele(os, FTAG);
2089 2089 }
2090 2090
2091 2091 return (error);
2092 2092 }
2093 2093
2094 2094 /*
2095 2095 * inputs:
2096 2096 * zc_name name of filesystem
2097 2097 * zc_nvlist_dst_size size of buffer for property nvlist
2098 2098 *
2099 2099 * outputs:
2100 2100 * zc_nvlist_dst received property nvlist
2101 2101 * zc_nvlist_dst_size size of received property nvlist
2102 2102 *
2103 2103 * Gets received properties (distinct from local properties on or after
2104 2104 * SPA_VERSION_RECVD_PROPS) for callers who want to differentiate received from
2105 2105 * local property values.
2106 2106 */
2107 2107 static int
2108 2108 zfs_ioc_objset_recvd_props(zfs_cmd_t *zc)
2109 2109 {
2110 2110 int error = 0;
2111 2111 nvlist_t *nv;
2112 2112
2113 2113 /*
2114 2114 * Without this check, we would return local property values if the
2115 2115 * caller has not already received properties on or after
2116 2116 * SPA_VERSION_RECVD_PROPS.
2117 2117 */
2118 2118 if (!dsl_prop_get_hasrecvd(zc->zc_name))
2119 2119 return (SET_ERROR(ENOTSUP));
2120 2120
2121 2121 if (zc->zc_nvlist_dst != 0 &&
2122 2122 (error = dsl_prop_get_received(zc->zc_name, &nv)) == 0) {
2123 2123 error = put_nvlist(zc, nv);
2124 2124 nvlist_free(nv);
2125 2125 }
2126 2126
2127 2127 return (error);
2128 2128 }
2129 2129
2130 2130 static int
2131 2131 nvl_add_zplprop(objset_t *os, nvlist_t *props, zfs_prop_t prop)
2132 2132 {
2133 2133 uint64_t value;
2134 2134 int error;
2135 2135
2136 2136 /*
2137 2137 * zfs_get_zplprop() will either find a value or give us
2138 2138 * the default value (if there is one).
2139 2139 */
2140 2140 if ((error = zfs_get_zplprop(os, prop, &value)) != 0)
2141 2141 return (error);
2142 2142 VERIFY(nvlist_add_uint64(props, zfs_prop_to_name(prop), value) == 0);
2143 2143 return (0);
2144 2144 }
2145 2145
2146 2146 /*
2147 2147 * inputs:
2148 2148 * zc_name name of filesystem
2149 2149 * zc_nvlist_dst_size size of buffer for zpl property nvlist
2150 2150 *
2151 2151 * outputs:
2152 2152 * zc_nvlist_dst zpl property nvlist
2153 2153 * zc_nvlist_dst_size size of zpl property nvlist
2154 2154 */
2155 2155 static int
2156 2156 zfs_ioc_objset_zplprops(zfs_cmd_t *zc)
2157 2157 {
2158 2158 objset_t *os;
2159 2159 int err;
2160 2160
2161 2161 /* XXX reading without owning */
2162 2162 if (err = dmu_objset_hold(zc->zc_name, FTAG, &os))
2163 2163 return (err);
2164 2164
2165 2165 dmu_objset_fast_stat(os, &zc->zc_objset_stats);
2166 2166
2167 2167 /*
2168 2168 * NB: nvl_add_zplprop() will read the objset contents,
2169 2169 * which we aren't supposed to do with a DS_MODE_USER
2170 2170 * hold, because it could be inconsistent.
2171 2171 */
2172 2172 if (zc->zc_nvlist_dst != NULL &&
2173 2173 !zc->zc_objset_stats.dds_inconsistent &&
2174 2174 dmu_objset_type(os) == DMU_OST_ZFS) {
2175 2175 nvlist_t *nv;
2176 2176
2177 2177 VERIFY(nvlist_alloc(&nv, NV_UNIQUE_NAME, KM_SLEEP) == 0);
2178 2178 if ((err = nvl_add_zplprop(os, nv, ZFS_PROP_VERSION)) == 0 &&
2179 2179 (err = nvl_add_zplprop(os, nv, ZFS_PROP_NORMALIZE)) == 0 &&
2180 2180 (err = nvl_add_zplprop(os, nv, ZFS_PROP_UTF8ONLY)) == 0 &&
2181 2181 (err = nvl_add_zplprop(os, nv, ZFS_PROP_CASE)) == 0)
2182 2182 err = put_nvlist(zc, nv);
2183 2183 nvlist_free(nv);
2184 2184 } else {
2185 2185 err = SET_ERROR(ENOENT);
2186 2186 }
2187 2187 dmu_objset_rele(os, FTAG);
2188 2188 return (err);
2189 2189 }
2190 2190
2191 2191 static boolean_t
2192 2192 dataset_name_hidden(const char *name)
2193 2193 {
2194 2194 /*
2195 2195 * Skip over datasets that are not visible in this zone,
2196 2196 * internal datasets (which have a $ in their name), and
2197 2197 * temporary datasets (which have a % in their name).
2198 2198 */
2199 2199 if (strchr(name, '$') != NULL)
2200 2200 return (B_TRUE);
2201 2201 if (strchr(name, '%') != NULL)
2202 2202 return (B_TRUE);
2203 2203 if (!INGLOBALZONE(curproc) && !zone_dataset_visible(name, NULL))
2204 2204 return (B_TRUE);
2205 2205 return (B_FALSE);
2206 2206 }
2207 2207
2208 2208 /*
2209 2209 * inputs:
2210 2210 * zc_name name of filesystem
2211 2211 * zc_cookie zap cursor
2212 2212 * zc_nvlist_dst_size size of buffer for property nvlist
2213 2213 *
2214 2214 * outputs:
2215 2215 * zc_name name of next filesystem
2216 2216 * zc_cookie zap cursor
2217 2217 * zc_objset_stats stats
2218 2218 * zc_nvlist_dst property nvlist
2219 2219 * zc_nvlist_dst_size size of property nvlist
2220 2220 */
2221 2221 static int
2222 2222 zfs_ioc_dataset_list_next(zfs_cmd_t *zc)
2223 2223 {
2224 2224 objset_t *os;
2225 2225 int error;
2226 2226 char *p;
2227 2227 size_t orig_len = strlen(zc->zc_name);
2228 2228
2229 2229 top:
2230 2230 if (error = dmu_objset_hold(zc->zc_name, FTAG, &os)) {
2231 2231 if (error == ENOENT)
2232 2232 error = SET_ERROR(ESRCH);
2233 2233 return (error);
2234 2234 }
2235 2235
2236 2236 p = strrchr(zc->zc_name, '/');
2237 2237 if (p == NULL || p[1] != '\0')
2238 2238 (void) strlcat(zc->zc_name, "/", sizeof (zc->zc_name));
2239 2239 p = zc->zc_name + strlen(zc->zc_name);
2240 2240
2241 2241 do {
2242 2242 error = dmu_dir_list_next(os,
2243 2243 sizeof (zc->zc_name) - (p - zc->zc_name), p,
2244 2244 NULL, &zc->zc_cookie);
2245 2245 if (error == ENOENT)
2246 2246 error = SET_ERROR(ESRCH);
2247 2247 } while (error == 0 && dataset_name_hidden(zc->zc_name));
2248 2248 dmu_objset_rele(os, FTAG);
2249 2249
2250 2250 /*
2251 2251 * If it's an internal dataset (ie. with a '$' in its name),
2252 2252 * don't try to get stats for it, otherwise we'll return ENOENT.
2253 2253 */
2254 2254 if (error == 0 && strchr(zc->zc_name, '$') == NULL) {
2255 2255 error = zfs_ioc_objset_stats(zc); /* fill in the stats */
2256 2256 if (error == ENOENT) {
2257 2257 /* We lost a race with destroy, get the next one. */
2258 2258 zc->zc_name[orig_len] = '\0';
2259 2259 goto top;
2260 2260 }
2261 2261 }
2262 2262 return (error);
2263 2263 }
2264 2264
2265 2265 /*
2266 2266 * inputs:
2267 2267 * zc_name name of filesystem
2268 2268 * zc_cookie zap cursor
2269 2269 * zc_nvlist_dst_size size of buffer for property nvlist
2270 2270 *
2271 2271 * outputs:
2272 2272 * zc_name name of next snapshot
2273 2273 * zc_objset_stats stats
2274 2274 * zc_nvlist_dst property nvlist
2275 2275 * zc_nvlist_dst_size size of property nvlist
2276 2276 */
2277 2277 static int
2278 2278 zfs_ioc_snapshot_list_next(zfs_cmd_t *zc)
2279 2279 {
2280 2280 objset_t *os;
2281 2281 int error;
2282 2282
2283 2283 error = dmu_objset_hold(zc->zc_name, FTAG, &os);
2284 2284 if (error != 0) {
2285 2285 return (error == ENOENT ? ESRCH : error);
2286 2286 }
2287 2287
2288 2288 /*
2289 2289 * A dataset name of maximum length cannot have any snapshots,
2290 2290 * so exit immediately.
2291 2291 */
2292 2292 if (strlcat(zc->zc_name, "@", sizeof (zc->zc_name)) >= MAXNAMELEN) {
2293 2293 dmu_objset_rele(os, FTAG);
2294 2294 return (SET_ERROR(ESRCH));
2295 2295 }
2296 2296
2297 2297 error = dmu_snapshot_list_next(os,
2298 2298 sizeof (zc->zc_name) - strlen(zc->zc_name),
2299 2299 zc->zc_name + strlen(zc->zc_name), &zc->zc_obj, &zc->zc_cookie,
2300 2300 NULL);
2301 2301
2302 2302 if (error == 0) {
2303 2303 dsl_dataset_t *ds;
2304 2304 dsl_pool_t *dp = os->os_dsl_dataset->ds_dir->dd_pool;
2305 2305
2306 2306 error = dsl_dataset_hold_obj(dp, zc->zc_obj, FTAG, &ds);
2307 2307 if (error == 0) {
2308 2308 objset_t *ossnap;
2309 2309
2310 2310 error = dmu_objset_from_ds(ds, &ossnap);
2311 2311 if (error == 0)
2312 2312 error = zfs_ioc_objset_stats_impl(zc, ossnap);
2313 2313 dsl_dataset_rele(ds, FTAG);
2314 2314 }
2315 2315 } else if (error == ENOENT) {
2316 2316 error = SET_ERROR(ESRCH);
2317 2317 }
2318 2318
2319 2319 dmu_objset_rele(os, FTAG);
2320 2320 /* if we failed, undo the @ that we tacked on to zc_name */
2321 2321 if (error != 0)
2322 2322 *strchr(zc->zc_name, '@') = '\0';
2323 2323 return (error);
2324 2324 }
2325 2325
2326 2326 static int
2327 2327 zfs_prop_set_userquota(const char *dsname, nvpair_t *pair)
2328 2328 {
2329 2329 const char *propname = nvpair_name(pair);
2330 2330 uint64_t *valary;
2331 2331 unsigned int vallen;
2332 2332 const char *domain;
2333 2333 char *dash;
2334 2334 zfs_userquota_prop_t type;
2335 2335 uint64_t rid;
2336 2336 uint64_t quota;
2337 2337 zfsvfs_t *zfsvfs;
2338 2338 int err;
2339 2339
2340 2340 if (nvpair_type(pair) == DATA_TYPE_NVLIST) {
2341 2341 nvlist_t *attrs;
2342 2342 VERIFY(nvpair_value_nvlist(pair, &attrs) == 0);
2343 2343 if (nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
2344 2344 &pair) != 0)
2345 2345 return (SET_ERROR(EINVAL));
2346 2346 }
2347 2347
2348 2348 /*
2349 2349 * A correctly constructed propname is encoded as
2350 2350 * userquota@<rid>-<domain>.
2351 2351 */
2352 2352 if ((dash = strchr(propname, '-')) == NULL ||
2353 2353 nvpair_value_uint64_array(pair, &valary, &vallen) != 0 ||
2354 2354 vallen != 3)
2355 2355 return (SET_ERROR(EINVAL));
2356 2356
2357 2357 domain = dash + 1;
2358 2358 type = valary[0];
2359 2359 rid = valary[1];
2360 2360 quota = valary[2];
2361 2361
2362 2362 err = zfsvfs_hold(dsname, FTAG, &zfsvfs, B_FALSE);
2363 2363 if (err == 0) {
2364 2364 err = zfs_set_userquota(zfsvfs, type, domain, rid, quota);
2365 2365 zfsvfs_rele(zfsvfs, FTAG);
2366 2366 }
2367 2367
2368 2368 return (err);
2369 2369 }
2370 2370
2371 2371 /*
2372 2372 * If the named property is one that has a special function to set its value,
2373 2373 * return 0 on success and a positive error code on failure; otherwise if it is
2374 2374 * not one of the special properties handled by this function, return -1.
2375 2375 *
2376 2376 * XXX: It would be better for callers of the property interface if we handled
2377 2377 * these special cases in dsl_prop.c (in the dsl layer).
2378 2378 */
2379 2379 static int
2380 2380 zfs_prop_set_special(const char *dsname, zprop_source_t source,
2381 2381 nvpair_t *pair)
2382 2382 {
2383 2383 const char *propname = nvpair_name(pair);
2384 2384 zfs_prop_t prop = zfs_name_to_prop(propname);
2385 2385 uint64_t intval;
2386 2386 int err = -1;
2387 2387
2388 2388 if (prop == ZPROP_INVAL) {
2389 2389 if (zfs_prop_userquota(propname))
2390 2390 return (zfs_prop_set_userquota(dsname, pair));
2391 2391 return (-1);
2392 2392 }
2393 2393
2394 2394 if (nvpair_type(pair) == DATA_TYPE_NVLIST) {
2395 2395 nvlist_t *attrs;
2396 2396 VERIFY(nvpair_value_nvlist(pair, &attrs) == 0);
2397 2397 VERIFY(nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
2398 2398 &pair) == 0);
2399 2399 }
2400 2400
2401 2401 if (zfs_prop_get_type(prop) == PROP_TYPE_STRING)
2402 2402 return (-1);
2403 2403
2404 2404 VERIFY(0 == nvpair_value_uint64(pair, &intval));
2405 2405
2406 2406 switch (prop) {
2407 2407 case ZFS_PROP_QUOTA:
2408 2408 err = dsl_dir_set_quota(dsname, source, intval);
2409 2409 break;
2410 2410 case ZFS_PROP_REFQUOTA:
2411 2411 err = dsl_dataset_set_refquota(dsname, source, intval);
2412 2412 break;
2413 2413 case ZFS_PROP_FILESYSTEM_LIMIT:
2414 2414 case ZFS_PROP_SNAPSHOT_LIMIT:
2415 2415 if (intval == UINT64_MAX) {
2416 2416 /* clearing the limit, just do it */
2417 2417 err = 0;
2418 2418 } else {
2419 2419 err = dsl_dir_activate_fs_ss_limit(dsname);
2420 2420 }
2421 2421 /*
2422 2422 * Set err to -1 to force the zfs_set_prop_nvlist code down the
2423 2423 * default path to set the value in the nvlist.
2424 2424 */
2425 2425 if (err == 0)
2426 2426 err = -1;
2427 2427 break;
2428 2428 case ZFS_PROP_RESERVATION:
2429 2429 err = dsl_dir_set_reservation(dsname, source, intval);
2430 2430 break;
2431 2431 case ZFS_PROP_REFRESERVATION:
2432 2432 err = dsl_dataset_set_refreservation(dsname, source, intval);
2433 2433 break;
2434 2434 case ZFS_PROP_VOLSIZE:
2435 2435 err = zvol_set_volsize(dsname, intval);
2436 2436 break;
2437 2437 case ZFS_PROP_VERSION:
2438 2438 {
2439 2439 zfsvfs_t *zfsvfs;
2440 2440
2441 2441 if ((err = zfsvfs_hold(dsname, FTAG, &zfsvfs, B_TRUE)) != 0)
2442 2442 break;
2443 2443
2444 2444 err = zfs_set_version(zfsvfs, intval);
2445 2445 zfsvfs_rele(zfsvfs, FTAG);
2446 2446
2447 2447 if (err == 0 && intval >= ZPL_VERSION_USERSPACE) {
2448 2448 zfs_cmd_t *zc;
2449 2449
2450 2450 zc = kmem_zalloc(sizeof (zfs_cmd_t), KM_SLEEP);
2451 2451 (void) strcpy(zc->zc_name, dsname);
2452 2452 (void) zfs_ioc_userspace_upgrade(zc);
2453 2453 kmem_free(zc, sizeof (zfs_cmd_t));
2454 2454 }
2455 2455 break;
2456 2456 }
2457 2457 default:
2458 2458 err = -1;
2459 2459 }
2460 2460
2461 2461 return (err);
2462 2462 }
2463 2463
2464 2464 /*
2465 2465 * This function is best effort. If it fails to set any of the given properties,
2466 2466 * it continues to set as many as it can and returns the last error
2467 2467 * encountered. If the caller provides a non-NULL errlist, it will be filled in
2468 2468 * with the list of names of all the properties that failed along with the
2469 2469 * corresponding error numbers.
2470 2470 *
2471 2471 * If every property is set successfully, zero is returned and errlist is not
2472 2472 * modified.
2473 2473 */
2474 2474 int
2475 2475 zfs_set_prop_nvlist(const char *dsname, zprop_source_t source, nvlist_t *nvl,
2476 2476 nvlist_t *errlist)
2477 2477 {
2478 2478 nvpair_t *pair;
2479 2479 nvpair_t *propval;
2480 2480 int rv = 0;
2481 2481 uint64_t intval;
2482 2482 char *strval;
2483 2483 nvlist_t *genericnvl = fnvlist_alloc();
2484 2484 nvlist_t *retrynvl = fnvlist_alloc();
2485 2485
2486 2486 retry:
2487 2487 pair = NULL;
2488 2488 while ((pair = nvlist_next_nvpair(nvl, pair)) != NULL) {
2489 2489 const char *propname = nvpair_name(pair);
2490 2490 zfs_prop_t prop = zfs_name_to_prop(propname);
2491 2491 int err = 0;
2492 2492
2493 2493 /* decode the property value */
2494 2494 propval = pair;
2495 2495 if (nvpair_type(pair) == DATA_TYPE_NVLIST) {
2496 2496 nvlist_t *attrs;
2497 2497 attrs = fnvpair_value_nvlist(pair);
2498 2498 if (nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
2499 2499 &propval) != 0)
2500 2500 err = SET_ERROR(EINVAL);
2501 2501 }
2502 2502
2503 2503 /* Validate value type */
2504 2504 if (err == 0 && prop == ZPROP_INVAL) {
2505 2505 if (zfs_prop_user(propname)) {
2506 2506 if (nvpair_type(propval) != DATA_TYPE_STRING)
2507 2507 err = SET_ERROR(EINVAL);
2508 2508 } else if (zfs_prop_userquota(propname)) {
2509 2509 if (nvpair_type(propval) !=
2510 2510 DATA_TYPE_UINT64_ARRAY)
2511 2511 err = SET_ERROR(EINVAL);
2512 2512 } else {
2513 2513 err = SET_ERROR(EINVAL);
2514 2514 }
2515 2515 } else if (err == 0) {
2516 2516 if (nvpair_type(propval) == DATA_TYPE_STRING) {
2517 2517 if (zfs_prop_get_type(prop) != PROP_TYPE_STRING)
2518 2518 err = SET_ERROR(EINVAL);
2519 2519 } else if (nvpair_type(propval) == DATA_TYPE_UINT64) {
2520 2520 const char *unused;
2521 2521
2522 2522 intval = fnvpair_value_uint64(propval);
2523 2523
2524 2524 switch (zfs_prop_get_type(prop)) {
2525 2525 case PROP_TYPE_NUMBER:
2526 2526 break;
2527 2527 case PROP_TYPE_STRING:
2528 2528 err = SET_ERROR(EINVAL);
2529 2529 break;
2530 2530 case PROP_TYPE_INDEX:
2531 2531 if (zfs_prop_index_to_string(prop,
2532 2532 intval, &unused) != 0)
2533 2533 err = SET_ERROR(EINVAL);
2534 2534 break;
2535 2535 default:
2536 2536 cmn_err(CE_PANIC,
2537 2537 "unknown property type");
2538 2538 }
2539 2539 } else {
2540 2540 err = SET_ERROR(EINVAL);
2541 2541 }
2542 2542 }
2543 2543
2544 2544 /* Validate permissions */
2545 2545 if (err == 0)
2546 2546 err = zfs_check_settable(dsname, pair, CRED());
2547 2547
2548 2548 if (err == 0) {
2549 2549 err = zfs_prop_set_special(dsname, source, pair);
2550 2550 if (err == -1) {
2551 2551 /*
2552 2552 * For better performance we build up a list of
2553 2553 * properties to set in a single transaction.
2554 2554 */
2555 2555 err = nvlist_add_nvpair(genericnvl, pair);
2556 2556 } else if (err != 0 && nvl != retrynvl) {
2557 2557 /*
2558 2558 * This may be a spurious error caused by
2559 2559 * receiving quota and reservation out of order.
2560 2560 * Try again in a second pass.
2561 2561 */
2562 2562 err = nvlist_add_nvpair(retrynvl, pair);
2563 2563 }
2564 2564 }
2565 2565
2566 2566 if (err != 0) {
2567 2567 if (errlist != NULL)
2568 2568 fnvlist_add_int32(errlist, propname, err);
2569 2569 rv = err;
2570 2570 }
2571 2571 }
2572 2572
2573 2573 if (nvl != retrynvl && !nvlist_empty(retrynvl)) {
2574 2574 nvl = retrynvl;
2575 2575 goto retry;
2576 2576 }
2577 2577
2578 2578 if (!nvlist_empty(genericnvl) &&
2579 2579 dsl_props_set(dsname, source, genericnvl) != 0) {
2580 2580 /*
2581 2581 * If this fails, we still want to set as many properties as we
2582 2582 * can, so try setting them individually.
2583 2583 */
2584 2584 pair = NULL;
2585 2585 while ((pair = nvlist_next_nvpair(genericnvl, pair)) != NULL) {
2586 2586 const char *propname = nvpair_name(pair);
2587 2587 int err = 0;
2588 2588
2589 2589 propval = pair;
2590 2590 if (nvpair_type(pair) == DATA_TYPE_NVLIST) {
2591 2591 nvlist_t *attrs;
2592 2592 attrs = fnvpair_value_nvlist(pair);
2593 2593 propval = fnvlist_lookup_nvpair(attrs,
2594 2594 ZPROP_VALUE);
2595 2595 }
2596 2596
2597 2597 if (nvpair_type(propval) == DATA_TYPE_STRING) {
2598 2598 strval = fnvpair_value_string(propval);
2599 2599 err = dsl_prop_set_string(dsname, propname,
2600 2600 source, strval);
2601 2601 } else {
2602 2602 intval = fnvpair_value_uint64(propval);
2603 2603 err = dsl_prop_set_int(dsname, propname, source,
2604 2604 intval);
2605 2605 }
2606 2606
2607 2607 if (err != 0) {
2608 2608 if (errlist != NULL) {
2609 2609 fnvlist_add_int32(errlist, propname,
2610 2610 err);
2611 2611 }
2612 2612 rv = err;
2613 2613 }
2614 2614 }
2615 2615 }
2616 2616 nvlist_free(genericnvl);
2617 2617 nvlist_free(retrynvl);
2618 2618
2619 2619 return (rv);
2620 2620 }
2621 2621
2622 2622 /*
2623 2623 * Check that all the properties are valid user properties.
2624 2624 */
2625 2625 static int
2626 2626 zfs_check_userprops(const char *fsname, nvlist_t *nvl)
2627 2627 {
2628 2628 nvpair_t *pair = NULL;
2629 2629 int error = 0;
2630 2630
2631 2631 while ((pair = nvlist_next_nvpair(nvl, pair)) != NULL) {
2632 2632 const char *propname = nvpair_name(pair);
2633 2633
2634 2634 if (!zfs_prop_user(propname) ||
2635 2635 nvpair_type(pair) != DATA_TYPE_STRING)
2636 2636 return (SET_ERROR(EINVAL));
2637 2637
2638 2638 if (error = zfs_secpolicy_write_perms(fsname,
2639 2639 ZFS_DELEG_PERM_USERPROP, CRED()))
2640 2640 return (error);
2641 2641
2642 2642 if (strlen(propname) >= ZAP_MAXNAMELEN)
2643 2643 return (SET_ERROR(ENAMETOOLONG));
2644 2644
2645 2645 if (strlen(fnvpair_value_string(pair)) >= ZAP_MAXVALUELEN)
2646 2646 return (E2BIG);
2647 2647 }
2648 2648 return (0);
2649 2649 }
2650 2650
2651 2651 static void
2652 2652 props_skip(nvlist_t *props, nvlist_t *skipped, nvlist_t **newprops)
2653 2653 {
2654 2654 nvpair_t *pair;
2655 2655
2656 2656 VERIFY(nvlist_alloc(newprops, NV_UNIQUE_NAME, KM_SLEEP) == 0);
2657 2657
2658 2658 pair = NULL;
2659 2659 while ((pair = nvlist_next_nvpair(props, pair)) != NULL) {
2660 2660 if (nvlist_exists(skipped, nvpair_name(pair)))
2661 2661 continue;
2662 2662
2663 2663 VERIFY(nvlist_add_nvpair(*newprops, pair) == 0);
2664 2664 }
2665 2665 }
2666 2666
2667 2667 static int
2668 2668 clear_received_props(const char *dsname, nvlist_t *props,
2669 2669 nvlist_t *skipped)
2670 2670 {
2671 2671 int err = 0;
2672 2672 nvlist_t *cleared_props = NULL;
2673 2673 props_skip(props, skipped, &cleared_props);
2674 2674 if (!nvlist_empty(cleared_props)) {
2675 2675 /*
2676 2676 * Acts on local properties until the dataset has received
2677 2677 * properties at least once on or after SPA_VERSION_RECVD_PROPS.
2678 2678 */
2679 2679 zprop_source_t flags = (ZPROP_SRC_NONE |
2680 2680 (dsl_prop_get_hasrecvd(dsname) ? ZPROP_SRC_RECEIVED : 0));
2681 2681 err = zfs_set_prop_nvlist(dsname, flags, cleared_props, NULL);
2682 2682 }
2683 2683 nvlist_free(cleared_props);
2684 2684 return (err);
2685 2685 }
2686 2686
2687 2687 /*
2688 2688 * inputs:
2689 2689 * zc_name name of filesystem
2690 2690 * zc_value name of property to set
2691 2691 * zc_nvlist_src{_size} nvlist of properties to apply
2692 2692 * zc_cookie received properties flag
2693 2693 *
2694 2694 * outputs:
2695 2695 * zc_nvlist_dst{_size} error for each unapplied received property
2696 2696 */
2697 2697 static int
2698 2698 zfs_ioc_set_prop(zfs_cmd_t *zc)
2699 2699 {
2700 2700 nvlist_t *nvl;
2701 2701 boolean_t received = zc->zc_cookie;
2702 2702 zprop_source_t source = (received ? ZPROP_SRC_RECEIVED :
2703 2703 ZPROP_SRC_LOCAL);
2704 2704 nvlist_t *errors;
2705 2705 int error;
2706 2706
2707 2707 if ((error = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
2708 2708 zc->zc_iflags, &nvl)) != 0)
2709 2709 return (error);
2710 2710
2711 2711 if (received) {
2712 2712 nvlist_t *origprops;
2713 2713
2714 2714 if (dsl_prop_get_received(zc->zc_name, &origprops) == 0) {
2715 2715 (void) clear_received_props(zc->zc_name,
2716 2716 origprops, nvl);
2717 2717 nvlist_free(origprops);
2718 2718 }
2719 2719
2720 2720 error = dsl_prop_set_hasrecvd(zc->zc_name);
2721 2721 }
2722 2722
2723 2723 errors = fnvlist_alloc();
2724 2724 if (error == 0)
2725 2725 error = zfs_set_prop_nvlist(zc->zc_name, source, nvl, errors);
2726 2726
2727 2727 if (zc->zc_nvlist_dst != NULL && errors != NULL) {
2728 2728 (void) put_nvlist(zc, errors);
2729 2729 }
2730 2730
2731 2731 nvlist_free(errors);
2732 2732 nvlist_free(nvl);
2733 2733 return (error);
2734 2734 }
2735 2735
2736 2736 /*
2737 2737 * inputs:
2738 2738 * zc_name name of filesystem
2739 2739 * zc_value name of property to inherit
2740 2740 * zc_cookie revert to received value if TRUE
2741 2741 *
2742 2742 * outputs: none
2743 2743 */
2744 2744 static int
2745 2745 zfs_ioc_inherit_prop(zfs_cmd_t *zc)
2746 2746 {
2747 2747 const char *propname = zc->zc_value;
2748 2748 zfs_prop_t prop = zfs_name_to_prop(propname);
2749 2749 boolean_t received = zc->zc_cookie;
2750 2750 zprop_source_t source = (received
2751 2751 ? ZPROP_SRC_NONE /* revert to received value, if any */
2752 2752 : ZPROP_SRC_INHERITED); /* explicitly inherit */
2753 2753
2754 2754 if (received) {
2755 2755 nvlist_t *dummy;
2756 2756 nvpair_t *pair;
2757 2757 zprop_type_t type;
2758 2758 int err;
2759 2759
2760 2760 /*
2761 2761 * zfs_prop_set_special() expects properties in the form of an
2762 2762 * nvpair with type info.
2763 2763 */
2764 2764 if (prop == ZPROP_INVAL) {
2765 2765 if (!zfs_prop_user(propname))
2766 2766 return (SET_ERROR(EINVAL));
2767 2767
2768 2768 type = PROP_TYPE_STRING;
2769 2769 } else if (prop == ZFS_PROP_VOLSIZE ||
2770 2770 prop == ZFS_PROP_VERSION) {
2771 2771 return (SET_ERROR(EINVAL));
2772 2772 } else {
2773 2773 type = zfs_prop_get_type(prop);
2774 2774 }
2775 2775
2776 2776 VERIFY(nvlist_alloc(&dummy, NV_UNIQUE_NAME, KM_SLEEP) == 0);
2777 2777
2778 2778 switch (type) {
2779 2779 case PROP_TYPE_STRING:
2780 2780 VERIFY(0 == nvlist_add_string(dummy, propname, ""));
2781 2781 break;
2782 2782 case PROP_TYPE_NUMBER:
2783 2783 case PROP_TYPE_INDEX:
2784 2784 VERIFY(0 == nvlist_add_uint64(dummy, propname, 0));
2785 2785 break;
2786 2786 default:
2787 2787 nvlist_free(dummy);
2788 2788 return (SET_ERROR(EINVAL));
2789 2789 }
2790 2790
2791 2791 pair = nvlist_next_nvpair(dummy, NULL);
2792 2792 err = zfs_prop_set_special(zc->zc_name, source, pair);
2793 2793 nvlist_free(dummy);
2794 2794 if (err != -1)
2795 2795 return (err); /* special property already handled */
2796 2796 } else {
2797 2797 /*
2798 2798 * Only check this in the non-received case. We want to allow
2799 2799 * 'inherit -S' to revert non-inheritable properties like quota
2800 2800 * and reservation to the received or default values even though
2801 2801 * they are not considered inheritable.
2802 2802 */
2803 2803 if (prop != ZPROP_INVAL && !zfs_prop_inheritable(prop))
2804 2804 return (SET_ERROR(EINVAL));
2805 2805 }
2806 2806
2807 2807 /* property name has been validated by zfs_secpolicy_inherit_prop() */
2808 2808 return (dsl_prop_inherit(zc->zc_name, zc->zc_value, source));
2809 2809 }
2810 2810
2811 2811 static int
2812 2812 zfs_ioc_pool_set_props(zfs_cmd_t *zc)
2813 2813 {
2814 2814 nvlist_t *props;
2815 2815 spa_t *spa;
2816 2816 int error;
2817 2817 nvpair_t *pair;
2818 2818
2819 2819 if (error = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
2820 2820 zc->zc_iflags, &props))
2821 2821 return (error);
2822 2822
2823 2823 /*
2824 2824 * If the only property is the configfile, then just do a spa_lookup()
2825 2825 * to handle the faulted case.
2826 2826 */
2827 2827 pair = nvlist_next_nvpair(props, NULL);
2828 2828 if (pair != NULL && strcmp(nvpair_name(pair),
2829 2829 zpool_prop_to_name(ZPOOL_PROP_CACHEFILE)) == 0 &&
2830 2830 nvlist_next_nvpair(props, pair) == NULL) {
2831 2831 mutex_enter(&spa_namespace_lock);
2832 2832 if ((spa = spa_lookup(zc->zc_name)) != NULL) {
2833 2833 spa_configfile_set(spa, props, B_FALSE);
2834 2834 spa_config_sync(spa, B_FALSE, B_TRUE);
2835 2835 }
2836 2836 mutex_exit(&spa_namespace_lock);
2837 2837 if (spa != NULL) {
2838 2838 nvlist_free(props);
2839 2839 return (0);
2840 2840 }
2841 2841 }
2842 2842
2843 2843 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0) {
2844 2844 nvlist_free(props);
2845 2845 return (error);
2846 2846 }
2847 2847
2848 2848 error = spa_prop_set(spa, props);
2849 2849
2850 2850 nvlist_free(props);
2851 2851 spa_close(spa, FTAG);
2852 2852
2853 2853 return (error);
2854 2854 }
2855 2855
2856 2856 static int
2857 2857 zfs_ioc_pool_get_props(zfs_cmd_t *zc)
2858 2858 {
2859 2859 spa_t *spa;
2860 2860 int error;
2861 2861 nvlist_t *nvp = NULL;
2862 2862
2863 2863 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0) {
2864 2864 /*
2865 2865 * If the pool is faulted, there may be properties we can still
2866 2866 * get (such as altroot and cachefile), so attempt to get them
2867 2867 * anyway.
2868 2868 */
2869 2869 mutex_enter(&spa_namespace_lock);
2870 2870 if ((spa = spa_lookup(zc->zc_name)) != NULL)
2871 2871 error = spa_prop_get(spa, &nvp);
2872 2872 mutex_exit(&spa_namespace_lock);
2873 2873 } else {
2874 2874 error = spa_prop_get(spa, &nvp);
2875 2875 spa_close(spa, FTAG);
2876 2876 }
2877 2877
2878 2878 if (error == 0 && zc->zc_nvlist_dst != NULL)
2879 2879 error = put_nvlist(zc, nvp);
2880 2880 else
2881 2881 error = SET_ERROR(EFAULT);
2882 2882
2883 2883 nvlist_free(nvp);
2884 2884 return (error);
2885 2885 }
2886 2886
2887 2887 /*
2888 2888 * inputs:
2889 2889 * zc_name name of filesystem
2890 2890 * zc_nvlist_src{_size} nvlist of delegated permissions
2891 2891 * zc_perm_action allow/unallow flag
2892 2892 *
2893 2893 * outputs: none
2894 2894 */
2895 2895 static int
2896 2896 zfs_ioc_set_fsacl(zfs_cmd_t *zc)
2897 2897 {
2898 2898 int error;
2899 2899 nvlist_t *fsaclnv = NULL;
2900 2900
2901 2901 if ((error = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
2902 2902 zc->zc_iflags, &fsaclnv)) != 0)
2903 2903 return (error);
2904 2904
2905 2905 /*
2906 2906 * Verify nvlist is constructed correctly
2907 2907 */
2908 2908 if ((error = zfs_deleg_verify_nvlist(fsaclnv)) != 0) {
2909 2909 nvlist_free(fsaclnv);
2910 2910 return (SET_ERROR(EINVAL));
2911 2911 }
2912 2912
2913 2913 /*
2914 2914 * If we don't have PRIV_SYS_MOUNT, then validate
2915 2915 * that user is allowed to hand out each permission in
2916 2916 * the nvlist(s)
2917 2917 */
2918 2918
2919 2919 error = secpolicy_zfs(CRED());
2920 2920 if (error != 0) {
2921 2921 if (zc->zc_perm_action == B_FALSE) {
2922 2922 error = dsl_deleg_can_allow(zc->zc_name,
2923 2923 fsaclnv, CRED());
2924 2924 } else {
2925 2925 error = dsl_deleg_can_unallow(zc->zc_name,
2926 2926 fsaclnv, CRED());
2927 2927 }
2928 2928 }
2929 2929
2930 2930 if (error == 0)
2931 2931 error = dsl_deleg_set(zc->zc_name, fsaclnv, zc->zc_perm_action);
2932 2932
2933 2933 nvlist_free(fsaclnv);
2934 2934 return (error);
2935 2935 }
2936 2936
2937 2937 /*
2938 2938 * inputs:
2939 2939 * zc_name name of filesystem
2940 2940 *
2941 2941 * outputs:
2942 2942 * zc_nvlist_src{_size} nvlist of delegated permissions
2943 2943 */
2944 2944 static int
2945 2945 zfs_ioc_get_fsacl(zfs_cmd_t *zc)
2946 2946 {
2947 2947 nvlist_t *nvp;
2948 2948 int error;
2949 2949
2950 2950 if ((error = dsl_deleg_get(zc->zc_name, &nvp)) == 0) {
2951 2951 error = put_nvlist(zc, nvp);
2952 2952 nvlist_free(nvp);
2953 2953 }
2954 2954
2955 2955 return (error);
2956 2956 }
2957 2957
2958 2958 /*
2959 2959 * Search the vfs list for a specified resource. Returns a pointer to it
2960 2960 * or NULL if no suitable entry is found. The caller of this routine
2961 2961 * is responsible for releasing the returned vfs pointer.
2962 2962 */
2963 2963 static vfs_t *
2964 2964 zfs_get_vfs(const char *resource)
2965 2965 {
2966 2966 struct vfs *vfsp;
2967 2967 struct vfs *vfs_found = NULL;
2968 2968
2969 2969 vfs_list_read_lock();
2970 2970 vfsp = rootvfs;
2971 2971 do {
2972 2972 if (strcmp(refstr_value(vfsp->vfs_resource), resource) == 0) {
2973 2973 VFS_HOLD(vfsp);
2974 2974 vfs_found = vfsp;
2975 2975 break;
2976 2976 }
2977 2977 vfsp = vfsp->vfs_next;
2978 2978 } while (vfsp != rootvfs);
2979 2979 vfs_list_unlock();
2980 2980 return (vfs_found);
2981 2981 }
2982 2982
2983 2983 /* ARGSUSED */
2984 2984 static void
2985 2985 zfs_create_cb(objset_t *os, void *arg, cred_t *cr, dmu_tx_t *tx)
2986 2986 {
2987 2987 zfs_creat_t *zct = arg;
2988 2988
2989 2989 zfs_create_fs(os, cr, zct->zct_zplprops, tx);
2990 2990 }
2991 2991
2992 2992 #define ZFS_PROP_UNDEFINED ((uint64_t)-1)
2993 2993
2994 2994 /*
2995 2995 * inputs:
2996 2996 * os parent objset pointer (NULL if root fs)
2997 2997 * fuids_ok fuids allowed in this version of the spa?
2998 2998 * sa_ok SAs allowed in this version of the spa?
2999 2999 * createprops list of properties requested by creator
3000 3000 *
3001 3001 * outputs:
3002 3002 * zplprops values for the zplprops we attach to the master node object
3003 3003 * is_ci true if requested file system will be purely case-insensitive
3004 3004 *
3005 3005 * Determine the settings for utf8only, normalization and
3006 3006 * casesensitivity. Specific values may have been requested by the
3007 3007 * creator and/or we can inherit values from the parent dataset. If
3008 3008 * the file system is of too early a vintage, a creator can not
3009 3009 * request settings for these properties, even if the requested
3010 3010 * setting is the default value. We don't actually want to create dsl
3011 3011 * properties for these, so remove them from the source nvlist after
3012 3012 * processing.
3013 3013 */
3014 3014 static int
3015 3015 zfs_fill_zplprops_impl(objset_t *os, uint64_t zplver,
3016 3016 boolean_t fuids_ok, boolean_t sa_ok, nvlist_t *createprops,
3017 3017 nvlist_t *zplprops, boolean_t *is_ci)
3018 3018 {
3019 3019 uint64_t sense = ZFS_PROP_UNDEFINED;
3020 3020 uint64_t norm = ZFS_PROP_UNDEFINED;
3021 3021 uint64_t u8 = ZFS_PROP_UNDEFINED;
3022 3022
3023 3023 ASSERT(zplprops != NULL);
3024 3024
3025 3025 /*
3026 3026 * Pull out creator prop choices, if any.
3027 3027 */
3028 3028 if (createprops) {
3029 3029 (void) nvlist_lookup_uint64(createprops,
3030 3030 zfs_prop_to_name(ZFS_PROP_VERSION), &zplver);
3031 3031 (void) nvlist_lookup_uint64(createprops,
3032 3032 zfs_prop_to_name(ZFS_PROP_NORMALIZE), &norm);
3033 3033 (void) nvlist_remove_all(createprops,
3034 3034 zfs_prop_to_name(ZFS_PROP_NORMALIZE));
3035 3035 (void) nvlist_lookup_uint64(createprops,
3036 3036 zfs_prop_to_name(ZFS_PROP_UTF8ONLY), &u8);
3037 3037 (void) nvlist_remove_all(createprops,
3038 3038 zfs_prop_to_name(ZFS_PROP_UTF8ONLY));
3039 3039 (void) nvlist_lookup_uint64(createprops,
3040 3040 zfs_prop_to_name(ZFS_PROP_CASE), &sense);
3041 3041 (void) nvlist_remove_all(createprops,
3042 3042 zfs_prop_to_name(ZFS_PROP_CASE));
3043 3043 }
3044 3044
3045 3045 /*
3046 3046 * If the zpl version requested is whacky or the file system
3047 3047 * or pool is version is too "young" to support normalization
3048 3048 * and the creator tried to set a value for one of the props,
3049 3049 * error out.
3050 3050 */
3051 3051 if ((zplver < ZPL_VERSION_INITIAL || zplver > ZPL_VERSION) ||
3052 3052 (zplver >= ZPL_VERSION_FUID && !fuids_ok) ||
3053 3053 (zplver >= ZPL_VERSION_SA && !sa_ok) ||
3054 3054 (zplver < ZPL_VERSION_NORMALIZATION &&
3055 3055 (norm != ZFS_PROP_UNDEFINED || u8 != ZFS_PROP_UNDEFINED ||
3056 3056 sense != ZFS_PROP_UNDEFINED)))
3057 3057 return (SET_ERROR(ENOTSUP));
3058 3058
3059 3059 /*
3060 3060 * Put the version in the zplprops
3061 3061 */
3062 3062 VERIFY(nvlist_add_uint64(zplprops,
3063 3063 zfs_prop_to_name(ZFS_PROP_VERSION), zplver) == 0);
3064 3064
3065 3065 if (norm == ZFS_PROP_UNDEFINED)
3066 3066 VERIFY(zfs_get_zplprop(os, ZFS_PROP_NORMALIZE, &norm) == 0);
3067 3067 VERIFY(nvlist_add_uint64(zplprops,
3068 3068 zfs_prop_to_name(ZFS_PROP_NORMALIZE), norm) == 0);
3069 3069
3070 3070 /*
3071 3071 * If we're normalizing, names must always be valid UTF-8 strings.
3072 3072 */
3073 3073 if (norm)
3074 3074 u8 = 1;
3075 3075 if (u8 == ZFS_PROP_UNDEFINED)
3076 3076 VERIFY(zfs_get_zplprop(os, ZFS_PROP_UTF8ONLY, &u8) == 0);
3077 3077 VERIFY(nvlist_add_uint64(zplprops,
3078 3078 zfs_prop_to_name(ZFS_PROP_UTF8ONLY), u8) == 0);
3079 3079
3080 3080 if (sense == ZFS_PROP_UNDEFINED)
3081 3081 VERIFY(zfs_get_zplprop(os, ZFS_PROP_CASE, &sense) == 0);
3082 3082 VERIFY(nvlist_add_uint64(zplprops,
3083 3083 zfs_prop_to_name(ZFS_PROP_CASE), sense) == 0);
3084 3084
3085 3085 if (is_ci)
3086 3086 *is_ci = (sense == ZFS_CASE_INSENSITIVE);
3087 3087
3088 3088 return (0);
3089 3089 }
3090 3090
3091 3091 static int
3092 3092 zfs_fill_zplprops(const char *dataset, nvlist_t *createprops,
3093 3093 nvlist_t *zplprops, boolean_t *is_ci)
3094 3094 {
3095 3095 boolean_t fuids_ok, sa_ok;
3096 3096 uint64_t zplver = ZPL_VERSION;
3097 3097 objset_t *os = NULL;
3098 3098 char parentname[MAXNAMELEN];
3099 3099 char *cp;
3100 3100 spa_t *spa;
3101 3101 uint64_t spa_vers;
3102 3102 int error;
3103 3103
3104 3104 (void) strlcpy(parentname, dataset, sizeof (parentname));
3105 3105 cp = strrchr(parentname, '/');
3106 3106 ASSERT(cp != NULL);
3107 3107 cp[0] = '\0';
3108 3108
3109 3109 if ((error = spa_open(dataset, &spa, FTAG)) != 0)
3110 3110 return (error);
3111 3111
3112 3112 spa_vers = spa_version(spa);
3113 3113 spa_close(spa, FTAG);
3114 3114
3115 3115 zplver = zfs_zpl_version_map(spa_vers);
3116 3116 fuids_ok = (zplver >= ZPL_VERSION_FUID);
3117 3117 sa_ok = (zplver >= ZPL_VERSION_SA);
3118 3118
3119 3119 /*
3120 3120 * Open parent object set so we can inherit zplprop values.
3121 3121 */
3122 3122 if ((error = dmu_objset_hold(parentname, FTAG, &os)) != 0)
3123 3123 return (error);
3124 3124
3125 3125 error = zfs_fill_zplprops_impl(os, zplver, fuids_ok, sa_ok, createprops,
3126 3126 zplprops, is_ci);
3127 3127 dmu_objset_rele(os, FTAG);
3128 3128 return (error);
3129 3129 }
3130 3130
3131 3131 static int
3132 3132 zfs_fill_zplprops_root(uint64_t spa_vers, nvlist_t *createprops,
3133 3133 nvlist_t *zplprops, boolean_t *is_ci)
3134 3134 {
3135 3135 boolean_t fuids_ok;
3136 3136 boolean_t sa_ok;
3137 3137 uint64_t zplver = ZPL_VERSION;
3138 3138 int error;
3139 3139
3140 3140 zplver = zfs_zpl_version_map(spa_vers);
3141 3141 fuids_ok = (zplver >= ZPL_VERSION_FUID);
3142 3142 sa_ok = (zplver >= ZPL_VERSION_SA);
3143 3143
3144 3144 error = zfs_fill_zplprops_impl(NULL, zplver, fuids_ok, sa_ok,
3145 3145 createprops, zplprops, is_ci);
3146 3146 return (error);
3147 3147 }
3148 3148
3149 3149 /*
3150 3150 * innvl: {
3151 3151 * "type" -> dmu_objset_type_t (int32)
3152 3152 * (optional) "props" -> { prop -> value }
3153 3153 * }
3154 3154 *
3155 3155 * outnvl: propname -> error code (int32)
3156 3156 */
3157 3157 static int
3158 3158 zfs_ioc_create(const char *fsname, nvlist_t *innvl, nvlist_t *outnvl)
3159 3159 {
3160 3160 int error = 0;
3161 3161 zfs_creat_t zct = { 0 };
3162 3162 nvlist_t *nvprops = NULL;
3163 3163 void (*cbfunc)(objset_t *os, void *arg, cred_t *cr, dmu_tx_t *tx);
3164 3164 int32_t type32;
3165 3165 dmu_objset_type_t type;
3166 3166 boolean_t is_insensitive = B_FALSE;
3167 3167
3168 3168 if (nvlist_lookup_int32(innvl, "type", &type32) != 0)
3169 3169 return (SET_ERROR(EINVAL));
3170 3170 type = type32;
3171 3171 (void) nvlist_lookup_nvlist(innvl, "props", &nvprops);
3172 3172
3173 3173 switch (type) {
3174 3174 case DMU_OST_ZFS:
3175 3175 cbfunc = zfs_create_cb;
3176 3176 break;
3177 3177
3178 3178 case DMU_OST_ZVOL:
3179 3179 cbfunc = zvol_create_cb;
3180 3180 break;
3181 3181
3182 3182 default:
3183 3183 cbfunc = NULL;
3184 3184 break;
3185 3185 }
3186 3186 if (strchr(fsname, '@') ||
3187 3187 strchr(fsname, '%'))
3188 3188 return (SET_ERROR(EINVAL));
3189 3189
3190 3190 zct.zct_props = nvprops;
3191 3191
3192 3192 if (cbfunc == NULL)
3193 3193 return (SET_ERROR(EINVAL));
3194 3194
3195 3195 if (type == DMU_OST_ZVOL) {
3196 3196 uint64_t volsize, volblocksize;
3197 3197
3198 3198 if (nvprops == NULL)
3199 3199 return (SET_ERROR(EINVAL));
3200 3200 if (nvlist_lookup_uint64(nvprops,
3201 3201 zfs_prop_to_name(ZFS_PROP_VOLSIZE), &volsize) != 0)
3202 3202 return (SET_ERROR(EINVAL));
3203 3203
3204 3204 if ((error = nvlist_lookup_uint64(nvprops,
3205 3205 zfs_prop_to_name(ZFS_PROP_VOLBLOCKSIZE),
3206 3206 &volblocksize)) != 0 && error != ENOENT)
3207 3207 return (SET_ERROR(EINVAL));
3208 3208
3209 3209 if (error != 0)
3210 3210 volblocksize = zfs_prop_default_numeric(
3211 3211 ZFS_PROP_VOLBLOCKSIZE);
3212 3212
3213 3213 if ((error = zvol_check_volblocksize(
3214 3214 volblocksize)) != 0 ||
3215 3215 (error = zvol_check_volsize(volsize,
3216 3216 volblocksize)) != 0)
3217 3217 return (error);
3218 3218 } else if (type == DMU_OST_ZFS) {
3219 3219 int error;
3220 3220
3221 3221 /*
3222 3222 * We have to have normalization and
3223 3223 * case-folding flags correct when we do the
3224 3224 * file system creation, so go figure them out
3225 3225 * now.
3226 3226 */
3227 3227 VERIFY(nvlist_alloc(&zct.zct_zplprops,
3228 3228 NV_UNIQUE_NAME, KM_SLEEP) == 0);
3229 3229 error = zfs_fill_zplprops(fsname, nvprops,
3230 3230 zct.zct_zplprops, &is_insensitive);
3231 3231 if (error != 0) {
3232 3232 nvlist_free(zct.zct_zplprops);
3233 3233 return (error);
3234 3234 }
3235 3235 }
3236 3236
3237 3237 error = dmu_objset_create(fsname, type,
3238 3238 is_insensitive ? DS_FLAG_CI_DATASET : 0, cbfunc, &zct);
3239 3239 nvlist_free(zct.zct_zplprops);
3240 3240
3241 3241 /*
3242 3242 * It would be nice to do this atomically.
3243 3243 */
3244 3244 if (error == 0) {
3245 3245 error = zfs_set_prop_nvlist(fsname, ZPROP_SRC_LOCAL,
3246 3246 nvprops, outnvl);
3247 3247 if (error != 0)
3248 3248 (void) dsl_destroy_head(fsname);
3249 3249 }
3250 3250 return (error);
3251 3251 }
3252 3252
3253 3253 /*
3254 3254 * innvl: {
3255 3255 * "origin" -> name of origin snapshot
3256 3256 * (optional) "props" -> { prop -> value }
3257 3257 * }
3258 3258 *
3259 3259 * outnvl: propname -> error code (int32)
3260 3260 */
3261 3261 static int
3262 3262 zfs_ioc_clone(const char *fsname, nvlist_t *innvl, nvlist_t *outnvl)
3263 3263 {
3264 3264 int error = 0;
3265 3265 nvlist_t *nvprops = NULL;
3266 3266 char *origin_name;
3267 3267
3268 3268 if (nvlist_lookup_string(innvl, "origin", &origin_name) != 0)
3269 3269 return (SET_ERROR(EINVAL));
3270 3270 (void) nvlist_lookup_nvlist(innvl, "props", &nvprops);
3271 3271
3272 3272 if (strchr(fsname, '@') ||
3273 3273 strchr(fsname, '%'))
3274 3274 return (SET_ERROR(EINVAL));
3275 3275
3276 3276 if (dataset_namecheck(origin_name, NULL, NULL) != 0)
3277 3277 return (SET_ERROR(EINVAL));
3278 3278 error = dmu_objset_clone(fsname, origin_name);
3279 3279 if (error != 0)
3280 3280 return (error);
3281 3281
3282 3282 /*
3283 3283 * It would be nice to do this atomically.
3284 3284 */
3285 3285 if (error == 0) {
3286 3286 error = zfs_set_prop_nvlist(fsname, ZPROP_SRC_LOCAL,
3287 3287 nvprops, outnvl);
3288 3288 if (error != 0)
3289 3289 (void) dsl_destroy_head(fsname);
3290 3290 }
3291 3291 return (error);
3292 3292 }
3293 3293
3294 3294 /*
3295 3295 * innvl: {
3296 3296 * "snaps" -> { snapshot1, snapshot2 }
3297 3297 * (optional) "props" -> { prop -> value (string) }
3298 3298 * }
3299 3299 *
3300 3300 * outnvl: snapshot -> error code (int32)
3301 3301 */
3302 3302 static int
3303 3303 zfs_ioc_snapshot(const char *poolname, nvlist_t *innvl, nvlist_t *outnvl)
3304 3304 {
3305 3305 nvlist_t *snaps;
3306 3306 nvlist_t *props = NULL;
3307 3307 int error, poollen;
3308 3308 nvpair_t *pair;
3309 3309
3310 3310 (void) nvlist_lookup_nvlist(innvl, "props", &props);
3311 3311 if ((error = zfs_check_userprops(poolname, props)) != 0)
3312 3312 return (error);
3313 3313
3314 3314 if (!nvlist_empty(props) &&
3315 3315 zfs_earlier_version(poolname, SPA_VERSION_SNAP_PROPS))
3316 3316 return (SET_ERROR(ENOTSUP));
3317 3317
3318 3318 if (nvlist_lookup_nvlist(innvl, "snaps", &snaps) != 0)
3319 3319 return (SET_ERROR(EINVAL));
3320 3320 poollen = strlen(poolname);
3321 3321 for (pair = nvlist_next_nvpair(snaps, NULL); pair != NULL;
3322 3322 pair = nvlist_next_nvpair(snaps, pair)) {
3323 3323 const char *name = nvpair_name(pair);
3324 3324 const char *cp = strchr(name, '@');
3325 3325
3326 3326 /*
3327 3327 * The snap name must contain an @, and the part after it must
3328 3328 * contain only valid characters.
3329 3329 */
3330 3330 if (cp == NULL ||
3331 3331 zfs_component_namecheck(cp + 1, NULL, NULL) != 0)
3332 3332 return (SET_ERROR(EINVAL));
3333 3333
3334 3334 /*
3335 3335 * The snap must be in the specified pool.
3336 3336 */
3337 3337 if (strncmp(name, poolname, poollen) != 0 ||
3338 3338 (name[poollen] != '/' && name[poollen] != '@'))
3339 3339 return (SET_ERROR(EXDEV));
3340 3340
3341 3341 /* This must be the only snap of this fs. */
3342 3342 for (nvpair_t *pair2 = nvlist_next_nvpair(snaps, pair);
3343 3343 pair2 != NULL; pair2 = nvlist_next_nvpair(snaps, pair2)) {
3344 3344 if (strncmp(name, nvpair_name(pair2), cp - name + 1)
3345 3345 == 0) {
3346 3346 return (SET_ERROR(EXDEV));
3347 3347 }
3348 3348 }
3349 3349 }
3350 3350
3351 3351 error = dsl_dataset_snapshot(snaps, props, outnvl);
3352 3352 return (error);
3353 3353 }
3354 3354
3355 3355 /*
3356 3356 * innvl: "message" -> string
3357 3357 */
3358 3358 /* ARGSUSED */
3359 3359 static int
3360 3360 zfs_ioc_log_history(const char *unused, nvlist_t *innvl, nvlist_t *outnvl)
3361 3361 {
3362 3362 char *message;
3363 3363 spa_t *spa;
3364 3364 int error;
3365 3365 char *poolname;
3366 3366
3367 3367 /*
3368 3368 * The poolname in the ioctl is not set, we get it from the TSD,
3369 3369 * which was set at the end of the last successful ioctl that allows
3370 3370 * logging. The secpolicy func already checked that it is set.
3371 3371 * Only one log ioctl is allowed after each successful ioctl, so
3372 3372 * we clear the TSD here.
3373 3373 */
3374 3374 poolname = tsd_get(zfs_allow_log_key);
3375 3375 (void) tsd_set(zfs_allow_log_key, NULL);
3376 3376 error = spa_open(poolname, &spa, FTAG);
3377 3377 strfree(poolname);
3378 3378 if (error != 0)
3379 3379 return (error);
3380 3380
3381 3381 if (nvlist_lookup_string(innvl, "message", &message) != 0) {
3382 3382 spa_close(spa, FTAG);
3383 3383 return (SET_ERROR(EINVAL));
3384 3384 }
3385 3385
3386 3386 if (spa_version(spa) < SPA_VERSION_ZPOOL_HISTORY) {
3387 3387 spa_close(spa, FTAG);
3388 3388 return (SET_ERROR(ENOTSUP));
3389 3389 }
3390 3390
3391 3391 error = spa_history_log(spa, message);
3392 3392 spa_close(spa, FTAG);
3393 3393 return (error);
3394 3394 }
3395 3395
3396 3396 /*
3397 3397 * The dp_config_rwlock must not be held when calling this, because the
3398 3398 * unmount may need to write out data.
3399 3399 *
3400 3400 * This function is best-effort. Callers must deal gracefully if it
3401 3401 * remains mounted (or is remounted after this call).
3402 3402 *
3403 3403 * Returns 0 if the argument is not a snapshot, or it is not currently a
3404 3404 * filesystem, or we were able to unmount it. Returns error code otherwise.
3405 3405 */
3406 3406 int
3407 3407 zfs_unmount_snap(const char *snapname)
3408 3408 {
3409 3409 vfs_t *vfsp;
3410 3410 zfsvfs_t *zfsvfs;
3411 3411 int err;
3412 3412
3413 3413 if (strchr(snapname, '@') == NULL)
3414 3414 return (0);
3415 3415
3416 3416 vfsp = zfs_get_vfs(snapname);
3417 3417 if (vfsp == NULL)
3418 3418 return (0);
3419 3419
3420 3420 zfsvfs = vfsp->vfs_data;
3421 3421 ASSERT(!dsl_pool_config_held(dmu_objset_pool(zfsvfs->z_os)));
3422 3422
3423 3423 err = vn_vfswlock(vfsp->vfs_vnodecovered);
3424 3424 VFS_RELE(vfsp);
3425 3425 if (err != 0)
3426 3426 return (SET_ERROR(err));
3427 3427
3428 3428 /*
3429 3429 * Always force the unmount for snapshots.
3430 3430 */
3431 3431 (void) dounmount(vfsp, MS_FORCE, kcred);
3432 3432 return (0);
3433 3433 }
3434 3434
3435 3435 /* ARGSUSED */
3436 3436 static int
3437 3437 zfs_unmount_snap_cb(const char *snapname, void *arg)
3438 3438 {
3439 3439 return (zfs_unmount_snap(snapname));
3440 3440 }
3441 3441
3442 3442 /*
3443 3443 * When a clone is destroyed, its origin may also need to be destroyed,
3444 3444 * in which case it must be unmounted. This routine will do that unmount
3445 3445 * if necessary.
3446 3446 */
3447 3447 void
3448 3448 zfs_destroy_unmount_origin(const char *fsname)
3449 3449 {
3450 3450 int error;
3451 3451 objset_t *os;
3452 3452 dsl_dataset_t *ds;
3453 3453
3454 3454 error = dmu_objset_hold(fsname, FTAG, &os);
3455 3455 if (error != 0)
3456 3456 return;
3457 3457 ds = dmu_objset_ds(os);
3458 3458 if (dsl_dir_is_clone(ds->ds_dir) && DS_IS_DEFER_DESTROY(ds->ds_prev)) {
3459 3459 char originname[MAXNAMELEN];
3460 3460 dsl_dataset_name(ds->ds_prev, originname);
3461 3461 dmu_objset_rele(os, FTAG);
3462 3462 (void) zfs_unmount_snap(originname);
3463 3463 } else {
3464 3464 dmu_objset_rele(os, FTAG);
3465 3465 }
3466 3466 }
3467 3467
3468 3468 /*
3469 3469 * innvl: {
3470 3470 * "snaps" -> { snapshot1, snapshot2 }
3471 3471 * (optional boolean) "defer"
3472 3472 * }
3473 3473 *
3474 3474 * outnvl: snapshot -> error code (int32)
3475 3475 *
3476 3476 */
3477 3477 /* ARGSUSED */
3478 3478 static int
3479 3479 zfs_ioc_destroy_snaps(const char *poolname, nvlist_t *innvl, nvlist_t *outnvl)
3480 3480 {
3481 3481 nvlist_t *snaps;
3482 3482 nvpair_t *pair;
3483 3483 boolean_t defer;
3484 3484
3485 3485 if (nvlist_lookup_nvlist(innvl, "snaps", &snaps) != 0)
3486 3486 return (SET_ERROR(EINVAL));
3487 3487 defer = nvlist_exists(innvl, "defer");
3488 3488
3489 3489 for (pair = nvlist_next_nvpair(snaps, NULL); pair != NULL;
3490 3490 pair = nvlist_next_nvpair(snaps, pair)) {
3491 3491 (void) zfs_unmount_snap(nvpair_name(pair));
3492 3492 }
3493 3493
3494 3494 return (dsl_destroy_snapshots_nvl(snaps, defer, outnvl));
3495 3495 }
3496 3496
3497 3497 /*
3498 3498 * Create bookmarks. Bookmark names are of the form <fs>#<bmark>.
3499 3499 * All bookmarks must be in the same pool.
3500 3500 *
3501 3501 * innvl: {
3502 3502 * bookmark1 -> snapshot1, bookmark2 -> snapshot2
3503 3503 * }
3504 3504 *
3505 3505 * outnvl: bookmark -> error code (int32)
3506 3506 *
3507 3507 */
3508 3508 /* ARGSUSED */
3509 3509 static int
3510 3510 zfs_ioc_bookmark(const char *poolname, nvlist_t *innvl, nvlist_t *outnvl)
3511 3511 {
3512 3512 for (nvpair_t *pair = nvlist_next_nvpair(innvl, NULL);
3513 3513 pair != NULL; pair = nvlist_next_nvpair(innvl, pair)) {
3514 3514 char *snap_name;
3515 3515
3516 3516 /*
3517 3517 * Verify the snapshot argument.
3518 3518 */
3519 3519 if (nvpair_value_string(pair, &snap_name) != 0)
3520 3520 return (SET_ERROR(EINVAL));
3521 3521
3522 3522
3523 3523 /* Verify that the keys (bookmarks) are unique */
3524 3524 for (nvpair_t *pair2 = nvlist_next_nvpair(innvl, pair);
3525 3525 pair2 != NULL; pair2 = nvlist_next_nvpair(innvl, pair2)) {
3526 3526 if (strcmp(nvpair_name(pair), nvpair_name(pair2)) == 0)
3527 3527 return (SET_ERROR(EINVAL));
3528 3528 }
3529 3529 }
3530 3530
3531 3531 return (dsl_bookmark_create(innvl, outnvl));
3532 3532 }
3533 3533
3534 3534 /*
3535 3535 * innvl: {
3536 3536 * property 1, property 2, ...
3537 3537 * }
3538 3538 *
3539 3539 * outnvl: {
3540 3540 * bookmark name 1 -> { property 1, property 2, ... },
3541 3541 * bookmark name 2 -> { property 1, property 2, ... }
3542 3542 * }
3543 3543 *
3544 3544 */
3545 3545 static int
3546 3546 zfs_ioc_get_bookmarks(const char *fsname, nvlist_t *innvl, nvlist_t *outnvl)
3547 3547 {
3548 3548 return (dsl_get_bookmarks(fsname, innvl, outnvl));
3549 3549 }
3550 3550
3551 3551 /*
3552 3552 * innvl: {
3553 3553 * bookmark name 1, bookmark name 2
3554 3554 * }
3555 3555 *
3556 3556 * outnvl: bookmark -> error code (int32)
3557 3557 *
3558 3558 */
3559 3559 static int
3560 3560 zfs_ioc_destroy_bookmarks(const char *poolname, nvlist_t *innvl,
3561 3561 nvlist_t *outnvl)
3562 3562 {
3563 3563 int error, poollen;
3564 3564
3565 3565 poollen = strlen(poolname);
3566 3566 for (nvpair_t *pair = nvlist_next_nvpair(innvl, NULL);
3567 3567 pair != NULL; pair = nvlist_next_nvpair(innvl, pair)) {
3568 3568 const char *name = nvpair_name(pair);
3569 3569 const char *cp = strchr(name, '#');
3570 3570
3571 3571 /*
3572 3572 * The bookmark name must contain an #, and the part after it
3573 3573 * must contain only valid characters.
3574 3574 */
3575 3575 if (cp == NULL ||
3576 3576 zfs_component_namecheck(cp + 1, NULL, NULL) != 0)
3577 3577 return (SET_ERROR(EINVAL));
3578 3578
3579 3579 /*
3580 3580 * The bookmark must be in the specified pool.
3581 3581 */
3582 3582 if (strncmp(name, poolname, poollen) != 0 ||
3583 3583 (name[poollen] != '/' && name[poollen] != '#'))
3584 3584 return (SET_ERROR(EXDEV));
3585 3585 }
3586 3586
3587 3587 error = dsl_bookmark_destroy(innvl, outnvl);
3588 3588 return (error);
3589 3589 }
3590 3590
3591 3591 /*
3592 3592 * inputs:
3593 3593 * zc_name name of dataset to destroy
3594 3594 * zc_objset_type type of objset
3595 3595 * zc_defer_destroy mark for deferred destroy
3596 3596 *
3597 3597 * outputs: none
3598 3598 */
3599 3599 static int
3600 3600 zfs_ioc_destroy(zfs_cmd_t *zc)
3601 3601 {
3602 3602 int err;
3603 3603
3604 3604 if (zc->zc_objset_type == DMU_OST_ZFS) {
3605 3605 err = zfs_unmount_snap(zc->zc_name);
3606 3606 if (err != 0)
3607 3607 return (err);
3608 3608 }
3609 3609
3610 3610 if (strchr(zc->zc_name, '@'))
3611 3611 err = dsl_destroy_snapshot(zc->zc_name, zc->zc_defer_destroy);
3612 3612 else
3613 3613 err = dsl_destroy_head(zc->zc_name);
3614 3614 if (zc->zc_objset_type == DMU_OST_ZVOL && err == 0)
3615 3615 (void) zvol_remove_minor(zc->zc_name);
3616 3616 return (err);
3617 3617 }
3618 3618
3619 3619 /*
3620 3620 * fsname is name of dataset to rollback (to most recent snapshot)
3621 3621 *
3622 3622 * innvl is not used.
3623 3623 *
3624 3624 * outnvl: "target" -> name of most recent snapshot
3625 3625 * }
3626 3626 */
3627 3627 /* ARGSUSED */
3628 3628 static int
3629 3629 zfs_ioc_rollback(const char *fsname, nvlist_t *args, nvlist_t *outnvl)
3630 3630 {
3631 3631 zfsvfs_t *zfsvfs;
3632 3632 int error;
3633 3633
3634 3634 if (getzfsvfs(fsname, &zfsvfs) == 0) {
3635 3635 error = zfs_suspend_fs(zfsvfs);
3636 3636 if (error == 0) {
3637 3637 int resume_err;
3638 3638
3639 3639 error = dsl_dataset_rollback(fsname, zfsvfs, outnvl);
3640 3640 resume_err = zfs_resume_fs(zfsvfs, fsname);
3641 3641 error = error ? error : resume_err;
3642 3642 }
3643 3643 VFS_RELE(zfsvfs->z_vfs);
3644 3644 } else {
3645 3645 error = dsl_dataset_rollback(fsname, NULL, outnvl);
3646 3646 }
3647 3647 return (error);
3648 3648 }
3649 3649
3650 3650 static int
3651 3651 recursive_unmount(const char *fsname, void *arg)
3652 3652 {
3653 3653 const char *snapname = arg;
3654 3654 char fullname[MAXNAMELEN];
3655 3655
3656 3656 (void) snprintf(fullname, sizeof (fullname), "%s@%s", fsname, snapname);
3657 3657 return (zfs_unmount_snap(fullname));
3658 3658 }
3659 3659
3660 3660 /*
3661 3661 * inputs:
3662 3662 * zc_name old name of dataset
3663 3663 * zc_value new name of dataset
3664 3664 * zc_cookie recursive flag (only valid for snapshots)
3665 3665 *
3666 3666 * outputs: none
3667 3667 */
3668 3668 static int
3669 3669 zfs_ioc_rename(zfs_cmd_t *zc)
3670 3670 {
3671 3671 boolean_t recursive = zc->zc_cookie & 1;
3672 3672 char *at;
3673 3673
3674 3674 zc->zc_value[sizeof (zc->zc_value) - 1] = '\0';
3675 3675 if (dataset_namecheck(zc->zc_value, NULL, NULL) != 0 ||
3676 3676 strchr(zc->zc_value, '%'))
3677 3677 return (SET_ERROR(EINVAL));
3678 3678
3679 3679 at = strchr(zc->zc_name, '@');
3680 3680 if (at != NULL) {
3681 3681 /* snaps must be in same fs */
3682 3682 int error;
3683 3683
3684 3684 if (strncmp(zc->zc_name, zc->zc_value, at - zc->zc_name + 1))
3685 3685 return (SET_ERROR(EXDEV));
3686 3686 *at = '\0';
3687 3687 if (zc->zc_objset_type == DMU_OST_ZFS) {
3688 3688 error = dmu_objset_find(zc->zc_name,
3689 3689 recursive_unmount, at + 1,
3690 3690 recursive ? DS_FIND_CHILDREN : 0);
3691 3691 if (error != 0) {
3692 3692 *at = '@';
3693 3693 return (error);
3694 3694 }
3695 3695 }
3696 3696 error = dsl_dataset_rename_snapshot(zc->zc_name,
3697 3697 at + 1, strchr(zc->zc_value, '@') + 1, recursive);
3698 3698 *at = '@';
3699 3699
3700 3700 return (error);
3701 3701 } else {
3702 3702 if (zc->zc_objset_type == DMU_OST_ZVOL)
3703 3703 (void) zvol_remove_minor(zc->zc_name);
3704 3704 return (dsl_dir_rename(zc->zc_name, zc->zc_value));
3705 3705 }
3706 3706 }
3707 3707
3708 3708 static int
3709 3709 zfs_check_settable(const char *dsname, nvpair_t *pair, cred_t *cr)
3710 3710 {
3711 3711 const char *propname = nvpair_name(pair);
3712 3712 boolean_t issnap = (strchr(dsname, '@') != NULL);
3713 3713 zfs_prop_t prop = zfs_name_to_prop(propname);
3714 3714 uint64_t intval;
3715 3715 int err;
3716 3716
3717 3717 if (prop == ZPROP_INVAL) {
3718 3718 if (zfs_prop_user(propname)) {
3719 3719 if (err = zfs_secpolicy_write_perms(dsname,
3720 3720 ZFS_DELEG_PERM_USERPROP, cr))
3721 3721 return (err);
3722 3722 return (0);
3723 3723 }
3724 3724
3725 3725 if (!issnap && zfs_prop_userquota(propname)) {
3726 3726 const char *perm = NULL;
3727 3727 const char *uq_prefix =
3728 3728 zfs_userquota_prop_prefixes[ZFS_PROP_USERQUOTA];
3729 3729 const char *gq_prefix =
3730 3730 zfs_userquota_prop_prefixes[ZFS_PROP_GROUPQUOTA];
3731 3731
3732 3732 if (strncmp(propname, uq_prefix,
3733 3733 strlen(uq_prefix)) == 0) {
3734 3734 perm = ZFS_DELEG_PERM_USERQUOTA;
3735 3735 } else if (strncmp(propname, gq_prefix,
3736 3736 strlen(gq_prefix)) == 0) {
3737 3737 perm = ZFS_DELEG_PERM_GROUPQUOTA;
3738 3738 } else {
3739 3739 /* USERUSED and GROUPUSED are read-only */
3740 3740 return (SET_ERROR(EINVAL));
3741 3741 }
3742 3742
3743 3743 if (err = zfs_secpolicy_write_perms(dsname, perm, cr))
3744 3744 return (err);
3745 3745 return (0);
3746 3746 }
3747 3747
3748 3748 return (SET_ERROR(EINVAL));
3749 3749 }
3750 3750
3751 3751 if (issnap)
3752 3752 return (SET_ERROR(EINVAL));
3753 3753
3754 3754 if (nvpair_type(pair) == DATA_TYPE_NVLIST) {
3755 3755 /*
3756 3756 * dsl_prop_get_all_impl() returns properties in this
3757 3757 * format.
3758 3758 */
3759 3759 nvlist_t *attrs;
3760 3760 VERIFY(nvpair_value_nvlist(pair, &attrs) == 0);
3761 3761 VERIFY(nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
3762 3762 &pair) == 0);
3763 3763 }
3764 3764
3765 3765 /*
3766 3766 * Check that this value is valid for this pool version
3767 3767 */
3768 3768 switch (prop) {
3769 3769 case ZFS_PROP_COMPRESSION:
3770 3770 /*
3771 3771 * If the user specified gzip compression, make sure
3772 3772 * the SPA supports it. We ignore any errors here since
3773 3773 * we'll catch them later.
3774 3774 */
3775 3775 if (nvpair_value_uint64(pair, &intval) == 0) {
3776 3776 if (intval >= ZIO_COMPRESS_GZIP_1 &&
3777 3777 intval <= ZIO_COMPRESS_GZIP_9 &&
3778 3778 zfs_earlier_version(dsname,
3779 3779 SPA_VERSION_GZIP_COMPRESSION)) {
3780 3780 return (SET_ERROR(ENOTSUP));
3781 3781 }
3782 3782
3783 3783 if (intval == ZIO_COMPRESS_ZLE &&
3784 3784 zfs_earlier_version(dsname,
3785 3785 SPA_VERSION_ZLE_COMPRESSION))
3786 3786 return (SET_ERROR(ENOTSUP));
3787 3787
3788 3788 if (intval == ZIO_COMPRESS_LZ4) {
3789 3789 spa_t *spa;
3790 3790
3791 3791 if ((err = spa_open(dsname, &spa, FTAG)) != 0)
3792 3792 return (err);
3793 3793
3794 3794 if (!spa_feature_is_enabled(spa,
3795 3795 SPA_FEATURE_LZ4_COMPRESS)) {
3796 3796 spa_close(spa, FTAG);
3797 3797 return (SET_ERROR(ENOTSUP));
3798 3798 }
3799 3799 spa_close(spa, FTAG);
3800 3800 }
3801 3801
3802 3802 /*
3803 3803 * If this is a bootable dataset then
3804 3804 * verify that the compression algorithm
3805 3805 * is supported for booting. We must return
3806 3806 * something other than ENOTSUP since it
3807 3807 * implies a downrev pool version.
3808 3808 */
3809 3809 if (zfs_is_bootfs(dsname) &&
3810 3810 !BOOTFS_COMPRESS_VALID(intval)) {
3811 3811 return (SET_ERROR(ERANGE));
3812 3812 }
3813 3813 }
3814 3814 break;
3815 3815
3816 3816 case ZFS_PROP_COPIES:
3817 3817 if (zfs_earlier_version(dsname, SPA_VERSION_DITTO_BLOCKS))
3818 3818 return (SET_ERROR(ENOTSUP));
3819 3819 break;
3820 3820
3821 3821 case ZFS_PROP_RECORDSIZE:
3822 3822 /* Record sizes above 128k need the feature to be enabled */
3823 3823 if (nvpair_value_uint64(pair, &intval) == 0 &&
3824 3824 intval > SPA_OLD_MAXBLOCKSIZE) {
3825 3825 spa_t *spa;
3826 3826
3827 3827 /*
3828 3828 * If this is a bootable dataset then
3829 3829 * the we don't allow large (>128K) blocks,
3830 3830 * because GRUB doesn't support them.
3831 3831 */
3832 3832 if (zfs_is_bootfs(dsname) &&
3833 3833 intval > SPA_OLD_MAXBLOCKSIZE) {
3834 3834 return (SET_ERROR(ERANGE));
3835 3835 }
3836 3836
3837 3837 /*
3838 3838 * We don't allow setting the property above 1MB,
3839 3839 * unless the tunable has been changed.
3840 3840 */
3841 3841 if (intval > zfs_max_recordsize ||
3842 3842 intval > SPA_MAXBLOCKSIZE)
3843 3843 return (SET_ERROR(ERANGE));
3844 3844
3845 3845 if ((err = spa_open(dsname, &spa, FTAG)) != 0)
3846 3846 return (err);
3847 3847
3848 3848 if (!spa_feature_is_enabled(spa,
3849 3849 SPA_FEATURE_LARGE_BLOCKS)) {
3850 3850 spa_close(spa, FTAG);
3851 3851 return (SET_ERROR(ENOTSUP));
3852 3852 }
3853 3853 spa_close(spa, FTAG);
3854 3854 }
3855 3855 break;
3856 3856
3857 3857 case ZFS_PROP_SHARESMB:
3858 3858 if (zpl_earlier_version(dsname, ZPL_VERSION_FUID))
3859 3859 return (SET_ERROR(ENOTSUP));
3860 3860 break;
3861 3861
3862 3862 case ZFS_PROP_ACLINHERIT:
3863 3863 if (nvpair_type(pair) == DATA_TYPE_UINT64 &&
3864 3864 nvpair_value_uint64(pair, &intval) == 0) {
3865 3865 if (intval == ZFS_ACL_PASSTHROUGH_X &&
3866 3866 zfs_earlier_version(dsname,
3867 3867 SPA_VERSION_PASSTHROUGH_X))
3868 3868 return (SET_ERROR(ENOTSUP));
3869 3869 }
3870 3870 break;
3871 3871
3872 3872 case ZFS_PROP_CHECKSUM:
3873 3873 case ZFS_PROP_DEDUP:
3874 3874 {
3875 3875 spa_feature_t feature;
3876 3876 spa_t *spa;
3877 3877
3878 3878 /* dedup feature version checks */
3879 3879 if (prop == ZFS_PROP_DEDUP &&
3880 3880 zfs_earlier_version(dsname, SPA_VERSION_DEDUP))
3881 3881 return (SET_ERROR(ENOTSUP));
3882 3882
3883 3883 if (nvpair_value_uint64(pair, &intval) != 0)
3884 3884 return (SET_ERROR(EINVAL));
3885 3885
3886 3886 /* check prop value is enabled in features */
3887 3887 feature = zio_checksum_to_feature(intval);
3888 3888 if (feature == SPA_FEATURE_NONE)
3889 3889 break;
3890 3890
3891 3891 if ((err = spa_open(dsname, &spa, FTAG)) != 0)
3892 3892 return (err);
3893 3893 /*
3894 3894 * Salted checksums are not supported on root pools.
3895 3895 */
3896 3896 if (spa_bootfs(spa) != 0 &&
3897 3897 intval < ZIO_CHECKSUM_FUNCTIONS &&
3898 3898 (zio_checksum_table[intval].ci_flags &
3899 3899 ZCHECKSUM_FLAG_SALTED)) {
3900 3900 spa_close(spa, FTAG);
3901 3901 return (SET_ERROR(ERANGE));
3902 3902 }
3903 3903 if (!spa_feature_is_enabled(spa, feature)) {
3904 3904 spa_close(spa, FTAG);
3905 3905 return (SET_ERROR(ENOTSUP));
3906 3906 }
3907 3907 spa_close(spa, FTAG);
3908 3908 break;
3909 3909 }
3910 3910 }
3911 3911
3912 3912 return (zfs_secpolicy_setprop(dsname, prop, pair, CRED()));
3913 3913 }
3914 3914
3915 3915 /*
3916 3916 * Checks for a race condition to make sure we don't increment a feature flag
3917 3917 * multiple times.
3918 3918 */
3919 3919 static int
3920 3920 zfs_prop_activate_feature_check(void *arg, dmu_tx_t *tx)
3921 3921 {
3922 3922 spa_t *spa = dmu_tx_pool(tx)->dp_spa;
3923 3923 spa_feature_t *featurep = arg;
3924 3924
3925 3925 if (!spa_feature_is_active(spa, *featurep))
3926 3926 return (0);
3927 3927 else
3928 3928 return (SET_ERROR(EBUSY));
3929 3929 }
3930 3930
3931 3931 /*
3932 3932 * The callback invoked on feature activation in the sync task caused by
3933 3933 * zfs_prop_activate_feature.
3934 3934 */
3935 3935 static void
3936 3936 zfs_prop_activate_feature_sync(void *arg, dmu_tx_t *tx)
3937 3937 {
3938 3938 spa_t *spa = dmu_tx_pool(tx)->dp_spa;
3939 3939 spa_feature_t *featurep = arg;
3940 3940
3941 3941 spa_feature_incr(spa, *featurep, tx);
3942 3942 }
3943 3943
3944 3944 /*
3945 3945 * Activates a feature on a pool in response to a property setting. This
3946 3946 * creates a new sync task which modifies the pool to reflect the feature
3947 3947 * as being active.
3948 3948 */
3949 3949 static int
3950 3950 zfs_prop_activate_feature(spa_t *spa, spa_feature_t feature)
3951 3951 {
3952 3952 int err;
3953 3953
3954 3954 /* EBUSY here indicates that the feature is already active */
3955 3955 err = dsl_sync_task(spa_name(spa),
3956 3956 zfs_prop_activate_feature_check, zfs_prop_activate_feature_sync,
3957 3957 &feature, 2, ZFS_SPACE_CHECK_RESERVED);
3958 3958
3959 3959 if (err != 0 && err != EBUSY)
3960 3960 return (err);
3961 3961 else
3962 3962 return (0);
3963 3963 }
3964 3964
3965 3965 /*
3966 3966 * Removes properties from the given props list that fail permission checks
3967 3967 * needed to clear them and to restore them in case of a receive error. For each
3968 3968 * property, make sure we have both set and inherit permissions.
3969 3969 *
3970 3970 * Returns the first error encountered if any permission checks fail. If the
3971 3971 * caller provides a non-NULL errlist, it also gives the complete list of names
3972 3972 * of all the properties that failed a permission check along with the
3973 3973 * corresponding error numbers. The caller is responsible for freeing the
3974 3974 * returned errlist.
3975 3975 *
3976 3976 * If every property checks out successfully, zero is returned and the list
3977 3977 * pointed at by errlist is NULL.
3978 3978 */
3979 3979 static int
3980 3980 zfs_check_clearable(char *dataset, nvlist_t *props, nvlist_t **errlist)
3981 3981 {
3982 3982 zfs_cmd_t *zc;
3983 3983 nvpair_t *pair, *next_pair;
3984 3984 nvlist_t *errors;
3985 3985 int err, rv = 0;
3986 3986
3987 3987 if (props == NULL)
3988 3988 return (0);
3989 3989
3990 3990 VERIFY(nvlist_alloc(&errors, NV_UNIQUE_NAME, KM_SLEEP) == 0);
3991 3991
3992 3992 zc = kmem_alloc(sizeof (zfs_cmd_t), KM_SLEEP);
3993 3993 (void) strcpy(zc->zc_name, dataset);
3994 3994 pair = nvlist_next_nvpair(props, NULL);
3995 3995 while (pair != NULL) {
3996 3996 next_pair = nvlist_next_nvpair(props, pair);
3997 3997
3998 3998 (void) strcpy(zc->zc_value, nvpair_name(pair));
3999 3999 if ((err = zfs_check_settable(dataset, pair, CRED())) != 0 ||
4000 4000 (err = zfs_secpolicy_inherit_prop(zc, NULL, CRED())) != 0) {
4001 4001 VERIFY(nvlist_remove_nvpair(props, pair) == 0);
4002 4002 VERIFY(nvlist_add_int32(errors,
4003 4003 zc->zc_value, err) == 0);
4004 4004 }
4005 4005 pair = next_pair;
4006 4006 }
4007 4007 kmem_free(zc, sizeof (zfs_cmd_t));
4008 4008
4009 4009 if ((pair = nvlist_next_nvpair(errors, NULL)) == NULL) {
4010 4010 nvlist_free(errors);
4011 4011 errors = NULL;
4012 4012 } else {
4013 4013 VERIFY(nvpair_value_int32(pair, &rv) == 0);
4014 4014 }
4015 4015
4016 4016 if (errlist == NULL)
4017 4017 nvlist_free(errors);
4018 4018 else
4019 4019 *errlist = errors;
4020 4020
4021 4021 return (rv);
4022 4022 }
4023 4023
4024 4024 static boolean_t
4025 4025 propval_equals(nvpair_t *p1, nvpair_t *p2)
4026 4026 {
4027 4027 if (nvpair_type(p1) == DATA_TYPE_NVLIST) {
4028 4028 /* dsl_prop_get_all_impl() format */
4029 4029 nvlist_t *attrs;
4030 4030 VERIFY(nvpair_value_nvlist(p1, &attrs) == 0);
4031 4031 VERIFY(nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
4032 4032 &p1) == 0);
4033 4033 }
4034 4034
4035 4035 if (nvpair_type(p2) == DATA_TYPE_NVLIST) {
4036 4036 nvlist_t *attrs;
4037 4037 VERIFY(nvpair_value_nvlist(p2, &attrs) == 0);
4038 4038 VERIFY(nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
4039 4039 &p2) == 0);
4040 4040 }
4041 4041
4042 4042 if (nvpair_type(p1) != nvpair_type(p2))
4043 4043 return (B_FALSE);
4044 4044
4045 4045 if (nvpair_type(p1) == DATA_TYPE_STRING) {
4046 4046 char *valstr1, *valstr2;
4047 4047
4048 4048 VERIFY(nvpair_value_string(p1, (char **)&valstr1) == 0);
4049 4049 VERIFY(nvpair_value_string(p2, (char **)&valstr2) == 0);
4050 4050 return (strcmp(valstr1, valstr2) == 0);
4051 4051 } else {
4052 4052 uint64_t intval1, intval2;
4053 4053
4054 4054 VERIFY(nvpair_value_uint64(p1, &intval1) == 0);
4055 4055 VERIFY(nvpair_value_uint64(p2, &intval2) == 0);
4056 4056 return (intval1 == intval2);
4057 4057 }
4058 4058 }
4059 4059
4060 4060 /*
4061 4061 * Remove properties from props if they are not going to change (as determined
4062 4062 * by comparison with origprops). Remove them from origprops as well, since we
4063 4063 * do not need to clear or restore properties that won't change.
4064 4064 */
4065 4065 static void
4066 4066 props_reduce(nvlist_t *props, nvlist_t *origprops)
4067 4067 {
4068 4068 nvpair_t *pair, *next_pair;
4069 4069
4070 4070 if (origprops == NULL)
4071 4071 return; /* all props need to be received */
4072 4072
4073 4073 pair = nvlist_next_nvpair(props, NULL);
4074 4074 while (pair != NULL) {
4075 4075 const char *propname = nvpair_name(pair);
4076 4076 nvpair_t *match;
4077 4077
4078 4078 next_pair = nvlist_next_nvpair(props, pair);
4079 4079
4080 4080 if ((nvlist_lookup_nvpair(origprops, propname,
4081 4081 &match) != 0) || !propval_equals(pair, match))
4082 4082 goto next; /* need to set received value */
4083 4083
4084 4084 /* don't clear the existing received value */
4085 4085 (void) nvlist_remove_nvpair(origprops, match);
|
↓ open down ↓ |
4085 lines elided |
↑ open up ↑ |
4086 4086 /* don't bother receiving the property */
4087 4087 (void) nvlist_remove_nvpair(props, pair);
4088 4088 next:
4089 4089 pair = next_pair;
4090 4090 }
4091 4091 }
4092 4092
4093 4093 /*
4094 4094 * Extract properties that cannot be set PRIOR to the receipt of a dataset.
4095 4095 * For example, refquota cannot be set until after the receipt of a dataset,
4096 - * because a prior snapshot may exceed the refquota, and refquotas only apply
4097 - * to the current dataset. The caller (libzfs) will manage these properties
4098 - * somewhat as well to make sure they only come down with the last dataset in
4099 - * a replication stream, but we still need to be safe about it here in
4100 - * kernel-land.
4096 + * because in replication streams, an older/earlier snapshot may exceed the
4097 + * refquota. We want to receive the older/earlier snapshot, but setting
4098 + * refquota pre-receipt will set the dsl's ACTUAL quota, which will prevent
4099 + * the older/earlier snapshot from being received (with EDQUOT).
4100 + *
4101 + * The ZFS test "zfs_receive_011_pos" demonstrates such a scenario.
4102 + *
4103 + * libzfs will need to be judicious handling errors encountered by props
4104 + * extracted by this function.
4101 4105 */
4102 4106 static nvlist_t *
4103 4107 extract_delay_props(nvlist_t *props)
4104 4108 {
4105 4109 nvlist_t *delayprops;
4106 4110 nvpair_t *nvp, *tmp;
4107 4111 static const zfs_prop_t delayable[] = { ZFS_PROP_REFQUOTA, 0 };
4108 - boolean_t dontbother = B_TRUE;
4109 4112 int i;
4110 4113
4111 4114 VERIFY(nvlist_alloc(&delayprops, NV_UNIQUE_NAME, KM_SLEEP) == 0);
4112 4115
4113 4116 for (nvp = nvlist_next_nvpair(props, NULL); nvp != NULL;
4114 4117 nvp = nvlist_next_nvpair(props, nvp)) {
4115 4118 /*
4116 4119 * strcmp() is safe because zfs_prop_to_name() always returns
4117 4120 * a bounded string.
4118 4121 */
4119 4122 for (i = 0; delayable[i] != 0; i++) {
|
↓ open down ↓ |
1 lines elided |
↑ open up ↑ |
4120 4123 if (strcmp(zfs_prop_to_name(delayable[i]),
4121 4124 nvpair_name(nvp)) == 0) {
4122 4125 break;
4123 4126 }
4124 4127 }
4125 4128 if (delayable[i] != 0) {
4126 4129 tmp = nvlist_prev_nvpair(props, nvp);
4127 4130 VERIFY(nvlist_add_nvpair(delayprops, nvp) == 0);
4128 4131 VERIFY(nvlist_remove_nvpair(props, nvp) == 0);
4129 4132 nvp = tmp;
4130 - dontbother = B_FALSE; /* Actually, do bother! */
4131 4133 }
4132 4134 }
4133 4135
4134 - if (dontbother) {
4136 + if (nvlist_empty(delayprops)) {
4135 4137 nvlist_free(delayprops);
4136 4138 delayprops = NULL;
4137 4139 }
4138 4140 return (delayprops);
4139 4141 }
4140 4142
4141 4143 #ifdef DEBUG
4142 4144 static boolean_t zfs_ioc_recv_inject_err;
4143 4145 #endif
4144 4146
4145 4147 /*
4146 4148 * inputs:
4147 4149 * zc_name name of containing filesystem
4148 4150 * zc_nvlist_src{_size} nvlist of properties to apply
4149 4151 * zc_value name of snapshot to create
4150 4152 * zc_string name of clone origin (if DRR_FLAG_CLONE)
4151 4153 * zc_cookie file descriptor to recv from
4152 4154 * zc_begin_record the BEGIN record of the stream (not byteswapped)
4153 4155 * zc_guid force flag
4154 4156 * zc_cleanup_fd cleanup-on-exit file descriptor
4155 4157 * zc_action_handle handle for this guid/ds mapping (or zero on first call)
4156 4158 * zc_resumable if data is incomplete assume sender will resume
4157 4159 *
4158 4160 * outputs:
4159 4161 * zc_cookie number of bytes read
4160 4162 * zc_nvlist_dst{_size} error for each unapplied received property
4161 4163 * zc_obj zprop_errflags_t
4162 4164 * zc_action_handle handle for this guid/ds mapping
4163 4165 */
4164 4166 static int
4165 4167 zfs_ioc_recv(zfs_cmd_t *zc)
4166 4168 {
4167 4169 file_t *fp;
4168 4170 dmu_recv_cookie_t drc;
4169 4171 boolean_t force = (boolean_t)zc->zc_guid;
4170 4172 int fd;
4171 4173 int error = 0;
4172 4174 int props_error = 0;
4173 4175 nvlist_t *errors;
4174 4176 offset_t off;
4175 4177 nvlist_t *props = NULL; /* sent properties */
4176 4178 nvlist_t *origprops = NULL; /* existing properties */
4177 4179 nvlist_t *delayprops = NULL; /* sent properties applied post-receive */
4178 4180 char *origin = NULL;
4179 4181 char *tosnap;
4180 4182 char tofs[ZFS_MAXNAMELEN];
4181 4183 boolean_t first_recvd_props = B_FALSE;
4182 4184
4183 4185 if (dataset_namecheck(zc->zc_value, NULL, NULL) != 0 ||
4184 4186 strchr(zc->zc_value, '@') == NULL ||
4185 4187 strchr(zc->zc_value, '%'))
4186 4188 return (SET_ERROR(EINVAL));
4187 4189
4188 4190 (void) strcpy(tofs, zc->zc_value);
4189 4191 tosnap = strchr(tofs, '@');
4190 4192 *tosnap++ = '\0';
4191 4193
4192 4194 if (zc->zc_nvlist_src != NULL &&
4193 4195 (error = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
4194 4196 zc->zc_iflags, &props)) != 0)
4195 4197 return (error);
4196 4198
4197 4199 fd = zc->zc_cookie;
4198 4200 fp = getf(fd);
4199 4201 if (fp == NULL) {
4200 4202 nvlist_free(props);
4201 4203 return (SET_ERROR(EBADF));
4202 4204 }
4203 4205
4204 4206 errors = fnvlist_alloc();
4205 4207
4206 4208 if (zc->zc_string[0])
4207 4209 origin = zc->zc_string;
4208 4210
4209 4211 error = dmu_recv_begin(tofs, tosnap,
4210 4212 &zc->zc_begin_record, force, zc->zc_resumable, origin, &drc);
4211 4213 if (error != 0)
4212 4214 goto out;
4213 4215
4214 4216 /*
4215 4217 * Set properties before we receive the stream so that they are applied
4216 4218 * to the new data. Note that we must call dmu_recv_stream() if
4217 4219 * dmu_recv_begin() succeeds.
4218 4220 */
4219 4221 if (props != NULL && !drc.drc_newfs) {
4220 4222 if (spa_version(dsl_dataset_get_spa(drc.drc_ds)) >=
4221 4223 SPA_VERSION_RECVD_PROPS &&
4222 4224 !dsl_prop_get_hasrecvd(tofs))
4223 4225 first_recvd_props = B_TRUE;
4224 4226
4225 4227 /*
4226 4228 * If new received properties are supplied, they are to
4227 4229 * completely replace the existing received properties, so stash
4228 4230 * away the existing ones.
4229 4231 */
4230 4232 if (dsl_prop_get_received(tofs, &origprops) == 0) {
4231 4233 nvlist_t *errlist = NULL;
4232 4234 /*
4233 4235 * Don't bother writing a property if its value won't
4234 4236 * change (and avoid the unnecessary security checks).
4235 4237 *
4236 4238 * The first receive after SPA_VERSION_RECVD_PROPS is a
4237 4239 * special case where we blow away all local properties
4238 4240 * regardless.
4239 4241 */
4240 4242 if (!first_recvd_props)
4241 4243 props_reduce(props, origprops);
4242 4244 if (zfs_check_clearable(tofs, origprops, &errlist) != 0)
4243 4245 (void) nvlist_merge(errors, errlist, 0);
4244 4246 nvlist_free(errlist);
4245 4247
4246 4248 if (clear_received_props(tofs, origprops,
4247 4249 first_recvd_props ? NULL : props) != 0)
4248 4250 zc->zc_obj |= ZPROP_ERR_NOCLEAR;
4249 4251 } else {
4250 4252 zc->zc_obj |= ZPROP_ERR_NOCLEAR;
4251 4253 }
4252 4254 }
4253 4255
4254 4256 if (props != NULL) {
4255 4257 props_error = dsl_prop_set_hasrecvd(tofs);
4256 4258
4257 4259 if (props_error == 0) {
4258 4260 delayprops = extract_delay_props(props);
4259 4261 (void) zfs_set_prop_nvlist(tofs, ZPROP_SRC_RECEIVED,
4260 4262 props, errors);
4261 4263 }
4262 4264 }
4263 4265
4264 4266 off = fp->f_offset;
4265 4267 error = dmu_recv_stream(&drc, fp->f_vnode, &off, zc->zc_cleanup_fd,
4266 4268 &zc->zc_action_handle);
4267 4269
4268 4270 if (error == 0) {
4269 4271 zfsvfs_t *zfsvfs = NULL;
4270 4272
4271 4273 if (getzfsvfs(tofs, &zfsvfs) == 0) {
4272 4274 /* online recv */
4273 4275 int end_err;
4274 4276
4275 4277 error = zfs_suspend_fs(zfsvfs);
4276 4278 /*
4277 4279 * If the suspend fails, then the recv_end will
4278 4280 * likely also fail, and clean up after itself.
4279 4281 */
4280 4282 end_err = dmu_recv_end(&drc, zfsvfs);
4281 4283 if (error == 0)
4282 4284 error = zfs_resume_fs(zfsvfs, tofs);
4283 4285 error = error ? error : end_err;
4284 4286 VFS_RELE(zfsvfs->z_vfs);
4285 4287 } else {
|
↓ open down ↓ |
141 lines elided |
↑ open up ↑ |
4286 4288 error = dmu_recv_end(&drc, NULL);
4287 4289 }
4288 4290
4289 4291 /* Set delayed properties now, after we're done receiving. */
4290 4292 if (delayprops != NULL) {
4291 4293 (void) zfs_set_prop_nvlist(tofs, ZPROP_SRC_RECEIVED,
4292 4294 delayprops, errors);
4293 4295 }
4294 4296 }
4295 4297
4296 - /* Merge delayprops back in with regular props, in case of errors. */
4298 + /*
4299 + * Merge delayed props back in with initial props, so errors (which is
4300 + * one list) can match up with the order in which props were set.
4301 + * Also, the error cleanup code only deals with the unsplit props
4302 + * list.
4303 + */
4297 4304 if (delayprops != NULL) {
4298 4305 VERIFY(nvlist_merge(props, delayprops, 0) == 0);
4299 4306 nvlist_free(delayprops);
4300 4307 }
4301 4308
4302 - /* Put the props error list into zc AFTER the delayprops. */
4309 + /*
4310 + * Now that all props, initial and delayed, are set, report the prop
4311 + * errors to the caller.
4312 + */
4303 4313 if (zc->zc_nvlist_dst_size != 0 &&
4304 4314 (nvlist_smush(errors, zc->zc_nvlist_dst_size) != 0 ||
4305 4315 put_nvlist(zc, errors) != 0)) {
4306 4316 /*
4307 4317 * Caller made zc->zc_nvlist_dst less than the minimum expected
4308 4318 * size or supplied an invalid address.
4309 4319 */
4310 4320 props_error = SET_ERROR(EINVAL);
4311 4321 }
4312 4322
4313 4323 zc->zc_cookie = off - fp->f_offset;
4314 4324 if (VOP_SEEK(fp->f_vnode, fp->f_offset, &off, NULL) == 0)
4315 4325 fp->f_offset = off;
4316 4326
4317 4327 #ifdef DEBUG
4318 4328 if (zfs_ioc_recv_inject_err) {
4319 4329 zfs_ioc_recv_inject_err = B_FALSE;
4320 4330 error = 1;
4321 4331 }
4322 4332 #endif
4323 4333 /*
4324 4334 * On error, restore the original props.
4325 4335 */
4326 4336 if (error != 0 && props != NULL && !drc.drc_newfs) {
4327 4337 if (clear_received_props(tofs, props, NULL) != 0) {
4328 4338 /*
4329 4339 * We failed to clear the received properties.
4330 4340 * Since we may have left a $recvd value on the
4331 4341 * system, we can't clear the $hasrecvd flag.
4332 4342 */
4333 4343 zc->zc_obj |= ZPROP_ERR_NORESTORE;
4334 4344 } else if (first_recvd_props) {
4335 4345 dsl_prop_unset_hasrecvd(tofs);
4336 4346 }
4337 4347
4338 4348 if (origprops == NULL && !drc.drc_newfs) {
4339 4349 /* We failed to stash the original properties. */
4340 4350 zc->zc_obj |= ZPROP_ERR_NORESTORE;
4341 4351 }
4342 4352
4343 4353 /*
4344 4354 * dsl_props_set() will not convert RECEIVED to LOCAL on or
4345 4355 * after SPA_VERSION_RECVD_PROPS, so we need to specify LOCAL
4346 4356 * explictly if we're restoring local properties cleared in the
4347 4357 * first new-style receive.
4348 4358 */
4349 4359 if (origprops != NULL &&
4350 4360 zfs_set_prop_nvlist(tofs, (first_recvd_props ?
4351 4361 ZPROP_SRC_LOCAL : ZPROP_SRC_RECEIVED),
4352 4362 origprops, NULL) != 0) {
4353 4363 /*
4354 4364 * We stashed the original properties but failed to
4355 4365 * restore them.
4356 4366 */
4357 4367 zc->zc_obj |= ZPROP_ERR_NORESTORE;
4358 4368 }
4359 4369 }
4360 4370 out:
4361 4371 nvlist_free(props);
4362 4372 nvlist_free(origprops);
4363 4373 nvlist_free(errors);
4364 4374 releasef(fd);
4365 4375
4366 4376 if (error == 0)
4367 4377 error = props_error;
4368 4378
4369 4379 return (error);
4370 4380 }
4371 4381
4372 4382 /*
4373 4383 * inputs:
4374 4384 * zc_name name of snapshot to send
4375 4385 * zc_cookie file descriptor to send stream to
4376 4386 * zc_obj fromorigin flag (mutually exclusive with zc_fromobj)
4377 4387 * zc_sendobj objsetid of snapshot to send
4378 4388 * zc_fromobj objsetid of incremental fromsnap (may be zero)
4379 4389 * zc_guid if set, estimate size of stream only. zc_cookie is ignored.
4380 4390 * output size in zc_objset_type.
4381 4391 * zc_flags lzc_send_flags
4382 4392 *
4383 4393 * outputs:
4384 4394 * zc_objset_type estimated size, if zc_guid is set
4385 4395 */
4386 4396 static int
4387 4397 zfs_ioc_send(zfs_cmd_t *zc)
4388 4398 {
4389 4399 int error;
4390 4400 offset_t off;
4391 4401 boolean_t estimate = (zc->zc_guid != 0);
4392 4402 boolean_t embedok = (zc->zc_flags & 0x1);
4393 4403 boolean_t large_block_ok = (zc->zc_flags & 0x2);
4394 4404
4395 4405 if (zc->zc_obj != 0) {
4396 4406 dsl_pool_t *dp;
4397 4407 dsl_dataset_t *tosnap;
4398 4408
4399 4409 error = dsl_pool_hold(zc->zc_name, FTAG, &dp);
4400 4410 if (error != 0)
4401 4411 return (error);
4402 4412
4403 4413 error = dsl_dataset_hold_obj(dp, zc->zc_sendobj, FTAG, &tosnap);
4404 4414 if (error != 0) {
4405 4415 dsl_pool_rele(dp, FTAG);
4406 4416 return (error);
4407 4417 }
4408 4418
4409 4419 if (dsl_dir_is_clone(tosnap->ds_dir))
4410 4420 zc->zc_fromobj =
4411 4421 dsl_dir_phys(tosnap->ds_dir)->dd_origin_obj;
4412 4422 dsl_dataset_rele(tosnap, FTAG);
4413 4423 dsl_pool_rele(dp, FTAG);
4414 4424 }
4415 4425
4416 4426 if (estimate) {
4417 4427 dsl_pool_t *dp;
4418 4428 dsl_dataset_t *tosnap;
4419 4429 dsl_dataset_t *fromsnap = NULL;
4420 4430
4421 4431 error = dsl_pool_hold(zc->zc_name, FTAG, &dp);
4422 4432 if (error != 0)
4423 4433 return (error);
4424 4434
4425 4435 error = dsl_dataset_hold_obj(dp, zc->zc_sendobj, FTAG, &tosnap);
4426 4436 if (error != 0) {
4427 4437 dsl_pool_rele(dp, FTAG);
4428 4438 return (error);
4429 4439 }
4430 4440
4431 4441 if (zc->zc_fromobj != 0) {
4432 4442 error = dsl_dataset_hold_obj(dp, zc->zc_fromobj,
4433 4443 FTAG, &fromsnap);
4434 4444 if (error != 0) {
4435 4445 dsl_dataset_rele(tosnap, FTAG);
4436 4446 dsl_pool_rele(dp, FTAG);
4437 4447 return (error);
4438 4448 }
4439 4449 }
4440 4450
4441 4451 error = dmu_send_estimate(tosnap, fromsnap,
4442 4452 &zc->zc_objset_type);
4443 4453
4444 4454 if (fromsnap != NULL)
4445 4455 dsl_dataset_rele(fromsnap, FTAG);
4446 4456 dsl_dataset_rele(tosnap, FTAG);
4447 4457 dsl_pool_rele(dp, FTAG);
4448 4458 } else {
4449 4459 file_t *fp = getf(zc->zc_cookie);
4450 4460 if (fp == NULL)
4451 4461 return (SET_ERROR(EBADF));
4452 4462
4453 4463 off = fp->f_offset;
4454 4464 error = dmu_send_obj(zc->zc_name, zc->zc_sendobj,
4455 4465 zc->zc_fromobj, embedok, large_block_ok,
4456 4466 zc->zc_cookie, fp->f_vnode, &off);
4457 4467
4458 4468 if (VOP_SEEK(fp->f_vnode, fp->f_offset, &off, NULL) == 0)
4459 4469 fp->f_offset = off;
4460 4470 releasef(zc->zc_cookie);
4461 4471 }
4462 4472 return (error);
4463 4473 }
4464 4474
4465 4475 /*
4466 4476 * inputs:
4467 4477 * zc_name name of snapshot on which to report progress
4468 4478 * zc_cookie file descriptor of send stream
4469 4479 *
4470 4480 * outputs:
4471 4481 * zc_cookie number of bytes written in send stream thus far
4472 4482 */
4473 4483 static int
4474 4484 zfs_ioc_send_progress(zfs_cmd_t *zc)
4475 4485 {
4476 4486 dsl_pool_t *dp;
4477 4487 dsl_dataset_t *ds;
4478 4488 dmu_sendarg_t *dsp = NULL;
4479 4489 int error;
4480 4490
4481 4491 error = dsl_pool_hold(zc->zc_name, FTAG, &dp);
4482 4492 if (error != 0)
4483 4493 return (error);
4484 4494
4485 4495 error = dsl_dataset_hold(dp, zc->zc_name, FTAG, &ds);
4486 4496 if (error != 0) {
4487 4497 dsl_pool_rele(dp, FTAG);
4488 4498 return (error);
4489 4499 }
4490 4500
4491 4501 mutex_enter(&ds->ds_sendstream_lock);
4492 4502
4493 4503 /*
4494 4504 * Iterate over all the send streams currently active on this dataset.
4495 4505 * If there's one which matches the specified file descriptor _and_ the
4496 4506 * stream was started by the current process, return the progress of
4497 4507 * that stream.
4498 4508 */
4499 4509 for (dsp = list_head(&ds->ds_sendstreams); dsp != NULL;
4500 4510 dsp = list_next(&ds->ds_sendstreams, dsp)) {
4501 4511 if (dsp->dsa_outfd == zc->zc_cookie &&
4502 4512 dsp->dsa_proc == curproc)
4503 4513 break;
4504 4514 }
4505 4515
4506 4516 if (dsp != NULL)
4507 4517 zc->zc_cookie = *(dsp->dsa_off);
4508 4518 else
4509 4519 error = SET_ERROR(ENOENT);
4510 4520
4511 4521 mutex_exit(&ds->ds_sendstream_lock);
4512 4522 dsl_dataset_rele(ds, FTAG);
4513 4523 dsl_pool_rele(dp, FTAG);
4514 4524 return (error);
4515 4525 }
4516 4526
4517 4527 static int
4518 4528 zfs_ioc_inject_fault(zfs_cmd_t *zc)
4519 4529 {
4520 4530 int id, error;
4521 4531
4522 4532 error = zio_inject_fault(zc->zc_name, (int)zc->zc_guid, &id,
4523 4533 &zc->zc_inject_record);
4524 4534
4525 4535 if (error == 0)
4526 4536 zc->zc_guid = (uint64_t)id;
4527 4537
4528 4538 return (error);
4529 4539 }
4530 4540
4531 4541 static int
4532 4542 zfs_ioc_clear_fault(zfs_cmd_t *zc)
4533 4543 {
4534 4544 return (zio_clear_fault((int)zc->zc_guid));
4535 4545 }
4536 4546
4537 4547 static int
4538 4548 zfs_ioc_inject_list_next(zfs_cmd_t *zc)
4539 4549 {
4540 4550 int id = (int)zc->zc_guid;
4541 4551 int error;
4542 4552
4543 4553 error = zio_inject_list_next(&id, zc->zc_name, sizeof (zc->zc_name),
4544 4554 &zc->zc_inject_record);
4545 4555
4546 4556 zc->zc_guid = id;
4547 4557
4548 4558 return (error);
4549 4559 }
4550 4560
4551 4561 static int
4552 4562 zfs_ioc_error_log(zfs_cmd_t *zc)
4553 4563 {
4554 4564 spa_t *spa;
4555 4565 int error;
4556 4566 size_t count = (size_t)zc->zc_nvlist_dst_size;
4557 4567
4558 4568 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
4559 4569 return (error);
4560 4570
4561 4571 error = spa_get_errlog(spa, (void *)(uintptr_t)zc->zc_nvlist_dst,
4562 4572 &count);
4563 4573 if (error == 0)
4564 4574 zc->zc_nvlist_dst_size = count;
4565 4575 else
4566 4576 zc->zc_nvlist_dst_size = spa_get_errlog_size(spa);
4567 4577
4568 4578 spa_close(spa, FTAG);
4569 4579
4570 4580 return (error);
4571 4581 }
4572 4582
4573 4583 static int
4574 4584 zfs_ioc_clear(zfs_cmd_t *zc)
4575 4585 {
4576 4586 spa_t *spa;
4577 4587 vdev_t *vd;
4578 4588 int error;
4579 4589
4580 4590 /*
4581 4591 * On zpool clear we also fix up missing slogs
4582 4592 */
4583 4593 mutex_enter(&spa_namespace_lock);
4584 4594 spa = spa_lookup(zc->zc_name);
4585 4595 if (spa == NULL) {
4586 4596 mutex_exit(&spa_namespace_lock);
4587 4597 return (SET_ERROR(EIO));
4588 4598 }
4589 4599 if (spa_get_log_state(spa) == SPA_LOG_MISSING) {
4590 4600 /* we need to let spa_open/spa_load clear the chains */
4591 4601 spa_set_log_state(spa, SPA_LOG_CLEAR);
4592 4602 }
4593 4603 spa->spa_last_open_failed = 0;
4594 4604 mutex_exit(&spa_namespace_lock);
4595 4605
4596 4606 if (zc->zc_cookie & ZPOOL_NO_REWIND) {
4597 4607 error = spa_open(zc->zc_name, &spa, FTAG);
4598 4608 } else {
4599 4609 nvlist_t *policy;
4600 4610 nvlist_t *config = NULL;
4601 4611
4602 4612 if (zc->zc_nvlist_src == NULL)
4603 4613 return (SET_ERROR(EINVAL));
4604 4614
4605 4615 if ((error = get_nvlist(zc->zc_nvlist_src,
4606 4616 zc->zc_nvlist_src_size, zc->zc_iflags, &policy)) == 0) {
4607 4617 error = spa_open_rewind(zc->zc_name, &spa, FTAG,
4608 4618 policy, &config);
4609 4619 if (config != NULL) {
4610 4620 int err;
4611 4621
4612 4622 if ((err = put_nvlist(zc, config)) != 0)
4613 4623 error = err;
4614 4624 nvlist_free(config);
4615 4625 }
4616 4626 nvlist_free(policy);
4617 4627 }
4618 4628 }
4619 4629
4620 4630 if (error != 0)
4621 4631 return (error);
4622 4632
4623 4633 spa_vdev_state_enter(spa, SCL_NONE);
4624 4634
4625 4635 if (zc->zc_guid == 0) {
4626 4636 vd = NULL;
4627 4637 } else {
4628 4638 vd = spa_lookup_by_guid(spa, zc->zc_guid, B_TRUE);
4629 4639 if (vd == NULL) {
4630 4640 (void) spa_vdev_state_exit(spa, NULL, ENODEV);
4631 4641 spa_close(spa, FTAG);
4632 4642 return (SET_ERROR(ENODEV));
4633 4643 }
4634 4644 }
4635 4645
4636 4646 vdev_clear(spa, vd);
4637 4647
4638 4648 (void) spa_vdev_state_exit(spa, NULL, 0);
4639 4649
4640 4650 /*
4641 4651 * Resume any suspended I/Os.
4642 4652 */
4643 4653 if (zio_resume(spa) != 0)
4644 4654 error = SET_ERROR(EIO);
4645 4655
4646 4656 spa_close(spa, FTAG);
4647 4657
4648 4658 return (error);
4649 4659 }
4650 4660
4651 4661 static int
4652 4662 zfs_ioc_pool_reopen(zfs_cmd_t *zc)
4653 4663 {
4654 4664 spa_t *spa;
4655 4665 int error;
4656 4666
4657 4667 error = spa_open(zc->zc_name, &spa, FTAG);
4658 4668 if (error != 0)
4659 4669 return (error);
4660 4670
4661 4671 spa_vdev_state_enter(spa, SCL_NONE);
4662 4672
4663 4673 /*
4664 4674 * If a resilver is already in progress then set the
4665 4675 * spa_scrub_reopen flag to B_TRUE so that we don't restart
4666 4676 * the scan as a side effect of the reopen. Otherwise, let
4667 4677 * vdev_open() decided if a resilver is required.
4668 4678 */
4669 4679 spa->spa_scrub_reopen = dsl_scan_resilvering(spa->spa_dsl_pool);
4670 4680 vdev_reopen(spa->spa_root_vdev);
4671 4681 spa->spa_scrub_reopen = B_FALSE;
4672 4682
4673 4683 (void) spa_vdev_state_exit(spa, NULL, 0);
4674 4684 spa_close(spa, FTAG);
4675 4685 return (0);
4676 4686 }
4677 4687 /*
4678 4688 * inputs:
4679 4689 * zc_name name of filesystem
4680 4690 * zc_value name of origin snapshot
4681 4691 *
4682 4692 * outputs:
4683 4693 * zc_string name of conflicting snapshot, if there is one
4684 4694 */
4685 4695 static int
4686 4696 zfs_ioc_promote(zfs_cmd_t *zc)
4687 4697 {
4688 4698 char *cp;
4689 4699
4690 4700 /*
4691 4701 * We don't need to unmount *all* the origin fs's snapshots, but
4692 4702 * it's easier.
4693 4703 */
4694 4704 cp = strchr(zc->zc_value, '@');
4695 4705 if (cp)
4696 4706 *cp = '\0';
4697 4707 (void) dmu_objset_find(zc->zc_value,
4698 4708 zfs_unmount_snap_cb, NULL, DS_FIND_SNAPSHOTS);
4699 4709 return (dsl_dataset_promote(zc->zc_name, zc->zc_string));
4700 4710 }
4701 4711
4702 4712 /*
4703 4713 * Retrieve a single {user|group}{used|quota}@... property.
4704 4714 *
4705 4715 * inputs:
4706 4716 * zc_name name of filesystem
4707 4717 * zc_objset_type zfs_userquota_prop_t
4708 4718 * zc_value domain name (eg. "S-1-234-567-89")
4709 4719 * zc_guid RID/UID/GID
4710 4720 *
4711 4721 * outputs:
4712 4722 * zc_cookie property value
4713 4723 */
4714 4724 static int
4715 4725 zfs_ioc_userspace_one(zfs_cmd_t *zc)
4716 4726 {
4717 4727 zfsvfs_t *zfsvfs;
4718 4728 int error;
4719 4729
4720 4730 if (zc->zc_objset_type >= ZFS_NUM_USERQUOTA_PROPS)
4721 4731 return (SET_ERROR(EINVAL));
4722 4732
4723 4733 error = zfsvfs_hold(zc->zc_name, FTAG, &zfsvfs, B_FALSE);
4724 4734 if (error != 0)
4725 4735 return (error);
4726 4736
4727 4737 error = zfs_userspace_one(zfsvfs,
4728 4738 zc->zc_objset_type, zc->zc_value, zc->zc_guid, &zc->zc_cookie);
4729 4739 zfsvfs_rele(zfsvfs, FTAG);
4730 4740
4731 4741 return (error);
4732 4742 }
4733 4743
4734 4744 /*
4735 4745 * inputs:
4736 4746 * zc_name name of filesystem
4737 4747 * zc_cookie zap cursor
4738 4748 * zc_objset_type zfs_userquota_prop_t
4739 4749 * zc_nvlist_dst[_size] buffer to fill (not really an nvlist)
4740 4750 *
4741 4751 * outputs:
4742 4752 * zc_nvlist_dst[_size] data buffer (array of zfs_useracct_t)
4743 4753 * zc_cookie zap cursor
4744 4754 */
4745 4755 static int
4746 4756 zfs_ioc_userspace_many(zfs_cmd_t *zc)
4747 4757 {
4748 4758 zfsvfs_t *zfsvfs;
4749 4759 int bufsize = zc->zc_nvlist_dst_size;
4750 4760
4751 4761 if (bufsize <= 0)
4752 4762 return (SET_ERROR(ENOMEM));
4753 4763
4754 4764 int error = zfsvfs_hold(zc->zc_name, FTAG, &zfsvfs, B_FALSE);
4755 4765 if (error != 0)
4756 4766 return (error);
4757 4767
4758 4768 void *buf = kmem_alloc(bufsize, KM_SLEEP);
4759 4769
4760 4770 error = zfs_userspace_many(zfsvfs, zc->zc_objset_type, &zc->zc_cookie,
4761 4771 buf, &zc->zc_nvlist_dst_size);
4762 4772
4763 4773 if (error == 0) {
4764 4774 error = xcopyout(buf,
4765 4775 (void *)(uintptr_t)zc->zc_nvlist_dst,
4766 4776 zc->zc_nvlist_dst_size);
4767 4777 }
4768 4778 kmem_free(buf, bufsize);
4769 4779 zfsvfs_rele(zfsvfs, FTAG);
4770 4780
4771 4781 return (error);
4772 4782 }
4773 4783
4774 4784 /*
4775 4785 * inputs:
4776 4786 * zc_name name of filesystem
4777 4787 *
4778 4788 * outputs:
4779 4789 * none
4780 4790 */
4781 4791 static int
4782 4792 zfs_ioc_userspace_upgrade(zfs_cmd_t *zc)
4783 4793 {
4784 4794 objset_t *os;
4785 4795 int error = 0;
4786 4796 zfsvfs_t *zfsvfs;
4787 4797
4788 4798 if (getzfsvfs(zc->zc_name, &zfsvfs) == 0) {
4789 4799 if (!dmu_objset_userused_enabled(zfsvfs->z_os)) {
4790 4800 /*
4791 4801 * If userused is not enabled, it may be because the
4792 4802 * objset needs to be closed & reopened (to grow the
4793 4803 * objset_phys_t). Suspend/resume the fs will do that.
4794 4804 */
4795 4805 error = zfs_suspend_fs(zfsvfs);
4796 4806 if (error == 0) {
4797 4807 dmu_objset_refresh_ownership(zfsvfs->z_os,
4798 4808 zfsvfs);
4799 4809 error = zfs_resume_fs(zfsvfs, zc->zc_name);
4800 4810 }
4801 4811 }
4802 4812 if (error == 0)
4803 4813 error = dmu_objset_userspace_upgrade(zfsvfs->z_os);
4804 4814 VFS_RELE(zfsvfs->z_vfs);
4805 4815 } else {
4806 4816 /* XXX kind of reading contents without owning */
4807 4817 error = dmu_objset_hold(zc->zc_name, FTAG, &os);
4808 4818 if (error != 0)
4809 4819 return (error);
4810 4820
4811 4821 error = dmu_objset_userspace_upgrade(os);
4812 4822 dmu_objset_rele(os, FTAG);
4813 4823 }
4814 4824
4815 4825 return (error);
4816 4826 }
4817 4827
4818 4828 /*
4819 4829 * We don't want to have a hard dependency
4820 4830 * against some special symbols in sharefs
4821 4831 * nfs, and smbsrv. Determine them if needed when
4822 4832 * the first file system is shared.
4823 4833 * Neither sharefs, nfs or smbsrv are unloadable modules.
4824 4834 */
4825 4835 int (*znfsexport_fs)(void *arg);
4826 4836 int (*zshare_fs)(enum sharefs_sys_op, share_t *, uint32_t);
4827 4837 int (*zsmbexport_fs)(void *arg, boolean_t add_share);
4828 4838
4829 4839 int zfs_nfsshare_inited;
4830 4840 int zfs_smbshare_inited;
4831 4841
4832 4842 ddi_modhandle_t nfs_mod;
4833 4843 ddi_modhandle_t sharefs_mod;
4834 4844 ddi_modhandle_t smbsrv_mod;
4835 4845 kmutex_t zfs_share_lock;
4836 4846
4837 4847 static int
4838 4848 zfs_init_sharefs()
4839 4849 {
4840 4850 int error;
4841 4851
4842 4852 ASSERT(MUTEX_HELD(&zfs_share_lock));
4843 4853 /* Both NFS and SMB shares also require sharetab support. */
4844 4854 if (sharefs_mod == NULL && ((sharefs_mod =
4845 4855 ddi_modopen("fs/sharefs",
4846 4856 KRTLD_MODE_FIRST, &error)) == NULL)) {
4847 4857 return (SET_ERROR(ENOSYS));
4848 4858 }
4849 4859 if (zshare_fs == NULL && ((zshare_fs =
4850 4860 (int (*)(enum sharefs_sys_op, share_t *, uint32_t))
4851 4861 ddi_modsym(sharefs_mod, "sharefs_impl", &error)) == NULL)) {
4852 4862 return (SET_ERROR(ENOSYS));
4853 4863 }
4854 4864 return (0);
4855 4865 }
4856 4866
4857 4867 static int
4858 4868 zfs_ioc_share(zfs_cmd_t *zc)
4859 4869 {
4860 4870 int error;
4861 4871 int opcode;
4862 4872
4863 4873 switch (zc->zc_share.z_sharetype) {
4864 4874 case ZFS_SHARE_NFS:
4865 4875 case ZFS_UNSHARE_NFS:
4866 4876 if (zfs_nfsshare_inited == 0) {
4867 4877 mutex_enter(&zfs_share_lock);
4868 4878 if (nfs_mod == NULL && ((nfs_mod = ddi_modopen("fs/nfs",
4869 4879 KRTLD_MODE_FIRST, &error)) == NULL)) {
4870 4880 mutex_exit(&zfs_share_lock);
4871 4881 return (SET_ERROR(ENOSYS));
4872 4882 }
4873 4883 if (znfsexport_fs == NULL &&
4874 4884 ((znfsexport_fs = (int (*)(void *))
4875 4885 ddi_modsym(nfs_mod,
4876 4886 "nfs_export", &error)) == NULL)) {
4877 4887 mutex_exit(&zfs_share_lock);
4878 4888 return (SET_ERROR(ENOSYS));
4879 4889 }
4880 4890 error = zfs_init_sharefs();
4881 4891 if (error != 0) {
4882 4892 mutex_exit(&zfs_share_lock);
4883 4893 return (SET_ERROR(ENOSYS));
4884 4894 }
4885 4895 zfs_nfsshare_inited = 1;
4886 4896 mutex_exit(&zfs_share_lock);
4887 4897 }
4888 4898 break;
4889 4899 case ZFS_SHARE_SMB:
4890 4900 case ZFS_UNSHARE_SMB:
4891 4901 if (zfs_smbshare_inited == 0) {
4892 4902 mutex_enter(&zfs_share_lock);
4893 4903 if (smbsrv_mod == NULL && ((smbsrv_mod =
4894 4904 ddi_modopen("drv/smbsrv",
4895 4905 KRTLD_MODE_FIRST, &error)) == NULL)) {
4896 4906 mutex_exit(&zfs_share_lock);
4897 4907 return (SET_ERROR(ENOSYS));
4898 4908 }
4899 4909 if (zsmbexport_fs == NULL && ((zsmbexport_fs =
4900 4910 (int (*)(void *, boolean_t))ddi_modsym(smbsrv_mod,
4901 4911 "smb_server_share", &error)) == NULL)) {
4902 4912 mutex_exit(&zfs_share_lock);
4903 4913 return (SET_ERROR(ENOSYS));
4904 4914 }
4905 4915 error = zfs_init_sharefs();
4906 4916 if (error != 0) {
4907 4917 mutex_exit(&zfs_share_lock);
4908 4918 return (SET_ERROR(ENOSYS));
4909 4919 }
4910 4920 zfs_smbshare_inited = 1;
4911 4921 mutex_exit(&zfs_share_lock);
4912 4922 }
4913 4923 break;
4914 4924 default:
4915 4925 return (SET_ERROR(EINVAL));
4916 4926 }
4917 4927
4918 4928 switch (zc->zc_share.z_sharetype) {
4919 4929 case ZFS_SHARE_NFS:
4920 4930 case ZFS_UNSHARE_NFS:
4921 4931 if (error =
4922 4932 znfsexport_fs((void *)
4923 4933 (uintptr_t)zc->zc_share.z_exportdata))
4924 4934 return (error);
4925 4935 break;
4926 4936 case ZFS_SHARE_SMB:
4927 4937 case ZFS_UNSHARE_SMB:
4928 4938 if (error = zsmbexport_fs((void *)
4929 4939 (uintptr_t)zc->zc_share.z_exportdata,
4930 4940 zc->zc_share.z_sharetype == ZFS_SHARE_SMB ?
4931 4941 B_TRUE: B_FALSE)) {
4932 4942 return (error);
4933 4943 }
4934 4944 break;
4935 4945 }
4936 4946
4937 4947 opcode = (zc->zc_share.z_sharetype == ZFS_SHARE_NFS ||
4938 4948 zc->zc_share.z_sharetype == ZFS_SHARE_SMB) ?
4939 4949 SHAREFS_ADD : SHAREFS_REMOVE;
4940 4950
4941 4951 /*
4942 4952 * Add or remove share from sharetab
4943 4953 */
4944 4954 error = zshare_fs(opcode,
4945 4955 (void *)(uintptr_t)zc->zc_share.z_sharedata,
4946 4956 zc->zc_share.z_sharemax);
4947 4957
4948 4958 return (error);
4949 4959
4950 4960 }
4951 4961
4952 4962 ace_t full_access[] = {
4953 4963 {(uid_t)-1, ACE_ALL_PERMS, ACE_EVERYONE, 0}
4954 4964 };
4955 4965
4956 4966 /*
4957 4967 * inputs:
4958 4968 * zc_name name of containing filesystem
4959 4969 * zc_obj object # beyond which we want next in-use object #
4960 4970 *
4961 4971 * outputs:
4962 4972 * zc_obj next in-use object #
4963 4973 */
4964 4974 static int
4965 4975 zfs_ioc_next_obj(zfs_cmd_t *zc)
4966 4976 {
4967 4977 objset_t *os = NULL;
4968 4978 int error;
4969 4979
4970 4980 error = dmu_objset_hold(zc->zc_name, FTAG, &os);
4971 4981 if (error != 0)
4972 4982 return (error);
4973 4983
4974 4984 error = dmu_object_next(os, &zc->zc_obj, B_FALSE,
4975 4985 dsl_dataset_phys(os->os_dsl_dataset)->ds_prev_snap_txg);
4976 4986
4977 4987 dmu_objset_rele(os, FTAG);
4978 4988 return (error);
4979 4989 }
4980 4990
4981 4991 /*
4982 4992 * inputs:
4983 4993 * zc_name name of filesystem
4984 4994 * zc_value prefix name for snapshot
4985 4995 * zc_cleanup_fd cleanup-on-exit file descriptor for calling process
4986 4996 *
4987 4997 * outputs:
4988 4998 * zc_value short name of new snapshot
4989 4999 */
4990 5000 static int
4991 5001 zfs_ioc_tmp_snapshot(zfs_cmd_t *zc)
4992 5002 {
4993 5003 char *snap_name;
4994 5004 char *hold_name;
4995 5005 int error;
4996 5006 minor_t minor;
4997 5007
4998 5008 error = zfs_onexit_fd_hold(zc->zc_cleanup_fd, &minor);
4999 5009 if (error != 0)
5000 5010 return (error);
5001 5011
5002 5012 snap_name = kmem_asprintf("%s-%016llx", zc->zc_value,
5003 5013 (u_longlong_t)ddi_get_lbolt64());
5004 5014 hold_name = kmem_asprintf("%%%s", zc->zc_value);
5005 5015
5006 5016 error = dsl_dataset_snapshot_tmp(zc->zc_name, snap_name, minor,
5007 5017 hold_name);
5008 5018 if (error == 0)
5009 5019 (void) strcpy(zc->zc_value, snap_name);
5010 5020 strfree(snap_name);
5011 5021 strfree(hold_name);
5012 5022 zfs_onexit_fd_rele(zc->zc_cleanup_fd);
5013 5023 return (error);
5014 5024 }
5015 5025
5016 5026 /*
5017 5027 * inputs:
5018 5028 * zc_name name of "to" snapshot
5019 5029 * zc_value name of "from" snapshot
5020 5030 * zc_cookie file descriptor to write diff data on
5021 5031 *
5022 5032 * outputs:
5023 5033 * dmu_diff_record_t's to the file descriptor
5024 5034 */
5025 5035 static int
5026 5036 zfs_ioc_diff(zfs_cmd_t *zc)
5027 5037 {
5028 5038 file_t *fp;
5029 5039 offset_t off;
5030 5040 int error;
5031 5041
5032 5042 fp = getf(zc->zc_cookie);
5033 5043 if (fp == NULL)
5034 5044 return (SET_ERROR(EBADF));
5035 5045
5036 5046 off = fp->f_offset;
5037 5047
5038 5048 error = dmu_diff(zc->zc_name, zc->zc_value, fp->f_vnode, &off);
5039 5049
5040 5050 if (VOP_SEEK(fp->f_vnode, fp->f_offset, &off, NULL) == 0)
5041 5051 fp->f_offset = off;
5042 5052 releasef(zc->zc_cookie);
5043 5053
5044 5054 return (error);
5045 5055 }
5046 5056
5047 5057 /*
5048 5058 * Remove all ACL files in shares dir
5049 5059 */
5050 5060 static int
5051 5061 zfs_smb_acl_purge(znode_t *dzp)
5052 5062 {
5053 5063 zap_cursor_t zc;
5054 5064 zap_attribute_t zap;
5055 5065 zfsvfs_t *zfsvfs = dzp->z_zfsvfs;
5056 5066 int error;
5057 5067
5058 5068 for (zap_cursor_init(&zc, zfsvfs->z_os, dzp->z_id);
5059 5069 (error = zap_cursor_retrieve(&zc, &zap)) == 0;
5060 5070 zap_cursor_advance(&zc)) {
5061 5071 if ((error = VOP_REMOVE(ZTOV(dzp), zap.za_name, kcred,
5062 5072 NULL, 0)) != 0)
5063 5073 break;
5064 5074 }
5065 5075 zap_cursor_fini(&zc);
5066 5076 return (error);
5067 5077 }
5068 5078
5069 5079 static int
5070 5080 zfs_ioc_smb_acl(zfs_cmd_t *zc)
5071 5081 {
5072 5082 vnode_t *vp;
5073 5083 znode_t *dzp;
5074 5084 vnode_t *resourcevp = NULL;
5075 5085 znode_t *sharedir;
5076 5086 zfsvfs_t *zfsvfs;
5077 5087 nvlist_t *nvlist;
5078 5088 char *src, *target;
5079 5089 vattr_t vattr;
5080 5090 vsecattr_t vsec;
5081 5091 int error = 0;
5082 5092
5083 5093 if ((error = lookupname(zc->zc_value, UIO_SYSSPACE,
5084 5094 NO_FOLLOW, NULL, &vp)) != 0)
5085 5095 return (error);
5086 5096
5087 5097 /* Now make sure mntpnt and dataset are ZFS */
5088 5098
5089 5099 if (vp->v_vfsp->vfs_fstype != zfsfstype ||
5090 5100 (strcmp((char *)refstr_value(vp->v_vfsp->vfs_resource),
5091 5101 zc->zc_name) != 0)) {
5092 5102 VN_RELE(vp);
5093 5103 return (SET_ERROR(EINVAL));
5094 5104 }
5095 5105
5096 5106 dzp = VTOZ(vp);
5097 5107 zfsvfs = dzp->z_zfsvfs;
5098 5108 ZFS_ENTER(zfsvfs);
5099 5109
5100 5110 /*
5101 5111 * Create share dir if its missing.
5102 5112 */
5103 5113 mutex_enter(&zfsvfs->z_lock);
5104 5114 if (zfsvfs->z_shares_dir == 0) {
5105 5115 dmu_tx_t *tx;
5106 5116
5107 5117 tx = dmu_tx_create(zfsvfs->z_os);
5108 5118 dmu_tx_hold_zap(tx, MASTER_NODE_OBJ, TRUE,
5109 5119 ZFS_SHARES_DIR);
5110 5120 dmu_tx_hold_zap(tx, DMU_NEW_OBJECT, FALSE, NULL);
5111 5121 error = dmu_tx_assign(tx, TXG_WAIT);
5112 5122 if (error != 0) {
5113 5123 dmu_tx_abort(tx);
5114 5124 } else {
5115 5125 error = zfs_create_share_dir(zfsvfs, tx);
5116 5126 dmu_tx_commit(tx);
5117 5127 }
5118 5128 if (error != 0) {
5119 5129 mutex_exit(&zfsvfs->z_lock);
5120 5130 VN_RELE(vp);
5121 5131 ZFS_EXIT(zfsvfs);
5122 5132 return (error);
5123 5133 }
5124 5134 }
5125 5135 mutex_exit(&zfsvfs->z_lock);
5126 5136
5127 5137 ASSERT(zfsvfs->z_shares_dir);
5128 5138 if ((error = zfs_zget(zfsvfs, zfsvfs->z_shares_dir, &sharedir)) != 0) {
5129 5139 VN_RELE(vp);
5130 5140 ZFS_EXIT(zfsvfs);
5131 5141 return (error);
5132 5142 }
5133 5143
5134 5144 switch (zc->zc_cookie) {
5135 5145 case ZFS_SMB_ACL_ADD:
5136 5146 vattr.va_mask = AT_MODE|AT_UID|AT_GID|AT_TYPE;
5137 5147 vattr.va_type = VREG;
5138 5148 vattr.va_mode = S_IFREG|0777;
5139 5149 vattr.va_uid = 0;
5140 5150 vattr.va_gid = 0;
5141 5151
5142 5152 vsec.vsa_mask = VSA_ACE;
5143 5153 vsec.vsa_aclentp = &full_access;
5144 5154 vsec.vsa_aclentsz = sizeof (full_access);
5145 5155 vsec.vsa_aclcnt = 1;
5146 5156
5147 5157 error = VOP_CREATE(ZTOV(sharedir), zc->zc_string,
5148 5158 &vattr, EXCL, 0, &resourcevp, kcred, 0, NULL, &vsec);
5149 5159 if (resourcevp)
5150 5160 VN_RELE(resourcevp);
5151 5161 break;
5152 5162
5153 5163 case ZFS_SMB_ACL_REMOVE:
5154 5164 error = VOP_REMOVE(ZTOV(sharedir), zc->zc_string, kcred,
5155 5165 NULL, 0);
5156 5166 break;
5157 5167
5158 5168 case ZFS_SMB_ACL_RENAME:
5159 5169 if ((error = get_nvlist(zc->zc_nvlist_src,
5160 5170 zc->zc_nvlist_src_size, zc->zc_iflags, &nvlist)) != 0) {
5161 5171 VN_RELE(vp);
5162 5172 VN_RELE(ZTOV(sharedir));
5163 5173 ZFS_EXIT(zfsvfs);
5164 5174 return (error);
5165 5175 }
5166 5176 if (nvlist_lookup_string(nvlist, ZFS_SMB_ACL_SRC, &src) ||
5167 5177 nvlist_lookup_string(nvlist, ZFS_SMB_ACL_TARGET,
5168 5178 &target)) {
5169 5179 VN_RELE(vp);
5170 5180 VN_RELE(ZTOV(sharedir));
5171 5181 ZFS_EXIT(zfsvfs);
5172 5182 nvlist_free(nvlist);
5173 5183 return (error);
5174 5184 }
5175 5185 error = VOP_RENAME(ZTOV(sharedir), src, ZTOV(sharedir), target,
5176 5186 kcred, NULL, 0);
5177 5187 nvlist_free(nvlist);
5178 5188 break;
5179 5189
5180 5190 case ZFS_SMB_ACL_PURGE:
5181 5191 error = zfs_smb_acl_purge(sharedir);
5182 5192 break;
5183 5193
5184 5194 default:
5185 5195 error = SET_ERROR(EINVAL);
5186 5196 break;
5187 5197 }
5188 5198
5189 5199 VN_RELE(vp);
5190 5200 VN_RELE(ZTOV(sharedir));
5191 5201
5192 5202 ZFS_EXIT(zfsvfs);
5193 5203
5194 5204 return (error);
5195 5205 }
5196 5206
5197 5207 /*
5198 5208 * innvl: {
5199 5209 * "holds" -> { snapname -> holdname (string), ... }
5200 5210 * (optional) "cleanup_fd" -> fd (int32)
5201 5211 * }
5202 5212 *
5203 5213 * outnvl: {
5204 5214 * snapname -> error value (int32)
5205 5215 * ...
5206 5216 * }
5207 5217 */
5208 5218 /* ARGSUSED */
5209 5219 static int
5210 5220 zfs_ioc_hold(const char *pool, nvlist_t *args, nvlist_t *errlist)
5211 5221 {
5212 5222 nvpair_t *pair;
5213 5223 nvlist_t *holds;
5214 5224 int cleanup_fd = -1;
5215 5225 int error;
5216 5226 minor_t minor = 0;
5217 5227
5218 5228 error = nvlist_lookup_nvlist(args, "holds", &holds);
5219 5229 if (error != 0)
5220 5230 return (SET_ERROR(EINVAL));
5221 5231
5222 5232 /* make sure the user didn't pass us any invalid (empty) tags */
5223 5233 for (pair = nvlist_next_nvpair(holds, NULL); pair != NULL;
5224 5234 pair = nvlist_next_nvpair(holds, pair)) {
5225 5235 char *htag;
5226 5236
5227 5237 error = nvpair_value_string(pair, &htag);
5228 5238 if (error != 0)
5229 5239 return (SET_ERROR(error));
5230 5240
5231 5241 if (strlen(htag) == 0)
5232 5242 return (SET_ERROR(EINVAL));
5233 5243 }
5234 5244
5235 5245 if (nvlist_lookup_int32(args, "cleanup_fd", &cleanup_fd) == 0) {
5236 5246 error = zfs_onexit_fd_hold(cleanup_fd, &minor);
5237 5247 if (error != 0)
5238 5248 return (error);
5239 5249 }
5240 5250
5241 5251 error = dsl_dataset_user_hold(holds, minor, errlist);
5242 5252 if (minor != 0)
5243 5253 zfs_onexit_fd_rele(cleanup_fd);
5244 5254 return (error);
5245 5255 }
5246 5256
5247 5257 /*
5248 5258 * innvl is not used.
5249 5259 *
5250 5260 * outnvl: {
5251 5261 * holdname -> time added (uint64 seconds since epoch)
5252 5262 * ...
5253 5263 * }
5254 5264 */
5255 5265 /* ARGSUSED */
5256 5266 static int
5257 5267 zfs_ioc_get_holds(const char *snapname, nvlist_t *args, nvlist_t *outnvl)
5258 5268 {
5259 5269 return (dsl_dataset_get_holds(snapname, outnvl));
5260 5270 }
5261 5271
5262 5272 /*
5263 5273 * innvl: {
5264 5274 * snapname -> { holdname, ... }
5265 5275 * ...
5266 5276 * }
5267 5277 *
5268 5278 * outnvl: {
5269 5279 * snapname -> error value (int32)
5270 5280 * ...
5271 5281 * }
5272 5282 */
5273 5283 /* ARGSUSED */
5274 5284 static int
5275 5285 zfs_ioc_release(const char *pool, nvlist_t *holds, nvlist_t *errlist)
5276 5286 {
5277 5287 return (dsl_dataset_user_release(holds, errlist));
5278 5288 }
5279 5289
5280 5290 /*
5281 5291 * inputs:
5282 5292 * zc_name name of new filesystem or snapshot
5283 5293 * zc_value full name of old snapshot
5284 5294 *
5285 5295 * outputs:
5286 5296 * zc_cookie space in bytes
5287 5297 * zc_objset_type compressed space in bytes
5288 5298 * zc_perm_action uncompressed space in bytes
5289 5299 */
5290 5300 static int
5291 5301 zfs_ioc_space_written(zfs_cmd_t *zc)
5292 5302 {
5293 5303 int error;
5294 5304 dsl_pool_t *dp;
5295 5305 dsl_dataset_t *new, *old;
5296 5306
5297 5307 error = dsl_pool_hold(zc->zc_name, FTAG, &dp);
5298 5308 if (error != 0)
5299 5309 return (error);
5300 5310 error = dsl_dataset_hold(dp, zc->zc_name, FTAG, &new);
5301 5311 if (error != 0) {
5302 5312 dsl_pool_rele(dp, FTAG);
5303 5313 return (error);
5304 5314 }
5305 5315 error = dsl_dataset_hold(dp, zc->zc_value, FTAG, &old);
5306 5316 if (error != 0) {
5307 5317 dsl_dataset_rele(new, FTAG);
5308 5318 dsl_pool_rele(dp, FTAG);
5309 5319 return (error);
5310 5320 }
5311 5321
5312 5322 error = dsl_dataset_space_written(old, new, &zc->zc_cookie,
5313 5323 &zc->zc_objset_type, &zc->zc_perm_action);
5314 5324 dsl_dataset_rele(old, FTAG);
5315 5325 dsl_dataset_rele(new, FTAG);
5316 5326 dsl_pool_rele(dp, FTAG);
5317 5327 return (error);
5318 5328 }
5319 5329
5320 5330 /*
5321 5331 * innvl: {
5322 5332 * "firstsnap" -> snapshot name
5323 5333 * }
5324 5334 *
5325 5335 * outnvl: {
5326 5336 * "used" -> space in bytes
5327 5337 * "compressed" -> compressed space in bytes
5328 5338 * "uncompressed" -> uncompressed space in bytes
5329 5339 * }
5330 5340 */
5331 5341 static int
5332 5342 zfs_ioc_space_snaps(const char *lastsnap, nvlist_t *innvl, nvlist_t *outnvl)
5333 5343 {
5334 5344 int error;
5335 5345 dsl_pool_t *dp;
5336 5346 dsl_dataset_t *new, *old;
5337 5347 char *firstsnap;
5338 5348 uint64_t used, comp, uncomp;
5339 5349
5340 5350 if (nvlist_lookup_string(innvl, "firstsnap", &firstsnap) != 0)
5341 5351 return (SET_ERROR(EINVAL));
5342 5352
5343 5353 error = dsl_pool_hold(lastsnap, FTAG, &dp);
5344 5354 if (error != 0)
5345 5355 return (error);
5346 5356
5347 5357 error = dsl_dataset_hold(dp, lastsnap, FTAG, &new);
5348 5358 if (error == 0 && !new->ds_is_snapshot) {
5349 5359 dsl_dataset_rele(new, FTAG);
5350 5360 error = SET_ERROR(EINVAL);
5351 5361 }
5352 5362 if (error != 0) {
5353 5363 dsl_pool_rele(dp, FTAG);
5354 5364 return (error);
5355 5365 }
5356 5366 error = dsl_dataset_hold(dp, firstsnap, FTAG, &old);
5357 5367 if (error == 0 && !old->ds_is_snapshot) {
5358 5368 dsl_dataset_rele(old, FTAG);
5359 5369 error = SET_ERROR(EINVAL);
5360 5370 }
5361 5371 if (error != 0) {
5362 5372 dsl_dataset_rele(new, FTAG);
5363 5373 dsl_pool_rele(dp, FTAG);
5364 5374 return (error);
5365 5375 }
5366 5376
5367 5377 error = dsl_dataset_space_wouldfree(old, new, &used, &comp, &uncomp);
5368 5378 dsl_dataset_rele(old, FTAG);
5369 5379 dsl_dataset_rele(new, FTAG);
5370 5380 dsl_pool_rele(dp, FTAG);
5371 5381 fnvlist_add_uint64(outnvl, "used", used);
5372 5382 fnvlist_add_uint64(outnvl, "compressed", comp);
5373 5383 fnvlist_add_uint64(outnvl, "uncompressed", uncomp);
5374 5384 return (error);
5375 5385 }
5376 5386
5377 5387 /*
5378 5388 * innvl: {
5379 5389 * "fd" -> file descriptor to write stream to (int32)
5380 5390 * (optional) "fromsnap" -> full snap name to send an incremental from
5381 5391 * (optional) "largeblockok" -> (value ignored)
5382 5392 * indicates that blocks > 128KB are permitted
5383 5393 * (optional) "embedok" -> (value ignored)
5384 5394 * presence indicates DRR_WRITE_EMBEDDED records are permitted
5385 5395 * (optional) "resume_object" and "resume_offset" -> (uint64)
5386 5396 * if present, resume send stream from specified object and offset.
5387 5397 * }
5388 5398 *
5389 5399 * outnvl is unused
5390 5400 */
5391 5401 /* ARGSUSED */
5392 5402 static int
5393 5403 zfs_ioc_send_new(const char *snapname, nvlist_t *innvl, nvlist_t *outnvl)
5394 5404 {
5395 5405 int error;
5396 5406 offset_t off;
5397 5407 char *fromname = NULL;
5398 5408 int fd;
5399 5409 boolean_t largeblockok;
5400 5410 boolean_t embedok;
5401 5411 uint64_t resumeobj = 0;
5402 5412 uint64_t resumeoff = 0;
5403 5413
5404 5414 error = nvlist_lookup_int32(innvl, "fd", &fd);
5405 5415 if (error != 0)
5406 5416 return (SET_ERROR(EINVAL));
5407 5417
5408 5418 (void) nvlist_lookup_string(innvl, "fromsnap", &fromname);
5409 5419
5410 5420 largeblockok = nvlist_exists(innvl, "largeblockok");
5411 5421 embedok = nvlist_exists(innvl, "embedok");
5412 5422
5413 5423 (void) nvlist_lookup_uint64(innvl, "resume_object", &resumeobj);
5414 5424 (void) nvlist_lookup_uint64(innvl, "resume_offset", &resumeoff);
5415 5425
5416 5426 file_t *fp = getf(fd);
5417 5427 if (fp == NULL)
5418 5428 return (SET_ERROR(EBADF));
5419 5429
5420 5430 off = fp->f_offset;
5421 5431 error = dmu_send(snapname, fromname, embedok, largeblockok, fd,
5422 5432 resumeobj, resumeoff, fp->f_vnode, &off);
5423 5433
5424 5434 if (VOP_SEEK(fp->f_vnode, fp->f_offset, &off, NULL) == 0)
5425 5435 fp->f_offset = off;
5426 5436 releasef(fd);
5427 5437 return (error);
5428 5438 }
5429 5439
5430 5440 /*
5431 5441 * Determine approximately how large a zfs send stream will be -- the number
5432 5442 * of bytes that will be written to the fd supplied to zfs_ioc_send_new().
5433 5443 *
5434 5444 * innvl: {
5435 5445 * (optional) "from" -> full snap or bookmark name to send an incremental
5436 5446 * from
5437 5447 * }
5438 5448 *
5439 5449 * outnvl: {
5440 5450 * "space" -> bytes of space (uint64)
5441 5451 * }
5442 5452 */
5443 5453 static int
5444 5454 zfs_ioc_send_space(const char *snapname, nvlist_t *innvl, nvlist_t *outnvl)
5445 5455 {
5446 5456 dsl_pool_t *dp;
5447 5457 dsl_dataset_t *tosnap;
5448 5458 int error;
5449 5459 char *fromname;
5450 5460 uint64_t space;
5451 5461
5452 5462 error = dsl_pool_hold(snapname, FTAG, &dp);
5453 5463 if (error != 0)
5454 5464 return (error);
5455 5465
5456 5466 error = dsl_dataset_hold(dp, snapname, FTAG, &tosnap);
5457 5467 if (error != 0) {
5458 5468 dsl_pool_rele(dp, FTAG);
5459 5469 return (error);
5460 5470 }
5461 5471
5462 5472 error = nvlist_lookup_string(innvl, "from", &fromname);
5463 5473 if (error == 0) {
5464 5474 if (strchr(fromname, '@') != NULL) {
5465 5475 /*
5466 5476 * If from is a snapshot, hold it and use the more
5467 5477 * efficient dmu_send_estimate to estimate send space
5468 5478 * size using deadlists.
5469 5479 */
5470 5480 dsl_dataset_t *fromsnap;
5471 5481 error = dsl_dataset_hold(dp, fromname, FTAG, &fromsnap);
5472 5482 if (error != 0)
5473 5483 goto out;
5474 5484 error = dmu_send_estimate(tosnap, fromsnap, &space);
5475 5485 dsl_dataset_rele(fromsnap, FTAG);
5476 5486 } else if (strchr(fromname, '#') != NULL) {
5477 5487 /*
5478 5488 * If from is a bookmark, fetch the creation TXG of the
5479 5489 * snapshot it was created from and use that to find
5480 5490 * blocks that were born after it.
5481 5491 */
5482 5492 zfs_bookmark_phys_t frombm;
5483 5493
5484 5494 error = dsl_bookmark_lookup(dp, fromname, tosnap,
5485 5495 &frombm);
5486 5496 if (error != 0)
5487 5497 goto out;
5488 5498 error = dmu_send_estimate_from_txg(tosnap,
5489 5499 frombm.zbm_creation_txg, &space);
5490 5500 } else {
5491 5501 /*
5492 5502 * from is not properly formatted as a snapshot or
5493 5503 * bookmark
5494 5504 */
5495 5505 error = SET_ERROR(EINVAL);
5496 5506 goto out;
5497 5507 }
5498 5508 } else {
5499 5509 // If estimating the size of a full send, use dmu_send_estimate
5500 5510 error = dmu_send_estimate(tosnap, NULL, &space);
5501 5511 }
5502 5512
5503 5513 fnvlist_add_uint64(outnvl, "space", space);
5504 5514
5505 5515 out:
5506 5516 dsl_dataset_rele(tosnap, FTAG);
5507 5517 dsl_pool_rele(dp, FTAG);
5508 5518 return (error);
5509 5519 }
5510 5520
5511 5521 static zfs_ioc_vec_t zfs_ioc_vec[ZFS_IOC_LAST - ZFS_IOC_FIRST];
5512 5522
5513 5523 static void
5514 5524 zfs_ioctl_register_legacy(zfs_ioc_t ioc, zfs_ioc_legacy_func_t *func,
5515 5525 zfs_secpolicy_func_t *secpolicy, zfs_ioc_namecheck_t namecheck,
5516 5526 boolean_t log_history, zfs_ioc_poolcheck_t pool_check)
5517 5527 {
5518 5528 zfs_ioc_vec_t *vec = &zfs_ioc_vec[ioc - ZFS_IOC_FIRST];
5519 5529
5520 5530 ASSERT3U(ioc, >=, ZFS_IOC_FIRST);
5521 5531 ASSERT3U(ioc, <, ZFS_IOC_LAST);
5522 5532 ASSERT3P(vec->zvec_legacy_func, ==, NULL);
5523 5533 ASSERT3P(vec->zvec_func, ==, NULL);
5524 5534
5525 5535 vec->zvec_legacy_func = func;
5526 5536 vec->zvec_secpolicy = secpolicy;
5527 5537 vec->zvec_namecheck = namecheck;
5528 5538 vec->zvec_allow_log = log_history;
5529 5539 vec->zvec_pool_check = pool_check;
5530 5540 }
5531 5541
5532 5542 /*
5533 5543 * See the block comment at the beginning of this file for details on
5534 5544 * each argument to this function.
5535 5545 */
5536 5546 static void
5537 5547 zfs_ioctl_register(const char *name, zfs_ioc_t ioc, zfs_ioc_func_t *func,
5538 5548 zfs_secpolicy_func_t *secpolicy, zfs_ioc_namecheck_t namecheck,
5539 5549 zfs_ioc_poolcheck_t pool_check, boolean_t smush_outnvlist,
5540 5550 boolean_t allow_log)
5541 5551 {
5542 5552 zfs_ioc_vec_t *vec = &zfs_ioc_vec[ioc - ZFS_IOC_FIRST];
5543 5553
5544 5554 ASSERT3U(ioc, >=, ZFS_IOC_FIRST);
5545 5555 ASSERT3U(ioc, <, ZFS_IOC_LAST);
5546 5556 ASSERT3P(vec->zvec_legacy_func, ==, NULL);
5547 5557 ASSERT3P(vec->zvec_func, ==, NULL);
5548 5558
5549 5559 /* if we are logging, the name must be valid */
5550 5560 ASSERT(!allow_log || namecheck != NO_NAME);
5551 5561
5552 5562 vec->zvec_name = name;
5553 5563 vec->zvec_func = func;
5554 5564 vec->zvec_secpolicy = secpolicy;
5555 5565 vec->zvec_namecheck = namecheck;
5556 5566 vec->zvec_pool_check = pool_check;
5557 5567 vec->zvec_smush_outnvlist = smush_outnvlist;
5558 5568 vec->zvec_allow_log = allow_log;
5559 5569 }
5560 5570
5561 5571 static void
5562 5572 zfs_ioctl_register_pool(zfs_ioc_t ioc, zfs_ioc_legacy_func_t *func,
5563 5573 zfs_secpolicy_func_t *secpolicy, boolean_t log_history,
5564 5574 zfs_ioc_poolcheck_t pool_check)
5565 5575 {
5566 5576 zfs_ioctl_register_legacy(ioc, func, secpolicy,
5567 5577 POOL_NAME, log_history, pool_check);
5568 5578 }
5569 5579
5570 5580 static void
5571 5581 zfs_ioctl_register_dataset_nolog(zfs_ioc_t ioc, zfs_ioc_legacy_func_t *func,
5572 5582 zfs_secpolicy_func_t *secpolicy, zfs_ioc_poolcheck_t pool_check)
5573 5583 {
5574 5584 zfs_ioctl_register_legacy(ioc, func, secpolicy,
5575 5585 DATASET_NAME, B_FALSE, pool_check);
5576 5586 }
5577 5587
5578 5588 static void
5579 5589 zfs_ioctl_register_pool_modify(zfs_ioc_t ioc, zfs_ioc_legacy_func_t *func)
5580 5590 {
5581 5591 zfs_ioctl_register_legacy(ioc, func, zfs_secpolicy_config,
5582 5592 POOL_NAME, B_TRUE, POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY);
5583 5593 }
5584 5594
5585 5595 static void
5586 5596 zfs_ioctl_register_pool_meta(zfs_ioc_t ioc, zfs_ioc_legacy_func_t *func,
5587 5597 zfs_secpolicy_func_t *secpolicy)
5588 5598 {
5589 5599 zfs_ioctl_register_legacy(ioc, func, secpolicy,
5590 5600 NO_NAME, B_FALSE, POOL_CHECK_NONE);
5591 5601 }
5592 5602
5593 5603 static void
5594 5604 zfs_ioctl_register_dataset_read_secpolicy(zfs_ioc_t ioc,
5595 5605 zfs_ioc_legacy_func_t *func, zfs_secpolicy_func_t *secpolicy)
5596 5606 {
5597 5607 zfs_ioctl_register_legacy(ioc, func, secpolicy,
5598 5608 DATASET_NAME, B_FALSE, POOL_CHECK_SUSPENDED);
5599 5609 }
5600 5610
5601 5611 static void
5602 5612 zfs_ioctl_register_dataset_read(zfs_ioc_t ioc, zfs_ioc_legacy_func_t *func)
5603 5613 {
5604 5614 zfs_ioctl_register_dataset_read_secpolicy(ioc, func,
5605 5615 zfs_secpolicy_read);
5606 5616 }
5607 5617
5608 5618 static void
5609 5619 zfs_ioctl_register_dataset_modify(zfs_ioc_t ioc, zfs_ioc_legacy_func_t *func,
5610 5620 zfs_secpolicy_func_t *secpolicy)
5611 5621 {
5612 5622 zfs_ioctl_register_legacy(ioc, func, secpolicy,
5613 5623 DATASET_NAME, B_TRUE, POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY);
5614 5624 }
5615 5625
5616 5626 static void
5617 5627 zfs_ioctl_init(void)
5618 5628 {
5619 5629 zfs_ioctl_register("snapshot", ZFS_IOC_SNAPSHOT,
5620 5630 zfs_ioc_snapshot, zfs_secpolicy_snapshot, POOL_NAME,
5621 5631 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_TRUE, B_TRUE);
5622 5632
5623 5633 zfs_ioctl_register("log_history", ZFS_IOC_LOG_HISTORY,
5624 5634 zfs_ioc_log_history, zfs_secpolicy_log_history, NO_NAME,
5625 5635 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_FALSE, B_FALSE);
5626 5636
5627 5637 zfs_ioctl_register("space_snaps", ZFS_IOC_SPACE_SNAPS,
5628 5638 zfs_ioc_space_snaps, zfs_secpolicy_read, DATASET_NAME,
5629 5639 POOL_CHECK_SUSPENDED, B_FALSE, B_FALSE);
5630 5640
5631 5641 zfs_ioctl_register("send", ZFS_IOC_SEND_NEW,
5632 5642 zfs_ioc_send_new, zfs_secpolicy_send_new, DATASET_NAME,
5633 5643 POOL_CHECK_SUSPENDED, B_FALSE, B_FALSE);
5634 5644
5635 5645 zfs_ioctl_register("send_space", ZFS_IOC_SEND_SPACE,
5636 5646 zfs_ioc_send_space, zfs_secpolicy_read, DATASET_NAME,
5637 5647 POOL_CHECK_SUSPENDED, B_FALSE, B_FALSE);
5638 5648
5639 5649 zfs_ioctl_register("create", ZFS_IOC_CREATE,
5640 5650 zfs_ioc_create, zfs_secpolicy_create_clone, DATASET_NAME,
5641 5651 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_TRUE, B_TRUE);
5642 5652
5643 5653 zfs_ioctl_register("clone", ZFS_IOC_CLONE,
5644 5654 zfs_ioc_clone, zfs_secpolicy_create_clone, DATASET_NAME,
5645 5655 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_TRUE, B_TRUE);
5646 5656
5647 5657 zfs_ioctl_register("destroy_snaps", ZFS_IOC_DESTROY_SNAPS,
5648 5658 zfs_ioc_destroy_snaps, zfs_secpolicy_destroy_snaps, POOL_NAME,
5649 5659 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_TRUE, B_TRUE);
5650 5660
5651 5661 zfs_ioctl_register("hold", ZFS_IOC_HOLD,
5652 5662 zfs_ioc_hold, zfs_secpolicy_hold, POOL_NAME,
5653 5663 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_TRUE, B_TRUE);
5654 5664 zfs_ioctl_register("release", ZFS_IOC_RELEASE,
5655 5665 zfs_ioc_release, zfs_secpolicy_release, POOL_NAME,
5656 5666 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_TRUE, B_TRUE);
5657 5667
5658 5668 zfs_ioctl_register("get_holds", ZFS_IOC_GET_HOLDS,
5659 5669 zfs_ioc_get_holds, zfs_secpolicy_read, DATASET_NAME,
5660 5670 POOL_CHECK_SUSPENDED, B_FALSE, B_FALSE);
5661 5671
5662 5672 zfs_ioctl_register("rollback", ZFS_IOC_ROLLBACK,
5663 5673 zfs_ioc_rollback, zfs_secpolicy_rollback, DATASET_NAME,
5664 5674 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_FALSE, B_TRUE);
5665 5675
5666 5676 zfs_ioctl_register("bookmark", ZFS_IOC_BOOKMARK,
5667 5677 zfs_ioc_bookmark, zfs_secpolicy_bookmark, POOL_NAME,
5668 5678 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_TRUE, B_TRUE);
5669 5679
5670 5680 zfs_ioctl_register("get_bookmarks", ZFS_IOC_GET_BOOKMARKS,
5671 5681 zfs_ioc_get_bookmarks, zfs_secpolicy_read, DATASET_NAME,
5672 5682 POOL_CHECK_SUSPENDED, B_FALSE, B_FALSE);
5673 5683
5674 5684 zfs_ioctl_register("destroy_bookmarks", ZFS_IOC_DESTROY_BOOKMARKS,
5675 5685 zfs_ioc_destroy_bookmarks, zfs_secpolicy_destroy_bookmarks,
5676 5686 POOL_NAME,
5677 5687 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_TRUE, B_TRUE);
5678 5688
5679 5689 /* IOCTLS that use the legacy function signature */
5680 5690
5681 5691 zfs_ioctl_register_legacy(ZFS_IOC_POOL_FREEZE, zfs_ioc_pool_freeze,
5682 5692 zfs_secpolicy_config, NO_NAME, B_FALSE, POOL_CHECK_READONLY);
5683 5693
5684 5694 zfs_ioctl_register_pool(ZFS_IOC_POOL_CREATE, zfs_ioc_pool_create,
5685 5695 zfs_secpolicy_config, B_TRUE, POOL_CHECK_NONE);
5686 5696 zfs_ioctl_register_pool_modify(ZFS_IOC_POOL_SCAN,
5687 5697 zfs_ioc_pool_scan);
5688 5698 zfs_ioctl_register_pool_modify(ZFS_IOC_POOL_UPGRADE,
5689 5699 zfs_ioc_pool_upgrade);
5690 5700 zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_ADD,
5691 5701 zfs_ioc_vdev_add);
5692 5702 zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_REMOVE,
5693 5703 zfs_ioc_vdev_remove);
5694 5704 zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_SET_STATE,
5695 5705 zfs_ioc_vdev_set_state);
5696 5706 zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_ATTACH,
5697 5707 zfs_ioc_vdev_attach);
5698 5708 zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_DETACH,
5699 5709 zfs_ioc_vdev_detach);
5700 5710 zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_SETPATH,
5701 5711 zfs_ioc_vdev_setpath);
5702 5712 zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_SETFRU,
5703 5713 zfs_ioc_vdev_setfru);
5704 5714 zfs_ioctl_register_pool_modify(ZFS_IOC_POOL_SET_PROPS,
5705 5715 zfs_ioc_pool_set_props);
5706 5716 zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_SPLIT,
5707 5717 zfs_ioc_vdev_split);
5708 5718 zfs_ioctl_register_pool_modify(ZFS_IOC_POOL_REGUID,
5709 5719 zfs_ioc_pool_reguid);
5710 5720
5711 5721 zfs_ioctl_register_pool_meta(ZFS_IOC_POOL_CONFIGS,
5712 5722 zfs_ioc_pool_configs, zfs_secpolicy_none);
5713 5723 zfs_ioctl_register_pool_meta(ZFS_IOC_POOL_TRYIMPORT,
5714 5724 zfs_ioc_pool_tryimport, zfs_secpolicy_config);
5715 5725 zfs_ioctl_register_pool_meta(ZFS_IOC_INJECT_FAULT,
5716 5726 zfs_ioc_inject_fault, zfs_secpolicy_inject);
5717 5727 zfs_ioctl_register_pool_meta(ZFS_IOC_CLEAR_FAULT,
5718 5728 zfs_ioc_clear_fault, zfs_secpolicy_inject);
5719 5729 zfs_ioctl_register_pool_meta(ZFS_IOC_INJECT_LIST_NEXT,
5720 5730 zfs_ioc_inject_list_next, zfs_secpolicy_inject);
5721 5731
5722 5732 /*
5723 5733 * pool destroy, and export don't log the history as part of
5724 5734 * zfsdev_ioctl, but rather zfs_ioc_pool_export
5725 5735 * does the logging of those commands.
5726 5736 */
5727 5737 zfs_ioctl_register_pool(ZFS_IOC_POOL_DESTROY, zfs_ioc_pool_destroy,
5728 5738 zfs_secpolicy_config, B_FALSE, POOL_CHECK_NONE);
5729 5739 zfs_ioctl_register_pool(ZFS_IOC_POOL_EXPORT, zfs_ioc_pool_export,
5730 5740 zfs_secpolicy_config, B_FALSE, POOL_CHECK_NONE);
5731 5741
5732 5742 zfs_ioctl_register_pool(ZFS_IOC_POOL_STATS, zfs_ioc_pool_stats,
5733 5743 zfs_secpolicy_read, B_FALSE, POOL_CHECK_NONE);
5734 5744 zfs_ioctl_register_pool(ZFS_IOC_POOL_GET_PROPS, zfs_ioc_pool_get_props,
5735 5745 zfs_secpolicy_read, B_FALSE, POOL_CHECK_NONE);
5736 5746
5737 5747 zfs_ioctl_register_pool(ZFS_IOC_ERROR_LOG, zfs_ioc_error_log,
5738 5748 zfs_secpolicy_inject, B_FALSE, POOL_CHECK_SUSPENDED);
5739 5749 zfs_ioctl_register_pool(ZFS_IOC_DSOBJ_TO_DSNAME,
5740 5750 zfs_ioc_dsobj_to_dsname,
5741 5751 zfs_secpolicy_diff, B_FALSE, POOL_CHECK_SUSPENDED);
5742 5752 zfs_ioctl_register_pool(ZFS_IOC_POOL_GET_HISTORY,
5743 5753 zfs_ioc_pool_get_history,
5744 5754 zfs_secpolicy_config, B_FALSE, POOL_CHECK_SUSPENDED);
5745 5755
5746 5756 zfs_ioctl_register_pool(ZFS_IOC_POOL_IMPORT, zfs_ioc_pool_import,
5747 5757 zfs_secpolicy_config, B_TRUE, POOL_CHECK_NONE);
5748 5758
5749 5759 zfs_ioctl_register_pool(ZFS_IOC_CLEAR, zfs_ioc_clear,
5750 5760 zfs_secpolicy_config, B_TRUE, POOL_CHECK_NONE);
5751 5761 zfs_ioctl_register_pool(ZFS_IOC_POOL_REOPEN, zfs_ioc_pool_reopen,
5752 5762 zfs_secpolicy_config, B_TRUE, POOL_CHECK_SUSPENDED);
5753 5763
5754 5764 zfs_ioctl_register_dataset_read(ZFS_IOC_SPACE_WRITTEN,
5755 5765 zfs_ioc_space_written);
5756 5766 zfs_ioctl_register_dataset_read(ZFS_IOC_OBJSET_RECVD_PROPS,
5757 5767 zfs_ioc_objset_recvd_props);
5758 5768 zfs_ioctl_register_dataset_read(ZFS_IOC_NEXT_OBJ,
5759 5769 zfs_ioc_next_obj);
5760 5770 zfs_ioctl_register_dataset_read(ZFS_IOC_GET_FSACL,
5761 5771 zfs_ioc_get_fsacl);
5762 5772 zfs_ioctl_register_dataset_read(ZFS_IOC_OBJSET_STATS,
5763 5773 zfs_ioc_objset_stats);
5764 5774 zfs_ioctl_register_dataset_read(ZFS_IOC_OBJSET_ZPLPROPS,
5765 5775 zfs_ioc_objset_zplprops);
5766 5776 zfs_ioctl_register_dataset_read(ZFS_IOC_DATASET_LIST_NEXT,
5767 5777 zfs_ioc_dataset_list_next);
5768 5778 zfs_ioctl_register_dataset_read(ZFS_IOC_SNAPSHOT_LIST_NEXT,
5769 5779 zfs_ioc_snapshot_list_next);
5770 5780 zfs_ioctl_register_dataset_read(ZFS_IOC_SEND_PROGRESS,
5771 5781 zfs_ioc_send_progress);
5772 5782
5773 5783 zfs_ioctl_register_dataset_read_secpolicy(ZFS_IOC_DIFF,
5774 5784 zfs_ioc_diff, zfs_secpolicy_diff);
5775 5785 zfs_ioctl_register_dataset_read_secpolicy(ZFS_IOC_OBJ_TO_STATS,
5776 5786 zfs_ioc_obj_to_stats, zfs_secpolicy_diff);
5777 5787 zfs_ioctl_register_dataset_read_secpolicy(ZFS_IOC_OBJ_TO_PATH,
5778 5788 zfs_ioc_obj_to_path, zfs_secpolicy_diff);
5779 5789 zfs_ioctl_register_dataset_read_secpolicy(ZFS_IOC_USERSPACE_ONE,
5780 5790 zfs_ioc_userspace_one, zfs_secpolicy_userspace_one);
5781 5791 zfs_ioctl_register_dataset_read_secpolicy(ZFS_IOC_USERSPACE_MANY,
5782 5792 zfs_ioc_userspace_many, zfs_secpolicy_userspace_many);
5783 5793 zfs_ioctl_register_dataset_read_secpolicy(ZFS_IOC_SEND,
5784 5794 zfs_ioc_send, zfs_secpolicy_send);
5785 5795
5786 5796 zfs_ioctl_register_dataset_modify(ZFS_IOC_SET_PROP, zfs_ioc_set_prop,
5787 5797 zfs_secpolicy_none);
5788 5798 zfs_ioctl_register_dataset_modify(ZFS_IOC_DESTROY, zfs_ioc_destroy,
5789 5799 zfs_secpolicy_destroy);
5790 5800 zfs_ioctl_register_dataset_modify(ZFS_IOC_RENAME, zfs_ioc_rename,
5791 5801 zfs_secpolicy_rename);
5792 5802 zfs_ioctl_register_dataset_modify(ZFS_IOC_RECV, zfs_ioc_recv,
5793 5803 zfs_secpolicy_recv);
5794 5804 zfs_ioctl_register_dataset_modify(ZFS_IOC_PROMOTE, zfs_ioc_promote,
5795 5805 zfs_secpolicy_promote);
5796 5806 zfs_ioctl_register_dataset_modify(ZFS_IOC_INHERIT_PROP,
5797 5807 zfs_ioc_inherit_prop, zfs_secpolicy_inherit_prop);
5798 5808 zfs_ioctl_register_dataset_modify(ZFS_IOC_SET_FSACL, zfs_ioc_set_fsacl,
5799 5809 zfs_secpolicy_set_fsacl);
5800 5810
5801 5811 zfs_ioctl_register_dataset_nolog(ZFS_IOC_SHARE, zfs_ioc_share,
5802 5812 zfs_secpolicy_share, POOL_CHECK_NONE);
5803 5813 zfs_ioctl_register_dataset_nolog(ZFS_IOC_SMB_ACL, zfs_ioc_smb_acl,
5804 5814 zfs_secpolicy_smb_acl, POOL_CHECK_NONE);
5805 5815 zfs_ioctl_register_dataset_nolog(ZFS_IOC_USERSPACE_UPGRADE,
5806 5816 zfs_ioc_userspace_upgrade, zfs_secpolicy_userspace_upgrade,
5807 5817 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY);
5808 5818 zfs_ioctl_register_dataset_nolog(ZFS_IOC_TMP_SNAPSHOT,
5809 5819 zfs_ioc_tmp_snapshot, zfs_secpolicy_tmp_snapshot,
5810 5820 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY);
5811 5821 }
5812 5822
5813 5823 int
5814 5824 pool_status_check(const char *name, zfs_ioc_namecheck_t type,
5815 5825 zfs_ioc_poolcheck_t check)
5816 5826 {
5817 5827 spa_t *spa;
5818 5828 int error;
5819 5829
5820 5830 ASSERT(type == POOL_NAME || type == DATASET_NAME);
5821 5831
5822 5832 if (check & POOL_CHECK_NONE)
5823 5833 return (0);
5824 5834
5825 5835 error = spa_open(name, &spa, FTAG);
5826 5836 if (error == 0) {
5827 5837 if ((check & POOL_CHECK_SUSPENDED) && spa_suspended(spa))
5828 5838 error = SET_ERROR(EAGAIN);
5829 5839 else if ((check & POOL_CHECK_READONLY) && !spa_writeable(spa))
5830 5840 error = SET_ERROR(EROFS);
5831 5841 spa_close(spa, FTAG);
5832 5842 }
5833 5843 return (error);
5834 5844 }
5835 5845
5836 5846 /*
5837 5847 * Find a free minor number.
5838 5848 */
5839 5849 minor_t
5840 5850 zfsdev_minor_alloc(void)
5841 5851 {
5842 5852 static minor_t last_minor;
5843 5853 minor_t m;
5844 5854
5845 5855 ASSERT(MUTEX_HELD(&zfsdev_state_lock));
5846 5856
5847 5857 for (m = last_minor + 1; m != last_minor; m++) {
5848 5858 if (m > ZFSDEV_MAX_MINOR)
5849 5859 m = 1;
5850 5860 if (ddi_get_soft_state(zfsdev_state, m) == NULL) {
5851 5861 last_minor = m;
5852 5862 return (m);
5853 5863 }
5854 5864 }
5855 5865
5856 5866 return (0);
5857 5867 }
5858 5868
5859 5869 static int
5860 5870 zfs_ctldev_init(dev_t *devp)
5861 5871 {
5862 5872 minor_t minor;
5863 5873 zfs_soft_state_t *zs;
5864 5874
5865 5875 ASSERT(MUTEX_HELD(&zfsdev_state_lock));
5866 5876 ASSERT(getminor(*devp) == 0);
5867 5877
5868 5878 minor = zfsdev_minor_alloc();
5869 5879 if (minor == 0)
5870 5880 return (SET_ERROR(ENXIO));
5871 5881
5872 5882 if (ddi_soft_state_zalloc(zfsdev_state, minor) != DDI_SUCCESS)
5873 5883 return (SET_ERROR(EAGAIN));
5874 5884
5875 5885 *devp = makedevice(getemajor(*devp), minor);
5876 5886
5877 5887 zs = ddi_get_soft_state(zfsdev_state, minor);
5878 5888 zs->zss_type = ZSST_CTLDEV;
5879 5889 zfs_onexit_init((zfs_onexit_t **)&zs->zss_data);
5880 5890
5881 5891 return (0);
5882 5892 }
5883 5893
5884 5894 static void
5885 5895 zfs_ctldev_destroy(zfs_onexit_t *zo, minor_t minor)
5886 5896 {
5887 5897 ASSERT(MUTEX_HELD(&zfsdev_state_lock));
5888 5898
5889 5899 zfs_onexit_destroy(zo);
5890 5900 ddi_soft_state_free(zfsdev_state, minor);
5891 5901 }
5892 5902
5893 5903 void *
5894 5904 zfsdev_get_soft_state(minor_t minor, enum zfs_soft_state_type which)
5895 5905 {
5896 5906 zfs_soft_state_t *zp;
5897 5907
5898 5908 zp = ddi_get_soft_state(zfsdev_state, minor);
5899 5909 if (zp == NULL || zp->zss_type != which)
5900 5910 return (NULL);
5901 5911
5902 5912 return (zp->zss_data);
5903 5913 }
5904 5914
5905 5915 static int
5906 5916 zfsdev_open(dev_t *devp, int flag, int otyp, cred_t *cr)
5907 5917 {
5908 5918 int error = 0;
5909 5919
5910 5920 if (getminor(*devp) != 0)
5911 5921 return (zvol_open(devp, flag, otyp, cr));
5912 5922
5913 5923 /* This is the control device. Allocate a new minor if requested. */
5914 5924 if (flag & FEXCL) {
5915 5925 mutex_enter(&zfsdev_state_lock);
5916 5926 error = zfs_ctldev_init(devp);
5917 5927 mutex_exit(&zfsdev_state_lock);
5918 5928 }
5919 5929
5920 5930 return (error);
5921 5931 }
5922 5932
5923 5933 static int
5924 5934 zfsdev_close(dev_t dev, int flag, int otyp, cred_t *cr)
5925 5935 {
5926 5936 zfs_onexit_t *zo;
5927 5937 minor_t minor = getminor(dev);
5928 5938
5929 5939 if (minor == 0)
5930 5940 return (0);
5931 5941
5932 5942 mutex_enter(&zfsdev_state_lock);
5933 5943 zo = zfsdev_get_soft_state(minor, ZSST_CTLDEV);
5934 5944 if (zo == NULL) {
5935 5945 mutex_exit(&zfsdev_state_lock);
5936 5946 return (zvol_close(dev, flag, otyp, cr));
5937 5947 }
5938 5948 zfs_ctldev_destroy(zo, minor);
5939 5949 mutex_exit(&zfsdev_state_lock);
5940 5950
5941 5951 return (0);
5942 5952 }
5943 5953
5944 5954 static int
5945 5955 zfsdev_ioctl(dev_t dev, int cmd, intptr_t arg, int flag, cred_t *cr, int *rvalp)
5946 5956 {
5947 5957 zfs_cmd_t *zc;
5948 5958 uint_t vecnum;
5949 5959 int error, rc, len;
5950 5960 minor_t minor = getminor(dev);
5951 5961 const zfs_ioc_vec_t *vec;
5952 5962 char *saved_poolname = NULL;
5953 5963 nvlist_t *innvl = NULL;
5954 5964
5955 5965 if (minor != 0 &&
5956 5966 zfsdev_get_soft_state(minor, ZSST_CTLDEV) == NULL)
5957 5967 return (zvol_ioctl(dev, cmd, arg, flag, cr, rvalp));
5958 5968
5959 5969 vecnum = cmd - ZFS_IOC_FIRST;
5960 5970 ASSERT3U(getmajor(dev), ==, ddi_driver_major(zfs_dip));
5961 5971
5962 5972 if (vecnum >= sizeof (zfs_ioc_vec) / sizeof (zfs_ioc_vec[0]))
5963 5973 return (SET_ERROR(EINVAL));
5964 5974 vec = &zfs_ioc_vec[vecnum];
5965 5975
5966 5976 zc = kmem_zalloc(sizeof (zfs_cmd_t), KM_SLEEP);
5967 5977
5968 5978 error = ddi_copyin((void *)arg, zc, sizeof (zfs_cmd_t), flag);
5969 5979 if (error != 0) {
5970 5980 error = SET_ERROR(EFAULT);
5971 5981 goto out;
5972 5982 }
5973 5983
5974 5984 zc->zc_iflags = flag & FKIOCTL;
5975 5985 if (zc->zc_nvlist_src_size != 0) {
5976 5986 error = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
5977 5987 zc->zc_iflags, &innvl);
5978 5988 if (error != 0)
5979 5989 goto out;
5980 5990 }
5981 5991
5982 5992 /*
5983 5993 * Ensure that all pool/dataset names are valid before we pass down to
5984 5994 * the lower layers.
5985 5995 */
5986 5996 zc->zc_name[sizeof (zc->zc_name) - 1] = '\0';
5987 5997 switch (vec->zvec_namecheck) {
5988 5998 case POOL_NAME:
5989 5999 if (pool_namecheck(zc->zc_name, NULL, NULL) != 0)
5990 6000 error = SET_ERROR(EINVAL);
5991 6001 else
5992 6002 error = pool_status_check(zc->zc_name,
5993 6003 vec->zvec_namecheck, vec->zvec_pool_check);
5994 6004 break;
5995 6005
5996 6006 case DATASET_NAME:
5997 6007 if (dataset_namecheck(zc->zc_name, NULL, NULL) != 0)
5998 6008 error = SET_ERROR(EINVAL);
5999 6009 else
6000 6010 error = pool_status_check(zc->zc_name,
6001 6011 vec->zvec_namecheck, vec->zvec_pool_check);
6002 6012 break;
6003 6013
6004 6014 case NO_NAME:
6005 6015 break;
6006 6016 }
6007 6017
6008 6018
6009 6019 if (error == 0 && !(flag & FKIOCTL))
6010 6020 error = vec->zvec_secpolicy(zc, innvl, cr);
6011 6021
6012 6022 if (error != 0)
6013 6023 goto out;
6014 6024
6015 6025 /* legacy ioctls can modify zc_name */
6016 6026 len = strcspn(zc->zc_name, "/@#") + 1;
6017 6027 saved_poolname = kmem_alloc(len, KM_SLEEP);
6018 6028 (void) strlcpy(saved_poolname, zc->zc_name, len);
6019 6029
6020 6030 if (vec->zvec_func != NULL) {
6021 6031 nvlist_t *outnvl;
6022 6032 int puterror = 0;
6023 6033 spa_t *spa;
6024 6034 nvlist_t *lognv = NULL;
6025 6035
6026 6036 ASSERT(vec->zvec_legacy_func == NULL);
6027 6037
6028 6038 /*
6029 6039 * Add the innvl to the lognv before calling the func,
6030 6040 * in case the func changes the innvl.
6031 6041 */
6032 6042 if (vec->zvec_allow_log) {
6033 6043 lognv = fnvlist_alloc();
6034 6044 fnvlist_add_string(lognv, ZPOOL_HIST_IOCTL,
6035 6045 vec->zvec_name);
6036 6046 if (!nvlist_empty(innvl)) {
6037 6047 fnvlist_add_nvlist(lognv, ZPOOL_HIST_INPUT_NVL,
6038 6048 innvl);
6039 6049 }
6040 6050 }
6041 6051
6042 6052 outnvl = fnvlist_alloc();
6043 6053 error = vec->zvec_func(zc->zc_name, innvl, outnvl);
6044 6054
6045 6055 if (error == 0 && vec->zvec_allow_log &&
6046 6056 spa_open(zc->zc_name, &spa, FTAG) == 0) {
6047 6057 if (!nvlist_empty(outnvl)) {
6048 6058 fnvlist_add_nvlist(lognv, ZPOOL_HIST_OUTPUT_NVL,
6049 6059 outnvl);
6050 6060 }
6051 6061 (void) spa_history_log_nvl(spa, lognv);
6052 6062 spa_close(spa, FTAG);
6053 6063 }
6054 6064 fnvlist_free(lognv);
6055 6065
6056 6066 if (!nvlist_empty(outnvl) || zc->zc_nvlist_dst_size != 0) {
6057 6067 int smusherror = 0;
6058 6068 if (vec->zvec_smush_outnvlist) {
6059 6069 smusherror = nvlist_smush(outnvl,
6060 6070 zc->zc_nvlist_dst_size);
6061 6071 }
6062 6072 if (smusherror == 0)
6063 6073 puterror = put_nvlist(zc, outnvl);
6064 6074 }
6065 6075
6066 6076 if (puterror != 0)
6067 6077 error = puterror;
6068 6078
6069 6079 nvlist_free(outnvl);
6070 6080 } else {
6071 6081 error = vec->zvec_legacy_func(zc);
6072 6082 }
6073 6083
6074 6084 out:
6075 6085 nvlist_free(innvl);
6076 6086 rc = ddi_copyout(zc, (void *)arg, sizeof (zfs_cmd_t), flag);
6077 6087 if (error == 0 && rc != 0)
6078 6088 error = SET_ERROR(EFAULT);
6079 6089 if (error == 0 && vec->zvec_allow_log) {
6080 6090 char *s = tsd_get(zfs_allow_log_key);
6081 6091 if (s != NULL)
6082 6092 strfree(s);
6083 6093 (void) tsd_set(zfs_allow_log_key, saved_poolname);
6084 6094 } else {
6085 6095 if (saved_poolname != NULL)
6086 6096 strfree(saved_poolname);
6087 6097 }
6088 6098
6089 6099 kmem_free(zc, sizeof (zfs_cmd_t));
6090 6100 return (error);
6091 6101 }
6092 6102
6093 6103 static int
6094 6104 zfs_attach(dev_info_t *dip, ddi_attach_cmd_t cmd)
6095 6105 {
6096 6106 if (cmd != DDI_ATTACH)
6097 6107 return (DDI_FAILURE);
6098 6108
6099 6109 if (ddi_create_minor_node(dip, "zfs", S_IFCHR, 0,
6100 6110 DDI_PSEUDO, 0) == DDI_FAILURE)
6101 6111 return (DDI_FAILURE);
6102 6112
6103 6113 zfs_dip = dip;
6104 6114
6105 6115 ddi_report_dev(dip);
6106 6116
6107 6117 return (DDI_SUCCESS);
6108 6118 }
6109 6119
6110 6120 static int
6111 6121 zfs_detach(dev_info_t *dip, ddi_detach_cmd_t cmd)
6112 6122 {
6113 6123 if (spa_busy() || zfs_busy() || zvol_busy())
6114 6124 return (DDI_FAILURE);
6115 6125
6116 6126 if (cmd != DDI_DETACH)
6117 6127 return (DDI_FAILURE);
6118 6128
6119 6129 zfs_dip = NULL;
6120 6130
6121 6131 ddi_prop_remove_all(dip);
6122 6132 ddi_remove_minor_node(dip, NULL);
6123 6133
6124 6134 return (DDI_SUCCESS);
6125 6135 }
6126 6136
6127 6137 /*ARGSUSED*/
6128 6138 static int
6129 6139 zfs_info(dev_info_t *dip, ddi_info_cmd_t infocmd, void *arg, void **result)
6130 6140 {
6131 6141 switch (infocmd) {
6132 6142 case DDI_INFO_DEVT2DEVINFO:
6133 6143 *result = zfs_dip;
6134 6144 return (DDI_SUCCESS);
6135 6145
6136 6146 case DDI_INFO_DEVT2INSTANCE:
6137 6147 *result = (void *)0;
6138 6148 return (DDI_SUCCESS);
6139 6149 }
6140 6150
6141 6151 return (DDI_FAILURE);
6142 6152 }
6143 6153
6144 6154 /*
6145 6155 * OK, so this is a little weird.
6146 6156 *
6147 6157 * /dev/zfs is the control node, i.e. minor 0.
6148 6158 * /dev/zvol/[r]dsk/pool/dataset are the zvols, minor > 0.
6149 6159 *
6150 6160 * /dev/zfs has basically nothing to do except serve up ioctls,
6151 6161 * so most of the standard driver entry points are in zvol.c.
6152 6162 */
6153 6163 static struct cb_ops zfs_cb_ops = {
6154 6164 zfsdev_open, /* open */
6155 6165 zfsdev_close, /* close */
6156 6166 zvol_strategy, /* strategy */
6157 6167 nodev, /* print */
6158 6168 zvol_dump, /* dump */
6159 6169 zvol_read, /* read */
6160 6170 zvol_write, /* write */
6161 6171 zfsdev_ioctl, /* ioctl */
6162 6172 nodev, /* devmap */
6163 6173 nodev, /* mmap */
6164 6174 nodev, /* segmap */
6165 6175 nochpoll, /* poll */
6166 6176 ddi_prop_op, /* prop_op */
6167 6177 NULL, /* streamtab */
6168 6178 D_NEW | D_MP | D_64BIT, /* Driver compatibility flag */
6169 6179 CB_REV, /* version */
6170 6180 nodev, /* async read */
6171 6181 nodev, /* async write */
6172 6182 };
6173 6183
6174 6184 static struct dev_ops zfs_dev_ops = {
6175 6185 DEVO_REV, /* version */
6176 6186 0, /* refcnt */
6177 6187 zfs_info, /* info */
6178 6188 nulldev, /* identify */
6179 6189 nulldev, /* probe */
6180 6190 zfs_attach, /* attach */
6181 6191 zfs_detach, /* detach */
6182 6192 nodev, /* reset */
6183 6193 &zfs_cb_ops, /* driver operations */
6184 6194 NULL, /* no bus operations */
6185 6195 NULL, /* power */
6186 6196 ddi_quiesce_not_needed, /* quiesce */
6187 6197 };
6188 6198
6189 6199 static struct modldrv zfs_modldrv = {
6190 6200 &mod_driverops,
6191 6201 "ZFS storage pool",
6192 6202 &zfs_dev_ops
6193 6203 };
6194 6204
6195 6205 static struct modlinkage modlinkage = {
6196 6206 MODREV_1,
6197 6207 (void *)&zfs_modlfs,
6198 6208 (void *)&zfs_modldrv,
6199 6209 NULL
6200 6210 };
6201 6211
6202 6212 static void
6203 6213 zfs_allow_log_destroy(void *arg)
6204 6214 {
6205 6215 char *poolname = arg;
6206 6216 strfree(poolname);
6207 6217 }
6208 6218
6209 6219 int
6210 6220 _init(void)
6211 6221 {
6212 6222 int error;
6213 6223
6214 6224 spa_init(FREAD | FWRITE);
6215 6225 zfs_init();
6216 6226 zvol_init();
6217 6227 zfs_ioctl_init();
6218 6228
6219 6229 if ((error = mod_install(&modlinkage)) != 0) {
6220 6230 zvol_fini();
6221 6231 zfs_fini();
6222 6232 spa_fini();
6223 6233 return (error);
6224 6234 }
6225 6235
6226 6236 tsd_create(&zfs_fsyncer_key, NULL);
6227 6237 tsd_create(&rrw_tsd_key, rrw_tsd_destroy);
6228 6238 tsd_create(&zfs_allow_log_key, zfs_allow_log_destroy);
6229 6239
6230 6240 error = ldi_ident_from_mod(&modlinkage, &zfs_li);
6231 6241 ASSERT(error == 0);
6232 6242 mutex_init(&zfs_share_lock, NULL, MUTEX_DEFAULT, NULL);
6233 6243
6234 6244 return (0);
6235 6245 }
6236 6246
6237 6247 int
6238 6248 _fini(void)
6239 6249 {
6240 6250 int error;
6241 6251
6242 6252 if (spa_busy() || zfs_busy() || zvol_busy() || zio_injection_enabled)
6243 6253 return (SET_ERROR(EBUSY));
6244 6254
6245 6255 if ((error = mod_remove(&modlinkage)) != 0)
6246 6256 return (error);
6247 6257
6248 6258 zvol_fini();
6249 6259 zfs_fini();
6250 6260 spa_fini();
6251 6261 if (zfs_nfsshare_inited)
6252 6262 (void) ddi_modclose(nfs_mod);
6253 6263 if (zfs_smbshare_inited)
6254 6264 (void) ddi_modclose(smbsrv_mod);
6255 6265 if (zfs_nfsshare_inited || zfs_smbshare_inited)
6256 6266 (void) ddi_modclose(sharefs_mod);
6257 6267
6258 6268 tsd_destroy(&zfs_fsyncer_key);
6259 6269 ldi_ident_release(zfs_li);
6260 6270 zfs_li = NULL;
6261 6271 mutex_destroy(&zfs_share_lock);
6262 6272
6263 6273 return (error);
6264 6274 }
6265 6275
6266 6276 int
6267 6277 _info(struct modinfo *modinfop)
6268 6278 {
6269 6279 return (mod_info(&modlinkage, modinfop));
6270 6280 }
|
↓ open down ↓ |
1958 lines elided |
↑ open up ↑ |
XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX