Merge commit 'dc97a43d4a70c8773a619f11b95b07a787f6f5b7' into merges
[unleashed.git] / kernel / fs / zfs / zcp.c
blob04c3d309f6bc8a2f4b890cb649ebbbf3b7c35851
1 /*
2 * CDDL HEADER START
4 * This file and its contents are supplied under the terms of the
5 * Common Development and Distribution License ("CDDL"), version 1.0.
6 * You may only use this file in accordance with the terms of version
7 * 1.0 of the CDDL.
9 * A full copy of the text of the CDDL should have accompanied this
10 * source. A copy of the CDDL is also available via the Internet at
11 * http://www.illumos.org/license/CDDL.
13 * CDDL HEADER END
17 * Copyright (c) 2016 by Delphix. All rights reserved.
21 * ZFS Channel Programs (ZCP)
23 * The ZCP interface allows various ZFS commands and operations ZFS
24 * administrative operations (e.g. creating and destroying snapshots, typically
25 * performed via an ioctl to /dev/zfs by the zfs(8) command and
26 * libzfs/libzfs_core) to be run * programmatically as a Lua script. A ZCP
27 * script is run as a dsl_sync_task and fully executed during one transaction
28 * group sync. This ensures that no other changes can be written concurrently
29 * with a running Lua script. Combining multiple calls to the exposed ZFS
30 * functions into one script gives a number of benefits:
32 * 1. Atomicity. For some compound or iterative operations, it's useful to be
33 * able to guarantee that the state of a pool has not changed between calls to
34 * ZFS.
36 * 2. Performance. If a large number of changes need to be made (e.g. deleting
37 * many filesystems), there can be a significant performance penalty as a
38 * result of the need to wait for a transaction group sync to pass for every
39 * single operation. When expressed as a single ZCP script, all these changes
40 * can be performed at once in one txg sync.
42 * A modified version of the Lua 5.2 interpreter is used to run channel program
43 * scripts. The Lua 5.2 manual can be found at:
45 * http://www.lua.org/manual/5.2/
47 * If being run by a user (via an ioctl syscall), executing a ZCP script
48 * requires root privileges in the global zone.
50 * Scripts are passed to zcp_eval() as a string, then run in a synctask by
51 * zcp_eval_sync(). Arguments can be passed into the Lua script as an nvlist,
52 * which will be converted to a Lua table. Similarly, values returned from
53 * a ZCP script will be converted to an nvlist. See zcp_lua_to_nvlist_impl()
54 * for details on exact allowed types and conversion.
56 * ZFS functionality is exposed to a ZCP script as a library of function calls.
57 * These calls are sorted into submodules, such as zfs.list and zfs.sync, for
58 * iterators and synctasks, respectively. Each of these submodules resides in
59 * its own source file, with a zcp_*_info structure describing each library
60 * call in the submodule.
62 * Error handling in ZCP scripts is handled by a number of different methods
63 * based on severity:
65 * 1. Memory and time limits are in place to prevent a channel program from
66 * consuming excessive system or running forever. If one of these limits is
67 * hit, the channel program will be stopped immediately and return from
68 * zcp_eval() with an error code. No attempt will be made to roll back or undo
69 * any changes made by the channel program before the error occured.
70 * Consumers invoking zcp_eval() from elsewhere in the kernel may pass a time
71 * limit of 0, disabling the time limit.
73 * 2. Internal Lua errors can occur as a result of a syntax error, calling a
74 * library function with incorrect arguments, invoking the error() function,
75 * failing an assert(), or other runtime errors. In these cases the channel
76 * program will stop executing and return from zcp_eval() with an error code.
77 * In place of a return value, an error message will also be returned in the
78 * 'result' nvlist containing information about the error. No attempt will be
79 * made to roll back or undo any changes made by the channel program before the
80 * error occured.
82 * 3. If an error occurs inside a ZFS library call which returns an error code,
83 * the error is returned to the Lua script to be handled as desired.
85 * In the first two cases, Lua's error-throwing mechanism is used, which
86 * longjumps out of the script execution with luaL_error() and returns with the
87 * error.
89 * See zfs-program(8) for more information on high level usage.
92 #include "lua.h"
93 #include "lualib.h"
94 #include "lauxlib.h"
96 #include <sys/dsl_prop.h>
97 #include <sys/dsl_synctask.h>
98 #include <sys/dsl_dataset.h>
99 #include <sys/zcp.h>
100 #include <sys/zcp_iter.h>
101 #include <sys/zcp_prop.h>
102 #include <sys/zcp_global.h>
103 #include <util/sscanf.h>
105 uint64_t zfs_lua_check_instrlimit_interval = 100;
106 uint64_t zfs_lua_max_instrlimit = ZCP_MAX_INSTRLIMIT;
107 uint64_t zfs_lua_max_memlimit = ZCP_MAX_MEMLIMIT;
109 static int zcp_nvpair_value_to_lua(lua_State *, nvpair_t *, char *, int);
110 static int zcp_lua_to_nvlist_impl(lua_State *, int, nvlist_t *, const char *,
111 int);
113 typedef struct zcp_alloc_arg {
114 boolean_t aa_must_succeed;
115 int64_t aa_alloc_remaining;
116 int64_t aa_alloc_limit;
117 } zcp_alloc_arg_t;
119 typedef struct zcp_eval_arg {
120 lua_State *ea_state;
121 zcp_alloc_arg_t *ea_allocargs;
122 cred_t *ea_cred;
123 nvlist_t *ea_outnvl;
124 int ea_result;
125 uint64_t ea_instrlimit;
126 } zcp_eval_arg_t;
128 /*ARGSUSED*/
129 static int
130 zcp_eval_check(void *arg, dmu_tx_t *tx)
132 return (0);
136 * The outer-most error callback handler for use with lua_pcall(). On
137 * error Lua will call this callback with a single argument that
138 * represents the error value. In most cases this will be a string
139 * containing an error message, but channel programs can use Lua's
140 * error() function to return arbitrary objects as errors. This callback
141 * returns (on the Lua stack) the original error object along with a traceback.
143 * Fatal Lua errors can occur while resources are held, so we also call any
144 * registered cleanup function here.
146 static int
147 zcp_error_handler(lua_State *state)
149 const char *msg;
151 zcp_cleanup(state);
153 VERIFY3U(1, ==, lua_gettop(state));
154 msg = lua_tostring(state, 1);
155 luaL_traceback(state, state, msg, 1);
156 return (1);
160 zcp_argerror(lua_State *state, int narg, const char *msg, ...)
162 va_list alist;
164 va_start(alist, msg);
165 const char *buf = lua_pushvfstring(state, msg, alist);
166 va_end(alist);
168 return (luaL_argerror(state, narg, buf));
172 * Install a new cleanup function, which will be invoked with the given
173 * opaque argument if a fatal error causes the Lua interpreter to longjump out
174 * of a function call.
176 * If an error occurs, the cleanup function will be invoked exactly once and
177 * then unreigstered.
179 void
180 zcp_register_cleanup(lua_State *state, zcp_cleanup_t cleanfunc, void *cleanarg)
182 zcp_run_info_t *ri = zcp_run_info(state);
184 * A cleanup function should always be explicitly removed before
185 * installing a new one to avoid accidental clobbering.
187 ASSERT3P(ri->zri_cleanup, ==, NULL);
189 ri->zri_cleanup = cleanfunc;
190 ri->zri_cleanup_arg = cleanarg;
193 void
194 zcp_clear_cleanup(lua_State *state)
196 zcp_run_info_t *ri = zcp_run_info(state);
198 ri->zri_cleanup = NULL;
199 ri->zri_cleanup_arg = NULL;
203 * If it exists, execute the currently set cleanup function then unregister it.
205 void
206 zcp_cleanup(lua_State *state)
208 zcp_run_info_t *ri = zcp_run_info(state);
210 if (ri->zri_cleanup != NULL) {
211 ri->zri_cleanup(ri->zri_cleanup_arg);
212 zcp_clear_cleanup(state);
216 #define ZCP_NVLIST_MAX_DEPTH 20
219 * Convert the lua table at the given index on the Lua stack to an nvlist
220 * and return it.
222 * If the table can not be converted for any reason, NULL is returned and
223 * an error message is pushed onto the Lua stack.
225 static nvlist_t *
226 zcp_table_to_nvlist(lua_State *state, int index, int depth)
228 nvlist_t *nvl;
230 * Converting a Lua table to an nvlist with key uniqueness checking is
231 * O(n^2) in the number of keys in the nvlist, which can take a long
232 * time when we return a large table from a channel program.
233 * Furthermore, Lua's table interface *almost* guarantees unique keys
234 * on its own (details below). Therefore, we don't use fnvlist_alloc()
235 * here to avoid the built-in uniqueness checking.
237 * The *almost* is because it's possible to have key collisions between
238 * e.g. the string "1" and the number 1, or the string "true" and the
239 * boolean true, so we explicitly check that when we're looking at a
240 * key which is an integer / boolean or a string that can be parsed as
241 * one of those types. In the worst case this could still devolve into
242 * O(n^2), so we only start doing these checks on boolean/integer keys
243 * once we've seen a string key which fits this weird usage pattern.
245 * Ultimately, we still want callers to know that the keys in this
246 * nvlist are unique, so before we return this we set the nvlist's
247 * flags to reflect that.
249 VERIFY0(nvlist_alloc(&nvl, 0, KM_SLEEP));
252 * Push an empty stack slot where lua_next() will store each
253 * table key.
255 lua_pushnil(state);
256 boolean_t saw_str_could_collide = B_FALSE;
257 while (lua_next(state, index) != 0) {
259 * The next key-value pair from the table at index is
260 * now on the stack, with the key at stack slot -2 and
261 * the value at slot -1.
263 int err = 0;
264 char buf[32];
265 const char *key = NULL;
266 boolean_t key_could_collide = B_FALSE;
268 switch (lua_type(state, -2)) {
269 case LUA_TSTRING:
270 key = lua_tostring(state, -2);
272 /* check if this could collide with a number or bool */
273 long long tmp;
274 int parselen;
275 if ((sscanf(key, "%lld%n", &tmp, &parselen) > 0 &&
276 parselen == strlen(key)) ||
277 strcmp(key, "true") == 0 ||
278 strcmp(key, "false") == 0) {
279 key_could_collide = B_TRUE;
280 saw_str_could_collide = B_TRUE;
282 break;
283 case LUA_TBOOLEAN:
284 key = (lua_toboolean(state, -2) == B_TRUE ?
285 "true" : "false");
286 if (saw_str_could_collide) {
287 key_could_collide = B_TRUE;
289 break;
290 case LUA_TNUMBER:
291 VERIFY3U(sizeof (buf), >,
292 snprintf(buf, sizeof (buf), "%lld",
293 (longlong_t)lua_tonumber(state, -2)));
294 key = buf;
295 if (saw_str_could_collide) {
296 key_could_collide = B_TRUE;
298 break;
299 default:
300 fnvlist_free(nvl);
301 (void) lua_pushfstring(state, "Invalid key "
302 "type '%s' in table",
303 lua_typename(state, lua_type(state, -2)));
304 return (NULL);
307 * Check for type-mismatched key collisions, and throw an error.
309 if (key_could_collide && nvlist_exists(nvl, key)) {
310 fnvlist_free(nvl);
311 (void) lua_pushfstring(state, "Collision of "
312 "key '%s' in table", key);
313 return (NULL);
316 * Recursively convert the table value and insert into
317 * the new nvlist with the parsed key. To prevent
318 * stack overflow on circular or heavily nested tables,
319 * we track the current nvlist depth.
321 if (depth >= ZCP_NVLIST_MAX_DEPTH) {
322 fnvlist_free(nvl);
323 (void) lua_pushfstring(state, "Maximum table "
324 "depth (%d) exceeded for table",
325 ZCP_NVLIST_MAX_DEPTH);
326 return (NULL);
328 err = zcp_lua_to_nvlist_impl(state, -1, nvl, key,
329 depth + 1);
330 if (err != 0) {
331 fnvlist_free(nvl);
333 * Error message has been pushed to the lua
334 * stack by the recursive call.
336 return (NULL);
339 * Pop the value pushed by lua_next().
341 lua_pop(state, 1);
345 * Mark the nvlist as having unique keys. This is a little ugly, but we
346 * ensured above that there are no duplicate keys in the nvlist.
348 nvl->nvl_nvflag |= NV_UNIQUE_NAME;
350 return (nvl);
354 * Convert a value from the given index into the lua stack to an nvpair, adding
355 * it to an nvlist with the given key.
357 * Values are converted as follows:
359 * string -> string
360 * number -> int64
361 * boolean -> boolean
362 * nil -> boolean (no value)
364 * Lua tables are converted to nvlists and then inserted. The table's keys
365 * are converted to strings then used as keys in the nvlist to store each table
366 * element. Keys are converted as follows:
368 * string -> no change
369 * number -> "%lld"
370 * boolean -> "true" | "false"
371 * nil -> error
373 * In the case of a key collision, an error is thrown.
375 * If an error is encountered, a nonzero error code is returned, and an error
376 * string will be pushed onto the Lua stack.
378 static int
379 zcp_lua_to_nvlist_impl(lua_State *state, int index, nvlist_t *nvl,
380 const char *key, int depth)
383 * Verify that we have enough remaining space in the lua stack to parse
384 * a key-value pair and push an error.
386 if (!lua_checkstack(state, 3)) {
387 (void) lua_pushstring(state, "Lua stack overflow");
388 return (1);
391 index = lua_absindex(state, index);
393 switch (lua_type(state, index)) {
394 case LUA_TNIL:
395 fnvlist_add_boolean(nvl, key);
396 break;
397 case LUA_TBOOLEAN:
398 fnvlist_add_boolean_value(nvl, key,
399 lua_toboolean(state, index));
400 break;
401 case LUA_TNUMBER:
402 fnvlist_add_int64(nvl, key, lua_tonumber(state, index));
403 break;
404 case LUA_TSTRING:
405 fnvlist_add_string(nvl, key, lua_tostring(state, index));
406 break;
407 case LUA_TTABLE: {
408 nvlist_t *value_nvl = zcp_table_to_nvlist(state, index, depth);
409 if (value_nvl == NULL)
410 return (EINVAL);
412 fnvlist_add_nvlist(nvl, key, value_nvl);
413 fnvlist_free(value_nvl);
414 break;
416 default:
417 (void) lua_pushfstring(state,
418 "Invalid value type '%s' for key '%s'",
419 lua_typename(state, lua_type(state, index)), key);
420 return (EINVAL);
423 return (0);
427 * Convert a lua value to an nvpair, adding it to an nvlist with the given key.
429 void
430 zcp_lua_to_nvlist(lua_State *state, int index, nvlist_t *nvl, const char *key)
433 * On error, zcp_lua_to_nvlist_impl pushes an error string onto the Lua
434 * stack before returning with a nonzero error code. If an error is
435 * returned, throw a fatal lua error with the given string.
437 if (zcp_lua_to_nvlist_impl(state, index, nvl, key, 0) != 0)
438 (void) lua_error(state);
442 zcp_lua_to_nvlist_helper(lua_State *state)
444 nvlist_t *nv = (nvlist_t *)lua_touserdata(state, 2);
445 const char *key = (const char *)lua_touserdata(state, 1);
446 zcp_lua_to_nvlist(state, 3, nv, key);
447 return (0);
450 void
451 zcp_convert_return_values(lua_State *state, nvlist_t *nvl,
452 const char *key, zcp_eval_arg_t *evalargs)
454 int err;
455 lua_pushcfunction(state, zcp_lua_to_nvlist_helper);
456 lua_pushlightuserdata(state, (char *)key);
457 lua_pushlightuserdata(state, nvl);
458 lua_pushvalue(state, 1);
459 lua_remove(state, 1);
460 err = lua_pcall(state, 3, 0, 0); /* zcp_lua_to_nvlist_helper */
461 if (err != 0) {
462 zcp_lua_to_nvlist(state, 1, nvl, ZCP_RET_ERROR);
463 evalargs->ea_result = SET_ERROR(ECHRNG);
468 * Push a Lua table representing nvl onto the stack. If it can't be
469 * converted, return EINVAL, fill in errbuf, and push nothing. errbuf may
470 * be specified as NULL, in which case no error string will be output.
472 * Most nvlists are converted as simple key->value Lua tables, but we make
473 * an exception for the case where all nvlist entries are BOOLEANs (a string
474 * key without a value). In Lua, a table key pointing to a value of Nil
475 * (no value) is equivalent to the key not existing, so a BOOLEAN nvlist
476 * entry can't be directly converted to a Lua table entry. Nvlists of entirely
477 * BOOLEAN entries are frequently used to pass around lists of datasets, so for
478 * convenience we check for this case, and convert it to a simple Lua array of
479 * strings.
482 zcp_nvlist_to_lua(lua_State *state, nvlist_t *nvl,
483 char *errbuf, int errbuf_len)
485 nvpair_t *pair;
486 lua_newtable(state);
487 boolean_t has_values = B_FALSE;
489 * If the list doesn't have any values, just convert it to a string
490 * array.
492 for (pair = nvlist_next_nvpair(nvl, NULL);
493 pair != NULL; pair = nvlist_next_nvpair(nvl, pair)) {
494 if (nvpair_type(pair) != DATA_TYPE_BOOLEAN) {
495 has_values = B_TRUE;
496 break;
499 if (!has_values) {
500 int i = 1;
501 for (pair = nvlist_next_nvpair(nvl, NULL);
502 pair != NULL; pair = nvlist_next_nvpair(nvl, pair)) {
503 (void) lua_pushinteger(state, i);
504 (void) lua_pushstring(state, nvpair_name(pair));
505 (void) lua_settable(state, -3);
506 i++;
508 } else {
509 for (pair = nvlist_next_nvpair(nvl, NULL);
510 pair != NULL; pair = nvlist_next_nvpair(nvl, pair)) {
511 int err = zcp_nvpair_value_to_lua(state, pair,
512 errbuf, errbuf_len);
513 if (err != 0) {
514 lua_pop(state, 1);
515 return (err);
517 (void) lua_setfield(state, -2, nvpair_name(pair));
520 return (0);
524 * Push a Lua object representing the value of "pair" onto the stack.
526 * Only understands boolean_value, string, int64, nvlist,
527 * string_array, and int64_array type values. For other
528 * types, returns EINVAL, fills in errbuf, and pushes nothing.
530 static int
531 zcp_nvpair_value_to_lua(lua_State *state, nvpair_t *pair,
532 char *errbuf, int errbuf_len)
534 int err = 0;
536 if (pair == NULL) {
537 lua_pushnil(state);
538 return (0);
541 switch (nvpair_type(pair)) {
542 case DATA_TYPE_BOOLEAN_VALUE:
543 (void) lua_pushboolean(state,
544 fnvpair_value_boolean_value(pair));
545 break;
546 case DATA_TYPE_STRING:
547 (void) lua_pushstring(state, fnvpair_value_string(pair));
548 break;
549 case DATA_TYPE_INT64:
550 (void) lua_pushinteger(state, fnvpair_value_int64(pair));
551 break;
552 case DATA_TYPE_NVLIST:
553 err = zcp_nvlist_to_lua(state,
554 fnvpair_value_nvlist(pair), errbuf, errbuf_len);
555 break;
556 case DATA_TYPE_STRING_ARRAY: {
557 char **strarr;
558 uint_t nelem;
559 (void) nvpair_value_string_array(pair, &strarr, &nelem);
560 lua_newtable(state);
561 for (int i = 0; i < nelem; i++) {
562 (void) lua_pushinteger(state, i + 1);
563 (void) lua_pushstring(state, strarr[i]);
564 (void) lua_settable(state, -3);
566 break;
568 case DATA_TYPE_UINT64_ARRAY: {
569 uint64_t *intarr;
570 uint_t nelem;
571 (void) nvpair_value_uint64_array(pair, &intarr, &nelem);
572 lua_newtable(state);
573 for (int i = 0; i < nelem; i++) {
574 (void) lua_pushinteger(state, i + 1);
575 (void) lua_pushinteger(state, intarr[i]);
576 (void) lua_settable(state, -3);
578 break;
580 case DATA_TYPE_INT64_ARRAY: {
581 int64_t *intarr;
582 uint_t nelem;
583 (void) nvpair_value_int64_array(pair, &intarr, &nelem);
584 lua_newtable(state);
585 for (int i = 0; i < nelem; i++) {
586 (void) lua_pushinteger(state, i + 1);
587 (void) lua_pushinteger(state, intarr[i]);
588 (void) lua_settable(state, -3);
590 break;
592 default: {
593 if (errbuf != NULL) {
594 (void) snprintf(errbuf, errbuf_len,
595 "Unhandled nvpair type %d for key '%s'",
596 nvpair_type(pair), nvpair_name(pair));
598 return (EINVAL);
601 return (err);
605 zcp_dataset_hold_error(lua_State *state, dsl_pool_t *dp, const char *dsname,
606 int error)
608 if (error == ENOENT) {
609 (void) zcp_argerror(state, 1, "no such dataset '%s'", dsname);
610 return (0); /* not reached; zcp_argerror will longjmp */
611 } else if (error == EXDEV) {
612 (void) zcp_argerror(state, 1,
613 "dataset '%s' is not in the target pool '%s'",
614 dsname, spa_name(dp->dp_spa));
615 return (0); /* not reached; zcp_argerror will longjmp */
616 } else if (error == EIO) {
617 (void) luaL_error(state,
618 "I/O error while accessing dataset '%s'", dsname);
619 return (0); /* not reached; luaL_error will longjmp */
620 } else if (error != 0) {
621 (void) luaL_error(state,
622 "unexpected error %d while accessing dataset '%s'",
623 error, dsname);
624 return (0); /* not reached; luaL_error will longjmp */
626 return (0);
630 * Note: will longjmp (via lua_error()) on error.
631 * Assumes that the dsname is argument #1 (for error reporting purposes).
633 dsl_dataset_t *
634 zcp_dataset_hold(lua_State *state, dsl_pool_t *dp, const char *dsname,
635 void *tag)
637 dsl_dataset_t *ds;
638 int error = dsl_dataset_hold(dp, dsname, tag, &ds);
639 (void) zcp_dataset_hold_error(state, dp, dsname, error);
640 return (ds);
643 static int zcp_debug(lua_State *);
644 static zcp_lib_info_t zcp_debug_info = {
645 .name = "debug",
646 .func = zcp_debug,
647 .pargs = {
648 { .za_name = "debug string", .za_lua_type = LUA_TSTRING},
649 {NULL, 0}
651 .kwargs = {
652 {NULL, 0}
656 static int
657 zcp_debug(lua_State *state)
659 const char *dbgstring;
660 zcp_run_info_t *ri = zcp_run_info(state);
661 zcp_lib_info_t *libinfo = &zcp_debug_info;
663 zcp_parse_args(state, libinfo->name, libinfo->pargs, libinfo->kwargs);
665 dbgstring = lua_tostring(state, 1);
667 zfs_dbgmsg("txg %lld ZCP: %s", ri->zri_tx->tx_txg, dbgstring);
669 return (0);
672 static int zcp_exists(lua_State *);
673 static zcp_lib_info_t zcp_exists_info = {
674 .name = "exists",
675 .func = zcp_exists,
676 .pargs = {
677 { .za_name = "dataset", .za_lua_type = LUA_TSTRING},
678 {NULL, 0}
680 .kwargs = {
681 {NULL, 0}
685 static int
686 zcp_exists(lua_State *state)
688 zcp_run_info_t *ri = zcp_run_info(state);
689 dsl_pool_t *dp = ri->zri_pool;
690 zcp_lib_info_t *libinfo = &zcp_exists_info;
692 zcp_parse_args(state, libinfo->name, libinfo->pargs, libinfo->kwargs);
694 const char *dsname = lua_tostring(state, 1);
696 dsl_dataset_t *ds;
697 int error = dsl_dataset_hold(dp, dsname, FTAG, &ds);
698 if (error == 0) {
699 dsl_dataset_rele(ds, FTAG);
700 lua_pushboolean(state, B_TRUE);
701 } else if (error == ENOENT) {
702 lua_pushboolean(state, B_FALSE);
703 } else if (error == EXDEV) {
704 return (luaL_error(state, "dataset '%s' is not in the "
705 "target pool", dsname));
706 } else if (error == EIO) {
707 return (luaL_error(state, "I/O error opening dataset '%s'",
708 dsname));
709 } else if (error != 0) {
710 return (luaL_error(state, "unexpected error %d", error));
713 return (0);
717 * Allocate/realloc/free a buffer for the lua interpreter.
719 * When nsize is 0, behaves as free() and returns NULL.
721 * If ptr is NULL, behaves as malloc() and returns an allocated buffer of size
722 * at least nsize.
724 * Otherwise, behaves as realloc(), changing the allocation from osize to nsize.
725 * Shrinking the buffer size never fails.
727 * The original allocated buffer size is stored as a uint64 at the beginning of
728 * the buffer to avoid actually reallocating when shrinking a buffer, since lua
729 * requires that this operation never fail.
731 static void *
732 zcp_lua_alloc(void *ud, void *ptr, size_t osize, size_t nsize)
734 zcp_alloc_arg_t *allocargs = ud;
735 int flags = (allocargs->aa_must_succeed) ?
736 KM_SLEEP : (KM_NOSLEEP | KM_NORMALPRI);
738 if (nsize == 0) {
739 if (ptr != NULL) {
740 int64_t *allocbuf = (int64_t *)ptr - 1;
741 int64_t allocsize = *allocbuf;
742 ASSERT3S(allocsize, >, 0);
743 ASSERT3S(allocargs->aa_alloc_remaining + allocsize, <=,
744 allocargs->aa_alloc_limit);
745 allocargs->aa_alloc_remaining += allocsize;
746 kmem_free(allocbuf, allocsize);
748 return (NULL);
749 } else if (ptr == NULL) {
750 int64_t *allocbuf;
751 int64_t allocsize = nsize + sizeof (int64_t);
753 if (!allocargs->aa_must_succeed &&
754 (allocsize <= 0 ||
755 allocsize > allocargs->aa_alloc_remaining)) {
756 return (NULL);
759 allocbuf = kmem_alloc(allocsize, flags);
760 if (allocbuf == NULL) {
761 return (NULL);
763 allocargs->aa_alloc_remaining -= allocsize;
765 *allocbuf = allocsize;
766 return (allocbuf + 1);
767 } else if (nsize <= osize) {
769 * If shrinking the buffer, lua requires that the reallocation
770 * never fail.
772 return (ptr);
773 } else {
774 ASSERT3U(nsize, >, osize);
776 uint64_t *luabuf = zcp_lua_alloc(ud, NULL, 0, nsize);
777 if (luabuf == NULL) {
778 return (NULL);
780 (void) memcpy(luabuf, ptr, osize);
781 VERIFY3P(zcp_lua_alloc(ud, ptr, osize, 0), ==, NULL);
782 return (luabuf);
786 /* ARGSUSED */
787 static void
788 zcp_lua_counthook(lua_State *state, lua_Debug *ar)
791 * If we're called, check how many instructions the channel program has
792 * executed so far, and compare against the limit.
794 lua_getfield(state, LUA_REGISTRYINDEX, ZCP_RUN_INFO_KEY);
795 zcp_run_info_t *ri = lua_touserdata(state, -1);
797 ri->zri_curinstrs += zfs_lua_check_instrlimit_interval;
798 if (ri->zri_maxinstrs != 0 && ri->zri_curinstrs > ri->zri_maxinstrs) {
799 ri->zri_timed_out = B_TRUE;
800 (void) lua_pushstring(state,
801 "Channel program timed out.");
802 (void) lua_error(state);
806 static int
807 zcp_panic_cb(lua_State *state)
809 panic("unprotected error in call to Lua API (%s)\n",
810 lua_tostring(state, -1));
811 return (0);
814 static void
815 zcp_eval_sync(void *arg, dmu_tx_t *tx)
817 int err;
818 zcp_run_info_t ri;
819 zcp_eval_arg_t *evalargs = arg;
820 lua_State *state = evalargs->ea_state;
823 * Open context should have setup the stack to contain:
824 * 1: Error handler callback
825 * 2: Script to run (converted to a Lua function)
826 * 3: nvlist input to function (converted to Lua table or nil)
828 VERIFY3U(3, ==, lua_gettop(state));
831 * Store the zcp_run_info_t struct for this run in the Lua registry.
832 * Registry entries are not directly accessible by the Lua scripts but
833 * can be accessed by our callbacks.
835 ri.zri_space_used = 0;
836 ri.zri_pool = dmu_tx_pool(tx);
837 ri.zri_cred = evalargs->ea_cred;
838 ri.zri_tx = tx;
839 ri.zri_timed_out = B_FALSE;
840 ri.zri_cleanup = NULL;
841 ri.zri_cleanup_arg = NULL;
842 ri.zri_curinstrs = 0;
843 ri.zri_maxinstrs = evalargs->ea_instrlimit;
845 lua_pushlightuserdata(state, &ri);
846 lua_setfield(state, LUA_REGISTRYINDEX, ZCP_RUN_INFO_KEY);
847 VERIFY3U(3, ==, lua_gettop(state));
850 * Tell the Lua interpreter to call our handler every count
851 * instructions. Channel programs that execute too many instructions
852 * should die with ETIME.
854 (void) lua_sethook(state, zcp_lua_counthook, LUA_MASKCOUNT,
855 zfs_lua_check_instrlimit_interval);
858 * Tell the Lua memory allocator to stop using KM_SLEEP before handing
859 * off control to the channel program. Channel programs that use too
860 * much memory should die with ENOSPC.
862 evalargs->ea_allocargs->aa_must_succeed = B_FALSE;
865 * Call the Lua function that open-context passed us. This pops the
866 * function and its input from the stack and pushes any return
867 * or error values.
869 err = lua_pcall(state, 1, LUA_MULTRET, 1);
872 * Let Lua use KM_SLEEP while we interpret the return values.
874 evalargs->ea_allocargs->aa_must_succeed = B_TRUE;
877 * Remove the error handler callback from the stack. At this point,
878 * if there is a cleanup function registered, then it was registered
879 * but never run or removed, which should never occur.
881 ASSERT3P(ri.zri_cleanup, ==, NULL);
882 lua_remove(state, 1);
884 switch (err) {
885 case LUA_OK: {
887 * Lua supports returning multiple values in a single return
888 * statement. Return values will have been pushed onto the
889 * stack:
890 * 1: Return value 1
891 * 2: Return value 2
892 * 3: etc...
893 * To simplify the process of retrieving a return value from a
894 * channel program, we disallow returning more than one value
895 * to ZFS from the Lua script, yielding a singleton return
896 * nvlist of the form { "return": Return value 1 }.
898 int return_count = lua_gettop(state);
900 if (return_count == 1) {
901 evalargs->ea_result = 0;
902 zcp_convert_return_values(state, evalargs->ea_outnvl,
903 ZCP_RET_RETURN, evalargs);
904 } else if (return_count > 1) {
905 evalargs->ea_result = SET_ERROR(ECHRNG);
906 (void) lua_pushfstring(state, "Multiple return "
907 "values not supported");
908 zcp_convert_return_values(state, evalargs->ea_outnvl,
909 ZCP_RET_ERROR, evalargs);
911 break;
913 case LUA_ERRRUN:
914 case LUA_ERRGCMM: {
916 * The channel program encountered a fatal error within the
917 * script, such as failing an assertion, or calling a function
918 * with incompatible arguments. The error value and the
919 * traceback generated by zcp_error_handler() should be on the
920 * stack.
922 VERIFY3U(1, ==, lua_gettop(state));
923 if (ri.zri_timed_out) {
924 evalargs->ea_result = SET_ERROR(ETIME);
925 } else {
926 evalargs->ea_result = SET_ERROR(ECHRNG);
929 zcp_convert_return_values(state, evalargs->ea_outnvl,
930 ZCP_RET_ERROR, evalargs);
931 break;
933 case LUA_ERRERR: {
935 * The channel program encountered a fatal error within the
936 * script, and we encountered another error while trying to
937 * compute the traceback in zcp_error_handler(). We can only
938 * return the error message.
940 VERIFY3U(1, ==, lua_gettop(state));
941 if (ri.zri_timed_out) {
942 evalargs->ea_result = SET_ERROR(ETIME);
943 } else {
944 evalargs->ea_result = SET_ERROR(ECHRNG);
947 zcp_convert_return_values(state, evalargs->ea_outnvl,
948 ZCP_RET_ERROR, evalargs);
949 break;
951 case LUA_ERRMEM:
953 * Lua ran out of memory while running the channel program.
954 * There's not much we can do.
956 evalargs->ea_result = SET_ERROR(ENOSPC);
957 break;
958 default:
959 VERIFY0(err);
964 zcp_eval(const char *poolname, const char *program, uint64_t instrlimit,
965 uint64_t memlimit, nvpair_t *nvarg, nvlist_t *outnvl)
967 int err;
968 lua_State *state;
969 zcp_eval_arg_t evalargs;
971 if (instrlimit > zfs_lua_max_instrlimit)
972 return (SET_ERROR(EINVAL));
973 if (memlimit == 0 || memlimit > zfs_lua_max_memlimit)
974 return (SET_ERROR(EINVAL));
976 zcp_alloc_arg_t allocargs = {
977 .aa_must_succeed = B_TRUE,
978 .aa_alloc_remaining = (int64_t)memlimit,
979 .aa_alloc_limit = (int64_t)memlimit,
983 * Creates a Lua state with a memory allocator that uses KM_SLEEP.
984 * This should never fail.
986 state = lua_newstate(zcp_lua_alloc, &allocargs);
987 VERIFY(state != NULL);
988 (void) lua_atpanic(state, zcp_panic_cb);
991 * Load core Lua libraries we want access to.
993 VERIFY3U(1, ==, luaopen_base(state));
994 lua_pop(state, 1);
995 VERIFY3U(1, ==, luaopen_coroutine(state));
996 lua_setglobal(state, LUA_COLIBNAME);
997 VERIFY0(lua_gettop(state));
998 VERIFY3U(1, ==, luaopen_string(state));
999 lua_setglobal(state, LUA_STRLIBNAME);
1000 VERIFY0(lua_gettop(state));
1001 VERIFY3U(1, ==, luaopen_table(state));
1002 lua_setglobal(state, LUA_TABLIBNAME);
1003 VERIFY0(lua_gettop(state));
1006 * Load globally visible variables such as errno aliases.
1008 zcp_load_globals(state);
1009 VERIFY0(lua_gettop(state));
1012 * Load ZFS-specific modules.
1014 lua_newtable(state);
1015 VERIFY3U(1, ==, zcp_load_list_lib(state));
1016 lua_setfield(state, -2, "list");
1017 VERIFY3U(1, ==, zcp_load_synctask_lib(state, B_FALSE));
1018 lua_setfield(state, -2, "check");
1019 VERIFY3U(1, ==, zcp_load_synctask_lib(state, B_TRUE));
1020 lua_setfield(state, -2, "sync");
1021 VERIFY3U(1, ==, zcp_load_get_lib(state));
1022 lua_pushcclosure(state, zcp_debug_info.func, 0);
1023 lua_setfield(state, -2, zcp_debug_info.name);
1024 lua_pushcclosure(state, zcp_exists_info.func, 0);
1025 lua_setfield(state, -2, zcp_exists_info.name);
1026 lua_setglobal(state, "zfs");
1027 VERIFY0(lua_gettop(state));
1030 * Push the error-callback that calculates Lua stack traces on
1031 * unexpected failures.
1033 lua_pushcfunction(state, zcp_error_handler);
1034 VERIFY3U(1, ==, lua_gettop(state));
1037 * Load the actual script as a function onto the stack as text ("t").
1038 * The only valid error condition is a syntax error in the script.
1039 * ERRMEM should not be possible because our allocator is using
1040 * KM_SLEEP. ERRGCMM should not be possible because we have not added
1041 * any objects with __gc metamethods to the interpreter that could
1042 * fail.
1044 err = luaL_loadbufferx(state, program, strlen(program),
1045 "channel program", "t");
1046 if (err == LUA_ERRSYNTAX) {
1047 fnvlist_add_string(outnvl, ZCP_RET_ERROR,
1048 lua_tostring(state, -1));
1049 lua_close(state);
1050 return (SET_ERROR(EINVAL));
1052 VERIFY0(err);
1053 VERIFY3U(2, ==, lua_gettop(state));
1056 * Convert the input nvlist to a Lua object and put it on top of the
1057 * stack.
1059 char errmsg[128];
1060 err = zcp_nvpair_value_to_lua(state, nvarg,
1061 errmsg, sizeof (errmsg));
1062 if (err != 0) {
1063 fnvlist_add_string(outnvl, ZCP_RET_ERROR, errmsg);
1064 lua_close(state);
1065 return (SET_ERROR(EINVAL));
1067 VERIFY3U(3, ==, lua_gettop(state));
1069 evalargs.ea_state = state;
1070 evalargs.ea_allocargs = &allocargs;
1071 evalargs.ea_instrlimit = instrlimit;
1072 evalargs.ea_cred = CRED();
1073 evalargs.ea_outnvl = outnvl;
1074 evalargs.ea_result = 0;
1076 VERIFY0(dsl_sync_task(poolname, zcp_eval_check,
1077 zcp_eval_sync, &evalargs, 0, ZFS_SPACE_CHECK_NONE));
1079 lua_close(state);
1081 return (evalargs.ea_result);
1085 * Retrieve metadata about the currently running channel program.
1087 zcp_run_info_t *
1088 zcp_run_info(lua_State *state)
1090 zcp_run_info_t *ri;
1092 lua_getfield(state, LUA_REGISTRYINDEX, ZCP_RUN_INFO_KEY);
1093 ri = lua_touserdata(state, -1);
1094 lua_pop(state, 1);
1095 return (ri);
1099 * Argument Parsing
1100 * ================
1102 * The Lua language allows methods to be called with any number
1103 * of arguments of any type. When calling back into ZFS we need to sanitize
1104 * arguments from channel programs to make sure unexpected arguments or
1105 * arguments of the wrong type result in clear error messages. To do this
1106 * in a uniform way all callbacks from channel programs should use the
1107 * zcp_parse_args() function to interpret inputs.
1109 * Positional vs Keyword Arguments
1110 * ===============================
1112 * Every callback function takes a fixed set of required positional arguments
1113 * and optional keyword arguments. For example, the destroy function takes
1114 * a single positional string argument (the name of the dataset to destroy)
1115 * and an optional "defer" keyword boolean argument. When calling lua functions
1116 * with parentheses, only positional arguments can be used:
1118 * zfs.sync.snapshot("rpool@snap")
1120 * To use keyword arguments functions should be called with a single argument
1121 * that is a lua table containing mappings of integer -> positional arguments
1122 * and string -> keyword arguments:
1124 * zfs.sync.snapshot({1="rpool@snap", defer=true})
1126 * The lua language allows curly braces to be used in place of parenthesis as
1127 * syntactic sugar for this calling convention:
1129 * zfs.sync.snapshot{"rpool@snap", defer=true}
1133 * Throw an error and print the given arguments. If there are too many
1134 * arguments to fit in the output buffer, only the error format string is
1135 * output.
1137 static void
1138 zcp_args_error(lua_State *state, const char *fname, const zcp_arg_t *pargs,
1139 const zcp_arg_t *kwargs, const char *fmt, ...)
1141 int i;
1142 char errmsg[512];
1143 size_t len = sizeof (errmsg);
1144 size_t msglen = 0;
1145 va_list argp;
1147 va_start(argp, fmt);
1148 VERIFY3U(len, >, vsnprintf(errmsg, len, fmt, argp));
1149 va_end(argp);
1152 * Calculate the total length of the final string, including extra
1153 * formatting characters. If the argument dump would be too large,
1154 * only print the error string.
1156 msglen = strlen(errmsg);
1157 msglen += strlen(fname) + 4; /* : + {} + null terminator */
1158 for (i = 0; pargs[i].za_name != NULL; i++) {
1159 msglen += strlen(pargs[i].za_name);
1160 msglen += strlen(lua_typename(state, pargs[i].za_lua_type));
1161 if (pargs[i + 1].za_name != NULL || kwargs[0].za_name != NULL)
1162 msglen += 5; /* < + ( + )> + , */
1163 else
1164 msglen += 4; /* < + ( + )> */
1166 for (i = 0; kwargs[i].za_name != NULL; i++) {
1167 msglen += strlen(kwargs[i].za_name);
1168 msglen += strlen(lua_typename(state, kwargs[i].za_lua_type));
1169 if (kwargs[i + 1].za_name != NULL)
1170 msglen += 4; /* =( + ) + , */
1171 else
1172 msglen += 3; /* =( + ) */
1175 if (msglen >= len)
1176 (void) luaL_error(state, errmsg);
1178 VERIFY3U(len, >, strlcat(errmsg, ": ", len));
1179 VERIFY3U(len, >, strlcat(errmsg, fname, len));
1180 VERIFY3U(len, >, strlcat(errmsg, "{", len));
1181 for (i = 0; pargs[i].za_name != NULL; i++) {
1182 VERIFY3U(len, >, strlcat(errmsg, "<", len));
1183 VERIFY3U(len, >, strlcat(errmsg, pargs[i].za_name, len));
1184 VERIFY3U(len, >, strlcat(errmsg, "(", len));
1185 VERIFY3U(len, >, strlcat(errmsg,
1186 lua_typename(state, pargs[i].za_lua_type), len));
1187 VERIFY3U(len, >, strlcat(errmsg, ")>", len));
1188 if (pargs[i + 1].za_name != NULL || kwargs[0].za_name != NULL) {
1189 VERIFY3U(len, >, strlcat(errmsg, ", ", len));
1192 for (i = 0; kwargs[i].za_name != NULL; i++) {
1193 VERIFY3U(len, >, strlcat(errmsg, kwargs[i].za_name, len));
1194 VERIFY3U(len, >, strlcat(errmsg, "=(", len));
1195 VERIFY3U(len, >, strlcat(errmsg,
1196 lua_typename(state, kwargs[i].za_lua_type), len));
1197 VERIFY3U(len, >, strlcat(errmsg, ")", len));
1198 if (kwargs[i + 1].za_name != NULL) {
1199 VERIFY3U(len, >, strlcat(errmsg, ", ", len));
1202 VERIFY3U(len, >, strlcat(errmsg, "}", len));
1204 (void) luaL_error(state, errmsg);
1205 panic("unreachable code");
1208 static void
1209 zcp_parse_table_args(lua_State *state, const char *fname,
1210 const zcp_arg_t *pargs, const zcp_arg_t *kwargs)
1212 int i;
1213 int type;
1215 for (i = 0; pargs[i].za_name != NULL; i++) {
1217 * Check the table for this positional argument, leaving it
1218 * on the top of the stack once we finish validating it.
1220 lua_pushinteger(state, i + 1);
1221 lua_gettable(state, 1);
1223 type = lua_type(state, -1);
1224 if (type == LUA_TNIL) {
1225 zcp_args_error(state, fname, pargs, kwargs,
1226 "too few arguments");
1227 panic("unreachable code");
1228 } else if (type != pargs[i].za_lua_type) {
1229 zcp_args_error(state, fname, pargs, kwargs,
1230 "arg %d wrong type (is '%s', expected '%s')",
1231 i + 1, lua_typename(state, type),
1232 lua_typename(state, pargs[i].za_lua_type));
1233 panic("unreachable code");
1237 * Remove the positional argument from the table.
1239 lua_pushinteger(state, i + 1);
1240 lua_pushnil(state);
1241 lua_settable(state, 1);
1244 for (i = 0; kwargs[i].za_name != NULL; i++) {
1246 * Check the table for this keyword argument, which may be
1247 * nil if it was omitted. Leave the value on the top of
1248 * the stack after validating it.
1250 lua_getfield(state, 1, kwargs[i].za_name);
1252 type = lua_type(state, -1);
1253 if (type != LUA_TNIL && type != kwargs[i].za_lua_type) {
1254 zcp_args_error(state, fname, pargs, kwargs,
1255 "kwarg '%s' wrong type (is '%s', expected '%s')",
1256 kwargs[i].za_name, lua_typename(state, type),
1257 lua_typename(state, kwargs[i].za_lua_type));
1258 panic("unreachable code");
1262 * Remove the keyword argument from the table.
1264 lua_pushnil(state);
1265 lua_setfield(state, 1, kwargs[i].za_name);
1269 * Any entries remaining in the table are invalid inputs, print
1270 * an error message based on what the entry is.
1272 lua_pushnil(state);
1273 if (lua_next(state, 1)) {
1274 if (lua_isnumber(state, -2) && lua_tointeger(state, -2) > 0) {
1275 zcp_args_error(state, fname, pargs, kwargs,
1276 "too many positional arguments");
1277 } else if (lua_isstring(state, -2)) {
1278 zcp_args_error(state, fname, pargs, kwargs,
1279 "invalid kwarg '%s'", lua_tostring(state, -2));
1280 } else {
1281 zcp_args_error(state, fname, pargs, kwargs,
1282 "kwarg keys must be strings");
1284 panic("unreachable code");
1287 lua_remove(state, 1);
1290 static void
1291 zcp_parse_pos_args(lua_State *state, const char *fname, const zcp_arg_t *pargs,
1292 const zcp_arg_t *kwargs)
1294 int i;
1295 int type;
1297 for (i = 0; pargs[i].za_name != NULL; i++) {
1298 type = lua_type(state, i + 1);
1299 if (type == LUA_TNONE) {
1300 zcp_args_error(state, fname, pargs, kwargs,
1301 "too few arguments");
1302 panic("unreachable code");
1303 } else if (type != pargs[i].za_lua_type) {
1304 zcp_args_error(state, fname, pargs, kwargs,
1305 "arg %d wrong type (is '%s', expected '%s')",
1306 i + 1, lua_typename(state, type),
1307 lua_typename(state, pargs[i].za_lua_type));
1308 panic("unreachable code");
1311 if (lua_gettop(state) != i) {
1312 zcp_args_error(state, fname, pargs, kwargs,
1313 "too many positional arguments");
1314 panic("unreachable code");
1317 for (i = 0; kwargs[i].za_name != NULL; i++) {
1318 lua_pushnil(state);
1323 * Checks the current Lua stack against an expected set of positional and
1324 * keyword arguments. If the stack does not match the expected arguments
1325 * aborts the current channel program with a useful error message, otherwise
1326 * it re-arranges the stack so that it contains the positional arguments
1327 * followed by the keyword argument values in declaration order. Any missing
1328 * keyword argument will be represented by a nil value on the stack.
1330 * If the stack contains exactly one argument of type LUA_TTABLE the curly
1331 * braces calling convention is assumed, otherwise the stack is parsed for
1332 * positional arguments only.
1334 * This function should be used by every function callback. It should be called
1335 * before the callback manipulates the Lua stack as it assumes the stack
1336 * represents the function arguments.
1338 void
1339 zcp_parse_args(lua_State *state, const char *fname, const zcp_arg_t *pargs,
1340 const zcp_arg_t *kwargs)
1342 if (lua_gettop(state) == 1 && lua_istable(state, 1)) {
1343 zcp_parse_table_args(state, fname, pargs, kwargs);
1344 } else {
1345 zcp_parse_pos_args(state, fname, pargs, kwargs);