block: Mark bdrv_refresh_filename() and callers GRAPH_RDLOCK
[qemu/kevin.git] / qemu-img.c
blob3ecbc375b06be833b4cb03d041c4fd5a89d7a301
1 /*
2 * QEMU disk image utility
4 * Copyright (c) 2003-2008 Fabrice Bellard
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
25 #include "qemu/osdep.h"
26 #include <getopt.h>
28 #include "qemu/help-texts.h"
29 #include "qemu/qemu-progress.h"
30 #include "qemu-version.h"
31 #include "qapi/error.h"
32 #include "qapi/qapi-commands-block-core.h"
33 #include "qapi/qapi-visit-block-core.h"
34 #include "qapi/qobject-output-visitor.h"
35 #include "qapi/qmp/qjson.h"
36 #include "qapi/qmp/qdict.h"
37 #include "qemu/cutils.h"
38 #include "qemu/config-file.h"
39 #include "qemu/option.h"
40 #include "qemu/error-report.h"
41 #include "qemu/log.h"
42 #include "qemu/main-loop.h"
43 #include "qemu/module.h"
44 #include "qemu/sockets.h"
45 #include "qemu/units.h"
46 #include "qemu/memalign.h"
47 #include "qom/object_interfaces.h"
48 #include "sysemu/block-backend.h"
49 #include "block/block_int.h"
50 #include "block/blockjob.h"
51 #include "block/dirty-bitmap.h"
52 #include "block/qapi.h"
53 #include "crypto/init.h"
54 #include "trace/control.h"
55 #include "qemu/throttle.h"
56 #include "block/throttle-groups.h"
58 #define QEMU_IMG_VERSION "qemu-img version " QEMU_FULL_VERSION \
59 "\n" QEMU_COPYRIGHT "\n"
61 typedef struct img_cmd_t {
62 const char *name;
63 int (*handler)(int argc, char **argv);
64 } img_cmd_t;
66 enum {
67 OPTION_OUTPUT = 256,
68 OPTION_BACKING_CHAIN = 257,
69 OPTION_OBJECT = 258,
70 OPTION_IMAGE_OPTS = 259,
71 OPTION_PATTERN = 260,
72 OPTION_FLUSH_INTERVAL = 261,
73 OPTION_NO_DRAIN = 262,
74 OPTION_TARGET_IMAGE_OPTS = 263,
75 OPTION_SIZE = 264,
76 OPTION_PREALLOCATION = 265,
77 OPTION_SHRINK = 266,
78 OPTION_SALVAGE = 267,
79 OPTION_TARGET_IS_ZERO = 268,
80 OPTION_ADD = 269,
81 OPTION_REMOVE = 270,
82 OPTION_CLEAR = 271,
83 OPTION_ENABLE = 272,
84 OPTION_DISABLE = 273,
85 OPTION_MERGE = 274,
86 OPTION_BITMAPS = 275,
87 OPTION_FORCE = 276,
88 OPTION_SKIP_BROKEN = 277,
91 typedef enum OutputFormat {
92 OFORMAT_JSON,
93 OFORMAT_HUMAN,
94 } OutputFormat;
96 /* Default to cache=writeback as data integrity is not important for qemu-img */
97 #define BDRV_DEFAULT_CACHE "writeback"
99 static void format_print(void *opaque, const char *name)
101 printf(" %s", name);
104 static G_NORETURN G_GNUC_PRINTF(1, 2)
105 void error_exit(const char *fmt, ...)
107 va_list ap;
109 va_start(ap, fmt);
110 error_vreport(fmt, ap);
111 va_end(ap);
113 error_printf("Try 'qemu-img --help' for more information\n");
114 exit(EXIT_FAILURE);
117 static G_NORETURN
118 void missing_argument(const char *option)
120 error_exit("missing argument for option '%s'", option);
123 static G_NORETURN
124 void unrecognized_option(const char *option)
126 error_exit("unrecognized option '%s'", option);
129 /* Please keep in synch with docs/tools/qemu-img.rst */
130 static G_NORETURN
131 void help(void)
133 const char *help_msg =
134 QEMU_IMG_VERSION
135 "usage: qemu-img [standard options] command [command options]\n"
136 "QEMU disk image utility\n"
137 "\n"
138 " '-h', '--help' display this help and exit\n"
139 " '-V', '--version' output version information and exit\n"
140 " '-T', '--trace' [[enable=]<pattern>][,events=<file>][,file=<file>]\n"
141 " specify tracing options\n"
142 "\n"
143 "Command syntax:\n"
144 #define DEF(option, callback, arg_string) \
145 " " arg_string "\n"
146 #include "qemu-img-cmds.h"
147 #undef DEF
148 "\n"
149 "Command parameters:\n"
150 " 'filename' is a disk image filename\n"
151 " 'objectdef' is a QEMU user creatable object definition. See the qemu(1)\n"
152 " manual page for a description of the object properties. The most common\n"
153 " object type is a 'secret', which is used to supply passwords and/or\n"
154 " encryption keys.\n"
155 " 'fmt' is the disk image format. It is guessed automatically in most cases\n"
156 " 'cache' is the cache mode used to write the output disk image, the valid\n"
157 " options are: 'none', 'writeback' (default, except for convert), 'writethrough',\n"
158 " 'directsync' and 'unsafe' (default for convert)\n"
159 " 'src_cache' is the cache mode used to read input disk images, the valid\n"
160 " options are the same as for the 'cache' option\n"
161 " 'size' is the disk image size in bytes. Optional suffixes\n"
162 " 'k' or 'K' (kilobyte, 1024), 'M' (megabyte, 1024k), 'G' (gigabyte, 1024M),\n"
163 " 'T' (terabyte, 1024G), 'P' (petabyte, 1024T) and 'E' (exabyte, 1024P) are\n"
164 " supported. 'b' is ignored.\n"
165 " 'output_filename' is the destination disk image filename\n"
166 " 'output_fmt' is the destination format\n"
167 " 'options' is a comma separated list of format specific options in a\n"
168 " name=value format. Use -o help for an overview of the options supported by\n"
169 " the used format\n"
170 " 'snapshot_param' is param used for internal snapshot, format\n"
171 " is 'snapshot.id=[ID],snapshot.name=[NAME]', or\n"
172 " '[ID_OR_NAME]'\n"
173 " '-c' indicates that target image must be compressed (qcow format only)\n"
174 " '-u' allows unsafe backing chains. For rebasing, it is assumed that old and\n"
175 " new backing file match exactly. The image doesn't need a working\n"
176 " backing file before rebasing in this case (useful for renaming the\n"
177 " backing file). For image creation, allow creating without attempting\n"
178 " to open the backing file.\n"
179 " '-h' with or without a command shows this help and lists the supported formats\n"
180 " '-p' show progress of command (only certain commands)\n"
181 " '-q' use Quiet mode - do not print any output (except errors)\n"
182 " '-S' indicates the consecutive number of bytes (defaults to 4k) that must\n"
183 " contain only zeros for qemu-img to create a sparse image during\n"
184 " conversion. If the number of bytes is 0, the source will not be scanned for\n"
185 " unallocated or zero sectors, and the destination image will always be\n"
186 " fully allocated\n"
187 " '--output' takes the format in which the output must be done (human or json)\n"
188 " '-n' skips the target volume creation (useful if the volume is created\n"
189 " prior to running qemu-img)\n"
190 "\n"
191 "Parameters to bitmap subcommand:\n"
192 " 'bitmap' is the name of the bitmap to manipulate, through one or more\n"
193 " actions from '--add', '--remove', '--clear', '--enable', '--disable',\n"
194 " or '--merge source'\n"
195 " '-g granularity' sets the granularity for '--add' actions\n"
196 " '-b source' and '-F src_fmt' tell '--merge' actions to find the source\n"
197 " bitmaps from an alternative file\n"
198 "\n"
199 "Parameters to check subcommand:\n"
200 " '-r' tries to repair any inconsistencies that are found during the check.\n"
201 " '-r leaks' repairs only cluster leaks, whereas '-r all' fixes all\n"
202 " kinds of errors, with a higher risk of choosing the wrong fix or\n"
203 " hiding corruption that has already occurred.\n"
204 "\n"
205 "Parameters to convert subcommand:\n"
206 " '--bitmaps' copies all top-level persistent bitmaps to destination\n"
207 " '-m' specifies how many coroutines work in parallel during the convert\n"
208 " process (defaults to 8)\n"
209 " '-W' allow to write to the target out of order rather than sequential\n"
210 "\n"
211 "Parameters to snapshot subcommand:\n"
212 " 'snapshot' is the name of the snapshot to create, apply or delete\n"
213 " '-a' applies a snapshot (revert disk to saved state)\n"
214 " '-c' creates a snapshot\n"
215 " '-d' deletes a snapshot\n"
216 " '-l' lists all snapshots in the given image\n"
217 "\n"
218 "Parameters to compare subcommand:\n"
219 " '-f' first image format\n"
220 " '-F' second image format\n"
221 " '-s' run in Strict mode - fail on different image size or sector allocation\n"
222 "\n"
223 "Parameters to dd subcommand:\n"
224 " 'bs=BYTES' read and write up to BYTES bytes at a time "
225 "(default: 512)\n"
226 " 'count=N' copy only N input blocks\n"
227 " 'if=FILE' read from FILE\n"
228 " 'of=FILE' write to FILE\n"
229 " 'skip=N' skip N bs-sized blocks at the start of input\n";
231 printf("%s\nSupported formats:", help_msg);
232 bdrv_iterate_format(format_print, NULL, false);
233 printf("\n\n" QEMU_HELP_BOTTOM "\n");
234 exit(EXIT_SUCCESS);
238 * Is @list safe for accumulate_options()?
239 * It is when multiple of them can be joined together separated by ','.
240 * To make that work, @list must not start with ',' (or else a
241 * separating ',' preceding it gets escaped), and it must not end with
242 * an odd number of ',' (or else a separating ',' following it gets
243 * escaped), or be empty (or else a separating ',' preceding it can
244 * escape a separating ',' following it).
247 static bool is_valid_option_list(const char *list)
249 size_t len = strlen(list);
250 size_t i;
252 if (!list[0] || list[0] == ',') {
253 return false;
256 for (i = len; i > 0 && list[i - 1] == ','; i--) {
258 if ((len - i) % 2) {
259 return false;
262 return true;
265 static int accumulate_options(char **options, char *list)
267 char *new_options;
269 if (!is_valid_option_list(list)) {
270 error_report("Invalid option list: %s", list);
271 return -1;
274 if (!*options) {
275 *options = g_strdup(list);
276 } else {
277 new_options = g_strdup_printf("%s,%s", *options, list);
278 g_free(*options);
279 *options = new_options;
281 return 0;
284 static QemuOptsList qemu_source_opts = {
285 .name = "source",
286 .implied_opt_name = "file",
287 .head = QTAILQ_HEAD_INITIALIZER(qemu_source_opts.head),
288 .desc = {
293 static int G_GNUC_PRINTF(2, 3) qprintf(bool quiet, const char *fmt, ...)
295 int ret = 0;
296 if (!quiet) {
297 va_list args;
298 va_start(args, fmt);
299 ret = vprintf(fmt, args);
300 va_end(args);
302 return ret;
306 static int print_block_option_help(const char *filename, const char *fmt)
308 BlockDriver *drv, *proto_drv;
309 QemuOptsList *create_opts = NULL;
310 Error *local_err = NULL;
312 /* Find driver and parse its options */
313 drv = bdrv_find_format(fmt);
314 if (!drv) {
315 error_report("Unknown file format '%s'", fmt);
316 return 1;
319 if (!drv->create_opts) {
320 error_report("Format driver '%s' does not support image creation", fmt);
321 return 1;
324 create_opts = qemu_opts_append(create_opts, drv->create_opts);
325 if (filename) {
326 proto_drv = bdrv_find_protocol(filename, true, &local_err);
327 if (!proto_drv) {
328 error_report_err(local_err);
329 qemu_opts_free(create_opts);
330 return 1;
332 if (!proto_drv->create_opts) {
333 error_report("Protocol driver '%s' does not support image creation",
334 proto_drv->format_name);
335 qemu_opts_free(create_opts);
336 return 1;
338 create_opts = qemu_opts_append(create_opts, proto_drv->create_opts);
341 if (filename) {
342 printf("Supported options:\n");
343 } else {
344 printf("Supported %s options:\n", fmt);
346 qemu_opts_print_help(create_opts, false);
347 qemu_opts_free(create_opts);
349 if (!filename) {
350 printf("\n"
351 "The protocol level may support further options.\n"
352 "Specify the target filename to include those options.\n");
355 return 0;
359 static BlockBackend *img_open_opts(const char *optstr,
360 QemuOpts *opts, int flags, bool writethrough,
361 bool quiet, bool force_share)
363 QDict *options;
364 Error *local_err = NULL;
365 BlockBackend *blk;
366 options = qemu_opts_to_qdict(opts, NULL);
367 if (force_share) {
368 if (qdict_haskey(options, BDRV_OPT_FORCE_SHARE)
369 && strcmp(qdict_get_str(options, BDRV_OPT_FORCE_SHARE), "on")) {
370 error_report("--force-share/-U conflicts with image options");
371 qobject_unref(options);
372 return NULL;
374 qdict_put_str(options, BDRV_OPT_FORCE_SHARE, "on");
376 blk = blk_new_open(NULL, NULL, options, flags, &local_err);
377 if (!blk) {
378 error_reportf_err(local_err, "Could not open '%s': ", optstr);
379 return NULL;
381 blk_set_enable_write_cache(blk, !writethrough);
383 return blk;
386 static BlockBackend *img_open_file(const char *filename,
387 QDict *options,
388 const char *fmt, int flags,
389 bool writethrough, bool quiet,
390 bool force_share)
392 BlockBackend *blk;
393 Error *local_err = NULL;
395 if (!options) {
396 options = qdict_new();
398 if (fmt) {
399 qdict_put_str(options, "driver", fmt);
402 if (force_share) {
403 qdict_put_bool(options, BDRV_OPT_FORCE_SHARE, true);
405 blk = blk_new_open(filename, NULL, options, flags, &local_err);
406 if (!blk) {
407 error_reportf_err(local_err, "Could not open '%s': ", filename);
408 return NULL;
410 blk_set_enable_write_cache(blk, !writethrough);
412 return blk;
416 static int img_add_key_secrets(void *opaque,
417 const char *name, const char *value,
418 Error **errp)
420 QDict *options = opaque;
422 if (g_str_has_suffix(name, "key-secret")) {
423 qdict_put_str(options, name, value);
426 return 0;
430 static BlockBackend *img_open(bool image_opts,
431 const char *filename,
432 const char *fmt, int flags, bool writethrough,
433 bool quiet, bool force_share)
435 BlockBackend *blk;
436 if (image_opts) {
437 QemuOpts *opts;
438 if (fmt) {
439 error_report("--image-opts and --format are mutually exclusive");
440 return NULL;
442 opts = qemu_opts_parse_noisily(qemu_find_opts("source"),
443 filename, true);
444 if (!opts) {
445 return NULL;
447 blk = img_open_opts(filename, opts, flags, writethrough, quiet,
448 force_share);
449 } else {
450 blk = img_open_file(filename, NULL, fmt, flags, writethrough, quiet,
451 force_share);
454 if (blk) {
455 blk_set_force_allow_inactivate(blk);
458 return blk;
462 static int add_old_style_options(const char *fmt, QemuOpts *opts,
463 const char *base_filename,
464 const char *base_fmt)
466 if (base_filename) {
467 if (!qemu_opt_set(opts, BLOCK_OPT_BACKING_FILE, base_filename,
468 NULL)) {
469 error_report("Backing file not supported for file format '%s'",
470 fmt);
471 return -1;
474 if (base_fmt) {
475 if (!qemu_opt_set(opts, BLOCK_OPT_BACKING_FMT, base_fmt, NULL)) {
476 error_report("Backing file format not supported for file "
477 "format '%s'", fmt);
478 return -1;
481 return 0;
484 static int64_t cvtnum_full(const char *name, const char *value, int64_t min,
485 int64_t max)
487 int err;
488 uint64_t res;
490 err = qemu_strtosz(value, NULL, &res);
491 if (err < 0 && err != -ERANGE) {
492 error_report("Invalid %s specified. You may use "
493 "k, M, G, T, P or E suffixes for", name);
494 error_report("kilobytes, megabytes, gigabytes, terabytes, "
495 "petabytes and exabytes.");
496 return err;
498 if (err == -ERANGE || res > max || res < min) {
499 error_report("Invalid %s specified. Must be between %" PRId64
500 " and %" PRId64 ".", name, min, max);
501 return -ERANGE;
503 return res;
506 static int64_t cvtnum(const char *name, const char *value)
508 return cvtnum_full(name, value, 0, INT64_MAX);
511 static int img_create(int argc, char **argv)
513 int c;
514 uint64_t img_size = -1;
515 const char *fmt = "raw";
516 const char *base_fmt = NULL;
517 const char *filename;
518 const char *base_filename = NULL;
519 char *options = NULL;
520 Error *local_err = NULL;
521 bool quiet = false;
522 int flags = 0;
524 for(;;) {
525 static const struct option long_options[] = {
526 {"help", no_argument, 0, 'h'},
527 {"object", required_argument, 0, OPTION_OBJECT},
528 {0, 0, 0, 0}
530 c = getopt_long(argc, argv, ":F:b:f:ho:qu",
531 long_options, NULL);
532 if (c == -1) {
533 break;
535 switch(c) {
536 case ':':
537 missing_argument(argv[optind - 1]);
538 break;
539 case '?':
540 unrecognized_option(argv[optind - 1]);
541 break;
542 case 'h':
543 help();
544 break;
545 case 'F':
546 base_fmt = optarg;
547 break;
548 case 'b':
549 base_filename = optarg;
550 break;
551 case 'f':
552 fmt = optarg;
553 break;
554 case 'o':
555 if (accumulate_options(&options, optarg) < 0) {
556 goto fail;
558 break;
559 case 'q':
560 quiet = true;
561 break;
562 case 'u':
563 flags |= BDRV_O_NO_BACKING;
564 break;
565 case OPTION_OBJECT:
566 user_creatable_process_cmdline(optarg);
567 break;
571 /* Get the filename */
572 filename = (optind < argc) ? argv[optind] : NULL;
573 if (options && has_help_option(options)) {
574 g_free(options);
575 return print_block_option_help(filename, fmt);
578 if (optind >= argc) {
579 error_exit("Expecting image file name");
581 optind++;
583 /* Get image size, if specified */
584 if (optind < argc) {
585 int64_t sval;
587 sval = cvtnum("image size", argv[optind++]);
588 if (sval < 0) {
589 goto fail;
591 img_size = (uint64_t)sval;
593 if (optind != argc) {
594 error_exit("Unexpected argument: %s", argv[optind]);
597 bdrv_img_create(filename, fmt, base_filename, base_fmt,
598 options, img_size, flags, quiet, &local_err);
599 if (local_err) {
600 error_reportf_err(local_err, "%s: ", filename);
601 goto fail;
604 g_free(options);
605 return 0;
607 fail:
608 g_free(options);
609 return 1;
612 static void dump_json_image_check(ImageCheck *check, bool quiet)
614 GString *str;
615 QObject *obj;
616 Visitor *v = qobject_output_visitor_new(&obj);
618 visit_type_ImageCheck(v, NULL, &check, &error_abort);
619 visit_complete(v, &obj);
620 str = qobject_to_json_pretty(obj, true);
621 assert(str != NULL);
622 qprintf(quiet, "%s\n", str->str);
623 qobject_unref(obj);
624 visit_free(v);
625 g_string_free(str, true);
628 static void dump_human_image_check(ImageCheck *check, bool quiet)
630 if (!(check->corruptions || check->leaks || check->check_errors)) {
631 qprintf(quiet, "No errors were found on the image.\n");
632 } else {
633 if (check->corruptions) {
634 qprintf(quiet, "\n%" PRId64 " errors were found on the image.\n"
635 "Data may be corrupted, or further writes to the image "
636 "may corrupt it.\n",
637 check->corruptions);
640 if (check->leaks) {
641 qprintf(quiet,
642 "\n%" PRId64 " leaked clusters were found on the image.\n"
643 "This means waste of disk space, but no harm to data.\n",
644 check->leaks);
647 if (check->check_errors) {
648 qprintf(quiet,
649 "\n%" PRId64
650 " internal errors have occurred during the check.\n",
651 check->check_errors);
655 if (check->total_clusters != 0 && check->allocated_clusters != 0) {
656 qprintf(quiet, "%" PRId64 "/%" PRId64 " = %0.2f%% allocated, "
657 "%0.2f%% fragmented, %0.2f%% compressed clusters\n",
658 check->allocated_clusters, check->total_clusters,
659 check->allocated_clusters * 100.0 / check->total_clusters,
660 check->fragmented_clusters * 100.0 / check->allocated_clusters,
661 check->compressed_clusters * 100.0 /
662 check->allocated_clusters);
665 if (check->image_end_offset) {
666 qprintf(quiet,
667 "Image end offset: %" PRId64 "\n", check->image_end_offset);
671 static int collect_image_check(BlockDriverState *bs,
672 ImageCheck *check,
673 const char *filename,
674 const char *fmt,
675 int fix)
677 int ret;
678 BdrvCheckResult result;
680 ret = bdrv_check(bs, &result, fix);
681 if (ret < 0) {
682 return ret;
685 check->filename = g_strdup(filename);
686 check->format = g_strdup(bdrv_get_format_name(bs));
687 check->check_errors = result.check_errors;
688 check->corruptions = result.corruptions;
689 check->has_corruptions = result.corruptions != 0;
690 check->leaks = result.leaks;
691 check->has_leaks = result.leaks != 0;
692 check->corruptions_fixed = result.corruptions_fixed;
693 check->has_corruptions_fixed = result.corruptions_fixed != 0;
694 check->leaks_fixed = result.leaks_fixed;
695 check->has_leaks_fixed = result.leaks_fixed != 0;
696 check->image_end_offset = result.image_end_offset;
697 check->has_image_end_offset = result.image_end_offset != 0;
698 check->total_clusters = result.bfi.total_clusters;
699 check->has_total_clusters = result.bfi.total_clusters != 0;
700 check->allocated_clusters = result.bfi.allocated_clusters;
701 check->has_allocated_clusters = result.bfi.allocated_clusters != 0;
702 check->fragmented_clusters = result.bfi.fragmented_clusters;
703 check->has_fragmented_clusters = result.bfi.fragmented_clusters != 0;
704 check->compressed_clusters = result.bfi.compressed_clusters;
705 check->has_compressed_clusters = result.bfi.compressed_clusters != 0;
707 return 0;
711 * Checks an image for consistency. Exit codes:
713 * 0 - Check completed, image is good
714 * 1 - Check not completed because of internal errors
715 * 2 - Check completed, image is corrupted
716 * 3 - Check completed, image has leaked clusters, but is good otherwise
717 * 63 - Checks are not supported by the image format
719 static int img_check(int argc, char **argv)
721 int c, ret;
722 OutputFormat output_format = OFORMAT_HUMAN;
723 const char *filename, *fmt, *output, *cache;
724 BlockBackend *blk;
725 BlockDriverState *bs;
726 int fix = 0;
727 int flags = BDRV_O_CHECK;
728 bool writethrough;
729 ImageCheck *check;
730 bool quiet = false;
731 bool image_opts = false;
732 bool force_share = false;
734 fmt = NULL;
735 output = NULL;
736 cache = BDRV_DEFAULT_CACHE;
738 for(;;) {
739 int option_index = 0;
740 static const struct option long_options[] = {
741 {"help", no_argument, 0, 'h'},
742 {"format", required_argument, 0, 'f'},
743 {"repair", required_argument, 0, 'r'},
744 {"output", required_argument, 0, OPTION_OUTPUT},
745 {"object", required_argument, 0, OPTION_OBJECT},
746 {"image-opts", no_argument, 0, OPTION_IMAGE_OPTS},
747 {"force-share", no_argument, 0, 'U'},
748 {0, 0, 0, 0}
750 c = getopt_long(argc, argv, ":hf:r:T:qU",
751 long_options, &option_index);
752 if (c == -1) {
753 break;
755 switch(c) {
756 case ':':
757 missing_argument(argv[optind - 1]);
758 break;
759 case '?':
760 unrecognized_option(argv[optind - 1]);
761 break;
762 case 'h':
763 help();
764 break;
765 case 'f':
766 fmt = optarg;
767 break;
768 case 'r':
769 flags |= BDRV_O_RDWR;
771 if (!strcmp(optarg, "leaks")) {
772 fix = BDRV_FIX_LEAKS;
773 } else if (!strcmp(optarg, "all")) {
774 fix = BDRV_FIX_LEAKS | BDRV_FIX_ERRORS;
775 } else {
776 error_exit("Unknown option value for -r "
777 "(expecting 'leaks' or 'all'): %s", optarg);
779 break;
780 case OPTION_OUTPUT:
781 output = optarg;
782 break;
783 case 'T':
784 cache = optarg;
785 break;
786 case 'q':
787 quiet = true;
788 break;
789 case 'U':
790 force_share = true;
791 break;
792 case OPTION_OBJECT:
793 user_creatable_process_cmdline(optarg);
794 break;
795 case OPTION_IMAGE_OPTS:
796 image_opts = true;
797 break;
800 if (optind != argc - 1) {
801 error_exit("Expecting one image file name");
803 filename = argv[optind++];
805 if (output && !strcmp(output, "json")) {
806 output_format = OFORMAT_JSON;
807 } else if (output && !strcmp(output, "human")) {
808 output_format = OFORMAT_HUMAN;
809 } else if (output) {
810 error_report("--output must be used with human or json as argument.");
811 return 1;
814 ret = bdrv_parse_cache_mode(cache, &flags, &writethrough);
815 if (ret < 0) {
816 error_report("Invalid source cache option: %s", cache);
817 return 1;
820 blk = img_open(image_opts, filename, fmt, flags, writethrough, quiet,
821 force_share);
822 if (!blk) {
823 return 1;
825 bs = blk_bs(blk);
827 check = g_new0(ImageCheck, 1);
828 ret = collect_image_check(bs, check, filename, fmt, fix);
830 if (ret == -ENOTSUP) {
831 error_report("This image format does not support checks");
832 ret = 63;
833 goto fail;
836 if (check->corruptions_fixed || check->leaks_fixed) {
837 int corruptions_fixed, leaks_fixed;
838 bool has_leaks_fixed, has_corruptions_fixed;
840 leaks_fixed = check->leaks_fixed;
841 has_leaks_fixed = check->has_leaks_fixed;
842 corruptions_fixed = check->corruptions_fixed;
843 has_corruptions_fixed = check->has_corruptions_fixed;
845 if (output_format == OFORMAT_HUMAN) {
846 qprintf(quiet,
847 "The following inconsistencies were found and repaired:\n\n"
848 " %" PRId64 " leaked clusters\n"
849 " %" PRId64 " corruptions\n\n"
850 "Double checking the fixed image now...\n",
851 check->leaks_fixed,
852 check->corruptions_fixed);
855 qapi_free_ImageCheck(check);
856 check = g_new0(ImageCheck, 1);
857 ret = collect_image_check(bs, check, filename, fmt, 0);
859 check->leaks_fixed = leaks_fixed;
860 check->has_leaks_fixed = has_leaks_fixed;
861 check->corruptions_fixed = corruptions_fixed;
862 check->has_corruptions_fixed = has_corruptions_fixed;
865 if (!ret) {
866 switch (output_format) {
867 case OFORMAT_HUMAN:
868 dump_human_image_check(check, quiet);
869 break;
870 case OFORMAT_JSON:
871 dump_json_image_check(check, quiet);
872 break;
876 if (ret || check->check_errors) {
877 if (ret) {
878 error_report("Check failed: %s", strerror(-ret));
879 } else {
880 error_report("Check failed");
882 ret = 1;
883 goto fail;
886 if (check->corruptions) {
887 ret = 2;
888 } else if (check->leaks) {
889 ret = 3;
890 } else {
891 ret = 0;
894 fail:
895 qapi_free_ImageCheck(check);
896 blk_unref(blk);
897 return ret;
900 typedef struct CommonBlockJobCBInfo {
901 BlockDriverState *bs;
902 Error **errp;
903 } CommonBlockJobCBInfo;
905 static void common_block_job_cb(void *opaque, int ret)
907 CommonBlockJobCBInfo *cbi = opaque;
909 if (ret < 0) {
910 error_setg_errno(cbi->errp, -ret, "Block job failed");
914 static void run_block_job(BlockJob *job, Error **errp)
916 uint64_t progress_current, progress_total;
917 AioContext *aio_context = block_job_get_aio_context(job);
918 int ret = 0;
920 job_lock();
921 job_ref_locked(&job->job);
922 do {
923 float progress = 0.0f;
924 job_unlock();
925 aio_poll(aio_context, true);
927 progress_get_snapshot(&job->job.progress, &progress_current,
928 &progress_total);
929 if (progress_total) {
930 progress = (float)progress_current / progress_total * 100.f;
932 qemu_progress_print(progress, 0);
933 job_lock();
934 } while (!job_is_ready_locked(&job->job) &&
935 !job_is_completed_locked(&job->job));
937 if (!job_is_completed_locked(&job->job)) {
938 ret = job_complete_sync_locked(&job->job, errp);
939 } else {
940 ret = job->job.ret;
942 job_unref_locked(&job->job);
943 job_unlock();
945 /* publish completion progress only when success */
946 if (!ret) {
947 qemu_progress_print(100.f, 0);
951 static int img_commit(int argc, char **argv)
953 int c, ret, flags;
954 const char *filename, *fmt, *cache, *base;
955 BlockBackend *blk;
956 BlockDriverState *bs, *base_bs;
957 BlockJob *job;
958 bool progress = false, quiet = false, drop = false;
959 bool writethrough;
960 Error *local_err = NULL;
961 CommonBlockJobCBInfo cbi;
962 bool image_opts = false;
963 AioContext *aio_context;
964 int64_t rate_limit = 0;
966 fmt = NULL;
967 cache = BDRV_DEFAULT_CACHE;
968 base = NULL;
969 for(;;) {
970 static const struct option long_options[] = {
971 {"help", no_argument, 0, 'h'},
972 {"object", required_argument, 0, OPTION_OBJECT},
973 {"image-opts", no_argument, 0, OPTION_IMAGE_OPTS},
974 {0, 0, 0, 0}
976 c = getopt_long(argc, argv, ":f:ht:b:dpqr:",
977 long_options, NULL);
978 if (c == -1) {
979 break;
981 switch(c) {
982 case ':':
983 missing_argument(argv[optind - 1]);
984 break;
985 case '?':
986 unrecognized_option(argv[optind - 1]);
987 break;
988 case 'h':
989 help();
990 break;
991 case 'f':
992 fmt = optarg;
993 break;
994 case 't':
995 cache = optarg;
996 break;
997 case 'b':
998 base = optarg;
999 /* -b implies -d */
1000 drop = true;
1001 break;
1002 case 'd':
1003 drop = true;
1004 break;
1005 case 'p':
1006 progress = true;
1007 break;
1008 case 'q':
1009 quiet = true;
1010 break;
1011 case 'r':
1012 rate_limit = cvtnum("rate limit", optarg);
1013 if (rate_limit < 0) {
1014 return 1;
1016 break;
1017 case OPTION_OBJECT:
1018 user_creatable_process_cmdline(optarg);
1019 break;
1020 case OPTION_IMAGE_OPTS:
1021 image_opts = true;
1022 break;
1026 /* Progress is not shown in Quiet mode */
1027 if (quiet) {
1028 progress = false;
1031 if (optind != argc - 1) {
1032 error_exit("Expecting one image file name");
1034 filename = argv[optind++];
1036 flags = BDRV_O_RDWR | BDRV_O_UNMAP;
1037 ret = bdrv_parse_cache_mode(cache, &flags, &writethrough);
1038 if (ret < 0) {
1039 error_report("Invalid cache option: %s", cache);
1040 return 1;
1043 blk = img_open(image_opts, filename, fmt, flags, writethrough, quiet,
1044 false);
1045 if (!blk) {
1046 return 1;
1048 bs = blk_bs(blk);
1050 qemu_progress_init(progress, 1.f);
1051 qemu_progress_print(0.f, 100);
1053 if (base) {
1054 base_bs = bdrv_find_backing_image(bs, base);
1055 if (!base_bs) {
1056 error_setg(&local_err,
1057 "Did not find '%s' in the backing chain of '%s'",
1058 base, filename);
1059 goto done;
1061 } else {
1062 /* This is different from QMP, which by default uses the deepest file in
1063 * the backing chain (i.e., the very base); however, the traditional
1064 * behavior of qemu-img commit is using the immediate backing file. */
1065 base_bs = bdrv_backing_chain_next(bs);
1066 if (!base_bs) {
1067 error_setg(&local_err, "Image does not have a backing file");
1068 goto done;
1072 cbi = (CommonBlockJobCBInfo){
1073 .errp = &local_err,
1074 .bs = bs,
1077 aio_context = bdrv_get_aio_context(bs);
1078 aio_context_acquire(aio_context);
1079 commit_active_start("commit", bs, base_bs, JOB_DEFAULT, rate_limit,
1080 BLOCKDEV_ON_ERROR_REPORT, NULL, common_block_job_cb,
1081 &cbi, false, &local_err);
1082 aio_context_release(aio_context);
1083 if (local_err) {
1084 goto done;
1087 /* When the block job completes, the BlockBackend reference will point to
1088 * the old backing file. In order to avoid that the top image is already
1089 * deleted, so we can still empty it afterwards, increment the reference
1090 * counter here preemptively. */
1091 if (!drop) {
1092 bdrv_ref(bs);
1095 job = block_job_get("commit");
1096 assert(job);
1097 run_block_job(job, &local_err);
1098 if (local_err) {
1099 goto unref_backing;
1102 if (!drop) {
1103 BlockBackend *old_backing_blk;
1105 old_backing_blk = blk_new_with_bs(bs, BLK_PERM_WRITE, BLK_PERM_ALL,
1106 &local_err);
1107 if (!old_backing_blk) {
1108 goto unref_backing;
1110 ret = blk_make_empty(old_backing_blk, &local_err);
1111 blk_unref(old_backing_blk);
1112 if (ret == -ENOTSUP) {
1113 error_free(local_err);
1114 local_err = NULL;
1115 } else if (ret < 0) {
1116 goto unref_backing;
1120 unref_backing:
1121 if (!drop) {
1122 bdrv_unref(bs);
1125 done:
1126 qemu_progress_end();
1129 * Manually inactivate the image first because this way we can know whether
1130 * an error occurred. blk_unref() doesn't tell us about failures.
1132 ret = bdrv_inactivate_all();
1133 if (ret < 0 && !local_err) {
1134 error_setg_errno(&local_err, -ret, "Error while closing the image");
1136 blk_unref(blk);
1138 if (local_err) {
1139 error_report_err(local_err);
1140 return 1;
1143 qprintf(quiet, "Image committed.\n");
1144 return 0;
1148 * Returns -1 if 'buf' contains only zeroes, otherwise the byte index
1149 * of the first sector boundary within buf where the sector contains a
1150 * non-zero byte. This function is robust to a buffer that is not
1151 * sector-aligned.
1153 static int64_t find_nonzero(const uint8_t *buf, int64_t n)
1155 int64_t i;
1156 int64_t end = QEMU_ALIGN_DOWN(n, BDRV_SECTOR_SIZE);
1158 for (i = 0; i < end; i += BDRV_SECTOR_SIZE) {
1159 if (!buffer_is_zero(buf + i, BDRV_SECTOR_SIZE)) {
1160 return i;
1163 if (i < n && !buffer_is_zero(buf + i, n - end)) {
1164 return i;
1166 return -1;
1170 * Returns true iff the first sector pointed to by 'buf' contains at least
1171 * a non-NUL byte.
1173 * 'pnum' is set to the number of sectors (including and immediately following
1174 * the first one) that are known to be in the same allocated/unallocated state.
1175 * The function will try to align the end offset to alignment boundaries so
1176 * that the request will at least end aligned and consecutive requests will
1177 * also start at an aligned offset.
1179 static int is_allocated_sectors(const uint8_t *buf, int n, int *pnum,
1180 int64_t sector_num, int alignment)
1182 bool is_zero;
1183 int i, tail;
1185 if (n <= 0) {
1186 *pnum = 0;
1187 return 0;
1189 is_zero = buffer_is_zero(buf, BDRV_SECTOR_SIZE);
1190 for(i = 1; i < n; i++) {
1191 buf += BDRV_SECTOR_SIZE;
1192 if (is_zero != buffer_is_zero(buf, BDRV_SECTOR_SIZE)) {
1193 break;
1197 if (i == n) {
1199 * The whole buf is the same.
1200 * No reason to split it into chunks, so return now.
1202 *pnum = i;
1203 return !is_zero;
1206 tail = (sector_num + i) & (alignment - 1);
1207 if (tail) {
1208 if (is_zero && i <= tail) {
1210 * For sure next sector after i is data, and it will rewrite this
1211 * tail anyway due to RMW. So, let's just write data now.
1213 is_zero = false;
1215 if (!is_zero) {
1216 /* If possible, align up end offset of allocated areas. */
1217 i += alignment - tail;
1218 i = MIN(i, n);
1219 } else {
1221 * For sure next sector after i is data, and it will rewrite this
1222 * tail anyway due to RMW. Better is avoid RMW and write zeroes up
1223 * to aligned bound.
1225 i -= tail;
1228 *pnum = i;
1229 return !is_zero;
1233 * Like is_allocated_sectors, but if the buffer starts with a used sector,
1234 * up to 'min' consecutive sectors containing zeros are ignored. This avoids
1235 * breaking up write requests for only small sparse areas.
1237 static int is_allocated_sectors_min(const uint8_t *buf, int n, int *pnum,
1238 int min, int64_t sector_num, int alignment)
1240 int ret;
1241 int num_checked, num_used;
1243 if (n < min) {
1244 min = n;
1247 ret = is_allocated_sectors(buf, n, pnum, sector_num, alignment);
1248 if (!ret) {
1249 return ret;
1252 num_used = *pnum;
1253 buf += BDRV_SECTOR_SIZE * *pnum;
1254 n -= *pnum;
1255 sector_num += *pnum;
1256 num_checked = num_used;
1258 while (n > 0) {
1259 ret = is_allocated_sectors(buf, n, pnum, sector_num, alignment);
1261 buf += BDRV_SECTOR_SIZE * *pnum;
1262 n -= *pnum;
1263 sector_num += *pnum;
1264 num_checked += *pnum;
1265 if (ret) {
1266 num_used = num_checked;
1267 } else if (*pnum >= min) {
1268 break;
1272 *pnum = num_used;
1273 return 1;
1277 * Compares two buffers sector by sector. Returns 0 if the first
1278 * sector of each buffer matches, non-zero otherwise.
1280 * pnum is set to the sector-aligned size of the buffer prefix that
1281 * has the same matching status as the first sector.
1283 static int compare_buffers(const uint8_t *buf1, const uint8_t *buf2,
1284 int64_t bytes, int64_t *pnum)
1286 bool res;
1287 int64_t i = MIN(bytes, BDRV_SECTOR_SIZE);
1289 assert(bytes > 0);
1291 res = !!memcmp(buf1, buf2, i);
1292 while (i < bytes) {
1293 int64_t len = MIN(bytes - i, BDRV_SECTOR_SIZE);
1295 if (!!memcmp(buf1 + i, buf2 + i, len) != res) {
1296 break;
1298 i += len;
1301 *pnum = i;
1302 return res;
1305 #define IO_BUF_SIZE (2 * MiB)
1308 * Check if passed sectors are empty (not allocated or contain only 0 bytes)
1310 * Intended for use by 'qemu-img compare': Returns 0 in case sectors are
1311 * filled with 0, 1 if sectors contain non-zero data (this is a comparison
1312 * failure), and 4 on error (the exit status for read errors), after emitting
1313 * an error message.
1315 * @param blk: BlockBackend for the image
1316 * @param offset: Starting offset to check
1317 * @param bytes: Number of bytes to check
1318 * @param filename: Name of disk file we are checking (logging purpose)
1319 * @param buffer: Allocated buffer for storing read data
1320 * @param quiet: Flag for quiet mode
1322 static int check_empty_sectors(BlockBackend *blk, int64_t offset,
1323 int64_t bytes, const char *filename,
1324 uint8_t *buffer, bool quiet)
1326 int ret = 0;
1327 int64_t idx;
1329 ret = blk_pread(blk, offset, bytes, buffer, 0);
1330 if (ret < 0) {
1331 error_report("Error while reading offset %" PRId64 " of %s: %s",
1332 offset, filename, strerror(-ret));
1333 return 4;
1335 idx = find_nonzero(buffer, bytes);
1336 if (idx >= 0) {
1337 qprintf(quiet, "Content mismatch at offset %" PRId64 "!\n",
1338 offset + idx);
1339 return 1;
1342 return 0;
1346 * Compares two images. Exit codes:
1348 * 0 - Images are identical or the requested help was printed
1349 * 1 - Images differ
1350 * >1 - Error occurred
1352 static int img_compare(int argc, char **argv)
1354 const char *fmt1 = NULL, *fmt2 = NULL, *cache, *filename1, *filename2;
1355 BlockBackend *blk1, *blk2;
1356 BlockDriverState *bs1, *bs2;
1357 int64_t total_size1, total_size2;
1358 uint8_t *buf1 = NULL, *buf2 = NULL;
1359 int64_t pnum1, pnum2;
1360 int allocated1, allocated2;
1361 int ret = 0; /* return value - 0 Ident, 1 Different, >1 Error */
1362 bool progress = false, quiet = false, strict = false;
1363 int flags;
1364 bool writethrough;
1365 int64_t total_size;
1366 int64_t offset = 0;
1367 int64_t chunk;
1368 int c;
1369 uint64_t progress_base;
1370 bool image_opts = false;
1371 bool force_share = false;
1373 cache = BDRV_DEFAULT_CACHE;
1374 for (;;) {
1375 static const struct option long_options[] = {
1376 {"help", no_argument, 0, 'h'},
1377 {"object", required_argument, 0, OPTION_OBJECT},
1378 {"image-opts", no_argument, 0, OPTION_IMAGE_OPTS},
1379 {"force-share", no_argument, 0, 'U'},
1380 {0, 0, 0, 0}
1382 c = getopt_long(argc, argv, ":hf:F:T:pqsU",
1383 long_options, NULL);
1384 if (c == -1) {
1385 break;
1387 switch (c) {
1388 case ':':
1389 missing_argument(argv[optind - 1]);
1390 break;
1391 case '?':
1392 unrecognized_option(argv[optind - 1]);
1393 break;
1394 case 'h':
1395 help();
1396 break;
1397 case 'f':
1398 fmt1 = optarg;
1399 break;
1400 case 'F':
1401 fmt2 = optarg;
1402 break;
1403 case 'T':
1404 cache = optarg;
1405 break;
1406 case 'p':
1407 progress = true;
1408 break;
1409 case 'q':
1410 quiet = true;
1411 break;
1412 case 's':
1413 strict = true;
1414 break;
1415 case 'U':
1416 force_share = true;
1417 break;
1418 case OPTION_OBJECT:
1420 Error *local_err = NULL;
1422 if (!user_creatable_add_from_str(optarg, &local_err)) {
1423 if (local_err) {
1424 error_report_err(local_err);
1425 exit(2);
1426 } else {
1427 /* Help was printed */
1428 exit(EXIT_SUCCESS);
1431 break;
1433 case OPTION_IMAGE_OPTS:
1434 image_opts = true;
1435 break;
1439 /* Progress is not shown in Quiet mode */
1440 if (quiet) {
1441 progress = false;
1445 if (optind != argc - 2) {
1446 error_exit("Expecting two image file names");
1448 filename1 = argv[optind++];
1449 filename2 = argv[optind++];
1451 /* Initialize before goto out */
1452 qemu_progress_init(progress, 2.0);
1454 flags = 0;
1455 ret = bdrv_parse_cache_mode(cache, &flags, &writethrough);
1456 if (ret < 0) {
1457 error_report("Invalid source cache option: %s", cache);
1458 ret = 2;
1459 goto out3;
1462 blk1 = img_open(image_opts, filename1, fmt1, flags, writethrough, quiet,
1463 force_share);
1464 if (!blk1) {
1465 ret = 2;
1466 goto out3;
1469 blk2 = img_open(image_opts, filename2, fmt2, flags, writethrough, quiet,
1470 force_share);
1471 if (!blk2) {
1472 ret = 2;
1473 goto out2;
1475 bs1 = blk_bs(blk1);
1476 bs2 = blk_bs(blk2);
1478 buf1 = blk_blockalign(blk1, IO_BUF_SIZE);
1479 buf2 = blk_blockalign(blk2, IO_BUF_SIZE);
1480 total_size1 = blk_getlength(blk1);
1481 if (total_size1 < 0) {
1482 error_report("Can't get size of %s: %s",
1483 filename1, strerror(-total_size1));
1484 ret = 4;
1485 goto out;
1487 total_size2 = blk_getlength(blk2);
1488 if (total_size2 < 0) {
1489 error_report("Can't get size of %s: %s",
1490 filename2, strerror(-total_size2));
1491 ret = 4;
1492 goto out;
1494 total_size = MIN(total_size1, total_size2);
1495 progress_base = MAX(total_size1, total_size2);
1497 qemu_progress_print(0, 100);
1499 if (strict && total_size1 != total_size2) {
1500 ret = 1;
1501 qprintf(quiet, "Strict mode: Image size mismatch!\n");
1502 goto out;
1505 while (offset < total_size) {
1506 int status1, status2;
1508 status1 = bdrv_block_status_above(bs1, NULL, offset,
1509 total_size1 - offset, &pnum1, NULL,
1510 NULL);
1511 if (status1 < 0) {
1512 ret = 3;
1513 error_report("Sector allocation test failed for %s", filename1);
1514 goto out;
1516 allocated1 = status1 & BDRV_BLOCK_ALLOCATED;
1518 status2 = bdrv_block_status_above(bs2, NULL, offset,
1519 total_size2 - offset, &pnum2, NULL,
1520 NULL);
1521 if (status2 < 0) {
1522 ret = 3;
1523 error_report("Sector allocation test failed for %s", filename2);
1524 goto out;
1526 allocated2 = status2 & BDRV_BLOCK_ALLOCATED;
1528 assert(pnum1 && pnum2);
1529 chunk = MIN(pnum1, pnum2);
1531 if (strict) {
1532 if (status1 != status2) {
1533 ret = 1;
1534 qprintf(quiet, "Strict mode: Offset %" PRId64
1535 " block status mismatch!\n", offset);
1536 goto out;
1539 if ((status1 & BDRV_BLOCK_ZERO) && (status2 & BDRV_BLOCK_ZERO)) {
1540 /* nothing to do */
1541 } else if (allocated1 == allocated2) {
1542 if (allocated1) {
1543 int64_t pnum;
1545 chunk = MIN(chunk, IO_BUF_SIZE);
1546 ret = blk_pread(blk1, offset, chunk, buf1, 0);
1547 if (ret < 0) {
1548 error_report("Error while reading offset %" PRId64
1549 " of %s: %s",
1550 offset, filename1, strerror(-ret));
1551 ret = 4;
1552 goto out;
1554 ret = blk_pread(blk2, offset, chunk, buf2, 0);
1555 if (ret < 0) {
1556 error_report("Error while reading offset %" PRId64
1557 " of %s: %s",
1558 offset, filename2, strerror(-ret));
1559 ret = 4;
1560 goto out;
1562 ret = compare_buffers(buf1, buf2, chunk, &pnum);
1563 if (ret || pnum != chunk) {
1564 qprintf(quiet, "Content mismatch at offset %" PRId64 "!\n",
1565 offset + (ret ? 0 : pnum));
1566 ret = 1;
1567 goto out;
1570 } else {
1571 chunk = MIN(chunk, IO_BUF_SIZE);
1572 if (allocated1) {
1573 ret = check_empty_sectors(blk1, offset, chunk,
1574 filename1, buf1, quiet);
1575 } else {
1576 ret = check_empty_sectors(blk2, offset, chunk,
1577 filename2, buf1, quiet);
1579 if (ret) {
1580 goto out;
1583 offset += chunk;
1584 qemu_progress_print(((float) chunk / progress_base) * 100, 100);
1587 if (total_size1 != total_size2) {
1588 BlockBackend *blk_over;
1589 const char *filename_over;
1591 qprintf(quiet, "Warning: Image size mismatch!\n");
1592 if (total_size1 > total_size2) {
1593 blk_over = blk1;
1594 filename_over = filename1;
1595 } else {
1596 blk_over = blk2;
1597 filename_over = filename2;
1600 while (offset < progress_base) {
1601 ret = bdrv_block_status_above(blk_bs(blk_over), NULL, offset,
1602 progress_base - offset, &chunk,
1603 NULL, NULL);
1604 if (ret < 0) {
1605 ret = 3;
1606 error_report("Sector allocation test failed for %s",
1607 filename_over);
1608 goto out;
1611 if (ret & BDRV_BLOCK_ALLOCATED && !(ret & BDRV_BLOCK_ZERO)) {
1612 chunk = MIN(chunk, IO_BUF_SIZE);
1613 ret = check_empty_sectors(blk_over, offset, chunk,
1614 filename_over, buf1, quiet);
1615 if (ret) {
1616 goto out;
1619 offset += chunk;
1620 qemu_progress_print(((float) chunk / progress_base) * 100, 100);
1624 qprintf(quiet, "Images are identical.\n");
1625 ret = 0;
1627 out:
1628 qemu_vfree(buf1);
1629 qemu_vfree(buf2);
1630 blk_unref(blk2);
1631 out2:
1632 blk_unref(blk1);
1633 out3:
1634 qemu_progress_end();
1635 return ret;
1638 /* Convenience wrapper around qmp_block_dirty_bitmap_merge */
1639 static void do_dirty_bitmap_merge(const char *dst_node, const char *dst_name,
1640 const char *src_node, const char *src_name,
1641 Error **errp)
1643 BlockDirtyBitmapOrStr *merge_src;
1644 BlockDirtyBitmapOrStrList *list = NULL;
1646 merge_src = g_new0(BlockDirtyBitmapOrStr, 1);
1647 merge_src->type = QTYPE_QDICT;
1648 merge_src->u.external.node = g_strdup(src_node);
1649 merge_src->u.external.name = g_strdup(src_name);
1650 QAPI_LIST_PREPEND(list, merge_src);
1651 qmp_block_dirty_bitmap_merge(dst_node, dst_name, list, errp);
1652 qapi_free_BlockDirtyBitmapOrStrList(list);
1655 enum ImgConvertBlockStatus {
1656 BLK_DATA,
1657 BLK_ZERO,
1658 BLK_BACKING_FILE,
1661 #define MAX_COROUTINES 16
1662 #define CONVERT_THROTTLE_GROUP "img_convert"
1664 typedef struct ImgConvertState {
1665 BlockBackend **src;
1666 int64_t *src_sectors;
1667 int *src_alignment;
1668 int src_num;
1669 int64_t total_sectors;
1670 int64_t allocated_sectors;
1671 int64_t allocated_done;
1672 int64_t sector_num;
1673 int64_t wr_offs;
1674 enum ImgConvertBlockStatus status;
1675 int64_t sector_next_status;
1676 BlockBackend *target;
1677 bool has_zero_init;
1678 bool compressed;
1679 bool target_is_new;
1680 bool target_has_backing;
1681 int64_t target_backing_sectors; /* negative if unknown */
1682 bool wr_in_order;
1683 bool copy_range;
1684 bool salvage;
1685 bool quiet;
1686 int min_sparse;
1687 int alignment;
1688 size_t cluster_sectors;
1689 size_t buf_sectors;
1690 long num_coroutines;
1691 int running_coroutines;
1692 Coroutine *co[MAX_COROUTINES];
1693 int64_t wait_sector_num[MAX_COROUTINES];
1694 CoMutex lock;
1695 int ret;
1696 } ImgConvertState;
1698 static void convert_select_part(ImgConvertState *s, int64_t sector_num,
1699 int *src_cur, int64_t *src_cur_offset)
1701 *src_cur = 0;
1702 *src_cur_offset = 0;
1703 while (sector_num - *src_cur_offset >= s->src_sectors[*src_cur]) {
1704 *src_cur_offset += s->src_sectors[*src_cur];
1705 (*src_cur)++;
1706 assert(*src_cur < s->src_num);
1710 static int convert_iteration_sectors(ImgConvertState *s, int64_t sector_num)
1712 int64_t src_cur_offset;
1713 int ret, n, src_cur;
1714 bool post_backing_zero = false;
1716 convert_select_part(s, sector_num, &src_cur, &src_cur_offset);
1718 assert(s->total_sectors > sector_num);
1719 n = MIN(s->total_sectors - sector_num, BDRV_REQUEST_MAX_SECTORS);
1721 if (s->target_backing_sectors >= 0) {
1722 if (sector_num >= s->target_backing_sectors) {
1723 post_backing_zero = true;
1724 } else if (sector_num + n > s->target_backing_sectors) {
1725 /* Split requests around target_backing_sectors (because
1726 * starting from there, zeros are handled differently) */
1727 n = s->target_backing_sectors - sector_num;
1731 if (s->sector_next_status <= sector_num) {
1732 uint64_t offset = (sector_num - src_cur_offset) * BDRV_SECTOR_SIZE;
1733 int64_t count;
1734 int tail;
1735 BlockDriverState *src_bs = blk_bs(s->src[src_cur]);
1736 BlockDriverState *base;
1738 if (s->target_has_backing) {
1739 base = bdrv_cow_bs(bdrv_skip_filters(src_bs));
1740 } else {
1741 base = NULL;
1744 do {
1745 count = n * BDRV_SECTOR_SIZE;
1747 ret = bdrv_block_status_above(src_bs, base, offset, count, &count,
1748 NULL, NULL);
1750 if (ret < 0) {
1751 if (s->salvage) {
1752 if (n == 1) {
1753 if (!s->quiet) {
1754 warn_report("error while reading block status at "
1755 "offset %" PRIu64 ": %s", offset,
1756 strerror(-ret));
1758 /* Just try to read the data, then */
1759 ret = BDRV_BLOCK_DATA;
1760 count = BDRV_SECTOR_SIZE;
1761 } else {
1762 /* Retry on a shorter range */
1763 n = DIV_ROUND_UP(n, 4);
1765 } else {
1766 error_report("error while reading block status at offset "
1767 "%" PRIu64 ": %s", offset, strerror(-ret));
1768 return ret;
1771 } while (ret < 0);
1773 n = DIV_ROUND_UP(count, BDRV_SECTOR_SIZE);
1776 * Avoid that s->sector_next_status becomes unaligned to the source
1777 * request alignment and/or cluster size to avoid unnecessary read
1778 * cycles.
1780 tail = (sector_num - src_cur_offset + n) % s->src_alignment[src_cur];
1781 if (n > tail) {
1782 n -= tail;
1785 if (ret & BDRV_BLOCK_ZERO) {
1786 s->status = post_backing_zero ? BLK_BACKING_FILE : BLK_ZERO;
1787 } else if (ret & BDRV_BLOCK_DATA) {
1788 s->status = BLK_DATA;
1789 } else {
1790 s->status = s->target_has_backing ? BLK_BACKING_FILE : BLK_DATA;
1793 s->sector_next_status = sector_num + n;
1796 n = MIN(n, s->sector_next_status - sector_num);
1797 if (s->status == BLK_DATA) {
1798 n = MIN(n, s->buf_sectors);
1801 /* We need to write complete clusters for compressed images, so if an
1802 * unallocated area is shorter than that, we must consider the whole
1803 * cluster allocated. */
1804 if (s->compressed) {
1805 if (n < s->cluster_sectors) {
1806 n = MIN(s->cluster_sectors, s->total_sectors - sector_num);
1807 s->status = BLK_DATA;
1808 } else {
1809 n = QEMU_ALIGN_DOWN(n, s->cluster_sectors);
1813 return n;
1816 static int coroutine_fn convert_co_read(ImgConvertState *s, int64_t sector_num,
1817 int nb_sectors, uint8_t *buf)
1819 uint64_t single_read_until = 0;
1820 int n, ret;
1822 assert(nb_sectors <= s->buf_sectors);
1823 while (nb_sectors > 0) {
1824 BlockBackend *blk;
1825 int src_cur;
1826 int64_t bs_sectors, src_cur_offset;
1827 uint64_t offset;
1829 /* In the case of compression with multiple source files, we can get a
1830 * nb_sectors that spreads into the next part. So we must be able to
1831 * read across multiple BDSes for one convert_read() call. */
1832 convert_select_part(s, sector_num, &src_cur, &src_cur_offset);
1833 blk = s->src[src_cur];
1834 bs_sectors = s->src_sectors[src_cur];
1836 offset = (sector_num - src_cur_offset) << BDRV_SECTOR_BITS;
1838 n = MIN(nb_sectors, bs_sectors - (sector_num - src_cur_offset));
1839 if (single_read_until > offset) {
1840 n = 1;
1843 ret = blk_co_pread(blk, offset, n << BDRV_SECTOR_BITS, buf, 0);
1844 if (ret < 0) {
1845 if (s->salvage) {
1846 if (n > 1) {
1847 single_read_until = offset + (n << BDRV_SECTOR_BITS);
1848 continue;
1849 } else {
1850 if (!s->quiet) {
1851 warn_report("error while reading offset %" PRIu64
1852 ": %s", offset, strerror(-ret));
1854 memset(buf, 0, BDRV_SECTOR_SIZE);
1856 } else {
1857 return ret;
1861 sector_num += n;
1862 nb_sectors -= n;
1863 buf += n * BDRV_SECTOR_SIZE;
1866 return 0;
1870 static int coroutine_fn convert_co_write(ImgConvertState *s, int64_t sector_num,
1871 int nb_sectors, uint8_t *buf,
1872 enum ImgConvertBlockStatus status)
1874 int ret;
1876 while (nb_sectors > 0) {
1877 int n = nb_sectors;
1878 BdrvRequestFlags flags = s->compressed ? BDRV_REQ_WRITE_COMPRESSED : 0;
1880 switch (status) {
1881 case BLK_BACKING_FILE:
1882 /* If we have a backing file, leave clusters unallocated that are
1883 * unallocated in the source image, so that the backing file is
1884 * visible at the respective offset. */
1885 assert(s->target_has_backing);
1886 break;
1888 case BLK_DATA:
1889 /* If we're told to keep the target fully allocated (-S 0) or there
1890 * is real non-zero data, we must write it. Otherwise we can treat
1891 * it as zero sectors.
1892 * Compressed clusters need to be written as a whole, so in that
1893 * case we can only save the write if the buffer is completely
1894 * zeroed. */
1895 if (!s->min_sparse ||
1896 (!s->compressed &&
1897 is_allocated_sectors_min(buf, n, &n, s->min_sparse,
1898 sector_num, s->alignment)) ||
1899 (s->compressed &&
1900 !buffer_is_zero(buf, n * BDRV_SECTOR_SIZE)))
1902 ret = blk_co_pwrite(s->target, sector_num << BDRV_SECTOR_BITS,
1903 n << BDRV_SECTOR_BITS, buf, flags);
1904 if (ret < 0) {
1905 return ret;
1907 break;
1909 /* fall-through */
1911 case BLK_ZERO:
1912 if (s->has_zero_init) {
1913 assert(!s->target_has_backing);
1914 break;
1916 ret = blk_co_pwrite_zeroes(s->target,
1917 sector_num << BDRV_SECTOR_BITS,
1918 n << BDRV_SECTOR_BITS,
1919 BDRV_REQ_MAY_UNMAP);
1920 if (ret < 0) {
1921 return ret;
1923 break;
1926 sector_num += n;
1927 nb_sectors -= n;
1928 buf += n * BDRV_SECTOR_SIZE;
1931 return 0;
1934 static int coroutine_fn convert_co_copy_range(ImgConvertState *s, int64_t sector_num,
1935 int nb_sectors)
1937 int n, ret;
1939 while (nb_sectors > 0) {
1940 BlockBackend *blk;
1941 int src_cur;
1942 int64_t bs_sectors, src_cur_offset;
1943 int64_t offset;
1945 convert_select_part(s, sector_num, &src_cur, &src_cur_offset);
1946 offset = (sector_num - src_cur_offset) << BDRV_SECTOR_BITS;
1947 blk = s->src[src_cur];
1948 bs_sectors = s->src_sectors[src_cur];
1950 n = MIN(nb_sectors, bs_sectors - (sector_num - src_cur_offset));
1952 ret = blk_co_copy_range(blk, offset, s->target,
1953 sector_num << BDRV_SECTOR_BITS,
1954 n << BDRV_SECTOR_BITS, 0, 0);
1955 if (ret < 0) {
1956 return ret;
1959 sector_num += n;
1960 nb_sectors -= n;
1962 return 0;
1965 static void coroutine_fn convert_co_do_copy(void *opaque)
1967 ImgConvertState *s = opaque;
1968 uint8_t *buf = NULL;
1969 int ret, i;
1970 int index = -1;
1972 for (i = 0; i < s->num_coroutines; i++) {
1973 if (s->co[i] == qemu_coroutine_self()) {
1974 index = i;
1975 break;
1978 assert(index >= 0);
1980 s->running_coroutines++;
1981 buf = blk_blockalign(s->target, s->buf_sectors * BDRV_SECTOR_SIZE);
1983 while (1) {
1984 int n;
1985 int64_t sector_num;
1986 enum ImgConvertBlockStatus status;
1987 bool copy_range;
1989 qemu_co_mutex_lock(&s->lock);
1990 if (s->ret != -EINPROGRESS || s->sector_num >= s->total_sectors) {
1991 qemu_co_mutex_unlock(&s->lock);
1992 break;
1994 WITH_GRAPH_RDLOCK_GUARD() {
1995 n = convert_iteration_sectors(s, s->sector_num);
1997 if (n < 0) {
1998 qemu_co_mutex_unlock(&s->lock);
1999 s->ret = n;
2000 break;
2002 /* save current sector and allocation status to local variables */
2003 sector_num = s->sector_num;
2004 status = s->status;
2005 if (!s->min_sparse && s->status == BLK_ZERO) {
2006 n = MIN(n, s->buf_sectors);
2008 /* increment global sector counter so that other coroutines can
2009 * already continue reading beyond this request */
2010 s->sector_num += n;
2011 qemu_co_mutex_unlock(&s->lock);
2013 if (status == BLK_DATA || (!s->min_sparse && status == BLK_ZERO)) {
2014 s->allocated_done += n;
2015 qemu_progress_print(100.0 * s->allocated_done /
2016 s->allocated_sectors, 0);
2019 retry:
2020 copy_range = s->copy_range && s->status == BLK_DATA;
2021 if (status == BLK_DATA && !copy_range) {
2022 ret = convert_co_read(s, sector_num, n, buf);
2023 if (ret < 0) {
2024 error_report("error while reading at byte %lld: %s",
2025 sector_num * BDRV_SECTOR_SIZE, strerror(-ret));
2026 s->ret = ret;
2028 } else if (!s->min_sparse && status == BLK_ZERO) {
2029 status = BLK_DATA;
2030 memset(buf, 0x00, n * BDRV_SECTOR_SIZE);
2033 if (s->wr_in_order) {
2034 /* keep writes in order */
2035 while (s->wr_offs != sector_num && s->ret == -EINPROGRESS) {
2036 s->wait_sector_num[index] = sector_num;
2037 qemu_coroutine_yield();
2039 s->wait_sector_num[index] = -1;
2042 if (s->ret == -EINPROGRESS) {
2043 if (copy_range) {
2044 WITH_GRAPH_RDLOCK_GUARD() {
2045 ret = convert_co_copy_range(s, sector_num, n);
2047 if (ret) {
2048 s->copy_range = false;
2049 goto retry;
2051 } else {
2052 ret = convert_co_write(s, sector_num, n, buf, status);
2054 if (ret < 0) {
2055 error_report("error while writing at byte %lld: %s",
2056 sector_num * BDRV_SECTOR_SIZE, strerror(-ret));
2057 s->ret = ret;
2061 if (s->wr_in_order) {
2062 /* reenter the coroutine that might have waited
2063 * for this write to complete */
2064 s->wr_offs = sector_num + n;
2065 for (i = 0; i < s->num_coroutines; i++) {
2066 if (s->co[i] && s->wait_sector_num[i] == s->wr_offs) {
2068 * A -> B -> A cannot occur because A has
2069 * s->wait_sector_num[i] == -1 during A -> B. Therefore
2070 * B will never enter A during this time window.
2072 qemu_coroutine_enter(s->co[i]);
2073 break;
2079 qemu_vfree(buf);
2080 s->co[index] = NULL;
2081 s->running_coroutines--;
2082 if (!s->running_coroutines && s->ret == -EINPROGRESS) {
2083 /* the convert job finished successfully */
2084 s->ret = 0;
2088 static int convert_do_copy(ImgConvertState *s)
2090 int ret, i, n;
2091 int64_t sector_num = 0;
2093 /* Check whether we have zero initialisation or can get it efficiently */
2094 if (!s->has_zero_init && s->target_is_new && s->min_sparse &&
2095 !s->target_has_backing) {
2096 s->has_zero_init = bdrv_has_zero_init(blk_bs(s->target));
2099 /* Allocate buffer for copied data. For compressed images, only one cluster
2100 * can be copied at a time. */
2101 if (s->compressed) {
2102 if (s->cluster_sectors <= 0 || s->cluster_sectors > s->buf_sectors) {
2103 error_report("invalid cluster size");
2104 return -EINVAL;
2106 s->buf_sectors = s->cluster_sectors;
2109 while (sector_num < s->total_sectors) {
2110 n = convert_iteration_sectors(s, sector_num);
2111 if (n < 0) {
2112 return n;
2114 if (s->status == BLK_DATA || (!s->min_sparse && s->status == BLK_ZERO))
2116 s->allocated_sectors += n;
2118 sector_num += n;
2121 /* Do the copy */
2122 s->sector_next_status = 0;
2123 s->ret = -EINPROGRESS;
2125 qemu_co_mutex_init(&s->lock);
2126 for (i = 0; i < s->num_coroutines; i++) {
2127 s->co[i] = qemu_coroutine_create(convert_co_do_copy, s);
2128 s->wait_sector_num[i] = -1;
2129 qemu_coroutine_enter(s->co[i]);
2132 while (s->running_coroutines) {
2133 main_loop_wait(false);
2136 if (s->compressed && !s->ret) {
2137 /* signal EOF to align */
2138 ret = blk_pwrite_compressed(s->target, 0, 0, NULL);
2139 if (ret < 0) {
2140 return ret;
2144 return s->ret;
2147 /* Check that bitmaps can be copied, or output an error */
2148 static int convert_check_bitmaps(BlockDriverState *src, bool skip_broken)
2150 BdrvDirtyBitmap *bm;
2152 if (!bdrv_supports_persistent_dirty_bitmap(src)) {
2153 error_report("Source lacks bitmap support");
2154 return -1;
2156 FOR_EACH_DIRTY_BITMAP(src, bm) {
2157 if (!bdrv_dirty_bitmap_get_persistence(bm)) {
2158 continue;
2160 if (!skip_broken && bdrv_dirty_bitmap_inconsistent(bm)) {
2161 error_report("Cannot copy inconsistent bitmap '%s'",
2162 bdrv_dirty_bitmap_name(bm));
2163 error_printf("Try --skip-broken-bitmaps, or "
2164 "use 'qemu-img bitmap --remove' to delete it\n");
2165 return -1;
2168 return 0;
2171 static int convert_copy_bitmaps(BlockDriverState *src, BlockDriverState *dst,
2172 bool skip_broken)
2174 BdrvDirtyBitmap *bm;
2175 Error *err = NULL;
2177 FOR_EACH_DIRTY_BITMAP(src, bm) {
2178 const char *name;
2180 if (!bdrv_dirty_bitmap_get_persistence(bm)) {
2181 continue;
2183 name = bdrv_dirty_bitmap_name(bm);
2184 if (skip_broken && bdrv_dirty_bitmap_inconsistent(bm)) {
2185 warn_report("Skipping inconsistent bitmap '%s'", name);
2186 continue;
2188 qmp_block_dirty_bitmap_add(dst->node_name, name,
2189 true, bdrv_dirty_bitmap_granularity(bm),
2190 true, true,
2191 true, !bdrv_dirty_bitmap_enabled(bm),
2192 &err);
2193 if (err) {
2194 error_reportf_err(err, "Failed to create bitmap %s: ", name);
2195 return -1;
2198 do_dirty_bitmap_merge(dst->node_name, name, src->node_name, name,
2199 &err);
2200 if (err) {
2201 error_reportf_err(err, "Failed to populate bitmap %s: ", name);
2202 qmp_block_dirty_bitmap_remove(dst->node_name, name, NULL);
2203 return -1;
2207 return 0;
2210 #define MAX_BUF_SECTORS 32768
2212 static void set_rate_limit(BlockBackend *blk, int64_t rate_limit)
2214 ThrottleConfig cfg;
2216 throttle_config_init(&cfg);
2217 cfg.buckets[THROTTLE_BPS_WRITE].avg = rate_limit;
2219 blk_io_limits_enable(blk, CONVERT_THROTTLE_GROUP);
2220 blk_set_io_limits(blk, &cfg);
2223 static int img_convert(int argc, char **argv)
2225 int c, bs_i, flags, src_flags = BDRV_O_NO_SHARE;
2226 const char *fmt = NULL, *out_fmt = NULL, *cache = "unsafe",
2227 *src_cache = BDRV_DEFAULT_CACHE, *out_baseimg = NULL,
2228 *out_filename, *out_baseimg_param, *snapshot_name = NULL,
2229 *backing_fmt = NULL;
2230 BlockDriver *drv = NULL, *proto_drv = NULL;
2231 BlockDriverInfo bdi;
2232 BlockDriverState *out_bs;
2233 QemuOpts *opts = NULL, *sn_opts = NULL;
2234 QemuOptsList *create_opts = NULL;
2235 QDict *open_opts = NULL;
2236 char *options = NULL;
2237 Error *local_err = NULL;
2238 bool writethrough, src_writethrough, image_opts = false,
2239 skip_create = false, progress = false, tgt_image_opts = false;
2240 int64_t ret = -EINVAL;
2241 bool force_share = false;
2242 bool explict_min_sparse = false;
2243 bool bitmaps = false;
2244 bool skip_broken = false;
2245 int64_t rate_limit = 0;
2247 ImgConvertState s = (ImgConvertState) {
2248 /* Need at least 4k of zeros for sparse detection */
2249 .min_sparse = 8,
2250 .copy_range = false,
2251 .buf_sectors = IO_BUF_SIZE / BDRV_SECTOR_SIZE,
2252 .wr_in_order = true,
2253 .num_coroutines = 8,
2256 for(;;) {
2257 static const struct option long_options[] = {
2258 {"help", no_argument, 0, 'h'},
2259 {"object", required_argument, 0, OPTION_OBJECT},
2260 {"image-opts", no_argument, 0, OPTION_IMAGE_OPTS},
2261 {"force-share", no_argument, 0, 'U'},
2262 {"target-image-opts", no_argument, 0, OPTION_TARGET_IMAGE_OPTS},
2263 {"salvage", no_argument, 0, OPTION_SALVAGE},
2264 {"target-is-zero", no_argument, 0, OPTION_TARGET_IS_ZERO},
2265 {"bitmaps", no_argument, 0, OPTION_BITMAPS},
2266 {"skip-broken-bitmaps", no_argument, 0, OPTION_SKIP_BROKEN},
2267 {0, 0, 0, 0}
2269 c = getopt_long(argc, argv, ":hf:O:B:CcF:o:l:S:pt:T:qnm:WUr:",
2270 long_options, NULL);
2271 if (c == -1) {
2272 break;
2274 switch(c) {
2275 case ':':
2276 missing_argument(argv[optind - 1]);
2277 break;
2278 case '?':
2279 unrecognized_option(argv[optind - 1]);
2280 break;
2281 case 'h':
2282 help();
2283 break;
2284 case 'f':
2285 fmt = optarg;
2286 break;
2287 case 'O':
2288 out_fmt = optarg;
2289 break;
2290 case 'B':
2291 out_baseimg = optarg;
2292 break;
2293 case 'C':
2294 s.copy_range = true;
2295 break;
2296 case 'c':
2297 s.compressed = true;
2298 break;
2299 case 'F':
2300 backing_fmt = optarg;
2301 break;
2302 case 'o':
2303 if (accumulate_options(&options, optarg) < 0) {
2304 goto fail_getopt;
2306 break;
2307 case 'l':
2308 if (strstart(optarg, SNAPSHOT_OPT_BASE, NULL)) {
2309 sn_opts = qemu_opts_parse_noisily(&internal_snapshot_opts,
2310 optarg, false);
2311 if (!sn_opts) {
2312 error_report("Failed in parsing snapshot param '%s'",
2313 optarg);
2314 goto fail_getopt;
2316 } else {
2317 snapshot_name = optarg;
2319 break;
2320 case 'S':
2322 int64_t sval;
2324 sval = cvtnum("buffer size for sparse output", optarg);
2325 if (sval < 0) {
2326 goto fail_getopt;
2327 } else if (!QEMU_IS_ALIGNED(sval, BDRV_SECTOR_SIZE) ||
2328 sval / BDRV_SECTOR_SIZE > MAX_BUF_SECTORS) {
2329 error_report("Invalid buffer size for sparse output specified. "
2330 "Valid sizes are multiples of %llu up to %llu. Select "
2331 "0 to disable sparse detection (fully allocates output).",
2332 BDRV_SECTOR_SIZE, MAX_BUF_SECTORS * BDRV_SECTOR_SIZE);
2333 goto fail_getopt;
2336 s.min_sparse = sval / BDRV_SECTOR_SIZE;
2337 explict_min_sparse = true;
2338 break;
2340 case 'p':
2341 progress = true;
2342 break;
2343 case 't':
2344 cache = optarg;
2345 break;
2346 case 'T':
2347 src_cache = optarg;
2348 break;
2349 case 'q':
2350 s.quiet = true;
2351 break;
2352 case 'n':
2353 skip_create = true;
2354 break;
2355 case 'm':
2356 if (qemu_strtol(optarg, NULL, 0, &s.num_coroutines) ||
2357 s.num_coroutines < 1 || s.num_coroutines > MAX_COROUTINES) {
2358 error_report("Invalid number of coroutines. Allowed number of"
2359 " coroutines is between 1 and %d", MAX_COROUTINES);
2360 goto fail_getopt;
2362 break;
2363 case 'W':
2364 s.wr_in_order = false;
2365 break;
2366 case 'U':
2367 force_share = true;
2368 break;
2369 case 'r':
2370 rate_limit = cvtnum("rate limit", optarg);
2371 if (rate_limit < 0) {
2372 goto fail_getopt;
2374 break;
2375 case OPTION_OBJECT:
2376 user_creatable_process_cmdline(optarg);
2377 break;
2378 case OPTION_IMAGE_OPTS:
2379 image_opts = true;
2380 break;
2381 case OPTION_SALVAGE:
2382 s.salvage = true;
2383 break;
2384 case OPTION_TARGET_IMAGE_OPTS:
2385 tgt_image_opts = true;
2386 break;
2387 case OPTION_TARGET_IS_ZERO:
2389 * The user asserting that the target is blank has the
2390 * same effect as the target driver supporting zero
2391 * initialisation.
2393 s.has_zero_init = true;
2394 break;
2395 case OPTION_BITMAPS:
2396 bitmaps = true;
2397 break;
2398 case OPTION_SKIP_BROKEN:
2399 skip_broken = true;
2400 break;
2404 if (!out_fmt && !tgt_image_opts) {
2405 out_fmt = "raw";
2408 if (skip_broken && !bitmaps) {
2409 error_report("Use of --skip-broken-bitmaps requires --bitmaps");
2410 goto fail_getopt;
2413 if (s.compressed && s.copy_range) {
2414 error_report("Cannot enable copy offloading when -c is used");
2415 goto fail_getopt;
2418 if (explict_min_sparse && s.copy_range) {
2419 error_report("Cannot enable copy offloading when -S is used");
2420 goto fail_getopt;
2423 if (s.copy_range && s.salvage) {
2424 error_report("Cannot use copy offloading in salvaging mode");
2425 goto fail_getopt;
2428 if (tgt_image_opts && !skip_create) {
2429 error_report("--target-image-opts requires use of -n flag");
2430 goto fail_getopt;
2433 if (skip_create && options) {
2434 error_report("-o has no effect when skipping image creation");
2435 goto fail_getopt;
2438 if (s.has_zero_init && !skip_create) {
2439 error_report("--target-is-zero requires use of -n flag");
2440 goto fail_getopt;
2443 s.src_num = argc - optind - 1;
2444 out_filename = s.src_num >= 1 ? argv[argc - 1] : NULL;
2446 if (options && has_help_option(options)) {
2447 if (out_fmt) {
2448 ret = print_block_option_help(out_filename, out_fmt);
2449 goto fail_getopt;
2450 } else {
2451 error_report("Option help requires a format be specified");
2452 goto fail_getopt;
2456 if (s.src_num < 1) {
2457 error_report("Must specify image file name");
2458 goto fail_getopt;
2461 /* ret is still -EINVAL until here */
2462 ret = bdrv_parse_cache_mode(src_cache, &src_flags, &src_writethrough);
2463 if (ret < 0) {
2464 error_report("Invalid source cache option: %s", src_cache);
2465 goto fail_getopt;
2468 /* Initialize before goto out */
2469 if (s.quiet) {
2470 progress = false;
2472 qemu_progress_init(progress, 1.0);
2473 qemu_progress_print(0, 100);
2475 s.src = g_new0(BlockBackend *, s.src_num);
2476 s.src_sectors = g_new(int64_t, s.src_num);
2477 s.src_alignment = g_new(int, s.src_num);
2479 for (bs_i = 0; bs_i < s.src_num; bs_i++) {
2480 BlockDriverState *src_bs;
2481 s.src[bs_i] = img_open(image_opts, argv[optind + bs_i],
2482 fmt, src_flags, src_writethrough, s.quiet,
2483 force_share);
2484 if (!s.src[bs_i]) {
2485 ret = -1;
2486 goto out;
2488 s.src_sectors[bs_i] = blk_nb_sectors(s.src[bs_i]);
2489 if (s.src_sectors[bs_i] < 0) {
2490 error_report("Could not get size of %s: %s",
2491 argv[optind + bs_i], strerror(-s.src_sectors[bs_i]));
2492 ret = -1;
2493 goto out;
2495 src_bs = blk_bs(s.src[bs_i]);
2496 s.src_alignment[bs_i] = DIV_ROUND_UP(src_bs->bl.request_alignment,
2497 BDRV_SECTOR_SIZE);
2498 if (!bdrv_get_info(src_bs, &bdi)) {
2499 s.src_alignment[bs_i] = MAX(s.src_alignment[bs_i],
2500 bdi.cluster_size / BDRV_SECTOR_SIZE);
2502 s.total_sectors += s.src_sectors[bs_i];
2505 if (sn_opts) {
2506 bdrv_snapshot_load_tmp(blk_bs(s.src[0]),
2507 qemu_opt_get(sn_opts, SNAPSHOT_OPT_ID),
2508 qemu_opt_get(sn_opts, SNAPSHOT_OPT_NAME),
2509 &local_err);
2510 } else if (snapshot_name != NULL) {
2511 if (s.src_num > 1) {
2512 error_report("No support for concatenating multiple snapshot");
2513 ret = -1;
2514 goto out;
2517 bdrv_snapshot_load_tmp_by_id_or_name(blk_bs(s.src[0]), snapshot_name,
2518 &local_err);
2520 if (local_err) {
2521 error_reportf_err(local_err, "Failed to load snapshot: ");
2522 ret = -1;
2523 goto out;
2526 if (!skip_create) {
2527 /* Find driver and parse its options */
2528 drv = bdrv_find_format(out_fmt);
2529 if (!drv) {
2530 error_report("Unknown file format '%s'", out_fmt);
2531 ret = -1;
2532 goto out;
2535 proto_drv = bdrv_find_protocol(out_filename, true, &local_err);
2536 if (!proto_drv) {
2537 error_report_err(local_err);
2538 ret = -1;
2539 goto out;
2542 if (!drv->create_opts) {
2543 error_report("Format driver '%s' does not support image creation",
2544 drv->format_name);
2545 ret = -1;
2546 goto out;
2549 if (!proto_drv->create_opts) {
2550 error_report("Protocol driver '%s' does not support image creation",
2551 proto_drv->format_name);
2552 ret = -1;
2553 goto out;
2556 create_opts = qemu_opts_append(create_opts, drv->create_opts);
2557 create_opts = qemu_opts_append(create_opts, proto_drv->create_opts);
2559 opts = qemu_opts_create(create_opts, NULL, 0, &error_abort);
2560 if (options) {
2561 if (!qemu_opts_do_parse(opts, options, NULL, &local_err)) {
2562 error_report_err(local_err);
2563 ret = -1;
2564 goto out;
2568 qemu_opt_set_number(opts, BLOCK_OPT_SIZE,
2569 s.total_sectors * BDRV_SECTOR_SIZE, &error_abort);
2570 ret = add_old_style_options(out_fmt, opts, out_baseimg, backing_fmt);
2571 if (ret < 0) {
2572 goto out;
2576 /* Get backing file name if -o backing_file was used */
2577 out_baseimg_param = qemu_opt_get(opts, BLOCK_OPT_BACKING_FILE);
2578 if (out_baseimg_param) {
2579 out_baseimg = out_baseimg_param;
2581 s.target_has_backing = (bool) out_baseimg;
2583 if (s.has_zero_init && s.target_has_backing) {
2584 error_report("Cannot use --target-is-zero when the destination "
2585 "image has a backing file");
2586 goto out;
2589 if (s.src_num > 1 && out_baseimg) {
2590 error_report("Having a backing file for the target makes no sense when "
2591 "concatenating multiple input images");
2592 ret = -1;
2593 goto out;
2596 if (out_baseimg_param) {
2597 if (!qemu_opt_get(opts, BLOCK_OPT_BACKING_FMT)) {
2598 error_report("Use of backing file requires explicit "
2599 "backing format");
2600 ret = -1;
2601 goto out;
2605 /* Check if compression is supported */
2606 if (s.compressed) {
2607 bool encryption =
2608 qemu_opt_get_bool(opts, BLOCK_OPT_ENCRYPT, false);
2609 const char *encryptfmt =
2610 qemu_opt_get(opts, BLOCK_OPT_ENCRYPT_FORMAT);
2611 const char *preallocation =
2612 qemu_opt_get(opts, BLOCK_OPT_PREALLOC);
2614 if (drv && !block_driver_can_compress(drv)) {
2615 error_report("Compression not supported for this file format");
2616 ret = -1;
2617 goto out;
2620 if (encryption || encryptfmt) {
2621 error_report("Compression and encryption not supported at "
2622 "the same time");
2623 ret = -1;
2624 goto out;
2627 if (preallocation
2628 && strcmp(preallocation, "off"))
2630 error_report("Compression and preallocation not supported at "
2631 "the same time");
2632 ret = -1;
2633 goto out;
2637 /* Determine if bitmaps need copying */
2638 if (bitmaps) {
2639 if (s.src_num > 1) {
2640 error_report("Copying bitmaps only possible with single source");
2641 ret = -1;
2642 goto out;
2644 ret = convert_check_bitmaps(blk_bs(s.src[0]), skip_broken);
2645 if (ret < 0) {
2646 goto out;
2651 * The later open call will need any decryption secrets, and
2652 * bdrv_create() will purge "opts", so extract them now before
2653 * they are lost.
2655 if (!skip_create) {
2656 open_opts = qdict_new();
2657 qemu_opt_foreach(opts, img_add_key_secrets, open_opts, &error_abort);
2659 /* Create the new image */
2660 ret = bdrv_create(drv, out_filename, opts, &local_err);
2661 if (ret < 0) {
2662 error_reportf_err(local_err, "%s: error while converting %s: ",
2663 out_filename, out_fmt);
2664 goto out;
2668 s.target_is_new = !skip_create;
2670 flags = s.min_sparse ? (BDRV_O_RDWR | BDRV_O_UNMAP) : BDRV_O_RDWR;
2671 ret = bdrv_parse_cache_mode(cache, &flags, &writethrough);
2672 if (ret < 0) {
2673 error_report("Invalid cache option: %s", cache);
2674 goto out;
2677 if (flags & BDRV_O_NOCACHE) {
2679 * If we open the target with O_DIRECT, it may be necessary to
2680 * extend its size to align to the physical sector size.
2682 flags |= BDRV_O_RESIZE;
2685 if (skip_create) {
2686 s.target = img_open(tgt_image_opts, out_filename, out_fmt,
2687 flags, writethrough, s.quiet, false);
2688 } else {
2689 /* TODO ultimately we should allow --target-image-opts
2690 * to be used even when -n is not given.
2691 * That has to wait for bdrv_create to be improved
2692 * to allow filenames in option syntax
2694 s.target = img_open_file(out_filename, open_opts, out_fmt,
2695 flags, writethrough, s.quiet, false);
2696 open_opts = NULL; /* blk_new_open will have freed it */
2698 if (!s.target) {
2699 ret = -1;
2700 goto out;
2702 out_bs = blk_bs(s.target);
2704 if (bitmaps && !bdrv_supports_persistent_dirty_bitmap(out_bs)) {
2705 error_report("Format driver '%s' does not support bitmaps",
2706 out_bs->drv->format_name);
2707 ret = -1;
2708 goto out;
2711 if (s.compressed && !block_driver_can_compress(out_bs->drv)) {
2712 error_report("Compression not supported for this file format");
2713 ret = -1;
2714 goto out;
2717 /* increase bufsectors from the default 4096 (2M) if opt_transfer
2718 * or discard_alignment of the out_bs is greater. Limit to
2719 * MAX_BUF_SECTORS as maximum which is currently 32768 (16MB). */
2720 s.buf_sectors = MIN(MAX_BUF_SECTORS,
2721 MAX(s.buf_sectors,
2722 MAX(out_bs->bl.opt_transfer >> BDRV_SECTOR_BITS,
2723 out_bs->bl.pdiscard_alignment >>
2724 BDRV_SECTOR_BITS)));
2726 /* try to align the write requests to the destination to avoid unnecessary
2727 * RMW cycles. */
2728 s.alignment = MAX(pow2floor(s.min_sparse),
2729 DIV_ROUND_UP(out_bs->bl.request_alignment,
2730 BDRV_SECTOR_SIZE));
2731 assert(is_power_of_2(s.alignment));
2733 if (skip_create) {
2734 int64_t output_sectors = blk_nb_sectors(s.target);
2735 if (output_sectors < 0) {
2736 error_report("unable to get output image length: %s",
2737 strerror(-output_sectors));
2738 ret = -1;
2739 goto out;
2740 } else if (output_sectors < s.total_sectors) {
2741 error_report("output file is smaller than input file");
2742 ret = -1;
2743 goto out;
2747 if (s.target_has_backing && s.target_is_new) {
2748 /* Errors are treated as "backing length unknown" (which means
2749 * s.target_backing_sectors has to be negative, which it will
2750 * be automatically). The backing file length is used only
2751 * for optimizations, so such a case is not fatal. */
2752 s.target_backing_sectors =
2753 bdrv_nb_sectors(bdrv_backing_chain_next(out_bs));
2754 } else {
2755 s.target_backing_sectors = -1;
2758 ret = bdrv_get_info(out_bs, &bdi);
2759 if (ret < 0) {
2760 if (s.compressed) {
2761 error_report("could not get block driver info");
2762 goto out;
2764 } else {
2765 s.compressed = s.compressed || bdi.needs_compressed_writes;
2766 s.cluster_sectors = bdi.cluster_size / BDRV_SECTOR_SIZE;
2769 if (rate_limit) {
2770 set_rate_limit(s.target, rate_limit);
2773 ret = convert_do_copy(&s);
2775 /* Now copy the bitmaps */
2776 if (bitmaps && ret == 0) {
2777 ret = convert_copy_bitmaps(blk_bs(s.src[0]), out_bs, skip_broken);
2780 out:
2781 if (!ret) {
2782 qemu_progress_print(100, 0);
2784 qemu_progress_end();
2785 qemu_opts_del(opts);
2786 qemu_opts_free(create_opts);
2787 qobject_unref(open_opts);
2788 blk_unref(s.target);
2789 if (s.src) {
2790 for (bs_i = 0; bs_i < s.src_num; bs_i++) {
2791 blk_unref(s.src[bs_i]);
2793 g_free(s.src);
2795 g_free(s.src_sectors);
2796 g_free(s.src_alignment);
2797 fail_getopt:
2798 qemu_opts_del(sn_opts);
2799 g_free(options);
2801 return !!ret;
2805 static void dump_snapshots(BlockDriverState *bs)
2807 QEMUSnapshotInfo *sn_tab, *sn;
2808 int nb_sns, i;
2810 nb_sns = bdrv_snapshot_list(bs, &sn_tab);
2811 if (nb_sns <= 0)
2812 return;
2813 printf("Snapshot list:\n");
2814 bdrv_snapshot_dump(NULL);
2815 printf("\n");
2816 for(i = 0; i < nb_sns; i++) {
2817 sn = &sn_tab[i];
2818 bdrv_snapshot_dump(sn);
2819 printf("\n");
2821 g_free(sn_tab);
2824 static void dump_json_block_graph_info_list(BlockGraphInfoList *list)
2826 GString *str;
2827 QObject *obj;
2828 Visitor *v = qobject_output_visitor_new(&obj);
2830 visit_type_BlockGraphInfoList(v, NULL, &list, &error_abort);
2831 visit_complete(v, &obj);
2832 str = qobject_to_json_pretty(obj, true);
2833 assert(str != NULL);
2834 printf("%s\n", str->str);
2835 qobject_unref(obj);
2836 visit_free(v);
2837 g_string_free(str, true);
2840 static void dump_json_block_graph_info(BlockGraphInfo *info)
2842 GString *str;
2843 QObject *obj;
2844 Visitor *v = qobject_output_visitor_new(&obj);
2846 visit_type_BlockGraphInfo(v, NULL, &info, &error_abort);
2847 visit_complete(v, &obj);
2848 str = qobject_to_json_pretty(obj, true);
2849 assert(str != NULL);
2850 printf("%s\n", str->str);
2851 qobject_unref(obj);
2852 visit_free(v);
2853 g_string_free(str, true);
2856 static void dump_human_image_info(BlockGraphInfo *info, int indentation,
2857 const char *path)
2859 BlockChildInfoList *children_list;
2861 bdrv_node_info_dump(qapi_BlockGraphInfo_base(info), indentation,
2862 info->children == NULL);
2864 for (children_list = info->children; children_list;
2865 children_list = children_list->next)
2867 BlockChildInfo *child = children_list->value;
2868 g_autofree char *child_path = NULL;
2870 printf("%*sChild node '%s%s':\n",
2871 indentation * 4, "", path, child->name);
2872 child_path = g_strdup_printf("%s%s/", path, child->name);
2873 dump_human_image_info(child->info, indentation + 1, child_path);
2877 static void dump_human_image_info_list(BlockGraphInfoList *list)
2879 BlockGraphInfoList *elem;
2880 bool delim = false;
2882 for (elem = list; elem; elem = elem->next) {
2883 if (delim) {
2884 printf("\n");
2886 delim = true;
2888 dump_human_image_info(elem->value, 0, "/");
2892 static gboolean str_equal_func(gconstpointer a, gconstpointer b)
2894 return strcmp(a, b) == 0;
2898 * Open an image file chain and return an BlockGraphInfoList
2900 * @filename: topmost image filename
2901 * @fmt: topmost image format (may be NULL to autodetect)
2902 * @chain: true - enumerate entire backing file chain
2903 * false - only topmost image file
2905 * Returns a list of BlockNodeInfo objects or NULL if there was an error
2906 * opening an image file. If there was an error a message will have been
2907 * printed to stderr.
2909 static BlockGraphInfoList *collect_image_info_list(bool image_opts,
2910 const char *filename,
2911 const char *fmt,
2912 bool chain, bool force_share)
2914 BlockGraphInfoList *head = NULL;
2915 BlockGraphInfoList **tail = &head;
2916 GHashTable *filenames;
2917 Error *err = NULL;
2919 filenames = g_hash_table_new_full(g_str_hash, str_equal_func, NULL, NULL);
2921 while (filename) {
2922 BlockBackend *blk;
2923 BlockDriverState *bs;
2924 BlockGraphInfo *info;
2926 if (g_hash_table_lookup_extended(filenames, filename, NULL, NULL)) {
2927 error_report("Backing file '%s' creates an infinite loop.",
2928 filename);
2929 goto err;
2931 g_hash_table_insert(filenames, (gpointer)filename, NULL);
2933 blk = img_open(image_opts, filename, fmt,
2934 BDRV_O_NO_BACKING | BDRV_O_NO_IO, false, false,
2935 force_share);
2936 if (!blk) {
2937 goto err;
2939 bs = blk_bs(blk);
2942 * Note that the returned BlockGraphInfo object will not have
2943 * information about this image's backing node, because we have opened
2944 * it with BDRV_O_NO_BACKING. Printing this object will therefore not
2945 * duplicate the backing chain information that we obtain by walking
2946 * the chain manually here.
2948 bdrv_graph_rdlock_main_loop();
2949 bdrv_query_block_graph_info(bs, &info, &err);
2950 bdrv_graph_rdunlock_main_loop();
2952 if (err) {
2953 error_report_err(err);
2954 blk_unref(blk);
2955 goto err;
2958 QAPI_LIST_APPEND(tail, info);
2960 blk_unref(blk);
2962 /* Clear parameters that only apply to the topmost image */
2963 filename = fmt = NULL;
2964 image_opts = false;
2966 if (chain) {
2967 if (info->full_backing_filename) {
2968 filename = info->full_backing_filename;
2969 } else if (info->backing_filename) {
2970 error_report("Could not determine absolute backing filename,"
2971 " but backing filename '%s' present",
2972 info->backing_filename);
2973 goto err;
2975 if (info->backing_filename_format) {
2976 fmt = info->backing_filename_format;
2980 g_hash_table_destroy(filenames);
2981 return head;
2983 err:
2984 qapi_free_BlockGraphInfoList(head);
2985 g_hash_table_destroy(filenames);
2986 return NULL;
2989 static int img_info(int argc, char **argv)
2991 int c;
2992 OutputFormat output_format = OFORMAT_HUMAN;
2993 bool chain = false;
2994 const char *filename, *fmt, *output;
2995 BlockGraphInfoList *list;
2996 bool image_opts = false;
2997 bool force_share = false;
2999 fmt = NULL;
3000 output = NULL;
3001 for(;;) {
3002 int option_index = 0;
3003 static const struct option long_options[] = {
3004 {"help", no_argument, 0, 'h'},
3005 {"format", required_argument, 0, 'f'},
3006 {"output", required_argument, 0, OPTION_OUTPUT},
3007 {"backing-chain", no_argument, 0, OPTION_BACKING_CHAIN},
3008 {"object", required_argument, 0, OPTION_OBJECT},
3009 {"image-opts", no_argument, 0, OPTION_IMAGE_OPTS},
3010 {"force-share", no_argument, 0, 'U'},
3011 {0, 0, 0, 0}
3013 c = getopt_long(argc, argv, ":f:hU",
3014 long_options, &option_index);
3015 if (c == -1) {
3016 break;
3018 switch(c) {
3019 case ':':
3020 missing_argument(argv[optind - 1]);
3021 break;
3022 case '?':
3023 unrecognized_option(argv[optind - 1]);
3024 break;
3025 case 'h':
3026 help();
3027 break;
3028 case 'f':
3029 fmt = optarg;
3030 break;
3031 case 'U':
3032 force_share = true;
3033 break;
3034 case OPTION_OUTPUT:
3035 output = optarg;
3036 break;
3037 case OPTION_BACKING_CHAIN:
3038 chain = true;
3039 break;
3040 case OPTION_OBJECT:
3041 user_creatable_process_cmdline(optarg);
3042 break;
3043 case OPTION_IMAGE_OPTS:
3044 image_opts = true;
3045 break;
3048 if (optind != argc - 1) {
3049 error_exit("Expecting one image file name");
3051 filename = argv[optind++];
3053 if (output && !strcmp(output, "json")) {
3054 output_format = OFORMAT_JSON;
3055 } else if (output && !strcmp(output, "human")) {
3056 output_format = OFORMAT_HUMAN;
3057 } else if (output) {
3058 error_report("--output must be used with human or json as argument.");
3059 return 1;
3062 list = collect_image_info_list(image_opts, filename, fmt, chain,
3063 force_share);
3064 if (!list) {
3065 return 1;
3068 switch (output_format) {
3069 case OFORMAT_HUMAN:
3070 dump_human_image_info_list(list);
3071 break;
3072 case OFORMAT_JSON:
3073 if (chain) {
3074 dump_json_block_graph_info_list(list);
3075 } else {
3076 dump_json_block_graph_info(list->value);
3078 break;
3081 qapi_free_BlockGraphInfoList(list);
3082 return 0;
3085 static int dump_map_entry(OutputFormat output_format, MapEntry *e,
3086 MapEntry *next)
3088 switch (output_format) {
3089 case OFORMAT_HUMAN:
3090 if (e->data && !e->has_offset) {
3091 error_report("File contains external, encrypted or compressed clusters.");
3092 return -1;
3094 if (e->data && !e->zero) {
3095 printf("%#-16"PRIx64"%#-16"PRIx64"%#-16"PRIx64"%s\n",
3096 e->start, e->length,
3097 e->has_offset ? e->offset : 0,
3098 e->filename ?: "");
3100 /* This format ignores the distinction between 0, ZERO and ZERO|DATA.
3101 * Modify the flags here to allow more coalescing.
3103 if (next && (!next->data || next->zero)) {
3104 next->data = false;
3105 next->zero = true;
3107 break;
3108 case OFORMAT_JSON:
3109 printf("{ \"start\": %"PRId64", \"length\": %"PRId64","
3110 " \"depth\": %"PRId64", \"present\": %s, \"zero\": %s,"
3111 " \"data\": %s, \"compressed\": %s",
3112 e->start, e->length, e->depth,
3113 e->present ? "true" : "false",
3114 e->zero ? "true" : "false",
3115 e->data ? "true" : "false",
3116 e->compressed ? "true" : "false");
3117 if (e->has_offset) {
3118 printf(", \"offset\": %"PRId64"", e->offset);
3120 putchar('}');
3122 if (next) {
3123 puts(",");
3125 break;
3127 return 0;
3130 static int get_block_status(BlockDriverState *bs, int64_t offset,
3131 int64_t bytes, MapEntry *e)
3133 int ret;
3134 int depth;
3135 BlockDriverState *file;
3136 bool has_offset;
3137 int64_t map;
3138 char *filename = NULL;
3140 /* As an optimization, we could cache the current range of unallocated
3141 * clusters in each file of the chain, and avoid querying the same
3142 * range repeatedly.
3145 depth = 0;
3146 for (;;) {
3147 bs = bdrv_skip_filters(bs);
3148 ret = bdrv_block_status(bs, offset, bytes, &bytes, &map, &file);
3149 if (ret < 0) {
3150 return ret;
3152 assert(bytes);
3153 if (ret & (BDRV_BLOCK_ZERO|BDRV_BLOCK_DATA)) {
3154 break;
3156 bs = bdrv_cow_bs(bs);
3157 if (bs == NULL) {
3158 ret = 0;
3159 break;
3162 depth++;
3165 has_offset = !!(ret & BDRV_BLOCK_OFFSET_VALID);
3167 if (file && has_offset) {
3168 bdrv_graph_rdlock_main_loop();
3169 bdrv_refresh_filename(file);
3170 bdrv_graph_rdunlock_main_loop();
3171 filename = file->filename;
3174 *e = (MapEntry) {
3175 .start = offset,
3176 .length = bytes,
3177 .data = !!(ret & BDRV_BLOCK_DATA),
3178 .zero = !!(ret & BDRV_BLOCK_ZERO),
3179 .compressed = !!(ret & BDRV_BLOCK_COMPRESSED),
3180 .offset = map,
3181 .has_offset = has_offset,
3182 .depth = depth,
3183 .present = !!(ret & BDRV_BLOCK_ALLOCATED),
3184 .filename = filename,
3187 return 0;
3190 static inline bool entry_mergeable(const MapEntry *curr, const MapEntry *next)
3192 if (curr->length == 0) {
3193 return false;
3195 if (curr->zero != next->zero ||
3196 curr->data != next->data ||
3197 curr->compressed != next->compressed ||
3198 curr->depth != next->depth ||
3199 curr->present != next->present ||
3200 !curr->filename != !next->filename ||
3201 curr->has_offset != next->has_offset) {
3202 return false;
3204 if (curr->filename && strcmp(curr->filename, next->filename)) {
3205 return false;
3207 if (curr->has_offset && curr->offset + curr->length != next->offset) {
3208 return false;
3210 return true;
3213 static int img_map(int argc, char **argv)
3215 int c;
3216 OutputFormat output_format = OFORMAT_HUMAN;
3217 BlockBackend *blk;
3218 BlockDriverState *bs;
3219 const char *filename, *fmt, *output;
3220 int64_t length;
3221 MapEntry curr = { .length = 0 }, next;
3222 int ret = 0;
3223 bool image_opts = false;
3224 bool force_share = false;
3225 int64_t start_offset = 0;
3226 int64_t max_length = -1;
3228 fmt = NULL;
3229 output = NULL;
3230 for (;;) {
3231 int option_index = 0;
3232 static const struct option long_options[] = {
3233 {"help", no_argument, 0, 'h'},
3234 {"format", required_argument, 0, 'f'},
3235 {"output", required_argument, 0, OPTION_OUTPUT},
3236 {"object", required_argument, 0, OPTION_OBJECT},
3237 {"image-opts", no_argument, 0, OPTION_IMAGE_OPTS},
3238 {"force-share", no_argument, 0, 'U'},
3239 {"start-offset", required_argument, 0, 's'},
3240 {"max-length", required_argument, 0, 'l'},
3241 {0, 0, 0, 0}
3243 c = getopt_long(argc, argv, ":f:s:l:hU",
3244 long_options, &option_index);
3245 if (c == -1) {
3246 break;
3248 switch (c) {
3249 case ':':
3250 missing_argument(argv[optind - 1]);
3251 break;
3252 case '?':
3253 unrecognized_option(argv[optind - 1]);
3254 break;
3255 case 'h':
3256 help();
3257 break;
3258 case 'f':
3259 fmt = optarg;
3260 break;
3261 case 'U':
3262 force_share = true;
3263 break;
3264 case OPTION_OUTPUT:
3265 output = optarg;
3266 break;
3267 case 's':
3268 start_offset = cvtnum("start offset", optarg);
3269 if (start_offset < 0) {
3270 return 1;
3272 break;
3273 case 'l':
3274 max_length = cvtnum("max length", optarg);
3275 if (max_length < 0) {
3276 return 1;
3278 break;
3279 case OPTION_OBJECT:
3280 user_creatable_process_cmdline(optarg);
3281 break;
3282 case OPTION_IMAGE_OPTS:
3283 image_opts = true;
3284 break;
3287 if (optind != argc - 1) {
3288 error_exit("Expecting one image file name");
3290 filename = argv[optind];
3292 if (output && !strcmp(output, "json")) {
3293 output_format = OFORMAT_JSON;
3294 } else if (output && !strcmp(output, "human")) {
3295 output_format = OFORMAT_HUMAN;
3296 } else if (output) {
3297 error_report("--output must be used with human or json as argument.");
3298 return 1;
3301 blk = img_open(image_opts, filename, fmt, 0, false, false, force_share);
3302 if (!blk) {
3303 return 1;
3305 bs = blk_bs(blk);
3307 if (output_format == OFORMAT_HUMAN) {
3308 printf("%-16s%-16s%-16s%s\n", "Offset", "Length", "Mapped to", "File");
3309 } else if (output_format == OFORMAT_JSON) {
3310 putchar('[');
3313 length = blk_getlength(blk);
3314 if (length < 0) {
3315 error_report("Failed to get size for '%s'", filename);
3316 return 1;
3318 if (max_length != -1) {
3319 length = MIN(start_offset + max_length, length);
3322 curr.start = start_offset;
3323 while (curr.start + curr.length < length) {
3324 int64_t offset = curr.start + curr.length;
3325 int64_t n = length - offset;
3327 ret = get_block_status(bs, offset, n, &next);
3328 if (ret < 0) {
3329 error_report("Could not read file metadata: %s", strerror(-ret));
3330 goto out;
3333 if (entry_mergeable(&curr, &next)) {
3334 curr.length += next.length;
3335 continue;
3338 if (curr.length > 0) {
3339 ret = dump_map_entry(output_format, &curr, &next);
3340 if (ret < 0) {
3341 goto out;
3344 curr = next;
3347 ret = dump_map_entry(output_format, &curr, NULL);
3348 if (output_format == OFORMAT_JSON) {
3349 puts("]");
3352 out:
3353 blk_unref(blk);
3354 return ret < 0;
3357 #define SNAPSHOT_LIST 1
3358 #define SNAPSHOT_CREATE 2
3359 #define SNAPSHOT_APPLY 3
3360 #define SNAPSHOT_DELETE 4
3362 static int img_snapshot(int argc, char **argv)
3364 BlockBackend *blk;
3365 BlockDriverState *bs;
3366 QEMUSnapshotInfo sn;
3367 char *filename, *snapshot_name = NULL;
3368 int c, ret = 0, bdrv_oflags;
3369 int action = 0;
3370 bool quiet = false;
3371 Error *err = NULL;
3372 bool image_opts = false;
3373 bool force_share = false;
3374 int64_t rt;
3376 bdrv_oflags = BDRV_O_RDWR;
3377 /* Parse commandline parameters */
3378 for(;;) {
3379 static const struct option long_options[] = {
3380 {"help", no_argument, 0, 'h'},
3381 {"object", required_argument, 0, OPTION_OBJECT},
3382 {"image-opts", no_argument, 0, OPTION_IMAGE_OPTS},
3383 {"force-share", no_argument, 0, 'U'},
3384 {0, 0, 0, 0}
3386 c = getopt_long(argc, argv, ":la:c:d:hqU",
3387 long_options, NULL);
3388 if (c == -1) {
3389 break;
3391 switch(c) {
3392 case ':':
3393 missing_argument(argv[optind - 1]);
3394 break;
3395 case '?':
3396 unrecognized_option(argv[optind - 1]);
3397 break;
3398 case 'h':
3399 help();
3400 return 0;
3401 case 'l':
3402 if (action) {
3403 error_exit("Cannot mix '-l', '-a', '-c', '-d'");
3404 return 0;
3406 action = SNAPSHOT_LIST;
3407 bdrv_oflags &= ~BDRV_O_RDWR; /* no need for RW */
3408 break;
3409 case 'a':
3410 if (action) {
3411 error_exit("Cannot mix '-l', '-a', '-c', '-d'");
3412 return 0;
3414 action = SNAPSHOT_APPLY;
3415 snapshot_name = optarg;
3416 break;
3417 case 'c':
3418 if (action) {
3419 error_exit("Cannot mix '-l', '-a', '-c', '-d'");
3420 return 0;
3422 action = SNAPSHOT_CREATE;
3423 snapshot_name = optarg;
3424 break;
3425 case 'd':
3426 if (action) {
3427 error_exit("Cannot mix '-l', '-a', '-c', '-d'");
3428 return 0;
3430 action = SNAPSHOT_DELETE;
3431 snapshot_name = optarg;
3432 break;
3433 case 'q':
3434 quiet = true;
3435 break;
3436 case 'U':
3437 force_share = true;
3438 break;
3439 case OPTION_OBJECT:
3440 user_creatable_process_cmdline(optarg);
3441 break;
3442 case OPTION_IMAGE_OPTS:
3443 image_opts = true;
3444 break;
3448 if (optind != argc - 1) {
3449 error_exit("Expecting one image file name");
3451 filename = argv[optind++];
3453 /* Open the image */
3454 blk = img_open(image_opts, filename, NULL, bdrv_oflags, false, quiet,
3455 force_share);
3456 if (!blk) {
3457 return 1;
3459 bs = blk_bs(blk);
3461 /* Perform the requested action */
3462 switch(action) {
3463 case SNAPSHOT_LIST:
3464 dump_snapshots(bs);
3465 break;
3467 case SNAPSHOT_CREATE:
3468 memset(&sn, 0, sizeof(sn));
3469 pstrcpy(sn.name, sizeof(sn.name), snapshot_name);
3471 rt = g_get_real_time();
3472 sn.date_sec = rt / G_USEC_PER_SEC;
3473 sn.date_nsec = (rt % G_USEC_PER_SEC) * 1000;
3475 bdrv_graph_rdlock_main_loop();
3476 ret = bdrv_snapshot_create(bs, &sn);
3477 bdrv_graph_rdunlock_main_loop();
3479 if (ret) {
3480 error_report("Could not create snapshot '%s': %s",
3481 snapshot_name, strerror(-ret));
3483 break;
3485 case SNAPSHOT_APPLY:
3486 ret = bdrv_snapshot_goto(bs, snapshot_name, &err);
3487 if (ret) {
3488 error_reportf_err(err, "Could not apply snapshot '%s': ",
3489 snapshot_name);
3491 break;
3493 case SNAPSHOT_DELETE:
3494 bdrv_graph_rdlock_main_loop();
3495 ret = bdrv_snapshot_find(bs, &sn, snapshot_name);
3496 if (ret < 0) {
3497 error_report("Could not delete snapshot '%s': snapshot not "
3498 "found", snapshot_name);
3499 ret = 1;
3500 } else {
3501 ret = bdrv_snapshot_delete(bs, sn.id_str, sn.name, &err);
3502 if (ret < 0) {
3503 error_reportf_err(err, "Could not delete snapshot '%s': ",
3504 snapshot_name);
3505 ret = 1;
3508 bdrv_graph_rdunlock_main_loop();
3509 break;
3512 /* Cleanup */
3513 blk_unref(blk);
3514 if (ret) {
3515 return 1;
3517 return 0;
3520 static int img_rebase(int argc, char **argv)
3522 BlockBackend *blk = NULL, *blk_old_backing = NULL, *blk_new_backing = NULL;
3523 uint8_t *buf_old = NULL;
3524 uint8_t *buf_new = NULL;
3525 BlockDriverState *bs = NULL, *prefix_chain_bs = NULL;
3526 BlockDriverState *unfiltered_bs;
3527 char *filename;
3528 const char *fmt, *cache, *src_cache, *out_basefmt, *out_baseimg;
3529 int c, flags, src_flags, ret;
3530 bool writethrough, src_writethrough;
3531 int unsafe = 0;
3532 bool force_share = false;
3533 int progress = 0;
3534 bool quiet = false;
3535 Error *local_err = NULL;
3536 bool image_opts = false;
3538 /* Parse commandline parameters */
3539 fmt = NULL;
3540 cache = BDRV_DEFAULT_CACHE;
3541 src_cache = BDRV_DEFAULT_CACHE;
3542 out_baseimg = NULL;
3543 out_basefmt = NULL;
3544 for(;;) {
3545 static const struct option long_options[] = {
3546 {"help", no_argument, 0, 'h'},
3547 {"object", required_argument, 0, OPTION_OBJECT},
3548 {"image-opts", no_argument, 0, OPTION_IMAGE_OPTS},
3549 {"force-share", no_argument, 0, 'U'},
3550 {0, 0, 0, 0}
3552 c = getopt_long(argc, argv, ":hf:F:b:upt:T:qU",
3553 long_options, NULL);
3554 if (c == -1) {
3555 break;
3557 switch(c) {
3558 case ':':
3559 missing_argument(argv[optind - 1]);
3560 break;
3561 case '?':
3562 unrecognized_option(argv[optind - 1]);
3563 break;
3564 case 'h':
3565 help();
3566 return 0;
3567 case 'f':
3568 fmt = optarg;
3569 break;
3570 case 'F':
3571 out_basefmt = optarg;
3572 break;
3573 case 'b':
3574 out_baseimg = optarg;
3575 break;
3576 case 'u':
3577 unsafe = 1;
3578 break;
3579 case 'p':
3580 progress = 1;
3581 break;
3582 case 't':
3583 cache = optarg;
3584 break;
3585 case 'T':
3586 src_cache = optarg;
3587 break;
3588 case 'q':
3589 quiet = true;
3590 break;
3591 case OPTION_OBJECT:
3592 user_creatable_process_cmdline(optarg);
3593 break;
3594 case OPTION_IMAGE_OPTS:
3595 image_opts = true;
3596 break;
3597 case 'U':
3598 force_share = true;
3599 break;
3603 if (quiet) {
3604 progress = 0;
3607 if (optind != argc - 1) {
3608 error_exit("Expecting one image file name");
3610 if (!unsafe && !out_baseimg) {
3611 error_exit("Must specify backing file (-b) or use unsafe mode (-u)");
3613 filename = argv[optind++];
3615 qemu_progress_init(progress, 2.0);
3616 qemu_progress_print(0, 100);
3618 flags = BDRV_O_RDWR | (unsafe ? BDRV_O_NO_BACKING : 0);
3619 ret = bdrv_parse_cache_mode(cache, &flags, &writethrough);
3620 if (ret < 0) {
3621 error_report("Invalid cache option: %s", cache);
3622 goto out;
3625 src_flags = 0;
3626 ret = bdrv_parse_cache_mode(src_cache, &src_flags, &src_writethrough);
3627 if (ret < 0) {
3628 error_report("Invalid source cache option: %s", src_cache);
3629 goto out;
3632 /* The source files are opened read-only, don't care about WCE */
3633 assert((src_flags & BDRV_O_RDWR) == 0);
3634 (void) src_writethrough;
3637 * Open the images.
3639 * Ignore the old backing file for unsafe rebase in case we want to correct
3640 * the reference to a renamed or moved backing file.
3642 blk = img_open(image_opts, filename, fmt, flags, writethrough, quiet,
3643 false);
3644 if (!blk) {
3645 ret = -1;
3646 goto out;
3648 bs = blk_bs(blk);
3650 unfiltered_bs = bdrv_skip_filters(bs);
3652 if (out_basefmt != NULL) {
3653 if (bdrv_find_format(out_basefmt) == NULL) {
3654 error_report("Invalid format name: '%s'", out_basefmt);
3655 ret = -1;
3656 goto out;
3660 /* For safe rebasing we need to compare old and new backing file */
3661 if (!unsafe) {
3662 QDict *options = NULL;
3663 BlockDriverState *base_bs = bdrv_cow_bs(unfiltered_bs);
3665 if (base_bs) {
3666 blk_old_backing = blk_new(qemu_get_aio_context(),
3667 BLK_PERM_CONSISTENT_READ,
3668 BLK_PERM_ALL);
3669 ret = blk_insert_bs(blk_old_backing, base_bs,
3670 &local_err);
3671 if (ret < 0) {
3672 error_reportf_err(local_err,
3673 "Could not reuse old backing file '%s': ",
3674 base_bs->filename);
3675 goto out;
3677 } else {
3678 blk_old_backing = NULL;
3681 if (out_baseimg[0]) {
3682 const char *overlay_filename;
3683 char *out_real_path;
3685 options = qdict_new();
3686 if (out_basefmt) {
3687 qdict_put_str(options, "driver", out_basefmt);
3689 if (force_share) {
3690 qdict_put_bool(options, BDRV_OPT_FORCE_SHARE, true);
3693 bdrv_graph_rdlock_main_loop();
3694 bdrv_refresh_filename(bs);
3695 bdrv_graph_rdunlock_main_loop();
3696 overlay_filename = bs->exact_filename[0] ? bs->exact_filename
3697 : bs->filename;
3698 out_real_path =
3699 bdrv_get_full_backing_filename_from_filename(overlay_filename,
3700 out_baseimg,
3701 &local_err);
3702 if (local_err) {
3703 qobject_unref(options);
3704 error_reportf_err(local_err,
3705 "Could not resolve backing filename: ");
3706 ret = -1;
3707 goto out;
3711 * Find out whether we rebase an image on top of a previous image
3712 * in its chain.
3714 prefix_chain_bs = bdrv_find_backing_image(bs, out_real_path);
3715 if (prefix_chain_bs) {
3716 qobject_unref(options);
3717 g_free(out_real_path);
3719 blk_new_backing = blk_new(qemu_get_aio_context(),
3720 BLK_PERM_CONSISTENT_READ,
3721 BLK_PERM_ALL);
3722 ret = blk_insert_bs(blk_new_backing, prefix_chain_bs,
3723 &local_err);
3724 if (ret < 0) {
3725 error_reportf_err(local_err,
3726 "Could not reuse backing file '%s': ",
3727 out_baseimg);
3728 goto out;
3730 } else {
3731 blk_new_backing = blk_new_open(out_real_path, NULL,
3732 options, src_flags, &local_err);
3733 g_free(out_real_path);
3734 if (!blk_new_backing) {
3735 error_reportf_err(local_err,
3736 "Could not open new backing file '%s': ",
3737 out_baseimg);
3738 ret = -1;
3739 goto out;
3746 * Check each unallocated cluster in the COW file. If it is unallocated,
3747 * accesses go to the backing file. We must therefore compare this cluster
3748 * in the old and new backing file, and if they differ we need to copy it
3749 * from the old backing file into the COW file.
3751 * If qemu-img crashes during this step, no harm is done. The content of
3752 * the image is the same as the original one at any time.
3754 if (!unsafe) {
3755 int64_t size;
3756 int64_t old_backing_size = 0;
3757 int64_t new_backing_size = 0;
3758 uint64_t offset;
3759 int64_t n;
3760 float local_progress = 0;
3762 buf_old = blk_blockalign(blk, IO_BUF_SIZE);
3763 buf_new = blk_blockalign(blk, IO_BUF_SIZE);
3765 size = blk_getlength(blk);
3766 if (size < 0) {
3767 error_report("Could not get size of '%s': %s",
3768 filename, strerror(-size));
3769 ret = -1;
3770 goto out;
3772 if (blk_old_backing) {
3773 old_backing_size = blk_getlength(blk_old_backing);
3774 if (old_backing_size < 0) {
3775 char backing_name[PATH_MAX];
3777 bdrv_get_backing_filename(bs, backing_name,
3778 sizeof(backing_name));
3779 error_report("Could not get size of '%s': %s",
3780 backing_name, strerror(-old_backing_size));
3781 ret = -1;
3782 goto out;
3785 if (blk_new_backing) {
3786 new_backing_size = blk_getlength(blk_new_backing);
3787 if (new_backing_size < 0) {
3788 error_report("Could not get size of '%s': %s",
3789 out_baseimg, strerror(-new_backing_size));
3790 ret = -1;
3791 goto out;
3795 if (size != 0) {
3796 local_progress = (float)100 / (size / MIN(size, IO_BUF_SIZE));
3799 for (offset = 0; offset < size; offset += n) {
3800 bool buf_old_is_zero = false;
3802 /* How many bytes can we handle with the next read? */
3803 n = MIN(IO_BUF_SIZE, size - offset);
3805 /* If the cluster is allocated, we don't need to take action */
3806 ret = bdrv_is_allocated(unfiltered_bs, offset, n, &n);
3807 if (ret < 0) {
3808 error_report("error while reading image metadata: %s",
3809 strerror(-ret));
3810 goto out;
3812 if (ret) {
3813 continue;
3816 if (prefix_chain_bs) {
3818 * If cluster wasn't changed since prefix_chain, we don't need
3819 * to take action
3821 ret = bdrv_is_allocated_above(bdrv_cow_bs(unfiltered_bs),
3822 prefix_chain_bs, false,
3823 offset, n, &n);
3824 if (ret < 0) {
3825 error_report("error while reading image metadata: %s",
3826 strerror(-ret));
3827 goto out;
3829 if (!ret) {
3830 continue;
3835 * Read old and new backing file and take into consideration that
3836 * backing files may be smaller than the COW image.
3838 if (offset >= old_backing_size) {
3839 memset(buf_old, 0, n);
3840 buf_old_is_zero = true;
3841 } else {
3842 if (offset + n > old_backing_size) {
3843 n = old_backing_size - offset;
3846 ret = blk_pread(blk_old_backing, offset, n, buf_old, 0);
3847 if (ret < 0) {
3848 error_report("error while reading from old backing file");
3849 goto out;
3853 if (offset >= new_backing_size || !blk_new_backing) {
3854 memset(buf_new, 0, n);
3855 } else {
3856 if (offset + n > new_backing_size) {
3857 n = new_backing_size - offset;
3860 ret = blk_pread(blk_new_backing, offset, n, buf_new, 0);
3861 if (ret < 0) {
3862 error_report("error while reading from new backing file");
3863 goto out;
3867 /* If they differ, we need to write to the COW file */
3868 uint64_t written = 0;
3870 while (written < n) {
3871 int64_t pnum;
3873 if (compare_buffers(buf_old + written, buf_new + written,
3874 n - written, &pnum))
3876 if (buf_old_is_zero) {
3877 ret = blk_pwrite_zeroes(blk, offset + written, pnum, 0);
3878 } else {
3879 ret = blk_pwrite(blk, offset + written, pnum,
3880 buf_old + written, 0);
3882 if (ret < 0) {
3883 error_report("Error while writing to COW image: %s",
3884 strerror(-ret));
3885 goto out;
3889 written += pnum;
3891 qemu_progress_print(local_progress, 100);
3896 * Change the backing file. All clusters that are different from the old
3897 * backing file are overwritten in the COW file now, so the visible content
3898 * doesn't change when we switch the backing file.
3900 if (out_baseimg && *out_baseimg) {
3901 ret = bdrv_change_backing_file(unfiltered_bs, out_baseimg, out_basefmt,
3902 true);
3903 } else {
3904 ret = bdrv_change_backing_file(unfiltered_bs, NULL, NULL, false);
3907 if (ret == -ENOSPC) {
3908 error_report("Could not change the backing file to '%s': No "
3909 "space left in the file header", out_baseimg);
3910 } else if (ret == -EINVAL && out_baseimg && !out_basefmt) {
3911 error_report("Could not change the backing file to '%s': backing "
3912 "format must be specified", out_baseimg);
3913 } else if (ret < 0) {
3914 error_report("Could not change the backing file to '%s': %s",
3915 out_baseimg, strerror(-ret));
3918 qemu_progress_print(100, 0);
3920 * TODO At this point it is possible to check if any clusters that are
3921 * allocated in the COW file are the same in the backing file. If so, they
3922 * could be dropped from the COW file. Don't do this before switching the
3923 * backing file, in case of a crash this would lead to corruption.
3925 out:
3926 qemu_progress_end();
3927 /* Cleanup */
3928 if (!unsafe) {
3929 blk_unref(blk_old_backing);
3930 blk_unref(blk_new_backing);
3932 qemu_vfree(buf_old);
3933 qemu_vfree(buf_new);
3935 blk_unref(blk);
3936 if (ret) {
3937 return 1;
3939 return 0;
3942 static int img_resize(int argc, char **argv)
3944 Error *err = NULL;
3945 int c, ret, relative;
3946 const char *filename, *fmt, *size;
3947 int64_t n, total_size, current_size;
3948 bool quiet = false;
3949 BlockBackend *blk = NULL;
3950 PreallocMode prealloc = PREALLOC_MODE_OFF;
3951 QemuOpts *param;
3953 static QemuOptsList resize_options = {
3954 .name = "resize_options",
3955 .head = QTAILQ_HEAD_INITIALIZER(resize_options.head),
3956 .desc = {
3958 .name = BLOCK_OPT_SIZE,
3959 .type = QEMU_OPT_SIZE,
3960 .help = "Virtual disk size"
3961 }, {
3962 /* end of list */
3966 bool image_opts = false;
3967 bool shrink = false;
3969 /* Remove size from argv manually so that negative numbers are not treated
3970 * as options by getopt. */
3971 if (argc < 3) {
3972 error_exit("Not enough arguments");
3973 return 1;
3976 size = argv[--argc];
3978 /* Parse getopt arguments */
3979 fmt = NULL;
3980 for(;;) {
3981 static const struct option long_options[] = {
3982 {"help", no_argument, 0, 'h'},
3983 {"object", required_argument, 0, OPTION_OBJECT},
3984 {"image-opts", no_argument, 0, OPTION_IMAGE_OPTS},
3985 {"preallocation", required_argument, 0, OPTION_PREALLOCATION},
3986 {"shrink", no_argument, 0, OPTION_SHRINK},
3987 {0, 0, 0, 0}
3989 c = getopt_long(argc, argv, ":f:hq",
3990 long_options, NULL);
3991 if (c == -1) {
3992 break;
3994 switch(c) {
3995 case ':':
3996 missing_argument(argv[optind - 1]);
3997 break;
3998 case '?':
3999 unrecognized_option(argv[optind - 1]);
4000 break;
4001 case 'h':
4002 help();
4003 break;
4004 case 'f':
4005 fmt = optarg;
4006 break;
4007 case 'q':
4008 quiet = true;
4009 break;
4010 case OPTION_OBJECT:
4011 user_creatable_process_cmdline(optarg);
4012 break;
4013 case OPTION_IMAGE_OPTS:
4014 image_opts = true;
4015 break;
4016 case OPTION_PREALLOCATION:
4017 prealloc = qapi_enum_parse(&PreallocMode_lookup, optarg,
4018 PREALLOC_MODE__MAX, NULL);
4019 if (prealloc == PREALLOC_MODE__MAX) {
4020 error_report("Invalid preallocation mode '%s'", optarg);
4021 return 1;
4023 break;
4024 case OPTION_SHRINK:
4025 shrink = true;
4026 break;
4029 if (optind != argc - 1) {
4030 error_exit("Expecting image file name and size");
4032 filename = argv[optind++];
4034 /* Choose grow, shrink, or absolute resize mode */
4035 switch (size[0]) {
4036 case '+':
4037 relative = 1;
4038 size++;
4039 break;
4040 case '-':
4041 relative = -1;
4042 size++;
4043 break;
4044 default:
4045 relative = 0;
4046 break;
4049 /* Parse size */
4050 param = qemu_opts_create(&resize_options, NULL, 0, &error_abort);
4051 if (!qemu_opt_set(param, BLOCK_OPT_SIZE, size, &err)) {
4052 error_report_err(err);
4053 ret = -1;
4054 qemu_opts_del(param);
4055 goto out;
4057 n = qemu_opt_get_size(param, BLOCK_OPT_SIZE, 0);
4058 qemu_opts_del(param);
4060 blk = img_open(image_opts, filename, fmt,
4061 BDRV_O_RDWR | BDRV_O_RESIZE, false, quiet,
4062 false);
4063 if (!blk) {
4064 ret = -1;
4065 goto out;
4068 current_size = blk_getlength(blk);
4069 if (current_size < 0) {
4070 error_report("Failed to inquire current image length: %s",
4071 strerror(-current_size));
4072 ret = -1;
4073 goto out;
4076 if (relative) {
4077 total_size = current_size + n * relative;
4078 } else {
4079 total_size = n;
4081 if (total_size <= 0) {
4082 error_report("New image size must be positive");
4083 ret = -1;
4084 goto out;
4087 if (total_size <= current_size && prealloc != PREALLOC_MODE_OFF) {
4088 error_report("Preallocation can only be used for growing images");
4089 ret = -1;
4090 goto out;
4093 if (total_size < current_size && !shrink) {
4094 error_report("Use the --shrink option to perform a shrink operation.");
4095 warn_report("Shrinking an image will delete all data beyond the "
4096 "shrunken image's end. Before performing such an "
4097 "operation, make sure there is no important data there.");
4098 ret = -1;
4099 goto out;
4103 * The user expects the image to have the desired size after
4104 * resizing, so pass @exact=true. It is of no use to report
4105 * success when the image has not actually been resized.
4107 ret = blk_truncate(blk, total_size, true, prealloc, 0, &err);
4108 if (!ret) {
4109 qprintf(quiet, "Image resized.\n");
4110 } else {
4111 error_report_err(err);
4113 out:
4114 blk_unref(blk);
4115 if (ret) {
4116 return 1;
4118 return 0;
4121 static void amend_status_cb(BlockDriverState *bs,
4122 int64_t offset, int64_t total_work_size,
4123 void *opaque)
4125 qemu_progress_print(100.f * offset / total_work_size, 0);
4128 static int print_amend_option_help(const char *format)
4130 BlockDriver *drv;
4132 /* Find driver and parse its options */
4133 drv = bdrv_find_format(format);
4134 if (!drv) {
4135 error_report("Unknown file format '%s'", format);
4136 return 1;
4139 if (!drv->bdrv_amend_options) {
4140 error_report("Format driver '%s' does not support option amendment",
4141 format);
4142 return 1;
4145 /* Every driver supporting amendment must have amend_opts */
4146 assert(drv->amend_opts);
4148 printf("Amend options for '%s':\n", format);
4149 qemu_opts_print_help(drv->amend_opts, false);
4150 return 0;
4153 static int img_amend(int argc, char **argv)
4155 Error *err = NULL;
4156 int c, ret = 0;
4157 char *options = NULL;
4158 QemuOptsList *amend_opts = NULL;
4159 QemuOpts *opts = NULL;
4160 const char *fmt = NULL, *filename, *cache;
4161 int flags;
4162 bool writethrough;
4163 bool quiet = false, progress = false;
4164 BlockBackend *blk = NULL;
4165 BlockDriverState *bs = NULL;
4166 bool image_opts = false;
4167 bool force = false;
4169 cache = BDRV_DEFAULT_CACHE;
4170 for (;;) {
4171 static const struct option long_options[] = {
4172 {"help", no_argument, 0, 'h'},
4173 {"object", required_argument, 0, OPTION_OBJECT},
4174 {"image-opts", no_argument, 0, OPTION_IMAGE_OPTS},
4175 {"force", no_argument, 0, OPTION_FORCE},
4176 {0, 0, 0, 0}
4178 c = getopt_long(argc, argv, ":ho:f:t:pq",
4179 long_options, NULL);
4180 if (c == -1) {
4181 break;
4184 switch (c) {
4185 case ':':
4186 missing_argument(argv[optind - 1]);
4187 break;
4188 case '?':
4189 unrecognized_option(argv[optind - 1]);
4190 break;
4191 case 'h':
4192 help();
4193 break;
4194 case 'o':
4195 if (accumulate_options(&options, optarg) < 0) {
4196 ret = -1;
4197 goto out_no_progress;
4199 break;
4200 case 'f':
4201 fmt = optarg;
4202 break;
4203 case 't':
4204 cache = optarg;
4205 break;
4206 case 'p':
4207 progress = true;
4208 break;
4209 case 'q':
4210 quiet = true;
4211 break;
4212 case OPTION_OBJECT:
4213 user_creatable_process_cmdline(optarg);
4214 break;
4215 case OPTION_IMAGE_OPTS:
4216 image_opts = true;
4217 break;
4218 case OPTION_FORCE:
4219 force = true;
4220 break;
4224 if (!options) {
4225 error_exit("Must specify options (-o)");
4228 if (quiet) {
4229 progress = false;
4231 qemu_progress_init(progress, 1.0);
4233 filename = (optind == argc - 1) ? argv[argc - 1] : NULL;
4234 if (fmt && has_help_option(options)) {
4235 /* If a format is explicitly specified (and possibly no filename is
4236 * given), print option help here */
4237 ret = print_amend_option_help(fmt);
4238 goto out;
4241 if (optind != argc - 1) {
4242 error_report("Expecting one image file name");
4243 ret = -1;
4244 goto out;
4247 flags = BDRV_O_RDWR;
4248 ret = bdrv_parse_cache_mode(cache, &flags, &writethrough);
4249 if (ret < 0) {
4250 error_report("Invalid cache option: %s", cache);
4251 goto out;
4254 blk = img_open(image_opts, filename, fmt, flags, writethrough, quiet,
4255 false);
4256 if (!blk) {
4257 ret = -1;
4258 goto out;
4260 bs = blk_bs(blk);
4262 fmt = bs->drv->format_name;
4264 if (has_help_option(options)) {
4265 /* If the format was auto-detected, print option help here */
4266 ret = print_amend_option_help(fmt);
4267 goto out;
4270 if (!bs->drv->bdrv_amend_options) {
4271 error_report("Format driver '%s' does not support option amendment",
4272 fmt);
4273 ret = -1;
4274 goto out;
4277 /* Every driver supporting amendment must have amend_opts */
4278 assert(bs->drv->amend_opts);
4280 amend_opts = qemu_opts_append(amend_opts, bs->drv->amend_opts);
4281 opts = qemu_opts_create(amend_opts, NULL, 0, &error_abort);
4282 if (!qemu_opts_do_parse(opts, options, NULL, &err)) {
4283 /* Try to parse options using the create options */
4284 amend_opts = qemu_opts_append(amend_opts, bs->drv->create_opts);
4285 qemu_opts_del(opts);
4286 opts = qemu_opts_create(amend_opts, NULL, 0, &error_abort);
4287 if (qemu_opts_do_parse(opts, options, NULL, NULL)) {
4288 error_append_hint(&err,
4289 "This option is only supported for image creation\n");
4292 error_report_err(err);
4293 ret = -1;
4294 goto out;
4297 /* In case the driver does not call amend_status_cb() */
4298 qemu_progress_print(0.f, 0);
4299 ret = bdrv_amend_options(bs, opts, &amend_status_cb, NULL, force, &err);
4300 qemu_progress_print(100.f, 0);
4301 if (ret < 0) {
4302 error_report_err(err);
4303 goto out;
4306 out:
4307 qemu_progress_end();
4309 out_no_progress:
4310 blk_unref(blk);
4311 qemu_opts_del(opts);
4312 qemu_opts_free(amend_opts);
4313 g_free(options);
4315 if (ret) {
4316 return 1;
4318 return 0;
4321 typedef struct BenchData {
4322 BlockBackend *blk;
4323 uint64_t image_size;
4324 bool write;
4325 int bufsize;
4326 int step;
4327 int nrreq;
4328 int n;
4329 int flush_interval;
4330 bool drain_on_flush;
4331 uint8_t *buf;
4332 QEMUIOVector *qiov;
4334 int in_flight;
4335 bool in_flush;
4336 uint64_t offset;
4337 } BenchData;
4339 static void bench_undrained_flush_cb(void *opaque, int ret)
4341 if (ret < 0) {
4342 error_report("Failed flush request: %s", strerror(-ret));
4343 exit(EXIT_FAILURE);
4347 static void bench_cb(void *opaque, int ret)
4349 BenchData *b = opaque;
4350 BlockAIOCB *acb;
4352 if (ret < 0) {
4353 error_report("Failed request: %s", strerror(-ret));
4354 exit(EXIT_FAILURE);
4357 if (b->in_flush) {
4358 /* Just finished a flush with drained queue: Start next requests */
4359 assert(b->in_flight == 0);
4360 b->in_flush = false;
4361 } else if (b->in_flight > 0) {
4362 int remaining = b->n - b->in_flight;
4364 b->n--;
4365 b->in_flight--;
4367 /* Time for flush? Drain queue if requested, then flush */
4368 if (b->flush_interval && remaining % b->flush_interval == 0) {
4369 if (!b->in_flight || !b->drain_on_flush) {
4370 BlockCompletionFunc *cb;
4372 if (b->drain_on_flush) {
4373 b->in_flush = true;
4374 cb = bench_cb;
4375 } else {
4376 cb = bench_undrained_flush_cb;
4379 acb = blk_aio_flush(b->blk, cb, b);
4380 if (!acb) {
4381 error_report("Failed to issue flush request");
4382 exit(EXIT_FAILURE);
4385 if (b->drain_on_flush) {
4386 return;
4391 while (b->n > b->in_flight && b->in_flight < b->nrreq) {
4392 int64_t offset = b->offset;
4393 /* blk_aio_* might look for completed I/Os and kick bench_cb
4394 * again, so make sure this operation is counted by in_flight
4395 * and b->offset is ready for the next submission.
4397 b->in_flight++;
4398 b->offset += b->step;
4399 b->offset %= b->image_size;
4400 if (b->write) {
4401 acb = blk_aio_pwritev(b->blk, offset, b->qiov, 0, bench_cb, b);
4402 } else {
4403 acb = blk_aio_preadv(b->blk, offset, b->qiov, 0, bench_cb, b);
4405 if (!acb) {
4406 error_report("Failed to issue request");
4407 exit(EXIT_FAILURE);
4412 static int img_bench(int argc, char **argv)
4414 int c, ret = 0;
4415 const char *fmt = NULL, *filename;
4416 bool quiet = false;
4417 bool image_opts = false;
4418 bool is_write = false;
4419 int count = 75000;
4420 int depth = 64;
4421 int64_t offset = 0;
4422 size_t bufsize = 4096;
4423 int pattern = 0;
4424 size_t step = 0;
4425 int flush_interval = 0;
4426 bool drain_on_flush = true;
4427 int64_t image_size;
4428 BlockBackend *blk = NULL;
4429 BenchData data = {};
4430 int flags = 0;
4431 bool writethrough = false;
4432 struct timeval t1, t2;
4433 int i;
4434 bool force_share = false;
4435 size_t buf_size = 0;
4437 for (;;) {
4438 static const struct option long_options[] = {
4439 {"help", no_argument, 0, 'h'},
4440 {"flush-interval", required_argument, 0, OPTION_FLUSH_INTERVAL},
4441 {"image-opts", no_argument, 0, OPTION_IMAGE_OPTS},
4442 {"pattern", required_argument, 0, OPTION_PATTERN},
4443 {"no-drain", no_argument, 0, OPTION_NO_DRAIN},
4444 {"force-share", no_argument, 0, 'U'},
4445 {0, 0, 0, 0}
4447 c = getopt_long(argc, argv, ":hc:d:f:ni:o:qs:S:t:wU", long_options,
4448 NULL);
4449 if (c == -1) {
4450 break;
4453 switch (c) {
4454 case ':':
4455 missing_argument(argv[optind - 1]);
4456 break;
4457 case '?':
4458 unrecognized_option(argv[optind - 1]);
4459 break;
4460 case 'h':
4461 help();
4462 break;
4463 case 'c':
4465 unsigned long res;
4467 if (qemu_strtoul(optarg, NULL, 0, &res) < 0 || res > INT_MAX) {
4468 error_report("Invalid request count specified");
4469 return 1;
4471 count = res;
4472 break;
4474 case 'd':
4476 unsigned long res;
4478 if (qemu_strtoul(optarg, NULL, 0, &res) < 0 || res > INT_MAX) {
4479 error_report("Invalid queue depth specified");
4480 return 1;
4482 depth = res;
4483 break;
4485 case 'f':
4486 fmt = optarg;
4487 break;
4488 case 'n':
4489 flags |= BDRV_O_NATIVE_AIO;
4490 break;
4491 case 'i':
4492 ret = bdrv_parse_aio(optarg, &flags);
4493 if (ret < 0) {
4494 error_report("Invalid aio option: %s", optarg);
4495 ret = -1;
4496 goto out;
4498 break;
4499 case 'o':
4501 offset = cvtnum("offset", optarg);
4502 if (offset < 0) {
4503 return 1;
4505 break;
4507 break;
4508 case 'q':
4509 quiet = true;
4510 break;
4511 case 's':
4513 int64_t sval;
4515 sval = cvtnum_full("buffer size", optarg, 0, INT_MAX);
4516 if (sval < 0) {
4517 return 1;
4520 bufsize = sval;
4521 break;
4523 case 'S':
4525 int64_t sval;
4527 sval = cvtnum_full("step_size", optarg, 0, INT_MAX);
4528 if (sval < 0) {
4529 return 1;
4532 step = sval;
4533 break;
4535 case 't':
4536 ret = bdrv_parse_cache_mode(optarg, &flags, &writethrough);
4537 if (ret < 0) {
4538 error_report("Invalid cache mode");
4539 ret = -1;
4540 goto out;
4542 break;
4543 case 'w':
4544 flags |= BDRV_O_RDWR;
4545 is_write = true;
4546 break;
4547 case 'U':
4548 force_share = true;
4549 break;
4550 case OPTION_PATTERN:
4552 unsigned long res;
4554 if (qemu_strtoul(optarg, NULL, 0, &res) < 0 || res > 0xff) {
4555 error_report("Invalid pattern byte specified");
4556 return 1;
4558 pattern = res;
4559 break;
4561 case OPTION_FLUSH_INTERVAL:
4563 unsigned long res;
4565 if (qemu_strtoul(optarg, NULL, 0, &res) < 0 || res > INT_MAX) {
4566 error_report("Invalid flush interval specified");
4567 return 1;
4569 flush_interval = res;
4570 break;
4572 case OPTION_NO_DRAIN:
4573 drain_on_flush = false;
4574 break;
4575 case OPTION_IMAGE_OPTS:
4576 image_opts = true;
4577 break;
4581 if (optind != argc - 1) {
4582 error_exit("Expecting one image file name");
4584 filename = argv[argc - 1];
4586 if (!is_write && flush_interval) {
4587 error_report("--flush-interval is only available in write tests");
4588 ret = -1;
4589 goto out;
4591 if (flush_interval && flush_interval < depth) {
4592 error_report("Flush interval can't be smaller than depth");
4593 ret = -1;
4594 goto out;
4597 blk = img_open(image_opts, filename, fmt, flags, writethrough, quiet,
4598 force_share);
4599 if (!blk) {
4600 ret = -1;
4601 goto out;
4604 image_size = blk_getlength(blk);
4605 if (image_size < 0) {
4606 ret = image_size;
4607 goto out;
4610 data = (BenchData) {
4611 .blk = blk,
4612 .image_size = image_size,
4613 .bufsize = bufsize,
4614 .step = step ?: bufsize,
4615 .nrreq = depth,
4616 .n = count,
4617 .offset = offset,
4618 .write = is_write,
4619 .flush_interval = flush_interval,
4620 .drain_on_flush = drain_on_flush,
4622 printf("Sending %d %s requests, %d bytes each, %d in parallel "
4623 "(starting at offset %" PRId64 ", step size %d)\n",
4624 data.n, data.write ? "write" : "read", data.bufsize, data.nrreq,
4625 data.offset, data.step);
4626 if (flush_interval) {
4627 printf("Sending flush every %d requests\n", flush_interval);
4630 buf_size = data.nrreq * data.bufsize;
4631 data.buf = blk_blockalign(blk, buf_size);
4632 memset(data.buf, pattern, data.nrreq * data.bufsize);
4634 blk_register_buf(blk, data.buf, buf_size, &error_fatal);
4636 data.qiov = g_new(QEMUIOVector, data.nrreq);
4637 for (i = 0; i < data.nrreq; i++) {
4638 qemu_iovec_init(&data.qiov[i], 1);
4639 qemu_iovec_add(&data.qiov[i],
4640 data.buf + i * data.bufsize, data.bufsize);
4643 gettimeofday(&t1, NULL);
4644 bench_cb(&data, 0);
4646 while (data.n > 0) {
4647 main_loop_wait(false);
4649 gettimeofday(&t2, NULL);
4651 printf("Run completed in %3.3f seconds.\n",
4652 (t2.tv_sec - t1.tv_sec)
4653 + ((double)(t2.tv_usec - t1.tv_usec) / 1000000));
4655 out:
4656 if (data.buf) {
4657 blk_unregister_buf(blk, data.buf, buf_size);
4659 qemu_vfree(data.buf);
4660 blk_unref(blk);
4662 if (ret) {
4663 return 1;
4665 return 0;
4668 enum ImgBitmapAct {
4669 BITMAP_ADD,
4670 BITMAP_REMOVE,
4671 BITMAP_CLEAR,
4672 BITMAP_ENABLE,
4673 BITMAP_DISABLE,
4674 BITMAP_MERGE,
4676 typedef struct ImgBitmapAction {
4677 enum ImgBitmapAct act;
4678 const char *src; /* only used for merge */
4679 QSIMPLEQ_ENTRY(ImgBitmapAction) next;
4680 } ImgBitmapAction;
4682 static int img_bitmap(int argc, char **argv)
4684 Error *err = NULL;
4685 int c, ret = 1;
4686 QemuOpts *opts = NULL;
4687 const char *fmt = NULL, *src_fmt = NULL, *src_filename = NULL;
4688 const char *filename, *bitmap;
4689 BlockBackend *blk = NULL, *src = NULL;
4690 BlockDriverState *bs = NULL, *src_bs = NULL;
4691 bool image_opts = false;
4692 int64_t granularity = 0;
4693 bool add = false, merge = false;
4694 QSIMPLEQ_HEAD(, ImgBitmapAction) actions;
4695 ImgBitmapAction *act, *act_next;
4696 const char *op;
4697 int inactivate_ret;
4699 QSIMPLEQ_INIT(&actions);
4701 for (;;) {
4702 static const struct option long_options[] = {
4703 {"help", no_argument, 0, 'h'},
4704 {"object", required_argument, 0, OPTION_OBJECT},
4705 {"image-opts", no_argument, 0, OPTION_IMAGE_OPTS},
4706 {"add", no_argument, 0, OPTION_ADD},
4707 {"remove", no_argument, 0, OPTION_REMOVE},
4708 {"clear", no_argument, 0, OPTION_CLEAR},
4709 {"enable", no_argument, 0, OPTION_ENABLE},
4710 {"disable", no_argument, 0, OPTION_DISABLE},
4711 {"merge", required_argument, 0, OPTION_MERGE},
4712 {"granularity", required_argument, 0, 'g'},
4713 {"source-file", required_argument, 0, 'b'},
4714 {"source-format", required_argument, 0, 'F'},
4715 {0, 0, 0, 0}
4717 c = getopt_long(argc, argv, ":b:f:F:g:h", long_options, NULL);
4718 if (c == -1) {
4719 break;
4722 switch (c) {
4723 case ':':
4724 missing_argument(argv[optind - 1]);
4725 break;
4726 case '?':
4727 unrecognized_option(argv[optind - 1]);
4728 break;
4729 case 'h':
4730 help();
4731 break;
4732 case 'b':
4733 src_filename = optarg;
4734 break;
4735 case 'f':
4736 fmt = optarg;
4737 break;
4738 case 'F':
4739 src_fmt = optarg;
4740 break;
4741 case 'g':
4742 granularity = cvtnum("granularity", optarg);
4743 if (granularity < 0) {
4744 return 1;
4746 break;
4747 case OPTION_ADD:
4748 act = g_new0(ImgBitmapAction, 1);
4749 act->act = BITMAP_ADD;
4750 QSIMPLEQ_INSERT_TAIL(&actions, act, next);
4751 add = true;
4752 break;
4753 case OPTION_REMOVE:
4754 act = g_new0(ImgBitmapAction, 1);
4755 act->act = BITMAP_REMOVE;
4756 QSIMPLEQ_INSERT_TAIL(&actions, act, next);
4757 break;
4758 case OPTION_CLEAR:
4759 act = g_new0(ImgBitmapAction, 1);
4760 act->act = BITMAP_CLEAR;
4761 QSIMPLEQ_INSERT_TAIL(&actions, act, next);
4762 break;
4763 case OPTION_ENABLE:
4764 act = g_new0(ImgBitmapAction, 1);
4765 act->act = BITMAP_ENABLE;
4766 QSIMPLEQ_INSERT_TAIL(&actions, act, next);
4767 break;
4768 case OPTION_DISABLE:
4769 act = g_new0(ImgBitmapAction, 1);
4770 act->act = BITMAP_DISABLE;
4771 QSIMPLEQ_INSERT_TAIL(&actions, act, next);
4772 break;
4773 case OPTION_MERGE:
4774 act = g_new0(ImgBitmapAction, 1);
4775 act->act = BITMAP_MERGE;
4776 act->src = optarg;
4777 QSIMPLEQ_INSERT_TAIL(&actions, act, next);
4778 merge = true;
4779 break;
4780 case OPTION_OBJECT:
4781 user_creatable_process_cmdline(optarg);
4782 break;
4783 case OPTION_IMAGE_OPTS:
4784 image_opts = true;
4785 break;
4789 if (QSIMPLEQ_EMPTY(&actions)) {
4790 error_report("Need at least one of --add, --remove, --clear, "
4791 "--enable, --disable, or --merge");
4792 goto out;
4795 if (granularity && !add) {
4796 error_report("granularity only supported with --add");
4797 goto out;
4799 if (src_fmt && !src_filename) {
4800 error_report("-F only supported with -b");
4801 goto out;
4803 if (src_filename && !merge) {
4804 error_report("Merge bitmap source file only supported with "
4805 "--merge");
4806 goto out;
4809 if (optind != argc - 2) {
4810 error_report("Expecting filename and bitmap name");
4811 goto out;
4814 filename = argv[optind];
4815 bitmap = argv[optind + 1];
4818 * No need to open backing chains; we will be manipulating bitmaps
4819 * directly in this image without reference to image contents.
4821 blk = img_open(image_opts, filename, fmt, BDRV_O_RDWR | BDRV_O_NO_BACKING,
4822 false, false, false);
4823 if (!blk) {
4824 goto out;
4826 bs = blk_bs(blk);
4827 if (src_filename) {
4828 src = img_open(false, src_filename, src_fmt, BDRV_O_NO_BACKING,
4829 false, false, false);
4830 if (!src) {
4831 goto out;
4833 src_bs = blk_bs(src);
4834 } else {
4835 src_bs = bs;
4838 QSIMPLEQ_FOREACH_SAFE(act, &actions, next, act_next) {
4839 switch (act->act) {
4840 case BITMAP_ADD:
4841 qmp_block_dirty_bitmap_add(bs->node_name, bitmap,
4842 !!granularity, granularity, true, true,
4843 false, false, &err);
4844 op = "add";
4845 break;
4846 case BITMAP_REMOVE:
4847 qmp_block_dirty_bitmap_remove(bs->node_name, bitmap, &err);
4848 op = "remove";
4849 break;
4850 case BITMAP_CLEAR:
4851 qmp_block_dirty_bitmap_clear(bs->node_name, bitmap, &err);
4852 op = "clear";
4853 break;
4854 case BITMAP_ENABLE:
4855 qmp_block_dirty_bitmap_enable(bs->node_name, bitmap, &err);
4856 op = "enable";
4857 break;
4858 case BITMAP_DISABLE:
4859 qmp_block_dirty_bitmap_disable(bs->node_name, bitmap, &err);
4860 op = "disable";
4861 break;
4862 case BITMAP_MERGE:
4863 do_dirty_bitmap_merge(bs->node_name, bitmap, src_bs->node_name,
4864 act->src, &err);
4865 op = "merge";
4866 break;
4867 default:
4868 g_assert_not_reached();
4871 if (err) {
4872 error_reportf_err(err, "Operation %s on bitmap %s failed: ",
4873 op, bitmap);
4874 goto out;
4876 g_free(act);
4879 ret = 0;
4881 out:
4883 * Manually inactivate the images first because this way we can know whether
4884 * an error occurred. blk_unref() doesn't tell us about failures.
4886 inactivate_ret = bdrv_inactivate_all();
4887 if (inactivate_ret < 0) {
4888 error_report("Error while closing the image: %s", strerror(-inactivate_ret));
4889 ret = 1;
4892 blk_unref(src);
4893 blk_unref(blk);
4894 qemu_opts_del(opts);
4895 return ret;
4898 #define C_BS 01
4899 #define C_COUNT 02
4900 #define C_IF 04
4901 #define C_OF 010
4902 #define C_SKIP 020
4904 struct DdInfo {
4905 unsigned int flags;
4906 int64_t count;
4909 struct DdIo {
4910 int bsz; /* Block size */
4911 char *filename;
4912 uint8_t *buf;
4913 int64_t offset;
4916 struct DdOpts {
4917 const char *name;
4918 int (*f)(const char *, struct DdIo *, struct DdIo *, struct DdInfo *);
4919 unsigned int flag;
4922 static int img_dd_bs(const char *arg,
4923 struct DdIo *in, struct DdIo *out,
4924 struct DdInfo *dd)
4926 int64_t res;
4928 res = cvtnum_full("bs", arg, 1, INT_MAX);
4930 if (res < 0) {
4931 return 1;
4933 in->bsz = out->bsz = res;
4935 return 0;
4938 static int img_dd_count(const char *arg,
4939 struct DdIo *in, struct DdIo *out,
4940 struct DdInfo *dd)
4942 dd->count = cvtnum("count", arg);
4944 if (dd->count < 0) {
4945 return 1;
4948 return 0;
4951 static int img_dd_if(const char *arg,
4952 struct DdIo *in, struct DdIo *out,
4953 struct DdInfo *dd)
4955 in->filename = g_strdup(arg);
4957 return 0;
4960 static int img_dd_of(const char *arg,
4961 struct DdIo *in, struct DdIo *out,
4962 struct DdInfo *dd)
4964 out->filename = g_strdup(arg);
4966 return 0;
4969 static int img_dd_skip(const char *arg,
4970 struct DdIo *in, struct DdIo *out,
4971 struct DdInfo *dd)
4973 in->offset = cvtnum("skip", arg);
4975 if (in->offset < 0) {
4976 return 1;
4979 return 0;
4982 static int img_dd(int argc, char **argv)
4984 int ret = 0;
4985 char *arg = NULL;
4986 char *tmp;
4987 BlockDriver *drv = NULL, *proto_drv = NULL;
4988 BlockBackend *blk1 = NULL, *blk2 = NULL;
4989 QemuOpts *opts = NULL;
4990 QemuOptsList *create_opts = NULL;
4991 Error *local_err = NULL;
4992 bool image_opts = false;
4993 int c, i;
4994 const char *out_fmt = "raw";
4995 const char *fmt = NULL;
4996 int64_t size = 0;
4997 int64_t out_pos, in_pos;
4998 bool force_share = false;
4999 struct DdInfo dd = {
5000 .flags = 0,
5001 .count = 0,
5003 struct DdIo in = {
5004 .bsz = 512, /* Block size is by default 512 bytes */
5005 .filename = NULL,
5006 .buf = NULL,
5007 .offset = 0
5009 struct DdIo out = {
5010 .bsz = 512,
5011 .filename = NULL,
5012 .buf = NULL,
5013 .offset = 0
5016 const struct DdOpts options[] = {
5017 { "bs", img_dd_bs, C_BS },
5018 { "count", img_dd_count, C_COUNT },
5019 { "if", img_dd_if, C_IF },
5020 { "of", img_dd_of, C_OF },
5021 { "skip", img_dd_skip, C_SKIP },
5022 { NULL, NULL, 0 }
5024 const struct option long_options[] = {
5025 { "help", no_argument, 0, 'h'},
5026 { "object", required_argument, 0, OPTION_OBJECT},
5027 { "image-opts", no_argument, 0, OPTION_IMAGE_OPTS},
5028 { "force-share", no_argument, 0, 'U'},
5029 { 0, 0, 0, 0 }
5032 while ((c = getopt_long(argc, argv, ":hf:O:U", long_options, NULL))) {
5033 if (c == EOF) {
5034 break;
5036 switch (c) {
5037 case 'O':
5038 out_fmt = optarg;
5039 break;
5040 case 'f':
5041 fmt = optarg;
5042 break;
5043 case ':':
5044 missing_argument(argv[optind - 1]);
5045 break;
5046 case '?':
5047 unrecognized_option(argv[optind - 1]);
5048 break;
5049 case 'h':
5050 help();
5051 break;
5052 case 'U':
5053 force_share = true;
5054 break;
5055 case OPTION_OBJECT:
5056 user_creatable_process_cmdline(optarg);
5057 break;
5058 case OPTION_IMAGE_OPTS:
5059 image_opts = true;
5060 break;
5064 for (i = optind; i < argc; i++) {
5065 int j;
5066 arg = g_strdup(argv[i]);
5068 tmp = strchr(arg, '=');
5069 if (tmp == NULL) {
5070 error_report("unrecognized operand %s", arg);
5071 ret = -1;
5072 goto out;
5075 *tmp++ = '\0';
5077 for (j = 0; options[j].name != NULL; j++) {
5078 if (!strcmp(arg, options[j].name)) {
5079 break;
5082 if (options[j].name == NULL) {
5083 error_report("unrecognized operand %s", arg);
5084 ret = -1;
5085 goto out;
5088 if (options[j].f(tmp, &in, &out, &dd) != 0) {
5089 ret = -1;
5090 goto out;
5092 dd.flags |= options[j].flag;
5093 g_free(arg);
5094 arg = NULL;
5097 if (!(dd.flags & C_IF && dd.flags & C_OF)) {
5098 error_report("Must specify both input and output files");
5099 ret = -1;
5100 goto out;
5103 blk1 = img_open(image_opts, in.filename, fmt, 0, false, false,
5104 force_share);
5106 if (!blk1) {
5107 ret = -1;
5108 goto out;
5111 drv = bdrv_find_format(out_fmt);
5112 if (!drv) {
5113 error_report("Unknown file format");
5114 ret = -1;
5115 goto out;
5117 proto_drv = bdrv_find_protocol(out.filename, true, &local_err);
5119 if (!proto_drv) {
5120 error_report_err(local_err);
5121 ret = -1;
5122 goto out;
5124 if (!drv->create_opts) {
5125 error_report("Format driver '%s' does not support image creation",
5126 drv->format_name);
5127 ret = -1;
5128 goto out;
5130 if (!proto_drv->create_opts) {
5131 error_report("Protocol driver '%s' does not support image creation",
5132 proto_drv->format_name);
5133 ret = -1;
5134 goto out;
5136 create_opts = qemu_opts_append(create_opts, drv->create_opts);
5137 create_opts = qemu_opts_append(create_opts, proto_drv->create_opts);
5139 opts = qemu_opts_create(create_opts, NULL, 0, &error_abort);
5141 size = blk_getlength(blk1);
5142 if (size < 0) {
5143 error_report("Failed to get size for '%s'", in.filename);
5144 ret = -1;
5145 goto out;
5148 if (dd.flags & C_COUNT && dd.count <= INT64_MAX / in.bsz &&
5149 dd.count * in.bsz < size) {
5150 size = dd.count * in.bsz;
5153 /* Overflow means the specified offset is beyond input image's size */
5154 if (dd.flags & C_SKIP && (in.offset > INT64_MAX / in.bsz ||
5155 size < in.bsz * in.offset)) {
5156 qemu_opt_set_number(opts, BLOCK_OPT_SIZE, 0, &error_abort);
5157 } else {
5158 qemu_opt_set_number(opts, BLOCK_OPT_SIZE,
5159 size - in.bsz * in.offset, &error_abort);
5162 ret = bdrv_create(drv, out.filename, opts, &local_err);
5163 if (ret < 0) {
5164 error_reportf_err(local_err,
5165 "%s: error while creating output image: ",
5166 out.filename);
5167 ret = -1;
5168 goto out;
5171 /* TODO, we can't honour --image-opts for the target,
5172 * since it needs to be given in a format compatible
5173 * with the bdrv_create() call above which does not
5174 * support image-opts style.
5176 blk2 = img_open_file(out.filename, NULL, out_fmt, BDRV_O_RDWR,
5177 false, false, false);
5179 if (!blk2) {
5180 ret = -1;
5181 goto out;
5184 if (dd.flags & C_SKIP && (in.offset > INT64_MAX / in.bsz ||
5185 size < in.offset * in.bsz)) {
5186 /* We give a warning if the skip option is bigger than the input
5187 * size and create an empty output disk image (i.e. like dd(1)).
5189 error_report("%s: cannot skip to specified offset", in.filename);
5190 in_pos = size;
5191 } else {
5192 in_pos = in.offset * in.bsz;
5195 in.buf = g_new(uint8_t, in.bsz);
5197 for (out_pos = 0; in_pos < size; ) {
5198 int bytes = (in_pos + in.bsz > size) ? size - in_pos : in.bsz;
5200 ret = blk_pread(blk1, in_pos, bytes, in.buf, 0);
5201 if (ret < 0) {
5202 error_report("error while reading from input image file: %s",
5203 strerror(-ret));
5204 goto out;
5206 in_pos += bytes;
5208 ret = blk_pwrite(blk2, out_pos, bytes, in.buf, 0);
5209 if (ret < 0) {
5210 error_report("error while writing to output image file: %s",
5211 strerror(-ret));
5212 goto out;
5214 out_pos += bytes;
5217 out:
5218 g_free(arg);
5219 qemu_opts_del(opts);
5220 qemu_opts_free(create_opts);
5221 blk_unref(blk1);
5222 blk_unref(blk2);
5223 g_free(in.filename);
5224 g_free(out.filename);
5225 g_free(in.buf);
5226 g_free(out.buf);
5228 if (ret) {
5229 return 1;
5231 return 0;
5234 static void dump_json_block_measure_info(BlockMeasureInfo *info)
5236 GString *str;
5237 QObject *obj;
5238 Visitor *v = qobject_output_visitor_new(&obj);
5240 visit_type_BlockMeasureInfo(v, NULL, &info, &error_abort);
5241 visit_complete(v, &obj);
5242 str = qobject_to_json_pretty(obj, true);
5243 assert(str != NULL);
5244 printf("%s\n", str->str);
5245 qobject_unref(obj);
5246 visit_free(v);
5247 g_string_free(str, true);
5250 static int img_measure(int argc, char **argv)
5252 static const struct option long_options[] = {
5253 {"help", no_argument, 0, 'h'},
5254 {"image-opts", no_argument, 0, OPTION_IMAGE_OPTS},
5255 {"object", required_argument, 0, OPTION_OBJECT},
5256 {"output", required_argument, 0, OPTION_OUTPUT},
5257 {"size", required_argument, 0, OPTION_SIZE},
5258 {"force-share", no_argument, 0, 'U'},
5259 {0, 0, 0, 0}
5261 OutputFormat output_format = OFORMAT_HUMAN;
5262 BlockBackend *in_blk = NULL;
5263 BlockDriver *drv;
5264 const char *filename = NULL;
5265 const char *fmt = NULL;
5266 const char *out_fmt = "raw";
5267 char *options = NULL;
5268 char *snapshot_name = NULL;
5269 bool force_share = false;
5270 QemuOpts *opts = NULL;
5271 QemuOpts *object_opts = NULL;
5272 QemuOpts *sn_opts = NULL;
5273 QemuOptsList *create_opts = NULL;
5274 bool image_opts = false;
5275 uint64_t img_size = UINT64_MAX;
5276 BlockMeasureInfo *info = NULL;
5277 Error *local_err = NULL;
5278 int ret = 1;
5279 int c;
5281 while ((c = getopt_long(argc, argv, "hf:O:o:l:U",
5282 long_options, NULL)) != -1) {
5283 switch (c) {
5284 case '?':
5285 case 'h':
5286 help();
5287 break;
5288 case 'f':
5289 fmt = optarg;
5290 break;
5291 case 'O':
5292 out_fmt = optarg;
5293 break;
5294 case 'o':
5295 if (accumulate_options(&options, optarg) < 0) {
5296 goto out;
5298 break;
5299 case 'l':
5300 if (strstart(optarg, SNAPSHOT_OPT_BASE, NULL)) {
5301 sn_opts = qemu_opts_parse_noisily(&internal_snapshot_opts,
5302 optarg, false);
5303 if (!sn_opts) {
5304 error_report("Failed in parsing snapshot param '%s'",
5305 optarg);
5306 goto out;
5308 } else {
5309 snapshot_name = optarg;
5311 break;
5312 case 'U':
5313 force_share = true;
5314 break;
5315 case OPTION_OBJECT:
5316 user_creatable_process_cmdline(optarg);
5317 break;
5318 case OPTION_IMAGE_OPTS:
5319 image_opts = true;
5320 break;
5321 case OPTION_OUTPUT:
5322 if (!strcmp(optarg, "json")) {
5323 output_format = OFORMAT_JSON;
5324 } else if (!strcmp(optarg, "human")) {
5325 output_format = OFORMAT_HUMAN;
5326 } else {
5327 error_report("--output must be used with human or json "
5328 "as argument.");
5329 goto out;
5331 break;
5332 case OPTION_SIZE:
5334 int64_t sval;
5336 sval = cvtnum("image size", optarg);
5337 if (sval < 0) {
5338 goto out;
5340 img_size = (uint64_t)sval;
5342 break;
5346 if (argc - optind > 1) {
5347 error_report("At most one filename argument is allowed.");
5348 goto out;
5349 } else if (argc - optind == 1) {
5350 filename = argv[optind];
5353 if (!filename && (image_opts || fmt || snapshot_name || sn_opts)) {
5354 error_report("--image-opts, -f, and -l require a filename argument.");
5355 goto out;
5357 if (filename && img_size != UINT64_MAX) {
5358 error_report("--size N cannot be used together with a filename.");
5359 goto out;
5361 if (!filename && img_size == UINT64_MAX) {
5362 error_report("Either --size N or one filename must be specified.");
5363 goto out;
5366 if (filename) {
5367 in_blk = img_open(image_opts, filename, fmt, 0,
5368 false, false, force_share);
5369 if (!in_blk) {
5370 goto out;
5373 if (sn_opts) {
5374 bdrv_snapshot_load_tmp(blk_bs(in_blk),
5375 qemu_opt_get(sn_opts, SNAPSHOT_OPT_ID),
5376 qemu_opt_get(sn_opts, SNAPSHOT_OPT_NAME),
5377 &local_err);
5378 } else if (snapshot_name != NULL) {
5379 bdrv_snapshot_load_tmp_by_id_or_name(blk_bs(in_blk),
5380 snapshot_name, &local_err);
5382 if (local_err) {
5383 error_reportf_err(local_err, "Failed to load snapshot: ");
5384 goto out;
5388 drv = bdrv_find_format(out_fmt);
5389 if (!drv) {
5390 error_report("Unknown file format '%s'", out_fmt);
5391 goto out;
5393 if (!drv->create_opts) {
5394 error_report("Format driver '%s' does not support image creation",
5395 drv->format_name);
5396 goto out;
5399 create_opts = qemu_opts_append(create_opts, drv->create_opts);
5400 create_opts = qemu_opts_append(create_opts, bdrv_file.create_opts);
5401 opts = qemu_opts_create(create_opts, NULL, 0, &error_abort);
5402 if (options) {
5403 if (!qemu_opts_do_parse(opts, options, NULL, &local_err)) {
5404 error_report_err(local_err);
5405 error_report("Invalid options for file format '%s'", out_fmt);
5406 goto out;
5409 if (img_size != UINT64_MAX) {
5410 qemu_opt_set_number(opts, BLOCK_OPT_SIZE, img_size, &error_abort);
5413 info = bdrv_measure(drv, opts, in_blk ? blk_bs(in_blk) : NULL, &local_err);
5414 if (local_err) {
5415 error_report_err(local_err);
5416 goto out;
5419 if (output_format == OFORMAT_HUMAN) {
5420 printf("required size: %" PRIu64 "\n", info->required);
5421 printf("fully allocated size: %" PRIu64 "\n", info->fully_allocated);
5422 if (info->has_bitmaps) {
5423 printf("bitmaps size: %" PRIu64 "\n", info->bitmaps);
5425 } else {
5426 dump_json_block_measure_info(info);
5429 ret = 0;
5431 out:
5432 qapi_free_BlockMeasureInfo(info);
5433 qemu_opts_del(object_opts);
5434 qemu_opts_del(opts);
5435 qemu_opts_del(sn_opts);
5436 qemu_opts_free(create_opts);
5437 g_free(options);
5438 blk_unref(in_blk);
5439 return ret;
5442 static const img_cmd_t img_cmds[] = {
5443 #define DEF(option, callback, arg_string) \
5444 { option, callback },
5445 #include "qemu-img-cmds.h"
5446 #undef DEF
5447 { NULL, NULL, },
5450 int main(int argc, char **argv)
5452 const img_cmd_t *cmd;
5453 const char *cmdname;
5454 int c;
5455 static const struct option long_options[] = {
5456 {"help", no_argument, 0, 'h'},
5457 {"version", no_argument, 0, 'V'},
5458 {"trace", required_argument, NULL, 'T'},
5459 {0, 0, 0, 0}
5462 #ifdef CONFIG_POSIX
5463 signal(SIGPIPE, SIG_IGN);
5464 #endif
5466 socket_init();
5467 error_init(argv[0]);
5468 module_call_init(MODULE_INIT_TRACE);
5469 qemu_init_exec_dir(argv[0]);
5471 qemu_init_main_loop(&error_fatal);
5473 qcrypto_init(&error_fatal);
5475 module_call_init(MODULE_INIT_QOM);
5476 bdrv_init();
5477 if (argc < 2) {
5478 error_exit("Not enough arguments");
5481 qemu_add_opts(&qemu_source_opts);
5482 qemu_add_opts(&qemu_trace_opts);
5484 while ((c = getopt_long(argc, argv, "+:hVT:", long_options, NULL)) != -1) {
5485 switch (c) {
5486 case ':':
5487 missing_argument(argv[optind - 1]);
5488 return 0;
5489 case '?':
5490 unrecognized_option(argv[optind - 1]);
5491 return 0;
5492 case 'h':
5493 help();
5494 return 0;
5495 case 'V':
5496 printf(QEMU_IMG_VERSION);
5497 return 0;
5498 case 'T':
5499 trace_opt_parse(optarg);
5500 break;
5504 cmdname = argv[optind];
5506 /* reset getopt_long scanning */
5507 argc -= optind;
5508 if (argc < 1) {
5509 return 0;
5511 argv += optind;
5512 qemu_reset_optind();
5514 if (!trace_init_backends()) {
5515 exit(1);
5517 trace_init_file();
5518 qemu_set_log(LOG_TRACE, &error_fatal);
5520 /* find the command */
5521 for (cmd = img_cmds; cmd->name != NULL; cmd++) {
5522 if (!strcmp(cmdname, cmd->name)) {
5523 return cmd->handler(argc, argv);
5527 /* not found */
5528 error_exit("Command not found: %s", cmdname);