qemu
/
blockdev.c
3649 строк · 108.5 Кб
1/*
2* QEMU host block devices
3*
4* Copyright (c) 2003-2008 Fabrice Bellard
5*
6* This work is licensed under the terms of the GNU GPL, version 2 or
7* later. See the COPYING file in the top-level directory.
8*
9* This file incorporates work covered by the following copyright and
10* permission notice:
11*
12* Copyright (c) 2003-2008 Fabrice Bellard
13*
14* Permission is hereby granted, free of charge, to any person obtaining a copy
15* of this software and associated documentation files (the "Software"), to deal
16* in the Software without restriction, including without limitation the rights
17* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
18* copies of the Software, and to permit persons to whom the Software is
19* furnished to do so, subject to the following conditions:
20*
21* The above copyright notice and this permission notice shall be included in
22* all copies or substantial portions of the Software.
23*
24* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
25* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
26* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
27* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
28* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
29* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
30* THE SOFTWARE.
31*/
32
33#include "qemu/osdep.h"34#include "sysemu/block-backend.h"35#include "sysemu/blockdev.h"36#include "hw/block/block.h"37#include "block/blockjob.h"38#include "block/dirty-bitmap.h"39#include "block/qdict.h"40#include "block/throttle-groups.h"41#include "monitor/monitor.h"42#include "qemu/error-report.h"43#include "qemu/option.h"44#include "qemu/qemu-print.h"45#include "qemu/config-file.h"46#include "qapi/qapi-commands-block.h"47#include "qapi/qapi-commands-transaction.h"48#include "qapi/qapi-visit-block-core.h"49#include "qapi/qmp/qdict.h"50#include "qapi/qmp/qnum.h"51#include "qapi/qmp/qstring.h"52#include "qapi/error.h"53#include "qapi/qmp/qerror.h"54#include "qapi/qmp/qlist.h"55#include "qapi/qobject-output-visitor.h"56#include "sysemu/sysemu.h"57#include "sysemu/iothread.h"58#include "block/block_int.h"59#include "block/trace.h"60#include "sysemu/runstate.h"61#include "sysemu/replay.h"62#include "qemu/cutils.h"63#include "qemu/help_option.h"64#include "qemu/main-loop.h"65#include "qemu/throttle-options.h"66
67/* Protected by BQL */
68QTAILQ_HEAD(, BlockDriverState) monitor_bdrv_states =69QTAILQ_HEAD_INITIALIZER(monitor_bdrv_states);70
71void bdrv_set_monitor_owned(BlockDriverState *bs)72{
73GLOBAL_STATE_CODE();74QTAILQ_INSERT_TAIL(&monitor_bdrv_states, bs, monitor_list);75}
76
77static const char *const if_name[IF_COUNT] = {78[IF_NONE] = "none",79[IF_IDE] = "ide",80[IF_SCSI] = "scsi",81[IF_FLOPPY] = "floppy",82[IF_PFLASH] = "pflash",83[IF_MTD] = "mtd",84[IF_SD] = "sd",85[IF_VIRTIO] = "virtio",86[IF_XEN] = "xen",87};88
89static int if_max_devs[IF_COUNT] = {90/*91* Do not change these numbers! They govern how drive option
92* index maps to unit and bus. That mapping is ABI.
93*
94* All controllers used to implement if=T drives need to support
95* if_max_devs[T] units, for any T with if_max_devs[T] != 0.
96* Otherwise, some index values map to "impossible" bus, unit
97* values.
98*
99* For instance, if you change [IF_SCSI] to 255, -drive
100* if=scsi,index=12 no longer means bus=1,unit=5, but
101* bus=0,unit=12. With an lsi53c895a controller (7 units max),
102* the drive can't be set up. Regression.
103*/
104[IF_IDE] = 2,105[IF_SCSI] = 7,106};107
108/**
109* Boards may call this to offer board-by-board overrides
110* of the default, global values.
111*/
112void override_max_devs(BlockInterfaceType type, int max_devs)113{
114BlockBackend *blk;115DriveInfo *dinfo;116
117GLOBAL_STATE_CODE();118
119if (max_devs <= 0) {120return;121}122
123for (blk = blk_next(NULL); blk; blk = blk_next(blk)) {124dinfo = blk_legacy_dinfo(blk);125if (dinfo->type == type) {126fprintf(stderr, "Cannot override units-per-bus property of"127" the %s interface, because a drive of that type has"128" already been added.\n", if_name[type]);129g_assert_not_reached();130}131}132
133if_max_devs[type] = max_devs;134}
135
136/*
137* We automatically delete the drive when a device using it gets
138* unplugged. Questionable feature, but we can't just drop it.
139* Device models call blockdev_mark_auto_del() to schedule the
140* automatic deletion, and generic qdev code calls blockdev_auto_del()
141* when deletion is actually safe.
142*/
143void blockdev_mark_auto_del(BlockBackend *blk)144{
145DriveInfo *dinfo = blk_legacy_dinfo(blk);146BlockJob *job;147
148GLOBAL_STATE_CODE();149
150if (!dinfo) {151return;152}153
154JOB_LOCK_GUARD();155
156do {157job = block_job_next_locked(NULL);158while (job && (job->job.cancelled ||159job->job.deferred_to_main_loop ||160!block_job_has_bdrv(job, blk_bs(blk))))161{162job = block_job_next_locked(job);163}164if (job) {165/*166* This drops the job lock temporarily and polls, so we need to
167* restart processing the list from the start after this.
168*/
169job_cancel_locked(&job->job, false);170}171} while (job);172
173dinfo->auto_del = 1;174}
175
176void blockdev_auto_del(BlockBackend *blk)177{
178DriveInfo *dinfo = blk_legacy_dinfo(blk);179GLOBAL_STATE_CODE();180
181if (dinfo && dinfo->auto_del) {182monitor_remove_blk(blk);183blk_unref(blk);184}185}
186
187static int drive_index_to_bus_id(BlockInterfaceType type, int index)188{
189int max_devs = if_max_devs[type];190return max_devs ? index / max_devs : 0;191}
192
193static int drive_index_to_unit_id(BlockInterfaceType type, int index)194{
195int max_devs = if_max_devs[type];196return max_devs ? index % max_devs : index;197}
198
199QemuOpts *drive_add(BlockInterfaceType type, int index, const char *file,200const char *optstr)201{
202QemuOpts *opts;203
204GLOBAL_STATE_CODE();205
206opts = qemu_opts_parse_noisily(qemu_find_opts("drive"), optstr, false);207if (!opts) {208return NULL;209}210if (type != IF_DEFAULT) {211qemu_opt_set(opts, "if", if_name[type], &error_abort);212}213if (index >= 0) {214qemu_opt_set_number(opts, "index", index, &error_abort);215}216if (file)217qemu_opt_set(opts, "file", file, &error_abort);218return opts;219}
220
221DriveInfo *drive_get(BlockInterfaceType type, int bus, int unit)222{
223BlockBackend *blk;224DriveInfo *dinfo;225
226GLOBAL_STATE_CODE();227
228for (blk = blk_next(NULL); blk; blk = blk_next(blk)) {229dinfo = blk_legacy_dinfo(blk);230if (dinfo && dinfo->type == type231&& dinfo->bus == bus && dinfo->unit == unit) {232return dinfo;233}234}235
236return NULL;237}
238
239/*
240* Check board claimed all -drive that are meant to be claimed.
241* Fatal error if any remain unclaimed.
242*/
243void drive_check_orphaned(void)244{
245BlockBackend *blk;246DriveInfo *dinfo;247Location loc;248bool orphans = false;249
250GLOBAL_STATE_CODE();251
252for (blk = blk_next(NULL); blk; blk = blk_next(blk)) {253dinfo = blk_legacy_dinfo(blk);254/*255* Ignore default drives, because we create certain default
256* drives unconditionally, then leave them unclaimed. Not the
257* users fault.
258* Ignore IF_VIRTIO or IF_XEN, because it gets desugared into
259* -device, so we can leave failing to -device.
260* Ignore IF_NONE, because leaving unclaimed IF_NONE remains
261* available for device_add is a feature.
262*/
263if (dinfo->is_default || dinfo->type == IF_VIRTIO264|| dinfo->type == IF_XEN || dinfo->type == IF_NONE) {265continue;266}267if (!blk_get_attached_dev(blk)) {268loc_push_none(&loc);269qemu_opts_loc_restore(dinfo->opts);270error_report("machine type does not support"271" if=%s,bus=%d,unit=%d",272if_name[dinfo->type], dinfo->bus, dinfo->unit);273loc_pop(&loc);274orphans = true;275}276}277
278if (orphans) {279exit(1);280}281}
282
283DriveInfo *drive_get_by_index(BlockInterfaceType type, int index)284{
285GLOBAL_STATE_CODE();286return drive_get(type,287drive_index_to_bus_id(type, index),288drive_index_to_unit_id(type, index));289}
290
291int drive_get_max_bus(BlockInterfaceType type)292{
293int max_bus;294BlockBackend *blk;295DriveInfo *dinfo;296
297GLOBAL_STATE_CODE();298
299max_bus = -1;300for (blk = blk_next(NULL); blk; blk = blk_next(blk)) {301dinfo = blk_legacy_dinfo(blk);302if (dinfo && dinfo->type == type && dinfo->bus > max_bus) {303max_bus = dinfo->bus;304}305}306return max_bus;307}
308
309static void bdrv_format_print(void *opaque, const char *name)310{
311qemu_printf(" %s", name);312}
313
314typedef struct {315QEMUBH *bh;316BlockDriverState *bs;317} BDRVPutRefBH;318
319static int parse_block_error_action(const char *buf, bool is_read, Error **errp)320{
321if (!strcmp(buf, "ignore")) {322return BLOCKDEV_ON_ERROR_IGNORE;323} else if (!is_read && !strcmp(buf, "enospc")) {324return BLOCKDEV_ON_ERROR_ENOSPC;325} else if (!strcmp(buf, "stop")) {326return BLOCKDEV_ON_ERROR_STOP;327} else if (!strcmp(buf, "report")) {328return BLOCKDEV_ON_ERROR_REPORT;329} else {330error_setg(errp, "'%s' invalid %s error action",331buf, is_read ? "read" : "write");332return -1;333}334}
335
336static bool parse_stats_intervals(BlockAcctStats *stats, QList *intervals,337Error **errp)338{
339const QListEntry *entry;340for (entry = qlist_first(intervals); entry; entry = qlist_next(entry)) {341switch (qobject_type(entry->value)) {342
343case QTYPE_QSTRING: {344uint64_t length;345const char *str = qstring_get_str(qobject_to(QString,346entry->value));347if (parse_uint_full(str, 10, &length) == 0 &&348length > 0 && length <= UINT_MAX) {349block_acct_add_interval(stats, (unsigned) length);350} else {351error_setg(errp, "Invalid interval length: %s", str);352return false;353}354break;355}356
357case QTYPE_QNUM: {358int64_t length = qnum_get_int(qobject_to(QNum, entry->value));359
360if (length > 0 && length <= UINT_MAX) {361block_acct_add_interval(stats, (unsigned) length);362} else {363error_setg(errp, "Invalid interval length: %" PRId64, length);364return false;365}366break;367}368
369default:370error_setg(errp, "The specification of stats-intervals is invalid");371return false;372}373}374return true;375}
376
377typedef enum { MEDIA_DISK, MEDIA_CDROM } DriveMediaType;378
379/* All parameters but @opts are optional and may be set to NULL. */
380static void extract_common_blockdev_options(QemuOpts *opts, int *bdrv_flags,381const char **throttling_group, ThrottleConfig *throttle_cfg,382BlockdevDetectZeroesOptions *detect_zeroes, Error **errp)383{
384Error *local_error = NULL;385const char *aio;386
387if (bdrv_flags) {388if (qemu_opt_get_bool(opts, "copy-on-read", false)) {389*bdrv_flags |= BDRV_O_COPY_ON_READ;390}391
392if ((aio = qemu_opt_get(opts, "aio")) != NULL) {393if (bdrv_parse_aio(aio, bdrv_flags) < 0) {394error_setg(errp, "invalid aio option");395return;396}397}398}399
400/* disk I/O throttling */401if (throttling_group) {402*throttling_group = qemu_opt_get(opts, "throttling.group");403}404
405if (throttle_cfg) {406throttle_config_init(throttle_cfg);407throttle_cfg->buckets[THROTTLE_BPS_TOTAL].avg =408qemu_opt_get_number(opts, "throttling.bps-total", 0);409throttle_cfg->buckets[THROTTLE_BPS_READ].avg =410qemu_opt_get_number(opts, "throttling.bps-read", 0);411throttle_cfg->buckets[THROTTLE_BPS_WRITE].avg =412qemu_opt_get_number(opts, "throttling.bps-write", 0);413throttle_cfg->buckets[THROTTLE_OPS_TOTAL].avg =414qemu_opt_get_number(opts, "throttling.iops-total", 0);415throttle_cfg->buckets[THROTTLE_OPS_READ].avg =416qemu_opt_get_number(opts, "throttling.iops-read", 0);417throttle_cfg->buckets[THROTTLE_OPS_WRITE].avg =418qemu_opt_get_number(opts, "throttling.iops-write", 0);419
420throttle_cfg->buckets[THROTTLE_BPS_TOTAL].max =421qemu_opt_get_number(opts, "throttling.bps-total-max", 0);422throttle_cfg->buckets[THROTTLE_BPS_READ].max =423qemu_opt_get_number(opts, "throttling.bps-read-max", 0);424throttle_cfg->buckets[THROTTLE_BPS_WRITE].max =425qemu_opt_get_number(opts, "throttling.bps-write-max", 0);426throttle_cfg->buckets[THROTTLE_OPS_TOTAL].max =427qemu_opt_get_number(opts, "throttling.iops-total-max", 0);428throttle_cfg->buckets[THROTTLE_OPS_READ].max =429qemu_opt_get_number(opts, "throttling.iops-read-max", 0);430throttle_cfg->buckets[THROTTLE_OPS_WRITE].max =431qemu_opt_get_number(opts, "throttling.iops-write-max", 0);432
433throttle_cfg->buckets[THROTTLE_BPS_TOTAL].burst_length =434qemu_opt_get_number(opts, "throttling.bps-total-max-length", 1);435throttle_cfg->buckets[THROTTLE_BPS_READ].burst_length =436qemu_opt_get_number(opts, "throttling.bps-read-max-length", 1);437throttle_cfg->buckets[THROTTLE_BPS_WRITE].burst_length =438qemu_opt_get_number(opts, "throttling.bps-write-max-length", 1);439throttle_cfg->buckets[THROTTLE_OPS_TOTAL].burst_length =440qemu_opt_get_number(opts, "throttling.iops-total-max-length", 1);441throttle_cfg->buckets[THROTTLE_OPS_READ].burst_length =442qemu_opt_get_number(opts, "throttling.iops-read-max-length", 1);443throttle_cfg->buckets[THROTTLE_OPS_WRITE].burst_length =444qemu_opt_get_number(opts, "throttling.iops-write-max-length", 1);445
446throttle_cfg->op_size =447qemu_opt_get_number(opts, "throttling.iops-size", 0);448
449if (!throttle_is_valid(throttle_cfg, errp)) {450return;451}452}453
454if (detect_zeroes) {455*detect_zeroes =456qapi_enum_parse(&BlockdevDetectZeroesOptions_lookup,457qemu_opt_get(opts, "detect-zeroes"),458BLOCKDEV_DETECT_ZEROES_OPTIONS_OFF,459&local_error);460if (local_error) {461error_propagate(errp, local_error);462return;463}464}465}
466
467static OnOffAuto account_get_opt(QemuOpts *opts, const char *name)468{
469if (!qemu_opt_find(opts, name)) {470return ON_OFF_AUTO_AUTO;471}472if (qemu_opt_get_bool(opts, name, true)) {473return ON_OFF_AUTO_ON;474}475return ON_OFF_AUTO_OFF;476}
477
478/* Takes the ownership of bs_opts */
479static BlockBackend *blockdev_init(const char *file, QDict *bs_opts,480Error **errp)481{
482const char *buf;483int bdrv_flags = 0;484int on_read_error, on_write_error;485OnOffAuto account_invalid, account_failed;486bool writethrough, read_only;487BlockBackend *blk;488BlockDriverState *bs;489ThrottleConfig cfg;490int snapshot = 0;491Error *error = NULL;492QemuOpts *opts;493QDict *interval_dict = NULL;494QList *interval_list = NULL;495const char *id;496BlockdevDetectZeroesOptions detect_zeroes =497BLOCKDEV_DETECT_ZEROES_OPTIONS_OFF;498const char *throttling_group = NULL;499
500/* Check common options by copying from bs_opts to opts, all other options501* stay in bs_opts for processing by bdrv_open(). */
502id = qdict_get_try_str(bs_opts, "id");503opts = qemu_opts_create(&qemu_common_drive_opts, id, 1, errp);504if (!opts) {505goto err_no_opts;506}507
508if (!qemu_opts_absorb_qdict(opts, bs_opts, errp)) {509goto early_err;510}511
512if (id) {513qdict_del(bs_opts, "id");514}515
516/* extract parameters */517snapshot = qemu_opt_get_bool(opts, "snapshot", 0);518
519account_invalid = account_get_opt(opts, "stats-account-invalid");520account_failed = account_get_opt(opts, "stats-account-failed");521
522writethrough = !qemu_opt_get_bool(opts, BDRV_OPT_CACHE_WB, true);523
524id = qemu_opts_id(opts);525
526qdict_extract_subqdict(bs_opts, &interval_dict, "stats-intervals.");527qdict_array_split(interval_dict, &interval_list);528
529if (qdict_size(interval_dict) != 0) {530error_setg(errp, "Invalid option stats-intervals.%s",531qdict_first(interval_dict)->key);532goto early_err;533}534
535extract_common_blockdev_options(opts, &bdrv_flags, &throttling_group, &cfg,536&detect_zeroes, &error);537if (error) {538error_propagate(errp, error);539goto early_err;540}541
542if ((buf = qemu_opt_get(opts, "format")) != NULL) {543if (is_help_option(buf)) {544qemu_printf("Supported formats:");545bdrv_iterate_format(bdrv_format_print, NULL, false);546qemu_printf("\nSupported formats (read-only):");547bdrv_iterate_format(bdrv_format_print, NULL, true);548qemu_printf("\n");549goto early_err;550}551
552if (qdict_haskey(bs_opts, "driver")) {553error_setg(errp, "Cannot specify both 'driver' and 'format'");554goto early_err;555}556qdict_put_str(bs_opts, "driver", buf);557}558
559on_write_error = BLOCKDEV_ON_ERROR_ENOSPC;560if ((buf = qemu_opt_get(opts, "werror")) != NULL) {561on_write_error = parse_block_error_action(buf, 0, &error);562if (error) {563error_propagate(errp, error);564goto early_err;565}566}567
568on_read_error = BLOCKDEV_ON_ERROR_REPORT;569if ((buf = qemu_opt_get(opts, "rerror")) != NULL) {570on_read_error = parse_block_error_action(buf, 1, &error);571if (error) {572error_propagate(errp, error);573goto early_err;574}575}576
577if (snapshot) {578bdrv_flags |= BDRV_O_SNAPSHOT;579}580
581read_only = qemu_opt_get_bool(opts, BDRV_OPT_READ_ONLY, false);582
583/* init */584if ((!file || !*file) && !qdict_size(bs_opts)) {585BlockBackendRootState *blk_rs;586
587blk = blk_new(qemu_get_aio_context(), 0, BLK_PERM_ALL);588blk_rs = blk_get_root_state(blk);589blk_rs->open_flags = bdrv_flags | (read_only ? 0 : BDRV_O_RDWR);590blk_rs->detect_zeroes = detect_zeroes;591
592qobject_unref(bs_opts);593} else {594if (file && !*file) {595file = NULL;596}597
598/* bdrv_open() defaults to the values in bdrv_flags (for compatibility599* with other callers) rather than what we want as the real defaults.
600* Apply the defaults here instead. */
601qdict_set_default_str(bs_opts, BDRV_OPT_CACHE_DIRECT, "off");602qdict_set_default_str(bs_opts, BDRV_OPT_CACHE_NO_FLUSH, "off");603qdict_set_default_str(bs_opts, BDRV_OPT_READ_ONLY,604read_only ? "on" : "off");605qdict_set_default_str(bs_opts, BDRV_OPT_AUTO_READ_ONLY, "on");606assert((bdrv_flags & BDRV_O_CACHE_MASK) == 0);607
608if (runstate_check(RUN_STATE_INMIGRATE)) {609bdrv_flags |= BDRV_O_INACTIVE;610}611
612blk = blk_new_open(file, NULL, bs_opts, bdrv_flags, errp);613if (!blk) {614goto err_no_bs_opts;615}616bs = blk_bs(blk);617
618bs->detect_zeroes = detect_zeroes;619
620block_acct_setup(blk_get_stats(blk), account_invalid, account_failed);621
622if (!parse_stats_intervals(blk_get_stats(blk), interval_list, errp)) {623blk_unref(blk);624blk = NULL;625goto err_no_bs_opts;626}627}628
629/* disk I/O throttling */630if (throttle_enabled(&cfg)) {631if (!throttling_group) {632throttling_group = id;633}634blk_io_limits_enable(blk, throttling_group);635blk_set_io_limits(blk, &cfg);636}637
638blk_set_enable_write_cache(blk, !writethrough);639blk_set_on_error(blk, on_read_error, on_write_error);640
641if (!monitor_add_blk(blk, id, errp)) {642blk_unref(blk);643blk = NULL;644goto err_no_bs_opts;645}646
647err_no_bs_opts:648qemu_opts_del(opts);649qobject_unref(interval_dict);650qobject_unref(interval_list);651return blk;652
653early_err:654qemu_opts_del(opts);655qobject_unref(interval_dict);656qobject_unref(interval_list);657err_no_opts:658qobject_unref(bs_opts);659return NULL;660}
661
662/* Takes the ownership of bs_opts */
663BlockDriverState *bds_tree_init(QDict *bs_opts, Error **errp)664{
665int bdrv_flags = 0;666
667GLOBAL_STATE_CODE();668/* bdrv_open() defaults to the values in bdrv_flags (for compatibility669* with other callers) rather than what we want as the real defaults.
670* Apply the defaults here instead. */
671qdict_set_default_str(bs_opts, BDRV_OPT_CACHE_DIRECT, "off");672qdict_set_default_str(bs_opts, BDRV_OPT_CACHE_NO_FLUSH, "off");673qdict_set_default_str(bs_opts, BDRV_OPT_READ_ONLY, "off");674
675if (runstate_check(RUN_STATE_INMIGRATE)) {676bdrv_flags |= BDRV_O_INACTIVE;677}678
679return bdrv_open(NULL, NULL, bs_opts, bdrv_flags, errp);680}
681
682void blockdev_close_all_bdrv_states(void)683{
684BlockDriverState *bs, *next_bs;685
686GLOBAL_STATE_CODE();687QTAILQ_FOREACH_SAFE(bs, &monitor_bdrv_states, monitor_list, next_bs) {688bdrv_unref(bs);689}690}
691
692/* Iterates over the list of monitor-owned BlockDriverStates */
693BlockDriverState *bdrv_next_monitor_owned(BlockDriverState *bs)694{
695GLOBAL_STATE_CODE();696return bs ? QTAILQ_NEXT(bs, monitor_list)697: QTAILQ_FIRST(&monitor_bdrv_states);698}
699
700static bool qemu_opt_rename(QemuOpts *opts, const char *from, const char *to,701Error **errp)702{
703const char *value;704
705value = qemu_opt_get(opts, from);706if (value) {707if (qemu_opt_find(opts, to)) {708error_setg(errp, "'%s' and its alias '%s' can't be used at the "709"same time", to, from);710return false;711}712}713
714/* rename all items in opts */715while ((value = qemu_opt_get(opts, from))) {716qemu_opt_set(opts, to, value, &error_abort);717qemu_opt_unset(opts, from);718}719return true;720}
721
722QemuOptsList qemu_legacy_drive_opts = {723.name = "drive",724.head = QTAILQ_HEAD_INITIALIZER(qemu_legacy_drive_opts.head),725.desc = {726{727.name = "bus",728.type = QEMU_OPT_NUMBER,729.help = "bus number",730},{731.name = "unit",732.type = QEMU_OPT_NUMBER,733.help = "unit number (i.e. lun for scsi)",734},{735.name = "index",736.type = QEMU_OPT_NUMBER,737.help = "index number",738},{739.name = "media",740.type = QEMU_OPT_STRING,741.help = "media type (disk, cdrom)",742},{743.name = "if",744.type = QEMU_OPT_STRING,745.help = "interface (ide, scsi, sd, mtd, floppy, pflash, virtio)",746},{747.name = "file",748.type = QEMU_OPT_STRING,749.help = "file name",750},751
752/* Options that are passed on, but have special semantics with -drive */753{754.name = BDRV_OPT_READ_ONLY,755.type = QEMU_OPT_BOOL,756.help = "open drive file as read-only",757},{758.name = "rerror",759.type = QEMU_OPT_STRING,760.help = "read error action",761},{762.name = "werror",763.type = QEMU_OPT_STRING,764.help = "write error action",765},{766.name = "copy-on-read",767.type = QEMU_OPT_BOOL,768.help = "copy read data from backing file into image file",769},770
771{ /* end of list */ }772},773};774
775DriveInfo *drive_new(QemuOpts *all_opts, BlockInterfaceType block_default_type,776Error **errp)777{
778const char *value;779BlockBackend *blk;780DriveInfo *dinfo = NULL;781QDict *bs_opts;782QemuOpts *legacy_opts;783DriveMediaType media = MEDIA_DISK;784BlockInterfaceType type;785int max_devs, bus_id, unit_id, index;786const char *werror, *rerror;787bool read_only = false;788bool copy_on_read;789const char *filename;790int i;791
792GLOBAL_STATE_CODE();793
794/* Change legacy command line options into QMP ones */795static const struct {796const char *from;797const char *to;798} opt_renames[] = {799{ "iops", "throttling.iops-total" },800{ "iops_rd", "throttling.iops-read" },801{ "iops_wr", "throttling.iops-write" },802
803{ "bps", "throttling.bps-total" },804{ "bps_rd", "throttling.bps-read" },805{ "bps_wr", "throttling.bps-write" },806
807{ "iops_max", "throttling.iops-total-max" },808{ "iops_rd_max", "throttling.iops-read-max" },809{ "iops_wr_max", "throttling.iops-write-max" },810
811{ "bps_max", "throttling.bps-total-max" },812{ "bps_rd_max", "throttling.bps-read-max" },813{ "bps_wr_max", "throttling.bps-write-max" },814
815{ "iops_size", "throttling.iops-size" },816
817{ "group", "throttling.group" },818
819{ "readonly", BDRV_OPT_READ_ONLY },820};821
822for (i = 0; i < ARRAY_SIZE(opt_renames); i++) {823if (!qemu_opt_rename(all_opts, opt_renames[i].from,824opt_renames[i].to, errp)) {825return NULL;826}827}828
829value = qemu_opt_get(all_opts, "cache");830if (value) {831int flags = 0;832bool writethrough;833
834if (bdrv_parse_cache_mode(value, &flags, &writethrough) != 0) {835error_setg(errp, "invalid cache option");836return NULL;837}838
839/* Specific options take precedence */840if (!qemu_opt_get(all_opts, BDRV_OPT_CACHE_WB)) {841qemu_opt_set_bool(all_opts, BDRV_OPT_CACHE_WB,842!writethrough, &error_abort);843}844if (!qemu_opt_get(all_opts, BDRV_OPT_CACHE_DIRECT)) {845qemu_opt_set_bool(all_opts, BDRV_OPT_CACHE_DIRECT,846!!(flags & BDRV_O_NOCACHE), &error_abort);847}848if (!qemu_opt_get(all_opts, BDRV_OPT_CACHE_NO_FLUSH)) {849qemu_opt_set_bool(all_opts, BDRV_OPT_CACHE_NO_FLUSH,850!!(flags & BDRV_O_NO_FLUSH), &error_abort);851}852qemu_opt_unset(all_opts, "cache");853}854
855/* Get a QDict for processing the options */856bs_opts = qdict_new();857qemu_opts_to_qdict(all_opts, bs_opts);858
859legacy_opts = qemu_opts_create(&qemu_legacy_drive_opts, NULL, 0,860&error_abort);861if (!qemu_opts_absorb_qdict(legacy_opts, bs_opts, errp)) {862goto fail;863}864
865/* Media type */866value = qemu_opt_get(legacy_opts, "media");867if (value) {868if (!strcmp(value, "disk")) {869media = MEDIA_DISK;870} else if (!strcmp(value, "cdrom")) {871media = MEDIA_CDROM;872read_only = true;873} else {874error_setg(errp, "'%s' invalid media", value);875goto fail;876}877}878
879/* copy-on-read is disabled with a warning for read-only devices */880read_only |= qemu_opt_get_bool(legacy_opts, BDRV_OPT_READ_ONLY, false);881copy_on_read = qemu_opt_get_bool(legacy_opts, "copy-on-read", false);882
883if (read_only && copy_on_read) {884warn_report("disabling copy-on-read on read-only drive");885copy_on_read = false;886}887
888qdict_put_str(bs_opts, BDRV_OPT_READ_ONLY, read_only ? "on" : "off");889qdict_put_str(bs_opts, "copy-on-read", copy_on_read ? "on" : "off");890
891/* Controller type */892value = qemu_opt_get(legacy_opts, "if");893if (value) {894for (type = 0;895type < IF_COUNT && strcmp(value, if_name[type]);896type++) {897}898if (type == IF_COUNT) {899error_setg(errp, "unsupported bus type '%s'", value);900goto fail;901}902} else {903type = block_default_type;904}905
906/* Device address specified by bus/unit or index.907* If none was specified, try to find the first free one. */
908bus_id = qemu_opt_get_number(legacy_opts, "bus", 0);909unit_id = qemu_opt_get_number(legacy_opts, "unit", -1);910index = qemu_opt_get_number(legacy_opts, "index", -1);911
912max_devs = if_max_devs[type];913
914if (index != -1) {915if (bus_id != 0 || unit_id != -1) {916error_setg(errp, "index cannot be used with bus and unit");917goto fail;918}919bus_id = drive_index_to_bus_id(type, index);920unit_id = drive_index_to_unit_id(type, index);921}922
923if (unit_id == -1) {924unit_id = 0;925while (drive_get(type, bus_id, unit_id) != NULL) {926unit_id++;927if (max_devs && unit_id >= max_devs) {928unit_id -= max_devs;929bus_id++;930}931}932}933
934if (max_devs && unit_id >= max_devs) {935error_setg(errp, "unit %d too big (max is %d)", unit_id, max_devs - 1);936goto fail;937}938
939if (drive_get(type, bus_id, unit_id) != NULL) {940error_setg(errp, "drive with bus=%d, unit=%d (index=%d) exists",941bus_id, unit_id, index);942goto fail;943}944
945/* no id supplied -> create one */946if (qemu_opts_id(all_opts) == NULL) {947char *new_id;948const char *mediastr = "";949if (type == IF_IDE || type == IF_SCSI) {950mediastr = (media == MEDIA_CDROM) ? "-cd" : "-hd";951}952if (max_devs) {953new_id = g_strdup_printf("%s%i%s%i", if_name[type], bus_id,954mediastr, unit_id);955} else {956new_id = g_strdup_printf("%s%s%i", if_name[type],957mediastr, unit_id);958}959qdict_put_str(bs_opts, "id", new_id);960g_free(new_id);961}962
963/* Add virtio block device */964if (type == IF_VIRTIO) {965QemuOpts *devopts;966devopts = qemu_opts_create(qemu_find_opts("device"), NULL, 0,967&error_abort);968qemu_opt_set(devopts, "driver", "virtio-blk", &error_abort);969qemu_opt_set(devopts, "drive", qdict_get_str(bs_opts, "id"),970&error_abort);971} else if (type == IF_XEN) {972QemuOpts *devopts;973devopts = qemu_opts_create(qemu_find_opts("device"), NULL, 0,974&error_abort);975qemu_opt_set(devopts, "driver",976(media == MEDIA_CDROM) ? "xen-cdrom" : "xen-disk",977&error_abort);978qemu_opt_set(devopts, "drive", qdict_get_str(bs_opts, "id"),979&error_abort);980}981
982filename = qemu_opt_get(legacy_opts, "file");983
984/* Check werror/rerror compatibility with if=... */985werror = qemu_opt_get(legacy_opts, "werror");986if (werror != NULL) {987if (type != IF_IDE && type != IF_SCSI && type != IF_VIRTIO &&988type != IF_NONE) {989error_setg(errp, "werror is not supported by this bus type");990goto fail;991}992qdict_put_str(bs_opts, "werror", werror);993}994
995rerror = qemu_opt_get(legacy_opts, "rerror");996if (rerror != NULL) {997if (type != IF_IDE && type != IF_VIRTIO && type != IF_SCSI &&998type != IF_NONE) {999error_setg(errp, "rerror is not supported by this bus type");1000goto fail;1001}1002qdict_put_str(bs_opts, "rerror", rerror);1003}1004
1005/* Actual block device init: Functionality shared with blockdev-add */1006blk = blockdev_init(filename, bs_opts, errp);1007bs_opts = NULL;1008if (!blk) {1009goto fail;1010}1011
1012/* Create legacy DriveInfo */1013dinfo = g_malloc0(sizeof(*dinfo));1014dinfo->opts = all_opts;1015
1016dinfo->type = type;1017dinfo->bus = bus_id;1018dinfo->unit = unit_id;1019
1020blk_set_legacy_dinfo(blk, dinfo);1021
1022switch(type) {1023case IF_IDE:1024case IF_SCSI:1025case IF_XEN:1026case IF_NONE:1027dinfo->media_cd = media == MEDIA_CDROM;1028break;1029default:1030break;1031}1032
1033fail:1034qemu_opts_del(legacy_opts);1035qobject_unref(bs_opts);1036return dinfo;1037}
1038
1039static BlockDriverState *qmp_get_root_bs(const char *name, Error **errp)1040{
1041BlockDriverState *bs;1042
1043GRAPH_RDLOCK_GUARD_MAINLOOP();1044
1045bs = bdrv_lookup_bs(name, name, errp);1046if (bs == NULL) {1047return NULL;1048}1049
1050if (!bdrv_is_root_node(bs)) {1051error_setg(errp, "Need a root block node");1052return NULL;1053}1054
1055if (!bdrv_is_inserted(bs)) {1056error_setg(errp, "Device has no medium");1057bs = NULL;1058}1059
1060return bs;1061}
1062
1063static void blockdev_do_action(TransactionAction *action, Error **errp)1064{
1065TransactionActionList list;1066
1067list.value = action;1068list.next = NULL;1069qmp_transaction(&list, NULL, errp);1070}
1071
1072void qmp_blockdev_snapshot_sync(const char *device, const char *node_name,1073const char *snapshot_file,1074const char *snapshot_node_name,1075const char *format,1076bool has_mode, NewImageMode mode, Error **errp)1077{
1078BlockdevSnapshotSync snapshot = {1079.device = (char *) device,1080.node_name = (char *) node_name,1081.snapshot_file = (char *) snapshot_file,1082.snapshot_node_name = (char *) snapshot_node_name,1083.format = (char *) format,1084.has_mode = has_mode,1085.mode = mode,1086};1087TransactionAction action = {1088.type = TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_SYNC,1089.u.blockdev_snapshot_sync.data = &snapshot,1090};1091blockdev_do_action(&action, errp);1092}
1093
1094void qmp_blockdev_snapshot(const char *node, const char *overlay,1095Error **errp)1096{
1097BlockdevSnapshot snapshot_data = {1098.node = (char *) node,1099.overlay = (char *) overlay1100};1101TransactionAction action = {1102.type = TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT,1103.u.blockdev_snapshot.data = &snapshot_data,1104};1105blockdev_do_action(&action, errp);1106}
1107
1108void qmp_blockdev_snapshot_internal_sync(const char *device,1109const char *name,1110Error **errp)1111{
1112BlockdevSnapshotInternal snapshot = {1113.device = (char *) device,1114.name = (char *) name1115};1116TransactionAction action = {1117.type = TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_INTERNAL_SYNC,1118.u.blockdev_snapshot_internal_sync.data = &snapshot,1119};1120blockdev_do_action(&action, errp);1121}
1122
1123SnapshotInfo *qmp_blockdev_snapshot_delete_internal_sync(const char *device,1124const char *id,1125const char *name,1126Error **errp)1127{
1128BlockDriverState *bs;1129QEMUSnapshotInfo sn;1130Error *local_err = NULL;1131SnapshotInfo *info = NULL;1132int ret;1133
1134GLOBAL_STATE_CODE();1135GRAPH_RDLOCK_GUARD_MAINLOOP();1136
1137bs = qmp_get_root_bs(device, errp);1138if (!bs) {1139return NULL;1140}1141
1142if (!id && !name) {1143error_setg(errp, "Name or id must be provided");1144return NULL;1145}1146
1147if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_INTERNAL_SNAPSHOT_DELETE, errp)) {1148return NULL;1149}1150
1151ret = bdrv_snapshot_find_by_id_and_name(bs, id, name, &sn, &local_err);1152if (local_err) {1153error_propagate(errp, local_err);1154return NULL;1155}1156if (!ret) {1157error_setg(errp,1158"Snapshot with id '%s' and name '%s' does not exist on "1159"device '%s'",1160STR_OR_NULL(id), STR_OR_NULL(name), device);1161return NULL;1162}1163
1164bdrv_snapshot_delete(bs, id, name, &local_err);1165if (local_err) {1166error_propagate(errp, local_err);1167return NULL;1168}1169
1170info = g_new0(SnapshotInfo, 1);1171info->id = g_strdup(sn.id_str);1172info->name = g_strdup(sn.name);1173info->date_nsec = sn.date_nsec;1174info->date_sec = sn.date_sec;1175info->vm_state_size = sn.vm_state_size;1176info->vm_clock_nsec = sn.vm_clock_nsec % 1000000000;1177info->vm_clock_sec = sn.vm_clock_nsec / 1000000000;1178if (sn.icount != -1ULL) {1179info->icount = sn.icount;1180info->has_icount = true;1181}1182
1183return info;1184}
1185
1186/* internal snapshot private data */
1187typedef struct InternalSnapshotState {1188BlockDriverState *bs;1189QEMUSnapshotInfo sn;1190bool created;1191} InternalSnapshotState;1192
1193static void internal_snapshot_abort(void *opaque);1194static void internal_snapshot_clean(void *opaque);1195TransactionActionDrv internal_snapshot_drv = {1196.abort = internal_snapshot_abort,1197.clean = internal_snapshot_clean,1198};1199
1200static void internal_snapshot_action(BlockdevSnapshotInternal *internal,1201Transaction *tran, Error **errp)1202{
1203Error *local_err = NULL;1204const char *device;1205const char *name;1206BlockDriverState *bs;1207QEMUSnapshotInfo old_sn, *sn;1208bool ret;1209int64_t rt;1210InternalSnapshotState *state = g_new0(InternalSnapshotState, 1);1211int ret1;1212
1213GLOBAL_STATE_CODE();1214GRAPH_RDLOCK_GUARD_MAINLOOP();1215
1216tran_add(tran, &internal_snapshot_drv, state);1217
1218device = internal->device;1219name = internal->name;1220
1221bs = qmp_get_root_bs(device, errp);1222if (!bs) {1223return;1224}1225
1226state->bs = bs;1227
1228/* Paired with .clean() */1229bdrv_drained_begin(bs);1230
1231if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_INTERNAL_SNAPSHOT, errp)) {1232return;1233}1234
1235if (bdrv_is_read_only(bs)) {1236error_setg(errp, "Device '%s' is read only", device);1237return;1238}1239
1240if (!bdrv_can_snapshot(bs)) {1241error_setg(errp, "Block format '%s' used by device '%s' "1242"does not support internal snapshots",1243bs->drv->format_name, device);1244return;1245}1246
1247if (!strlen(name)) {1248error_setg(errp, "Name is empty");1249return;1250}1251
1252/* check whether a snapshot with name exist */1253ret = bdrv_snapshot_find_by_id_and_name(bs, NULL, name, &old_sn,1254&local_err);1255if (local_err) {1256error_propagate(errp, local_err);1257return;1258} else if (ret) {1259error_setg(errp,1260"Snapshot with name '%s' already exists on device '%s'",1261name, device);1262return;1263}1264
1265/* 3. take the snapshot */1266sn = &state->sn;1267pstrcpy(sn->name, sizeof(sn->name), name);1268rt = g_get_real_time();1269sn->date_sec = rt / G_USEC_PER_SEC;1270sn->date_nsec = (rt % G_USEC_PER_SEC) * 1000;1271sn->vm_clock_nsec = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL);1272if (replay_mode != REPLAY_MODE_NONE) {1273sn->icount = replay_get_current_icount();1274} else {1275sn->icount = -1ULL;1276}1277
1278ret1 = bdrv_snapshot_create(bs, sn);1279if (ret1 < 0) {1280error_setg_errno(errp, -ret1,1281"Failed to create snapshot '%s' on device '%s'",1282name, device);1283return;1284}1285
1286/* 4. succeed, mark a snapshot is created */1287state->created = true;1288}
1289
1290static void internal_snapshot_abort(void *opaque)1291{
1292InternalSnapshotState *state = opaque;1293BlockDriverState *bs = state->bs;1294QEMUSnapshotInfo *sn = &state->sn;1295Error *local_error = NULL;1296
1297GLOBAL_STATE_CODE();1298GRAPH_RDLOCK_GUARD_MAINLOOP();1299
1300if (!state->created) {1301return;1302}1303
1304if (bdrv_snapshot_delete(bs, sn->id_str, sn->name, &local_error) < 0) {1305error_reportf_err(local_error,1306"Failed to delete snapshot with id '%s' and "1307"name '%s' on device '%s' in abort: ",1308sn->id_str, sn->name,1309bdrv_get_device_name(bs));1310}1311}
1312
1313static void internal_snapshot_clean(void *opaque)1314{
1315g_autofree InternalSnapshotState *state = opaque;1316
1317if (!state->bs) {1318return;1319}1320
1321bdrv_drained_end(state->bs);1322}
1323
1324/* external snapshot private data */
1325typedef struct ExternalSnapshotState {1326BlockDriverState *old_bs;1327BlockDriverState *new_bs;1328bool overlay_appended;1329} ExternalSnapshotState;1330
1331static void external_snapshot_commit(void *opaque);1332static void external_snapshot_abort(void *opaque);1333static void external_snapshot_clean(void *opaque);1334TransactionActionDrv external_snapshot_drv = {1335.commit = external_snapshot_commit,1336.abort = external_snapshot_abort,1337.clean = external_snapshot_clean,1338};1339
1340static void external_snapshot_action(TransactionAction *action,1341Transaction *tran, Error **errp)1342{
1343int ret;1344int flags = 0;1345QDict *options = NULL;1346Error *local_err = NULL;1347/* Device and node name of the image to generate the snapshot from */1348const char *device;1349const char *node_name;1350/* Reference to the new image (for 'blockdev-snapshot') */1351const char *snapshot_ref;1352/* File name of the new image (for 'blockdev-snapshot-sync') */1353const char *new_image_file;1354ExternalSnapshotState *state = g_new0(ExternalSnapshotState, 1);1355uint64_t perm, shared;1356
1357/* TODO We'll eventually have to take a writer lock in this function */1358GRAPH_RDLOCK_GUARD_MAINLOOP();1359
1360tran_add(tran, &external_snapshot_drv, state);1361
1362/* 'blockdev-snapshot' and 'blockdev-snapshot-sync' have similar1363* purpose but a different set of parameters */
1364switch (action->type) {1365case TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT:1366{1367BlockdevSnapshot *s = action->u.blockdev_snapshot.data;1368device = s->node;1369node_name = s->node;1370new_image_file = NULL;1371snapshot_ref = s->overlay;1372}1373break;1374case TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_SYNC:1375{1376BlockdevSnapshotSync *s = action->u.blockdev_snapshot_sync.data;1377device = s->device;1378node_name = s->node_name;1379new_image_file = s->snapshot_file;1380snapshot_ref = NULL;1381}1382break;1383default:1384g_assert_not_reached();1385}1386
1387/* start processing */1388
1389state->old_bs = bdrv_lookup_bs(device, node_name, errp);1390if (!state->old_bs) {1391return;1392}1393
1394/* Paired with .clean() */1395bdrv_drained_begin(state->old_bs);1396
1397if (!bdrv_is_inserted(state->old_bs)) {1398error_setg(errp, "Device '%s' has no medium",1399bdrv_get_device_or_node_name(state->old_bs));1400return;1401}1402
1403if (bdrv_op_is_blocked(state->old_bs,1404BLOCK_OP_TYPE_EXTERNAL_SNAPSHOT, errp)) {1405return;1406}1407
1408if (!bdrv_is_read_only(state->old_bs)) {1409ret = bdrv_flush(state->old_bs);1410if (ret < 0) {1411error_setg_errno(errp, -ret, "Write to node '%s' failed",1412bdrv_get_device_or_node_name(state->old_bs));1413return;1414}1415}1416
1417if (action->type == TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_SYNC) {1418BlockdevSnapshotSync *s = action->u.blockdev_snapshot_sync.data;1419const char *format = s->format ?: "qcow2";1420enum NewImageMode mode;1421const char *snapshot_node_name = s->snapshot_node_name;1422
1423if (node_name && !snapshot_node_name) {1424error_setg(errp, "New overlay node-name missing");1425return;1426}1427
1428if (snapshot_node_name &&1429bdrv_lookup_bs(snapshot_node_name, snapshot_node_name, NULL)) {1430error_setg(errp, "New overlay node-name already in use");1431return;1432}1433
1434flags = state->old_bs->open_flags;1435flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_COPY_ON_READ);1436flags |= BDRV_O_NO_BACKING;1437
1438/* create new image w/backing file */1439mode = s->has_mode ? s->mode : NEW_IMAGE_MODE_ABSOLUTE_PATHS;1440if (mode != NEW_IMAGE_MODE_EXISTING) {1441int64_t size = bdrv_getlength(state->old_bs);1442if (size < 0) {1443error_setg_errno(errp, -size, "bdrv_getlength failed");1444return;1445}1446bdrv_refresh_filename(state->old_bs);1447
1448bdrv_img_create(new_image_file, format,1449state->old_bs->filename,1450state->old_bs->drv->format_name,1451NULL, size, flags, false, &local_err);1452
1453if (local_err) {1454error_propagate(errp, local_err);1455return;1456}1457}1458
1459options = qdict_new();1460if (snapshot_node_name) {1461qdict_put_str(options, "node-name", snapshot_node_name);1462}1463qdict_put_str(options, "driver", format);1464}1465
1466state->new_bs = bdrv_open(new_image_file, snapshot_ref, options, flags,1467errp);1468
1469/* We will manually add the backing_hd field to the bs later */1470if (!state->new_bs) {1471return;1472}1473
1474/*1475* Allow attaching a backing file to an overlay that's already in use only
1476* if the parents don't assume that they are already seeing a valid image.
1477* (Specifically, allow it as a mirror target, which is write-only access.)
1478*/
1479bdrv_get_cumulative_perm(state->new_bs, &perm, &shared);1480if (perm & BLK_PERM_CONSISTENT_READ) {1481error_setg(errp, "The overlay is already in use");1482return;1483}1484
1485if (state->new_bs->drv->is_filter) {1486error_setg(errp, "Filters cannot be used as overlays");1487return;1488}1489
1490if (bdrv_cow_child(state->new_bs)) {1491error_setg(errp, "The overlay already has a backing image");1492return;1493}1494
1495if (!state->new_bs->drv->supports_backing) {1496error_setg(errp, "The overlay does not support backing images");1497return;1498}1499
1500ret = bdrv_append(state->new_bs, state->old_bs, errp);1501if (ret < 0) {1502return;1503}1504state->overlay_appended = true;1505}
1506
1507static void external_snapshot_commit(void *opaque)1508{
1509ExternalSnapshotState *state = opaque;1510
1511/* We don't need (or want) to use the transactional1512* bdrv_reopen_multiple() across all the entries at once, because we
1513* don't want to abort all of them if one of them fails the reopen */
1514if (!qatomic_read(&state->old_bs->copy_on_read)) {1515bdrv_reopen_set_read_only(state->old_bs, true, NULL);1516}1517}
1518
1519static void external_snapshot_abort(void *opaque)1520{
1521ExternalSnapshotState *state = opaque;1522if (state->new_bs) {1523if (state->overlay_appended) {1524AioContext *aio_context;1525AioContext *tmp_context;1526int ret;1527
1528aio_context = bdrv_get_aio_context(state->old_bs);1529
1530bdrv_ref(state->old_bs); /* we can't let bdrv_set_backind_hd()1531close state->old_bs; we need it */
1532bdrv_set_backing_hd(state->new_bs, NULL, &error_abort);1533
1534/*1535* The call to bdrv_set_backing_hd() above returns state->old_bs to
1536* the main AioContext. As we're still going to be using it, return
1537* it to the AioContext it was before.
1538*/
1539tmp_context = bdrv_get_aio_context(state->old_bs);1540if (aio_context != tmp_context) {1541ret = bdrv_try_change_aio_context(state->old_bs,1542aio_context, NULL, NULL);1543assert(ret == 0);1544}1545
1546bdrv_drained_begin(state->new_bs);1547bdrv_graph_wrlock();1548bdrv_replace_node(state->new_bs, state->old_bs, &error_abort);1549bdrv_graph_wrunlock();1550bdrv_drained_end(state->new_bs);1551
1552bdrv_unref(state->old_bs); /* bdrv_replace_node() ref'ed old_bs */1553}1554}1555}
1556
1557static void external_snapshot_clean(void *opaque)1558{
1559g_autofree ExternalSnapshotState *state = opaque;1560
1561if (!state->old_bs) {1562return;1563}1564
1565bdrv_drained_end(state->old_bs);1566bdrv_unref(state->new_bs);1567}
1568
1569typedef struct DriveBackupState {1570BlockDriverState *bs;1571BlockJob *job;1572} DriveBackupState;1573
1574static BlockJob *do_backup_common(BackupCommon *backup,1575BlockDriverState *bs,1576BlockDriverState *target_bs,1577AioContext *aio_context,1578JobTxn *txn, Error **errp);1579
1580static void drive_backup_commit(void *opaque);1581static void drive_backup_abort(void *opaque);1582static void drive_backup_clean(void *opaque);1583TransactionActionDrv drive_backup_drv = {1584.commit = drive_backup_commit,1585.abort = drive_backup_abort,1586.clean = drive_backup_clean,1587};1588
1589static void drive_backup_action(DriveBackup *backup,1590JobTxn *block_job_txn,1591Transaction *tran, Error **errp)1592{
1593DriveBackupState *state = g_new0(DriveBackupState, 1);1594BlockDriverState *bs;1595BlockDriverState *target_bs;1596BlockDriverState *source = NULL;1597AioContext *aio_context;1598const char *format;1599QDict *options;1600Error *local_err = NULL;1601int flags;1602int64_t size;1603bool set_backing_hd = false;1604int ret;1605
1606GLOBAL_STATE_CODE();1607
1608tran_add(tran, &drive_backup_drv, state);1609
1610if (!backup->has_mode) {1611backup->mode = NEW_IMAGE_MODE_ABSOLUTE_PATHS;1612}1613
1614bs = bdrv_lookup_bs(backup->device, backup->device, errp);1615if (!bs) {1616return;1617}1618
1619if (!bs->drv) {1620error_setg(errp, "Device has no medium");1621return;1622}1623
1624aio_context = bdrv_get_aio_context(bs);1625
1626state->bs = bs;1627/* Paired with .clean() */1628bdrv_drained_begin(bs);1629
1630format = backup->format;1631if (!format && backup->mode != NEW_IMAGE_MODE_EXISTING) {1632format = bs->drv->format_name;1633}1634
1635/* Early check to avoid creating target */1636bdrv_graph_rdlock_main_loop();1637if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_BACKUP_SOURCE, errp)) {1638bdrv_graph_rdunlock_main_loop();1639return;1640}1641
1642flags = bs->open_flags | BDRV_O_RDWR;1643
1644/*1645* See if we have a backing HD we can use to create our new image
1646* on top of.
1647*/
1648if (backup->sync == MIRROR_SYNC_MODE_TOP) {1649/*1650* Backup will not replace the source by the target, so none
1651* of the filters skipped here will be removed (in contrast to
1652* mirror). Therefore, we can skip all of them when looking
1653* for the first COW relationship.
1654*/
1655source = bdrv_cow_bs(bdrv_skip_filters(bs));1656if (!source) {1657backup->sync = MIRROR_SYNC_MODE_FULL;1658}1659}1660if (backup->sync == MIRROR_SYNC_MODE_NONE) {1661source = bs;1662flags |= BDRV_O_NO_BACKING;1663set_backing_hd = true;1664}1665bdrv_graph_rdunlock_main_loop();1666
1667size = bdrv_getlength(bs);1668if (size < 0) {1669error_setg_errno(errp, -size, "bdrv_getlength failed");1670return;1671}1672
1673if (backup->mode != NEW_IMAGE_MODE_EXISTING) {1674assert(format);1675if (source) {1676/* Implicit filters should not appear in the filename */1677BlockDriverState *explicit_backing;1678
1679bdrv_graph_rdlock_main_loop();1680explicit_backing = bdrv_skip_implicit_filters(source);1681bdrv_refresh_filename(explicit_backing);1682bdrv_graph_rdunlock_main_loop();1683
1684bdrv_img_create(backup->target, format,1685explicit_backing->filename,1686explicit_backing->drv->format_name, NULL,1687size, flags, false, &local_err);1688} else {1689bdrv_img_create(backup->target, format, NULL, NULL, NULL,1690size, flags, false, &local_err);1691}1692}1693
1694if (local_err) {1695error_propagate(errp, local_err);1696return;1697}1698
1699options = qdict_new();1700qdict_put_str(options, "discard", "unmap");1701qdict_put_str(options, "detect-zeroes", "unmap");1702if (format) {1703qdict_put_str(options, "driver", format);1704}1705
1706target_bs = bdrv_open(backup->target, NULL, options, flags, errp);1707if (!target_bs) {1708return;1709}1710
1711ret = bdrv_try_change_aio_context(target_bs, aio_context, NULL, errp);1712if (ret < 0) {1713bdrv_unref(target_bs);1714return;1715}1716
1717if (set_backing_hd) {1718if (bdrv_set_backing_hd(target_bs, source, errp) < 0) {1719goto unref;1720}1721}1722
1723state->job = do_backup_common(qapi_DriveBackup_base(backup),1724bs, target_bs, aio_context,1725block_job_txn, errp);1726
1727unref:1728bdrv_unref(target_bs);1729}
1730
1731static void drive_backup_commit(void *opaque)1732{
1733DriveBackupState *state = opaque;1734
1735assert(state->job);1736job_start(&state->job->job);1737}
1738
1739static void drive_backup_abort(void *opaque)1740{
1741DriveBackupState *state = opaque;1742
1743if (state->job) {1744job_cancel_sync(&state->job->job, true);1745}1746}
1747
1748static void drive_backup_clean(void *opaque)1749{
1750g_autofree DriveBackupState *state = opaque;1751
1752if (!state->bs) {1753return;1754}1755
1756bdrv_drained_end(state->bs);1757}
1758
1759typedef struct BlockdevBackupState {1760BlockDriverState *bs;1761BlockJob *job;1762} BlockdevBackupState;1763
1764static void blockdev_backup_commit(void *opaque);1765static void blockdev_backup_abort(void *opaque);1766static void blockdev_backup_clean(void *opaque);1767TransactionActionDrv blockdev_backup_drv = {1768.commit = blockdev_backup_commit,1769.abort = blockdev_backup_abort,1770.clean = blockdev_backup_clean,1771};1772
1773static void blockdev_backup_action(BlockdevBackup *backup,1774JobTxn *block_job_txn,1775Transaction *tran, Error **errp)1776{
1777BlockdevBackupState *state = g_new0(BlockdevBackupState, 1);1778BlockDriverState *bs;1779BlockDriverState *target_bs;1780AioContext *aio_context;1781int ret;1782
1783tran_add(tran, &blockdev_backup_drv, state);1784
1785bs = bdrv_lookup_bs(backup->device, backup->device, errp);1786if (!bs) {1787return;1788}1789
1790target_bs = bdrv_lookup_bs(backup->target, backup->target, errp);1791if (!target_bs) {1792return;1793}1794
1795/* Honor bdrv_try_change_aio_context() context acquisition requirements. */1796aio_context = bdrv_get_aio_context(bs);1797
1798ret = bdrv_try_change_aio_context(target_bs, aio_context, NULL, errp);1799if (ret < 0) {1800return;1801}1802
1803state->bs = bs;1804
1805/* Paired with .clean() */1806bdrv_drained_begin(state->bs);1807
1808state->job = do_backup_common(qapi_BlockdevBackup_base(backup),1809bs, target_bs, aio_context,1810block_job_txn, errp);1811}
1812
1813static void blockdev_backup_commit(void *opaque)1814{
1815BlockdevBackupState *state = opaque;1816
1817assert(state->job);1818job_start(&state->job->job);1819}
1820
1821static void blockdev_backup_abort(void *opaque)1822{
1823BlockdevBackupState *state = opaque;1824
1825if (state->job) {1826job_cancel_sync(&state->job->job, true);1827}1828}
1829
1830static void blockdev_backup_clean(void *opaque)1831{
1832g_autofree BlockdevBackupState *state = opaque;1833
1834if (!state->bs) {1835return;1836}1837
1838bdrv_drained_end(state->bs);1839}
1840
1841typedef struct BlockDirtyBitmapState {1842BdrvDirtyBitmap *bitmap;1843BlockDriverState *bs;1844HBitmap *backup;1845bool was_enabled;1846} BlockDirtyBitmapState;1847
1848static void block_dirty_bitmap_add_abort(void *opaque);1849TransactionActionDrv block_dirty_bitmap_add_drv = {1850.abort = block_dirty_bitmap_add_abort,1851.clean = g_free,1852};1853
1854static void block_dirty_bitmap_add_action(BlockDirtyBitmapAdd *action,1855Transaction *tran, Error **errp)1856{
1857Error *local_err = NULL;1858BlockDirtyBitmapState *state = g_new0(BlockDirtyBitmapState, 1);1859
1860tran_add(tran, &block_dirty_bitmap_add_drv, state);1861
1862/* AIO context taken and released within qmp_block_dirty_bitmap_add */1863qmp_block_dirty_bitmap_add(action->node, action->name,1864action->has_granularity, action->granularity,1865action->has_persistent, action->persistent,1866action->has_disabled, action->disabled,1867&local_err);1868
1869if (!local_err) {1870state->bitmap = block_dirty_bitmap_lookup(action->node, action->name,1871NULL, &error_abort);1872} else {1873error_propagate(errp, local_err);1874}1875}
1876
1877static void block_dirty_bitmap_add_abort(void *opaque)1878{
1879BlockDirtyBitmapState *state = opaque;1880
1881if (state->bitmap) {1882bdrv_release_dirty_bitmap(state->bitmap);1883}1884}
1885
1886static void block_dirty_bitmap_restore(void *opaque);1887static void block_dirty_bitmap_free_backup(void *opaque);1888TransactionActionDrv block_dirty_bitmap_clear_drv = {1889.abort = block_dirty_bitmap_restore,1890.commit = block_dirty_bitmap_free_backup,1891.clean = g_free,1892};1893
1894static void block_dirty_bitmap_clear_action(BlockDirtyBitmap *action,1895Transaction *tran, Error **errp)1896{
1897BlockDirtyBitmapState *state = g_new0(BlockDirtyBitmapState, 1);1898
1899tran_add(tran, &block_dirty_bitmap_clear_drv, state);1900
1901state->bitmap = block_dirty_bitmap_lookup(action->node,1902action->name,1903&state->bs,1904errp);1905if (!state->bitmap) {1906return;1907}1908
1909if (bdrv_dirty_bitmap_check(state->bitmap, BDRV_BITMAP_DEFAULT, errp)) {1910return;1911}1912
1913bdrv_clear_dirty_bitmap(state->bitmap, &state->backup);1914}
1915
1916static void block_dirty_bitmap_restore(void *opaque)1917{
1918BlockDirtyBitmapState *state = opaque;1919
1920if (state->backup) {1921bdrv_restore_dirty_bitmap(state->bitmap, state->backup);1922}1923}
1924
1925static void block_dirty_bitmap_free_backup(void *opaque)1926{
1927BlockDirtyBitmapState *state = opaque;1928
1929hbitmap_free(state->backup);1930}
1931
1932static void block_dirty_bitmap_enable_abort(void *opaque);1933TransactionActionDrv block_dirty_bitmap_enable_drv = {1934.abort = block_dirty_bitmap_enable_abort,1935.clean = g_free,1936};1937
1938static void block_dirty_bitmap_enable_action(BlockDirtyBitmap *action,1939Transaction *tran, Error **errp)1940{
1941BlockDirtyBitmapState *state = g_new0(BlockDirtyBitmapState, 1);1942
1943tran_add(tran, &block_dirty_bitmap_enable_drv, state);1944
1945state->bitmap = block_dirty_bitmap_lookup(action->node,1946action->name,1947NULL,1948errp);1949if (!state->bitmap) {1950return;1951}1952
1953if (bdrv_dirty_bitmap_check(state->bitmap, BDRV_BITMAP_ALLOW_RO, errp)) {1954return;1955}1956
1957state->was_enabled = bdrv_dirty_bitmap_enabled(state->bitmap);1958bdrv_enable_dirty_bitmap(state->bitmap);1959}
1960
1961static void block_dirty_bitmap_enable_abort(void *opaque)1962{
1963BlockDirtyBitmapState *state = opaque;1964
1965if (!state->was_enabled) {1966bdrv_disable_dirty_bitmap(state->bitmap);1967}1968}
1969
1970static void block_dirty_bitmap_disable_abort(void *opaque);1971TransactionActionDrv block_dirty_bitmap_disable_drv = {1972.abort = block_dirty_bitmap_disable_abort,1973.clean = g_free,1974};1975
1976static void block_dirty_bitmap_disable_action(BlockDirtyBitmap *action,1977Transaction *tran, Error **errp)1978{
1979BlockDirtyBitmapState *state = g_new0(BlockDirtyBitmapState, 1);1980
1981tran_add(tran, &block_dirty_bitmap_disable_drv, state);1982
1983state->bitmap = block_dirty_bitmap_lookup(action->node,1984action->name,1985NULL,1986errp);1987if (!state->bitmap) {1988return;1989}1990
1991if (bdrv_dirty_bitmap_check(state->bitmap, BDRV_BITMAP_ALLOW_RO, errp)) {1992return;1993}1994
1995state->was_enabled = bdrv_dirty_bitmap_enabled(state->bitmap);1996bdrv_disable_dirty_bitmap(state->bitmap);1997}
1998
1999static void block_dirty_bitmap_disable_abort(void *opaque)2000{
2001BlockDirtyBitmapState *state = opaque;2002
2003if (state->was_enabled) {2004bdrv_enable_dirty_bitmap(state->bitmap);2005}2006}
2007
2008TransactionActionDrv block_dirty_bitmap_merge_drv = {2009.commit = block_dirty_bitmap_free_backup,2010.abort = block_dirty_bitmap_restore,2011.clean = g_free,2012};2013
2014static void block_dirty_bitmap_merge_action(BlockDirtyBitmapMerge *action,2015Transaction *tran, Error **errp)2016{
2017BlockDirtyBitmapState *state = g_new0(BlockDirtyBitmapState, 1);2018
2019tran_add(tran, &block_dirty_bitmap_merge_drv, state);2020
2021state->bitmap = block_dirty_bitmap_merge(action->node, action->target,2022action->bitmaps, &state->backup,2023errp);2024}
2025
2026static void block_dirty_bitmap_remove_commit(void *opaque);2027static void block_dirty_bitmap_remove_abort(void *opaque);2028TransactionActionDrv block_dirty_bitmap_remove_drv = {2029.commit = block_dirty_bitmap_remove_commit,2030.abort = block_dirty_bitmap_remove_abort,2031.clean = g_free,2032};2033
2034static void block_dirty_bitmap_remove_action(BlockDirtyBitmap *action,2035Transaction *tran, Error **errp)2036{
2037BlockDirtyBitmapState *state = g_new0(BlockDirtyBitmapState, 1);2038
2039tran_add(tran, &block_dirty_bitmap_remove_drv, state);2040
2041
2042state->bitmap = block_dirty_bitmap_remove(action->node, action->name,2043false, &state->bs, errp);2044if (state->bitmap) {2045bdrv_dirty_bitmap_skip_store(state->bitmap, true);2046bdrv_dirty_bitmap_set_busy(state->bitmap, true);2047}2048}
2049
2050static void block_dirty_bitmap_remove_abort(void *opaque)2051{
2052BlockDirtyBitmapState *state = opaque;2053
2054if (state->bitmap) {2055bdrv_dirty_bitmap_skip_store(state->bitmap, false);2056bdrv_dirty_bitmap_set_busy(state->bitmap, false);2057}2058}
2059
2060static void block_dirty_bitmap_remove_commit(void *opaque)2061{
2062BlockDirtyBitmapState *state = opaque;2063
2064bdrv_dirty_bitmap_set_busy(state->bitmap, false);2065bdrv_release_dirty_bitmap(state->bitmap);2066}
2067
2068static void abort_commit(void *opaque);2069TransactionActionDrv abort_drv = {2070.commit = abort_commit,2071};2072
2073static void abort_action(Transaction *tran, Error **errp)2074{
2075tran_add(tran, &abort_drv, NULL);2076error_setg(errp, "Transaction aborted using Abort action");2077}
2078
2079static void abort_commit(void *opaque)2080{
2081g_assert_not_reached(); /* this action never succeeds */2082}
2083
2084static void transaction_action(TransactionAction *act, JobTxn *block_job_txn,2085Transaction *tran, Error **errp)2086{
2087switch (act->type) {2088case TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT:2089case TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_SYNC:2090external_snapshot_action(act, tran, errp);2091return;2092case TRANSACTION_ACTION_KIND_DRIVE_BACKUP:2093drive_backup_action(act->u.drive_backup.data,2094block_job_txn, tran, errp);2095return;2096case TRANSACTION_ACTION_KIND_BLOCKDEV_BACKUP:2097blockdev_backup_action(act->u.blockdev_backup.data,2098block_job_txn, tran, errp);2099return;2100case TRANSACTION_ACTION_KIND_ABORT:2101abort_action(tran, errp);2102return;2103case TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_INTERNAL_SYNC:2104internal_snapshot_action(act->u.blockdev_snapshot_internal_sync.data,2105tran, errp);2106return;2107case TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_ADD:2108block_dirty_bitmap_add_action(act->u.block_dirty_bitmap_add.data,2109tran, errp);2110return;2111case TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_CLEAR:2112block_dirty_bitmap_clear_action(act->u.block_dirty_bitmap_clear.data,2113tran, errp);2114return;2115case TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_ENABLE:2116block_dirty_bitmap_enable_action(act->u.block_dirty_bitmap_enable.data,2117tran, errp);2118return;2119case TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_DISABLE:2120block_dirty_bitmap_disable_action(2121act->u.block_dirty_bitmap_disable.data, tran, errp);2122return;2123case TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_MERGE:2124block_dirty_bitmap_merge_action(act->u.block_dirty_bitmap_merge.data,2125tran, errp);2126return;2127case TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_REMOVE:2128block_dirty_bitmap_remove_action(act->u.block_dirty_bitmap_remove.data,2129tran, errp);2130return;2131/*2132* Where are transactions for MIRROR, COMMIT and STREAM?
2133* Although these blockjobs use transaction callbacks like the backup job,
2134* these jobs do not necessarily adhere to transaction semantics.
2135* These jobs may not fully undo all of their actions on abort, nor do they
2136* necessarily work in transactions with more than one job in them.
2137*/
2138case TRANSACTION_ACTION_KIND__MAX:2139default:2140g_assert_not_reached();2141};2142}
2143
2144
2145/*
2146* 'Atomic' group operations. The operations are performed as a set, and if
2147* any fail then we roll back all operations in the group.
2148*
2149* Always run under BQL.
2150*/
2151void qmp_transaction(TransactionActionList *actions,2152struct TransactionProperties *properties,2153Error **errp)2154{
2155TransactionActionList *act;2156JobTxn *block_job_txn = NULL;2157Error *local_err = NULL;2158Transaction *tran;2159ActionCompletionMode comp_mode =2160properties ? properties->completion_mode :2161ACTION_COMPLETION_MODE_INDIVIDUAL;2162
2163GLOBAL_STATE_CODE();2164
2165/* Does this transaction get canceled as a group on failure?2166* If not, we don't really need to make a JobTxn.
2167*/
2168if (comp_mode != ACTION_COMPLETION_MODE_INDIVIDUAL) {2169for (act = actions; act; act = act->next) {2170TransactionActionKind type = act->value->type;2171
2172if (type != TRANSACTION_ACTION_KIND_BLOCKDEV_BACKUP &&2173type != TRANSACTION_ACTION_KIND_DRIVE_BACKUP)2174{2175error_setg(errp,2176"Action '%s' does not support transaction property "2177"completion-mode = %s",2178TransactionActionKind_str(type),2179ActionCompletionMode_str(comp_mode));2180return;2181}2182}2183
2184block_job_txn = job_txn_new();2185}2186
2187/* drain all i/o before any operations */2188bdrv_drain_all();2189
2190tran = tran_new();2191
2192/* We don't do anything in this loop that commits us to the operations */2193for (act = actions; act; act = act->next) {2194transaction_action(act->value, block_job_txn, tran, &local_err);2195if (local_err) {2196error_propagate(errp, local_err);2197goto delete_and_fail;2198}2199}2200
2201tran_commit(tran);2202
2203/* success */2204goto exit;2205
2206delete_and_fail:2207/* failure, and it is all-or-none; roll back all operations */2208tran_abort(tran);2209exit:2210job_txn_unref(block_job_txn);2211}
2212
2213BlockDirtyBitmapSha256 *qmp_x_debug_block_dirty_bitmap_sha256(const char *node,2214const char *name,2215Error **errp)2216{
2217BdrvDirtyBitmap *bitmap;2218BlockDriverState *bs;2219BlockDirtyBitmapSha256 *ret = NULL;2220char *sha256;2221
2222bitmap = block_dirty_bitmap_lookup(node, name, &bs, errp);2223if (!bitmap || !bs) {2224return NULL;2225}2226
2227sha256 = bdrv_dirty_bitmap_sha256(bitmap, errp);2228if (sha256 == NULL) {2229return NULL;2230}2231
2232ret = g_new(BlockDirtyBitmapSha256, 1);2233ret->sha256 = sha256;2234
2235return ret;2236}
2237
2238void coroutine_fn qmp_block_resize(const char *device, const char *node_name,2239int64_t size, Error **errp)2240{
2241Error *local_err = NULL;2242BlockBackend *blk;2243BlockDriverState *bs;2244AioContext *old_ctx;2245
2246bs = bdrv_lookup_bs(device, node_name, &local_err);2247if (local_err) {2248error_propagate(errp, local_err);2249return;2250}2251
2252if (size < 0) {2253error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "size", "a >0 size");2254return;2255}2256
2257bdrv_graph_co_rdlock();2258if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_RESIZE, errp)) {2259bdrv_graph_co_rdunlock();2260return;2261}2262bdrv_graph_co_rdunlock();2263
2264blk = blk_co_new_with_bs(bs, BLK_PERM_RESIZE, BLK_PERM_ALL, errp);2265if (!blk) {2266return;2267}2268
2269bdrv_drained_begin(bs);2270
2271old_ctx = bdrv_co_enter(bs);2272blk_co_truncate(blk, size, false, PREALLOC_MODE_OFF, 0, errp);2273bdrv_co_leave(bs, old_ctx);2274
2275bdrv_drained_end(bs);2276blk_co_unref(blk);2277}
2278
2279void qmp_block_stream(const char *job_id, const char *device,2280const char *base,2281const char *base_node,2282const char *backing_file,2283bool has_backing_mask_protocol,2284bool backing_mask_protocol,2285const char *bottom,2286bool has_speed, int64_t speed,2287bool has_on_error, BlockdevOnError on_error,2288const char *filter_node_name,2289bool has_auto_finalize, bool auto_finalize,2290bool has_auto_dismiss, bool auto_dismiss,2291Error **errp)2292{
2293BlockDriverState *bs, *iter, *iter_end;2294BlockDriverState *base_bs = NULL;2295BlockDriverState *bottom_bs = NULL;2296AioContext *aio_context;2297Error *local_err = NULL;2298int job_flags = JOB_DEFAULT;2299
2300GLOBAL_STATE_CODE();2301
2302if (base && base_node) {2303error_setg(errp, "'base' and 'base-node' cannot be specified "2304"at the same time");2305return;2306}2307
2308if (base && bottom) {2309error_setg(errp, "'base' and 'bottom' cannot be specified "2310"at the same time");2311return;2312}2313
2314if (bottom && base_node) {2315error_setg(errp, "'bottom' and 'base-node' cannot be specified "2316"at the same time");2317return;2318}2319
2320if (!has_backing_mask_protocol) {2321backing_mask_protocol = false;2322}2323
2324if (!has_on_error) {2325on_error = BLOCKDEV_ON_ERROR_REPORT;2326}2327
2328bs = bdrv_lookup_bs(device, device, errp);2329if (!bs) {2330return;2331}2332
2333aio_context = bdrv_get_aio_context(bs);2334
2335bdrv_graph_rdlock_main_loop();2336if (base) {2337base_bs = bdrv_find_backing_image(bs, base);2338if (base_bs == NULL) {2339error_setg(errp, "Can't find '%s' in the backing chain", base);2340goto out_rdlock;2341}2342assert(bdrv_get_aio_context(base_bs) == aio_context);2343}2344
2345if (base_node) {2346base_bs = bdrv_lookup_bs(NULL, base_node, errp);2347if (!base_bs) {2348goto out_rdlock;2349}2350if (bs == base_bs || !bdrv_chain_contains(bs, base_bs)) {2351error_setg(errp, "Node '%s' is not a backing image of '%s'",2352base_node, device);2353goto out_rdlock;2354}2355assert(bdrv_get_aio_context(base_bs) == aio_context);2356
2357bdrv_refresh_filename(base_bs);2358}2359
2360if (bottom) {2361bottom_bs = bdrv_lookup_bs(NULL, bottom, errp);2362if (!bottom_bs) {2363goto out_rdlock;2364}2365if (!bottom_bs->drv) {2366error_setg(errp, "Node '%s' is not open", bottom);2367goto out_rdlock;2368}2369if (bottom_bs->drv->is_filter) {2370error_setg(errp, "Node '%s' is a filter, use a non-filter node "2371"as 'bottom'", bottom);2372goto out_rdlock;2373}2374if (!bdrv_chain_contains(bs, bottom_bs)) {2375error_setg(errp, "Node '%s' is not in a chain starting from '%s'",2376bottom, device);2377goto out_rdlock;2378}2379assert(bdrv_get_aio_context(bottom_bs) == aio_context);2380}2381
2382/*2383* Check for op blockers in the whole chain between bs and base (or bottom)
2384*/
2385iter_end = bottom ? bdrv_filter_or_cow_bs(bottom_bs) : base_bs;2386for (iter = bs; iter && iter != iter_end;2387iter = bdrv_filter_or_cow_bs(iter))2388{2389if (bdrv_op_is_blocked(iter, BLOCK_OP_TYPE_STREAM, errp)) {2390goto out_rdlock;2391}2392}2393bdrv_graph_rdunlock_main_loop();2394
2395/* if we are streaming the entire chain, the result will have no backing2396* file, and specifying one is therefore an error */
2397if (!base_bs && backing_file) {2398error_setg(errp, "backing file specified, but streaming the "2399"entire chain");2400return;2401}2402
2403if (has_auto_finalize && !auto_finalize) {2404job_flags |= JOB_MANUAL_FINALIZE;2405}2406if (has_auto_dismiss && !auto_dismiss) {2407job_flags |= JOB_MANUAL_DISMISS;2408}2409
2410stream_start(job_id, bs, base_bs, backing_file,2411backing_mask_protocol,2412bottom_bs, job_flags, has_speed ? speed : 0, on_error,2413filter_node_name, &local_err);2414if (local_err) {2415error_propagate(errp, local_err);2416return;2417}2418
2419trace_qmp_block_stream(bs);2420return;2421
2422out_rdlock:2423bdrv_graph_rdunlock_main_loop();2424}
2425
2426void qmp_block_commit(const char *job_id, const char *device,2427const char *base_node,2428const char *base,2429const char *top_node,2430const char *top,2431const char *backing_file,2432bool has_backing_mask_protocol,2433bool backing_mask_protocol,2434bool has_speed, int64_t speed,2435bool has_on_error, BlockdevOnError on_error,2436const char *filter_node_name,2437bool has_auto_finalize, bool auto_finalize,2438bool has_auto_dismiss, bool auto_dismiss,2439Error **errp)2440{
2441BlockDriverState *bs;2442BlockDriverState *iter;2443BlockDriverState *base_bs, *top_bs;2444AioContext *aio_context;2445Error *local_err = NULL;2446int job_flags = JOB_DEFAULT;2447uint64_t top_perm, top_shared;2448
2449/* TODO We'll eventually have to take a writer lock in this function */2450GRAPH_RDLOCK_GUARD_MAINLOOP();2451
2452if (!has_speed) {2453speed = 0;2454}2455if (!has_on_error) {2456on_error = BLOCKDEV_ON_ERROR_REPORT;2457}2458if (has_auto_finalize && !auto_finalize) {2459job_flags |= JOB_MANUAL_FINALIZE;2460}2461if (has_auto_dismiss && !auto_dismiss) {2462job_flags |= JOB_MANUAL_DISMISS;2463}2464if (!has_backing_mask_protocol) {2465backing_mask_protocol = false;2466}2467
2468/* Important Note:2469* libvirt relies on the DeviceNotFound error class in order to probe for
2470* live commit feature versions; for this to work, we must make sure to
2471* perform the device lookup before any generic errors that may occur in a
2472* scenario in which all optional arguments are omitted. */
2473bs = qmp_get_root_bs(device, &local_err);2474if (!bs) {2475bs = bdrv_lookup_bs(device, device, NULL);2476if (!bs) {2477error_free(local_err);2478error_set(errp, ERROR_CLASS_DEVICE_NOT_FOUND,2479"Device '%s' not found", device);2480} else {2481error_propagate(errp, local_err);2482}2483return;2484}2485
2486aio_context = bdrv_get_aio_context(bs);2487
2488if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_COMMIT_SOURCE, errp)) {2489return;2490}2491
2492/* default top_bs is the active layer */2493top_bs = bs;2494
2495if (top_node && top) {2496error_setg(errp, "'top-node' and 'top' are mutually exclusive");2497return;2498} else if (top_node) {2499top_bs = bdrv_lookup_bs(NULL, top_node, errp);2500if (top_bs == NULL) {2501return;2502}2503if (!bdrv_chain_contains(bs, top_bs)) {2504error_setg(errp, "'%s' is not in this backing file chain",2505top_node);2506return;2507}2508} else if (top) {2509/* This strcmp() is just a shortcut, there is no need to2510* refresh @bs's filename. If it mismatches,
2511* bdrv_find_backing_image() will do the refresh and may still
2512* return @bs. */
2513if (strcmp(bs->filename, top) != 0) {2514top_bs = bdrv_find_backing_image(bs, top);2515}2516}2517
2518if (top_bs == NULL) {2519error_setg(errp, "Top image file %s not found", top ? top : "NULL");2520return;2521}2522
2523assert(bdrv_get_aio_context(top_bs) == aio_context);2524
2525if (base_node && base) {2526error_setg(errp, "'base-node' and 'base' are mutually exclusive");2527return;2528} else if (base_node) {2529base_bs = bdrv_lookup_bs(NULL, base_node, errp);2530if (base_bs == NULL) {2531return;2532}2533if (!bdrv_chain_contains(top_bs, base_bs)) {2534error_setg(errp, "'%s' is not in this backing file chain",2535base_node);2536return;2537}2538} else if (base) {2539base_bs = bdrv_find_backing_image(top_bs, base);2540if (base_bs == NULL) {2541error_setg(errp, "Can't find '%s' in the backing chain", base);2542return;2543}2544} else {2545base_bs = bdrv_find_base(top_bs);2546if (base_bs == NULL) {2547error_setg(errp, "There is no backimg image");2548return;2549}2550}2551
2552assert(bdrv_get_aio_context(base_bs) == aio_context);2553
2554for (iter = top_bs; iter != bdrv_filter_or_cow_bs(base_bs);2555iter = bdrv_filter_or_cow_bs(iter))2556{2557if (bdrv_op_is_blocked(iter, BLOCK_OP_TYPE_COMMIT_TARGET, errp)) {2558return;2559}2560}2561
2562/* Do not allow attempts to commit an image into itself */2563if (top_bs == base_bs) {2564error_setg(errp, "cannot commit an image into itself");2565return;2566}2567
2568/*2569* Active commit is required if and only if someone has taken a
2570* WRITE permission on the top node. Historically, we have always
2571* used active commit for top nodes, so continue that practice
2572* lest we possibly break clients that rely on this behavior, e.g.
2573* to later attach this node to a writing parent.
2574* (Active commit is never really wrong.)
2575*/
2576bdrv_get_cumulative_perm(top_bs, &top_perm, &top_shared);2577if (top_perm & BLK_PERM_WRITE ||2578bdrv_skip_filters(top_bs) == bdrv_skip_filters(bs))2579{2580if (backing_file) {2581if (bdrv_skip_filters(top_bs) == bdrv_skip_filters(bs)) {2582error_setg(errp, "'backing-file' specified,"2583" but 'top' is the active layer");2584} else {2585error_setg(errp, "'backing-file' specified, but 'top' has a "2586"writer on it");2587}2588return;2589}2590if (!job_id) {2591/*2592* Emulate here what block_job_create() does, because it
2593* is possible that @bs != @top_bs (the block job should
2594* be named after @bs, even if @top_bs is the actual
2595* source)
2596*/
2597job_id = bdrv_get_device_name(bs);2598}2599commit_active_start(job_id, top_bs, base_bs, job_flags, speed, on_error,2600filter_node_name, NULL, NULL, false, &local_err);2601} else {2602BlockDriverState *overlay_bs = bdrv_find_overlay(bs, top_bs);2603if (bdrv_op_is_blocked(overlay_bs, BLOCK_OP_TYPE_COMMIT_TARGET, errp)) {2604return;2605}2606commit_start(job_id, bs, base_bs, top_bs, job_flags,2607speed, on_error, backing_file,2608backing_mask_protocol,2609filter_node_name, &local_err);2610}2611if (local_err != NULL) {2612error_propagate(errp, local_err);2613return;2614}2615}
2616
2617/* Common QMP interface for drive-backup and blockdev-backup */
2618static BlockJob *do_backup_common(BackupCommon *backup,2619BlockDriverState *bs,2620BlockDriverState *target_bs,2621AioContext *aio_context,2622JobTxn *txn, Error **errp)2623{
2624BlockJob *job = NULL;2625BdrvDirtyBitmap *bmap = NULL;2626BackupPerf perf = { .max_workers = 64 };2627int job_flags = JOB_DEFAULT;2628
2629if (!backup->has_speed) {2630backup->speed = 0;2631}2632if (!backup->has_on_source_error) {2633backup->on_source_error = BLOCKDEV_ON_ERROR_REPORT;2634}2635if (!backup->has_on_target_error) {2636backup->on_target_error = BLOCKDEV_ON_ERROR_REPORT;2637}2638if (!backup->has_auto_finalize) {2639backup->auto_finalize = true;2640}2641if (!backup->has_auto_dismiss) {2642backup->auto_dismiss = true;2643}2644if (!backup->has_compress) {2645backup->compress = false;2646}2647
2648if (backup->x_perf) {2649if (backup->x_perf->has_use_copy_range) {2650perf.use_copy_range = backup->x_perf->use_copy_range;2651}2652if (backup->x_perf->has_max_workers) {2653perf.max_workers = backup->x_perf->max_workers;2654}2655if (backup->x_perf->has_max_chunk) {2656perf.max_chunk = backup->x_perf->max_chunk;2657}2658}2659
2660if ((backup->sync == MIRROR_SYNC_MODE_BITMAP) ||2661(backup->sync == MIRROR_SYNC_MODE_INCREMENTAL)) {2662/* done before desugaring 'incremental' to print the right message */2663if (!backup->bitmap) {2664error_setg(errp, "must provide a valid bitmap name for "2665"'%s' sync mode", MirrorSyncMode_str(backup->sync));2666return NULL;2667}2668}2669
2670if (backup->sync == MIRROR_SYNC_MODE_INCREMENTAL) {2671if (backup->has_bitmap_mode &&2672backup->bitmap_mode != BITMAP_SYNC_MODE_ON_SUCCESS) {2673error_setg(errp, "Bitmap sync mode must be '%s' "2674"when using sync mode '%s'",2675BitmapSyncMode_str(BITMAP_SYNC_MODE_ON_SUCCESS),2676MirrorSyncMode_str(backup->sync));2677return NULL;2678}2679backup->has_bitmap_mode = true;2680backup->sync = MIRROR_SYNC_MODE_BITMAP;2681backup->bitmap_mode = BITMAP_SYNC_MODE_ON_SUCCESS;2682}2683
2684if (backup->bitmap) {2685bmap = bdrv_find_dirty_bitmap(bs, backup->bitmap);2686if (!bmap) {2687error_setg(errp, "Bitmap '%s' could not be found", backup->bitmap);2688return NULL;2689}2690if (!backup->has_bitmap_mode) {2691error_setg(errp, "Bitmap sync mode must be given "2692"when providing a bitmap");2693return NULL;2694}2695if (bdrv_dirty_bitmap_check(bmap, BDRV_BITMAP_ALLOW_RO, errp)) {2696return NULL;2697}2698
2699/* This does not produce a useful bitmap artifact: */2700if (backup->sync == MIRROR_SYNC_MODE_NONE) {2701error_setg(errp, "sync mode '%s' does not produce meaningful bitmap"2702" outputs", MirrorSyncMode_str(backup->sync));2703return NULL;2704}2705
2706/* If the bitmap isn't used for input or output, this is useless: */2707if (backup->bitmap_mode == BITMAP_SYNC_MODE_NEVER &&2708backup->sync != MIRROR_SYNC_MODE_BITMAP) {2709error_setg(errp, "Bitmap sync mode '%s' has no meaningful effect"2710" when combined with sync mode '%s'",2711BitmapSyncMode_str(backup->bitmap_mode),2712MirrorSyncMode_str(backup->sync));2713return NULL;2714}2715}2716
2717if (!backup->bitmap && backup->has_bitmap_mode) {2718error_setg(errp, "Cannot specify bitmap sync mode without a bitmap");2719return NULL;2720}2721
2722if (!backup->auto_finalize) {2723job_flags |= JOB_MANUAL_FINALIZE;2724}2725if (!backup->auto_dismiss) {2726job_flags |= JOB_MANUAL_DISMISS;2727}2728
2729job = backup_job_create(backup->job_id, bs, target_bs, backup->speed,2730backup->sync, bmap, backup->bitmap_mode,2731backup->compress, backup->discard_source,2732backup->filter_node_name,2733&perf,2734backup->on_source_error,2735backup->on_target_error,2736job_flags, NULL, NULL, txn, errp);2737return job;2738}
2739
2740void qmp_drive_backup(DriveBackup *backup, Error **errp)2741{
2742TransactionAction action = {2743.type = TRANSACTION_ACTION_KIND_DRIVE_BACKUP,2744.u.drive_backup.data = backup,2745};2746blockdev_do_action(&action, errp);2747}
2748
2749BlockDeviceInfoList *qmp_query_named_block_nodes(bool has_flat,2750bool flat,2751Error **errp)2752{
2753bool return_flat = has_flat && flat;2754
2755return bdrv_named_nodes_list(return_flat, errp);2756}
2757
2758XDbgBlockGraph *qmp_x_debug_query_block_graph(Error **errp)2759{
2760GRAPH_RDLOCK_GUARD_MAINLOOP();2761
2762return bdrv_get_xdbg_block_graph(errp);2763}
2764
2765void qmp_blockdev_backup(BlockdevBackup *backup, Error **errp)2766{
2767TransactionAction action = {2768.type = TRANSACTION_ACTION_KIND_BLOCKDEV_BACKUP,2769.u.blockdev_backup.data = backup,2770};2771blockdev_do_action(&action, errp);2772}
2773
2774/* Parameter check and block job starting for drive mirroring.
2775* Caller should hold @device and @target's aio context (must be the same).
2776**/
2777static void blockdev_mirror_common(const char *job_id, BlockDriverState *bs,2778BlockDriverState *target,2779const char *replaces,2780enum MirrorSyncMode sync,2781BlockMirrorBackingMode backing_mode,2782bool zero_target,2783bool has_speed, int64_t speed,2784bool has_granularity, uint32_t granularity,2785bool has_buf_size, int64_t buf_size,2786bool has_on_source_error,2787BlockdevOnError on_source_error,2788bool has_on_target_error,2789BlockdevOnError on_target_error,2790bool has_unmap, bool unmap,2791const char *filter_node_name,2792bool has_copy_mode, MirrorCopyMode copy_mode,2793bool has_auto_finalize, bool auto_finalize,2794bool has_auto_dismiss, bool auto_dismiss,2795Error **errp)2796{
2797BlockDriverState *unfiltered_bs;2798int job_flags = JOB_DEFAULT;2799
2800GLOBAL_STATE_CODE();2801GRAPH_RDLOCK_GUARD_MAINLOOP();2802
2803if (!has_speed) {2804speed = 0;2805}2806if (!has_on_source_error) {2807on_source_error = BLOCKDEV_ON_ERROR_REPORT;2808}2809if (!has_on_target_error) {2810on_target_error = BLOCKDEV_ON_ERROR_REPORT;2811}2812if (!has_granularity) {2813granularity = 0;2814}2815if (!has_buf_size) {2816buf_size = 0;2817}2818if (!has_unmap) {2819unmap = true;2820}2821if (!has_copy_mode) {2822copy_mode = MIRROR_COPY_MODE_BACKGROUND;2823}2824if (has_auto_finalize && !auto_finalize) {2825job_flags |= JOB_MANUAL_FINALIZE;2826}2827if (has_auto_dismiss && !auto_dismiss) {2828job_flags |= JOB_MANUAL_DISMISS;2829}2830
2831if (granularity != 0 && (granularity < 512 || granularity > 1048576 * 64)) {2832error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "granularity",2833"a value in range [512B, 64MB]");2834return;2835}2836if (granularity & (granularity - 1)) {2837error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "granularity",2838"a power of 2");2839return;2840}2841
2842if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_MIRROR_SOURCE, errp)) {2843return;2844}2845if (bdrv_op_is_blocked(target, BLOCK_OP_TYPE_MIRROR_TARGET, errp)) {2846return;2847}2848
2849if (!bdrv_backing_chain_next(bs) && sync == MIRROR_SYNC_MODE_TOP) {2850sync = MIRROR_SYNC_MODE_FULL;2851}2852
2853if (!replaces) {2854/* We want to mirror from @bs, but keep implicit filters on top */2855unfiltered_bs = bdrv_skip_implicit_filters(bs);2856if (unfiltered_bs != bs) {2857replaces = unfiltered_bs->node_name;2858}2859}2860
2861if (replaces) {2862BlockDriverState *to_replace_bs;2863int64_t bs_size, replace_size;2864
2865bs_size = bdrv_getlength(bs);2866if (bs_size < 0) {2867error_setg_errno(errp, -bs_size, "Failed to query device's size");2868return;2869}2870
2871to_replace_bs = check_to_replace_node(bs, replaces, errp);2872if (!to_replace_bs) {2873return;2874}2875
2876replace_size = bdrv_getlength(to_replace_bs);2877
2878if (replace_size < 0) {2879error_setg_errno(errp, -replace_size,2880"Failed to query the replacement node's size");2881return;2882}2883if (bs_size != replace_size) {2884error_setg(errp, "cannot replace image with a mirror image of "2885"different size");2886return;2887}2888}2889
2890/* pass the node name to replace to mirror start since it's loose coupling2891* and will allow to check whether the node still exist at mirror completion
2892*/
2893mirror_start(job_id, bs, target,2894replaces, job_flags,2895speed, granularity, buf_size, sync, backing_mode, zero_target,2896on_source_error, on_target_error, unmap, filter_node_name,2897copy_mode, errp);2898}
2899
2900void qmp_drive_mirror(DriveMirror *arg, Error **errp)2901{
2902BlockDriverState *bs;2903BlockDriverState *target_backing_bs, *target_bs;2904AioContext *aio_context;2905BlockMirrorBackingMode backing_mode;2906Error *local_err = NULL;2907QDict *options = NULL;2908int flags;2909int64_t size;2910const char *format = arg->format;2911bool zero_target;2912int ret;2913
2914bs = qmp_get_root_bs(arg->device, errp);2915if (!bs) {2916return;2917}2918
2919/* Early check to avoid creating target */2920bdrv_graph_rdlock_main_loop();2921if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_MIRROR_SOURCE, errp)) {2922bdrv_graph_rdunlock_main_loop();2923return;2924}2925
2926aio_context = bdrv_get_aio_context(bs);2927
2928if (!arg->has_mode) {2929arg->mode = NEW_IMAGE_MODE_ABSOLUTE_PATHS;2930}2931
2932if (!arg->format) {2933format = (arg->mode == NEW_IMAGE_MODE_EXISTING2934? NULL : bs->drv->format_name);2935}2936
2937flags = bs->open_flags | BDRV_O_RDWR;2938target_backing_bs = bdrv_cow_bs(bdrv_skip_filters(bs));2939if (!target_backing_bs && arg->sync == MIRROR_SYNC_MODE_TOP) {2940arg->sync = MIRROR_SYNC_MODE_FULL;2941}2942if (arg->sync == MIRROR_SYNC_MODE_NONE) {2943target_backing_bs = bs;2944}2945bdrv_graph_rdunlock_main_loop();2946
2947size = bdrv_getlength(bs);2948if (size < 0) {2949error_setg_errno(errp, -size, "bdrv_getlength failed");2950return;2951}2952
2953if (arg->replaces) {2954if (!arg->node_name) {2955error_setg(errp, "a node-name must be provided when replacing a"2956" named node of the graph");2957return;2958}2959}2960
2961if (arg->mode == NEW_IMAGE_MODE_ABSOLUTE_PATHS) {2962backing_mode = MIRROR_SOURCE_BACKING_CHAIN;2963} else {2964backing_mode = MIRROR_OPEN_BACKING_CHAIN;2965}2966
2967/* Don't open backing image in create() */2968flags |= BDRV_O_NO_BACKING;2969
2970if ((arg->sync == MIRROR_SYNC_MODE_FULL || !target_backing_bs)2971&& arg->mode != NEW_IMAGE_MODE_EXISTING)2972{2973/* create new image w/o backing file */2974assert(format);2975bdrv_img_create(arg->target, format,2976NULL, NULL, NULL, size, flags, false, &local_err);2977} else {2978BlockDriverState *explicit_backing;2979
2980switch (arg->mode) {2981case NEW_IMAGE_MODE_EXISTING:2982break;2983case NEW_IMAGE_MODE_ABSOLUTE_PATHS:2984/*2985* Create new image with backing file.
2986* Implicit filters should not appear in the filename.
2987*/
2988bdrv_graph_rdlock_main_loop();2989explicit_backing = bdrv_skip_implicit_filters(target_backing_bs);2990bdrv_refresh_filename(explicit_backing);2991bdrv_graph_rdunlock_main_loop();2992
2993bdrv_img_create(arg->target, format,2994explicit_backing->filename,2995explicit_backing->drv->format_name,2996NULL, size, flags, false, &local_err);2997break;2998default:2999abort();3000}3001}3002
3003if (local_err) {3004error_propagate(errp, local_err);3005return;3006}3007
3008options = qdict_new();3009if (arg->node_name) {3010qdict_put_str(options, "node-name", arg->node_name);3011}3012if (format) {3013qdict_put_str(options, "driver", format);3014}3015
3016/* Mirroring takes care of copy-on-write using the source's backing3017* file.
3018*/
3019target_bs = bdrv_open(arg->target, NULL, options, flags, errp);3020if (!target_bs) {3021return;3022}3023
3024bdrv_graph_rdlock_main_loop();3025zero_target = (arg->sync == MIRROR_SYNC_MODE_FULL &&3026(arg->mode == NEW_IMAGE_MODE_EXISTING ||3027!bdrv_has_zero_init(target_bs)));3028bdrv_graph_rdunlock_main_loop();3029
3030
3031ret = bdrv_try_change_aio_context(target_bs, aio_context, NULL, errp);3032if (ret < 0) {3033bdrv_unref(target_bs);3034return;3035}3036
3037blockdev_mirror_common(arg->job_id, bs, target_bs,3038arg->replaces, arg->sync,3039backing_mode, zero_target,3040arg->has_speed, arg->speed,3041arg->has_granularity, arg->granularity,3042arg->has_buf_size, arg->buf_size,3043arg->has_on_source_error, arg->on_source_error,3044arg->has_on_target_error, arg->on_target_error,3045arg->has_unmap, arg->unmap,3046NULL,3047arg->has_copy_mode, arg->copy_mode,3048arg->has_auto_finalize, arg->auto_finalize,3049arg->has_auto_dismiss, arg->auto_dismiss,3050errp);3051bdrv_unref(target_bs);3052}
3053
3054void qmp_blockdev_mirror(const char *job_id,3055const char *device, const char *target,3056const char *replaces,3057MirrorSyncMode sync,3058bool has_speed, int64_t speed,3059bool has_granularity, uint32_t granularity,3060bool has_buf_size, int64_t buf_size,3061bool has_on_source_error,3062BlockdevOnError on_source_error,3063bool has_on_target_error,3064BlockdevOnError on_target_error,3065const char *filter_node_name,3066bool has_copy_mode, MirrorCopyMode copy_mode,3067bool has_auto_finalize, bool auto_finalize,3068bool has_auto_dismiss, bool auto_dismiss,3069Error **errp)3070{
3071BlockDriverState *bs;3072BlockDriverState *target_bs;3073AioContext *aio_context;3074BlockMirrorBackingMode backing_mode = MIRROR_LEAVE_BACKING_CHAIN;3075bool zero_target;3076int ret;3077
3078bs = qmp_get_root_bs(device, errp);3079if (!bs) {3080return;3081}3082
3083target_bs = bdrv_lookup_bs(target, target, errp);3084if (!target_bs) {3085return;3086}3087
3088zero_target = (sync == MIRROR_SYNC_MODE_FULL);3089
3090aio_context = bdrv_get_aio_context(bs);3091
3092ret = bdrv_try_change_aio_context(target_bs, aio_context, NULL, errp);3093if (ret < 0) {3094return;3095}3096
3097blockdev_mirror_common(job_id, bs, target_bs,3098replaces, sync, backing_mode,3099zero_target, has_speed, speed,3100has_granularity, granularity,3101has_buf_size, buf_size,3102has_on_source_error, on_source_error,3103has_on_target_error, on_target_error,3104true, true, filter_node_name,3105has_copy_mode, copy_mode,3106has_auto_finalize, auto_finalize,3107has_auto_dismiss, auto_dismiss,3108errp);3109}
3110
3111/*
3112* Get a block job using its ID. Called with job_mutex held.
3113*/
3114static BlockJob *find_block_job_locked(const char *id, Error **errp)3115{
3116BlockJob *job;3117
3118assert(id != NULL);3119
3120job = block_job_get_locked(id);3121
3122if (!job) {3123error_set(errp, ERROR_CLASS_DEVICE_NOT_ACTIVE,3124"Block job '%s' not found", id);3125return NULL;3126}3127
3128return job;3129}
3130
3131void qmp_block_job_set_speed(const char *device, int64_t speed, Error **errp)3132{
3133BlockJob *job;3134
3135JOB_LOCK_GUARD();3136job = find_block_job_locked(device, errp);3137
3138if (!job) {3139return;3140}3141
3142block_job_set_speed_locked(job, speed, errp);3143}
3144
3145void qmp_block_job_cancel(const char *device,3146bool has_force, bool force, Error **errp)3147{
3148BlockJob *job;3149
3150JOB_LOCK_GUARD();3151job = find_block_job_locked(device, errp);3152
3153if (!job) {3154return;3155}3156
3157if (!has_force) {3158force = false;3159}3160
3161if (job_user_paused_locked(&job->job) && !force) {3162error_setg(errp, "The block job for device '%s' is currently paused",3163device);3164return;3165}3166
3167trace_qmp_block_job_cancel(job);3168job_user_cancel_locked(&job->job, force, errp);3169}
3170
3171void qmp_block_job_pause(const char *device, Error **errp)3172{
3173BlockJob *job;3174
3175JOB_LOCK_GUARD();3176job = find_block_job_locked(device, errp);3177
3178if (!job) {3179return;3180}3181
3182trace_qmp_block_job_pause(job);3183job_user_pause_locked(&job->job, errp);3184}
3185
3186void qmp_block_job_resume(const char *device, Error **errp)3187{
3188BlockJob *job;3189
3190JOB_LOCK_GUARD();3191job = find_block_job_locked(device, errp);3192
3193if (!job) {3194return;3195}3196
3197trace_qmp_block_job_resume(job);3198job_user_resume_locked(&job->job, errp);3199}
3200
3201void qmp_block_job_complete(const char *device, Error **errp)3202{
3203BlockJob *job;3204
3205JOB_LOCK_GUARD();3206job = find_block_job_locked(device, errp);3207
3208if (!job) {3209return;3210}3211
3212trace_qmp_block_job_complete(job);3213job_complete_locked(&job->job, errp);3214}
3215
3216void qmp_block_job_finalize(const char *id, Error **errp)3217{
3218BlockJob *job;3219
3220JOB_LOCK_GUARD();3221job = find_block_job_locked(id, errp);3222
3223if (!job) {3224return;3225}3226
3227trace_qmp_block_job_finalize(job);3228job_ref_locked(&job->job);3229job_finalize_locked(&job->job, errp);3230
3231job_unref_locked(&job->job);3232}
3233
3234void qmp_block_job_dismiss(const char *id, Error **errp)3235{
3236BlockJob *bjob;3237Job *job;3238
3239JOB_LOCK_GUARD();3240bjob = find_block_job_locked(id, errp);3241
3242if (!bjob) {3243return;3244}3245
3246trace_qmp_block_job_dismiss(bjob);3247job = &bjob->job;3248job_dismiss_locked(&job, errp);3249}
3250
3251void qmp_block_job_change(BlockJobChangeOptions *opts, Error **errp)3252{
3253BlockJob *job;3254
3255JOB_LOCK_GUARD();3256job = find_block_job_locked(opts->id, errp);3257
3258if (!job) {3259return;3260}3261
3262block_job_change_locked(job, opts, errp);3263}
3264
3265void qmp_change_backing_file(const char *device,3266const char *image_node_name,3267const char *backing_file,3268Error **errp)3269{
3270BlockDriverState *bs = NULL;3271BlockDriverState *image_bs = NULL;3272Error *local_err = NULL;3273bool ro;3274int ret;3275
3276bs = qmp_get_root_bs(device, errp);3277if (!bs) {3278return;3279}3280
3281bdrv_graph_rdlock_main_loop();3282
3283image_bs = bdrv_lookup_bs(NULL, image_node_name, &local_err);3284if (local_err) {3285error_propagate(errp, local_err);3286goto out_rdlock;3287}3288
3289if (!image_bs) {3290error_setg(errp, "image file not found");3291goto out_rdlock;3292}3293
3294if (bdrv_find_base(image_bs) == image_bs) {3295error_setg(errp, "not allowing backing file change on an image "3296"without a backing file");3297goto out_rdlock;3298}3299
3300/* even though we are not necessarily operating on bs, we need it to3301* determine if block ops are currently prohibited on the chain */
3302if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_CHANGE, errp)) {3303goto out_rdlock;3304}3305
3306/* final sanity check */3307if (!bdrv_chain_contains(bs, image_bs)) {3308error_setg(errp, "'%s' and image file are not in the same chain",3309device);3310goto out_rdlock;3311}3312bdrv_graph_rdunlock_main_loop();3313
3314/* if not r/w, reopen to make r/w */3315ro = bdrv_is_read_only(image_bs);3316
3317if (ro) {3318if (bdrv_reopen_set_read_only(image_bs, false, errp) != 0) {3319return;3320}3321}3322
3323ret = bdrv_change_backing_file(image_bs, backing_file,3324image_bs->drv ? image_bs->drv->format_name : "",3325false);3326
3327if (ret < 0) {3328error_setg_errno(errp, -ret, "Could not change backing file to '%s'",3329backing_file);3330/* don't exit here, so we can try to restore open flags if3331* appropriate */
3332}3333
3334if (ro) {3335bdrv_reopen_set_read_only(image_bs, true, errp);3336}3337return;3338
3339out_rdlock:3340bdrv_graph_rdunlock_main_loop();3341}
3342
3343void qmp_blockdev_add(BlockdevOptions *options, Error **errp)3344{
3345BlockDriverState *bs;3346QObject *obj;3347Visitor *v = qobject_output_visitor_new(&obj);3348QDict *qdict;3349
3350visit_type_BlockdevOptions(v, NULL, &options, &error_abort);3351visit_complete(v, &obj);3352qdict = qobject_to(QDict, obj);3353
3354qdict_flatten(qdict);3355
3356if (!qdict_get_try_str(qdict, "node-name")) {3357error_setg(errp, "'node-name' must be specified for the root node");3358goto fail;3359}3360
3361bs = bds_tree_init(qdict, errp);3362if (!bs) {3363goto fail;3364}3365
3366bdrv_set_monitor_owned(bs);3367
3368fail:3369visit_free(v);3370}
3371
3372void qmp_blockdev_reopen(BlockdevOptionsList *reopen_list, Error **errp)3373{
3374BlockReopenQueue *queue = NULL;3375
3376/* Add each one of the BDS that we want to reopen to the queue */3377for (; reopen_list != NULL; reopen_list = reopen_list->next) {3378BlockdevOptions *options = reopen_list->value;3379BlockDriverState *bs;3380QObject *obj;3381Visitor *v;3382QDict *qdict;3383
3384/* Check for the selected node name */3385if (!options->node_name) {3386error_setg(errp, "node-name not specified");3387goto fail;3388}3389
3390bs = bdrv_find_node(options->node_name);3391if (!bs) {3392error_setg(errp, "Failed to find node with node-name='%s'",3393options->node_name);3394goto fail;3395}3396
3397/* Put all options in a QDict and flatten it */3398v = qobject_output_visitor_new(&obj);3399visit_type_BlockdevOptions(v, NULL, &options, &error_abort);3400visit_complete(v, &obj);3401visit_free(v);3402
3403qdict = qobject_to(QDict, obj);3404
3405qdict_flatten(qdict);3406
3407queue = bdrv_reopen_queue(queue, bs, qdict, false);3408}3409
3410/* Perform the reopen operation */3411bdrv_reopen_multiple(queue, errp);3412queue = NULL;3413
3414fail:3415bdrv_reopen_queue_free(queue);3416}
3417
3418void qmp_blockdev_del(const char *node_name, Error **errp)3419{
3420BlockDriverState *bs;3421
3422GLOBAL_STATE_CODE();3423GRAPH_RDLOCK_GUARD_MAINLOOP();3424
3425bs = bdrv_find_node(node_name);3426if (!bs) {3427error_setg(errp, "Failed to find node with node-name='%s'", node_name);3428return;3429}3430if (bdrv_has_blk(bs)) {3431error_setg(errp, "Node %s is in use", node_name);3432return;3433}3434
3435if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_DRIVE_DEL, errp)) {3436return;3437}3438
3439if (!QTAILQ_IN_USE(bs, monitor_list)) {3440error_setg(errp, "Node %s is not owned by the monitor",3441bs->node_name);3442return;3443}3444
3445if (bs->refcnt > 1) {3446error_setg(errp, "Block device %s is in use",3447bdrv_get_device_or_node_name(bs));3448return;3449}3450
3451QTAILQ_REMOVE(&monitor_bdrv_states, bs, monitor_list);3452bdrv_unref(bs);3453}
3454
3455static BdrvChild * GRAPH_RDLOCK3456bdrv_find_child(BlockDriverState *parent_bs, const char *child_name)3457{
3458BdrvChild *child;3459
3460QLIST_FOREACH(child, &parent_bs->children, next) {3461if (strcmp(child->name, child_name) == 0) {3462return child;3463}3464}3465
3466return NULL;3467}
3468
3469void qmp_x_blockdev_change(const char *parent, const char *child,3470const char *node, Error **errp)3471{
3472BlockDriverState *parent_bs, *new_bs = NULL;3473BdrvChild *p_child;3474
3475bdrv_graph_wrlock();3476
3477parent_bs = bdrv_lookup_bs(parent, parent, errp);3478if (!parent_bs) {3479goto out;3480}3481
3482if (!child == !node) {3483if (child) {3484error_setg(errp, "The parameters child and node are in conflict");3485} else {3486error_setg(errp, "Either child or node must be specified");3487}3488goto out;3489}3490
3491if (child) {3492p_child = bdrv_find_child(parent_bs, child);3493if (!p_child) {3494error_setg(errp, "Node '%s' does not have child '%s'",3495parent, child);3496goto out;3497}3498bdrv_del_child(parent_bs, p_child, errp);3499}3500
3501if (node) {3502new_bs = bdrv_find_node(node);3503if (!new_bs) {3504error_setg(errp, "Node '%s' not found", node);3505goto out;3506}3507bdrv_add_child(parent_bs, new_bs, errp);3508}3509
3510out:3511bdrv_graph_wrunlock();3512}
3513
3514BlockJobInfoList *qmp_query_block_jobs(Error **errp)3515{
3516BlockJobInfoList *head = NULL, **tail = &head;3517BlockJob *job;3518
3519JOB_LOCK_GUARD();3520
3521for (job = block_job_next_locked(NULL); job;3522job = block_job_next_locked(job)) {3523BlockJobInfo *value;3524
3525if (block_job_is_internal(job)) {3526continue;3527}3528value = block_job_query_locked(job, errp);3529if (!value) {3530qapi_free_BlockJobInfoList(head);3531return NULL;3532}3533QAPI_LIST_APPEND(tail, value);3534}3535
3536return head;3537}
3538
3539void qmp_x_blockdev_set_iothread(const char *node_name, StrOrNull *iothread,3540bool has_force, bool force, Error **errp)3541{
3542AioContext *new_context;3543BlockDriverState *bs;3544
3545GRAPH_RDLOCK_GUARD_MAINLOOP();3546
3547bs = bdrv_find_node(node_name);3548if (!bs) {3549error_setg(errp, "Failed to find node with node-name='%s'", node_name);3550return;3551}3552
3553/* Protects against accidents. */3554if (!(has_force && force) && bdrv_has_blk(bs)) {3555error_setg(errp, "Node %s is associated with a BlockBackend and could "3556"be in use (use force=true to override this check)",3557node_name);3558return;3559}3560
3561if (iothread->type == QTYPE_QSTRING) {3562IOThread *obj = iothread_by_id(iothread->u.s);3563if (!obj) {3564error_setg(errp, "Cannot find iothread %s", iothread->u.s);3565return;3566}3567
3568new_context = iothread_get_aio_context(obj);3569} else {3570new_context = qemu_get_aio_context();3571}3572
3573bdrv_try_change_aio_context(bs, new_context, NULL, errp);3574}
3575
3576QemuOptsList qemu_common_drive_opts = {3577.name = "drive",3578.head = QTAILQ_HEAD_INITIALIZER(qemu_common_drive_opts.head),3579.desc = {3580{3581.name = "snapshot",3582.type = QEMU_OPT_BOOL,3583.help = "enable/disable snapshot mode",3584},{3585.name = "aio",3586.type = QEMU_OPT_STRING,3587.help = "host AIO implementation (threads, native, io_uring)",3588},{3589.name = BDRV_OPT_CACHE_WB,3590.type = QEMU_OPT_BOOL,3591.help = "Enable writeback mode",3592},{3593.name = "format",3594.type = QEMU_OPT_STRING,3595.help = "disk format (raw, qcow2, ...)",3596},{3597.name = "rerror",3598.type = QEMU_OPT_STRING,3599.help = "read error action",3600},{3601.name = "werror",3602.type = QEMU_OPT_STRING,3603.help = "write error action",3604},{3605.name = BDRV_OPT_READ_ONLY,3606.type = QEMU_OPT_BOOL,3607.help = "open drive file as read-only",3608},3609
3610THROTTLE_OPTS,3611
3612{3613.name = "throttling.group",3614.type = QEMU_OPT_STRING,3615.help = "name of the block throttling group",3616},{3617.name = "copy-on-read",3618.type = QEMU_OPT_BOOL,3619.help = "copy read data from backing file into image file",3620},{3621.name = "detect-zeroes",3622.type = QEMU_OPT_STRING,3623.help = "try to optimize zero writes (off, on, unmap)",3624},{3625.name = "stats-account-invalid",3626.type = QEMU_OPT_BOOL,3627.help = "whether to account for invalid I/O operations "3628"in the statistics",3629},{3630.name = "stats-account-failed",3631.type = QEMU_OPT_BOOL,3632.help = "whether to account for failed I/O operations "3633"in the statistics",3634},3635{ /* end of list */ }3636},3637};3638
3639QemuOptsList qemu_drive_opts = {3640.name = "drive",3641.head = QTAILQ_HEAD_INITIALIZER(qemu_drive_opts.head),3642.desc = {3643/*3644* no elements => accept any params
3645* validation will happen later
3646*/
3647{ /* end of list */ }3648},3649};3650