cachepc-qemu

Fork of AMDESE/qemu with changes for cachepc side-channel attack
git clone https://git.sinitax.com/sinitax/cachepc-qemu
Log | Files | Refs | Submodules | LICENSE | sfeed.txt

blockdev.c (120109B)


      1/*
      2 * QEMU host block devices
      3 *
      4 * Copyright (c) 2003-2008 Fabrice Bellard
      5 *
      6 * This work is licensed under the terms of the GNU GPL, version 2 or
      7 * later.  See the COPYING file in the top-level directory.
      8 *
      9 * This file incorporates work covered by the following copyright and
     10 * permission notice:
     11 *
     12 * Copyright (c) 2003-2008 Fabrice Bellard
     13 *
     14 * Permission is hereby granted, free of charge, to any person obtaining a copy
     15 * of this software and associated documentation files (the "Software"), to deal
     16 * in the Software without restriction, including without limitation the rights
     17 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
     18 * copies of the Software, and to permit persons to whom the Software is
     19 * furnished to do so, subject to the following conditions:
     20 *
     21 * The above copyright notice and this permission notice shall be included in
     22 * all copies or substantial portions of the Software.
     23 *
     24 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
     25 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
     26 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
     27 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
     28 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
     29 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
     30 * THE SOFTWARE.
     31 */
     32
     33#include "qemu/osdep.h"
     34#include "sysemu/block-backend.h"
     35#include "sysemu/blockdev.h"
     36#include "hw/block/block.h"
     37#include "block/blockjob.h"
     38#include "block/qdict.h"
     39#include "block/throttle-groups.h"
     40#include "monitor/monitor.h"
     41#include "qemu/error-report.h"
     42#include "qemu/option.h"
     43#include "qemu/qemu-print.h"
     44#include "qemu/config-file.h"
     45#include "qapi/qapi-commands-block.h"
     46#include "qapi/qapi-commands-transaction.h"
     47#include "qapi/qapi-visit-block-core.h"
     48#include "qapi/qmp/qdict.h"
     49#include "qapi/qmp/qnum.h"
     50#include "qapi/qmp/qstring.h"
     51#include "qapi/error.h"
     52#include "qapi/qmp/qerror.h"
     53#include "qapi/qmp/qlist.h"
     54#include "qapi/qobject-output-visitor.h"
     55#include "sysemu/sysemu.h"
     56#include "sysemu/iothread.h"
     57#include "block/block_int.h"
     58#include "block/trace.h"
     59#include "sysemu/runstate.h"
     60#include "sysemu/replay.h"
     61#include "qemu/cutils.h"
     62#include "qemu/help_option.h"
     63#include "qemu/main-loop.h"
     64#include "qemu/throttle-options.h"
     65
     66QTAILQ_HEAD(, BlockDriverState) monitor_bdrv_states =
     67    QTAILQ_HEAD_INITIALIZER(monitor_bdrv_states);
     68
     69void bdrv_set_monitor_owned(BlockDriverState *bs)
     70{
     71    QTAILQ_INSERT_TAIL(&monitor_bdrv_states, bs, monitor_list);
     72}
     73
     74static const char *const if_name[IF_COUNT] = {
     75    [IF_NONE] = "none",
     76    [IF_IDE] = "ide",
     77    [IF_SCSI] = "scsi",
     78    [IF_FLOPPY] = "floppy",
     79    [IF_PFLASH] = "pflash",
     80    [IF_MTD] = "mtd",
     81    [IF_SD] = "sd",
     82    [IF_VIRTIO] = "virtio",
     83    [IF_XEN] = "xen",
     84};
     85
     86static int if_max_devs[IF_COUNT] = {
     87    /*
     88     * Do not change these numbers!  They govern how drive option
     89     * index maps to unit and bus.  That mapping is ABI.
     90     *
     91     * All controllers used to implement if=T drives need to support
     92     * if_max_devs[T] units, for any T with if_max_devs[T] != 0.
     93     * Otherwise, some index values map to "impossible" bus, unit
     94     * values.
     95     *
     96     * For instance, if you change [IF_SCSI] to 255, -drive
     97     * if=scsi,index=12 no longer means bus=1,unit=5, but
     98     * bus=0,unit=12.  With an lsi53c895a controller (7 units max),
     99     * the drive can't be set up.  Regression.
    100     */
    101    [IF_IDE] = 2,
    102    [IF_SCSI] = 7,
    103};
    104
    105/**
    106 * Boards may call this to offer board-by-board overrides
    107 * of the default, global values.
    108 */
    109void override_max_devs(BlockInterfaceType type, int max_devs)
    110{
    111    BlockBackend *blk;
    112    DriveInfo *dinfo;
    113
    114    if (max_devs <= 0) {
    115        return;
    116    }
    117
    118    for (blk = blk_next(NULL); blk; blk = blk_next(blk)) {
    119        dinfo = blk_legacy_dinfo(blk);
    120        if (dinfo->type == type) {
    121            fprintf(stderr, "Cannot override units-per-bus property of"
    122                    " the %s interface, because a drive of that type has"
    123                    " already been added.\n", if_name[type]);
    124            g_assert_not_reached();
    125        }
    126    }
    127
    128    if_max_devs[type] = max_devs;
    129}
    130
    131/*
    132 * We automatically delete the drive when a device using it gets
    133 * unplugged.  Questionable feature, but we can't just drop it.
    134 * Device models call blockdev_mark_auto_del() to schedule the
    135 * automatic deletion, and generic qdev code calls blockdev_auto_del()
    136 * when deletion is actually safe.
    137 */
    138void blockdev_mark_auto_del(BlockBackend *blk)
    139{
    140    DriveInfo *dinfo = blk_legacy_dinfo(blk);
    141    BlockJob *job;
    142
    143    if (!dinfo) {
    144        return;
    145    }
    146
    147    for (job = block_job_next(NULL); job; job = block_job_next(job)) {
    148        if (block_job_has_bdrv(job, blk_bs(blk))) {
    149            AioContext *aio_context = job->job.aio_context;
    150            aio_context_acquire(aio_context);
    151
    152            job_cancel(&job->job, false);
    153
    154            aio_context_release(aio_context);
    155        }
    156    }
    157
    158    dinfo->auto_del = 1;
    159}
    160
    161void blockdev_auto_del(BlockBackend *blk)
    162{
    163    DriveInfo *dinfo = blk_legacy_dinfo(blk);
    164
    165    if (dinfo && dinfo->auto_del) {
    166        monitor_remove_blk(blk);
    167        blk_unref(blk);
    168    }
    169}
    170
    171/**
    172 * Returns the current mapping of how many units per bus
    173 * a particular interface can support.
    174 *
    175 *  A positive integer indicates n units per bus.
    176 *  0 implies the mapping has not been established.
    177 * -1 indicates an invalid BlockInterfaceType was given.
    178 */
    179int drive_get_max_devs(BlockInterfaceType type)
    180{
    181    if (type >= IF_IDE && type < IF_COUNT) {
    182        return if_max_devs[type];
    183    }
    184
    185    return -1;
    186}
    187
    188static int drive_index_to_bus_id(BlockInterfaceType type, int index)
    189{
    190    int max_devs = if_max_devs[type];
    191    return max_devs ? index / max_devs : 0;
    192}
    193
    194static int drive_index_to_unit_id(BlockInterfaceType type, int index)
    195{
    196    int max_devs = if_max_devs[type];
    197    return max_devs ? index % max_devs : index;
    198}
    199
    200QemuOpts *drive_def(const char *optstr)
    201{
    202    return qemu_opts_parse_noisily(qemu_find_opts("drive"), optstr, false);
    203}
    204
    205QemuOpts *drive_add(BlockInterfaceType type, int index, const char *file,
    206                    const char *optstr)
    207{
    208    QemuOpts *opts;
    209
    210    opts = drive_def(optstr);
    211    if (!opts) {
    212        return NULL;
    213    }
    214    if (type != IF_DEFAULT) {
    215        qemu_opt_set(opts, "if", if_name[type], &error_abort);
    216    }
    217    if (index >= 0) {
    218        qemu_opt_set_number(opts, "index", index, &error_abort);
    219    }
    220    if (file)
    221        qemu_opt_set(opts, "file", file, &error_abort);
    222    return opts;
    223}
    224
    225DriveInfo *drive_get(BlockInterfaceType type, int bus, int unit)
    226{
    227    BlockBackend *blk;
    228    DriveInfo *dinfo;
    229
    230    for (blk = blk_next(NULL); blk; blk = blk_next(blk)) {
    231        dinfo = blk_legacy_dinfo(blk);
    232        if (dinfo && dinfo->type == type
    233            && dinfo->bus == bus && dinfo->unit == unit) {
    234            return dinfo;
    235        }
    236    }
    237
    238    return NULL;
    239}
    240
    241/*
    242 * Check board claimed all -drive that are meant to be claimed.
    243 * Fatal error if any remain unclaimed.
    244 */
    245void drive_check_orphaned(void)
    246{
    247    BlockBackend *blk;
    248    DriveInfo *dinfo;
    249    Location loc;
    250    bool orphans = false;
    251
    252    for (blk = blk_next(NULL); blk; blk = blk_next(blk)) {
    253        dinfo = blk_legacy_dinfo(blk);
    254        /*
    255         * Ignore default drives, because we create certain default
    256         * drives unconditionally, then leave them unclaimed.  Not the
    257         * users fault.
    258         * Ignore IF_VIRTIO, because it gets desugared into -device,
    259         * so we can leave failing to -device.
    260         * Ignore IF_NONE, because leaving unclaimed IF_NONE remains
    261         * available for device_add is a feature.
    262         */
    263        if (dinfo->is_default || dinfo->type == IF_VIRTIO
    264            || dinfo->type == IF_NONE) {
    265            continue;
    266        }
    267        if (!blk_get_attached_dev(blk)) {
    268            loc_push_none(&loc);
    269            qemu_opts_loc_restore(dinfo->opts);
    270            error_report("machine type does not support"
    271                         " if=%s,bus=%d,unit=%d",
    272                         if_name[dinfo->type], dinfo->bus, dinfo->unit);
    273            loc_pop(&loc);
    274            orphans = true;
    275        }
    276    }
    277
    278    if (orphans) {
    279        exit(1);
    280    }
    281}
    282
    283DriveInfo *drive_get_by_index(BlockInterfaceType type, int index)
    284{
    285    return drive_get(type,
    286                     drive_index_to_bus_id(type, index),
    287                     drive_index_to_unit_id(type, index));
    288}
    289
    290int drive_get_max_bus(BlockInterfaceType type)
    291{
    292    int max_bus;
    293    BlockBackend *blk;
    294    DriveInfo *dinfo;
    295
    296    max_bus = -1;
    297    for (blk = blk_next(NULL); blk; blk = blk_next(blk)) {
    298        dinfo = blk_legacy_dinfo(blk);
    299        if (dinfo && dinfo->type == type && dinfo->bus > max_bus) {
    300            max_bus = dinfo->bus;
    301        }
    302    }
    303    return max_bus;
    304}
    305
    306/* Get a block device.  This should only be used for single-drive devices
    307   (e.g. SD/Floppy/MTD).  Multi-disk devices (scsi/ide) should use the
    308   appropriate bus.  */
    309DriveInfo *drive_get_next(BlockInterfaceType type)
    310{
    311    static int next_block_unit[IF_COUNT];
    312
    313    return drive_get(type, 0, next_block_unit[type]++);
    314}
    315
    316static void bdrv_format_print(void *opaque, const char *name)
    317{
    318    qemu_printf(" %s", name);
    319}
    320
    321typedef struct {
    322    QEMUBH *bh;
    323    BlockDriverState *bs;
    324} BDRVPutRefBH;
    325
    326static int parse_block_error_action(const char *buf, bool is_read, Error **errp)
    327{
    328    if (!strcmp(buf, "ignore")) {
    329        return BLOCKDEV_ON_ERROR_IGNORE;
    330    } else if (!is_read && !strcmp(buf, "enospc")) {
    331        return BLOCKDEV_ON_ERROR_ENOSPC;
    332    } else if (!strcmp(buf, "stop")) {
    333        return BLOCKDEV_ON_ERROR_STOP;
    334    } else if (!strcmp(buf, "report")) {
    335        return BLOCKDEV_ON_ERROR_REPORT;
    336    } else {
    337        error_setg(errp, "'%s' invalid %s error action",
    338                   buf, is_read ? "read" : "write");
    339        return -1;
    340    }
    341}
    342
    343static bool parse_stats_intervals(BlockAcctStats *stats, QList *intervals,
    344                                  Error **errp)
    345{
    346    const QListEntry *entry;
    347    for (entry = qlist_first(intervals); entry; entry = qlist_next(entry)) {
    348        switch (qobject_type(entry->value)) {
    349
    350        case QTYPE_QSTRING: {
    351            unsigned long long length;
    352            const char *str = qstring_get_str(qobject_to(QString,
    353                                                         entry->value));
    354            if (parse_uint_full(str, &length, 10) == 0 &&
    355                length > 0 && length <= UINT_MAX) {
    356                block_acct_add_interval(stats, (unsigned) length);
    357            } else {
    358                error_setg(errp, "Invalid interval length: %s", str);
    359                return false;
    360            }
    361            break;
    362        }
    363
    364        case QTYPE_QNUM: {
    365            int64_t length = qnum_get_int(qobject_to(QNum, entry->value));
    366
    367            if (length > 0 && length <= UINT_MAX) {
    368                block_acct_add_interval(stats, (unsigned) length);
    369            } else {
    370                error_setg(errp, "Invalid interval length: %" PRId64, length);
    371                return false;
    372            }
    373            break;
    374        }
    375
    376        default:
    377            error_setg(errp, "The specification of stats-intervals is invalid");
    378            return false;
    379        }
    380    }
    381    return true;
    382}
    383
    384typedef enum { MEDIA_DISK, MEDIA_CDROM } DriveMediaType;
    385
    386/* All parameters but @opts are optional and may be set to NULL. */
    387static void extract_common_blockdev_options(QemuOpts *opts, int *bdrv_flags,
    388    const char **throttling_group, ThrottleConfig *throttle_cfg,
    389    BlockdevDetectZeroesOptions *detect_zeroes, Error **errp)
    390{
    391    Error *local_error = NULL;
    392    const char *aio;
    393
    394    if (bdrv_flags) {
    395        if (qemu_opt_get_bool(opts, "copy-on-read", false)) {
    396            *bdrv_flags |= BDRV_O_COPY_ON_READ;
    397        }
    398
    399        if ((aio = qemu_opt_get(opts, "aio")) != NULL) {
    400            if (bdrv_parse_aio(aio, bdrv_flags) < 0) {
    401                error_setg(errp, "invalid aio option");
    402                return;
    403            }
    404        }
    405    }
    406
    407    /* disk I/O throttling */
    408    if (throttling_group) {
    409        *throttling_group = qemu_opt_get(opts, "throttling.group");
    410    }
    411
    412    if (throttle_cfg) {
    413        throttle_config_init(throttle_cfg);
    414        throttle_cfg->buckets[THROTTLE_BPS_TOTAL].avg =
    415            qemu_opt_get_number(opts, "throttling.bps-total", 0);
    416        throttle_cfg->buckets[THROTTLE_BPS_READ].avg  =
    417            qemu_opt_get_number(opts, "throttling.bps-read", 0);
    418        throttle_cfg->buckets[THROTTLE_BPS_WRITE].avg =
    419            qemu_opt_get_number(opts, "throttling.bps-write", 0);
    420        throttle_cfg->buckets[THROTTLE_OPS_TOTAL].avg =
    421            qemu_opt_get_number(opts, "throttling.iops-total", 0);
    422        throttle_cfg->buckets[THROTTLE_OPS_READ].avg =
    423            qemu_opt_get_number(opts, "throttling.iops-read", 0);
    424        throttle_cfg->buckets[THROTTLE_OPS_WRITE].avg =
    425            qemu_opt_get_number(opts, "throttling.iops-write", 0);
    426
    427        throttle_cfg->buckets[THROTTLE_BPS_TOTAL].max =
    428            qemu_opt_get_number(opts, "throttling.bps-total-max", 0);
    429        throttle_cfg->buckets[THROTTLE_BPS_READ].max  =
    430            qemu_opt_get_number(opts, "throttling.bps-read-max", 0);
    431        throttle_cfg->buckets[THROTTLE_BPS_WRITE].max =
    432            qemu_opt_get_number(opts, "throttling.bps-write-max", 0);
    433        throttle_cfg->buckets[THROTTLE_OPS_TOTAL].max =
    434            qemu_opt_get_number(opts, "throttling.iops-total-max", 0);
    435        throttle_cfg->buckets[THROTTLE_OPS_READ].max =
    436            qemu_opt_get_number(opts, "throttling.iops-read-max", 0);
    437        throttle_cfg->buckets[THROTTLE_OPS_WRITE].max =
    438            qemu_opt_get_number(opts, "throttling.iops-write-max", 0);
    439
    440        throttle_cfg->buckets[THROTTLE_BPS_TOTAL].burst_length =
    441            qemu_opt_get_number(opts, "throttling.bps-total-max-length", 1);
    442        throttle_cfg->buckets[THROTTLE_BPS_READ].burst_length  =
    443            qemu_opt_get_number(opts, "throttling.bps-read-max-length", 1);
    444        throttle_cfg->buckets[THROTTLE_BPS_WRITE].burst_length =
    445            qemu_opt_get_number(opts, "throttling.bps-write-max-length", 1);
    446        throttle_cfg->buckets[THROTTLE_OPS_TOTAL].burst_length =
    447            qemu_opt_get_number(opts, "throttling.iops-total-max-length", 1);
    448        throttle_cfg->buckets[THROTTLE_OPS_READ].burst_length =
    449            qemu_opt_get_number(opts, "throttling.iops-read-max-length", 1);
    450        throttle_cfg->buckets[THROTTLE_OPS_WRITE].burst_length =
    451            qemu_opt_get_number(opts, "throttling.iops-write-max-length", 1);
    452
    453        throttle_cfg->op_size =
    454            qemu_opt_get_number(opts, "throttling.iops-size", 0);
    455
    456        if (!throttle_is_valid(throttle_cfg, errp)) {
    457            return;
    458        }
    459    }
    460
    461    if (detect_zeroes) {
    462        *detect_zeroes =
    463            qapi_enum_parse(&BlockdevDetectZeroesOptions_lookup,
    464                            qemu_opt_get(opts, "detect-zeroes"),
    465                            BLOCKDEV_DETECT_ZEROES_OPTIONS_OFF,
    466                            &local_error);
    467        if (local_error) {
    468            error_propagate(errp, local_error);
    469            return;
    470        }
    471    }
    472}
    473
    474/* Takes the ownership of bs_opts */
    475static BlockBackend *blockdev_init(const char *file, QDict *bs_opts,
    476                                   Error **errp)
    477{
    478    const char *buf;
    479    int bdrv_flags = 0;
    480    int on_read_error, on_write_error;
    481    bool account_invalid, account_failed;
    482    bool writethrough, read_only;
    483    BlockBackend *blk;
    484    BlockDriverState *bs;
    485    ThrottleConfig cfg;
    486    int snapshot = 0;
    487    Error *error = NULL;
    488    QemuOpts *opts;
    489    QDict *interval_dict = NULL;
    490    QList *interval_list = NULL;
    491    const char *id;
    492    BlockdevDetectZeroesOptions detect_zeroes =
    493        BLOCKDEV_DETECT_ZEROES_OPTIONS_OFF;
    494    const char *throttling_group = NULL;
    495
    496    /* Check common options by copying from bs_opts to opts, all other options
    497     * stay in bs_opts for processing by bdrv_open(). */
    498    id = qdict_get_try_str(bs_opts, "id");
    499    opts = qemu_opts_create(&qemu_common_drive_opts, id, 1, errp);
    500    if (!opts) {
    501        goto err_no_opts;
    502    }
    503
    504    if (!qemu_opts_absorb_qdict(opts, bs_opts, errp)) {
    505        goto early_err;
    506    }
    507
    508    if (id) {
    509        qdict_del(bs_opts, "id");
    510    }
    511
    512    /* extract parameters */
    513    snapshot = qemu_opt_get_bool(opts, "snapshot", 0);
    514
    515    account_invalid = qemu_opt_get_bool(opts, "stats-account-invalid", true);
    516    account_failed = qemu_opt_get_bool(opts, "stats-account-failed", true);
    517
    518    writethrough = !qemu_opt_get_bool(opts, BDRV_OPT_CACHE_WB, true);
    519
    520    id = qemu_opts_id(opts);
    521
    522    qdict_extract_subqdict(bs_opts, &interval_dict, "stats-intervals.");
    523    qdict_array_split(interval_dict, &interval_list);
    524
    525    if (qdict_size(interval_dict) != 0) {
    526        error_setg(errp, "Invalid option stats-intervals.%s",
    527                   qdict_first(interval_dict)->key);
    528        goto early_err;
    529    }
    530
    531    extract_common_blockdev_options(opts, &bdrv_flags, &throttling_group, &cfg,
    532                                    &detect_zeroes, &error);
    533    if (error) {
    534        error_propagate(errp, error);
    535        goto early_err;
    536    }
    537
    538    if ((buf = qemu_opt_get(opts, "format")) != NULL) {
    539        if (is_help_option(buf)) {
    540            qemu_printf("Supported formats:");
    541            bdrv_iterate_format(bdrv_format_print, NULL, false);
    542            qemu_printf("\nSupported formats (read-only):");
    543            bdrv_iterate_format(bdrv_format_print, NULL, true);
    544            qemu_printf("\n");
    545            goto early_err;
    546        }
    547
    548        if (qdict_haskey(bs_opts, "driver")) {
    549            error_setg(errp, "Cannot specify both 'driver' and 'format'");
    550            goto early_err;
    551        }
    552        qdict_put_str(bs_opts, "driver", buf);
    553    }
    554
    555    on_write_error = BLOCKDEV_ON_ERROR_ENOSPC;
    556    if ((buf = qemu_opt_get(opts, "werror")) != NULL) {
    557        on_write_error = parse_block_error_action(buf, 0, &error);
    558        if (error) {
    559            error_propagate(errp, error);
    560            goto early_err;
    561        }
    562    }
    563
    564    on_read_error = BLOCKDEV_ON_ERROR_REPORT;
    565    if ((buf = qemu_opt_get(opts, "rerror")) != NULL) {
    566        on_read_error = parse_block_error_action(buf, 1, &error);
    567        if (error) {
    568            error_propagate(errp, error);
    569            goto early_err;
    570        }
    571    }
    572
    573    if (snapshot) {
    574        bdrv_flags |= BDRV_O_SNAPSHOT;
    575    }
    576
    577    read_only = qemu_opt_get_bool(opts, BDRV_OPT_READ_ONLY, false);
    578
    579    /* init */
    580    if ((!file || !*file) && !qdict_size(bs_opts)) {
    581        BlockBackendRootState *blk_rs;
    582
    583        blk = blk_new(qemu_get_aio_context(), 0, BLK_PERM_ALL);
    584        blk_rs = blk_get_root_state(blk);
    585        blk_rs->open_flags    = bdrv_flags | (read_only ? 0 : BDRV_O_RDWR);
    586        blk_rs->detect_zeroes = detect_zeroes;
    587
    588        qobject_unref(bs_opts);
    589    } else {
    590        if (file && !*file) {
    591            file = NULL;
    592        }
    593
    594        /* bdrv_open() defaults to the values in bdrv_flags (for compatibility
    595         * with other callers) rather than what we want as the real defaults.
    596         * Apply the defaults here instead. */
    597        qdict_set_default_str(bs_opts, BDRV_OPT_CACHE_DIRECT, "off");
    598        qdict_set_default_str(bs_opts, BDRV_OPT_CACHE_NO_FLUSH, "off");
    599        qdict_set_default_str(bs_opts, BDRV_OPT_READ_ONLY,
    600                              read_only ? "on" : "off");
    601        qdict_set_default_str(bs_opts, BDRV_OPT_AUTO_READ_ONLY, "on");
    602        assert((bdrv_flags & BDRV_O_CACHE_MASK) == 0);
    603
    604        if (runstate_check(RUN_STATE_INMIGRATE)) {
    605            bdrv_flags |= BDRV_O_INACTIVE;
    606        }
    607
    608        blk = blk_new_open(file, NULL, bs_opts, bdrv_flags, errp);
    609        if (!blk) {
    610            goto err_no_bs_opts;
    611        }
    612        bs = blk_bs(blk);
    613
    614        bs->detect_zeroes = detect_zeroes;
    615
    616        block_acct_setup(blk_get_stats(blk), account_invalid, account_failed);
    617
    618        if (!parse_stats_intervals(blk_get_stats(blk), interval_list, errp)) {
    619            blk_unref(blk);
    620            blk = NULL;
    621            goto err_no_bs_opts;
    622        }
    623    }
    624
    625    /* disk I/O throttling */
    626    if (throttle_enabled(&cfg)) {
    627        if (!throttling_group) {
    628            throttling_group = id;
    629        }
    630        blk_io_limits_enable(blk, throttling_group);
    631        blk_set_io_limits(blk, &cfg);
    632    }
    633
    634    blk_set_enable_write_cache(blk, !writethrough);
    635    blk_set_on_error(blk, on_read_error, on_write_error);
    636
    637    if (!monitor_add_blk(blk, id, errp)) {
    638        blk_unref(blk);
    639        blk = NULL;
    640        goto err_no_bs_opts;
    641    }
    642
    643err_no_bs_opts:
    644    qemu_opts_del(opts);
    645    qobject_unref(interval_dict);
    646    qobject_unref(interval_list);
    647    return blk;
    648
    649early_err:
    650    qemu_opts_del(opts);
    651    qobject_unref(interval_dict);
    652    qobject_unref(interval_list);
    653err_no_opts:
    654    qobject_unref(bs_opts);
    655    return NULL;
    656}
    657
    658/* Takes the ownership of bs_opts */
    659BlockDriverState *bds_tree_init(QDict *bs_opts, Error **errp)
    660{
    661    int bdrv_flags = 0;
    662
    663    /* bdrv_open() defaults to the values in bdrv_flags (for compatibility
    664     * with other callers) rather than what we want as the real defaults.
    665     * Apply the defaults here instead. */
    666    qdict_set_default_str(bs_opts, BDRV_OPT_CACHE_DIRECT, "off");
    667    qdict_set_default_str(bs_opts, BDRV_OPT_CACHE_NO_FLUSH, "off");
    668    qdict_set_default_str(bs_opts, BDRV_OPT_READ_ONLY, "off");
    669
    670    if (runstate_check(RUN_STATE_INMIGRATE)) {
    671        bdrv_flags |= BDRV_O_INACTIVE;
    672    }
    673
    674    return bdrv_open(NULL, NULL, bs_opts, bdrv_flags, errp);
    675}
    676
    677void blockdev_close_all_bdrv_states(void)
    678{
    679    BlockDriverState *bs, *next_bs;
    680
    681    QTAILQ_FOREACH_SAFE(bs, &monitor_bdrv_states, monitor_list, next_bs) {
    682        AioContext *ctx = bdrv_get_aio_context(bs);
    683
    684        aio_context_acquire(ctx);
    685        bdrv_unref(bs);
    686        aio_context_release(ctx);
    687    }
    688}
    689
    690/* Iterates over the list of monitor-owned BlockDriverStates */
    691BlockDriverState *bdrv_next_monitor_owned(BlockDriverState *bs)
    692{
    693    return bs ? QTAILQ_NEXT(bs, monitor_list)
    694              : QTAILQ_FIRST(&monitor_bdrv_states);
    695}
    696
    697static bool qemu_opt_rename(QemuOpts *opts, const char *from, const char *to,
    698                            Error **errp)
    699{
    700    const char *value;
    701
    702    value = qemu_opt_get(opts, from);
    703    if (value) {
    704        if (qemu_opt_find(opts, to)) {
    705            error_setg(errp, "'%s' and its alias '%s' can't be used at the "
    706                       "same time", to, from);
    707            return false;
    708        }
    709    }
    710
    711    /* rename all items in opts */
    712    while ((value = qemu_opt_get(opts, from))) {
    713        qemu_opt_set(opts, to, value, &error_abort);
    714        qemu_opt_unset(opts, from);
    715    }
    716    return true;
    717}
    718
    719QemuOptsList qemu_legacy_drive_opts = {
    720    .name = "drive",
    721    .head = QTAILQ_HEAD_INITIALIZER(qemu_legacy_drive_opts.head),
    722    .desc = {
    723        {
    724            .name = "bus",
    725            .type = QEMU_OPT_NUMBER,
    726            .help = "bus number",
    727        },{
    728            .name = "unit",
    729            .type = QEMU_OPT_NUMBER,
    730            .help = "unit number (i.e. lun for scsi)",
    731        },{
    732            .name = "index",
    733            .type = QEMU_OPT_NUMBER,
    734            .help = "index number",
    735        },{
    736            .name = "media",
    737            .type = QEMU_OPT_STRING,
    738            .help = "media type (disk, cdrom)",
    739        },{
    740            .name = "if",
    741            .type = QEMU_OPT_STRING,
    742            .help = "interface (ide, scsi, sd, mtd, floppy, pflash, virtio)",
    743        },{
    744            .name = "file",
    745            .type = QEMU_OPT_STRING,
    746            .help = "file name",
    747        },
    748
    749        /* Options that are passed on, but have special semantics with -drive */
    750        {
    751            .name = BDRV_OPT_READ_ONLY,
    752            .type = QEMU_OPT_BOOL,
    753            .help = "open drive file as read-only",
    754        },{
    755            .name = "rerror",
    756            .type = QEMU_OPT_STRING,
    757            .help = "read error action",
    758        },{
    759            .name = "werror",
    760            .type = QEMU_OPT_STRING,
    761            .help = "write error action",
    762        },{
    763            .name = "copy-on-read",
    764            .type = QEMU_OPT_BOOL,
    765            .help = "copy read data from backing file into image file",
    766        },
    767
    768        { /* end of list */ }
    769    },
    770};
    771
    772DriveInfo *drive_new(QemuOpts *all_opts, BlockInterfaceType block_default_type,
    773                     Error **errp)
    774{
    775    const char *value;
    776    BlockBackend *blk;
    777    DriveInfo *dinfo = NULL;
    778    QDict *bs_opts;
    779    QemuOpts *legacy_opts;
    780    DriveMediaType media = MEDIA_DISK;
    781    BlockInterfaceType type;
    782    int max_devs, bus_id, unit_id, index;
    783    const char *werror, *rerror;
    784    bool read_only = false;
    785    bool copy_on_read;
    786    const char *filename;
    787    int i;
    788
    789    /* Change legacy command line options into QMP ones */
    790    static const struct {
    791        const char *from;
    792        const char *to;
    793    } opt_renames[] = {
    794        { "iops",           "throttling.iops-total" },
    795        { "iops_rd",        "throttling.iops-read" },
    796        { "iops_wr",        "throttling.iops-write" },
    797
    798        { "bps",            "throttling.bps-total" },
    799        { "bps_rd",         "throttling.bps-read" },
    800        { "bps_wr",         "throttling.bps-write" },
    801
    802        { "iops_max",       "throttling.iops-total-max" },
    803        { "iops_rd_max",    "throttling.iops-read-max" },
    804        { "iops_wr_max",    "throttling.iops-write-max" },
    805
    806        { "bps_max",        "throttling.bps-total-max" },
    807        { "bps_rd_max",     "throttling.bps-read-max" },
    808        { "bps_wr_max",     "throttling.bps-write-max" },
    809
    810        { "iops_size",      "throttling.iops-size" },
    811
    812        { "group",          "throttling.group" },
    813
    814        { "readonly",       BDRV_OPT_READ_ONLY },
    815    };
    816
    817    for (i = 0; i < ARRAY_SIZE(opt_renames); i++) {
    818        if (!qemu_opt_rename(all_opts, opt_renames[i].from,
    819                             opt_renames[i].to, errp)) {
    820            return NULL;
    821        }
    822    }
    823
    824    value = qemu_opt_get(all_opts, "cache");
    825    if (value) {
    826        int flags = 0;
    827        bool writethrough;
    828
    829        if (bdrv_parse_cache_mode(value, &flags, &writethrough) != 0) {
    830            error_setg(errp, "invalid cache option");
    831            return NULL;
    832        }
    833
    834        /* Specific options take precedence */
    835        if (!qemu_opt_get(all_opts, BDRV_OPT_CACHE_WB)) {
    836            qemu_opt_set_bool(all_opts, BDRV_OPT_CACHE_WB,
    837                              !writethrough, &error_abort);
    838        }
    839        if (!qemu_opt_get(all_opts, BDRV_OPT_CACHE_DIRECT)) {
    840            qemu_opt_set_bool(all_opts, BDRV_OPT_CACHE_DIRECT,
    841                              !!(flags & BDRV_O_NOCACHE), &error_abort);
    842        }
    843        if (!qemu_opt_get(all_opts, BDRV_OPT_CACHE_NO_FLUSH)) {
    844            qemu_opt_set_bool(all_opts, BDRV_OPT_CACHE_NO_FLUSH,
    845                              !!(flags & BDRV_O_NO_FLUSH), &error_abort);
    846        }
    847        qemu_opt_unset(all_opts, "cache");
    848    }
    849
    850    /* Get a QDict for processing the options */
    851    bs_opts = qdict_new();
    852    qemu_opts_to_qdict(all_opts, bs_opts);
    853
    854    legacy_opts = qemu_opts_create(&qemu_legacy_drive_opts, NULL, 0,
    855                                   &error_abort);
    856    if (!qemu_opts_absorb_qdict(legacy_opts, bs_opts, errp)) {
    857        goto fail;
    858    }
    859
    860    /* Media type */
    861    value = qemu_opt_get(legacy_opts, "media");
    862    if (value) {
    863        if (!strcmp(value, "disk")) {
    864            media = MEDIA_DISK;
    865        } else if (!strcmp(value, "cdrom")) {
    866            media = MEDIA_CDROM;
    867            read_only = true;
    868        } else {
    869            error_setg(errp, "'%s' invalid media", value);
    870            goto fail;
    871        }
    872    }
    873
    874    /* copy-on-read is disabled with a warning for read-only devices */
    875    read_only |= qemu_opt_get_bool(legacy_opts, BDRV_OPT_READ_ONLY, false);
    876    copy_on_read = qemu_opt_get_bool(legacy_opts, "copy-on-read", false);
    877
    878    if (read_only && copy_on_read) {
    879        warn_report("disabling copy-on-read on read-only drive");
    880        copy_on_read = false;
    881    }
    882
    883    qdict_put_str(bs_opts, BDRV_OPT_READ_ONLY, read_only ? "on" : "off");
    884    qdict_put_str(bs_opts, "copy-on-read", copy_on_read ? "on" : "off");
    885
    886    /* Controller type */
    887    value = qemu_opt_get(legacy_opts, "if");
    888    if (value) {
    889        for (type = 0;
    890             type < IF_COUNT && strcmp(value, if_name[type]);
    891             type++) {
    892        }
    893        if (type == IF_COUNT) {
    894            error_setg(errp, "unsupported bus type '%s'", value);
    895            goto fail;
    896        }
    897    } else {
    898        type = block_default_type;
    899    }
    900
    901    /* Device address specified by bus/unit or index.
    902     * If none was specified, try to find the first free one. */
    903    bus_id  = qemu_opt_get_number(legacy_opts, "bus", 0);
    904    unit_id = qemu_opt_get_number(legacy_opts, "unit", -1);
    905    index   = qemu_opt_get_number(legacy_opts, "index", -1);
    906
    907    max_devs = if_max_devs[type];
    908
    909    if (index != -1) {
    910        if (bus_id != 0 || unit_id != -1) {
    911            error_setg(errp, "index cannot be used with bus and unit");
    912            goto fail;
    913        }
    914        bus_id = drive_index_to_bus_id(type, index);
    915        unit_id = drive_index_to_unit_id(type, index);
    916    }
    917
    918    if (unit_id == -1) {
    919       unit_id = 0;
    920       while (drive_get(type, bus_id, unit_id) != NULL) {
    921           unit_id++;
    922           if (max_devs && unit_id >= max_devs) {
    923               unit_id -= max_devs;
    924               bus_id++;
    925           }
    926       }
    927    }
    928
    929    if (max_devs && unit_id >= max_devs) {
    930        error_setg(errp, "unit %d too big (max is %d)", unit_id, max_devs - 1);
    931        goto fail;
    932    }
    933
    934    if (drive_get(type, bus_id, unit_id) != NULL) {
    935        error_setg(errp, "drive with bus=%d, unit=%d (index=%d) exists",
    936                   bus_id, unit_id, index);
    937        goto fail;
    938    }
    939
    940    /* no id supplied -> create one */
    941    if (qemu_opts_id(all_opts) == NULL) {
    942        char *new_id;
    943        const char *mediastr = "";
    944        if (type == IF_IDE || type == IF_SCSI) {
    945            mediastr = (media == MEDIA_CDROM) ? "-cd" : "-hd";
    946        }
    947        if (max_devs) {
    948            new_id = g_strdup_printf("%s%i%s%i", if_name[type], bus_id,
    949                                     mediastr, unit_id);
    950        } else {
    951            new_id = g_strdup_printf("%s%s%i", if_name[type],
    952                                     mediastr, unit_id);
    953        }
    954        qdict_put_str(bs_opts, "id", new_id);
    955        g_free(new_id);
    956    }
    957
    958    /* Add virtio block device */
    959    if (type == IF_VIRTIO) {
    960        QemuOpts *devopts;
    961        devopts = qemu_opts_create(qemu_find_opts("device"), NULL, 0,
    962                                   &error_abort);
    963        qemu_opt_set(devopts, "driver", "virtio-blk", &error_abort);
    964        qemu_opt_set(devopts, "drive", qdict_get_str(bs_opts, "id"),
    965                     &error_abort);
    966    }
    967
    968    filename = qemu_opt_get(legacy_opts, "file");
    969
    970    /* Check werror/rerror compatibility with if=... */
    971    werror = qemu_opt_get(legacy_opts, "werror");
    972    if (werror != NULL) {
    973        if (type != IF_IDE && type != IF_SCSI && type != IF_VIRTIO &&
    974            type != IF_NONE) {
    975            error_setg(errp, "werror is not supported by this bus type");
    976            goto fail;
    977        }
    978        qdict_put_str(bs_opts, "werror", werror);
    979    }
    980
    981    rerror = qemu_opt_get(legacy_opts, "rerror");
    982    if (rerror != NULL) {
    983        if (type != IF_IDE && type != IF_VIRTIO && type != IF_SCSI &&
    984            type != IF_NONE) {
    985            error_setg(errp, "rerror is not supported by this bus type");
    986            goto fail;
    987        }
    988        qdict_put_str(bs_opts, "rerror", rerror);
    989    }
    990
    991    /* Actual block device init: Functionality shared with blockdev-add */
    992    blk = blockdev_init(filename, bs_opts, errp);
    993    bs_opts = NULL;
    994    if (!blk) {
    995        goto fail;
    996    }
    997
    998    /* Create legacy DriveInfo */
    999    dinfo = g_malloc0(sizeof(*dinfo));
   1000    dinfo->opts = all_opts;
   1001
   1002    dinfo->type = type;
   1003    dinfo->bus = bus_id;
   1004    dinfo->unit = unit_id;
   1005
   1006    blk_set_legacy_dinfo(blk, dinfo);
   1007
   1008    switch(type) {
   1009    case IF_IDE:
   1010    case IF_SCSI:
   1011    case IF_XEN:
   1012    case IF_NONE:
   1013        dinfo->media_cd = media == MEDIA_CDROM;
   1014        break;
   1015    default:
   1016        break;
   1017    }
   1018
   1019fail:
   1020    qemu_opts_del(legacy_opts);
   1021    qobject_unref(bs_opts);
   1022    return dinfo;
   1023}
   1024
   1025static BlockDriverState *qmp_get_root_bs(const char *name, Error **errp)
   1026{
   1027    BlockDriverState *bs;
   1028
   1029    bs = bdrv_lookup_bs(name, name, errp);
   1030    if (bs == NULL) {
   1031        return NULL;
   1032    }
   1033
   1034    if (!bdrv_is_root_node(bs)) {
   1035        error_setg(errp, "Need a root block node");
   1036        return NULL;
   1037    }
   1038
   1039    if (!bdrv_is_inserted(bs)) {
   1040        error_setg(errp, "Device has no medium");
   1041        return NULL;
   1042    }
   1043
   1044    return bs;
   1045}
   1046
   1047static void blockdev_do_action(TransactionAction *action, Error **errp)
   1048{
   1049    TransactionActionList list;
   1050
   1051    list.value = action;
   1052    list.next = NULL;
   1053    qmp_transaction(&list, false, NULL, errp);
   1054}
   1055
   1056void qmp_blockdev_snapshot_sync(bool has_device, const char *device,
   1057                                bool has_node_name, const char *node_name,
   1058                                const char *snapshot_file,
   1059                                bool has_snapshot_node_name,
   1060                                const char *snapshot_node_name,
   1061                                bool has_format, const char *format,
   1062                                bool has_mode, NewImageMode mode, Error **errp)
   1063{
   1064    BlockdevSnapshotSync snapshot = {
   1065        .has_device = has_device,
   1066        .device = (char *) device,
   1067        .has_node_name = has_node_name,
   1068        .node_name = (char *) node_name,
   1069        .snapshot_file = (char *) snapshot_file,
   1070        .has_snapshot_node_name = has_snapshot_node_name,
   1071        .snapshot_node_name = (char *) snapshot_node_name,
   1072        .has_format = has_format,
   1073        .format = (char *) format,
   1074        .has_mode = has_mode,
   1075        .mode = mode,
   1076    };
   1077    TransactionAction action = {
   1078        .type = TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_SYNC,
   1079        .u.blockdev_snapshot_sync.data = &snapshot,
   1080    };
   1081    blockdev_do_action(&action, errp);
   1082}
   1083
   1084void qmp_blockdev_snapshot(const char *node, const char *overlay,
   1085                           Error **errp)
   1086{
   1087    BlockdevSnapshot snapshot_data = {
   1088        .node = (char *) node,
   1089        .overlay = (char *) overlay
   1090    };
   1091    TransactionAction action = {
   1092        .type = TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT,
   1093        .u.blockdev_snapshot.data = &snapshot_data,
   1094    };
   1095    blockdev_do_action(&action, errp);
   1096}
   1097
   1098void qmp_blockdev_snapshot_internal_sync(const char *device,
   1099                                         const char *name,
   1100                                         Error **errp)
   1101{
   1102    BlockdevSnapshotInternal snapshot = {
   1103        .device = (char *) device,
   1104        .name = (char *) name
   1105    };
   1106    TransactionAction action = {
   1107        .type = TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_INTERNAL_SYNC,
   1108        .u.blockdev_snapshot_internal_sync.data = &snapshot,
   1109    };
   1110    blockdev_do_action(&action, errp);
   1111}
   1112
   1113SnapshotInfo *qmp_blockdev_snapshot_delete_internal_sync(const char *device,
   1114                                                         bool has_id,
   1115                                                         const char *id,
   1116                                                         bool has_name,
   1117                                                         const char *name,
   1118                                                         Error **errp)
   1119{
   1120    BlockDriverState *bs;
   1121    AioContext *aio_context;
   1122    QEMUSnapshotInfo sn;
   1123    Error *local_err = NULL;
   1124    SnapshotInfo *info = NULL;
   1125    int ret;
   1126
   1127    bs = qmp_get_root_bs(device, errp);
   1128    if (!bs) {
   1129        return NULL;
   1130    }
   1131    aio_context = bdrv_get_aio_context(bs);
   1132    aio_context_acquire(aio_context);
   1133
   1134    if (!has_id) {
   1135        id = NULL;
   1136    }
   1137
   1138    if (!has_name) {
   1139        name = NULL;
   1140    }
   1141
   1142    if (!id && !name) {
   1143        error_setg(errp, "Name or id must be provided");
   1144        goto out_aio_context;
   1145    }
   1146
   1147    if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_INTERNAL_SNAPSHOT_DELETE, errp)) {
   1148        goto out_aio_context;
   1149    }
   1150
   1151    ret = bdrv_snapshot_find_by_id_and_name(bs, id, name, &sn, &local_err);
   1152    if (local_err) {
   1153        error_propagate(errp, local_err);
   1154        goto out_aio_context;
   1155    }
   1156    if (!ret) {
   1157        error_setg(errp,
   1158                   "Snapshot with id '%s' and name '%s' does not exist on "
   1159                   "device '%s'",
   1160                   STR_OR_NULL(id), STR_OR_NULL(name), device);
   1161        goto out_aio_context;
   1162    }
   1163
   1164    bdrv_snapshot_delete(bs, id, name, &local_err);
   1165    if (local_err) {
   1166        error_propagate(errp, local_err);
   1167        goto out_aio_context;
   1168    }
   1169
   1170    aio_context_release(aio_context);
   1171
   1172    info = g_new0(SnapshotInfo, 1);
   1173    info->id = g_strdup(sn.id_str);
   1174    info->name = g_strdup(sn.name);
   1175    info->date_nsec = sn.date_nsec;
   1176    info->date_sec = sn.date_sec;
   1177    info->vm_state_size = sn.vm_state_size;
   1178    info->vm_clock_nsec = sn.vm_clock_nsec % 1000000000;
   1179    info->vm_clock_sec = sn.vm_clock_nsec / 1000000000;
   1180    if (sn.icount != -1ULL) {
   1181        info->icount = sn.icount;
   1182        info->has_icount = true;
   1183    }
   1184
   1185    return info;
   1186
   1187out_aio_context:
   1188    aio_context_release(aio_context);
   1189    return NULL;
   1190}
   1191
   1192/* New and old BlockDriverState structs for atomic group operations */
   1193
   1194typedef struct BlkActionState BlkActionState;
   1195
   1196/**
   1197 * BlkActionOps:
   1198 * Table of operations that define an Action.
   1199 *
   1200 * @instance_size: Size of state struct, in bytes.
   1201 * @prepare: Prepare the work, must NOT be NULL.
   1202 * @commit: Commit the changes, can be NULL.
   1203 * @abort: Abort the changes on fail, can be NULL.
   1204 * @clean: Clean up resources after all transaction actions have called
   1205 *         commit() or abort(). Can be NULL.
   1206 *
   1207 * Only prepare() may fail. In a single transaction, only one of commit() or
   1208 * abort() will be called. clean() will always be called if it is present.
   1209 */
   1210typedef struct BlkActionOps {
   1211    size_t instance_size;
   1212    void (*prepare)(BlkActionState *common, Error **errp);
   1213    void (*commit)(BlkActionState *common);
   1214    void (*abort)(BlkActionState *common);
   1215    void (*clean)(BlkActionState *common);
   1216} BlkActionOps;
   1217
   1218/**
   1219 * BlkActionState:
   1220 * Describes one Action's state within a Transaction.
   1221 *
   1222 * @action: QAPI-defined enum identifying which Action to perform.
   1223 * @ops: Table of ActionOps this Action can perform.
   1224 * @block_job_txn: Transaction which this action belongs to.
   1225 * @entry: List membership for all Actions in this Transaction.
   1226 *
   1227 * This structure must be arranged as first member in a subclassed type,
   1228 * assuming that the compiler will also arrange it to the same offsets as the
   1229 * base class.
   1230 */
   1231struct BlkActionState {
   1232    TransactionAction *action;
   1233    const BlkActionOps *ops;
   1234    JobTxn *block_job_txn;
   1235    TransactionProperties *txn_props;
   1236    QTAILQ_ENTRY(BlkActionState) entry;
   1237};
   1238
   1239/* internal snapshot private data */
   1240typedef struct InternalSnapshotState {
   1241    BlkActionState common;
   1242    BlockDriverState *bs;
   1243    QEMUSnapshotInfo sn;
   1244    bool created;
   1245} InternalSnapshotState;
   1246
   1247
   1248static int action_check_completion_mode(BlkActionState *s, Error **errp)
   1249{
   1250    if (s->txn_props->completion_mode != ACTION_COMPLETION_MODE_INDIVIDUAL) {
   1251        error_setg(errp,
   1252                   "Action '%s' does not support Transaction property "
   1253                   "completion-mode = %s",
   1254                   TransactionActionKind_str(s->action->type),
   1255                   ActionCompletionMode_str(s->txn_props->completion_mode));
   1256        return -1;
   1257    }
   1258    return 0;
   1259}
   1260
   1261static void internal_snapshot_prepare(BlkActionState *common,
   1262                                      Error **errp)
   1263{
   1264    Error *local_err = NULL;
   1265    const char *device;
   1266    const char *name;
   1267    BlockDriverState *bs;
   1268    QEMUSnapshotInfo old_sn, *sn;
   1269    bool ret;
   1270    qemu_timeval tv;
   1271    BlockdevSnapshotInternal *internal;
   1272    InternalSnapshotState *state;
   1273    AioContext *aio_context;
   1274    int ret1;
   1275
   1276    g_assert(common->action->type ==
   1277             TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_INTERNAL_SYNC);
   1278    internal = common->action->u.blockdev_snapshot_internal_sync.data;
   1279    state = DO_UPCAST(InternalSnapshotState, common, common);
   1280
   1281    /* 1. parse input */
   1282    device = internal->device;
   1283    name = internal->name;
   1284
   1285    /* 2. check for validation */
   1286    if (action_check_completion_mode(common, errp) < 0) {
   1287        return;
   1288    }
   1289
   1290    bs = qmp_get_root_bs(device, errp);
   1291    if (!bs) {
   1292        return;
   1293    }
   1294
   1295    aio_context = bdrv_get_aio_context(bs);
   1296    aio_context_acquire(aio_context);
   1297
   1298    state->bs = bs;
   1299
   1300    /* Paired with .clean() */
   1301    bdrv_drained_begin(bs);
   1302
   1303    if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_INTERNAL_SNAPSHOT, errp)) {
   1304        goto out;
   1305    }
   1306
   1307    if (bdrv_is_read_only(bs)) {
   1308        error_setg(errp, "Device '%s' is read only", device);
   1309        goto out;
   1310    }
   1311
   1312    if (!bdrv_can_snapshot(bs)) {
   1313        error_setg(errp, "Block format '%s' used by device '%s' "
   1314                   "does not support internal snapshots",
   1315                   bs->drv->format_name, device);
   1316        goto out;
   1317    }
   1318
   1319    if (!strlen(name)) {
   1320        error_setg(errp, "Name is empty");
   1321        goto out;
   1322    }
   1323
   1324    /* check whether a snapshot with name exist */
   1325    ret = bdrv_snapshot_find_by_id_and_name(bs, NULL, name, &old_sn,
   1326                                            &local_err);
   1327    if (local_err) {
   1328        error_propagate(errp, local_err);
   1329        goto out;
   1330    } else if (ret) {
   1331        error_setg(errp,
   1332                   "Snapshot with name '%s' already exists on device '%s'",
   1333                   name, device);
   1334        goto out;
   1335    }
   1336
   1337    /* 3. take the snapshot */
   1338    sn = &state->sn;
   1339    pstrcpy(sn->name, sizeof(sn->name), name);
   1340    qemu_gettimeofday(&tv);
   1341    sn->date_sec = tv.tv_sec;
   1342    sn->date_nsec = tv.tv_usec * 1000;
   1343    sn->vm_clock_nsec = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL);
   1344    if (replay_mode != REPLAY_MODE_NONE) {
   1345        sn->icount = replay_get_current_icount();
   1346    } else {
   1347        sn->icount = -1ULL;
   1348    }
   1349
   1350    ret1 = bdrv_snapshot_create(bs, sn);
   1351    if (ret1 < 0) {
   1352        error_setg_errno(errp, -ret1,
   1353                         "Failed to create snapshot '%s' on device '%s'",
   1354                         name, device);
   1355        goto out;
   1356    }
   1357
   1358    /* 4. succeed, mark a snapshot is created */
   1359    state->created = true;
   1360
   1361out:
   1362    aio_context_release(aio_context);
   1363}
   1364
   1365static void internal_snapshot_abort(BlkActionState *common)
   1366{
   1367    InternalSnapshotState *state =
   1368                             DO_UPCAST(InternalSnapshotState, common, common);
   1369    BlockDriverState *bs = state->bs;
   1370    QEMUSnapshotInfo *sn = &state->sn;
   1371    AioContext *aio_context;
   1372    Error *local_error = NULL;
   1373
   1374    if (!state->created) {
   1375        return;
   1376    }
   1377
   1378    aio_context = bdrv_get_aio_context(state->bs);
   1379    aio_context_acquire(aio_context);
   1380
   1381    if (bdrv_snapshot_delete(bs, sn->id_str, sn->name, &local_error) < 0) {
   1382        error_reportf_err(local_error,
   1383                          "Failed to delete snapshot with id '%s' and "
   1384                          "name '%s' on device '%s' in abort: ",
   1385                          sn->id_str, sn->name,
   1386                          bdrv_get_device_name(bs));
   1387    }
   1388
   1389    aio_context_release(aio_context);
   1390}
   1391
   1392static void internal_snapshot_clean(BlkActionState *common)
   1393{
   1394    InternalSnapshotState *state = DO_UPCAST(InternalSnapshotState,
   1395                                             common, common);
   1396    AioContext *aio_context;
   1397
   1398    if (!state->bs) {
   1399        return;
   1400    }
   1401
   1402    aio_context = bdrv_get_aio_context(state->bs);
   1403    aio_context_acquire(aio_context);
   1404
   1405    bdrv_drained_end(state->bs);
   1406
   1407    aio_context_release(aio_context);
   1408}
   1409
   1410/* external snapshot private data */
   1411typedef struct ExternalSnapshotState {
   1412    BlkActionState common;
   1413    BlockDriverState *old_bs;
   1414    BlockDriverState *new_bs;
   1415    bool overlay_appended;
   1416} ExternalSnapshotState;
   1417
   1418static void external_snapshot_prepare(BlkActionState *common,
   1419                                      Error **errp)
   1420{
   1421    int ret;
   1422    int flags = 0;
   1423    QDict *options = NULL;
   1424    Error *local_err = NULL;
   1425    /* Device and node name of the image to generate the snapshot from */
   1426    const char *device;
   1427    const char *node_name;
   1428    /* Reference to the new image (for 'blockdev-snapshot') */
   1429    const char *snapshot_ref;
   1430    /* File name of the new image (for 'blockdev-snapshot-sync') */
   1431    const char *new_image_file;
   1432    ExternalSnapshotState *state =
   1433                             DO_UPCAST(ExternalSnapshotState, common, common);
   1434    TransactionAction *action = common->action;
   1435    AioContext *aio_context;
   1436    uint64_t perm, shared;
   1437
   1438    /* 'blockdev-snapshot' and 'blockdev-snapshot-sync' have similar
   1439     * purpose but a different set of parameters */
   1440    switch (action->type) {
   1441    case TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT:
   1442        {
   1443            BlockdevSnapshot *s = action->u.blockdev_snapshot.data;
   1444            device = s->node;
   1445            node_name = s->node;
   1446            new_image_file = NULL;
   1447            snapshot_ref = s->overlay;
   1448        }
   1449        break;
   1450    case TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_SYNC:
   1451        {
   1452            BlockdevSnapshotSync *s = action->u.blockdev_snapshot_sync.data;
   1453            device = s->has_device ? s->device : NULL;
   1454            node_name = s->has_node_name ? s->node_name : NULL;
   1455            new_image_file = s->snapshot_file;
   1456            snapshot_ref = NULL;
   1457        }
   1458        break;
   1459    default:
   1460        g_assert_not_reached();
   1461    }
   1462
   1463    /* start processing */
   1464    if (action_check_completion_mode(common, errp) < 0) {
   1465        return;
   1466    }
   1467
   1468    state->old_bs = bdrv_lookup_bs(device, node_name, errp);
   1469    if (!state->old_bs) {
   1470        return;
   1471    }
   1472
   1473    aio_context = bdrv_get_aio_context(state->old_bs);
   1474    aio_context_acquire(aio_context);
   1475
   1476    /* Paired with .clean() */
   1477    bdrv_drained_begin(state->old_bs);
   1478
   1479    if (!bdrv_is_inserted(state->old_bs)) {
   1480        error_setg(errp, QERR_DEVICE_HAS_NO_MEDIUM, device);
   1481        goto out;
   1482    }
   1483
   1484    if (bdrv_op_is_blocked(state->old_bs,
   1485                           BLOCK_OP_TYPE_EXTERNAL_SNAPSHOT, errp)) {
   1486        goto out;
   1487    }
   1488
   1489    if (!bdrv_is_read_only(state->old_bs)) {
   1490        if (bdrv_flush(state->old_bs)) {
   1491            error_setg(errp, QERR_IO_ERROR);
   1492            goto out;
   1493        }
   1494    }
   1495
   1496    if (action->type == TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_SYNC) {
   1497        BlockdevSnapshotSync *s = action->u.blockdev_snapshot_sync.data;
   1498        const char *format = s->has_format ? s->format : "qcow2";
   1499        enum NewImageMode mode;
   1500        const char *snapshot_node_name =
   1501            s->has_snapshot_node_name ? s->snapshot_node_name : NULL;
   1502
   1503        if (node_name && !snapshot_node_name) {
   1504            error_setg(errp, "New overlay node-name missing");
   1505            goto out;
   1506        }
   1507
   1508        if (snapshot_node_name &&
   1509            bdrv_lookup_bs(snapshot_node_name, snapshot_node_name, NULL)) {
   1510            error_setg(errp, "New overlay node-name already in use");
   1511            goto out;
   1512        }
   1513
   1514        flags = state->old_bs->open_flags;
   1515        flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_COPY_ON_READ);
   1516        flags |= BDRV_O_NO_BACKING;
   1517
   1518        /* create new image w/backing file */
   1519        mode = s->has_mode ? s->mode : NEW_IMAGE_MODE_ABSOLUTE_PATHS;
   1520        if (mode != NEW_IMAGE_MODE_EXISTING) {
   1521            int64_t size = bdrv_getlength(state->old_bs);
   1522            if (size < 0) {
   1523                error_setg_errno(errp, -size, "bdrv_getlength failed");
   1524                goto out;
   1525            }
   1526            bdrv_refresh_filename(state->old_bs);
   1527            bdrv_img_create(new_image_file, format,
   1528                            state->old_bs->filename,
   1529                            state->old_bs->drv->format_name,
   1530                            NULL, size, flags, false, &local_err);
   1531            if (local_err) {
   1532                error_propagate(errp, local_err);
   1533                goto out;
   1534            }
   1535        }
   1536
   1537        options = qdict_new();
   1538        if (snapshot_node_name) {
   1539            qdict_put_str(options, "node-name", snapshot_node_name);
   1540        }
   1541        qdict_put_str(options, "driver", format);
   1542    }
   1543
   1544    state->new_bs = bdrv_open(new_image_file, snapshot_ref, options, flags,
   1545                              errp);
   1546    /* We will manually add the backing_hd field to the bs later */
   1547    if (!state->new_bs) {
   1548        goto out;
   1549    }
   1550
   1551    /*
   1552     * Allow attaching a backing file to an overlay that's already in use only
   1553     * if the parents don't assume that they are already seeing a valid image.
   1554     * (Specifically, allow it as a mirror target, which is write-only access.)
   1555     */
   1556    bdrv_get_cumulative_perm(state->new_bs, &perm, &shared);
   1557    if (perm & BLK_PERM_CONSISTENT_READ) {
   1558        error_setg(errp, "The overlay is already in use");
   1559        goto out;
   1560    }
   1561
   1562    if (state->new_bs->drv->is_filter) {
   1563        error_setg(errp, "Filters cannot be used as overlays");
   1564        goto out;
   1565    }
   1566
   1567    if (bdrv_cow_child(state->new_bs)) {
   1568        error_setg(errp, "The overlay already has a backing image");
   1569        goto out;
   1570    }
   1571
   1572    if (!state->new_bs->drv->supports_backing) {
   1573        error_setg(errp, "The overlay does not support backing images");
   1574        goto out;
   1575    }
   1576
   1577    ret = bdrv_append(state->new_bs, state->old_bs, errp);
   1578    if (ret < 0) {
   1579        goto out;
   1580    }
   1581    state->overlay_appended = true;
   1582
   1583out:
   1584    aio_context_release(aio_context);
   1585}
   1586
   1587static void external_snapshot_commit(BlkActionState *common)
   1588{
   1589    ExternalSnapshotState *state =
   1590                             DO_UPCAST(ExternalSnapshotState, common, common);
   1591    AioContext *aio_context;
   1592
   1593    aio_context = bdrv_get_aio_context(state->old_bs);
   1594    aio_context_acquire(aio_context);
   1595
   1596    /* We don't need (or want) to use the transactional
   1597     * bdrv_reopen_multiple() across all the entries at once, because we
   1598     * don't want to abort all of them if one of them fails the reopen */
   1599    if (!qatomic_read(&state->old_bs->copy_on_read)) {
   1600        bdrv_reopen_set_read_only(state->old_bs, true, NULL);
   1601    }
   1602
   1603    aio_context_release(aio_context);
   1604}
   1605
   1606static void external_snapshot_abort(BlkActionState *common)
   1607{
   1608    ExternalSnapshotState *state =
   1609                             DO_UPCAST(ExternalSnapshotState, common, common);
   1610    if (state->new_bs) {
   1611        if (state->overlay_appended) {
   1612            AioContext *aio_context;
   1613            AioContext *tmp_context;
   1614            int ret;
   1615
   1616            aio_context = bdrv_get_aio_context(state->old_bs);
   1617            aio_context_acquire(aio_context);
   1618
   1619            bdrv_ref(state->old_bs);   /* we can't let bdrv_set_backind_hd()
   1620                                          close state->old_bs; we need it */
   1621            bdrv_set_backing_hd(state->new_bs, NULL, &error_abort);
   1622
   1623            /*
   1624             * The call to bdrv_set_backing_hd() above returns state->old_bs to
   1625             * the main AioContext. As we're still going to be using it, return
   1626             * it to the AioContext it was before.
   1627             */
   1628            tmp_context = bdrv_get_aio_context(state->old_bs);
   1629            if (aio_context != tmp_context) {
   1630                aio_context_release(aio_context);
   1631                aio_context_acquire(tmp_context);
   1632
   1633                ret = bdrv_try_set_aio_context(state->old_bs,
   1634                                               aio_context, NULL);
   1635                assert(ret == 0);
   1636
   1637                aio_context_release(tmp_context);
   1638                aio_context_acquire(aio_context);
   1639            }
   1640
   1641            bdrv_replace_node(state->new_bs, state->old_bs, &error_abort);
   1642            bdrv_unref(state->old_bs); /* bdrv_replace_node() ref'ed old_bs */
   1643
   1644            aio_context_release(aio_context);
   1645        }
   1646    }
   1647}
   1648
   1649static void external_snapshot_clean(BlkActionState *common)
   1650{
   1651    ExternalSnapshotState *state =
   1652                             DO_UPCAST(ExternalSnapshotState, common, common);
   1653    AioContext *aio_context;
   1654
   1655    if (!state->old_bs) {
   1656        return;
   1657    }
   1658
   1659    aio_context = bdrv_get_aio_context(state->old_bs);
   1660    aio_context_acquire(aio_context);
   1661
   1662    bdrv_drained_end(state->old_bs);
   1663    bdrv_unref(state->new_bs);
   1664
   1665    aio_context_release(aio_context);
   1666}
   1667
   1668typedef struct DriveBackupState {
   1669    BlkActionState common;
   1670    BlockDriverState *bs;
   1671    BlockJob *job;
   1672} DriveBackupState;
   1673
   1674static BlockJob *do_backup_common(BackupCommon *backup,
   1675                                  BlockDriverState *bs,
   1676                                  BlockDriverState *target_bs,
   1677                                  AioContext *aio_context,
   1678                                  JobTxn *txn, Error **errp);
   1679
   1680static void drive_backup_prepare(BlkActionState *common, Error **errp)
   1681{
   1682    DriveBackupState *state = DO_UPCAST(DriveBackupState, common, common);
   1683    DriveBackup *backup;
   1684    BlockDriverState *bs;
   1685    BlockDriverState *target_bs;
   1686    BlockDriverState *source = NULL;
   1687    AioContext *aio_context;
   1688    AioContext *old_context;
   1689    QDict *options;
   1690    Error *local_err = NULL;
   1691    int flags;
   1692    int64_t size;
   1693    bool set_backing_hd = false;
   1694    int ret;
   1695
   1696    assert(common->action->type == TRANSACTION_ACTION_KIND_DRIVE_BACKUP);
   1697    backup = common->action->u.drive_backup.data;
   1698
   1699    if (!backup->has_mode) {
   1700        backup->mode = NEW_IMAGE_MODE_ABSOLUTE_PATHS;
   1701    }
   1702
   1703    bs = bdrv_lookup_bs(backup->device, backup->device, errp);
   1704    if (!bs) {
   1705        return;
   1706    }
   1707
   1708    if (!bs->drv) {
   1709        error_setg(errp, "Device has no medium");
   1710        return;
   1711    }
   1712
   1713    aio_context = bdrv_get_aio_context(bs);
   1714    aio_context_acquire(aio_context);
   1715
   1716    state->bs = bs;
   1717    /* Paired with .clean() */
   1718    bdrv_drained_begin(bs);
   1719
   1720    if (!backup->has_format) {
   1721        backup->format = backup->mode == NEW_IMAGE_MODE_EXISTING ?
   1722                         NULL : (char *) bs->drv->format_name;
   1723    }
   1724
   1725    /* Early check to avoid creating target */
   1726    if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_BACKUP_SOURCE, errp)) {
   1727        goto out;
   1728    }
   1729
   1730    flags = bs->open_flags | BDRV_O_RDWR;
   1731
   1732    /*
   1733     * See if we have a backing HD we can use to create our new image
   1734     * on top of.
   1735     */
   1736    if (backup->sync == MIRROR_SYNC_MODE_TOP) {
   1737        /*
   1738         * Backup will not replace the source by the target, so none
   1739         * of the filters skipped here will be removed (in contrast to
   1740         * mirror).  Therefore, we can skip all of them when looking
   1741         * for the first COW relationship.
   1742         */
   1743        source = bdrv_cow_bs(bdrv_skip_filters(bs));
   1744        if (!source) {
   1745            backup->sync = MIRROR_SYNC_MODE_FULL;
   1746        }
   1747    }
   1748    if (backup->sync == MIRROR_SYNC_MODE_NONE) {
   1749        source = bs;
   1750        flags |= BDRV_O_NO_BACKING;
   1751        set_backing_hd = true;
   1752    }
   1753
   1754    size = bdrv_getlength(bs);
   1755    if (size < 0) {
   1756        error_setg_errno(errp, -size, "bdrv_getlength failed");
   1757        goto out;
   1758    }
   1759
   1760    if (backup->mode != NEW_IMAGE_MODE_EXISTING) {
   1761        assert(backup->format);
   1762        if (source) {
   1763            /* Implicit filters should not appear in the filename */
   1764            BlockDriverState *explicit_backing =
   1765                bdrv_skip_implicit_filters(source);
   1766
   1767            bdrv_refresh_filename(explicit_backing);
   1768            bdrv_img_create(backup->target, backup->format,
   1769                            explicit_backing->filename,
   1770                            explicit_backing->drv->format_name, NULL,
   1771                            size, flags, false, &local_err);
   1772        } else {
   1773            bdrv_img_create(backup->target, backup->format, NULL, NULL, NULL,
   1774                            size, flags, false, &local_err);
   1775        }
   1776    }
   1777
   1778    if (local_err) {
   1779        error_propagate(errp, local_err);
   1780        goto out;
   1781    }
   1782
   1783    options = qdict_new();
   1784    qdict_put_str(options, "discard", "unmap");
   1785    qdict_put_str(options, "detect-zeroes", "unmap");
   1786    if (backup->format) {
   1787        qdict_put_str(options, "driver", backup->format);
   1788    }
   1789
   1790    target_bs = bdrv_open(backup->target, NULL, options, flags, errp);
   1791    if (!target_bs) {
   1792        goto out;
   1793    }
   1794
   1795    /* Honor bdrv_try_set_aio_context() context acquisition requirements. */
   1796    old_context = bdrv_get_aio_context(target_bs);
   1797    aio_context_release(aio_context);
   1798    aio_context_acquire(old_context);
   1799
   1800    ret = bdrv_try_set_aio_context(target_bs, aio_context, errp);
   1801    if (ret < 0) {
   1802        bdrv_unref(target_bs);
   1803        aio_context_release(old_context);
   1804        return;
   1805    }
   1806
   1807    aio_context_release(old_context);
   1808    aio_context_acquire(aio_context);
   1809
   1810    if (set_backing_hd) {
   1811        if (bdrv_set_backing_hd(target_bs, source, errp) < 0) {
   1812            goto unref;
   1813        }
   1814    }
   1815
   1816    state->job = do_backup_common(qapi_DriveBackup_base(backup),
   1817                                  bs, target_bs, aio_context,
   1818                                  common->block_job_txn, errp);
   1819
   1820unref:
   1821    bdrv_unref(target_bs);
   1822out:
   1823    aio_context_release(aio_context);
   1824}
   1825
   1826static void drive_backup_commit(BlkActionState *common)
   1827{
   1828    DriveBackupState *state = DO_UPCAST(DriveBackupState, common, common);
   1829    AioContext *aio_context;
   1830
   1831    aio_context = bdrv_get_aio_context(state->bs);
   1832    aio_context_acquire(aio_context);
   1833
   1834    assert(state->job);
   1835    job_start(&state->job->job);
   1836
   1837    aio_context_release(aio_context);
   1838}
   1839
   1840static void drive_backup_abort(BlkActionState *common)
   1841{
   1842    DriveBackupState *state = DO_UPCAST(DriveBackupState, common, common);
   1843
   1844    if (state->job) {
   1845        AioContext *aio_context;
   1846
   1847        aio_context = bdrv_get_aio_context(state->bs);
   1848        aio_context_acquire(aio_context);
   1849
   1850        job_cancel_sync(&state->job->job, true);
   1851
   1852        aio_context_release(aio_context);
   1853    }
   1854}
   1855
   1856static void drive_backup_clean(BlkActionState *common)
   1857{
   1858    DriveBackupState *state = DO_UPCAST(DriveBackupState, common, common);
   1859    AioContext *aio_context;
   1860
   1861    if (!state->bs) {
   1862        return;
   1863    }
   1864
   1865    aio_context = bdrv_get_aio_context(state->bs);
   1866    aio_context_acquire(aio_context);
   1867
   1868    bdrv_drained_end(state->bs);
   1869
   1870    aio_context_release(aio_context);
   1871}
   1872
   1873typedef struct BlockdevBackupState {
   1874    BlkActionState common;
   1875    BlockDriverState *bs;
   1876    BlockJob *job;
   1877} BlockdevBackupState;
   1878
   1879static void blockdev_backup_prepare(BlkActionState *common, Error **errp)
   1880{
   1881    BlockdevBackupState *state = DO_UPCAST(BlockdevBackupState, common, common);
   1882    BlockdevBackup *backup;
   1883    BlockDriverState *bs;
   1884    BlockDriverState *target_bs;
   1885    AioContext *aio_context;
   1886    AioContext *old_context;
   1887    int ret;
   1888
   1889    assert(common->action->type == TRANSACTION_ACTION_KIND_BLOCKDEV_BACKUP);
   1890    backup = common->action->u.blockdev_backup.data;
   1891
   1892    bs = bdrv_lookup_bs(backup->device, backup->device, errp);
   1893    if (!bs) {
   1894        return;
   1895    }
   1896
   1897    target_bs = bdrv_lookup_bs(backup->target, backup->target, errp);
   1898    if (!target_bs) {
   1899        return;
   1900    }
   1901
   1902    /* Honor bdrv_try_set_aio_context() context acquisition requirements. */
   1903    aio_context = bdrv_get_aio_context(bs);
   1904    old_context = bdrv_get_aio_context(target_bs);
   1905    aio_context_acquire(old_context);
   1906
   1907    ret = bdrv_try_set_aio_context(target_bs, aio_context, errp);
   1908    if (ret < 0) {
   1909        aio_context_release(old_context);
   1910        return;
   1911    }
   1912
   1913    aio_context_release(old_context);
   1914    aio_context_acquire(aio_context);
   1915    state->bs = bs;
   1916
   1917    /* Paired with .clean() */
   1918    bdrv_drained_begin(state->bs);
   1919
   1920    state->job = do_backup_common(qapi_BlockdevBackup_base(backup),
   1921                                  bs, target_bs, aio_context,
   1922                                  common->block_job_txn, errp);
   1923
   1924    aio_context_release(aio_context);
   1925}
   1926
   1927static void blockdev_backup_commit(BlkActionState *common)
   1928{
   1929    BlockdevBackupState *state = DO_UPCAST(BlockdevBackupState, common, common);
   1930    AioContext *aio_context;
   1931
   1932    aio_context = bdrv_get_aio_context(state->bs);
   1933    aio_context_acquire(aio_context);
   1934
   1935    assert(state->job);
   1936    job_start(&state->job->job);
   1937
   1938    aio_context_release(aio_context);
   1939}
   1940
   1941static void blockdev_backup_abort(BlkActionState *common)
   1942{
   1943    BlockdevBackupState *state = DO_UPCAST(BlockdevBackupState, common, common);
   1944
   1945    if (state->job) {
   1946        AioContext *aio_context;
   1947
   1948        aio_context = bdrv_get_aio_context(state->bs);
   1949        aio_context_acquire(aio_context);
   1950
   1951        job_cancel_sync(&state->job->job, true);
   1952
   1953        aio_context_release(aio_context);
   1954    }
   1955}
   1956
   1957static void blockdev_backup_clean(BlkActionState *common)
   1958{
   1959    BlockdevBackupState *state = DO_UPCAST(BlockdevBackupState, common, common);
   1960    AioContext *aio_context;
   1961
   1962    if (!state->bs) {
   1963        return;
   1964    }
   1965
   1966    aio_context = bdrv_get_aio_context(state->bs);
   1967    aio_context_acquire(aio_context);
   1968
   1969    bdrv_drained_end(state->bs);
   1970
   1971    aio_context_release(aio_context);
   1972}
   1973
   1974typedef struct BlockDirtyBitmapState {
   1975    BlkActionState common;
   1976    BdrvDirtyBitmap *bitmap;
   1977    BlockDriverState *bs;
   1978    HBitmap *backup;
   1979    bool prepared;
   1980    bool was_enabled;
   1981} BlockDirtyBitmapState;
   1982
   1983static void block_dirty_bitmap_add_prepare(BlkActionState *common,
   1984                                           Error **errp)
   1985{
   1986    Error *local_err = NULL;
   1987    BlockDirtyBitmapAdd *action;
   1988    BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState,
   1989                                             common, common);
   1990
   1991    if (action_check_completion_mode(common, errp) < 0) {
   1992        return;
   1993    }
   1994
   1995    action = common->action->u.block_dirty_bitmap_add.data;
   1996    /* AIO context taken and released within qmp_block_dirty_bitmap_add */
   1997    qmp_block_dirty_bitmap_add(action->node, action->name,
   1998                               action->has_granularity, action->granularity,
   1999                               action->has_persistent, action->persistent,
   2000                               action->has_disabled, action->disabled,
   2001                               &local_err);
   2002
   2003    if (!local_err) {
   2004        state->prepared = true;
   2005    } else {
   2006        error_propagate(errp, local_err);
   2007    }
   2008}
   2009
   2010static void block_dirty_bitmap_add_abort(BlkActionState *common)
   2011{
   2012    BlockDirtyBitmapAdd *action;
   2013    BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState,
   2014                                             common, common);
   2015
   2016    action = common->action->u.block_dirty_bitmap_add.data;
   2017    /* Should not be able to fail: IF the bitmap was added via .prepare(),
   2018     * then the node reference and bitmap name must have been valid.
   2019     */
   2020    if (state->prepared) {
   2021        qmp_block_dirty_bitmap_remove(action->node, action->name, &error_abort);
   2022    }
   2023}
   2024
   2025static void block_dirty_bitmap_clear_prepare(BlkActionState *common,
   2026                                             Error **errp)
   2027{
   2028    BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState,
   2029                                             common, common);
   2030    BlockDirtyBitmap *action;
   2031
   2032    if (action_check_completion_mode(common, errp) < 0) {
   2033        return;
   2034    }
   2035
   2036    action = common->action->u.block_dirty_bitmap_clear.data;
   2037    state->bitmap = block_dirty_bitmap_lookup(action->node,
   2038                                              action->name,
   2039                                              &state->bs,
   2040                                              errp);
   2041    if (!state->bitmap) {
   2042        return;
   2043    }
   2044
   2045    if (bdrv_dirty_bitmap_check(state->bitmap, BDRV_BITMAP_DEFAULT, errp)) {
   2046        return;
   2047    }
   2048
   2049    bdrv_clear_dirty_bitmap(state->bitmap, &state->backup);
   2050}
   2051
   2052static void block_dirty_bitmap_restore(BlkActionState *common)
   2053{
   2054    BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState,
   2055                                             common, common);
   2056
   2057    if (state->backup) {
   2058        bdrv_restore_dirty_bitmap(state->bitmap, state->backup);
   2059    }
   2060}
   2061
   2062static void block_dirty_bitmap_free_backup(BlkActionState *common)
   2063{
   2064    BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState,
   2065                                             common, common);
   2066
   2067    hbitmap_free(state->backup);
   2068}
   2069
   2070static void block_dirty_bitmap_enable_prepare(BlkActionState *common,
   2071                                              Error **errp)
   2072{
   2073    BlockDirtyBitmap *action;
   2074    BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState,
   2075                                             common, common);
   2076
   2077    if (action_check_completion_mode(common, errp) < 0) {
   2078        return;
   2079    }
   2080
   2081    action = common->action->u.block_dirty_bitmap_enable.data;
   2082    state->bitmap = block_dirty_bitmap_lookup(action->node,
   2083                                              action->name,
   2084                                              NULL,
   2085                                              errp);
   2086    if (!state->bitmap) {
   2087        return;
   2088    }
   2089
   2090    if (bdrv_dirty_bitmap_check(state->bitmap, BDRV_BITMAP_ALLOW_RO, errp)) {
   2091        return;
   2092    }
   2093
   2094    state->was_enabled = bdrv_dirty_bitmap_enabled(state->bitmap);
   2095    bdrv_enable_dirty_bitmap(state->bitmap);
   2096}
   2097
   2098static void block_dirty_bitmap_enable_abort(BlkActionState *common)
   2099{
   2100    BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState,
   2101                                             common, common);
   2102
   2103    if (!state->was_enabled) {
   2104        bdrv_disable_dirty_bitmap(state->bitmap);
   2105    }
   2106}
   2107
   2108static void block_dirty_bitmap_disable_prepare(BlkActionState *common,
   2109                                               Error **errp)
   2110{
   2111    BlockDirtyBitmap *action;
   2112    BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState,
   2113                                             common, common);
   2114
   2115    if (action_check_completion_mode(common, errp) < 0) {
   2116        return;
   2117    }
   2118
   2119    action = common->action->u.block_dirty_bitmap_disable.data;
   2120    state->bitmap = block_dirty_bitmap_lookup(action->node,
   2121                                              action->name,
   2122                                              NULL,
   2123                                              errp);
   2124    if (!state->bitmap) {
   2125        return;
   2126    }
   2127
   2128    if (bdrv_dirty_bitmap_check(state->bitmap, BDRV_BITMAP_ALLOW_RO, errp)) {
   2129        return;
   2130    }
   2131
   2132    state->was_enabled = bdrv_dirty_bitmap_enabled(state->bitmap);
   2133    bdrv_disable_dirty_bitmap(state->bitmap);
   2134}
   2135
   2136static void block_dirty_bitmap_disable_abort(BlkActionState *common)
   2137{
   2138    BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState,
   2139                                             common, common);
   2140
   2141    if (state->was_enabled) {
   2142        bdrv_enable_dirty_bitmap(state->bitmap);
   2143    }
   2144}
   2145
   2146static void block_dirty_bitmap_merge_prepare(BlkActionState *common,
   2147                                             Error **errp)
   2148{
   2149    BlockDirtyBitmapMerge *action;
   2150    BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState,
   2151                                             common, common);
   2152
   2153    if (action_check_completion_mode(common, errp) < 0) {
   2154        return;
   2155    }
   2156
   2157    action = common->action->u.block_dirty_bitmap_merge.data;
   2158
   2159    state->bitmap = block_dirty_bitmap_merge(action->node, action->target,
   2160                                             action->bitmaps, &state->backup,
   2161                                             errp);
   2162}
   2163
   2164static void block_dirty_bitmap_remove_prepare(BlkActionState *common,
   2165                                              Error **errp)
   2166{
   2167    BlockDirtyBitmap *action;
   2168    BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState,
   2169                                             common, common);
   2170
   2171    if (action_check_completion_mode(common, errp) < 0) {
   2172        return;
   2173    }
   2174
   2175    action = common->action->u.block_dirty_bitmap_remove.data;
   2176
   2177    state->bitmap = block_dirty_bitmap_remove(action->node, action->name,
   2178                                              false, &state->bs, errp);
   2179    if (state->bitmap) {
   2180        bdrv_dirty_bitmap_skip_store(state->bitmap, true);
   2181        bdrv_dirty_bitmap_set_busy(state->bitmap, true);
   2182    }
   2183}
   2184
   2185static void block_dirty_bitmap_remove_abort(BlkActionState *common)
   2186{
   2187    BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState,
   2188                                             common, common);
   2189
   2190    if (state->bitmap) {
   2191        bdrv_dirty_bitmap_skip_store(state->bitmap, false);
   2192        bdrv_dirty_bitmap_set_busy(state->bitmap, false);
   2193    }
   2194}
   2195
   2196static void block_dirty_bitmap_remove_commit(BlkActionState *common)
   2197{
   2198    BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState,
   2199                                             common, common);
   2200
   2201    bdrv_dirty_bitmap_set_busy(state->bitmap, false);
   2202    bdrv_release_dirty_bitmap(state->bitmap);
   2203}
   2204
   2205static void abort_prepare(BlkActionState *common, Error **errp)
   2206{
   2207    error_setg(errp, "Transaction aborted using Abort action");
   2208}
   2209
   2210static void abort_commit(BlkActionState *common)
   2211{
   2212    g_assert_not_reached(); /* this action never succeeds */
   2213}
   2214
   2215static const BlkActionOps actions[] = {
   2216    [TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT] = {
   2217        .instance_size = sizeof(ExternalSnapshotState),
   2218        .prepare  = external_snapshot_prepare,
   2219        .commit   = external_snapshot_commit,
   2220        .abort = external_snapshot_abort,
   2221        .clean = external_snapshot_clean,
   2222    },
   2223    [TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_SYNC] = {
   2224        .instance_size = sizeof(ExternalSnapshotState),
   2225        .prepare  = external_snapshot_prepare,
   2226        .commit   = external_snapshot_commit,
   2227        .abort = external_snapshot_abort,
   2228        .clean = external_snapshot_clean,
   2229    },
   2230    [TRANSACTION_ACTION_KIND_DRIVE_BACKUP] = {
   2231        .instance_size = sizeof(DriveBackupState),
   2232        .prepare = drive_backup_prepare,
   2233        .commit = drive_backup_commit,
   2234        .abort = drive_backup_abort,
   2235        .clean = drive_backup_clean,
   2236    },
   2237    [TRANSACTION_ACTION_KIND_BLOCKDEV_BACKUP] = {
   2238        .instance_size = sizeof(BlockdevBackupState),
   2239        .prepare = blockdev_backup_prepare,
   2240        .commit = blockdev_backup_commit,
   2241        .abort = blockdev_backup_abort,
   2242        .clean = blockdev_backup_clean,
   2243    },
   2244    [TRANSACTION_ACTION_KIND_ABORT] = {
   2245        .instance_size = sizeof(BlkActionState),
   2246        .prepare = abort_prepare,
   2247        .commit = abort_commit,
   2248    },
   2249    [TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_INTERNAL_SYNC] = {
   2250        .instance_size = sizeof(InternalSnapshotState),
   2251        .prepare  = internal_snapshot_prepare,
   2252        .abort = internal_snapshot_abort,
   2253        .clean = internal_snapshot_clean,
   2254    },
   2255    [TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_ADD] = {
   2256        .instance_size = sizeof(BlockDirtyBitmapState),
   2257        .prepare = block_dirty_bitmap_add_prepare,
   2258        .abort = block_dirty_bitmap_add_abort,
   2259    },
   2260    [TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_CLEAR] = {
   2261        .instance_size = sizeof(BlockDirtyBitmapState),
   2262        .prepare = block_dirty_bitmap_clear_prepare,
   2263        .commit = block_dirty_bitmap_free_backup,
   2264        .abort = block_dirty_bitmap_restore,
   2265    },
   2266    [TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_ENABLE] = {
   2267        .instance_size = sizeof(BlockDirtyBitmapState),
   2268        .prepare = block_dirty_bitmap_enable_prepare,
   2269        .abort = block_dirty_bitmap_enable_abort,
   2270    },
   2271    [TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_DISABLE] = {
   2272        .instance_size = sizeof(BlockDirtyBitmapState),
   2273        .prepare = block_dirty_bitmap_disable_prepare,
   2274        .abort = block_dirty_bitmap_disable_abort,
   2275    },
   2276    [TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_MERGE] = {
   2277        .instance_size = sizeof(BlockDirtyBitmapState),
   2278        .prepare = block_dirty_bitmap_merge_prepare,
   2279        .commit = block_dirty_bitmap_free_backup,
   2280        .abort = block_dirty_bitmap_restore,
   2281    },
   2282    [TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_REMOVE] = {
   2283        .instance_size = sizeof(BlockDirtyBitmapState),
   2284        .prepare = block_dirty_bitmap_remove_prepare,
   2285        .commit = block_dirty_bitmap_remove_commit,
   2286        .abort = block_dirty_bitmap_remove_abort,
   2287    },
   2288    /* Where are transactions for MIRROR, COMMIT and STREAM?
   2289     * Although these blockjobs use transaction callbacks like the backup job,
   2290     * these jobs do not necessarily adhere to transaction semantics.
   2291     * These jobs may not fully undo all of their actions on abort, nor do they
   2292     * necessarily work in transactions with more than one job in them.
   2293     */
   2294};
   2295
   2296/**
   2297 * Allocate a TransactionProperties structure if necessary, and fill
   2298 * that structure with desired defaults if they are unset.
   2299 */
   2300static TransactionProperties *get_transaction_properties(
   2301    TransactionProperties *props)
   2302{
   2303    if (!props) {
   2304        props = g_new0(TransactionProperties, 1);
   2305    }
   2306
   2307    if (!props->has_completion_mode) {
   2308        props->has_completion_mode = true;
   2309        props->completion_mode = ACTION_COMPLETION_MODE_INDIVIDUAL;
   2310    }
   2311
   2312    return props;
   2313}
   2314
   2315/*
   2316 * 'Atomic' group operations.  The operations are performed as a set, and if
   2317 * any fail then we roll back all operations in the group.
   2318 */
   2319void qmp_transaction(TransactionActionList *dev_list,
   2320                     bool has_props,
   2321                     struct TransactionProperties *props,
   2322                     Error **errp)
   2323{
   2324    TransactionActionList *dev_entry = dev_list;
   2325    JobTxn *block_job_txn = NULL;
   2326    BlkActionState *state, *next;
   2327    Error *local_err = NULL;
   2328
   2329    QTAILQ_HEAD(, BlkActionState) snap_bdrv_states;
   2330    QTAILQ_INIT(&snap_bdrv_states);
   2331
   2332    /* Does this transaction get canceled as a group on failure?
   2333     * If not, we don't really need to make a JobTxn.
   2334     */
   2335    props = get_transaction_properties(props);
   2336    if (props->completion_mode != ACTION_COMPLETION_MODE_INDIVIDUAL) {
   2337        block_job_txn = job_txn_new();
   2338    }
   2339
   2340    /* drain all i/o before any operations */
   2341    bdrv_drain_all();
   2342
   2343    /* We don't do anything in this loop that commits us to the operations */
   2344    while (NULL != dev_entry) {
   2345        TransactionAction *dev_info = NULL;
   2346        const BlkActionOps *ops;
   2347
   2348        dev_info = dev_entry->value;
   2349        dev_entry = dev_entry->next;
   2350
   2351        assert(dev_info->type < ARRAY_SIZE(actions));
   2352
   2353        ops = &actions[dev_info->type];
   2354        assert(ops->instance_size > 0);
   2355
   2356        state = g_malloc0(ops->instance_size);
   2357        state->ops = ops;
   2358        state->action = dev_info;
   2359        state->block_job_txn = block_job_txn;
   2360        state->txn_props = props;
   2361        QTAILQ_INSERT_TAIL(&snap_bdrv_states, state, entry);
   2362
   2363        state->ops->prepare(state, &local_err);
   2364        if (local_err) {
   2365            error_propagate(errp, local_err);
   2366            goto delete_and_fail;
   2367        }
   2368    }
   2369
   2370    QTAILQ_FOREACH(state, &snap_bdrv_states, entry) {
   2371        if (state->ops->commit) {
   2372            state->ops->commit(state);
   2373        }
   2374    }
   2375
   2376    /* success */
   2377    goto exit;
   2378
   2379delete_and_fail:
   2380    /* failure, and it is all-or-none; roll back all operations */
   2381    QTAILQ_FOREACH_REVERSE(state, &snap_bdrv_states, entry) {
   2382        if (state->ops->abort) {
   2383            state->ops->abort(state);
   2384        }
   2385    }
   2386exit:
   2387    QTAILQ_FOREACH_SAFE(state, &snap_bdrv_states, entry, next) {
   2388        if (state->ops->clean) {
   2389            state->ops->clean(state);
   2390        }
   2391        g_free(state);
   2392    }
   2393    if (!has_props) {
   2394        qapi_free_TransactionProperties(props);
   2395    }
   2396    job_txn_unref(block_job_txn);
   2397}
   2398
   2399BlockDirtyBitmapSha256 *qmp_x_debug_block_dirty_bitmap_sha256(const char *node,
   2400                                                              const char *name,
   2401                                                              Error **errp)
   2402{
   2403    BdrvDirtyBitmap *bitmap;
   2404    BlockDriverState *bs;
   2405    BlockDirtyBitmapSha256 *ret = NULL;
   2406    char *sha256;
   2407
   2408    bitmap = block_dirty_bitmap_lookup(node, name, &bs, errp);
   2409    if (!bitmap || !bs) {
   2410        return NULL;
   2411    }
   2412
   2413    sha256 = bdrv_dirty_bitmap_sha256(bitmap, errp);
   2414    if (sha256 == NULL) {
   2415        return NULL;
   2416    }
   2417
   2418    ret = g_new(BlockDirtyBitmapSha256, 1);
   2419    ret->sha256 = sha256;
   2420
   2421    return ret;
   2422}
   2423
   2424void coroutine_fn qmp_block_resize(bool has_device, const char *device,
   2425                                   bool has_node_name, const char *node_name,
   2426                                   int64_t size, Error **errp)
   2427{
   2428    Error *local_err = NULL;
   2429    BlockBackend *blk;
   2430    BlockDriverState *bs;
   2431    AioContext *old_ctx;
   2432
   2433    bs = bdrv_lookup_bs(has_device ? device : NULL,
   2434                        has_node_name ? node_name : NULL,
   2435                        &local_err);
   2436    if (local_err) {
   2437        error_propagate(errp, local_err);
   2438        return;
   2439    }
   2440
   2441    if (size < 0) {
   2442        error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "size", "a >0 size");
   2443        return;
   2444    }
   2445
   2446    if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_RESIZE, NULL)) {
   2447        error_setg(errp, QERR_DEVICE_IN_USE, device);
   2448        return;
   2449    }
   2450
   2451    blk = blk_new_with_bs(bs, BLK_PERM_RESIZE, BLK_PERM_ALL, errp);
   2452    if (!blk) {
   2453        return;
   2454    }
   2455
   2456    bdrv_co_lock(bs);
   2457    bdrv_drained_begin(bs);
   2458    bdrv_co_unlock(bs);
   2459
   2460    old_ctx = bdrv_co_enter(bs);
   2461    blk_truncate(blk, size, false, PREALLOC_MODE_OFF, 0, errp);
   2462    bdrv_co_leave(bs, old_ctx);
   2463
   2464    bdrv_co_lock(bs);
   2465    bdrv_drained_end(bs);
   2466    blk_unref(blk);
   2467    bdrv_co_unlock(bs);
   2468}
   2469
   2470void qmp_block_stream(bool has_job_id, const char *job_id, const char *device,
   2471                      bool has_base, const char *base,
   2472                      bool has_base_node, const char *base_node,
   2473                      bool has_backing_file, const char *backing_file,
   2474                      bool has_bottom, const char *bottom,
   2475                      bool has_speed, int64_t speed,
   2476                      bool has_on_error, BlockdevOnError on_error,
   2477                      bool has_filter_node_name, const char *filter_node_name,
   2478                      bool has_auto_finalize, bool auto_finalize,
   2479                      bool has_auto_dismiss, bool auto_dismiss,
   2480                      Error **errp)
   2481{
   2482    BlockDriverState *bs, *iter, *iter_end;
   2483    BlockDriverState *base_bs = NULL;
   2484    BlockDriverState *bottom_bs = NULL;
   2485    AioContext *aio_context;
   2486    Error *local_err = NULL;
   2487    int job_flags = JOB_DEFAULT;
   2488
   2489    if (has_base && has_base_node) {
   2490        error_setg(errp, "'base' and 'base-node' cannot be specified "
   2491                   "at the same time");
   2492        return;
   2493    }
   2494
   2495    if (has_base && has_bottom) {
   2496        error_setg(errp, "'base' and 'bottom' cannot be specified "
   2497                   "at the same time");
   2498        return;
   2499    }
   2500
   2501    if (has_bottom && has_base_node) {
   2502        error_setg(errp, "'bottom' and 'base-node' cannot be specified "
   2503                   "at the same time");
   2504        return;
   2505    }
   2506
   2507    if (!has_on_error) {
   2508        on_error = BLOCKDEV_ON_ERROR_REPORT;
   2509    }
   2510
   2511    bs = bdrv_lookup_bs(device, device, errp);
   2512    if (!bs) {
   2513        return;
   2514    }
   2515
   2516    aio_context = bdrv_get_aio_context(bs);
   2517    aio_context_acquire(aio_context);
   2518
   2519    if (has_base) {
   2520        base_bs = bdrv_find_backing_image(bs, base);
   2521        if (base_bs == NULL) {
   2522            error_setg(errp, "Can't find '%s' in the backing chain", base);
   2523            goto out;
   2524        }
   2525        assert(bdrv_get_aio_context(base_bs) == aio_context);
   2526    }
   2527
   2528    if (has_base_node) {
   2529        base_bs = bdrv_lookup_bs(NULL, base_node, errp);
   2530        if (!base_bs) {
   2531            goto out;
   2532        }
   2533        if (bs == base_bs || !bdrv_chain_contains(bs, base_bs)) {
   2534            error_setg(errp, "Node '%s' is not a backing image of '%s'",
   2535                       base_node, device);
   2536            goto out;
   2537        }
   2538        assert(bdrv_get_aio_context(base_bs) == aio_context);
   2539        bdrv_refresh_filename(base_bs);
   2540    }
   2541
   2542    if (has_bottom) {
   2543        bottom_bs = bdrv_lookup_bs(NULL, bottom, errp);
   2544        if (!bottom_bs) {
   2545            goto out;
   2546        }
   2547        if (!bottom_bs->drv) {
   2548            error_setg(errp, "Node '%s' is not open", bottom);
   2549            goto out;
   2550        }
   2551        if (bottom_bs->drv->is_filter) {
   2552            error_setg(errp, "Node '%s' is a filter, use a non-filter node "
   2553                       "as 'bottom'", bottom);
   2554            goto out;
   2555        }
   2556        if (!bdrv_chain_contains(bs, bottom_bs)) {
   2557            error_setg(errp, "Node '%s' is not in a chain starting from '%s'",
   2558                       bottom, device);
   2559            goto out;
   2560        }
   2561        assert(bdrv_get_aio_context(bottom_bs) == aio_context);
   2562    }
   2563
   2564    /*
   2565     * Check for op blockers in the whole chain between bs and base (or bottom)
   2566     */
   2567    iter_end = has_bottom ? bdrv_filter_or_cow_bs(bottom_bs) : base_bs;
   2568    for (iter = bs; iter && iter != iter_end;
   2569         iter = bdrv_filter_or_cow_bs(iter))
   2570    {
   2571        if (bdrv_op_is_blocked(iter, BLOCK_OP_TYPE_STREAM, errp)) {
   2572            goto out;
   2573        }
   2574    }
   2575
   2576    /* if we are streaming the entire chain, the result will have no backing
   2577     * file, and specifying one is therefore an error */
   2578    if (base_bs == NULL && has_backing_file) {
   2579        error_setg(errp, "backing file specified, but streaming the "
   2580                         "entire chain");
   2581        goto out;
   2582    }
   2583
   2584    if (has_auto_finalize && !auto_finalize) {
   2585        job_flags |= JOB_MANUAL_FINALIZE;
   2586    }
   2587    if (has_auto_dismiss && !auto_dismiss) {
   2588        job_flags |= JOB_MANUAL_DISMISS;
   2589    }
   2590
   2591    stream_start(has_job_id ? job_id : NULL, bs, base_bs, backing_file,
   2592                 bottom_bs, job_flags, has_speed ? speed : 0, on_error,
   2593                 filter_node_name, &local_err);
   2594    if (local_err) {
   2595        error_propagate(errp, local_err);
   2596        goto out;
   2597    }
   2598
   2599    trace_qmp_block_stream(bs);
   2600
   2601out:
   2602    aio_context_release(aio_context);
   2603}
   2604
   2605void qmp_block_commit(bool has_job_id, const char *job_id, const char *device,
   2606                      bool has_base_node, const char *base_node,
   2607                      bool has_base, const char *base,
   2608                      bool has_top_node, const char *top_node,
   2609                      bool has_top, const char *top,
   2610                      bool has_backing_file, const char *backing_file,
   2611                      bool has_speed, int64_t speed,
   2612                      bool has_on_error, BlockdevOnError on_error,
   2613                      bool has_filter_node_name, const char *filter_node_name,
   2614                      bool has_auto_finalize, bool auto_finalize,
   2615                      bool has_auto_dismiss, bool auto_dismiss,
   2616                      Error **errp)
   2617{
   2618    BlockDriverState *bs;
   2619    BlockDriverState *iter;
   2620    BlockDriverState *base_bs, *top_bs;
   2621    AioContext *aio_context;
   2622    Error *local_err = NULL;
   2623    int job_flags = JOB_DEFAULT;
   2624    uint64_t top_perm, top_shared;
   2625
   2626    if (!has_speed) {
   2627        speed = 0;
   2628    }
   2629    if (!has_on_error) {
   2630        on_error = BLOCKDEV_ON_ERROR_REPORT;
   2631    }
   2632    if (!has_filter_node_name) {
   2633        filter_node_name = NULL;
   2634    }
   2635    if (has_auto_finalize && !auto_finalize) {
   2636        job_flags |= JOB_MANUAL_FINALIZE;
   2637    }
   2638    if (has_auto_dismiss && !auto_dismiss) {
   2639        job_flags |= JOB_MANUAL_DISMISS;
   2640    }
   2641
   2642    /* Important Note:
   2643     *  libvirt relies on the DeviceNotFound error class in order to probe for
   2644     *  live commit feature versions; for this to work, we must make sure to
   2645     *  perform the device lookup before any generic errors that may occur in a
   2646     *  scenario in which all optional arguments are omitted. */
   2647    bs = qmp_get_root_bs(device, &local_err);
   2648    if (!bs) {
   2649        bs = bdrv_lookup_bs(device, device, NULL);
   2650        if (!bs) {
   2651            error_free(local_err);
   2652            error_set(errp, ERROR_CLASS_DEVICE_NOT_FOUND,
   2653                      "Device '%s' not found", device);
   2654        } else {
   2655            error_propagate(errp, local_err);
   2656        }
   2657        return;
   2658    }
   2659
   2660    aio_context = bdrv_get_aio_context(bs);
   2661    aio_context_acquire(aio_context);
   2662
   2663    if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_COMMIT_SOURCE, errp)) {
   2664        goto out;
   2665    }
   2666
   2667    /* default top_bs is the active layer */
   2668    top_bs = bs;
   2669
   2670    if (has_top_node && has_top) {
   2671        error_setg(errp, "'top-node' and 'top' are mutually exclusive");
   2672        goto out;
   2673    } else if (has_top_node) {
   2674        top_bs = bdrv_lookup_bs(NULL, top_node, errp);
   2675        if (top_bs == NULL) {
   2676            goto out;
   2677        }
   2678        if (!bdrv_chain_contains(bs, top_bs)) {
   2679            error_setg(errp, "'%s' is not in this backing file chain",
   2680                       top_node);
   2681            goto out;
   2682        }
   2683    } else if (has_top && top) {
   2684        /* This strcmp() is just a shortcut, there is no need to
   2685         * refresh @bs's filename.  If it mismatches,
   2686         * bdrv_find_backing_image() will do the refresh and may still
   2687         * return @bs. */
   2688        if (strcmp(bs->filename, top) != 0) {
   2689            top_bs = bdrv_find_backing_image(bs, top);
   2690        }
   2691    }
   2692
   2693    if (top_bs == NULL) {
   2694        error_setg(errp, "Top image file %s not found", top ? top : "NULL");
   2695        goto out;
   2696    }
   2697
   2698    assert(bdrv_get_aio_context(top_bs) == aio_context);
   2699
   2700    if (has_base_node && has_base) {
   2701        error_setg(errp, "'base-node' and 'base' are mutually exclusive");
   2702        goto out;
   2703    } else if (has_base_node) {
   2704        base_bs = bdrv_lookup_bs(NULL, base_node, errp);
   2705        if (base_bs == NULL) {
   2706            goto out;
   2707        }
   2708        if (!bdrv_chain_contains(top_bs, base_bs)) {
   2709            error_setg(errp, "'%s' is not in this backing file chain",
   2710                       base_node);
   2711            goto out;
   2712        }
   2713    } else if (has_base && base) {
   2714        base_bs = bdrv_find_backing_image(top_bs, base);
   2715        if (base_bs == NULL) {
   2716            error_setg(errp, "Can't find '%s' in the backing chain", base);
   2717            goto out;
   2718        }
   2719    } else {
   2720        base_bs = bdrv_find_base(top_bs);
   2721        if (base_bs == NULL) {
   2722            error_setg(errp, "There is no backimg image");
   2723            goto out;
   2724        }
   2725    }
   2726
   2727    assert(bdrv_get_aio_context(base_bs) == aio_context);
   2728
   2729    for (iter = top_bs; iter != bdrv_filter_or_cow_bs(base_bs);
   2730         iter = bdrv_filter_or_cow_bs(iter))
   2731    {
   2732        if (bdrv_op_is_blocked(iter, BLOCK_OP_TYPE_COMMIT_TARGET, errp)) {
   2733            goto out;
   2734        }
   2735    }
   2736
   2737    /* Do not allow attempts to commit an image into itself */
   2738    if (top_bs == base_bs) {
   2739        error_setg(errp, "cannot commit an image into itself");
   2740        goto out;
   2741    }
   2742
   2743    /*
   2744     * Active commit is required if and only if someone has taken a
   2745     * WRITE permission on the top node.  Historically, we have always
   2746     * used active commit for top nodes, so continue that practice
   2747     * lest we possibly break clients that rely on this behavior, e.g.
   2748     * to later attach this node to a writing parent.
   2749     * (Active commit is never really wrong.)
   2750     */
   2751    bdrv_get_cumulative_perm(top_bs, &top_perm, &top_shared);
   2752    if (top_perm & BLK_PERM_WRITE ||
   2753        bdrv_skip_filters(top_bs) == bdrv_skip_filters(bs))
   2754    {
   2755        if (has_backing_file) {
   2756            if (bdrv_skip_filters(top_bs) == bdrv_skip_filters(bs)) {
   2757                error_setg(errp, "'backing-file' specified,"
   2758                                 " but 'top' is the active layer");
   2759            } else {
   2760                error_setg(errp, "'backing-file' specified, but 'top' has a "
   2761                                 "writer on it");
   2762            }
   2763            goto out;
   2764        }
   2765        if (!has_job_id) {
   2766            /*
   2767             * Emulate here what block_job_create() does, because it
   2768             * is possible that @bs != @top_bs (the block job should
   2769             * be named after @bs, even if @top_bs is the actual
   2770             * source)
   2771             */
   2772            job_id = bdrv_get_device_name(bs);
   2773        }
   2774        commit_active_start(job_id, top_bs, base_bs, job_flags, speed, on_error,
   2775                            filter_node_name, NULL, NULL, false, &local_err);
   2776    } else {
   2777        BlockDriverState *overlay_bs = bdrv_find_overlay(bs, top_bs);
   2778        if (bdrv_op_is_blocked(overlay_bs, BLOCK_OP_TYPE_COMMIT_TARGET, errp)) {
   2779            goto out;
   2780        }
   2781        commit_start(has_job_id ? job_id : NULL, bs, base_bs, top_bs, job_flags,
   2782                     speed, on_error, has_backing_file ? backing_file : NULL,
   2783                     filter_node_name, &local_err);
   2784    }
   2785    if (local_err != NULL) {
   2786        error_propagate(errp, local_err);
   2787        goto out;
   2788    }
   2789
   2790out:
   2791    aio_context_release(aio_context);
   2792}
   2793
   2794/* Common QMP interface for drive-backup and blockdev-backup */
   2795static BlockJob *do_backup_common(BackupCommon *backup,
   2796                                  BlockDriverState *bs,
   2797                                  BlockDriverState *target_bs,
   2798                                  AioContext *aio_context,
   2799                                  JobTxn *txn, Error **errp)
   2800{
   2801    BlockJob *job = NULL;
   2802    BdrvDirtyBitmap *bmap = NULL;
   2803    BackupPerf perf = { .max_workers = 64 };
   2804    int job_flags = JOB_DEFAULT;
   2805
   2806    if (!backup->has_speed) {
   2807        backup->speed = 0;
   2808    }
   2809    if (!backup->has_on_source_error) {
   2810        backup->on_source_error = BLOCKDEV_ON_ERROR_REPORT;
   2811    }
   2812    if (!backup->has_on_target_error) {
   2813        backup->on_target_error = BLOCKDEV_ON_ERROR_REPORT;
   2814    }
   2815    if (!backup->has_job_id) {
   2816        backup->job_id = NULL;
   2817    }
   2818    if (!backup->has_auto_finalize) {
   2819        backup->auto_finalize = true;
   2820    }
   2821    if (!backup->has_auto_dismiss) {
   2822        backup->auto_dismiss = true;
   2823    }
   2824    if (!backup->has_compress) {
   2825        backup->compress = false;
   2826    }
   2827
   2828    if (backup->x_perf) {
   2829        if (backup->x_perf->has_use_copy_range) {
   2830            perf.use_copy_range = backup->x_perf->use_copy_range;
   2831        }
   2832        if (backup->x_perf->has_max_workers) {
   2833            perf.max_workers = backup->x_perf->max_workers;
   2834        }
   2835        if (backup->x_perf->has_max_chunk) {
   2836            perf.max_chunk = backup->x_perf->max_chunk;
   2837        }
   2838    }
   2839
   2840    if ((backup->sync == MIRROR_SYNC_MODE_BITMAP) ||
   2841        (backup->sync == MIRROR_SYNC_MODE_INCREMENTAL)) {
   2842        /* done before desugaring 'incremental' to print the right message */
   2843        if (!backup->has_bitmap) {
   2844            error_setg(errp, "must provide a valid bitmap name for "
   2845                       "'%s' sync mode", MirrorSyncMode_str(backup->sync));
   2846            return NULL;
   2847        }
   2848    }
   2849
   2850    if (backup->sync == MIRROR_SYNC_MODE_INCREMENTAL) {
   2851        if (backup->has_bitmap_mode &&
   2852            backup->bitmap_mode != BITMAP_SYNC_MODE_ON_SUCCESS) {
   2853            error_setg(errp, "Bitmap sync mode must be '%s' "
   2854                       "when using sync mode '%s'",
   2855                       BitmapSyncMode_str(BITMAP_SYNC_MODE_ON_SUCCESS),
   2856                       MirrorSyncMode_str(backup->sync));
   2857            return NULL;
   2858        }
   2859        backup->has_bitmap_mode = true;
   2860        backup->sync = MIRROR_SYNC_MODE_BITMAP;
   2861        backup->bitmap_mode = BITMAP_SYNC_MODE_ON_SUCCESS;
   2862    }
   2863
   2864    if (backup->has_bitmap) {
   2865        bmap = bdrv_find_dirty_bitmap(bs, backup->bitmap);
   2866        if (!bmap) {
   2867            error_setg(errp, "Bitmap '%s' could not be found", backup->bitmap);
   2868            return NULL;
   2869        }
   2870        if (!backup->has_bitmap_mode) {
   2871            error_setg(errp, "Bitmap sync mode must be given "
   2872                       "when providing a bitmap");
   2873            return NULL;
   2874        }
   2875        if (bdrv_dirty_bitmap_check(bmap, BDRV_BITMAP_ALLOW_RO, errp)) {
   2876            return NULL;
   2877        }
   2878
   2879        /* This does not produce a useful bitmap artifact: */
   2880        if (backup->sync == MIRROR_SYNC_MODE_NONE) {
   2881            error_setg(errp, "sync mode '%s' does not produce meaningful bitmap"
   2882                       " outputs", MirrorSyncMode_str(backup->sync));
   2883            return NULL;
   2884        }
   2885
   2886        /* If the bitmap isn't used for input or output, this is useless: */
   2887        if (backup->bitmap_mode == BITMAP_SYNC_MODE_NEVER &&
   2888            backup->sync != MIRROR_SYNC_MODE_BITMAP) {
   2889            error_setg(errp, "Bitmap sync mode '%s' has no meaningful effect"
   2890                       " when combined with sync mode '%s'",
   2891                       BitmapSyncMode_str(backup->bitmap_mode),
   2892                       MirrorSyncMode_str(backup->sync));
   2893            return NULL;
   2894        }
   2895    }
   2896
   2897    if (!backup->has_bitmap && backup->has_bitmap_mode) {
   2898        error_setg(errp, "Cannot specify bitmap sync mode without a bitmap");
   2899        return NULL;
   2900    }
   2901
   2902    if (!backup->auto_finalize) {
   2903        job_flags |= JOB_MANUAL_FINALIZE;
   2904    }
   2905    if (!backup->auto_dismiss) {
   2906        job_flags |= JOB_MANUAL_DISMISS;
   2907    }
   2908
   2909    job = backup_job_create(backup->job_id, bs, target_bs, backup->speed,
   2910                            backup->sync, bmap, backup->bitmap_mode,
   2911                            backup->compress,
   2912                            backup->filter_node_name,
   2913                            &perf,
   2914                            backup->on_source_error,
   2915                            backup->on_target_error,
   2916                            job_flags, NULL, NULL, txn, errp);
   2917    return job;
   2918}
   2919
   2920void qmp_drive_backup(DriveBackup *backup, Error **errp)
   2921{
   2922    TransactionAction action = {
   2923        .type = TRANSACTION_ACTION_KIND_DRIVE_BACKUP,
   2924        .u.drive_backup.data = backup,
   2925    };
   2926    blockdev_do_action(&action, errp);
   2927}
   2928
   2929BlockDeviceInfoList *qmp_query_named_block_nodes(bool has_flat,
   2930                                                 bool flat,
   2931                                                 Error **errp)
   2932{
   2933    bool return_flat = has_flat && flat;
   2934
   2935    return bdrv_named_nodes_list(return_flat, errp);
   2936}
   2937
   2938XDbgBlockGraph *qmp_x_debug_query_block_graph(Error **errp)
   2939{
   2940    return bdrv_get_xdbg_block_graph(errp);
   2941}
   2942
   2943void qmp_blockdev_backup(BlockdevBackup *backup, Error **errp)
   2944{
   2945    TransactionAction action = {
   2946        .type = TRANSACTION_ACTION_KIND_BLOCKDEV_BACKUP,
   2947        .u.blockdev_backup.data = backup,
   2948    };
   2949    blockdev_do_action(&action, errp);
   2950}
   2951
   2952/* Parameter check and block job starting for drive mirroring.
   2953 * Caller should hold @device and @target's aio context (must be the same).
   2954 **/
   2955static void blockdev_mirror_common(const char *job_id, BlockDriverState *bs,
   2956                                   BlockDriverState *target,
   2957                                   bool has_replaces, const char *replaces,
   2958                                   enum MirrorSyncMode sync,
   2959                                   BlockMirrorBackingMode backing_mode,
   2960                                   bool zero_target,
   2961                                   bool has_speed, int64_t speed,
   2962                                   bool has_granularity, uint32_t granularity,
   2963                                   bool has_buf_size, int64_t buf_size,
   2964                                   bool has_on_source_error,
   2965                                   BlockdevOnError on_source_error,
   2966                                   bool has_on_target_error,
   2967                                   BlockdevOnError on_target_error,
   2968                                   bool has_unmap, bool unmap,
   2969                                   bool has_filter_node_name,
   2970                                   const char *filter_node_name,
   2971                                   bool has_copy_mode, MirrorCopyMode copy_mode,
   2972                                   bool has_auto_finalize, bool auto_finalize,
   2973                                   bool has_auto_dismiss, bool auto_dismiss,
   2974                                   Error **errp)
   2975{
   2976    BlockDriverState *unfiltered_bs;
   2977    int job_flags = JOB_DEFAULT;
   2978
   2979    if (!has_speed) {
   2980        speed = 0;
   2981    }
   2982    if (!has_on_source_error) {
   2983        on_source_error = BLOCKDEV_ON_ERROR_REPORT;
   2984    }
   2985    if (!has_on_target_error) {
   2986        on_target_error = BLOCKDEV_ON_ERROR_REPORT;
   2987    }
   2988    if (!has_granularity) {
   2989        granularity = 0;
   2990    }
   2991    if (!has_buf_size) {
   2992        buf_size = 0;
   2993    }
   2994    if (!has_unmap) {
   2995        unmap = true;
   2996    }
   2997    if (!has_filter_node_name) {
   2998        filter_node_name = NULL;
   2999    }
   3000    if (!has_copy_mode) {
   3001        copy_mode = MIRROR_COPY_MODE_BACKGROUND;
   3002    }
   3003    if (has_auto_finalize && !auto_finalize) {
   3004        job_flags |= JOB_MANUAL_FINALIZE;
   3005    }
   3006    if (has_auto_dismiss && !auto_dismiss) {
   3007        job_flags |= JOB_MANUAL_DISMISS;
   3008    }
   3009
   3010    if (granularity != 0 && (granularity < 512 || granularity > 1048576 * 64)) {
   3011        error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "granularity",
   3012                   "a value in range [512B, 64MB]");
   3013        return;
   3014    }
   3015    if (granularity & (granularity - 1)) {
   3016        error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "granularity",
   3017                   "a power of 2");
   3018        return;
   3019    }
   3020
   3021    if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_MIRROR_SOURCE, errp)) {
   3022        return;
   3023    }
   3024    if (bdrv_op_is_blocked(target, BLOCK_OP_TYPE_MIRROR_TARGET, errp)) {
   3025        return;
   3026    }
   3027
   3028    if (!bdrv_backing_chain_next(bs) && sync == MIRROR_SYNC_MODE_TOP) {
   3029        sync = MIRROR_SYNC_MODE_FULL;
   3030    }
   3031
   3032    if (!has_replaces) {
   3033        /* We want to mirror from @bs, but keep implicit filters on top */
   3034        unfiltered_bs = bdrv_skip_implicit_filters(bs);
   3035        if (unfiltered_bs != bs) {
   3036            replaces = unfiltered_bs->node_name;
   3037            has_replaces = true;
   3038        }
   3039    }
   3040
   3041    if (has_replaces) {
   3042        BlockDriverState *to_replace_bs;
   3043        AioContext *replace_aio_context;
   3044        int64_t bs_size, replace_size;
   3045
   3046        bs_size = bdrv_getlength(bs);
   3047        if (bs_size < 0) {
   3048            error_setg_errno(errp, -bs_size, "Failed to query device's size");
   3049            return;
   3050        }
   3051
   3052        to_replace_bs = check_to_replace_node(bs, replaces, errp);
   3053        if (!to_replace_bs) {
   3054            return;
   3055        }
   3056
   3057        replace_aio_context = bdrv_get_aio_context(to_replace_bs);
   3058        aio_context_acquire(replace_aio_context);
   3059        replace_size = bdrv_getlength(to_replace_bs);
   3060        aio_context_release(replace_aio_context);
   3061
   3062        if (replace_size < 0) {
   3063            error_setg_errno(errp, -replace_size,
   3064                             "Failed to query the replacement node's size");
   3065            return;
   3066        }
   3067        if (bs_size != replace_size) {
   3068            error_setg(errp, "cannot replace image with a mirror image of "
   3069                             "different size");
   3070            return;
   3071        }
   3072    }
   3073
   3074    /* pass the node name to replace to mirror start since it's loose coupling
   3075     * and will allow to check whether the node still exist at mirror completion
   3076     */
   3077    mirror_start(job_id, bs, target,
   3078                 has_replaces ? replaces : NULL, job_flags,
   3079                 speed, granularity, buf_size, sync, backing_mode, zero_target,
   3080                 on_source_error, on_target_error, unmap, filter_node_name,
   3081                 copy_mode, errp);
   3082}
   3083
   3084void qmp_drive_mirror(DriveMirror *arg, Error **errp)
   3085{
   3086    BlockDriverState *bs;
   3087    BlockDriverState *target_backing_bs, *target_bs;
   3088    AioContext *aio_context;
   3089    AioContext *old_context;
   3090    BlockMirrorBackingMode backing_mode;
   3091    Error *local_err = NULL;
   3092    QDict *options = NULL;
   3093    int flags;
   3094    int64_t size;
   3095    const char *format = arg->format;
   3096    bool zero_target;
   3097    int ret;
   3098
   3099    bs = qmp_get_root_bs(arg->device, errp);
   3100    if (!bs) {
   3101        return;
   3102    }
   3103
   3104    /* Early check to avoid creating target */
   3105    if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_MIRROR_SOURCE, errp)) {
   3106        return;
   3107    }
   3108
   3109    aio_context = bdrv_get_aio_context(bs);
   3110    aio_context_acquire(aio_context);
   3111
   3112    if (!arg->has_mode) {
   3113        arg->mode = NEW_IMAGE_MODE_ABSOLUTE_PATHS;
   3114    }
   3115
   3116    if (!arg->has_format) {
   3117        format = (arg->mode == NEW_IMAGE_MODE_EXISTING
   3118                  ? NULL : bs->drv->format_name);
   3119    }
   3120
   3121    flags = bs->open_flags | BDRV_O_RDWR;
   3122    target_backing_bs = bdrv_cow_bs(bdrv_skip_filters(bs));
   3123    if (!target_backing_bs && arg->sync == MIRROR_SYNC_MODE_TOP) {
   3124        arg->sync = MIRROR_SYNC_MODE_FULL;
   3125    }
   3126    if (arg->sync == MIRROR_SYNC_MODE_NONE) {
   3127        target_backing_bs = bs;
   3128    }
   3129
   3130    size = bdrv_getlength(bs);
   3131    if (size < 0) {
   3132        error_setg_errno(errp, -size, "bdrv_getlength failed");
   3133        goto out;
   3134    }
   3135
   3136    if (arg->has_replaces) {
   3137        if (!arg->has_node_name) {
   3138            error_setg(errp, "a node-name must be provided when replacing a"
   3139                             " named node of the graph");
   3140            goto out;
   3141        }
   3142    }
   3143
   3144    if (arg->mode == NEW_IMAGE_MODE_ABSOLUTE_PATHS) {
   3145        backing_mode = MIRROR_SOURCE_BACKING_CHAIN;
   3146    } else {
   3147        backing_mode = MIRROR_OPEN_BACKING_CHAIN;
   3148    }
   3149
   3150    /* Don't open backing image in create() */
   3151    flags |= BDRV_O_NO_BACKING;
   3152
   3153    if ((arg->sync == MIRROR_SYNC_MODE_FULL || !target_backing_bs)
   3154        && arg->mode != NEW_IMAGE_MODE_EXISTING)
   3155    {
   3156        /* create new image w/o backing file */
   3157        assert(format);
   3158        bdrv_img_create(arg->target, format,
   3159                        NULL, NULL, NULL, size, flags, false, &local_err);
   3160    } else {
   3161        /* Implicit filters should not appear in the filename */
   3162        BlockDriverState *explicit_backing =
   3163            bdrv_skip_implicit_filters(target_backing_bs);
   3164
   3165        switch (arg->mode) {
   3166        case NEW_IMAGE_MODE_EXISTING:
   3167            break;
   3168        case NEW_IMAGE_MODE_ABSOLUTE_PATHS:
   3169            /* create new image with backing file */
   3170            bdrv_refresh_filename(explicit_backing);
   3171            bdrv_img_create(arg->target, format,
   3172                            explicit_backing->filename,
   3173                            explicit_backing->drv->format_name,
   3174                            NULL, size, flags, false, &local_err);
   3175            break;
   3176        default:
   3177            abort();
   3178        }
   3179    }
   3180
   3181    if (local_err) {
   3182        error_propagate(errp, local_err);
   3183        goto out;
   3184    }
   3185
   3186    options = qdict_new();
   3187    if (arg->has_node_name) {
   3188        qdict_put_str(options, "node-name", arg->node_name);
   3189    }
   3190    if (format) {
   3191        qdict_put_str(options, "driver", format);
   3192    }
   3193
   3194    /* Mirroring takes care of copy-on-write using the source's backing
   3195     * file.
   3196     */
   3197    target_bs = bdrv_open(arg->target, NULL, options, flags, errp);
   3198    if (!target_bs) {
   3199        goto out;
   3200    }
   3201
   3202    zero_target = (arg->sync == MIRROR_SYNC_MODE_FULL &&
   3203                   (arg->mode == NEW_IMAGE_MODE_EXISTING ||
   3204                    !bdrv_has_zero_init(target_bs)));
   3205
   3206
   3207    /* Honor bdrv_try_set_aio_context() context acquisition requirements. */
   3208    old_context = bdrv_get_aio_context(target_bs);
   3209    aio_context_release(aio_context);
   3210    aio_context_acquire(old_context);
   3211
   3212    ret = bdrv_try_set_aio_context(target_bs, aio_context, errp);
   3213    if (ret < 0) {
   3214        bdrv_unref(target_bs);
   3215        aio_context_release(old_context);
   3216        return;
   3217    }
   3218
   3219    aio_context_release(old_context);
   3220    aio_context_acquire(aio_context);
   3221
   3222    blockdev_mirror_common(arg->has_job_id ? arg->job_id : NULL, bs, target_bs,
   3223                           arg->has_replaces, arg->replaces, arg->sync,
   3224                           backing_mode, zero_target,
   3225                           arg->has_speed, arg->speed,
   3226                           arg->has_granularity, arg->granularity,
   3227                           arg->has_buf_size, arg->buf_size,
   3228                           arg->has_on_source_error, arg->on_source_error,
   3229                           arg->has_on_target_error, arg->on_target_error,
   3230                           arg->has_unmap, arg->unmap,
   3231                           false, NULL,
   3232                           arg->has_copy_mode, arg->copy_mode,
   3233                           arg->has_auto_finalize, arg->auto_finalize,
   3234                           arg->has_auto_dismiss, arg->auto_dismiss,
   3235                           errp);
   3236    bdrv_unref(target_bs);
   3237out:
   3238    aio_context_release(aio_context);
   3239}
   3240
   3241void qmp_blockdev_mirror(bool has_job_id, const char *job_id,
   3242                         const char *device, const char *target,
   3243                         bool has_replaces, const char *replaces,
   3244                         MirrorSyncMode sync,
   3245                         bool has_speed, int64_t speed,
   3246                         bool has_granularity, uint32_t granularity,
   3247                         bool has_buf_size, int64_t buf_size,
   3248                         bool has_on_source_error,
   3249                         BlockdevOnError on_source_error,
   3250                         bool has_on_target_error,
   3251                         BlockdevOnError on_target_error,
   3252                         bool has_filter_node_name,
   3253                         const char *filter_node_name,
   3254                         bool has_copy_mode, MirrorCopyMode copy_mode,
   3255                         bool has_auto_finalize, bool auto_finalize,
   3256                         bool has_auto_dismiss, bool auto_dismiss,
   3257                         Error **errp)
   3258{
   3259    BlockDriverState *bs;
   3260    BlockDriverState *target_bs;
   3261    AioContext *aio_context;
   3262    AioContext *old_context;
   3263    BlockMirrorBackingMode backing_mode = MIRROR_LEAVE_BACKING_CHAIN;
   3264    bool zero_target;
   3265    int ret;
   3266
   3267    bs = qmp_get_root_bs(device, errp);
   3268    if (!bs) {
   3269        return;
   3270    }
   3271
   3272    target_bs = bdrv_lookup_bs(target, target, errp);
   3273    if (!target_bs) {
   3274        return;
   3275    }
   3276
   3277    zero_target = (sync == MIRROR_SYNC_MODE_FULL);
   3278
   3279    /* Honor bdrv_try_set_aio_context() context acquisition requirements. */
   3280    old_context = bdrv_get_aio_context(target_bs);
   3281    aio_context = bdrv_get_aio_context(bs);
   3282    aio_context_acquire(old_context);
   3283
   3284    ret = bdrv_try_set_aio_context(target_bs, aio_context, errp);
   3285
   3286    aio_context_release(old_context);
   3287    aio_context_acquire(aio_context);
   3288
   3289    if (ret < 0) {
   3290        goto out;
   3291    }
   3292
   3293    blockdev_mirror_common(has_job_id ? job_id : NULL, bs, target_bs,
   3294                           has_replaces, replaces, sync, backing_mode,
   3295                           zero_target, has_speed, speed,
   3296                           has_granularity, granularity,
   3297                           has_buf_size, buf_size,
   3298                           has_on_source_error, on_source_error,
   3299                           has_on_target_error, on_target_error,
   3300                           true, true,
   3301                           has_filter_node_name, filter_node_name,
   3302                           has_copy_mode, copy_mode,
   3303                           has_auto_finalize, auto_finalize,
   3304                           has_auto_dismiss, auto_dismiss,
   3305                           errp);
   3306out:
   3307    aio_context_release(aio_context);
   3308}
   3309
   3310/* Get a block job using its ID and acquire its AioContext */
   3311static BlockJob *find_block_job(const char *id, AioContext **aio_context,
   3312                                Error **errp)
   3313{
   3314    BlockJob *job;
   3315
   3316    assert(id != NULL);
   3317
   3318    *aio_context = NULL;
   3319
   3320    job = block_job_get(id);
   3321
   3322    if (!job) {
   3323        error_set(errp, ERROR_CLASS_DEVICE_NOT_ACTIVE,
   3324                  "Block job '%s' not found", id);
   3325        return NULL;
   3326    }
   3327
   3328    *aio_context = blk_get_aio_context(job->blk);
   3329    aio_context_acquire(*aio_context);
   3330
   3331    return job;
   3332}
   3333
   3334void qmp_block_job_set_speed(const char *device, int64_t speed, Error **errp)
   3335{
   3336    AioContext *aio_context;
   3337    BlockJob *job = find_block_job(device, &aio_context, errp);
   3338
   3339    if (!job) {
   3340        return;
   3341    }
   3342
   3343    block_job_set_speed(job, speed, errp);
   3344    aio_context_release(aio_context);
   3345}
   3346
   3347void qmp_block_job_cancel(const char *device,
   3348                          bool has_force, bool force, Error **errp)
   3349{
   3350    AioContext *aio_context;
   3351    BlockJob *job = find_block_job(device, &aio_context, errp);
   3352
   3353    if (!job) {
   3354        return;
   3355    }
   3356
   3357    if (!has_force) {
   3358        force = false;
   3359    }
   3360
   3361    if (job_user_paused(&job->job) && !force) {
   3362        error_setg(errp, "The block job for device '%s' is currently paused",
   3363                   device);
   3364        goto out;
   3365    }
   3366
   3367    trace_qmp_block_job_cancel(job);
   3368    job_user_cancel(&job->job, force, errp);
   3369out:
   3370    aio_context_release(aio_context);
   3371}
   3372
   3373void qmp_block_job_pause(const char *device, Error **errp)
   3374{
   3375    AioContext *aio_context;
   3376    BlockJob *job = find_block_job(device, &aio_context, errp);
   3377
   3378    if (!job) {
   3379        return;
   3380    }
   3381
   3382    trace_qmp_block_job_pause(job);
   3383    job_user_pause(&job->job, errp);
   3384    aio_context_release(aio_context);
   3385}
   3386
   3387void qmp_block_job_resume(const char *device, Error **errp)
   3388{
   3389    AioContext *aio_context;
   3390    BlockJob *job = find_block_job(device, &aio_context, errp);
   3391
   3392    if (!job) {
   3393        return;
   3394    }
   3395
   3396    trace_qmp_block_job_resume(job);
   3397    job_user_resume(&job->job, errp);
   3398    aio_context_release(aio_context);
   3399}
   3400
   3401void qmp_block_job_complete(const char *device, Error **errp)
   3402{
   3403    AioContext *aio_context;
   3404    BlockJob *job = find_block_job(device, &aio_context, errp);
   3405
   3406    if (!job) {
   3407        return;
   3408    }
   3409
   3410    trace_qmp_block_job_complete(job);
   3411    job_complete(&job->job, errp);
   3412    aio_context_release(aio_context);
   3413}
   3414
   3415void qmp_block_job_finalize(const char *id, Error **errp)
   3416{
   3417    AioContext *aio_context;
   3418    BlockJob *job = find_block_job(id, &aio_context, errp);
   3419
   3420    if (!job) {
   3421        return;
   3422    }
   3423
   3424    trace_qmp_block_job_finalize(job);
   3425    job_ref(&job->job);
   3426    job_finalize(&job->job, errp);
   3427
   3428    /*
   3429     * Job's context might have changed via job_finalize (and job_txn_apply
   3430     * automatically acquires the new one), so make sure we release the correct
   3431     * one.
   3432     */
   3433    aio_context = blk_get_aio_context(job->blk);
   3434    job_unref(&job->job);
   3435    aio_context_release(aio_context);
   3436}
   3437
   3438void qmp_block_job_dismiss(const char *id, Error **errp)
   3439{
   3440    AioContext *aio_context;
   3441    BlockJob *bjob = find_block_job(id, &aio_context, errp);
   3442    Job *job;
   3443
   3444    if (!bjob) {
   3445        return;
   3446    }
   3447
   3448    trace_qmp_block_job_dismiss(bjob);
   3449    job = &bjob->job;
   3450    job_dismiss(&job, errp);
   3451    aio_context_release(aio_context);
   3452}
   3453
   3454void qmp_change_backing_file(const char *device,
   3455                             const char *image_node_name,
   3456                             const char *backing_file,
   3457                             Error **errp)
   3458{
   3459    BlockDriverState *bs = NULL;
   3460    AioContext *aio_context;
   3461    BlockDriverState *image_bs = NULL;
   3462    Error *local_err = NULL;
   3463    bool ro;
   3464    int ret;
   3465
   3466    bs = qmp_get_root_bs(device, errp);
   3467    if (!bs) {
   3468        return;
   3469    }
   3470
   3471    aio_context = bdrv_get_aio_context(bs);
   3472    aio_context_acquire(aio_context);
   3473
   3474    image_bs = bdrv_lookup_bs(NULL, image_node_name, &local_err);
   3475    if (local_err) {
   3476        error_propagate(errp, local_err);
   3477        goto out;
   3478    }
   3479
   3480    if (!image_bs) {
   3481        error_setg(errp, "image file not found");
   3482        goto out;
   3483    }
   3484
   3485    if (bdrv_find_base(image_bs) == image_bs) {
   3486        error_setg(errp, "not allowing backing file change on an image "
   3487                         "without a backing file");
   3488        goto out;
   3489    }
   3490
   3491    /* even though we are not necessarily operating on bs, we need it to
   3492     * determine if block ops are currently prohibited on the chain */
   3493    if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_CHANGE, errp)) {
   3494        goto out;
   3495    }
   3496
   3497    /* final sanity check */
   3498    if (!bdrv_chain_contains(bs, image_bs)) {
   3499        error_setg(errp, "'%s' and image file are not in the same chain",
   3500                   device);
   3501        goto out;
   3502    }
   3503
   3504    /* if not r/w, reopen to make r/w */
   3505    ro = bdrv_is_read_only(image_bs);
   3506
   3507    if (ro) {
   3508        if (bdrv_reopen_set_read_only(image_bs, false, errp) != 0) {
   3509            goto out;
   3510        }
   3511    }
   3512
   3513    ret = bdrv_change_backing_file(image_bs, backing_file,
   3514                                   image_bs->drv ? image_bs->drv->format_name : "",
   3515                                   false);
   3516
   3517    if (ret < 0) {
   3518        error_setg_errno(errp, -ret, "Could not change backing file to '%s'",
   3519                         backing_file);
   3520        /* don't exit here, so we can try to restore open flags if
   3521         * appropriate */
   3522    }
   3523
   3524    if (ro) {
   3525        bdrv_reopen_set_read_only(image_bs, true, errp);
   3526    }
   3527
   3528out:
   3529    aio_context_release(aio_context);
   3530}
   3531
   3532void qmp_blockdev_add(BlockdevOptions *options, Error **errp)
   3533{
   3534    BlockDriverState *bs;
   3535    QObject *obj;
   3536    Visitor *v = qobject_output_visitor_new(&obj);
   3537    QDict *qdict;
   3538
   3539    visit_type_BlockdevOptions(v, NULL, &options, &error_abort);
   3540    visit_complete(v, &obj);
   3541    qdict = qobject_to(QDict, obj);
   3542
   3543    qdict_flatten(qdict);
   3544
   3545    if (!qdict_get_try_str(qdict, "node-name")) {
   3546        error_setg(errp, "'node-name' must be specified for the root node");
   3547        goto fail;
   3548    }
   3549
   3550    bs = bds_tree_init(qdict, errp);
   3551    if (!bs) {
   3552        goto fail;
   3553    }
   3554
   3555    bdrv_set_monitor_owned(bs);
   3556
   3557fail:
   3558    visit_free(v);
   3559}
   3560
   3561void qmp_blockdev_reopen(BlockdevOptionsList *reopen_list, Error **errp)
   3562{
   3563    BlockReopenQueue *queue = NULL;
   3564    GSList *drained = NULL;
   3565
   3566    /* Add each one of the BDS that we want to reopen to the queue */
   3567    for (; reopen_list != NULL; reopen_list = reopen_list->next) {
   3568        BlockdevOptions *options = reopen_list->value;
   3569        BlockDriverState *bs;
   3570        AioContext *ctx;
   3571        QObject *obj;
   3572        Visitor *v;
   3573        QDict *qdict;
   3574
   3575        /* Check for the selected node name */
   3576        if (!options->has_node_name) {
   3577            error_setg(errp, "node-name not specified");
   3578            goto fail;
   3579        }
   3580
   3581        bs = bdrv_find_node(options->node_name);
   3582        if (!bs) {
   3583            error_setg(errp, "Failed to find node with node-name='%s'",
   3584                       options->node_name);
   3585            goto fail;
   3586        }
   3587
   3588        /* Put all options in a QDict and flatten it */
   3589        v = qobject_output_visitor_new(&obj);
   3590        visit_type_BlockdevOptions(v, NULL, &options, &error_abort);
   3591        visit_complete(v, &obj);
   3592        visit_free(v);
   3593
   3594        qdict = qobject_to(QDict, obj);
   3595
   3596        qdict_flatten(qdict);
   3597
   3598        ctx = bdrv_get_aio_context(bs);
   3599        aio_context_acquire(ctx);
   3600
   3601        bdrv_subtree_drained_begin(bs);
   3602        queue = bdrv_reopen_queue(queue, bs, qdict, false);
   3603        drained = g_slist_prepend(drained, bs);
   3604
   3605        aio_context_release(ctx);
   3606    }
   3607
   3608    /* Perform the reopen operation */
   3609    bdrv_reopen_multiple(queue, errp);
   3610    queue = NULL;
   3611
   3612fail:
   3613    bdrv_reopen_queue_free(queue);
   3614    g_slist_free_full(drained, (GDestroyNotify) bdrv_subtree_drained_end);
   3615}
   3616
   3617void qmp_blockdev_del(const char *node_name, Error **errp)
   3618{
   3619    AioContext *aio_context;
   3620    BlockDriverState *bs;
   3621
   3622    bs = bdrv_find_node(node_name);
   3623    if (!bs) {
   3624        error_setg(errp, "Failed to find node with node-name='%s'", node_name);
   3625        return;
   3626    }
   3627    if (bdrv_has_blk(bs)) {
   3628        error_setg(errp, "Node %s is in use", node_name);
   3629        return;
   3630    }
   3631    aio_context = bdrv_get_aio_context(bs);
   3632    aio_context_acquire(aio_context);
   3633
   3634    if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_DRIVE_DEL, errp)) {
   3635        goto out;
   3636    }
   3637
   3638    if (!QTAILQ_IN_USE(bs, monitor_list)) {
   3639        error_setg(errp, "Node %s is not owned by the monitor",
   3640                   bs->node_name);
   3641        goto out;
   3642    }
   3643
   3644    if (bs->refcnt > 1) {
   3645        error_setg(errp, "Block device %s is in use",
   3646                   bdrv_get_device_or_node_name(bs));
   3647        goto out;
   3648    }
   3649
   3650    QTAILQ_REMOVE(&monitor_bdrv_states, bs, monitor_list);
   3651    bdrv_unref(bs);
   3652
   3653out:
   3654    aio_context_release(aio_context);
   3655}
   3656
   3657static BdrvChild *bdrv_find_child(BlockDriverState *parent_bs,
   3658                                  const char *child_name)
   3659{
   3660    BdrvChild *child;
   3661
   3662    QLIST_FOREACH(child, &parent_bs->children, next) {
   3663        if (strcmp(child->name, child_name) == 0) {
   3664            return child;
   3665        }
   3666    }
   3667
   3668    return NULL;
   3669}
   3670
   3671void qmp_x_blockdev_change(const char *parent, bool has_child,
   3672                           const char *child, bool has_node,
   3673                           const char *node, Error **errp)
   3674{
   3675    BlockDriverState *parent_bs, *new_bs = NULL;
   3676    BdrvChild *p_child;
   3677
   3678    parent_bs = bdrv_lookup_bs(parent, parent, errp);
   3679    if (!parent_bs) {
   3680        return;
   3681    }
   3682
   3683    if (has_child == has_node) {
   3684        if (has_child) {
   3685            error_setg(errp, "The parameters child and node are in conflict");
   3686        } else {
   3687            error_setg(errp, "Either child or node must be specified");
   3688        }
   3689        return;
   3690    }
   3691
   3692    if (has_child) {
   3693        p_child = bdrv_find_child(parent_bs, child);
   3694        if (!p_child) {
   3695            error_setg(errp, "Node '%s' does not have child '%s'",
   3696                       parent, child);
   3697            return;
   3698        }
   3699        bdrv_del_child(parent_bs, p_child, errp);
   3700    }
   3701
   3702    if (has_node) {
   3703        new_bs = bdrv_find_node(node);
   3704        if (!new_bs) {
   3705            error_setg(errp, "Node '%s' not found", node);
   3706            return;
   3707        }
   3708        bdrv_add_child(parent_bs, new_bs, errp);
   3709    }
   3710}
   3711
   3712BlockJobInfoList *qmp_query_block_jobs(Error **errp)
   3713{
   3714    BlockJobInfoList *head = NULL, **tail = &head;
   3715    BlockJob *job;
   3716
   3717    for (job = block_job_next(NULL); job; job = block_job_next(job)) {
   3718        BlockJobInfo *value;
   3719        AioContext *aio_context;
   3720
   3721        if (block_job_is_internal(job)) {
   3722            continue;
   3723        }
   3724        aio_context = blk_get_aio_context(job->blk);
   3725        aio_context_acquire(aio_context);
   3726        value = block_job_query(job, errp);
   3727        aio_context_release(aio_context);
   3728        if (!value) {
   3729            qapi_free_BlockJobInfoList(head);
   3730            return NULL;
   3731        }
   3732        QAPI_LIST_APPEND(tail, value);
   3733    }
   3734
   3735    return head;
   3736}
   3737
   3738void qmp_x_blockdev_set_iothread(const char *node_name, StrOrNull *iothread,
   3739                                 bool has_force, bool force, Error **errp)
   3740{
   3741    AioContext *old_context;
   3742    AioContext *new_context;
   3743    BlockDriverState *bs;
   3744
   3745    bs = bdrv_find_node(node_name);
   3746    if (!bs) {
   3747        error_setg(errp, "Failed to find node with node-name='%s'", node_name);
   3748        return;
   3749    }
   3750
   3751    /* Protects against accidents. */
   3752    if (!(has_force && force) && bdrv_has_blk(bs)) {
   3753        error_setg(errp, "Node %s is associated with a BlockBackend and could "
   3754                         "be in use (use force=true to override this check)",
   3755                         node_name);
   3756        return;
   3757    }
   3758
   3759    if (iothread->type == QTYPE_QSTRING) {
   3760        IOThread *obj = iothread_by_id(iothread->u.s);
   3761        if (!obj) {
   3762            error_setg(errp, "Cannot find iothread %s", iothread->u.s);
   3763            return;
   3764        }
   3765
   3766        new_context = iothread_get_aio_context(obj);
   3767    } else {
   3768        new_context = qemu_get_aio_context();
   3769    }
   3770
   3771    old_context = bdrv_get_aio_context(bs);
   3772    aio_context_acquire(old_context);
   3773
   3774    bdrv_try_set_aio_context(bs, new_context, errp);
   3775
   3776    aio_context_release(old_context);
   3777}
   3778
   3779QemuOptsList qemu_common_drive_opts = {
   3780    .name = "drive",
   3781    .head = QTAILQ_HEAD_INITIALIZER(qemu_common_drive_opts.head),
   3782    .desc = {
   3783        {
   3784            .name = "snapshot",
   3785            .type = QEMU_OPT_BOOL,
   3786            .help = "enable/disable snapshot mode",
   3787        },{
   3788            .name = "aio",
   3789            .type = QEMU_OPT_STRING,
   3790            .help = "host AIO implementation (threads, native, io_uring)",
   3791        },{
   3792            .name = BDRV_OPT_CACHE_WB,
   3793            .type = QEMU_OPT_BOOL,
   3794            .help = "Enable writeback mode",
   3795        },{
   3796            .name = "format",
   3797            .type = QEMU_OPT_STRING,
   3798            .help = "disk format (raw, qcow2, ...)",
   3799        },{
   3800            .name = "rerror",
   3801            .type = QEMU_OPT_STRING,
   3802            .help = "read error action",
   3803        },{
   3804            .name = "werror",
   3805            .type = QEMU_OPT_STRING,
   3806            .help = "write error action",
   3807        },{
   3808            .name = BDRV_OPT_READ_ONLY,
   3809            .type = QEMU_OPT_BOOL,
   3810            .help = "open drive file as read-only",
   3811        },
   3812
   3813        THROTTLE_OPTS,
   3814
   3815        {
   3816            .name = "throttling.group",
   3817            .type = QEMU_OPT_STRING,
   3818            .help = "name of the block throttling group",
   3819        },{
   3820            .name = "copy-on-read",
   3821            .type = QEMU_OPT_BOOL,
   3822            .help = "copy read data from backing file into image file",
   3823        },{
   3824            .name = "detect-zeroes",
   3825            .type = QEMU_OPT_STRING,
   3826            .help = "try to optimize zero writes (off, on, unmap)",
   3827        },{
   3828            .name = "stats-account-invalid",
   3829            .type = QEMU_OPT_BOOL,
   3830            .help = "whether to account for invalid I/O operations "
   3831                    "in the statistics",
   3832        },{
   3833            .name = "stats-account-failed",
   3834            .type = QEMU_OPT_BOOL,
   3835            .help = "whether to account for failed I/O operations "
   3836                    "in the statistics",
   3837        },
   3838        { /* end of list */ }
   3839    },
   3840};
   3841
   3842QemuOptsList qemu_drive_opts = {
   3843    .name = "drive",
   3844    .head = QTAILQ_HEAD_INITIALIZER(qemu_drive_opts.head),
   3845    .desc = {
   3846        /*
   3847         * no elements => accept any params
   3848         * validation will happen later
   3849         */
   3850        { /* end of list */ }
   3851    },
   3852};