Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 1 | /* |
| 2 | * Live block commit |
| 3 | * |
| 4 | * Copyright Red Hat, Inc. 2012 |
| 5 | * |
| 6 | * Authors: |
| 7 | * Jeff Cody <jcody@redhat.com> |
| 8 | * Based on stream.c by Stefan Hajnoczi |
| 9 | * |
| 10 | * This work is licensed under the terms of the GNU LGPL, version 2 or later. |
| 11 | * See the COPYING.LIB file in the top-level directory. |
| 12 | * |
| 13 | */ |
| 14 | |
Peter Maydell | 80c71a2 | 2016-01-18 18:01:42 +0000 | [diff] [blame] | 15 | #include "qemu/osdep.h" |
Kevin Wolf | dcbf37c | 2017-03-09 11:49:16 +0100 | [diff] [blame] | 16 | #include "qemu/cutils.h" |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 17 | #include "trace.h" |
Paolo Bonzini | 737e150 | 2012-12-17 18:19:44 +0100 | [diff] [blame] | 18 | #include "block/block_int.h" |
John Snow | c87621e | 2016-10-27 12:07:00 -0400 | [diff] [blame] | 19 | #include "block/blockjob_int.h" |
Markus Armbruster | da34e65 | 2016-03-14 09:01:28 +0100 | [diff] [blame] | 20 | #include "qapi/error.h" |
Markus Armbruster | cc7a8ea | 2015-03-17 17:22:46 +0100 | [diff] [blame] | 21 | #include "qapi/qmp/qerror.h" |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 22 | #include "qemu/ratelimit.h" |
Max Reitz | 373340b | 2015-10-19 17:53:22 +0200 | [diff] [blame] | 23 | #include "sysemu/block-backend.h" |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 24 | |
| 25 | enum { |
| 26 | /* |
| 27 | * Size of data buffer for populating the image file. This should be large |
| 28 | * enough to process multiple clusters in a single call, so that populating |
| 29 | * contiguous regions of the image is efficient. |
| 30 | */ |
| 31 | COMMIT_BUFFER_SIZE = 512 * 1024, /* in bytes */ |
| 32 | }; |
| 33 | |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 34 | typedef struct CommitBlockJob { |
| 35 | BlockJob common; |
Kevin Wolf | 8dfba27 | 2017-01-16 16:22:34 +0100 | [diff] [blame] | 36 | BlockDriverState *commit_top_bs; |
Kevin Wolf | 4653456 | 2016-04-14 13:09:53 +0200 | [diff] [blame] | 37 | BlockBackend *top; |
| 38 | BlockBackend *base; |
John Snow | 22dffcb | 2018-09-06 09:02:13 -0400 | [diff] [blame] | 39 | BlockDriverState *base_bs; |
Paolo Bonzini | 92aa5c6 | 2012-09-28 17:22:55 +0200 | [diff] [blame] | 40 | BlockdevOnError on_error; |
Alberto Garcia | e70cdc5 | 2018-11-12 16:00:35 +0200 | [diff] [blame] | 41 | bool base_read_only; |
Alberto Garcia | df82733 | 2019-03-12 18:48:41 +0200 | [diff] [blame] | 42 | bool chain_frozen; |
Jeff Cody | 54e2690 | 2014-06-25 15:40:10 -0400 | [diff] [blame] | 43 | char *backing_file_str; |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 44 | } CommitBlockJob; |
| 45 | |
Kevin Wolf | 4653456 | 2016-04-14 13:09:53 +0200 | [diff] [blame] | 46 | static int coroutine_fn commit_populate(BlockBackend *bs, BlockBackend *base, |
Eric Blake | d8a9858 | 2017-07-07 07:44:44 -0500 | [diff] [blame] | 47 | int64_t offset, uint64_t bytes, |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 48 | void *buf) |
| 49 | { |
| 50 | int ret = 0; |
| 51 | |
Eric Blake | d8a9858 | 2017-07-07 07:44:44 -0500 | [diff] [blame] | 52 | assert(bytes < SIZE_MAX); |
Kevin Wolf | 4653456 | 2016-04-14 13:09:53 +0200 | [diff] [blame] | 53 | |
Vladimir Sementsov-Ogievskiy | 08b6261 | 2019-04-22 17:58:36 +0300 | [diff] [blame] | 54 | ret = blk_co_pread(bs, offset, bytes, buf, 0); |
Kevin Wolf | 4653456 | 2016-04-14 13:09:53 +0200 | [diff] [blame] | 55 | if (ret < 0) { |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 56 | return ret; |
| 57 | } |
| 58 | |
Vladimir Sementsov-Ogievskiy | 08b6261 | 2019-04-22 17:58:36 +0300 | [diff] [blame] | 59 | ret = blk_co_pwrite(base, offset, bytes, buf, 0); |
Kevin Wolf | 4653456 | 2016-04-14 13:09:53 +0200 | [diff] [blame] | 60 | if (ret < 0) { |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 61 | return ret; |
| 62 | } |
| 63 | |
| 64 | return 0; |
| 65 | } |
| 66 | |
John Snow | 22dffcb | 2018-09-06 09:02:13 -0400 | [diff] [blame] | 67 | static int commit_prepare(Job *job) |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 68 | { |
Kevin Wolf | 1908a55 | 2018-04-17 16:41:17 +0200 | [diff] [blame] | 69 | CommitBlockJob *s = container_of(job, CommitBlockJob, common.job); |
Kevin Wolf | 19ebd13 | 2017-06-02 23:04:55 +0200 | [diff] [blame] | 70 | |
Alberto Garcia | df82733 | 2019-03-12 18:48:41 +0200 | [diff] [blame] | 71 | bdrv_unfreeze_backing_chain(s->commit_top_bs, s->base_bs); |
| 72 | s->chain_frozen = false; |
| 73 | |
Kevin Wolf | 8dfba27 | 2017-01-16 16:22:34 +0100 | [diff] [blame] | 74 | /* Remove base node parent that still uses BLK_PERM_WRITE/RESIZE before |
| 75 | * the normal backing chain can be restored. */ |
| 76 | blk_unref(s->base); |
John Snow | 22dffcb | 2018-09-06 09:02:13 -0400 | [diff] [blame] | 77 | s->base = NULL; |
Stefan Hajnoczi | 9e85cd5 | 2014-10-21 12:03:59 +0100 | [diff] [blame] | 78 | |
John Snow | 22dffcb | 2018-09-06 09:02:13 -0400 | [diff] [blame] | 79 | /* FIXME: bdrv_drop_intermediate treats total failures and partial failures |
| 80 | * identically. Further work is needed to disambiguate these cases. */ |
| 81 | return bdrv_drop_intermediate(s->commit_top_bs, s->base_bs, |
| 82 | s->backing_file_str); |
| 83 | } |
| 84 | |
| 85 | static void commit_abort(Job *job) |
| 86 | { |
| 87 | CommitBlockJob *s = container_of(job, CommitBlockJob, common.job); |
| 88 | BlockDriverState *top_bs = blk_bs(s->top); |
| 89 | |
Alberto Garcia | df82733 | 2019-03-12 18:48:41 +0200 | [diff] [blame] | 90 | if (s->chain_frozen) { |
| 91 | bdrv_unfreeze_backing_chain(s->commit_top_bs, s->base_bs); |
| 92 | } |
| 93 | |
John Snow | 22dffcb | 2018-09-06 09:02:13 -0400 | [diff] [blame] | 94 | /* Make sure commit_top_bs and top stay around until bdrv_replace_node() */ |
| 95 | bdrv_ref(top_bs); |
| 96 | bdrv_ref(s->commit_top_bs); |
| 97 | |
| 98 | if (s->base) { |
| 99 | blk_unref(s->base); |
Stefan Hajnoczi | 9e85cd5 | 2014-10-21 12:03:59 +0100 | [diff] [blame] | 100 | } |
| 101 | |
John Snow | 22dffcb | 2018-09-06 09:02:13 -0400 | [diff] [blame] | 102 | /* free the blockers on the intermediate nodes so that bdrv_replace_nodes |
| 103 | * can succeed */ |
| 104 | block_job_remove_all_bdrv(&s->common); |
| 105 | |
| 106 | /* If bdrv_drop_intermediate() failed (or was not invoked), remove the |
| 107 | * commit filter driver from the backing chain now. Do this as the final |
| 108 | * step so that the 'consistent read' permission can be granted. |
| 109 | * |
| 110 | * XXX Can (or should) we somehow keep 'consistent read' blocked even |
| 111 | * after the failed/cancelled commit job is gone? If we already wrote |
| 112 | * something to base, the intermediate images aren't valid any more. */ |
| 113 | bdrv_child_try_set_perm(s->commit_top_bs->backing, 0, BLK_PERM_ALL, |
| 114 | &error_abort); |
| 115 | bdrv_replace_node(s->commit_top_bs, backing_bs(s->commit_top_bs), |
| 116 | &error_abort); |
| 117 | |
| 118 | bdrv_unref(s->commit_top_bs); |
| 119 | bdrv_unref(top_bs); |
| 120 | } |
| 121 | |
| 122 | static void commit_clean(Job *job) |
| 123 | { |
| 124 | CommitBlockJob *s = container_of(job, CommitBlockJob, common.job); |
| 125 | |
Stefan Hajnoczi | 9e85cd5 | 2014-10-21 12:03:59 +0100 | [diff] [blame] | 126 | /* restore base open flags here if appropriate (e.g., change the base back |
| 127 | * to r/o). These reopens do not need to be atomic, since we won't abort |
| 128 | * even on failure here */ |
Alberto Garcia | e70cdc5 | 2018-11-12 16:00:35 +0200 | [diff] [blame] | 129 | if (s->base_read_only) { |
| 130 | bdrv_reopen_set_read_only(s->base_bs, true, NULL); |
Stefan Hajnoczi | 9e85cd5 | 2014-10-21 12:03:59 +0100 | [diff] [blame] | 131 | } |
John Snow | 22dffcb | 2018-09-06 09:02:13 -0400 | [diff] [blame] | 132 | |
Stefan Hajnoczi | 9e85cd5 | 2014-10-21 12:03:59 +0100 | [diff] [blame] | 133 | g_free(s->backing_file_str); |
Kevin Wolf | 4653456 | 2016-04-14 13:09:53 +0200 | [diff] [blame] | 134 | blk_unref(s->top); |
Stefan Hajnoczi | 9e85cd5 | 2014-10-21 12:03:59 +0100 | [diff] [blame] | 135 | } |
| 136 | |
John Snow | f67432a | 2018-08-29 21:57:26 -0400 | [diff] [blame] | 137 | static int coroutine_fn commit_run(Job *job, Error **errp) |
Stefan Hajnoczi | 9e85cd5 | 2014-10-21 12:03:59 +0100 | [diff] [blame] | 138 | { |
John Snow | f67432a | 2018-08-29 21:57:26 -0400 | [diff] [blame] | 139 | CommitBlockJob *s = container_of(job, CommitBlockJob, common.job); |
Eric Blake | 317a667 | 2017-07-07 07:44:45 -0500 | [diff] [blame] | 140 | int64_t offset; |
Sascha Silbe | f14a39c | 2016-06-28 17:28:41 +0200 | [diff] [blame] | 141 | uint64_t delay_ns = 0; |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 142 | int ret = 0; |
Eric Blake | 51b0a48 | 2017-07-07 07:44:59 -0500 | [diff] [blame] | 143 | int64_t n = 0; /* bytes */ |
Stefan Hajnoczi | 9e85cd5 | 2014-10-21 12:03:59 +0100 | [diff] [blame] | 144 | void *buf = NULL; |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 145 | int bytes_written = 0; |
Kevin Wolf | 05df8a6 | 2018-01-18 18:08:22 +0100 | [diff] [blame] | 146 | int64_t len, base_len; |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 147 | |
Kevin Wolf | 05df8a6 | 2018-01-18 18:08:22 +0100 | [diff] [blame] | 148 | ret = len = blk_getlength(s->top); |
| 149 | if (len < 0) { |
Stefan Hajnoczi | 9e85cd5 | 2014-10-21 12:03:59 +0100 | [diff] [blame] | 150 | goto out; |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 151 | } |
Kevin Wolf | 30a5c88 | 2018-05-04 12:17:20 +0200 | [diff] [blame] | 152 | job_progress_set_remaining(&s->common.job, len); |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 153 | |
Kevin Wolf | 4653456 | 2016-04-14 13:09:53 +0200 | [diff] [blame] | 154 | ret = base_len = blk_getlength(s->base); |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 155 | if (base_len < 0) { |
Stefan Hajnoczi | 9e85cd5 | 2014-10-21 12:03:59 +0100 | [diff] [blame] | 156 | goto out; |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 157 | } |
| 158 | |
Kevin Wolf | 05df8a6 | 2018-01-18 18:08:22 +0100 | [diff] [blame] | 159 | if (base_len < len) { |
| 160 | ret = blk_truncate(s->base, len, PREALLOC_MODE_OFF, NULL); |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 161 | if (ret) { |
Stefan Hajnoczi | 9e85cd5 | 2014-10-21 12:03:59 +0100 | [diff] [blame] | 162 | goto out; |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 163 | } |
| 164 | } |
| 165 | |
Kevin Wolf | 4653456 | 2016-04-14 13:09:53 +0200 | [diff] [blame] | 166 | buf = blk_blockalign(s->top, COMMIT_BUFFER_SIZE); |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 167 | |
Kevin Wolf | 05df8a6 | 2018-01-18 18:08:22 +0100 | [diff] [blame] | 168 | for (offset = 0; offset < len; offset += n) { |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 169 | bool copy; |
| 170 | |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 171 | /* Note that even when no rate limit is applied we need to yield |
Kevin Wolf | c57b665 | 2012-11-13 16:35:13 +0100 | [diff] [blame] | 172 | * with no pending I/O here so that bdrv_drain_all() returns. |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 173 | */ |
Kevin Wolf | 5d43e86 | 2018-04-18 16:32:20 +0200 | [diff] [blame] | 174 | job_sleep_ns(&s->common.job, delay_ns); |
Kevin Wolf | daa7f2f | 2018-04-17 12:56:07 +0200 | [diff] [blame] | 175 | if (job_is_cancelled(&s->common.job)) { |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 176 | break; |
| 177 | } |
| 178 | /* Copy if allocated above the base */ |
Kevin Wolf | 4653456 | 2016-04-14 13:09:53 +0200 | [diff] [blame] | 179 | ret = bdrv_is_allocated_above(blk_bs(s->top), blk_bs(s->base), |
Eric Blake | 51b0a48 | 2017-07-07 07:44:59 -0500 | [diff] [blame] | 180 | offset, COMMIT_BUFFER_SIZE, &n); |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 181 | copy = (ret == 1); |
Eric Blake | 51b0a48 | 2017-07-07 07:44:59 -0500 | [diff] [blame] | 182 | trace_commit_one_iteration(s, offset, n, ret); |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 183 | if (copy) { |
Eric Blake | 51b0a48 | 2017-07-07 07:44:59 -0500 | [diff] [blame] | 184 | ret = commit_populate(s->top, s->base, offset, n, buf); |
| 185 | bytes_written += n; |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 186 | } |
| 187 | if (ret < 0) { |
Kevin Wolf | 1e8fb7f | 2016-06-29 17:38:57 +0200 | [diff] [blame] | 188 | BlockErrorAction action = |
| 189 | block_job_error_action(&s->common, false, s->on_error, -ret); |
| 190 | if (action == BLOCK_ERROR_ACTION_REPORT) { |
Stefan Hajnoczi | 9e85cd5 | 2014-10-21 12:03:59 +0100 | [diff] [blame] | 191 | goto out; |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 192 | } else { |
| 193 | n = 0; |
| 194 | continue; |
| 195 | } |
| 196 | } |
| 197 | /* Publish progress */ |
Kevin Wolf | 30a5c88 | 2018-05-04 12:17:20 +0200 | [diff] [blame] | 198 | job_progress_update(&s->common.job, n); |
Sascha Silbe | f14a39c | 2016-06-28 17:28:41 +0200 | [diff] [blame] | 199 | |
Kevin Wolf | dee81d5 | 2018-01-18 21:19:38 +0100 | [diff] [blame] | 200 | if (copy) { |
| 201 | delay_ns = block_job_ratelimit_get_delay(&s->common, n); |
Kevin Wolf | 2fe4bba | 2018-01-18 21:23:52 +0100 | [diff] [blame] | 202 | } else { |
| 203 | delay_ns = 0; |
Sascha Silbe | f14a39c | 2016-06-28 17:28:41 +0200 | [diff] [blame] | 204 | } |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 205 | } |
| 206 | |
| 207 | ret = 0; |
| 208 | |
Stefan Hajnoczi | 9e85cd5 | 2014-10-21 12:03:59 +0100 | [diff] [blame] | 209 | out: |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 210 | qemu_vfree(buf); |
| 211 | |
John Snow | f67432a | 2018-08-29 21:57:26 -0400 | [diff] [blame] | 212 | return ret; |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 213 | } |
| 214 | |
Fam Zheng | 3fc4b10 | 2013-10-08 17:29:38 +0800 | [diff] [blame] | 215 | static const BlockJobDriver commit_job_driver = { |
Kevin Wolf | 33e9e9b | 2018-04-12 17:29:59 +0200 | [diff] [blame] | 216 | .job_driver = { |
| 217 | .instance_size = sizeof(CommitBlockJob), |
Kevin Wolf | 252291e | 2018-04-12 17:57:08 +0200 | [diff] [blame] | 218 | .job_type = JOB_TYPE_COMMIT, |
Kevin Wolf | 80fa2c7 | 2018-04-13 18:50:05 +0200 | [diff] [blame] | 219 | .free = block_job_free, |
Kevin Wolf | b15de82 | 2018-04-18 17:10:26 +0200 | [diff] [blame] | 220 | .user_resume = block_job_user_resume, |
Kevin Wolf | b69f777 | 2018-04-20 17:00:29 +0200 | [diff] [blame] | 221 | .drain = block_job_drain, |
John Snow | f67432a | 2018-08-29 21:57:26 -0400 | [diff] [blame] | 222 | .run = commit_run, |
John Snow | 22dffcb | 2018-09-06 09:02:13 -0400 | [diff] [blame] | 223 | .prepare = commit_prepare, |
| 224 | .abort = commit_abort, |
| 225 | .clean = commit_clean |
Kevin Wolf | 33e9e9b | 2018-04-12 17:29:59 +0200 | [diff] [blame] | 226 | }, |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 227 | }; |
| 228 | |
Kevin Wolf | 8dfba27 | 2017-01-16 16:22:34 +0100 | [diff] [blame] | 229 | static int coroutine_fn bdrv_commit_top_preadv(BlockDriverState *bs, |
| 230 | uint64_t offset, uint64_t bytes, QEMUIOVector *qiov, int flags) |
| 231 | { |
| 232 | return bdrv_co_preadv(bs->backing, offset, bytes, qiov, flags); |
| 233 | } |
| 234 | |
Max Reitz | 998b3a1 | 2019-02-01 20:29:28 +0100 | [diff] [blame] | 235 | static void bdrv_commit_top_refresh_filename(BlockDriverState *bs) |
Kevin Wolf | dcbf37c | 2017-03-09 11:49:16 +0100 | [diff] [blame] | 236 | { |
Kevin Wolf | dcbf37c | 2017-03-09 11:49:16 +0100 | [diff] [blame] | 237 | pstrcpy(bs->exact_filename, sizeof(bs->exact_filename), |
| 238 | bs->backing->bs->filename); |
| 239 | } |
Kevin Wolf | 9196565 | 2017-03-08 15:07:12 +0100 | [diff] [blame] | 240 | |
Kevin Wolf | 8dfba27 | 2017-01-16 16:22:34 +0100 | [diff] [blame] | 241 | static void bdrv_commit_top_child_perm(BlockDriverState *bs, BdrvChild *c, |
| 242 | const BdrvChildRole *role, |
Kevin Wolf | e0995dc | 2017-09-14 12:47:11 +0200 | [diff] [blame] | 243 | BlockReopenQueue *reopen_queue, |
Kevin Wolf | 8dfba27 | 2017-01-16 16:22:34 +0100 | [diff] [blame] | 244 | uint64_t perm, uint64_t shared, |
| 245 | uint64_t *nperm, uint64_t *nshared) |
| 246 | { |
| 247 | *nperm = 0; |
| 248 | *nshared = BLK_PERM_ALL; |
| 249 | } |
| 250 | |
| 251 | /* Dummy node that provides consistent read to its users without requiring it |
| 252 | * from its backing file and that allows writes on the backing file chain. */ |
| 253 | static BlockDriver bdrv_commit_top = { |
Kevin Wolf | 9196565 | 2017-03-08 15:07:12 +0100 | [diff] [blame] | 254 | .format_name = "commit_top", |
| 255 | .bdrv_co_preadv = bdrv_commit_top_preadv, |
Eric Blake | 3e4d0e7 | 2018-02-13 14:26:43 -0600 | [diff] [blame] | 256 | .bdrv_co_block_status = bdrv_co_block_status_from_backing, |
Kevin Wolf | dcbf37c | 2017-03-09 11:49:16 +0100 | [diff] [blame] | 257 | .bdrv_refresh_filename = bdrv_commit_top_refresh_filename, |
Kevin Wolf | 9196565 | 2017-03-08 15:07:12 +0100 | [diff] [blame] | 258 | .bdrv_child_perm = bdrv_commit_top_child_perm, |
Kevin Wolf | 8dfba27 | 2017-01-16 16:22:34 +0100 | [diff] [blame] | 259 | }; |
| 260 | |
Alberto Garcia | fd62c60 | 2016-07-05 17:29:00 +0300 | [diff] [blame] | 261 | void commit_start(const char *job_id, BlockDriverState *bs, |
John Snow | 5360782 | 2018-09-06 09:02:10 -0400 | [diff] [blame] | 262 | BlockDriverState *base, BlockDriverState *top, |
| 263 | int creation_flags, int64_t speed, |
John Snow | 8254b6d | 2016-10-27 12:06:58 -0400 | [diff] [blame] | 264 | BlockdevOnError on_error, const char *backing_file_str, |
Kevin Wolf | 0db832f | 2017-02-20 18:10:05 +0100 | [diff] [blame] | 265 | const char *filter_node_name, Error **errp) |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 266 | { |
| 267 | CommitBlockJob *s; |
Alberto Garcia | 3e4c512 | 2016-10-28 10:08:08 +0300 | [diff] [blame] | 268 | BlockDriverState *iter; |
Kevin Wolf | 8dfba27 | 2017-01-16 16:22:34 +0100 | [diff] [blame] | 269 | BlockDriverState *commit_top_bs = NULL; |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 270 | Error *local_err = NULL; |
Kevin Wolf | d708642 | 2017-01-13 19:02:32 +0100 | [diff] [blame] | 271 | int ret; |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 272 | |
Fam Zheng | 18da7f9 | 2013-12-16 14:45:33 +0800 | [diff] [blame] | 273 | assert(top != bs); |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 274 | if (top == base) { |
| 275 | error_setg(errp, "Invalid files for merge: top and base are the same"); |
| 276 | return; |
| 277 | } |
| 278 | |
John Snow | 75859b9 | 2018-03-10 03:27:27 -0500 | [diff] [blame] | 279 | s = block_job_create(job_id, &commit_job_driver, NULL, bs, 0, BLK_PERM_ALL, |
John Snow | 5360782 | 2018-09-06 09:02:10 -0400 | [diff] [blame] | 280 | speed, creation_flags, NULL, NULL, errp); |
Alberto Garcia | 834fe28 | 2016-05-27 12:53:39 +0200 | [diff] [blame] | 281 | if (!s) { |
| 282 | return; |
| 283 | } |
| 284 | |
Kevin Wolf | bde7071 | 2017-06-27 20:36:18 +0200 | [diff] [blame] | 285 | /* convert base to r/w, if necessary */ |
Alberto Garcia | e70cdc5 | 2018-11-12 16:00:35 +0200 | [diff] [blame] | 286 | s->base_read_only = bdrv_is_read_only(base); |
| 287 | if (s->base_read_only) { |
| 288 | if (bdrv_reopen_set_read_only(base, false, errp) != 0) { |
Kevin Wolf | d708642 | 2017-01-13 19:02:32 +0100 | [diff] [blame] | 289 | goto fail; |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 290 | } |
| 291 | } |
| 292 | |
Kevin Wolf | 8dfba27 | 2017-01-16 16:22:34 +0100 | [diff] [blame] | 293 | /* Insert commit_top block node above top, so we can block consistent read |
| 294 | * on the backing chain below it */ |
Kevin Wolf | 0db832f | 2017-02-20 18:10:05 +0100 | [diff] [blame] | 295 | commit_top_bs = bdrv_new_open_driver(&bdrv_commit_top, filter_node_name, 0, |
| 296 | errp); |
Kevin Wolf | 8dfba27 | 2017-01-16 16:22:34 +0100 | [diff] [blame] | 297 | if (commit_top_bs == NULL) { |
| 298 | goto fail; |
| 299 | } |
Kevin Wolf | d3c8c67 | 2017-07-18 17:24:05 +0200 | [diff] [blame] | 300 | if (!filter_node_name) { |
| 301 | commit_top_bs->implicit = true; |
| 302 | } |
Kevin Wolf | 0d0676a | 2017-04-06 19:07:14 +0200 | [diff] [blame] | 303 | commit_top_bs->total_sectors = top->total_sectors; |
Kevin Wolf | 8dfba27 | 2017-01-16 16:22:34 +0100 | [diff] [blame] | 304 | |
Alberto Garcia | 6a63419 | 2019-04-03 17:37:48 +0300 | [diff] [blame] | 305 | bdrv_append(commit_top_bs, top, &local_err); |
Fam Zheng | b69f00d | 2017-03-07 19:07:22 +0800 | [diff] [blame] | 306 | if (local_err) { |
Fam Zheng | b69f00d | 2017-03-07 19:07:22 +0800 | [diff] [blame] | 307 | commit_top_bs = NULL; |
| 308 | error_propagate(errp, local_err); |
| 309 | goto fail; |
| 310 | } |
Kevin Wolf | 8dfba27 | 2017-01-16 16:22:34 +0100 | [diff] [blame] | 311 | |
| 312 | s->commit_top_bs = commit_top_bs; |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 313 | |
Alberto Garcia | 3e4c512 | 2016-10-28 10:08:08 +0300 | [diff] [blame] | 314 | /* Block all nodes between top and base, because they will |
| 315 | * disappear from the chain after this operation. */ |
| 316 | assert(bdrv_chain_contains(top, base)); |
Kevin Wolf | 8dfba27 | 2017-01-16 16:22:34 +0100 | [diff] [blame] | 317 | for (iter = top; iter != base; iter = backing_bs(iter)) { |
| 318 | /* XXX BLK_PERM_WRITE needs to be allowed so we don't block ourselves |
| 319 | * at s->base (if writes are blocked for a node, they are also blocked |
| 320 | * for its backing file). The other options would be a second filter |
| 321 | * driver above s->base. */ |
| 322 | ret = block_job_add_bdrv(&s->common, "intermediate node", iter, 0, |
| 323 | BLK_PERM_WRITE_UNCHANGED | BLK_PERM_WRITE, |
| 324 | errp); |
| 325 | if (ret < 0) { |
| 326 | goto fail; |
| 327 | } |
Alberto Garcia | 3e4c512 | 2016-10-28 10:08:08 +0300 | [diff] [blame] | 328 | } |
| 329 | |
Alberto Garcia | df82733 | 2019-03-12 18:48:41 +0200 | [diff] [blame] | 330 | if (bdrv_freeze_backing_chain(commit_top_bs, base, errp) < 0) { |
| 331 | goto fail; |
| 332 | } |
| 333 | s->chain_frozen = true; |
| 334 | |
Kevin Wolf | 8dfba27 | 2017-01-16 16:22:34 +0100 | [diff] [blame] | 335 | ret = block_job_add_bdrv(&s->common, "base", base, 0, BLK_PERM_ALL, errp); |
| 336 | if (ret < 0) { |
| 337 | goto fail; |
| 338 | } |
| 339 | |
Kevin Wolf | d861ab3 | 2019-04-25 14:25:10 +0200 | [diff] [blame] | 340 | s->base = blk_new(s->common.job.aio_context, |
| 341 | BLK_PERM_CONSISTENT_READ |
Kevin Wolf | 8dfba27 | 2017-01-16 16:22:34 +0100 | [diff] [blame] | 342 | | BLK_PERM_WRITE |
| 343 | | BLK_PERM_RESIZE, |
| 344 | BLK_PERM_CONSISTENT_READ |
| 345 | | BLK_PERM_GRAPH_MOD |
| 346 | | BLK_PERM_WRITE_UNCHANGED); |
Kevin Wolf | d708642 | 2017-01-13 19:02:32 +0100 | [diff] [blame] | 347 | ret = blk_insert_bs(s->base, base, errp); |
| 348 | if (ret < 0) { |
| 349 | goto fail; |
| 350 | } |
John Snow | 22dffcb | 2018-09-06 09:02:13 -0400 | [diff] [blame] | 351 | s->base_bs = base; |
Kevin Wolf | 4653456 | 2016-04-14 13:09:53 +0200 | [diff] [blame] | 352 | |
Kevin Wolf | 8dfba27 | 2017-01-16 16:22:34 +0100 | [diff] [blame] | 353 | /* Required permissions are already taken with block_job_add_bdrv() */ |
Kevin Wolf | d861ab3 | 2019-04-25 14:25:10 +0200 | [diff] [blame] | 354 | s->top = blk_new(s->common.job.aio_context, 0, BLK_PERM_ALL); |
Kevin Wolf | b247767 | 2017-03-03 16:54:21 +0100 | [diff] [blame] | 355 | ret = blk_insert_bs(s->top, top, errp); |
Kevin Wolf | d708642 | 2017-01-13 19:02:32 +0100 | [diff] [blame] | 356 | if (ret < 0) { |
| 357 | goto fail; |
| 358 | } |
Kevin Wolf | 4653456 | 2016-04-14 13:09:53 +0200 | [diff] [blame] | 359 | |
Jeff Cody | 54e2690 | 2014-06-25 15:40:10 -0400 | [diff] [blame] | 360 | s->backing_file_str = g_strdup(backing_file_str); |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 361 | s->on_error = on_error; |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 362 | |
John Snow | 5ccac6f | 2016-11-08 01:50:37 -0500 | [diff] [blame] | 363 | trace_commit_start(bs, base, top, s); |
Kevin Wolf | da01ff7 | 2018-04-13 17:31:02 +0200 | [diff] [blame] | 364 | job_start(&s->common.job); |
Kevin Wolf | d708642 | 2017-01-13 19:02:32 +0100 | [diff] [blame] | 365 | return; |
| 366 | |
| 367 | fail: |
Alberto Garcia | df82733 | 2019-03-12 18:48:41 +0200 | [diff] [blame] | 368 | if (s->chain_frozen) { |
| 369 | bdrv_unfreeze_backing_chain(commit_top_bs, base); |
| 370 | } |
Kevin Wolf | d708642 | 2017-01-13 19:02:32 +0100 | [diff] [blame] | 371 | if (s->base) { |
| 372 | blk_unref(s->base); |
| 373 | } |
| 374 | if (s->top) { |
| 375 | blk_unref(s->top); |
| 376 | } |
Alberto Garcia | 065abf9 | 2019-04-29 15:51:08 +0200 | [diff] [blame] | 377 | if (s->base_read_only) { |
| 378 | bdrv_reopen_set_read_only(base, true, NULL); |
| 379 | } |
Alberto Garcia | 2468eed | 2019-02-15 15:49:32 +0200 | [diff] [blame] | 380 | job_early_fail(&s->common.job); |
| 381 | /* commit_top_bs has to be replaced after deleting the block job, |
| 382 | * otherwise this would fail because of lack of permissions. */ |
Kevin Wolf | 8dfba27 | 2017-01-16 16:22:34 +0100 | [diff] [blame] | 383 | if (commit_top_bs) { |
Kevin Wolf | bde7071 | 2017-06-27 20:36:18 +0200 | [diff] [blame] | 384 | bdrv_replace_node(commit_top_bs, top, &error_abort); |
Kevin Wolf | 8dfba27 | 2017-01-16 16:22:34 +0100 | [diff] [blame] | 385 | } |
Jeff Cody | 747ff60 | 2012-09-27 13:29:13 -0400 | [diff] [blame] | 386 | } |
Kevin Wolf | 83fd6dd | 2016-05-30 15:53:15 +0200 | [diff] [blame] | 387 | |
| 388 | |
Eric Blake | d6a644b | 2017-07-07 07:44:57 -0500 | [diff] [blame] | 389 | #define COMMIT_BUF_SIZE (2048 * BDRV_SECTOR_SIZE) |
Kevin Wolf | 83fd6dd | 2016-05-30 15:53:15 +0200 | [diff] [blame] | 390 | |
| 391 | /* commit COW file into the raw image */ |
| 392 | int bdrv_commit(BlockDriverState *bs) |
| 393 | { |
Kevin Wolf | f8e2bd5 | 2016-05-30 16:29:47 +0200 | [diff] [blame] | 394 | BlockBackend *src, *backing; |
Kevin Wolf | d3f0675 | 2017-01-19 18:16:03 +0100 | [diff] [blame] | 395 | BlockDriverState *backing_file_bs = NULL; |
| 396 | BlockDriverState *commit_top_bs = NULL; |
Kevin Wolf | 83fd6dd | 2016-05-30 15:53:15 +0200 | [diff] [blame] | 397 | BlockDriver *drv = bs->drv; |
Kevin Wolf | d861ab3 | 2019-04-25 14:25:10 +0200 | [diff] [blame] | 398 | AioContext *ctx; |
Eric Blake | d6a644b | 2017-07-07 07:44:57 -0500 | [diff] [blame] | 399 | int64_t offset, length, backing_length; |
Alberto Garcia | c742a36 | 2018-11-12 16:00:36 +0200 | [diff] [blame] | 400 | int ro; |
Eric Blake | d6a644b | 2017-07-07 07:44:57 -0500 | [diff] [blame] | 401 | int64_t n; |
Kevin Wolf | 83fd6dd | 2016-05-30 15:53:15 +0200 | [diff] [blame] | 402 | int ret = 0; |
| 403 | uint8_t *buf = NULL; |
Kevin Wolf | d3f0675 | 2017-01-19 18:16:03 +0100 | [diff] [blame] | 404 | Error *local_err = NULL; |
Kevin Wolf | 83fd6dd | 2016-05-30 15:53:15 +0200 | [diff] [blame] | 405 | |
| 406 | if (!drv) |
| 407 | return -ENOMEDIUM; |
| 408 | |
| 409 | if (!bs->backing) { |
| 410 | return -ENOTSUP; |
| 411 | } |
| 412 | |
| 413 | if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_COMMIT_SOURCE, NULL) || |
| 414 | bdrv_op_is_blocked(bs->backing->bs, BLOCK_OP_TYPE_COMMIT_TARGET, NULL)) { |
| 415 | return -EBUSY; |
| 416 | } |
| 417 | |
| 418 | ro = bs->backing->bs->read_only; |
Kevin Wolf | 83fd6dd | 2016-05-30 15:53:15 +0200 | [diff] [blame] | 419 | |
| 420 | if (ro) { |
Alberto Garcia | c742a36 | 2018-11-12 16:00:36 +0200 | [diff] [blame] | 421 | if (bdrv_reopen_set_read_only(bs->backing->bs, false, NULL)) { |
Kevin Wolf | 83fd6dd | 2016-05-30 15:53:15 +0200 | [diff] [blame] | 422 | return -EACCES; |
| 423 | } |
| 424 | } |
| 425 | |
Kevin Wolf | d861ab3 | 2019-04-25 14:25:10 +0200 | [diff] [blame] | 426 | ctx = bdrv_get_aio_context(bs); |
| 427 | src = blk_new(ctx, BLK_PERM_CONSISTENT_READ, BLK_PERM_ALL); |
| 428 | backing = blk_new(ctx, BLK_PERM_WRITE | BLK_PERM_RESIZE, BLK_PERM_ALL); |
Kevin Wolf | d708642 | 2017-01-13 19:02:32 +0100 | [diff] [blame] | 429 | |
Kevin Wolf | d3f0675 | 2017-01-19 18:16:03 +0100 | [diff] [blame] | 430 | ret = blk_insert_bs(src, bs, &local_err); |
Kevin Wolf | d708642 | 2017-01-13 19:02:32 +0100 | [diff] [blame] | 431 | if (ret < 0) { |
Kevin Wolf | d3f0675 | 2017-01-19 18:16:03 +0100 | [diff] [blame] | 432 | error_report_err(local_err); |
Kevin Wolf | d708642 | 2017-01-13 19:02:32 +0100 | [diff] [blame] | 433 | goto ro_cleanup; |
| 434 | } |
| 435 | |
Kevin Wolf | d3f0675 | 2017-01-19 18:16:03 +0100 | [diff] [blame] | 436 | /* Insert commit_top block node above backing, so we can write to it */ |
| 437 | backing_file_bs = backing_bs(bs); |
| 438 | |
| 439 | commit_top_bs = bdrv_new_open_driver(&bdrv_commit_top, NULL, BDRV_O_RDWR, |
| 440 | &local_err); |
| 441 | if (commit_top_bs == NULL) { |
| 442 | error_report_err(local_err); |
| 443 | goto ro_cleanup; |
| 444 | } |
| 445 | |
Kevin Wolf | 12fa4af | 2017-02-17 20:42:32 +0100 | [diff] [blame] | 446 | bdrv_set_backing_hd(commit_top_bs, backing_file_bs, &error_abort); |
| 447 | bdrv_set_backing_hd(bs, commit_top_bs, &error_abort); |
Kevin Wolf | d3f0675 | 2017-01-19 18:16:03 +0100 | [diff] [blame] | 448 | |
| 449 | ret = blk_insert_bs(backing, backing_file_bs, &local_err); |
Kevin Wolf | d708642 | 2017-01-13 19:02:32 +0100 | [diff] [blame] | 450 | if (ret < 0) { |
Kevin Wolf | d3f0675 | 2017-01-19 18:16:03 +0100 | [diff] [blame] | 451 | error_report_err(local_err); |
Kevin Wolf | d708642 | 2017-01-13 19:02:32 +0100 | [diff] [blame] | 452 | goto ro_cleanup; |
| 453 | } |
Kevin Wolf | f8e2bd5 | 2016-05-30 16:29:47 +0200 | [diff] [blame] | 454 | |
| 455 | length = blk_getlength(src); |
Kevin Wolf | 83fd6dd | 2016-05-30 15:53:15 +0200 | [diff] [blame] | 456 | if (length < 0) { |
| 457 | ret = length; |
| 458 | goto ro_cleanup; |
| 459 | } |
| 460 | |
Kevin Wolf | f8e2bd5 | 2016-05-30 16:29:47 +0200 | [diff] [blame] | 461 | backing_length = blk_getlength(backing); |
Kevin Wolf | 83fd6dd | 2016-05-30 15:53:15 +0200 | [diff] [blame] | 462 | if (backing_length < 0) { |
| 463 | ret = backing_length; |
| 464 | goto ro_cleanup; |
| 465 | } |
| 466 | |
| 467 | /* If our top snapshot is larger than the backing file image, |
| 468 | * grow the backing file image if possible. If not possible, |
| 469 | * we must return an error */ |
| 470 | if (length > backing_length) { |
Max Reitz | 3a691c5 | 2017-06-13 22:20:54 +0200 | [diff] [blame] | 471 | ret = blk_truncate(backing, length, PREALLOC_MODE_OFF, &local_err); |
Kevin Wolf | 83fd6dd | 2016-05-30 15:53:15 +0200 | [diff] [blame] | 472 | if (ret < 0) { |
Max Reitz | ed3d2ec | 2017-03-28 22:51:27 +0200 | [diff] [blame] | 473 | error_report_err(local_err); |
Kevin Wolf | 83fd6dd | 2016-05-30 15:53:15 +0200 | [diff] [blame] | 474 | goto ro_cleanup; |
| 475 | } |
| 476 | } |
| 477 | |
Kevin Wolf | f8e2bd5 | 2016-05-30 16:29:47 +0200 | [diff] [blame] | 478 | /* blk_try_blockalign() for src will choose an alignment that works for |
| 479 | * backing as well, so no need to compare the alignment manually. */ |
Eric Blake | d6a644b | 2017-07-07 07:44:57 -0500 | [diff] [blame] | 480 | buf = blk_try_blockalign(src, COMMIT_BUF_SIZE); |
Kevin Wolf | 83fd6dd | 2016-05-30 15:53:15 +0200 | [diff] [blame] | 481 | if (buf == NULL) { |
| 482 | ret = -ENOMEM; |
| 483 | goto ro_cleanup; |
| 484 | } |
| 485 | |
Eric Blake | d6a644b | 2017-07-07 07:44:57 -0500 | [diff] [blame] | 486 | for (offset = 0; offset < length; offset += n) { |
| 487 | ret = bdrv_is_allocated(bs, offset, COMMIT_BUF_SIZE, &n); |
Kevin Wolf | 83fd6dd | 2016-05-30 15:53:15 +0200 | [diff] [blame] | 488 | if (ret < 0) { |
| 489 | goto ro_cleanup; |
| 490 | } |
| 491 | if (ret) { |
Eric Blake | d6a644b | 2017-07-07 07:44:57 -0500 | [diff] [blame] | 492 | ret = blk_pread(src, offset, buf, n); |
Kevin Wolf | 83fd6dd | 2016-05-30 15:53:15 +0200 | [diff] [blame] | 493 | if (ret < 0) { |
| 494 | goto ro_cleanup; |
| 495 | } |
| 496 | |
Eric Blake | d6a644b | 2017-07-07 07:44:57 -0500 | [diff] [blame] | 497 | ret = blk_pwrite(backing, offset, buf, n, 0); |
Kevin Wolf | 83fd6dd | 2016-05-30 15:53:15 +0200 | [diff] [blame] | 498 | if (ret < 0) { |
| 499 | goto ro_cleanup; |
| 500 | } |
| 501 | } |
| 502 | } |
| 503 | |
| 504 | if (drv->bdrv_make_empty) { |
| 505 | ret = drv->bdrv_make_empty(bs); |
| 506 | if (ret < 0) { |
| 507 | goto ro_cleanup; |
| 508 | } |
Kevin Wolf | f8e2bd5 | 2016-05-30 16:29:47 +0200 | [diff] [blame] | 509 | blk_flush(src); |
Kevin Wolf | 83fd6dd | 2016-05-30 15:53:15 +0200 | [diff] [blame] | 510 | } |
| 511 | |
| 512 | /* |
| 513 | * Make sure all data we wrote to the backing device is actually |
| 514 | * stable on disk. |
| 515 | */ |
Kevin Wolf | f8e2bd5 | 2016-05-30 16:29:47 +0200 | [diff] [blame] | 516 | blk_flush(backing); |
Kevin Wolf | 83fd6dd | 2016-05-30 15:53:15 +0200 | [diff] [blame] | 517 | |
| 518 | ret = 0; |
| 519 | ro_cleanup: |
| 520 | qemu_vfree(buf); |
| 521 | |
Kevin Wolf | f8e2bd5 | 2016-05-30 16:29:47 +0200 | [diff] [blame] | 522 | blk_unref(backing); |
Kevin Wolf | d3f0675 | 2017-01-19 18:16:03 +0100 | [diff] [blame] | 523 | if (backing_file_bs) { |
Kevin Wolf | 12fa4af | 2017-02-17 20:42:32 +0100 | [diff] [blame] | 524 | bdrv_set_backing_hd(bs, backing_file_bs, &error_abort); |
Kevin Wolf | d3f0675 | 2017-01-19 18:16:03 +0100 | [diff] [blame] | 525 | } |
| 526 | bdrv_unref(commit_top_bs); |
| 527 | blk_unref(src); |
Kevin Wolf | f8e2bd5 | 2016-05-30 16:29:47 +0200 | [diff] [blame] | 528 | |
Kevin Wolf | 83fd6dd | 2016-05-30 15:53:15 +0200 | [diff] [blame] | 529 | if (ro) { |
| 530 | /* ignoring error return here */ |
Alberto Garcia | c742a36 | 2018-11-12 16:00:36 +0200 | [diff] [blame] | 531 | bdrv_reopen_set_read_only(bs->backing->bs, true, NULL); |
Kevin Wolf | 83fd6dd | 2016-05-30 15:53:15 +0200 | [diff] [blame] | 532 | } |
| 533 | |
| 534 | return ret; |
| 535 | } |