2 * Copy-on-read filter block driver
4 * Copyright (c) 2018 Red Hat, Inc.
7 * Max Reitz <mreitz@redhat.com>
9 * This program is free software; you can redistribute it and/or
10 * modify it under the terms of the GNU General Public License as
11 * published by the Free Software Foundation; either version 2 or
12 * (at your option) version 3 of the License.
14 * This program is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 * GNU General Public License for more details.
19 * You should have received a copy of the GNU General Public License
20 * along with this program; if not, see <http://www.gnu.org/licenses/>.
23 #include "qemu/osdep.h"
24 #include "block/block_int.h"
25 #include "qemu/module.h"
26 #include "qapi/error.h"
27 #include "qapi/qmp/qdict.h"
28 #include "block/copy-on-read.h"
31 typedef struct BDRVStateCOR
{
33 BlockDriverState
*bottom_bs
;
38 static int cor_open(BlockDriverState
*bs
, QDict
*options
, int flags
,
41 BlockDriverState
*bottom_bs
= NULL
;
42 BDRVStateCOR
*state
= bs
->opaque
;
43 /* Find a bottom node name, if any */
44 const char *bottom_node
= qdict_get_try_str(options
, "bottom");
46 bs
->file
= bdrv_open_child(NULL
, options
, "file", bs
, &child_of_bds
,
47 BDRV_CHILD_FILTERED
| BDRV_CHILD_PRIMARY
,
53 bs
->supported_read_flags
= BDRV_REQ_PREFETCH
;
55 bs
->supported_write_flags
= BDRV_REQ_WRITE_UNCHANGED
|
56 (BDRV_REQ_FUA
& bs
->file
->bs
->supported_write_flags
);
58 bs
->supported_zero_flags
= BDRV_REQ_WRITE_UNCHANGED
|
59 ((BDRV_REQ_FUA
| BDRV_REQ_MAY_UNMAP
| BDRV_REQ_NO_FALLBACK
) &
60 bs
->file
->bs
->supported_zero_flags
);
63 bottom_bs
= bdrv_find_node(bottom_node
);
65 error_setg(errp
, "Bottom node '%s' not found", bottom_node
);
66 qdict_del(options
, "bottom");
69 qdict_del(options
, "bottom");
71 if (!bottom_bs
->drv
) {
72 error_setg(errp
, "Bottom node '%s' not opened", bottom_node
);
76 if (bottom_bs
->drv
->is_filter
) {
77 error_setg(errp
, "Bottom node '%s' is a filter", bottom_node
);
81 if (bdrv_freeze_backing_chain(bs
, bottom_bs
, errp
) < 0) {
84 state
->chain_frozen
= true;
87 * We do freeze the chain, so it shouldn't be removed. Still, storing a
88 * pointer worth bdrv_ref().
93 state
->bottom_bs
= bottom_bs
;
96 * We don't need to call bdrv_child_refresh_perms() now as the permissions
97 * will be updated later when the filter node gets its parent.
104 #define PERM_PASSTHROUGH (BLK_PERM_CONSISTENT_READ \
107 #define PERM_UNCHANGED (BLK_PERM_ALL & ~PERM_PASSTHROUGH)
109 static void cor_child_perm(BlockDriverState
*bs
, BdrvChild
*c
,
111 BlockReopenQueue
*reopen_queue
,
112 uint64_t perm
, uint64_t shared
,
113 uint64_t *nperm
, uint64_t *nshared
)
115 BDRVStateCOR
*s
= bs
->opaque
;
119 * While the filter is being removed
122 *nshared
= BLK_PERM_ALL
;
126 *nperm
= perm
& PERM_PASSTHROUGH
;
127 *nshared
= (shared
& PERM_PASSTHROUGH
) | PERM_UNCHANGED
;
129 /* We must not request write permissions for an inactive node, the child
130 * cannot provide it. */
131 if (!(bs
->open_flags
& BDRV_O_INACTIVE
)) {
132 *nperm
|= BLK_PERM_WRITE_UNCHANGED
;
137 static int64_t cor_getlength(BlockDriverState
*bs
)
139 return bdrv_getlength(bs
->file
->bs
);
143 static int coroutine_fn
cor_co_preadv_part(BlockDriverState
*bs
,
144 uint64_t offset
, uint64_t bytes
,
152 BDRVStateCOR
*state
= bs
->opaque
;
154 if (!state
->bottom_bs
) {
155 return bdrv_co_preadv_part(bs
->file
, offset
, bytes
, qiov
, qiov_offset
,
156 flags
| BDRV_REQ_COPY_ON_READ
);
162 /* In case of failure, try to copy-on-read anyway */
163 ret
= bdrv_is_allocated(bs
->file
->bs
, offset
, bytes
, &n
);
165 ret
= bdrv_is_allocated_above(bdrv_backing_chain_next(bs
->file
->bs
),
166 state
->bottom_bs
, true, offset
,
168 if (ret
> 0 || ret
< 0) {
169 local_flags
|= BDRV_REQ_COPY_ON_READ
;
171 /* Finish earlier if the end of a backing file has been reached */
177 /* Skip if neither read nor write are needed */
178 if ((local_flags
& (BDRV_REQ_PREFETCH
| BDRV_REQ_COPY_ON_READ
)) !=
180 ret
= bdrv_co_preadv_part(bs
->file
, offset
, n
, qiov
, qiov_offset
,
196 static int coroutine_fn
cor_co_pwritev_part(BlockDriverState
*bs
,
200 size_t qiov_offset
, int flags
)
202 return bdrv_co_pwritev_part(bs
->file
, offset
, bytes
, qiov
, qiov_offset
,
207 static int coroutine_fn
cor_co_pwrite_zeroes(BlockDriverState
*bs
,
208 int64_t offset
, int bytes
,
209 BdrvRequestFlags flags
)
211 return bdrv_co_pwrite_zeroes(bs
->file
, offset
, bytes
, flags
);
215 static int coroutine_fn
cor_co_pdiscard(BlockDriverState
*bs
,
216 int64_t offset
, int bytes
)
218 return bdrv_co_pdiscard(bs
->file
, offset
, bytes
);
222 static int coroutine_fn
cor_co_pwritev_compressed(BlockDriverState
*bs
,
227 return bdrv_co_pwritev(bs
->file
, offset
, bytes
, qiov
,
228 BDRV_REQ_WRITE_COMPRESSED
);
232 static void cor_eject(BlockDriverState
*bs
, bool eject_flag
)
234 bdrv_eject(bs
->file
->bs
, eject_flag
);
238 static void cor_lock_medium(BlockDriverState
*bs
, bool locked
)
240 bdrv_lock_medium(bs
->file
->bs
, locked
);
244 static void cor_close(BlockDriverState
*bs
)
246 BDRVStateCOR
*s
= bs
->opaque
;
248 if (s
->chain_frozen
) {
249 s
->chain_frozen
= false;
250 bdrv_unfreeze_backing_chain(bs
, s
->bottom_bs
);
253 bdrv_unref(s
->bottom_bs
);
257 static BlockDriver bdrv_copy_on_read
= {
258 .format_name
= "copy-on-read",
259 .instance_size
= sizeof(BDRVStateCOR
),
261 .bdrv_open
= cor_open
,
262 .bdrv_close
= cor_close
,
263 .bdrv_child_perm
= cor_child_perm
,
265 .bdrv_getlength
= cor_getlength
,
267 .bdrv_co_preadv_part
= cor_co_preadv_part
,
268 .bdrv_co_pwritev_part
= cor_co_pwritev_part
,
269 .bdrv_co_pwrite_zeroes
= cor_co_pwrite_zeroes
,
270 .bdrv_co_pdiscard
= cor_co_pdiscard
,
271 .bdrv_co_pwritev_compressed
= cor_co_pwritev_compressed
,
273 .bdrv_eject
= cor_eject
,
274 .bdrv_lock_medium
= cor_lock_medium
,
276 .has_variable_length
= true,
281 void bdrv_cor_filter_drop(BlockDriverState
*cor_filter_bs
)
284 BlockDriverState
*bs
;
285 BDRVStateCOR
*s
= cor_filter_bs
->opaque
;
287 child
= bdrv_filter_child(cor_filter_bs
);
293 /* Retain the BDS until we complete the graph change. */
295 /* Hold a guest back from writing while permissions are being reset. */
296 bdrv_drained_begin(bs
);
297 /* Drop permissions before the graph change. */
299 /* unfreeze, as otherwise bdrv_replace_node() will fail */
300 if (s
->chain_frozen
) {
301 s
->chain_frozen
= false;
302 bdrv_unfreeze_backing_chain(cor_filter_bs
, s
->bottom_bs
);
304 bdrv_child_refresh_perms(cor_filter_bs
, child
, &error_abort
);
305 bdrv_replace_node(cor_filter_bs
, bs
, &error_abort
);
307 bdrv_drained_end(bs
);
309 bdrv_unref(cor_filter_bs
);
313 static void bdrv_copy_on_read_init(void)
315 bdrv_register(&bdrv_copy_on_read
);
318 block_init(bdrv_copy_on_read_init
);