[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]
Re: [Qemu-block] [PATCH 13/21] qcow2: add .bdrv_store_persistent_dirty_b
From: |
Max Reitz |
Subject: |
Re: [Qemu-block] [PATCH 13/21] qcow2: add .bdrv_store_persistent_dirty_bitmaps() |
Date: |
Fri, 9 Dec 2016 18:05:27 +0100 |
User-agent: |
Mozilla/5.0 (X11; Linux x86_64; rv:45.0) Gecko/20100101 Thunderbird/45.5.1 |
On 22.11.2016 18:26, Vladimir Sementsov-Ogievskiy wrote:
> Realize block bitmap storing interface, to allow qcow2 images store
> persistent bitmaps.
>
> Signed-off-by: Vladimir Sementsov-Ogievskiy <address@hidden>
> ---
> block/qcow2-bitmap.c | 451
> +++++++++++++++++++++++++++++++++++++++++++++++++++
> block/qcow2.c | 1 +
> block/qcow2.h | 1 +
> 3 files changed, 453 insertions(+)
>
> diff --git a/block/qcow2-bitmap.c b/block/qcow2-bitmap.c
> index 81be1ca..a975388 100644
> --- a/block/qcow2-bitmap.c
> +++ b/block/qcow2-bitmap.c
> @@ -28,6 +28,7 @@
> #include "qemu/osdep.h"
> #include "qapi/error.h"
> #include "exec/log.h"
> +#include "qemu/cutils.h"
>
> #include "block/block_int.h"
> #include "block/qcow2.h"
> @@ -43,6 +44,10 @@
> #define BME_MIN_GRANULARITY_BITS 9
> #define BME_MAX_NAME_SIZE 1023
>
> +#if BME_MAX_TABLE_SIZE * 8ULL > INT_MAX
> +#error In the code bitmap table physical size assumed to fit into int
> +#endif
> +
> /* Bitmap directory entry flags */
> #define BME_RESERVED_FLAGS 0xfffffffcU
> #define BME_FLAG_IN_USE 1
> @@ -74,6 +79,8 @@ typedef struct Qcow2Bitmap {
> uint8_t granularity_bits;
> char *name;
>
> + BdrvDirtyBitmap *dirty_bitmap;
(I'm not quite happy with the asymmetry of this field (it isn't set by
load_bitmap(), but it is required by store_bitmap()), but making it
symmetric either by making load_bitmap() set it or by store_bitmap() not
reading it (but getting the value through an explicit parameter) makes
the code needlessly more complicated, so I guess I'll have to stay
not-quite-happy.)
> +
> QSIMPLEQ_ENTRY(Qcow2Bitmap) entry;
> } Qcow2Bitmap;
> typedef QSIMPLEQ_HEAD(Qcow2BitmapList, Qcow2Bitmap) Qcow2BitmapList;
> @@ -87,6 +94,27 @@ static inline bool can_write(BlockDriverState *bs)
> return !bdrv_is_read_only(bs) && !(bdrv_get_flags(bs) & BDRV_O_INACTIVE);
> }
>
> +static int update_header_sync(BlockDriverState *bs)
> +{
> + int ret;
> +
> + ret = qcow2_update_header(bs);
> + if (ret < 0) {
> + return ret;
> + }
> +
> + /* We doesn't return bdrv_flush error code. Even if it fails, write was
s/doesn't/don't/
(Also, there's a double space after return.)
> + * successful and it is more logical to consider that header is in the
> new
> + * state than in the old.
> + */
> + ret = bdrv_flush(bs);
> + if (ret < 0) {
> + fprintf(stderr, "Failed to flush qcow2 header");
> + }
> +
> + return 0;
> +}
> +
> static inline void bitmap_table_to_cpu(uint64_t *bitmap_table, size_t size)
> {
> size_t i;
> @@ -96,6 +124,15 @@ static inline void bitmap_table_to_cpu(uint64_t
> *bitmap_table, size_t size)
> }
> }
>
> +static inline void bitmap_table_to_be(uint64_t *bitmap_table, size_t size)
> +{
> + size_t i;
> +
> + for (i = 0; i < size; ++i) {
> + cpu_to_be64s(&bitmap_table[i]);
> + }
> +}
> +
> /* Check table entry specification constraints. If cluster_size is 0, offset
> * alignment is not checked. */
> static int check_table_entry(uint64_t entry, int cluster_size)
> @@ -121,6 +158,51 @@ static int check_table_entry(uint64_t entry, int
> cluster_size)
> return 0;
> }
>
> +static int check_constraints_on_bitmap(BlockDriverState *bs,
> + const char *name,
> + uint32_t granularity)
> +{
> + BDRVQcow2State *s = bs->opaque;
> + int granularity_bits = ctz32(granularity);
> +
> + int64_t nb_sectors = bdrv_nb_sectors(bs);
> +
> + if (nb_sectors < 0) {
> + return nb_sectors;
> + }
> +
> + uint64_t phys_bitmap_bytes = (nb_sectors << BDRV_SECTOR_BITS) >>
Using bdrv_getlength() would be simpler.
> + granularity_bits;
> + uint64_t bitmap_table_size = phys_bitmap_bytes / s->cluster_size;
Should be a DIV_ROUND_UP().
> + size_t name_size = strlen(name);
> +
> + int fail =
I'd personally like a bool more.
> + (bitmap_table_size > BME_MAX_TABLE_SIZE) ||
> + (phys_bitmap_bytes > BME_MAX_PHYS_SIZE) ||
> + (granularity_bits > BME_MAX_GRANULARITY_BITS) ||
> + (granularity_bits < BME_MIN_GRANULARITY_BITS) ||
> + (name_size > BME_MAX_NAME_SIZE);
> +
> + return fail ? -EINVAL : 0;
> +}
> +
> +static void clear_bitmap_table(BlockDriverState *bs, uint64_t *bitmap_table,
> + uint32_t bitmap_table_size)
> +{
> + BDRVQcow2State *s = bs->opaque;
> + int i;
> +
> + for (i = 0; i < bitmap_table_size; ++i) {
> + uint64_t addr = bitmap_table[i] & BME_TABLE_ENTRY_OFFSET_MASK;
> + if (!addr) {
> + continue;
> + }
> +
> + qcow2_free_clusters(bs, addr, s->cluster_size, QCOW2_DISCARD_OTHER);
> + bitmap_table[i] = 0;
> + }
> +}
> +
> static int bitmap_table_load(BlockDriverState *bs, Qcow2Bitmap *bm,
> uint64_t **bitmap_table)
> {
> @@ -159,6 +241,28 @@ fail:
> return ret;
> }
>
> +static int free_bitmap_clusters(BlockDriverState *bs, Qcow2Bitmap *bm)
> +{
> + int ret;
> + uint64_t *bitmap_table;
> +
> + ret = bitmap_table_load(bs, bm, &bitmap_table);
> + if (ret < 0) {
> + assert(bitmap_table == NULL);
> + return ret;
> + }
> +
> + clear_bitmap_table(bs, bitmap_table, bm->table_size);
> + qcow2_free_clusters(bs, bm->table_offset, bm->table_size *
> sizeof(uint64_t),
> + QCOW2_DISCARD_OTHER);
> + g_free(bitmap_table);
> +
> + bm->table_offset = 0;
> + bm->table_size = 0;
> +
> + return 0;
> +}
> +
> /* This function returns the number of disk sectors covered by a single
> cluster
> * of bitmap data. */
> static uint64_t disk_sectors_in_bitmap_cluster(const BDRVQcow2State *s,
> @@ -603,6 +707,72 @@ fail:
> * Bitmap List end
> */
>
> +static int update_ext_header_and_dir(BlockDriverState *bs,
> + Qcow2BitmapList *bm_list)
> +{
> + BDRVQcow2State *s = bs->opaque;
> + int ret;
> + Qcow2Bitmap *bm;
> + uint64_t new_offset = 0;
> + uint64_t new_size = 0;
> + uint32_t new_nb_bitmaps = 0;
> + uint64_t old_offset = s->bitmap_directory_offset;
> + uint64_t old_size = s->bitmap_directory_size;
> + uint32_t old_nb_bitmaps = s->nb_bitmaps;
> + uint64_t old_autocl = s->autoclear_features;
> +
> + if (bm_list != NULL && !QSIMPLEQ_EMPTY(bm_list)) {
> + QSIMPLEQ_FOREACH(bm, bm_list, entry) {
> + new_nb_bitmaps++;
> + }
> +
> + if (new_nb_bitmaps > QCOW2_MAX_BITMAPS) {
> + return -EINVAL;
> + }
> +
> + ret = bitmap_list_store(bs, bm_list, &new_offset, &new_size, false);
> + if (ret < 0) {
> + return ret;
> + }
> +
> + ret = bdrv_flush(bs);
> + if (ret < 0) {
> + goto fail;
> + }
I think this only needs to flush bs->file, not bs itself. Alternatively,
bitmap_list_store() could just use bdrv_pwrite_sync().
> +
> + s->autoclear_features |= QCOW2_AUTOCLEAR_BITMAPS;
> + } else {
> + s->autoclear_features &= ~(uint64_t)QCOW2_AUTOCLEAR_BITMAPS;
> + }
> +
> + s->bitmap_directory_offset = new_offset;
> + s->bitmap_directory_size = new_size;
> + s->nb_bitmaps = new_nb_bitmaps;
> +
> + ret = update_header_sync(bs);
> + if (ret < 0) {
> + goto fail;
> + }
> +
> + if (old_size > 0) {
> + qcow2_free_clusters(bs, old_offset, old_size, QCOW2_DISCARD_OTHER);
> + }
> +
> + return 0;
> +
> +fail:
> + if (new_offset > 0) {
> + qcow2_free_clusters(bs, new_offset, new_size, QCOW2_DISCARD_OTHER);
> + }
> +
> + s->bitmap_directory_offset = old_offset;
> + s->bitmap_directory_size = old_size;
> + s->nb_bitmaps = old_nb_bitmaps;
> + s->autoclear_features = old_autocl;
> +
> + return ret;
> +}
> +
> /* for g_slist_foreach for GSList of BdrvDirtyBitmap* elements */
> static void release_dirty_bitmap_helper(gpointer bitmap,
> gpointer bs)
> @@ -664,3 +834,284 @@ fail:
> g_slist_free(created_dirty_bitmaps);
> bitmap_list_free(bm_list);
> }
> +
> +/* store_bitmap_data()
> + * Store bitmap to image, filling bitmap table accordingly.
> + */
> +static uint64_t *store_bitmap_data(BlockDriverState *bs,
> + BdrvDirtyBitmap *bitmap,
> + uint32_t *bitmap_table_size, Error **errp)
> +{
> + int ret;
> + BDRVQcow2State *s = bs->opaque;
> + int64_t sector;
> + uint64_t dsc;
> + uint64_t bm_size = bdrv_dirty_bitmap_size(bitmap);
> + const char *bm_name = bdrv_dirty_bitmap_name(bitmap);
> + uint8_t *buf = NULL;
> + BdrvDirtyBitmapIter *dbi;
> + uint64_t *tb;
> + uint64_t tb_size =
> + size_to_clusters(s,
> + bdrv_dirty_bitmap_serialization_size(bitmap, 0, bm_size));
> +
> + if (tb_size > BME_MAX_TABLE_SIZE ||
> + tb_size * s->cluster_size > BME_MAX_PHYS_SIZE) {
Alignment to the opening parenthesis, please.
> + error_setg(errp, "Bitmap '%s' is too big", bm_name);
> + return NULL;
> + }
> +
> + tb = g_try_new0(uint64_t, tb_size);
> + if (tb == NULL) {
> + error_setg(errp, "No memory");
> + return NULL;
> + }
> +
> + dbi = bdrv_dirty_iter_new(bitmap, 0);
> + buf = g_malloc(s->cluster_size);
> + dsc = disk_sectors_in_bitmap_cluster(s, bitmap);
> +
> + while ((sector = bdrv_dirty_iter_next(dbi)) != -1) {
> + uint64_t cluster = sector / dsc;
> + uint64_t end, write_size;
> + int64_t off;
> +
> + sector = cluster * dsc;
> + end = MIN(bm_size, sector + dsc);
> + write_size =
> + bdrv_dirty_bitmap_serialization_size(bitmap, sector, end -
> sector);
> +
> + off = qcow2_alloc_clusters(bs, s->cluster_size);
> + if (off < 0) {
> + error_setg_errno(errp, -off,
> + "Failed to allocate clusters for bitmap '%s'",
> + bm_name);
> + goto fail;
> + }
> + tb[cluster] = off;
Somehow I would feel better with either an assert(cluster < tb_size);
here or an assert(bdrv_nb_sectors(bs) / dsc == tb_size); (plus the error
handling for bdrv_nb_sectors()) above the loop.
> +
> + bdrv_dirty_bitmap_serialize_part(bitmap, buf, sector, end - sector);
> + if (write_size < s->cluster_size) {
> + memset(buf + write_size, 0, s->cluster_size - write_size);
> + }
Should we assert that write_size <= s->cluster_size?
> +
> + ret = qcow2_pre_write_overlap_check(bs, 0, off, s->cluster_size);
> + if (ret < 0) {
> + error_setg_errno(errp, -ret, "Qcow2 overlap check failed");
> + goto fail;
> + }
> +
> + ret = bdrv_pwrite(bs->file, off, buf, s->cluster_size);
> + if (ret < 0) {
> + error_setg_errno(errp, -ret, "Failed to write bitmap '%s' to
> file",
> + bm_name);
> + goto fail;
> + }
> +
> + if (end >= bm_size) {
> + break;
> + }
> +
> + bdrv_set_dirty_iter(dbi, end);
> + }
> +
> + *bitmap_table_size = tb_size;
> + g_free(buf);
> + bdrv_dirty_iter_free(dbi);
> +
> + return tb;
> +
> +fail:
> + clear_bitmap_table(bs, tb, tb_size);
> + g_free(buf);
> + bdrv_dirty_iter_free(dbi);
> + g_free(tb);
> +
> + return NULL;
> +}
> +
> +/* store_bitmap()
> + * Store bm->dirty_bitmap to qcow2.
> + * Set bm->table_offset and bm->table_size accordingly.
> + */
> +static int store_bitmap(BlockDriverState *bs, Qcow2Bitmap *bm, Error **errp)
> +{
> + int ret;
> + uint64_t *tb;
> + int64_t tb_offset;
> + uint32_t tb_size;
> + BdrvDirtyBitmap *bitmap = bm->dirty_bitmap;
> + const char *bm_name;
> +
> + assert(bitmap != NULL);
> +
> + bm_name = bdrv_dirty_bitmap_name(bitmap);
> +
> + tb = store_bitmap_data(bs, bitmap, &tb_size, errp);
> + if (tb == NULL) {
> + g_free(tb);
> + return -EINVAL;
> + }
> +
> + assert(tb_size <= BME_MAX_TABLE_SIZE);
> + tb_offset = qcow2_alloc_clusters(bs, tb_size * sizeof(tb[0]));
> + if (tb_offset < 0) {
> + error_setg_errno(errp, -tb_offset,
> + "Failed to allocate clusters for bitmap '%s'",
> + bm_name);
> + goto fail;
> + }
> +
> + ret = qcow2_pre_write_overlap_check(bs, 0, tb_offset,
> + tb_size * sizeof(tb[0]));
> + if (ret < 0) {
> + error_setg_errno(errp, -ret, "Qcow2 overlap check failed");
> + goto fail;
> + }
> +
> + bitmap_table_to_be(tb, tb_size);
> + ret = bdrv_pwrite(bs->file, tb_offset, tb, tb_size * sizeof(tb[0]));
> + if (ret < 0) {
> + error_setg_errno(errp, -ret, "Failed to write bitmap '%s' to file",
> + bm_name);
> + goto fail;
> + }
> +
> + g_free(tb);
> +
> + bm->table_offset = tb_offset;
> + bm->table_size = tb_size;
> +
> + return 0;
> +
> +fail:
> + clear_bitmap_table(bs, tb, tb_size);
> +
> + if (tb_offset > 0) {
> + qcow2_free_clusters(bs, tb_offset, tb_size, QCOW2_DISCARD_OTHER);
tb_size should be tb_size * sizeof(uint64_t) (or sizeof(tb[0])).
> + }
> +
> + g_free(tb);
> +
> + return ret;
> +}
> +
> +static Qcow2Bitmap *find_bitmap_by_name(Qcow2BitmapList *bm_list,
> + const char *name)
> +{
> + Qcow2Bitmap *bm;
> +
> + QSIMPLEQ_FOREACH(bm, bm_list, entry) {
> + if (strcmp(name, bm->name) == 0) {
> + return bm;
> + }
> + }
> +
> + return NULL;
> +}
> +
> +void qcow2_store_persistent_dirty_bitmaps(BlockDriverState *bs, Error **errp)
> +{
> + BdrvDirtyBitmap *bitmap;
> + BDRVQcow2State *s = bs->opaque;
> + uint32_t new_nb_bitmaps = s->nb_bitmaps;
> + uint64_t new_dir_size = s->bitmap_directory_size;
> + int ret;
> + Qcow2BitmapList *bm_list;
> + Qcow2Bitmap *bm;
> +
> + if (!bdrv_has_persistent_bitmaps(bs)) {
> + /* nothing to do */
> + return;
Maybe there is something to do. See [1].
> + }
> +
> + if (s->nb_bitmaps == 0) {
> + bm_list = bitmap_list_new();
> + } else {
> + bm_list = bitmap_list_load(bs, s->bitmap_directory_offset,
> + s->bitmap_directory_size, errp);
> + if (bm_list == NULL) {
> + /* errp is already set */
> + return;
> + }
> + }
> +
> + /* check constraints and names */
> + for (bitmap = bdrv_dirty_bitmap_next(bs, NULL); bitmap != NULL;
> + bitmap = bdrv_dirty_bitmap_next(bs, bitmap)) {
Alignment to the opening parenthesis, please.
> + const char *name = bdrv_dirty_bitmap_name(bitmap);
> + uint32_t granularity = bdrv_dirty_bitmap_granularity(bitmap);
> + Qcow2Bitmap *bm;
> +
> + if (!bdrv_dirty_bitmap_get_persistance(bitmap)) {
> + continue;
> + }
> +
> + if (++new_nb_bitmaps > QCOW2_MAX_BITMAPS) {
> + error_setg(errp, "Too many persistent bitmaps");
> + goto fail;
> + }
> +
> + new_dir_size += calc_dir_entry_size(strlen(name), 0);
> + if (new_dir_size > QCOW2_MAX_BITMAP_DIRECTORY_SIZE) {
> + error_setg(errp, "Too large bitmap directory");
> + goto fail;
> + }
You only need to increment new_nb_bitmaps and increase new_dir_size if
the bitmap does not already exist in the image (i.e. if
find_bitmap_by_name() below returns NULL).
> +
> + if (check_constraints_on_bitmap(bs, name, granularity) < 0) {
> + error_setg(errp, "Bitmap '%s' doesn't satisfy the constraints",
> + name);
> + goto fail;
> + }
> +
> + bm = find_bitmap_by_name(bm_list, name);
> + if (bm == NULL) {
> + bm = g_new0(Qcow2Bitmap, 1);
> + bm->name = g_strdup(name);
> + QSIMPLEQ_INSERT_TAIL(bm_list, bm, entry);
> + } else {
> + if (!(bm->flags & BME_FLAG_IN_USE) && can_write(bs)) {
Shouldn't we error out right at the beginning of this function if
can_write(bs) is false?
> + error_setg(errp, "Bitmap '%s' is already exists in the
> image",
> + name);
> + goto fail;
> + }
> + free_bitmap_clusters(bs, bm);
These clusters should not be freed until the new data has been written
successfully.
> + /* TODO it is better to reuse these clusters */
> + }
> + bm->flags = bdrv_dirty_bitmap_get_autoload(bitmap) ? BME_FLAG_AUTO :
> 0;
> + bm->granularity_bits = ctz32(bdrv_dirty_bitmap_granularity(bitmap));
> + bm->dirty_bitmap = bitmap;
> + }
[1] What about bitmaps that have BME_FLAG_IN_USE set but do not have a
corresponding BDS bitmap?
If such a bitmap does not have BME_FLAG_AUTO set, we didn't set the
flag, so we should keep it unchanged. That's what this function is
currently doing.
However, if such a bitmap does have BME_FLAG_AUTO set, it was definitely
us who set the IN_USE flag (because otherwise we would have aborted
loading the bitmaps, and thus also aborted bdrv_open_common()).
Therefore, the only explanation is that the bitmap was deleted in the
meantime, and that means we should also delete it in the qcow2 file.
Max
> +
> + /* allocate clusters and store bitmaps */
> + QSIMPLEQ_FOREACH(bm, bm_list, entry) {
> + if (bm->dirty_bitmap == NULL) {
> + continue;
> + }
> +
> + ret = store_bitmap(bs, bm, errp);
> + if (ret < 0) {
> + goto fail;
> + }
> + }
> +
> + ret = update_ext_header_and_dir(bs, bm_list);
> + if (ret < 0) {
> + error_setg_errno(errp, -ret, "Failed to update bitmap extension");
> + goto fail;
> + }
> +
> + bitmap_list_free(bm_list);
> + return;
> +
> +fail:
> + QSIMPLEQ_FOREACH(bm, bm_list, entry) {
> + if (bm->dirty_bitmap == NULL || bm->table_offset == 0) {
> + continue;
> + }
> +
> + free_bitmap_clusters(bs, bm);
> + }
> +
> + bitmap_list_free(bm_list);
> +}
> diff --git a/block/qcow2.c b/block/qcow2.c
> index 443be0e..66c7f74 100644
> --- a/block/qcow2.c
> +++ b/block/qcow2.c
> @@ -3515,6 +3515,7 @@ BlockDriver bdrv_qcow2 = {
> .bdrv_attach_aio_context = qcow2_attach_aio_context,
>
> .bdrv_load_autoloading_dirty_bitmaps =
> qcow2_load_autoloading_dirty_bitmaps,
> + .bdrv_store_persistent_dirty_bitmaps =
> qcow2_store_persistent_dirty_bitmaps,
> };
>
> static void bdrv_qcow2_init(void)
> diff --git a/block/qcow2.h b/block/qcow2.h
> index bcedf5b..d9a7643 100644
> --- a/block/qcow2.h
> +++ b/block/qcow2.h
> @@ -615,5 +615,6 @@ void qcow2_cache_put(BlockDriverState *bs, Qcow2Cache *c,
> void **table);
>
> /* qcow2-bitmap.c functions */
> void qcow2_load_autoloading_dirty_bitmaps(BlockDriverState *bs, Error
> **errp);
> +void qcow2_store_persistent_dirty_bitmaps(BlockDriverState *bs, Error
> **errp);
>
> #endif
>
signature.asc
Description: OpenPGP digital signature
- Re: [Qemu-block] [PATCH 13/21] qcow2: add .bdrv_store_persistent_dirty_bitmaps(),
Max Reitz <=