mirror of https://gitee.com/openkylin/qemu.git
block-migration: efficiently encode zero blocks
this patch adds a efficient encoding for zero blocks by adding a new flag indicating a block is completely zero. additionally bdrv_write_zeros() is used at the destination to efficiently write these zeroes. depending on the implementation this avoids that the destination target gets fully provisioned. Signed-off-by: Peter Lieven <pl@kamp.de> Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
This commit is contained in:
parent
8bf9344ad6
commit
323004a39d
|
@ -29,6 +29,7 @@
|
||||||
#define BLK_MIG_FLAG_DEVICE_BLOCK 0x01
|
#define BLK_MIG_FLAG_DEVICE_BLOCK 0x01
|
||||||
#define BLK_MIG_FLAG_EOS 0x02
|
#define BLK_MIG_FLAG_EOS 0x02
|
||||||
#define BLK_MIG_FLAG_PROGRESS 0x04
|
#define BLK_MIG_FLAG_PROGRESS 0x04
|
||||||
|
#define BLK_MIG_FLAG_ZERO_BLOCK 0x08
|
||||||
|
|
||||||
#define MAX_IS_ALLOCATED_SEARCH 65536
|
#define MAX_IS_ALLOCATED_SEARCH 65536
|
||||||
|
|
||||||
|
@ -80,6 +81,7 @@ typedef struct BlkMigState {
|
||||||
int shared_base;
|
int shared_base;
|
||||||
QSIMPLEQ_HEAD(bmds_list, BlkMigDevState) bmds_list;
|
QSIMPLEQ_HEAD(bmds_list, BlkMigDevState) bmds_list;
|
||||||
int64_t total_sector_sum;
|
int64_t total_sector_sum;
|
||||||
|
bool zero_blocks;
|
||||||
|
|
||||||
/* Protected by lock. */
|
/* Protected by lock. */
|
||||||
QSIMPLEQ_HEAD(blk_list, BlkMigBlock) blk_list;
|
QSIMPLEQ_HEAD(blk_list, BlkMigBlock) blk_list;
|
||||||
|
@ -114,16 +116,30 @@ static void blk_mig_unlock(void)
|
||||||
static void blk_send(QEMUFile *f, BlkMigBlock * blk)
|
static void blk_send(QEMUFile *f, BlkMigBlock * blk)
|
||||||
{
|
{
|
||||||
int len;
|
int len;
|
||||||
|
uint64_t flags = BLK_MIG_FLAG_DEVICE_BLOCK;
|
||||||
|
|
||||||
|
if (block_mig_state.zero_blocks &&
|
||||||
|
buffer_is_zero(blk->buf, BLOCK_SIZE)) {
|
||||||
|
flags |= BLK_MIG_FLAG_ZERO_BLOCK;
|
||||||
|
}
|
||||||
|
|
||||||
/* sector number and flags */
|
/* sector number and flags */
|
||||||
qemu_put_be64(f, (blk->sector << BDRV_SECTOR_BITS)
|
qemu_put_be64(f, (blk->sector << BDRV_SECTOR_BITS)
|
||||||
| BLK_MIG_FLAG_DEVICE_BLOCK);
|
| flags);
|
||||||
|
|
||||||
/* device name */
|
/* device name */
|
||||||
len = strlen(blk->bmds->bs->device_name);
|
len = strlen(blk->bmds->bs->device_name);
|
||||||
qemu_put_byte(f, len);
|
qemu_put_byte(f, len);
|
||||||
qemu_put_buffer(f, (uint8_t *)blk->bmds->bs->device_name, len);
|
qemu_put_buffer(f, (uint8_t *)blk->bmds->bs->device_name, len);
|
||||||
|
|
||||||
|
/* if a block is zero we need to flush here since the network
|
||||||
|
* bandwidth is now a lot higher than the storage device bandwidth.
|
||||||
|
* thus if we queue zero blocks we slow down the migration */
|
||||||
|
if (flags & BLK_MIG_FLAG_ZERO_BLOCK) {
|
||||||
|
qemu_fflush(f);
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
qemu_put_buffer(f, blk->buf, BLOCK_SIZE);
|
qemu_put_buffer(f, blk->buf, BLOCK_SIZE);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -344,6 +360,7 @@ static void init_blk_migration(QEMUFile *f)
|
||||||
block_mig_state.total_sector_sum = 0;
|
block_mig_state.total_sector_sum = 0;
|
||||||
block_mig_state.prev_progress = -1;
|
block_mig_state.prev_progress = -1;
|
||||||
block_mig_state.bulk_completed = 0;
|
block_mig_state.bulk_completed = 0;
|
||||||
|
block_mig_state.zero_blocks = migrate_zero_blocks();
|
||||||
|
|
||||||
bdrv_iterate(init_blk_migration_it, NULL);
|
bdrv_iterate(init_blk_migration_it, NULL);
|
||||||
}
|
}
|
||||||
|
@ -762,12 +779,15 @@ static int block_load(QEMUFile *f, void *opaque, int version_id)
|
||||||
nr_sectors = BDRV_SECTORS_PER_DIRTY_CHUNK;
|
nr_sectors = BDRV_SECTORS_PER_DIRTY_CHUNK;
|
||||||
}
|
}
|
||||||
|
|
||||||
buf = g_malloc(BLOCK_SIZE);
|
if (flags & BLK_MIG_FLAG_ZERO_BLOCK) {
|
||||||
|
ret = bdrv_write_zeroes(bs, addr, nr_sectors);
|
||||||
|
} else {
|
||||||
|
buf = g_malloc(BLOCK_SIZE);
|
||||||
|
qemu_get_buffer(f, buf, BLOCK_SIZE);
|
||||||
|
ret = bdrv_write(bs, addr, buf, nr_sectors);
|
||||||
|
g_free(buf);
|
||||||
|
}
|
||||||
|
|
||||||
qemu_get_buffer(f, buf, BLOCK_SIZE);
|
|
||||||
ret = bdrv_write(bs, addr, buf, nr_sectors);
|
|
||||||
|
|
||||||
g_free(buf);
|
|
||||||
if (ret < 0) {
|
if (ret < 0) {
|
||||||
return ret;
|
return ret;
|
||||||
}
|
}
|
||||||
|
|
|
@ -124,6 +124,7 @@ void migrate_add_blocker(Error *reason);
|
||||||
void migrate_del_blocker(Error *reason);
|
void migrate_del_blocker(Error *reason);
|
||||||
|
|
||||||
bool migrate_rdma_pin_all(void);
|
bool migrate_rdma_pin_all(void);
|
||||||
|
bool migrate_zero_blocks(void);
|
||||||
|
|
||||||
bool migrate_auto_converge(void);
|
bool migrate_auto_converge(void);
|
||||||
|
|
||||||
|
|
|
@ -493,6 +493,15 @@ bool migrate_auto_converge(void)
|
||||||
return s->enabled_capabilities[MIGRATION_CAPABILITY_AUTO_CONVERGE];
|
return s->enabled_capabilities[MIGRATION_CAPABILITY_AUTO_CONVERGE];
|
||||||
}
|
}
|
||||||
|
|
||||||
|
bool migrate_zero_blocks(void)
|
||||||
|
{
|
||||||
|
MigrationState *s;
|
||||||
|
|
||||||
|
s = migrate_get_current();
|
||||||
|
|
||||||
|
return s->enabled_capabilities[MIGRATION_CAPABILITY_ZERO_BLOCKS];
|
||||||
|
}
|
||||||
|
|
||||||
int migrate_use_xbzrle(void)
|
int migrate_use_xbzrle(void)
|
||||||
{
|
{
|
||||||
MigrationState *s;
|
MigrationState *s;
|
||||||
|
|
|
@ -613,10 +613,16 @@
|
||||||
# Disabled by default. Experimental: may (or may not) be renamed after
|
# Disabled by default. Experimental: may (or may not) be renamed after
|
||||||
# further testing is complete. (since 1.6)
|
# further testing is complete. (since 1.6)
|
||||||
#
|
#
|
||||||
|
# @zero-blocks: During storage migration encode blocks of zeroes efficiently. This
|
||||||
|
# essentially saves 1MB of zeroes per block on the wire. Enabling requires
|
||||||
|
# source and target VM to support this feature. To enable it is sufficient
|
||||||
|
# to enable the capability on the source VM. The feature is disabled by
|
||||||
|
# default. (since 1.6)
|
||||||
|
#
|
||||||
# Since: 1.2
|
# Since: 1.2
|
||||||
##
|
##
|
||||||
{ 'enum': 'MigrationCapability',
|
{ 'enum': 'MigrationCapability',
|
||||||
'data': ['xbzrle', 'x-rdma-pin-all', 'auto-converge'] }
|
'data': ['xbzrle', 'x-rdma-pin-all', 'auto-converge', 'zero-blocks'] }
|
||||||
|
|
||||||
##
|
##
|
||||||
# @MigrationCapabilityStatus
|
# @MigrationCapabilityStatus
|
||||||
|
|
Loading…
Reference in New Issue