2004-08-02 05:59:26 +08:00
|
|
|
/*
|
|
|
|
* QEMU System Emulator block driver
|
2007-09-17 05:08:06 +08:00
|
|
|
*
|
2004-08-02 05:59:26 +08:00
|
|
|
* Copyright (c) 2003 Fabrice Bellard
|
2007-09-17 05:08:06 +08:00
|
|
|
*
|
2004-08-02 05:59:26 +08:00
|
|
|
* Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
|
|
* of this software and associated documentation files (the "Software"), to deal
|
|
|
|
* in the Software without restriction, including without limitation the rights
|
|
|
|
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
|
|
* copies of the Software, and to permit persons to whom the Software is
|
|
|
|
* furnished to do so, subject to the following conditions:
|
|
|
|
*
|
|
|
|
* The above copyright notice and this permission notice shall be included in
|
|
|
|
* all copies or substantial portions of the Software.
|
|
|
|
*
|
|
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
|
|
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
|
|
* THE SOFTWARE.
|
|
|
|
*/
|
|
|
|
#ifndef BLOCK_INT_H
|
|
|
|
#define BLOCK_INT_H
|
|
|
|
|
2007-11-11 10:51:17 +08:00
|
|
|
#include "block.h"
|
2009-05-18 22:42:10 +08:00
|
|
|
#include "qemu-option.h"
|
2010-04-10 14:02:42 +08:00
|
|
|
#include "qemu-queue.h"
|
2007-11-11 10:51:17 +08:00
|
|
|
|
2007-09-17 05:59:02 +08:00
|
|
|
#define BLOCK_FLAG_ENCRYPT 1
|
|
|
|
#define BLOCK_FLAG_COMPRESS 2
|
|
|
|
#define BLOCK_FLAG_COMPAT6 4
|
|
|
|
|
2009-05-18 22:42:10 +08:00
|
|
|
#define BLOCK_OPT_SIZE "size"
|
|
|
|
#define BLOCK_OPT_ENCRYPT "encryption"
|
|
|
|
#define BLOCK_OPT_COMPAT6 "compat6"
|
|
|
|
#define BLOCK_OPT_BACKING_FILE "backing_file"
|
|
|
|
#define BLOCK_OPT_BACKING_FMT "backing_fmt"
|
2009-05-19 23:57:21 +08:00
|
|
|
#define BLOCK_OPT_CLUSTER_SIZE "cluster_size"
|
2009-08-17 21:50:10 +08:00
|
|
|
#define BLOCK_OPT_PREALLOC "preallocation"
|
2009-05-18 22:42:10 +08:00
|
|
|
|
2009-03-21 02:25:59 +08:00
|
|
|
typedef struct AIOPool {
|
|
|
|
void (*cancel)(BlockDriverAIOCB *acb);
|
|
|
|
int aiocb_size;
|
|
|
|
BlockDriverAIOCB *free_aiocb;
|
|
|
|
} AIOPool;
|
|
|
|
|
2004-08-02 05:59:26 +08:00
|
|
|
struct BlockDriver {
|
|
|
|
const char *format_name;
|
|
|
|
int instance_size;
|
|
|
|
int (*bdrv_probe)(const uint8_t *buf, int buf_size, const char *filename);
|
2009-06-15 20:04:22 +08:00
|
|
|
int (*bdrv_probe_device)(const char *filename);
|
2010-04-14 20:17:38 +08:00
|
|
|
int (*bdrv_open)(BlockDriverState *bs, int flags);
|
|
|
|
int (*bdrv_file_open)(BlockDriverState *bs, const char *filename, int flags);
|
2007-09-17 05:08:06 +08:00
|
|
|
int (*bdrv_read)(BlockDriverState *bs, int64_t sector_num,
|
2004-08-02 05:59:26 +08:00
|
|
|
uint8_t *buf, int nb_sectors);
|
2007-09-17 05:08:06 +08:00
|
|
|
int (*bdrv_write)(BlockDriverState *bs, int64_t sector_num,
|
2004-08-02 05:59:26 +08:00
|
|
|
const uint8_t *buf, int nb_sectors);
|
2004-09-19 03:32:11 +08:00
|
|
|
void (*bdrv_close)(BlockDriverState *bs);
|
2009-05-18 22:42:10 +08:00
|
|
|
int (*bdrv_create)(const char *filename, QEMUOptionParameter *options);
|
2010-10-21 22:43:43 +08:00
|
|
|
int (*bdrv_flush)(BlockDriverState *bs);
|
2004-08-02 05:59:26 +08:00
|
|
|
int (*bdrv_is_allocated)(BlockDriverState *bs, int64_t sector_num,
|
|
|
|
int nb_sectors, int *pnum);
|
|
|
|
int (*bdrv_set_key)(BlockDriverState *bs, const char *key);
|
2005-12-19 02:28:15 +08:00
|
|
|
int (*bdrv_make_empty)(BlockDriverState *bs);
|
2006-08-02 00:21:11 +08:00
|
|
|
/* aio */
|
2009-04-08 02:43:24 +08:00
|
|
|
BlockDriverAIOCB *(*bdrv_aio_readv)(BlockDriverState *bs,
|
|
|
|
int64_t sector_num, QEMUIOVector *qiov, int nb_sectors,
|
2006-08-07 10:38:06 +08:00
|
|
|
BlockDriverCompletionFunc *cb, void *opaque);
|
2009-04-08 02:43:24 +08:00
|
|
|
BlockDriverAIOCB *(*bdrv_aio_writev)(BlockDriverState *bs,
|
|
|
|
int64_t sector_num, QEMUIOVector *qiov, int nb_sectors,
|
2006-08-07 10:38:06 +08:00
|
|
|
BlockDriverCompletionFunc *cb, void *opaque);
|
2009-09-05 01:01:49 +08:00
|
|
|
BlockDriverAIOCB *(*bdrv_aio_flush)(BlockDriverState *bs,
|
|
|
|
BlockDriverCompletionFunc *cb, void *opaque);
|
2006-08-02 00:21:11 +08:00
|
|
|
|
2009-09-09 23:53:37 +08:00
|
|
|
int (*bdrv_aio_multiwrite)(BlockDriverState *bs, BlockRequest *reqs,
|
|
|
|
int num_reqs);
|
|
|
|
int (*bdrv_merge_requests)(BlockDriverState *bs, BlockRequest* a,
|
|
|
|
BlockRequest *b);
|
|
|
|
|
|
|
|
|
2006-08-02 00:21:11 +08:00
|
|
|
const char *protocol_name;
|
|
|
|
int (*bdrv_truncate)(BlockDriverState *bs, int64_t offset);
|
|
|
|
int64_t (*bdrv_getlength)(BlockDriverState *bs);
|
2007-09-17 05:08:06 +08:00
|
|
|
int (*bdrv_write_compressed)(BlockDriverState *bs, int64_t sector_num,
|
2006-08-06 05:31:00 +08:00
|
|
|
const uint8_t *buf, int nb_sectors);
|
|
|
|
|
2007-09-17 05:08:06 +08:00
|
|
|
int (*bdrv_snapshot_create)(BlockDriverState *bs,
|
2006-08-06 05:31:00 +08:00
|
|
|
QEMUSnapshotInfo *sn_info);
|
2007-09-17 05:08:06 +08:00
|
|
|
int (*bdrv_snapshot_goto)(BlockDriverState *bs,
|
2006-08-06 05:31:00 +08:00
|
|
|
const char *snapshot_id);
|
|
|
|
int (*bdrv_snapshot_delete)(BlockDriverState *bs, const char *snapshot_id);
|
2007-09-17 05:08:06 +08:00
|
|
|
int (*bdrv_snapshot_list)(BlockDriverState *bs,
|
2006-08-06 05:31:00 +08:00
|
|
|
QEMUSnapshotInfo **psn_info);
|
2010-09-22 10:58:41 +08:00
|
|
|
int (*bdrv_snapshot_load_tmp)(BlockDriverState *bs,
|
|
|
|
const char *snapshot_name);
|
2006-08-06 05:31:00 +08:00
|
|
|
int (*bdrv_get_info)(BlockDriverState *bs, BlockDriverInfo *bdi);
|
2006-08-02 00:21:11 +08:00
|
|
|
|
2009-07-11 05:11:57 +08:00
|
|
|
int (*bdrv_save_vmstate)(BlockDriverState *bs, const uint8_t *buf,
|
|
|
|
int64_t pos, int size);
|
|
|
|
int (*bdrv_load_vmstate)(BlockDriverState *bs, uint8_t *buf,
|
|
|
|
int64_t pos, int size);
|
2009-04-06 03:10:55 +08:00
|
|
|
|
2010-01-12 19:55:17 +08:00
|
|
|
int (*bdrv_change_backing_file)(BlockDriverState *bs,
|
|
|
|
const char *backing_file, const char *backing_fmt);
|
|
|
|
|
2006-08-19 19:45:59 +08:00
|
|
|
/* removable device specific */
|
|
|
|
int (*bdrv_is_inserted)(BlockDriverState *bs);
|
|
|
|
int (*bdrv_media_changed)(BlockDriverState *bs);
|
|
|
|
int (*bdrv_eject)(BlockDriverState *bs, int eject_flag);
|
|
|
|
int (*bdrv_set_locked)(BlockDriverState *bs, int locked);
|
2007-09-17 16:09:54 +08:00
|
|
|
|
2007-12-25 00:10:43 +08:00
|
|
|
/* to control generic scsi devices */
|
|
|
|
int (*bdrv_ioctl)(BlockDriverState *bs, unsigned long int req, void *buf);
|
2009-03-29 01:28:41 +08:00
|
|
|
BlockDriverAIOCB *(*bdrv_aio_ioctl)(BlockDriverState *bs,
|
|
|
|
unsigned long int req, void *buf,
|
|
|
|
BlockDriverCompletionFunc *cb, void *opaque);
|
2007-12-25 00:10:43 +08:00
|
|
|
|
2009-05-18 22:42:10 +08:00
|
|
|
/* List of options for creating images, terminated by name == NULL */
|
|
|
|
QEMUOptionParameter *create_options;
|
|
|
|
|
2009-03-29 01:55:10 +08:00
|
|
|
|
2010-06-29 18:37:54 +08:00
|
|
|
/*
|
|
|
|
* Returns 0 for completed check, -errno for internal errors.
|
|
|
|
* The check results are stored in result.
|
|
|
|
*/
|
|
|
|
int (*bdrv_check)(BlockDriverState* bs, BdrvCheckResult *result);
|
2009-04-22 07:11:50 +08:00
|
|
|
|
2010-03-16 00:27:00 +08:00
|
|
|
void (*bdrv_debug_event)(BlockDriverState *bs, BlkDebugEvent event);
|
|
|
|
|
2010-07-28 17:26:29 +08:00
|
|
|
/*
|
|
|
|
* Returns 1 if newly created images are guaranteed to contain only
|
|
|
|
* zeros, 0 otherwise.
|
|
|
|
*/
|
|
|
|
int (*bdrv_has_zero_init)(BlockDriverState *bs);
|
2009-11-30 23:54:15 +08:00
|
|
|
|
2010-04-13 17:29:33 +08:00
|
|
|
QLIST_ENTRY(BlockDriver) list;
|
2004-08-02 05:59:26 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct BlockDriverState {
|
2006-08-06 21:35:09 +08:00
|
|
|
int64_t total_sectors; /* if we are reading a disk image, give its
|
|
|
|
size in sectors */
|
2004-08-02 05:59:26 +08:00
|
|
|
int read_only; /* if true, the media is read only */
|
2010-02-14 19:39:18 +08:00
|
|
|
int keep_read_only; /* if true, the media was requested to stay read only */
|
|
|
|
int open_flags; /* flags used to open the file, re-used for re-open */
|
2004-08-02 05:59:26 +08:00
|
|
|
int removable; /* if true, the media can be removed */
|
|
|
|
int locked; /* if true, the media cannot temporarily be ejected */
|
block: Change bdrv_eject() not to drop the image
bdrv_eject() gets called when a device model opens or closes the tray.
If the block driver implements method bdrv_eject(), that method gets
called. Drivers host_cdrom implements it, and it opens and closes the
physical tray, and nothing else. When a device model opens, then
closes the tray, media changes only if the user actively changes the
physical media while the tray is open. This is matches how physical
hardware behaves.
If the block driver doesn't implement method bdrv_eject(), we do
something quite different: opening the tray severs the connection to
the image by calling bdrv_close(), and closing the tray does nothing.
When the device model opens, then closes the tray, media is gone,
unless the user actively inserts another one while the tray is open,
with a suitable change command in the monitor. This isn't how
physical hardware behaves. Rather inconvenient when programs
"helpfully" eject media to give you a chance to change it. The way
bdrv_eject() behaves here turns that chance into a must, which is not
what these programs or their users expect.
Change the default action not to call bdrv_close(). Instead, note the
tray status in new BlockDriverState member tray_open. Use it in
bdrv_is_inserted().
Arguably, the device models should keep track of tray status
themselves. But this is less invasive.
Signed-off-by: Markus Armbruster <armbru@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2010-07-27 20:02:01 +08:00
|
|
|
int tray_open; /* if true, the virtual tray is open */
|
2004-08-02 05:59:26 +08:00
|
|
|
int encrypted; /* if true, the media is encrypted */
|
2009-03-06 07:01:01 +08:00
|
|
|
int valid_key; /* if true, a valid encryption key has been set */
|
2007-12-25 00:10:43 +08:00
|
|
|
int sg; /* if true, the device is a /dev/sg* */
|
2004-08-02 05:59:26 +08:00
|
|
|
/* event callback when inserting/removing */
|
|
|
|
void (*change_cb)(void *opaque);
|
|
|
|
void *change_opaque;
|
|
|
|
|
2006-08-19 19:45:59 +08:00
|
|
|
BlockDriver *drv; /* NULL means no media */
|
2004-08-02 05:59:26 +08:00
|
|
|
void *opaque;
|
|
|
|
|
2010-06-29 22:58:30 +08:00
|
|
|
DeviceState *peer;
|
|
|
|
|
2004-08-02 05:59:26 +08:00
|
|
|
char filename[1024];
|
|
|
|
char backing_file[1024]; /* if non zero, the image is a diff of
|
|
|
|
this file image */
|
2009-03-29 01:55:10 +08:00
|
|
|
char backing_format[16]; /* if non-zero and backing_file exists */
|
2004-08-02 05:59:26 +08:00
|
|
|
int is_temporary;
|
2006-08-19 19:45:59 +08:00
|
|
|
int media_changed;
|
|
|
|
|
2004-08-02 05:59:26 +08:00
|
|
|
BlockDriverState *backing_hd;
|
2010-04-14 20:17:38 +08:00
|
|
|
BlockDriverState *file;
|
|
|
|
|
2006-08-07 10:38:06 +08:00
|
|
|
/* async read/write emulation */
|
2006-08-02 00:21:11 +08:00
|
|
|
|
2006-08-07 10:38:06 +08:00
|
|
|
void *sync_aiocb;
|
2007-09-17 16:09:54 +08:00
|
|
|
|
2007-12-02 13:18:19 +08:00
|
|
|
/* I/O stats (display with "info blockstats"). */
|
|
|
|
uint64_t rd_bytes;
|
|
|
|
uint64_t wr_bytes;
|
|
|
|
uint64_t rd_ops;
|
|
|
|
uint64_t wr_ops;
|
2010-04-28 20:34:01 +08:00
|
|
|
uint64_t wr_highest_sector;
|
2007-12-02 13:18:19 +08:00
|
|
|
|
2009-03-04 01:37:16 +08:00
|
|
|
/* Whether the disk can expand beyond total_sectors */
|
|
|
|
int growable;
|
|
|
|
|
2009-04-23 04:20:00 +08:00
|
|
|
/* the memory alignment required for the buffers handled by this driver */
|
|
|
|
int buffer_alignment;
|
|
|
|
|
2009-09-05 01:01:15 +08:00
|
|
|
/* do we need to tell the quest if we have a volatile write cache? */
|
|
|
|
int enable_write_cache;
|
|
|
|
|
2004-08-02 05:59:26 +08:00
|
|
|
/* NOTE: the following infos are only hints for real hardware
|
|
|
|
drivers. They are not used by the block driver */
|
2004-11-16 09:45:27 +08:00
|
|
|
int cyls, heads, secs, translation;
|
2004-08-02 05:59:26 +08:00
|
|
|
int type;
|
2010-06-03 00:55:17 +08:00
|
|
|
BlockErrorAction on_read_error, on_write_error;
|
2004-08-02 05:59:26 +08:00
|
|
|
char device_name[32];
|
2009-12-01 01:21:20 +08:00
|
|
|
unsigned long *dirty_bitmap;
|
2010-01-26 16:31:48 +08:00
|
|
|
int64_t dirty_count;
|
2010-04-10 14:02:42 +08:00
|
|
|
QTAILQ_ENTRY(BlockDriverState) list;
|
2009-02-11 23:20:29 +08:00
|
|
|
void *private;
|
2004-08-02 05:59:26 +08:00
|
|
|
};
|
|
|
|
|
2006-08-02 00:21:11 +08:00
|
|
|
struct BlockDriverAIOCB {
|
2009-03-21 02:25:59 +08:00
|
|
|
AIOPool *pool;
|
2006-08-02 00:21:11 +08:00
|
|
|
BlockDriverState *bs;
|
|
|
|
BlockDriverCompletionFunc *cb;
|
2006-08-07 10:38:06 +08:00
|
|
|
void *opaque;
|
|
|
|
BlockDriverAIOCB *next;
|
2006-08-02 00:21:11 +08:00
|
|
|
};
|
|
|
|
|
2005-12-19 02:28:15 +08:00
|
|
|
void get_tmp_filename(char *filename, int size);
|
|
|
|
|
2009-05-25 18:37:32 +08:00
|
|
|
void *qemu_aio_get(AIOPool *pool, BlockDriverState *bs,
|
|
|
|
BlockDriverCompletionFunc *cb, void *opaque);
|
2006-08-07 10:38:06 +08:00
|
|
|
void qemu_aio_release(void *p);
|
|
|
|
|
2009-04-23 04:20:00 +08:00
|
|
|
void *qemu_blockalign(BlockDriverState *bs, size_t size);
|
|
|
|
|
2009-06-15 20:04:22 +08:00
|
|
|
#ifdef _WIN32
|
|
|
|
int is_windows_drive(const char *filename);
|
|
|
|
#endif
|
|
|
|
|
block: add topology qdev properties
Add three new qdev properties to export block topology information to
the guest. This is needed to get optimal I/O alignment for RAID arrays
or SSDs.
The options are:
- physical_block_size to specify the physical block size of the device,
this is going to increase from 512 bytes to 4096 kilobytes for many
modern storage devices
- min_io_size to specify the minimal I/O size without performance impact,
this is typically set to the RAID chunk size for arrays.
- opt_io_size to specify the optimal sustained I/O size, this is
typically the RAID stripe width for arrays.
I decided to not auto-probe these values from blkid which might easily
be possible as I don't know how to deal with these issues on migration.
Note that we specificly only set the physical_block_size, and not the
logial one which is the unit all I/O is described in. The reason for
that is that IDE does not support increasing the logical block size and
at last for now I want to stick to one meachnisms in queue and allow
for easy switching of transports for a given backing image which would
not be possible if scsi and virtio use real 4k sectors, while ide only
uses the physical block exponent.
To make this more common for the different block drivers introduce a
new BlockConf structure holding all common block properties and a
DEFINE_BLOCK_PROPERTIES macro to add them all together, mirroring
what is done for network drivers. Also switch over all block drivers
to use it, except for the floppy driver which has weird driveA/driveB
properties and probably won't require any advanced block options ever.
Example usage for a virtio device with 4k physical block size and
8k optimal I/O size:
-drive file=scratch.img,media=disk,cache=none,id=scratch \
-device virtio-blk-pci,drive=scratch,physical_block_size=4096,opt_io_size=8192
aliguori: updated patch to take into account BLOCK events
Signed-off-by: Christoph Hellwig <hch@lst.de>
Signed-off-by: Anthony Liguori <aliguori@us.ibm.com>
2010-02-11 06:37:09 +08:00
|
|
|
typedef struct BlockConf {
|
2010-05-05 22:36:52 +08:00
|
|
|
BlockDriverState *bs;
|
block: add topology qdev properties
Add three new qdev properties to export block topology information to
the guest. This is needed to get optimal I/O alignment for RAID arrays
or SSDs.
The options are:
- physical_block_size to specify the physical block size of the device,
this is going to increase from 512 bytes to 4096 kilobytes for many
modern storage devices
- min_io_size to specify the minimal I/O size without performance impact,
this is typically set to the RAID chunk size for arrays.
- opt_io_size to specify the optimal sustained I/O size, this is
typically the RAID stripe width for arrays.
I decided to not auto-probe these values from blkid which might easily
be possible as I don't know how to deal with these issues on migration.
Note that we specificly only set the physical_block_size, and not the
logial one which is the unit all I/O is described in. The reason for
that is that IDE does not support increasing the logical block size and
at last for now I want to stick to one meachnisms in queue and allow
for easy switching of transports for a given backing image which would
not be possible if scsi and virtio use real 4k sectors, while ide only
uses the physical block exponent.
To make this more common for the different block drivers introduce a
new BlockConf structure holding all common block properties and a
DEFINE_BLOCK_PROPERTIES macro to add them all together, mirroring
what is done for network drivers. Also switch over all block drivers
to use it, except for the floppy driver which has weird driveA/driveB
properties and probably won't require any advanced block options ever.
Example usage for a virtio device with 4k physical block size and
8k optimal I/O size:
-drive file=scratch.img,media=disk,cache=none,id=scratch \
-device virtio-blk-pci,drive=scratch,physical_block_size=4096,opt_io_size=8192
aliguori: updated patch to take into account BLOCK events
Signed-off-by: Christoph Hellwig <hch@lst.de>
Signed-off-by: Anthony Liguori <aliguori@us.ibm.com>
2010-02-11 06:37:09 +08:00
|
|
|
uint16_t physical_block_size;
|
2010-03-04 21:20:17 +08:00
|
|
|
uint16_t logical_block_size;
|
block: add topology qdev properties
Add three new qdev properties to export block topology information to
the guest. This is needed to get optimal I/O alignment for RAID arrays
or SSDs.
The options are:
- physical_block_size to specify the physical block size of the device,
this is going to increase from 512 bytes to 4096 kilobytes for many
modern storage devices
- min_io_size to specify the minimal I/O size without performance impact,
this is typically set to the RAID chunk size for arrays.
- opt_io_size to specify the optimal sustained I/O size, this is
typically the RAID stripe width for arrays.
I decided to not auto-probe these values from blkid which might easily
be possible as I don't know how to deal with these issues on migration.
Note that we specificly only set the physical_block_size, and not the
logial one which is the unit all I/O is described in. The reason for
that is that IDE does not support increasing the logical block size and
at last for now I want to stick to one meachnisms in queue and allow
for easy switching of transports for a given backing image which would
not be possible if scsi and virtio use real 4k sectors, while ide only
uses the physical block exponent.
To make this more common for the different block drivers introduce a
new BlockConf structure holding all common block properties and a
DEFINE_BLOCK_PROPERTIES macro to add them all together, mirroring
what is done for network drivers. Also switch over all block drivers
to use it, except for the floppy driver which has weird driveA/driveB
properties and probably won't require any advanced block options ever.
Example usage for a virtio device with 4k physical block size and
8k optimal I/O size:
-drive file=scratch.img,media=disk,cache=none,id=scratch \
-device virtio-blk-pci,drive=scratch,physical_block_size=4096,opt_io_size=8192
aliguori: updated patch to take into account BLOCK events
Signed-off-by: Christoph Hellwig <hch@lst.de>
Signed-off-by: Anthony Liguori <aliguori@us.ibm.com>
2010-02-11 06:37:09 +08:00
|
|
|
uint16_t min_io_size;
|
|
|
|
uint32_t opt_io_size;
|
|
|
|
} BlockConf;
|
|
|
|
|
|
|
|
static inline unsigned int get_physical_block_exp(BlockConf *conf)
|
|
|
|
{
|
|
|
|
unsigned int exp = 0, size;
|
|
|
|
|
2010-06-15 23:52:52 +08:00
|
|
|
for (size = conf->physical_block_size;
|
|
|
|
size > conf->logical_block_size;
|
|
|
|
size >>= 1) {
|
block: add topology qdev properties
Add three new qdev properties to export block topology information to
the guest. This is needed to get optimal I/O alignment for RAID arrays
or SSDs.
The options are:
- physical_block_size to specify the physical block size of the device,
this is going to increase from 512 bytes to 4096 kilobytes for many
modern storage devices
- min_io_size to specify the minimal I/O size without performance impact,
this is typically set to the RAID chunk size for arrays.
- opt_io_size to specify the optimal sustained I/O size, this is
typically the RAID stripe width for arrays.
I decided to not auto-probe these values from blkid which might easily
be possible as I don't know how to deal with these issues on migration.
Note that we specificly only set the physical_block_size, and not the
logial one which is the unit all I/O is described in. The reason for
that is that IDE does not support increasing the logical block size and
at last for now I want to stick to one meachnisms in queue and allow
for easy switching of transports for a given backing image which would
not be possible if scsi and virtio use real 4k sectors, while ide only
uses the physical block exponent.
To make this more common for the different block drivers introduce a
new BlockConf structure holding all common block properties and a
DEFINE_BLOCK_PROPERTIES macro to add them all together, mirroring
what is done for network drivers. Also switch over all block drivers
to use it, except for the floppy driver which has weird driveA/driveB
properties and probably won't require any advanced block options ever.
Example usage for a virtio device with 4k physical block size and
8k optimal I/O size:
-drive file=scratch.img,media=disk,cache=none,id=scratch \
-device virtio-blk-pci,drive=scratch,physical_block_size=4096,opt_io_size=8192
aliguori: updated patch to take into account BLOCK events
Signed-off-by: Christoph Hellwig <hch@lst.de>
Signed-off-by: Anthony Liguori <aliguori@us.ibm.com>
2010-02-11 06:37:09 +08:00
|
|
|
exp++;
|
|
|
|
}
|
|
|
|
|
|
|
|
return exp;
|
|
|
|
}
|
|
|
|
|
|
|
|
#define DEFINE_BLOCK_PROPERTIES(_state, _conf) \
|
2010-05-05 22:36:52 +08:00
|
|
|
DEFINE_PROP_DRIVE("drive", _state, _conf.bs), \
|
2010-03-04 21:20:17 +08:00
|
|
|
DEFINE_PROP_UINT16("logical_block_size", _state, \
|
|
|
|
_conf.logical_block_size, 512), \
|
block: add topology qdev properties
Add three new qdev properties to export block topology information to
the guest. This is needed to get optimal I/O alignment for RAID arrays
or SSDs.
The options are:
- physical_block_size to specify the physical block size of the device,
this is going to increase from 512 bytes to 4096 kilobytes for many
modern storage devices
- min_io_size to specify the minimal I/O size without performance impact,
this is typically set to the RAID chunk size for arrays.
- opt_io_size to specify the optimal sustained I/O size, this is
typically the RAID stripe width for arrays.
I decided to not auto-probe these values from blkid which might easily
be possible as I don't know how to deal with these issues on migration.
Note that we specificly only set the physical_block_size, and not the
logial one which is the unit all I/O is described in. The reason for
that is that IDE does not support increasing the logical block size and
at last for now I want to stick to one meachnisms in queue and allow
for easy switching of transports for a given backing image which would
not be possible if scsi and virtio use real 4k sectors, while ide only
uses the physical block exponent.
To make this more common for the different block drivers introduce a
new BlockConf structure holding all common block properties and a
DEFINE_BLOCK_PROPERTIES macro to add them all together, mirroring
what is done for network drivers. Also switch over all block drivers
to use it, except for the floppy driver which has weird driveA/driveB
properties and probably won't require any advanced block options ever.
Example usage for a virtio device with 4k physical block size and
8k optimal I/O size:
-drive file=scratch.img,media=disk,cache=none,id=scratch \
-device virtio-blk-pci,drive=scratch,physical_block_size=4096,opt_io_size=8192
aliguori: updated patch to take into account BLOCK events
Signed-off-by: Christoph Hellwig <hch@lst.de>
Signed-off-by: Anthony Liguori <aliguori@us.ibm.com>
2010-02-11 06:37:09 +08:00
|
|
|
DEFINE_PROP_UINT16("physical_block_size", _state, \
|
|
|
|
_conf.physical_block_size, 512), \
|
2010-07-23 15:35:04 +08:00
|
|
|
DEFINE_PROP_UINT16("min_io_size", _state, _conf.min_io_size, 0), \
|
|
|
|
DEFINE_PROP_UINT32("opt_io_size", _state, _conf.opt_io_size, 0)
|
block: add topology qdev properties
Add three new qdev properties to export block topology information to
the guest. This is needed to get optimal I/O alignment for RAID arrays
or SSDs.
The options are:
- physical_block_size to specify the physical block size of the device,
this is going to increase from 512 bytes to 4096 kilobytes for many
modern storage devices
- min_io_size to specify the minimal I/O size without performance impact,
this is typically set to the RAID chunk size for arrays.
- opt_io_size to specify the optimal sustained I/O size, this is
typically the RAID stripe width for arrays.
I decided to not auto-probe these values from blkid which might easily
be possible as I don't know how to deal with these issues on migration.
Note that we specificly only set the physical_block_size, and not the
logial one which is the unit all I/O is described in. The reason for
that is that IDE does not support increasing the logical block size and
at last for now I want to stick to one meachnisms in queue and allow
for easy switching of transports for a given backing image which would
not be possible if scsi and virtio use real 4k sectors, while ide only
uses the physical block exponent.
To make this more common for the different block drivers introduce a
new BlockConf structure holding all common block properties and a
DEFINE_BLOCK_PROPERTIES macro to add them all together, mirroring
what is done for network drivers. Also switch over all block drivers
to use it, except for the floppy driver which has weird driveA/driveB
properties and probably won't require any advanced block options ever.
Example usage for a virtio device with 4k physical block size and
8k optimal I/O size:
-drive file=scratch.img,media=disk,cache=none,id=scratch \
-device virtio-blk-pci,drive=scratch,physical_block_size=4096,opt_io_size=8192
aliguori: updated patch to take into account BLOCK events
Signed-off-by: Christoph Hellwig <hch@lst.de>
Signed-off-by: Anthony Liguori <aliguori@us.ibm.com>
2010-02-11 06:37:09 +08:00
|
|
|
|
2004-08-02 05:59:26 +08:00
|
|
|
#endif /* BLOCK_INT_H */
|