2008-12-05 04:33:06 +08:00
|
|
|
/*
|
|
|
|
* Virtio Block Device
|
|
|
|
*
|
|
|
|
* Copyright IBM, Corp. 2008
|
|
|
|
*
|
|
|
|
* Authors:
|
|
|
|
* Anthony Liguori <aliguori@us.ibm.com>
|
|
|
|
*
|
|
|
|
* This work is licensed under the terms of the GNU GPL, version 2. See
|
|
|
|
* the COPYING file in the top-level directory.
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
|
2010-04-27 20:34:06 +08:00
|
|
|
#include "iov.h"
|
2008-12-05 04:33:06 +08:00
|
|
|
#include "qemu-common.h"
|
|
|
|
#include "virtio.h"
|
|
|
|
#include "pc.h"
|
|
|
|
#include "cpu.h"
|
2010-01-27 04:17:35 +08:00
|
|
|
#include "monitor.h"
|
2008-12-05 04:33:06 +08:00
|
|
|
#include "balloon.h"
|
|
|
|
#include "virtio-balloon.h"
|
|
|
|
#include "kvm.h"
|
2010-01-27 04:17:35 +08:00
|
|
|
#include "qlist.h"
|
|
|
|
#include "qint.h"
|
|
|
|
#include "qstring.h"
|
2008-12-05 04:33:06 +08:00
|
|
|
|
|
|
|
#if defined(__linux__)
|
|
|
|
#include <sys/mman.h>
|
|
|
|
#endif
|
|
|
|
|
2010-09-15 00:43:39 +08:00
|
|
|
/* Disable guest-provided stats by now (https://bugzilla.redhat.com/show_bug.cgi?id=623903) */
|
|
|
|
#define ENABLE_GUEST_STATS 0
|
|
|
|
|
|
|
|
|
2008-12-05 04:33:06 +08:00
|
|
|
typedef struct VirtIOBalloon
|
|
|
|
{
|
|
|
|
VirtIODevice vdev;
|
2010-01-27 04:17:35 +08:00
|
|
|
VirtQueue *ivq, *dvq, *svq;
|
2008-12-05 04:33:06 +08:00
|
|
|
uint32_t num_pages;
|
|
|
|
uint32_t actual;
|
2010-01-27 04:17:35 +08:00
|
|
|
uint64_t stats[VIRTIO_BALLOON_S_NR];
|
|
|
|
VirtQueueElement stats_vq_elem;
|
|
|
|
size_t stats_vq_offset;
|
|
|
|
MonitorCompletion *stats_callback;
|
|
|
|
void *stats_opaque_callback_data;
|
2008-12-05 04:33:06 +08:00
|
|
|
} VirtIOBalloon;
|
|
|
|
|
|
|
|
static VirtIOBalloon *to_virtio_balloon(VirtIODevice *vdev)
|
|
|
|
{
|
|
|
|
return (VirtIOBalloon *)vdev;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void balloon_page(void *addr, int deflate)
|
|
|
|
{
|
|
|
|
#if defined(__linux__)
|
|
|
|
if (!kvm_enabled() || kvm_has_sync_mmu())
|
2010-09-25 19:26:05 +08:00
|
|
|
qemu_madvise(addr, TARGET_PAGE_SIZE,
|
|
|
|
deflate ? QEMU_MADV_WILLNEED : QEMU_MADV_DONTNEED);
|
2008-12-05 04:33:06 +08:00
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2010-01-27 04:17:35 +08:00
|
|
|
/*
|
|
|
|
* reset_stats - Mark all items in the stats array as unset
|
|
|
|
*
|
|
|
|
* This function needs to be called at device intialization and before
|
|
|
|
* before updating to a set of newly-generated stats. This will ensure that no
|
|
|
|
* stale values stick around in case the guest reports a subset of the supported
|
|
|
|
* statistics.
|
|
|
|
*/
|
|
|
|
static inline void reset_stats(VirtIOBalloon *dev)
|
|
|
|
{
|
|
|
|
int i;
|
|
|
|
for (i = 0; i < VIRTIO_BALLOON_S_NR; dev->stats[i++] = -1);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void stat_put(QDict *dict, const char *label, uint64_t val)
|
|
|
|
{
|
|
|
|
if (val != -1)
|
|
|
|
qdict_put(dict, label, qint_from_int(val));
|
|
|
|
}
|
|
|
|
|
|
|
|
static QObject *get_stats_qobject(VirtIOBalloon *dev)
|
|
|
|
{
|
|
|
|
QDict *dict = qdict_new();
|
2010-03-25 21:58:17 +08:00
|
|
|
uint64_t actual = ram_size - ((uint64_t) dev->actual <<
|
|
|
|
VIRTIO_BALLOON_PFN_SHIFT);
|
2010-01-27 04:17:35 +08:00
|
|
|
|
|
|
|
stat_put(dict, "actual", actual);
|
2010-09-15 00:43:39 +08:00
|
|
|
#if ENABLE_GUEST_STATS
|
2010-01-27 04:17:35 +08:00
|
|
|
stat_put(dict, "mem_swapped_in", dev->stats[VIRTIO_BALLOON_S_SWAP_IN]);
|
|
|
|
stat_put(dict, "mem_swapped_out", dev->stats[VIRTIO_BALLOON_S_SWAP_OUT]);
|
|
|
|
stat_put(dict, "major_page_faults", dev->stats[VIRTIO_BALLOON_S_MAJFLT]);
|
|
|
|
stat_put(dict, "minor_page_faults", dev->stats[VIRTIO_BALLOON_S_MINFLT]);
|
|
|
|
stat_put(dict, "free_mem", dev->stats[VIRTIO_BALLOON_S_MEMFREE]);
|
|
|
|
stat_put(dict, "total_mem", dev->stats[VIRTIO_BALLOON_S_MEMTOT]);
|
2010-09-15 00:43:39 +08:00
|
|
|
#endif
|
2010-01-27 04:17:35 +08:00
|
|
|
|
|
|
|
return QOBJECT(dict);
|
|
|
|
}
|
|
|
|
|
2008-12-05 04:33:06 +08:00
|
|
|
static void virtio_balloon_handle_output(VirtIODevice *vdev, VirtQueue *vq)
|
|
|
|
{
|
|
|
|
VirtIOBalloon *s = to_virtio_balloon(vdev);
|
|
|
|
VirtQueueElement elem;
|
|
|
|
|
|
|
|
while (virtqueue_pop(vq, &elem)) {
|
|
|
|
size_t offset = 0;
|
|
|
|
uint32_t pfn;
|
|
|
|
|
2010-04-27 20:34:06 +08:00
|
|
|
while (iov_to_buf(elem.out_sg, elem.out_num, &pfn, offset, 4) == 4) {
|
2009-10-02 05:12:16 +08:00
|
|
|
ram_addr_t pa;
|
|
|
|
ram_addr_t addr;
|
2008-12-05 04:33:06 +08:00
|
|
|
|
2009-10-02 05:12:16 +08:00
|
|
|
pa = (ram_addr_t)ldl_p(&pfn) << VIRTIO_BALLOON_PFN_SHIFT;
|
2008-12-05 04:33:06 +08:00
|
|
|
offset += 4;
|
|
|
|
|
|
|
|
addr = cpu_get_physical_page_desc(pa);
|
|
|
|
if ((addr & ~TARGET_PAGE_MASK) != IO_MEM_RAM)
|
|
|
|
continue;
|
|
|
|
|
2009-04-10 22:29:45 +08:00
|
|
|
/* Using qemu_get_ram_ptr is bending the rules a bit, but
|
|
|
|
should be OK because we only want a single page. */
|
|
|
|
balloon_page(qemu_get_ram_ptr(addr), !!(vq == s->dvq));
|
2008-12-05 04:33:06 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
virtqueue_push(vq, &elem, offset);
|
|
|
|
virtio_notify(vdev, vq);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2010-01-27 04:17:35 +08:00
|
|
|
static void complete_stats_request(VirtIOBalloon *vb)
|
|
|
|
{
|
|
|
|
QObject *stats;
|
|
|
|
|
|
|
|
if (!vb->stats_opaque_callback_data)
|
|
|
|
return;
|
|
|
|
|
|
|
|
stats = get_stats_qobject(vb);
|
|
|
|
vb->stats_callback(vb->stats_opaque_callback_data, stats);
|
|
|
|
qobject_decref(stats);
|
|
|
|
vb->stats_opaque_callback_data = NULL;
|
|
|
|
vb->stats_callback = NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void virtio_balloon_receive_stats(VirtIODevice *vdev, VirtQueue *vq)
|
|
|
|
{
|
|
|
|
VirtIOBalloon *s = DO_UPCAST(VirtIOBalloon, vdev, vdev);
|
|
|
|
VirtQueueElement *elem = &s->stats_vq_elem;
|
|
|
|
VirtIOBalloonStat stat;
|
|
|
|
size_t offset = 0;
|
|
|
|
|
|
|
|
if (!virtqueue_pop(vq, elem)) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Initialize the stats to get rid of any stale values. This is only
|
|
|
|
* needed to handle the case where a guest supports fewer stats than it
|
|
|
|
* used to (ie. it has booted into an old kernel).
|
|
|
|
*/
|
|
|
|
reset_stats(s);
|
|
|
|
|
2010-04-27 20:34:06 +08:00
|
|
|
while (iov_to_buf(elem->out_sg, elem->out_num, &stat, offset, sizeof(stat))
|
|
|
|
== sizeof(stat)) {
|
2010-01-27 04:17:35 +08:00
|
|
|
uint16_t tag = tswap16(stat.tag);
|
|
|
|
uint64_t val = tswap64(stat.val);
|
|
|
|
|
|
|
|
offset += sizeof(stat);
|
|
|
|
if (tag < VIRTIO_BALLOON_S_NR)
|
|
|
|
s->stats[tag] = val;
|
|
|
|
}
|
|
|
|
s->stats_vq_offset = offset;
|
|
|
|
|
|
|
|
complete_stats_request(s);
|
|
|
|
}
|
|
|
|
|
2008-12-05 04:33:06 +08:00
|
|
|
static void virtio_balloon_get_config(VirtIODevice *vdev, uint8_t *config_data)
|
|
|
|
{
|
|
|
|
VirtIOBalloon *dev = to_virtio_balloon(vdev);
|
|
|
|
struct virtio_balloon_config config;
|
|
|
|
|
|
|
|
config.num_pages = cpu_to_le32(dev->num_pages);
|
|
|
|
config.actual = cpu_to_le32(dev->actual);
|
|
|
|
|
|
|
|
memcpy(config_data, &config, 8);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void virtio_balloon_set_config(VirtIODevice *vdev,
|
|
|
|
const uint8_t *config_data)
|
|
|
|
{
|
|
|
|
VirtIOBalloon *dev = to_virtio_balloon(vdev);
|
|
|
|
struct virtio_balloon_config config;
|
|
|
|
memcpy(&config, config_data, 8);
|
virtio-balloon: fixed endianness bug in the config space
The specification for the virtio balloon device requres that the values
in the config space be encoded little-endian. This differs from most
virtio things, where guest-native endian is the norm.
Currently, the qemu virtio-balloon code correctly makes the conversion
on get_config(), but doesn't on set_config for the 'actual' field. The
kernel driver, on the other hand, correctly converts when setting the
actual field, but does not convert when reading the config space. The
upshot is that virtio-balloon will only work correctly if both host and
guest are LE, making all the conversions nops.
This patch corrects the qemu side, correctly doing host-native <-> LE
conversions when accessing the config space. This won't break any setups
that aren't already broken, and fixes the case of BE host, LE guest.
Fixing the BE guest case will require kernel fixes as well.
Signed-off-by: Alexey Kardashevskiy <aik@ozlabs.ru>
Signed-off-by: David Gibson <david@gibson.dropbear.id.au>
Signed-off-by: Stefan Hajnoczi <stefanha@linux.vnet.ibm.com>
2011-04-07 11:02:04 +08:00
|
|
|
dev->actual = le32_to_cpu(config.actual);
|
2008-12-05 04:33:06 +08:00
|
|
|
}
|
|
|
|
|
2010-01-10 19:52:53 +08:00
|
|
|
static uint32_t virtio_balloon_get_features(VirtIODevice *vdev, uint32_t f)
|
2008-12-05 04:33:06 +08:00
|
|
|
{
|
2010-01-27 04:17:35 +08:00
|
|
|
f |= (1 << VIRTIO_BALLOON_F_STATS_VQ);
|
2010-01-10 19:52:53 +08:00
|
|
|
return f;
|
2008-12-05 04:33:06 +08:00
|
|
|
}
|
|
|
|
|
2011-07-20 15:49:07 +08:00
|
|
|
static void virtio_balloon_stat(void *opaque, MonitorCompletion cb,
|
|
|
|
void *cb_data)
|
|
|
|
{
|
|
|
|
VirtIOBalloon *dev = opaque;
|
|
|
|
|
|
|
|
/* For now, only allow one request at a time. This restriction can be
|
|
|
|
* removed later by queueing callback and data pairs.
|
|
|
|
*/
|
|
|
|
if (dev->stats_callback != NULL) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
dev->stats_callback = cb;
|
|
|
|
dev->stats_opaque_callback_data = cb_data;
|
|
|
|
|
|
|
|
if (ENABLE_GUEST_STATS
|
|
|
|
&& (dev->vdev.guest_features & (1 << VIRTIO_BALLOON_F_STATS_VQ))) {
|
|
|
|
virtqueue_push(dev->svq, &dev->stats_vq_elem, dev->stats_vq_offset);
|
|
|
|
virtio_notify(&dev->vdev, dev->svq);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Stats are not supported. Clear out any stale values that might
|
|
|
|
* have been set by a more featureful guest kernel.
|
|
|
|
*/
|
|
|
|
reset_stats(dev);
|
|
|
|
complete_stats_request(dev);
|
|
|
|
}
|
|
|
|
|
2010-01-27 04:17:35 +08:00
|
|
|
static void virtio_balloon_to_target(void *opaque, ram_addr_t target,
|
|
|
|
MonitorCompletion cb, void *cb_data)
|
2008-12-05 04:33:06 +08:00
|
|
|
{
|
|
|
|
VirtIOBalloon *dev = opaque;
|
|
|
|
|
2011-07-20 15:49:07 +08:00
|
|
|
if (target > ram_size) {
|
2008-12-05 04:33:06 +08:00
|
|
|
target = ram_size;
|
2011-07-20 15:49:07 +08:00
|
|
|
}
|
2008-12-05 04:33:06 +08:00
|
|
|
if (target) {
|
|
|
|
dev->num_pages = (ram_size - target) >> VIRTIO_BALLOON_PFN_SHIFT;
|
|
|
|
virtio_notify_config(&dev->vdev);
|
2010-01-27 04:17:35 +08:00
|
|
|
} else {
|
2011-07-20 15:49:07 +08:00
|
|
|
virtio_balloon_stat(opaque, cb, cb_data);
|
2008-12-05 04:33:06 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static void virtio_balloon_save(QEMUFile *f, void *opaque)
|
|
|
|
{
|
|
|
|
VirtIOBalloon *s = opaque;
|
|
|
|
|
|
|
|
virtio_save(&s->vdev, f);
|
|
|
|
|
|
|
|
qemu_put_be32(f, s->num_pages);
|
|
|
|
qemu_put_be32(f, s->actual);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int virtio_balloon_load(QEMUFile *f, void *opaque, int version_id)
|
|
|
|
{
|
|
|
|
VirtIOBalloon *s = opaque;
|
|
|
|
|
|
|
|
if (version_id != 1)
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
virtio_load(&s->vdev, f);
|
|
|
|
|
|
|
|
s->num_pages = qemu_get_be32(f);
|
|
|
|
s->actual = qemu_get_be32(f);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2009-05-18 21:51:59 +08:00
|
|
|
VirtIODevice *virtio_balloon_init(DeviceState *dev)
|
2008-12-05 04:33:06 +08:00
|
|
|
{
|
|
|
|
VirtIOBalloon *s;
|
|
|
|
|
2009-05-18 21:51:59 +08:00
|
|
|
s = (VirtIOBalloon *)virtio_common_init("virtio-balloon",
|
|
|
|
VIRTIO_ID_BALLOON,
|
|
|
|
8, sizeof(VirtIOBalloon));
|
2008-12-05 04:33:06 +08:00
|
|
|
|
|
|
|
s->vdev.get_config = virtio_balloon_get_config;
|
|
|
|
s->vdev.set_config = virtio_balloon_set_config;
|
|
|
|
s->vdev.get_features = virtio_balloon_get_features;
|
|
|
|
|
|
|
|
s->ivq = virtio_add_queue(&s->vdev, 128, virtio_balloon_handle_output);
|
|
|
|
s->dvq = virtio_add_queue(&s->vdev, 128, virtio_balloon_handle_output);
|
2010-01-27 04:17:35 +08:00
|
|
|
s->svq = virtio_add_queue(&s->vdev, 128, virtio_balloon_receive_stats);
|
2008-12-05 04:33:06 +08:00
|
|
|
|
2010-01-27 04:17:35 +08:00
|
|
|
reset_stats(s);
|
2008-12-05 04:33:06 +08:00
|
|
|
qemu_add_balloon_handler(virtio_balloon_to_target, s);
|
|
|
|
|
2010-06-26 01:09:07 +08:00
|
|
|
register_savevm(dev, "virtio-balloon", -1, 1,
|
|
|
|
virtio_balloon_save, virtio_balloon_load, s);
|
2008-12-05 04:33:06 +08:00
|
|
|
|
2009-05-18 21:51:59 +08:00
|
|
|
return &s->vdev;
|
2008-12-05 04:33:06 +08:00
|
|
|
}
|