eda7362af9
Pre-copy support allows the VFIO device data to be transferred while the VM is running. This helps to accommodate VFIO devices that have a large amount of data that needs to be transferred, and it can reduce migration downtime. Pre-copy support is optional in VFIO migration protocol v2. Implement pre-copy of VFIO migration protocol v2 and use it for devices that support it. Full description of it can be found in the following Linux commit: 4db52602a607 ("vfio: Extend the device migration protocol with PRE_COPY"). Signed-off-by: Avihai Horon <avihaih@nvidia.com> Reviewed-by: Cédric Le Goater <clg@redhat.com> Tested-by: YangHang Liu <yanghliu@redhat.com> Acked-by: Alex Williamson <alex.williamson@redhat.com> Signed-off-by: Cédric Le Goater <clg@redhat.com>
257 lines
7.9 KiB
C
257 lines
7.9 KiB
C
/*
|
|
* common header for vfio based device assignment support
|
|
*
|
|
* Copyright Red Hat, Inc. 2012
|
|
*
|
|
* Authors:
|
|
* Alex Williamson <alex.williamson@redhat.com>
|
|
*
|
|
* This work is licensed under the terms of the GNU GPL, version 2. See
|
|
* the COPYING file in the top-level directory.
|
|
*
|
|
* Based on qemu-kvm device-assignment:
|
|
* Adapted for KVM by Qumranet.
|
|
* Copyright (c) 2007, Neocleus, Alex Novik (alex@neocleus.com)
|
|
* Copyright (c) 2007, Neocleus, Guy Zana (guy@neocleus.com)
|
|
* Copyright (C) 2008, Qumranet, Amit Shah (amit.shah@qumranet.com)
|
|
* Copyright (C) 2008, Red Hat, Amit Shah (amit.shah@redhat.com)
|
|
* Copyright (C) 2008, IBM, Muli Ben-Yehuda (muli@il.ibm.com)
|
|
*/
|
|
|
|
#ifndef HW_VFIO_VFIO_COMMON_H
|
|
#define HW_VFIO_VFIO_COMMON_H
|
|
|
|
#include "exec/memory.h"
|
|
#include "qemu/queue.h"
|
|
#include "qemu/notify.h"
|
|
#include "ui/console.h"
|
|
#include "hw/display/ramfb.h"
|
|
#ifdef CONFIG_LINUX
|
|
#include <linux/vfio.h>
|
|
#endif
|
|
#include "sysemu/sysemu.h"
|
|
|
|
#define VFIO_MSG_PREFIX "vfio %s: "
|
|
|
|
enum {
|
|
VFIO_DEVICE_TYPE_PCI = 0,
|
|
VFIO_DEVICE_TYPE_PLATFORM = 1,
|
|
VFIO_DEVICE_TYPE_CCW = 2,
|
|
VFIO_DEVICE_TYPE_AP = 3,
|
|
};
|
|
|
|
typedef struct VFIOMmap {
|
|
MemoryRegion mem;
|
|
void *mmap;
|
|
off_t offset;
|
|
size_t size;
|
|
} VFIOMmap;
|
|
|
|
typedef struct VFIORegion {
|
|
struct VFIODevice *vbasedev;
|
|
off_t fd_offset; /* offset of region within device fd */
|
|
MemoryRegion *mem; /* slow, read/write access */
|
|
size_t size;
|
|
uint32_t flags; /* VFIO region flags (rd/wr/mmap) */
|
|
uint32_t nr_mmaps;
|
|
VFIOMmap *mmaps;
|
|
uint8_t nr; /* cache the region number for debug */
|
|
} VFIORegion;
|
|
|
|
typedef struct VFIOMigration {
|
|
struct VFIODevice *vbasedev;
|
|
VMChangeStateEntry *vm_state;
|
|
Notifier migration_state;
|
|
uint32_t device_state;
|
|
int data_fd;
|
|
void *data_buffer;
|
|
size_t data_buffer_size;
|
|
uint64_t mig_flags;
|
|
uint64_t precopy_init_size;
|
|
uint64_t precopy_dirty_size;
|
|
} VFIOMigration;
|
|
|
|
typedef struct VFIOAddressSpace {
|
|
AddressSpace *as;
|
|
QLIST_HEAD(, VFIOContainer) containers;
|
|
QLIST_ENTRY(VFIOAddressSpace) list;
|
|
} VFIOAddressSpace;
|
|
|
|
struct VFIOGroup;
|
|
|
|
typedef struct VFIOContainer {
|
|
VFIOAddressSpace *space;
|
|
int fd; /* /dev/vfio/vfio, empowered by the attached groups */
|
|
MemoryListener listener;
|
|
MemoryListener prereg_listener;
|
|
unsigned iommu_type;
|
|
Error *error;
|
|
bool initialized;
|
|
bool dirty_pages_supported;
|
|
uint64_t dirty_pgsizes;
|
|
uint64_t max_dirty_bitmap_size;
|
|
unsigned long pgsizes;
|
|
unsigned int dma_max_mappings;
|
|
QLIST_HEAD(, VFIOGuestIOMMU) giommu_list;
|
|
QLIST_HEAD(, VFIOHostDMAWindow) hostwin_list;
|
|
QLIST_HEAD(, VFIOGroup) group_list;
|
|
QLIST_HEAD(, VFIORamDiscardListener) vrdl_list;
|
|
QLIST_ENTRY(VFIOContainer) next;
|
|
} VFIOContainer;
|
|
|
|
typedef struct VFIOGuestIOMMU {
|
|
VFIOContainer *container;
|
|
IOMMUMemoryRegion *iommu_mr;
|
|
hwaddr iommu_offset;
|
|
IOMMUNotifier n;
|
|
QLIST_ENTRY(VFIOGuestIOMMU) giommu_next;
|
|
} VFIOGuestIOMMU;
|
|
|
|
typedef struct VFIORamDiscardListener {
|
|
VFIOContainer *container;
|
|
MemoryRegion *mr;
|
|
hwaddr offset_within_address_space;
|
|
hwaddr size;
|
|
uint64_t granularity;
|
|
RamDiscardListener listener;
|
|
QLIST_ENTRY(VFIORamDiscardListener) next;
|
|
} VFIORamDiscardListener;
|
|
|
|
typedef struct VFIOHostDMAWindow {
|
|
hwaddr min_iova;
|
|
hwaddr max_iova;
|
|
uint64_t iova_pgsizes;
|
|
QLIST_ENTRY(VFIOHostDMAWindow) hostwin_next;
|
|
} VFIOHostDMAWindow;
|
|
|
|
typedef struct VFIODeviceOps VFIODeviceOps;
|
|
|
|
typedef struct VFIODevice {
|
|
QLIST_ENTRY(VFIODevice) next;
|
|
struct VFIOGroup *group;
|
|
char *sysfsdev;
|
|
char *name;
|
|
DeviceState *dev;
|
|
int fd;
|
|
int type;
|
|
bool reset_works;
|
|
bool needs_reset;
|
|
bool no_mmap;
|
|
bool ram_block_discard_allowed;
|
|
bool enable_migration;
|
|
VFIODeviceOps *ops;
|
|
unsigned int num_irqs;
|
|
unsigned int num_regions;
|
|
unsigned int flags;
|
|
VFIOMigration *migration;
|
|
Error *migration_blocker;
|
|
OnOffAuto pre_copy_dirty_page_tracking;
|
|
bool dirty_pages_supported;
|
|
bool dirty_tracking;
|
|
} VFIODevice;
|
|
|
|
struct VFIODeviceOps {
|
|
void (*vfio_compute_needs_reset)(VFIODevice *vdev);
|
|
int (*vfio_hot_reset_multi)(VFIODevice *vdev);
|
|
void (*vfio_eoi)(VFIODevice *vdev);
|
|
Object *(*vfio_get_object)(VFIODevice *vdev);
|
|
void (*vfio_save_config)(VFIODevice *vdev, QEMUFile *f);
|
|
int (*vfio_load_config)(VFIODevice *vdev, QEMUFile *f);
|
|
};
|
|
|
|
typedef struct VFIOGroup {
|
|
int fd;
|
|
int groupid;
|
|
VFIOContainer *container;
|
|
QLIST_HEAD(, VFIODevice) device_list;
|
|
QLIST_ENTRY(VFIOGroup) next;
|
|
QLIST_ENTRY(VFIOGroup) container_next;
|
|
bool ram_block_discard_allowed;
|
|
} VFIOGroup;
|
|
|
|
typedef struct VFIODMABuf {
|
|
QemuDmaBuf buf;
|
|
uint32_t pos_x, pos_y, pos_updates;
|
|
uint32_t hot_x, hot_y, hot_updates;
|
|
int dmabuf_id;
|
|
QTAILQ_ENTRY(VFIODMABuf) next;
|
|
} VFIODMABuf;
|
|
|
|
typedef struct VFIODisplay {
|
|
QemuConsole *con;
|
|
RAMFBState *ramfb;
|
|
struct vfio_region_info *edid_info;
|
|
struct vfio_region_gfx_edid *edid_regs;
|
|
uint8_t *edid_blob;
|
|
QEMUTimer *edid_link_timer;
|
|
struct {
|
|
VFIORegion buffer;
|
|
DisplaySurface *surface;
|
|
} region;
|
|
struct {
|
|
QTAILQ_HEAD(, VFIODMABuf) bufs;
|
|
VFIODMABuf *primary;
|
|
VFIODMABuf *cursor;
|
|
} dmabuf;
|
|
} VFIODisplay;
|
|
|
|
void vfio_put_base_device(VFIODevice *vbasedev);
|
|
void vfio_disable_irqindex(VFIODevice *vbasedev, int index);
|
|
void vfio_unmask_single_irqindex(VFIODevice *vbasedev, int index);
|
|
void vfio_mask_single_irqindex(VFIODevice *vbasedev, int index);
|
|
int vfio_set_irq_signaling(VFIODevice *vbasedev, int index, int subindex,
|
|
int action, int fd, Error **errp);
|
|
void vfio_region_write(void *opaque, hwaddr addr,
|
|
uint64_t data, unsigned size);
|
|
uint64_t vfio_region_read(void *opaque,
|
|
hwaddr addr, unsigned size);
|
|
int vfio_region_setup(Object *obj, VFIODevice *vbasedev, VFIORegion *region,
|
|
int index, const char *name);
|
|
int vfio_region_mmap(VFIORegion *region);
|
|
void vfio_region_mmaps_set_enabled(VFIORegion *region, bool enabled);
|
|
void vfio_region_unmap(VFIORegion *region);
|
|
void vfio_region_exit(VFIORegion *region);
|
|
void vfio_region_finalize(VFIORegion *region);
|
|
void vfio_reset_handler(void *opaque);
|
|
VFIOGroup *vfio_get_group(int groupid, AddressSpace *as, Error **errp);
|
|
void vfio_put_group(VFIOGroup *group);
|
|
int vfio_get_device(VFIOGroup *group, const char *name,
|
|
VFIODevice *vbasedev, Error **errp);
|
|
|
|
extern const MemoryRegionOps vfio_region_ops;
|
|
typedef QLIST_HEAD(VFIOGroupList, VFIOGroup) VFIOGroupList;
|
|
extern VFIOGroupList vfio_group_list;
|
|
|
|
bool vfio_mig_active(void);
|
|
int vfio_block_multiple_devices_migration(Error **errp);
|
|
void vfio_unblock_multiple_devices_migration(void);
|
|
int vfio_block_giommu_migration(Error **errp);
|
|
int64_t vfio_mig_bytes_transferred(void);
|
|
|
|
#ifdef CONFIG_LINUX
|
|
int vfio_get_region_info(VFIODevice *vbasedev, int index,
|
|
struct vfio_region_info **info);
|
|
int vfio_get_dev_region_info(VFIODevice *vbasedev, uint32_t type,
|
|
uint32_t subtype, struct vfio_region_info **info);
|
|
bool vfio_has_region_cap(VFIODevice *vbasedev, int region, uint16_t cap_type);
|
|
struct vfio_info_cap_header *
|
|
vfio_get_region_info_cap(struct vfio_region_info *info, uint16_t id);
|
|
bool vfio_get_info_dma_avail(struct vfio_iommu_type1_info *info,
|
|
unsigned int *avail);
|
|
struct vfio_info_cap_header *
|
|
vfio_get_device_info_cap(struct vfio_device_info *info, uint16_t id);
|
|
#endif
|
|
extern const MemoryListener vfio_prereg_listener;
|
|
|
|
int vfio_spapr_create_window(VFIOContainer *container,
|
|
MemoryRegionSection *section,
|
|
hwaddr *pgsize);
|
|
int vfio_spapr_remove_window(VFIOContainer *container,
|
|
hwaddr offset_within_address_space);
|
|
|
|
int vfio_migration_realize(VFIODevice *vbasedev, Error **errp);
|
|
void vfio_migration_exit(VFIODevice *vbasedev);
|
|
void vfio_migration_finalize(void);
|
|
|
|
#endif /* HW_VFIO_VFIO_COMMON_H */
|