- hw/arm/fsl-imx: Do not ignore Error argument - hw/net/cadence_gem.c: spelling fixes: Octects - tests/qtest: check the return value - libvhost-user: Fix VHOST_USER_GET_MAX_MEM_SLOTS reply mainline inclusion commit 69a5daec06f423843ce1bb9be5fb049314996f78 category: bugfix - io_uring: fix short read slow path mainline inclusion commit c06fc7ce147e57ab493bad9263f1601b8298484b category: bugfix - libvhost-user: Fix VHOST_USER_ADD_MEM_REG reply mainline inclusion commit 7f27d20ded2f480f3e66d03f90ea71507b834276 category: bugfix - qsd: Unlink absolute PID file path mainline inclusion commit 9d8f8233b9fa525a7e37350fbc18877051128c5d category: bugfix - net: Fix a misleading error message - vdpa: stop all svq on device deletion - vhost: release virtqueue objects in error path - vhost: fix the fd leak - virtio: i2c: Check notifier helpers for VIRTIO_CONFIG_IRQ_IDX - hw/virtio: fix typo in VIRTIO_CONFIG_IRQ_IDX comments - virtio-net: clear guest_announce feature if no cvq backend - vdpa: fix VHOST_BACKEND_F_IOTLB_ASID flag check - vdpa: do not block migration if device has cvq and x-svq=on - vdpa net: block migration if the device has CVQ - vdpa: Return -EIO if device ack is VIRTIO_NET_ERR in _load_mq() - vdpa: Return -EIO if device ack is VIRTIO_NET_ERR in _load_mac() - vdpa: fix not using CVQ buffer in case of error - vdpa: Fix possible use-after-free for VirtQueueElement - hw/virtio: fix vhost_user_read tracepoint - vhost: Fix false positive out-of-bounds - vhost: fix possible wrap in SVQ descriptor ring - vhost: move iova_tree set to vhost_svq_start - vhost: Always store new kick fd on vhost_svq_set_svq_kick_fd - virtio-crypto: verify src&dst buffer length for sym request - vdpa: commit all host notifier MRs in a single MR transaction - vdpa: harden the error path if get_iova_range failed - vdpa-dev: get iova range explicitly - virtio-pci: add support for configure interrupt - virtio-mmio: add support for configure interrupt - virtio-net: add support for configure interrupt - vhost: add support for configure interrupt - virtio: add support for configure interrupt - vhost-vdpa: add support for config interrupt - vhost: introduce new VhostOps vhost_set_config_call - virtio-pci: decouple the single vector from the interrupt process - virtio-pci: decouple notifier from interrupt process - virtio: introduce macro VIRTIO_CONFIG_IRQ_IDX - vdpa: do not handle VIRTIO_NET_F_GUEST_ANNOUNCE in vhost-vdpa - vdpa: handle VIRTIO_NET_CTRL_ANNOUNCE in vhost_vdpa_net_handle_ctrl_avail - vhost: fix vq dirty bitmap syncing when vIOMMU is enabled - hw/virtio: gracefully handle unset vhost_dev vdev - hw/virtio/vhost: Fix typo in comment. - vdpa: always start CVQ in SVQ mode if possible - vdpa: add shadow_data to vhost_vdpa - vdpa: store x-svq parameter in VhostVDPAState - vdpa: add asid parameter to vhost_vdpa_dma_map/unmap - vdpa: allocate SVQ array unconditionally - vdpa: move SVQ vring features check to net/ - vdpa: request iova_range only once - vdpa: add vhost_vdpa_net_valid_svq_features - vhost: allocate SVQ device file descriptors at device start - vhost: set SVQ device call handler at SVQ start - vdpa: use v->shadow_vqs_enabled in vhost_vdpa_svqs_start & stop - vhost: enable vrings in vhost_dev_start() for vhost-user devices - vhost-vdpa: fix assert !virtio_net_get_subqueue(nc)->async_tx.elem in virtio_net_reset - net/vhost-vdpa.c: Fix clang compilation failure - vhost-vdpa: allow passing opened vhostfd to vhost-vdpa - vdpa: Remove shadow CVQ command check - vdpa: Delete duplicated vdpa_feature_bits entry - hw/virtio: add some vhost-user trace events - vdpa: Allow MQ feature in SVQ - virtio-net: Update virtio-net curr_queue_pairs in vdpa backends - vdpa: validate MQ CVQ commands - vdpa: Add vhost_vdpa_net_load_mq - vdpa: extract vhost_vdpa_net_load_mac from vhost_vdpa_net_load - vdpa: Make VhostVDPAState cvq_cmd_in_buffer control ack type - vdpa: Delete CVQ migration blocker - vdpa: Add virtio-net mac address via CVQ at start - vhost_net: add NetClientState->load() callback - vdpa: extract vhost_vdpa_net_cvq_add from vhost_vdpa_net_handle_ctrl_avail - vdpa: Move command buffers map to start of net device - vdpa: add net_vhost_vdpa_cvq_info NetClientInfo - vhost_net: Add NetClientInfo stop callback - vhost_net: Add NetClientInfo start callback - vdpa: Use ring hwaddr at vhost_vdpa_svq_unmap_ring - vdpa: Make SVQ vring unmapping return void - vdpa: Remove SVQ vring from iova_tree at shutdown - util: accept iova_tree_remove_parameter by value - vdpa: do not save failed dma maps in SVQ iova tree - vdpa: Skip the maps not in the iova tree - vdpa: Fix file descriptor leak on get features error - vdpa: Fix memory listener deletions of iova tree - vhost: Get vring base from vq, not svq - vdpa: Add x-svq to NetdevVhostVDPAOptions - vdpa: Add device migration blocker - vdpa: Extract get features part from vhost_vdpa_get_max_queue_pairs - vdpa: Buffer CVQ support on shadow virtqueue - vdpa: manual forward CVQ buffers - vdpa: Export vhost_vdpa_dma_map and unmap calls - vhost: Add svq avail_handler callback - vhost: add vhost_svq_poll - vhost: Expose vhost_svq_add - vhost: add vhost_svq_push_elem - vhost: Track number of descs in SVQDescState - vhost: Add SVQDescState - vhost: Decouple vhost_svq_add from VirtQueueElement - vhost: Check for queue full at vhost_svq_add - vhost: Move vhost_svq_kick call to vhost_svq_add - vhost: Reorder vhost_svq_kick - vdpa: Avoid compiler to squash reads to used idx - virtio-net: Expose ctrl virtqueue logic - virtio-net: Expose MAC_TABLE_ENTRIES - vhost: move descriptor translation to vhost_svq_vring_write_descs - util: Return void on iova_tree_remove - virtio-net: don't handle mq request in userspace handler for vhost-vdpa - vhost-vdpa: change name and polarity for vhost_vdpa_one_time_request() - vhost-vdpa: backend feature should set only once - vhost-vdpa: fix improper cleanup in net_init_vhost_vdpa - virtio-net: align ctrl_vq index for non-mq guest for vhost_vdpa - virtio: add vhost support for virtio devices - include/hw: start documenting the vhost API - hw/virtio: add vhost_user_[read|write] trace points - vhost: Fix element in vhost_svq_add failure - vdpa: Fix index calculus at vhost_vdpa_svqs_start - vdpa: Fix bad index calculus at vhost_vdpa_get_vring_base - vhost: Fix device's used descriptor dequeue - vhost: Track descriptor chain in private at SVQ - vdpa: Add missing tracing to batch mapping functions - vhost-vdpa: fix typo in a comment - virtio: fix --enable-vhost-user build on non-Linux - vdpa: Expose VHOST_F_LOG_ALL on SVQ - vdpa: Never set log_base addr if SVQ is enabled - vdpa: Adapt vhost_vdpa_get_vring_base to SVQ - vdpa: Add custom IOTLB translations to SVQ - vhost: Add VhostIOVATree - util: add iova_tree_find_iova - util: Add iova_tree_alloc_map - vhost: Shadow virtqueue buffers forwarding - vdpa: adapt vhost_ops callbacks to svq - virtio: Add vhost_svq_get_vring_addr - vhost: Add vhost_svq_valid_features to shadow vq - vhost: Add Shadow VirtQueue call forwarding capabilities - vhost: Add Shadow VirtQueue kick forwarding capabilities - vhost: Add VhostShadowVirtqueue - vdpa: Make ncs autofree - Revert "virtio: introduce macro IRTIO_CONFIG_IRQ_IDX" - Revert "virtio-pci: decouple notifier from interrupt process" - Revert "virtio-pci: decouple the single vector from the interrupt process" - Revert "vhost-vdpa: add support for config interrupt" - Revert "virtio: add support for configure interrupt" - Revert "vhost: add support for configure interrupt" - Revert "virtio-net: add support for configure interrupt" - Revert "virtio-mmio: add support for configure interrupt" - Revert "virtio-pci: add support for configure interrupt" - Revert "vhost: introduce new VhostOps vhost_set_config_call" - virtio: signal after wrapping packed used_idx - target/i386: Adjust feature level according to FEAT_7_1_EDX - target/i386: Add new CPU model GraniteRapids - target/i386: Add support for PREFETCHIT0/1 in CPUID enumeration - target/i386: Add support for AVX-NE-CONVERT in CPUID enumeration - target/i386: Add support for AVX-VNNI-INT8 in CPUID enumeration - target/i386: Add support for AVX-IFMA in CPUID enumeration - target/i386: Add support for AMX-FP16 in CPUID enumeration - target/i386: Add support for CMPCCXADD in CPUID enumeration - tracetool: avoid invalid escape in Python string - hw/pvrdma: Protect against buggy or malicious guest driver - vga: avoid crash if no default vga card mainline inclusion commit 6985d8ede92494f3b791de01e8ee9306eb6d5e4a category: bugfix - qom/object: Remove circular include dependency mainline inclusion commit 5bba9bcfbb42e7c016626420e148a1bf1b080835 category: bugfix - artist: set memory region owners for buffers to the artist device mainline inclusion commit 39fbaeca096a9bf6cbe2af88572c1cb2aa62aa8c category: bugfix - virtio-iommu: Fix the partial copy of probe request mainline inclusion commit 45461aace83d961e933b27519b81d17b4c690514 category: bugfix - e1000: set RX descriptor status in a separate operation mainline inclusion commit 034d00d4858161e1d4cff82d8d230bce874a04d3 category: bugfix - vhost: introduce new VhostOps vhost_set_config_call - vhost: stick to -errno error return convention - vhost-user: stick to -errno error return convention - vhost-vdpa: stick to -errno error return convention - virtio-pci: add support for configure interrupt - virtio-mmio: add support for configure interrupt - virtio-net: add support for configure interrupt - vhost: add support for configure interrupt - virtio: add support for configure interrupt - vhost-vdpa: add support for config interrupt - virtio-pci: decouple the single vector from the interrupt process - virtio-pci: decouple notifier from interrupt process - virtio: introduce macro IRTIO_CONFIG_IRQ_IDX - pci: Fix the update of interrupt disable bit in PCI_COMMAND register - hw/timer/npcm7xx_timer: Prevent timer from counting down past zero - tpm_crb: mark command buffer as dirty on request completion mainline inclusion commit e37a0ef4605e5d2041785ff3fc89ca6021faf7a0 category: bugfix - pci: fix overflow in snprintf string formatting mainline inclusion commit 36f18c6989a3d1ff1d7a0e50b0868ef3958299b4 category: bugfix - hw/usb/hcd-ehci: fix writeback order mainline inclusion commit f471e8b060798f26a7fc339c6152f82f22a7b33d category: bugfix - qemu-timer: Skip empty timer lists before locking in qemu_clock_deadline_ns_all mainline inclusion commit 3f42906c9ab2c777a895b48b87b8107167e4a275 category: bugfix - semihosting/config: Merge --semihosting-config option groups mainline inclusion commit 90c072e063737e9e8f431489bbd334452f89056e category: bugfix - semihosting: fix memleak at semihosting_arg_fallback - target/i386: Export GDS_NO bit to guests Signed-off-by: Jiabo Feng <fengjiabo1@huawei.com>
225 lines
7.7 KiB
Diff
225 lines
7.7 KiB
Diff
From e2e9aeaacdb28b6c2a1bfcfef09113dc9b26a420 Mon Sep 17 00:00:00 2001
|
|
From: =?UTF-8?q?Eugenio=20P=C3=A9rez?= <eperezma@redhat.com>
|
|
Date: Thu, 15 Dec 2022 12:31:44 +0100
|
|
Subject: [PATCH] vdpa: always start CVQ in SVQ mode if possible
|
|
MIME-Version: 1.0
|
|
Content-Type: text/plain; charset=UTF-8
|
|
Content-Transfer-Encoding: 8bit
|
|
|
|
Isolate control virtqueue in its own group, allowing to intercept control
|
|
commands but letting dataplane run totally passthrough to the guest.
|
|
|
|
Signed-off-by: Eugenio Pérez <eperezma@redhat.com>
|
|
Message-Id: <20221215113144.322011-13-eperezma@redhat.com>
|
|
Reviewed-by: Michael S. Tsirkin <mst@redhat.com>
|
|
Signed-off-by: Michael S. Tsirkin <mst@redhat.com>
|
|
Acked-by: Jason Wang <jasowang@redhat.com>
|
|
Signed-off-by: fangyi <eric.fangyi@huawei.com>
|
|
---
|
|
hw/virtio/vhost-vdpa.c | 3 +-
|
|
include/standard-headers/linux/vhost_types.h | 5 +
|
|
linux-headers/linux/vhost.h | 14 +++
|
|
net/vhost-vdpa.c | 110 ++++++++++++++++++-
|
|
4 files changed, 130 insertions(+), 2 deletions(-)
|
|
|
|
diff --git a/hw/virtio/vhost-vdpa.c b/hw/virtio/vhost-vdpa.c
|
|
index 6d0d85b733..8b44f5a7b8 100644
|
|
--- a/hw/virtio/vhost-vdpa.c
|
|
+++ b/hw/virtio/vhost-vdpa.c
|
|
@@ -641,7 +641,8 @@ static int vhost_vdpa_set_backend_cap(struct vhost_dev *dev)
|
|
{
|
|
uint64_t features;
|
|
uint64_t f = 0x1ULL << VHOST_BACKEND_F_IOTLB_MSG_V2 |
|
|
- 0x1ULL << VHOST_BACKEND_F_IOTLB_BATCH;
|
|
+ 0x1ULL << VHOST_BACKEND_F_IOTLB_BATCH |
|
|
+ 0x1ULL << VHOST_BACKEND_F_IOTLB_ASID;
|
|
int r;
|
|
|
|
if (vhost_vdpa_call(dev, VHOST_GET_BACKEND_FEATURES, &features)) {
|
|
diff --git a/include/standard-headers/linux/vhost_types.h b/include/standard-headers/linux/vhost_types.h
|
|
index fa267e39d4..17833e320e 100644
|
|
--- a/include/standard-headers/linux/vhost_types.h
|
|
+++ b/include/standard-headers/linux/vhost_types.h
|
|
@@ -153,4 +153,9 @@ struct vhost_vdpa_iova_range {
|
|
/* vhost-net should add virtio_net_hdr for RX, and strip for TX packets. */
|
|
#define VHOST_NET_F_VIRTIO_NET_HDR 27
|
|
|
|
+/* IOTLB can accept address space identifier through V2 type of IOTLB
|
|
+ * message
|
|
+ */
|
|
+#define VHOST_BACKEND_F_IOTLB_ASID 0x3
|
|
+
|
|
#endif
|
|
diff --git a/linux-headers/linux/vhost.h b/linux-headers/linux/vhost.h
|
|
index 5d99e7c242..b6ded7f831 100644
|
|
--- a/linux-headers/linux/vhost.h
|
|
+++ b/linux-headers/linux/vhost.h
|
|
@@ -157,4 +157,18 @@
|
|
/* Get the count of all virtqueues */
|
|
#define VHOST_VDPA_GET_VQS_COUNT _IOR(VHOST_VIRTIO, 0x80, __u32)
|
|
|
|
+/* Get the group for a virtqueue: read index, write group in num,
|
|
+ * The virtqueue index is stored in the index field of
|
|
+ * vhost_vring_state. The group for this specific virtqueue is
|
|
+ * returned via num field of vhost_vring_state.
|
|
+ */
|
|
+#define VHOST_VDPA_GET_VRING_GROUP _IOWR(VHOST_VIRTIO, 0x7B, \
|
|
+ struct vhost_vring_state)
|
|
+/* Set the ASID for a virtqueue group. The group index is stored in
|
|
+ * the index field of vhost_vring_state, the ASID associated with this
|
|
+ * group is stored at num field of vhost_vring_state.
|
|
+ */
|
|
+#define VHOST_VDPA_SET_GROUP_ASID _IOW(VHOST_VIRTIO, 0x7C, \
|
|
+ struct vhost_vring_state)
|
|
+
|
|
#endif
|
|
diff --git a/net/vhost-vdpa.c b/net/vhost-vdpa.c
|
|
index 21fb89bb6b..24c4c2ef51 100644
|
|
--- a/net/vhost-vdpa.c
|
|
+++ b/net/vhost-vdpa.c
|
|
@@ -100,6 +100,8 @@ static const uint64_t vdpa_svq_device_features =
|
|
BIT_ULL(VIRTIO_NET_F_RSC_EXT) |
|
|
BIT_ULL(VIRTIO_NET_F_STANDBY);
|
|
|
|
+#define VHOST_VDPA_NET_CVQ_ASID 1
|
|
+
|
|
VHostNetState *vhost_vdpa_get_vhost_net(NetClientState *nc)
|
|
{
|
|
VhostVDPAState *s = DO_UPCAST(VhostVDPAState, nc, nc);
|
|
@@ -250,6 +252,40 @@ static NetClientInfo net_vhost_vdpa_info = {
|
|
.check_peer_type = vhost_vdpa_check_peer_type,
|
|
};
|
|
|
|
+static int64_t vhost_vdpa_get_vring_group(int device_fd, unsigned vq_index)
|
|
+{
|
|
+ struct vhost_vring_state state = {
|
|
+ .index = vq_index,
|
|
+ };
|
|
+ int r = ioctl(device_fd, VHOST_VDPA_GET_VRING_GROUP, &state);
|
|
+
|
|
+ if (unlikely(r < 0)) {
|
|
+ error_report("Cannot get VQ %u group: %s", vq_index,
|
|
+ g_strerror(errno));
|
|
+ return r;
|
|
+ }
|
|
+
|
|
+ return state.num;
|
|
+}
|
|
+
|
|
+static int vhost_vdpa_set_address_space_id(struct vhost_vdpa *v,
|
|
+ unsigned vq_group,
|
|
+ unsigned asid_num)
|
|
+{
|
|
+ struct vhost_vring_state asid = {
|
|
+ .index = vq_group,
|
|
+ .num = asid_num,
|
|
+ };
|
|
+ int r;
|
|
+
|
|
+ r = ioctl(v->device_fd, VHOST_VDPA_SET_GROUP_ASID, &asid);
|
|
+ if (unlikely(r < 0)) {
|
|
+ error_report("Can't set vq group %u asid %u, errno=%d (%s)",
|
|
+ asid.index, asid.num, errno, g_strerror(errno));
|
|
+ }
|
|
+ return r;
|
|
+}
|
|
+
|
|
static void vhost_vdpa_cvq_unmap_buf(struct vhost_vdpa *v, void *addr)
|
|
{
|
|
VhostIOVATree *tree = v->iova_tree;
|
|
@@ -324,11 +360,75 @@ dma_map_err:
|
|
static int vhost_vdpa_net_cvq_start(NetClientState *nc)
|
|
{
|
|
VhostVDPAState *s;
|
|
- int r;
|
|
+ struct vhost_vdpa *v;
|
|
+ uint64_t backend_features;
|
|
+ int64_t cvq_group;
|
|
+ int cvq_index, r;
|
|
|
|
assert(nc->info->type == NET_CLIENT_DRIVER_VHOST_VDPA);
|
|
|
|
s = DO_UPCAST(VhostVDPAState, nc, nc);
|
|
+ v = &s->vhost_vdpa;
|
|
+
|
|
+ v->shadow_data = s->always_svq;
|
|
+ v->shadow_vqs_enabled = s->always_svq;
|
|
+ s->vhost_vdpa.address_space_id = VHOST_VDPA_GUEST_PA_ASID;
|
|
+
|
|
+ if (s->always_svq) {
|
|
+ /* SVQ is already configured for all virtqueues */
|
|
+ goto out;
|
|
+ }
|
|
+
|
|
+ /*
|
|
+ * If we early return in these cases SVQ will not be enabled. The migration
|
|
+ * will be blocked as long as vhost-vdpa backends will not offer _F_LOG.
|
|
+ *
|
|
+ * Calling VHOST_GET_BACKEND_FEATURES as they are not available in v->dev
|
|
+ * yet.
|
|
+ */
|
|
+ r = ioctl(v->device_fd, VHOST_GET_BACKEND_FEATURES, &backend_features);
|
|
+ if (unlikely(r < 0)) {
|
|
+ error_report("Cannot get vdpa backend_features: %s(%d)",
|
|
+ g_strerror(errno), errno);
|
|
+ return -1;
|
|
+ }
|
|
+ if (!(backend_features & VHOST_BACKEND_F_IOTLB_ASID) ||
|
|
+ !vhost_vdpa_net_valid_svq_features(v->dev->features, NULL)) {
|
|
+ return 0;
|
|
+ }
|
|
+
|
|
+ /*
|
|
+ * Check if all the virtqueues of the virtio device are in a different vq
|
|
+ * than the last vq. VQ group of last group passed in cvq_group.
|
|
+ */
|
|
+ cvq_index = v->dev->vq_index_end - 1;
|
|
+ cvq_group = vhost_vdpa_get_vring_group(v->device_fd, cvq_index);
|
|
+ if (unlikely(cvq_group < 0)) {
|
|
+ return cvq_group;
|
|
+ }
|
|
+ for (int i = 0; i < cvq_index; ++i) {
|
|
+ int64_t group = vhost_vdpa_get_vring_group(v->device_fd, i);
|
|
+
|
|
+ if (unlikely(group < 0)) {
|
|
+ return group;
|
|
+ }
|
|
+
|
|
+ if (group == cvq_group) {
|
|
+ return 0;
|
|
+ }
|
|
+ }
|
|
+
|
|
+ r = vhost_vdpa_set_address_space_id(v, cvq_group, VHOST_VDPA_NET_CVQ_ASID);
|
|
+ if (unlikely(r < 0)) {
|
|
+ return r;
|
|
+ }
|
|
+
|
|
+ v->iova_tree = vhost_iova_tree_new(v->iova_range.first,
|
|
+ v->iova_range.last);
|
|
+ v->shadow_vqs_enabled = true;
|
|
+ s->vhost_vdpa.address_space_id = VHOST_VDPA_NET_CVQ_ASID;
|
|
+
|
|
+out:
|
|
if (!s->vhost_vdpa.shadow_vqs_enabled) {
|
|
return 0;
|
|
}
|
|
@@ -357,6 +457,14 @@ static void vhost_vdpa_net_cvq_stop(NetClientState *nc)
|
|
if (s->vhost_vdpa.shadow_vqs_enabled) {
|
|
vhost_vdpa_cvq_unmap_buf(&s->vhost_vdpa, s->cvq_cmd_out_buffer);
|
|
vhost_vdpa_cvq_unmap_buf(&s->vhost_vdpa, s->status);
|
|
+ if (!s->always_svq) {
|
|
+ /*
|
|
+ * If only the CVQ is shadowed we can delete this safely.
|
|
+ * If all the VQs are shadows this will be needed by the time the
|
|
+ * device is started again to register SVQ vrings and similar.
|
|
+ */
|
|
+ g_clear_pointer(&s->vhost_vdpa.iova_tree, vhost_iova_tree_delete);
|
|
+ }
|
|
}
|
|
}
|
|
|
|
--
|
|
2.27.0
|
|
|