From: "Eugenio Pérez" <eperezma@redhat.com>
To: qemu-devel@nongnu.org
Cc: kvm@vger.kernel.org, "Michael S. Tsirkin" <mst@redhat.com>,
Jason Wang <jasowang@redhat.com>,
Daniel Daly <dandaly0@gmail.com>,
virtualization@lists.linux-foundation.org,
Liran Alon <liralon@gmail.com>, Eli Cohen <eli@mellanox.com>,
Nitin Shrivastav <nitin.shrivastav@broadcom.com>,
Alex Barba <alex.barba@broadcom.com>,
Christophe Fontaine <cfontain@redhat.com>,
Juan Quintela <quintela@redhat.com>,
Lee Ballard <ballle98@gmail.com>,
Lars Ganrot <lars.ganrot@gmail.com>,
Rob Miller <rob.miller@broadcom.com>,
Stefano Garzarella <sgarzare@redhat.com>,
Howard Cai <howard.cai@gmail.com>,
Parav Pandit <parav@mellanox.com>, vm <vmireyno@marvell.com>,
Salil Mehta <mehta.salil.lnk@gmail.com>,
Stephen Finucane <stephenfin@redhat.com>,
Xiao W Wang <xiao.w.wang@intel.com>,
Sean Mooney <smooney@redhat.com>,
Stefan Hajnoczi <stefanha@redhat.com>,
Jim Harford <jim.harford@broadcom.com>,
Dmytro Kazantsev <dmytro.kazantsev@gmail.com>,
Siwei Liu <loseweigh@gmail.com>,
Harpreet Singh Anand <hanand@xilinx.com>,
Michael Lilja <ml@napatech.com>, Max Gurtovoy <maxgu14@gmail.com>
Subject: [RFC PATCH 13/27] vhost: Send buffers to device
Date: Fri, 20 Nov 2020 19:50:51 +0100 [thread overview]
Message-ID: <20201120185105.279030-14-eperezma@redhat.com> (raw)
In-Reply-To: <20201120185105.279030-1-eperezma@redhat.com>
Signed-off-by: Eugenio Pérez <eperezma@redhat.com>
---
hw/virtio/vhost-sw-lm-ring.h | 3 +
hw/virtio/vhost-sw-lm-ring.c | 134 +++++++++++++++++++++++++++++++++--
hw/virtio/vhost.c | 59 ++++++++++++++-
3 files changed, 189 insertions(+), 7 deletions(-)
diff --git a/hw/virtio/vhost-sw-lm-ring.h b/hw/virtio/vhost-sw-lm-ring.h
index 86dc081b93..29d21feaf4 100644
--- a/hw/virtio/vhost-sw-lm-ring.h
+++ b/hw/virtio/vhost-sw-lm-ring.h
@@ -18,6 +18,9 @@
typedef struct VhostShadowVirtqueue VhostShadowVirtqueue;
bool vhost_vring_kick(VhostShadowVirtqueue *vq);
+int vhost_vring_add(VhostShadowVirtqueue *vq, VirtQueueElement *elem);
+void vhost_vring_write_addr(const VhostShadowVirtqueue *vq,
+ struct vhost_vring_addr *addr);
VhostShadowVirtqueue *vhost_sw_lm_shadow_vq(struct vhost_dev *dev, int idx);
diff --git a/hw/virtio/vhost-sw-lm-ring.c b/hw/virtio/vhost-sw-lm-ring.c
index cd7b5ba772..aed005c2d9 100644
--- a/hw/virtio/vhost-sw-lm-ring.c
+++ b/hw/virtio/vhost-sw-lm-ring.c
@@ -9,6 +9,7 @@
#include "hw/virtio/vhost-sw-lm-ring.h"
#include "hw/virtio/vhost.h"
+#include "hw/virtio/virtio-access.h"
#include "standard-headers/linux/vhost_types.h"
#include "standard-headers/linux/virtio_ring.h"
@@ -19,21 +20,140 @@ typedef struct VhostShadowVirtqueue {
struct vring vring;
EventNotifier hdev_notifier;
VirtQueue *vq;
+ VirtIODevice *vdev;
+
+ /* Map for returning guest's descriptors */
+ VirtQueueElement **ring_id_maps;
+
+ /* Next head to expose to device */
+ uint16_t avail_idx_shadow;
+
+ /* Number of descriptors added since last notification */
+ uint16_t num_added;
+
+ /* Next free descriptor */
+ uint16_t free_head;
vring_desc_t descs[];
} VhostShadowVirtqueue;
-static inline bool vhost_vring_should_kick(VhostShadowVirtqueue *vq)
+static bool vhost_vring_should_kick_rcu(VhostShadowVirtqueue *vq)
{
- return virtio_queue_get_used_notify_split(vq->vq);
+ VirtIODevice *vdev = vq->vdev;
+ vq->num_added = 0;
+
+ smp_rmb();
+ return !(vq->vring.used->flags
+ & virtio_tswap16(vdev, VRING_USED_F_NO_NOTIFY));
}
+static bool vhost_vring_should_kick(VhostShadowVirtqueue *vq)
+{
+ RCU_READ_LOCK_GUARD();
+ return vhost_vring_should_kick_rcu(vq);
+}
+
+
bool vhost_vring_kick(VhostShadowVirtqueue *vq)
{
return vhost_vring_should_kick(vq) ? event_notifier_set(&vq->hdev_notifier)
: true;
}
+static void vhost_vring_write_descs(VhostShadowVirtqueue *vq,
+ const struct iovec *iovec,
+ size_t num, bool more_descs, bool write)
+{
+ uint16_t i = vq->free_head, last = vq->free_head;
+ unsigned n;
+ const VirtIODevice *vdev = vq->vdev;
+ uint16_t flags = write ? virtio_tswap16(vdev, VRING_DESC_F_WRITE) : 0;
+ vring_desc_t *descs = vq->vring.desc;
+
+ if (num == 0) {
+ return;
+ }
+
+ for (n = 0; n < num; n++) {
+ if (more_descs || (n + 1 < num)) {
+ descs[i].flags = flags | virtio_tswap16(vdev, VRING_DESC_F_NEXT);
+ } else {
+ descs[i].flags = flags;
+ }
+ descs[i].addr = virtio_tswap64(vdev, (hwaddr)iovec[n].iov_base);
+ descs[i].len = virtio_tswap32(vdev, iovec[n].iov_len);
+
+ last = i;
+ i = virtio_tswap16(vdev, descs[i].next);
+ }
+
+ vq->free_head = virtio_tswap16(vdev, descs[last].next);
+}
+
+/* virtqueue_add:
+ * @vq: The #VirtQueue
+ * @elem: The #VirtQueueElement
+ *
+ * Add an avail element to a virtqueue.
+ */
+static int vhost_vring_add_split(VhostShadowVirtqueue *vq,
+ const VirtQueueElement *elem)
+{
+ int head;
+ unsigned avail_idx;
+ const VirtIODevice *vdev;
+ vring_avail_t *avail;
+
+ RCU_READ_LOCK_GUARD();
+ vdev = vq->vdev;
+ avail = vq->vring.avail;
+
+ head = vq->free_head;
+
+ /* We need some descriptors here */
+ assert(elem->out_num || elem->in_num);
+
+ vhost_vring_write_descs(vq, elem->out_sg, elem->out_num,
+ elem->in_num > 0, false);
+ vhost_vring_write_descs(vq, elem->in_sg, elem->in_num, false, true);
+
+ /* Put entry in available array (but don't update avail->idx until they
+ * do sync). */
+ avail_idx = vq->avail_idx_shadow & (vq->vring.num - 1);
+ avail->ring[avail_idx] = virtio_tswap16(vdev, head);
+ vq->avail_idx_shadow++;
+
+ /* Expose descriptors to device */
+ smp_wmb();
+ avail->idx = virtio_tswap16(vdev, vq->avail_idx_shadow);
+
+ /* threoretically possible. Kick just in case */
+ if (unlikely(vq->num_added++ == (uint16_t)-1)) {
+ vhost_vring_kick(vq);
+ }
+
+ return head;
+}
+
+int vhost_vring_add(VhostShadowVirtqueue *vq, VirtQueueElement *elem)
+{
+ int host_head = vhost_vring_add_split(vq, elem);
+ if (vq->ring_id_maps[host_head]) {
+ g_free(vq->ring_id_maps[host_head]);
+ }
+
+ vq->ring_id_maps[host_head] = elem;
+ return 0;
+}
+
+void vhost_vring_write_addr(const VhostShadowVirtqueue *vq,
+ struct vhost_vring_addr *addr)
+{
+ addr->desc_user_addr = (uint64_t)vq->vring.desc;
+ addr->avail_user_addr = (uint64_t)vq->vring.avail;
+ addr->used_user_addr = (uint64_t)vq->vring.used;
+}
+
VhostShadowVirtqueue *vhost_sw_lm_shadow_vq(struct vhost_dev *dev, int idx)
{
struct vhost_vring_file file = {
@@ -43,9 +163,11 @@ VhostShadowVirtqueue *vhost_sw_lm_shadow_vq(struct vhost_dev *dev, int idx)
unsigned num = virtio_queue_get_num(dev->vdev, idx);
size_t ring_size = vring_size(num, VRING_DESC_ALIGN_SIZE);
VhostShadowVirtqueue *svq;
- int r;
+ int r, i;
svq = g_malloc0(sizeof(*svq) + ring_size);
+ svq->ring_id_maps = g_new0(VirtQueueElement *, num);
+ svq->vdev = dev->vdev;
svq->vq = vq;
r = event_notifier_init(&svq->hdev_notifier, 0);
@@ -55,8 +177,9 @@ VhostShadowVirtqueue *vhost_sw_lm_shadow_vq(struct vhost_dev *dev, int idx)
r = dev->vhost_ops->vhost_set_vring_kick(dev, &file);
assert(r == 0);
- vhost_virtqueue_mask(dev, dev->vdev, idx, true);
- vhost_virtqueue_pending(dev, idx);
+ vring_init(&svq->vring, num, svq->descs, VRING_DESC_ALIGN_SIZE);
+ for (i = 0; i < num - 1; i++)
+ svq->descs[i].next = virtio_tswap16(dev->vdev, i + 1);
return svq;
}
@@ -64,5 +187,6 @@ VhostShadowVirtqueue *vhost_sw_lm_shadow_vq(struct vhost_dev *dev, int idx)
void vhost_sw_lm_shadow_vq_free(VhostShadowVirtqueue *vq)
{
event_notifier_cleanup(&vq->hdev_notifier);
+ g_free(vq->ring_id_maps);
g_free(vq);
}
diff --git a/hw/virtio/vhost.c b/hw/virtio/vhost.c
index 9352c56bfa..304e0baa61 100644
--- a/hw/virtio/vhost.c
+++ b/hw/virtio/vhost.c
@@ -956,8 +956,34 @@ static void handle_sw_lm_vq(VirtIODevice *vdev, VirtQueue *vq)
uint16_t idx = virtio_get_queue_index(vq);
VhostShadowVirtqueue *svq = hdev->sw_lm_shadow_vq[idx];
+ VirtQueueElement *elem;
- vhost_vring_kick(svq);
+ /*
+ * Make available all buffers as possible.
+ */
+ do {
+ if (virtio_queue_get_notification(vq)) {
+ virtio_queue_set_notification(vq, false);
+ }
+
+ while (true) {
+ int r;
+ if (virtio_queue_full(vq)) {
+ break;
+ }
+
+ elem = virtqueue_pop(vq, sizeof(*elem));
+ if (!elem) {
+ break;
+ }
+
+ r = vhost_vring_add(svq, elem);
+ assert(r >= 0);
+ vhost_vring_kick(svq);
+ }
+
+ virtio_queue_set_notification(vq, true);
+ } while(!virtio_queue_empty(vq));
}
static void vhost_handle_call(EventNotifier *n)
@@ -975,6 +1001,11 @@ static void vhost_handle_call(EventNotifier *n)
}
}
+static void vhost_virtqueue_stop(struct vhost_dev *dev,
+ struct VirtIODevice *vdev,
+ struct vhost_virtqueue *vq,
+ unsigned idx);
+
static int vhost_sw_live_migration_stop(struct vhost_dev *dev)
{
int idx;
@@ -991,17 +1022,41 @@ static int vhost_sw_live_migration_stop(struct vhost_dev *dev)
static int vhost_sw_live_migration_start(struct vhost_dev *dev)
{
- int idx;
+ int idx, r;
+
+ assert(dev->vhost_ops->vhost_set_vring_enable);
+ dev->vhost_ops->vhost_set_vring_enable(dev, false);
for (idx = 0; idx < dev->nvqs; ++idx) {
struct vhost_virtqueue *vq = &dev->vqs[idx];
+ struct vhost_vring_addr addr = {
+ .index = idx,
+ };
+ struct vhost_vring_state s = {
+ .index = idx,
+ };
+
+ vhost_virtqueue_stop(dev, dev->vdev, &dev->vqs[idx], idx);
dev->sw_lm_shadow_vq[idx] = vhost_sw_lm_shadow_vq(dev, idx);
event_notifier_set_handler(&vq->masked_notifier, vhost_handle_call);
+
+ vhost_vring_write_addr(dev->sw_lm_shadow_vq[idx], &addr);
+ r = dev->vhost_ops->vhost_set_vring_addr(dev, &addr);
+ assert(r == 0);
+
+ r = dev->vhost_ops->vhost_set_vring_base(dev, &s);
+ assert(r == 0);
}
+ dev->vhost_ops->vhost_set_vring_enable(dev, true);
vhost_dev_disable_notifiers(dev, dev->vdev);
+ for (idx = 0; idx < dev->nvqs; ++idx) {
+ vhost_virtqueue_mask(dev, dev->vdev, idx, true);
+ vhost_virtqueue_pending(dev, idx);
+ }
+
return 0;
}
--
2.18.4
next prev parent reply other threads:[~2020-11-20 19:02 UTC|newest]
Thread overview: 81+ messages / expand[flat|nested] mbox.gz Atom feed top
2020-11-20 18:50 [RFC PATCH 00/27] vDPA software assisted live migration Eugenio Pérez
2020-11-20 18:50 ` [RFC PATCH 01/27] vhost: Add vhost_dev_can_log Eugenio Pérez
2020-11-20 18:50 ` [RFC PATCH 02/27] vhost: Add device callback in vhost_migration_log Eugenio Pérez
2020-12-07 16:19 ` Stefan Hajnoczi
2020-12-09 12:20 ` Eugenio Perez Martin
2020-11-20 18:50 ` [RFC PATCH 03/27] vhost: Move log resize/put to vhost_dev_set_log Eugenio Pérez
2020-11-20 18:50 ` [RFC PATCH 04/27] vhost: add vhost_kernel_set_vring_enable Eugenio Pérez
2020-12-07 16:43 ` Stefan Hajnoczi
2020-12-09 12:00 ` Eugenio Perez Martin
2020-12-09 16:08 ` Stefan Hajnoczi
2020-11-20 18:50 ` [RFC PATCH 05/27] vhost: Add hdev->dev.sw_lm_vq_handler Eugenio Pérez
2020-12-07 16:52 ` Stefan Hajnoczi
2020-12-09 15:02 ` Eugenio Perez Martin
2020-12-10 11:30 ` Stefan Hajnoczi
2020-11-20 18:50 ` [RFC PATCH 06/27] virtio: Add virtio_queue_get_used_notify_split Eugenio Pérez
2020-12-07 16:58 ` Stefan Hajnoczi
2021-01-12 18:21 ` Eugenio Perez Martin
2021-03-02 11:22 ` Stefan Hajnoczi
2021-03-02 18:34 ` Eugenio Perez Martin
2021-03-08 10:46 ` Stefan Hajnoczi
2020-11-20 18:50 ` [RFC PATCH 07/27] vhost: Route guest->host notification through qemu Eugenio Pérez
2020-12-07 17:42 ` Stefan Hajnoczi
2020-12-09 17:08 ` Eugenio Perez Martin
2020-12-10 11:50 ` Stefan Hajnoczi
2021-01-21 20:10 ` Eugenio Perez Martin
2020-11-20 18:50 ` [RFC PATCH 08/27] vhost: Add a flag for software assisted Live Migration Eugenio Pérez
2020-12-08 7:20 ` Stefan Hajnoczi
2020-12-09 17:57 ` Eugenio Perez Martin
2020-11-20 18:50 ` [RFC PATCH 09/27] vhost: Route host->guest notification through qemu Eugenio Pérez
2020-12-08 7:34 ` Stefan Hajnoczi
2020-11-20 18:50 ` [RFC PATCH 10/27] vhost: Allocate shadow vring Eugenio Pérez
2020-12-08 7:49 ` Stefan Hajnoczi
2020-12-08 8:17 ` Stefan Hajnoczi
2020-12-09 18:15 ` Eugenio Perez Martin
2020-11-20 18:50 ` [RFC PATCH 11/27] virtio: const-ify all virtio_tswap* functions Eugenio Pérez
2020-11-20 18:50 ` [RFC PATCH 12/27] virtio: Add virtio_queue_full Eugenio Pérez
2020-11-20 18:50 ` Eugenio Pérez [this message]
2020-12-08 8:16 ` [RFC PATCH 13/27] vhost: Send buffers to device Stefan Hajnoczi
2020-12-09 18:41 ` Eugenio Perez Martin
2020-12-10 11:55 ` Stefan Hajnoczi
2021-01-22 18:18 ` Eugenio Perez Martin
[not found] ` <CAJaqyWdNeaboGaSsXPA8r=mUsbctFLzACFKLX55yRQpTvjqxJw@mail.gmail.com>
2021-03-22 10:51 ` Stefan Hajnoczi
2021-03-22 15:55 ` Eugenio Perez Martin
2021-03-22 17:40 ` Stefan Hajnoczi
2021-03-24 19:04 ` Eugenio Perez Martin
2021-03-24 19:56 ` Stefan Hajnoczi
2020-11-20 18:50 ` [RFC PATCH 14/27] virtio: Remove virtio_queue_get_used_notify_split Eugenio Pérez
2020-11-20 18:50 ` [RFC PATCH 15/27] vhost: Do not invalidate signalled used Eugenio Pérez
2020-11-20 18:50 ` [RFC PATCH 16/27] virtio: Expose virtqueue_alloc_element Eugenio Pérez
2020-12-08 8:25 ` Stefan Hajnoczi
2020-12-09 18:46 ` Eugenio Perez Martin
2020-12-10 11:57 ` Stefan Hajnoczi
2020-11-20 18:50 ` [RFC PATCH 17/27] vhost: add vhost_vring_set_notification_rcu Eugenio Pérez
2020-11-20 18:50 ` [RFC PATCH 18/27] vhost: add vhost_vring_poll_rcu Eugenio Pérez
2020-12-08 8:41 ` Stefan Hajnoczi
2020-12-09 18:48 ` Eugenio Perez Martin
2020-11-20 18:50 ` [RFC PATCH 19/27] vhost: add vhost_vring_get_buf_rcu Eugenio Pérez
2020-11-20 18:50 ` [RFC PATCH 20/27] vhost: Return used buffers Eugenio Pérez
2020-12-08 8:50 ` Stefan Hajnoczi
2020-11-20 18:50 ` [RFC PATCH 21/27] vhost: Add vhost_virtqueue_memory_unmap Eugenio Pérez
2020-11-20 18:51 ` [RFC PATCH 22/27] vhost: Add vhost_virtqueue_memory_map Eugenio Pérez
2020-11-20 18:51 ` [RFC PATCH 23/27] vhost: unmap qemu's shadow virtqueues on sw live migration Eugenio Pérez
2020-11-27 15:29 ` Stefano Garzarella
2020-11-30 7:54 ` Eugenio Perez Martin
2020-11-20 18:51 ` [RFC PATCH 24/27] vhost: iommu changes Eugenio Pérez
2020-12-08 9:02 ` Stefan Hajnoczi
2020-11-20 18:51 ` [RFC PATCH 25/27] vhost: Do not commit vhost used idx on vhost_virtqueue_stop Eugenio Pérez
2020-11-20 19:35 ` Eugenio Perez Martin
2020-11-20 18:51 ` [RFC PATCH 26/27] vhost: Add vhost_hdev_can_sw_lm Eugenio Pérez
2020-11-20 18:51 ` [RFC PATCH 27/27] vhost: forbid vhost devices logging Eugenio Pérez
2020-11-20 19:03 ` [RFC PATCH 00/27] vDPA software assisted live migration Eugenio Perez Martin
2020-11-20 19:30 ` no-reply
2020-11-25 7:08 ` Jason Wang
2020-11-25 12:03 ` Eugenio Perez Martin
2020-11-25 12:14 ` Eugenio Perez Martin
2020-11-26 3:07 ` Jason Wang
2020-11-27 15:44 ` Stefano Garzarella
2020-12-08 9:37 ` Stefan Hajnoczi
2020-12-09 9:26 ` Jason Wang
2020-12-09 15:57 ` Stefan Hajnoczi
2020-12-10 9:12 ` Jason Wang
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=20201120185105.279030-14-eperezma@redhat.com \
--to=eperezma@redhat.com \
--cc=alex.barba@broadcom.com \
--cc=ballle98@gmail.com \
--cc=cfontain@redhat.com \
--cc=dandaly0@gmail.com \
--cc=dmytro.kazantsev@gmail.com \
--cc=eli@mellanox.com \
--cc=hanand@xilinx.com \
--cc=howard.cai@gmail.com \
--cc=jasowang@redhat.com \
--cc=jim.harford@broadcom.com \
--cc=kvm@vger.kernel.org \
--cc=lars.ganrot@gmail.com \
--cc=liralon@gmail.com \
--cc=loseweigh@gmail.com \
--cc=maxgu14@gmail.com \
--cc=mehta.salil.lnk@gmail.com \
--cc=ml@napatech.com \
--cc=mst@redhat.com \
--cc=nitin.shrivastav@broadcom.com \
--cc=parav@mellanox.com \
--cc=qemu-devel@nongnu.org \
--cc=quintela@redhat.com \
--cc=rob.miller@broadcom.com \
--cc=sgarzare@redhat.com \
--cc=smooney@redhat.com \
--cc=stefanha@redhat.com \
--cc=stephenfin@redhat.com \
--cc=virtualization@lists.linux-foundation.org \
--cc=vmireyno@marvell.com \
--cc=xiao.w.wang@intel.com \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).