[<prev] [next>] [<thread-prev] [thread-next>] [day] [month] [year] [list]
Message-ID: <CACGkMEumFkT=Cu3dY1Vv1-1O5tyGa7uh+_nS=icA0uUx-MCx_w@mail.gmail.com>
Date: Mon, 29 Dec 2025 15:16:16 +0800
From: Jason Wang <jasowang@...hat.com>
To: "Michael S. Tsirkin" <mst@...hat.com>
Cc: xuanzhuo@...ux.alibaba.com, eperezma@...hat.com,
virtualization@...ts.linux.dev, linux-kernel@...r.kernel.org
Subject: Re: [PATCH V11 13/19] virtio_ring: introduce virtqueue ops
On Sat, Dec 27, 2025 at 3:45 AM Michael S. Tsirkin <mst@...hat.com> wrote:
>
> On Thu, Dec 25, 2025 at 12:26:02PM +0800, Jason Wang wrote:
> > This patch introduces virtqueue ops which is a set of callbacks
> > that will be called for different queue layout or features. This would
> > help to avoid branches for split/packed and will ease the future
> > implementation like in order.
> >
> > Note that in order to eliminate the indirect calls this patch uses
> > global array of const ops to allow compiler to avoid indirect
> > branches.
> >
> > Tested with CONFIG_MITIGATION_RETPOLINE, no performance differences
> > were noticed.
> >
> > Acked-by: Eugenio Pérez <eperezma@...hat.com>
> > Suggested-by: Michael S. Tsirkin <mst@...hat.com>
> > Signed-off-by: Jason Wang <jasowang@...hat.com>
> > ---
> > drivers/virtio/virtio_ring.c | 173 ++++++++++++++++++++++++++---------
> > 1 file changed, 130 insertions(+), 43 deletions(-)
> >
> > diff --git a/drivers/virtio/virtio_ring.c b/drivers/virtio/virtio_ring.c
> > index f804c5c6975a..4e905dc7b6cb 100644
> > --- a/drivers/virtio/virtio_ring.c
> > +++ b/drivers/virtio/virtio_ring.c
> > @@ -67,6 +67,12 @@
> > #define LAST_ADD_TIME_INVALID(vq)
> > #endif
> >
> > +enum vq_layout {
> > + SPLIT = 0,
> > + PACKED,
> > + VQ_TYPE_MAX,
> > +};
> > +
> > struct vring_desc_state_split {
> > void *data; /* Data for callback. */
> >
> > @@ -159,12 +165,29 @@ struct vring_virtqueue_packed {
> > size_t event_size_in_bytes;
> > };
> >
> > +struct vring_virtqueue;
> > +
> > +struct virtqueue_ops {
> > + int (*add)(struct vring_virtqueue *vq, struct scatterlist *sgs[],
> > + unsigned int total_sg, unsigned int out_sgs,
> > + unsigned int in_sgs, void *data,
> > + void *ctx, bool premapped, gfp_t gfp);
> > + void *(*get)(struct vring_virtqueue *vq, unsigned int *len, void **ctx);
> > + bool (*kick_prepare)(struct vring_virtqueue *vq);
> > + void (*disable_cb)(struct vring_virtqueue *vq);
> > + bool (*enable_cb_delayed)(struct vring_virtqueue *vq);
> > + unsigned int (*enable_cb_prepare)(struct vring_virtqueue *vq);
> > + bool (*poll)(const struct vring_virtqueue *vq,
> > + unsigned int last_used_idx);
> > + void *(*detach_unused_buf)(struct vring_virtqueue *vq);
> > + bool (*more_used)(const struct vring_virtqueue *vq);
> > + int (*resize)(struct vring_virtqueue *vq, u32 num);
> > + void (*reset)(struct vring_virtqueue *vq);
> > +};
> > +
> > struct vring_virtqueue {
> > struct virtqueue vq;
> >
> > - /* Is this a packed ring? */
> > - bool packed_ring;
> > -
> > /* Is DMA API used? */
> > bool use_map_api;
> >
> > @@ -180,6 +203,8 @@ struct vring_virtqueue {
> > /* Host publishes avail event idx */
> > bool event;
> >
> > + enum vq_layout layout;
> > +
> > /* Head of free buffer list. */
> > unsigned int free_head;
> > /* Number we've added since last sync. */
> > @@ -231,6 +256,12 @@ static void vring_free(struct virtqueue *_vq);
> >
> > #define to_vvq(_vq) container_of_const(_vq, struct vring_virtqueue, vq)
> >
> > +
> > +static inline bool virtqueue_is_packed(const struct vring_virtqueue *vq)
> > +{
> > + return vq->layout == PACKED;
> > +}
> > +
> > static bool virtqueue_use_indirect(const struct vring_virtqueue *vq,
> > unsigned int total_sg)
> > {
> > @@ -433,7 +464,7 @@ static void virtqueue_init(struct vring_virtqueue *vq, u32 num)
> > {
> > vq->vq.num_free = num;
> >
> > - if (vq->packed_ring)
> > + if (virtqueue_is_packed(vq))
> > vq->last_used_idx = 0 | (1 << VRING_PACKED_EVENT_F_WRAP_CTR);
> > else
> > vq->last_used_idx = 0;
> > @@ -1122,6 +1153,8 @@ static int vring_alloc_queue_split(struct vring_virtqueue_split *vring_split,
> > return 0;
> > }
> >
> > +static const struct virtqueue_ops split_ops;
> > +
> > static struct virtqueue *__vring_new_virtqueue_split(unsigned int index,
> > struct vring_virtqueue_split *vring_split,
> > struct virtio_device *vdev,
> > @@ -1139,7 +1172,7 @@ static struct virtqueue *__vring_new_virtqueue_split(unsigned int index,
> > if (!vq)
> > return NULL;
> >
> > - vq->packed_ring = false;
> > + vq->layout = SPLIT;
> > vq->vq.callback = callback;
> > vq->vq.vdev = vdev;
> > vq->vq.name = name;
> > @@ -2077,6 +2110,8 @@ static void virtqueue_reset_packed(struct vring_virtqueue *vq)
> > virtqueue_vring_init_packed(&vq->packed, !!vq->vq.callback);
> > }
> >
> > +static const struct virtqueue_ops packed_ops;
> > +
> > static struct virtqueue *__vring_new_virtqueue_packed(unsigned int index,
> > struct vring_virtqueue_packed *vring_packed,
> > struct virtio_device *vdev,
> > @@ -2107,7 +2142,7 @@ static struct virtqueue *__vring_new_virtqueue_packed(unsigned int index,
> > #else
> > vq->broken = false;
> > #endif
> > - vq->packed_ring = true;
> > + vq->layout = PACKED;
> > vq->map = map;
> > vq->use_map_api = vring_use_map_api(vdev);
> >
> > @@ -2195,6 +2230,39 @@ static int virtqueue_resize_packed(struct vring_virtqueue *vq, u32 num)
> > return -ENOMEM;
> > }
> >
> > +static const struct virtqueue_ops split_ops = {
> > + .add = virtqueue_add_split,
> > + .get = virtqueue_get_buf_ctx_split,
> > + .kick_prepare = virtqueue_kick_prepare_split,
> > + .disable_cb = virtqueue_disable_cb_split,
> > + .enable_cb_delayed = virtqueue_enable_cb_delayed_split,
> > + .enable_cb_prepare = virtqueue_enable_cb_prepare_split,
> > + .poll = virtqueue_poll_split,
> > + .detach_unused_buf = virtqueue_detach_unused_buf_split,
> > + .more_used = more_used_split,
> > + .resize = virtqueue_resize_split,
> > + .reset = virtqueue_reset_split,
> > +};
> > +
> > +static const struct virtqueue_ops packed_ops = {
> > + .add = virtqueue_add_packed,
> > + .get = virtqueue_get_buf_ctx_packed,
> > + .kick_prepare = virtqueue_kick_prepare_packed,
> > + .disable_cb = virtqueue_disable_cb_packed,
> > + .enable_cb_delayed = virtqueue_enable_cb_delayed_packed,
> > + .enable_cb_prepare = virtqueue_enable_cb_prepare_packed,
> > + .poll = virtqueue_poll_packed,
> > + .detach_unused_buf = virtqueue_detach_unused_buf_packed,
> > + .more_used = more_used_packed,
> > + .resize = virtqueue_resize_packed,
> > + .reset = virtqueue_reset_packed,
> > +};
> > +
> > +static const struct virtqueue_ops *const all_ops[VQ_TYPE_MAX] = {
> > + [SPLIT] = &split_ops,
> > + [PACKED] = &packed_ops
> > +};
> > +
> > static int virtqueue_disable_and_recycle(struct virtqueue *_vq,
> > void (*recycle)(struct virtqueue *vq, void *buf))
> > {
>
> Actually:
>
> > @@ -2237,6 +2305,39 @@ static int virtqueue_enable_after_reset(struct virtqueue *_vq)
> > * Generic functions and exported symbols.
> > */
> >
> > +#define VIRTQUEUE_CALL(vq, op, ...) \
> > + ({ \
>
> this macro evaluates vq many times.
> You can use a temporary
>
> struct vring_virtqueue *__VIRTQUEUE_CALL_vq = (vq);
>
> to avoid the issue.
>
>
> > + typeof(all_ops[SPLIT]->op(vq, ##__VA_ARGS__)) ret; \
> > + \
> > + switch (vq->layout) { \
>
> Should probably be (vq)->layout like in VOID_VIRTQUEUE_CALL,
> unless you use a temporary.
>
>
>
>
> > + case SPLIT: \
> > + ret = all_ops[SPLIT]->op(vq, ##__VA_ARGS__); \
>
> and (vq) here, too.
> unless you use a temporary.
>
>
>
> > + break; \
> > + case PACKED: \
> > + ret = all_ops[PACKED]->op(vq, ##__VA_ARGS__); \
> > + break; \
> > + default: \
> > + BUG(); \
> > + break; \
> > + } \
> > + ret; \
> > +})
> > +
> > +#define VOID_VIRTQUEUE_CALL(vq, op, ...) \
> > + ({ \
> > + switch ((vq)->layout) { \
> > + case SPLIT: \
> > + all_ops[SPLIT]->op(vq, ##__VA_ARGS__); \
> > + break; \
> > + case PACKED: \
> > + all_ops[PACKED]->op(vq, ##__VA_ARGS__); \
> > + break; \
> > + default: \
> > + BUG(); \
> > + break; \
> > + } \
> > +})
> > +
>
>
> we can just open-code here and drop all_ops completely?
>
> #define VOID_VIRTQUEUE_CALL(vq, op, ...) \
> ({ \
> switch ((vq)->layout) { \
> case SPLIT: \
> split_ops->op(vq, ##__VA_ARGS__); \
> break; \
> case PACKED: \
> packed_ops->op(vq, ##__VA_ARGS__); \
> break; \
> default: \
> BUG(); \
> break; \
> } \
> })
>
>
>
> then we do not need VQ_LAYOUT_MAX either.
Exactly,I've modiefed the code this way in the new version.
>
> I did not check this generates same code, pls do.
Will do.
Thanks
>
>
>
> > static inline int virtqueue_add(struct virtqueue *_vq,
> > struct scatterlist *sgs[],
> > unsigned int total_sg,
> > @@ -2249,10 +2350,9 @@ static inline int virtqueue_add(struct virtqueue *_vq,
> > {
> > struct vring_virtqueue *vq = to_vvq(_vq);
> >
> > - return vq->packed_ring ? virtqueue_add_packed(vq, sgs, total_sg,
> > - out_sgs, in_sgs, data, ctx, premapped, gfp) :
> > - virtqueue_add_split(vq, sgs, total_sg,
> > - out_sgs, in_sgs, data, ctx, premapped, gfp);
> > + return VIRTQUEUE_CALL(vq, add, sgs, total_sg,
> > + out_sgs, in_sgs, data,
> > + ctx, premapped, gfp);
> > }
> >
> > /**
> > @@ -2442,8 +2542,7 @@ bool virtqueue_kick_prepare(struct virtqueue *_vq)
> > {
> > struct vring_virtqueue *vq = to_vvq(_vq);
> >
> > - return vq->packed_ring ? virtqueue_kick_prepare_packed(vq) :
> > - virtqueue_kick_prepare_split(vq);
> > + return VIRTQUEUE_CALL(vq, kick_prepare);
> > }
> > EXPORT_SYMBOL_GPL(virtqueue_kick_prepare);
> >
> > @@ -2513,8 +2612,7 @@ void *virtqueue_get_buf_ctx(struct virtqueue *_vq, unsigned int *len,
> > {
> > struct vring_virtqueue *vq = to_vvq(_vq);
> >
> > - return vq->packed_ring ? virtqueue_get_buf_ctx_packed(vq, len, ctx) :
> > - virtqueue_get_buf_ctx_split(vq, len, ctx);
> > + return VIRTQUEUE_CALL(vq, get, len, ctx);
> > }
> > EXPORT_SYMBOL_GPL(virtqueue_get_buf_ctx);
> >
> > @@ -2536,10 +2634,7 @@ void virtqueue_disable_cb(struct virtqueue *_vq)
> > {
> > struct vring_virtqueue *vq = to_vvq(_vq);
> >
> > - if (vq->packed_ring)
> > - virtqueue_disable_cb_packed(vq);
> > - else
> > - virtqueue_disable_cb_split(vq);
> > + VOID_VIRTQUEUE_CALL(vq, disable_cb);
> > }
> > EXPORT_SYMBOL_GPL(virtqueue_disable_cb);
> >
> > @@ -2562,8 +2657,7 @@ unsigned int virtqueue_enable_cb_prepare(struct virtqueue *_vq)
> > if (vq->event_triggered)
> > vq->event_triggered = false;
> >
> > - return vq->packed_ring ? virtqueue_enable_cb_prepare_packed(vq) :
> > - virtqueue_enable_cb_prepare_split(vq);
> > + return VIRTQUEUE_CALL(vq, enable_cb_prepare);
> > }
> > EXPORT_SYMBOL_GPL(virtqueue_enable_cb_prepare);
> >
> > @@ -2584,8 +2678,8 @@ bool virtqueue_poll(struct virtqueue *_vq, unsigned int last_used_idx)
> > return false;
> >
> > virtio_mb(vq->weak_barriers);
> > - return vq->packed_ring ? virtqueue_poll_packed(vq, last_used_idx) :
> > - virtqueue_poll_split(vq, last_used_idx);
> > +
> > + return VIRTQUEUE_CALL(vq, poll, last_used_idx);
> > }
> > EXPORT_SYMBOL_GPL(virtqueue_poll);
> >
> > @@ -2628,8 +2722,7 @@ bool virtqueue_enable_cb_delayed(struct virtqueue *_vq)
> > if (vq->event_triggered)
> > data_race(vq->event_triggered = false);
> >
> > - return vq->packed_ring ? virtqueue_enable_cb_delayed_packed(vq) :
> > - virtqueue_enable_cb_delayed_split(vq);
> > + return VIRTQUEUE_CALL(vq, enable_cb_delayed);
> > }
> > EXPORT_SYMBOL_GPL(virtqueue_enable_cb_delayed);
> >
> > @@ -2645,14 +2738,13 @@ void *virtqueue_detach_unused_buf(struct virtqueue *_vq)
> > {
> > struct vring_virtqueue *vq = to_vvq(_vq);
> >
> > - return vq->packed_ring ? virtqueue_detach_unused_buf_packed(vq) :
> > - virtqueue_detach_unused_buf_split(vq);
> > + return VIRTQUEUE_CALL(vq, detach_unused_buf);
> > }
> > EXPORT_SYMBOL_GPL(virtqueue_detach_unused_buf);
> >
> > static inline bool more_used(const struct vring_virtqueue *vq)
> > {
> > - return vq->packed_ring ? more_used_packed(vq) : more_used_split(vq);
> > + return VIRTQUEUE_CALL(vq, more_used);
> > }
> >
> > /**
> > @@ -2782,7 +2874,7 @@ int virtqueue_resize(struct virtqueue *_vq, u32 num,
> > if (!num)
> > return -EINVAL;
> >
> > - if ((vq->packed_ring ? vq->packed.vring.num : vq->split.vring.num) == num)
> > + if (virtqueue_get_vring_size(_vq) == num)
> > return 0;
> >
> > err = virtqueue_disable_and_recycle(_vq, recycle);
> > @@ -2791,10 +2883,7 @@ int virtqueue_resize(struct virtqueue *_vq, u32 num,
> > if (recycle_done)
> > recycle_done(_vq);
> >
> > - if (vq->packed_ring)
> > - err = virtqueue_resize_packed(vq, num);
> > - else
> > - err = virtqueue_resize_split(vq, num);
> > + err = VIRTQUEUE_CALL(vq, resize, num);
> >
> > err_reset = virtqueue_enable_after_reset(_vq);
> > if (err_reset)
> > @@ -2832,10 +2921,7 @@ int virtqueue_reset(struct virtqueue *_vq,
> > if (recycle_done)
> > recycle_done(_vq);
> >
> > - if (vq->packed_ring)
> > - virtqueue_reset_packed(vq);
> > - else
> > - virtqueue_reset_split(vq);
> > + VOID_VIRTQUEUE_CALL(vq, reset);
> >
> > return virtqueue_enable_after_reset(_vq);
> > }
> > @@ -2878,7 +2964,7 @@ static void vring_free(struct virtqueue *_vq)
> > struct vring_virtqueue *vq = to_vvq(_vq);
> >
> > if (vq->we_own_ring) {
> > - if (vq->packed_ring) {
> > + if (virtqueue_is_packed(vq)) {
> > vring_free_queue(vq->vq.vdev,
> > vq->packed.ring_size_in_bytes,
> > vq->packed.vring.desc,
> > @@ -2907,7 +2993,7 @@ static void vring_free(struct virtqueue *_vq)
> > vq->map);
> > }
> > }
> > - if (!vq->packed_ring) {
> > + if (!virtqueue_is_packed(vq)) {
> > kfree(vq->split.desc_state);
> > kfree(vq->split.desc_extra);
> > }
> > @@ -2932,7 +3018,7 @@ u32 vring_notification_data(struct virtqueue *_vq)
> > struct vring_virtqueue *vq = to_vvq(_vq);
> > u16 next;
> >
> > - if (vq->packed_ring)
> > + if (virtqueue_is_packed(vq))
> > next = (vq->packed.next_avail_idx &
> > ~(-(1 << VRING_PACKED_EVENT_F_WRAP_CTR))) |
> > vq->packed.avail_wrap_counter <<
> > @@ -2985,7 +3071,8 @@ unsigned int virtqueue_get_vring_size(const struct virtqueue *_vq)
> >
> > const struct vring_virtqueue *vq = to_vvq(_vq);
> >
> > - return vq->packed_ring ? vq->packed.vring.num : vq->split.vring.num;
> > + return virtqueue_is_packed(vq) ? vq->packed.vring.num :
> > + vq->split.vring.num;
> > }
> > EXPORT_SYMBOL_GPL(virtqueue_get_vring_size);
> >
> > @@ -3068,7 +3155,7 @@ dma_addr_t virtqueue_get_desc_addr(const struct virtqueue *_vq)
> >
> > BUG_ON(!vq->we_own_ring);
> >
> > - if (vq->packed_ring)
> > + if (virtqueue_is_packed(vq))
> > return vq->packed.ring_dma_addr;
> >
> > return vq->split.queue_dma_addr;
> > @@ -3081,7 +3168,7 @@ dma_addr_t virtqueue_get_avail_addr(const struct virtqueue *_vq)
> >
> > BUG_ON(!vq->we_own_ring);
> >
> > - if (vq->packed_ring)
> > + if (virtqueue_is_packed(vq))
> > return vq->packed.driver_event_dma_addr;
> >
> > return vq->split.queue_dma_addr +
> > @@ -3095,7 +3182,7 @@ dma_addr_t virtqueue_get_used_addr(const struct virtqueue *_vq)
> >
> > BUG_ON(!vq->we_own_ring);
> >
> > - if (vq->packed_ring)
> > + if (virtqueue_is_packed(vq))
> > return vq->packed.device_event_dma_addr;
> >
> > return vq->split.queue_dma_addr +
> > --
> > 2.31.1
>
Powered by blists - more mailing lists