On Fri, Sep 19, 2025 at 03:31:48PM +0800, Jason Wang wrote:
> This patch introduces virtqueue ops which is a set of the callbacks
> that will be called for different queue layout or features. This would
> help to avoid branches for split/packed and will ease the future
> implementation like in order.
> 
> Note that in order to eliminate the indirect calls this patch uses
> global array of const ops to allow compiler to avoid indirect
> branches.
> 
> Tested with CONFIG_MITIGATION_RETPOLINE, no performance differences
> were noticed.
> 
> Acked-by: Eugenio Pérez <epere...@redhat.com>
> Suggested-by: Michael S. Tsirkin <m...@redhat.com>
> Signed-off-by: Jason Wang <jasow...@redhat.com>
> ---
>  drivers/virtio/virtio_ring.c | 173 ++++++++++++++++++++++++++---------
>  1 file changed, 130 insertions(+), 43 deletions(-)
> 
> diff --git a/drivers/virtio/virtio_ring.c b/drivers/virtio/virtio_ring.c
> index b1b6af297061..1045c553ee65 100644
> --- a/drivers/virtio/virtio_ring.c
> +++ b/drivers/virtio/virtio_ring.c
> @@ -67,6 +67,12 @@
>  #define LAST_ADD_TIME_INVALID(vq)
>  #endif
>  
> +enum vq_layout {
> +     SPLIT = 0,
> +     PACKED,
> +     VQ_TYPE_MAX,
> +};
> +
>  struct vring_desc_state_split {
>       void *data;                     /* Data for callback. */
>  
> @@ -159,12 +165,28 @@ struct vring_virtqueue_packed {
>       size_t event_size_in_bytes;
>  };
>  
> +struct vring_virtqueue;
> +
> +struct virtqueue_ops {
> +     int (*add)(struct vring_virtqueue *_vq, struct scatterlist *sgs[],
> +                unsigned int total_sg, unsigned int out_sgs,
> +                unsigned int in_sgs, void *data,
> +                void *ctx, bool premapped, gfp_t gfp);

Why is it _vq here?


> +     void *(*get)(struct vring_virtqueue *vq, unsigned int *len, void **ctx);
> +     bool (*kick_prepare)(struct vring_virtqueue *vq);
> +     void (*disable_cb)(struct vring_virtqueue *vq);
> +     bool (*enable_cb_delayed)(struct vring_virtqueue *vq);
> +     unsigned int (*enable_cb_prepare)(struct vring_virtqueue *vq);
> +     bool (*poll)(const struct vring_virtqueue *vq, u16 last_used_idx);
> +     void *(*detach_unused_buf)(struct vring_virtqueue *vq);
> +     bool (*more_used)(const struct vring_virtqueue *vq);
> +     int (*resize)(struct vring_virtqueue *vq, u32 num);
> +     void (*reset)(struct vring_virtqueue *vq);
> +};
> +
>  struct vring_virtqueue {
>       struct virtqueue vq;
>  
> -     /* Is this a packed ring? */
> -     bool packed_ring;
> -
>       /* Is DMA API used? */
>       bool use_map_api;
>  
> @@ -180,6 +202,8 @@ struct vring_virtqueue {
>       /* Host publishes avail event idx */
>       bool event;
>  
> +     enum vq_layout layout;
> +
>       /* Head of free buffer list. */
>       unsigned int free_head;
>       /* Number we've added since last sync. */
> @@ -231,6 +255,12 @@ static void vring_free(struct virtqueue *_vq);
>  
>  #define to_vvq(_vq) container_of_const(_vq, struct vring_virtqueue, vq)
>  
> +

why the extra empty line?


> +static inline bool virtqueue_is_packed(const struct vring_virtqueue *vq)
> +{
> +     return vq->layout == PACKED;
> +}
> +
>  static bool virtqueue_use_indirect(const struct vring_virtqueue *vq,
>                                  unsigned int total_sg)
>  {
> @@ -433,7 +463,7 @@ static void virtqueue_init(struct vring_virtqueue *vq, 
> u32 num)
>  {
>       vq->vq.num_free = num;
>  
> -     if (vq->packed_ring)
> +     if (virtqueue_is_packed(vq))
>               vq->last_used_idx = 0 | (1 << VRING_PACKED_EVENT_F_WRAP_CTR);
>       else
>               vq->last_used_idx = 0;
> @@ -1121,6 +1151,8 @@ static int vring_alloc_queue_split(struct 
> vring_virtqueue_split *vring_split,
>       return 0;
>  }
>  
> +static const struct virtqueue_ops split_ops;
> +
>  static struct virtqueue *__vring_new_virtqueue_split(unsigned int index,
>                                              struct vring_virtqueue_split 
> *vring_split,
>                                              struct virtio_device *vdev,
> @@ -1138,7 +1170,7 @@ static struct virtqueue 
> *__vring_new_virtqueue_split(unsigned int index,
>       if (!vq)
>               return NULL;
>  
> -     vq->packed_ring = false;
> +     vq->layout = SPLIT;
>       vq->vq.callback = callback;
>       vq->vq.vdev = vdev;
>       vq->vq.name = name;
> @@ -2075,6 +2107,8 @@ static void virtqueue_reset_packed(struct 
> vring_virtqueue *vq)
>       virtqueue_vring_init_packed(&vq->packed, !!vq->vq.callback);
>  }
>  
> +static const struct virtqueue_ops packed_ops;
> +
>  static struct virtqueue *__vring_new_virtqueue_packed(unsigned int index,
>                                              struct vring_virtqueue_packed 
> *vring_packed,
>                                              struct virtio_device *vdev,
> @@ -2105,7 +2139,7 @@ static struct virtqueue 
> *__vring_new_virtqueue_packed(unsigned int index,
>  #else
>       vq->broken = false;
>  #endif
> -     vq->packed_ring = true;
> +     vq->layout = PACKED;
>       vq->map = map;
>       vq->use_map_api = vring_use_map_api(vdev);
>  
> @@ -2193,6 +2227,39 @@ static int virtqueue_resize_packed(struct 
> vring_virtqueue *vq, u32 num)
>       return -ENOMEM;
>  }
>  
> +static const struct virtqueue_ops split_ops = {
> +     .add = virtqueue_add_split,
> +     .get = virtqueue_get_buf_ctx_split,
> +     .kick_prepare = virtqueue_kick_prepare_split,
> +     .disable_cb = virtqueue_disable_cb_split,
> +     .enable_cb_delayed = virtqueue_enable_cb_delayed_split,
> +     .enable_cb_prepare = virtqueue_enable_cb_prepare_split,
> +     .poll = virtqueue_poll_split,
> +     .detach_unused_buf = virtqueue_detach_unused_buf_split,
> +     .more_used = more_used_split,
> +     .resize = virtqueue_resize_split,
> +     .reset = virtqueue_reset_split,
> +};
> +
> +static const struct virtqueue_ops packed_ops = {
> +     .add = virtqueue_add_packed,
> +     .get = virtqueue_get_buf_ctx_packed,
> +     .kick_prepare = virtqueue_kick_prepare_packed,
> +     .disable_cb = virtqueue_disable_cb_packed,
> +     .enable_cb_delayed = virtqueue_enable_cb_delayed_packed,
> +     .enable_cb_prepare = virtqueue_enable_cb_prepare_packed,
> +     .poll = virtqueue_poll_packed,
> +     .detach_unused_buf = virtqueue_detach_unused_buf_packed,
> +     .more_used = more_used_packed,
> +     .resize = virtqueue_resize_packed,
> +     .reset = virtqueue_reset_packed,
> +};
> +
> +static const struct virtqueue_ops *const all_ops[VQ_TYPE_MAX] = {
> +     [SPLIT] = &split_ops,
> +     [PACKED] = &packed_ops
> +};
> +
>  static int virtqueue_disable_and_recycle(struct virtqueue *_vq,
>                                        void (*recycle)(struct virtqueue *vq, 
> void *buf))
>  {
> @@ -2235,6 +2302,39 @@ static int virtqueue_enable_after_reset(struct 
> virtqueue *_vq)
>   * Generic functions and exported symbols.
>   */
>  
> +#define VIRTQUEUE_CALL(vq, op, ...)                                  \
> +     ({                                                              \
> +     typeof(all_ops[SPLIT]->op(vq, ##__VA_ARGS__)) ret;              \
> +                                                                     \
> +     switch (vq->layout) {                                           \
> +     case SPLIT:                                                     \
> +             ret = all_ops[SPLIT]->op(vq, ##__VA_ARGS__);            \
> +             break;                                                  \
> +     case PACKED:                                                    \
> +             ret = all_ops[PACKED]->op(vq, ##__VA_ARGS__);           \
> +             break;                                                  \
> +     default:                                                        \
> +             BUG();                                                  \
> +             break;                                                  \
> +     }                                                               \
> +     ret;                                                            \
> +})
> +
> +#define VOID_VIRTQUEUE_CALL(vq, op, ...)             \
> +     ({                                              \
> +     switch ((vq)->layout) {                 \
> +     case SPLIT:                                     \
> +             all_ops[SPLIT]->op(vq, ##__VA_ARGS__);  \
> +             break;                                  \
> +     case PACKED:                                    \
> +             all_ops[PACKED]->op(vq, ##__VA_ARGS__); \
> +             break;                                  \
> +     default:                                        \
> +             BUG();                                  \
> +             break;                                  \
> +     }                                               \
> +})
> +
>  static inline int virtqueue_add(struct virtqueue *_vq,
>                               struct scatterlist *sgs[],
>                               unsigned int total_sg,
> @@ -2247,10 +2347,9 @@ static inline int virtqueue_add(struct virtqueue *_vq,
>  {
>       struct vring_virtqueue *vq = to_vvq(_vq);
>  
> -     return vq->packed_ring ? virtqueue_add_packed(vq, sgs, total_sg,
> -                                     out_sgs, in_sgs, data, ctx, premapped, 
> gfp) :
> -                              virtqueue_add_split(vq, sgs, total_sg,
> -                                     out_sgs, in_sgs, data, ctx, premapped, 
> gfp);
> +     return VIRTQUEUE_CALL(vq, add, sgs, total_sg,
> +                           out_sgs, in_sgs, data,
> +                           ctx, premapped, gfp);
>  }
>  
>  /**
> @@ -2440,8 +2539,7 @@ bool virtqueue_kick_prepare(struct virtqueue *_vq)
>  {
>       struct vring_virtqueue *vq = to_vvq(_vq);
>  
> -     return vq->packed_ring ? virtqueue_kick_prepare_packed(vq) :
> -                              virtqueue_kick_prepare_split(vq);
> +     return VIRTQUEUE_CALL(vq, kick_prepare);
>  }
>  EXPORT_SYMBOL_GPL(virtqueue_kick_prepare);
>  
> @@ -2511,8 +2609,7 @@ void *virtqueue_get_buf_ctx(struct virtqueue *_vq, 
> unsigned int *len,
>  {
>       struct vring_virtqueue *vq = to_vvq(_vq);
>  
> -     return vq->packed_ring ? virtqueue_get_buf_ctx_packed(vq, len, ctx) :
> -                              virtqueue_get_buf_ctx_split(vq, len, ctx);
> +     return VIRTQUEUE_CALL(vq, get, len, ctx);
>  }
>  EXPORT_SYMBOL_GPL(virtqueue_get_buf_ctx);
>  
> @@ -2534,10 +2631,7 @@ void virtqueue_disable_cb(struct virtqueue *_vq)
>  {
>       struct vring_virtqueue *vq = to_vvq(_vq);
>  
> -     if (vq->packed_ring)
> -             virtqueue_disable_cb_packed(vq);
> -     else
> -             virtqueue_disable_cb_split(vq);
> +     VOID_VIRTQUEUE_CALL(vq, disable_cb);
>  }
>  EXPORT_SYMBOL_GPL(virtqueue_disable_cb);
>  
> @@ -2560,8 +2654,7 @@ unsigned int virtqueue_enable_cb_prepare(struct 
> virtqueue *_vq)
>       if (vq->event_triggered)
>               vq->event_triggered = false;
>  
> -     return vq->packed_ring ? virtqueue_enable_cb_prepare_packed(vq) :
> -                              virtqueue_enable_cb_prepare_split(vq);
> +     return VIRTQUEUE_CALL(vq, enable_cb_prepare);
>  }
>  EXPORT_SYMBOL_GPL(virtqueue_enable_cb_prepare);
>  
> @@ -2582,8 +2675,8 @@ bool virtqueue_poll(struct virtqueue *_vq, unsigned int 
> last_used_idx)
>               return false;
>  
>       virtio_mb(vq->weak_barriers);
> -     return vq->packed_ring ? virtqueue_poll_packed(vq, last_used_idx) :
> -                              virtqueue_poll_split(vq, last_used_idx);
> +
> +     return VIRTQUEUE_CALL(vq, poll, last_used_idx);
>  }
>  EXPORT_SYMBOL_GPL(virtqueue_poll);
>  
> @@ -2626,8 +2719,7 @@ bool virtqueue_enable_cb_delayed(struct virtqueue *_vq)
>       if (vq->event_triggered)
>               data_race(vq->event_triggered = false);
>  
> -     return vq->packed_ring ? virtqueue_enable_cb_delayed_packed(vq) :
> -                              virtqueue_enable_cb_delayed_split(vq);
> +     return VIRTQUEUE_CALL(vq, enable_cb_delayed);
>  }
>  EXPORT_SYMBOL_GPL(virtqueue_enable_cb_delayed);
>  
> @@ -2643,14 +2735,13 @@ void *virtqueue_detach_unused_buf(struct virtqueue 
> *_vq)
>  {
>       struct vring_virtqueue *vq = to_vvq(_vq);
>  
> -     return vq->packed_ring ? virtqueue_detach_unused_buf_packed(vq) :
> -                              virtqueue_detach_unused_buf_split(vq);
> +     return VIRTQUEUE_CALL(vq, detach_unused_buf);
>  }
>  EXPORT_SYMBOL_GPL(virtqueue_detach_unused_buf);
>  
>  static inline bool more_used(const struct vring_virtqueue *vq)
>  {
> -     return vq->packed_ring ? more_used_packed(vq) : more_used_split(vq);
> +     return VIRTQUEUE_CALL(vq, more_used);
>  }
>  
>  /**
> @@ -2780,7 +2871,8 @@ int virtqueue_resize(struct virtqueue *_vq, u32 num,
>       if (!num)
>               return -EINVAL;
>  
> -     if ((vq->packed_ring ? vq->packed.vring.num : vq->split.vring.num) == 
> num)
> +     if ((virtqueue_is_packed(vq) ? vq->packed.vring.num :
> +                                    vq->split.vring.num) == num)
>               return 0;
>  
>       err = virtqueue_disable_and_recycle(_vq, recycle);
> @@ -2789,10 +2881,7 @@ int virtqueue_resize(struct virtqueue *_vq, u32 num,
>       if (recycle_done)
>               recycle_done(_vq);
>  
> -     if (vq->packed_ring)
> -             err = virtqueue_resize_packed(vq, num);
> -     else
> -             err = virtqueue_resize_split(vq, num);
> +     err = VIRTQUEUE_CALL(vq, resize, num);
>  
>       err_reset = virtqueue_enable_after_reset(_vq);
>       if (err_reset)
> @@ -2830,10 +2919,7 @@ int virtqueue_reset(struct virtqueue *_vq,
>       if (recycle_done)
>               recycle_done(_vq);
>  
> -     if (vq->packed_ring)
> -             virtqueue_reset_packed(vq);
> -     else
> -             virtqueue_reset_split(vq);
> +     VOID_VIRTQUEUE_CALL(vq, reset);
>  
>       return virtqueue_enable_after_reset(_vq);
>  }
> @@ -2876,7 +2962,7 @@ static void vring_free(struct virtqueue *_vq)
>       struct vring_virtqueue *vq = to_vvq(_vq);
>  
>       if (vq->we_own_ring) {
> -             if (vq->packed_ring) {
> +             if (virtqueue_is_packed(vq)) {
>                       vring_free_queue(vq->vq.vdev,
>                                        vq->packed.ring_size_in_bytes,
>                                        vq->packed.vring.desc,
> @@ -2905,7 +2991,7 @@ static void vring_free(struct virtqueue *_vq)
>                                        vq->map);
>               }
>       }
> -     if (!vq->packed_ring) {
> +     if (!virtqueue_is_packed(vq)) {
>               kfree(vq->split.desc_state);
>               kfree(vq->split.desc_extra);
>       }
> @@ -2930,7 +3016,7 @@ u32 vring_notification_data(struct virtqueue *_vq)
>       struct vring_virtqueue *vq = to_vvq(_vq);
>       u16 next;
>  
> -     if (vq->packed_ring)
> +     if (virtqueue_is_packed(vq))
>               next = (vq->packed.next_avail_idx &
>                               ~(-(1 << VRING_PACKED_EVENT_F_WRAP_CTR))) |
>                       vq->packed.avail_wrap_counter <<
> @@ -2983,7 +3069,8 @@ unsigned int virtqueue_get_vring_size(const struct 
> virtqueue *_vq)
>  
>       const struct vring_virtqueue *vq = to_vvq(_vq);
>  
> -     return vq->packed_ring ? vq->packed.vring.num : vq->split.vring.num;
> +     return virtqueue_is_packed(vq) ? vq->packed.vring.num :
> +                                   vq->split.vring.num;
>  }
>  EXPORT_SYMBOL_GPL(virtqueue_get_vring_size);
>  
> @@ -3066,7 +3153,7 @@ dma_addr_t virtqueue_get_desc_addr(const struct 
> virtqueue *_vq)
>  
>       BUG_ON(!vq->we_own_ring);
>  
> -     if (vq->packed_ring)
> +     if (virtqueue_is_packed(vq))
>               return vq->packed.ring_dma_addr;
>  
>       return vq->split.queue_dma_addr;
> @@ -3079,7 +3166,7 @@ dma_addr_t virtqueue_get_avail_addr(const struct 
> virtqueue *_vq)
>  
>       BUG_ON(!vq->we_own_ring);
>  
> -     if (vq->packed_ring)
> +     if (virtqueue_is_packed(vq))
>               return vq->packed.driver_event_dma_addr;
>  
>       return vq->split.queue_dma_addr +
> @@ -3093,7 +3180,7 @@ dma_addr_t virtqueue_get_used_addr(const struct 
> virtqueue *_vq)
>  
>       BUG_ON(!vq->we_own_ring);
>  
> -     if (vq->packed_ring)
> +     if (virtqueue_is_packed(vq))
>               return vq->packed.device_event_dma_addr;
>  
>       return vq->split.queue_dma_addr +
> -- 
> 2.31.1


Reply via email to