qemu-devel
[Top][All Lists]
Advanced

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

Re: [PATCH v4 6/6] vdpa: Always start CVQ in SVQ mode


From: Jason Wang
Subject: Re: [PATCH v4 6/6] vdpa: Always start CVQ in SVQ mode
Date: Fri, 19 Aug 2022 14:18:06 +0800

On Tue, Aug 9, 2022 at 3:54 PM Eugenio Perez Martin <eperezma@redhat.com> wrote:
>
> On Tue, Aug 9, 2022 at 9:36 AM Jason Wang <jasowang@redhat.com> wrote:
> >
> > On Sat, Aug 6, 2022 at 12:39 AM Eugenio Pérez <eperezma@redhat.com> wrote:
> > >
> > > Isolate control virtqueue in its own group, allowing to intercept control
> > > commands but letting dataplane run totally passthrough to the guest.
> > >
> > > Signed-off-by: Eugenio Pérez <eperezma@redhat.com>
> > > ---
> > > v4:
> > > * Squash vhost_vdpa_cvq_group_is_independent.
> > > * Rebased on last CVQ start series, that allocated CVQ cmd bufs at load
> > > * Do not check for cvq index on vhost_vdpa_net_prepare, we only have one
> > >   that callback registered in that NetClientInfo.
> > >
> > > v3:
> > > * Make asid related queries print a warning instead of returning an
> > >   error and stop the start of qemu.
> > > ---
> > >  hw/virtio/vhost-vdpa.c |   3 +-
> > >  net/vhost-vdpa.c       | 124 +++++++++++++++++++++++++++++++++++++++--
> > >  2 files changed, 122 insertions(+), 5 deletions(-)
> > >
> > > diff --git a/hw/virtio/vhost-vdpa.c b/hw/virtio/vhost-vdpa.c
> > > index 3eb67b27b7..69f34f4cc5 100644
> > > --- a/hw/virtio/vhost-vdpa.c
> > > +++ b/hw/virtio/vhost-vdpa.c
> > > @@ -678,7 +678,8 @@ static int vhost_vdpa_set_backend_cap(struct 
> > > vhost_dev *dev)
> > >  {
> > >      uint64_t features;
> > >      uint64_t f = 0x1ULL << VHOST_BACKEND_F_IOTLB_MSG_V2 |
> > > -        0x1ULL << VHOST_BACKEND_F_IOTLB_BATCH;
> > > +        0x1ULL << VHOST_BACKEND_F_IOTLB_BATCH |
> > > +        0x1ULL << VHOST_BACKEND_F_IOTLB_ASID;
> > >      int r;
> > >
> > >      if (vhost_vdpa_call(dev, VHOST_GET_BACKEND_FEATURES, &features)) {
> > > diff --git a/net/vhost-vdpa.c b/net/vhost-vdpa.c
> > > index bf78b1332f..c820a5fd9f 100644
> > > --- a/net/vhost-vdpa.c
> > > +++ b/net/vhost-vdpa.c
> > > @@ -37,6 +37,9 @@ typedef struct VhostVDPAState {
> > >      /* Control commands shadow buffers */
> > >      void *cvq_cmd_out_buffer, *cvq_cmd_in_buffer;
> > >
> > > +    /* Number of address spaces supported by the device */
> > > +    unsigned address_space_num;
> > > +
> > >      /* The device always have SVQ enabled */
> > >      bool always_svq;
> > >      bool started;
> > > @@ -100,6 +103,9 @@ static const uint64_t vdpa_svq_device_features =
> > >      BIT_ULL(VIRTIO_NET_F_RSC_EXT) |
> > >      BIT_ULL(VIRTIO_NET_F_STANDBY);
> > >
> > > +#define VHOST_VDPA_NET_CVQ_PASSTHROUGH 0
> >
> > We need a better name for the macro since it's not easy to see it's an asid.
> >
>
> VHOST_VDPA_NET_DATA_ASID?

Looks fine.

>
> > > +#define VHOST_VDPA_NET_CVQ_ASID 1
> > > +
> > >  VHostNetState *vhost_vdpa_get_vhost_net(NetClientState *nc)
> > >  {
> > >      VhostVDPAState *s = DO_UPCAST(VhostVDPAState, nc, nc);
> > > @@ -224,6 +230,37 @@ static NetClientInfo net_vhost_vdpa_info = {
> > >          .check_peer_type = vhost_vdpa_check_peer_type,
> > >  };
> > >
> > > +static void vhost_vdpa_get_vring_group(int device_fd,
> > > +                                       struct vhost_vring_state *state)
> > > +{
> > > +    int r = ioctl(device_fd, VHOST_VDPA_GET_VRING_GROUP, state);
> >
> > Let's hide vhost_vring_state from the caller and simply accept a vq
> > index parameter (as the below function did) then we can return the
> > group id.
> >
> > The hides low level ABI and simplify the caller's code.
> >
>
> We need to return an error.
>
> The example is a little bit pathological, but if we get that CVQ is on
> vq group != 0, and all data vqs returns an error reading the vq group,
> I think we shouldn't assume they belong to the asid 0. Some of them
> could be on the same vq group as cvq, making all of this fail.
>
> Can we assume the vq group is an uint32_t? Would it work to return an
> int64_t with the possibility of errors?

Yes, or I think a simple int should be fine, I can't image we will
make use of the full 32 bit in near future.

>
> > > +    if (unlikely(r < 0)) {
> > > +        /*
> > > +         * Assume all groups are 0, the consequences are the same and we 
> > > will
> > > +         * not abort device creation
> > > +         */
> > > +        state->num = 0;
> > > +    }
> > > +}
> > > +
> > > +static int vhost_vdpa_set_address_space_id(struct vhost_vdpa *v,
> > > +                                           unsigned vq_group,
> > > +                                           unsigned asid_num)
> > > +{
> > > +    struct vhost_vring_state asid = {
> > > +        .index = vq_group,
> > > +        .num = asid_num,
> > > +    };
> > > +    int ret;
> > > +
> > > +    ret = ioctl(v->device_fd, VHOST_VDPA_SET_GROUP_ASID, &asid);
> > > +    if (unlikely(ret < 0)) {
> > > +        warn_report("Can't set vq group %u asid %u, errno=%d (%s)",
> > > +            asid.index, asid.num, errno, g_strerror(errno));
> > > +    }
> > > +    return ret;
> > > +}
> > > +
> > >  static void vhost_vdpa_cvq_unmap_buf(struct vhost_vdpa *v, void *addr)
> > >  {
> > >      VhostIOVATree *tree = v->iova_tree;
> > > @@ -298,11 +335,55 @@ dma_map_err:
> > >  static int vhost_vdpa_net_cvq_prepare(NetClientState *nc)
> > >  {
> > >      VhostVDPAState *s;
> > > +    struct vhost_vdpa *v;
> > > +    struct vhost_vring_state cvq_group = {};
> > >      int r;
> > >
> > >      assert(nc->info->type == NET_CLIENT_DRIVER_VHOST_VDPA);
> > >
> > >      s = DO_UPCAST(VhostVDPAState, nc, nc);
> > > +    v = &s->vhost_vdpa;
> > > +    cvq_group.index = v->dev->vq_index_end - 1;
> > > +
> > > +    /* Default values */
> >
> > Code can explain itself so this comment is probably useless.
> >
>
> I'll delete.
>
> > > +    v->shadow_vqs_enabled = false;
> > > +    s->vhost_vdpa.address_space_id = VHOST_VDPA_NET_CVQ_PASSTHROUGH;
> > > +
> > > +    if (s->always_svq) {
> > > +        v->shadow_vqs_enabled = true;
> >
> > The name of the variable is suboptimal.
> >
> > I think we need to differ:
> >
> > 1) shadow all virtqueues
> >
> > from
> >
> > 2) shadow cvq only
> >
>
> Note that shadow_vqs_enabled is per vhost_vdpa, so
> v->shadow_vqs_enabled means that vqs of *v* are shadowed.
>
> Data vhost_vdpa can have a different value than CVQ vhost_vdpa.
>
> Having said that, I'm ok with changing the name of the variable, but I
> cannot come with a better one.

Ok, let's leave it as is.

Thanks

>
> Thanks!
>
> > Thanks
> >
> > > +        goto out;
> > > +    }
> > > +
> > > +    if (s->address_space_num < 2) {
> > > +        return 0;
> > > +    }
> > > +
> > > +    /**
> > > +     * Check if all the virtqueues of the virtio device are in a 
> > > different vq
> > > +     * than the last vq. VQ group of last group passed in cvq_group.
> > > +     */
> > > +    vhost_vdpa_get_vring_group(v->device_fd, &cvq_group);
> > > +    for (int i = 0; i < (v->dev->vq_index_end - 1); ++i) {
> > > +        struct vhost_vring_state vq_group = {
> > > +            .index = i,
> > > +        };
> > > +
> > > +        vhost_vdpa_get_vring_group(v->device_fd, &vq_group);
> > > +        if (unlikely(vq_group.num == cvq_group.num)) {
> > > +            warn_report("CVQ %u group is the same as VQ %u one (%u)",
> > > +                         cvq_group.index, vq_group.index, cvq_group.num);
> > > +            return 0;
> > > +        }
> > > +    }
> > > +
> > > +    r = vhost_vdpa_set_address_space_id(v, cvq_group.num,
> > > +                                        VHOST_VDPA_NET_CVQ_ASID);
> > > +    if (r == 0) {
> > > +        v->shadow_vqs_enabled = true;
> > > +        s->vhost_vdpa.address_space_id = VHOST_VDPA_NET_CVQ_ASID;
> > > +    }
> > > +
> > > +out:
> > >      if (!s->vhost_vdpa.shadow_vqs_enabled) {
> > >          return 0;
> > >      }
> > > @@ -523,12 +604,38 @@ static const VhostShadowVirtqueueOps 
> > > vhost_vdpa_net_svq_ops = {
> > >      .avail_handler = vhost_vdpa_net_handle_ctrl_avail,
> > >  };
> > >
> > > +static uint32_t vhost_vdpa_get_as_num(int vdpa_device_fd)
> > > +{
> > > +    uint64_t features;
> > > +    unsigned num_as;
> > > +    int r;
> > > +
> > > +    r = ioctl(vdpa_device_fd, VHOST_GET_BACKEND_FEATURES, &features);
> > > +    if (unlikely(r < 0)) {
> > > +        warn_report("Cannot get backend features");
> > > +        return 1;
> > > +    }
> > > +
> > > +    if (!(features & BIT_ULL(VHOST_BACKEND_F_IOTLB_ASID))) {
> > > +        return 1;
> > > +    }
> > > +
> > > +    r = ioctl(vdpa_device_fd, VHOST_VDPA_GET_AS_NUM, &num_as);
> > > +    if (unlikely(r < 0)) {
> > > +        warn_report("Cannot retrieve number of supported ASs");
> > > +        return 1;
> > > +    }
> > > +
> > > +    return num_as;
> > > +}
> > > +
> > >  static NetClientState *net_vhost_vdpa_init(NetClientState *peer,
> > >                                             const char *device,
> > >                                             const char *name,
> > >                                             int vdpa_device_fd,
> > >                                             int queue_pair_index,
> > >                                             int nvqs,
> > > +                                           unsigned nas,
> > >                                             bool is_datapath,
> > >                                             bool svq,
> > >                                             VhostIOVATree *iova_tree)
> > > @@ -547,6 +654,7 @@ static NetClientState 
> > > *net_vhost_vdpa_init(NetClientState *peer,
> > >      snprintf(nc->info_str, sizeof(nc->info_str), TYPE_VHOST_VDPA);
> > >      s = DO_UPCAST(VhostVDPAState, nc, nc);
> > >
> > > +    s->address_space_num = nas;
> > >      s->vhost_vdpa.device_fd = vdpa_device_fd;
> > >      s->vhost_vdpa.index = queue_pair_index;
> > >      s->always_svq = svq;
> > > @@ -632,6 +740,8 @@ int net_init_vhost_vdpa(const Netdev *netdev, const 
> > > char *name,
> > >      g_autoptr(VhostIOVATree) iova_tree = NULL;
> > >      NetClientState *nc;
> > >      int queue_pairs, r, i = 0, has_cvq = 0;
> > > +    unsigned num_as = 1;
> > > +    bool svq_cvq;
> > >
> > >      assert(netdev->type == NET_CLIENT_DRIVER_VHOST_VDPA);
> > >      opts = &netdev->u.vhost_vdpa;
> > > @@ -656,7 +766,13 @@ int net_init_vhost_vdpa(const Netdev *netdev, const 
> > > char *name,
> > >          goto err;
> > >      }
> > >
> > > -    if (opts->x_svq) {
> > > +    svq_cvq = opts->x_svq;
> > > +    if (has_cvq && !opts->x_svq) {
> > > +        num_as = vhost_vdpa_get_as_num(vdpa_device_fd);
> > > +        svq_cvq = num_as > 1;
> > > +    }
> > > +
> > > +    if (opts->x_svq || svq_cvq) {
> > >          struct vhost_vdpa_iova_range iova_range;
> > >
> > >          uint64_t invalid_dev_features =
> > > @@ -679,15 +795,15 @@ int net_init_vhost_vdpa(const Netdev *netdev, const 
> > > char *name,
> > >
> > >      for (i = 0; i < queue_pairs; i++) {
> > >          ncs[i] = net_vhost_vdpa_init(peer, TYPE_VHOST_VDPA, name,
> > > -                                     vdpa_device_fd, i, 2, true, 
> > > opts->x_svq,
> > > -                                     iova_tree);
> > > +                                     vdpa_device_fd, i, 2, num_as, true,
> > > +                                     opts->x_svq, iova_tree);
> > >          if (!ncs[i])
> > >              goto err;
> > >      }
> > >
> > >      if (has_cvq) {
> > >          nc = net_vhost_vdpa_init(peer, TYPE_VHOST_VDPA, name,
> > > -                                 vdpa_device_fd, i, 1, false,
> > > +                                 vdpa_device_fd, i, 1, num_as, false,
> > >                                   opts->x_svq, iova_tree);
> > >          if (!nc)
> > >              goto err;
> > > --
> > > 2.31.1
> > >
> >
>




reply via email to

[Prev in Thread] Current Thread [Next in Thread]