Re: [PATCH vhost v4 12/16] vdpa/mlx5: Improve mr update flow

From: Dragos Tatulea
Date: Mon Oct 23 2023 - 04:07:10 EST


On Fri, 2023-10-20 at 18:01 +0200, Eugenio Perez Martin wrote:
> On Wed, Oct 18, 2023 at 7:21 PM Dragos Tatulea <dtatulea@xxxxxxxxxx> wrote:
> >
> > On Wed, 2023-10-18 at 20:14 +0300, Dragos Tatulea wrote:
> > > The current flow for updating an mr works directly on mvdev->mr which
> > > makes it cumbersome to handle multiple new mr structs.
> > >
> > > This patch makes the flow more straightforward by having
> > > mlx5_vdpa_create_mr return a new mr which will update the old mr (if
> > > any). The old mr will be deleted and unlinked from mvdev. For the case
> > > when the iotlb is empty (not NULL), the old mr will be cleared.
> > >
> > > This change paves the way for adding mrs for different ASIDs.
> > >
> > > The initialized bool is no longer needed as mr is now a pointer in the
> > > mlx5_vdpa_dev struct which will be NULL when not initialized.
> > >
> > > Acked-by: Eugenio Pérez <eperezma@xxxxxxxxxx>
> > > Acked-by: Jason Wang <jasowang@xxxxxxxxxx>
> > > Signed-off-by: Dragos Tatulea <dtatulea@xxxxxxxxxx>
> > > ---
> > >  drivers/vdpa/mlx5/core/mlx5_vdpa.h | 14 +++--
> > >  drivers/vdpa/mlx5/core/mr.c        | 87 ++++++++++++++++--------------
> > >  drivers/vdpa/mlx5/net/mlx5_vnet.c  | 53 +++++++++---------
> > >  3 files changed, 82 insertions(+), 72 deletions(-)
> > >
> > > diff --git a/drivers/vdpa/mlx5/core/mlx5_vdpa.h
> > > b/drivers/vdpa/mlx5/core/mlx5_vdpa.h
> > > index 9c6ac42c21e1..bbe4335106bd 100644
> > > --- a/drivers/vdpa/mlx5/core/mlx5_vdpa.h
> > > +++ b/drivers/vdpa/mlx5/core/mlx5_vdpa.h
> > > @@ -31,8 +31,6 @@ struct mlx5_vdpa_mr {
> > >         struct list_head head;
> > >         unsigned long num_directs;
> > >         unsigned long num_klms;
> > > -       /* state of dvq mr */
> > > -       bool initialized;
> > >
> > >         bool user_mr;
> > >  };
> > > @@ -91,7 +89,7 @@ struct mlx5_vdpa_dev {
> > >         u16 max_idx;
> > >         u32 generation;
> > >
> > > -       struct mlx5_vdpa_mr mr;
> > > +       struct mlx5_vdpa_mr *mr;
> > >         /* serialize mr access */
> > >         struct mutex mr_mtx;
> > >         struct mlx5_control_vq cvq;
> > > @@ -114,14 +112,14 @@ void mlx5_vdpa_free_resources(struct mlx5_vdpa_dev
> > > *mvdev);
> > >  int mlx5_vdpa_create_mkey(struct mlx5_vdpa_dev *mvdev, u32 *mkey, u32
> > > *in,
> > >                           int inlen);
> > >  int mlx5_vdpa_destroy_mkey(struct mlx5_vdpa_dev *mvdev, u32 mkey);
> > > -int mlx5_vdpa_handle_set_map(struct mlx5_vdpa_dev *mvdev, struct
> > > vhost_iotlb
> > > *iotlb,
> > > -                            bool *change_map, unsigned int asid);
> > > -int mlx5_vdpa_create_mr(struct mlx5_vdpa_dev *mvdev,
> > > -                       struct mlx5_vdpa_mr *mr,
> > > -                       struct vhost_iotlb *iotlb);
> > > +struct mlx5_vdpa_mr *mlx5_vdpa_create_mr(struct mlx5_vdpa_dev *mvdev,
> > > +                                        struct vhost_iotlb *iotlb);
> > >  void mlx5_vdpa_destroy_mr_resources(struct mlx5_vdpa_dev *mvdev);
> > >  void mlx5_vdpa_destroy_mr(struct mlx5_vdpa_dev *mvdev,
> > >                           struct mlx5_vdpa_mr *mr);
> > > +void mlx5_vdpa_update_mr(struct mlx5_vdpa_dev *mvdev,
> > > +                        struct mlx5_vdpa_mr *mr,
> > > +                        unsigned int asid);
> > >  int mlx5_vdpa_update_cvq_iotlb(struct mlx5_vdpa_dev *mvdev,
> > >                                 struct vhost_iotlb *iotlb,
> > >                                 unsigned int asid);
> > > diff --git a/drivers/vdpa/mlx5/core/mr.c b/drivers/vdpa/mlx5/core/mr.c
> > > index abd6a6fb122f..00eff5a07152 100644
> > > --- a/drivers/vdpa/mlx5/core/mr.c
> > > +++ b/drivers/vdpa/mlx5/core/mr.c
> > > @@ -495,30 +495,51 @@ static void destroy_user_mr(struct mlx5_vdpa_dev
> > > *mvdev,
> > > struct mlx5_vdpa_mr *mr
> > >
> > >  static void _mlx5_vdpa_destroy_mr(struct mlx5_vdpa_dev *mvdev, struct
> > > mlx5_vdpa_mr *mr)
> > >  {
> > > -       if (!mr->initialized)
> > > -               return;
> > > -
> > >         if (mr->user_mr)
> > >                 destroy_user_mr(mvdev, mr);
> > >         else
> > >                 destroy_dma_mr(mvdev, mr);
> > > -
> > > -       mr->initialized = false;
> > >  }
> > >
> > >  void mlx5_vdpa_destroy_mr(struct mlx5_vdpa_dev *mvdev,
> > >                           struct mlx5_vdpa_mr *mr)
> > >  {
> > > +       if (!mr)
> > > +               return;
> > > +
> > >         mutex_lock(&mvdev->mr_mtx);
> > >
> > >         _mlx5_vdpa_destroy_mr(mvdev, mr);
> > >
> > > +       if (mvdev->mr == mr)
> > > +               mvdev->mr = NULL;
> > > +
> > > +       mutex_unlock(&mvdev->mr_mtx);
> > > +
> > > +       kfree(mr);
> > > +}
> > > +
> > > +void mlx5_vdpa_update_mr(struct mlx5_vdpa_dev *mvdev,
> > > +                        struct mlx5_vdpa_mr *new_mr,
> > > +                        unsigned int asid)
> > > +{
> > > +       struct mlx5_vdpa_mr *old_mr = mvdev->mr;
> > > +
> > > +       mutex_lock(&mvdev->mr_mtx);
> > > +
> > > +       mvdev->mr = new_mr;
> > > +       if (old_mr) {
> > > +               _mlx5_vdpa_destroy_mr(mvdev, old_mr);
> > > +               kfree(old_mr);
> > > +       }
> > > +
> > >         mutex_unlock(&mvdev->mr_mtx);
> > > +
> > >  }
> > >
> > >  void mlx5_vdpa_destroy_mr_resources(struct mlx5_vdpa_dev *mvdev)
> > >  {
> > > -       mlx5_vdpa_destroy_mr(mvdev, &mvdev->mr);
> > > +       mlx5_vdpa_destroy_mr(mvdev, mvdev->mr);
> > >         prune_iotlb(mvdev);
> > >  }
> > >
> > > @@ -528,52 +549,36 @@ static int _mlx5_vdpa_create_mr(struct mlx5_vdpa_dev
> > > *mvdev,
> > >  {
> > >         int err;
> > >
> > > -       if (mr->initialized)
> > > -               return 0;
> > > -
> > >         if (iotlb)
> > >                 err = create_user_mr(mvdev, mr, iotlb);
> > >         else
> > >                 err = create_dma_mr(mvdev, mr);
> > >
> > > -       if (err)
> > > -               return err;
> > > -
> > > -       mr->initialized = true;
> > > -
> > > -       return 0;
> > > +       return err;
> > >  }
> > >
> > > -int mlx5_vdpa_create_mr(struct mlx5_vdpa_dev *mvdev,
> > > -                       struct mlx5_vdpa_mr *mr,
> > > -                       struct vhost_iotlb *iotlb)
> > > +struct mlx5_vdpa_mr *mlx5_vdpa_create_mr(struct mlx5_vdpa_dev *mvdev,
> > > +                                        struct vhost_iotlb *iotlb)
> > >  {
> > > +       struct mlx5_vdpa_mr *mr;
> > >         int err;
> > >
> > > +       mr = kzalloc(sizeof(*mr), GFP_KERNEL);
> > > +       if (!mr)
> > > +               return ERR_PTR(-ENOMEM);
> > > +
> > >         mutex_lock(&mvdev->mr_mtx);
> > >         err = _mlx5_vdpa_create_mr(mvdev, mr, iotlb);
> > >         mutex_unlock(&mvdev->mr_mtx);
> > >
> > > -       return err;
> > > -}
> > > -
> > > -int mlx5_vdpa_handle_set_map(struct mlx5_vdpa_dev *mvdev, struct
> > > vhost_iotlb
> > > *iotlb,
> > > -                            bool *change_map, unsigned int asid)
> > > -{
> > > -       struct mlx5_vdpa_mr *mr = &mvdev->mr;
> > > -       int err = 0;
> > > +       if (err)
> > > +               goto out_err;
> > >
> > > -       *change_map = false;
> > > -       mutex_lock(&mvdev->mr_mtx);
> > > -       if (mr->initialized) {
> > > -               mlx5_vdpa_info(mvdev, "memory map update\n");
> > > -               *change_map = true;
> > > -       }
> > > -       if (!*change_map)
> > > -               err = _mlx5_vdpa_create_mr(mvdev, mr, iotlb);
> > > -       mutex_unlock(&mvdev->mr_mtx);
> > > +       return mr;
> > >
> > > -       return err;
> > > +out_err:
> > > +       kfree(mr);
> > > +       return ERR_PTR(err);
> > >  }
> > >
> > >  int mlx5_vdpa_update_cvq_iotlb(struct mlx5_vdpa_dev *mvdev,
> > > @@ -597,11 +602,13 @@ int mlx5_vdpa_update_cvq_iotlb(struct mlx5_vdpa_dev
> > > *mvdev,
> > >
> > >  int mlx5_vdpa_create_dma_mr(struct mlx5_vdpa_dev *mvdev)
> > >  {
> > > -       int err;
> > > +       struct mlx5_vdpa_mr *mr;
> > >
> > > -       err = mlx5_vdpa_create_mr(mvdev, &mvdev->mr, NULL);
> > > -       if (err)
> > > -               return err;
> > > +       mr = mlx5_vdpa_create_mr(mvdev, NULL);
> > > +       if (IS_ERR(mr))
> > > +               return PTR_ERR(mr);
> > > +
> > > +       mlx5_vdpa_update_mr(mvdev, mr, 0);
> > >
> > >         return mlx5_vdpa_update_cvq_iotlb(mvdev, NULL, 0);
> > >  }
> > > diff --git a/drivers/vdpa/mlx5/net/mlx5_vnet.c
> > > b/drivers/vdpa/mlx5/net/mlx5_vnet.c
> > > index 256fdd80c321..7b878995b6aa 100644
> > > --- a/drivers/vdpa/mlx5/net/mlx5_vnet.c
> > > +++ b/drivers/vdpa/mlx5/net/mlx5_vnet.c
> > > @@ -873,7 +873,7 @@ static int create_virtqueue(struct mlx5_vdpa_net
> > > *ndev,
> > > struct mlx5_vdpa_virtque
> > >         MLX5_SET64(virtio_q, vq_ctx, desc_addr, mvq->desc_addr);
> > >         MLX5_SET64(virtio_q, vq_ctx, used_addr, mvq->device_addr);
> > >         MLX5_SET64(virtio_q, vq_ctx, available_addr, mvq->driver_addr);
> > > -       MLX5_SET(virtio_q, vq_ctx, virtio_q_mkey, ndev->mvdev.mr.mkey);
> > > +       MLX5_SET(virtio_q, vq_ctx, virtio_q_mkey, ndev->mvdev.mr->mkey);
> > >         MLX5_SET(virtio_q, vq_ctx, umem_1_id, mvq->umem1.id);
> > >         MLX5_SET(virtio_q, vq_ctx, umem_1_size, mvq->umem1.size);
> > >         MLX5_SET(virtio_q, vq_ctx, umem_2_id, mvq->umem2.id);
> > > @@ -2633,7 +2633,7 @@ static void restore_channels_info(struct
> > > mlx5_vdpa_net
> > > *ndev)
> > >  }
> > >
> > >  static int mlx5_vdpa_change_map(struct mlx5_vdpa_dev *mvdev,
> > > -                               struct vhost_iotlb *iotlb, unsigned int
> > > asid)
> > > +                               struct mlx5_vdpa_mr *new_mr, unsigned int
> > > asid)
> > >  {
> > >         struct mlx5_vdpa_net *ndev = to_mlx5_vdpa_ndev(mvdev);
> > >         int err;
> > > @@ -2641,27 +2641,18 @@ static int mlx5_vdpa_change_map(struct
> > > mlx5_vdpa_dev
> > > *mvdev,
> > >         suspend_vqs(ndev);
> > >         err = save_channels_info(ndev);
> > >         if (err)
> > > -               goto err_mr;
> > > +               return err;
> > >
> > >         teardown_driver(ndev);
> > > -       mlx5_vdpa_destroy_mr(mvdev, &mvdev->mr);
> > > -       err = mlx5_vdpa_create_mr(mvdev, &mvdev->mr, iotlb);
> > > -       if (err)
> > > -               goto err_mr;
> > > +
> > > +       mlx5_vdpa_update_mr(mvdev, new_mr, asid);
> > >
> > >         if (!(mvdev->status & VIRTIO_CONFIG_S_DRIVER_OK) || mvdev-
> > > >suspended)
> > > -               goto err_mr;
> > > +               return 0;
> > >
> > >         restore_channels_info(ndev);
> > >         err = setup_driver(mvdev);
> > > -       if (err)
> > > -               goto err_setup;
> > > -
> > > -       return 0;
> > >
> > > -err_setup:
> > > -       mlx5_vdpa_destroy_mr(mvdev, &mvdev->mr);
> > > -err_mr:
> > >         return err;
> > >  }
> > >
> > > @@ -2875,26 +2866,40 @@ static u32 mlx5_vdpa_get_generation(struct
> > > vdpa_device
> > > *vdev)
> > >  static int set_map_data(struct mlx5_vdpa_dev *mvdev, struct vhost_iotlb
> > > *iotlb,
> > >                         unsigned int asid)
> > >  {
> > > -       bool change_map;
> > > +       struct mlx5_vdpa_mr *new_mr;
> > >         int err;
> > >
> > >         if (mvdev->group2asid[MLX5_VDPA_DATAVQ_GROUP] != asid)
> > >                 goto end;
> > >
> > > -       err = mlx5_vdpa_handle_set_map(mvdev, iotlb, &change_map, asid);
> > > -       if (err) {
> > > -               mlx5_vdpa_warn(mvdev, "set map failed(%d)\n", err);
> > > -               return err;
> > > +       if (vhost_iotlb_itree_first(iotlb, 0, U64_MAX)) {
> > > +               new_mr = mlx5_vdpa_create_mr(mvdev, iotlb);
> > > +               if (IS_ERR(new_mr)) {
> > > +                       err = PTR_ERR(new_mr);
> > > +                       mlx5_vdpa_warn(mvdev, "create map failed(%d)\n",
> > > err);
> > > +                       return err;
> > > +               }
> > > +       } else {
> > > +               /* Empty iotlbs don't have an mr but will clear the
> > > previous
> > > mr. */
> > > +               new_mr = NULL;
> > >         }
> > Hi Jason and/or Eugenio, could you have a quick look at this part of the
> > patch
> > that changed please?
> >
> > Thanks,
> > Dragos
> > >
> > > -       if (change_map) {
> > > -               err = mlx5_vdpa_change_map(mvdev, iotlb, asid);
> > > -               if (err)
> > > -                       return err;
> > > +       if (!mvdev->mr) {
> > > +               mlx5_vdpa_update_mr(mvdev, new_mr, asid);
> > > +       } else {
> > > +               err = mlx5_vdpa_change_map(mvdev, new_mr, asid);
> > > +               if (err) {
> > > +                       mlx5_vdpa_warn(mvdev, "change map failed(%d)\n",
> > > err);
> > > +                       goto out_err;
> > > +               }
> > >         }
> > >
> > >  end:
> > >         return mlx5_vdpa_update_cvq_iotlb(mvdev, iotlb, asid);
> > > +
> > > +out_err:
> > > +       mlx5_vdpa_destroy_mr(mvdev, new_mr);
>
> Is it possible to reach this mlx5_vdpa_destroy_mr call with new_mr ==
> NULL? Like:
> * iotlb does not have any entries
> * mdev already has a mr
> * mlx5_vdpa_change_map fails
>
It could happen.

> If I'm not wrong, mlx5_vdpa_destroy_mr may dereference new_mr through
> _mlx5_vdpa_destroy_mr -> vhost_iotlb_free(mr->iotlb).
>
mlx5_vdpa_destroy_mr checks for mr being NULL first.

The other place where _mlx5_vdpa_destroy_mr gets called is from
mlx5_vdpa_update_mr on the old mr IF it exists (it is not NULL).

This looks safe to me.

Thanks,
Dragos

> Am I missing something?
>
> Thanks!
>
>
>
>
> > > +       return err;
> > >  }
> > >
> > >  static int mlx5_vdpa_set_map(struct vdpa_device *vdev, unsigned int asid,
> >
>