Re: [PATCH for-rc] RDMA/rxe: Fix QP cleanup flow

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



On Fri, Jun 12, 2020 at 04:32:51PM +0800, Zhu Yanjun wrote:
> On Fri, Jun 12, 2020 at 4:31 PM Yanjun Zhu <yanjunz@xxxxxxxxxxxx> wrote:
> >
> >
> >
> > -----Original Message-----
> > From: Kamal Heib <kamalheib1@xxxxxxxxx>
> > Sent: Wednesday, June 3, 2020 6:18 PM
> > To: linux-rdma@xxxxxxxxxxxxxxx
> > Cc: Doug Ledford <dledford@xxxxxxxxxx>; Jason Gunthorpe <jgg@xxxxxxxx>; Yanjun Zhu <yanjunz@xxxxxxxxxxxx>; Kamal Heib <kamalheib1@xxxxxxxxx>
> > Subject: [PATCH for-rc] RDMA/rxe: Fix QP cleanup flow
> >
> > Avoid releasing the socket associated with each QP in rxe_qp_cleanup() which can sleep and move it to rxe_destroy_qp() instead, after doing this there is no need for the execute_work that used to avoid calling
> > rxe_qp_cleanup() directly. also check that the socket is valid in
> > rxe_skb_tx_dtor() to avoid use-after-free.
> >
> > Fixes: 8700e3e7c485 ("Soft RoCE driver")
> > Fixes: bb3ffb7ad48a ("RDMA/rxe: Fix rxe_qp_cleanup()")
> > Signed-off-by: Kamal Heib <kamalheib1@xxxxxxxxx>
> > ---
> >  drivers/infiniband/sw/rxe/rxe_net.c   | 14 ++++++++++++--
> >  drivers/infiniband/sw/rxe/rxe_qp.c    | 22 ++++++----------------
> >  drivers/infiniband/sw/rxe/rxe_verbs.h |  3 ---
> >  3 files changed, 18 insertions(+), 21 deletions(-)
> >
> > diff --git a/drivers/infiniband/sw/rxe/rxe_net.c b/drivers/infiniband/sw/rxe/rxe_net.c
> > index 312c2fc961c0..298ccd3fd3e2 100644
> > --- a/drivers/infiniband/sw/rxe/rxe_net.c
> > +++ b/drivers/infiniband/sw/rxe/rxe_net.c
> > @@ -411,8 +411,18 @@ int rxe_prepare(struct rxe_pkt_info *pkt, struct sk_buff *skb, u32 *crc)  static void rxe_skb_tx_dtor(struct sk_buff *skb)  {
> >         struct sock *sk = skb->sk;
> > -       struct rxe_qp *qp = sk->sk_user_data;
> > -       int skb_out = atomic_dec_return(&qp->skb_out);
> > +       struct rxe_qp *qp;
> > +       int skb_out;
> > +
> > +       if (!sk)
> 
> When does sk become NULL?
>
Looks like the sk isn't set to NULL when it gets released..., This change
will require more work, please drop this patch.

Thanks,
Kamal

> > +               return;
> > +
> > +       qp = sk->sk_user_data;
> > +
> > +       if (!qp)
> 
> When does qp become NULL?
> 
> > +               return;
> > +
> > +       skb_out = atomic_dec_return(&qp->skb_out);
> >
> >         if (unlikely(qp->need_req_skb &&
> >                      skb_out < RXE_INFLIGHT_SKBS_PER_QP_LOW)) diff --git a/drivers/infiniband/sw/rxe/rxe_qp.c b/drivers/infiniband/sw/rxe/rxe_qp.c
> > index 6c11c3aeeca6..89dac6c1111c 100644
> > --- a/drivers/infiniband/sw/rxe/rxe_qp.c
> > +++ b/drivers/infiniband/sw/rxe/rxe_qp.c
> > @@ -787,6 +787,7 @@ void rxe_qp_destroy(struct rxe_qp *qp)
> >         if (qp_type(qp) == IB_QPT_RC) {
> >                 del_timer_sync(&qp->retrans_timer);
> >                 del_timer_sync(&qp->rnr_nak_timer);
> > +               sk_dst_reset(qp->sk->sk);
> >         }
> >
> >         rxe_cleanup_task(&qp->req.task);
> > @@ -798,12 +799,15 @@ void rxe_qp_destroy(struct rxe_qp *qp)
> >                 __rxe_do_task(&qp->comp.task);
> >                 __rxe_do_task(&qp->req.task);
> >         }
> > +
> > +       kernel_sock_shutdown(qp->sk, SHUT_RDWR);
> > +       sock_release(qp->sk);
> >  }
> >
> >  /* called when the last reference to the qp is dropped */ -static void rxe_qp_do_cleanup(struct work_struct *work)
> > +void rxe_qp_cleanup(struct rxe_pool_entry *arg)
> >  {
> > -       struct rxe_qp *qp = container_of(work, typeof(*qp), cleanup_work.work);
> > +       struct rxe_qp *qp = container_of(arg, typeof(*qp), pelem);
> >
> >         rxe_drop_all_mcast_groups(qp);
> >
> > @@ -828,19 +832,5 @@ static void rxe_qp_do_cleanup(struct work_struct *work)
> >                 qp->resp.mr = NULL;
> >         }
> >
> > -       if (qp_type(qp) == IB_QPT_RC)
> > -               sk_dst_reset(qp->sk->sk);
> > -
> >         free_rd_atomic_resources(qp);
> > -
> > -       kernel_sock_shutdown(qp->sk, SHUT_RDWR);
> > -       sock_release(qp->sk);
> > -}
> > -
> > -/* called when the last reference to the qp is dropped */ -void rxe_qp_cleanup(struct rxe_pool_entry *arg) -{
> > -       struct rxe_qp *qp = container_of(arg, typeof(*qp), pelem);
> > -
> > -       execute_in_process_context(rxe_qp_do_cleanup, &qp->cleanup_work);
> >  }
> > diff --git a/drivers/infiniband/sw/rxe/rxe_verbs.h b/drivers/infiniband/sw/rxe/rxe_verbs.h
> > index 92de39c4a7c1..339debaf095f 100644
> > --- a/drivers/infiniband/sw/rxe/rxe_verbs.h
> > +++ b/drivers/infiniband/sw/rxe/rxe_verbs.h
> > @@ -35,7 +35,6 @@
> >  #define RXE_VERBS_H
> >
> >  #include <linux/interrupt.h>
> > -#include <linux/workqueue.h>
> >  #include <rdma/rdma_user_rxe.h>
> >  #include "rxe_pool.h"
> >  #include "rxe_task.h"
> > @@ -285,8 +284,6 @@ struct rxe_qp {
> >         struct timer_list rnr_nak_timer;
> >
> >         spinlock_t              state_lock; /* guard requester and completer */
> > -
> > -       struct execute_work     cleanup_work;
> >  };
> >
> >  enum rxe_mem_state {
> > --
> > 2.25.4
> >



[Index of Archives]     [Linux USB Devel]     [Video for Linux]     [Linux Audio Users]     [Photo]     [Yosemite News]     [Yosemite Photos]     [Linux Kernel]     [Linux SCSI]     [XFree86]

  Powered by Linux