RDMA/mlx5: Move all WR logic from qp.c to separate file
authorLeon Romanovsky <leonro@mellanox.com>
Wed, 6 May 2020 06:55:13 +0000 (09:55 +0300)
committerJason Gunthorpe <jgg@mellanox.com>
Wed, 6 May 2020 20:42:45 +0000 (17:42 -0300)
Split qp.c by removing all WR logic to separate file.

Link: https://lore.kernel.org/r/20200506065513.4668-4-leon@kernel.org
Signed-off-by: Leon Romanovsky <leonro@mellanox.com>
Signed-off-by: Jason Gunthorpe <jgg@mellanox.com>
drivers/infiniband/hw/mlx5/Makefile
drivers/infiniband/hw/mlx5/main.c
drivers/infiniband/hw/mlx5/mlx5_ib.h
drivers/infiniband/hw/mlx5/qp.c
drivers/infiniband/hw/mlx5/wr.c [new file with mode: 0644]
drivers/infiniband/hw/mlx5/wr.h [new file with mode: 0644]

index 228be05..8cca61c 100644 (file)
@@ -16,7 +16,8 @@ mlx5_ib-y := ah.o \
             qpc.o \
             restrack.o \
             srq.o \
-            srq_cmd.o
+            srq_cmd.o \
+            wr.o
 
 mlx5_ib-$(CONFIG_INFINIBAND_ON_DEMAND_PAGING) += odp.o
 mlx5_ib-$(CONFIG_MLX5_ESWITCH) += ib_rep.o
index 0c0fbf4..40bf71e 100644 (file)
@@ -61,6 +61,7 @@
 #include "cmd.h"
 #include "srq.h"
 #include "qp.h"
+#include "wr.h"
 #include <linux/mlx5/fs_helpers.h>
 #include <linux/mlx5/accel.h>
 #include <rdma/uverbs_std_types.h>
@@ -6657,8 +6658,8 @@ static const struct ib_device_ops mlx5_ib_dev_ops = {
        .modify_qp = mlx5_ib_modify_qp,
        .modify_srq = mlx5_ib_modify_srq,
        .poll_cq = mlx5_ib_poll_cq,
-       .post_recv = mlx5_ib_post_recv,
-       .post_send = mlx5_ib_post_send,
+       .post_recv = mlx5_ib_post_recv_nodrain,
+       .post_send = mlx5_ib_post_send_nodrain,
        .post_srq_recv = mlx5_ib_post_srq_recv,
        .process_mad = mlx5_ib_process_mad,
        .query_ah = mlx5_ib_query_ah,
index 3041808..482b54e 100644 (file)
@@ -1178,10 +1178,6 @@ int mlx5_ib_query_qp(struct ib_qp *ibqp, struct ib_qp_attr *qp_attr, int qp_attr
 int mlx5_ib_destroy_qp(struct ib_qp *qp, struct ib_udata *udata);
 void mlx5_ib_drain_sq(struct ib_qp *qp);
 void mlx5_ib_drain_rq(struct ib_qp *qp);
-int mlx5_ib_post_send(struct ib_qp *ibqp, const struct ib_send_wr *wr,
-                     const struct ib_send_wr **bad_wr);
-int mlx5_ib_post_recv(struct ib_qp *ibqp, const struct ib_recv_wr *wr,
-                     const struct ib_recv_wr **bad_wr);
 int mlx5_ib_read_wqe_sq(struct mlx5_ib_qp *qp, int wqe_index, void *buffer,
                        size_t buflen, size_t *bc);
 int mlx5_ib_read_wqe_rq(struct mlx5_ib_qp *qp, int wqe_index, void *buffer,
index 1e3dcfd..fb2ea3b 100644 (file)
@@ -40,6 +40,7 @@
 #include "ib_rep.h"
 #include "cmd.h"
 #include "qp.h"
+#include "wr.h"
 
 enum {
        MLX5_IB_ACK_REQ_FREQ    = 8,
@@ -52,32 +53,6 @@ enum {
        MLX5_IB_LINK_TYPE_ETH           = 1
 };
 
-enum {
-       MLX5_IB_SQ_STRIDE       = 6,
-       MLX5_IB_SQ_UMR_INLINE_THRESHOLD = 64,
-};
-
-static const u32 mlx5_ib_opcode[] = {
-       [IB_WR_SEND]                            = MLX5_OPCODE_SEND,
-       [IB_WR_LSO]                             = MLX5_OPCODE_LSO,
-       [IB_WR_SEND_WITH_IMM]                   = MLX5_OPCODE_SEND_IMM,
-       [IB_WR_RDMA_WRITE]                      = MLX5_OPCODE_RDMA_WRITE,
-       [IB_WR_RDMA_WRITE_WITH_IMM]             = MLX5_OPCODE_RDMA_WRITE_IMM,
-       [IB_WR_RDMA_READ]                       = MLX5_OPCODE_RDMA_READ,
-       [IB_WR_ATOMIC_CMP_AND_SWP]              = MLX5_OPCODE_ATOMIC_CS,
-       [IB_WR_ATOMIC_FETCH_AND_ADD]            = MLX5_OPCODE_ATOMIC_FA,
-       [IB_WR_SEND_WITH_INV]                   = MLX5_OPCODE_SEND_INVAL,
-       [IB_WR_LOCAL_INV]                       = MLX5_OPCODE_UMR,
-       [IB_WR_REG_MR]                          = MLX5_OPCODE_UMR,
-       [IB_WR_MASKED_ATOMIC_CMP_AND_SWP]       = MLX5_OPCODE_ATOMIC_MASKED_CS,
-       [IB_WR_MASKED_ATOMIC_FETCH_AND_ADD]     = MLX5_OPCODE_ATOMIC_MASKED_FA,
-       [MLX5_IB_WR_UMR]                        = MLX5_OPCODE_UMR,
-};
-
-struct mlx5_wqe_eth_pad {
-       u8 rsvd0[16];
-};
-
 enum raw_qp_set_mask_map {
        MLX5_RAW_QP_MOD_SET_RQ_Q_CTR_ID         = 1UL << 0,
        MLX5_RAW_QP_RATE_LIMIT                  = 1UL << 1,
@@ -1061,30 +1036,6 @@ static void destroy_qp(struct mlx5_ib_dev *dev, struct mlx5_ib_qp *qp,
                mlx5_frag_buf_free(dev->mdev, &qp->buf);
 }
 
-/* get_sq_edge - Get the next nearby edge.
- *
- * An 'edge' is defined as the first following address after the end
- * of the fragment or the SQ. Accordingly, during the WQE construction
- * which repetitively increases the pointer to write the next data, it
- * simply should check if it gets to an edge.
- *
- * @sq - SQ buffer.
- * @idx - Stride index in the SQ buffer.
- *
- * Return:
- *     The new edge.
- */
-static void *get_sq_edge(struct mlx5_ib_wq *sq, u32 idx)
-{
-       void *fragment_end;
-
-       fragment_end = mlx5_frag_buf_get_wqe
-               (&sq->fbc,
-                mlx5_frag_buf_get_idx_last_contig_stride(&sq->fbc, idx));
-
-       return fragment_end + MLX5_SEND_WQE_BB;
-}
-
 static int _create_kernel_qp(struct mlx5_ib_dev *dev,
                             struct ib_qp_init_attr *init_attr,
                             struct mlx5_ib_qp *qp, u32 **in, int *inlen,
@@ -2335,11 +2286,6 @@ static void mlx5_ib_unlock_cqs(struct mlx5_ib_cq *send_cq, struct mlx5_ib_cq *re
        }
 }
 
-static struct mlx5_ib_pd *get_pd(struct mlx5_ib_qp *qp)
-{
-       return to_mpd(qp->ibqp.pd);
-}
-
 static void get_cqs(enum ib_qp_type qp_type,
                    struct ib_cq *ib_send_cq, struct ib_cq *ib_recv_cq,
                    struct mlx5_ib_cq **send_cq, struct mlx5_ib_cq **recv_cq)
@@ -3758,7 +3704,7 @@ static int __mlx5_ib_modify_qp(struct ib_qp *ibqp,
        if (!context)
                return -ENOMEM;
 
-       pd = get_pd(qp);
+       pd = to_mpd(qp->ibqp.pd);
        context->flags = cpu_to_be32(mlx5_st << 16);
 
        if (!(attr_mask & IB_QP_PATH_MIG_STATE)) {
@@ -4286,1494 +4232,6 @@ out:
        return err;
 }
 
-static void _handle_post_send_edge(struct mlx5_ib_wq *sq, void **seg,
-                                  u32 wqe_sz, void **cur_edge)
-{
-       u32 idx;
-
-       idx = (sq->cur_post + (wqe_sz >> 2)) & (sq->wqe_cnt - 1);
-       *cur_edge = get_sq_edge(sq, idx);
-
-       *seg = mlx5_frag_buf_get_wqe(&sq->fbc, idx);
-}
-
-/* handle_post_send_edge - Check if we get to SQ edge. If yes, update to the
- * next nearby edge and get new address translation for current WQE position.
- * @sq - SQ buffer.
- * @seg: Current WQE position (16B aligned).
- * @wqe_sz: Total current WQE size [16B].
- * @cur_edge: Updated current edge.
- */
-static inline void handle_post_send_edge(struct mlx5_ib_wq *sq, void **seg,
-                                        u32 wqe_sz, void **cur_edge)
-{
-       if (likely(*seg != *cur_edge))
-               return;
-
-       _handle_post_send_edge(sq, seg, wqe_sz, cur_edge);
-}
-
-/* memcpy_send_wqe - copy data from src to WQE and update the relevant WQ's
- * pointers. At the end @seg is aligned to 16B regardless the copied size.
- * @sq - SQ buffer.
- * @cur_edge: Updated current edge.
- * @seg: Current WQE position (16B aligned).
- * @wqe_sz: Total current WQE size [16B].
- * @src: Pointer to copy from.
- * @n: Number of bytes to copy.
- */
-static inline void memcpy_send_wqe(struct mlx5_ib_wq *sq, void **cur_edge,
-                                  void **seg, u32 *wqe_sz, const void *src,
-                                  size_t n)
-{
-       while (likely(n)) {
-               size_t leftlen = *cur_edge - *seg;
-               size_t copysz = min_t(size_t, leftlen, n);
-               size_t stride;
-
-               memcpy(*seg, src, copysz);
-
-               n -= copysz;
-               src += copysz;
-               stride = !n ? ALIGN(copysz, 16) : copysz;
-               *seg += stride;
-               *wqe_sz += stride >> 4;
-               handle_post_send_edge(sq, seg, *wqe_sz, cur_edge);
-       }
-}
-
-static int mlx5_wq_overflow(struct mlx5_ib_wq *wq, int nreq, struct ib_cq *ib_cq)
-{
-       struct mlx5_ib_cq *cq;
-       unsigned cur;
-
-       cur = wq->head - wq->tail;
-       if (likely(cur + nreq < wq->max_post))
-               return 0;
-
-       cq = to_mcq(ib_cq);
-       spin_lock(&cq->lock);
-       cur = wq->head - wq->tail;
-       spin_unlock(&cq->lock);
-
-       return cur + nreq >= wq->max_post;
-}
-
-static __always_inline void set_raddr_seg(struct mlx5_wqe_raddr_seg *rseg,
-                                         u64 remote_addr, u32 rkey)
-{
-       rseg->raddr    = cpu_to_be64(remote_addr);
-       rseg->rkey     = cpu_to_be32(rkey);
-       rseg->reserved = 0;
-}
-
-static void set_eth_seg(const struct ib_send_wr *wr, struct mlx5_ib_qp *qp,
-                       void **seg, int *size, void **cur_edge)
-{
-       struct mlx5_wqe_eth_seg *eseg = *seg;
-
-       memset(eseg, 0, sizeof(struct mlx5_wqe_eth_seg));
-
-       if (wr->send_flags & IB_SEND_IP_CSUM)
-               eseg->cs_flags = MLX5_ETH_WQE_L3_CSUM |
-                                MLX5_ETH_WQE_L4_CSUM;
-
-       if (wr->opcode == IB_WR_LSO) {
-               struct ib_ud_wr *ud_wr = container_of(wr, struct ib_ud_wr, wr);
-               size_t left, copysz;
-               void *pdata = ud_wr->header;
-               size_t stride;
-
-               left = ud_wr->hlen;
-               eseg->mss = cpu_to_be16(ud_wr->mss);
-               eseg->inline_hdr.sz = cpu_to_be16(left);
-
-               /* memcpy_send_wqe should get a 16B align address. Hence, we
-                * first copy up to the current edge and then, if needed,
-                * fall-through to memcpy_send_wqe.
-                */
-               copysz = min_t(u64, *cur_edge - (void *)eseg->inline_hdr.start,
-                              left);
-               memcpy(eseg->inline_hdr.start, pdata, copysz);
-               stride = ALIGN(sizeof(struct mlx5_wqe_eth_seg) -
-                              sizeof(eseg->inline_hdr.start) + copysz, 16);
-               *size += stride / 16;
-               *seg += stride;
-
-               if (copysz < left) {
-                       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
-                       left -= copysz;
-                       pdata += copysz;
-                       memcpy_send_wqe(&qp->sq, cur_edge, seg, size, pdata,
-                                       left);
-               }
-
-               return;
-       }
-
-       *seg += sizeof(struct mlx5_wqe_eth_seg);
-       *size += sizeof(struct mlx5_wqe_eth_seg) / 16;
-}
-
-static void set_datagram_seg(struct mlx5_wqe_datagram_seg *dseg,
-                            const struct ib_send_wr *wr)
-{
-       memcpy(&dseg->av, &to_mah(ud_wr(wr)->ah)->av, sizeof(struct mlx5_av));
-       dseg->av.dqp_dct = cpu_to_be32(ud_wr(wr)->remote_qpn | MLX5_EXTENDED_UD_AV);
-       dseg->av.key.qkey.qkey = cpu_to_be32(ud_wr(wr)->remote_qkey);
-}
-
-static void set_data_ptr_seg(struct mlx5_wqe_data_seg *dseg, struct ib_sge *sg)
-{
-       dseg->byte_count = cpu_to_be32(sg->length);
-       dseg->lkey       = cpu_to_be32(sg->lkey);
-       dseg->addr       = cpu_to_be64(sg->addr);
-}
-
-static u64 get_xlt_octo(u64 bytes)
-{
-       return ALIGN(bytes, MLX5_IB_UMR_XLT_ALIGNMENT) /
-              MLX5_IB_UMR_OCTOWORD;
-}
-
-static __be64 frwr_mkey_mask(bool atomic)
-{
-       u64 result;
-
-       result = MLX5_MKEY_MASK_LEN             |
-               MLX5_MKEY_MASK_PAGE_SIZE        |
-               MLX5_MKEY_MASK_START_ADDR       |
-               MLX5_MKEY_MASK_EN_RINVAL        |
-               MLX5_MKEY_MASK_KEY              |
-               MLX5_MKEY_MASK_LR               |
-               MLX5_MKEY_MASK_LW               |
-               MLX5_MKEY_MASK_RR               |
-               MLX5_MKEY_MASK_RW               |
-               MLX5_MKEY_MASK_SMALL_FENCE      |
-               MLX5_MKEY_MASK_FREE;
-
-       if (atomic)
-               result |= MLX5_MKEY_MASK_A;
-
-       return cpu_to_be64(result);
-}
-
-static __be64 sig_mkey_mask(void)
-{
-       u64 result;
-
-       result = MLX5_MKEY_MASK_LEN             |
-               MLX5_MKEY_MASK_PAGE_SIZE        |
-               MLX5_MKEY_MASK_START_ADDR       |
-               MLX5_MKEY_MASK_EN_SIGERR        |
-               MLX5_MKEY_MASK_EN_RINVAL        |
-               MLX5_MKEY_MASK_KEY              |
-               MLX5_MKEY_MASK_LR               |
-               MLX5_MKEY_MASK_LW               |
-               MLX5_MKEY_MASK_RR               |
-               MLX5_MKEY_MASK_RW               |
-               MLX5_MKEY_MASK_SMALL_FENCE      |
-               MLX5_MKEY_MASK_FREE             |
-               MLX5_MKEY_MASK_BSF_EN;
-
-       return cpu_to_be64(result);
-}
-
-static void set_reg_umr_seg(struct mlx5_wqe_umr_ctrl_seg *umr,
-                           struct mlx5_ib_mr *mr, u8 flags, bool atomic)
-{
-       int size = (mr->ndescs + mr->meta_ndescs) * mr->desc_size;
-
-       memset(umr, 0, sizeof(*umr));
-
-       umr->flags = flags;
-       umr->xlt_octowords = cpu_to_be16(get_xlt_octo(size));
-       umr->mkey_mask = frwr_mkey_mask(atomic);
-}
-
-static void set_linv_umr_seg(struct mlx5_wqe_umr_ctrl_seg *umr)
-{
-       memset(umr, 0, sizeof(*umr));
-       umr->mkey_mask = cpu_to_be64(MLX5_MKEY_MASK_FREE);
-       umr->flags = MLX5_UMR_INLINE;
-}
-
-static __be64 get_umr_enable_mr_mask(void)
-{
-       u64 result;
-
-       result = MLX5_MKEY_MASK_KEY |
-                MLX5_MKEY_MASK_FREE;
-
-       return cpu_to_be64(result);
-}
-
-static __be64 get_umr_disable_mr_mask(void)
-{
-       u64 result;
-
-       result = MLX5_MKEY_MASK_FREE;
-
-       return cpu_to_be64(result);
-}
-
-static __be64 get_umr_update_translation_mask(void)
-{
-       u64 result;
-
-       result = MLX5_MKEY_MASK_LEN |
-                MLX5_MKEY_MASK_PAGE_SIZE |
-                MLX5_MKEY_MASK_START_ADDR;
-
-       return cpu_to_be64(result);
-}
-
-static __be64 get_umr_update_access_mask(int atomic)
-{
-       u64 result;
-
-       result = MLX5_MKEY_MASK_LR |
-                MLX5_MKEY_MASK_LW |
-                MLX5_MKEY_MASK_RR |
-                MLX5_MKEY_MASK_RW;
-
-       if (atomic)
-               result |= MLX5_MKEY_MASK_A;
-
-       return cpu_to_be64(result);
-}
-
-static __be64 get_umr_update_pd_mask(void)
-{
-       u64 result;
-
-       result = MLX5_MKEY_MASK_PD;
-
-       return cpu_to_be64(result);
-}
-
-static int umr_check_mkey_mask(struct mlx5_ib_dev *dev, u64 mask)
-{
-       if ((mask & MLX5_MKEY_MASK_PAGE_SIZE &&
-            MLX5_CAP_GEN(dev->mdev, umr_modify_entity_size_disabled)) ||
-           (mask & MLX5_MKEY_MASK_A &&
-            MLX5_CAP_GEN(dev->mdev, umr_modify_atomic_disabled)))
-               return -EPERM;
-       return 0;
-}
-
-static int set_reg_umr_segment(struct mlx5_ib_dev *dev,
-                              struct mlx5_wqe_umr_ctrl_seg *umr,
-                              const struct ib_send_wr *wr, int atomic)
-{
-       const struct mlx5_umr_wr *umrwr = umr_wr(wr);
-
-       memset(umr, 0, sizeof(*umr));
-
-       if (!umrwr->ignore_free_state) {
-               if (wr->send_flags & MLX5_IB_SEND_UMR_FAIL_IF_FREE)
-                        /* fail if free */
-                       umr->flags = MLX5_UMR_CHECK_FREE;
-               else
-                       /* fail if not free */
-                       umr->flags = MLX5_UMR_CHECK_NOT_FREE;
-       }
-
-       umr->xlt_octowords = cpu_to_be16(get_xlt_octo(umrwr->xlt_size));
-       if (wr->send_flags & MLX5_IB_SEND_UMR_UPDATE_XLT) {
-               u64 offset = get_xlt_octo(umrwr->offset);
-
-               umr->xlt_offset = cpu_to_be16(offset & 0xffff);
-               umr->xlt_offset_47_16 = cpu_to_be32(offset >> 16);
-               umr->flags |= MLX5_UMR_TRANSLATION_OFFSET_EN;
-       }
-       if (wr->send_flags & MLX5_IB_SEND_UMR_UPDATE_TRANSLATION)
-               umr->mkey_mask |= get_umr_update_translation_mask();
-       if (wr->send_flags & MLX5_IB_SEND_UMR_UPDATE_PD_ACCESS) {
-               umr->mkey_mask |= get_umr_update_access_mask(atomic);
-               umr->mkey_mask |= get_umr_update_pd_mask();
-       }
-       if (wr->send_flags & MLX5_IB_SEND_UMR_ENABLE_MR)
-               umr->mkey_mask |= get_umr_enable_mr_mask();
-       if (wr->send_flags & MLX5_IB_SEND_UMR_DISABLE_MR)
-               umr->mkey_mask |= get_umr_disable_mr_mask();
-
-       if (!wr->num_sge)
-               umr->flags |= MLX5_UMR_INLINE;
-
-       return umr_check_mkey_mask(dev, be64_to_cpu(umr->mkey_mask));
-}
-
-static u8 get_umr_flags(int acc)
-{
-       return (acc & IB_ACCESS_REMOTE_ATOMIC ? MLX5_PERM_ATOMIC       : 0) |
-              (acc & IB_ACCESS_REMOTE_WRITE  ? MLX5_PERM_REMOTE_WRITE : 0) |
-              (acc & IB_ACCESS_REMOTE_READ   ? MLX5_PERM_REMOTE_READ  : 0) |
-              (acc & IB_ACCESS_LOCAL_WRITE   ? MLX5_PERM_LOCAL_WRITE  : 0) |
-               MLX5_PERM_LOCAL_READ | MLX5_PERM_UMR_EN;
-}
-
-static void set_reg_mkey_seg(struct mlx5_mkey_seg *seg,
-                            struct mlx5_ib_mr *mr,
-                            u32 key, int access)
-{
-       int ndescs = ALIGN(mr->ndescs + mr->meta_ndescs, 8) >> 1;
-
-       memset(seg, 0, sizeof(*seg));
-
-       if (mr->access_mode == MLX5_MKC_ACCESS_MODE_MTT)
-               seg->log2_page_size = ilog2(mr->ibmr.page_size);
-       else if (mr->access_mode == MLX5_MKC_ACCESS_MODE_KLMS)
-               /* KLMs take twice the size of MTTs */
-               ndescs *= 2;
-
-       seg->flags = get_umr_flags(access) | mr->access_mode;
-       seg->qpn_mkey7_0 = cpu_to_be32((key & 0xff) | 0xffffff00);
-       seg->flags_pd = cpu_to_be32(MLX5_MKEY_REMOTE_INVAL);
-       seg->start_addr = cpu_to_be64(mr->ibmr.iova);
-       seg->len = cpu_to_be64(mr->ibmr.length);
-       seg->xlt_oct_size = cpu_to_be32(ndescs);
-}
-
-static void set_linv_mkey_seg(struct mlx5_mkey_seg *seg)
-{
-       memset(seg, 0, sizeof(*seg));
-       seg->status = MLX5_MKEY_STATUS_FREE;
-}
-
-static void set_reg_mkey_segment(struct mlx5_mkey_seg *seg,
-                                const struct ib_send_wr *wr)
-{
-       const struct mlx5_umr_wr *umrwr = umr_wr(wr);
-
-       memset(seg, 0, sizeof(*seg));
-       if (wr->send_flags & MLX5_IB_SEND_UMR_DISABLE_MR)
-               seg->status = MLX5_MKEY_STATUS_FREE;
-
-       seg->flags = convert_access(umrwr->access_flags);
-       if (umrwr->pd)
-               seg->flags_pd = cpu_to_be32(to_mpd(umrwr->pd)->pdn);
-       if (wr->send_flags & MLX5_IB_SEND_UMR_UPDATE_TRANSLATION &&
-           !umrwr->length)
-               seg->flags_pd |= cpu_to_be32(MLX5_MKEY_LEN64);
-
-       seg->start_addr = cpu_to_be64(umrwr->virt_addr);
-       seg->len = cpu_to_be64(umrwr->length);
-       seg->log2_page_size = umrwr->page_shift;
-       seg->qpn_mkey7_0 = cpu_to_be32(0xffffff00 |
-                                      mlx5_mkey_variant(umrwr->mkey));
-}
-
-static void set_reg_data_seg(struct mlx5_wqe_data_seg *dseg,
-                            struct mlx5_ib_mr *mr,
-                            struct mlx5_ib_pd *pd)
-{
-       int bcount = mr->desc_size * (mr->ndescs + mr->meta_ndescs);
-
-       dseg->addr = cpu_to_be64(mr->desc_map);
-       dseg->byte_count = cpu_to_be32(ALIGN(bcount, 64));
-       dseg->lkey = cpu_to_be32(pd->ibpd.local_dma_lkey);
-}
-
-static __be32 send_ieth(const struct ib_send_wr *wr)
-{
-       switch (wr->opcode) {
-       case IB_WR_SEND_WITH_IMM:
-       case IB_WR_RDMA_WRITE_WITH_IMM:
-               return wr->ex.imm_data;
-
-       case IB_WR_SEND_WITH_INV:
-               return cpu_to_be32(wr->ex.invalidate_rkey);
-
-       default:
-               return 0;
-       }
-}
-
-static u8 calc_sig(void *wqe, int size)
-{
-       u8 *p = wqe;
-       u8 res = 0;
-       int i;
-
-       for (i = 0; i < size; i++)
-               res ^= p[i];
-
-       return ~res;
-}
-
-static u8 wq_sig(void *wqe)
-{
-       return calc_sig(wqe, (*((u8 *)wqe + 8) & 0x3f) << 4);
-}
-
-static int set_data_inl_seg(struct mlx5_ib_qp *qp, const struct ib_send_wr *wr,
-                           void **wqe, int *wqe_sz, void **cur_edge)
-{
-       struct mlx5_wqe_inline_seg *seg;
-       size_t offset;
-       int inl = 0;
-       int i;
-
-       seg = *wqe;
-       *wqe += sizeof(*seg);
-       offset = sizeof(*seg);
-
-       for (i = 0; i < wr->num_sge; i++) {
-               size_t len  = wr->sg_list[i].length;
-               void *addr = (void *)(unsigned long)(wr->sg_list[i].addr);
-
-               inl += len;
-
-               if (unlikely(inl > qp->max_inline_data))
-                       return -ENOMEM;
-
-               while (likely(len)) {
-                       size_t leftlen;
-                       size_t copysz;
-
-                       handle_post_send_edge(&qp->sq, wqe,
-                                             *wqe_sz + (offset >> 4),
-                                             cur_edge);
-
-                       leftlen = *cur_edge - *wqe;
-                       copysz = min_t(size_t, leftlen, len);
-
-                       memcpy(*wqe, addr, copysz);
-                       len -= copysz;
-                       addr += copysz;
-                       *wqe += copysz;
-                       offset += copysz;
-               }
-       }
-
-       seg->byte_count = cpu_to_be32(inl | MLX5_INLINE_SEG);
-
-       *wqe_sz +=  ALIGN(inl + sizeof(seg->byte_count), 16) / 16;
-
-       return 0;
-}
-
-static u16 prot_field_size(enum ib_signature_type type)
-{
-       switch (type) {
-       case IB_SIG_TYPE_T10_DIF:
-               return MLX5_DIF_SIZE;
-       default:
-               return 0;
-       }
-}
-
-static u8 bs_selector(int block_size)
-{
-       switch (block_size) {
-       case 512:           return 0x1;
-       case 520:           return 0x2;
-       case 4096:          return 0x3;
-       case 4160:          return 0x4;
-       case 1073741824:    return 0x5;
-       default:            return 0;
-       }
-}
-
-static void mlx5_fill_inl_bsf(struct ib_sig_domain *domain,
-                             struct mlx5_bsf_inl *inl)
-{
-       /* Valid inline section and allow BSF refresh */
-       inl->vld_refresh = cpu_to_be16(MLX5_BSF_INL_VALID |
-                                      MLX5_BSF_REFRESH_DIF);
-       inl->dif_apptag = cpu_to_be16(domain->sig.dif.app_tag);
-       inl->dif_reftag = cpu_to_be32(domain->sig.dif.ref_tag);
-       /* repeating block */
-       inl->rp_inv_seed = MLX5_BSF_REPEAT_BLOCK;
-       inl->sig_type = domain->sig.dif.bg_type == IB_T10DIF_CRC ?
-                       MLX5_DIF_CRC : MLX5_DIF_IPCS;
-
-       if (domain->sig.dif.ref_remap)
-               inl->dif_inc_ref_guard_check |= MLX5_BSF_INC_REFTAG;
-
-       if (domain->sig.dif.app_escape) {
-               if (domain->sig.dif.ref_escape)
-                       inl->dif_inc_ref_guard_check |= MLX5_BSF_APPREF_ESCAPE;
-               else
-                       inl->dif_inc_ref_guard_check |= MLX5_BSF_APPTAG_ESCAPE;
-       }
-
-       inl->dif_app_bitmask_check =
-               cpu_to_be16(domain->sig.dif.apptag_check_mask);
-}
-
-static int mlx5_set_bsf(struct ib_mr *sig_mr,
-                       struct ib_sig_attrs *sig_attrs,
-                       struct mlx5_bsf *bsf, u32 data_size)
-{
-       struct mlx5_core_sig_ctx *msig = to_mmr(sig_mr)->sig;
-       struct mlx5_bsf_basic *basic = &bsf->basic;
-       struct ib_sig_domain *mem = &sig_attrs->mem;
-       struct ib_sig_domain *wire = &sig_attrs->wire;
-
-       memset(bsf, 0, sizeof(*bsf));
-
-       /* Basic + Extended + Inline */
-       basic->bsf_size_sbs = 1 << 7;
-       /* Input domain check byte mask */
-       basic->check_byte_mask = sig_attrs->check_mask;
-       basic->raw_data_size = cpu_to_be32(data_size);
-
-       /* Memory domain */
-       switch (sig_attrs->mem.sig_type) {
-       case IB_SIG_TYPE_NONE:
-               break;
-       case IB_SIG_TYPE_T10_DIF:
-               basic->mem.bs_selector = bs_selector(mem->sig.dif.pi_interval);
-               basic->m_bfs_psv = cpu_to_be32(msig->psv_memory.psv_idx);
-               mlx5_fill_inl_bsf(mem, &bsf->m_inl);
-               break;
-       default:
-               return -EINVAL;
-       }
-
-       /* Wire domain */
-       switch (sig_attrs->wire.sig_type) {
-       case IB_SIG_TYPE_NONE:
-               break;
-       case IB_SIG_TYPE_T10_DIF:
-               if (mem->sig.dif.pi_interval == wire->sig.dif.pi_interval &&
-                   mem->sig_type == wire->sig_type) {
-                       /* Same block structure */
-                       basic->bsf_size_sbs |= 1 << 4;
-                       if (mem->sig.dif.bg_type == wire->sig.dif.bg_type)
-                               basic->wire.copy_byte_mask |= MLX5_CPY_GRD_MASK;
-                       if (mem->sig.dif.app_tag == wire->sig.dif.app_tag)
-                               basic->wire.copy_byte_mask |= MLX5_CPY_APP_MASK;
-                       if (mem->sig.dif.ref_tag == wire->sig.dif.ref_tag)
-                               basic->wire.copy_byte_mask |= MLX5_CPY_REF_MASK;
-               } else
-                       basic->wire.bs_selector = bs_selector(wire->sig.dif.pi_interval);
-
-               basic->w_bfs_psv = cpu_to_be32(msig->psv_wire.psv_idx);
-               mlx5_fill_inl_bsf(wire, &bsf->w_inl);
-               break;
-       default:
-               return -EINVAL;
-       }
-
-       return 0;
-}
-
-static int set_sig_data_segment(const struct ib_send_wr *send_wr,
-                               struct ib_mr *sig_mr,
-                               struct ib_sig_attrs *sig_attrs,
-                               struct mlx5_ib_qp *qp, void **seg, int *size,
-                               void **cur_edge)
-{
-       struct mlx5_bsf *bsf;
-       u32 data_len;
-       u32 data_key;
-       u64 data_va;
-       u32 prot_len = 0;
-       u32 prot_key = 0;
-       u64 prot_va = 0;
-       bool prot = false;
-       int ret;
-       int wqe_size;
-       struct mlx5_ib_mr *mr = to_mmr(sig_mr);
-       struct mlx5_ib_mr *pi_mr = mr->pi_mr;
-
-       data_len = pi_mr->data_length;
-       data_key = pi_mr->ibmr.lkey;
-       data_va = pi_mr->data_iova;
-       if (pi_mr->meta_ndescs) {
-               prot_len = pi_mr->meta_length;
-               prot_key = pi_mr->ibmr.lkey;
-               prot_va = pi_mr->pi_iova;
-               prot = true;
-       }
-
-       if (!prot || (data_key == prot_key && data_va == prot_va &&
-                     data_len == prot_len)) {
-               /**
-                * Source domain doesn't contain signature information
-                * or data and protection are interleaved in memory.
-                * So need construct:
-                *                  ------------------
-                *                 |     data_klm     |
-                *                  ------------------
-                *                 |       BSF        |
-                *                  ------------------
-                **/
-               struct mlx5_klm *data_klm = *seg;
-
-               data_klm->bcount = cpu_to_be32(data_len);
-               data_klm->key = cpu_to_be32(data_key);
-               data_klm->va = cpu_to_be64(data_va);
-               wqe_size = ALIGN(sizeof(*data_klm), 64);
-       } else {
-               /**
-                * Source domain contains signature information
-                * So need construct a strided block format:
-                *               ---------------------------
-                *              |     stride_block_ctrl     |
-                *               ---------------------------
-                *              |          data_klm         |
-                *               ---------------------------
-                *              |          prot_klm         |
-                *               ---------------------------
-                *              |             BSF           |
-                *               ---------------------------
-                **/
-               struct mlx5_stride_block_ctrl_seg *sblock_ctrl;
-               struct mlx5_stride_block_entry *data_sentry;
-               struct mlx5_stride_block_entry *prot_sentry;
-               u16 block_size = sig_attrs->mem.sig.dif.pi_interval;
-               int prot_size;
-
-               sblock_ctrl = *seg;
-               data_sentry = (void *)sblock_ctrl + sizeof(*sblock_ctrl);
-               prot_sentry = (void *)data_sentry + sizeof(*data_sentry);
-
-               prot_size = prot_field_size(sig_attrs->mem.sig_type);
-               if (!prot_size) {
-                       pr_err("Bad block size given: %u\n", block_size);
-                       return -EINVAL;
-               }
-               sblock_ctrl->bcount_per_cycle = cpu_to_be32(block_size +
-                                                           prot_size);
-               sblock_ctrl->op = cpu_to_be32(MLX5_STRIDE_BLOCK_OP);
-               sblock_ctrl->repeat_count = cpu_to_be32(data_len / block_size);
-               sblock_ctrl->num_entries = cpu_to_be16(2);
-
-               data_sentry->bcount = cpu_to_be16(block_size);
-               data_sentry->key = cpu_to_be32(data_key);
-               data_sentry->va = cpu_to_be64(data_va);
-               data_sentry->stride = cpu_to_be16(block_size);
-
-               prot_sentry->bcount = cpu_to_be16(prot_size);
-               prot_sentry->key = cpu_to_be32(prot_key);
-               prot_sentry->va = cpu_to_be64(prot_va);
-               prot_sentry->stride = cpu_to_be16(prot_size);
-
-               wqe_size = ALIGN(sizeof(*sblock_ctrl) + sizeof(*data_sentry) +
-                                sizeof(*prot_sentry), 64);
-       }
-
-       *seg += wqe_size;
-       *size += wqe_size / 16;
-       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
-
-       bsf = *seg;
-       ret = mlx5_set_bsf(sig_mr, sig_attrs, bsf, data_len);
-       if (ret)
-               return -EINVAL;
-
-       *seg += sizeof(*bsf);
-       *size += sizeof(*bsf) / 16;
-       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
-
-       return 0;
-}
-
-static void set_sig_mkey_segment(struct mlx5_mkey_seg *seg,
-                                struct ib_mr *sig_mr, int access_flags,
-                                u32 size, u32 length, u32 pdn)
-{
-       u32 sig_key = sig_mr->rkey;
-       u8 sigerr = to_mmr(sig_mr)->sig->sigerr_count & 1;
-
-       memset(seg, 0, sizeof(*seg));
-
-       seg->flags = get_umr_flags(access_flags) | MLX5_MKC_ACCESS_MODE_KLMS;
-       seg->qpn_mkey7_0 = cpu_to_be32((sig_key & 0xff) | 0xffffff00);
-       seg->flags_pd = cpu_to_be32(MLX5_MKEY_REMOTE_INVAL | sigerr << 26 |
-                                   MLX5_MKEY_BSF_EN | pdn);
-       seg->len = cpu_to_be64(length);
-       seg->xlt_oct_size = cpu_to_be32(get_xlt_octo(size));
-       seg->bsfs_octo_size = cpu_to_be32(MLX5_MKEY_BSF_OCTO_SIZE);
-}
-
-static void set_sig_umr_segment(struct mlx5_wqe_umr_ctrl_seg *umr,
-                               u32 size)
-{
-       memset(umr, 0, sizeof(*umr));
-
-       umr->flags = MLX5_FLAGS_INLINE | MLX5_FLAGS_CHECK_FREE;
-       umr->xlt_octowords = cpu_to_be16(get_xlt_octo(size));
-       umr->bsf_octowords = cpu_to_be16(MLX5_MKEY_BSF_OCTO_SIZE);
-       umr->mkey_mask = sig_mkey_mask();
-}
-
-static int set_pi_umr_wr(const struct ib_send_wr *send_wr,
-                        struct mlx5_ib_qp *qp, void **seg, int *size,
-                        void **cur_edge)
-{
-       const struct ib_reg_wr *wr = reg_wr(send_wr);
-       struct mlx5_ib_mr *sig_mr = to_mmr(wr->mr);
-       struct mlx5_ib_mr *pi_mr = sig_mr->pi_mr;
-       struct ib_sig_attrs *sig_attrs = sig_mr->ibmr.sig_attrs;
-       u32 pdn = get_pd(qp)->pdn;
-       u32 xlt_size;
-       int region_len, ret;
-
-       if (unlikely(send_wr->num_sge != 0) ||
-           unlikely(wr->access & IB_ACCESS_REMOTE_ATOMIC) ||
-           unlikely(!sig_mr->sig) || unlikely(!qp->ibqp.integrity_en) ||
-           unlikely(!sig_mr->sig->sig_status_checked))
-               return -EINVAL;
-
-       /* length of the protected region, data + protection */
-       region_len = pi_mr->ibmr.length;
-
-       /**
-        * KLM octoword size - if protection was provided
-        * then we use strided block format (3 octowords),
-        * else we use single KLM (1 octoword)
-        **/
-       if (sig_attrs->mem.sig_type != IB_SIG_TYPE_NONE)
-               xlt_size = 0x30;
-       else
-               xlt_size = sizeof(struct mlx5_klm);
-
-       set_sig_umr_segment(*seg, xlt_size);
-       *seg += sizeof(struct mlx5_wqe_umr_ctrl_seg);
-       *size += sizeof(struct mlx5_wqe_umr_ctrl_seg) / 16;
-       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
-
-       set_sig_mkey_segment(*seg, wr->mr, wr->access, xlt_size, region_len,
-                            pdn);
-       *seg += sizeof(struct mlx5_mkey_seg);
-       *size += sizeof(struct mlx5_mkey_seg) / 16;
-       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
-
-       ret = set_sig_data_segment(send_wr, wr->mr, sig_attrs, qp, seg, size,
-                                  cur_edge);
-       if (ret)
-               return ret;
-
-       sig_mr->sig->sig_status_checked = false;
-       return 0;
-}
-
-static int set_psv_wr(struct ib_sig_domain *domain,
-                     u32 psv_idx, void **seg, int *size)
-{
-       struct mlx5_seg_set_psv *psv_seg = *seg;
-
-       memset(psv_seg, 0, sizeof(*psv_seg));
-       psv_seg->psv_num = cpu_to_be32(psv_idx);
-       switch (domain->sig_type) {
-       case IB_SIG_TYPE_NONE:
-               break;
-       case IB_SIG_TYPE_T10_DIF:
-               psv_seg->transient_sig = cpu_to_be32(domain->sig.dif.bg << 16 |
-                                                    domain->sig.dif.app_tag);
-               psv_seg->ref_tag = cpu_to_be32(domain->sig.dif.ref_tag);
-               break;
-       default:
-               pr_err("Bad signature type (%d) is given.\n",
-                      domain->sig_type);
-               return -EINVAL;
-       }
-
-       *seg += sizeof(*psv_seg);
-       *size += sizeof(*psv_seg) / 16;
-
-       return 0;
-}
-
-static int set_reg_wr(struct mlx5_ib_qp *qp,
-                     const struct ib_reg_wr *wr,
-                     void **seg, int *size, void **cur_edge,
-                     bool check_not_free)
-{
-       struct mlx5_ib_mr *mr = to_mmr(wr->mr);
-       struct mlx5_ib_pd *pd = to_mpd(qp->ibqp.pd);
-       struct mlx5_ib_dev *dev = to_mdev(pd->ibpd.device);
-       int mr_list_size = (mr->ndescs + mr->meta_ndescs) * mr->desc_size;
-       bool umr_inline = mr_list_size <= MLX5_IB_SQ_UMR_INLINE_THRESHOLD;
-       bool atomic = wr->access & IB_ACCESS_REMOTE_ATOMIC;
-       u8 flags = 0;
-
-       if (!mlx5_ib_can_use_umr(dev, atomic, wr->access)) {
-               mlx5_ib_warn(to_mdev(qp->ibqp.device),
-                            "Fast update of %s for MR is disabled\n",
-                            (MLX5_CAP_GEN(dev->mdev,
-                                          umr_modify_entity_size_disabled)) ?
-                                    "entity size" :
-                                    "atomic access");
-               return -EINVAL;
-       }
-
-       if (unlikely(wr->wr.send_flags & IB_SEND_INLINE)) {
-               mlx5_ib_warn(to_mdev(qp->ibqp.device),
-                            "Invalid IB_SEND_INLINE send flag\n");
-               return -EINVAL;
-       }
-
-       if (check_not_free)
-               flags |= MLX5_UMR_CHECK_NOT_FREE;
-       if (umr_inline)
-               flags |= MLX5_UMR_INLINE;
-
-       set_reg_umr_seg(*seg, mr, flags, atomic);
-       *seg += sizeof(struct mlx5_wqe_umr_ctrl_seg);
-       *size += sizeof(struct mlx5_wqe_umr_ctrl_seg) / 16;
-       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
-
-       set_reg_mkey_seg(*seg, mr, wr->key, wr->access);
-       *seg += sizeof(struct mlx5_mkey_seg);
-       *size += sizeof(struct mlx5_mkey_seg) / 16;
-       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
-
-       if (umr_inline) {
-               memcpy_send_wqe(&qp->sq, cur_edge, seg, size, mr->descs,
-                               mr_list_size);
-               *size = ALIGN(*size, MLX5_SEND_WQE_BB >> 4);
-       } else {
-               set_reg_data_seg(*seg, mr, pd);
-               *seg += sizeof(struct mlx5_wqe_data_seg);
-               *size += (sizeof(struct mlx5_wqe_data_seg) / 16);
-       }
-       return 0;
-}
-
-static void set_linv_wr(struct mlx5_ib_qp *qp, void **seg, int *size,
-                       void **cur_edge)
-{
-       set_linv_umr_seg(*seg);
-       *seg += sizeof(struct mlx5_wqe_umr_ctrl_seg);
-       *size += sizeof(struct mlx5_wqe_umr_ctrl_seg) / 16;
-       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
-       set_linv_mkey_seg(*seg);
-       *seg += sizeof(struct mlx5_mkey_seg);
-       *size += sizeof(struct mlx5_mkey_seg) / 16;
-       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
-}
-
-static void dump_wqe(struct mlx5_ib_qp *qp, u32 idx, int size_16)
-{
-       __be32 *p = NULL;
-       int i, j;
-
-       pr_debug("dump WQE index %u:\n", idx);
-       for (i = 0, j = 0; i < size_16 * 4; i += 4, j += 4) {
-               if ((i & 0xf) == 0) {
-                       p = mlx5_frag_buf_get_wqe(&qp->sq.fbc, idx);
-                       pr_debug("WQBB at %p:\n", (void *)p);
-                       j = 0;
-                       idx = (idx + 1) & (qp->sq.wqe_cnt - 1);
-               }
-               pr_debug("%08x %08x %08x %08x\n", be32_to_cpu(p[j]),
-                        be32_to_cpu(p[j + 1]), be32_to_cpu(p[j + 2]),
-                        be32_to_cpu(p[j + 3]));
-       }
-}
-
-static int __begin_wqe(struct mlx5_ib_qp *qp, void **seg,
-                      struct mlx5_wqe_ctrl_seg **ctrl,
-                      const struct ib_send_wr *wr, unsigned int *idx,
-                      int *size, void **cur_edge, int nreq,
-                      bool send_signaled, bool solicited)
-{
-       if (unlikely(mlx5_wq_overflow(&qp->sq, nreq, qp->ibqp.send_cq)))
-               return -ENOMEM;
-
-       *idx = qp->sq.cur_post & (qp->sq.wqe_cnt - 1);
-       *seg = mlx5_frag_buf_get_wqe(&qp->sq.fbc, *idx);
-       *ctrl = *seg;
-       *(uint32_t *)(*seg + 8) = 0;
-       (*ctrl)->imm = send_ieth(wr);
-       (*ctrl)->fm_ce_se = qp->sq_signal_bits |
-               (send_signaled ? MLX5_WQE_CTRL_CQ_UPDATE : 0) |
-               (solicited ? MLX5_WQE_CTRL_SOLICITED : 0);
-
-       *seg += sizeof(**ctrl);
-       *size = sizeof(**ctrl) / 16;
-       *cur_edge = qp->sq.cur_edge;
-
-       return 0;
-}
-
-static int begin_wqe(struct mlx5_ib_qp *qp, void **seg,
-                    struct mlx5_wqe_ctrl_seg **ctrl,
-                    const struct ib_send_wr *wr, unsigned *idx,
-                    int *size, void **cur_edge, int nreq)
-{
-       return __begin_wqe(qp, seg, ctrl, wr, idx, size, cur_edge, nreq,
-                          wr->send_flags & IB_SEND_SIGNALED,
-                          wr->send_flags & IB_SEND_SOLICITED);
-}
-
-static void finish_wqe(struct mlx5_ib_qp *qp,
-                      struct mlx5_wqe_ctrl_seg *ctrl,
-                      void *seg, u8 size, void *cur_edge,
-                      unsigned int idx, u64 wr_id, int nreq, u8 fence,
-                      u32 mlx5_opcode)
-{
-       u8 opmod = 0;
-
-       ctrl->opmod_idx_opcode = cpu_to_be32(((u32)(qp->sq.cur_post) << 8) |
-                                            mlx5_opcode | ((u32)opmod << 24));
-       ctrl->qpn_ds = cpu_to_be32(size | (qp->trans_qp.base.mqp.qpn << 8));
-       ctrl->fm_ce_se |= fence;
-       if (unlikely(qp->flags_en & MLX5_QP_FLAG_SIGNATURE))
-               ctrl->signature = wq_sig(ctrl);
-
-       qp->sq.wrid[idx] = wr_id;
-       qp->sq.w_list[idx].opcode = mlx5_opcode;
-       qp->sq.wqe_head[idx] = qp->sq.head + nreq;
-       qp->sq.cur_post += DIV_ROUND_UP(size * 16, MLX5_SEND_WQE_BB);
-       qp->sq.w_list[idx].next = qp->sq.cur_post;
-
-       /* We save the edge which was possibly updated during the WQE
-        * construction, into SQ's cache.
-        */
-       seg = PTR_ALIGN(seg, MLX5_SEND_WQE_BB);
-       qp->sq.cur_edge = (unlikely(seg == cur_edge)) ?
-                         get_sq_edge(&qp->sq, qp->sq.cur_post &
-                                     (qp->sq.wqe_cnt - 1)) :
-                         cur_edge;
-}
-
-static void handle_rdma_op(const struct ib_send_wr *wr, void **seg, int *size)
-{
-       set_raddr_seg(*seg, rdma_wr(wr)->remote_addr, rdma_wr(wr)->rkey);
-       *seg += sizeof(struct mlx5_wqe_raddr_seg);
-       *size += sizeof(struct mlx5_wqe_raddr_seg) / 16;
-}
-
-static void handle_local_inv(struct mlx5_ib_qp *qp, const struct ib_send_wr *wr,
-                            struct mlx5_wqe_ctrl_seg **ctrl, void **seg,
-                            int *size, void **cur_edge, unsigned int idx)
-{
-       qp->sq.wr_data[idx] = IB_WR_LOCAL_INV;
-       (*ctrl)->imm = cpu_to_be32(wr->ex.invalidate_rkey);
-       set_linv_wr(qp, seg, size, cur_edge);
-}
-
-static int handle_reg_mr(struct mlx5_ib_qp *qp, const struct ib_send_wr *wr,
-                        struct mlx5_wqe_ctrl_seg **ctrl, void **seg, int *size,
-                        void **cur_edge, unsigned int idx)
-{
-       qp->sq.wr_data[idx] = IB_WR_REG_MR;
-       (*ctrl)->imm = cpu_to_be32(reg_wr(wr)->key);
-       return set_reg_wr(qp, reg_wr(wr), seg, size, cur_edge, true);
-}
-
-static int handle_psv(struct mlx5_ib_dev *dev, struct mlx5_ib_qp *qp,
-                     const struct ib_send_wr *wr,
-                     struct mlx5_wqe_ctrl_seg **ctrl, void **seg, int *size,
-                     void **cur_edge, unsigned int *idx, int nreq,
-                     struct ib_sig_domain *domain, u32 psv_index,
-                     u8 next_fence)
-{
-       int err;
-
-       /*
-        * SET_PSV WQEs are not signaled and solicited on error.
-        */
-       err = __begin_wqe(qp, seg, ctrl, wr, idx, size, cur_edge, nreq,
-                         false, true);
-       if (unlikely(err)) {
-               mlx5_ib_warn(dev, "\n");
-               err = -ENOMEM;
-               goto out;
-       }
-       err = set_psv_wr(domain, psv_index, seg, size);
-       if (unlikely(err)) {
-               mlx5_ib_warn(dev, "\n");
-               goto out;
-       }
-       finish_wqe(qp, *ctrl, *seg, *size, *cur_edge, *idx, wr->wr_id, nreq,
-                  next_fence, MLX5_OPCODE_SET_PSV);
-
-out:
-       return err;
-}
-
-static int handle_reg_mr_integrity(struct mlx5_ib_dev *dev,
-               struct mlx5_ib_qp *qp, const struct ib_send_wr *wr,
-               struct mlx5_wqe_ctrl_seg **ctrl, void **seg, int *size,
-               void **cur_edge, unsigned int *idx, int nreq, u8 fence,
-               u8 next_fence)
-{
-       struct mlx5_ib_mr *mr;
-       struct mlx5_ib_mr *pi_mr;
-       struct mlx5_ib_mr pa_pi_mr;
-       struct ib_sig_attrs *sig_attrs;
-       struct ib_reg_wr reg_pi_wr;
-       int err;
-
-       qp->sq.wr_data[*idx] = IB_WR_REG_MR_INTEGRITY;
-
-       mr = to_mmr(reg_wr(wr)->mr);
-       pi_mr = mr->pi_mr;
-
-       if (pi_mr) {
-               memset(&reg_pi_wr, 0,
-                      sizeof(struct ib_reg_wr));
-
-               reg_pi_wr.mr = &pi_mr->ibmr;
-               reg_pi_wr.access = reg_wr(wr)->access;
-               reg_pi_wr.key = pi_mr->ibmr.rkey;
-
-               (*ctrl)->imm = cpu_to_be32(reg_pi_wr.key);
-               /* UMR for data + prot registration */
-               err = set_reg_wr(qp, &reg_pi_wr, seg, size, cur_edge, false);
-               if (unlikely(err))
-                       goto out;
-
-               finish_wqe(qp, *ctrl, *seg, *size, *cur_edge, *idx, wr->wr_id,
-                          nreq, fence, MLX5_OPCODE_UMR);
-
-               err = begin_wqe(qp, seg, ctrl, wr, idx, size, cur_edge, nreq);
-               if (unlikely(err)) {
-                       mlx5_ib_warn(dev, "\n");
-                       err = -ENOMEM;
-                       goto out;
-               }
-       } else {
-               memset(&pa_pi_mr, 0, sizeof(struct mlx5_ib_mr));
-               /* No UMR, use local_dma_lkey */
-               pa_pi_mr.ibmr.lkey = mr->ibmr.pd->local_dma_lkey;
-               pa_pi_mr.ndescs = mr->ndescs;
-               pa_pi_mr.data_length = mr->data_length;
-               pa_pi_mr.data_iova = mr->data_iova;
-               if (mr->meta_ndescs) {
-                       pa_pi_mr.meta_ndescs = mr->meta_ndescs;
-                       pa_pi_mr.meta_length = mr->meta_length;
-                       pa_pi_mr.pi_iova = mr->pi_iova;
-               }
-
-               pa_pi_mr.ibmr.length = mr->ibmr.length;
-               mr->pi_mr = &pa_pi_mr;
-       }
-       (*ctrl)->imm = cpu_to_be32(mr->ibmr.rkey);
-       /* UMR for sig MR */
-       err = set_pi_umr_wr(wr, qp, seg, size, cur_edge);
-       if (unlikely(err)) {
-               mlx5_ib_warn(dev, "\n");
-               goto out;
-       }
-       finish_wqe(qp, *ctrl, *seg, *size, *cur_edge, *idx, wr->wr_id, nreq,
-                  fence, MLX5_OPCODE_UMR);
-
-       sig_attrs = mr->ibmr.sig_attrs;
-       err = handle_psv(dev, qp, wr, ctrl, seg, size, cur_edge, idx, nreq,
-                        &sig_attrs->mem, mr->sig->psv_memory.psv_idx,
-                        next_fence);
-       if (unlikely(err))
-               goto out;
-
-       err = handle_psv(dev, qp, wr, ctrl, seg, size, cur_edge, idx, nreq,
-                        &sig_attrs->wire, mr->sig->psv_wire.psv_idx,
-                        next_fence);
-       if (unlikely(err))
-               goto out;
-
-       qp->next_fence = MLX5_FENCE_MODE_INITIATOR_SMALL;
-
-out:
-       return err;
-}
-
-static int handle_qpt_rc(struct mlx5_ib_dev *dev, struct mlx5_ib_qp *qp,
-                        const struct ib_send_wr *wr,
-                        struct mlx5_wqe_ctrl_seg **ctrl, void **seg, int *size,
-                        void **cur_edge, unsigned int *idx, int nreq, u8 fence,
-                        u8 next_fence, int *num_sge)
-{
-       int err = 0;
-
-       switch (wr->opcode) {
-       case IB_WR_RDMA_READ:
-       case IB_WR_RDMA_WRITE:
-       case IB_WR_RDMA_WRITE_WITH_IMM:
-               handle_rdma_op(wr, seg, size);
-               break;
-
-       case IB_WR_ATOMIC_CMP_AND_SWP:
-       case IB_WR_ATOMIC_FETCH_AND_ADD:
-       case IB_WR_MASKED_ATOMIC_CMP_AND_SWP:
-               mlx5_ib_warn(dev, "Atomic operations are not supported yet\n");
-               err = -EOPNOTSUPP;
-               goto out;
-
-       case IB_WR_LOCAL_INV:
-               handle_local_inv(qp, wr, ctrl, seg, size, cur_edge, *idx);
-               *num_sge = 0;
-               break;
-
-       case IB_WR_REG_MR:
-               err = handle_reg_mr(qp, wr, ctrl, seg, size, cur_edge, *idx);
-               if (unlikely(err))
-                       goto out;
-               *num_sge = 0;
-               break;
-
-       case IB_WR_REG_MR_INTEGRITY:
-               err = handle_reg_mr_integrity(dev, qp, wr, ctrl, seg, size,
-                                             cur_edge, idx, nreq, fence,
-                                             next_fence);
-               if (unlikely(err))
-                       goto out;
-               *num_sge = 0;
-               break;
-
-       default:
-               break;
-       }
-
-out:
-       return err;
-}
-
-static void handle_qpt_uc(const struct ib_send_wr *wr, void **seg, int *size)
-{
-       switch (wr->opcode) {
-       case IB_WR_RDMA_WRITE:
-       case IB_WR_RDMA_WRITE_WITH_IMM:
-               handle_rdma_op(wr, seg, size);
-               break;
-       default:
-               break;
-       }
-}
-
-static void handle_qpt_hw_gsi(struct mlx5_ib_qp *qp,
-                             const struct ib_send_wr *wr, void **seg,
-                             int *size, void **cur_edge)
-{
-       set_datagram_seg(*seg, wr);
-       *seg += sizeof(struct mlx5_wqe_datagram_seg);
-       *size += sizeof(struct mlx5_wqe_datagram_seg) / 16;
-       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
-}
-
-static void handle_qpt_ud(struct mlx5_ib_qp *qp, const struct ib_send_wr *wr,
-                         void **seg, int *size, void **cur_edge)
-{
-       set_datagram_seg(*seg, wr);
-       *seg += sizeof(struct mlx5_wqe_datagram_seg);
-       *size += sizeof(struct mlx5_wqe_datagram_seg) / 16;
-       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
-
-       /* handle qp that supports ud offload */
-       if (qp->flags & IB_QP_CREATE_IPOIB_UD_LSO) {
-               struct mlx5_wqe_eth_pad *pad;
-
-               pad = *seg;
-               memset(pad, 0, sizeof(struct mlx5_wqe_eth_pad));
-               *seg += sizeof(struct mlx5_wqe_eth_pad);
-               *size += sizeof(struct mlx5_wqe_eth_pad) / 16;
-               set_eth_seg(wr, qp, seg, size, cur_edge);
-               handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
-       }
-}
-
-static int handle_qpt_reg_umr(struct mlx5_ib_dev *dev, struct mlx5_ib_qp *qp,
-                             const struct ib_send_wr *wr,
-                             struct mlx5_wqe_ctrl_seg **ctrl, void **seg,
-                             int *size, void **cur_edge, unsigned int idx)
-{
-       int err = 0;
-
-       if (unlikely(wr->opcode != MLX5_IB_WR_UMR)) {
-               err = -EINVAL;
-               mlx5_ib_warn(dev, "bad opcode %d\n", wr->opcode);
-               goto out;
-       }
-
-       qp->sq.wr_data[idx] = MLX5_IB_WR_UMR;
-       (*ctrl)->imm = cpu_to_be32(umr_wr(wr)->mkey);
-       err = set_reg_umr_segment(dev, *seg, wr,
-                                 !!(MLX5_CAP_GEN(dev->mdev, atomic)));
-       if (unlikely(err))
-               goto out;
-       *seg += sizeof(struct mlx5_wqe_umr_ctrl_seg);
-       *size += sizeof(struct mlx5_wqe_umr_ctrl_seg) / 16;
-       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
-       set_reg_mkey_segment(*seg, wr);
-       *seg += sizeof(struct mlx5_mkey_seg);
-       *size += sizeof(struct mlx5_mkey_seg) / 16;
-       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
-out:
-       return err;
-}
-
-static int _mlx5_ib_post_send(struct ib_qp *ibqp, const struct ib_send_wr *wr,
-                             const struct ib_send_wr **bad_wr, bool drain)
-{
-       struct mlx5_wqe_ctrl_seg *ctrl = NULL;  /* compiler warning */
-       struct mlx5_ib_dev *dev = to_mdev(ibqp->device);
-       struct mlx5_core_dev *mdev = dev->mdev;
-       struct mlx5_ib_qp *qp;
-       struct mlx5_wqe_xrc_seg *xrc;
-       struct mlx5_bf *bf;
-       void *cur_edge;
-       int uninitialized_var(size);
-       unsigned long flags;
-       unsigned idx;
-       int err = 0;
-       int num_sge;
-       void *seg;
-       int nreq;
-       int i;
-       u8 next_fence = 0;
-       u8 fence;
-
-       if (unlikely(mdev->state == MLX5_DEVICE_STATE_INTERNAL_ERROR &&
-                    !drain)) {
-               *bad_wr = wr;
-               return -EIO;
-       }
-
-       if (unlikely(ibqp->qp_type == IB_QPT_GSI))
-               return mlx5_ib_gsi_post_send(ibqp, wr, bad_wr);
-
-       qp = to_mqp(ibqp);
-       bf = &qp->bf;
-
-       spin_lock_irqsave(&qp->sq.lock, flags);
-
-       for (nreq = 0; wr; nreq++, wr = wr->next) {
-               if (unlikely(wr->opcode >= ARRAY_SIZE(mlx5_ib_opcode))) {
-                       mlx5_ib_warn(dev, "\n");
-                       err = -EINVAL;
-                       *bad_wr = wr;
-                       goto out;
-               }
-
-               num_sge = wr->num_sge;
-               if (unlikely(num_sge > qp->sq.max_gs)) {
-                       mlx5_ib_warn(dev, "\n");
-                       err = -EINVAL;
-                       *bad_wr = wr;
-                       goto out;
-               }
-
-               err = begin_wqe(qp, &seg, &ctrl, wr, &idx, &size, &cur_edge,
-                               nreq);
-               if (err) {
-                       mlx5_ib_warn(dev, "\n");
-                       err = -ENOMEM;
-                       *bad_wr = wr;
-                       goto out;
-               }
-
-               if (wr->opcode == IB_WR_REG_MR ||
-                   wr->opcode == IB_WR_REG_MR_INTEGRITY) {
-                       fence = dev->umr_fence;
-                       next_fence = MLX5_FENCE_MODE_INITIATOR_SMALL;
-               } else  {
-                       if (wr->send_flags & IB_SEND_FENCE) {
-                               if (qp->next_fence)
-                                       fence = MLX5_FENCE_MODE_SMALL_AND_FENCE;
-                               else
-                                       fence = MLX5_FENCE_MODE_FENCE;
-                       } else {
-                               fence = qp->next_fence;
-                       }
-               }
-
-               switch (ibqp->qp_type) {
-               case IB_QPT_XRC_INI:
-                       xrc = seg;
-                       seg += sizeof(*xrc);
-                       size += sizeof(*xrc) / 16;
-                       /* fall through */
-               case IB_QPT_RC:
-                       err = handle_qpt_rc(dev, qp, wr, &ctrl, &seg, &size,
-                                           &cur_edge, &idx, nreq, fence,
-                                           next_fence, &num_sge);
-                       if (unlikely(err)) {
-                               *bad_wr = wr;
-                               goto out;
-                       } else if (wr->opcode == IB_WR_REG_MR_INTEGRITY) {
-                               goto skip_psv;
-                       }
-                       break;
-
-               case IB_QPT_UC:
-                       handle_qpt_uc(wr, &seg, &size);
-                       break;
-               case IB_QPT_SMI:
-                       if (unlikely(!mdev->port_caps[qp->port - 1].has_smi)) {
-                               mlx5_ib_warn(dev, "Send SMP MADs is not allowed\n");
-                               err = -EPERM;
-                               *bad_wr = wr;
-                               goto out;
-                       }
-                       /* fall through */
-               case MLX5_IB_QPT_HW_GSI:
-                       handle_qpt_hw_gsi(qp, wr, &seg, &size, &cur_edge);
-                       break;
-               case IB_QPT_UD:
-                       handle_qpt_ud(qp, wr, &seg, &size, &cur_edge);
-                       break;
-               case MLX5_IB_QPT_REG_UMR:
-                       err = handle_qpt_reg_umr(dev, qp, wr, &ctrl, &seg,
-                                                      &size, &cur_edge, idx);
-                       if (unlikely(err))
-                               goto out;
-                       break;
-
-               default:
-                       break;
-               }
-
-               if (wr->send_flags & IB_SEND_INLINE && num_sge) {
-                       err = set_data_inl_seg(qp, wr, &seg, &size, &cur_edge);
-                       if (unlikely(err)) {
-                               mlx5_ib_warn(dev, "\n");
-                               *bad_wr = wr;
-                               goto out;
-                       }
-               } else {
-                       for (i = 0; i < num_sge; i++) {
-                               handle_post_send_edge(&qp->sq, &seg, size,
-                                                     &cur_edge);
-                               if (likely(wr->sg_list[i].length)) {
-                                       set_data_ptr_seg
-                                       ((struct mlx5_wqe_data_seg *)seg,
-                                        wr->sg_list + i);
-                                       size += sizeof(struct mlx5_wqe_data_seg) / 16;
-                                       seg += sizeof(struct mlx5_wqe_data_seg);
-                               }
-                       }
-               }
-
-               qp->next_fence = next_fence;
-               finish_wqe(qp, ctrl, seg, size, cur_edge, idx, wr->wr_id, nreq,
-                          fence, mlx5_ib_opcode[wr->opcode]);
-skip_psv:
-               if (0)
-                       dump_wqe(qp, idx, size);
-       }
-
-out:
-       if (likely(nreq)) {
-               qp->sq.head += nreq;
-
-               /* Make sure that descriptors are written before
-                * updating doorbell record and ringing the doorbell
-                */
-               wmb();
-
-               qp->db.db[MLX5_SND_DBR] = cpu_to_be32(qp->sq.cur_post);
-
-               /* Make sure doorbell record is visible to the HCA before
-                * we hit doorbell */
-               wmb();
-
-               mlx5_write64((__be32 *)ctrl, bf->bfreg->map + bf->offset);
-               /* Make sure doorbells don't leak out of SQ spinlock
-                * and reach the HCA out of order.
-                */
-               bf->offset ^= bf->buf_size;
-       }
-
-       spin_unlock_irqrestore(&qp->sq.lock, flags);
-
-       return err;
-}
-
-int mlx5_ib_post_send(struct ib_qp *ibqp, const struct ib_send_wr *wr,
-                     const struct ib_send_wr **bad_wr)
-{
-       return _mlx5_ib_post_send(ibqp, wr, bad_wr, false);
-}
-
-static void set_sig_seg(struct mlx5_rwqe_sig *sig, int size)
-{
-       sig->signature = calc_sig(sig, size);
-}
-
-static int _mlx5_ib_post_recv(struct ib_qp *ibqp, const struct ib_recv_wr *wr,
-                     const struct ib_recv_wr **bad_wr, bool drain)
-{
-       struct mlx5_ib_qp *qp = to_mqp(ibqp);
-       struct mlx5_wqe_data_seg *scat;
-       struct mlx5_rwqe_sig *sig;
-       struct mlx5_ib_dev *dev = to_mdev(ibqp->device);
-       struct mlx5_core_dev *mdev = dev->mdev;
-       unsigned long flags;
-       int err = 0;
-       int nreq;
-       int ind;
-       int i;
-
-       if (unlikely(mdev->state == MLX5_DEVICE_STATE_INTERNAL_ERROR &&
-                    !drain)) {
-               *bad_wr = wr;
-               return -EIO;
-       }
-
-       if (unlikely(ibqp->qp_type == IB_QPT_GSI))
-               return mlx5_ib_gsi_post_recv(ibqp, wr, bad_wr);
-
-       spin_lock_irqsave(&qp->rq.lock, flags);
-
-       ind = qp->rq.head & (qp->rq.wqe_cnt - 1);
-
-       for (nreq = 0; wr; nreq++, wr = wr->next) {
-               if (mlx5_wq_overflow(&qp->rq, nreq, qp->ibqp.recv_cq)) {
-                       err = -ENOMEM;
-                       *bad_wr = wr;
-                       goto out;
-               }
-
-               if (unlikely(wr->num_sge > qp->rq.max_gs)) {
-                       err = -EINVAL;
-                       *bad_wr = wr;
-                       goto out;
-               }
-
-               scat = mlx5_frag_buf_get_wqe(&qp->rq.fbc, ind);
-               if (qp->flags_en & MLX5_QP_FLAG_SIGNATURE)
-                       scat++;
-
-               for (i = 0; i < wr->num_sge; i++)
-                       set_data_ptr_seg(scat + i, wr->sg_list + i);
-
-               if (i < qp->rq.max_gs) {
-                       scat[i].byte_count = 0;
-                       scat[i].lkey       = cpu_to_be32(MLX5_INVALID_LKEY);
-                       scat[i].addr       = 0;
-               }
-
-               if (qp->flags_en & MLX5_QP_FLAG_SIGNATURE) {
-                       sig = (struct mlx5_rwqe_sig *)scat;
-                       set_sig_seg(sig, (qp->rq.max_gs + 1) << 2);
-               }
-
-               qp->rq.wrid[ind] = wr->wr_id;
-
-               ind = (ind + 1) & (qp->rq.wqe_cnt - 1);
-       }
-
-out:
-       if (likely(nreq)) {
-               qp->rq.head += nreq;
-
-               /* Make sure that descriptors are written before
-                * doorbell record.
-                */
-               wmb();
-
-               *qp->db.db = cpu_to_be32(qp->rq.head & 0xffff);
-       }
-
-       spin_unlock_irqrestore(&qp->rq.lock, flags);
-
-       return err;
-}
-
-int mlx5_ib_post_recv(struct ib_qp *ibqp, const struct ib_recv_wr *wr,
-                     const struct ib_recv_wr **bad_wr)
-{
-       return _mlx5_ib_post_recv(ibqp, wr, bad_wr, false);
-}
-
 static inline enum ib_qp_state to_ib_qp_state(enum mlx5_qp_state mlx5_state)
 {
        switch (mlx5_state) {
@@ -6808,7 +5266,7 @@ void mlx5_ib_drain_sq(struct ib_qp *qp)
        sdrain.cqe.done = mlx5_ib_drain_qp_done;
        init_completion(&sdrain.done);
 
-       ret = _mlx5_ib_post_send(qp, &swr.wr, &bad_swr, true);
+       ret = mlx5_ib_post_send_drain(qp, &swr.wr, &bad_swr);
        if (ret) {
                WARN_ONCE(ret, "failed to drain send queue: %d\n", ret);
                return;
@@ -6838,7 +5296,7 @@ void mlx5_ib_drain_rq(struct ib_qp *qp)
        rdrain.cqe.done = mlx5_ib_drain_qp_done;
        init_completion(&rdrain.done);
 
-       ret = _mlx5_ib_post_recv(qp, &rwr, &bad_rwr, true);
+       ret = mlx5_ib_post_recv_drain(qp, &rwr, &bad_rwr);
        if (ret) {
                WARN_ONCE(ret, "failed to drain recv queue: %d\n", ret);
                return;
diff --git a/drivers/infiniband/hw/mlx5/wr.c b/drivers/infiniband/hw/mlx5/wr.c
new file mode 100644 (file)
index 0000000..2c6df1c
--- /dev/null
@@ -0,0 +1,1504 @@
+// SPDX-License-Identifier: GPL-2.0 OR Linux-OpenIB
+/*
+ * Copyright (c) 2020, Mellanox Technologies inc. All rights reserved.
+ */
+
+#include <linux/gfp.h>
+#include <linux/mlx5/qp.h>
+#include <linux/mlx5/driver.h>
+#include "wr.h"
+
+static const u32 mlx5_ib_opcode[] = {
+       [IB_WR_SEND]                            = MLX5_OPCODE_SEND,
+       [IB_WR_LSO]                             = MLX5_OPCODE_LSO,
+       [IB_WR_SEND_WITH_IMM]                   = MLX5_OPCODE_SEND_IMM,
+       [IB_WR_RDMA_WRITE]                      = MLX5_OPCODE_RDMA_WRITE,
+       [IB_WR_RDMA_WRITE_WITH_IMM]             = MLX5_OPCODE_RDMA_WRITE_IMM,
+       [IB_WR_RDMA_READ]                       = MLX5_OPCODE_RDMA_READ,
+       [IB_WR_ATOMIC_CMP_AND_SWP]              = MLX5_OPCODE_ATOMIC_CS,
+       [IB_WR_ATOMIC_FETCH_AND_ADD]            = MLX5_OPCODE_ATOMIC_FA,
+       [IB_WR_SEND_WITH_INV]                   = MLX5_OPCODE_SEND_INVAL,
+       [IB_WR_LOCAL_INV]                       = MLX5_OPCODE_UMR,
+       [IB_WR_REG_MR]                          = MLX5_OPCODE_UMR,
+       [IB_WR_MASKED_ATOMIC_CMP_AND_SWP]       = MLX5_OPCODE_ATOMIC_MASKED_CS,
+       [IB_WR_MASKED_ATOMIC_FETCH_AND_ADD]     = MLX5_OPCODE_ATOMIC_MASKED_FA,
+       [MLX5_IB_WR_UMR]                        = MLX5_OPCODE_UMR,
+};
+
+/* handle_post_send_edge - Check if we get to SQ edge. If yes, update to the
+ * next nearby edge and get new address translation for current WQE position.
+ * @sq - SQ buffer.
+ * @seg: Current WQE position (16B aligned).
+ * @wqe_sz: Total current WQE size [16B].
+ * @cur_edge: Updated current edge.
+ */
+static inline void handle_post_send_edge(struct mlx5_ib_wq *sq, void **seg,
+                                        u32 wqe_sz, void **cur_edge)
+{
+       u32 idx;
+
+       if (likely(*seg != *cur_edge))
+               return;
+
+       idx = (sq->cur_post + (wqe_sz >> 2)) & (sq->wqe_cnt - 1);
+       *cur_edge = get_sq_edge(sq, idx);
+
+       *seg = mlx5_frag_buf_get_wqe(&sq->fbc, idx);
+}
+
+/* memcpy_send_wqe - copy data from src to WQE and update the relevant WQ's
+ * pointers. At the end @seg is aligned to 16B regardless the copied size.
+ * @sq - SQ buffer.
+ * @cur_edge: Updated current edge.
+ * @seg: Current WQE position (16B aligned).
+ * @wqe_sz: Total current WQE size [16B].
+ * @src: Pointer to copy from.
+ * @n: Number of bytes to copy.
+ */
+static inline void memcpy_send_wqe(struct mlx5_ib_wq *sq, void **cur_edge,
+                                  void **seg, u32 *wqe_sz, const void *src,
+                                  size_t n)
+{
+       while (likely(n)) {
+               size_t leftlen = *cur_edge - *seg;
+               size_t copysz = min_t(size_t, leftlen, n);
+               size_t stride;
+
+               memcpy(*seg, src, copysz);
+
+               n -= copysz;
+               src += copysz;
+               stride = !n ? ALIGN(copysz, 16) : copysz;
+               *seg += stride;
+               *wqe_sz += stride >> 4;
+               handle_post_send_edge(sq, seg, *wqe_sz, cur_edge);
+       }
+}
+
+static int mlx5_wq_overflow(struct mlx5_ib_wq *wq, int nreq,
+                           struct ib_cq *ib_cq)
+{
+       struct mlx5_ib_cq *cq;
+       unsigned int cur;
+
+       cur = wq->head - wq->tail;
+       if (likely(cur + nreq < wq->max_post))
+               return 0;
+
+       cq = to_mcq(ib_cq);
+       spin_lock(&cq->lock);
+       cur = wq->head - wq->tail;
+       spin_unlock(&cq->lock);
+
+       return cur + nreq >= wq->max_post;
+}
+
+static __always_inline void set_raddr_seg(struct mlx5_wqe_raddr_seg *rseg,
+                                         u64 remote_addr, u32 rkey)
+{
+       rseg->raddr    = cpu_to_be64(remote_addr);
+       rseg->rkey     = cpu_to_be32(rkey);
+       rseg->reserved = 0;
+}
+
+static void set_eth_seg(const struct ib_send_wr *wr, struct mlx5_ib_qp *qp,
+                       void **seg, int *size, void **cur_edge)
+{
+       struct mlx5_wqe_eth_seg *eseg = *seg;
+
+       memset(eseg, 0, sizeof(struct mlx5_wqe_eth_seg));
+
+       if (wr->send_flags & IB_SEND_IP_CSUM)
+               eseg->cs_flags = MLX5_ETH_WQE_L3_CSUM |
+                                MLX5_ETH_WQE_L4_CSUM;
+
+       if (wr->opcode == IB_WR_LSO) {
+               struct ib_ud_wr *ud_wr = container_of(wr, struct ib_ud_wr, wr);
+               size_t left, copysz;
+               void *pdata = ud_wr->header;
+               size_t stride;
+
+               left = ud_wr->hlen;
+               eseg->mss = cpu_to_be16(ud_wr->mss);
+               eseg->inline_hdr.sz = cpu_to_be16(left);
+
+               /* memcpy_send_wqe should get a 16B align address. Hence, we
+                * first copy up to the current edge and then, if needed,
+                * continue to memcpy_send_wqe.
+                */
+               copysz = min_t(u64, *cur_edge - (void *)eseg->inline_hdr.start,
+                              left);
+               memcpy(eseg->inline_hdr.start, pdata, copysz);
+               stride = ALIGN(sizeof(struct mlx5_wqe_eth_seg) -
+                              sizeof(eseg->inline_hdr.start) + copysz, 16);
+               *size += stride / 16;
+               *seg += stride;
+
+               if (copysz < left) {
+                       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
+                       left -= copysz;
+                       pdata += copysz;
+                       memcpy_send_wqe(&qp->sq, cur_edge, seg, size, pdata,
+                                       left);
+               }
+
+               return;
+       }
+
+       *seg += sizeof(struct mlx5_wqe_eth_seg);
+       *size += sizeof(struct mlx5_wqe_eth_seg) / 16;
+}
+
+static void set_datagram_seg(struct mlx5_wqe_datagram_seg *dseg,
+                            const struct ib_send_wr *wr)
+{
+       memcpy(&dseg->av, &to_mah(ud_wr(wr)->ah)->av, sizeof(struct mlx5_av));
+       dseg->av.dqp_dct =
+               cpu_to_be32(ud_wr(wr)->remote_qpn | MLX5_EXTENDED_UD_AV);
+       dseg->av.key.qkey.qkey = cpu_to_be32(ud_wr(wr)->remote_qkey);
+}
+
+static void set_data_ptr_seg(struct mlx5_wqe_data_seg *dseg, struct ib_sge *sg)
+{
+       dseg->byte_count = cpu_to_be32(sg->length);
+       dseg->lkey       = cpu_to_be32(sg->lkey);
+       dseg->addr       = cpu_to_be64(sg->addr);
+}
+
+static u64 get_xlt_octo(u64 bytes)
+{
+       return ALIGN(bytes, MLX5_IB_UMR_XLT_ALIGNMENT) /
+              MLX5_IB_UMR_OCTOWORD;
+}
+
+static __be64 frwr_mkey_mask(bool atomic)
+{
+       u64 result;
+
+       result = MLX5_MKEY_MASK_LEN             |
+               MLX5_MKEY_MASK_PAGE_SIZE        |
+               MLX5_MKEY_MASK_START_ADDR       |
+               MLX5_MKEY_MASK_EN_RINVAL        |
+               MLX5_MKEY_MASK_KEY              |
+               MLX5_MKEY_MASK_LR               |
+               MLX5_MKEY_MASK_LW               |
+               MLX5_MKEY_MASK_RR               |
+               MLX5_MKEY_MASK_RW               |
+               MLX5_MKEY_MASK_SMALL_FENCE      |
+               MLX5_MKEY_MASK_FREE;
+
+       if (atomic)
+               result |= MLX5_MKEY_MASK_A;
+
+       return cpu_to_be64(result);
+}
+
+static __be64 sig_mkey_mask(void)
+{
+       u64 result;
+
+       result = MLX5_MKEY_MASK_LEN             |
+               MLX5_MKEY_MASK_PAGE_SIZE        |
+               MLX5_MKEY_MASK_START_ADDR       |
+               MLX5_MKEY_MASK_EN_SIGERR        |
+               MLX5_MKEY_MASK_EN_RINVAL        |
+               MLX5_MKEY_MASK_KEY              |
+               MLX5_MKEY_MASK_LR               |
+               MLX5_MKEY_MASK_LW               |
+               MLX5_MKEY_MASK_RR               |
+               MLX5_MKEY_MASK_RW               |
+               MLX5_MKEY_MASK_SMALL_FENCE      |
+               MLX5_MKEY_MASK_FREE             |
+               MLX5_MKEY_MASK_BSF_EN;
+
+       return cpu_to_be64(result);
+}
+
+static void set_reg_umr_seg(struct mlx5_wqe_umr_ctrl_seg *umr,
+                           struct mlx5_ib_mr *mr, u8 flags, bool atomic)
+{
+       int size = (mr->ndescs + mr->meta_ndescs) * mr->desc_size;
+
+       memset(umr, 0, sizeof(*umr));
+
+       umr->flags = flags;
+       umr->xlt_octowords = cpu_to_be16(get_xlt_octo(size));
+       umr->mkey_mask = frwr_mkey_mask(atomic);
+}
+
+static void set_linv_umr_seg(struct mlx5_wqe_umr_ctrl_seg *umr)
+{
+       memset(umr, 0, sizeof(*umr));
+       umr->mkey_mask = cpu_to_be64(MLX5_MKEY_MASK_FREE);
+       umr->flags = MLX5_UMR_INLINE;
+}
+
+static __be64 get_umr_enable_mr_mask(void)
+{
+       u64 result;
+
+       result = MLX5_MKEY_MASK_KEY |
+                MLX5_MKEY_MASK_FREE;
+
+       return cpu_to_be64(result);
+}
+
+static __be64 get_umr_disable_mr_mask(void)
+{
+       u64 result;
+
+       result = MLX5_MKEY_MASK_FREE;
+
+       return cpu_to_be64(result);
+}
+
+static __be64 get_umr_update_translation_mask(void)
+{
+       u64 result;
+
+       result = MLX5_MKEY_MASK_LEN |
+                MLX5_MKEY_MASK_PAGE_SIZE |
+                MLX5_MKEY_MASK_START_ADDR;
+
+       return cpu_to_be64(result);
+}
+
+static __be64 get_umr_update_access_mask(int atomic)
+{
+       u64 result;
+
+       result = MLX5_MKEY_MASK_LR |
+                MLX5_MKEY_MASK_LW |
+                MLX5_MKEY_MASK_RR |
+                MLX5_MKEY_MASK_RW;
+
+       if (atomic)
+               result |= MLX5_MKEY_MASK_A;
+
+       return cpu_to_be64(result);
+}
+
+static __be64 get_umr_update_pd_mask(void)
+{
+       u64 result;
+
+       result = MLX5_MKEY_MASK_PD;
+
+       return cpu_to_be64(result);
+}
+
+static int umr_check_mkey_mask(struct mlx5_ib_dev *dev, u64 mask)
+{
+       if ((mask & MLX5_MKEY_MASK_PAGE_SIZE &&
+            MLX5_CAP_GEN(dev->mdev, umr_modify_entity_size_disabled)) ||
+           (mask & MLX5_MKEY_MASK_A &&
+            MLX5_CAP_GEN(dev->mdev, umr_modify_atomic_disabled)))
+               return -EPERM;
+       return 0;
+}
+
+static int set_reg_umr_segment(struct mlx5_ib_dev *dev,
+                              struct mlx5_wqe_umr_ctrl_seg *umr,
+                              const struct ib_send_wr *wr, int atomic)
+{
+       const struct mlx5_umr_wr *umrwr = umr_wr(wr);
+
+       memset(umr, 0, sizeof(*umr));
+
+       if (!umrwr->ignore_free_state) {
+               if (wr->send_flags & MLX5_IB_SEND_UMR_FAIL_IF_FREE)
+                        /* fail if free */
+                       umr->flags = MLX5_UMR_CHECK_FREE;
+               else
+                       /* fail if not free */
+                       umr->flags = MLX5_UMR_CHECK_NOT_FREE;
+       }
+
+       umr->xlt_octowords = cpu_to_be16(get_xlt_octo(umrwr->xlt_size));
+       if (wr->send_flags & MLX5_IB_SEND_UMR_UPDATE_XLT) {
+               u64 offset = get_xlt_octo(umrwr->offset);
+
+               umr->xlt_offset = cpu_to_be16(offset & 0xffff);
+               umr->xlt_offset_47_16 = cpu_to_be32(offset >> 16);
+               umr->flags |= MLX5_UMR_TRANSLATION_OFFSET_EN;
+       }
+       if (wr->send_flags & MLX5_IB_SEND_UMR_UPDATE_TRANSLATION)
+               umr->mkey_mask |= get_umr_update_translation_mask();
+       if (wr->send_flags & MLX5_IB_SEND_UMR_UPDATE_PD_ACCESS) {
+               umr->mkey_mask |= get_umr_update_access_mask(atomic);
+               umr->mkey_mask |= get_umr_update_pd_mask();
+       }
+       if (wr->send_flags & MLX5_IB_SEND_UMR_ENABLE_MR)
+               umr->mkey_mask |= get_umr_enable_mr_mask();
+       if (wr->send_flags & MLX5_IB_SEND_UMR_DISABLE_MR)
+               umr->mkey_mask |= get_umr_disable_mr_mask();
+
+       if (!wr->num_sge)
+               umr->flags |= MLX5_UMR_INLINE;
+
+       return umr_check_mkey_mask(dev, be64_to_cpu(umr->mkey_mask));
+}
+
+static u8 get_umr_flags(int acc)
+{
+       return (acc & IB_ACCESS_REMOTE_ATOMIC ? MLX5_PERM_ATOMIC       : 0) |
+              (acc & IB_ACCESS_REMOTE_WRITE  ? MLX5_PERM_REMOTE_WRITE : 0) |
+              (acc & IB_ACCESS_REMOTE_READ   ? MLX5_PERM_REMOTE_READ  : 0) |
+              (acc & IB_ACCESS_LOCAL_WRITE   ? MLX5_PERM_LOCAL_WRITE  : 0) |
+               MLX5_PERM_LOCAL_READ | MLX5_PERM_UMR_EN;
+}
+
+static void set_reg_mkey_seg(struct mlx5_mkey_seg *seg,
+                            struct mlx5_ib_mr *mr,
+                            u32 key, int access)
+{
+       int ndescs = ALIGN(mr->ndescs + mr->meta_ndescs, 8) >> 1;
+
+       memset(seg, 0, sizeof(*seg));
+
+       if (mr->access_mode == MLX5_MKC_ACCESS_MODE_MTT)
+               seg->log2_page_size = ilog2(mr->ibmr.page_size);
+       else if (mr->access_mode == MLX5_MKC_ACCESS_MODE_KLMS)
+               /* KLMs take twice the size of MTTs */
+               ndescs *= 2;
+
+       seg->flags = get_umr_flags(access) | mr->access_mode;
+       seg->qpn_mkey7_0 = cpu_to_be32((key & 0xff) | 0xffffff00);
+       seg->flags_pd = cpu_to_be32(MLX5_MKEY_REMOTE_INVAL);
+       seg->start_addr = cpu_to_be64(mr->ibmr.iova);
+       seg->len = cpu_to_be64(mr->ibmr.length);
+       seg->xlt_oct_size = cpu_to_be32(ndescs);
+}
+
+static void set_linv_mkey_seg(struct mlx5_mkey_seg *seg)
+{
+       memset(seg, 0, sizeof(*seg));
+       seg->status = MLX5_MKEY_STATUS_FREE;
+}
+
+static void set_reg_mkey_segment(struct mlx5_mkey_seg *seg,
+                                const struct ib_send_wr *wr)
+{
+       const struct mlx5_umr_wr *umrwr = umr_wr(wr);
+
+       memset(seg, 0, sizeof(*seg));
+       if (wr->send_flags & MLX5_IB_SEND_UMR_DISABLE_MR)
+               seg->status = MLX5_MKEY_STATUS_FREE;
+
+       seg->flags = convert_access(umrwr->access_flags);
+       if (umrwr->pd)
+               seg->flags_pd = cpu_to_be32(to_mpd(umrwr->pd)->pdn);
+       if (wr->send_flags & MLX5_IB_SEND_UMR_UPDATE_TRANSLATION &&
+           !umrwr->length)
+               seg->flags_pd |= cpu_to_be32(MLX5_MKEY_LEN64);
+
+       seg->start_addr = cpu_to_be64(umrwr->virt_addr);
+       seg->len = cpu_to_be64(umrwr->length);
+       seg->log2_page_size = umrwr->page_shift;
+       seg->qpn_mkey7_0 = cpu_to_be32(0xffffff00 |
+                                      mlx5_mkey_variant(umrwr->mkey));
+}
+
+static void set_reg_data_seg(struct mlx5_wqe_data_seg *dseg,
+                            struct mlx5_ib_mr *mr,
+                            struct mlx5_ib_pd *pd)
+{
+       int bcount = mr->desc_size * (mr->ndescs + mr->meta_ndescs);
+
+       dseg->addr = cpu_to_be64(mr->desc_map);
+       dseg->byte_count = cpu_to_be32(ALIGN(bcount, 64));
+       dseg->lkey = cpu_to_be32(pd->ibpd.local_dma_lkey);
+}
+
+static __be32 send_ieth(const struct ib_send_wr *wr)
+{
+       switch (wr->opcode) {
+       case IB_WR_SEND_WITH_IMM:
+       case IB_WR_RDMA_WRITE_WITH_IMM:
+               return wr->ex.imm_data;
+
+       case IB_WR_SEND_WITH_INV:
+               return cpu_to_be32(wr->ex.invalidate_rkey);
+
+       default:
+               return 0;
+       }
+}
+
+static u8 calc_sig(void *wqe, int size)
+{
+       u8 *p = wqe;
+       u8 res = 0;
+       int i;
+
+       for (i = 0; i < size; i++)
+               res ^= p[i];
+
+       return ~res;
+}
+
+static u8 wq_sig(void *wqe)
+{
+       return calc_sig(wqe, (*((u8 *)wqe + 8) & 0x3f) << 4);
+}
+
+static int set_data_inl_seg(struct mlx5_ib_qp *qp, const struct ib_send_wr *wr,
+                           void **wqe, int *wqe_sz, void **cur_edge)
+{
+       struct mlx5_wqe_inline_seg *seg;
+       size_t offset;
+       int inl = 0;
+       int i;
+
+       seg = *wqe;
+       *wqe += sizeof(*seg);
+       offset = sizeof(*seg);
+
+       for (i = 0; i < wr->num_sge; i++) {
+               size_t len  = wr->sg_list[i].length;
+               void *addr = (void *)(unsigned long)(wr->sg_list[i].addr);
+
+               inl += len;
+
+               if (unlikely(inl > qp->max_inline_data))
+                       return -ENOMEM;
+
+               while (likely(len)) {
+                       size_t leftlen;
+                       size_t copysz;
+
+                       handle_post_send_edge(&qp->sq, wqe,
+                                             *wqe_sz + (offset >> 4),
+                                             cur_edge);
+
+                       leftlen = *cur_edge - *wqe;
+                       copysz = min_t(size_t, leftlen, len);
+
+                       memcpy(*wqe, addr, copysz);
+                       len -= copysz;
+                       addr += copysz;
+                       *wqe += copysz;
+                       offset += copysz;
+               }
+       }
+
+       seg->byte_count = cpu_to_be32(inl | MLX5_INLINE_SEG);
+
+       *wqe_sz +=  ALIGN(inl + sizeof(seg->byte_count), 16) / 16;
+
+       return 0;
+}
+
+static u16 prot_field_size(enum ib_signature_type type)
+{
+       switch (type) {
+       case IB_SIG_TYPE_T10_DIF:
+               return MLX5_DIF_SIZE;
+       default:
+               return 0;
+       }
+}
+
+static u8 bs_selector(int block_size)
+{
+       switch (block_size) {
+       case 512:           return 0x1;
+       case 520:           return 0x2;
+       case 4096:          return 0x3;
+       case 4160:          return 0x4;
+       case 1073741824:    return 0x5;
+       default:            return 0;
+       }
+}
+
+static void mlx5_fill_inl_bsf(struct ib_sig_domain *domain,
+                             struct mlx5_bsf_inl *inl)
+{
+       /* Valid inline section and allow BSF refresh */
+       inl->vld_refresh = cpu_to_be16(MLX5_BSF_INL_VALID |
+                                      MLX5_BSF_REFRESH_DIF);
+       inl->dif_apptag = cpu_to_be16(domain->sig.dif.app_tag);
+       inl->dif_reftag = cpu_to_be32(domain->sig.dif.ref_tag);
+       /* repeating block */
+       inl->rp_inv_seed = MLX5_BSF_REPEAT_BLOCK;
+       inl->sig_type = domain->sig.dif.bg_type == IB_T10DIF_CRC ?
+                       MLX5_DIF_CRC : MLX5_DIF_IPCS;
+
+       if (domain->sig.dif.ref_remap)
+               inl->dif_inc_ref_guard_check |= MLX5_BSF_INC_REFTAG;
+
+       if (domain->sig.dif.app_escape) {
+               if (domain->sig.dif.ref_escape)
+                       inl->dif_inc_ref_guard_check |= MLX5_BSF_APPREF_ESCAPE;
+               else
+                       inl->dif_inc_ref_guard_check |= MLX5_BSF_APPTAG_ESCAPE;
+       }
+
+       inl->dif_app_bitmask_check =
+               cpu_to_be16(domain->sig.dif.apptag_check_mask);
+}
+
+static int mlx5_set_bsf(struct ib_mr *sig_mr,
+                       struct ib_sig_attrs *sig_attrs,
+                       struct mlx5_bsf *bsf, u32 data_size)
+{
+       struct mlx5_core_sig_ctx *msig = to_mmr(sig_mr)->sig;
+       struct mlx5_bsf_basic *basic = &bsf->basic;
+       struct ib_sig_domain *mem = &sig_attrs->mem;
+       struct ib_sig_domain *wire = &sig_attrs->wire;
+
+       memset(bsf, 0, sizeof(*bsf));
+
+       /* Basic + Extended + Inline */
+       basic->bsf_size_sbs = 1 << 7;
+       /* Input domain check byte mask */
+       basic->check_byte_mask = sig_attrs->check_mask;
+       basic->raw_data_size = cpu_to_be32(data_size);
+
+       /* Memory domain */
+       switch (sig_attrs->mem.sig_type) {
+       case IB_SIG_TYPE_NONE:
+               break;
+       case IB_SIG_TYPE_T10_DIF:
+               basic->mem.bs_selector = bs_selector(mem->sig.dif.pi_interval);
+               basic->m_bfs_psv = cpu_to_be32(msig->psv_memory.psv_idx);
+               mlx5_fill_inl_bsf(mem, &bsf->m_inl);
+               break;
+       default:
+               return -EINVAL;
+       }
+
+       /* Wire domain */
+       switch (sig_attrs->wire.sig_type) {
+       case IB_SIG_TYPE_NONE:
+               break;
+       case IB_SIG_TYPE_T10_DIF:
+               if (mem->sig.dif.pi_interval == wire->sig.dif.pi_interval &&
+                   mem->sig_type == wire->sig_type) {
+                       /* Same block structure */
+                       basic->bsf_size_sbs |= 1 << 4;
+                       if (mem->sig.dif.bg_type == wire->sig.dif.bg_type)
+                               basic->wire.copy_byte_mask |= MLX5_CPY_GRD_MASK;
+                       if (mem->sig.dif.app_tag == wire->sig.dif.app_tag)
+                               basic->wire.copy_byte_mask |= MLX5_CPY_APP_MASK;
+                       if (mem->sig.dif.ref_tag == wire->sig.dif.ref_tag)
+                               basic->wire.copy_byte_mask |= MLX5_CPY_REF_MASK;
+               } else
+                       basic->wire.bs_selector =
+                               bs_selector(wire->sig.dif.pi_interval);
+
+               basic->w_bfs_psv = cpu_to_be32(msig->psv_wire.psv_idx);
+               mlx5_fill_inl_bsf(wire, &bsf->w_inl);
+               break;
+       default:
+               return -EINVAL;
+       }
+
+       return 0;
+}
+
+
+static int set_sig_data_segment(const struct ib_send_wr *send_wr,
+                               struct ib_mr *sig_mr,
+                               struct ib_sig_attrs *sig_attrs,
+                               struct mlx5_ib_qp *qp, void **seg, int *size,
+                               void **cur_edge)
+{
+       struct mlx5_bsf *bsf;
+       u32 data_len;
+       u32 data_key;
+       u64 data_va;
+       u32 prot_len = 0;
+       u32 prot_key = 0;
+       u64 prot_va = 0;
+       bool prot = false;
+       int ret;
+       int wqe_size;
+       struct mlx5_ib_mr *mr = to_mmr(sig_mr);
+       struct mlx5_ib_mr *pi_mr = mr->pi_mr;
+
+       data_len = pi_mr->data_length;
+       data_key = pi_mr->ibmr.lkey;
+       data_va = pi_mr->data_iova;
+       if (pi_mr->meta_ndescs) {
+               prot_len = pi_mr->meta_length;
+               prot_key = pi_mr->ibmr.lkey;
+               prot_va = pi_mr->pi_iova;
+               prot = true;
+       }
+
+       if (!prot || (data_key == prot_key && data_va == prot_va &&
+                     data_len == prot_len)) {
+               /**
+                * Source domain doesn't contain signature information
+                * or data and protection are interleaved in memory.
+                * So need construct:
+                *                  ------------------
+                *                 |     data_klm     |
+                *                  ------------------
+                *                 |       BSF        |
+                *                  ------------------
+                **/
+               struct mlx5_klm *data_klm = *seg;
+
+               data_klm->bcount = cpu_to_be32(data_len);
+               data_klm->key = cpu_to_be32(data_key);
+               data_klm->va = cpu_to_be64(data_va);
+               wqe_size = ALIGN(sizeof(*data_klm), 64);
+       } else {
+               /**
+                * Source domain contains signature information
+                * So need construct a strided block format:
+                *               ---------------------------
+                *              |     stride_block_ctrl     |
+                *               ---------------------------
+                *              |          data_klm         |
+                *               ---------------------------
+                *              |          prot_klm         |
+                *               ---------------------------
+                *              |             BSF           |
+                *               ---------------------------
+                **/
+               struct mlx5_stride_block_ctrl_seg *sblock_ctrl;
+               struct mlx5_stride_block_entry *data_sentry;
+               struct mlx5_stride_block_entry *prot_sentry;
+               u16 block_size = sig_attrs->mem.sig.dif.pi_interval;
+               int prot_size;
+
+               sblock_ctrl = *seg;
+               data_sentry = (void *)sblock_ctrl + sizeof(*sblock_ctrl);
+               prot_sentry = (void *)data_sentry + sizeof(*data_sentry);
+
+               prot_size = prot_field_size(sig_attrs->mem.sig_type);
+               if (!prot_size) {
+                       pr_err("Bad block size given: %u\n", block_size);
+                       return -EINVAL;
+               }
+               sblock_ctrl->bcount_per_cycle = cpu_to_be32(block_size +
+                                                           prot_size);
+               sblock_ctrl->op = cpu_to_be32(MLX5_STRIDE_BLOCK_OP);
+               sblock_ctrl->repeat_count = cpu_to_be32(data_len / block_size);
+               sblock_ctrl->num_entries = cpu_to_be16(2);
+
+               data_sentry->bcount = cpu_to_be16(block_size);
+               data_sentry->key = cpu_to_be32(data_key);
+               data_sentry->va = cpu_to_be64(data_va);
+               data_sentry->stride = cpu_to_be16(block_size);
+
+               prot_sentry->bcount = cpu_to_be16(prot_size);
+               prot_sentry->key = cpu_to_be32(prot_key);
+               prot_sentry->va = cpu_to_be64(prot_va);
+               prot_sentry->stride = cpu_to_be16(prot_size);
+
+               wqe_size = ALIGN(sizeof(*sblock_ctrl) + sizeof(*data_sentry) +
+                                sizeof(*prot_sentry), 64);
+       }
+
+       *seg += wqe_size;
+       *size += wqe_size / 16;
+       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
+
+       bsf = *seg;
+       ret = mlx5_set_bsf(sig_mr, sig_attrs, bsf, data_len);
+       if (ret)
+               return -EINVAL;
+
+       *seg += sizeof(*bsf);
+       *size += sizeof(*bsf) / 16;
+       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
+
+       return 0;
+}
+
+static void set_sig_mkey_segment(struct mlx5_mkey_seg *seg,
+                                struct ib_mr *sig_mr, int access_flags,
+                                u32 size, u32 length, u32 pdn)
+{
+       u32 sig_key = sig_mr->rkey;
+       u8 sigerr = to_mmr(sig_mr)->sig->sigerr_count & 1;
+
+       memset(seg, 0, sizeof(*seg));
+
+       seg->flags = get_umr_flags(access_flags) | MLX5_MKC_ACCESS_MODE_KLMS;
+       seg->qpn_mkey7_0 = cpu_to_be32((sig_key & 0xff) | 0xffffff00);
+       seg->flags_pd = cpu_to_be32(MLX5_MKEY_REMOTE_INVAL | sigerr << 26 |
+                                   MLX5_MKEY_BSF_EN | pdn);
+       seg->len = cpu_to_be64(length);
+       seg->xlt_oct_size = cpu_to_be32(get_xlt_octo(size));
+       seg->bsfs_octo_size = cpu_to_be32(MLX5_MKEY_BSF_OCTO_SIZE);
+}
+
+static void set_sig_umr_segment(struct mlx5_wqe_umr_ctrl_seg *umr,
+                               u32 size)
+{
+       memset(umr, 0, sizeof(*umr));
+
+       umr->flags = MLX5_FLAGS_INLINE | MLX5_FLAGS_CHECK_FREE;
+       umr->xlt_octowords = cpu_to_be16(get_xlt_octo(size));
+       umr->bsf_octowords = cpu_to_be16(MLX5_MKEY_BSF_OCTO_SIZE);
+       umr->mkey_mask = sig_mkey_mask();
+}
+
+static int set_pi_umr_wr(const struct ib_send_wr *send_wr,
+                        struct mlx5_ib_qp *qp, void **seg, int *size,
+                        void **cur_edge)
+{
+       const struct ib_reg_wr *wr = reg_wr(send_wr);
+       struct mlx5_ib_mr *sig_mr = to_mmr(wr->mr);
+       struct mlx5_ib_mr *pi_mr = sig_mr->pi_mr;
+       struct ib_sig_attrs *sig_attrs = sig_mr->ibmr.sig_attrs;
+       u32 pdn = to_mpd(qp->ibqp.pd)->pdn;
+       u32 xlt_size;
+       int region_len, ret;
+
+       if (unlikely(send_wr->num_sge != 0) ||
+           unlikely(wr->access & IB_ACCESS_REMOTE_ATOMIC) ||
+           unlikely(!sig_mr->sig) || unlikely(!qp->ibqp.integrity_en) ||
+           unlikely(!sig_mr->sig->sig_status_checked))
+               return -EINVAL;
+
+       /* length of the protected region, data + protection */
+       region_len = pi_mr->ibmr.length;
+
+       /**
+        * KLM octoword size - if protection was provided
+        * then we use strided block format (3 octowords),
+        * else we use single KLM (1 octoword)
+        **/
+       if (sig_attrs->mem.sig_type != IB_SIG_TYPE_NONE)
+               xlt_size = 0x30;
+       else
+               xlt_size = sizeof(struct mlx5_klm);
+
+       set_sig_umr_segment(*seg, xlt_size);
+       *seg += sizeof(struct mlx5_wqe_umr_ctrl_seg);
+       *size += sizeof(struct mlx5_wqe_umr_ctrl_seg) / 16;
+       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
+
+       set_sig_mkey_segment(*seg, wr->mr, wr->access, xlt_size, region_len,
+                            pdn);
+       *seg += sizeof(struct mlx5_mkey_seg);
+       *size += sizeof(struct mlx5_mkey_seg) / 16;
+       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
+
+       ret = set_sig_data_segment(send_wr, wr->mr, sig_attrs, qp, seg, size,
+                                  cur_edge);
+       if (ret)
+               return ret;
+
+       sig_mr->sig->sig_status_checked = false;
+       return 0;
+}
+
+static int set_psv_wr(struct ib_sig_domain *domain,
+                     u32 psv_idx, void **seg, int *size)
+{
+       struct mlx5_seg_set_psv *psv_seg = *seg;
+
+       memset(psv_seg, 0, sizeof(*psv_seg));
+       psv_seg->psv_num = cpu_to_be32(psv_idx);
+       switch (domain->sig_type) {
+       case IB_SIG_TYPE_NONE:
+               break;
+       case IB_SIG_TYPE_T10_DIF:
+               psv_seg->transient_sig = cpu_to_be32(domain->sig.dif.bg << 16 |
+                                                    domain->sig.dif.app_tag);
+               psv_seg->ref_tag = cpu_to_be32(domain->sig.dif.ref_tag);
+               break;
+       default:
+               pr_err("Bad signature type (%d) is given.\n",
+                      domain->sig_type);
+               return -EINVAL;
+       }
+
+       *seg += sizeof(*psv_seg);
+       *size += sizeof(*psv_seg) / 16;
+
+       return 0;
+}
+
+static int set_reg_wr(struct mlx5_ib_qp *qp,
+                     const struct ib_reg_wr *wr,
+                     void **seg, int *size, void **cur_edge,
+                     bool check_not_free)
+{
+       struct mlx5_ib_mr *mr = to_mmr(wr->mr);
+       struct mlx5_ib_pd *pd = to_mpd(qp->ibqp.pd);
+       struct mlx5_ib_dev *dev = to_mdev(pd->ibpd.device);
+       int mr_list_size = (mr->ndescs + mr->meta_ndescs) * mr->desc_size;
+       bool umr_inline = mr_list_size <= MLX5_IB_SQ_UMR_INLINE_THRESHOLD;
+       bool atomic = wr->access & IB_ACCESS_REMOTE_ATOMIC;
+       u8 flags = 0;
+
+       if (!mlx5_ib_can_use_umr(dev, atomic, wr->access)) {
+               mlx5_ib_warn(to_mdev(qp->ibqp.device),
+                            "Fast update of %s for MR is disabled\n",
+                            (MLX5_CAP_GEN(dev->mdev,
+                                          umr_modify_entity_size_disabled)) ?
+                                    "entity size" :
+                                    "atomic access");
+               return -EINVAL;
+       }
+
+       if (unlikely(wr->wr.send_flags & IB_SEND_INLINE)) {
+               mlx5_ib_warn(to_mdev(qp->ibqp.device),
+                            "Invalid IB_SEND_INLINE send flag\n");
+               return -EINVAL;
+       }
+
+       if (check_not_free)
+               flags |= MLX5_UMR_CHECK_NOT_FREE;
+       if (umr_inline)
+               flags |= MLX5_UMR_INLINE;
+
+       set_reg_umr_seg(*seg, mr, flags, atomic);
+       *seg += sizeof(struct mlx5_wqe_umr_ctrl_seg);
+       *size += sizeof(struct mlx5_wqe_umr_ctrl_seg) / 16;
+       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
+
+       set_reg_mkey_seg(*seg, mr, wr->key, wr->access);
+       *seg += sizeof(struct mlx5_mkey_seg);
+       *size += sizeof(struct mlx5_mkey_seg) / 16;
+       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
+
+       if (umr_inline) {
+               memcpy_send_wqe(&qp->sq, cur_edge, seg, size, mr->descs,
+                               mr_list_size);
+               *size = ALIGN(*size, MLX5_SEND_WQE_BB >> 4);
+       } else {
+               set_reg_data_seg(*seg, mr, pd);
+               *seg += sizeof(struct mlx5_wqe_data_seg);
+               *size += (sizeof(struct mlx5_wqe_data_seg) / 16);
+       }
+       return 0;
+}
+
+static void set_linv_wr(struct mlx5_ib_qp *qp, void **seg, int *size,
+                       void **cur_edge)
+{
+       set_linv_umr_seg(*seg);
+       *seg += sizeof(struct mlx5_wqe_umr_ctrl_seg);
+       *size += sizeof(struct mlx5_wqe_umr_ctrl_seg) / 16;
+       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
+       set_linv_mkey_seg(*seg);
+       *seg += sizeof(struct mlx5_mkey_seg);
+       *size += sizeof(struct mlx5_mkey_seg) / 16;
+       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
+}
+
+static void dump_wqe(struct mlx5_ib_qp *qp, u32 idx, int size_16)
+{
+       __be32 *p = NULL;
+       int i, j;
+
+       pr_debug("dump WQE index %u:\n", idx);
+       for (i = 0, j = 0; i < size_16 * 4; i += 4, j += 4) {
+               if ((i & 0xf) == 0) {
+                       p = mlx5_frag_buf_get_wqe(&qp->sq.fbc, idx);
+                       pr_debug("WQBB at %p:\n", (void *)p);
+                       j = 0;
+                       idx = (idx + 1) & (qp->sq.wqe_cnt - 1);
+               }
+               pr_debug("%08x %08x %08x %08x\n", be32_to_cpu(p[j]),
+                        be32_to_cpu(p[j + 1]), be32_to_cpu(p[j + 2]),
+                        be32_to_cpu(p[j + 3]));
+       }
+}
+
+static int __begin_wqe(struct mlx5_ib_qp *qp, void **seg,
+                      struct mlx5_wqe_ctrl_seg **ctrl,
+                      const struct ib_send_wr *wr, unsigned int *idx,
+                      int *size, void **cur_edge, int nreq,
+                      bool send_signaled, bool solicited)
+{
+       if (unlikely(mlx5_wq_overflow(&qp->sq, nreq, qp->ibqp.send_cq)))
+               return -ENOMEM;
+
+       *idx = qp->sq.cur_post & (qp->sq.wqe_cnt - 1);
+       *seg = mlx5_frag_buf_get_wqe(&qp->sq.fbc, *idx);
+       *ctrl = *seg;
+       *(uint32_t *)(*seg + 8) = 0;
+       (*ctrl)->imm = send_ieth(wr);
+       (*ctrl)->fm_ce_se = qp->sq_signal_bits |
+               (send_signaled ? MLX5_WQE_CTRL_CQ_UPDATE : 0) |
+               (solicited ? MLX5_WQE_CTRL_SOLICITED : 0);
+
+       *seg += sizeof(**ctrl);
+       *size = sizeof(**ctrl) / 16;
+       *cur_edge = qp->sq.cur_edge;
+
+       return 0;
+}
+
+static int begin_wqe(struct mlx5_ib_qp *qp, void **seg,
+                    struct mlx5_wqe_ctrl_seg **ctrl,
+                    const struct ib_send_wr *wr, unsigned int *idx, int *size,
+                    void **cur_edge, int nreq)
+{
+       return __begin_wqe(qp, seg, ctrl, wr, idx, size, cur_edge, nreq,
+                          wr->send_flags & IB_SEND_SIGNALED,
+                          wr->send_flags & IB_SEND_SOLICITED);
+}
+
+static void finish_wqe(struct mlx5_ib_qp *qp,
+                      struct mlx5_wqe_ctrl_seg *ctrl,
+                      void *seg, u8 size, void *cur_edge,
+                      unsigned int idx, u64 wr_id, int nreq, u8 fence,
+                      u32 mlx5_opcode)
+{
+       u8 opmod = 0;
+
+       ctrl->opmod_idx_opcode = cpu_to_be32(((u32)(qp->sq.cur_post) << 8) |
+                                            mlx5_opcode | ((u32)opmod << 24));
+       ctrl->qpn_ds = cpu_to_be32(size | (qp->trans_qp.base.mqp.qpn << 8));
+       ctrl->fm_ce_se |= fence;
+       if (unlikely(qp->flags_en & MLX5_QP_FLAG_SIGNATURE))
+               ctrl->signature = wq_sig(ctrl);
+
+       qp->sq.wrid[idx] = wr_id;
+       qp->sq.w_list[idx].opcode = mlx5_opcode;
+       qp->sq.wqe_head[idx] = qp->sq.head + nreq;
+       qp->sq.cur_post += DIV_ROUND_UP(size * 16, MLX5_SEND_WQE_BB);
+       qp->sq.w_list[idx].next = qp->sq.cur_post;
+
+       /* We save the edge which was possibly updated during the WQE
+        * construction, into SQ's cache.
+        */
+       seg = PTR_ALIGN(seg, MLX5_SEND_WQE_BB);
+       qp->sq.cur_edge = (unlikely(seg == cur_edge)) ?
+                         get_sq_edge(&qp->sq, qp->sq.cur_post &
+                                     (qp->sq.wqe_cnt - 1)) :
+                         cur_edge;
+}
+
+static void handle_rdma_op(const struct ib_send_wr *wr, void **seg, int *size)
+{
+       set_raddr_seg(*seg, rdma_wr(wr)->remote_addr, rdma_wr(wr)->rkey);
+       *seg += sizeof(struct mlx5_wqe_raddr_seg);
+       *size += sizeof(struct mlx5_wqe_raddr_seg) / 16;
+}
+
+static void handle_local_inv(struct mlx5_ib_qp *qp, const struct ib_send_wr *wr,
+                            struct mlx5_wqe_ctrl_seg **ctrl, void **seg,
+                            int *size, void **cur_edge, unsigned int idx)
+{
+       qp->sq.wr_data[idx] = IB_WR_LOCAL_INV;
+       (*ctrl)->imm = cpu_to_be32(wr->ex.invalidate_rkey);
+       set_linv_wr(qp, seg, size, cur_edge);
+}
+
+static int handle_reg_mr(struct mlx5_ib_qp *qp, const struct ib_send_wr *wr,
+                        struct mlx5_wqe_ctrl_seg **ctrl, void **seg, int *size,
+                        void **cur_edge, unsigned int idx)
+{
+       qp->sq.wr_data[idx] = IB_WR_REG_MR;
+       (*ctrl)->imm = cpu_to_be32(reg_wr(wr)->key);
+       return set_reg_wr(qp, reg_wr(wr), seg, size, cur_edge, true);
+}
+
+static int handle_psv(struct mlx5_ib_dev *dev, struct mlx5_ib_qp *qp,
+                     const struct ib_send_wr *wr,
+                     struct mlx5_wqe_ctrl_seg **ctrl, void **seg, int *size,
+                     void **cur_edge, unsigned int *idx, int nreq,
+                     struct ib_sig_domain *domain, u32 psv_index,
+                     u8 next_fence)
+{
+       int err;
+
+       /*
+        * SET_PSV WQEs are not signaled and solicited on error.
+        */
+       err = __begin_wqe(qp, seg, ctrl, wr, idx, size, cur_edge, nreq,
+                         false, true);
+       if (unlikely(err)) {
+               mlx5_ib_warn(dev, "\n");
+               err = -ENOMEM;
+               goto out;
+       }
+       err = set_psv_wr(domain, psv_index, seg, size);
+       if (unlikely(err)) {
+               mlx5_ib_warn(dev, "\n");
+               goto out;
+       }
+       finish_wqe(qp, *ctrl, *seg, *size, *cur_edge, *idx, wr->wr_id, nreq,
+                  next_fence, MLX5_OPCODE_SET_PSV);
+
+out:
+       return err;
+}
+
+static int handle_reg_mr_integrity(struct mlx5_ib_dev *dev,
+                                  struct mlx5_ib_qp *qp,
+                                  const struct ib_send_wr *wr,
+                                  struct mlx5_wqe_ctrl_seg **ctrl, void **seg,
+                                  int *size, void **cur_edge,
+                                  unsigned int *idx, int nreq, u8 fence,
+                                  u8 next_fence)
+{
+       struct mlx5_ib_mr *mr;
+       struct mlx5_ib_mr *pi_mr;
+       struct mlx5_ib_mr pa_pi_mr;
+       struct ib_sig_attrs *sig_attrs;
+       struct ib_reg_wr reg_pi_wr;
+       int err;
+
+       qp->sq.wr_data[*idx] = IB_WR_REG_MR_INTEGRITY;
+
+       mr = to_mmr(reg_wr(wr)->mr);
+       pi_mr = mr->pi_mr;
+
+       if (pi_mr) {
+               memset(&reg_pi_wr, 0,
+                      sizeof(struct ib_reg_wr));
+
+               reg_pi_wr.mr = &pi_mr->ibmr;
+               reg_pi_wr.access = reg_wr(wr)->access;
+               reg_pi_wr.key = pi_mr->ibmr.rkey;
+
+               (*ctrl)->imm = cpu_to_be32(reg_pi_wr.key);
+               /* UMR for data + prot registration */
+               err = set_reg_wr(qp, &reg_pi_wr, seg, size, cur_edge, false);
+               if (unlikely(err))
+                       goto out;
+
+               finish_wqe(qp, *ctrl, *seg, *size, *cur_edge, *idx, wr->wr_id,
+                          nreq, fence, MLX5_OPCODE_UMR);
+
+               err = begin_wqe(qp, seg, ctrl, wr, idx, size, cur_edge, nreq);
+               if (unlikely(err)) {
+                       mlx5_ib_warn(dev, "\n");
+                       err = -ENOMEM;
+                       goto out;
+               }
+       } else {
+               memset(&pa_pi_mr, 0, sizeof(struct mlx5_ib_mr));
+               /* No UMR, use local_dma_lkey */
+               pa_pi_mr.ibmr.lkey = mr->ibmr.pd->local_dma_lkey;
+               pa_pi_mr.ndescs = mr->ndescs;
+               pa_pi_mr.data_length = mr->data_length;
+               pa_pi_mr.data_iova = mr->data_iova;
+               if (mr->meta_ndescs) {
+                       pa_pi_mr.meta_ndescs = mr->meta_ndescs;
+                       pa_pi_mr.meta_length = mr->meta_length;
+                       pa_pi_mr.pi_iova = mr->pi_iova;
+               }
+
+               pa_pi_mr.ibmr.length = mr->ibmr.length;
+               mr->pi_mr = &pa_pi_mr;
+       }
+       (*ctrl)->imm = cpu_to_be32(mr->ibmr.rkey);
+       /* UMR for sig MR */
+       err = set_pi_umr_wr(wr, qp, seg, size, cur_edge);
+       if (unlikely(err)) {
+               mlx5_ib_warn(dev, "\n");
+               goto out;
+       }
+       finish_wqe(qp, *ctrl, *seg, *size, *cur_edge, *idx, wr->wr_id, nreq,
+                  fence, MLX5_OPCODE_UMR);
+
+       sig_attrs = mr->ibmr.sig_attrs;
+       err = handle_psv(dev, qp, wr, ctrl, seg, size, cur_edge, idx, nreq,
+                        &sig_attrs->mem, mr->sig->psv_memory.psv_idx,
+                        next_fence);
+       if (unlikely(err))
+               goto out;
+
+       err = handle_psv(dev, qp, wr, ctrl, seg, size, cur_edge, idx, nreq,
+                        &sig_attrs->wire, mr->sig->psv_wire.psv_idx,
+                        next_fence);
+       if (unlikely(err))
+               goto out;
+
+       qp->next_fence = MLX5_FENCE_MODE_INITIATOR_SMALL;
+
+out:
+       return err;
+}
+
+static int handle_qpt_rc(struct mlx5_ib_dev *dev, struct mlx5_ib_qp *qp,
+                        const struct ib_send_wr *wr,
+                        struct mlx5_wqe_ctrl_seg **ctrl, void **seg, int *size,
+                        void **cur_edge, unsigned int *idx, int nreq, u8 fence,
+                        u8 next_fence, int *num_sge)
+{
+       int err = 0;
+
+       switch (wr->opcode) {
+       case IB_WR_RDMA_READ:
+       case IB_WR_RDMA_WRITE:
+       case IB_WR_RDMA_WRITE_WITH_IMM:
+               handle_rdma_op(wr, seg, size);
+               break;
+
+       case IB_WR_ATOMIC_CMP_AND_SWP:
+       case IB_WR_ATOMIC_FETCH_AND_ADD:
+       case IB_WR_MASKED_ATOMIC_CMP_AND_SWP:
+               mlx5_ib_warn(dev, "Atomic operations are not supported yet\n");
+               err = -EOPNOTSUPP;
+               goto out;
+
+       case IB_WR_LOCAL_INV:
+               handle_local_inv(qp, wr, ctrl, seg, size, cur_edge, *idx);
+               *num_sge = 0;
+               break;
+
+       case IB_WR_REG_MR:
+               err = handle_reg_mr(qp, wr, ctrl, seg, size, cur_edge, *idx);
+               if (unlikely(err))
+                       goto out;
+               *num_sge = 0;
+               break;
+
+       case IB_WR_REG_MR_INTEGRITY:
+               err = handle_reg_mr_integrity(dev, qp, wr, ctrl, seg, size,
+                                             cur_edge, idx, nreq, fence,
+                                             next_fence);
+               if (unlikely(err))
+                       goto out;
+               *num_sge = 0;
+               break;
+
+       default:
+               break;
+       }
+
+out:
+       return err;
+}
+
+static void handle_qpt_uc(const struct ib_send_wr *wr, void **seg, int *size)
+{
+       switch (wr->opcode) {
+       case IB_WR_RDMA_WRITE:
+       case IB_WR_RDMA_WRITE_WITH_IMM:
+               handle_rdma_op(wr, seg, size);
+               break;
+       default:
+               break;
+       }
+}
+
+static void handle_qpt_hw_gsi(struct mlx5_ib_qp *qp,
+                             const struct ib_send_wr *wr, void **seg,
+                             int *size, void **cur_edge)
+{
+       set_datagram_seg(*seg, wr);
+       *seg += sizeof(struct mlx5_wqe_datagram_seg);
+       *size += sizeof(struct mlx5_wqe_datagram_seg) / 16;
+       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
+}
+
+static void handle_qpt_ud(struct mlx5_ib_qp *qp, const struct ib_send_wr *wr,
+                         void **seg, int *size, void **cur_edge)
+{
+       set_datagram_seg(*seg, wr);
+       *seg += sizeof(struct mlx5_wqe_datagram_seg);
+       *size += sizeof(struct mlx5_wqe_datagram_seg) / 16;
+       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
+
+       /* handle qp that supports ud offload */
+       if (qp->flags & IB_QP_CREATE_IPOIB_UD_LSO) {
+               struct mlx5_wqe_eth_pad *pad;
+
+               pad = *seg;
+               memset(pad, 0, sizeof(struct mlx5_wqe_eth_pad));
+               *seg += sizeof(struct mlx5_wqe_eth_pad);
+               *size += sizeof(struct mlx5_wqe_eth_pad) / 16;
+               set_eth_seg(wr, qp, seg, size, cur_edge);
+               handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
+       }
+}
+
+static int handle_qpt_reg_umr(struct mlx5_ib_dev *dev, struct mlx5_ib_qp *qp,
+                             const struct ib_send_wr *wr,
+                             struct mlx5_wqe_ctrl_seg **ctrl, void **seg,
+                             int *size, void **cur_edge, unsigned int idx)
+{
+       int err = 0;
+
+       if (unlikely(wr->opcode != MLX5_IB_WR_UMR)) {
+               err = -EINVAL;
+               mlx5_ib_warn(dev, "bad opcode %d\n", wr->opcode);
+               goto out;
+       }
+
+       qp->sq.wr_data[idx] = MLX5_IB_WR_UMR;
+       (*ctrl)->imm = cpu_to_be32(umr_wr(wr)->mkey);
+       err = set_reg_umr_segment(dev, *seg, wr,
+                                 !!(MLX5_CAP_GEN(dev->mdev, atomic)));
+       if (unlikely(err))
+               goto out;
+       *seg += sizeof(struct mlx5_wqe_umr_ctrl_seg);
+       *size += sizeof(struct mlx5_wqe_umr_ctrl_seg) / 16;
+       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
+       set_reg_mkey_segment(*seg, wr);
+       *seg += sizeof(struct mlx5_mkey_seg);
+       *size += sizeof(struct mlx5_mkey_seg) / 16;
+       handle_post_send_edge(&qp->sq, seg, *size, cur_edge);
+out:
+       return err;
+}
+
+int mlx5_ib_post_send(struct ib_qp *ibqp, const struct ib_send_wr *wr,
+                     const struct ib_send_wr **bad_wr, bool drain)
+{
+       struct mlx5_wqe_ctrl_seg *ctrl = NULL;  /* compiler warning */
+       struct mlx5_ib_dev *dev = to_mdev(ibqp->device);
+       struct mlx5_core_dev *mdev = dev->mdev;
+       struct mlx5_ib_qp *qp;
+       struct mlx5_wqe_xrc_seg *xrc;
+       struct mlx5_bf *bf;
+       void *cur_edge;
+       int uninitialized_var(size);
+       unsigned long flags;
+       unsigned int idx;
+       int err = 0;
+       int num_sge;
+       void *seg;
+       int nreq;
+       int i;
+       u8 next_fence = 0;
+       u8 fence;
+
+       if (unlikely(mdev->state == MLX5_DEVICE_STATE_INTERNAL_ERROR &&
+                    !drain)) {
+               *bad_wr = wr;
+               return -EIO;
+       }
+
+       if (unlikely(ibqp->qp_type == IB_QPT_GSI))
+               return mlx5_ib_gsi_post_send(ibqp, wr, bad_wr);
+
+       qp = to_mqp(ibqp);
+       bf = &qp->bf;
+
+       spin_lock_irqsave(&qp->sq.lock, flags);
+
+       for (nreq = 0; wr; nreq++, wr = wr->next) {
+               if (unlikely(wr->opcode >= ARRAY_SIZE(mlx5_ib_opcode))) {
+                       mlx5_ib_warn(dev, "\n");
+                       err = -EINVAL;
+                       *bad_wr = wr;
+                       goto out;
+               }
+
+               num_sge = wr->num_sge;
+               if (unlikely(num_sge > qp->sq.max_gs)) {
+                       mlx5_ib_warn(dev, "\n");
+                       err = -EINVAL;
+                       *bad_wr = wr;
+                       goto out;
+               }
+
+               err = begin_wqe(qp, &seg, &ctrl, wr, &idx, &size, &cur_edge,
+                               nreq);
+               if (err) {
+                       mlx5_ib_warn(dev, "\n");
+                       err = -ENOMEM;
+                       *bad_wr = wr;
+                       goto out;
+               }
+
+               if (wr->opcode == IB_WR_REG_MR ||
+                   wr->opcode == IB_WR_REG_MR_INTEGRITY) {
+                       fence = dev->umr_fence;
+                       next_fence = MLX5_FENCE_MODE_INITIATOR_SMALL;
+               } else  {
+                       if (wr->send_flags & IB_SEND_FENCE) {
+                               if (qp->next_fence)
+                                       fence = MLX5_FENCE_MODE_SMALL_AND_FENCE;
+                               else
+                                       fence = MLX5_FENCE_MODE_FENCE;
+                       } else {
+                               fence = qp->next_fence;
+                       }
+               }
+
+               switch (ibqp->qp_type) {
+               case IB_QPT_XRC_INI:
+                       xrc = seg;
+                       seg += sizeof(*xrc);
+                       size += sizeof(*xrc) / 16;
+                       fallthrough;
+               case IB_QPT_RC:
+                       err = handle_qpt_rc(dev, qp, wr, &ctrl, &seg, &size,
+                                           &cur_edge, &idx, nreq, fence,
+                                           next_fence, &num_sge);
+                       if (unlikely(err)) {
+                               *bad_wr = wr;
+                               goto out;
+                       } else if (wr->opcode == IB_WR_REG_MR_INTEGRITY) {
+                               goto skip_psv;
+                       }
+                       break;
+
+               case IB_QPT_UC:
+                       handle_qpt_uc(wr, &seg, &size);
+                       break;
+               case IB_QPT_SMI:
+                       if (unlikely(!mdev->port_caps[qp->port - 1].has_smi)) {
+                               mlx5_ib_warn(dev, "Send SMP MADs is not allowed\n");
+                               err = -EPERM;
+                               *bad_wr = wr;
+                               goto out;
+                       }
+                       fallthrough;
+               case MLX5_IB_QPT_HW_GSI:
+                       handle_qpt_hw_gsi(qp, wr, &seg, &size, &cur_edge);
+                       break;
+               case IB_QPT_UD:
+                       handle_qpt_ud(qp, wr, &seg, &size, &cur_edge);
+                       break;
+               case MLX5_IB_QPT_REG_UMR:
+                       err = handle_qpt_reg_umr(dev, qp, wr, &ctrl, &seg,
+                                                      &size, &cur_edge, idx);
+                       if (unlikely(err))
+                               goto out;
+                       break;
+
+               default:
+                       break;
+               }
+
+               if (wr->send_flags & IB_SEND_INLINE && num_sge) {
+                       err = set_data_inl_seg(qp, wr, &seg, &size, &cur_edge);
+                       if (unlikely(err)) {
+                               mlx5_ib_warn(dev, "\n");
+                               *bad_wr = wr;
+                               goto out;
+                       }
+               } else {
+                       for (i = 0; i < num_sge; i++) {
+                               handle_post_send_edge(&qp->sq, &seg, size,
+                                                     &cur_edge);
+                               if (unlikely(!wr->sg_list[i].length))
+                                       continue;
+
+                               set_data_ptr_seg(
+                                       (struct mlx5_wqe_data_seg *)seg,
+                                       wr->sg_list + i);
+                               size += sizeof(struct mlx5_wqe_data_seg) / 16;
+                               seg += sizeof(struct mlx5_wqe_data_seg);
+                       }
+               }
+
+               qp->next_fence = next_fence;
+               finish_wqe(qp, ctrl, seg, size, cur_edge, idx, wr->wr_id, nreq,
+                          fence, mlx5_ib_opcode[wr->opcode]);
+skip_psv:
+               if (0)
+                       dump_wqe(qp, idx, size);
+       }
+
+out:
+       if (likely(nreq)) {
+               qp->sq.head += nreq;
+
+               /* Make sure that descriptors are written before
+                * updating doorbell record and ringing the doorbell
+                */
+               wmb();
+
+               qp->db.db[MLX5_SND_DBR] = cpu_to_be32(qp->sq.cur_post);
+
+               /* Make sure doorbell record is visible to the HCA before
+                * we hit doorbell.
+                */
+               wmb();
+
+               mlx5_write64((__be32 *)ctrl, bf->bfreg->map + bf->offset);
+               /* Make sure doorbells don't leak out of SQ spinlock
+                * and reach the HCA out of order.
+                */
+               bf->offset ^= bf->buf_size;
+       }
+
+       spin_unlock_irqrestore(&qp->sq.lock, flags);
+
+       return err;
+}
+
+static void set_sig_seg(struct mlx5_rwqe_sig *sig, int max_gs)
+{
+        sig->signature = calc_sig(sig, (max_gs + 1) << 2);
+}
+
+int mlx5_ib_post_recv(struct ib_qp *ibqp, const struct ib_recv_wr *wr,
+                     const struct ib_recv_wr **bad_wr, bool drain)
+{
+       struct mlx5_ib_qp *qp = to_mqp(ibqp);
+       struct mlx5_wqe_data_seg *scat;
+       struct mlx5_rwqe_sig *sig;
+       struct mlx5_ib_dev *dev = to_mdev(ibqp->device);
+       struct mlx5_core_dev *mdev = dev->mdev;
+       unsigned long flags;
+       int err = 0;
+       int nreq;
+       int ind;
+       int i;
+
+       if (unlikely(mdev->state == MLX5_DEVICE_STATE_INTERNAL_ERROR &&
+                    !drain)) {
+               *bad_wr = wr;
+               return -EIO;
+       }
+
+       if (unlikely(ibqp->qp_type == IB_QPT_GSI))
+               return mlx5_ib_gsi_post_recv(ibqp, wr, bad_wr);
+
+       spin_lock_irqsave(&qp->rq.lock, flags);
+
+       ind = qp->rq.head & (qp->rq.wqe_cnt - 1);
+
+       for (nreq = 0; wr; nreq++, wr = wr->next) {
+               if (mlx5_wq_overflow(&qp->rq, nreq, qp->ibqp.recv_cq)) {
+                       err = -ENOMEM;
+                       *bad_wr = wr;
+                       goto out;
+               }
+
+               if (unlikely(wr->num_sge > qp->rq.max_gs)) {
+                       err = -EINVAL;
+                       *bad_wr = wr;
+                       goto out;
+               }
+
+               scat = mlx5_frag_buf_get_wqe(&qp->rq.fbc, ind);
+               if (qp->flags_en & MLX5_QP_FLAG_SIGNATURE)
+                       scat++;
+
+               for (i = 0; i < wr->num_sge; i++)
+                       set_data_ptr_seg(scat + i, wr->sg_list + i);
+
+               if (i < qp->rq.max_gs) {
+                       scat[i].byte_count = 0;
+                       scat[i].lkey       = cpu_to_be32(MLX5_INVALID_LKEY);
+                       scat[i].addr       = 0;
+               }
+
+               if (qp->flags_en & MLX5_QP_FLAG_SIGNATURE) {
+                       sig = (struct mlx5_rwqe_sig *)scat;
+                       set_sig_seg(sig, qp->rq.max_gs);
+               }
+
+               qp->rq.wrid[ind] = wr->wr_id;
+
+               ind = (ind + 1) & (qp->rq.wqe_cnt - 1);
+       }
+
+out:
+       if (likely(nreq)) {
+               qp->rq.head += nreq;
+
+               /* Make sure that descriptors are written before
+                * doorbell record.
+                */
+               wmb();
+
+               *qp->db.db = cpu_to_be32(qp->rq.head & 0xffff);
+       }
+
+       spin_unlock_irqrestore(&qp->rq.lock, flags);
+
+       return err;
+}
diff --git a/drivers/infiniband/hw/mlx5/wr.h b/drivers/infiniband/hw/mlx5/wr.h
new file mode 100644 (file)
index 0000000..4f00575
--- /dev/null
@@ -0,0 +1,76 @@
+/* SPDX-License-Identifier: GPL-2.0 OR Linux-OpenIB */
+/*
+ * Copyright (c) 2020, Mellanox Technologies inc. All rights reserved.
+ */
+
+#ifndef _MLX5_IB_WR_H
+#define _MLX5_IB_WR_H
+
+#include "mlx5_ib.h"
+
+enum {
+       MLX5_IB_SQ_UMR_INLINE_THRESHOLD = 64,
+};
+
+struct mlx5_wqe_eth_pad {
+       u8 rsvd0[16];
+};
+
+
+/* get_sq_edge - Get the next nearby edge.
+ *
+ * An 'edge' is defined as the first following address after the end
+ * of the fragment or the SQ. Accordingly, during the WQE construction
+ * which repetitively increases the pointer to write the next data, it
+ * simply should check if it gets to an edge.
+ *
+ * @sq - SQ buffer.
+ * @idx - Stride index in the SQ buffer.
+ *
+ * Return:
+ *     The new edge.
+ */
+static inline void *get_sq_edge(struct mlx5_ib_wq *sq, u32 idx)
+{
+       void *fragment_end;
+
+       fragment_end = mlx5_frag_buf_get_wqe
+               (&sq->fbc,
+                mlx5_frag_buf_get_idx_last_contig_stride(&sq->fbc, idx));
+
+       return fragment_end + MLX5_SEND_WQE_BB;
+}
+
+int mlx5_ib_post_send(struct ib_qp *ibqp, const struct ib_send_wr *wr,
+                     const struct ib_send_wr **bad_wr, bool drain);
+int mlx5_ib_post_recv(struct ib_qp *ibqp, const struct ib_recv_wr *wr,
+                     const struct ib_recv_wr **bad_wr, bool drain);
+
+static inline int mlx5_ib_post_send_nodrain(struct ib_qp *ibqp,
+                                           const struct ib_send_wr *wr,
+                                           const struct ib_send_wr **bad_wr)
+{
+       return mlx5_ib_post_send(ibqp, wr, bad_wr, false);
+}
+
+static inline int mlx5_ib_post_send_drain(struct ib_qp *ibqp,
+                                         const struct ib_send_wr *wr,
+                                         const struct ib_send_wr **bad_wr)
+{
+       return mlx5_ib_post_send(ibqp, wr, bad_wr, true);
+}
+
+static inline int mlx5_ib_post_recv_nodrain(struct ib_qp *ibqp,
+                                           const struct ib_recv_wr *wr,
+                                           const struct ib_recv_wr **bad_wr)
+{
+       return mlx5_ib_post_recv(ibqp, wr, bad_wr, false);
+}
+
+static inline int mlx5_ib_post_recv_drain(struct ib_qp *ibqp,
+                                         const struct ib_recv_wr *wr,
+                                         const struct ib_recv_wr **bad_wr)
+{
+       return mlx5_ib_post_recv(ibqp, wr, bad_wr, true);
+}
+#endif /* _MLX5_IB_WR_H */