RDMA/hns: Update the interfaces for MTT/CQE multi hop addressing in hip08
authorShaobo Xu <xushaobo2@huawei.com>
Wed, 30 Aug 2017 09:23:08 +0000 (17:23 +0800)
committerDoug Ledford <dledford@redhat.com>
Wed, 27 Sep 2017 12:34:56 +0000 (08:34 -0400)
The MTT(SQWQE/SGE/RQWQE) and CQE in hip08 can support multi hop
addressing. The address of MTT/CQE can be retrieved by the BT
(Base Address Table) with multi hop addressing.

This patch is to update the interfaces in HEM to support multi hop
addressing for the MTT/CQE.

Signed-off-by: Shaobo Xu <xushaobo2@huawei.com>
Signed-off-by: Lijun Ou <oulijun@huawei.com>
Signed-off-by: Wei Hu (Xavier) <xavier.huwei@huawei.com>
Signed-off-by: Doug Ledford <dledford@redhat.com>
drivers/infiniband/hw/hns/hns_roce_cq.c
drivers/infiniband/hw/hns/hns_roce_device.h
drivers/infiniband/hw/hns/hns_roce_hem.c
drivers/infiniband/hw/hns/hns_roce_hem.h
drivers/infiniband/hw/hns/hns_roce_hw_v1.c
drivers/infiniband/hw/hns/hns_roce_hw_v2.c
drivers/infiniband/hw/hns/hns_roce_hw_v2.h
drivers/infiniband/hw/hns/hns_roce_mr.c

index 5f512429f6347fe2bba2472c218c5bb539011d4a..362aeecc1a0865353f6d15ac8a20f712dd46f9bc 100644 (file)
@@ -85,17 +85,19 @@ static int hns_roce_cq_alloc(struct hns_roce_dev *hr_dev, int nent,
                             struct hns_roce_uar *hr_uar,
                             struct hns_roce_cq *hr_cq, int vector)
 {
-       struct hns_roce_cmd_mailbox *mailbox = NULL;
-       struct hns_roce_cq_table *cq_table = NULL;
+       struct hns_roce_cmd_mailbox *mailbox;
+       struct hns_roce_hem_table *mtt_table;
+       struct hns_roce_cq_table *cq_table;
        struct device *dev = hr_dev->dev;
        dma_addr_t dma_handle;
-       u64 *mtts = NULL;
-       int ret = 0;
+       u64 *mtts;
+       int ret;
 
        cq_table = &hr_dev->cq_table;
 
        /* Get the physical address of cq buf */
-       mtts = hns_roce_table_find(&hr_dev->mr_table.mtt_table,
+       mtt_table = &hr_dev->mr_table.mtt_table;
+       mtts = hns_roce_table_find(hr_dev, mtt_table,
                                   hr_mtt->first_seg, &dma_handle);
        if (!mtts) {
                dev_err(dev, "CQ alloc.Failed to find cq buf addr.\n");
index 4574a7bb8c7fd4735144d42f429d5fd6edbb7192..7dd8fbb2b9f206ccf1c1d38b28b582afc8f77618 100644 (file)
@@ -525,6 +525,12 @@ struct hns_roce_caps {
        u32             mpt_ba_pg_sz;
        u32             mpt_buf_pg_sz;
        u32             mpt_hop_num;
+       u32             mtt_ba_pg_sz;
+       u32             mtt_buf_pg_sz;
+       u32             mtt_hop_num;
+       u32             cqe_ba_pg_sz;
+       u32             cqe_buf_pg_sz;
+       u32             cqe_hop_num;
 };
 
 struct hns_roce_hw {
index 9bc8c6bd301d73d7baf9c709b822e7b6dc62a5ae..ac2d671ed2f9addf65531c9126e537afb560520c 100644 (file)
@@ -47,7 +47,9 @@ bool hns_roce_check_whether_mhop(struct hns_roce_dev *hr_dev, u32 type)
        if ((hr_dev->caps.qpc_hop_num && type == HEM_TYPE_QPC) ||
            (hr_dev->caps.mpt_hop_num && type == HEM_TYPE_MTPT) ||
            (hr_dev->caps.cqc_hop_num && type == HEM_TYPE_CQC) ||
-           (hr_dev->caps.srqc_hop_num && type == HEM_TYPE_SRQC))
+           (hr_dev->caps.srqc_hop_num && type == HEM_TYPE_SRQC) ||
+           (hr_dev->caps.cqe_hop_num && type == HEM_TYPE_CQE) ||
+           (hr_dev->caps.mtt_hop_num && type == HEM_TYPE_MTT))
                return true;
 
        return false;
@@ -132,6 +134,22 @@ int hns_roce_calc_hem_mhop(struct hns_roce_dev *hr_dev,
                mhop->ba_l0_num = hr_dev->caps.srqc_bt_num;
                mhop->hop_num = hr_dev->caps.srqc_hop_num;
                break;
+       case HEM_TYPE_MTT:
+               mhop->buf_chunk_size = 1 << (hr_dev->caps.mtt_buf_pg_sz
+                                            + PAGE_SHIFT);
+               mhop->bt_chunk_size = 1 << (hr_dev->caps.mtt_ba_pg_sz
+                                            + PAGE_SHIFT);
+               mhop->ba_l0_num = mhop->bt_chunk_size / 8;
+               mhop->hop_num = hr_dev->caps.mtt_hop_num;
+               break;
+       case HEM_TYPE_CQE:
+               mhop->buf_chunk_size = 1 << (hr_dev->caps.cqe_buf_pg_sz
+                                            + PAGE_SHIFT);
+               mhop->bt_chunk_size = 1 << (hr_dev->caps.cqe_ba_pg_sz
+                                            + PAGE_SHIFT);
+               mhop->ba_l0_num = mhop->bt_chunk_size / 8;
+               mhop->hop_num = hr_dev->caps.cqe_hop_num;
+               break;
        default:
                dev_err(dev, "Table %d not support multi-hop addressing!\n",
                         table->type);
@@ -141,10 +159,14 @@ int hns_roce_calc_hem_mhop(struct hns_roce_dev *hr_dev,
        if (!obj)
                return 0;
 
-       /* QPC/MTPT/CQC/SRQC alloc hem for buffer pages. */
+       /*
+        * QPC/MTPT/CQC/SRQC alloc hem for buffer pages.
+        * MTT/CQE alloc hem for bt pages.
+        */
        bt_num = hns_roce_get_bt_num(table->type, mhop->hop_num);
        chunk_ba_num = mhop->bt_chunk_size / 8;
-       chunk_size = mhop->buf_chunk_size;
+       chunk_size = table->type < HEM_TYPE_MTT ? mhop->buf_chunk_size :
+                             mhop->bt_chunk_size;
        table_idx = (*obj & (table->num_obj - 1)) /
                     (chunk_size / table->obj_size);
        switch (bt_num) {
@@ -448,8 +470,11 @@ int hns_roce_table_mhop_get(struct hns_roce_dev *hr_dev,
                }
        }
 
-       /* alloc buffer space chunk for QPC/MTPT/CQC/SRQC. */
-       size = buf_chunk_size;
+       /*
+        * alloc buffer space chunk for QPC/MTPT/CQC/SRQC.
+        * alloc bt space chunk for MTT/CQE.
+        */
+       size = table->type < HEM_TYPE_MTT ? buf_chunk_size : bt_chunk_size;
        table->hem[hem_idx] = hns_roce_alloc_hem(hr_dev,
                                                size >> PAGE_SHIFT,
                                                size,
@@ -480,6 +505,8 @@ int hns_roce_table_mhop_get(struct hns_roce_dev *hr_dev,
                        dev_err(dev, "set HEM base address to HW failed!\n");
                        goto err_alloc_hem_buf;
                }
+       } else if (hop_num == 2) {
+               *(table->bt_l0[bt_l0_idx] + mhop.l1_idx) = bt_ba;
        }
 
        ++table->hem[hem_idx]->refcount;
@@ -610,7 +637,10 @@ void hns_roce_table_mhop_put(struct hns_roce_dev *hr_dev,
                        dev_warn(dev, "Clear HEM base address failed.\n");
        }
 
-       /* free buffer space chunk for QPC/MTPT/CQC/SRQC. */
+       /*
+        * free buffer space chunk for QPC/MTPT/CQC/SRQC.
+        * free bt space chunk for MTT/CQE.
+        */
        hns_roce_free_hem(hr_dev, table->hem[hem_idx]);
        table->hem[hem_idx] = NULL;
 
@@ -686,23 +716,46 @@ void hns_roce_table_put(struct hns_roce_dev *hr_dev,
        mutex_unlock(&table->mutex);
 }
 
-void *hns_roce_table_find(struct hns_roce_hem_table *table, unsigned long obj,
-                         dma_addr_t *dma_handle)
+void *hns_roce_table_find(struct hns_roce_dev *hr_dev,
+                         struct hns_roce_hem_table *table,
+                         unsigned long obj, dma_addr_t *dma_handle)
 {
        struct hns_roce_hem_chunk *chunk;
-       unsigned long idx;
-       int i;
-       int offset, dma_offset;
+       struct hns_roce_hem_mhop mhop;
        struct hns_roce_hem *hem;
        struct page *page = NULL;
+       unsigned long mhop_obj = obj;
+       unsigned long idx;
+       int offset, dma_offset;
+       int i, j;
+       u32 hem_idx = 0;
 
        if (!table->lowmem)
                return NULL;
 
        mutex_lock(&table->mutex);
-       idx = (obj & (table->num_obj - 1)) * table->obj_size;
-       hem = table->hem[idx / HNS_ROCE_TABLE_CHUNK_SIZE];
-       dma_offset = offset = idx % HNS_ROCE_TABLE_CHUNK_SIZE;
+
+       if (!hns_roce_check_whether_mhop(hr_dev, table->type)) {
+               idx = (obj & (table->num_obj - 1)) * table->obj_size;
+               hem = table->hem[idx / HNS_ROCE_TABLE_CHUNK_SIZE];
+               dma_offset = offset = idx % HNS_ROCE_TABLE_CHUNK_SIZE;
+       } else {
+               hns_roce_calc_hem_mhop(hr_dev, table, &mhop_obj, &mhop);
+               /* mtt mhop */
+               i = mhop.l0_idx;
+               j = mhop.l1_idx;
+               if (mhop.hop_num == 2)
+                       hem_idx = i * (mhop.bt_chunk_size / 8) + j;
+               else if (mhop.hop_num == 1 ||
+                        mhop.hop_num == HNS_ROCE_HOP_NUM_0)
+                       hem_idx = i;
+
+               hem = table->hem[hem_idx];
+               dma_offset = offset = (obj & (table->num_obj - 1)) *
+                                      table->obj_size % mhop.bt_chunk_size;
+               if (mhop.hop_num == 2)
+                       dma_offset = offset = 0;
+       }
 
        if (!hem)
                goto out;
@@ -735,9 +788,15 @@ int hns_roce_table_get_range(struct hns_roce_dev *hr_dev,
                             struct hns_roce_hem_table *table,
                             unsigned long start, unsigned long end)
 {
+       struct hns_roce_hem_mhop mhop;
        unsigned long inc = HNS_ROCE_TABLE_CHUNK_SIZE / table->obj_size;
-       unsigned long i = 0;
-       int ret = 0;
+       unsigned long i;
+       int ret;
+
+       if (hns_roce_check_whether_mhop(hr_dev, table->type)) {
+               hns_roce_calc_hem_mhop(hr_dev, table, NULL, &mhop);
+               inc = mhop.bt_chunk_size / table->obj_size;
+       }
 
        /* Allocate MTT entry memory according to chunk(128K) */
        for (i = start; i <= end; i += inc) {
@@ -760,10 +819,17 @@ void hns_roce_table_put_range(struct hns_roce_dev *hr_dev,
                              struct hns_roce_hem_table *table,
                              unsigned long start, unsigned long end)
 {
+       struct hns_roce_hem_mhop mhop;
+       unsigned long inc = HNS_ROCE_TABLE_CHUNK_SIZE / table->obj_size;
        unsigned long i;
 
+       if (hns_roce_check_whether_mhop(hr_dev, table->type)) {
+               hns_roce_calc_hem_mhop(hr_dev, table, NULL, &mhop);
+               inc = mhop.bt_chunk_size / table->obj_size;
+       }
+
        for (i = start; i <= end;
-               i += HNS_ROCE_TABLE_CHUNK_SIZE / table->obj_size)
+               i += inc)
                hns_roce_table_put(hr_dev, table, i);
 }
 
@@ -787,7 +853,7 @@ int hns_roce_init_hem_table(struct hns_roce_dev *hr_dev,
                unsigned long buf_chunk_size;
                unsigned long bt_chunk_size;
                unsigned long bt_chunk_num;
-               unsigned long num_bt_l0;
+               unsigned long num_bt_l0 = 0;
                u32 hop_num;
 
                switch (type) {
@@ -823,6 +889,18 @@ int hns_roce_init_hem_table(struct hns_roce_dev *hr_dev,
                        num_bt_l0 = hr_dev->caps.srqc_bt_num;
                        hop_num = hr_dev->caps.srqc_hop_num;
                        break;
+               case HEM_TYPE_MTT:
+                       buf_chunk_size = 1 << (hr_dev->caps.mtt_ba_pg_sz
+                                       + PAGE_SHIFT);
+                       bt_chunk_size = buf_chunk_size;
+                       hop_num = hr_dev->caps.mtt_hop_num;
+                       break;
+               case HEM_TYPE_CQE:
+                       buf_chunk_size = 1 << (hr_dev->caps.cqe_ba_pg_sz
+                                       + PAGE_SHIFT);
+                       bt_chunk_size = buf_chunk_size;
+                       hop_num = hr_dev->caps.cqe_hop_num;
+                       break;
                default:
                        dev_err(dev,
                          "Table %d not support to init hem table here!\n",
@@ -832,6 +910,8 @@ int hns_roce_init_hem_table(struct hns_roce_dev *hr_dev,
                obj_per_chunk = buf_chunk_size / obj_size;
                num_hem = (nobj + obj_per_chunk - 1) / obj_per_chunk;
                bt_chunk_num = bt_chunk_size / 8;
+               if (table->type >= HEM_TYPE_MTT)
+                       num_bt_l0 = bt_chunk_num;
 
                table->hem = kcalloc(num_hem, sizeof(*table->hem),
                                         GFP_KERNEL);
@@ -910,7 +990,8 @@ void hns_roce_cleanup_mhop_hem_table(struct hns_roce_dev *hr_dev,
        u64 obj;
 
        hns_roce_calc_hem_mhop(hr_dev, table, NULL, &mhop);
-       buf_chunk_size = mhop.buf_chunk_size;
+       buf_chunk_size = table->type < HEM_TYPE_MTT ? mhop.buf_chunk_size :
+                                       mhop.bt_chunk_size;
 
        for (i = 0; i < table->num_hem; ++i) {
                obj = i * buf_chunk_size / table->obj_size;
index b064ef5fad0850381152b7174cb0eae5447f153f..1aa54b6d583e69628405855366d81a7364e862c6 100644 (file)
@@ -47,6 +47,7 @@ enum {
 
         /* UNMAP HEM */
        HEM_TYPE_MTT,
+       HEM_TYPE_CQE,
        HEM_TYPE_IRRL,
 };
 
@@ -58,10 +59,13 @@ enum {
        (type < HEM_TYPE_MTT && hop_num == 2)
 
 #define check_whether_bt_num_2(type, hop_num) \
-       (type < HEM_TYPE_MTT && hop_num == 1)
+       ((type < HEM_TYPE_MTT && hop_num == 1) || \
+       (type >= HEM_TYPE_MTT && hop_num == 2))
 
 #define check_whether_bt_num_1(type, hop_num) \
-       (type < HEM_TYPE_MTT && hop_num == HNS_ROCE_HOP_NUM_0)
+       ((type < HEM_TYPE_MTT && hop_num == HNS_ROCE_HOP_NUM_0) || \
+       (type >= HEM_TYPE_MTT && hop_num == 1) || \
+       (type >= HEM_TYPE_MTT && hop_num == HNS_ROCE_HOP_NUM_0))
 
 enum {
         HNS_ROCE_HEM_PAGE_SHIFT = 12,
@@ -101,7 +105,8 @@ int hns_roce_table_get(struct hns_roce_dev *hr_dev,
                       struct hns_roce_hem_table *table, unsigned long obj);
 void hns_roce_table_put(struct hns_roce_dev *hr_dev,
                        struct hns_roce_hem_table *table, unsigned long obj);
-void *hns_roce_table_find(struct hns_roce_hem_table *table, unsigned long obj,
+void *hns_roce_table_find(struct hns_roce_dev *hr_dev,
+                         struct hns_roce_hem_table *table, unsigned long obj,
                          dma_addr_t *dma_handle);
 int hns_roce_table_get_range(struct hns_roce_dev *hr_dev,
                             struct hns_roce_hem_table *table,
index 50dee130737eb63bb80e0fa2370d2a489a838ff4..0a634c58dfcb8b829d8644a918765f5b2fe13374 100644 (file)
@@ -2524,7 +2524,7 @@ static int hns_roce_v1_m_sqp(struct ib_qp *ibqp, const struct ib_qp_attr *attr,
                return -ENOMEM;
 
        /* Search QP buf's MTTs */
-       mtts = hns_roce_table_find(&hr_dev->mr_table.mtt_table,
+       mtts = hns_roce_table_find(hr_dev, &hr_dev->mr_table.mtt_table,
                                   hr_qp->mtt.first_seg, &dma_handle);
        if (!mtts) {
                dev_err(dev, "qp buf pa find failed\n");
@@ -2671,7 +2671,7 @@ static int hns_roce_v1_m_qp(struct ib_qp *ibqp, const struct ib_qp_attr *attr,
                return -ENOMEM;
 
        /* Search qp buf's mtts */
-       mtts = hns_roce_table_find(&hr_dev->mr_table.mtt_table,
+       mtts = hns_roce_table_find(hr_dev, &hr_dev->mr_table.mtt_table,
                                   hr_qp->mtt.first_seg, &dma_handle);
        if (mtts == NULL) {
                dev_err(dev, "qp buf pa find failed\n");
@@ -2679,8 +2679,8 @@ static int hns_roce_v1_m_qp(struct ib_qp *ibqp, const struct ib_qp_attr *attr,
        }
 
        /* Search IRRL's mtts */
-       mtts_2 = hns_roce_table_find(&hr_dev->qp_table.irrl_table, hr_qp->qpn,
-                                    &dma_handle_2);
+       mtts_2 = hns_roce_table_find(hr_dev, &hr_dev->qp_table.irrl_table,
+                                    hr_qp->qpn, &dma_handle_2);
        if (mtts_2 == NULL) {
                dev_err(dev, "qp irrl_table find failed\n");
                goto out;
index 77cf476d609618b37c9d3eebbd5a84db4a4efe62..c59d15ec6d5e6ae82db16db7c926f300958c0882 100644 (file)
@@ -613,6 +613,12 @@ static int hns_roce_v2_profile(struct hns_roce_dev *hr_dev)
        caps->mpt_ba_pg_sz      = 0;
        caps->mpt_buf_pg_sz     = 0;
        caps->mpt_hop_num       = HNS_ROCE_CONTEXT_HOP_NUM;
+       caps->mtt_ba_pg_sz      = 0;
+       caps->mtt_buf_pg_sz     = 0;
+       caps->mtt_hop_num       = HNS_ROCE_MTT_HOP_NUM;
+       caps->cqe_ba_pg_sz      = 0;
+       caps->cqe_buf_pg_sz     = 0;
+       caps->cqe_hop_num       = HNS_ROCE_CQE_HOP_NUM;
 
        caps->pkey_table_len[0] = 1;
        caps->gid_table_len[0] = 2;
index cc8c8d05d6992bc00459d0d4e7644c6b99233006..212d51135f9dc0ba1ce73c7a0befb1ded22c43ea 100644 (file)
@@ -74,6 +74,7 @@
 
 #define HNS_ROCE_CONTEXT_HOP_NUM               1
 #define HNS_ROCE_MTT_HOP_NUM                   1
+#define HNS_ROCE_CQE_HOP_NUM                   1
 
 #define HNS_ROCE_CMD_FLAG_IN_VALID_SHIFT       0
 #define HNS_ROCE_CMD_FLAG_OUT_VALID_SHIFT      1
index 923d2b40e9c566fedb097ba3d0f00f18f5ce319e..d8f7b41148d1843a2a1ecfd2e6c284b353e4dd1a 100644 (file)
@@ -348,10 +348,11 @@ static int hns_roce_write_mtt_chunk(struct hns_roce_dev *hr_dev,
                                    struct hns_roce_mtt *mtt, u32 start_index,
                                    u32 npages, u64 *page_list)
 {
-       u32 i = 0;
-       __le64 *mtts = NULL;
+       struct hns_roce_hem_table *table;
        dma_addr_t dma_handle;
+       __le64 *mtts;
        u32 s = start_index * sizeof(u64);
+       u32 i;
 
        /* All MTTs must fit in the same page */
        if (start_index / (PAGE_SIZE / sizeof(u64)) !=
@@ -361,15 +362,20 @@ static int hns_roce_write_mtt_chunk(struct hns_roce_dev *hr_dev,
        if (start_index & (HNS_ROCE_MTT_ENTRY_PER_SEG - 1))
                return -EINVAL;
 
-       mtts = hns_roce_table_find(&hr_dev->mr_table.mtt_table,
+       table = &hr_dev->mr_table.mtt_table;
+       mtts = hns_roce_table_find(hr_dev, table,
                                mtt->first_seg + s / hr_dev->caps.mtt_entry_sz,
                                &dma_handle);
        if (!mtts)
                return -ENOMEM;
 
        /* Save page addr, low 12 bits : 0 */
-       for (i = 0; i < npages; ++i)
-               mtts[i] = (cpu_to_le64(page_list[i])) >> PAGE_ADDR_SHIFT;
+       for (i = 0; i < npages; ++i) {
+               if (!hr_dev->caps.mtt_hop_num)
+                       mtts[i] = cpu_to_le64(page_list[i] >> PAGE_ADDR_SHIFT);
+               else
+                       mtts[i] = cpu_to_le64(page_list[i]);
+       }
 
        return 0;
 }