RDMA/hns: Support direct wqe of userspace
The current write wqe mechanism is to write to DDR first, and then notify the hardware through doorbell to read the data. Direct wqe is a mechanism to fill wqe directly into the hardware. In the case of light load, the wqe will be filled into pcie bar space of the hardware, this will reduce one memory access operation and therefore reduce the latency. SIMD instructions allows cpu to write the 512 bits at one time to device memory, thus it can be used for posting direct wqe. Add direct wqe enable switch and address mapping. Link: https://lore.kernel.org/r/20211207124901.42123-2-liangwenpeng@huawei.com Signed-off-by: Yixing Liu <liuyixing1@huawei.com> Signed-off-by: Wenpeng Liang <liangwenpeng@huawei.com> Signed-off-by: Jason Gunthorpe <jgg@nvidia.com>
This commit is contained in:
parent
b1a4da64bf
commit
0045e0d3f4
6 changed files with 94 additions and 12 deletions
|
|
@ -77,10 +77,12 @@ enum hns_roce_qp_cap_flags {
|
|||
HNS_ROCE_QP_CAP_RQ_RECORD_DB = 1 << 0,
|
||||
HNS_ROCE_QP_CAP_SQ_RECORD_DB = 1 << 1,
|
||||
HNS_ROCE_QP_CAP_OWNER_DB = 1 << 2,
|
||||
HNS_ROCE_QP_CAP_DIRECT_WQE = 1 << 5,
|
||||
};
|
||||
|
||||
struct hns_roce_ib_create_qp_resp {
|
||||
__aligned_u64 cap_flags;
|
||||
__aligned_u64 dwqe_mmap_key;
|
||||
};
|
||||
|
||||
struct hns_roce_ib_alloc_ucontext_resp {
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue