git: 9207f9d206a4 - main - bnxt_re: User library support for RoCE driver

From: Sumit Saxena <ssaxena_at_FreeBSD.org>
Date: Tue, 09 Jul 2024 11:10:43 UTC
The branch main has been updated by ssaxena:

URL: https://cgit.FreeBSD.org/src/commit/?id=9207f9d206a4017001f01ca27d3d25a26c268a95

commit 9207f9d206a4017001f01ca27d3d25a26c268a95
Author:     Chandrakanth patil <chandrakanth.patil@broadcom.com>
AuthorDate: 2024-07-05 07:53:46 +0000
Commit:     Sumit Saxena <ssaxena@FreeBSD.org>
CommitDate: 2024-07-09 11:08:36 +0000

    bnxt_re: User library support for RoCE driver
    
    This patch introduces userspace library support for the bnxt_re RoCE driver.
    The library can be linked with RDMA applications such as perftest and rping.
    The RoCE traffic has been tested with the rping and perftest utility.
    
    Reviewed by:            imp, kib, sumit.saxena@broadcom.com
    Approved by:            imp
    Differential revision:  https://reviews.freebsd.org/D45729
---
 contrib/ofed/libbnxtre/abi.h     |  542 ++++++++
 contrib/ofed/libbnxtre/db.c      |  566 +++++++++
 contrib/ofed/libbnxtre/list.h    |  122 ++
 contrib/ofed/libbnxtre/main.c    |  383 ++++++
 contrib/ofed/libbnxtre/main.h    |  538 ++++++++
 contrib/ofed/libbnxtre/memory.c  |   96 ++
 contrib/ofed/libbnxtre/memory.h  |  166 +++
 contrib/ofed/libbnxtre/verbs.c   | 2557 ++++++++++++++++++++++++++++++++++++++
 contrib/ofed/libbnxtre/verbs.h   |  184 +++
 contrib/ofed/libbnxtre/version.h |   45 +
 lib/ofed/libbnxtre/Makefile      |   14 +
 11 files changed, 5213 insertions(+)

diff --git a/contrib/ofed/libbnxtre/abi.h b/contrib/ofed/libbnxtre/abi.h
new file mode 100644
index 000000000000..390605edb40b
--- /dev/null
+++ b/contrib/ofed/libbnxtre/abi.h
@@ -0,0 +1,542 @@
+/*
+ * Copyright (c) 2024, Broadcom. All rights reserved.  The term
+ * Broadcom refers to Broadcom Limited and/or its subsidiaries.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ *
+ * 1. Redistributions of source code must retain the above copyright
+ *    notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ *    notice, this list of conditions and the following disclaimer in
+ *    the documentation and/or other materials provided with the
+ *    distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS''
+ * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
+ * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
+ * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS
+ * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+ * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+ * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+ * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+ * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+ * OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+ * IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ */
+
+#ifndef __BNXT_RE_ABI_H__
+#define __BNXT_RE_ABI_H__
+
+#include <sys/types.h>
+#include <sys/mman.h>
+#include <sys/stat.h>
+
+#include <infiniband/kern-abi.h>
+
+#include <errno.h>
+#include <fcntl.h>
+#include <limits.h>
+#include <pthread.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <unistd.h>
+
+#define __aligned_u64 __attribute__((aligned(8))) u64
+
+#define BNXT_RE_ABI_VERSION	6
+#define BNXT_RE_MAX_INLINE_SIZE		0x60
+#define BNXT_RE_MAX_INLINE_SIZE_VAR_WQE	0x1E0
+#define BNXT_RE_MAX_PUSH_SIZE_VAR_WQE	0xD0
+#define BNXT_RE_FULL_FLAG_DELTA	0x00
+
+enum bnxt_re_wr_opcode {
+	BNXT_RE_WR_OPCD_SEND		= 0x00,
+	BNXT_RE_WR_OPCD_SEND_IMM	= 0x01,
+	BNXT_RE_WR_OPCD_SEND_INVAL	= 0x02,
+	BNXT_RE_WR_OPCD_RDMA_WRITE	= 0x04,
+	BNXT_RE_WR_OPCD_RDMA_WRITE_IMM	= 0x05,
+	BNXT_RE_WR_OPCD_RDMA_READ	= 0x06,
+	BNXT_RE_WR_OPCD_ATOMIC_CS	= 0x08,
+	BNXT_RE_WR_OPCD_ATOMIC_FA	= 0x0B,
+	BNXT_RE_WR_OPCD_LOC_INVAL	= 0x0C,
+	BNXT_RE_WR_OPCD_BIND		= 0x0E,
+	BNXT_RE_WR_OPCD_RECV		= 0x80,
+	BNXT_RE_WR_OPCD_INVAL		= 0xFF
+};
+
+enum bnxt_re_wr_flags {
+	BNXT_RE_WR_FLAGS_INLINE		= 0x10,
+	BNXT_RE_WR_FLAGS_SE		= 0x08,
+	BNXT_RE_WR_FLAGS_UC_FENCE	= 0x04,
+	BNXT_RE_WR_FLAGS_RD_FENCE	= 0x02,
+	BNXT_RE_WR_FLAGS_SIGNALED	= 0x01
+};
+
+#define BNXT_RE_MEMW_TYPE_2		0x02
+#define BNXT_RE_MEMW_TYPE_1		0x00
+enum bnxt_re_wr_bind_acc {
+	BNXT_RE_WR_BIND_ACC_LWR		= 0x01,
+	BNXT_RE_WR_BIND_ACC_RRD		= 0x02,
+	BNXT_RE_WR_BIND_ACC_RWR		= 0x04,
+	BNXT_RE_WR_BIND_ACC_RAT		= 0x08,
+	BNXT_RE_WR_BIND_ACC_MWB		= 0x10,
+	BNXT_RE_WR_BIND_ACC_ZBVA	= 0x01,
+	BNXT_RE_WR_BIND_ACC_SHIFT	= 0x10
+};
+
+enum bnxt_re_wc_type {
+	BNXT_RE_WC_TYPE_SEND		= 0x00,
+	BNXT_RE_WC_TYPE_RECV_RC		= 0x01,
+	BNXT_RE_WC_TYPE_RECV_UD		= 0x02,
+	BNXT_RE_WC_TYPE_RECV_RAW	= 0x03,
+	BNXT_RE_WC_TYPE_TERM		= 0x0E,
+	BNXT_RE_WC_TYPE_COFF		= 0x0F
+};
+
+#define	BNXT_RE_WC_OPCD_RECV		0x80
+enum bnxt_re_req_wc_status {
+	BNXT_RE_REQ_ST_OK		= 0x00,
+	BNXT_RE_REQ_ST_BAD_RESP		= 0x01,
+	BNXT_RE_REQ_ST_LOC_LEN		= 0x02,
+	BNXT_RE_REQ_ST_LOC_QP_OP	= 0x03,
+	BNXT_RE_REQ_ST_PROT		= 0x04,
+	BNXT_RE_REQ_ST_MEM_OP		= 0x05,
+	BNXT_RE_REQ_ST_REM_INVAL	= 0x06,
+	BNXT_RE_REQ_ST_REM_ACC		= 0x07,
+	BNXT_RE_REQ_ST_REM_OP		= 0x08,
+	BNXT_RE_REQ_ST_RNR_NAK_XCED	= 0x09,
+	BNXT_RE_REQ_ST_TRNSP_XCED	= 0x0A,
+	BNXT_RE_REQ_ST_WR_FLUSH		= 0x0B
+};
+
+enum bnxt_re_rsp_wc_status {
+	BNXT_RE_RSP_ST_OK		= 0x00,
+	BNXT_RE_RSP_ST_LOC_ACC		= 0x01,
+	BNXT_RE_RSP_ST_LOC_LEN		= 0x02,
+	BNXT_RE_RSP_ST_LOC_PROT		= 0x03,
+	BNXT_RE_RSP_ST_LOC_QP_OP	= 0x04,
+	BNXT_RE_RSP_ST_MEM_OP		= 0x05,
+	BNXT_RE_RSP_ST_REM_INVAL	= 0x06,
+	BNXT_RE_RSP_ST_WR_FLUSH		= 0x07,
+	BNXT_RE_RSP_ST_HW_FLUSH		= 0x08
+};
+
+enum bnxt_re_hdr_offset {
+	BNXT_RE_HDR_WT_MASK		= 0xFF,
+	BNXT_RE_HDR_FLAGS_MASK		= 0xFF,
+	BNXT_RE_HDR_FLAGS_SHIFT		= 0x08,
+	BNXT_RE_HDR_WS_MASK		= 0xFF,
+	BNXT_RE_HDR_WS_SHIFT		= 0x10
+};
+
+enum bnxt_re_db_que_type {
+	BNXT_RE_QUE_TYPE_SQ		= 0x00,
+	BNXT_RE_QUE_TYPE_RQ		= 0x01,
+	BNXT_RE_QUE_TYPE_SRQ		= 0x02,
+	BNXT_RE_QUE_TYPE_SRQ_ARM	= 0x03,
+	BNXT_RE_QUE_TYPE_CQ		= 0x04,
+	BNXT_RE_QUE_TYPE_CQ_ARMSE	= 0x05,
+	BNXT_RE_QUE_TYPE_CQ_ARMALL	= 0x06,
+	BNXT_RE_QUE_TYPE_CQ_ARMENA	= 0x07,
+	BNXT_RE_QUE_TYPE_SRQ_ARMENA	= 0x08,
+	BNXT_RE_QUE_TYPE_CQ_CUT_ACK	= 0x09,
+	BNXT_RE_PUSH_TYPE_START		= 0x0C,
+	BNXT_RE_PUSH_TYPE_END		= 0x0D,
+	BNXT_RE_QUE_TYPE_NULL		= 0x0F
+};
+
+enum bnxt_re_db_mask {
+	BNXT_RE_DB_INDX_MASK		= 0xFFFFFFUL,
+	BNXT_RE_DB_PILO_MASK		= 0x0FFUL,
+	BNXT_RE_DB_PILO_SHIFT		= 0x18,
+	BNXT_RE_DB_QID_MASK		= 0xFFFFFUL,
+	BNXT_RE_DB_PIHI_MASK		= 0xF00UL,
+	BNXT_RE_DB_PIHI_SHIFT		= 0x0C, /* Because mask is 0xF00 */
+	BNXT_RE_DB_TYP_MASK		= 0x0FUL,
+	BNXT_RE_DB_TYP_SHIFT		= 0x1C,
+	BNXT_RE_DB_VALID_SHIFT		= 0x1A,
+	BNXT_RE_DB_EPOCH_SHIFT		= 0x18,
+	BNXT_RE_DB_TOGGLE_SHIFT		= 0x19,
+
+};
+
+enum bnxt_re_psns_mask {
+	BNXT_RE_PSNS_SPSN_MASK		= 0xFFFFFF,
+	BNXT_RE_PSNS_OPCD_MASK		= 0xFF,
+	BNXT_RE_PSNS_OPCD_SHIFT		= 0x18,
+	BNXT_RE_PSNS_NPSN_MASK		= 0xFFFFFF,
+	BNXT_RE_PSNS_FLAGS_MASK		= 0xFF,
+	BNXT_RE_PSNS_FLAGS_SHIFT	= 0x18
+};
+
+enum bnxt_re_msns_mask {
+	BNXT_RE_SQ_MSN_SEARCH_START_PSN_MASK	= 0xFFFFFFUL,
+	BNXT_RE_SQ_MSN_SEARCH_START_PSN_SHIFT	= 0,
+	BNXT_RE_SQ_MSN_SEARCH_NEXT_PSN_MASK	= 0xFFFFFF000000ULL,
+	BNXT_RE_SQ_MSN_SEARCH_NEXT_PSN_SHIFT	= 0x18,
+	BNXT_RE_SQ_MSN_SEARCH_START_IDX_MASK	= 0xFFFF000000000000ULL,
+	BNXT_RE_SQ_MSN_SEARCH_START_IDX_SHIFT	= 0x30
+};
+
+enum bnxt_re_bcqe_mask {
+	BNXT_RE_BCQE_PH_MASK		= 0x01,
+	BNXT_RE_BCQE_TYPE_MASK		= 0x0F,
+	BNXT_RE_BCQE_TYPE_SHIFT		= 0x01,
+	BNXT_RE_BCQE_STATUS_MASK	= 0xFF,
+	BNXT_RE_BCQE_STATUS_SHIFT	= 0x08,
+	BNXT_RE_BCQE_FLAGS_MASK		= 0xFFFFU,
+	BNXT_RE_BCQE_FLAGS_SHIFT	= 0x10,
+	BNXT_RE_BCQE_RWRID_MASK		= 0xFFFFFU,
+	BNXT_RE_BCQE_SRCQP_MASK		= 0xFF,
+	BNXT_RE_BCQE_SRCQP_SHIFT	= 0x18
+};
+
+enum bnxt_re_rc_flags_mask {
+	BNXT_RE_RC_FLAGS_SRQ_RQ_MASK	= 0x01,
+	BNXT_RE_RC_FLAGS_IMM_MASK	= 0x02,
+	BNXT_RE_RC_FLAGS_IMM_SHIFT	= 0x01,
+	BNXT_RE_RC_FLAGS_INV_MASK	= 0x04,
+	BNXT_RE_RC_FLAGS_INV_SHIFT	= 0x02,
+	BNXT_RE_RC_FLAGS_RDMA_MASK	= 0x08,
+	BNXT_RE_RC_FLAGS_RDMA_SHIFT	= 0x03
+};
+
+enum bnxt_re_ud_flags_mask {
+	BNXT_RE_UD_FLAGS_SRQ_RQ_MASK	= 0x01,
+	BNXT_RE_UD_FLAGS_SRQ_RQ_SFT	= 0x00,
+	BNXT_RE_UD_FLAGS_IMM_MASK	= 0x02,
+	BNXT_RE_UD_FLAGS_IMM_SFT	= 0x01,
+	BNXT_RE_UD_FLAGS_IP_VER_MASK	= 0x30,
+	BNXT_RE_UD_FLAGS_IP_VER_SFT	= 0x4,
+	BNXT_RE_UD_FLAGS_META_MASK	= 0x3C0,
+	BNXT_RE_UD_FLAGS_META_SFT	= 0x6,
+	BNXT_RE_UD_FLAGS_EXT_META_MASK	= 0xC00,
+	BNXT_RE_UD_FLAGS_EXT_META_SFT	= 0x10,
+};
+
+enum bnxt_re_ud_cqe_mask {
+	BNXT_RE_UD_CQE_MAC_MASK		= 0xFFFFFFFFFFFFULL,
+	BNXT_RE_UD_CQE_SRCQPLO_MASK	= 0xFFFF,
+	BNXT_RE_UD_CQE_SRCQPLO_SHIFT	= 0x30,
+	BNXT_RE_UD_CQE_LEN_MASK		= 0x3FFFU
+};
+
+enum bnxt_re_shpg_offt {
+	BNXT_RE_SHPG_BEG_RESV_OFFT	= 0x00,
+	BNXT_RE_SHPG_AVID_OFFT		= 0x10,
+	BNXT_RE_SHPG_AVID_SIZE		= 0x04,
+	BNXT_RE_SHPG_END_RESV_OFFT	= 0xFF0
+};
+
+enum bnxt_re_que_flags_mask {
+	BNXT_RE_FLAG_EPOCH_TAIL_SHIFT	= 0x0UL,
+	BNXT_RE_FLAG_EPOCH_HEAD_SHIFT	= 0x1UL,
+	BNXT_RE_FLAG_EPOCH_TAIL_MASK	= 0x1UL,
+	BNXT_RE_FLAG_EPOCH_HEAD_MASK	= 0x2UL,
+};
+
+enum bnxt_re_db_epoch_flag_shift {
+	BNXT_RE_DB_EPOCH_TAIL_SHIFT	= BNXT_RE_DB_EPOCH_SHIFT,
+	BNXT_RE_DB_EPOCH_HEAD_SHIFT	= (BNXT_RE_DB_EPOCH_SHIFT - 1)
+};
+
+enum bnxt_re_ppp_st_en_mask {
+	BNXT_RE_PPP_ENABLED_MASK	= 0x1UL,
+	BNXT_RE_PPP_STATE_MASK		= 0x2UL,
+};
+
+enum bnxt_re_ppp_st_shift {
+	BNXT_RE_PPP_ST_SHIFT		= 0x1UL
+};
+
+struct bnxt_re_db_hdr {
+	__u64 typ_qid_indx; /* typ: 4, qid:20, indx:24 */
+};
+
+#define BNXT_RE_CHIP_ID0_CHIP_NUM_SFT		0x00
+#define BNXT_RE_CHIP_ID0_CHIP_REV_SFT		0x10
+#define BNXT_RE_CHIP_ID0_CHIP_MET_SFT		0x18
+
+enum {
+	BNXT_RE_COMP_MASK_UCNTX_WC_DPI_ENABLED = 0x01,
+	BNXT_RE_COMP_MASK_UCNTX_POW2_DISABLED = 0x02,
+	BNXT_RE_COMP_MASK_UCNTX_RSVD_WQE_DISABLED = 0x04,
+	BNXT_RE_COMP_MASK_UCNTX_MQP_EX_SUPPORTED = 0x8,
+	BNXT_RE_COMP_MASK_UCNTX_DBR_PACING_ENABLED = 0x10,
+	BNXT_RE_COMP_MASK_UCNTX_DBR_RECOVERY_ENABLED = 0x20,
+	BNXT_RE_COMP_MASK_UCNTX_HW_RETX_ENABLED = 0x40
+};
+
+enum bnxt_re_req_to_drv {
+	BNXT_RE_COMP_MASK_REQ_UCNTX_POW2_SUPPORT = 0x01,
+	BNXT_RE_COMP_MASK_REQ_UCNTX_RSVD_WQE = 0x02
+};
+
+#define BNXT_RE_WQE_MODES_WQE_MODE_MASK		0x01
+/* bit wise modes can be extended here. */
+enum bnxt_re_modes {
+	BNXT_RE_WQE_MODE_STATIC =	0x00,
+	BNXT_RE_WQE_MODE_VARIABLE =	0x01
+	/* Other modes can be here */
+};
+
+struct bnxt_re_cntx_req {
+	struct ibv_get_context cmd;
+	__aligned_u64 comp_mask;
+};
+
+struct bnxt_re_cntx_resp {
+	struct ibv_get_context_resp resp;
+	__u32 dev_id;
+	__u32 max_qp; /* To allocate qp-table */
+	__u32 pg_size;
+	__u32 cqe_size;
+	__u32 max_cqd;
+	__u32 chip_id0;
+	__u32 chip_id1;
+	__u32 modes;
+	__aligned_u64 comp_mask;
+} __attribute__((packed));
+
+enum {
+	BNXT_RE_COMP_MASK_PD_HAS_WC_DPI = 0x01,
+	BNXT_RE_COMP_MASK_PD_HAS_DBR_BAR_ADDR = 0x02,
+};
+
+struct bnxt_re_pd_resp {
+	struct ibv_alloc_pd_resp resp;
+	__u32 pdid;
+	__u32 dpi;
+	__u64 dbr;
+	__u64 comp_mask;
+	__u32 wcdpi;
+	__u64 dbr_bar_map;
+} __attribute__((packed));
+
+struct bnxt_re_mr_resp {
+	struct ibv_reg_mr_resp resp;
+} __attribute__((packed));
+
+/* CQ */
+enum {
+	BNXT_RE_COMP_MASK_CQ_HAS_DB_INFO = 0x01,
+	BNXT_RE_COMP_MASK_CQ_HAS_WC_DPI = 0x02,
+	BNXT_RE_COMP_MASK_CQ_HAS_CQ_PAGE = 0x04
+};
+
+enum {
+	BNXT_RE_COMP_MASK_CQ_REQ_HAS_CAP_MASK = 0x1
+};
+
+enum {
+	BNXT_RE_COMP_MASK_CQ_REQ_CAP_DBR_RECOVERY = 0x1
+};
+
+struct bnxt_re_cq_req {
+	struct ibv_create_cq cmd;
+	__u64 cq_va;
+	__u64 cq_handle;
+	__aligned_u64 comp_mask;
+	__u16 cq_capab;
+} __attribute__((packed));
+
+struct bnxt_re_cq_resp {
+	struct ibv_create_cq_resp resp;
+	__u32 cqid;
+	__u32 tail;
+	__u32 phase;
+	__u32 rsvd;
+	__aligned_u64 comp_mask;
+	__u32 dpi;
+	__u64 dbr;
+	__u32 wcdpi;
+	__u64 cq_page;
+} __attribute__((packed));
+
+struct bnxt_re_resize_cq_req {
+	struct ibv_resize_cq cmd;
+	__u64   cq_va;
+} __attribute__((packed));
+
+struct bnxt_re_bcqe {
+	__u32 flg_st_typ_ph;
+	__u32 qphi_rwrid;
+} __attribute__((packed));
+
+struct bnxt_re_req_cqe {
+	__u64 qp_handle;
+	__u32 con_indx; /* 16 bits valid. */
+	__u32 rsvd1;
+	__u64 rsvd2;
+} __attribute__((packed));
+
+struct bnxt_re_rc_cqe {
+	__u32 length;
+	__u32 imm_key;
+	__u64 qp_handle;
+	__u64 mr_handle;
+} __attribute__((packed));
+
+struct bnxt_re_ud_cqe {
+	__u32 length; /* 14 bits */
+	__u32 immd;
+	__u64 qp_handle;
+	__u64 qplo_mac; /* 16:48*/
+} __attribute__((packed));
+
+struct bnxt_re_term_cqe {
+	__u64 qp_handle;
+	__u32 rq_sq_cidx;
+	__u32 rsvd;
+	__u64 rsvd1;
+} __attribute__((packed));
+
+struct bnxt_re_cutoff_cqe {
+	__u64 rsvd1;
+	__u64 rsvd2;
+	__u64 rsvd3;
+	__u8 cqe_type_toggle;
+	__u8 status;
+	__u16 rsvd4;
+	__u32 rsvd5;
+} __attribute__((packed));
+
+/* QP */
+struct bnxt_re_qp_req {
+	struct ibv_create_qp cmd;
+	__u64 qpsva;
+	__u64 qprva;
+	__u64 qp_handle;
+} __attribute__((packed));
+
+struct bnxt_re_qp_resp {
+	struct	ibv_create_qp_resp resp;
+	__u32 qpid;
+} __attribute__((packed));
+
+enum bnxt_re_modify_ex_mask {
+	BNXT_RE_MQP_PPP_REQ_EN_MASK	= 0x1UL,
+	BNXT_RE_MQP_PPP_REQ_EN		= 0x1UL,
+	BNXT_RE_MQP_PATH_MTU_MASK	= 0x2UL,
+	BNXT_RE_MQP_PPP_IDX_MASK	= 0x7UL,
+	BNXT_RE_MQP_PPP_STATE		= 0x10UL
+};
+
+/* Modify QP */
+struct bnxt_re_modify_ex_req {
+	struct	ibv_modify_qp_ex cmd;
+	__aligned_u64 comp_mask;
+	__u32	dpi;
+	__u32	rsvd;
+};
+
+struct bnxt_re_modify_ex_resp {
+	struct	ibv_modify_qp_resp_ex resp;
+	__aligned_u64 comp_mask;
+	__u32 ppp_st_idx;
+	__u32 path_mtu;
+};
+
+union lower_shdr {
+	__u64 qkey_len;
+	__u64 lkey_plkey;
+	__u64 rva;
+};
+
+struct bnxt_re_bsqe {
+	__u32 rsv_ws_fl_wt;
+	__u32 key_immd;
+	union lower_shdr lhdr;
+} __attribute__((packed));
+
+struct bnxt_re_psns_ext {
+	__u32 opc_spsn;
+	__u32 flg_npsn;
+	__u16 st_slot_idx;
+	__u16 rsvd0;
+	__u32 rsvd1;
+} __attribute__((packed));
+
+/* sq_msn_search (size:64b/8B) */
+struct bnxt_re_msns {
+	__u64  start_idx_next_psn_start_psn;
+} __attribute__((packed));
+
+struct bnxt_re_psns {
+	__u32 opc_spsn;
+	__u32 flg_npsn;
+} __attribute__((packed));
+
+struct bnxt_re_sge {
+	__u64 pa;
+	__u32 lkey;
+	__u32 length;
+} __attribute__((packed));
+
+struct bnxt_re_send {
+	__u32 dst_qp;
+	__u32 avid;
+	__u64 rsvd;
+} __attribute__((packed));
+
+struct bnxt_re_raw {
+	__u32 cfa_meta;
+	__u32 rsvd2;
+	__u64 rsvd3;
+} __attribute__((packed));
+
+struct bnxt_re_rdma {
+	__u64 rva;
+	__u32 rkey;
+	__u32 rsvd2;
+} __attribute__((packed));
+
+struct bnxt_re_atomic {
+	__u64 swp_dt;
+	__u64 cmp_dt;
+} __attribute__((packed));
+
+struct bnxt_re_inval {
+	__u64 rsvd[2];
+} __attribute__((packed));
+
+struct bnxt_re_bind {
+	__u64 va;
+	__u64 len; /* only 40 bits are valid */
+} __attribute__((packed));
+
+struct bnxt_re_brqe {
+	__u32 rsv_ws_fl_wt;
+	__u32 rsvd;
+	__u32 wrid;
+	__u32 rsvd1;
+} __attribute__((packed));
+
+struct bnxt_re_rqe {
+	__u64 rsvd[2];
+} __attribute__((packed));
+
+/* SRQ */
+struct bnxt_re_srq_req {
+	struct ibv_create_srq cmd;
+	__u64 srqva;
+	__u64 srq_handle;
+} __attribute__((packed));
+
+struct bnxt_re_srq_resp {
+	struct ibv_create_srq_resp resp;
+	__u32 srqid;
+} __attribute__((packed));
+
+struct bnxt_re_srqe {
+	__u64 rsvd[2];
+} __attribute__((packed));
+
+struct bnxt_re_push_wqe {
+	__u64 addr[32];
+} __attribute__((packed));;
+
+#endif
diff --git a/contrib/ofed/libbnxtre/db.c b/contrib/ofed/libbnxtre/db.c
new file mode 100644
index 000000000000..8751297c9218
--- /dev/null
+++ b/contrib/ofed/libbnxtre/db.c
@@ -0,0 +1,566 @@
+/*
+ * Copyright (c) 2024, Broadcom. All rights reserved.  The term
+ * Broadcom refers to Broadcom Limited and/or its subsidiaries.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ *
+ * 1. Redistributions of source code must retain the above copyright
+ *    notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ *    notice, this list of conditions and the following disclaimer in
+ *    the documentation and/or other materials provided with the
+ *    distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS''
+ * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
+ * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
+ * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS
+ * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+ * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+ * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+ * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+ * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+ * OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+ * IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ *
+ * Description: Doorbell handling functions.
+ */
+
+#include <malloc.h>
+#include <unistd.h>
+
+#include "abi.h"
+#include "main.h"
+
+#define BNXT_RE_DB_FIFO_ROOM_MASK_P5	0x1FFF8000
+#define BNXT_RE_MAX_FIFO_DEPTH_P5	0x2c00
+
+#define BNXT_RE_DB_FIFO_ROOM_MASK_P7	0x3FFF8000
+#define BNXT_RE_MAX_FIFO_DEPTH_P7	0x8000
+
+#define BNXT_RE_DB_FIFO_ROOM_SHIFT      15
+#define BNXT_RE_DB_THRESHOLD		20
+
+#define BNXT_RE_DB_FIFO_ROOM_MASK(ctx)	\
+	(_is_chip_thor2((ctx)) ? \
+	 BNXT_RE_DB_FIFO_ROOM_MASK_P7 :\
+	 BNXT_RE_DB_FIFO_ROOM_MASK_P5)
+#define BNXT_RE_MAX_FIFO_DEPTH(ctx)	\
+	(_is_chip_thor2((ctx)) ? \
+	 BNXT_RE_MAX_FIFO_DEPTH_P7 :\
+	 BNXT_RE_MAX_FIFO_DEPTH_P5)
+
+static uint32_t xorshift32(struct xorshift32_state *state)
+{
+	/* Algorithm "xor" from p. 4 of Marsaglia, "Xorshift RNGs" */
+	uint32_t x = state->seed;
+
+	x ^= x << 13;
+	x ^= x >> 17;
+	x ^= x << 5;
+	return state->seed = x;
+}
+
+static uint16_t rnd(struct xorshift32_state *state, uint16_t range)
+{
+	/* range must be a power of 2 - 1 */
+	return (xorshift32(state) & range);
+}
+
+static int calculate_fifo_occupancy(struct bnxt_re_context *cntx)
+{
+	uint32_t *dbr_map = cntx->bar_map + 0x1a8;
+	uint32_t read_val, fifo_occup;
+
+	read_val = *dbr_map;
+	fifo_occup = BNXT_RE_MAX_FIFO_DEPTH(cntx->cctx) -
+		((read_val & BNXT_RE_DB_FIFO_ROOM_MASK(cntx->cctx)) >>
+		 BNXT_RE_DB_FIFO_ROOM_SHIFT);
+
+	return fifo_occup;
+}
+
+static inline uint32_t find_min(uint32_t x, uint32_t y)
+{
+	return (y > x ? x : y);
+}
+
+int bnxt_re_do_pacing(struct bnxt_re_context *cntx, struct xorshift32_state *state)
+{
+	/* First 4 bytes  of shared page (pacing_info) contains the DBR
+	 * pacing information. Second 4 bytes (pacing_th)  contains
+	 * the pacing threshold value to determine whether to
+	 * add delay or not
+	 */
+	struct bnxt_re_pacing_data *pacing_data =
+		(struct bnxt_re_pacing_data *)cntx->dbr_page;
+	uint32_t wait_time = 1;
+	uint32_t fifo_occup;
+
+	if (!pacing_data)
+		return 0;
+	/* If the device in error recovery state, return error to
+	 * not to ring new doorbells in this state.
+	 */
+	if (pacing_data->dev_err_state)
+		return -EFAULT;
+
+	if (rnd(state, BNXT_RE_MAX_DO_PACING) < pacing_data->do_pacing) {
+		while ((fifo_occup = calculate_fifo_occupancy(cntx))
+			>  pacing_data->pacing_th) {
+			struct bnxt_re_cq *cq;
+			uint32_t usec_wait;
+
+			if (pacing_data->alarm_th && fifo_occup > pacing_data->alarm_th) {
+				cq = container_of(cntx->dbr_cq, struct bnxt_re_cq, ibvcq);
+				bnxt_re_poll_kernel_cq(cq);
+			}
+			usec_wait = rnd(state, wait_time - 1);
+			if (usec_wait)
+				bnxt_re_sub_sec_busy_wait(usec_wait * 1000);
+			/* wait time capped at 128 us */
+			wait_time = find_min(wait_time * 2, 128);
+		}
+	}
+	return 0;
+}
+
+static inline void bnxt_re_ring_db(struct bnxt_re_dpi *dpi, __u64 key,
+				   uint64_t *db_key, uint8_t *lock)
+{
+	while (1) {
+		if (__sync_bool_compare_and_swap(lock, 0, 1)) {
+			*db_key = key;
+			bnxt_re_wm_barrier();
+			iowrite64(dpi->dbpage, key);
+			bnxt_re_wm_barrier();
+			*lock = 0;
+			break;
+		}
+	}
+}
+
+static inline void bnxt_re_init_push_hdr(struct bnxt_re_db_hdr *hdr,
+					 uint32_t indx, uint32_t qid,
+					 uint32_t typ, uint32_t pidx)
+{
+	__u64 key_lo, key_hi;
+
+	key_lo = (((pidx & BNXT_RE_DB_PILO_MASK) << BNXT_RE_DB_PILO_SHIFT) |
+		  (indx & BNXT_RE_DB_INDX_MASK));
+	key_hi = ((((pidx & BNXT_RE_DB_PIHI_MASK) << BNXT_RE_DB_PIHI_SHIFT) |
+		   (qid & BNXT_RE_DB_QID_MASK)) |
+		  ((typ & BNXT_RE_DB_TYP_MASK) << BNXT_RE_DB_TYP_SHIFT) |
+		  (0x1UL << BNXT_RE_DB_VALID_SHIFT));
+	hdr->typ_qid_indx = htole64((key_lo | (key_hi << 32)));
+}
+
+static inline void bnxt_re_init_db_hdr(struct bnxt_re_db_hdr *hdr,
+				       uint32_t indx, uint32_t toggle,
+				       uint32_t qid, uint32_t typ)
+{
+	__u64 key_lo, key_hi;
+
+	key_lo = htole32(indx | toggle);
+	key_hi = ((qid & BNXT_RE_DB_QID_MASK) |
+		  ((typ & BNXT_RE_DB_TYP_MASK) << BNXT_RE_DB_TYP_SHIFT) |
+		  (0x1UL << BNXT_RE_DB_VALID_SHIFT));
+	hdr->typ_qid_indx = htole64((key_lo | (key_hi << 32)));
+}
+
+static inline void __bnxt_re_ring_pend_db(__u64 *ucdb, __u64 key,
+					  struct  bnxt_re_qp *qp)
+{
+	struct bnxt_re_db_hdr hdr;
+
+	bnxt_re_init_db_hdr(&hdr,
+			    (*qp->jsqq->hwque->dbtail |
+			     ((qp->jsqq->hwque->flags &
+			       BNXT_RE_FLAG_EPOCH_TAIL_MASK) <<
+			    BNXT_RE_DB_EPOCH_TAIL_SHIFT)), 0,
+			    qp->qpid,
+			    BNXT_RE_QUE_TYPE_SQ);
+
+	while (1) {
+		if (__sync_bool_compare_and_swap(&qp->sq_dbr_lock, 0, 1)) {
+			qp->sq_shadow_db_key = hdr.typ_qid_indx;
+			bnxt_re_wm_barrier();
+			iowrite64(ucdb, key);
+			bnxt_re_wm_barrier();
+			qp->sq_dbr_lock = 0;
+			break;
+		}
+	}
+}
+
+void bnxt_re_ring_rq_db(struct bnxt_re_qp *qp)
+{
+	struct bnxt_re_db_hdr hdr;
+
+	if (bnxt_re_do_pacing(qp->cntx, &qp->rand))
+		return;
+	bnxt_re_init_db_hdr(&hdr,
+			    (*qp->jrqq->hwque->dbtail |
+			     ((qp->jrqq->hwque->flags &
+			       BNXT_RE_FLAG_EPOCH_TAIL_MASK) <<
+			      BNXT_RE_DB_EPOCH_TAIL_SHIFT)), 0,
+			    qp->qpid,
+			    BNXT_RE_QUE_TYPE_RQ);
+	bnxt_re_ring_db(qp->udpi, hdr.typ_qid_indx, &qp->rq_shadow_db_key,
+			&qp->rq_dbr_lock);
+}
+
+void bnxt_re_ring_sq_db(struct bnxt_re_qp *qp)
+{
+	struct bnxt_re_db_hdr hdr;
+
+	if (bnxt_re_do_pacing(qp->cntx, &qp->rand))
+		return;
+	bnxt_re_init_db_hdr(&hdr,
+			    (*qp->jsqq->hwque->dbtail |
+			     ((qp->jsqq->hwque->flags &
+			       BNXT_RE_FLAG_EPOCH_TAIL_MASK) <<
+			     BNXT_RE_DB_EPOCH_TAIL_SHIFT)), 0,
+			    qp->qpid,
+			    BNXT_RE_QUE_TYPE_SQ);
+	bnxt_re_ring_db(qp->udpi, hdr.typ_qid_indx, &qp->sq_shadow_db_key,
+			&qp->sq_dbr_lock);
+}
+
+void bnxt_re_ring_srq_db(struct bnxt_re_srq *srq)
+{
+	struct bnxt_re_db_hdr hdr;
+
+	if (bnxt_re_do_pacing(srq->uctx, &srq->rand))
+		return;
+	bnxt_re_init_db_hdr(&hdr,
+			    (srq->srqq->tail |
+			     ((srq->srqq->flags &
+			       BNXT_RE_FLAG_EPOCH_TAIL_MASK) <<
+			     BNXT_RE_DB_EPOCH_TAIL_SHIFT)), 0,
+			    srq->srqid, BNXT_RE_QUE_TYPE_SRQ);
+	bnxt_re_ring_db(srq->udpi, hdr.typ_qid_indx, &srq->shadow_db_key,
+			&srq->dbr_lock);
+}
+
+void bnxt_re_ring_srq_arm(struct bnxt_re_srq *srq)
+{
+	struct bnxt_re_db_hdr hdr;
+
+	if (bnxt_re_do_pacing(srq->uctx, &srq->rand))
+		return;
+	bnxt_re_init_db_hdr(&hdr, srq->cap.srq_limit, 0, srq->srqid,
+			    BNXT_RE_QUE_TYPE_SRQ_ARM);
+	bnxt_re_ring_db(srq->udpi, hdr.typ_qid_indx, &srq->shadow_db_key,
+			&srq->dbr_lock);
+}
+
+void bnxt_re_ring_cq_db(struct bnxt_re_cq *cq)
+{
+	struct bnxt_re_db_hdr hdr;
+
+	if (bnxt_re_do_pacing(cq->cntx, &cq->rand))
+		return;
+	bnxt_re_init_db_hdr(&hdr,
+			    (cq->cqq->head |
+			     ((cq->cqq->flags &
+			       BNXT_RE_FLAG_EPOCH_HEAD_MASK) <<
+			     BNXT_RE_DB_EPOCH_HEAD_SHIFT)), 0,
+			    cq->cqid,
+			    BNXT_RE_QUE_TYPE_CQ);
+	bnxt_re_ring_db(cq->udpi, hdr.typ_qid_indx, &cq->shadow_db_key,
+			&cq->dbr_lock);
+}
+
+void bnxt_re_ring_cq_arm_db(struct bnxt_re_cq *cq, uint8_t aflag)
+{
+	uint32_t *cq_page = cq->cq_page;
+	struct bnxt_re_db_hdr hdr;
+	uint32_t toggle = 0;
+
+	if (cq_page)
+		toggle = *cq_page;
+
+	if (bnxt_re_do_pacing(cq->cntx, &cq->rand))
+		return;
+	bnxt_re_init_db_hdr(&hdr,
+			    (cq->cqq->head |
+			     ((cq->cqq->flags &
+			       BNXT_RE_FLAG_EPOCH_HEAD_MASK) <<
+			     BNXT_RE_DB_EPOCH_HEAD_SHIFT)),
+			     toggle << BNXT_RE_DB_TOGGLE_SHIFT,
+			    cq->cqid, aflag);
+	bnxt_re_ring_db(cq->udpi, hdr.typ_qid_indx, &cq->shadow_db_key,
+			&cq->dbr_lock);
+}
+
+void bnxt_re_ring_pstart_db(struct bnxt_re_qp *qp,
+			    struct bnxt_re_push_buffer *pbuf)
+{
+	__u64 key;
+
+	if (bnxt_re_do_pacing(qp->cntx, &qp->rand))
+		return;
+	key = ((((pbuf->wcdpi & BNXT_RE_DB_PIHI_MASK) <<
+		  BNXT_RE_DB_PIHI_SHIFT) | (pbuf->qpid & BNXT_RE_DB_QID_MASK)) |
+	       ((BNXT_RE_PUSH_TYPE_START & BNXT_RE_DB_TYP_MASK) <<
+		 BNXT_RE_DB_TYP_SHIFT) | (0x1UL << BNXT_RE_DB_VALID_SHIFT));
+	key <<= 32;
+	key |= ((((__u32)pbuf->wcdpi & BNXT_RE_DB_PILO_MASK) <<
+		  BNXT_RE_DB_PILO_SHIFT) | (pbuf->st_idx &
+					    BNXT_RE_DB_INDX_MASK));
+	bnxt_re_wm_barrier();
+	iowrite64(pbuf->ucdb, key);
+}
+
+void bnxt_re_ring_pend_db(struct bnxt_re_qp *qp,
+			  struct bnxt_re_push_buffer *pbuf)
+{
+	__u64 key;
+
+	if (bnxt_re_do_pacing(qp->cntx, &qp->rand))
+		return;
+	key = ((((pbuf->wcdpi & BNXT_RE_DB_PIHI_MASK) <<
+		  BNXT_RE_DB_PIHI_SHIFT) | (pbuf->qpid & BNXT_RE_DB_QID_MASK)) |
+	       ((BNXT_RE_PUSH_TYPE_END & BNXT_RE_DB_TYP_MASK) <<
+		 BNXT_RE_DB_TYP_SHIFT) | (0x1UL << BNXT_RE_DB_VALID_SHIFT));
+	key <<= 32;
+	key |= ((((__u32)pbuf->wcdpi & BNXT_RE_DB_PILO_MASK) <<
+		  BNXT_RE_DB_PILO_SHIFT) | (pbuf->tail &
+					    BNXT_RE_DB_INDX_MASK));
+	__bnxt_re_ring_pend_db(pbuf->ucdb, key, qp);
+}
+
+void bnxt_re_fill_ppp(struct bnxt_re_push_buffer *pbuf,
+		      struct bnxt_re_qp *qp, uint8_t len, uint32_t idx)
+{
+	struct bnxt_re_db_ppp_hdr phdr = {};
+	__u64 *dst, *src;
+	__u8 plen;
+	int indx;
+
+	src = (__u64 *)&phdr;
+	plen = len + sizeof(phdr) + bnxt_re_get_sqe_hdr_sz();
+
+	bnxt_re_init_db_hdr(&phdr.db_hdr,
+			    (*qp->jsqq->hwque->dbtail |
+			     ((qp->jsqq->hwque->flags &
+			       BNXT_RE_FLAG_EPOCH_TAIL_MASK) <<
+			     BNXT_RE_DB_EPOCH_TAIL_SHIFT)), 0,
+			    qp->qpid,
+			    BNXT_RE_QUE_TYPE_SQ);
+
+	phdr.rsv_psz_pidx = ((pbuf->st_idx & BNXT_RE_DB_INDX_MASK) |
+			     (((plen % 8 ? (plen / 8) + 1 :
+				plen / 8) & BNXT_RE_PUSH_SIZE_MASK) <<
+			       BNXT_RE_PUSH_SIZE_SHIFT));
+
+	bnxt_re_wm_barrier();
+	for (indx = 0; indx < 2; indx++) {
+		dst = (__u64 *)(pbuf->pbuf + indx);
+		iowrite64(dst, *src);
+		src++;
+	}
+	bnxt_re_copy_data_to_pb(pbuf, 1, idx);
+	mmio_flush_writes();
+}
+
+void bnxt_re_fill_push_wcb(struct bnxt_re_qp *qp,
+			   struct bnxt_re_push_buffer *pbuf, uint32_t idx)
+{
+	bnxt_re_ring_pstart_db(qp, pbuf);
+	mmio_wc_start();
+	bnxt_re_copy_data_to_pb(pbuf, 0, idx);
+	/* Flush WQE write before push end db. */
+	mmio_flush_writes();
+	bnxt_re_ring_pend_db(qp, pbuf);
+}
+
+int bnxt_re_init_pbuf_list(struct bnxt_re_context *ucntx)
+{
+	struct bnxt_re_push_buffer *pbuf;
+	int indx, wqesz;
+	int size, offt;
+	__u64 wcpage;
+	__u64 dbpage;
+	void *base;
+
+	size = (sizeof(*ucntx->pbrec) +
+		16 * (sizeof(*ucntx->pbrec->pbuf) +
+		      sizeof(struct bnxt_re_push_wqe)));
+	ucntx->pbrec = calloc(1, size);
+	if (!ucntx->pbrec)
+		goto out;
+
+	offt = sizeof(*ucntx->pbrec);
+	base = ucntx->pbrec;
+	ucntx->pbrec->pbuf = (base + offt);
*** 4326 LINES SKIPPED ***