git: 9207f9d206a4 - main - bnxt_re: User library support for RoCE driver
- Go to: [ bottom of page ] [ top of archives ] [ this month ]
Date: Tue, 09 Jul 2024 11:10:43 UTC
The branch main has been updated by ssaxena:
URL: https://cgit.FreeBSD.org/src/commit/?id=9207f9d206a4017001f01ca27d3d25a26c268a95
commit 9207f9d206a4017001f01ca27d3d25a26c268a95
Author: Chandrakanth patil <chandrakanth.patil@broadcom.com>
AuthorDate: 2024-07-05 07:53:46 +0000
Commit: Sumit Saxena <ssaxena@FreeBSD.org>
CommitDate: 2024-07-09 11:08:36 +0000
bnxt_re: User library support for RoCE driver
This patch introduces userspace library support for the bnxt_re RoCE driver.
The library can be linked with RDMA applications such as perftest and rping.
The RoCE traffic has been tested with the rping and perftest utility.
Reviewed by: imp, kib, sumit.saxena@broadcom.com
Approved by: imp
Differential revision: https://reviews.freebsd.org/D45729
---
contrib/ofed/libbnxtre/abi.h | 542 ++++++++
contrib/ofed/libbnxtre/db.c | 566 +++++++++
contrib/ofed/libbnxtre/list.h | 122 ++
contrib/ofed/libbnxtre/main.c | 383 ++++++
contrib/ofed/libbnxtre/main.h | 538 ++++++++
contrib/ofed/libbnxtre/memory.c | 96 ++
contrib/ofed/libbnxtre/memory.h | 166 +++
contrib/ofed/libbnxtre/verbs.c | 2557 ++++++++++++++++++++++++++++++++++++++
contrib/ofed/libbnxtre/verbs.h | 184 +++
contrib/ofed/libbnxtre/version.h | 45 +
lib/ofed/libbnxtre/Makefile | 14 +
11 files changed, 5213 insertions(+)
diff --git a/contrib/ofed/libbnxtre/abi.h b/contrib/ofed/libbnxtre/abi.h
new file mode 100644
index 000000000000..390605edb40b
--- /dev/null
+++ b/contrib/ofed/libbnxtre/abi.h
@@ -0,0 +1,542 @@
+/*
+ * Copyright (c) 2024, Broadcom. All rights reserved. The term
+ * Broadcom refers to Broadcom Limited and/or its subsidiaries.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ *
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in
+ * the documentation and/or other materials provided with the
+ * distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS''
+ * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
+ * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
+ * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS
+ * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+ * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+ * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+ * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+ * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+ * OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+ * IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ */
+
+#ifndef __BNXT_RE_ABI_H__
+#define __BNXT_RE_ABI_H__
+
+#include <sys/types.h>
+#include <sys/mman.h>
+#include <sys/stat.h>
+
+#include <infiniband/kern-abi.h>
+
+#include <errno.h>
+#include <fcntl.h>
+#include <limits.h>
+#include <pthread.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <unistd.h>
+
+#define __aligned_u64 __attribute__((aligned(8))) u64
+
+#define BNXT_RE_ABI_VERSION 6
+#define BNXT_RE_MAX_INLINE_SIZE 0x60
+#define BNXT_RE_MAX_INLINE_SIZE_VAR_WQE 0x1E0
+#define BNXT_RE_MAX_PUSH_SIZE_VAR_WQE 0xD0
+#define BNXT_RE_FULL_FLAG_DELTA 0x00
+
+enum bnxt_re_wr_opcode {
+ BNXT_RE_WR_OPCD_SEND = 0x00,
+ BNXT_RE_WR_OPCD_SEND_IMM = 0x01,
+ BNXT_RE_WR_OPCD_SEND_INVAL = 0x02,
+ BNXT_RE_WR_OPCD_RDMA_WRITE = 0x04,
+ BNXT_RE_WR_OPCD_RDMA_WRITE_IMM = 0x05,
+ BNXT_RE_WR_OPCD_RDMA_READ = 0x06,
+ BNXT_RE_WR_OPCD_ATOMIC_CS = 0x08,
+ BNXT_RE_WR_OPCD_ATOMIC_FA = 0x0B,
+ BNXT_RE_WR_OPCD_LOC_INVAL = 0x0C,
+ BNXT_RE_WR_OPCD_BIND = 0x0E,
+ BNXT_RE_WR_OPCD_RECV = 0x80,
+ BNXT_RE_WR_OPCD_INVAL = 0xFF
+};
+
+enum bnxt_re_wr_flags {
+ BNXT_RE_WR_FLAGS_INLINE = 0x10,
+ BNXT_RE_WR_FLAGS_SE = 0x08,
+ BNXT_RE_WR_FLAGS_UC_FENCE = 0x04,
+ BNXT_RE_WR_FLAGS_RD_FENCE = 0x02,
+ BNXT_RE_WR_FLAGS_SIGNALED = 0x01
+};
+
+#define BNXT_RE_MEMW_TYPE_2 0x02
+#define BNXT_RE_MEMW_TYPE_1 0x00
+enum bnxt_re_wr_bind_acc {
+ BNXT_RE_WR_BIND_ACC_LWR = 0x01,
+ BNXT_RE_WR_BIND_ACC_RRD = 0x02,
+ BNXT_RE_WR_BIND_ACC_RWR = 0x04,
+ BNXT_RE_WR_BIND_ACC_RAT = 0x08,
+ BNXT_RE_WR_BIND_ACC_MWB = 0x10,
+ BNXT_RE_WR_BIND_ACC_ZBVA = 0x01,
+ BNXT_RE_WR_BIND_ACC_SHIFT = 0x10
+};
+
+enum bnxt_re_wc_type {
+ BNXT_RE_WC_TYPE_SEND = 0x00,
+ BNXT_RE_WC_TYPE_RECV_RC = 0x01,
+ BNXT_RE_WC_TYPE_RECV_UD = 0x02,
+ BNXT_RE_WC_TYPE_RECV_RAW = 0x03,
+ BNXT_RE_WC_TYPE_TERM = 0x0E,
+ BNXT_RE_WC_TYPE_COFF = 0x0F
+};
+
+#define BNXT_RE_WC_OPCD_RECV 0x80
+enum bnxt_re_req_wc_status {
+ BNXT_RE_REQ_ST_OK = 0x00,
+ BNXT_RE_REQ_ST_BAD_RESP = 0x01,
+ BNXT_RE_REQ_ST_LOC_LEN = 0x02,
+ BNXT_RE_REQ_ST_LOC_QP_OP = 0x03,
+ BNXT_RE_REQ_ST_PROT = 0x04,
+ BNXT_RE_REQ_ST_MEM_OP = 0x05,
+ BNXT_RE_REQ_ST_REM_INVAL = 0x06,
+ BNXT_RE_REQ_ST_REM_ACC = 0x07,
+ BNXT_RE_REQ_ST_REM_OP = 0x08,
+ BNXT_RE_REQ_ST_RNR_NAK_XCED = 0x09,
+ BNXT_RE_REQ_ST_TRNSP_XCED = 0x0A,
+ BNXT_RE_REQ_ST_WR_FLUSH = 0x0B
+};
+
+enum bnxt_re_rsp_wc_status {
+ BNXT_RE_RSP_ST_OK = 0x00,
+ BNXT_RE_RSP_ST_LOC_ACC = 0x01,
+ BNXT_RE_RSP_ST_LOC_LEN = 0x02,
+ BNXT_RE_RSP_ST_LOC_PROT = 0x03,
+ BNXT_RE_RSP_ST_LOC_QP_OP = 0x04,
+ BNXT_RE_RSP_ST_MEM_OP = 0x05,
+ BNXT_RE_RSP_ST_REM_INVAL = 0x06,
+ BNXT_RE_RSP_ST_WR_FLUSH = 0x07,
+ BNXT_RE_RSP_ST_HW_FLUSH = 0x08
+};
+
+enum bnxt_re_hdr_offset {
+ BNXT_RE_HDR_WT_MASK = 0xFF,
+ BNXT_RE_HDR_FLAGS_MASK = 0xFF,
+ BNXT_RE_HDR_FLAGS_SHIFT = 0x08,
+ BNXT_RE_HDR_WS_MASK = 0xFF,
+ BNXT_RE_HDR_WS_SHIFT = 0x10
+};
+
+enum bnxt_re_db_que_type {
+ BNXT_RE_QUE_TYPE_SQ = 0x00,
+ BNXT_RE_QUE_TYPE_RQ = 0x01,
+ BNXT_RE_QUE_TYPE_SRQ = 0x02,
+ BNXT_RE_QUE_TYPE_SRQ_ARM = 0x03,
+ BNXT_RE_QUE_TYPE_CQ = 0x04,
+ BNXT_RE_QUE_TYPE_CQ_ARMSE = 0x05,
+ BNXT_RE_QUE_TYPE_CQ_ARMALL = 0x06,
+ BNXT_RE_QUE_TYPE_CQ_ARMENA = 0x07,
+ BNXT_RE_QUE_TYPE_SRQ_ARMENA = 0x08,
+ BNXT_RE_QUE_TYPE_CQ_CUT_ACK = 0x09,
+ BNXT_RE_PUSH_TYPE_START = 0x0C,
+ BNXT_RE_PUSH_TYPE_END = 0x0D,
+ BNXT_RE_QUE_TYPE_NULL = 0x0F
+};
+
+enum bnxt_re_db_mask {
+ BNXT_RE_DB_INDX_MASK = 0xFFFFFFUL,
+ BNXT_RE_DB_PILO_MASK = 0x0FFUL,
+ BNXT_RE_DB_PILO_SHIFT = 0x18,
+ BNXT_RE_DB_QID_MASK = 0xFFFFFUL,
+ BNXT_RE_DB_PIHI_MASK = 0xF00UL,
+ BNXT_RE_DB_PIHI_SHIFT = 0x0C, /* Because mask is 0xF00 */
+ BNXT_RE_DB_TYP_MASK = 0x0FUL,
+ BNXT_RE_DB_TYP_SHIFT = 0x1C,
+ BNXT_RE_DB_VALID_SHIFT = 0x1A,
+ BNXT_RE_DB_EPOCH_SHIFT = 0x18,
+ BNXT_RE_DB_TOGGLE_SHIFT = 0x19,
+
+};
+
+enum bnxt_re_psns_mask {
+ BNXT_RE_PSNS_SPSN_MASK = 0xFFFFFF,
+ BNXT_RE_PSNS_OPCD_MASK = 0xFF,
+ BNXT_RE_PSNS_OPCD_SHIFT = 0x18,
+ BNXT_RE_PSNS_NPSN_MASK = 0xFFFFFF,
+ BNXT_RE_PSNS_FLAGS_MASK = 0xFF,
+ BNXT_RE_PSNS_FLAGS_SHIFT = 0x18
+};
+
+enum bnxt_re_msns_mask {
+ BNXT_RE_SQ_MSN_SEARCH_START_PSN_MASK = 0xFFFFFFUL,
+ BNXT_RE_SQ_MSN_SEARCH_START_PSN_SHIFT = 0,
+ BNXT_RE_SQ_MSN_SEARCH_NEXT_PSN_MASK = 0xFFFFFF000000ULL,
+ BNXT_RE_SQ_MSN_SEARCH_NEXT_PSN_SHIFT = 0x18,
+ BNXT_RE_SQ_MSN_SEARCH_START_IDX_MASK = 0xFFFF000000000000ULL,
+ BNXT_RE_SQ_MSN_SEARCH_START_IDX_SHIFT = 0x30
+};
+
+enum bnxt_re_bcqe_mask {
+ BNXT_RE_BCQE_PH_MASK = 0x01,
+ BNXT_RE_BCQE_TYPE_MASK = 0x0F,
+ BNXT_RE_BCQE_TYPE_SHIFT = 0x01,
+ BNXT_RE_BCQE_STATUS_MASK = 0xFF,
+ BNXT_RE_BCQE_STATUS_SHIFT = 0x08,
+ BNXT_RE_BCQE_FLAGS_MASK = 0xFFFFU,
+ BNXT_RE_BCQE_FLAGS_SHIFT = 0x10,
+ BNXT_RE_BCQE_RWRID_MASK = 0xFFFFFU,
+ BNXT_RE_BCQE_SRCQP_MASK = 0xFF,
+ BNXT_RE_BCQE_SRCQP_SHIFT = 0x18
+};
+
+enum bnxt_re_rc_flags_mask {
+ BNXT_RE_RC_FLAGS_SRQ_RQ_MASK = 0x01,
+ BNXT_RE_RC_FLAGS_IMM_MASK = 0x02,
+ BNXT_RE_RC_FLAGS_IMM_SHIFT = 0x01,
+ BNXT_RE_RC_FLAGS_INV_MASK = 0x04,
+ BNXT_RE_RC_FLAGS_INV_SHIFT = 0x02,
+ BNXT_RE_RC_FLAGS_RDMA_MASK = 0x08,
+ BNXT_RE_RC_FLAGS_RDMA_SHIFT = 0x03
+};
+
+enum bnxt_re_ud_flags_mask {
+ BNXT_RE_UD_FLAGS_SRQ_RQ_MASK = 0x01,
+ BNXT_RE_UD_FLAGS_SRQ_RQ_SFT = 0x00,
+ BNXT_RE_UD_FLAGS_IMM_MASK = 0x02,
+ BNXT_RE_UD_FLAGS_IMM_SFT = 0x01,
+ BNXT_RE_UD_FLAGS_IP_VER_MASK = 0x30,
+ BNXT_RE_UD_FLAGS_IP_VER_SFT = 0x4,
+ BNXT_RE_UD_FLAGS_META_MASK = 0x3C0,
+ BNXT_RE_UD_FLAGS_META_SFT = 0x6,
+ BNXT_RE_UD_FLAGS_EXT_META_MASK = 0xC00,
+ BNXT_RE_UD_FLAGS_EXT_META_SFT = 0x10,
+};
+
+enum bnxt_re_ud_cqe_mask {
+ BNXT_RE_UD_CQE_MAC_MASK = 0xFFFFFFFFFFFFULL,
+ BNXT_RE_UD_CQE_SRCQPLO_MASK = 0xFFFF,
+ BNXT_RE_UD_CQE_SRCQPLO_SHIFT = 0x30,
+ BNXT_RE_UD_CQE_LEN_MASK = 0x3FFFU
+};
+
+enum bnxt_re_shpg_offt {
+ BNXT_RE_SHPG_BEG_RESV_OFFT = 0x00,
+ BNXT_RE_SHPG_AVID_OFFT = 0x10,
+ BNXT_RE_SHPG_AVID_SIZE = 0x04,
+ BNXT_RE_SHPG_END_RESV_OFFT = 0xFF0
+};
+
+enum bnxt_re_que_flags_mask {
+ BNXT_RE_FLAG_EPOCH_TAIL_SHIFT = 0x0UL,
+ BNXT_RE_FLAG_EPOCH_HEAD_SHIFT = 0x1UL,
+ BNXT_RE_FLAG_EPOCH_TAIL_MASK = 0x1UL,
+ BNXT_RE_FLAG_EPOCH_HEAD_MASK = 0x2UL,
+};
+
+enum bnxt_re_db_epoch_flag_shift {
+ BNXT_RE_DB_EPOCH_TAIL_SHIFT = BNXT_RE_DB_EPOCH_SHIFT,
+ BNXT_RE_DB_EPOCH_HEAD_SHIFT = (BNXT_RE_DB_EPOCH_SHIFT - 1)
+};
+
+enum bnxt_re_ppp_st_en_mask {
+ BNXT_RE_PPP_ENABLED_MASK = 0x1UL,
+ BNXT_RE_PPP_STATE_MASK = 0x2UL,
+};
+
+enum bnxt_re_ppp_st_shift {
+ BNXT_RE_PPP_ST_SHIFT = 0x1UL
+};
+
+struct bnxt_re_db_hdr {
+ __u64 typ_qid_indx; /* typ: 4, qid:20, indx:24 */
+};
+
+#define BNXT_RE_CHIP_ID0_CHIP_NUM_SFT 0x00
+#define BNXT_RE_CHIP_ID0_CHIP_REV_SFT 0x10
+#define BNXT_RE_CHIP_ID0_CHIP_MET_SFT 0x18
+
+enum {
+ BNXT_RE_COMP_MASK_UCNTX_WC_DPI_ENABLED = 0x01,
+ BNXT_RE_COMP_MASK_UCNTX_POW2_DISABLED = 0x02,
+ BNXT_RE_COMP_MASK_UCNTX_RSVD_WQE_DISABLED = 0x04,
+ BNXT_RE_COMP_MASK_UCNTX_MQP_EX_SUPPORTED = 0x8,
+ BNXT_RE_COMP_MASK_UCNTX_DBR_PACING_ENABLED = 0x10,
+ BNXT_RE_COMP_MASK_UCNTX_DBR_RECOVERY_ENABLED = 0x20,
+ BNXT_RE_COMP_MASK_UCNTX_HW_RETX_ENABLED = 0x40
+};
+
+enum bnxt_re_req_to_drv {
+ BNXT_RE_COMP_MASK_REQ_UCNTX_POW2_SUPPORT = 0x01,
+ BNXT_RE_COMP_MASK_REQ_UCNTX_RSVD_WQE = 0x02
+};
+
+#define BNXT_RE_WQE_MODES_WQE_MODE_MASK 0x01
+/* bit wise modes can be extended here. */
+enum bnxt_re_modes {
+ BNXT_RE_WQE_MODE_STATIC = 0x00,
+ BNXT_RE_WQE_MODE_VARIABLE = 0x01
+ /* Other modes can be here */
+};
+
+struct bnxt_re_cntx_req {
+ struct ibv_get_context cmd;
+ __aligned_u64 comp_mask;
+};
+
+struct bnxt_re_cntx_resp {
+ struct ibv_get_context_resp resp;
+ __u32 dev_id;
+ __u32 max_qp; /* To allocate qp-table */
+ __u32 pg_size;
+ __u32 cqe_size;
+ __u32 max_cqd;
+ __u32 chip_id0;
+ __u32 chip_id1;
+ __u32 modes;
+ __aligned_u64 comp_mask;
+} __attribute__((packed));
+
+enum {
+ BNXT_RE_COMP_MASK_PD_HAS_WC_DPI = 0x01,
+ BNXT_RE_COMP_MASK_PD_HAS_DBR_BAR_ADDR = 0x02,
+};
+
+struct bnxt_re_pd_resp {
+ struct ibv_alloc_pd_resp resp;
+ __u32 pdid;
+ __u32 dpi;
+ __u64 dbr;
+ __u64 comp_mask;
+ __u32 wcdpi;
+ __u64 dbr_bar_map;
+} __attribute__((packed));
+
+struct bnxt_re_mr_resp {
+ struct ibv_reg_mr_resp resp;
+} __attribute__((packed));
+
+/* CQ */
+enum {
+ BNXT_RE_COMP_MASK_CQ_HAS_DB_INFO = 0x01,
+ BNXT_RE_COMP_MASK_CQ_HAS_WC_DPI = 0x02,
+ BNXT_RE_COMP_MASK_CQ_HAS_CQ_PAGE = 0x04
+};
+
+enum {
+ BNXT_RE_COMP_MASK_CQ_REQ_HAS_CAP_MASK = 0x1
+};
+
+enum {
+ BNXT_RE_COMP_MASK_CQ_REQ_CAP_DBR_RECOVERY = 0x1
+};
+
+struct bnxt_re_cq_req {
+ struct ibv_create_cq cmd;
+ __u64 cq_va;
+ __u64 cq_handle;
+ __aligned_u64 comp_mask;
+ __u16 cq_capab;
+} __attribute__((packed));
+
+struct bnxt_re_cq_resp {
+ struct ibv_create_cq_resp resp;
+ __u32 cqid;
+ __u32 tail;
+ __u32 phase;
+ __u32 rsvd;
+ __aligned_u64 comp_mask;
+ __u32 dpi;
+ __u64 dbr;
+ __u32 wcdpi;
+ __u64 cq_page;
+} __attribute__((packed));
+
+struct bnxt_re_resize_cq_req {
+ struct ibv_resize_cq cmd;
+ __u64 cq_va;
+} __attribute__((packed));
+
+struct bnxt_re_bcqe {
+ __u32 flg_st_typ_ph;
+ __u32 qphi_rwrid;
+} __attribute__((packed));
+
+struct bnxt_re_req_cqe {
+ __u64 qp_handle;
+ __u32 con_indx; /* 16 bits valid. */
+ __u32 rsvd1;
+ __u64 rsvd2;
+} __attribute__((packed));
+
+struct bnxt_re_rc_cqe {
+ __u32 length;
+ __u32 imm_key;
+ __u64 qp_handle;
+ __u64 mr_handle;
+} __attribute__((packed));
+
+struct bnxt_re_ud_cqe {
+ __u32 length; /* 14 bits */
+ __u32 immd;
+ __u64 qp_handle;
+ __u64 qplo_mac; /* 16:48*/
+} __attribute__((packed));
+
+struct bnxt_re_term_cqe {
+ __u64 qp_handle;
+ __u32 rq_sq_cidx;
+ __u32 rsvd;
+ __u64 rsvd1;
+} __attribute__((packed));
+
+struct bnxt_re_cutoff_cqe {
+ __u64 rsvd1;
+ __u64 rsvd2;
+ __u64 rsvd3;
+ __u8 cqe_type_toggle;
+ __u8 status;
+ __u16 rsvd4;
+ __u32 rsvd5;
+} __attribute__((packed));
+
+/* QP */
+struct bnxt_re_qp_req {
+ struct ibv_create_qp cmd;
+ __u64 qpsva;
+ __u64 qprva;
+ __u64 qp_handle;
+} __attribute__((packed));
+
+struct bnxt_re_qp_resp {
+ struct ibv_create_qp_resp resp;
+ __u32 qpid;
+} __attribute__((packed));
+
+enum bnxt_re_modify_ex_mask {
+ BNXT_RE_MQP_PPP_REQ_EN_MASK = 0x1UL,
+ BNXT_RE_MQP_PPP_REQ_EN = 0x1UL,
+ BNXT_RE_MQP_PATH_MTU_MASK = 0x2UL,
+ BNXT_RE_MQP_PPP_IDX_MASK = 0x7UL,
+ BNXT_RE_MQP_PPP_STATE = 0x10UL
+};
+
+/* Modify QP */
+struct bnxt_re_modify_ex_req {
+ struct ibv_modify_qp_ex cmd;
+ __aligned_u64 comp_mask;
+ __u32 dpi;
+ __u32 rsvd;
+};
+
+struct bnxt_re_modify_ex_resp {
+ struct ibv_modify_qp_resp_ex resp;
+ __aligned_u64 comp_mask;
+ __u32 ppp_st_idx;
+ __u32 path_mtu;
+};
+
+union lower_shdr {
+ __u64 qkey_len;
+ __u64 lkey_plkey;
+ __u64 rva;
+};
+
+struct bnxt_re_bsqe {
+ __u32 rsv_ws_fl_wt;
+ __u32 key_immd;
+ union lower_shdr lhdr;
+} __attribute__((packed));
+
+struct bnxt_re_psns_ext {
+ __u32 opc_spsn;
+ __u32 flg_npsn;
+ __u16 st_slot_idx;
+ __u16 rsvd0;
+ __u32 rsvd1;
+} __attribute__((packed));
+
+/* sq_msn_search (size:64b/8B) */
+struct bnxt_re_msns {
+ __u64 start_idx_next_psn_start_psn;
+} __attribute__((packed));
+
+struct bnxt_re_psns {
+ __u32 opc_spsn;
+ __u32 flg_npsn;
+} __attribute__((packed));
+
+struct bnxt_re_sge {
+ __u64 pa;
+ __u32 lkey;
+ __u32 length;
+} __attribute__((packed));
+
+struct bnxt_re_send {
+ __u32 dst_qp;
+ __u32 avid;
+ __u64 rsvd;
+} __attribute__((packed));
+
+struct bnxt_re_raw {
+ __u32 cfa_meta;
+ __u32 rsvd2;
+ __u64 rsvd3;
+} __attribute__((packed));
+
+struct bnxt_re_rdma {
+ __u64 rva;
+ __u32 rkey;
+ __u32 rsvd2;
+} __attribute__((packed));
+
+struct bnxt_re_atomic {
+ __u64 swp_dt;
+ __u64 cmp_dt;
+} __attribute__((packed));
+
+struct bnxt_re_inval {
+ __u64 rsvd[2];
+} __attribute__((packed));
+
+struct bnxt_re_bind {
+ __u64 va;
+ __u64 len; /* only 40 bits are valid */
+} __attribute__((packed));
+
+struct bnxt_re_brqe {
+ __u32 rsv_ws_fl_wt;
+ __u32 rsvd;
+ __u32 wrid;
+ __u32 rsvd1;
+} __attribute__((packed));
+
+struct bnxt_re_rqe {
+ __u64 rsvd[2];
+} __attribute__((packed));
+
+/* SRQ */
+struct bnxt_re_srq_req {
+ struct ibv_create_srq cmd;
+ __u64 srqva;
+ __u64 srq_handle;
+} __attribute__((packed));
+
+struct bnxt_re_srq_resp {
+ struct ibv_create_srq_resp resp;
+ __u32 srqid;
+} __attribute__((packed));
+
+struct bnxt_re_srqe {
+ __u64 rsvd[2];
+} __attribute__((packed));
+
+struct bnxt_re_push_wqe {
+ __u64 addr[32];
+} __attribute__((packed));;
+
+#endif
diff --git a/contrib/ofed/libbnxtre/db.c b/contrib/ofed/libbnxtre/db.c
new file mode 100644
index 000000000000..8751297c9218
--- /dev/null
+++ b/contrib/ofed/libbnxtre/db.c
@@ -0,0 +1,566 @@
+/*
+ * Copyright (c) 2024, Broadcom. All rights reserved. The term
+ * Broadcom refers to Broadcom Limited and/or its subsidiaries.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ *
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in
+ * the documentation and/or other materials provided with the
+ * distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS''
+ * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
+ * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
+ * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS
+ * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+ * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+ * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+ * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+ * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+ * OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+ * IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ *
+ * Description: Doorbell handling functions.
+ */
+
+#include <malloc.h>
+#include <unistd.h>
+
+#include "abi.h"
+#include "main.h"
+
+#define BNXT_RE_DB_FIFO_ROOM_MASK_P5 0x1FFF8000
+#define BNXT_RE_MAX_FIFO_DEPTH_P5 0x2c00
+
+#define BNXT_RE_DB_FIFO_ROOM_MASK_P7 0x3FFF8000
+#define BNXT_RE_MAX_FIFO_DEPTH_P7 0x8000
+
+#define BNXT_RE_DB_FIFO_ROOM_SHIFT 15
+#define BNXT_RE_DB_THRESHOLD 20
+
+#define BNXT_RE_DB_FIFO_ROOM_MASK(ctx) \
+ (_is_chip_thor2((ctx)) ? \
+ BNXT_RE_DB_FIFO_ROOM_MASK_P7 :\
+ BNXT_RE_DB_FIFO_ROOM_MASK_P5)
+#define BNXT_RE_MAX_FIFO_DEPTH(ctx) \
+ (_is_chip_thor2((ctx)) ? \
+ BNXT_RE_MAX_FIFO_DEPTH_P7 :\
+ BNXT_RE_MAX_FIFO_DEPTH_P5)
+
+static uint32_t xorshift32(struct xorshift32_state *state)
+{
+ /* Algorithm "xor" from p. 4 of Marsaglia, "Xorshift RNGs" */
+ uint32_t x = state->seed;
+
+ x ^= x << 13;
+ x ^= x >> 17;
+ x ^= x << 5;
+ return state->seed = x;
+}
+
+static uint16_t rnd(struct xorshift32_state *state, uint16_t range)
+{
+ /* range must be a power of 2 - 1 */
+ return (xorshift32(state) & range);
+}
+
+static int calculate_fifo_occupancy(struct bnxt_re_context *cntx)
+{
+ uint32_t *dbr_map = cntx->bar_map + 0x1a8;
+ uint32_t read_val, fifo_occup;
+
+ read_val = *dbr_map;
+ fifo_occup = BNXT_RE_MAX_FIFO_DEPTH(cntx->cctx) -
+ ((read_val & BNXT_RE_DB_FIFO_ROOM_MASK(cntx->cctx)) >>
+ BNXT_RE_DB_FIFO_ROOM_SHIFT);
+
+ return fifo_occup;
+}
+
+static inline uint32_t find_min(uint32_t x, uint32_t y)
+{
+ return (y > x ? x : y);
+}
+
+int bnxt_re_do_pacing(struct bnxt_re_context *cntx, struct xorshift32_state *state)
+{
+ /* First 4 bytes of shared page (pacing_info) contains the DBR
+ * pacing information. Second 4 bytes (pacing_th) contains
+ * the pacing threshold value to determine whether to
+ * add delay or not
+ */
+ struct bnxt_re_pacing_data *pacing_data =
+ (struct bnxt_re_pacing_data *)cntx->dbr_page;
+ uint32_t wait_time = 1;
+ uint32_t fifo_occup;
+
+ if (!pacing_data)
+ return 0;
+ /* If the device in error recovery state, return error to
+ * not to ring new doorbells in this state.
+ */
+ if (pacing_data->dev_err_state)
+ return -EFAULT;
+
+ if (rnd(state, BNXT_RE_MAX_DO_PACING) < pacing_data->do_pacing) {
+ while ((fifo_occup = calculate_fifo_occupancy(cntx))
+ > pacing_data->pacing_th) {
+ struct bnxt_re_cq *cq;
+ uint32_t usec_wait;
+
+ if (pacing_data->alarm_th && fifo_occup > pacing_data->alarm_th) {
+ cq = container_of(cntx->dbr_cq, struct bnxt_re_cq, ibvcq);
+ bnxt_re_poll_kernel_cq(cq);
+ }
+ usec_wait = rnd(state, wait_time - 1);
+ if (usec_wait)
+ bnxt_re_sub_sec_busy_wait(usec_wait * 1000);
+ /* wait time capped at 128 us */
+ wait_time = find_min(wait_time * 2, 128);
+ }
+ }
+ return 0;
+}
+
+static inline void bnxt_re_ring_db(struct bnxt_re_dpi *dpi, __u64 key,
+ uint64_t *db_key, uint8_t *lock)
+{
+ while (1) {
+ if (__sync_bool_compare_and_swap(lock, 0, 1)) {
+ *db_key = key;
+ bnxt_re_wm_barrier();
+ iowrite64(dpi->dbpage, key);
+ bnxt_re_wm_barrier();
+ *lock = 0;
+ break;
+ }
+ }
+}
+
+static inline void bnxt_re_init_push_hdr(struct bnxt_re_db_hdr *hdr,
+ uint32_t indx, uint32_t qid,
+ uint32_t typ, uint32_t pidx)
+{
+ __u64 key_lo, key_hi;
+
+ key_lo = (((pidx & BNXT_RE_DB_PILO_MASK) << BNXT_RE_DB_PILO_SHIFT) |
+ (indx & BNXT_RE_DB_INDX_MASK));
+ key_hi = ((((pidx & BNXT_RE_DB_PIHI_MASK) << BNXT_RE_DB_PIHI_SHIFT) |
+ (qid & BNXT_RE_DB_QID_MASK)) |
+ ((typ & BNXT_RE_DB_TYP_MASK) << BNXT_RE_DB_TYP_SHIFT) |
+ (0x1UL << BNXT_RE_DB_VALID_SHIFT));
+ hdr->typ_qid_indx = htole64((key_lo | (key_hi << 32)));
+}
+
+static inline void bnxt_re_init_db_hdr(struct bnxt_re_db_hdr *hdr,
+ uint32_t indx, uint32_t toggle,
+ uint32_t qid, uint32_t typ)
+{
+ __u64 key_lo, key_hi;
+
+ key_lo = htole32(indx | toggle);
+ key_hi = ((qid & BNXT_RE_DB_QID_MASK) |
+ ((typ & BNXT_RE_DB_TYP_MASK) << BNXT_RE_DB_TYP_SHIFT) |
+ (0x1UL << BNXT_RE_DB_VALID_SHIFT));
+ hdr->typ_qid_indx = htole64((key_lo | (key_hi << 32)));
+}
+
+static inline void __bnxt_re_ring_pend_db(__u64 *ucdb, __u64 key,
+ struct bnxt_re_qp *qp)
+{
+ struct bnxt_re_db_hdr hdr;
+
+ bnxt_re_init_db_hdr(&hdr,
+ (*qp->jsqq->hwque->dbtail |
+ ((qp->jsqq->hwque->flags &
+ BNXT_RE_FLAG_EPOCH_TAIL_MASK) <<
+ BNXT_RE_DB_EPOCH_TAIL_SHIFT)), 0,
+ qp->qpid,
+ BNXT_RE_QUE_TYPE_SQ);
+
+ while (1) {
+ if (__sync_bool_compare_and_swap(&qp->sq_dbr_lock, 0, 1)) {
+ qp->sq_shadow_db_key = hdr.typ_qid_indx;
+ bnxt_re_wm_barrier();
+ iowrite64(ucdb, key);
+ bnxt_re_wm_barrier();
+ qp->sq_dbr_lock = 0;
+ break;
+ }
+ }
+}
+
+void bnxt_re_ring_rq_db(struct bnxt_re_qp *qp)
+{
+ struct bnxt_re_db_hdr hdr;
+
+ if (bnxt_re_do_pacing(qp->cntx, &qp->rand))
+ return;
+ bnxt_re_init_db_hdr(&hdr,
+ (*qp->jrqq->hwque->dbtail |
+ ((qp->jrqq->hwque->flags &
+ BNXT_RE_FLAG_EPOCH_TAIL_MASK) <<
+ BNXT_RE_DB_EPOCH_TAIL_SHIFT)), 0,
+ qp->qpid,
+ BNXT_RE_QUE_TYPE_RQ);
+ bnxt_re_ring_db(qp->udpi, hdr.typ_qid_indx, &qp->rq_shadow_db_key,
+ &qp->rq_dbr_lock);
+}
+
+void bnxt_re_ring_sq_db(struct bnxt_re_qp *qp)
+{
+ struct bnxt_re_db_hdr hdr;
+
+ if (bnxt_re_do_pacing(qp->cntx, &qp->rand))
+ return;
+ bnxt_re_init_db_hdr(&hdr,
+ (*qp->jsqq->hwque->dbtail |
+ ((qp->jsqq->hwque->flags &
+ BNXT_RE_FLAG_EPOCH_TAIL_MASK) <<
+ BNXT_RE_DB_EPOCH_TAIL_SHIFT)), 0,
+ qp->qpid,
+ BNXT_RE_QUE_TYPE_SQ);
+ bnxt_re_ring_db(qp->udpi, hdr.typ_qid_indx, &qp->sq_shadow_db_key,
+ &qp->sq_dbr_lock);
+}
+
+void bnxt_re_ring_srq_db(struct bnxt_re_srq *srq)
+{
+ struct bnxt_re_db_hdr hdr;
+
+ if (bnxt_re_do_pacing(srq->uctx, &srq->rand))
+ return;
+ bnxt_re_init_db_hdr(&hdr,
+ (srq->srqq->tail |
+ ((srq->srqq->flags &
+ BNXT_RE_FLAG_EPOCH_TAIL_MASK) <<
+ BNXT_RE_DB_EPOCH_TAIL_SHIFT)), 0,
+ srq->srqid, BNXT_RE_QUE_TYPE_SRQ);
+ bnxt_re_ring_db(srq->udpi, hdr.typ_qid_indx, &srq->shadow_db_key,
+ &srq->dbr_lock);
+}
+
+void bnxt_re_ring_srq_arm(struct bnxt_re_srq *srq)
+{
+ struct bnxt_re_db_hdr hdr;
+
+ if (bnxt_re_do_pacing(srq->uctx, &srq->rand))
+ return;
+ bnxt_re_init_db_hdr(&hdr, srq->cap.srq_limit, 0, srq->srqid,
+ BNXT_RE_QUE_TYPE_SRQ_ARM);
+ bnxt_re_ring_db(srq->udpi, hdr.typ_qid_indx, &srq->shadow_db_key,
+ &srq->dbr_lock);
+}
+
+void bnxt_re_ring_cq_db(struct bnxt_re_cq *cq)
+{
+ struct bnxt_re_db_hdr hdr;
+
+ if (bnxt_re_do_pacing(cq->cntx, &cq->rand))
+ return;
+ bnxt_re_init_db_hdr(&hdr,
+ (cq->cqq->head |
+ ((cq->cqq->flags &
+ BNXT_RE_FLAG_EPOCH_HEAD_MASK) <<
+ BNXT_RE_DB_EPOCH_HEAD_SHIFT)), 0,
+ cq->cqid,
+ BNXT_RE_QUE_TYPE_CQ);
+ bnxt_re_ring_db(cq->udpi, hdr.typ_qid_indx, &cq->shadow_db_key,
+ &cq->dbr_lock);
+}
+
+void bnxt_re_ring_cq_arm_db(struct bnxt_re_cq *cq, uint8_t aflag)
+{
+ uint32_t *cq_page = cq->cq_page;
+ struct bnxt_re_db_hdr hdr;
+ uint32_t toggle = 0;
+
+ if (cq_page)
+ toggle = *cq_page;
+
+ if (bnxt_re_do_pacing(cq->cntx, &cq->rand))
+ return;
+ bnxt_re_init_db_hdr(&hdr,
+ (cq->cqq->head |
+ ((cq->cqq->flags &
+ BNXT_RE_FLAG_EPOCH_HEAD_MASK) <<
+ BNXT_RE_DB_EPOCH_HEAD_SHIFT)),
+ toggle << BNXT_RE_DB_TOGGLE_SHIFT,
+ cq->cqid, aflag);
+ bnxt_re_ring_db(cq->udpi, hdr.typ_qid_indx, &cq->shadow_db_key,
+ &cq->dbr_lock);
+}
+
+void bnxt_re_ring_pstart_db(struct bnxt_re_qp *qp,
+ struct bnxt_re_push_buffer *pbuf)
+{
+ __u64 key;
+
+ if (bnxt_re_do_pacing(qp->cntx, &qp->rand))
+ return;
+ key = ((((pbuf->wcdpi & BNXT_RE_DB_PIHI_MASK) <<
+ BNXT_RE_DB_PIHI_SHIFT) | (pbuf->qpid & BNXT_RE_DB_QID_MASK)) |
+ ((BNXT_RE_PUSH_TYPE_START & BNXT_RE_DB_TYP_MASK) <<
+ BNXT_RE_DB_TYP_SHIFT) | (0x1UL << BNXT_RE_DB_VALID_SHIFT));
+ key <<= 32;
+ key |= ((((__u32)pbuf->wcdpi & BNXT_RE_DB_PILO_MASK) <<
+ BNXT_RE_DB_PILO_SHIFT) | (pbuf->st_idx &
+ BNXT_RE_DB_INDX_MASK));
+ bnxt_re_wm_barrier();
+ iowrite64(pbuf->ucdb, key);
+}
+
+void bnxt_re_ring_pend_db(struct bnxt_re_qp *qp,
+ struct bnxt_re_push_buffer *pbuf)
+{
+ __u64 key;
+
+ if (bnxt_re_do_pacing(qp->cntx, &qp->rand))
+ return;
+ key = ((((pbuf->wcdpi & BNXT_RE_DB_PIHI_MASK) <<
+ BNXT_RE_DB_PIHI_SHIFT) | (pbuf->qpid & BNXT_RE_DB_QID_MASK)) |
+ ((BNXT_RE_PUSH_TYPE_END & BNXT_RE_DB_TYP_MASK) <<
+ BNXT_RE_DB_TYP_SHIFT) | (0x1UL << BNXT_RE_DB_VALID_SHIFT));
+ key <<= 32;
+ key |= ((((__u32)pbuf->wcdpi & BNXT_RE_DB_PILO_MASK) <<
+ BNXT_RE_DB_PILO_SHIFT) | (pbuf->tail &
+ BNXT_RE_DB_INDX_MASK));
+ __bnxt_re_ring_pend_db(pbuf->ucdb, key, qp);
+}
+
+void bnxt_re_fill_ppp(struct bnxt_re_push_buffer *pbuf,
+ struct bnxt_re_qp *qp, uint8_t len, uint32_t idx)
+{
+ struct bnxt_re_db_ppp_hdr phdr = {};
+ __u64 *dst, *src;
+ __u8 plen;
+ int indx;
+
+ src = (__u64 *)&phdr;
+ plen = len + sizeof(phdr) + bnxt_re_get_sqe_hdr_sz();
+
+ bnxt_re_init_db_hdr(&phdr.db_hdr,
+ (*qp->jsqq->hwque->dbtail |
+ ((qp->jsqq->hwque->flags &
+ BNXT_RE_FLAG_EPOCH_TAIL_MASK) <<
+ BNXT_RE_DB_EPOCH_TAIL_SHIFT)), 0,
+ qp->qpid,
+ BNXT_RE_QUE_TYPE_SQ);
+
+ phdr.rsv_psz_pidx = ((pbuf->st_idx & BNXT_RE_DB_INDX_MASK) |
+ (((plen % 8 ? (plen / 8) + 1 :
+ plen / 8) & BNXT_RE_PUSH_SIZE_MASK) <<
+ BNXT_RE_PUSH_SIZE_SHIFT));
+
+ bnxt_re_wm_barrier();
+ for (indx = 0; indx < 2; indx++) {
+ dst = (__u64 *)(pbuf->pbuf + indx);
+ iowrite64(dst, *src);
+ src++;
+ }
+ bnxt_re_copy_data_to_pb(pbuf, 1, idx);
+ mmio_flush_writes();
+}
+
+void bnxt_re_fill_push_wcb(struct bnxt_re_qp *qp,
+ struct bnxt_re_push_buffer *pbuf, uint32_t idx)
+{
+ bnxt_re_ring_pstart_db(qp, pbuf);
+ mmio_wc_start();
+ bnxt_re_copy_data_to_pb(pbuf, 0, idx);
+ /* Flush WQE write before push end db. */
+ mmio_flush_writes();
+ bnxt_re_ring_pend_db(qp, pbuf);
+}
+
+int bnxt_re_init_pbuf_list(struct bnxt_re_context *ucntx)
+{
+ struct bnxt_re_push_buffer *pbuf;
+ int indx, wqesz;
+ int size, offt;
+ __u64 wcpage;
+ __u64 dbpage;
+ void *base;
+
+ size = (sizeof(*ucntx->pbrec) +
+ 16 * (sizeof(*ucntx->pbrec->pbuf) +
+ sizeof(struct bnxt_re_push_wqe)));
+ ucntx->pbrec = calloc(1, size);
+ if (!ucntx->pbrec)
+ goto out;
+
+ offt = sizeof(*ucntx->pbrec);
+ base = ucntx->pbrec;
+ ucntx->pbrec->pbuf = (base + offt);
*** 4326 LINES SKIPPED ***