13ec648c6SKrzysztof Kozlowski /* SPDX-License-Identifier: GPL-2.0 OR BSD-3-Clause */ 2a5319752SBernard Metzler 3a5319752SBernard Metzler /* Authors: Bernard Metzler <bmt@zurich.ibm.com> */ 4a5319752SBernard Metzler /* Copyright (c) 2008-2019, IBM Corporation */ 5a5319752SBernard Metzler 6a5319752SBernard Metzler #ifndef _SIW_H 7a5319752SBernard Metzler #define _SIW_H 8a5319752SBernard Metzler 9a5319752SBernard Metzler #include <rdma/ib_verbs.h> 1058fb0b56SBernard Metzler #include <rdma/restrack.h> 11a5319752SBernard Metzler #include <linux/socket.h> 12a5319752SBernard Metzler #include <linux/skbuff.h> 13a5319752SBernard Metzler #include <linux/crc32.h> 14a5319752SBernard Metzler #include <linux/crc32c.h> 15426370c8SEric Biggers #include <linux/unaligned.h> 16a5319752SBernard Metzler 17a5319752SBernard Metzler #include <rdma/siw-abi.h> 18a5319752SBernard Metzler #include "iwarp.h" 19a5319752SBernard Metzler 20a5319752SBernard Metzler #define SIW_VENDOR_ID 0x626d74 /* ascii 'bmt' for now */ 21a5319752SBernard Metzler #define SIW_VENDORT_PART_ID 0 22a5319752SBernard Metzler #define SIW_MAX_QP (1024 * 100) 23a5319752SBernard Metzler #define SIW_MAX_QP_WR (1024 * 32) 24a5319752SBernard Metzler #define SIW_MAX_ORD_QP 128 25a5319752SBernard Metzler #define SIW_MAX_IRD_QP 128 26a5319752SBernard Metzler #define SIW_MAX_SGE_PBL 256 /* max num sge's for PBL */ 27a5319752SBernard Metzler #define SIW_MAX_SGE_RD 1 /* iwarp limitation. we could relax */ 28a5319752SBernard Metzler #define SIW_MAX_CQ (1024 * 100) 29a5319752SBernard Metzler #define SIW_MAX_CQE (SIW_MAX_QP_WR * 100) 30a5319752SBernard Metzler #define SIW_MAX_MR (SIW_MAX_QP * 10) 31a5319752SBernard Metzler #define SIW_MAX_PD SIW_MAX_QP 32a5319752SBernard Metzler #define SIW_MAX_MW 0 /* to be set if MW's are supported */ 33a5319752SBernard Metzler #define SIW_MAX_SRQ SIW_MAX_QP 34a5319752SBernard Metzler #define SIW_MAX_SRQ_WR (SIW_MAX_QP_WR * 10) 35a5319752SBernard Metzler #define SIW_MAX_CONTEXT SIW_MAX_PD 36a5319752SBernard Metzler 37a5319752SBernard Metzler /* Min number of bytes for using zero copy transmit */ 38a5319752SBernard Metzler #define SENDPAGE_THRESH PAGE_SIZE 39a5319752SBernard Metzler 40a5319752SBernard Metzler /* Maximum number of frames which can be send in one SQ processing */ 41a5319752SBernard Metzler #define SQ_USER_MAXBURST 100 42a5319752SBernard Metzler 43a5319752SBernard Metzler /* Maximum number of consecutive IRQ elements which get served 44a5319752SBernard Metzler * if SQ has pending work. Prevents starving local SQ processing 45a5319752SBernard Metzler * by serving peer Read Requests. 46a5319752SBernard Metzler */ 47a5319752SBernard Metzler #define SIW_IRQ_MAXBURST_SQ_ACTIVE 4 48a5319752SBernard Metzler 4916b87037SBernard Metzler /* There is always only a port 1 per siw device */ 5016b87037SBernard Metzler #define SIW_PORT 1 5116b87037SBernard Metzler 52a5319752SBernard Metzler struct siw_dev_cap { 53a5319752SBernard Metzler int max_qp; 54a5319752SBernard Metzler int max_qp_wr; 55a5319752SBernard Metzler int max_ord; /* max. outbound read queue depth */ 56a5319752SBernard Metzler int max_ird; /* max. inbound read queue depth */ 57a5319752SBernard Metzler int max_sge; 58a5319752SBernard Metzler int max_sge_rd; 59a5319752SBernard Metzler int max_cq; 60a5319752SBernard Metzler int max_cqe; 61a5319752SBernard Metzler int max_mr; 62a5319752SBernard Metzler int max_pd; 63a5319752SBernard Metzler int max_mw; 64a5319752SBernard Metzler int max_srq; 65a5319752SBernard Metzler int max_srq_wr; 66a5319752SBernard Metzler int max_srq_sge; 67a5319752SBernard Metzler }; 68a5319752SBernard Metzler 69a5319752SBernard Metzler struct siw_pd { 70a5319752SBernard Metzler struct ib_pd base_pd; 71a5319752SBernard Metzler }; 72a5319752SBernard Metzler 73a5319752SBernard Metzler struct siw_device { 74a5319752SBernard Metzler struct ib_device base_dev; 75a5319752SBernard Metzler struct siw_dev_cap attrs; 76a5319752SBernard Metzler 77a5319752SBernard Metzler u32 vendor_part_id; 78a5319752SBernard Metzler int numa_node; 79bad5b6e3SChuck Lever char raw_gid[ETH_ALEN]; 80a5319752SBernard Metzler 81a5319752SBernard Metzler spinlock_t lock; 82a5319752SBernard Metzler 83a5319752SBernard Metzler struct xarray qp_xa; 84a5319752SBernard Metzler struct xarray mem_xa; 85a5319752SBernard Metzler 86a5319752SBernard Metzler struct list_head cep_list; 87a5319752SBernard Metzler struct list_head qp_list; 88a5319752SBernard Metzler 89a5319752SBernard Metzler /* active objects statistics to enforce limits */ 90a5319752SBernard Metzler atomic_t num_qp; 91a5319752SBernard Metzler atomic_t num_cq; 92a5319752SBernard Metzler atomic_t num_pd; 93a5319752SBernard Metzler atomic_t num_mr; 94a5319752SBernard Metzler atomic_t num_srq; 95a5319752SBernard Metzler atomic_t num_ctx; 96a5319752SBernard Metzler }; 97a5319752SBernard Metzler 98a5319752SBernard Metzler struct siw_ucontext { 99a5319752SBernard Metzler struct ib_ucontext base_ucontext; 100a5319752SBernard Metzler struct siw_device *sdev; 101a5319752SBernard Metzler }; 102a5319752SBernard Metzler 103a5319752SBernard Metzler /* 104a5319752SBernard Metzler * The RDMA core does not define LOCAL_READ access, which is always 105a5319752SBernard Metzler * enabled implictely. 106a5319752SBernard Metzler */ 107a5319752SBernard Metzler #define IWARP_ACCESS_MASK \ 108a5319752SBernard Metzler (IB_ACCESS_LOCAL_WRITE | IB_ACCESS_REMOTE_WRITE | \ 109a5319752SBernard Metzler IB_ACCESS_REMOTE_READ) 110a5319752SBernard Metzler 111a5319752SBernard Metzler /* 112a5319752SBernard Metzler * siw presentation of user memory registered as source 113a5319752SBernard Metzler * or target of RDMA operations. 114a5319752SBernard Metzler */ 115a5319752SBernard Metzler 116a5319752SBernard Metzler struct siw_page_chunk { 117a5319752SBernard Metzler struct page **plist; 118a5319752SBernard Metzler }; 119a5319752SBernard Metzler 120a5319752SBernard Metzler struct siw_umem { 121476b7c7eSBernard Metzler struct ib_umem *base_mem; 122a5319752SBernard Metzler struct siw_page_chunk *page_chunk; 123a5319752SBernard Metzler int num_pages; 124a5319752SBernard Metzler u64 fp_addr; /* First page base address */ 125a5319752SBernard Metzler }; 126a5319752SBernard Metzler 127a5319752SBernard Metzler struct siw_pble { 128c536277eSBernard Metzler dma_addr_t addr; /* Address of assigned buffer */ 129c536277eSBernard Metzler unsigned int size; /* Size of this entry */ 130c536277eSBernard Metzler unsigned long pbl_off; /* Total offset from start of PBL */ 131a5319752SBernard Metzler }; 132a5319752SBernard Metzler 133a5319752SBernard Metzler struct siw_pbl { 134a5319752SBernard Metzler unsigned int num_buf; 135a5319752SBernard Metzler unsigned int max_buf; 1360bc018b7SKees Cook struct siw_pble pbe[] __counted_by(max_buf); 137a5319752SBernard Metzler }; 138a5319752SBernard Metzler 139a5319752SBernard Metzler /* 140a5319752SBernard Metzler * Generic memory representation for registered siw memory. 141a5319752SBernard Metzler * Memory lookup always via higher 24 bit of STag (STag index). 142a5319752SBernard Metzler */ 143a5319752SBernard Metzler struct siw_mem { 144a5319752SBernard Metzler struct siw_device *sdev; 145a5319752SBernard Metzler struct kref ref; 146a5319752SBernard Metzler u64 va; /* VA of memory */ 147a5319752SBernard Metzler u64 len; /* length of the memory buffer in bytes */ 148a5319752SBernard Metzler u32 stag; /* iWarp memory access steering tag */ 149a5319752SBernard Metzler u8 stag_valid; /* VALID or INVALID */ 150a5319752SBernard Metzler u8 is_pbl; /* PBL or user space mem */ 151a5319752SBernard Metzler u8 is_mw; /* Memory Region or Memory Window */ 152a5319752SBernard Metzler enum ib_access_flags perms; /* local/remote READ & WRITE */ 153a5319752SBernard Metzler union { 154a5319752SBernard Metzler struct siw_umem *umem; 155a5319752SBernard Metzler struct siw_pbl *pbl; 156a5319752SBernard Metzler void *mem_obj; 157a5319752SBernard Metzler }; 158a5319752SBernard Metzler struct ib_pd *pd; 159a5319752SBernard Metzler }; 160a5319752SBernard Metzler 161a5319752SBernard Metzler struct siw_mr { 162a5319752SBernard Metzler struct ib_mr base_mr; 163a5319752SBernard Metzler struct siw_mem *mem; 164a5319752SBernard Metzler struct rcu_head rcu; 165a5319752SBernard Metzler }; 166a5319752SBernard Metzler 167a5319752SBernard Metzler /* 168a5319752SBernard Metzler * Error codes for local or remote 169a5319752SBernard Metzler * access to registered memory 170a5319752SBernard Metzler */ 171a5319752SBernard Metzler enum siw_access_state { 172a5319752SBernard Metzler E_ACCESS_OK, 173a5319752SBernard Metzler E_STAG_INVALID, 174a5319752SBernard Metzler E_BASE_BOUNDS, 175a5319752SBernard Metzler E_ACCESS_PERM, 176a5319752SBernard Metzler E_PD_MISMATCH 177a5319752SBernard Metzler }; 178a5319752SBernard Metzler 179a5319752SBernard Metzler enum siw_wr_state { 180a5319752SBernard Metzler SIW_WR_IDLE, 181a5319752SBernard Metzler SIW_WR_QUEUED, /* processing has not started yet */ 182a5319752SBernard Metzler SIW_WR_INPROGRESS /* initiated processing of the WR */ 183a5319752SBernard Metzler }; 184a5319752SBernard Metzler 185a5319752SBernard Metzler /* The WQE currently being processed (RX or TX) */ 186a5319752SBernard Metzler struct siw_wqe { 187a5319752SBernard Metzler /* Copy of applications SQE or RQE */ 188a5319752SBernard Metzler union { 189a5319752SBernard Metzler struct siw_sqe sqe; 190a5319752SBernard Metzler struct siw_rqe rqe; 191a5319752SBernard Metzler }; 192a5319752SBernard Metzler struct siw_mem *mem[SIW_MAX_SGE]; /* per sge's resolved mem */ 193a5319752SBernard Metzler enum siw_wr_state wr_status; 194a5319752SBernard Metzler enum siw_wc_status wc_status; 195a5319752SBernard Metzler u32 bytes; /* total bytes to process */ 196a5319752SBernard Metzler u32 processed; /* bytes processed */ 197a5319752SBernard Metzler }; 198a5319752SBernard Metzler 199a5319752SBernard Metzler struct siw_cq { 200a5319752SBernard Metzler struct ib_cq base_cq; 201a5319752SBernard Metzler spinlock_t lock; 2022c8ccb37SBernard Metzler struct siw_cq_ctrl *notify; 203a5319752SBernard Metzler struct siw_cqe *queue; 204a5319752SBernard Metzler u32 cq_put; 205a5319752SBernard Metzler u32 cq_get; 206a5319752SBernard Metzler u32 num_cqe; 20711f1a755SMichal Kalderon struct rdma_user_mmap_entry *cq_entry; /* mmap info for CQE array */ 208a5319752SBernard Metzler u32 id; /* For debugging only */ 209a5319752SBernard Metzler }; 210a5319752SBernard Metzler 211a5319752SBernard Metzler enum siw_qp_state { 212a5319752SBernard Metzler SIW_QP_STATE_IDLE, 213a5319752SBernard Metzler SIW_QP_STATE_RTR, 214a5319752SBernard Metzler SIW_QP_STATE_RTS, 215a5319752SBernard Metzler SIW_QP_STATE_CLOSING, 216a5319752SBernard Metzler SIW_QP_STATE_TERMINATE, 217a5319752SBernard Metzler SIW_QP_STATE_ERROR, 218a5319752SBernard Metzler SIW_QP_STATE_COUNT 219a5319752SBernard Metzler }; 220a5319752SBernard Metzler 221a5319752SBernard Metzler enum siw_qp_flags { 222a5319752SBernard Metzler SIW_RDMA_BIND_ENABLED = (1 << 0), 223a5319752SBernard Metzler SIW_RDMA_WRITE_ENABLED = (1 << 1), 224a5319752SBernard Metzler SIW_RDMA_READ_ENABLED = (1 << 2), 225a5319752SBernard Metzler SIW_SIGNAL_ALL_WR = (1 << 3), 226a5319752SBernard Metzler SIW_MPA_CRC = (1 << 4), 227a5319752SBernard Metzler SIW_QP_IN_DESTROY = (1 << 5) 228a5319752SBernard Metzler }; 229a5319752SBernard Metzler 230a5319752SBernard Metzler enum siw_qp_attr_mask { 231a5319752SBernard Metzler SIW_QP_ATTR_STATE = (1 << 0), 232a5319752SBernard Metzler SIW_QP_ATTR_ACCESS_FLAGS = (1 << 1), 233a5319752SBernard Metzler SIW_QP_ATTR_LLP_HANDLE = (1 << 2), 234a5319752SBernard Metzler SIW_QP_ATTR_ORD = (1 << 3), 235a5319752SBernard Metzler SIW_QP_ATTR_IRD = (1 << 4), 236a5319752SBernard Metzler SIW_QP_ATTR_SQ_SIZE = (1 << 5), 237a5319752SBernard Metzler SIW_QP_ATTR_RQ_SIZE = (1 << 6), 238a5319752SBernard Metzler SIW_QP_ATTR_MPA = (1 << 7) 239a5319752SBernard Metzler }; 240a5319752SBernard Metzler 241a5319752SBernard Metzler struct siw_srq { 242a5319752SBernard Metzler struct ib_srq base_srq; 243a5319752SBernard Metzler spinlock_t lock; 244a5319752SBernard Metzler u32 max_sge; 245a5319752SBernard Metzler u32 limit; /* low watermark for async event */ 246a5319752SBernard Metzler struct siw_rqe *recvq; 247a5319752SBernard Metzler u32 rq_put; 248a5319752SBernard Metzler u32 rq_get; 249a5319752SBernard Metzler u32 num_rqe; /* max # of wqe's allowed */ 25011f1a755SMichal Kalderon struct rdma_user_mmap_entry *srq_entry; /* mmap info for SRQ array */ 25158fb0b56SBernard Metzler bool armed:1; /* inform user if limit hit */ 25258fb0b56SBernard Metzler bool is_kernel_res:1; /* true if kernel client */ 253a5319752SBernard Metzler }; 254a5319752SBernard Metzler 255a5319752SBernard Metzler struct siw_qp_attrs { 256a5319752SBernard Metzler enum siw_qp_state state; 257a5319752SBernard Metzler u32 sq_size; 258a5319752SBernard Metzler u32 rq_size; 259a5319752SBernard Metzler u32 orq_size; 260a5319752SBernard Metzler u32 irq_size; 261a5319752SBernard Metzler u32 sq_max_sges; 262a5319752SBernard Metzler u32 rq_max_sges; 263a5319752SBernard Metzler enum siw_qp_flags flags; 264a5319752SBernard Metzler 265a5319752SBernard Metzler struct socket *sk; 266a5319752SBernard Metzler }; 267a5319752SBernard Metzler 268a5319752SBernard Metzler enum siw_tx_ctx { 269a5319752SBernard Metzler SIW_SEND_HDR, /* start or continue sending HDR */ 270a5319752SBernard Metzler SIW_SEND_DATA, /* start or continue sending DDP payload */ 271a5319752SBernard Metzler SIW_SEND_TRAILER, /* start or continue sending TRAILER */ 272a5319752SBernard Metzler SIW_SEND_SHORT_FPDU/* send whole FPDU hdr|data|trailer at once */ 273a5319752SBernard Metzler }; 274a5319752SBernard Metzler 275a5319752SBernard Metzler enum siw_rx_state { 276a5319752SBernard Metzler SIW_GET_HDR, /* await new hdr or within hdr */ 277a5319752SBernard Metzler SIW_GET_DATA_START, /* start of inbound DDP payload */ 278a5319752SBernard Metzler SIW_GET_DATA_MORE, /* continuation of (misaligned) DDP payload */ 279a5319752SBernard Metzler SIW_GET_TRAILER/* await new trailer or within trailer */ 280a5319752SBernard Metzler }; 281a5319752SBernard Metzler 282a5319752SBernard Metzler struct siw_rx_stream { 283a5319752SBernard Metzler struct sk_buff *skb; 284a5319752SBernard Metzler int skb_new; /* pending unread bytes in skb */ 285a5319752SBernard Metzler int skb_offset; /* offset in skb */ 286a5319752SBernard Metzler int skb_copied; /* processed bytes in skb */ 287a5319752SBernard Metzler 28851ac45a6SGuoqing Jiang enum siw_rx_state state; 28951ac45a6SGuoqing Jiang 290a5319752SBernard Metzler union iwarp_hdr hdr; 291a5319752SBernard Metzler struct mpa_trailer trailer; 292426370c8SEric Biggers u32 mpa_crc; 293426370c8SEric Biggers bool mpa_crc_enabled; 294a5319752SBernard Metzler 295a5319752SBernard Metzler /* 296a5319752SBernard Metzler * For each FPDU, main RX loop runs through 3 stages: 297a5319752SBernard Metzler * Receiving protocol headers, placing DDP payload and receiving 298a5319752SBernard Metzler * trailer information (CRC + possibly padding). 299a5319752SBernard Metzler * Next two variables keep state on receive status of the 300a5319752SBernard Metzler * current FPDU part (hdr, data, trailer). 301a5319752SBernard Metzler */ 302a5319752SBernard Metzler int fpdu_part_rcvd; /* bytes in pkt part copied */ 303a5319752SBernard Metzler int fpdu_part_rem; /* bytes in pkt part not seen */ 304a5319752SBernard Metzler 305a5319752SBernard Metzler /* 306a5319752SBernard Metzler * Next expected DDP MSN for each QN + 307a5319752SBernard Metzler * expected steering tag + 308a5319752SBernard Metzler * expected DDP tagget offset (all HBO) 309a5319752SBernard Metzler */ 310a5319752SBernard Metzler u32 ddp_msn[RDMAP_UNTAGGED_QN_COUNT]; 311a5319752SBernard Metzler u32 ddp_stag; 312a5319752SBernard Metzler u64 ddp_to; 313a5319752SBernard Metzler u32 inval_stag; /* Stag to be invalidated */ 314a5319752SBernard Metzler 315a5319752SBernard Metzler u8 rx_suspend : 1; 316a5319752SBernard Metzler u8 pad : 2; /* # of pad bytes expected */ 317a5319752SBernard Metzler u8 rdmap_op : 4; /* opcode of current frame */ 318a5319752SBernard Metzler }; 319a5319752SBernard Metzler 320a5319752SBernard Metzler struct siw_rx_fpdu { 321a5319752SBernard Metzler /* 322a5319752SBernard Metzler * Local destination memory of inbound RDMA operation. 323a5319752SBernard Metzler * Valid, according to wqe->wr_status 324a5319752SBernard Metzler */ 325a5319752SBernard Metzler struct siw_wqe wqe_active; 326a5319752SBernard Metzler 327a5319752SBernard Metzler unsigned int pbl_idx; /* Index into current PBL */ 328a5319752SBernard Metzler unsigned int sge_idx; /* current sge in rx */ 329a5319752SBernard Metzler unsigned int sge_off; /* already rcvd in curr. sge */ 330a5319752SBernard Metzler 331a5319752SBernard Metzler char first_ddp_seg; /* this is the first DDP seg */ 332a5319752SBernard Metzler char more_ddp_segs; /* more DDP segs expected */ 333a5319752SBernard Metzler u8 prev_rdmap_op : 4; /* opcode of prev frame */ 334a5319752SBernard Metzler }; 335a5319752SBernard Metzler 336a5319752SBernard Metzler /* 337a5319752SBernard Metzler * Shorthands for short packets w/o payload 338a5319752SBernard Metzler * to be transmitted more efficient. 339a5319752SBernard Metzler */ 340a5319752SBernard Metzler struct siw_send_pkt { 341a5319752SBernard Metzler struct iwarp_send send; 342a5319752SBernard Metzler __be32 crc; 343a5319752SBernard Metzler }; 344a5319752SBernard Metzler 345a5319752SBernard Metzler struct siw_write_pkt { 346a5319752SBernard Metzler struct iwarp_rdma_write write; 347a5319752SBernard Metzler __be32 crc; 348a5319752SBernard Metzler }; 349a5319752SBernard Metzler 350a5319752SBernard Metzler struct siw_rreq_pkt { 351a5319752SBernard Metzler struct iwarp_rdma_rreq rreq; 352a5319752SBernard Metzler __be32 crc; 353a5319752SBernard Metzler }; 354a5319752SBernard Metzler 355a5319752SBernard Metzler struct siw_rresp_pkt { 356a5319752SBernard Metzler struct iwarp_rdma_rresp rresp; 357a5319752SBernard Metzler __be32 crc; 358a5319752SBernard Metzler }; 359a5319752SBernard Metzler 360a5319752SBernard Metzler struct siw_iwarp_tx { 361a5319752SBernard Metzler union { 362a5319752SBernard Metzler union iwarp_hdr hdr; 363a5319752SBernard Metzler 364a5319752SBernard Metzler /* Generic part of FPDU header */ 365a5319752SBernard Metzler struct iwarp_ctrl ctrl; 366a5319752SBernard Metzler struct iwarp_ctrl_untagged c_untagged; 367a5319752SBernard Metzler struct iwarp_ctrl_tagged c_tagged; 368a5319752SBernard Metzler 369a5319752SBernard Metzler /* FPDU headers */ 370a5319752SBernard Metzler struct iwarp_rdma_write rwrite; 371a5319752SBernard Metzler struct iwarp_rdma_rreq rreq; 372a5319752SBernard Metzler struct iwarp_rdma_rresp rresp; 373a5319752SBernard Metzler struct iwarp_terminate terminate; 374a5319752SBernard Metzler struct iwarp_send send; 375a5319752SBernard Metzler struct iwarp_send_inv send_inv; 376a5319752SBernard Metzler 377a5319752SBernard Metzler /* complete short FPDUs */ 378a5319752SBernard Metzler struct siw_send_pkt send_pkt; 379a5319752SBernard Metzler struct siw_write_pkt write_pkt; 380a5319752SBernard Metzler struct siw_rreq_pkt rreq_pkt; 381a5319752SBernard Metzler struct siw_rresp_pkt rresp_pkt; 382a5319752SBernard Metzler } pkt; 383a5319752SBernard Metzler 384a5319752SBernard Metzler struct mpa_trailer trailer; 385a5319752SBernard Metzler /* DDP MSN for untagged messages */ 386a5319752SBernard Metzler u32 ddp_msn[RDMAP_UNTAGGED_QN_COUNT]; 387a5319752SBernard Metzler 388a5319752SBernard Metzler enum siw_tx_ctx state; 389a5319752SBernard Metzler u16 ctrl_len; /* ddp+rdmap hdr */ 390a5319752SBernard Metzler u16 ctrl_sent; 391a5319752SBernard Metzler int burst; 392a5319752SBernard Metzler int bytes_unsent; /* ddp payload bytes */ 393a5319752SBernard Metzler 394426370c8SEric Biggers u32 mpa_crc; 395426370c8SEric Biggers bool mpa_crc_enabled; 396a5319752SBernard Metzler 397a5319752SBernard Metzler u8 do_crc : 1; /* do crc for segment */ 398a5319752SBernard Metzler u8 use_sendpage : 1; /* send w/o copy */ 399a5319752SBernard Metzler u8 tx_suspend : 1; /* stop sending DDP segs. */ 400a5319752SBernard Metzler u8 pad : 2; /* # pad in current fpdu */ 401a5319752SBernard Metzler u8 orq_fence : 1; /* ORQ full or Send fenced */ 402a5319752SBernard Metzler u8 in_syscall : 1; /* TX out of user context */ 403a5319752SBernard Metzler u8 zcopy_tx : 1; /* Use TCP_SENDPAGE if possible */ 404a5319752SBernard Metzler u8 gso_seg_limit; /* Maximum segments for GSO, 0 = unbound */ 405a5319752SBernard Metzler 406a5319752SBernard Metzler u16 fpdu_len; /* len of FPDU to tx */ 407a5319752SBernard Metzler unsigned int tcp_seglen; /* remaining tcp seg space */ 408a5319752SBernard Metzler 409a5319752SBernard Metzler struct siw_wqe wqe_active; 410a5319752SBernard Metzler 411a5319752SBernard Metzler int pbl_idx; /* Index into current PBL */ 412a5319752SBernard Metzler int sge_idx; /* current sge in tx */ 413a5319752SBernard Metzler u32 sge_off; /* already sent in curr. sge */ 414a5319752SBernard Metzler }; 415a5319752SBernard Metzler 416a5319752SBernard Metzler struct siw_qp { 41758fb0b56SBernard Metzler struct ib_qp base_qp; 418a5319752SBernard Metzler struct siw_device *sdev; 41984de14baSGuoqing Jiang int tx_cpu; 420a5319752SBernard Metzler struct kref ref; 421a3c27880SBernard Metzler struct completion qp_free; 422a5319752SBernard Metzler struct list_head devq; 423a5319752SBernard Metzler struct siw_qp_attrs attrs; 424a5319752SBernard Metzler 425a5319752SBernard Metzler struct siw_cep *cep; 426a5319752SBernard Metzler struct rw_semaphore state_lock; 427a5319752SBernard Metzler 428a5319752SBernard Metzler struct ib_pd *pd; 429a5319752SBernard Metzler struct siw_cq *scq; 430a5319752SBernard Metzler struct siw_cq *rcq; 431a5319752SBernard Metzler struct siw_srq *srq; 432a5319752SBernard Metzler 433a5319752SBernard Metzler struct siw_iwarp_tx tx_ctx; /* Transmit context */ 434a5319752SBernard Metzler spinlock_t sq_lock; 435a5319752SBernard Metzler struct siw_sqe *sendq; /* send queue element array */ 436a5319752SBernard Metzler uint32_t sq_get; /* consumer index into sq array */ 437a5319752SBernard Metzler uint32_t sq_put; /* kernel prod. index into sq array */ 438a5319752SBernard Metzler struct llist_node tx_list; 439a5319752SBernard Metzler 440a5319752SBernard Metzler struct siw_sqe *orq; /* outbound read queue element array */ 441a5319752SBernard Metzler spinlock_t orq_lock; 442a5319752SBernard Metzler uint32_t orq_get; /* consumer index into orq array */ 443a5319752SBernard Metzler uint32_t orq_put; /* shared producer index for ORQ */ 444a5319752SBernard Metzler 445a5319752SBernard Metzler struct siw_rx_stream rx_stream; 446a5319752SBernard Metzler struct siw_rx_fpdu *rx_fpdu; 447a5319752SBernard Metzler struct siw_rx_fpdu rx_tagged; 448a5319752SBernard Metzler struct siw_rx_fpdu rx_untagged; 449a5319752SBernard Metzler spinlock_t rq_lock; 450a5319752SBernard Metzler struct siw_rqe *recvq; /* recv queue element array */ 451a5319752SBernard Metzler uint32_t rq_get; /* consumer index into rq array */ 452a5319752SBernard Metzler uint32_t rq_put; /* kernel prod. index into rq array */ 453a5319752SBernard Metzler 454a5319752SBernard Metzler struct siw_sqe *irq; /* inbound read queue element array */ 455a5319752SBernard Metzler uint32_t irq_get; /* consumer index into irq array */ 456a5319752SBernard Metzler uint32_t irq_put; /* producer index into irq array */ 457a5319752SBernard Metzler int irq_burst; 458a5319752SBernard Metzler 459a5319752SBernard Metzler struct { /* information to be carried in TERMINATE pkt, if valid */ 460a5319752SBernard Metzler u8 valid; 461a5319752SBernard Metzler u8 in_tx; 462a5319752SBernard Metzler u8 layer : 4, etype : 4; 463a5319752SBernard Metzler u8 ecode; 464a5319752SBernard Metzler } term_info; 46511f1a755SMichal Kalderon struct rdma_user_mmap_entry *sq_entry; /* mmap info for SQE array */ 46611f1a755SMichal Kalderon struct rdma_user_mmap_entry *rq_entry; /* mmap info for RQE array */ 467a5319752SBernard Metzler }; 468a5319752SBernard Metzler 469a5319752SBernard Metzler /* helper macros */ 470a5319752SBernard Metzler #define rx_qp(rx) container_of(rx, struct siw_qp, rx_stream) 471a5319752SBernard Metzler #define tx_qp(tx) container_of(tx, struct siw_qp, tx_ctx) 472a5319752SBernard Metzler #define tx_wqe(qp) (&(qp)->tx_ctx.wqe_active) 473a5319752SBernard Metzler #define rx_wqe(rctx) (&(rctx)->wqe_active) 474a5319752SBernard Metzler #define rx_mem(rctx) ((rctx)->wqe_active.mem[0]) 475a5319752SBernard Metzler #define tx_type(wqe) ((wqe)->sqe.opcode) 476a5319752SBernard Metzler #define rx_type(wqe) ((wqe)->rqe.opcode) 477a5319752SBernard Metzler #define tx_flags(wqe) ((wqe)->sqe.flags) 478a5319752SBernard Metzler 479a5319752SBernard Metzler struct iwarp_msg_info { 480a5319752SBernard Metzler int hdr_len; 481a5319752SBernard Metzler struct iwarp_ctrl ctrl; 482a5319752SBernard Metzler int (*rx_data)(struct siw_qp *qp); 483a5319752SBernard Metzler }; 484a5319752SBernard Metzler 48511f1a755SMichal Kalderon struct siw_user_mmap_entry { 48611f1a755SMichal Kalderon struct rdma_user_mmap_entry rdma_entry; 48711f1a755SMichal Kalderon void *address; 48811f1a755SMichal Kalderon }; 48911f1a755SMichal Kalderon 490a5319752SBernard Metzler /* Global siw parameters. Currently set in siw_main.c */ 491a5319752SBernard Metzler extern const bool zcopy_tx; 492a5319752SBernard Metzler extern const bool try_gso; 493a5319752SBernard Metzler extern const bool loopback_enabled; 494a5319752SBernard Metzler extern const bool mpa_crc_required; 495a5319752SBernard Metzler extern const bool mpa_crc_strict; 496a5319752SBernard Metzler extern const bool siw_tcp_nagle; 497a5319752SBernard Metzler extern u_char mpa_version; 498a5319752SBernard Metzler extern const bool peer_to_peer; 499a5319752SBernard Metzler extern struct task_struct *siw_tx_thread[]; 500a5319752SBernard Metzler 501a5319752SBernard Metzler extern struct iwarp_msg_info iwarp_pktinfo[RDMAP_TERMINATE + 1]; 502a5319752SBernard Metzler 503a5319752SBernard Metzler /* QP general functions */ 504a5319752SBernard Metzler int siw_qp_modify(struct siw_qp *qp, struct siw_qp_attrs *attr, 505a5319752SBernard Metzler enum siw_qp_attr_mask mask); 506a5319752SBernard Metzler int siw_qp_mpa_rts(struct siw_qp *qp, enum mpa_v2_ctrl ctrl); 507a5319752SBernard Metzler void siw_qp_llp_close(struct siw_qp *qp); 508a5319752SBernard Metzler void siw_qp_cm_drop(struct siw_qp *qp, int schedule); 509a5319752SBernard Metzler void siw_send_terminate(struct siw_qp *qp); 510a5319752SBernard Metzler 511a5319752SBernard Metzler void siw_qp_get_ref(struct ib_qp *qp); 512a5319752SBernard Metzler void siw_qp_put_ref(struct ib_qp *qp); 513a5319752SBernard Metzler int siw_qp_add(struct siw_device *sdev, struct siw_qp *qp); 514a5319752SBernard Metzler void siw_free_qp(struct kref *ref); 515a5319752SBernard Metzler 516a5319752SBernard Metzler void siw_init_terminate(struct siw_qp *qp, enum term_elayer layer, 517a5319752SBernard Metzler u8 etype, u8 ecode, int in_tx); 518a5319752SBernard Metzler enum ddp_ecode siw_tagged_error(enum siw_access_state state); 519a5319752SBernard Metzler enum rdmap_ecode siw_rdmap_error(enum siw_access_state state); 520a5319752SBernard Metzler 521a5319752SBernard Metzler void siw_read_to_orq(struct siw_sqe *rreq, struct siw_sqe *sqe); 522a5319752SBernard Metzler int siw_sqe_complete(struct siw_qp *qp, struct siw_sqe *sqe, u32 bytes, 523a5319752SBernard Metzler enum siw_wc_status status); 524a5319752SBernard Metzler int siw_rqe_complete(struct siw_qp *qp, struct siw_rqe *rqe, u32 bytes, 525a5319752SBernard Metzler u32 inval_stag, enum siw_wc_status status); 526a5319752SBernard Metzler void siw_qp_llp_data_ready(struct sock *sk); 527a5319752SBernard Metzler void siw_qp_llp_write_space(struct sock *sk); 528a5319752SBernard Metzler 529a5319752SBernard Metzler /* QP TX path functions */ 53091f36237SBernard Metzler int siw_create_tx_threads(void); 53191f36237SBernard Metzler void siw_stop_tx_threads(void); 532a5319752SBernard Metzler int siw_run_sq(void *arg); 533a5319752SBernard Metzler int siw_qp_sq_process(struct siw_qp *qp); 534a5319752SBernard Metzler int siw_sq_start(struct siw_qp *qp); 535a5319752SBernard Metzler int siw_activate_tx(struct siw_qp *qp); 536a5319752SBernard Metzler int siw_get_tx_cpu(struct siw_device *sdev); 537a5319752SBernard Metzler void siw_put_tx_cpu(int cpu); 538a5319752SBernard Metzler 539a5319752SBernard Metzler /* QP RX path functions */ 540a5319752SBernard Metzler int siw_proc_send(struct siw_qp *qp); 541a5319752SBernard Metzler int siw_proc_rreq(struct siw_qp *qp); 542a5319752SBernard Metzler int siw_proc_rresp(struct siw_qp *qp); 543a5319752SBernard Metzler int siw_proc_write(struct siw_qp *qp); 544a5319752SBernard Metzler int siw_proc_terminate(struct siw_qp *qp); 545a5319752SBernard Metzler 546a5319752SBernard Metzler int siw_tcp_rx_data(read_descriptor_t *rd_desc, struct sk_buff *skb, 547a5319752SBernard Metzler unsigned int off, size_t len); 548a5319752SBernard Metzler 549a5319752SBernard Metzler static inline void set_rx_fpdu_context(struct siw_qp *qp, u8 opcode) 550a5319752SBernard Metzler { 551a5319752SBernard Metzler if (opcode == RDMAP_RDMA_WRITE || opcode == RDMAP_RDMA_READ_RESP) 552a5319752SBernard Metzler qp->rx_fpdu = &qp->rx_tagged; 553a5319752SBernard Metzler else 554a5319752SBernard Metzler qp->rx_fpdu = &qp->rx_untagged; 555a5319752SBernard Metzler 556a5319752SBernard Metzler qp->rx_stream.rdmap_op = opcode; 557a5319752SBernard Metzler } 558a5319752SBernard Metzler 559a5319752SBernard Metzler static inline struct siw_ucontext *to_siw_ctx(struct ib_ucontext *base_ctx) 560a5319752SBernard Metzler { 561a5319752SBernard Metzler return container_of(base_ctx, struct siw_ucontext, base_ucontext); 562a5319752SBernard Metzler } 563a5319752SBernard Metzler 564a5319752SBernard Metzler static inline struct siw_qp *to_siw_qp(struct ib_qp *base_qp) 565a5319752SBernard Metzler { 56658fb0b56SBernard Metzler return container_of(base_qp, struct siw_qp, base_qp); 567a5319752SBernard Metzler } 568a5319752SBernard Metzler 569a5319752SBernard Metzler static inline struct siw_cq *to_siw_cq(struct ib_cq *base_cq) 570a5319752SBernard Metzler { 571a5319752SBernard Metzler return container_of(base_cq, struct siw_cq, base_cq); 572a5319752SBernard Metzler } 573a5319752SBernard Metzler 574a5319752SBernard Metzler static inline struct siw_srq *to_siw_srq(struct ib_srq *base_srq) 575a5319752SBernard Metzler { 576a5319752SBernard Metzler return container_of(base_srq, struct siw_srq, base_srq); 577a5319752SBernard Metzler } 578a5319752SBernard Metzler 579a5319752SBernard Metzler static inline struct siw_device *to_siw_dev(struct ib_device *base_dev) 580a5319752SBernard Metzler { 581a5319752SBernard Metzler return container_of(base_dev, struct siw_device, base_dev); 582a5319752SBernard Metzler } 583a5319752SBernard Metzler 584a5319752SBernard Metzler static inline struct siw_mr *to_siw_mr(struct ib_mr *base_mr) 585a5319752SBernard Metzler { 586a5319752SBernard Metzler return container_of(base_mr, struct siw_mr, base_mr); 587a5319752SBernard Metzler } 588a5319752SBernard Metzler 58911f1a755SMichal Kalderon static inline struct siw_user_mmap_entry * 59011f1a755SMichal Kalderon to_siw_mmap_entry(struct rdma_user_mmap_entry *rdma_mmap) 59111f1a755SMichal Kalderon { 59211f1a755SMichal Kalderon return container_of(rdma_mmap, struct siw_user_mmap_entry, rdma_entry); 59311f1a755SMichal Kalderon } 59411f1a755SMichal Kalderon 595a5319752SBernard Metzler static inline struct siw_qp *siw_qp_id2obj(struct siw_device *sdev, int id) 596a5319752SBernard Metzler { 597a5319752SBernard Metzler struct siw_qp *qp; 598a5319752SBernard Metzler 599a5319752SBernard Metzler rcu_read_lock(); 600a5319752SBernard Metzler qp = xa_load(&sdev->qp_xa, id); 601a5319752SBernard Metzler if (likely(qp && kref_get_unless_zero(&qp->ref))) { 602a5319752SBernard Metzler rcu_read_unlock(); 603a5319752SBernard Metzler return qp; 604a5319752SBernard Metzler } 605a5319752SBernard Metzler rcu_read_unlock(); 606a5319752SBernard Metzler return NULL; 607a5319752SBernard Metzler } 608a5319752SBernard Metzler 609a5319752SBernard Metzler static inline u32 qp_id(struct siw_qp *qp) 610a5319752SBernard Metzler { 61158fb0b56SBernard Metzler return qp->base_qp.qp_num; 612a5319752SBernard Metzler } 613a5319752SBernard Metzler 614a5319752SBernard Metzler static inline void siw_qp_get(struct siw_qp *qp) 615a5319752SBernard Metzler { 616a5319752SBernard Metzler kref_get(&qp->ref); 617a5319752SBernard Metzler } 618a5319752SBernard Metzler 619a5319752SBernard Metzler static inline void siw_qp_put(struct siw_qp *qp) 620a5319752SBernard Metzler { 621a5319752SBernard Metzler kref_put(&qp->ref, siw_free_qp); 622a5319752SBernard Metzler } 623a5319752SBernard Metzler 624a5319752SBernard Metzler static inline int siw_sq_empty(struct siw_qp *qp) 625a5319752SBernard Metzler { 626a5319752SBernard Metzler struct siw_sqe *sqe = &qp->sendq[qp->sq_get % qp->attrs.sq_size]; 627a5319752SBernard Metzler 628a5319752SBernard Metzler return READ_ONCE(sqe->flags) == 0; 629a5319752SBernard Metzler } 630a5319752SBernard Metzler 631a5319752SBernard Metzler static inline struct siw_sqe *sq_get_next(struct siw_qp *qp) 632a5319752SBernard Metzler { 633a5319752SBernard Metzler struct siw_sqe *sqe = &qp->sendq[qp->sq_get % qp->attrs.sq_size]; 634a5319752SBernard Metzler 635a5319752SBernard Metzler if (READ_ONCE(sqe->flags) & SIW_WQE_VALID) 636a5319752SBernard Metzler return sqe; 637a5319752SBernard Metzler 638a5319752SBernard Metzler return NULL; 639a5319752SBernard Metzler } 640a5319752SBernard Metzler 641a5319752SBernard Metzler static inline struct siw_sqe *orq_get_current(struct siw_qp *qp) 642a5319752SBernard Metzler { 643a5319752SBernard Metzler return &qp->orq[qp->orq_get % qp->attrs.orq_size]; 644a5319752SBernard Metzler } 645a5319752SBernard Metzler 646a5319752SBernard Metzler static inline struct siw_sqe *orq_get_free(struct siw_qp *qp) 647a5319752SBernard Metzler { 648b43a76f4SBernard Metzler struct siw_sqe *orq_e = &qp->orq[qp->orq_put % qp->attrs.orq_size]; 649a5319752SBernard Metzler 650661f3859SBernard Metzler if (READ_ONCE(orq_e->flags) == 0) 651a5319752SBernard Metzler return orq_e; 652a5319752SBernard Metzler 653a5319752SBernard Metzler return NULL; 654a5319752SBernard Metzler } 655a5319752SBernard Metzler 656a5319752SBernard Metzler static inline int siw_orq_empty(struct siw_qp *qp) 657a5319752SBernard Metzler { 658b7a2768aSGuoqing Jiang return orq_get_current(qp)->flags == 0 ? 1 : 0; 659a5319752SBernard Metzler } 660a5319752SBernard Metzler 661a5319752SBernard Metzler static inline struct siw_sqe *irq_alloc_free(struct siw_qp *qp) 662a5319752SBernard Metzler { 663a5319752SBernard Metzler struct siw_sqe *irq_e = &qp->irq[qp->irq_put % qp->attrs.irq_size]; 664a5319752SBernard Metzler 665a5319752SBernard Metzler if (READ_ONCE(irq_e->flags) == 0) { 666a5319752SBernard Metzler qp->irq_put++; 667a5319752SBernard Metzler return irq_e; 668a5319752SBernard Metzler } 669a5319752SBernard Metzler return NULL; 670a5319752SBernard Metzler } 671a5319752SBernard Metzler 672426370c8SEric Biggers static inline void siw_crc_init(u32 *crc) 673426370c8SEric Biggers { 674426370c8SEric Biggers *crc = ~0; 675426370c8SEric Biggers } 676426370c8SEric Biggers 677426370c8SEric Biggers static inline void siw_crc_update(u32 *crc, const void *data, size_t len) 678426370c8SEric Biggers { 679426370c8SEric Biggers *crc = crc32c(*crc, data, len); 680426370c8SEric Biggers } 681426370c8SEric Biggers 682426370c8SEric Biggers static inline void siw_crc_final(u32 *crc, u8 out[4]) 683426370c8SEric Biggers { 684426370c8SEric Biggers put_unaligned_le32(~*crc, out); 685426370c8SEric Biggers } 686426370c8SEric Biggers 687426370c8SEric Biggers static inline void siw_crc_oneshot(const void *data, size_t len, u8 out[4]) 688426370c8SEric Biggers { 689426370c8SEric Biggers u32 crc; 690426370c8SEric Biggers 691426370c8SEric Biggers siw_crc_init(&crc); 692426370c8SEric Biggers siw_crc_update(&crc, data, len); 693426370c8SEric Biggers return siw_crc_final(&crc, out); 694426370c8SEric Biggers } 695426370c8SEric Biggers 696a5319752SBernard Metzler static inline __wsum siw_csum_update(const void *buff, int len, __wsum sum) 697a5319752SBernard Metzler { 698a5319752SBernard Metzler return (__force __wsum)crc32c((__force __u32)sum, buff, len); 699a5319752SBernard Metzler } 700a5319752SBernard Metzler 701a5319752SBernard Metzler static inline __wsum siw_csum_combine(__wsum csum, __wsum csum2, int offset, 702a5319752SBernard Metzler int len) 703a5319752SBernard Metzler { 704c64e6570SEric Biggers return (__force __wsum)crc32c_combine((__force __u32)csum, 705a5319752SBernard Metzler (__force __u32)csum2, len); 706a5319752SBernard Metzler } 707a5319752SBernard Metzler 708a5319752SBernard Metzler static inline void siw_crc_skb(struct siw_rx_stream *srx, unsigned int len) 709a5319752SBernard Metzler { 710a5319752SBernard Metzler const struct skb_checksum_ops siw_cs_ops = { 711a5319752SBernard Metzler .update = siw_csum_update, 712a5319752SBernard Metzler .combine = siw_csum_combine, 713a5319752SBernard Metzler }; 714426370c8SEric Biggers __wsum crc = (__force __wsum)srx->mpa_crc; 715a5319752SBernard Metzler 716a5319752SBernard Metzler crc = __skb_checksum(srx->skb, srx->skb_offset, len, crc, 717a5319752SBernard Metzler &siw_cs_ops); 718426370c8SEric Biggers srx->mpa_crc = (__force u32)crc; 719a5319752SBernard Metzler } 720a5319752SBernard Metzler 721a5319752SBernard Metzler #define siw_dbg(ibdev, fmt, ...) \ 722a5319752SBernard Metzler ibdev_dbg(ibdev, "%s: " fmt, __func__, ##__VA_ARGS__) 723a5319752SBernard Metzler 724a5319752SBernard Metzler #define siw_dbg_qp(qp, fmt, ...) \ 725a5319752SBernard Metzler ibdev_dbg(&qp->sdev->base_dev, "QP[%u] %s: " fmt, qp_id(qp), __func__, \ 726a5319752SBernard Metzler ##__VA_ARGS__) 727a5319752SBernard Metzler 728a5319752SBernard Metzler #define siw_dbg_cq(cq, fmt, ...) \ 729a5319752SBernard Metzler ibdev_dbg(cq->base_cq.device, "CQ[%u] %s: " fmt, cq->id, __func__, \ 730a5319752SBernard Metzler ##__VA_ARGS__) 731a5319752SBernard Metzler 732a5319752SBernard Metzler #define siw_dbg_pd(pd, fmt, ...) \ 733a5319752SBernard Metzler ibdev_dbg(pd->device, "PD[%u] %s: " fmt, pd->res.id, __func__, \ 734a5319752SBernard Metzler ##__VA_ARGS__) 735a5319752SBernard Metzler 736a5319752SBernard Metzler #define siw_dbg_mem(mem, fmt, ...) \ 737a5319752SBernard Metzler ibdev_dbg(&mem->sdev->base_dev, \ 738a5319752SBernard Metzler "MEM[0x%08x] %s: " fmt, mem->stag, __func__, ##__VA_ARGS__) 739a5319752SBernard Metzler 740a5319752SBernard Metzler #define siw_dbg_cep(cep, fmt, ...) \ 741*9334003dSThomas Weißschuh ibdev_dbg(&cep->sdev->base_dev, "CEP[0x%p] %s: " fmt, \ 742a5319752SBernard Metzler cep, __func__, ##__VA_ARGS__) 743a5319752SBernard Metzler 744a5319752SBernard Metzler void siw_cq_flush(struct siw_cq *cq); 745a5319752SBernard Metzler void siw_sq_flush(struct siw_qp *qp); 746a5319752SBernard Metzler void siw_rq_flush(struct siw_qp *qp); 747a5319752SBernard Metzler int siw_reap_cqe(struct siw_cq *cq, struct ib_wc *wc); 748a5319752SBernard Metzler 749a5319752SBernard Metzler #endif 750