13ec648c6SKrzysztof Kozlowski /* SPDX-License-Identifier: GPL-2.0 OR BSD-3-Clause */
2a5319752SBernard Metzler
3a5319752SBernard Metzler /* Authors: Bernard Metzler <bmt@zurich.ibm.com> */
4a5319752SBernard Metzler /* Copyright (c) 2008-2019, IBM Corporation */
5a5319752SBernard Metzler
6a5319752SBernard Metzler #ifndef _SIW_H
7a5319752SBernard Metzler #define _SIW_H
8a5319752SBernard Metzler
9a5319752SBernard Metzler #include <rdma/ib_verbs.h>
1058fb0b56SBernard Metzler #include <rdma/restrack.h>
11a5319752SBernard Metzler #include <linux/socket.h>
12a5319752SBernard Metzler #include <linux/skbuff.h>
13a5319752SBernard Metzler #include <linux/crc32.h>
14a5319752SBernard Metzler #include <linux/crc32c.h>
15426370c8SEric Biggers #include <linux/unaligned.h>
16a5319752SBernard Metzler
17a5319752SBernard Metzler #include <rdma/siw-abi.h>
18a5319752SBernard Metzler #include "iwarp.h"
19a5319752SBernard Metzler
20a5319752SBernard Metzler #define SIW_VENDOR_ID 0x626d74 /* ascii 'bmt' for now */
21a5319752SBernard Metzler #define SIW_VENDORT_PART_ID 0
22a5319752SBernard Metzler #define SIW_MAX_QP (1024 * 100)
23a5319752SBernard Metzler #define SIW_MAX_QP_WR (1024 * 32)
24a5319752SBernard Metzler #define SIW_MAX_ORD_QP 128
25a5319752SBernard Metzler #define SIW_MAX_IRD_QP 128
26a5319752SBernard Metzler #define SIW_MAX_SGE_PBL 256 /* max num sge's for PBL */
27a5319752SBernard Metzler #define SIW_MAX_SGE_RD 1 /* iwarp limitation. we could relax */
28a5319752SBernard Metzler #define SIW_MAX_CQ (1024 * 100)
29a5319752SBernard Metzler #define SIW_MAX_CQE (SIW_MAX_QP_WR * 100)
30a5319752SBernard Metzler #define SIW_MAX_MR (SIW_MAX_QP * 10)
31a5319752SBernard Metzler #define SIW_MAX_PD SIW_MAX_QP
32a5319752SBernard Metzler #define SIW_MAX_MW 0 /* to be set if MW's are supported */
33a5319752SBernard Metzler #define SIW_MAX_SRQ SIW_MAX_QP
34a5319752SBernard Metzler #define SIW_MAX_SRQ_WR (SIW_MAX_QP_WR * 10)
35a5319752SBernard Metzler #define SIW_MAX_CONTEXT SIW_MAX_PD
36a5319752SBernard Metzler
37a5319752SBernard Metzler /* Min number of bytes for using zero copy transmit */
38a5319752SBernard Metzler #define SENDPAGE_THRESH PAGE_SIZE
39a5319752SBernard Metzler
40a5319752SBernard Metzler /* Maximum number of frames which can be send in one SQ processing */
41a5319752SBernard Metzler #define SQ_USER_MAXBURST 100
42a5319752SBernard Metzler
43a5319752SBernard Metzler /* Maximum number of consecutive IRQ elements which get served
44a5319752SBernard Metzler * if SQ has pending work. Prevents starving local SQ processing
45a5319752SBernard Metzler * by serving peer Read Requests.
46a5319752SBernard Metzler */
47a5319752SBernard Metzler #define SIW_IRQ_MAXBURST_SQ_ACTIVE 4
48a5319752SBernard Metzler
4916b87037SBernard Metzler /* There is always only a port 1 per siw device */
5016b87037SBernard Metzler #define SIW_PORT 1
5116b87037SBernard Metzler
52a5319752SBernard Metzler struct siw_dev_cap {
53a5319752SBernard Metzler int max_qp;
54a5319752SBernard Metzler int max_qp_wr;
55a5319752SBernard Metzler int max_ord; /* max. outbound read queue depth */
56a5319752SBernard Metzler int max_ird; /* max. inbound read queue depth */
57a5319752SBernard Metzler int max_sge;
58a5319752SBernard Metzler int max_sge_rd;
59a5319752SBernard Metzler int max_cq;
60a5319752SBernard Metzler int max_cqe;
61a5319752SBernard Metzler int max_mr;
62a5319752SBernard Metzler int max_pd;
63a5319752SBernard Metzler int max_mw;
64a5319752SBernard Metzler int max_srq;
65a5319752SBernard Metzler int max_srq_wr;
66a5319752SBernard Metzler int max_srq_sge;
67a5319752SBernard Metzler };
68a5319752SBernard Metzler
69a5319752SBernard Metzler struct siw_pd {
70a5319752SBernard Metzler struct ib_pd base_pd;
71a5319752SBernard Metzler };
72a5319752SBernard Metzler
73a5319752SBernard Metzler struct siw_device {
74a5319752SBernard Metzler struct ib_device base_dev;
75a5319752SBernard Metzler struct siw_dev_cap attrs;
76a5319752SBernard Metzler
77a5319752SBernard Metzler u32 vendor_part_id;
78a5319752SBernard Metzler int numa_node;
79bad5b6e3SChuck Lever char raw_gid[ETH_ALEN];
80a5319752SBernard Metzler
81a5319752SBernard Metzler spinlock_t lock;
82a5319752SBernard Metzler
83a5319752SBernard Metzler struct xarray qp_xa;
84a5319752SBernard Metzler struct xarray mem_xa;
85a5319752SBernard Metzler
86a5319752SBernard Metzler struct list_head cep_list;
87a5319752SBernard Metzler struct list_head qp_list;
88a5319752SBernard Metzler
89a5319752SBernard Metzler /* active objects statistics to enforce limits */
90a5319752SBernard Metzler atomic_t num_qp;
91a5319752SBernard Metzler atomic_t num_cq;
92a5319752SBernard Metzler atomic_t num_pd;
93a5319752SBernard Metzler atomic_t num_mr;
94a5319752SBernard Metzler atomic_t num_srq;
95a5319752SBernard Metzler atomic_t num_ctx;
96a5319752SBernard Metzler };
97a5319752SBernard Metzler
98a5319752SBernard Metzler struct siw_ucontext {
99a5319752SBernard Metzler struct ib_ucontext base_ucontext;
100a5319752SBernard Metzler struct siw_device *sdev;
101a5319752SBernard Metzler };
102a5319752SBernard Metzler
103a5319752SBernard Metzler /*
104a5319752SBernard Metzler * The RDMA core does not define LOCAL_READ access, which is always
105a5319752SBernard Metzler * enabled implictely.
106a5319752SBernard Metzler */
107a5319752SBernard Metzler #define IWARP_ACCESS_MASK \
108a5319752SBernard Metzler (IB_ACCESS_LOCAL_WRITE | IB_ACCESS_REMOTE_WRITE | \
109a5319752SBernard Metzler IB_ACCESS_REMOTE_READ)
110a5319752SBernard Metzler
111a5319752SBernard Metzler /*
112a5319752SBernard Metzler * siw presentation of user memory registered as source
113a5319752SBernard Metzler * or target of RDMA operations.
114a5319752SBernard Metzler */
115a5319752SBernard Metzler
116a5319752SBernard Metzler struct siw_page_chunk {
117a5319752SBernard Metzler struct page **plist;
118a5319752SBernard Metzler };
119a5319752SBernard Metzler
120a5319752SBernard Metzler struct siw_umem {
121476b7c7eSBernard Metzler struct ib_umem *base_mem;
122a5319752SBernard Metzler struct siw_page_chunk *page_chunk;
123a5319752SBernard Metzler int num_pages;
124a5319752SBernard Metzler u64 fp_addr; /* First page base address */
125a5319752SBernard Metzler };
126a5319752SBernard Metzler
127a5319752SBernard Metzler struct siw_pble {
128c536277eSBernard Metzler dma_addr_t addr; /* Address of assigned buffer */
129c536277eSBernard Metzler unsigned int size; /* Size of this entry */
130c536277eSBernard Metzler unsigned long pbl_off; /* Total offset from start of PBL */
131a5319752SBernard Metzler };
132a5319752SBernard Metzler
133a5319752SBernard Metzler struct siw_pbl {
134a5319752SBernard Metzler unsigned int num_buf;
135a5319752SBernard Metzler unsigned int max_buf;
1360bc018b7SKees Cook struct siw_pble pbe[] __counted_by(max_buf);
137a5319752SBernard Metzler };
138a5319752SBernard Metzler
139a5319752SBernard Metzler /*
140a5319752SBernard Metzler * Generic memory representation for registered siw memory.
141a5319752SBernard Metzler * Memory lookup always via higher 24 bit of STag (STag index).
142a5319752SBernard Metzler */
143a5319752SBernard Metzler struct siw_mem {
144a5319752SBernard Metzler struct siw_device *sdev;
145a5319752SBernard Metzler struct kref ref;
146a5319752SBernard Metzler u64 va; /* VA of memory */
147a5319752SBernard Metzler u64 len; /* length of the memory buffer in bytes */
148a5319752SBernard Metzler u32 stag; /* iWarp memory access steering tag */
149a5319752SBernard Metzler u8 stag_valid; /* VALID or INVALID */
150a5319752SBernard Metzler u8 is_pbl; /* PBL or user space mem */
151a5319752SBernard Metzler u8 is_mw; /* Memory Region or Memory Window */
152a5319752SBernard Metzler enum ib_access_flags perms; /* local/remote READ & WRITE */
153a5319752SBernard Metzler union {
154a5319752SBernard Metzler struct siw_umem *umem;
155a5319752SBernard Metzler struct siw_pbl *pbl;
156a5319752SBernard Metzler void *mem_obj;
157a5319752SBernard Metzler };
158a5319752SBernard Metzler struct ib_pd *pd;
159a5319752SBernard Metzler };
160a5319752SBernard Metzler
161a5319752SBernard Metzler struct siw_mr {
162a5319752SBernard Metzler struct ib_mr base_mr;
163a5319752SBernard Metzler struct siw_mem *mem;
164a5319752SBernard Metzler struct rcu_head rcu;
165a5319752SBernard Metzler };
166a5319752SBernard Metzler
167a5319752SBernard Metzler /*
168a5319752SBernard Metzler * Error codes for local or remote
169a5319752SBernard Metzler * access to registered memory
170a5319752SBernard Metzler */
171a5319752SBernard Metzler enum siw_access_state {
172a5319752SBernard Metzler E_ACCESS_OK,
173a5319752SBernard Metzler E_STAG_INVALID,
174a5319752SBernard Metzler E_BASE_BOUNDS,
175a5319752SBernard Metzler E_ACCESS_PERM,
176a5319752SBernard Metzler E_PD_MISMATCH
177a5319752SBernard Metzler };
178a5319752SBernard Metzler
179a5319752SBernard Metzler enum siw_wr_state {
180a5319752SBernard Metzler SIW_WR_IDLE,
181a5319752SBernard Metzler SIW_WR_QUEUED, /* processing has not started yet */
182a5319752SBernard Metzler SIW_WR_INPROGRESS /* initiated processing of the WR */
183a5319752SBernard Metzler };
184a5319752SBernard Metzler
185a5319752SBernard Metzler /* The WQE currently being processed (RX or TX) */
186a5319752SBernard Metzler struct siw_wqe {
187a5319752SBernard Metzler /* Copy of applications SQE or RQE */
188a5319752SBernard Metzler union {
189a5319752SBernard Metzler struct siw_sqe sqe;
190a5319752SBernard Metzler struct siw_rqe rqe;
191a5319752SBernard Metzler };
192a5319752SBernard Metzler struct siw_mem *mem[SIW_MAX_SGE]; /* per sge's resolved mem */
193a5319752SBernard Metzler enum siw_wr_state wr_status;
194a5319752SBernard Metzler enum siw_wc_status wc_status;
195a5319752SBernard Metzler u32 bytes; /* total bytes to process */
196a5319752SBernard Metzler u32 processed; /* bytes processed */
197a5319752SBernard Metzler };
198a5319752SBernard Metzler
199a5319752SBernard Metzler struct siw_cq {
200a5319752SBernard Metzler struct ib_cq base_cq;
201a5319752SBernard Metzler spinlock_t lock;
2022c8ccb37SBernard Metzler struct siw_cq_ctrl *notify;
203a5319752SBernard Metzler struct siw_cqe *queue;
204a5319752SBernard Metzler u32 cq_put;
205a5319752SBernard Metzler u32 cq_get;
206a5319752SBernard Metzler u32 num_cqe;
20711f1a755SMichal Kalderon struct rdma_user_mmap_entry *cq_entry; /* mmap info for CQE array */
208a5319752SBernard Metzler u32 id; /* For debugging only */
209a5319752SBernard Metzler };
210a5319752SBernard Metzler
211a5319752SBernard Metzler enum siw_qp_state {
212a5319752SBernard Metzler SIW_QP_STATE_IDLE,
213a5319752SBernard Metzler SIW_QP_STATE_RTR,
214a5319752SBernard Metzler SIW_QP_STATE_RTS,
215a5319752SBernard Metzler SIW_QP_STATE_CLOSING,
216a5319752SBernard Metzler SIW_QP_STATE_TERMINATE,
217a5319752SBernard Metzler SIW_QP_STATE_ERROR,
218a5319752SBernard Metzler SIW_QP_STATE_COUNT
219a5319752SBernard Metzler };
220a5319752SBernard Metzler
221a5319752SBernard Metzler enum siw_qp_flags {
222a5319752SBernard Metzler SIW_RDMA_BIND_ENABLED = (1 << 0),
223a5319752SBernard Metzler SIW_RDMA_WRITE_ENABLED = (1 << 1),
224a5319752SBernard Metzler SIW_RDMA_READ_ENABLED = (1 << 2),
225a5319752SBernard Metzler SIW_SIGNAL_ALL_WR = (1 << 3),
226a5319752SBernard Metzler SIW_MPA_CRC = (1 << 4),
227a5319752SBernard Metzler SIW_QP_IN_DESTROY = (1 << 5)
228a5319752SBernard Metzler };
229a5319752SBernard Metzler
230a5319752SBernard Metzler enum siw_qp_attr_mask {
231a5319752SBernard Metzler SIW_QP_ATTR_STATE = (1 << 0),
232a5319752SBernard Metzler SIW_QP_ATTR_ACCESS_FLAGS = (1 << 1),
233a5319752SBernard Metzler SIW_QP_ATTR_LLP_HANDLE = (1 << 2),
234a5319752SBernard Metzler SIW_QP_ATTR_ORD = (1 << 3),
235a5319752SBernard Metzler SIW_QP_ATTR_IRD = (1 << 4),
236a5319752SBernard Metzler SIW_QP_ATTR_SQ_SIZE = (1 << 5),
237a5319752SBernard Metzler SIW_QP_ATTR_RQ_SIZE = (1 << 6),
238a5319752SBernard Metzler SIW_QP_ATTR_MPA = (1 << 7)
239a5319752SBernard Metzler };
240a5319752SBernard Metzler
241a5319752SBernard Metzler struct siw_srq {
242a5319752SBernard Metzler struct ib_srq base_srq;
243a5319752SBernard Metzler spinlock_t lock;
244a5319752SBernard Metzler u32 max_sge;
245a5319752SBernard Metzler u32 limit; /* low watermark for async event */
246a5319752SBernard Metzler struct siw_rqe *recvq;
247a5319752SBernard Metzler u32 rq_put;
248a5319752SBernard Metzler u32 rq_get;
249a5319752SBernard Metzler u32 num_rqe; /* max # of wqe's allowed */
25011f1a755SMichal Kalderon struct rdma_user_mmap_entry *srq_entry; /* mmap info for SRQ array */
25158fb0b56SBernard Metzler bool armed:1; /* inform user if limit hit */
25258fb0b56SBernard Metzler bool is_kernel_res:1; /* true if kernel client */
253a5319752SBernard Metzler };
254a5319752SBernard Metzler
255a5319752SBernard Metzler struct siw_qp_attrs {
256a5319752SBernard Metzler enum siw_qp_state state;
257a5319752SBernard Metzler u32 sq_size;
258a5319752SBernard Metzler u32 rq_size;
259a5319752SBernard Metzler u32 orq_size;
260a5319752SBernard Metzler u32 irq_size;
261a5319752SBernard Metzler u32 sq_max_sges;
262a5319752SBernard Metzler u32 rq_max_sges;
263a5319752SBernard Metzler enum siw_qp_flags flags;
264a5319752SBernard Metzler
265a5319752SBernard Metzler struct socket *sk;
266a5319752SBernard Metzler };
267a5319752SBernard Metzler
268a5319752SBernard Metzler enum siw_tx_ctx {
269a5319752SBernard Metzler SIW_SEND_HDR, /* start or continue sending HDR */
270a5319752SBernard Metzler SIW_SEND_DATA, /* start or continue sending DDP payload */
271a5319752SBernard Metzler SIW_SEND_TRAILER, /* start or continue sending TRAILER */
272a5319752SBernard Metzler SIW_SEND_SHORT_FPDU/* send whole FPDU hdr|data|trailer at once */
273a5319752SBernard Metzler };
274a5319752SBernard Metzler
275a5319752SBernard Metzler enum siw_rx_state {
276a5319752SBernard Metzler SIW_GET_HDR, /* await new hdr or within hdr */
277a5319752SBernard Metzler SIW_GET_DATA_START, /* start of inbound DDP payload */
278a5319752SBernard Metzler SIW_GET_DATA_MORE, /* continuation of (misaligned) DDP payload */
279a5319752SBernard Metzler SIW_GET_TRAILER/* await new trailer or within trailer */
280a5319752SBernard Metzler };
281a5319752SBernard Metzler
282a5319752SBernard Metzler struct siw_rx_stream {
283a5319752SBernard Metzler struct sk_buff *skb;
284a5319752SBernard Metzler int skb_new; /* pending unread bytes in skb */
285a5319752SBernard Metzler int skb_offset; /* offset in skb */
286a5319752SBernard Metzler int skb_copied; /* processed bytes in skb */
287a5319752SBernard Metzler
28851ac45a6SGuoqing Jiang enum siw_rx_state state;
28951ac45a6SGuoqing Jiang
290a5319752SBernard Metzler union iwarp_hdr hdr;
291a5319752SBernard Metzler struct mpa_trailer trailer;
292426370c8SEric Biggers u32 mpa_crc;
293426370c8SEric Biggers bool mpa_crc_enabled;
294a5319752SBernard Metzler
295a5319752SBernard Metzler /*
296a5319752SBernard Metzler * For each FPDU, main RX loop runs through 3 stages:
297a5319752SBernard Metzler * Receiving protocol headers, placing DDP payload and receiving
298a5319752SBernard Metzler * trailer information (CRC + possibly padding).
299a5319752SBernard Metzler * Next two variables keep state on receive status of the
300a5319752SBernard Metzler * current FPDU part (hdr, data, trailer).
301a5319752SBernard Metzler */
302a5319752SBernard Metzler int fpdu_part_rcvd; /* bytes in pkt part copied */
303a5319752SBernard Metzler int fpdu_part_rem; /* bytes in pkt part not seen */
304a5319752SBernard Metzler
305a5319752SBernard Metzler /*
306a5319752SBernard Metzler * Next expected DDP MSN for each QN +
307a5319752SBernard Metzler * expected steering tag +
308a5319752SBernard Metzler * expected DDP tagget offset (all HBO)
309a5319752SBernard Metzler */
310a5319752SBernard Metzler u32 ddp_msn[RDMAP_UNTAGGED_QN_COUNT];
311a5319752SBernard Metzler u32 ddp_stag;
312a5319752SBernard Metzler u64 ddp_to;
313a5319752SBernard Metzler u32 inval_stag; /* Stag to be invalidated */
314a5319752SBernard Metzler
315a5319752SBernard Metzler u8 rx_suspend : 1;
316a5319752SBernard Metzler u8 pad : 2; /* # of pad bytes expected */
317a5319752SBernard Metzler u8 rdmap_op : 4; /* opcode of current frame */
318a5319752SBernard Metzler };
319a5319752SBernard Metzler
320a5319752SBernard Metzler struct siw_rx_fpdu {
321a5319752SBernard Metzler /*
322a5319752SBernard Metzler * Local destination memory of inbound RDMA operation.
323a5319752SBernard Metzler * Valid, according to wqe->wr_status
324a5319752SBernard Metzler */
325a5319752SBernard Metzler struct siw_wqe wqe_active;
326a5319752SBernard Metzler
327a5319752SBernard Metzler unsigned int pbl_idx; /* Index into current PBL */
328a5319752SBernard Metzler unsigned int sge_idx; /* current sge in rx */
329a5319752SBernard Metzler unsigned int sge_off; /* already rcvd in curr. sge */
330a5319752SBernard Metzler
331a5319752SBernard Metzler char first_ddp_seg; /* this is the first DDP seg */
332a5319752SBernard Metzler char more_ddp_segs; /* more DDP segs expected */
333a5319752SBernard Metzler u8 prev_rdmap_op : 4; /* opcode of prev frame */
334a5319752SBernard Metzler };
335a5319752SBernard Metzler
336a5319752SBernard Metzler /*
337a5319752SBernard Metzler * Shorthands for short packets w/o payload
338a5319752SBernard Metzler * to be transmitted more efficient.
339a5319752SBernard Metzler */
340a5319752SBernard Metzler struct siw_send_pkt {
341a5319752SBernard Metzler struct iwarp_send send;
342a5319752SBernard Metzler __be32 crc;
343a5319752SBernard Metzler };
344a5319752SBernard Metzler
345a5319752SBernard Metzler struct siw_write_pkt {
346a5319752SBernard Metzler struct iwarp_rdma_write write;
347a5319752SBernard Metzler __be32 crc;
348a5319752SBernard Metzler };
349a5319752SBernard Metzler
350a5319752SBernard Metzler struct siw_rreq_pkt {
351a5319752SBernard Metzler struct iwarp_rdma_rreq rreq;
352a5319752SBernard Metzler __be32 crc;
353a5319752SBernard Metzler };
354a5319752SBernard Metzler
355a5319752SBernard Metzler struct siw_rresp_pkt {
356a5319752SBernard Metzler struct iwarp_rdma_rresp rresp;
357a5319752SBernard Metzler __be32 crc;
358a5319752SBernard Metzler };
359a5319752SBernard Metzler
360a5319752SBernard Metzler struct siw_iwarp_tx {
361a5319752SBernard Metzler union {
362a5319752SBernard Metzler union iwarp_hdr hdr;
363a5319752SBernard Metzler
364a5319752SBernard Metzler /* Generic part of FPDU header */
365a5319752SBernard Metzler struct iwarp_ctrl ctrl;
366a5319752SBernard Metzler struct iwarp_ctrl_untagged c_untagged;
367a5319752SBernard Metzler struct iwarp_ctrl_tagged c_tagged;
368a5319752SBernard Metzler
369a5319752SBernard Metzler /* FPDU headers */
370a5319752SBernard Metzler struct iwarp_rdma_write rwrite;
371a5319752SBernard Metzler struct iwarp_rdma_rreq rreq;
372a5319752SBernard Metzler struct iwarp_rdma_rresp rresp;
373a5319752SBernard Metzler struct iwarp_terminate terminate;
374a5319752SBernard Metzler struct iwarp_send send;
375a5319752SBernard Metzler struct iwarp_send_inv send_inv;
376a5319752SBernard Metzler
377a5319752SBernard Metzler /* complete short FPDUs */
378a5319752SBernard Metzler struct siw_send_pkt send_pkt;
379a5319752SBernard Metzler struct siw_write_pkt write_pkt;
380a5319752SBernard Metzler struct siw_rreq_pkt rreq_pkt;
381a5319752SBernard Metzler struct siw_rresp_pkt rresp_pkt;
382a5319752SBernard Metzler } pkt;
383a5319752SBernard Metzler
384a5319752SBernard Metzler struct mpa_trailer trailer;
385a5319752SBernard Metzler /* DDP MSN for untagged messages */
386a5319752SBernard Metzler u32 ddp_msn[RDMAP_UNTAGGED_QN_COUNT];
387a5319752SBernard Metzler
388a5319752SBernard Metzler enum siw_tx_ctx state;
389a5319752SBernard Metzler u16 ctrl_len; /* ddp+rdmap hdr */
390a5319752SBernard Metzler u16 ctrl_sent;
391a5319752SBernard Metzler int burst;
392a5319752SBernard Metzler int bytes_unsent; /* ddp payload bytes */
393a5319752SBernard Metzler
394426370c8SEric Biggers u32 mpa_crc;
395426370c8SEric Biggers bool mpa_crc_enabled;
396a5319752SBernard Metzler
397a5319752SBernard Metzler u8 do_crc : 1; /* do crc for segment */
398a5319752SBernard Metzler u8 use_sendpage : 1; /* send w/o copy */
399a5319752SBernard Metzler u8 tx_suspend : 1; /* stop sending DDP segs. */
400a5319752SBernard Metzler u8 pad : 2; /* # pad in current fpdu */
401a5319752SBernard Metzler u8 orq_fence : 1; /* ORQ full or Send fenced */
402a5319752SBernard Metzler u8 in_syscall : 1; /* TX out of user context */
403a5319752SBernard Metzler u8 zcopy_tx : 1; /* Use TCP_SENDPAGE if possible */
404a5319752SBernard Metzler u8 gso_seg_limit; /* Maximum segments for GSO, 0 = unbound */
405a5319752SBernard Metzler
406a5319752SBernard Metzler u16 fpdu_len; /* len of FPDU to tx */
407a5319752SBernard Metzler unsigned int tcp_seglen; /* remaining tcp seg space */
408a5319752SBernard Metzler
409a5319752SBernard Metzler struct siw_wqe wqe_active;
410a5319752SBernard Metzler
411a5319752SBernard Metzler int pbl_idx; /* Index into current PBL */
412a5319752SBernard Metzler int sge_idx; /* current sge in tx */
413a5319752SBernard Metzler u32 sge_off; /* already sent in curr. sge */
414a5319752SBernard Metzler };
415a5319752SBernard Metzler
416a5319752SBernard Metzler struct siw_qp {
41758fb0b56SBernard Metzler struct ib_qp base_qp;
418a5319752SBernard Metzler struct siw_device *sdev;
41984de14baSGuoqing Jiang int tx_cpu;
420a5319752SBernard Metzler struct kref ref;
421a3c27880SBernard Metzler struct completion qp_free;
422a5319752SBernard Metzler struct list_head devq;
423a5319752SBernard Metzler struct siw_qp_attrs attrs;
424a5319752SBernard Metzler
425a5319752SBernard Metzler struct siw_cep *cep;
426a5319752SBernard Metzler struct rw_semaphore state_lock;
427a5319752SBernard Metzler
428a5319752SBernard Metzler struct ib_pd *pd;
429a5319752SBernard Metzler struct siw_cq *scq;
430a5319752SBernard Metzler struct siw_cq *rcq;
431a5319752SBernard Metzler struct siw_srq *srq;
432a5319752SBernard Metzler
433a5319752SBernard Metzler struct siw_iwarp_tx tx_ctx; /* Transmit context */
434a5319752SBernard Metzler spinlock_t sq_lock;
435a5319752SBernard Metzler struct siw_sqe *sendq; /* send queue element array */
436a5319752SBernard Metzler uint32_t sq_get; /* consumer index into sq array */
437a5319752SBernard Metzler uint32_t sq_put; /* kernel prod. index into sq array */
438a5319752SBernard Metzler struct llist_node tx_list;
439a5319752SBernard Metzler
440a5319752SBernard Metzler struct siw_sqe *orq; /* outbound read queue element array */
441a5319752SBernard Metzler spinlock_t orq_lock;
442a5319752SBernard Metzler uint32_t orq_get; /* consumer index into orq array */
443a5319752SBernard Metzler uint32_t orq_put; /* shared producer index for ORQ */
444a5319752SBernard Metzler
445a5319752SBernard Metzler struct siw_rx_stream rx_stream;
446a5319752SBernard Metzler struct siw_rx_fpdu *rx_fpdu;
447a5319752SBernard Metzler struct siw_rx_fpdu rx_tagged;
448a5319752SBernard Metzler struct siw_rx_fpdu rx_untagged;
449a5319752SBernard Metzler spinlock_t rq_lock;
450a5319752SBernard Metzler struct siw_rqe *recvq; /* recv queue element array */
451a5319752SBernard Metzler uint32_t rq_get; /* consumer index into rq array */
452a5319752SBernard Metzler uint32_t rq_put; /* kernel prod. index into rq array */
453a5319752SBernard Metzler
454a5319752SBernard Metzler struct siw_sqe *irq; /* inbound read queue element array */
455a5319752SBernard Metzler uint32_t irq_get; /* consumer index into irq array */
456a5319752SBernard Metzler uint32_t irq_put; /* producer index into irq array */
457a5319752SBernard Metzler int irq_burst;
458a5319752SBernard Metzler
459a5319752SBernard Metzler struct { /* information to be carried in TERMINATE pkt, if valid */
460a5319752SBernard Metzler u8 valid;
461a5319752SBernard Metzler u8 in_tx;
462a5319752SBernard Metzler u8 layer : 4, etype : 4;
463a5319752SBernard Metzler u8 ecode;
464a5319752SBernard Metzler } term_info;
46511f1a755SMichal Kalderon struct rdma_user_mmap_entry *sq_entry; /* mmap info for SQE array */
46611f1a755SMichal Kalderon struct rdma_user_mmap_entry *rq_entry; /* mmap info for RQE array */
467a5319752SBernard Metzler };
468a5319752SBernard Metzler
469a5319752SBernard Metzler /* helper macros */
470a5319752SBernard Metzler #define rx_qp(rx) container_of(rx, struct siw_qp, rx_stream)
471a5319752SBernard Metzler #define tx_qp(tx) container_of(tx, struct siw_qp, tx_ctx)
472a5319752SBernard Metzler #define tx_wqe(qp) (&(qp)->tx_ctx.wqe_active)
473a5319752SBernard Metzler #define rx_wqe(rctx) (&(rctx)->wqe_active)
474a5319752SBernard Metzler #define rx_mem(rctx) ((rctx)->wqe_active.mem[0])
475a5319752SBernard Metzler #define tx_type(wqe) ((wqe)->sqe.opcode)
476a5319752SBernard Metzler #define rx_type(wqe) ((wqe)->rqe.opcode)
477a5319752SBernard Metzler #define tx_flags(wqe) ((wqe)->sqe.flags)
478a5319752SBernard Metzler
479a5319752SBernard Metzler struct iwarp_msg_info {
480a5319752SBernard Metzler int hdr_len;
481a5319752SBernard Metzler struct iwarp_ctrl ctrl;
482a5319752SBernard Metzler int (*rx_data)(struct siw_qp *qp);
483a5319752SBernard Metzler };
484a5319752SBernard Metzler
48511f1a755SMichal Kalderon struct siw_user_mmap_entry {
48611f1a755SMichal Kalderon struct rdma_user_mmap_entry rdma_entry;
48711f1a755SMichal Kalderon void *address;
48811f1a755SMichal Kalderon };
48911f1a755SMichal Kalderon
490a5319752SBernard Metzler /* Global siw parameters. Currently set in siw_main.c */
491a5319752SBernard Metzler extern const bool zcopy_tx;
492a5319752SBernard Metzler extern const bool try_gso;
493a5319752SBernard Metzler extern const bool loopback_enabled;
494a5319752SBernard Metzler extern const bool mpa_crc_required;
495a5319752SBernard Metzler extern const bool mpa_crc_strict;
496a5319752SBernard Metzler extern const bool siw_tcp_nagle;
497a5319752SBernard Metzler extern u_char mpa_version;
498a5319752SBernard Metzler extern const bool peer_to_peer;
499a5319752SBernard Metzler extern struct task_struct *siw_tx_thread[];
500a5319752SBernard Metzler
501a5319752SBernard Metzler extern struct iwarp_msg_info iwarp_pktinfo[RDMAP_TERMINATE + 1];
502a5319752SBernard Metzler
503a5319752SBernard Metzler /* QP general functions */
504a5319752SBernard Metzler int siw_qp_modify(struct siw_qp *qp, struct siw_qp_attrs *attr,
505a5319752SBernard Metzler enum siw_qp_attr_mask mask);
506a5319752SBernard Metzler int siw_qp_mpa_rts(struct siw_qp *qp, enum mpa_v2_ctrl ctrl);
507a5319752SBernard Metzler void siw_qp_llp_close(struct siw_qp *qp);
508a5319752SBernard Metzler void siw_qp_cm_drop(struct siw_qp *qp, int schedule);
509a5319752SBernard Metzler void siw_send_terminate(struct siw_qp *qp);
510a5319752SBernard Metzler
511a5319752SBernard Metzler void siw_qp_get_ref(struct ib_qp *qp);
512a5319752SBernard Metzler void siw_qp_put_ref(struct ib_qp *qp);
513a5319752SBernard Metzler int siw_qp_add(struct siw_device *sdev, struct siw_qp *qp);
514a5319752SBernard Metzler void siw_free_qp(struct kref *ref);
515a5319752SBernard Metzler
516a5319752SBernard Metzler void siw_init_terminate(struct siw_qp *qp, enum term_elayer layer,
517a5319752SBernard Metzler u8 etype, u8 ecode, int in_tx);
518a5319752SBernard Metzler enum ddp_ecode siw_tagged_error(enum siw_access_state state);
519a5319752SBernard Metzler enum rdmap_ecode siw_rdmap_error(enum siw_access_state state);
520a5319752SBernard Metzler
521a5319752SBernard Metzler void siw_read_to_orq(struct siw_sqe *rreq, struct siw_sqe *sqe);
522a5319752SBernard Metzler int siw_sqe_complete(struct siw_qp *qp, struct siw_sqe *sqe, u32 bytes,
523a5319752SBernard Metzler enum siw_wc_status status);
524a5319752SBernard Metzler int siw_rqe_complete(struct siw_qp *qp, struct siw_rqe *rqe, u32 bytes,
525a5319752SBernard Metzler u32 inval_stag, enum siw_wc_status status);
526a5319752SBernard Metzler void siw_qp_llp_data_ready(struct sock *sk);
527a5319752SBernard Metzler void siw_qp_llp_write_space(struct sock *sk);
528a5319752SBernard Metzler
529a5319752SBernard Metzler /* QP TX path functions */
53091f36237SBernard Metzler int siw_create_tx_threads(void);
53191f36237SBernard Metzler void siw_stop_tx_threads(void);
532a5319752SBernard Metzler int siw_run_sq(void *arg);
533a5319752SBernard Metzler int siw_qp_sq_process(struct siw_qp *qp);
534a5319752SBernard Metzler int siw_sq_start(struct siw_qp *qp);
535a5319752SBernard Metzler int siw_activate_tx(struct siw_qp *qp);
536a5319752SBernard Metzler int siw_get_tx_cpu(struct siw_device *sdev);
537a5319752SBernard Metzler void siw_put_tx_cpu(int cpu);
538a5319752SBernard Metzler
539a5319752SBernard Metzler /* QP RX path functions */
540a5319752SBernard Metzler int siw_proc_send(struct siw_qp *qp);
541a5319752SBernard Metzler int siw_proc_rreq(struct siw_qp *qp);
542a5319752SBernard Metzler int siw_proc_rresp(struct siw_qp *qp);
543a5319752SBernard Metzler int siw_proc_write(struct siw_qp *qp);
544a5319752SBernard Metzler int siw_proc_terminate(struct siw_qp *qp);
545a5319752SBernard Metzler
546a5319752SBernard Metzler int siw_tcp_rx_data(read_descriptor_t *rd_desc, struct sk_buff *skb,
547a5319752SBernard Metzler unsigned int off, size_t len);
548a5319752SBernard Metzler
set_rx_fpdu_context(struct siw_qp * qp,u8 opcode)549a5319752SBernard Metzler static inline void set_rx_fpdu_context(struct siw_qp *qp, u8 opcode)
550a5319752SBernard Metzler {
551a5319752SBernard Metzler if (opcode == RDMAP_RDMA_WRITE || opcode == RDMAP_RDMA_READ_RESP)
552a5319752SBernard Metzler qp->rx_fpdu = &qp->rx_tagged;
553a5319752SBernard Metzler else
554a5319752SBernard Metzler qp->rx_fpdu = &qp->rx_untagged;
555a5319752SBernard Metzler
556a5319752SBernard Metzler qp->rx_stream.rdmap_op = opcode;
557a5319752SBernard Metzler }
558a5319752SBernard Metzler
to_siw_ctx(struct ib_ucontext * base_ctx)559a5319752SBernard Metzler static inline struct siw_ucontext *to_siw_ctx(struct ib_ucontext *base_ctx)
560a5319752SBernard Metzler {
561a5319752SBernard Metzler return container_of(base_ctx, struct siw_ucontext, base_ucontext);
562a5319752SBernard Metzler }
563a5319752SBernard Metzler
to_siw_qp(struct ib_qp * base_qp)564a5319752SBernard Metzler static inline struct siw_qp *to_siw_qp(struct ib_qp *base_qp)
565a5319752SBernard Metzler {
56658fb0b56SBernard Metzler return container_of(base_qp, struct siw_qp, base_qp);
567a5319752SBernard Metzler }
568a5319752SBernard Metzler
to_siw_cq(struct ib_cq * base_cq)569a5319752SBernard Metzler static inline struct siw_cq *to_siw_cq(struct ib_cq *base_cq)
570a5319752SBernard Metzler {
571a5319752SBernard Metzler return container_of(base_cq, struct siw_cq, base_cq);
572a5319752SBernard Metzler }
573a5319752SBernard Metzler
to_siw_srq(struct ib_srq * base_srq)574a5319752SBernard Metzler static inline struct siw_srq *to_siw_srq(struct ib_srq *base_srq)
575a5319752SBernard Metzler {
576a5319752SBernard Metzler return container_of(base_srq, struct siw_srq, base_srq);
577a5319752SBernard Metzler }
578a5319752SBernard Metzler
to_siw_dev(struct ib_device * base_dev)579a5319752SBernard Metzler static inline struct siw_device *to_siw_dev(struct ib_device *base_dev)
580a5319752SBernard Metzler {
581a5319752SBernard Metzler return container_of(base_dev, struct siw_device, base_dev);
582a5319752SBernard Metzler }
583a5319752SBernard Metzler
to_siw_mr(struct ib_mr * base_mr)584a5319752SBernard Metzler static inline struct siw_mr *to_siw_mr(struct ib_mr *base_mr)
585a5319752SBernard Metzler {
586a5319752SBernard Metzler return container_of(base_mr, struct siw_mr, base_mr);
587a5319752SBernard Metzler }
588a5319752SBernard Metzler
58911f1a755SMichal Kalderon static inline struct siw_user_mmap_entry *
to_siw_mmap_entry(struct rdma_user_mmap_entry * rdma_mmap)59011f1a755SMichal Kalderon to_siw_mmap_entry(struct rdma_user_mmap_entry *rdma_mmap)
59111f1a755SMichal Kalderon {
59211f1a755SMichal Kalderon return container_of(rdma_mmap, struct siw_user_mmap_entry, rdma_entry);
59311f1a755SMichal Kalderon }
59411f1a755SMichal Kalderon
siw_qp_id2obj(struct siw_device * sdev,int id)595a5319752SBernard Metzler static inline struct siw_qp *siw_qp_id2obj(struct siw_device *sdev, int id)
596a5319752SBernard Metzler {
597a5319752SBernard Metzler struct siw_qp *qp;
598a5319752SBernard Metzler
599a5319752SBernard Metzler rcu_read_lock();
600a5319752SBernard Metzler qp = xa_load(&sdev->qp_xa, id);
601a5319752SBernard Metzler if (likely(qp && kref_get_unless_zero(&qp->ref))) {
602a5319752SBernard Metzler rcu_read_unlock();
603a5319752SBernard Metzler return qp;
604a5319752SBernard Metzler }
605a5319752SBernard Metzler rcu_read_unlock();
606a5319752SBernard Metzler return NULL;
607a5319752SBernard Metzler }
608a5319752SBernard Metzler
qp_id(struct siw_qp * qp)609a5319752SBernard Metzler static inline u32 qp_id(struct siw_qp *qp)
610a5319752SBernard Metzler {
61158fb0b56SBernard Metzler return qp->base_qp.qp_num;
612a5319752SBernard Metzler }
613a5319752SBernard Metzler
siw_qp_get(struct siw_qp * qp)614a5319752SBernard Metzler static inline void siw_qp_get(struct siw_qp *qp)
615a5319752SBernard Metzler {
616a5319752SBernard Metzler kref_get(&qp->ref);
617a5319752SBernard Metzler }
618a5319752SBernard Metzler
siw_qp_put(struct siw_qp * qp)619a5319752SBernard Metzler static inline void siw_qp_put(struct siw_qp *qp)
620a5319752SBernard Metzler {
621a5319752SBernard Metzler kref_put(&qp->ref, siw_free_qp);
622a5319752SBernard Metzler }
623a5319752SBernard Metzler
siw_sq_empty(struct siw_qp * qp)624a5319752SBernard Metzler static inline int siw_sq_empty(struct siw_qp *qp)
625a5319752SBernard Metzler {
626a5319752SBernard Metzler struct siw_sqe *sqe = &qp->sendq[qp->sq_get % qp->attrs.sq_size];
627a5319752SBernard Metzler
628a5319752SBernard Metzler return READ_ONCE(sqe->flags) == 0;
629a5319752SBernard Metzler }
630a5319752SBernard Metzler
sq_get_next(struct siw_qp * qp)631a5319752SBernard Metzler static inline struct siw_sqe *sq_get_next(struct siw_qp *qp)
632a5319752SBernard Metzler {
633a5319752SBernard Metzler struct siw_sqe *sqe = &qp->sendq[qp->sq_get % qp->attrs.sq_size];
634a5319752SBernard Metzler
635a5319752SBernard Metzler if (READ_ONCE(sqe->flags) & SIW_WQE_VALID)
636a5319752SBernard Metzler return sqe;
637a5319752SBernard Metzler
638a5319752SBernard Metzler return NULL;
639a5319752SBernard Metzler }
640a5319752SBernard Metzler
orq_get_current(struct siw_qp * qp)641a5319752SBernard Metzler static inline struct siw_sqe *orq_get_current(struct siw_qp *qp)
642a5319752SBernard Metzler {
643a5319752SBernard Metzler return &qp->orq[qp->orq_get % qp->attrs.orq_size];
644a5319752SBernard Metzler }
645a5319752SBernard Metzler
orq_get_free(struct siw_qp * qp)646a5319752SBernard Metzler static inline struct siw_sqe *orq_get_free(struct siw_qp *qp)
647a5319752SBernard Metzler {
648b43a76f4SBernard Metzler struct siw_sqe *orq_e = &qp->orq[qp->orq_put % qp->attrs.orq_size];
649a5319752SBernard Metzler
650661f3859SBernard Metzler if (READ_ONCE(orq_e->flags) == 0)
651a5319752SBernard Metzler return orq_e;
652a5319752SBernard Metzler
653a5319752SBernard Metzler return NULL;
654a5319752SBernard Metzler }
655a5319752SBernard Metzler
siw_orq_empty(struct siw_qp * qp)656a5319752SBernard Metzler static inline int siw_orq_empty(struct siw_qp *qp)
657a5319752SBernard Metzler {
658b7a2768aSGuoqing Jiang return orq_get_current(qp)->flags == 0 ? 1 : 0;
659a5319752SBernard Metzler }
660a5319752SBernard Metzler
irq_alloc_free(struct siw_qp * qp)661a5319752SBernard Metzler static inline struct siw_sqe *irq_alloc_free(struct siw_qp *qp)
662a5319752SBernard Metzler {
663a5319752SBernard Metzler struct siw_sqe *irq_e = &qp->irq[qp->irq_put % qp->attrs.irq_size];
664a5319752SBernard Metzler
665a5319752SBernard Metzler if (READ_ONCE(irq_e->flags) == 0) {
666a5319752SBernard Metzler qp->irq_put++;
667a5319752SBernard Metzler return irq_e;
668a5319752SBernard Metzler }
669a5319752SBernard Metzler return NULL;
670a5319752SBernard Metzler }
671a5319752SBernard Metzler
siw_crc_init(u32 * crc)672426370c8SEric Biggers static inline void siw_crc_init(u32 *crc)
673426370c8SEric Biggers {
674426370c8SEric Biggers *crc = ~0;
675426370c8SEric Biggers }
676426370c8SEric Biggers
siw_crc_update(u32 * crc,const void * data,size_t len)677426370c8SEric Biggers static inline void siw_crc_update(u32 *crc, const void *data, size_t len)
678426370c8SEric Biggers {
679426370c8SEric Biggers *crc = crc32c(*crc, data, len);
680426370c8SEric Biggers }
681426370c8SEric Biggers
siw_crc_final(u32 * crc,u8 out[4])682426370c8SEric Biggers static inline void siw_crc_final(u32 *crc, u8 out[4])
683426370c8SEric Biggers {
684426370c8SEric Biggers put_unaligned_le32(~*crc, out);
685426370c8SEric Biggers }
686426370c8SEric Biggers
siw_crc_oneshot(const void * data,size_t len,u8 out[4])687426370c8SEric Biggers static inline void siw_crc_oneshot(const void *data, size_t len, u8 out[4])
688426370c8SEric Biggers {
689426370c8SEric Biggers u32 crc;
690426370c8SEric Biggers
691426370c8SEric Biggers siw_crc_init(&crc);
692426370c8SEric Biggers siw_crc_update(&crc, data, len);
693426370c8SEric Biggers return siw_crc_final(&crc, out);
694426370c8SEric Biggers }
695426370c8SEric Biggers
siw_crc_skb(struct siw_rx_stream * srx,unsigned int len)696a5319752SBernard Metzler static inline void siw_crc_skb(struct siw_rx_stream *srx, unsigned int len)
697a5319752SBernard Metzler {
698*62673b7dSEric Biggers srx->mpa_crc = skb_crc32c(srx->skb, srx->skb_offset, len, srx->mpa_crc);
699a5319752SBernard Metzler }
700a5319752SBernard Metzler
701a5319752SBernard Metzler #define siw_dbg(ibdev, fmt, ...) \
702a5319752SBernard Metzler ibdev_dbg(ibdev, "%s: " fmt, __func__, ##__VA_ARGS__)
703a5319752SBernard Metzler
704a5319752SBernard Metzler #define siw_dbg_qp(qp, fmt, ...) \
705a5319752SBernard Metzler ibdev_dbg(&qp->sdev->base_dev, "QP[%u] %s: " fmt, qp_id(qp), __func__, \
706a5319752SBernard Metzler ##__VA_ARGS__)
707a5319752SBernard Metzler
708a5319752SBernard Metzler #define siw_dbg_cq(cq, fmt, ...) \
709a5319752SBernard Metzler ibdev_dbg(cq->base_cq.device, "CQ[%u] %s: " fmt, cq->id, __func__, \
710a5319752SBernard Metzler ##__VA_ARGS__)
711a5319752SBernard Metzler
712a5319752SBernard Metzler #define siw_dbg_pd(pd, fmt, ...) \
713a5319752SBernard Metzler ibdev_dbg(pd->device, "PD[%u] %s: " fmt, pd->res.id, __func__, \
714a5319752SBernard Metzler ##__VA_ARGS__)
715a5319752SBernard Metzler
716a5319752SBernard Metzler #define siw_dbg_mem(mem, fmt, ...) \
717a5319752SBernard Metzler ibdev_dbg(&mem->sdev->base_dev, \
718a5319752SBernard Metzler "MEM[0x%08x] %s: " fmt, mem->stag, __func__, ##__VA_ARGS__)
719a5319752SBernard Metzler
720a5319752SBernard Metzler #define siw_dbg_cep(cep, fmt, ...) \
7219334003dSThomas Weißschuh ibdev_dbg(&cep->sdev->base_dev, "CEP[0x%p] %s: " fmt, \
722a5319752SBernard Metzler cep, __func__, ##__VA_ARGS__)
723a5319752SBernard Metzler
724a5319752SBernard Metzler void siw_cq_flush(struct siw_cq *cq);
725a5319752SBernard Metzler void siw_sq_flush(struct siw_qp *qp);
726a5319752SBernard Metzler void siw_rq_flush(struct siw_qp *qp);
727a5319752SBernard Metzler int siw_reap_cqe(struct siw_cq *cq, struct ib_wc *wc);
728a5319752SBernard Metzler
729a5319752SBernard Metzler #endif
730