1 /*
2  * Copyright (c) 2016 Mellanox Technologies Ltd. All rights reserved.
3  * Copyright (c) 2015 System Fabric Works, Inc. All rights reserved.
4  *
5  * This software is available to you under a choice of one of two
6  * licenses.  You may choose to be licensed under the terms of the GNU
7  * General Public License (GPL) Version 2, available from the file
8  * COPYING in the main directory of this source tree, or the
9  * OpenIB.org BSD license below:
10  *
11  *	   Redistribution and use in source and binary forms, with or
12  *	   without modification, are permitted provided that the following
13  *	   conditions are met:
14  *
15  *	- Redistributions of source code must retain the above
16  *	  copyright notice, this list of conditions and the following
17  *	  disclaimer.
18  *
19  *	- Redistributions in binary form must reproduce the above
20  *	  copyright notice, this list of conditions and the following
21  *	  disclaimer in the documentation and/or other materials
22  *	  provided with the distribution.
23  *
24  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
25  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
26  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
27  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
28  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
29  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
30  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
31  * SOFTWARE.
32  */
33 
34 #ifndef RXE_VERBS_H
35 #define RXE_VERBS_H
36 
37 #include <linux/interrupt.h>
38 #include <linux/workqueue.h>
39 #include <rdma/rdma_user_rxe.h>
40 #include "rxe_pool.h"
41 #include "rxe_task.h"
42 #include "rxe_hw_counters.h"
43 
pkey_match(u16 key1,u16 key2)44 static inline int pkey_match(u16 key1, u16 key2)
45 {
46 	return (((key1 & 0x7fff) != 0) &&
47 		((key1 & 0x7fff) == (key2 & 0x7fff)) &&
48 		((key1 & 0x8000) || (key2 & 0x8000))) ? 1 : 0;
49 }
50 
51 /* Return >0 if psn_a > psn_b
52  *	   0 if psn_a == psn_b
53  *	  <0 if psn_a < psn_b
54  */
psn_compare(u32 psn_a,u32 psn_b)55 static inline int psn_compare(u32 psn_a, u32 psn_b)
56 {
57 	s32 diff;
58 
59 	diff = (psn_a - psn_b) << 8;
60 	return diff;
61 }
62 
63 struct rxe_ucontext {
64 	struct rxe_pool_entry	pelem;
65 	struct ib_ucontext	ibuc;
66 };
67 
68 struct rxe_pd {
69 	struct rxe_pool_entry	pelem;
70 	struct ib_pd		ibpd;
71 };
72 
73 struct rxe_ah {
74 	struct rxe_pool_entry	pelem;
75 	struct ib_ah		ibah;
76 	struct rxe_pd		*pd;
77 	struct rxe_av		av;
78 };
79 
80 struct rxe_cqe {
81 	union {
82 		struct ib_wc		ibwc;
83 		struct ib_uverbs_wc	uibwc;
84 	};
85 };
86 
87 struct rxe_cq {
88 	struct rxe_pool_entry	pelem;
89 	struct ib_cq		ibcq;
90 	struct rxe_queue	*queue;
91 	spinlock_t		cq_lock;
92 	u8			notify;
93 	bool			is_dying;
94 	int			is_user;
95 	struct tasklet_struct	comp_task;
96 };
97 
98 enum wqe_state {
99 	wqe_state_posted,
100 	wqe_state_processing,
101 	wqe_state_pending,
102 	wqe_state_done,
103 	wqe_state_error,
104 };
105 
106 struct rxe_sq {
107 	int			max_wr;
108 	int			max_sge;
109 	int			max_inline;
110 	spinlock_t		sq_lock; /* guard queue */
111 	struct rxe_queue	*queue;
112 };
113 
114 struct rxe_rq {
115 	int			max_wr;
116 	int			max_sge;
117 	spinlock_t		producer_lock; /* guard queue producer */
118 	spinlock_t		consumer_lock; /* guard queue consumer */
119 	struct rxe_queue	*queue;
120 };
121 
122 struct rxe_srq {
123 	struct rxe_pool_entry	pelem;
124 	struct ib_srq		ibsrq;
125 	struct rxe_pd		*pd;
126 	struct rxe_rq		rq;
127 	u32			srq_num;
128 
129 	int			limit;
130 	int			error;
131 };
132 
133 enum rxe_qp_state {
134 	QP_STATE_RESET,
135 	QP_STATE_INIT,
136 	QP_STATE_READY,
137 	QP_STATE_DRAIN,		/* req only */
138 	QP_STATE_DRAINED,	/* req only */
139 	QP_STATE_ERROR
140 };
141 
142 struct rxe_req_info {
143 	enum rxe_qp_state	state;
144 	int			wqe_index;
145 	u32			psn;
146 	int			opcode;
147 	atomic_t		rd_atomic;
148 	int			wait_fence;
149 	int			need_rd_atomic;
150 	int			wait_psn;
151 	int			need_retry;
152 	int			noack_pkts;
153 	struct rxe_task		task;
154 };
155 
156 struct rxe_comp_info {
157 	u32			psn;
158 	int			opcode;
159 	int			timeout;
160 	int			timeout_retry;
161 	u32			retry_cnt;
162 	u32			rnr_retry;
163 	struct rxe_task		task;
164 };
165 
166 enum rdatm_res_state {
167 	rdatm_res_state_next,
168 	rdatm_res_state_new,
169 	rdatm_res_state_replay,
170 };
171 
172 struct resp_res {
173 	int			type;
174 	u32			first_psn;
175 	u32			last_psn;
176 	u32			cur_psn;
177 	enum rdatm_res_state	state;
178 
179 	union {
180 		struct {
181 			struct sk_buff	*skb;
182 		} atomic;
183 		struct {
184 			struct rxe_mem	*mr;
185 			u64		va_org;
186 			u32		rkey;
187 			u32		length;
188 			u64		va;
189 			u32		resid;
190 		} read;
191 	};
192 };
193 
194 struct rxe_resp_info {
195 	enum rxe_qp_state	state;
196 	u32			msn;
197 	u32			psn;
198 	int			opcode;
199 	int			drop_msg;
200 	int			goto_error;
201 	int			sent_psn_nak;
202 	enum ib_wc_status	status;
203 	u8			aeth_syndrome;
204 
205 	/* Receive only */
206 	struct rxe_recv_wqe	*wqe;
207 
208 	/* RDMA read / atomic only */
209 	u64			va;
210 	struct rxe_mem		*mr;
211 	u32			resid;
212 	u32			rkey;
213 	u64			atomic_orig;
214 
215 	/* SRQ only */
216 	struct {
217 		struct rxe_recv_wqe	wqe;
218 		struct ib_sge		sge[RXE_MAX_SGE];
219 	} srq_wqe;
220 
221 	/* Responder resources. It's a circular list where the oldest
222 	 * resource is dropped first.
223 	 */
224 	struct resp_res		*resources;
225 	unsigned int		res_head;
226 	unsigned int		res_tail;
227 	struct resp_res		*res;
228 	struct rxe_task		task;
229 };
230 
231 struct rxe_qp {
232 	struct rxe_pool_entry	pelem;
233 	struct ib_qp		ibqp;
234 	struct ib_qp_attr	attr;
235 	unsigned int		valid;
236 	unsigned int		mtu;
237 	int			is_user;
238 
239 	struct rxe_pd		*pd;
240 	struct rxe_srq		*srq;
241 	struct rxe_cq		*scq;
242 	struct rxe_cq		*rcq;
243 
244 	enum ib_sig_type	sq_sig_type;
245 
246 	struct rxe_sq		sq;
247 	struct rxe_rq		rq;
248 
249 	struct socket		*sk;
250 	u32			dst_cookie;
251 
252 	struct rxe_av		pri_av;
253 	struct rxe_av		alt_av;
254 
255 	/* list of mcast groups qp has joined (for cleanup) */
256 	struct list_head	grp_list;
257 	spinlock_t		grp_lock; /* guard grp_list */
258 
259 	struct sk_buff_head	req_pkts;
260 	struct sk_buff_head	resp_pkts;
261 	struct sk_buff_head	send_pkts;
262 
263 	struct rxe_req_info	req;
264 	struct rxe_comp_info	comp;
265 	struct rxe_resp_info	resp;
266 
267 	atomic_t		ssn;
268 	atomic_t		skb_out;
269 	int			need_req_skb;
270 
271 	/* Timer for retranmitting packet when ACKs have been lost. RC
272 	 * only. The requester sets it when it is not already
273 	 * started. The responder resets it whenever an ack is
274 	 * received.
275 	 */
276 	struct timer_list retrans_timer;
277 	u64 qp_timeout_jiffies;
278 
279 	/* Timer for handling RNR NAKS. */
280 	struct timer_list rnr_nak_timer;
281 
282 	spinlock_t		state_lock; /* guard requester and completer */
283 
284 	struct execute_work	cleanup_work;
285 };
286 
287 enum rxe_mem_state {
288 	RXE_MEM_STATE_ZOMBIE,
289 	RXE_MEM_STATE_INVALID,
290 	RXE_MEM_STATE_FREE,
291 	RXE_MEM_STATE_VALID,
292 };
293 
294 enum rxe_mem_type {
295 	RXE_MEM_TYPE_NONE,
296 	RXE_MEM_TYPE_DMA,
297 	RXE_MEM_TYPE_MR,
298 	RXE_MEM_TYPE_FMR,
299 	RXE_MEM_TYPE_MW,
300 };
301 
302 #define RXE_BUF_PER_MAP		(PAGE_SIZE / sizeof(struct rxe_phys_buf))
303 
304 struct rxe_phys_buf {
305 	u64      addr;
306 	u64      size;
307 };
308 
309 struct rxe_map {
310 	struct rxe_phys_buf	buf[RXE_BUF_PER_MAP];
311 };
312 
313 struct rxe_mem {
314 	struct rxe_pool_entry	pelem;
315 	union {
316 		struct ib_mr		ibmr;
317 		struct ib_mw		ibmw;
318 	};
319 
320 	struct rxe_pd		*pd;
321 	struct ib_umem		*umem;
322 
323 	u32			lkey;
324 	u32			rkey;
325 
326 	enum rxe_mem_state	state;
327 	enum rxe_mem_type	type;
328 	u64			va;
329 	u64			iova;
330 	size_t			length;
331 	u32			offset;
332 	int			access;
333 
334 	int			page_shift;
335 	int			page_mask;
336 	int			map_shift;
337 	int			map_mask;
338 
339 	u32			num_buf;
340 	u32			nbuf;
341 
342 	u32			max_buf;
343 	u32			num_map;
344 
345 	struct rxe_map		**map;
346 };
347 
348 struct rxe_mc_grp {
349 	struct rxe_pool_entry	pelem;
350 	spinlock_t		mcg_lock; /* guard group */
351 	struct rxe_dev		*rxe;
352 	struct list_head	qp_list;
353 	union ib_gid		mgid;
354 	int			num_qp;
355 	u32			qkey;
356 	u16			pkey;
357 };
358 
359 struct rxe_mc_elem {
360 	struct rxe_pool_entry	pelem;
361 	struct list_head	qp_list;
362 	struct list_head	grp_list;
363 	struct rxe_qp		*qp;
364 	struct rxe_mc_grp	*grp;
365 };
366 
367 struct rxe_port {
368 	struct ib_port_attr	attr;
369 	u16			*pkey_tbl;
370 	__be64			port_guid;
371 	__be64			subnet_prefix;
372 	spinlock_t		port_lock; /* guard port */
373 	unsigned int		mtu_cap;
374 	/* special QPs */
375 	u32			qp_smi_index;
376 	u32			qp_gsi_index;
377 };
378 
379 struct rxe_dev {
380 	struct ib_device	ib_dev;
381 	struct ib_device_attr	attr;
382 	int			max_ucontext;
383 	int			max_inline_data;
384 	struct kref		ref_cnt;
385 	struct mutex	usdev_lock;
386 
387 	struct net_device	*ndev;
388 
389 	int			xmit_errors;
390 
391 	struct rxe_pool		uc_pool;
392 	struct rxe_pool		pd_pool;
393 	struct rxe_pool		ah_pool;
394 	struct rxe_pool		srq_pool;
395 	struct rxe_pool		qp_pool;
396 	struct rxe_pool		cq_pool;
397 	struct rxe_pool		mr_pool;
398 	struct rxe_pool		mw_pool;
399 	struct rxe_pool		mc_grp_pool;
400 	struct rxe_pool		mc_elem_pool;
401 
402 	spinlock_t		pending_lock; /* guard pending_mmaps */
403 	struct list_head	pending_mmaps;
404 
405 	spinlock_t		mmap_offset_lock; /* guard mmap_offset */
406 	int			mmap_offset;
407 
408 	u64			stats_counters[RXE_NUM_OF_COUNTERS];
409 
410 	struct rxe_port		port;
411 	struct list_head	list;
412 	struct crypto_shash	*tfm;
413 };
414 
rxe_counter_inc(struct rxe_dev * rxe,enum rxe_counters cnt)415 static inline void rxe_counter_inc(struct rxe_dev *rxe, enum rxe_counters cnt)
416 {
417 	rxe->stats_counters[cnt]++;
418 }
419 
to_rdev(struct ib_device * dev)420 static inline struct rxe_dev *to_rdev(struct ib_device *dev)
421 {
422 	return dev ? container_of(dev, struct rxe_dev, ib_dev) : NULL;
423 }
424 
to_ruc(struct ib_ucontext * uc)425 static inline struct rxe_ucontext *to_ruc(struct ib_ucontext *uc)
426 {
427 	return uc ? container_of(uc, struct rxe_ucontext, ibuc) : NULL;
428 }
429 
to_rpd(struct ib_pd * pd)430 static inline struct rxe_pd *to_rpd(struct ib_pd *pd)
431 {
432 	return pd ? container_of(pd, struct rxe_pd, ibpd) : NULL;
433 }
434 
to_rah(struct ib_ah * ah)435 static inline struct rxe_ah *to_rah(struct ib_ah *ah)
436 {
437 	return ah ? container_of(ah, struct rxe_ah, ibah) : NULL;
438 }
439 
to_rsrq(struct ib_srq * srq)440 static inline struct rxe_srq *to_rsrq(struct ib_srq *srq)
441 {
442 	return srq ? container_of(srq, struct rxe_srq, ibsrq) : NULL;
443 }
444 
to_rqp(struct ib_qp * qp)445 static inline struct rxe_qp *to_rqp(struct ib_qp *qp)
446 {
447 	return qp ? container_of(qp, struct rxe_qp, ibqp) : NULL;
448 }
449 
to_rcq(struct ib_cq * cq)450 static inline struct rxe_cq *to_rcq(struct ib_cq *cq)
451 {
452 	return cq ? container_of(cq, struct rxe_cq, ibcq) : NULL;
453 }
454 
to_rmr(struct ib_mr * mr)455 static inline struct rxe_mem *to_rmr(struct ib_mr *mr)
456 {
457 	return mr ? container_of(mr, struct rxe_mem, ibmr) : NULL;
458 }
459 
to_rmw(struct ib_mw * mw)460 static inline struct rxe_mem *to_rmw(struct ib_mw *mw)
461 {
462 	return mw ? container_of(mw, struct rxe_mem, ibmw) : NULL;
463 }
464 
465 int rxe_register_device(struct rxe_dev *rxe);
466 int rxe_unregister_device(struct rxe_dev *rxe);
467 
468 void rxe_mc_cleanup(struct rxe_pool_entry *arg);
469 
470 #endif /* RXE_VERBS_H */
471