1 /* SPDX-License-Identifier: GPL-2.0 OR Linux-OpenIB */
2 /* Copyright (c) 2019 Mellanox Technologies. */
3 
4 #ifndef __MLX5_EN_TXRX_H___
5 #define __MLX5_EN_TXRX_H___
6 
7 #include "en.h"
8 #include <linux/indirect_call_wrapper.h>
9 
10 #define MLX5E_TX_WQE_EMPTY_DS_COUNT (sizeof(struct mlx5e_tx_wqe) / MLX5_SEND_WQE_DS)
11 
12 /* The mult of MLX5_SEND_WQE_MAX_WQEBBS * MLX5_SEND_WQEBB_NUM_DS
13  * (16 * 4 == 64) does not fit in the 6-bit DS field of Ctrl Segment.
14  * We use a bound lower that MLX5_SEND_WQE_MAX_WQEBBS to let a
15  * full-session WQE be cache-aligned.
16  */
17 #if L1_CACHE_BYTES < 128
18 #define MLX5E_TX_MPW_MAX_WQEBBS (MLX5_SEND_WQE_MAX_WQEBBS - 1)
19 #else
20 #define MLX5E_TX_MPW_MAX_WQEBBS (MLX5_SEND_WQE_MAX_WQEBBS - 2)
21 #endif
22 
23 #define MLX5E_TX_MPW_MAX_NUM_DS (MLX5E_TX_MPW_MAX_WQEBBS * MLX5_SEND_WQEBB_NUM_DS)
24 
25 #define INL_HDR_START_SZ (sizeof(((struct mlx5_wqe_eth_seg *)NULL)->inline_hdr.start))
26 
27 enum mlx5e_icosq_wqe_type {
28 	MLX5E_ICOSQ_WQE_NOP,
29 	MLX5E_ICOSQ_WQE_UMR_RX,
30 #ifdef CONFIG_MLX5_EN_TLS
31 	MLX5E_ICOSQ_WQE_UMR_TLS,
32 	MLX5E_ICOSQ_WQE_SET_PSV_TLS,
33 	MLX5E_ICOSQ_WQE_GET_PSV_TLS,
34 #endif
35 };
36 
37 /* General */
mlx5e_skb_is_multicast(struct sk_buff * skb)38 static inline bool mlx5e_skb_is_multicast(struct sk_buff *skb)
39 {
40 	return skb->pkt_type == PACKET_MULTICAST || skb->pkt_type == PACKET_BROADCAST;
41 }
42 
43 void mlx5e_trigger_irq(struct mlx5e_icosq *sq);
44 void mlx5e_completion_event(struct mlx5_core_cq *mcq, struct mlx5_eqe *eqe);
45 void mlx5e_cq_error_event(struct mlx5_core_cq *mcq, enum mlx5_event event);
46 int mlx5e_napi_poll(struct napi_struct *napi, int budget);
47 int mlx5e_poll_ico_cq(struct mlx5e_cq *cq);
48 
49 /* RX */
50 void mlx5e_page_dma_unmap(struct mlx5e_rq *rq, struct mlx5e_dma_info *dma_info);
51 void mlx5e_page_release_dynamic(struct mlx5e_rq *rq,
52 				struct mlx5e_dma_info *dma_info,
53 				bool recycle);
54 INDIRECT_CALLABLE_DECLARE(bool mlx5e_post_rx_wqes(struct mlx5e_rq *rq));
55 INDIRECT_CALLABLE_DECLARE(bool mlx5e_post_rx_mpwqes(struct mlx5e_rq *rq));
56 int mlx5e_poll_rx_cq(struct mlx5e_cq *cq, int budget);
57 void mlx5e_free_rx_descs(struct mlx5e_rq *rq);
58 void mlx5e_free_rx_in_progress_descs(struct mlx5e_rq *rq);
59 
60 /* TX */
61 u16 mlx5e_select_queue(struct net_device *dev, struct sk_buff *skb,
62 		       struct net_device *sb_dev);
63 netdev_tx_t mlx5e_xmit(struct sk_buff *skb, struct net_device *dev);
64 bool mlx5e_poll_tx_cq(struct mlx5e_cq *cq, int napi_budget);
65 void mlx5e_free_txqsq_descs(struct mlx5e_txqsq *sq);
66 
67 static inline bool
mlx5e_wqc_has_room_for(struct mlx5_wq_cyc * wq,u16 cc,u16 pc,u16 n)68 mlx5e_wqc_has_room_for(struct mlx5_wq_cyc *wq, u16 cc, u16 pc, u16 n)
69 {
70 	return (mlx5_wq_cyc_ctr2ix(wq, cc - pc) >= n) || (cc == pc);
71 }
72 
mlx5e_fetch_wqe(struct mlx5_wq_cyc * wq,u16 pi,size_t wqe_size)73 static inline void *mlx5e_fetch_wqe(struct mlx5_wq_cyc *wq, u16 pi, size_t wqe_size)
74 {
75 	void *wqe;
76 
77 	wqe = mlx5_wq_cyc_get_wqe(wq, pi);
78 	memset(wqe, 0, wqe_size);
79 
80 	return wqe;
81 }
82 
83 #define MLX5E_TX_FETCH_WQE(sq, pi) \
84 	((struct mlx5e_tx_wqe *)mlx5e_fetch_wqe(&(sq)->wq, pi, sizeof(struct mlx5e_tx_wqe)))
85 
86 static inline struct mlx5e_tx_wqe *
mlx5e_post_nop(struct mlx5_wq_cyc * wq,u32 sqn,u16 * pc)87 mlx5e_post_nop(struct mlx5_wq_cyc *wq, u32 sqn, u16 *pc)
88 {
89 	u16                         pi   = mlx5_wq_cyc_ctr2ix(wq, *pc);
90 	struct mlx5e_tx_wqe        *wqe  = mlx5_wq_cyc_get_wqe(wq, pi);
91 	struct mlx5_wqe_ctrl_seg   *cseg = &wqe->ctrl;
92 
93 	memset(cseg, 0, sizeof(*cseg));
94 
95 	cseg->opmod_idx_opcode = cpu_to_be32((*pc << 8) | MLX5_OPCODE_NOP);
96 	cseg->qpn_ds           = cpu_to_be32((sqn << 8) | 0x01);
97 
98 	(*pc)++;
99 
100 	return wqe;
101 }
102 
103 static inline struct mlx5e_tx_wqe *
mlx5e_post_nop_fence(struct mlx5_wq_cyc * wq,u32 sqn,u16 * pc)104 mlx5e_post_nop_fence(struct mlx5_wq_cyc *wq, u32 sqn, u16 *pc)
105 {
106 	u16                         pi   = mlx5_wq_cyc_ctr2ix(wq, *pc);
107 	struct mlx5e_tx_wqe        *wqe  = mlx5_wq_cyc_get_wqe(wq, pi);
108 	struct mlx5_wqe_ctrl_seg   *cseg = &wqe->ctrl;
109 
110 	memset(cseg, 0, sizeof(*cseg));
111 
112 	cseg->opmod_idx_opcode = cpu_to_be32((*pc << 8) | MLX5_OPCODE_NOP);
113 	cseg->qpn_ds           = cpu_to_be32((sqn << 8) | 0x01);
114 	cseg->fm_ce_se         = MLX5_FENCE_MODE_INITIATOR_SMALL;
115 
116 	(*pc)++;
117 
118 	return wqe;
119 }
120 
121 struct mlx5e_tx_wqe_info {
122 	struct sk_buff *skb;
123 	u32 num_bytes;
124 	u8 num_wqebbs;
125 	u8 num_dma;
126 	u8 num_fifo_pkts;
127 #ifdef CONFIG_MLX5_EN_TLS
128 	struct page *resync_dump_frag_page;
129 #endif
130 };
131 
mlx5e_txqsq_get_next_pi(struct mlx5e_txqsq * sq,u16 size)132 static inline u16 mlx5e_txqsq_get_next_pi(struct mlx5e_txqsq *sq, u16 size)
133 {
134 	struct mlx5_wq_cyc *wq = &sq->wq;
135 	u16 pi, contig_wqebbs;
136 
137 	pi = mlx5_wq_cyc_ctr2ix(wq, sq->pc);
138 	contig_wqebbs = mlx5_wq_cyc_get_contig_wqebbs(wq, pi);
139 	if (unlikely(contig_wqebbs < size)) {
140 		struct mlx5e_tx_wqe_info *wi, *edge_wi;
141 
142 		wi = &sq->db.wqe_info[pi];
143 		edge_wi = wi + contig_wqebbs;
144 
145 		/* Fill SQ frag edge with NOPs to avoid WQE wrapping two pages. */
146 		for (; wi < edge_wi; wi++) {
147 			*wi = (struct mlx5e_tx_wqe_info) {
148 				.num_wqebbs = 1,
149 			};
150 			mlx5e_post_nop(wq, sq->sqn, &sq->pc);
151 		}
152 		sq->stats->nop += contig_wqebbs;
153 
154 		pi = mlx5_wq_cyc_ctr2ix(wq, sq->pc);
155 	}
156 
157 	return pi;
158 }
159 
160 struct mlx5e_icosq_wqe_info {
161 	u8 wqe_type;
162 	u8 num_wqebbs;
163 
164 	/* Auxiliary data for different wqe types. */
165 	union {
166 		struct {
167 			struct mlx5e_rq *rq;
168 		} umr;
169 #ifdef CONFIG_MLX5_EN_TLS
170 		struct {
171 			struct mlx5e_ktls_offload_context_rx *priv_rx;
172 		} tls_set_params;
173 		struct {
174 			struct mlx5e_ktls_rx_resync_buf *buf;
175 		} tls_get_params;
176 #endif
177 	};
178 };
179 
180 void mlx5e_free_icosq_descs(struct mlx5e_icosq *sq);
181 
mlx5e_icosq_get_next_pi(struct mlx5e_icosq * sq,u16 size)182 static inline u16 mlx5e_icosq_get_next_pi(struct mlx5e_icosq *sq, u16 size)
183 {
184 	struct mlx5_wq_cyc *wq = &sq->wq;
185 	u16 pi, contig_wqebbs;
186 
187 	pi = mlx5_wq_cyc_ctr2ix(wq, sq->pc);
188 	contig_wqebbs = mlx5_wq_cyc_get_contig_wqebbs(wq, pi);
189 	if (unlikely(contig_wqebbs < size)) {
190 		struct mlx5e_icosq_wqe_info *wi, *edge_wi;
191 
192 		wi = &sq->db.wqe_info[pi];
193 		edge_wi = wi + contig_wqebbs;
194 
195 		/* Fill SQ frag edge with NOPs to avoid WQE wrapping two pages. */
196 		for (; wi < edge_wi; wi++) {
197 			*wi = (struct mlx5e_icosq_wqe_info) {
198 				.wqe_type   = MLX5E_ICOSQ_WQE_NOP,
199 				.num_wqebbs = 1,
200 			};
201 			mlx5e_post_nop(wq, sq->sqn, &sq->pc);
202 		}
203 
204 		pi = mlx5_wq_cyc_ctr2ix(wq, sq->pc);
205 	}
206 
207 	return pi;
208 }
209 
210 static inline void
mlx5e_notify_hw(struct mlx5_wq_cyc * wq,u16 pc,void __iomem * uar_map,struct mlx5_wqe_ctrl_seg * ctrl)211 mlx5e_notify_hw(struct mlx5_wq_cyc *wq, u16 pc, void __iomem *uar_map,
212 		struct mlx5_wqe_ctrl_seg *ctrl)
213 {
214 	ctrl->fm_ce_se |= MLX5_WQE_CTRL_CQ_UPDATE;
215 	/* ensure wqe is visible to device before updating doorbell record */
216 	dma_wmb();
217 
218 	*wq->db = cpu_to_be32(pc);
219 
220 	/* ensure doorbell record is visible to device before ringing the
221 	 * doorbell
222 	 */
223 	wmb();
224 
225 	mlx5_write64((__be32 *)ctrl, uar_map);
226 }
227 
mlx5e_cq_arm(struct mlx5e_cq * cq)228 static inline void mlx5e_cq_arm(struct mlx5e_cq *cq)
229 {
230 	struct mlx5_core_cq *mcq;
231 
232 	mcq = &cq->mcq;
233 	mlx5_cq_arm(mcq, MLX5_CQ_DB_REQ_NOT, mcq->uar->map, cq->wq.cc);
234 }
235 
236 static inline struct mlx5e_sq_dma *
mlx5e_dma_get(struct mlx5e_txqsq * sq,u32 i)237 mlx5e_dma_get(struct mlx5e_txqsq *sq, u32 i)
238 {
239 	return &sq->db.dma_fifo[i & sq->dma_fifo_mask];
240 }
241 
242 static inline void
mlx5e_dma_push(struct mlx5e_txqsq * sq,dma_addr_t addr,u32 size,enum mlx5e_dma_map_type map_type)243 mlx5e_dma_push(struct mlx5e_txqsq *sq, dma_addr_t addr, u32 size,
244 	       enum mlx5e_dma_map_type map_type)
245 {
246 	struct mlx5e_sq_dma *dma = mlx5e_dma_get(sq, sq->dma_fifo_pc++);
247 
248 	dma->addr = addr;
249 	dma->size = size;
250 	dma->type = map_type;
251 }
252 
mlx5e_skb_fifo_get(struct mlx5e_txqsq * sq,u16 i)253 static inline struct sk_buff **mlx5e_skb_fifo_get(struct mlx5e_txqsq *sq, u16 i)
254 {
255 	return &sq->db.skb_fifo[i & sq->skb_fifo_mask];
256 }
257 
mlx5e_skb_fifo_push(struct mlx5e_txqsq * sq,struct sk_buff * skb)258 static inline void mlx5e_skb_fifo_push(struct mlx5e_txqsq *sq, struct sk_buff *skb)
259 {
260 	struct sk_buff **skb_item = mlx5e_skb_fifo_get(sq, sq->skb_fifo_pc++);
261 
262 	*skb_item = skb;
263 }
264 
mlx5e_skb_fifo_pop(struct mlx5e_txqsq * sq)265 static inline struct sk_buff *mlx5e_skb_fifo_pop(struct mlx5e_txqsq *sq)
266 {
267 	return *mlx5e_skb_fifo_get(sq, sq->skb_fifo_cc++);
268 }
269 
270 static inline void
mlx5e_tx_dma_unmap(struct device * pdev,struct mlx5e_sq_dma * dma)271 mlx5e_tx_dma_unmap(struct device *pdev, struct mlx5e_sq_dma *dma)
272 {
273 	switch (dma->type) {
274 	case MLX5E_DMA_MAP_SINGLE:
275 		dma_unmap_single(pdev, dma->addr, dma->size, DMA_TO_DEVICE);
276 		break;
277 	case MLX5E_DMA_MAP_PAGE:
278 		dma_unmap_page(pdev, dma->addr, dma->size, DMA_TO_DEVICE);
279 		break;
280 	default:
281 		WARN_ONCE(true, "mlx5e_tx_dma_unmap unknown DMA type!\n");
282 	}
283 }
284 
285 void mlx5e_sq_xmit_simple(struct mlx5e_txqsq *sq, struct sk_buff *skb, bool xmit_more);
286 void mlx5e_tx_mpwqe_ensure_complete(struct mlx5e_txqsq *sq);
287 
mlx5e_tx_mpwqe_is_full(struct mlx5e_tx_mpwqe * session)288 static inline bool mlx5e_tx_mpwqe_is_full(struct mlx5e_tx_mpwqe *session)
289 {
290 	return session->ds_count == MLX5E_TX_MPW_MAX_NUM_DS;
291 }
292 
mlx5e_rqwq_reset(struct mlx5e_rq * rq)293 static inline void mlx5e_rqwq_reset(struct mlx5e_rq *rq)
294 {
295 	if (rq->wq_type == MLX5_WQ_TYPE_LINKED_LIST_STRIDING_RQ) {
296 		mlx5_wq_ll_reset(&rq->mpwqe.wq);
297 		rq->mpwqe.actual_wq_head = 0;
298 	} else {
299 		mlx5_wq_cyc_reset(&rq->wqe.wq);
300 	}
301 }
302 
mlx5e_dump_error_cqe(struct mlx5e_cq * cq,u32 qn,struct mlx5_err_cqe * err_cqe)303 static inline void mlx5e_dump_error_cqe(struct mlx5e_cq *cq, u32 qn,
304 					struct mlx5_err_cqe *err_cqe)
305 {
306 	struct mlx5_cqwq *wq = &cq->wq;
307 	u32 ci;
308 
309 	ci = mlx5_cqwq_ctr2ix(wq, wq->cc - 1);
310 
311 	netdev_err(cq->channel->netdev,
312 		   "Error cqe on cqn 0x%x, ci 0x%x, qn 0x%x, opcode 0x%x, syndrome 0x%x, vendor syndrome 0x%x\n",
313 		   cq->mcq.cqn, ci, qn,
314 		   get_cqe_opcode((struct mlx5_cqe64 *)err_cqe),
315 		   err_cqe->syndrome, err_cqe->vendor_err_synd);
316 	mlx5_dump_err_cqe(cq->mdev, err_cqe);
317 }
318 
mlx5e_rqwq_get_size(struct mlx5e_rq * rq)319 static inline u32 mlx5e_rqwq_get_size(struct mlx5e_rq *rq)
320 {
321 	switch (rq->wq_type) {
322 	case MLX5_WQ_TYPE_LINKED_LIST_STRIDING_RQ:
323 		return mlx5_wq_ll_get_size(&rq->mpwqe.wq);
324 	default:
325 		return mlx5_wq_cyc_get_size(&rq->wqe.wq);
326 	}
327 }
328 
mlx5e_rqwq_get_cur_sz(struct mlx5e_rq * rq)329 static inline u32 mlx5e_rqwq_get_cur_sz(struct mlx5e_rq *rq)
330 {
331 	switch (rq->wq_type) {
332 	case MLX5_WQ_TYPE_LINKED_LIST_STRIDING_RQ:
333 		return rq->mpwqe.wq.cur_sz;
334 	default:
335 		return rq->wqe.wq.cur_sz;
336 	}
337 }
338 
mlx5e_rqwq_get_head(struct mlx5e_rq * rq)339 static inline u16 mlx5e_rqwq_get_head(struct mlx5e_rq *rq)
340 {
341 	switch (rq->wq_type) {
342 	case MLX5_WQ_TYPE_LINKED_LIST_STRIDING_RQ:
343 		return mlx5_wq_ll_get_head(&rq->mpwqe.wq);
344 	default:
345 		return mlx5_wq_cyc_get_head(&rq->wqe.wq);
346 	}
347 }
348 
mlx5e_rqwq_get_wqe_counter(struct mlx5e_rq * rq)349 static inline u16 mlx5e_rqwq_get_wqe_counter(struct mlx5e_rq *rq)
350 {
351 	switch (rq->wq_type) {
352 	case MLX5_WQ_TYPE_LINKED_LIST_STRIDING_RQ:
353 		return mlx5_wq_ll_get_counter(&rq->mpwqe.wq);
354 	default:
355 		return mlx5_wq_cyc_get_counter(&rq->wqe.wq);
356 	}
357 }
358 
359 /* SW parser related functions */
360 
361 struct mlx5e_swp_spec {
362 	__be16 l3_proto;
363 	u8 l4_proto;
364 	u8 is_tun;
365 	__be16 tun_l3_proto;
366 	u8 tun_l4_proto;
367 };
368 
369 static inline void
mlx5e_set_eseg_swp(struct sk_buff * skb,struct mlx5_wqe_eth_seg * eseg,struct mlx5e_swp_spec * swp_spec)370 mlx5e_set_eseg_swp(struct sk_buff *skb, struct mlx5_wqe_eth_seg *eseg,
371 		   struct mlx5e_swp_spec *swp_spec)
372 {
373 	/* SWP offsets are in 2-bytes words */
374 	eseg->swp_outer_l3_offset = skb_network_offset(skb) / 2;
375 	if (swp_spec->l3_proto == htons(ETH_P_IPV6))
376 		eseg->swp_flags |= MLX5_ETH_WQE_SWP_OUTER_L3_IPV6;
377 	if (swp_spec->l4_proto) {
378 		eseg->swp_outer_l4_offset = skb_transport_offset(skb) / 2;
379 		if (swp_spec->l4_proto == IPPROTO_UDP)
380 			eseg->swp_flags |= MLX5_ETH_WQE_SWP_OUTER_L4_UDP;
381 	}
382 
383 	if (swp_spec->is_tun) {
384 		eseg->swp_inner_l3_offset = skb_inner_network_offset(skb) / 2;
385 		if (swp_spec->tun_l3_proto == htons(ETH_P_IPV6))
386 			eseg->swp_flags |= MLX5_ETH_WQE_SWP_INNER_L3_IPV6;
387 	} else { /* typically for ipsec when xfrm mode != XFRM_MODE_TUNNEL */
388 		eseg->swp_inner_l3_offset = skb_network_offset(skb) / 2;
389 		if (swp_spec->l3_proto == htons(ETH_P_IPV6))
390 			eseg->swp_flags |= MLX5_ETH_WQE_SWP_INNER_L3_IPV6;
391 	}
392 	switch (swp_spec->tun_l4_proto) {
393 	case IPPROTO_UDP:
394 		eseg->swp_flags |= MLX5_ETH_WQE_SWP_INNER_L4_UDP;
395 		fallthrough;
396 	case IPPROTO_TCP:
397 		eseg->swp_inner_l4_offset = skb_inner_transport_offset(skb) / 2;
398 		break;
399 	}
400 }
401 
mlx5e_stop_room_for_wqe(u16 wqe_size)402 static inline u16 mlx5e_stop_room_for_wqe(u16 wqe_size)
403 {
404 	BUILD_BUG_ON(PAGE_SIZE / MLX5_SEND_WQE_BB < MLX5_SEND_WQE_MAX_WQEBBS);
405 
406 	/* A WQE must not cross the page boundary, hence two conditions:
407 	 * 1. Its size must not exceed the page size.
408 	 * 2. If the WQE size is X, and the space remaining in a page is less
409 	 *    than X, this space needs to be padded with NOPs. So, one WQE of
410 	 *    size X may require up to X-1 WQEBBs of padding, which makes the
411 	 *    stop room of X-1 + X.
412 	 * WQE size is also limited by the hardware limit.
413 	 */
414 
415 	if (__builtin_constant_p(wqe_size))
416 		BUILD_BUG_ON(wqe_size > MLX5_SEND_WQE_MAX_WQEBBS);
417 	else
418 		WARN_ON_ONCE(wqe_size > MLX5_SEND_WQE_MAX_WQEBBS);
419 
420 	return wqe_size * 2 - 1;
421 }
422 
423 #endif
424