1 // SPDX-License-Identifier: GPL-2.0
2 /* Copyright(c) 2017 - 2019 Pensando Systems, Inc */
3
4 #include <linux/ip.h>
5 #include <linux/ipv6.h>
6 #include <linux/if_vlan.h>
7 #include <net/ip6_checksum.h>
8
9 #include "ionic.h"
10 #include "ionic_lif.h"
11 #include "ionic_txrx.h"
12
13 static void ionic_rx_clean(struct ionic_queue *q,
14 struct ionic_desc_info *desc_info,
15 struct ionic_cq_info *cq_info,
16 void *cb_arg);
17
18 static bool ionic_rx_service(struct ionic_cq *cq, struct ionic_cq_info *cq_info);
19
20 static bool ionic_tx_service(struct ionic_cq *cq, struct ionic_cq_info *cq_info);
21
ionic_txq_post(struct ionic_queue * q,bool ring_dbell,ionic_desc_cb cb_func,void * cb_arg)22 static inline void ionic_txq_post(struct ionic_queue *q, bool ring_dbell,
23 ionic_desc_cb cb_func, void *cb_arg)
24 {
25 DEBUG_STATS_TXQ_POST(q, ring_dbell);
26
27 ionic_q_post(q, ring_dbell, cb_func, cb_arg);
28 }
29
ionic_rxq_post(struct ionic_queue * q,bool ring_dbell,ionic_desc_cb cb_func,void * cb_arg)30 static inline void ionic_rxq_post(struct ionic_queue *q, bool ring_dbell,
31 ionic_desc_cb cb_func, void *cb_arg)
32 {
33 ionic_q_post(q, ring_dbell, cb_func, cb_arg);
34
35 DEBUG_STATS_RX_BUFF_CNT(q);
36 }
37
q_to_ndq(struct ionic_queue * q)38 static inline struct netdev_queue *q_to_ndq(struct ionic_queue *q)
39 {
40 return netdev_get_tx_queue(q->lif->netdev, q->index);
41 }
42
ionic_rx_skb_alloc(struct ionic_queue * q,unsigned int len,bool frags)43 static struct sk_buff *ionic_rx_skb_alloc(struct ionic_queue *q,
44 unsigned int len, bool frags)
45 {
46 struct ionic_lif *lif = q->lif;
47 struct ionic_rx_stats *stats;
48 struct net_device *netdev;
49 struct sk_buff *skb;
50
51 netdev = lif->netdev;
52 stats = &q->lif->rxqstats[q->index];
53
54 if (frags)
55 skb = napi_get_frags(&q_to_qcq(q)->napi);
56 else
57 skb = netdev_alloc_skb_ip_align(netdev, len);
58
59 if (unlikely(!skb)) {
60 net_warn_ratelimited("%s: SKB alloc failed on %s!\n",
61 netdev->name, q->name);
62 stats->alloc_err++;
63 return NULL;
64 }
65
66 return skb;
67 }
68
ionic_rx_frags(struct ionic_queue * q,struct ionic_desc_info * desc_info,struct ionic_cq_info * cq_info)69 static struct sk_buff *ionic_rx_frags(struct ionic_queue *q,
70 struct ionic_desc_info *desc_info,
71 struct ionic_cq_info *cq_info)
72 {
73 struct ionic_rxq_comp *comp = cq_info->cq_desc;
74 struct device *dev = q->lif->ionic->dev;
75 struct ionic_page_info *page_info;
76 struct sk_buff *skb;
77 unsigned int i;
78 u16 frag_len;
79 u16 len;
80
81 page_info = &desc_info->pages[0];
82 len = le16_to_cpu(comp->len);
83
84 prefetch(page_address(page_info->page) + NET_IP_ALIGN);
85
86 skb = ionic_rx_skb_alloc(q, len, true);
87 if (unlikely(!skb))
88 return NULL;
89
90 i = comp->num_sg_elems + 1;
91 do {
92 if (unlikely(!page_info->page)) {
93 struct napi_struct *napi = &q_to_qcq(q)->napi;
94
95 napi->skb = NULL;
96 dev_kfree_skb(skb);
97 return NULL;
98 }
99
100 frag_len = min(len, (u16)PAGE_SIZE);
101 len -= frag_len;
102
103 dma_unmap_page(dev, dma_unmap_addr(page_info, dma_addr),
104 PAGE_SIZE, DMA_FROM_DEVICE);
105 skb_add_rx_frag(skb, skb_shinfo(skb)->nr_frags,
106 page_info->page, 0, frag_len, PAGE_SIZE);
107 page_info->page = NULL;
108 page_info++;
109 i--;
110 } while (i > 0);
111
112 return skb;
113 }
114
ionic_rx_copybreak(struct ionic_queue * q,struct ionic_desc_info * desc_info,struct ionic_cq_info * cq_info)115 static struct sk_buff *ionic_rx_copybreak(struct ionic_queue *q,
116 struct ionic_desc_info *desc_info,
117 struct ionic_cq_info *cq_info)
118 {
119 struct ionic_rxq_comp *comp = cq_info->cq_desc;
120 struct device *dev = q->lif->ionic->dev;
121 struct ionic_page_info *page_info;
122 struct sk_buff *skb;
123 u16 len;
124
125 page_info = &desc_info->pages[0];
126 len = le16_to_cpu(comp->len);
127
128 skb = ionic_rx_skb_alloc(q, len, false);
129 if (unlikely(!skb))
130 return NULL;
131
132 if (unlikely(!page_info->page)) {
133 dev_kfree_skb(skb);
134 return NULL;
135 }
136
137 dma_sync_single_for_cpu(dev, dma_unmap_addr(page_info, dma_addr),
138 len, DMA_FROM_DEVICE);
139 skb_copy_to_linear_data(skb, page_address(page_info->page), len);
140 dma_sync_single_for_device(dev, dma_unmap_addr(page_info, dma_addr),
141 len, DMA_FROM_DEVICE);
142
143 skb_put(skb, len);
144 skb->protocol = eth_type_trans(skb, q->lif->netdev);
145
146 return skb;
147 }
148
ionic_rx_clean(struct ionic_queue * q,struct ionic_desc_info * desc_info,struct ionic_cq_info * cq_info,void * cb_arg)149 static void ionic_rx_clean(struct ionic_queue *q,
150 struct ionic_desc_info *desc_info,
151 struct ionic_cq_info *cq_info,
152 void *cb_arg)
153 {
154 struct ionic_rxq_comp *comp = cq_info->cq_desc;
155 struct ionic_qcq *qcq = q_to_qcq(q);
156 struct ionic_rx_stats *stats;
157 struct net_device *netdev;
158 struct sk_buff *skb;
159
160 stats = q_to_rx_stats(q);
161 netdev = q->lif->netdev;
162
163 if (comp->status) {
164 stats->dropped++;
165 return;
166 }
167
168 stats->pkts++;
169 stats->bytes += le16_to_cpu(comp->len);
170
171 if (le16_to_cpu(comp->len) <= q->lif->rx_copybreak)
172 skb = ionic_rx_copybreak(q, desc_info, cq_info);
173 else
174 skb = ionic_rx_frags(q, desc_info, cq_info);
175
176 if (unlikely(!skb)) {
177 stats->dropped++;
178 return;
179 }
180
181 skb_record_rx_queue(skb, q->index);
182
183 if (likely(netdev->features & NETIF_F_RXHASH)) {
184 switch (comp->pkt_type_color & IONIC_RXQ_COMP_PKT_TYPE_MASK) {
185 case IONIC_PKT_TYPE_IPV4:
186 case IONIC_PKT_TYPE_IPV6:
187 skb_set_hash(skb, le32_to_cpu(comp->rss_hash),
188 PKT_HASH_TYPE_L3);
189 break;
190 case IONIC_PKT_TYPE_IPV4_TCP:
191 case IONIC_PKT_TYPE_IPV6_TCP:
192 case IONIC_PKT_TYPE_IPV4_UDP:
193 case IONIC_PKT_TYPE_IPV6_UDP:
194 skb_set_hash(skb, le32_to_cpu(comp->rss_hash),
195 PKT_HASH_TYPE_L4);
196 break;
197 }
198 }
199
200 if (likely(netdev->features & NETIF_F_RXCSUM)) {
201 if (comp->csum_flags & IONIC_RXQ_COMP_CSUM_F_CALC) {
202 skb->ip_summed = CHECKSUM_COMPLETE;
203 skb->csum = (__force __wsum)le16_to_cpu(comp->csum);
204 stats->csum_complete++;
205 }
206 } else {
207 stats->csum_none++;
208 }
209
210 if (unlikely((comp->csum_flags & IONIC_RXQ_COMP_CSUM_F_TCP_BAD) ||
211 (comp->csum_flags & IONIC_RXQ_COMP_CSUM_F_UDP_BAD) ||
212 (comp->csum_flags & IONIC_RXQ_COMP_CSUM_F_IP_BAD)))
213 stats->csum_error++;
214
215 if (likely(netdev->features & NETIF_F_HW_VLAN_CTAG_RX) &&
216 (comp->csum_flags & IONIC_RXQ_COMP_CSUM_F_VLAN)) {
217 __vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q),
218 le16_to_cpu(comp->vlan_tci));
219 stats->vlan_stripped++;
220 }
221
222 if (le16_to_cpu(comp->len) <= q->lif->rx_copybreak)
223 napi_gro_receive(&qcq->napi, skb);
224 else
225 napi_gro_frags(&qcq->napi);
226 }
227
ionic_rx_service(struct ionic_cq * cq,struct ionic_cq_info * cq_info)228 static bool ionic_rx_service(struct ionic_cq *cq, struct ionic_cq_info *cq_info)
229 {
230 struct ionic_rxq_comp *comp = cq_info->cq_desc;
231 struct ionic_queue *q = cq->bound_q;
232 struct ionic_desc_info *desc_info;
233
234 if (!color_match(comp->pkt_type_color, cq->done_color))
235 return false;
236
237 /* check for empty queue */
238 if (q->tail_idx == q->head_idx)
239 return false;
240
241 if (q->tail_idx != le16_to_cpu(comp->comp_index))
242 return false;
243
244 desc_info = &q->info[q->tail_idx];
245 q->tail_idx = (q->tail_idx + 1) & (q->num_descs - 1);
246
247 /* clean the related q entry, only one per qc completion */
248 ionic_rx_clean(q, desc_info, cq_info, desc_info->cb_arg);
249
250 desc_info->cb = NULL;
251 desc_info->cb_arg = NULL;
252
253 return true;
254 }
255
ionic_rx_page_alloc(struct ionic_queue * q,struct ionic_page_info * page_info)256 static int ionic_rx_page_alloc(struct ionic_queue *q,
257 struct ionic_page_info *page_info)
258 {
259 struct ionic_lif *lif = q->lif;
260 struct ionic_rx_stats *stats;
261 struct net_device *netdev;
262 struct device *dev;
263
264 netdev = lif->netdev;
265 dev = lif->ionic->dev;
266 stats = q_to_rx_stats(q);
267
268 if (unlikely(!page_info)) {
269 net_err_ratelimited("%s: %s invalid page_info in alloc\n",
270 netdev->name, q->name);
271 return -EINVAL;
272 }
273
274 page_info->page = dev_alloc_page();
275 if (unlikely(!page_info->page)) {
276 net_err_ratelimited("%s: %s page alloc failed\n",
277 netdev->name, q->name);
278 stats->alloc_err++;
279 return -ENOMEM;
280 }
281
282 page_info->dma_addr = dma_map_page(dev, page_info->page, 0, PAGE_SIZE,
283 DMA_FROM_DEVICE);
284 if (unlikely(dma_mapping_error(dev, page_info->dma_addr))) {
285 put_page(page_info->page);
286 page_info->dma_addr = 0;
287 page_info->page = NULL;
288 net_err_ratelimited("%s: %s dma map failed\n",
289 netdev->name, q->name);
290 stats->dma_map_err++;
291 return -EIO;
292 }
293
294 return 0;
295 }
296
ionic_rx_page_free(struct ionic_queue * q,struct ionic_page_info * page_info)297 static void ionic_rx_page_free(struct ionic_queue *q,
298 struct ionic_page_info *page_info)
299 {
300 struct ionic_lif *lif = q->lif;
301 struct net_device *netdev;
302 struct device *dev;
303
304 netdev = lif->netdev;
305 dev = lif->ionic->dev;
306
307 if (unlikely(!page_info)) {
308 net_err_ratelimited("%s: %s invalid page_info in free\n",
309 netdev->name, q->name);
310 return;
311 }
312
313 if (unlikely(!page_info->page)) {
314 net_err_ratelimited("%s: %s invalid page in free\n",
315 netdev->name, q->name);
316 return;
317 }
318
319 dma_unmap_page(dev, page_info->dma_addr, PAGE_SIZE, DMA_FROM_DEVICE);
320
321 put_page(page_info->page);
322 page_info->dma_addr = 0;
323 page_info->page = NULL;
324 }
325
ionic_rx_fill(struct ionic_queue * q)326 void ionic_rx_fill(struct ionic_queue *q)
327 {
328 struct net_device *netdev = q->lif->netdev;
329 struct ionic_desc_info *desc_info;
330 struct ionic_page_info *page_info;
331 struct ionic_rxq_sg_desc *sg_desc;
332 struct ionic_rxq_sg_elem *sg_elem;
333 struct ionic_rxq_desc *desc;
334 unsigned int remain_len;
335 unsigned int seg_len;
336 unsigned int nfrags;
337 unsigned int i, j;
338 unsigned int len;
339
340 len = netdev->mtu + ETH_HLEN;
341 nfrags = round_up(len, PAGE_SIZE) / PAGE_SIZE;
342
343 for (i = ionic_q_space_avail(q); i; i--) {
344 remain_len = len;
345 desc_info = &q->info[q->head_idx];
346 desc = desc_info->desc;
347 sg_desc = desc_info->sg_desc;
348 page_info = &desc_info->pages[0];
349
350 if (page_info->page) { /* recycle the buffer */
351 ionic_rxq_post(q, false, ionic_rx_clean, NULL);
352 continue;
353 }
354
355 /* fill main descriptor - pages[0] */
356 desc->opcode = (nfrags > 1) ? IONIC_RXQ_DESC_OPCODE_SG :
357 IONIC_RXQ_DESC_OPCODE_SIMPLE;
358 desc_info->npages = nfrags;
359 if (unlikely(ionic_rx_page_alloc(q, page_info))) {
360 desc->addr = 0;
361 desc->len = 0;
362 return;
363 }
364 desc->addr = cpu_to_le64(page_info->dma_addr);
365 seg_len = min_t(unsigned int, PAGE_SIZE, len);
366 desc->len = cpu_to_le16(seg_len);
367 remain_len -= seg_len;
368 page_info++;
369
370 /* fill sg descriptors - pages[1..n] */
371 for (j = 0; j < nfrags - 1; j++) {
372 if (page_info->page) /* recycle the sg buffer */
373 continue;
374
375 sg_elem = &sg_desc->elems[j];
376 if (unlikely(ionic_rx_page_alloc(q, page_info))) {
377 sg_elem->addr = 0;
378 sg_elem->len = 0;
379 return;
380 }
381 sg_elem->addr = cpu_to_le64(page_info->dma_addr);
382 seg_len = min_t(unsigned int, PAGE_SIZE, remain_len);
383 sg_elem->len = cpu_to_le16(seg_len);
384 remain_len -= seg_len;
385 page_info++;
386 }
387
388 ionic_rxq_post(q, false, ionic_rx_clean, NULL);
389 }
390
391 ionic_dbell_ring(q->lif->kern_dbpage, q->hw_type,
392 q->dbval | q->head_idx);
393 }
394
ionic_rx_fill_cb(void * arg)395 static void ionic_rx_fill_cb(void *arg)
396 {
397 ionic_rx_fill(arg);
398 }
399
ionic_rx_empty(struct ionic_queue * q)400 void ionic_rx_empty(struct ionic_queue *q)
401 {
402 struct ionic_desc_info *desc_info;
403 struct ionic_page_info *page_info;
404 unsigned int i, j;
405
406 for (i = 0; i < q->num_descs; i++) {
407 desc_info = &q->info[i];
408 for (j = 0; j < IONIC_RX_MAX_SG_ELEMS + 1; j++) {
409 page_info = &desc_info->pages[j];
410 if (page_info->page)
411 ionic_rx_page_free(q, page_info);
412 }
413
414 desc_info->npages = 0;
415 desc_info->cb = NULL;
416 desc_info->cb_arg = NULL;
417 }
418 }
419
ionic_dim_update(struct ionic_qcq * qcq)420 static void ionic_dim_update(struct ionic_qcq *qcq)
421 {
422 struct dim_sample dim_sample;
423 struct ionic_lif *lif;
424 unsigned int qi;
425
426 if (!qcq->intr.dim_coal_hw)
427 return;
428
429 lif = qcq->q.lif;
430 qi = qcq->cq.bound_q->index;
431
432 ionic_intr_coal_init(lif->ionic->idev.intr_ctrl,
433 lif->rxqcqs[qi]->intr.index,
434 qcq->intr.dim_coal_hw);
435
436 dim_update_sample(qcq->cq.bound_intr->rearm_count,
437 lif->txqstats[qi].pkts,
438 lif->txqstats[qi].bytes,
439 &dim_sample);
440
441 net_dim(&qcq->dim, dim_sample);
442 }
443
ionic_tx_napi(struct napi_struct * napi,int budget)444 int ionic_tx_napi(struct napi_struct *napi, int budget)
445 {
446 struct ionic_qcq *qcq = napi_to_qcq(napi);
447 struct ionic_cq *cq = napi_to_cq(napi);
448 struct ionic_dev *idev;
449 struct ionic_lif *lif;
450 u32 work_done = 0;
451 u32 flags = 0;
452
453 lif = cq->bound_q->lif;
454 idev = &lif->ionic->idev;
455
456 work_done = ionic_cq_service(cq, budget,
457 ionic_tx_service, NULL, NULL);
458
459 if (work_done < budget && napi_complete_done(napi, work_done)) {
460 ionic_dim_update(qcq);
461 flags |= IONIC_INTR_CRED_UNMASK;
462 cq->bound_intr->rearm_count++;
463 }
464
465 if (work_done || flags) {
466 flags |= IONIC_INTR_CRED_RESET_COALESCE;
467 ionic_intr_credits(idev->intr_ctrl,
468 cq->bound_intr->index,
469 work_done, flags);
470 }
471
472 DEBUG_STATS_NAPI_POLL(qcq, work_done);
473
474 return work_done;
475 }
476
ionic_rx_napi(struct napi_struct * napi,int budget)477 int ionic_rx_napi(struct napi_struct *napi, int budget)
478 {
479 struct ionic_qcq *qcq = napi_to_qcq(napi);
480 struct ionic_cq *cq = napi_to_cq(napi);
481 struct ionic_dev *idev;
482 struct ionic_lif *lif;
483 u32 work_done = 0;
484 u32 flags = 0;
485
486 lif = cq->bound_q->lif;
487 idev = &lif->ionic->idev;
488
489 work_done = ionic_cq_service(cq, budget,
490 ionic_rx_service, NULL, NULL);
491
492 if (work_done)
493 ionic_rx_fill(cq->bound_q);
494
495 if (work_done < budget && napi_complete_done(napi, work_done)) {
496 ionic_dim_update(qcq);
497 flags |= IONIC_INTR_CRED_UNMASK;
498 cq->bound_intr->rearm_count++;
499 }
500
501 if (work_done || flags) {
502 flags |= IONIC_INTR_CRED_RESET_COALESCE;
503 ionic_intr_credits(idev->intr_ctrl,
504 cq->bound_intr->index,
505 work_done, flags);
506 }
507
508 DEBUG_STATS_NAPI_POLL(qcq, work_done);
509
510 return work_done;
511 }
512
ionic_txrx_napi(struct napi_struct * napi,int budget)513 int ionic_txrx_napi(struct napi_struct *napi, int budget)
514 {
515 struct ionic_qcq *qcq = napi_to_qcq(napi);
516 struct ionic_cq *rxcq = napi_to_cq(napi);
517 unsigned int qi = rxcq->bound_q->index;
518 struct ionic_dev *idev;
519 struct ionic_lif *lif;
520 struct ionic_cq *txcq;
521 u32 rx_work_done = 0;
522 u32 tx_work_done = 0;
523 u32 flags = 0;
524
525 lif = rxcq->bound_q->lif;
526 idev = &lif->ionic->idev;
527 txcq = &lif->txqcqs[qi]->cq;
528
529 tx_work_done = ionic_cq_service(txcq, lif->tx_budget,
530 ionic_tx_service, NULL, NULL);
531
532 rx_work_done = ionic_cq_service(rxcq, budget,
533 ionic_rx_service, NULL, NULL);
534 if (rx_work_done)
535 ionic_rx_fill_cb(rxcq->bound_q);
536
537 if (rx_work_done < budget && napi_complete_done(napi, rx_work_done)) {
538 ionic_dim_update(qcq);
539 flags |= IONIC_INTR_CRED_UNMASK;
540 rxcq->bound_intr->rearm_count++;
541 }
542
543 if (rx_work_done || flags) {
544 flags |= IONIC_INTR_CRED_RESET_COALESCE;
545 ionic_intr_credits(idev->intr_ctrl, rxcq->bound_intr->index,
546 tx_work_done + rx_work_done, flags);
547 }
548
549 DEBUG_STATS_NAPI_POLL(qcq, rx_work_done);
550 DEBUG_STATS_NAPI_POLL(qcq, tx_work_done);
551
552 return rx_work_done;
553 }
554
ionic_tx_map_single(struct ionic_queue * q,void * data,size_t len)555 static dma_addr_t ionic_tx_map_single(struct ionic_queue *q,
556 void *data, size_t len)
557 {
558 struct ionic_tx_stats *stats = q_to_tx_stats(q);
559 struct device *dev = q->lif->ionic->dev;
560 dma_addr_t dma_addr;
561
562 dma_addr = dma_map_single(dev, data, len, DMA_TO_DEVICE);
563 if (dma_mapping_error(dev, dma_addr)) {
564 net_warn_ratelimited("%s: DMA single map failed on %s!\n",
565 q->lif->netdev->name, q->name);
566 stats->dma_map_err++;
567 return 0;
568 }
569 return dma_addr;
570 }
571
ionic_tx_map_frag(struct ionic_queue * q,const skb_frag_t * frag,size_t offset,size_t len)572 static dma_addr_t ionic_tx_map_frag(struct ionic_queue *q,
573 const skb_frag_t *frag,
574 size_t offset, size_t len)
575 {
576 struct ionic_tx_stats *stats = q_to_tx_stats(q);
577 struct device *dev = q->lif->ionic->dev;
578 dma_addr_t dma_addr;
579
580 dma_addr = skb_frag_dma_map(dev, frag, offset, len, DMA_TO_DEVICE);
581 if (dma_mapping_error(dev, dma_addr)) {
582 net_warn_ratelimited("%s: DMA frag map failed on %s!\n",
583 q->lif->netdev->name, q->name);
584 stats->dma_map_err++;
585 }
586 return dma_addr;
587 }
588
ionic_tx_clean(struct ionic_queue * q,struct ionic_desc_info * desc_info,struct ionic_cq_info * cq_info,void * cb_arg)589 static void ionic_tx_clean(struct ionic_queue *q,
590 struct ionic_desc_info *desc_info,
591 struct ionic_cq_info *cq_info,
592 void *cb_arg)
593 {
594 struct ionic_txq_sg_desc *sg_desc = desc_info->sg_desc;
595 struct ionic_txq_sg_elem *elem = sg_desc->elems;
596 struct ionic_tx_stats *stats = q_to_tx_stats(q);
597 struct ionic_txq_desc *desc = desc_info->desc;
598 struct device *dev = q->lif->ionic->dev;
599 u8 opcode, flags, nsge;
600 u16 queue_index;
601 unsigned int i;
602 u64 addr;
603
604 decode_txq_desc_cmd(le64_to_cpu(desc->cmd),
605 &opcode, &flags, &nsge, &addr);
606
607 /* use unmap_single only if either this is not TSO,
608 * or this is first descriptor of a TSO
609 */
610 if (opcode != IONIC_TXQ_DESC_OPCODE_TSO ||
611 flags & IONIC_TXQ_DESC_FLAG_TSO_SOT)
612 dma_unmap_single(dev, (dma_addr_t)addr,
613 le16_to_cpu(desc->len), DMA_TO_DEVICE);
614 else
615 dma_unmap_page(dev, (dma_addr_t)addr,
616 le16_to_cpu(desc->len), DMA_TO_DEVICE);
617
618 for (i = 0; i < nsge; i++, elem++)
619 dma_unmap_page(dev, (dma_addr_t)le64_to_cpu(elem->addr),
620 le16_to_cpu(elem->len), DMA_TO_DEVICE);
621
622 if (cb_arg) {
623 struct sk_buff *skb = cb_arg;
624 u32 len = skb->len;
625
626 queue_index = skb_get_queue_mapping(skb);
627 if (unlikely(__netif_subqueue_stopped(q->lif->netdev,
628 queue_index))) {
629 netif_wake_subqueue(q->lif->netdev, queue_index);
630 q->wake++;
631 }
632 dev_kfree_skb_any(skb);
633 stats->clean++;
634 netdev_tx_completed_queue(q_to_ndq(q), 1, len);
635 }
636 }
637
ionic_tx_service(struct ionic_cq * cq,struct ionic_cq_info * cq_info)638 static bool ionic_tx_service(struct ionic_cq *cq, struct ionic_cq_info *cq_info)
639 {
640 struct ionic_txq_comp *comp = cq_info->cq_desc;
641 struct ionic_queue *q = cq->bound_q;
642 struct ionic_desc_info *desc_info;
643 u16 index;
644
645 if (!color_match(comp->color, cq->done_color))
646 return false;
647
648 /* clean the related q entries, there could be
649 * several q entries completed for each cq completion
650 */
651 do {
652 desc_info = &q->info[q->tail_idx];
653 index = q->tail_idx;
654 q->tail_idx = (q->tail_idx + 1) & (q->num_descs - 1);
655 ionic_tx_clean(q, desc_info, cq_info, desc_info->cb_arg);
656 desc_info->cb = NULL;
657 desc_info->cb_arg = NULL;
658 } while (index != le16_to_cpu(comp->comp_index));
659
660 return true;
661 }
662
ionic_tx_flush(struct ionic_cq * cq)663 void ionic_tx_flush(struct ionic_cq *cq)
664 {
665 struct ionic_dev *idev = &cq->lif->ionic->idev;
666 u32 work_done;
667
668 work_done = ionic_cq_service(cq, cq->num_descs,
669 ionic_tx_service, NULL, NULL);
670 if (work_done)
671 ionic_intr_credits(idev->intr_ctrl, cq->bound_intr->index,
672 work_done, IONIC_INTR_CRED_RESET_COALESCE);
673 }
674
ionic_tx_empty(struct ionic_queue * q)675 void ionic_tx_empty(struct ionic_queue *q)
676 {
677 struct ionic_desc_info *desc_info;
678
679 /* walk the not completed tx entries, if any */
680 while (q->head_idx != q->tail_idx) {
681 desc_info = &q->info[q->tail_idx];
682 q->tail_idx = (q->tail_idx + 1) & (q->num_descs - 1);
683 ionic_tx_clean(q, desc_info, NULL, desc_info->cb_arg);
684 desc_info->cb = NULL;
685 desc_info->cb_arg = NULL;
686 }
687 }
688
ionic_tx_tcp_inner_pseudo_csum(struct sk_buff * skb)689 static int ionic_tx_tcp_inner_pseudo_csum(struct sk_buff *skb)
690 {
691 int err;
692
693 err = skb_cow_head(skb, 0);
694 if (err)
695 return err;
696
697 if (skb->protocol == cpu_to_be16(ETH_P_IP)) {
698 inner_ip_hdr(skb)->check = 0;
699 inner_tcp_hdr(skb)->check =
700 ~csum_tcpudp_magic(inner_ip_hdr(skb)->saddr,
701 inner_ip_hdr(skb)->daddr,
702 0, IPPROTO_TCP, 0);
703 } else if (skb->protocol == cpu_to_be16(ETH_P_IPV6)) {
704 inner_tcp_hdr(skb)->check =
705 ~csum_ipv6_magic(&inner_ipv6_hdr(skb)->saddr,
706 &inner_ipv6_hdr(skb)->daddr,
707 0, IPPROTO_TCP, 0);
708 }
709
710 return 0;
711 }
712
ionic_tx_tcp_pseudo_csum(struct sk_buff * skb)713 static int ionic_tx_tcp_pseudo_csum(struct sk_buff *skb)
714 {
715 int err;
716
717 err = skb_cow_head(skb, 0);
718 if (err)
719 return err;
720
721 if (skb->protocol == cpu_to_be16(ETH_P_IP)) {
722 ip_hdr(skb)->check = 0;
723 tcp_hdr(skb)->check =
724 ~csum_tcpudp_magic(ip_hdr(skb)->saddr,
725 ip_hdr(skb)->daddr,
726 0, IPPROTO_TCP, 0);
727 } else if (skb->protocol == cpu_to_be16(ETH_P_IPV6)) {
728 tcp_v6_gso_csum_prep(skb);
729 }
730
731 return 0;
732 }
733
ionic_tx_tso_post(struct ionic_queue * q,struct ionic_txq_desc * desc,struct sk_buff * skb,dma_addr_t addr,u8 nsge,u16 len,unsigned int hdrlen,unsigned int mss,bool outer_csum,u16 vlan_tci,bool has_vlan,bool start,bool done)734 static void ionic_tx_tso_post(struct ionic_queue *q, struct ionic_txq_desc *desc,
735 struct sk_buff *skb,
736 dma_addr_t addr, u8 nsge, u16 len,
737 unsigned int hdrlen, unsigned int mss,
738 bool outer_csum,
739 u16 vlan_tci, bool has_vlan,
740 bool start, bool done)
741 {
742 u8 flags = 0;
743 u64 cmd;
744
745 flags |= has_vlan ? IONIC_TXQ_DESC_FLAG_VLAN : 0;
746 flags |= outer_csum ? IONIC_TXQ_DESC_FLAG_ENCAP : 0;
747 flags |= start ? IONIC_TXQ_DESC_FLAG_TSO_SOT : 0;
748 flags |= done ? IONIC_TXQ_DESC_FLAG_TSO_EOT : 0;
749
750 cmd = encode_txq_desc_cmd(IONIC_TXQ_DESC_OPCODE_TSO, flags, nsge, addr);
751 desc->cmd = cpu_to_le64(cmd);
752 desc->len = cpu_to_le16(len);
753 desc->vlan_tci = cpu_to_le16(vlan_tci);
754 desc->hdr_len = cpu_to_le16(hdrlen);
755 desc->mss = cpu_to_le16(mss);
756
757 if (done) {
758 skb_tx_timestamp(skb);
759 netdev_tx_sent_queue(q_to_ndq(q), skb->len);
760 ionic_txq_post(q, !netdev_xmit_more(), ionic_tx_clean, skb);
761 } else {
762 ionic_txq_post(q, false, ionic_tx_clean, NULL);
763 }
764 }
765
ionic_tx_tso_next(struct ionic_queue * q,struct ionic_txq_sg_elem ** elem)766 static struct ionic_txq_desc *ionic_tx_tso_next(struct ionic_queue *q,
767 struct ionic_txq_sg_elem **elem)
768 {
769 struct ionic_txq_sg_desc *sg_desc = q->info[q->head_idx].txq_sg_desc;
770 struct ionic_txq_desc *desc = q->info[q->head_idx].txq_desc;
771
772 *elem = sg_desc->elems;
773 return desc;
774 }
775
ionic_tx_tso(struct ionic_queue * q,struct sk_buff * skb)776 static int ionic_tx_tso(struct ionic_queue *q, struct sk_buff *skb)
777 {
778 struct ionic_tx_stats *stats = q_to_tx_stats(q);
779 struct ionic_desc_info *rewind_desc_info;
780 struct device *dev = q->lif->ionic->dev;
781 struct ionic_txq_sg_elem *elem;
782 struct ionic_txq_desc *desc;
783 unsigned int frag_left = 0;
784 unsigned int offset = 0;
785 u16 abort = q->head_idx;
786 unsigned int len_left;
787 dma_addr_t desc_addr;
788 unsigned int hdrlen;
789 unsigned int nfrags;
790 unsigned int seglen;
791 u64 total_bytes = 0;
792 u64 total_pkts = 0;
793 u16 rewind = abort;
794 unsigned int left;
795 unsigned int len;
796 unsigned int mss;
797 skb_frag_t *frag;
798 bool start, done;
799 bool outer_csum;
800 dma_addr_t addr;
801 bool has_vlan;
802 u16 desc_len;
803 u8 desc_nsge;
804 u16 vlan_tci;
805 bool encap;
806 int err;
807
808 mss = skb_shinfo(skb)->gso_size;
809 nfrags = skb_shinfo(skb)->nr_frags;
810 len_left = skb->len - skb_headlen(skb);
811 outer_csum = (skb_shinfo(skb)->gso_type & SKB_GSO_GRE_CSUM) ||
812 (skb_shinfo(skb)->gso_type & SKB_GSO_UDP_TUNNEL_CSUM);
813 has_vlan = !!skb_vlan_tag_present(skb);
814 vlan_tci = skb_vlan_tag_get(skb);
815 encap = skb->encapsulation;
816
817 /* Preload inner-most TCP csum field with IP pseudo hdr
818 * calculated with IP length set to zero. HW will later
819 * add in length to each TCP segment resulting from the TSO.
820 */
821
822 if (encap)
823 err = ionic_tx_tcp_inner_pseudo_csum(skb);
824 else
825 err = ionic_tx_tcp_pseudo_csum(skb);
826 if (err)
827 return err;
828
829 if (encap)
830 hdrlen = skb_inner_transport_header(skb) - skb->data +
831 inner_tcp_hdrlen(skb);
832 else
833 hdrlen = skb_transport_offset(skb) + tcp_hdrlen(skb);
834
835 seglen = hdrlen + mss;
836 left = skb_headlen(skb);
837
838 desc = ionic_tx_tso_next(q, &elem);
839 start = true;
840
841 /* Chop skb->data up into desc segments */
842
843 while (left > 0) {
844 len = min(seglen, left);
845 frag_left = seglen - len;
846 desc_addr = ionic_tx_map_single(q, skb->data + offset, len);
847 if (dma_mapping_error(dev, desc_addr))
848 goto err_out_abort;
849 desc_len = len;
850 desc_nsge = 0;
851 left -= len;
852 offset += len;
853 if (nfrags > 0 && frag_left > 0)
854 continue;
855 done = (nfrags == 0 && left == 0);
856 ionic_tx_tso_post(q, desc, skb,
857 desc_addr, desc_nsge, desc_len,
858 hdrlen, mss,
859 outer_csum,
860 vlan_tci, has_vlan,
861 start, done);
862 total_pkts++;
863 total_bytes += start ? len : len + hdrlen;
864 desc = ionic_tx_tso_next(q, &elem);
865 start = false;
866 seglen = mss;
867 }
868
869 /* Chop skb frags into desc segments */
870
871 for (frag = skb_shinfo(skb)->frags; len_left; frag++) {
872 offset = 0;
873 left = skb_frag_size(frag);
874 len_left -= left;
875 nfrags--;
876 stats->frags++;
877
878 while (left > 0) {
879 if (frag_left > 0) {
880 len = min(frag_left, left);
881 frag_left -= len;
882 addr = ionic_tx_map_frag(q, frag, offset, len);
883 if (dma_mapping_error(dev, addr))
884 goto err_out_abort;
885 elem->addr = cpu_to_le64(addr);
886 elem->len = cpu_to_le16(len);
887 elem++;
888 desc_nsge++;
889 left -= len;
890 offset += len;
891 if (nfrags > 0 && frag_left > 0)
892 continue;
893 done = (nfrags == 0 && left == 0);
894 ionic_tx_tso_post(q, desc, skb, desc_addr,
895 desc_nsge, desc_len,
896 hdrlen, mss, outer_csum,
897 vlan_tci, has_vlan,
898 start, done);
899 total_pkts++;
900 total_bytes += start ? len : len + hdrlen;
901 desc = ionic_tx_tso_next(q, &elem);
902 start = false;
903 } else {
904 len = min(mss, left);
905 frag_left = mss - len;
906 desc_addr = ionic_tx_map_frag(q, frag,
907 offset, len);
908 if (dma_mapping_error(dev, desc_addr))
909 goto err_out_abort;
910 desc_len = len;
911 desc_nsge = 0;
912 left -= len;
913 offset += len;
914 if (nfrags > 0 && frag_left > 0)
915 continue;
916 done = (nfrags == 0 && left == 0);
917 ionic_tx_tso_post(q, desc, skb, desc_addr,
918 desc_nsge, desc_len,
919 hdrlen, mss, outer_csum,
920 vlan_tci, has_vlan,
921 start, done);
922 total_pkts++;
923 total_bytes += start ? len : len + hdrlen;
924 desc = ionic_tx_tso_next(q, &elem);
925 start = false;
926 }
927 }
928 }
929
930 stats->pkts += total_pkts;
931 stats->bytes += total_bytes;
932 stats->tso++;
933 stats->tso_bytes += total_bytes;
934
935 return 0;
936
937 err_out_abort:
938 while (rewind != q->head_idx) {
939 rewind_desc_info = &q->info[rewind];
940 ionic_tx_clean(q, rewind_desc_info, NULL, NULL);
941 rewind = (rewind + 1) & (q->num_descs - 1);
942 }
943 q->head_idx = abort;
944
945 return -ENOMEM;
946 }
947
ionic_tx_calc_csum(struct ionic_queue * q,struct sk_buff * skb)948 static int ionic_tx_calc_csum(struct ionic_queue *q, struct sk_buff *skb)
949 {
950 struct ionic_txq_desc *desc = q->info[q->head_idx].txq_desc;
951 struct ionic_tx_stats *stats = q_to_tx_stats(q);
952 struct device *dev = q->lif->ionic->dev;
953 dma_addr_t dma_addr;
954 bool has_vlan;
955 u8 flags = 0;
956 bool encap;
957 u64 cmd;
958
959 has_vlan = !!skb_vlan_tag_present(skb);
960 encap = skb->encapsulation;
961
962 dma_addr = ionic_tx_map_single(q, skb->data, skb_headlen(skb));
963 if (dma_mapping_error(dev, dma_addr))
964 return -ENOMEM;
965
966 flags |= has_vlan ? IONIC_TXQ_DESC_FLAG_VLAN : 0;
967 flags |= encap ? IONIC_TXQ_DESC_FLAG_ENCAP : 0;
968
969 cmd = encode_txq_desc_cmd(IONIC_TXQ_DESC_OPCODE_CSUM_PARTIAL,
970 flags, skb_shinfo(skb)->nr_frags, dma_addr);
971 desc->cmd = cpu_to_le64(cmd);
972 desc->len = cpu_to_le16(skb_headlen(skb));
973 desc->csum_start = cpu_to_le16(skb_checksum_start_offset(skb));
974 desc->csum_offset = cpu_to_le16(skb->csum_offset);
975 if (has_vlan) {
976 desc->vlan_tci = cpu_to_le16(skb_vlan_tag_get(skb));
977 stats->vlan_inserted++;
978 }
979
980 if (skb->csum_not_inet)
981 stats->crc32_csum++;
982 else
983 stats->csum++;
984
985 return 0;
986 }
987
ionic_tx_calc_no_csum(struct ionic_queue * q,struct sk_buff * skb)988 static int ionic_tx_calc_no_csum(struct ionic_queue *q, struct sk_buff *skb)
989 {
990 struct ionic_txq_desc *desc = q->info[q->head_idx].txq_desc;
991 struct ionic_tx_stats *stats = q_to_tx_stats(q);
992 struct device *dev = q->lif->ionic->dev;
993 dma_addr_t dma_addr;
994 bool has_vlan;
995 u8 flags = 0;
996 bool encap;
997 u64 cmd;
998
999 has_vlan = !!skb_vlan_tag_present(skb);
1000 encap = skb->encapsulation;
1001
1002 dma_addr = ionic_tx_map_single(q, skb->data, skb_headlen(skb));
1003 if (dma_mapping_error(dev, dma_addr))
1004 return -ENOMEM;
1005
1006 flags |= has_vlan ? IONIC_TXQ_DESC_FLAG_VLAN : 0;
1007 flags |= encap ? IONIC_TXQ_DESC_FLAG_ENCAP : 0;
1008
1009 cmd = encode_txq_desc_cmd(IONIC_TXQ_DESC_OPCODE_CSUM_NONE,
1010 flags, skb_shinfo(skb)->nr_frags, dma_addr);
1011 desc->cmd = cpu_to_le64(cmd);
1012 desc->len = cpu_to_le16(skb_headlen(skb));
1013 if (has_vlan) {
1014 desc->vlan_tci = cpu_to_le16(skb_vlan_tag_get(skb));
1015 stats->vlan_inserted++;
1016 }
1017
1018 stats->csum_none++;
1019
1020 return 0;
1021 }
1022
ionic_tx_skb_frags(struct ionic_queue * q,struct sk_buff * skb)1023 static int ionic_tx_skb_frags(struct ionic_queue *q, struct sk_buff *skb)
1024 {
1025 struct ionic_txq_sg_desc *sg_desc = q->info[q->head_idx].txq_sg_desc;
1026 unsigned int len_left = skb->len - skb_headlen(skb);
1027 struct ionic_txq_sg_elem *elem = sg_desc->elems;
1028 struct ionic_tx_stats *stats = q_to_tx_stats(q);
1029 struct device *dev = q->lif->ionic->dev;
1030 dma_addr_t dma_addr;
1031 skb_frag_t *frag;
1032 u16 len;
1033
1034 for (frag = skb_shinfo(skb)->frags; len_left; frag++, elem++) {
1035 len = skb_frag_size(frag);
1036 elem->len = cpu_to_le16(len);
1037 dma_addr = ionic_tx_map_frag(q, frag, 0, len);
1038 if (dma_mapping_error(dev, dma_addr))
1039 return -ENOMEM;
1040 elem->addr = cpu_to_le64(dma_addr);
1041 len_left -= len;
1042 stats->frags++;
1043 }
1044
1045 return 0;
1046 }
1047
ionic_tx(struct ionic_queue * q,struct sk_buff * skb)1048 static int ionic_tx(struct ionic_queue *q, struct sk_buff *skb)
1049 {
1050 struct ionic_tx_stats *stats = q_to_tx_stats(q);
1051 int err;
1052
1053 /* set up the initial descriptor */
1054 if (skb->ip_summed == CHECKSUM_PARTIAL)
1055 err = ionic_tx_calc_csum(q, skb);
1056 else
1057 err = ionic_tx_calc_no_csum(q, skb);
1058 if (err)
1059 return err;
1060
1061 /* add frags */
1062 err = ionic_tx_skb_frags(q, skb);
1063 if (err)
1064 return err;
1065
1066 skb_tx_timestamp(skb);
1067 stats->pkts++;
1068 stats->bytes += skb->len;
1069
1070 netdev_tx_sent_queue(q_to_ndq(q), skb->len);
1071 ionic_txq_post(q, !netdev_xmit_more(), ionic_tx_clean, skb);
1072
1073 return 0;
1074 }
1075
ionic_tx_descs_needed(struct ionic_queue * q,struct sk_buff * skb)1076 static int ionic_tx_descs_needed(struct ionic_queue *q, struct sk_buff *skb)
1077 {
1078 int sg_elems = q->lif->qtype_info[IONIC_QTYPE_TXQ].max_sg_elems;
1079 struct ionic_tx_stats *stats = q_to_tx_stats(q);
1080 int err;
1081
1082 /* If TSO, need roundup(skb->len/mss) descs */
1083 if (skb_is_gso(skb))
1084 return (skb->len / skb_shinfo(skb)->gso_size) + 1;
1085
1086 /* If non-TSO, just need 1 desc and nr_frags sg elems */
1087 if (skb_shinfo(skb)->nr_frags <= sg_elems)
1088 return 1;
1089
1090 /* Too many frags, so linearize */
1091 err = skb_linearize(skb);
1092 if (err)
1093 return err;
1094
1095 stats->linearize++;
1096
1097 /* Need 1 desc and zero sg elems */
1098 return 1;
1099 }
1100
ionic_maybe_stop_tx(struct ionic_queue * q,int ndescs)1101 static int ionic_maybe_stop_tx(struct ionic_queue *q, int ndescs)
1102 {
1103 int stopped = 0;
1104
1105 if (unlikely(!ionic_q_has_space(q, ndescs))) {
1106 netif_stop_subqueue(q->lif->netdev, q->index);
1107 q->stop++;
1108 stopped = 1;
1109
1110 /* Might race with ionic_tx_clean, check again */
1111 smp_rmb();
1112 if (ionic_q_has_space(q, ndescs)) {
1113 netif_wake_subqueue(q->lif->netdev, q->index);
1114 stopped = 0;
1115 }
1116 }
1117
1118 return stopped;
1119 }
1120
ionic_start_xmit(struct sk_buff * skb,struct net_device * netdev)1121 netdev_tx_t ionic_start_xmit(struct sk_buff *skb, struct net_device *netdev)
1122 {
1123 u16 queue_index = skb_get_queue_mapping(skb);
1124 struct ionic_lif *lif = netdev_priv(netdev);
1125 struct ionic_queue *q;
1126 int ndescs;
1127 int err;
1128
1129 if (unlikely(!test_bit(IONIC_LIF_F_UP, lif->state))) {
1130 dev_kfree_skb(skb);
1131 return NETDEV_TX_OK;
1132 }
1133
1134 if (unlikely(queue_index >= lif->nxqs))
1135 queue_index = 0;
1136 q = &lif->txqcqs[queue_index]->q;
1137
1138 ndescs = ionic_tx_descs_needed(q, skb);
1139 if (ndescs < 0)
1140 goto err_out_drop;
1141
1142 if (unlikely(ionic_maybe_stop_tx(q, ndescs)))
1143 return NETDEV_TX_BUSY;
1144
1145 if (skb_is_gso(skb))
1146 err = ionic_tx_tso(q, skb);
1147 else
1148 err = ionic_tx(q, skb);
1149
1150 if (err)
1151 goto err_out_drop;
1152
1153 /* Stop the queue if there aren't descriptors for the next packet.
1154 * Since our SG lists per descriptor take care of most of the possible
1155 * fragmentation, we don't need to have many descriptors available.
1156 */
1157 ionic_maybe_stop_tx(q, 4);
1158
1159 return NETDEV_TX_OK;
1160
1161 err_out_drop:
1162 q->stop++;
1163 q->drop++;
1164 dev_kfree_skb(skb);
1165 return NETDEV_TX_OK;
1166 }
1167