1 /*
2 * Huawei HiNIC PCI Express Linux driver
3 * Copyright(c) 2017 Huawei Technologies Co., Ltd
4 *
5 * This program is free software; you can redistribute it and/or modify it
6 * under the terms and conditions of the GNU General Public License,
7 * version 2, as published by the Free Software Foundation.
8 *
9 * This program is distributed in the hope it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
12 * for more details.
13 *
14 */
15
16 #include <linux/kernel.h>
17 #include <linux/types.h>
18 #include <linux/pci.h>
19 #include <linux/device.h>
20 #include <linux/dma-mapping.h>
21 #include <linux/vmalloc.h>
22 #include <linux/errno.h>
23 #include <linux/sizes.h>
24 #include <linux/atomic.h>
25 #include <linux/skbuff.h>
26 #include <linux/io.h>
27 #include <asm/barrier.h>
28 #include <asm/byteorder.h>
29
30 #include "hinic_common.h"
31 #include "hinic_hw_if.h"
32 #include "hinic_hw_wqe.h"
33 #include "hinic_hw_wq.h"
34 #include "hinic_hw_qp_ctxt.h"
35 #include "hinic_hw_qp.h"
36 #include "hinic_hw_io.h"
37
38 #define SQ_DB_OFF SZ_2K
39
40 /* The number of cache line to prefetch Until threshold state */
41 #define WQ_PREFETCH_MAX 2
42 /* The number of cache line to prefetch After threshold state */
43 #define WQ_PREFETCH_MIN 1
44 /* Threshold state */
45 #define WQ_PREFETCH_THRESHOLD 256
46
47 /* sizes of the SQ/RQ ctxt */
48 #define Q_CTXT_SIZE 48
49 #define CTXT_RSVD 240
50
51 #define SQ_CTXT_OFFSET(max_sqs, max_rqs, q_id) \
52 (((max_rqs) + (max_sqs)) * CTXT_RSVD + (q_id) * Q_CTXT_SIZE)
53
54 #define RQ_CTXT_OFFSET(max_sqs, max_rqs, q_id) \
55 (((max_rqs) + (max_sqs)) * CTXT_RSVD + \
56 (max_sqs + (q_id)) * Q_CTXT_SIZE)
57
58 #define SIZE_16BYTES(size) (ALIGN(size, 16) >> 4)
59 #define SIZE_8BYTES(size) (ALIGN(size, 8) >> 3)
60 #define SECT_SIZE_FROM_8BYTES(size) ((size) << 3)
61
62 #define SQ_DB_PI_HI_SHIFT 8
63 #define SQ_DB_PI_HI(prod_idx) ((prod_idx) >> SQ_DB_PI_HI_SHIFT)
64
65 #define SQ_DB_PI_LOW_MASK 0xFF
66 #define SQ_DB_PI_LOW(prod_idx) ((prod_idx) & SQ_DB_PI_LOW_MASK)
67
68 #define SQ_DB_ADDR(sq, pi) ((u64 *)((sq)->db_base) + SQ_DB_PI_LOW(pi))
69
70 #define SQ_MASKED_IDX(sq, idx) ((idx) & (sq)->wq->mask)
71 #define RQ_MASKED_IDX(rq, idx) ((idx) & (rq)->wq->mask)
72
73 #define TX_MAX_MSS_DEFAULT 0x3E00
74
75 enum sq_wqe_type {
76 SQ_NORMAL_WQE = 0,
77 };
78
79 enum rq_completion_fmt {
80 RQ_COMPLETE_SGE = 1
81 };
82
hinic_qp_prepare_header(struct hinic_qp_ctxt_header * qp_ctxt_hdr,enum hinic_qp_ctxt_type ctxt_type,u16 num_queues,u16 max_queues)83 void hinic_qp_prepare_header(struct hinic_qp_ctxt_header *qp_ctxt_hdr,
84 enum hinic_qp_ctxt_type ctxt_type,
85 u16 num_queues, u16 max_queues)
86 {
87 u16 max_sqs = max_queues;
88 u16 max_rqs = max_queues;
89
90 qp_ctxt_hdr->num_queues = num_queues;
91 qp_ctxt_hdr->queue_type = ctxt_type;
92
93 if (ctxt_type == HINIC_QP_CTXT_TYPE_SQ)
94 qp_ctxt_hdr->addr_offset = SQ_CTXT_OFFSET(max_sqs, max_rqs, 0);
95 else
96 qp_ctxt_hdr->addr_offset = RQ_CTXT_OFFSET(max_sqs, max_rqs, 0);
97
98 qp_ctxt_hdr->addr_offset = SIZE_16BYTES(qp_ctxt_hdr->addr_offset);
99
100 hinic_cpu_to_be32(qp_ctxt_hdr, sizeof(*qp_ctxt_hdr));
101 }
102
hinic_sq_prepare_ctxt(struct hinic_sq_ctxt * sq_ctxt,struct hinic_sq * sq,u16 global_qid)103 void hinic_sq_prepare_ctxt(struct hinic_sq_ctxt *sq_ctxt,
104 struct hinic_sq *sq, u16 global_qid)
105 {
106 u32 wq_page_pfn_hi, wq_page_pfn_lo, wq_block_pfn_hi, wq_block_pfn_lo;
107 u64 wq_page_addr, wq_page_pfn, wq_block_pfn;
108 u16 pi_start, ci_start;
109 struct hinic_wq *wq;
110
111 wq = sq->wq;
112 ci_start = atomic_read(&wq->cons_idx);
113 pi_start = atomic_read(&wq->prod_idx);
114
115 /* Read the first page paddr from the WQ page paddr ptrs */
116 wq_page_addr = be64_to_cpu(*wq->block_vaddr);
117
118 wq_page_pfn = HINIC_WQ_PAGE_PFN(wq_page_addr);
119 wq_page_pfn_hi = upper_32_bits(wq_page_pfn);
120 wq_page_pfn_lo = lower_32_bits(wq_page_pfn);
121
122 wq_block_pfn = HINIC_WQ_BLOCK_PFN(wq->block_paddr);
123 wq_block_pfn_hi = upper_32_bits(wq_block_pfn);
124 wq_block_pfn_lo = lower_32_bits(wq_block_pfn);
125
126 sq_ctxt->ceq_attr = HINIC_SQ_CTXT_CEQ_ATTR_SET(global_qid,
127 GLOBAL_SQ_ID) |
128 HINIC_SQ_CTXT_CEQ_ATTR_SET(0, EN);
129
130 sq_ctxt->ci_wrapped = HINIC_SQ_CTXT_CI_SET(ci_start, IDX) |
131 HINIC_SQ_CTXT_CI_SET(1, WRAPPED);
132
133 sq_ctxt->wq_hi_pfn_pi =
134 HINIC_SQ_CTXT_WQ_PAGE_SET(wq_page_pfn_hi, HI_PFN) |
135 HINIC_SQ_CTXT_WQ_PAGE_SET(pi_start, PI);
136
137 sq_ctxt->wq_lo_pfn = wq_page_pfn_lo;
138
139 sq_ctxt->pref_cache =
140 HINIC_SQ_CTXT_PREF_SET(WQ_PREFETCH_MIN, CACHE_MIN) |
141 HINIC_SQ_CTXT_PREF_SET(WQ_PREFETCH_MAX, CACHE_MAX) |
142 HINIC_SQ_CTXT_PREF_SET(WQ_PREFETCH_THRESHOLD, CACHE_THRESHOLD);
143
144 sq_ctxt->pref_wrapped = 1;
145
146 sq_ctxt->pref_wq_hi_pfn_ci =
147 HINIC_SQ_CTXT_PREF_SET(ci_start, CI) |
148 HINIC_SQ_CTXT_PREF_SET(wq_page_pfn_hi, WQ_HI_PFN);
149
150 sq_ctxt->pref_wq_lo_pfn = wq_page_pfn_lo;
151
152 sq_ctxt->wq_block_hi_pfn =
153 HINIC_SQ_CTXT_WQ_BLOCK_SET(wq_block_pfn_hi, HI_PFN);
154
155 sq_ctxt->wq_block_lo_pfn = wq_block_pfn_lo;
156
157 hinic_cpu_to_be32(sq_ctxt, sizeof(*sq_ctxt));
158 }
159
hinic_rq_prepare_ctxt(struct hinic_rq_ctxt * rq_ctxt,struct hinic_rq * rq,u16 global_qid)160 void hinic_rq_prepare_ctxt(struct hinic_rq_ctxt *rq_ctxt,
161 struct hinic_rq *rq, u16 global_qid)
162 {
163 u32 wq_page_pfn_hi, wq_page_pfn_lo, wq_block_pfn_hi, wq_block_pfn_lo;
164 u64 wq_page_addr, wq_page_pfn, wq_block_pfn;
165 u16 pi_start, ci_start;
166 struct hinic_wq *wq;
167
168 wq = rq->wq;
169 ci_start = atomic_read(&wq->cons_idx);
170 pi_start = atomic_read(&wq->prod_idx);
171
172 /* Read the first page paddr from the WQ page paddr ptrs */
173 wq_page_addr = be64_to_cpu(*wq->block_vaddr);
174
175 wq_page_pfn = HINIC_WQ_PAGE_PFN(wq_page_addr);
176 wq_page_pfn_hi = upper_32_bits(wq_page_pfn);
177 wq_page_pfn_lo = lower_32_bits(wq_page_pfn);
178
179 wq_block_pfn = HINIC_WQ_BLOCK_PFN(wq->block_paddr);
180 wq_block_pfn_hi = upper_32_bits(wq_block_pfn);
181 wq_block_pfn_lo = lower_32_bits(wq_block_pfn);
182
183 rq_ctxt->ceq_attr = HINIC_RQ_CTXT_CEQ_ATTR_SET(0, EN) |
184 HINIC_RQ_CTXT_CEQ_ATTR_SET(1, WRAPPED);
185
186 rq_ctxt->pi_intr_attr = HINIC_RQ_CTXT_PI_SET(pi_start, IDX) |
187 HINIC_RQ_CTXT_PI_SET(rq->msix_entry, INTR);
188
189 rq_ctxt->wq_hi_pfn_ci = HINIC_RQ_CTXT_WQ_PAGE_SET(wq_page_pfn_hi,
190 HI_PFN) |
191 HINIC_RQ_CTXT_WQ_PAGE_SET(ci_start, CI);
192
193 rq_ctxt->wq_lo_pfn = wq_page_pfn_lo;
194
195 rq_ctxt->pref_cache =
196 HINIC_RQ_CTXT_PREF_SET(WQ_PREFETCH_MIN, CACHE_MIN) |
197 HINIC_RQ_CTXT_PREF_SET(WQ_PREFETCH_MAX, CACHE_MAX) |
198 HINIC_RQ_CTXT_PREF_SET(WQ_PREFETCH_THRESHOLD, CACHE_THRESHOLD);
199
200 rq_ctxt->pref_wrapped = 1;
201
202 rq_ctxt->pref_wq_hi_pfn_ci =
203 HINIC_RQ_CTXT_PREF_SET(wq_page_pfn_hi, WQ_HI_PFN) |
204 HINIC_RQ_CTXT_PREF_SET(ci_start, CI);
205
206 rq_ctxt->pref_wq_lo_pfn = wq_page_pfn_lo;
207
208 rq_ctxt->pi_paddr_hi = upper_32_bits(rq->pi_dma_addr);
209 rq_ctxt->pi_paddr_lo = lower_32_bits(rq->pi_dma_addr);
210
211 rq_ctxt->wq_block_hi_pfn =
212 HINIC_RQ_CTXT_WQ_BLOCK_SET(wq_block_pfn_hi, HI_PFN);
213
214 rq_ctxt->wq_block_lo_pfn = wq_block_pfn_lo;
215
216 hinic_cpu_to_be32(rq_ctxt, sizeof(*rq_ctxt));
217 }
218
219 /**
220 * alloc_sq_skb_arr - allocate sq array for saved skb
221 * @sq: HW Send Queue
222 *
223 * Return 0 - Success, negative - Failure
224 **/
alloc_sq_skb_arr(struct hinic_sq * sq)225 static int alloc_sq_skb_arr(struct hinic_sq *sq)
226 {
227 struct hinic_wq *wq = sq->wq;
228 size_t skb_arr_size;
229
230 skb_arr_size = wq->q_depth * sizeof(*sq->saved_skb);
231 sq->saved_skb = vzalloc(skb_arr_size);
232 if (!sq->saved_skb)
233 return -ENOMEM;
234
235 return 0;
236 }
237
238 /**
239 * free_sq_skb_arr - free sq array for saved skb
240 * @sq: HW Send Queue
241 **/
free_sq_skb_arr(struct hinic_sq * sq)242 static void free_sq_skb_arr(struct hinic_sq *sq)
243 {
244 vfree(sq->saved_skb);
245 }
246
247 /**
248 * alloc_rq_skb_arr - allocate rq array for saved skb
249 * @rq: HW Receive Queue
250 *
251 * Return 0 - Success, negative - Failure
252 **/
alloc_rq_skb_arr(struct hinic_rq * rq)253 static int alloc_rq_skb_arr(struct hinic_rq *rq)
254 {
255 struct hinic_wq *wq = rq->wq;
256 size_t skb_arr_size;
257
258 skb_arr_size = wq->q_depth * sizeof(*rq->saved_skb);
259 rq->saved_skb = vzalloc(skb_arr_size);
260 if (!rq->saved_skb)
261 return -ENOMEM;
262
263 return 0;
264 }
265
266 /**
267 * free_rq_skb_arr - free rq array for saved skb
268 * @rq: HW Receive Queue
269 **/
free_rq_skb_arr(struct hinic_rq * rq)270 static void free_rq_skb_arr(struct hinic_rq *rq)
271 {
272 vfree(rq->saved_skb);
273 }
274
275 /**
276 * hinic_init_sq - Initialize HW Send Queue
277 * @sq: HW Send Queue
278 * @hwif: HW Interface for accessing HW
279 * @wq: Work Queue for the data of the SQ
280 * @entry: msix entry for sq
281 * @ci_addr: address for reading the current HW consumer index
282 * @ci_dma_addr: dma address for reading the current HW consumer index
283 * @db_base: doorbell base address
284 *
285 * Return 0 - Success, negative - Failure
286 **/
hinic_init_sq(struct hinic_sq * sq,struct hinic_hwif * hwif,struct hinic_wq * wq,struct msix_entry * entry,void * ci_addr,dma_addr_t ci_dma_addr,void __iomem * db_base)287 int hinic_init_sq(struct hinic_sq *sq, struct hinic_hwif *hwif,
288 struct hinic_wq *wq, struct msix_entry *entry,
289 void *ci_addr, dma_addr_t ci_dma_addr,
290 void __iomem *db_base)
291 {
292 sq->hwif = hwif;
293
294 sq->wq = wq;
295
296 sq->irq = entry->vector;
297 sq->msix_entry = entry->entry;
298
299 sq->hw_ci_addr = ci_addr;
300 sq->hw_ci_dma_addr = ci_dma_addr;
301
302 sq->db_base = db_base + SQ_DB_OFF;
303
304 return alloc_sq_skb_arr(sq);
305 }
306
307 /**
308 * hinic_clean_sq - Clean HW Send Queue's Resources
309 * @sq: Send Queue
310 **/
hinic_clean_sq(struct hinic_sq * sq)311 void hinic_clean_sq(struct hinic_sq *sq)
312 {
313 free_sq_skb_arr(sq);
314 }
315
316 /**
317 * alloc_rq_cqe - allocate rq completion queue elements
318 * @rq: HW Receive Queue
319 *
320 * Return 0 - Success, negative - Failure
321 **/
alloc_rq_cqe(struct hinic_rq * rq)322 static int alloc_rq_cqe(struct hinic_rq *rq)
323 {
324 struct hinic_hwif *hwif = rq->hwif;
325 struct pci_dev *pdev = hwif->pdev;
326 size_t cqe_dma_size, cqe_size;
327 struct hinic_wq *wq = rq->wq;
328 int j, i;
329
330 cqe_size = wq->q_depth * sizeof(*rq->cqe);
331 rq->cqe = vzalloc(cqe_size);
332 if (!rq->cqe)
333 return -ENOMEM;
334
335 cqe_dma_size = wq->q_depth * sizeof(*rq->cqe_dma);
336 rq->cqe_dma = vzalloc(cqe_dma_size);
337 if (!rq->cqe_dma)
338 goto err_cqe_dma_arr_alloc;
339
340 for (i = 0; i < wq->q_depth; i++) {
341 rq->cqe[i] = dma_zalloc_coherent(&pdev->dev,
342 sizeof(*rq->cqe[i]),
343 &rq->cqe_dma[i], GFP_KERNEL);
344 if (!rq->cqe[i])
345 goto err_cqe_alloc;
346 }
347
348 return 0;
349
350 err_cqe_alloc:
351 for (j = 0; j < i; j++)
352 dma_free_coherent(&pdev->dev, sizeof(*rq->cqe[j]), rq->cqe[j],
353 rq->cqe_dma[j]);
354
355 vfree(rq->cqe_dma);
356
357 err_cqe_dma_arr_alloc:
358 vfree(rq->cqe);
359 return -ENOMEM;
360 }
361
362 /**
363 * free_rq_cqe - free rq completion queue elements
364 * @rq: HW Receive Queue
365 **/
free_rq_cqe(struct hinic_rq * rq)366 static void free_rq_cqe(struct hinic_rq *rq)
367 {
368 struct hinic_hwif *hwif = rq->hwif;
369 struct pci_dev *pdev = hwif->pdev;
370 struct hinic_wq *wq = rq->wq;
371 int i;
372
373 for (i = 0; i < wq->q_depth; i++)
374 dma_free_coherent(&pdev->dev, sizeof(*rq->cqe[i]), rq->cqe[i],
375 rq->cqe_dma[i]);
376
377 vfree(rq->cqe_dma);
378 vfree(rq->cqe);
379 }
380
381 /**
382 * hinic_init_rq - Initialize HW Receive Queue
383 * @rq: HW Receive Queue
384 * @hwif: HW Interface for accessing HW
385 * @wq: Work Queue for the data of the RQ
386 * @entry: msix entry for rq
387 *
388 * Return 0 - Success, negative - Failure
389 **/
hinic_init_rq(struct hinic_rq * rq,struct hinic_hwif * hwif,struct hinic_wq * wq,struct msix_entry * entry)390 int hinic_init_rq(struct hinic_rq *rq, struct hinic_hwif *hwif,
391 struct hinic_wq *wq, struct msix_entry *entry)
392 {
393 struct pci_dev *pdev = hwif->pdev;
394 size_t pi_size;
395 int err;
396
397 rq->hwif = hwif;
398
399 rq->wq = wq;
400
401 rq->irq = entry->vector;
402 rq->msix_entry = entry->entry;
403
404 rq->buf_sz = HINIC_RX_BUF_SZ;
405
406 err = alloc_rq_skb_arr(rq);
407 if (err) {
408 dev_err(&pdev->dev, "Failed to allocate rq priv data\n");
409 return err;
410 }
411
412 err = alloc_rq_cqe(rq);
413 if (err) {
414 dev_err(&pdev->dev, "Failed to allocate rq cqe\n");
415 goto err_alloc_rq_cqe;
416 }
417
418 /* HW requirements: Must be at least 32 bit */
419 pi_size = ALIGN(sizeof(*rq->pi_virt_addr), sizeof(u32));
420 rq->pi_virt_addr = dma_zalloc_coherent(&pdev->dev, pi_size,
421 &rq->pi_dma_addr, GFP_KERNEL);
422 if (!rq->pi_virt_addr) {
423 dev_err(&pdev->dev, "Failed to allocate PI address\n");
424 err = -ENOMEM;
425 goto err_pi_virt;
426 }
427
428 return 0;
429
430 err_pi_virt:
431 free_rq_cqe(rq);
432
433 err_alloc_rq_cqe:
434 free_rq_skb_arr(rq);
435 return err;
436 }
437
438 /**
439 * hinic_clean_rq - Clean HW Receive Queue's Resources
440 * @rq: HW Receive Queue
441 **/
hinic_clean_rq(struct hinic_rq * rq)442 void hinic_clean_rq(struct hinic_rq *rq)
443 {
444 struct hinic_hwif *hwif = rq->hwif;
445 struct pci_dev *pdev = hwif->pdev;
446 size_t pi_size;
447
448 pi_size = ALIGN(sizeof(*rq->pi_virt_addr), sizeof(u32));
449 dma_free_coherent(&pdev->dev, pi_size, rq->pi_virt_addr,
450 rq->pi_dma_addr);
451
452 free_rq_cqe(rq);
453 free_rq_skb_arr(rq);
454 }
455
456 /**
457 * hinic_get_sq_free_wqebbs - return number of free wqebbs for use
458 * @sq: send queue
459 *
460 * Return number of free wqebbs
461 **/
hinic_get_sq_free_wqebbs(struct hinic_sq * sq)462 int hinic_get_sq_free_wqebbs(struct hinic_sq *sq)
463 {
464 struct hinic_wq *wq = sq->wq;
465
466 return atomic_read(&wq->delta) - 1;
467 }
468
469 /**
470 * hinic_get_rq_free_wqebbs - return number of free wqebbs for use
471 * @rq: recv queue
472 *
473 * Return number of free wqebbs
474 **/
hinic_get_rq_free_wqebbs(struct hinic_rq * rq)475 int hinic_get_rq_free_wqebbs(struct hinic_rq *rq)
476 {
477 struct hinic_wq *wq = rq->wq;
478
479 return atomic_read(&wq->delta) - 1;
480 }
481
sq_prepare_ctrl(struct hinic_sq_ctrl * ctrl,u16 prod_idx,int nr_descs)482 static void sq_prepare_ctrl(struct hinic_sq_ctrl *ctrl, u16 prod_idx,
483 int nr_descs)
484 {
485 u32 ctrl_size, task_size, bufdesc_size;
486
487 ctrl_size = SIZE_8BYTES(sizeof(struct hinic_sq_ctrl));
488 task_size = SIZE_8BYTES(sizeof(struct hinic_sq_task));
489 bufdesc_size = nr_descs * sizeof(struct hinic_sq_bufdesc);
490 bufdesc_size = SIZE_8BYTES(bufdesc_size);
491
492 ctrl->ctrl_info = HINIC_SQ_CTRL_SET(bufdesc_size, BUFDESC_SECT_LEN) |
493 HINIC_SQ_CTRL_SET(task_size, TASKSECT_LEN) |
494 HINIC_SQ_CTRL_SET(SQ_NORMAL_WQE, DATA_FORMAT) |
495 HINIC_SQ_CTRL_SET(ctrl_size, LEN);
496
497 ctrl->queue_info = HINIC_SQ_CTRL_SET(TX_MAX_MSS_DEFAULT,
498 QUEUE_INFO_MSS);
499 }
500
sq_prepare_task(struct hinic_sq_task * task)501 static void sq_prepare_task(struct hinic_sq_task *task)
502 {
503 task->pkt_info0 =
504 HINIC_SQ_TASK_INFO0_SET(0, L2HDR_LEN) |
505 HINIC_SQ_TASK_INFO0_SET(HINIC_L4_OFF_DISABLE, L4_OFFLOAD) |
506 HINIC_SQ_TASK_INFO0_SET(HINIC_OUTER_L3TYPE_UNKNOWN,
507 INNER_L3TYPE) |
508 HINIC_SQ_TASK_INFO0_SET(HINIC_VLAN_OFF_DISABLE,
509 VLAN_OFFLOAD) |
510 HINIC_SQ_TASK_INFO0_SET(HINIC_PKT_NOT_PARSED, PARSE_FLAG);
511
512 task->pkt_info1 =
513 HINIC_SQ_TASK_INFO1_SET(HINIC_MEDIA_UNKNOWN, MEDIA_TYPE) |
514 HINIC_SQ_TASK_INFO1_SET(0, INNER_L4_LEN) |
515 HINIC_SQ_TASK_INFO1_SET(0, INNER_L3_LEN);
516
517 task->pkt_info2 =
518 HINIC_SQ_TASK_INFO2_SET(0, TUNNEL_L4_LEN) |
519 HINIC_SQ_TASK_INFO2_SET(0, OUTER_L3_LEN) |
520 HINIC_SQ_TASK_INFO2_SET(HINIC_TUNNEL_L4TYPE_UNKNOWN,
521 TUNNEL_L4TYPE) |
522 HINIC_SQ_TASK_INFO2_SET(HINIC_OUTER_L3TYPE_UNKNOWN,
523 OUTER_L3TYPE);
524
525 task->ufo_v6_identify = 0;
526
527 task->pkt_info4 = HINIC_SQ_TASK_INFO4_SET(HINIC_L2TYPE_ETH, L2TYPE);
528
529 task->zero_pad = 0;
530 }
531
532 /**
533 * hinic_sq_prepare_wqe - prepare wqe before insert to the queue
534 * @sq: send queue
535 * @prod_idx: pi value
536 * @sq_wqe: wqe to prepare
537 * @sges: sges for use by the wqe for send for buf addresses
538 * @nr_sges: number of sges
539 **/
hinic_sq_prepare_wqe(struct hinic_sq * sq,u16 prod_idx,struct hinic_sq_wqe * sq_wqe,struct hinic_sge * sges,int nr_sges)540 void hinic_sq_prepare_wqe(struct hinic_sq *sq, u16 prod_idx,
541 struct hinic_sq_wqe *sq_wqe, struct hinic_sge *sges,
542 int nr_sges)
543 {
544 int i;
545
546 sq_prepare_ctrl(&sq_wqe->ctrl, prod_idx, nr_sges);
547
548 sq_prepare_task(&sq_wqe->task);
549
550 for (i = 0; i < nr_sges; i++)
551 sq_wqe->buf_descs[i].sge = sges[i];
552 }
553
554 /**
555 * sq_prepare_db - prepare doorbell to write
556 * @sq: send queue
557 * @prod_idx: pi value for the doorbell
558 * @cos: cos of the doorbell
559 *
560 * Return db value
561 **/
sq_prepare_db(struct hinic_sq * sq,u16 prod_idx,unsigned int cos)562 static u32 sq_prepare_db(struct hinic_sq *sq, u16 prod_idx, unsigned int cos)
563 {
564 struct hinic_qp *qp = container_of(sq, struct hinic_qp, sq);
565 u8 hi_prod_idx = SQ_DB_PI_HI(SQ_MASKED_IDX(sq, prod_idx));
566
567 /* Data should be written to HW in Big Endian Format */
568 return cpu_to_be32(HINIC_SQ_DB_INFO_SET(hi_prod_idx, PI_HI) |
569 HINIC_SQ_DB_INFO_SET(HINIC_DB_SQ_TYPE, TYPE) |
570 HINIC_SQ_DB_INFO_SET(HINIC_DATA_PATH, PATH) |
571 HINIC_SQ_DB_INFO_SET(cos, COS) |
572 HINIC_SQ_DB_INFO_SET(qp->q_id, QID));
573 }
574
575 /**
576 * hinic_sq_write_db- write doorbell
577 * @sq: send queue
578 * @prod_idx: pi value for the doorbell
579 * @wqe_size: wqe size
580 * @cos: cos of the wqe
581 **/
hinic_sq_write_db(struct hinic_sq * sq,u16 prod_idx,unsigned int wqe_size,unsigned int cos)582 void hinic_sq_write_db(struct hinic_sq *sq, u16 prod_idx, unsigned int wqe_size,
583 unsigned int cos)
584 {
585 struct hinic_wq *wq = sq->wq;
586
587 /* increment prod_idx to the next */
588 prod_idx += ALIGN(wqe_size, wq->wqebb_size) / wq->wqebb_size;
589
590 wmb(); /* Write all before the doorbell */
591
592 writel(sq_prepare_db(sq, prod_idx, cos), SQ_DB_ADDR(sq, prod_idx));
593 }
594
595 /**
596 * hinic_sq_get_wqe - get wqe ptr in the current pi and update the pi
597 * @sq: sq to get wqe from
598 * @wqe_size: wqe size
599 * @prod_idx: returned pi
600 *
601 * Return wqe pointer
602 **/
hinic_sq_get_wqe(struct hinic_sq * sq,unsigned int wqe_size,u16 * prod_idx)603 struct hinic_sq_wqe *hinic_sq_get_wqe(struct hinic_sq *sq,
604 unsigned int wqe_size, u16 *prod_idx)
605 {
606 struct hinic_hw_wqe *hw_wqe = hinic_get_wqe(sq->wq, wqe_size,
607 prod_idx);
608
609 if (IS_ERR(hw_wqe))
610 return NULL;
611
612 return &hw_wqe->sq_wqe;
613 }
614
615 /**
616 * hinic_sq_write_wqe - write the wqe to the sq
617 * @sq: send queue
618 * @prod_idx: pi of the wqe
619 * @sq_wqe: the wqe to write
620 * @skb: skb to save
621 * @wqe_size: the size of the wqe
622 **/
hinic_sq_write_wqe(struct hinic_sq * sq,u16 prod_idx,struct hinic_sq_wqe * sq_wqe,struct sk_buff * skb,unsigned int wqe_size)623 void hinic_sq_write_wqe(struct hinic_sq *sq, u16 prod_idx,
624 struct hinic_sq_wqe *sq_wqe,
625 struct sk_buff *skb, unsigned int wqe_size)
626 {
627 struct hinic_hw_wqe *hw_wqe = (struct hinic_hw_wqe *)sq_wqe;
628
629 sq->saved_skb[prod_idx] = skb;
630
631 /* The data in the HW should be in Big Endian Format */
632 hinic_cpu_to_be32(sq_wqe, wqe_size);
633
634 hinic_write_wqe(sq->wq, hw_wqe, wqe_size);
635 }
636
637 /**
638 * hinic_sq_read_wqebb - read wqe ptr in the current ci and update the ci, the
639 * wqe only have one wqebb
640 * @sq: send queue
641 * @skb: return skb that was saved
642 * @wqe_size: the wqe size ptr
643 * @cons_idx: consumer index of the wqe
644 *
645 * Return wqe in ci position
646 **/
hinic_sq_read_wqebb(struct hinic_sq * sq,struct sk_buff ** skb,unsigned int * wqe_size,u16 * cons_idx)647 struct hinic_sq_wqe *hinic_sq_read_wqebb(struct hinic_sq *sq,
648 struct sk_buff **skb,
649 unsigned int *wqe_size, u16 *cons_idx)
650 {
651 struct hinic_hw_wqe *hw_wqe;
652 struct hinic_sq_wqe *sq_wqe;
653 struct hinic_sq_ctrl *ctrl;
654 unsigned int buf_sect_len;
655 u32 ctrl_info;
656
657 /* read the ctrl section for getting wqe size */
658 hw_wqe = hinic_read_wqe(sq->wq, sizeof(*ctrl), cons_idx);
659 if (IS_ERR(hw_wqe))
660 return NULL;
661
662 *skb = sq->saved_skb[*cons_idx];
663
664 sq_wqe = &hw_wqe->sq_wqe;
665 ctrl = &sq_wqe->ctrl;
666 ctrl_info = be32_to_cpu(ctrl->ctrl_info);
667 buf_sect_len = HINIC_SQ_CTRL_GET(ctrl_info, BUFDESC_SECT_LEN);
668
669 *wqe_size = sizeof(*ctrl) + sizeof(sq_wqe->task);
670 *wqe_size += SECT_SIZE_FROM_8BYTES(buf_sect_len);
671 *wqe_size = ALIGN(*wqe_size, sq->wq->wqebb_size);
672
673 return &hw_wqe->sq_wqe;
674 }
675
676 /**
677 * hinic_sq_read_wqe - read wqe ptr in the current ci and update the ci
678 * @sq: send queue
679 * @skb: return skb that was saved
680 * @wqe_size: the size of the wqe
681 * @cons_idx: consumer index of the wqe
682 *
683 * Return wqe in ci position
684 **/
hinic_sq_read_wqe(struct hinic_sq * sq,struct sk_buff ** skb,unsigned int wqe_size,u16 * cons_idx)685 struct hinic_sq_wqe *hinic_sq_read_wqe(struct hinic_sq *sq,
686 struct sk_buff **skb,
687 unsigned int wqe_size, u16 *cons_idx)
688 {
689 struct hinic_hw_wqe *hw_wqe;
690
691 hw_wqe = hinic_read_wqe(sq->wq, wqe_size, cons_idx);
692 *skb = sq->saved_skb[*cons_idx];
693
694 return &hw_wqe->sq_wqe;
695 }
696
697 /**
698 * hinic_sq_put_wqe - release the ci for new wqes
699 * @sq: send queue
700 * @wqe_size: the size of the wqe
701 **/
hinic_sq_put_wqe(struct hinic_sq * sq,unsigned int wqe_size)702 void hinic_sq_put_wqe(struct hinic_sq *sq, unsigned int wqe_size)
703 {
704 hinic_put_wqe(sq->wq, wqe_size);
705 }
706
707 /**
708 * hinic_sq_get_sges - get sges from the wqe
709 * @sq_wqe: wqe to get the sges from its buffer addresses
710 * @sges: returned sges
711 * @nr_sges: number sges to return
712 **/
hinic_sq_get_sges(struct hinic_sq_wqe * sq_wqe,struct hinic_sge * sges,int nr_sges)713 void hinic_sq_get_sges(struct hinic_sq_wqe *sq_wqe, struct hinic_sge *sges,
714 int nr_sges)
715 {
716 int i;
717
718 for (i = 0; i < nr_sges && i < HINIC_MAX_SQ_BUFDESCS; i++) {
719 sges[i] = sq_wqe->buf_descs[i].sge;
720 hinic_be32_to_cpu(&sges[i], sizeof(sges[i]));
721 }
722 }
723
724 /**
725 * hinic_rq_get_wqe - get wqe ptr in the current pi and update the pi
726 * @rq: rq to get wqe from
727 * @wqe_size: wqe size
728 * @prod_idx: returned pi
729 *
730 * Return wqe pointer
731 **/
hinic_rq_get_wqe(struct hinic_rq * rq,unsigned int wqe_size,u16 * prod_idx)732 struct hinic_rq_wqe *hinic_rq_get_wqe(struct hinic_rq *rq,
733 unsigned int wqe_size, u16 *prod_idx)
734 {
735 struct hinic_hw_wqe *hw_wqe = hinic_get_wqe(rq->wq, wqe_size,
736 prod_idx);
737
738 if (IS_ERR(hw_wqe))
739 return NULL;
740
741 return &hw_wqe->rq_wqe;
742 }
743
744 /**
745 * hinic_rq_write_wqe - write the wqe to the rq
746 * @rq: recv queue
747 * @prod_idx: pi of the wqe
748 * @rq_wqe: the wqe to write
749 * @skb: skb to save
750 **/
hinic_rq_write_wqe(struct hinic_rq * rq,u16 prod_idx,struct hinic_rq_wqe * rq_wqe,struct sk_buff * skb)751 void hinic_rq_write_wqe(struct hinic_rq *rq, u16 prod_idx,
752 struct hinic_rq_wqe *rq_wqe, struct sk_buff *skb)
753 {
754 struct hinic_hw_wqe *hw_wqe = (struct hinic_hw_wqe *)rq_wqe;
755
756 rq->saved_skb[prod_idx] = skb;
757
758 /* The data in the HW should be in Big Endian Format */
759 hinic_cpu_to_be32(rq_wqe, sizeof(*rq_wqe));
760
761 hinic_write_wqe(rq->wq, hw_wqe, sizeof(*rq_wqe));
762 }
763
764 /**
765 * hinic_rq_read_wqe - read wqe ptr in the current ci and update the ci
766 * @rq: recv queue
767 * @wqe_size: the size of the wqe
768 * @skb: return saved skb
769 * @cons_idx: consumer index of the wqe
770 *
771 * Return wqe in ci position
772 **/
hinic_rq_read_wqe(struct hinic_rq * rq,unsigned int wqe_size,struct sk_buff ** skb,u16 * cons_idx)773 struct hinic_rq_wqe *hinic_rq_read_wqe(struct hinic_rq *rq,
774 unsigned int wqe_size,
775 struct sk_buff **skb, u16 *cons_idx)
776 {
777 struct hinic_hw_wqe *hw_wqe;
778 struct hinic_rq_cqe *cqe;
779 int rx_done;
780 u32 status;
781
782 hw_wqe = hinic_read_wqe(rq->wq, wqe_size, cons_idx);
783 if (IS_ERR(hw_wqe))
784 return NULL;
785
786 cqe = rq->cqe[*cons_idx];
787
788 status = be32_to_cpu(cqe->status);
789
790 rx_done = HINIC_RQ_CQE_STATUS_GET(status, RXDONE);
791 if (!rx_done)
792 return NULL;
793
794 *skb = rq->saved_skb[*cons_idx];
795
796 return &hw_wqe->rq_wqe;
797 }
798
799 /**
800 * hinic_rq_read_next_wqe - increment ci and read the wqe in ci position
801 * @rq: recv queue
802 * @wqe_size: the size of the wqe
803 * @skb: return saved skb
804 * @cons_idx: consumer index in the wq
805 *
806 * Return wqe in incremented ci position
807 **/
hinic_rq_read_next_wqe(struct hinic_rq * rq,unsigned int wqe_size,struct sk_buff ** skb,u16 * cons_idx)808 struct hinic_rq_wqe *hinic_rq_read_next_wqe(struct hinic_rq *rq,
809 unsigned int wqe_size,
810 struct sk_buff **skb,
811 u16 *cons_idx)
812 {
813 struct hinic_wq *wq = rq->wq;
814 struct hinic_hw_wqe *hw_wqe;
815 unsigned int num_wqebbs;
816
817 wqe_size = ALIGN(wqe_size, wq->wqebb_size);
818 num_wqebbs = wqe_size / wq->wqebb_size;
819
820 *cons_idx = RQ_MASKED_IDX(rq, *cons_idx + num_wqebbs);
821
822 *skb = rq->saved_skb[*cons_idx];
823
824 hw_wqe = hinic_read_wqe_direct(wq, *cons_idx);
825
826 return &hw_wqe->rq_wqe;
827 }
828
829 /**
830 * hinic_put_wqe - release the ci for new wqes
831 * @rq: recv queue
832 * @cons_idx: consumer index of the wqe
833 * @wqe_size: the size of the wqe
834 **/
hinic_rq_put_wqe(struct hinic_rq * rq,u16 cons_idx,unsigned int wqe_size)835 void hinic_rq_put_wqe(struct hinic_rq *rq, u16 cons_idx,
836 unsigned int wqe_size)
837 {
838 struct hinic_rq_cqe *cqe = rq->cqe[cons_idx];
839 u32 status = be32_to_cpu(cqe->status);
840
841 status = HINIC_RQ_CQE_STATUS_CLEAR(status, RXDONE);
842
843 /* Rx WQE size is 1 WQEBB, no wq shadow*/
844 cqe->status = cpu_to_be32(status);
845
846 wmb(); /* clear done flag */
847
848 hinic_put_wqe(rq->wq, wqe_size);
849 }
850
851 /**
852 * hinic_rq_get_sge - get sge from the wqe
853 * @rq: recv queue
854 * @rq_wqe: wqe to get the sge from its buf address
855 * @cons_idx: consumer index
856 * @sge: returned sge
857 **/
hinic_rq_get_sge(struct hinic_rq * rq,struct hinic_rq_wqe * rq_wqe,u16 cons_idx,struct hinic_sge * sge)858 void hinic_rq_get_sge(struct hinic_rq *rq, struct hinic_rq_wqe *rq_wqe,
859 u16 cons_idx, struct hinic_sge *sge)
860 {
861 struct hinic_rq_cqe *cqe = rq->cqe[cons_idx];
862 u32 len = be32_to_cpu(cqe->len);
863
864 sge->hi_addr = be32_to_cpu(rq_wqe->buf_desc.hi_addr);
865 sge->lo_addr = be32_to_cpu(rq_wqe->buf_desc.lo_addr);
866 sge->len = HINIC_RQ_CQE_SGE_GET(len, LEN);
867 }
868
869 /**
870 * hinic_rq_prepare_wqe - prepare wqe before insert to the queue
871 * @rq: recv queue
872 * @prod_idx: pi value
873 * @rq_wqe: the wqe
874 * @sge: sge for use by the wqe for recv buf address
875 **/
hinic_rq_prepare_wqe(struct hinic_rq * rq,u16 prod_idx,struct hinic_rq_wqe * rq_wqe,struct hinic_sge * sge)876 void hinic_rq_prepare_wqe(struct hinic_rq *rq, u16 prod_idx,
877 struct hinic_rq_wqe *rq_wqe, struct hinic_sge *sge)
878 {
879 struct hinic_rq_cqe_sect *cqe_sect = &rq_wqe->cqe_sect;
880 struct hinic_rq_bufdesc *buf_desc = &rq_wqe->buf_desc;
881 struct hinic_rq_cqe *cqe = rq->cqe[prod_idx];
882 struct hinic_rq_ctrl *ctrl = &rq_wqe->ctrl;
883 dma_addr_t cqe_dma = rq->cqe_dma[prod_idx];
884
885 ctrl->ctrl_info =
886 HINIC_RQ_CTRL_SET(SIZE_8BYTES(sizeof(*ctrl)), LEN) |
887 HINIC_RQ_CTRL_SET(SIZE_8BYTES(sizeof(*cqe_sect)),
888 COMPLETE_LEN) |
889 HINIC_RQ_CTRL_SET(SIZE_8BYTES(sizeof(*buf_desc)),
890 BUFDESC_SECT_LEN) |
891 HINIC_RQ_CTRL_SET(RQ_COMPLETE_SGE, COMPLETE_FORMAT);
892
893 hinic_set_sge(&cqe_sect->sge, cqe_dma, sizeof(*cqe));
894
895 buf_desc->hi_addr = sge->hi_addr;
896 buf_desc->lo_addr = sge->lo_addr;
897 }
898
899 /**
900 * hinic_rq_update - update pi of the rq
901 * @rq: recv queue
902 * @prod_idx: pi value
903 **/
hinic_rq_update(struct hinic_rq * rq,u16 prod_idx)904 void hinic_rq_update(struct hinic_rq *rq, u16 prod_idx)
905 {
906 *rq->pi_virt_addr = cpu_to_be16(RQ_MASKED_IDX(rq, prod_idx + 1));
907 }
908