1 /*
2  * Copyright 2020 Broadcom
3  *
4  * SPDX-License-Identifier: Apache-2.0
5  */
6 
7 #define DT_DRV_COMPAT brcm_iproc_pax_dma_v1
8 
9 #include <zephyr/arch/cpu.h>
10 #include <zephyr/cache.h>
11 #include <errno.h>
12 #include <zephyr/init.h>
13 #include <zephyr/kernel.h>
14 #include <zephyr/linker/sections.h>
15 #include <soc.h>
16 #include <string.h>
17 #include <zephyr/toolchain.h>
18 #include <zephyr/types.h>
19 #include <zephyr/drivers/dma.h>
20 #include <zephyr/drivers/pcie/endpoint/pcie_ep.h>
21 #include "dma_iproc_pax_v1.h"
22 
23 #define LOG_LEVEL CONFIG_DMA_LOG_LEVEL
24 #include <zephyr/logging/log.h>
25 #include <zephyr/irq.h>
26 LOG_MODULE_REGISTER(dma_iproc_pax);
27 
28 /* Driver runtime data for PAX DMA and RM */
29 static struct dma_iproc_pax_data pax_dma_data;
30 
reset_pkt_id(struct dma_iproc_pax_ring_data * ring)31 static inline uint32_t reset_pkt_id(struct dma_iproc_pax_ring_data *ring)
32 {
33 	return ring->pkt_id = 0x0;
34 }
35 
36 /**
37  * @brief Opaque/packet id allocator, range 0 to 31
38  */
alloc_pkt_id(struct dma_iproc_pax_ring_data * ring)39 static inline uint32_t alloc_pkt_id(struct dma_iproc_pax_ring_data *ring)
40 {
41 	ring->pkt_id = (ring->pkt_id + 1) % 32;
42 	return ring->pkt_id;
43 }
44 
curr_pkt_id(struct dma_iproc_pax_ring_data * ring)45 static inline uint32_t curr_pkt_id(struct dma_iproc_pax_ring_data *ring)
46 {
47 	return ring->pkt_id;
48 }
49 
curr_toggle_val(struct dma_iproc_pax_ring_data * ring)50 static inline uint32_t curr_toggle_val(struct dma_iproc_pax_ring_data *ring)
51 {
52 	return ring->curr.toggle;
53 }
54 
55 /**
56  * @brief Populate header descriptor
57  */
rm_write_header_desc(void * desc,uint32_t toggle,uint32_t opq,uint32_t bdcount)58 static inline void rm_write_header_desc(void *desc, uint32_t toggle,
59 			     uint32_t opq, uint32_t bdcount)
60 {
61 	struct rm_header *r = (struct rm_header *)desc;
62 
63 	r->opq = opq;
64 	/* DMA descriptor count init value */
65 	r->bdcount = bdcount;
66 	r->prot = 0x0;
67 	/* No packet extension, start and end set to '1' */
68 	r->start = 1;
69 	r->end = 1;
70 	r->toggle = toggle;
71 	/* RM header type */
72 	r->type = PAX_DMA_TYPE_RM_HEADER;
73 }
74 
75 /**
76  * @brief Fill RM header descriptor for next transfer
77  *        with invalid toggle
78  */
rm_write_header_next_desc(void * desc,struct dma_iproc_pax_ring_data * r,uint32_t opq,uint32_t bdcount)79 static inline void rm_write_header_next_desc(void *desc,
80 					     struct dma_iproc_pax_ring_data *r,
81 					     uint32_t opq, uint32_t bdcount)
82 {
83 	/* Toggle bit is invalid until next payload configured */
84 	rm_write_header_desc(desc, (r->curr.toggle == 0) ? 1 : 0, opq, bdcount);
85 }
86 
rm_header_set_bd_count(void * desc,uint32_t bdcount)87 static inline void rm_header_set_bd_count(void *desc, uint32_t bdcount)
88 {
89 	struct rm_header *r = (struct rm_header *)desc;
90 
91 	/* DMA descriptor count */
92 	r->bdcount = bdcount;
93 }
94 
rm_header_set_toggle(void * desc,uint32_t toggle)95 static inline void rm_header_set_toggle(void *desc, uint32_t toggle)
96 {
97 	struct rm_header *r = (struct rm_header *)desc;
98 
99 	r->toggle = toggle;
100 }
101 
102 /**
103  * @brief Populate dma header descriptor
104  */
rm_write_dma_header_desc(void * desc,struct dma_iproc_pax_payload * pl)105 static inline void rm_write_dma_header_desc(void *desc,
106 					    struct dma_iproc_pax_payload *pl)
107 {
108 	struct dma_header_desc *hdr = (struct dma_header_desc *)desc;
109 
110 	hdr->length = pl->xfer_sz;
111 	hdr->opcode = pl->direction;
112 	/* DMA header type */
113 	hdr->type = PAX_DMA_TYPE_DMA_DESC;
114 }
115 
116 /**
117  * @brief Populate axi address descriptor
118  */
rm_write_axi_addr_desc(void * desc,struct dma_iproc_pax_payload * pl)119 static inline void rm_write_axi_addr_desc(void *desc,
120 					  struct dma_iproc_pax_payload *pl)
121 {
122 	struct axi_addr_desc *axi = (struct axi_addr_desc *)desc;
123 
124 	axi->axi_addr = pl->axi_addr;
125 	axi->type = PAX_DMA_TYPE_DMA_DESC;
126 
127 }
128 
129 /**
130  * @brief Populate pci address descriptor
131  */
rm_write_pci_addr_desc(void * desc,struct dma_iproc_pax_payload * pl)132 static inline void rm_write_pci_addr_desc(void *desc,
133 					  struct dma_iproc_pax_payload *pl)
134 {
135 	struct pci_addr_desc *pci = (struct pci_addr_desc *)desc;
136 
137 	pci->pcie_addr = pl->pci_addr >> PAX_DMA_PCI_ADDR_ALIGNMT_SHIFT;
138 	pci->type = PAX_DMA_TYPE_DMA_DESC;
139 }
140 
141 /**
142  * @brief Return's pointer to the descriptor memory to be written next,
143  *	  skip next pointer descriptor address.
144  */
next_desc_addr(struct dma_iproc_pax_ring_data * ring)145 static void *next_desc_addr(struct dma_iproc_pax_ring_data *ring)
146 {
147 	struct next_ptr_desc *nxt;
148 	uintptr_t curr;
149 
150 	curr = (uintptr_t)ring->curr.write_ptr + PAX_DMA_RM_DESC_BDWIDTH;
151 	/* if hit next table ptr, skip to next location, flip toggle */
152 	nxt = (struct next_ptr_desc *)curr;
153 	if (nxt->type == PAX_DMA_TYPE_NEXT_PTR) {
154 		LOG_DBG("hit next_ptr@0x%lx:T%d, next_table@0x%lx\n",
155 			curr, nxt->toggle, (uintptr_t)nxt->addr);
156 		uintptr_t last = (uintptr_t)ring->bd +
157 			     PAX_DMA_RM_DESC_RING_SIZE * PAX_DMA_NUM_BD_BUFFS;
158 		ring->curr.toggle = (ring->curr.toggle == 0) ? 1 : 0;
159 		/* move to next addr, wrap around if hits end */
160 		curr += PAX_DMA_RM_DESC_BDWIDTH;
161 		if (curr == last) {
162 			curr = (uintptr_t)ring->bd;
163 			LOG_DBG("hit end of desc:0x%lx, wrap to 0x%lx\n",
164 				last, curr);
165 		}
166 	}
167 	ring->curr.write_ptr = (void *)curr;
168 	return (void *)curr;
169 }
170 
171 /**
172  * @brief Populate next ptr descriptor
173  */
rm_write_next_table_desc(void * desc,void * next_ptr,uint32_t toggle)174 static void rm_write_next_table_desc(void *desc, void *next_ptr,
175 				     uint32_t toggle)
176 {
177 	struct next_ptr_desc *nxt = (struct next_ptr_desc *)desc;
178 
179 	nxt->addr = (uintptr_t)next_ptr;
180 	nxt->type = PAX_DMA_TYPE_NEXT_PTR;
181 	nxt->toggle = toggle;
182 }
183 
prepare_ring(struct dma_iproc_pax_ring_data * ring)184 static void prepare_ring(struct dma_iproc_pax_ring_data *ring)
185 {
186 	uintptr_t curr, next, last;
187 	uint32_t  toggle;
188 	int buff_count = PAX_DMA_NUM_BD_BUFFS;
189 
190 	/* zero out descriptor area */
191 	memset(ring->bd, 0x0, PAX_DMA_RM_DESC_RING_SIZE * PAX_DMA_NUM_BD_BUFFS);
192 	memset(ring->cmpl, 0x0, PAX_DMA_RM_CMPL_RING_SIZE);
193 
194 	/* opaque/packet id value */
195 	rm_write_header_desc(ring->bd, 0x0, reset_pkt_id(ring),
196 			     PAX_DMA_RM_DESC_BDCOUNT);
197 	/* start with first buffer, valid toggle is 0x1 */
198 	toggle = 0x1;
199 	curr = (uintptr_t)ring->bd;
200 	next = curr + PAX_DMA_RM_DESC_RING_SIZE;
201 	last = curr + PAX_DMA_RM_DESC_RING_SIZE * PAX_DMA_NUM_BD_BUFFS;
202 	do {
203 		/* Place next_table desc as last BD entry on each buffer */
204 		rm_write_next_table_desc(PAX_DMA_NEXT_TBL_ADDR((void *)curr),
205 					 (void *)next, toggle);
206 
207 		/* valid toggle flips for each buffer */
208 		toggle = toggle ? 0x0 : 0x1;
209 		curr += PAX_DMA_RM_DESC_RING_SIZE;
210 		next += PAX_DMA_RM_DESC_RING_SIZE;
211 		/* last entry, chain back to first buffer */
212 		if (next == last) {
213 			next = (uintptr_t)ring->bd;
214 		}
215 
216 	} while (--buff_count);
217 
218 	dma_mb();
219 
220 	/* start programming from first RM header */
221 	ring->curr.write_ptr = ring->bd;
222 	/* valid toggle starts with 1 after reset */
223 	ring->curr.toggle = 1;
224 	/* completion read offset */
225 	ring->curr.cmpl_rd_offs = 0;
226 
227 	/* init sync data for the ring */
228 	ring->curr.sync_data.signature = PAX_DMA_WRITE_SYNC_SIGNATURE;
229 	ring->curr.sync_data.ring = ring->idx;
230 	/* pkt id for active dma xfer */
231 	ring->curr.sync_data.opaque = 0x0;
232 	/* pkt count for active dma xfer */
233 	ring->curr.sync_data.total_pkts = 0x0;
234 }
235 
init_rm(struct dma_iproc_pax_data * pd)236 static int init_rm(struct dma_iproc_pax_data *pd)
237 {
238 	int ret = -ETIMEDOUT, timeout = 1000;
239 
240 	k_mutex_lock(&pd->dma_lock, K_FOREVER);
241 	/* Wait for Ring Manager ready */
242 	do {
243 		LOG_DBG("Waiting for RM HW init\n");
244 		if ((sys_read32(RM_COMM_REG(pd, RM_COMM_MAIN_HW_INIT_DONE)) &
245 		    RM_COMM_MAIN_HW_INIT_DONE_MASK)) {
246 			ret = 0;
247 			break;
248 		}
249 		k_sleep(K_MSEC(1));
250 	} while (--timeout);
251 	k_mutex_unlock(&pd->dma_lock);
252 
253 	if (!timeout) {
254 		LOG_WRN("RM HW Init timedout!\n");
255 	} else {
256 		LOG_INF("PAX DMA RM HW Init Done\n");
257 	}
258 
259 	return ret;
260 }
261 
rm_cfg_start(struct dma_iproc_pax_data * pd)262 static void rm_cfg_start(struct dma_iproc_pax_data *pd)
263 {
264 	uint32_t val;
265 
266 	k_mutex_lock(&pd->dma_lock, K_FOREVER);
267 
268 	/* set config done 0, enable toggle mode */
269 	val = sys_read32(RM_COMM_REG(pd, RM_COMM_CONTROL));
270 	val &= ~RM_COMM_CONTROL_CONFIG_DONE;
271 	sys_write32(val, RM_COMM_REG(pd, RM_COMM_CONTROL));
272 
273 	val &= ~(RM_COMM_CONTROL_MODE_MASK << RM_COMM_CONTROL_MODE_SHIFT);
274 	val |= (RM_COMM_CONTROL_MODE_TOGGLE << RM_COMM_CONTROL_MODE_SHIFT);
275 	sys_write32(val, RM_COMM_REG(pd, RM_COMM_CONTROL));
276 
277 	/* Disable MSI */
278 	sys_write32(RM_COMM_MSI_DISABLE_VAL,
279 		    RM_COMM_REG(pd, RM_COMM_MSI_DISABLE));
280 	/* Enable Line interrupt */
281 	val = sys_read32(RM_COMM_REG(pd, RM_COMM_CONTROL));
282 	val |= RM_COMM_CONTROL_LINE_INTR_EN;
283 	sys_write32(val, RM_COMM_REG(pd, RM_COMM_CONTROL));
284 
285 	/* Enable AE_TIMEOUT */
286 	sys_write32(RM_COMM_AE_TIMEOUT_VAL, RM_COMM_REG(pd,
287 							RM_COMM_AE_TIMEOUT));
288 	val = sys_read32(RM_COMM_REG(pd, RM_COMM_CONTROL));
289 	val |= RM_COMM_CONTROL_AE_TIMEOUT_EN;
290 	sys_write32(val, RM_COMM_REG(pd, RM_COMM_CONTROL));
291 
292 	/* AE (Acceleration Engine) grouping to group '0' */
293 	val = sys_read32(RM_COMM_REG(pd, RM_AE0_AE_CONTROL));
294 	val &= ~RM_AE_CTRL_AE_GROUP_MASK;
295 	sys_write32(val, RM_COMM_REG(pd, RM_AE0_AE_CONTROL));
296 	val |= RM_AE_CONTROL_ACTIVE;
297 	sys_write32(val, RM_COMM_REG(pd, RM_AE0_AE_CONTROL));
298 
299 	/* AXI read/write channel enable */
300 	val = sys_read32(RM_COMM_REG(pd, RM_COMM_AXI_CONTROL));
301 	val |= (RM_COMM_AXI_CONTROL_RD_CH_EN | RM_COMM_AXI_CONTROL_WR_CH_EN);
302 	sys_write32(val, RM_COMM_REG(pd, RM_COMM_AXI_CONTROL));
303 
304 	/* Tune RM control programming for 4 rings */
305 	sys_write32(RM_COMM_TIMER_CONTROL0_VAL,
306 		    RM_COMM_REG(pd, RM_COMM_TIMER_CONTROL_0));
307 	sys_write32(RM_COMM_TIMER_CONTROL1_VAL,
308 		    RM_COMM_REG(pd, RM_COMM_TIMER_CONTROL_1));
309 	sys_write32(RM_COMM_RM_BURST_LENGTH,
310 		    RM_COMM_REG(pd, RM_COMM_RM_BURST_LENGTH));
311 
312 	/* Set Sequence max count to the max supported value */
313 	val = sys_read32(RM_COMM_REG(pd, RM_COMM_MASK_SEQUENCE_MAX_COUNT));
314 	val = (val | RING_MASK_SEQ_MAX_COUNT_MASK);
315 	sys_write32(val, RM_COMM_REG(pd, RM_COMM_MASK_SEQUENCE_MAX_COUNT));
316 
317 	k_mutex_unlock(&pd->dma_lock);
318 }
319 
rm_ring_clear_stats(struct dma_iproc_pax_data * pd,enum ring_idx idx)320 static void rm_ring_clear_stats(struct dma_iproc_pax_data *pd,
321 				enum ring_idx idx)
322 {
323 	/* Read ring Tx, Rx, and Outstanding counts to clear */
324 	sys_read32(RM_RING_REG(pd, idx, RING_NUM_REQ_RECV_LS));
325 	sys_read32(RM_RING_REG(pd, idx, RING_NUM_REQ_RECV_MS));
326 	sys_read32(RM_RING_REG(pd, idx, RING_NUM_REQ_TRANS_LS));
327 	sys_read32(RM_RING_REG(pd, idx, RING_NUM_REQ_TRANS_MS));
328 	sys_read32(RM_RING_REG(pd, idx, RING_NUM_REQ_OUTSTAND));
329 }
330 
rm_cfg_finish(struct dma_iproc_pax_data * pd)331 static void rm_cfg_finish(struct dma_iproc_pax_data *pd)
332 {
333 	uint32_t val;
334 
335 	k_mutex_lock(&pd->dma_lock, K_FOREVER);
336 
337 	/* set Ring config done */
338 	val = sys_read32(RM_COMM_REG(pd, RM_COMM_CONTROL));
339 	val |= RM_COMM_CONTROL_CONFIG_DONE;
340 	sys_write32(val,  RM_COMM_REG(pd, RM_COMM_CONTROL));
341 
342 	k_mutex_unlock(&pd->dma_lock);
343 }
344 
345 /* Activate/Deactivate rings */
set_ring_active(struct dma_iproc_pax_data * pd,enum ring_idx idx,bool active)346 static inline void set_ring_active(struct dma_iproc_pax_data *pd,
347 				   enum ring_idx idx,
348 				   bool active)
349 {
350 	uint32_t val;
351 
352 	val = sys_read32(RM_RING_REG(pd, idx, RING_CONTROL));
353 	if (active) {
354 		val |= RING_CONTROL_ACTIVE;
355 	} else {
356 		val &= ~RING_CONTROL_ACTIVE;
357 	}
358 	sys_write32(val, RM_RING_REG(pd, idx, RING_CONTROL));
359 }
360 
init_ring(struct dma_iproc_pax_data * pd,enum ring_idx idx)361 static int init_ring(struct dma_iproc_pax_data *pd, enum ring_idx idx)
362 {
363 	uint32_t val;
364 	uintptr_t desc = (uintptr_t)pd->ring[idx].bd;
365 	uintptr_t cmpl = (uintptr_t)pd->ring[idx].cmpl;
366 	int timeout = 5000, ret = 0;
367 
368 	k_mutex_lock(&pd->dma_lock, K_FOREVER);
369 
370 	/*  Read cmpl write ptr incase previous dma stopped */
371 	sys_read32(RM_RING_REG(pd, idx, RING_CMPL_WRITE_PTR));
372 
373 	/* Inactivate ring */
374 	sys_write32(0x0, RM_RING_REG(pd, idx, RING_CONTROL));
375 
376 	/* Flush ring before loading new descriptor */
377 	sys_write32(RING_CONTROL_FLUSH, RM_RING_REG(pd, idx, RING_CONTROL));
378 	do {
379 		if (sys_read32(RM_RING_REG(pd, idx, RING_FLUSH_DONE)) &
380 		    RING_FLUSH_DONE_MASK) {
381 			break;
382 		}
383 		k_busy_wait(1);
384 	} while (--timeout);
385 
386 	if (!timeout) {
387 		LOG_WRN("Ring %d flush timedout!\n", idx);
388 		ret = -ETIMEDOUT;
389 		goto err;
390 	}
391 
392 	/* clear ring after flush */
393 	sys_write32(0x0, RM_RING_REG(pd, idx, RING_CONTROL));
394 
395 	/* ring group id set to '0' */
396 	val = sys_read32(RM_COMM_REG(pd, RM_COMM_CTRL_REG(idx)));
397 	val &= ~RING_COMM_CTRL_AE_GROUP_MASK;
398 	sys_write32(val, RM_COMM_REG(pd, RM_COMM_CTRL_REG(idx)));
399 
400 	/* DDR update control, set timeout value */
401 	val = RING_DDR_CONTROL_COUNT(RING_DDR_CONTROL_COUNT_VAL) |
402 	      RING_DDR_CONTROL_TIMER(RING_DDR_CONTROL_TIMER_VAL) |
403 	      RING_DDR_CONTROL_ENABLE;
404 
405 	sys_write32(val, RM_RING_REG(pd, idx, RING_CMPL_WR_PTR_DDR_CONTROL));
406 
407 	val = (uint32_t)((uintptr_t)desc >> PAX_DMA_RING_BD_ALIGN_ORDER);
408 	sys_write32(val, RM_RING_REG(pd, idx, RING_BD_START_ADDR));
409 	val = (uint32_t)((uintptr_t)cmpl >> PAX_DMA_RING_CMPL_ALIGN_ORDER);
410 	sys_write32(val, RM_RING_REG(pd, idx, RING_CMPL_START_ADDR));
411 	val = sys_read32(RM_RING_REG(pd, idx, RING_BD_READ_PTR));
412 
413 	/* keep ring inactive after init to avoid BD poll */
414 	set_ring_active(pd, idx, false);
415 	rm_ring_clear_stats(pd, idx);
416 err:
417 	k_mutex_unlock(&pd->dma_lock);
418 
419 	return ret;
420 }
421 
poll_on_write_sync(const struct device * dev,struct dma_iproc_pax_ring_data * ring)422 static int poll_on_write_sync(const struct device *dev,
423 			      struct dma_iproc_pax_ring_data *ring)
424 {
425 	const struct dma_iproc_pax_cfg *cfg = dev->config;
426 	struct dma_iproc_pax_write_sync_data sync_rd, *recv, *sent;
427 	uint64_t pci_addr;
428 	uint32_t *pci32, *axi32;
429 	uint32_t zero_init = 0, timeout = PAX_DMA_MAX_SYNC_WAIT;
430 	int ret;
431 
432 	recv = &sync_rd;
433 	sent = &(ring->curr.sync_data);
434 	/* form host pci sync address */
435 	pci32 = (uint32_t *)&pci_addr;
436 	pci32[0] = ring->sync_pci.addr_lo;
437 	pci32[1] = ring->sync_pci.addr_hi;
438 	axi32 = (uint32_t *)&sync_rd;
439 
440 	do {
441 		ret = pcie_ep_xfer_data_memcpy(cfg->pcie_dev, pci_addr,
442 					       (uintptr_t *)axi32, 4,
443 					       PCIE_OB_LOWMEM, HOST_TO_DEVICE);
444 
445 		if (memcmp((void *)recv, (void *)sent, 4) == 0) {
446 			/* clear the sync word */
447 			ret = pcie_ep_xfer_data_memcpy(cfg->pcie_dev, pci_addr,
448 						       (uintptr_t *)&zero_init,
449 						       4, PCIE_OB_LOWMEM,
450 						       DEVICE_TO_HOST);
451 			dma_mb();
452 			ret = 0;
453 			break;
454 		}
455 		k_busy_wait(1);
456 	} while (--timeout);
457 
458 	if (!timeout) {
459 		LOG_DBG("[ring %d]: not recvd write sync!\n", ring->idx);
460 		ret = -ETIMEDOUT;
461 	}
462 
463 	return ret;
464 }
465 
process_cmpl_event(const struct device * dev,enum ring_idx idx,uint32_t pl_len)466 static int process_cmpl_event(const struct device *dev,
467 			      enum ring_idx idx, uint32_t pl_len)
468 {
469 	struct dma_iproc_pax_data *pd = dev->data;
470 	uint32_t wr_offs, rd_offs, ret = DMA_STATUS_COMPLETE;
471 	struct dma_iproc_pax_ring_data *ring = &(pd->ring[idx]);
472 	struct cmpl_pkt *c;
473 	uint32_t is_outstanding;
474 
475 	/* cmpl read offset, unprocessed cmpl location */
476 	rd_offs = ring->curr.cmpl_rd_offs;
477 
478 	wr_offs = sys_read32(RM_RING_REG(pd, idx,
479 					 RING_CMPL_WRITE_PTR));
480 
481 	/* Update read ptr to "processed" */
482 	ring->curr.cmpl_rd_offs = wr_offs;
483 
484 	/*
485 	 * Ensure consistency of completion descriptor
486 	 * The completion desc is updated by RM via AXI stream
487 	 * CPU need to ensure the memory operations are completed
488 	 * before reading cmpl area, by a "dsb"
489 	 * If Dcache enabled, need to invalidate the cachelines to
490 	 * read updated cmpl desc. The cache API also issues dsb.
491 	 */
492 	dma_mb();
493 
494 	/* Decode cmpl pkt id to verify */
495 	c = (struct cmpl_pkt *)((uintptr_t)ring->cmpl +
496 	    PAX_DMA_CMPL_DESC_SIZE * PAX_DMA_CURR_CMPL_IDX(wr_offs));
497 
498 	LOG_DBG("RING%d WR_PTR:%d opq:%d, rm_status:%x dma_status:%x\n",
499 		idx, wr_offs, c->opq, c->rm_status, c->dma_status);
500 
501 	is_outstanding = sys_read32(RM_RING_REG(pd, idx,
502 						RING_NUM_REQ_OUTSTAND));
503 	if ((ring->curr.opq != c->opq) && (is_outstanding != 0)) {
504 		LOG_ERR("RING%d: pkt id should be %d, rcvd %d outst=%d\n",
505 			idx, ring->curr.opq, c->opq, is_outstanding);
506 		ret = -EIO;
507 	}
508 	/* check for completion AE timeout */
509 	if (c->rm_status == RM_COMPLETION_AE_TIMEOUT) {
510 		LOG_ERR("RING%d WR_PTR:%d rm_status:%x AE Timeout!\n",
511 			idx, wr_offs, c->rm_status);
512 		/* TBD: Issue full card reset to restore operations */
513 		LOG_ERR("Needs Card Reset to recover!\n");
514 		ret = -ETIMEDOUT;
515 	}
516 
517 	if (ring->dma_callback) {
518 		ring->dma_callback(dev, ring->callback_arg, idx, ret);
519 	}
520 
521 	return ret;
522 }
523 
524 #ifdef CONFIG_DMA_IPROC_PAX_POLL_MODE
peek_ring_cmpl(const struct device * dev,enum ring_idx idx,uint32_t pl_len)525 static int peek_ring_cmpl(const struct device *dev,
526 			  enum ring_idx idx, uint32_t pl_len)
527 {
528 	struct dma_iproc_pax_data *pd = dev->data;
529 	uint32_t wr_offs, rd_offs, timeout = PAX_DMA_MAX_POLL_WAIT;
530 	struct dma_iproc_pax_ring_data *ring = &(pd->ring[idx]);
531 
532 	/* cmpl read offset, unprocessed cmpl location */
533 	rd_offs = ring->curr.cmpl_rd_offs;
534 
535 	/* poll write_ptr until cmpl received for all buffers */
536 	do {
537 		wr_offs = sys_read32(RM_RING_REG(pd, idx,
538 						 RING_CMPL_WRITE_PTR));
539 		if (PAX_DMA_GET_CMPL_COUNT(wr_offs, rd_offs) >= pl_len) {
540 			break;
541 		}
542 		k_busy_wait(1);
543 	} while (--timeout);
544 
545 	if (timeout == 0) {
546 		LOG_ERR("RING%d timeout, rcvd %d, expected %d!\n",
547 			idx, PAX_DMA_GET_CMPL_COUNT(wr_offs, rd_offs), pl_len);
548 		/* More debug info on current dma instance */
549 		LOG_ERR("WR_PTR:%x RD_PTR%x\n", wr_offs, rd_offs);
550 		return  -ETIMEDOUT;
551 	}
552 
553 	return process_cmpl_event(dev, idx, pl_len);
554 }
555 #else
rm_isr(const struct device * dev)556 static void rm_isr(const struct device *dev)
557 {
558 	uint32_t status, err_stat, idx;
559 	struct dma_iproc_pax_data *pd = dev->data;
560 
561 	/* read and clear interrupt status */
562 	status = sys_read32(RM_COMM_REG(pd, RM_COMM_MSI_INTR_INTERRUPT_STATUS));
563 	sys_write32(status, RM_COMM_REG(pd,
564 					RM_COMM_MSI_INTERRUPT_STATUS_CLEAR));
565 
566 	/* read and clear DME/AE error interrupts */
567 	err_stat = sys_read32(RM_COMM_REG(pd,
568 					  RM_COMM_DME_INTERRUPT_STATUS_MASK));
569 	sys_write32(err_stat,
570 		    RM_COMM_REG(pd, RM_COMM_DME_INTERRUPT_STATUS_CLEAR));
571 	err_stat =
572 	sys_read32(RM_COMM_REG(pd,
573 			       RM_COMM_AE_INTERFACE_GROUP_0_INTERRUPT_MASK));
574 	sys_write32(err_stat,
575 		    RM_COMM_REG(pd,
576 				RM_COMM_AE_INTERFACE_GROUP_0_INTERRUPT_CLEAR));
577 
578 	/* alert waiting thread to process, for each completed ring */
579 	for (idx = PAX_DMA_RING0; idx < PAX_DMA_RINGS_MAX; idx++) {
580 		if (status & (0x1 << idx)) {
581 			k_sem_give(&pd->ring[idx].alert);
582 		}
583 	}
584 }
585 #endif
586 
dma_iproc_pax_init(const struct device * dev)587 static int dma_iproc_pax_init(const struct device *dev)
588 {
589 	const struct dma_iproc_pax_cfg *cfg = dev->config;
590 	struct dma_iproc_pax_data *pd = dev->data;
591 	int r;
592 	uintptr_t mem_aligned;
593 
594 	if (!device_is_ready(cfg->pcie_dev)) {
595 		LOG_ERR("PCIe device not ready");
596 		return -ENODEV;
597 	}
598 
599 	pd->dma_base = cfg->dma_base;
600 	pd->rm_comm_base = cfg->rm_comm_base;
601 	pd->used_rings = (cfg->use_rings < PAX_DMA_RINGS_MAX) ?
602 			 cfg->use_rings : PAX_DMA_RINGS_MAX;
603 
604 	LOG_DBG("dma base:0x%x, rm comm base:0x%x, needed rings %d\n",
605 		pd->dma_base, pd->rm_comm_base, pd->used_rings);
606 
607 	/* dma/rm access lock */
608 	k_mutex_init(&pd->dma_lock);
609 
610 	/* Ring Manager H/W init */
611 	if (init_rm(pd)) {
612 		return -ETIMEDOUT;
613 	}
614 
615 	/* common rm config */
616 	rm_cfg_start(pd);
617 
618 	/* individual ring config */
619 	for (r = 0; r < pd->used_rings; r++) {
620 		/* per-ring mutex lock */
621 		k_mutex_init(&pd->ring[r].lock);
622 		/* Init alerts */
623 		k_sem_init(&pd->ring[r].alert, 0, 1);
624 
625 		pd->ring[r].idx = r;
626 		pd->ring[r].ring_base = cfg->rm_base +
627 					PAX_DMA_RING_ADDR_OFFSET(r);
628 		LOG_DBG("RING%d,VERSION:0x%x\n", pd->ring[r].idx,
629 			sys_read32(RM_RING_REG(pd, r, RING_VER)));
630 
631 		/* Allocate for 2 BD buffers + cmpl buffer + payload struct */
632 		pd->ring[r].ring_mem = (void *)((uintptr_t)cfg->bd_memory_base +
633 						r *
634 						PAX_DMA_PER_RING_ALLOC_SIZE);
635 		if (!pd->ring[r].ring_mem) {
636 			LOG_ERR("RING%d failed to alloc desc memory!\n", r);
637 			return -ENOMEM;
638 		}
639 		/* Find 8K aligned address within allocated region */
640 		mem_aligned = ((uintptr_t)pd->ring[r].ring_mem +
641 			       PAX_DMA_RING_ALIGN - 1) &
642 			       ~(PAX_DMA_RING_ALIGN - 1);
643 
644 		pd->ring[r].cmpl = (void *)mem_aligned;
645 		pd->ring[r].bd = (void *)(mem_aligned +
646 					  PAX_DMA_RM_CMPL_RING_SIZE);
647 		pd->ring[r].payload = (void *)((uintptr_t)pd->ring[r].bd +
648 				      PAX_DMA_RM_DESC_RING_SIZE *
649 				      PAX_DMA_NUM_BD_BUFFS);
650 
651 		LOG_DBG("Ring%d,allocated Mem:0x%p Size %d\n",
652 			pd->ring[r].idx,
653 			pd->ring[r].ring_mem,
654 			PAX_DMA_PER_RING_ALLOC_SIZE);
655 		LOG_DBG("Ring%d,BD:0x%p, CMPL:0x%p, PL:0x%p\n",
656 			pd->ring[r].idx,
657 			pd->ring[r].bd,
658 			pd->ring[r].cmpl,
659 			pd->ring[r].payload);
660 
661 		/* Prepare ring desc table */
662 		prepare_ring(&(pd->ring[r]));
663 
664 		/* initialize ring */
665 		init_ring(pd, r);
666 	}
667 
668 	/* set ring config done */
669 	rm_cfg_finish(pd);
670 
671 #ifndef CONFIG_DMA_IPROC_PAX_POLL_MODE
672 	/* Register and enable RM interrupt */
673 	IRQ_CONNECT(DT_INST_IRQN(0),
674 		    DT_INST_IRQ(0, priority),
675 		    rm_isr,
676 		    DEVICE_DT_INST_GET(0),
677 		    0);
678 	irq_enable(DT_INST_IRQN(0));
679 #else
680 	LOG_INF("%s PAX DMA rings in poll mode!\n", dev->name);
681 #endif
682 	LOG_INF("%s RM setup %d rings\n", dev->name, pd->used_rings);
683 
684 	return 0;
685 }
686 
687 #ifdef CONFIG_DMA_IPROC_PAX_POLL_MODE
set_pkt_count(const struct device * dev,enum ring_idx idx,uint32_t pl_len)688 static void set_pkt_count(const struct device *dev,
689 			  enum ring_idx idx,
690 			  uint32_t pl_len)
691 {
692 	/* Nothing needs to be programmed here in poll mode */
693 }
694 
wait_for_pkt_completion(const struct device * dev,enum ring_idx idx,uint32_t pl_len)695 static int wait_for_pkt_completion(const struct device *dev,
696 				   enum ring_idx idx,
697 				   uint32_t pl_len)
698 {
699 	/* poll for completion */
700 	return peek_ring_cmpl(dev, idx, pl_len + 1);
701 }
702 #else
set_pkt_count(const struct device * dev,enum ring_idx idx,uint32_t pl_len)703 static void set_pkt_count(const struct device *dev,
704 			  enum ring_idx idx,
705 			  uint32_t pl_len)
706 {
707 	struct dma_iproc_pax_data *pd = dev->data;
708 	uint32_t val;
709 
710 	/* program packet count for interrupt assertion */
711 	val = sys_read32(RM_RING_REG(pd, idx,
712 				     RING_CMPL_WR_PTR_DDR_CONTROL));
713 	val &= ~RING_DDR_CONTROL_COUNT_MASK;
714 	val |= RING_DDR_CONTROL_COUNT(pl_len);
715 	sys_write32(val, RM_RING_REG(pd, idx,
716 				     RING_CMPL_WR_PTR_DDR_CONTROL));
717 }
718 
wait_for_pkt_completion(const struct device * dev,enum ring_idx idx,uint32_t pl_len)719 static int wait_for_pkt_completion(const struct device *dev,
720 				   enum ring_idx idx,
721 				   uint32_t pl_len)
722 {
723 	struct dma_iproc_pax_data *pd = dev->data;
724 	struct dma_iproc_pax_ring_data *ring;
725 
726 	ring = &(pd->ring[idx]);
727 
728 	/* wait for sg dma completion alert */
729 	if (k_sem_take(&ring->alert, K_MSEC(PAX_DMA_TIMEOUT)) != 0) {
730 		LOG_ERR("PAX DMA [ring %d] Timeout!\n", idx);
731 		return -ETIMEDOUT;
732 	}
733 
734 	return process_cmpl_event(dev, idx, pl_len);
735 }
736 #endif
737 
dma_iproc_pax_do_xfer(const struct device * dev,enum ring_idx idx,struct dma_iproc_pax_payload * pl,uint32_t pl_len)738 static int dma_iproc_pax_do_xfer(const struct device *dev,
739 				 enum ring_idx idx,
740 				 struct dma_iproc_pax_payload *pl,
741 				 uint32_t pl_len)
742 {
743 	struct dma_iproc_pax_data *pd = dev->data;
744 	const struct dma_iproc_pax_cfg *cfg = dev->config;
745 	int ret = 0, cnt;
746 	struct dma_iproc_pax_ring_data *ring;
747 	void *hdr;
748 	uint32_t toggle_bit;
749 	struct dma_iproc_pax_payload sync_pl;
750 	struct dma_iproc_pax_addr64 sync;
751 
752 	ring = &(pd->ring[idx]);
753 	pl = ring->payload;
754 
755 	/*
756 	 * Host sync buffer isn't ready at zephyr/driver init-time
757 	 * Read the host address location once at first DMA write
758 	 * on that ring.
759 	 */
760 	if ((ring->sync_pci.addr_lo == 0x0) &&
761 	    (ring->sync_pci.addr_hi == 0x0)) {
762 		/* populate sync data location */
763 		LOG_DBG("sync addr loc 0x%x\n", cfg->scr_addr_loc);
764 
765 		sync.addr_lo = sys_read32(cfg->scr_addr_loc
766 					  + 4);
767 		sync.addr_hi = sys_read32(cfg->scr_addr_loc);
768 		ring->sync_pci.addr_lo = sync.addr_lo + idx * 4;
769 		ring->sync_pci.addr_hi = sync.addr_hi;
770 		LOG_DBG("ring:%d,sync addr:0x%x.0x%x\n", idx,
771 			ring->sync_pci.addr_hi,
772 			ring->sync_pci.addr_lo);
773 	}
774 
775 	/* account extra sync packet */
776 	ring->curr.sync_data.opaque = ring->curr.opq;
777 	ring->curr.sync_data.total_pkts = pl_len;
778 	memcpy((void *)&ring->sync_loc,
779 	       (void *)&(ring->curr.sync_data), 4);
780 	sync_pl.pci_addr = ring->sync_pci.addr_lo |
781 			   (uint64_t)ring->sync_pci.addr_hi << 32;
782 	sync_pl.axi_addr = (uintptr_t)&ring->sync_loc;
783 
784 	sync_pl.xfer_sz = 4; /* 4-bytes */
785 	sync_pl.direction = CARD_TO_HOST;
786 
787 	/* Get descriptor write pointer for first header */
788 	hdr = (void *)ring->curr.write_ptr;
789 	/* current toggle bit */
790 	toggle_bit = ring->curr.toggle;
791 	/* current opq value for cmpl check */
792 	ring->curr.opq = curr_pkt_id(ring);
793 
794 	/* DMA desc count for first payload */
795 	rm_header_set_bd_count(hdr, PAX_DMA_RM_DESC_BDCOUNT);
796 
797 	/* Form dma descriptors for total sg payload */
798 	for (cnt = 0; cnt < pl_len; cnt++) {
799 		rm_write_dma_header_desc(next_desc_addr(ring), pl + cnt);
800 		rm_write_axi_addr_desc(next_desc_addr(ring), pl + cnt);
801 		rm_write_pci_addr_desc(next_desc_addr(ring), pl + cnt);
802 		/* Toggle may flip, program updated toggle value */
803 		rm_write_header_desc(next_desc_addr(ring),
804 				     curr_toggle_val(ring),
805 				     curr_pkt_id(ring),
806 				     PAX_DMA_RM_DESC_BDCOUNT);
807 	}
808 
809 	/* Append write sync payload descriptors */
810 	rm_write_dma_header_desc(next_desc_addr(ring), &sync_pl);
811 	rm_write_axi_addr_desc(next_desc_addr(ring), &sync_pl);
812 	rm_write_pci_addr_desc(next_desc_addr(ring), &sync_pl);
813 
814 	/* RM header for next transfer, RM wait on (invalid) toggle bit */
815 	rm_write_header_next_desc(next_desc_addr(ring), ring, alloc_pkt_id(ring),
816 		       PAX_DMA_RM_DESC_BDCOUNT);
817 
818 	set_pkt_count(dev, idx, pl_len + 1);
819 
820 	/* Ensure memory write before toggle flip */
821 	dma_mb();
822 
823 	/* set toggle to valid in first header */
824 	rm_header_set_toggle(hdr, toggle_bit);
825 	/* activate the ring */
826 	set_ring_active(pd, idx, true);
827 
828 	ret = wait_for_pkt_completion(dev, idx, pl_len + 1);
829 	if (ret) {
830 		goto err_ret;
831 	}
832 
833 	ret = poll_on_write_sync(dev, ring);
834 	k_mutex_lock(&ring->lock, K_FOREVER);
835 	ring->ring_active = 0;
836 	k_mutex_unlock(&ring->lock);
837 
838 err_ret:
839 	ring->ring_active = 0;
840 	/* deactivate the ring until next active transfer */
841 	set_ring_active(pd, idx, false);
842 
843 	return ret;
844 }
845 
dma_iproc_pax_configure(const struct device * dev,uint32_t channel,struct dma_config * cfg)846 static int dma_iproc_pax_configure(const struct device *dev, uint32_t channel,
847 				   struct dma_config *cfg)
848 {
849 	struct dma_iproc_pax_data *pd = dev->data;
850 	struct dma_iproc_pax_ring_data *ring;
851 	uint32_t xfer_sz;
852 	int ret = 0;
853 #ifdef CONFIG_DMA_IPROC_PAX_DEBUG
854 	uint32_t *pci_addr32;
855 	uint32_t *axi_addr32;
856 #endif
857 
858 	if (channel >= PAX_DMA_RINGS_MAX) {
859 		LOG_ERR("Invalid ring/channel %d\n", channel);
860 		return -EINVAL;
861 	}
862 
863 	ring = &(pd->ring[channel]);
864 	k_mutex_lock(&ring->lock, K_FOREVER);
865 
866 	if (cfg->block_count > 1) {
867 		/* Scatter/gather list handling is not supported */
868 		ret = -ENOTSUP;
869 		goto err;
870 	}
871 
872 	if (ring->ring_active) {
873 		ret = -EBUSY;
874 		goto err;
875 	}
876 
877 	ring->ring_active = 1;
878 
879 	if (cfg->channel_direction == MEMORY_TO_PERIPHERAL) {
880 #ifdef CONFIG_DMA_IPROC_PAX_DEBUG
881 		axi_addr32 = (uint32_t *)&cfg->head_block->source_address;
882 		pci_addr32 = (uint32_t *)&cfg->head_block->dest_address;
883 #endif
884 		ring->payload->direction = CARD_TO_HOST;
885 		ring->payload->pci_addr = cfg->head_block->dest_address;
886 		ring->payload->axi_addr = cfg->head_block->source_address;
887 	} else if (cfg->channel_direction == PERIPHERAL_TO_MEMORY) {
888 #ifdef CONFIG_DMA_IPROC_PAX_DEBUG
889 		axi_addr32 = (uint32_t *)&cfg->head_block->dest_address;
890 		pci_addr32 = (uint32_t *)&cfg->head_block->source_address;
891 #endif
892 		ring->payload->direction = HOST_TO_CARD;
893 		ring->payload->pci_addr = cfg->head_block->source_address;
894 		ring->payload->axi_addr = cfg->head_block->dest_address;
895 	} else {
896 		ring->ring_active = 0;
897 		ret = -ENOTSUP;
898 		goto err;
899 	}
900 
901 	xfer_sz = cfg->head_block->block_size;
902 
903 #ifdef CONFIG_DMA_IPROC_PAX_DEBUG
904 	if (xfer_sz > PAX_DMA_MAX_SIZE) {
905 		LOG_ERR("Unsupported size: %d\n", xfer_size);
906 		ring->ring_active = 0;
907 		ret = -EINVAL;
908 		goto err;
909 	}
910 
911 	if (xfer_sz % PAX_DMA_MIN_SIZE) {
912 		LOG_ERR("Unaligned size 0x%x\n", xfer_size);
913 		ring->ring_active = 0;
914 		ret = -EINVAL;
915 		goto err;
916 	}
917 
918 	if (pci_addr32[0] % PAX_DMA_ADDR_ALIGN) {
919 		LOG_ERR("Unaligned Host addr: 0x%x.0x%x\n",
920 			pci_addr32[1], pci_addr32[0]);
921 		ring->ring_active = 0;
922 		ret = -EINVAL;
923 		goto err;
924 	}
925 
926 	if (axi_addr32[0] % PAX_DMA_ADDR_ALIGN) {
927 		LOG_ERR("Unaligned Card addr: 0x%x.0x%x\n",
928 			axi_addr32[1], axi_addr32[0]);
929 		ring->ring_active = 0;
930 		ret = -EINVAL;
931 		goto err;
932 	}
933 #endif
934 	ring->payload->xfer_sz = xfer_sz;
935 
936 	ring->dma_callback = cfg->dma_callback;
937 	ring->callback_arg = cfg->user_data;
938 err:
939 	k_mutex_unlock(&ring->lock);
940 
941 	return ret;
942 }
943 
dma_iproc_pax_transfer_start(const struct device * dev,uint32_t channel)944 static int dma_iproc_pax_transfer_start(const struct device *dev,
945 					uint32_t channel)
946 {
947 	int ret = 0;
948 	struct dma_iproc_pax_data *pd = dev->data;
949 	struct dma_iproc_pax_ring_data *ring;
950 
951 	if (channel >= PAX_DMA_RINGS_MAX) {
952 		LOG_ERR("Invalid ring %d\n", channel);
953 		return -EINVAL;
954 	}
955 	ring = &(pd->ring[channel]);
956 	/* do dma transfer of single buffer */
957 	ret = dma_iproc_pax_do_xfer(dev, channel, ring->payload, 1);
958 
959 	return ret;
960 }
961 
dma_iproc_pax_transfer_stop(const struct device * dev,uint32_t channel)962 static int dma_iproc_pax_transfer_stop(const struct device *dev,
963 				       uint32_t channel)
964 {
965 	return 0;
966 }
967 
968 static DEVICE_API(dma, pax_dma_driver_api) = {
969 	.config = dma_iproc_pax_configure,
970 	.start = dma_iproc_pax_transfer_start,
971 	.stop = dma_iproc_pax_transfer_stop,
972 };
973 
974 static const struct dma_iproc_pax_cfg pax_dma_cfg = {
975 	.dma_base = DT_INST_REG_ADDR_BY_NAME(0, dme_regs),
976 	.rm_base = DT_INST_REG_ADDR_BY_NAME(0, rm_ring_regs),
977 	.rm_comm_base = DT_INST_REG_ADDR_BY_NAME(0, rm_comm_regs),
978 	.use_rings = DT_INST_PROP(0, dma_channels),
979 	.bd_memory_base = (void *)DT_INST_PROP_BY_IDX(0, bd_memory, 0),
980 	.scr_addr_loc = DT_INST_PROP(0, scr_addr_loc),
981 	.pcie_dev = DEVICE_DT_GET(DT_INST_PHANDLE(0, pcie_ep)),
982 };
983 
984 DEVICE_DT_INST_DEFINE(0,
985 		    &dma_iproc_pax_init,
986 		    NULL,
987 		    &pax_dma_data,
988 		    &pax_dma_cfg,
989 		    POST_KERNEL,
990 		    CONFIG_DMA_INIT_PRIORITY,
991 		    &pax_dma_driver_api);
992