1 // SPDX-License-Identifier: GPL-2.0
2 /*
3 * Copyright (C) 2014-2018 Etnaviv Project
4 */
5
6 #include "etnaviv_cmdbuf.h"
7 #include "etnaviv_gpu.h"
8 #include "etnaviv_gem.h"
9 #include "etnaviv_mmu.h"
10
11 #include "common.xml.h"
12 #include "state.xml.h"
13 #include "state_hi.xml.h"
14 #include "state_3d.xml.h"
15 #include "cmdstream.xml.h"
16
17 /*
18 * Command Buffer helper:
19 */
20
21
OUT(struct etnaviv_cmdbuf * buffer,u32 data)22 static inline void OUT(struct etnaviv_cmdbuf *buffer, u32 data)
23 {
24 u32 *vaddr = (u32 *)buffer->vaddr;
25
26 BUG_ON(buffer->user_size >= buffer->size);
27
28 vaddr[buffer->user_size / 4] = data;
29 buffer->user_size += 4;
30 }
31
CMD_LOAD_STATE(struct etnaviv_cmdbuf * buffer,u32 reg,u32 value)32 static inline void CMD_LOAD_STATE(struct etnaviv_cmdbuf *buffer,
33 u32 reg, u32 value)
34 {
35 u32 index = reg >> VIV_FE_LOAD_STATE_HEADER_OFFSET__SHR;
36
37 buffer->user_size = ALIGN(buffer->user_size, 8);
38
39 /* write a register via cmd stream */
40 OUT(buffer, VIV_FE_LOAD_STATE_HEADER_OP_LOAD_STATE |
41 VIV_FE_LOAD_STATE_HEADER_COUNT(1) |
42 VIV_FE_LOAD_STATE_HEADER_OFFSET(index));
43 OUT(buffer, value);
44 }
45
CMD_END(struct etnaviv_cmdbuf * buffer)46 static inline void CMD_END(struct etnaviv_cmdbuf *buffer)
47 {
48 buffer->user_size = ALIGN(buffer->user_size, 8);
49
50 OUT(buffer, VIV_FE_END_HEADER_OP_END);
51 }
52
CMD_WAIT(struct etnaviv_cmdbuf * buffer)53 static inline void CMD_WAIT(struct etnaviv_cmdbuf *buffer)
54 {
55 buffer->user_size = ALIGN(buffer->user_size, 8);
56
57 OUT(buffer, VIV_FE_WAIT_HEADER_OP_WAIT | 200);
58 }
59
CMD_LINK(struct etnaviv_cmdbuf * buffer,u16 prefetch,u32 address)60 static inline void CMD_LINK(struct etnaviv_cmdbuf *buffer,
61 u16 prefetch, u32 address)
62 {
63 buffer->user_size = ALIGN(buffer->user_size, 8);
64
65 OUT(buffer, VIV_FE_LINK_HEADER_OP_LINK |
66 VIV_FE_LINK_HEADER_PREFETCH(prefetch));
67 OUT(buffer, address);
68 }
69
CMD_STALL(struct etnaviv_cmdbuf * buffer,u32 from,u32 to)70 static inline void CMD_STALL(struct etnaviv_cmdbuf *buffer,
71 u32 from, u32 to)
72 {
73 buffer->user_size = ALIGN(buffer->user_size, 8);
74
75 OUT(buffer, VIV_FE_STALL_HEADER_OP_STALL);
76 OUT(buffer, VIV_FE_STALL_TOKEN_FROM(from) | VIV_FE_STALL_TOKEN_TO(to));
77 }
78
CMD_SEM(struct etnaviv_cmdbuf * buffer,u32 from,u32 to)79 static inline void CMD_SEM(struct etnaviv_cmdbuf *buffer, u32 from, u32 to)
80 {
81 CMD_LOAD_STATE(buffer, VIVS_GL_SEMAPHORE_TOKEN,
82 VIVS_GL_SEMAPHORE_TOKEN_FROM(from) |
83 VIVS_GL_SEMAPHORE_TOKEN_TO(to));
84 }
85
etnaviv_cmd_select_pipe(struct etnaviv_gpu * gpu,struct etnaviv_cmdbuf * buffer,u8 pipe)86 static void etnaviv_cmd_select_pipe(struct etnaviv_gpu *gpu,
87 struct etnaviv_cmdbuf *buffer, u8 pipe)
88 {
89 u32 flush = 0;
90
91 lockdep_assert_held(&gpu->lock);
92
93 /*
94 * This assumes that if we're switching to 2D, we're switching
95 * away from 3D, and vice versa. Hence, if we're switching to
96 * the 2D core, we need to flush the 3D depth and color caches,
97 * otherwise we need to flush the 2D pixel engine cache.
98 */
99 if (gpu->exec_state == ETNA_PIPE_2D)
100 flush = VIVS_GL_FLUSH_CACHE_PE2D;
101 else if (gpu->exec_state == ETNA_PIPE_3D)
102 flush = VIVS_GL_FLUSH_CACHE_DEPTH | VIVS_GL_FLUSH_CACHE_COLOR;
103
104 CMD_LOAD_STATE(buffer, VIVS_GL_FLUSH_CACHE, flush);
105 CMD_SEM(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
106 CMD_STALL(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
107
108 CMD_LOAD_STATE(buffer, VIVS_GL_PIPE_SELECT,
109 VIVS_GL_PIPE_SELECT_PIPE(pipe));
110 }
111
etnaviv_buffer_dump(struct etnaviv_gpu * gpu,struct etnaviv_cmdbuf * buf,u32 off,u32 len)112 static void etnaviv_buffer_dump(struct etnaviv_gpu *gpu,
113 struct etnaviv_cmdbuf *buf, u32 off, u32 len)
114 {
115 u32 size = buf->size;
116 u32 *ptr = buf->vaddr + off;
117
118 dev_info(gpu->dev, "virt %p phys 0x%08x free 0x%08x\n",
119 ptr, etnaviv_cmdbuf_get_va(buf) + off, size - len * 4 - off);
120
121 print_hex_dump(KERN_INFO, "cmd ", DUMP_PREFIX_OFFSET, 16, 4,
122 ptr, len * 4, 0);
123 }
124
125 /*
126 * Safely replace the WAIT of a waitlink with a new command and argument.
127 * The GPU may be executing this WAIT while we're modifying it, so we have
128 * to write it in a specific order to avoid the GPU branching to somewhere
129 * else. 'wl_offset' is the offset to the first byte of the WAIT command.
130 */
etnaviv_buffer_replace_wait(struct etnaviv_cmdbuf * buffer,unsigned int wl_offset,u32 cmd,u32 arg)131 static void etnaviv_buffer_replace_wait(struct etnaviv_cmdbuf *buffer,
132 unsigned int wl_offset, u32 cmd, u32 arg)
133 {
134 u32 *lw = buffer->vaddr + wl_offset;
135
136 lw[1] = arg;
137 mb();
138 lw[0] = cmd;
139 mb();
140 }
141
142 /*
143 * Ensure that there is space in the command buffer to contiguously write
144 * 'cmd_dwords' 64-bit words into the buffer, wrapping if necessary.
145 */
etnaviv_buffer_reserve(struct etnaviv_gpu * gpu,struct etnaviv_cmdbuf * buffer,unsigned int cmd_dwords)146 static u32 etnaviv_buffer_reserve(struct etnaviv_gpu *gpu,
147 struct etnaviv_cmdbuf *buffer, unsigned int cmd_dwords)
148 {
149 if (buffer->user_size + cmd_dwords * sizeof(u64) > buffer->size)
150 buffer->user_size = 0;
151
152 return etnaviv_cmdbuf_get_va(buffer) + buffer->user_size;
153 }
154
etnaviv_buffer_init(struct etnaviv_gpu * gpu)155 u16 etnaviv_buffer_init(struct etnaviv_gpu *gpu)
156 {
157 struct etnaviv_cmdbuf *buffer = &gpu->buffer;
158
159 lockdep_assert_held(&gpu->lock);
160
161 /* initialize buffer */
162 buffer->user_size = 0;
163
164 CMD_WAIT(buffer);
165 CMD_LINK(buffer, 2, etnaviv_cmdbuf_get_va(buffer) +
166 buffer->user_size - 4);
167
168 return buffer->user_size / 8;
169 }
170
etnaviv_buffer_config_mmuv2(struct etnaviv_gpu * gpu,u32 mtlb_addr,u32 safe_addr)171 u16 etnaviv_buffer_config_mmuv2(struct etnaviv_gpu *gpu, u32 mtlb_addr, u32 safe_addr)
172 {
173 struct etnaviv_cmdbuf *buffer = &gpu->buffer;
174
175 lockdep_assert_held(&gpu->lock);
176
177 buffer->user_size = 0;
178
179 if (gpu->identity.features & chipFeatures_PIPE_3D) {
180 CMD_LOAD_STATE(buffer, VIVS_GL_PIPE_SELECT,
181 VIVS_GL_PIPE_SELECT_PIPE(ETNA_PIPE_3D));
182 CMD_LOAD_STATE(buffer, VIVS_MMUv2_CONFIGURATION,
183 mtlb_addr | VIVS_MMUv2_CONFIGURATION_MODE_MODE4_K);
184 CMD_LOAD_STATE(buffer, VIVS_MMUv2_SAFE_ADDRESS, safe_addr);
185 CMD_SEM(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
186 CMD_STALL(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
187 }
188
189 if (gpu->identity.features & chipFeatures_PIPE_2D) {
190 CMD_LOAD_STATE(buffer, VIVS_GL_PIPE_SELECT,
191 VIVS_GL_PIPE_SELECT_PIPE(ETNA_PIPE_2D));
192 CMD_LOAD_STATE(buffer, VIVS_MMUv2_CONFIGURATION,
193 mtlb_addr | VIVS_MMUv2_CONFIGURATION_MODE_MODE4_K);
194 CMD_LOAD_STATE(buffer, VIVS_MMUv2_SAFE_ADDRESS, safe_addr);
195 CMD_SEM(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
196 CMD_STALL(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
197 }
198
199 CMD_END(buffer);
200
201 buffer->user_size = ALIGN(buffer->user_size, 8);
202
203 return buffer->user_size / 8;
204 }
205
etnaviv_buffer_config_pta(struct etnaviv_gpu * gpu)206 u16 etnaviv_buffer_config_pta(struct etnaviv_gpu *gpu)
207 {
208 struct etnaviv_cmdbuf *buffer = &gpu->buffer;
209
210 lockdep_assert_held(&gpu->lock);
211
212 buffer->user_size = 0;
213
214 CMD_LOAD_STATE(buffer, VIVS_MMUv2_PTA_CONFIG,
215 VIVS_MMUv2_PTA_CONFIG_INDEX(0));
216
217 CMD_END(buffer);
218
219 buffer->user_size = ALIGN(buffer->user_size, 8);
220
221 return buffer->user_size / 8;
222 }
223
etnaviv_buffer_end(struct etnaviv_gpu * gpu)224 void etnaviv_buffer_end(struct etnaviv_gpu *gpu)
225 {
226 struct etnaviv_cmdbuf *buffer = &gpu->buffer;
227 unsigned int waitlink_offset = buffer->user_size - 16;
228 u32 link_target, flush = 0;
229
230 lockdep_assert_held(&gpu->lock);
231
232 if (gpu->exec_state == ETNA_PIPE_2D)
233 flush = VIVS_GL_FLUSH_CACHE_PE2D;
234 else if (gpu->exec_state == ETNA_PIPE_3D)
235 flush = VIVS_GL_FLUSH_CACHE_DEPTH |
236 VIVS_GL_FLUSH_CACHE_COLOR |
237 VIVS_GL_FLUSH_CACHE_TEXTURE |
238 VIVS_GL_FLUSH_CACHE_TEXTUREVS |
239 VIVS_GL_FLUSH_CACHE_SHADER_L2;
240
241 if (flush) {
242 unsigned int dwords = 7;
243
244 link_target = etnaviv_buffer_reserve(gpu, buffer, dwords);
245
246 CMD_SEM(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
247 CMD_STALL(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
248 CMD_LOAD_STATE(buffer, VIVS_GL_FLUSH_CACHE, flush);
249 if (gpu->exec_state == ETNA_PIPE_3D)
250 CMD_LOAD_STATE(buffer, VIVS_TS_FLUSH_CACHE,
251 VIVS_TS_FLUSH_CACHE_FLUSH);
252 CMD_SEM(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
253 CMD_STALL(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
254 CMD_END(buffer);
255
256 etnaviv_buffer_replace_wait(buffer, waitlink_offset,
257 VIV_FE_LINK_HEADER_OP_LINK |
258 VIV_FE_LINK_HEADER_PREFETCH(dwords),
259 link_target);
260 } else {
261 /* Replace the last link-wait with an "END" command */
262 etnaviv_buffer_replace_wait(buffer, waitlink_offset,
263 VIV_FE_END_HEADER_OP_END, 0);
264 }
265 }
266
267 /* Append a 'sync point' to the ring buffer. */
etnaviv_sync_point_queue(struct etnaviv_gpu * gpu,unsigned int event)268 void etnaviv_sync_point_queue(struct etnaviv_gpu *gpu, unsigned int event)
269 {
270 struct etnaviv_cmdbuf *buffer = &gpu->buffer;
271 unsigned int waitlink_offset = buffer->user_size - 16;
272 u32 dwords, target;
273
274 lockdep_assert_held(&gpu->lock);
275
276 /*
277 * We need at most 3 dwords in the return target:
278 * 1 event + 1 end + 1 wait + 1 link.
279 */
280 dwords = 4;
281 target = etnaviv_buffer_reserve(gpu, buffer, dwords);
282
283 /* Signal sync point event */
284 CMD_LOAD_STATE(buffer, VIVS_GL_EVENT, VIVS_GL_EVENT_EVENT_ID(event) |
285 VIVS_GL_EVENT_FROM_PE);
286
287 /* Stop the FE to 'pause' the GPU */
288 CMD_END(buffer);
289
290 /* Append waitlink */
291 CMD_WAIT(buffer);
292 CMD_LINK(buffer, 2, etnaviv_cmdbuf_get_va(buffer) +
293 buffer->user_size - 4);
294
295 /*
296 * Kick off the 'sync point' command by replacing the previous
297 * WAIT with a link to the address in the ring buffer.
298 */
299 etnaviv_buffer_replace_wait(buffer, waitlink_offset,
300 VIV_FE_LINK_HEADER_OP_LINK |
301 VIV_FE_LINK_HEADER_PREFETCH(dwords),
302 target);
303 }
304
305 /* Append a command buffer to the ring buffer. */
etnaviv_buffer_queue(struct etnaviv_gpu * gpu,u32 exec_state,unsigned int event,struct etnaviv_cmdbuf * cmdbuf)306 void etnaviv_buffer_queue(struct etnaviv_gpu *gpu, u32 exec_state,
307 unsigned int event, struct etnaviv_cmdbuf *cmdbuf)
308 {
309 struct etnaviv_cmdbuf *buffer = &gpu->buffer;
310 unsigned int waitlink_offset = buffer->user_size - 16;
311 u32 return_target, return_dwords;
312 u32 link_target, link_dwords;
313 bool switch_context = gpu->exec_state != exec_state;
314
315 lockdep_assert_held(&gpu->lock);
316
317 if (drm_debug & DRM_UT_DRIVER)
318 etnaviv_buffer_dump(gpu, buffer, 0, 0x50);
319
320 link_target = etnaviv_cmdbuf_get_va(cmdbuf);
321 link_dwords = cmdbuf->size / 8;
322
323 /*
324 * If we need maintanence prior to submitting this buffer, we will
325 * need to append a mmu flush load state, followed by a new
326 * link to this buffer - a total of four additional words.
327 */
328 if (gpu->mmu->need_flush || switch_context) {
329 u32 target, extra_dwords;
330
331 /* link command */
332 extra_dwords = 1;
333
334 /* flush command */
335 if (gpu->mmu->need_flush) {
336 if (gpu->mmu->version == ETNAVIV_IOMMU_V1)
337 extra_dwords += 1;
338 else
339 extra_dwords += 3;
340 }
341
342 /* pipe switch commands */
343 if (switch_context)
344 extra_dwords += 4;
345
346 target = etnaviv_buffer_reserve(gpu, buffer, extra_dwords);
347
348 if (gpu->mmu->need_flush) {
349 /* Add the MMU flush */
350 if (gpu->mmu->version == ETNAVIV_IOMMU_V1) {
351 CMD_LOAD_STATE(buffer, VIVS_GL_FLUSH_MMU,
352 VIVS_GL_FLUSH_MMU_FLUSH_FEMMU |
353 VIVS_GL_FLUSH_MMU_FLUSH_UNK1 |
354 VIVS_GL_FLUSH_MMU_FLUSH_UNK2 |
355 VIVS_GL_FLUSH_MMU_FLUSH_PEMMU |
356 VIVS_GL_FLUSH_MMU_FLUSH_UNK4);
357 } else {
358 CMD_LOAD_STATE(buffer, VIVS_MMUv2_CONFIGURATION,
359 VIVS_MMUv2_CONFIGURATION_MODE_MASK |
360 VIVS_MMUv2_CONFIGURATION_ADDRESS_MASK |
361 VIVS_MMUv2_CONFIGURATION_FLUSH_FLUSH);
362 CMD_SEM(buffer, SYNC_RECIPIENT_FE,
363 SYNC_RECIPIENT_PE);
364 CMD_STALL(buffer, SYNC_RECIPIENT_FE,
365 SYNC_RECIPIENT_PE);
366 }
367
368 gpu->mmu->need_flush = false;
369 }
370
371 if (switch_context) {
372 etnaviv_cmd_select_pipe(gpu, buffer, exec_state);
373 gpu->exec_state = exec_state;
374 }
375
376 /* And the link to the submitted buffer */
377 CMD_LINK(buffer, link_dwords, link_target);
378
379 /* Update the link target to point to above instructions */
380 link_target = target;
381 link_dwords = extra_dwords;
382 }
383
384 /*
385 * Append a LINK to the submitted command buffer to return to
386 * the ring buffer. return_target is the ring target address.
387 * We need at most 7 dwords in the return target: 2 cache flush +
388 * 2 semaphore stall + 1 event + 1 wait + 1 link.
389 */
390 return_dwords = 7;
391 return_target = etnaviv_buffer_reserve(gpu, buffer, return_dwords);
392 CMD_LINK(cmdbuf, return_dwords, return_target);
393
394 /*
395 * Append a cache flush, stall, event, wait and link pointing back to
396 * the wait command to the ring buffer.
397 */
398 if (gpu->exec_state == ETNA_PIPE_2D) {
399 CMD_LOAD_STATE(buffer, VIVS_GL_FLUSH_CACHE,
400 VIVS_GL_FLUSH_CACHE_PE2D);
401 } else {
402 CMD_LOAD_STATE(buffer, VIVS_GL_FLUSH_CACHE,
403 VIVS_GL_FLUSH_CACHE_DEPTH |
404 VIVS_GL_FLUSH_CACHE_COLOR);
405 CMD_LOAD_STATE(buffer, VIVS_TS_FLUSH_CACHE,
406 VIVS_TS_FLUSH_CACHE_FLUSH);
407 }
408 CMD_SEM(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
409 CMD_STALL(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
410 CMD_LOAD_STATE(buffer, VIVS_GL_EVENT, VIVS_GL_EVENT_EVENT_ID(event) |
411 VIVS_GL_EVENT_FROM_PE);
412 CMD_WAIT(buffer);
413 CMD_LINK(buffer, 2, etnaviv_cmdbuf_get_va(buffer) +
414 buffer->user_size - 4);
415
416 if (drm_debug & DRM_UT_DRIVER)
417 pr_info("stream link to 0x%08x @ 0x%08x %p\n",
418 return_target, etnaviv_cmdbuf_get_va(cmdbuf),
419 cmdbuf->vaddr);
420
421 if (drm_debug & DRM_UT_DRIVER) {
422 print_hex_dump(KERN_INFO, "cmd ", DUMP_PREFIX_OFFSET, 16, 4,
423 cmdbuf->vaddr, cmdbuf->size, 0);
424
425 pr_info("link op: %p\n", buffer->vaddr + waitlink_offset);
426 pr_info("addr: 0x%08x\n", link_target);
427 pr_info("back: 0x%08x\n", return_target);
428 pr_info("event: %d\n", event);
429 }
430
431 /*
432 * Kick off the submitted command by replacing the previous
433 * WAIT with a link to the address in the ring buffer.
434 */
435 etnaviv_buffer_replace_wait(buffer, waitlink_offset,
436 VIV_FE_LINK_HEADER_OP_LINK |
437 VIV_FE_LINK_HEADER_PREFETCH(link_dwords),
438 link_target);
439
440 if (drm_debug & DRM_UT_DRIVER)
441 etnaviv_buffer_dump(gpu, buffer, 0, 0x50);
442
443 gpu->lastctx = cmdbuf->ctx;
444 }
445