1 /* r128_state.c -- State support for r128 -*- linux-c -*-
2  * Created: Thu Jan 27 02:53:43 2000 by gareth@valinux.com
3  */
4 /*
5  * Copyright 2000 VA Linux Systems, Inc., Sunnyvale, California.
6  * All Rights Reserved.
7  *
8  * Permission is hereby granted, free of charge, to any person obtaining a
9  * copy of this software and associated documentation files (the "Software"),
10  * to deal in the Software without restriction, including without limitation
11  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
12  * and/or sell copies of the Software, and to permit persons to whom the
13  * Software is furnished to do so, subject to the following conditions:
14  *
15  * The above copyright notice and this permission notice (including the next
16  * paragraph) shall be included in all copies or substantial portions of the
17  * Software.
18  *
19  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
20  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
21  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
22  * PRECISION INSIGHT AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
23  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
24  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
25  * DEALINGS IN THE SOFTWARE.
26  *
27  * Authors:
28  *    Gareth Hughes <gareth@valinux.com>
29  */
30 
31 #include <drm/drmP.h>
32 #include <drm/r128_drm.h>
33 #include "r128_drv.h"
34 
35 /* ================================================================
36  * CCE hardware state programming functions
37  */
38 
r128_emit_clip_rects(drm_r128_private_t * dev_priv,struct drm_clip_rect * boxes,int count)39 static void r128_emit_clip_rects(drm_r128_private_t *dev_priv,
40 				 struct drm_clip_rect *boxes, int count)
41 {
42 	u32 aux_sc_cntl = 0x00000000;
43 	RING_LOCALS;
44 	DRM_DEBUG("\n");
45 
46 	BEGIN_RING((count < 3 ? count : 3) * 5 + 2);
47 
48 	if (count >= 1) {
49 		OUT_RING(CCE_PACKET0(R128_AUX1_SC_LEFT, 3));
50 		OUT_RING(boxes[0].x1);
51 		OUT_RING(boxes[0].x2 - 1);
52 		OUT_RING(boxes[0].y1);
53 		OUT_RING(boxes[0].y2 - 1);
54 
55 		aux_sc_cntl |= (R128_AUX1_SC_EN | R128_AUX1_SC_MODE_OR);
56 	}
57 	if (count >= 2) {
58 		OUT_RING(CCE_PACKET0(R128_AUX2_SC_LEFT, 3));
59 		OUT_RING(boxes[1].x1);
60 		OUT_RING(boxes[1].x2 - 1);
61 		OUT_RING(boxes[1].y1);
62 		OUT_RING(boxes[1].y2 - 1);
63 
64 		aux_sc_cntl |= (R128_AUX2_SC_EN | R128_AUX2_SC_MODE_OR);
65 	}
66 	if (count >= 3) {
67 		OUT_RING(CCE_PACKET0(R128_AUX3_SC_LEFT, 3));
68 		OUT_RING(boxes[2].x1);
69 		OUT_RING(boxes[2].x2 - 1);
70 		OUT_RING(boxes[2].y1);
71 		OUT_RING(boxes[2].y2 - 1);
72 
73 		aux_sc_cntl |= (R128_AUX3_SC_EN | R128_AUX3_SC_MODE_OR);
74 	}
75 
76 	OUT_RING(CCE_PACKET0(R128_AUX_SC_CNTL, 0));
77 	OUT_RING(aux_sc_cntl);
78 
79 	ADVANCE_RING();
80 }
81 
r128_emit_core(drm_r128_private_t * dev_priv)82 static __inline__ void r128_emit_core(drm_r128_private_t *dev_priv)
83 {
84 	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
85 	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
86 	RING_LOCALS;
87 	DRM_DEBUG("\n");
88 
89 	BEGIN_RING(2);
90 
91 	OUT_RING(CCE_PACKET0(R128_SCALE_3D_CNTL, 0));
92 	OUT_RING(ctx->scale_3d_cntl);
93 
94 	ADVANCE_RING();
95 }
96 
r128_emit_context(drm_r128_private_t * dev_priv)97 static __inline__ void r128_emit_context(drm_r128_private_t *dev_priv)
98 {
99 	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
100 	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
101 	RING_LOCALS;
102 	DRM_DEBUG("\n");
103 
104 	BEGIN_RING(13);
105 
106 	OUT_RING(CCE_PACKET0(R128_DST_PITCH_OFFSET_C, 11));
107 	OUT_RING(ctx->dst_pitch_offset_c);
108 	OUT_RING(ctx->dp_gui_master_cntl_c);
109 	OUT_RING(ctx->sc_top_left_c);
110 	OUT_RING(ctx->sc_bottom_right_c);
111 	OUT_RING(ctx->z_offset_c);
112 	OUT_RING(ctx->z_pitch_c);
113 	OUT_RING(ctx->z_sten_cntl_c);
114 	OUT_RING(ctx->tex_cntl_c);
115 	OUT_RING(ctx->misc_3d_state_cntl_reg);
116 	OUT_RING(ctx->texture_clr_cmp_clr_c);
117 	OUT_RING(ctx->texture_clr_cmp_msk_c);
118 	OUT_RING(ctx->fog_color_c);
119 
120 	ADVANCE_RING();
121 }
122 
r128_emit_setup(drm_r128_private_t * dev_priv)123 static __inline__ void r128_emit_setup(drm_r128_private_t *dev_priv)
124 {
125 	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
126 	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
127 	RING_LOCALS;
128 	DRM_DEBUG("\n");
129 
130 	BEGIN_RING(3);
131 
132 	OUT_RING(CCE_PACKET1(R128_SETUP_CNTL, R128_PM4_VC_FPU_SETUP));
133 	OUT_RING(ctx->setup_cntl);
134 	OUT_RING(ctx->pm4_vc_fpu_setup);
135 
136 	ADVANCE_RING();
137 }
138 
r128_emit_masks(drm_r128_private_t * dev_priv)139 static __inline__ void r128_emit_masks(drm_r128_private_t *dev_priv)
140 {
141 	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
142 	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
143 	RING_LOCALS;
144 	DRM_DEBUG("\n");
145 
146 	BEGIN_RING(5);
147 
148 	OUT_RING(CCE_PACKET0(R128_DP_WRITE_MASK, 0));
149 	OUT_RING(ctx->dp_write_mask);
150 
151 	OUT_RING(CCE_PACKET0(R128_STEN_REF_MASK_C, 1));
152 	OUT_RING(ctx->sten_ref_mask_c);
153 	OUT_RING(ctx->plane_3d_mask_c);
154 
155 	ADVANCE_RING();
156 }
157 
r128_emit_window(drm_r128_private_t * dev_priv)158 static __inline__ void r128_emit_window(drm_r128_private_t *dev_priv)
159 {
160 	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
161 	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
162 	RING_LOCALS;
163 	DRM_DEBUG("\n");
164 
165 	BEGIN_RING(2);
166 
167 	OUT_RING(CCE_PACKET0(R128_WINDOW_XY_OFFSET, 0));
168 	OUT_RING(ctx->window_xy_offset);
169 
170 	ADVANCE_RING();
171 }
172 
r128_emit_tex0(drm_r128_private_t * dev_priv)173 static __inline__ void r128_emit_tex0(drm_r128_private_t *dev_priv)
174 {
175 	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
176 	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
177 	drm_r128_texture_regs_t *tex = &sarea_priv->tex_state[0];
178 	int i;
179 	RING_LOCALS;
180 	DRM_DEBUG("\n");
181 
182 	BEGIN_RING(7 + R128_MAX_TEXTURE_LEVELS);
183 
184 	OUT_RING(CCE_PACKET0(R128_PRIM_TEX_CNTL_C,
185 			     2 + R128_MAX_TEXTURE_LEVELS));
186 	OUT_RING(tex->tex_cntl);
187 	OUT_RING(tex->tex_combine_cntl);
188 	OUT_RING(ctx->tex_size_pitch_c);
189 	for (i = 0; i < R128_MAX_TEXTURE_LEVELS; i++)
190 		OUT_RING(tex->tex_offset[i]);
191 
192 	OUT_RING(CCE_PACKET0(R128_CONSTANT_COLOR_C, 1));
193 	OUT_RING(ctx->constant_color_c);
194 	OUT_RING(tex->tex_border_color);
195 
196 	ADVANCE_RING();
197 }
198 
r128_emit_tex1(drm_r128_private_t * dev_priv)199 static __inline__ void r128_emit_tex1(drm_r128_private_t *dev_priv)
200 {
201 	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
202 	drm_r128_texture_regs_t *tex = &sarea_priv->tex_state[1];
203 	int i;
204 	RING_LOCALS;
205 	DRM_DEBUG("\n");
206 
207 	BEGIN_RING(5 + R128_MAX_TEXTURE_LEVELS);
208 
209 	OUT_RING(CCE_PACKET0(R128_SEC_TEX_CNTL_C, 1 + R128_MAX_TEXTURE_LEVELS));
210 	OUT_RING(tex->tex_cntl);
211 	OUT_RING(tex->tex_combine_cntl);
212 	for (i = 0; i < R128_MAX_TEXTURE_LEVELS; i++)
213 		OUT_RING(tex->tex_offset[i]);
214 
215 	OUT_RING(CCE_PACKET0(R128_SEC_TEXTURE_BORDER_COLOR_C, 0));
216 	OUT_RING(tex->tex_border_color);
217 
218 	ADVANCE_RING();
219 }
220 
r128_emit_state(drm_r128_private_t * dev_priv)221 static void r128_emit_state(drm_r128_private_t *dev_priv)
222 {
223 	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
224 	unsigned int dirty = sarea_priv->dirty;
225 
226 	DRM_DEBUG("dirty=0x%08x\n", dirty);
227 
228 	if (dirty & R128_UPLOAD_CORE) {
229 		r128_emit_core(dev_priv);
230 		sarea_priv->dirty &= ~R128_UPLOAD_CORE;
231 	}
232 
233 	if (dirty & R128_UPLOAD_CONTEXT) {
234 		r128_emit_context(dev_priv);
235 		sarea_priv->dirty &= ~R128_UPLOAD_CONTEXT;
236 	}
237 
238 	if (dirty & R128_UPLOAD_SETUP) {
239 		r128_emit_setup(dev_priv);
240 		sarea_priv->dirty &= ~R128_UPLOAD_SETUP;
241 	}
242 
243 	if (dirty & R128_UPLOAD_MASKS) {
244 		r128_emit_masks(dev_priv);
245 		sarea_priv->dirty &= ~R128_UPLOAD_MASKS;
246 	}
247 
248 	if (dirty & R128_UPLOAD_WINDOW) {
249 		r128_emit_window(dev_priv);
250 		sarea_priv->dirty &= ~R128_UPLOAD_WINDOW;
251 	}
252 
253 	if (dirty & R128_UPLOAD_TEX0) {
254 		r128_emit_tex0(dev_priv);
255 		sarea_priv->dirty &= ~R128_UPLOAD_TEX0;
256 	}
257 
258 	if (dirty & R128_UPLOAD_TEX1) {
259 		r128_emit_tex1(dev_priv);
260 		sarea_priv->dirty &= ~R128_UPLOAD_TEX1;
261 	}
262 
263 	/* Turn off the texture cache flushing */
264 	sarea_priv->context_state.tex_cntl_c &= ~R128_TEX_CACHE_FLUSH;
265 
266 	sarea_priv->dirty &= ~R128_REQUIRE_QUIESCENCE;
267 }
268 
269 #if R128_PERFORMANCE_BOXES
270 /* ================================================================
271  * Performance monitoring functions
272  */
273 
r128_clear_box(drm_r128_private_t * dev_priv,int x,int y,int w,int h,int r,int g,int b)274 static void r128_clear_box(drm_r128_private_t *dev_priv,
275 			   int x, int y, int w, int h, int r, int g, int b)
276 {
277 	u32 pitch, offset;
278 	u32 fb_bpp, color;
279 	RING_LOCALS;
280 
281 	switch (dev_priv->fb_bpp) {
282 	case 16:
283 		fb_bpp = R128_GMC_DST_16BPP;
284 		color = (((r & 0xf8) << 8) |
285 			 ((g & 0xfc) << 3) | ((b & 0xf8) >> 3));
286 		break;
287 	case 24:
288 		fb_bpp = R128_GMC_DST_24BPP;
289 		color = ((r << 16) | (g << 8) | b);
290 		break;
291 	case 32:
292 		fb_bpp = R128_GMC_DST_32BPP;
293 		color = (((0xff) << 24) | (r << 16) | (g << 8) | b);
294 		break;
295 	default:
296 		return;
297 	}
298 
299 	offset = dev_priv->back_offset;
300 	pitch = dev_priv->back_pitch >> 3;
301 
302 	BEGIN_RING(6);
303 
304 	OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
305 	OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
306 		 R128_GMC_BRUSH_SOLID_COLOR |
307 		 fb_bpp |
308 		 R128_GMC_SRC_DATATYPE_COLOR |
309 		 R128_ROP3_P |
310 		 R128_GMC_CLR_CMP_CNTL_DIS | R128_GMC_AUX_CLIP_DIS);
311 
312 	OUT_RING((pitch << 21) | (offset >> 5));
313 	OUT_RING(color);
314 
315 	OUT_RING((x << 16) | y);
316 	OUT_RING((w << 16) | h);
317 
318 	ADVANCE_RING();
319 }
320 
r128_cce_performance_boxes(drm_r128_private_t * dev_priv)321 static void r128_cce_performance_boxes(drm_r128_private_t *dev_priv)
322 {
323 	if (atomic_read(&dev_priv->idle_count) == 0)
324 		r128_clear_box(dev_priv, 64, 4, 8, 8, 0, 255, 0);
325 	else
326 		atomic_set(&dev_priv->idle_count, 0);
327 }
328 
329 #endif
330 
331 /* ================================================================
332  * CCE command dispatch functions
333  */
334 
r128_print_dirty(const char * msg,unsigned int flags)335 static void r128_print_dirty(const char *msg, unsigned int flags)
336 {
337 	DRM_INFO("%s: (0x%x) %s%s%s%s%s%s%s%s%s\n",
338 		 msg,
339 		 flags,
340 		 (flags & R128_UPLOAD_CORE) ? "core, " : "",
341 		 (flags & R128_UPLOAD_CONTEXT) ? "context, " : "",
342 		 (flags & R128_UPLOAD_SETUP) ? "setup, " : "",
343 		 (flags & R128_UPLOAD_TEX0) ? "tex0, " : "",
344 		 (flags & R128_UPLOAD_TEX1) ? "tex1, " : "",
345 		 (flags & R128_UPLOAD_MASKS) ? "masks, " : "",
346 		 (flags & R128_UPLOAD_WINDOW) ? "window, " : "",
347 		 (flags & R128_UPLOAD_CLIPRECTS) ? "cliprects, " : "",
348 		 (flags & R128_REQUIRE_QUIESCENCE) ? "quiescence, " : "");
349 }
350 
r128_cce_dispatch_clear(struct drm_device * dev,drm_r128_clear_t * clear)351 static void r128_cce_dispatch_clear(struct drm_device *dev,
352 				    drm_r128_clear_t *clear)
353 {
354 	drm_r128_private_t *dev_priv = dev->dev_private;
355 	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
356 	int nbox = sarea_priv->nbox;
357 	struct drm_clip_rect *pbox = sarea_priv->boxes;
358 	unsigned int flags = clear->flags;
359 	int i;
360 	RING_LOCALS;
361 	DRM_DEBUG("\n");
362 
363 	if (dev_priv->page_flipping && dev_priv->current_page == 1) {
364 		unsigned int tmp = flags;
365 
366 		flags &= ~(R128_FRONT | R128_BACK);
367 		if (tmp & R128_FRONT)
368 			flags |= R128_BACK;
369 		if (tmp & R128_BACK)
370 			flags |= R128_FRONT;
371 	}
372 
373 	for (i = 0; i < nbox; i++) {
374 		int x = pbox[i].x1;
375 		int y = pbox[i].y1;
376 		int w = pbox[i].x2 - x;
377 		int h = pbox[i].y2 - y;
378 
379 		DRM_DEBUG("dispatch clear %d,%d-%d,%d flags 0x%x\n",
380 			  pbox[i].x1, pbox[i].y1, pbox[i].x2,
381 			  pbox[i].y2, flags);
382 
383 		if (flags & (R128_FRONT | R128_BACK)) {
384 			BEGIN_RING(2);
385 
386 			OUT_RING(CCE_PACKET0(R128_DP_WRITE_MASK, 0));
387 			OUT_RING(clear->color_mask);
388 
389 			ADVANCE_RING();
390 		}
391 
392 		if (flags & R128_FRONT) {
393 			BEGIN_RING(6);
394 
395 			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
396 			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
397 				 R128_GMC_BRUSH_SOLID_COLOR |
398 				 (dev_priv->color_fmt << 8) |
399 				 R128_GMC_SRC_DATATYPE_COLOR |
400 				 R128_ROP3_P |
401 				 R128_GMC_CLR_CMP_CNTL_DIS |
402 				 R128_GMC_AUX_CLIP_DIS);
403 
404 			OUT_RING(dev_priv->front_pitch_offset_c);
405 			OUT_RING(clear->clear_color);
406 
407 			OUT_RING((x << 16) | y);
408 			OUT_RING((w << 16) | h);
409 
410 			ADVANCE_RING();
411 		}
412 
413 		if (flags & R128_BACK) {
414 			BEGIN_RING(6);
415 
416 			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
417 			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
418 				 R128_GMC_BRUSH_SOLID_COLOR |
419 				 (dev_priv->color_fmt << 8) |
420 				 R128_GMC_SRC_DATATYPE_COLOR |
421 				 R128_ROP3_P |
422 				 R128_GMC_CLR_CMP_CNTL_DIS |
423 				 R128_GMC_AUX_CLIP_DIS);
424 
425 			OUT_RING(dev_priv->back_pitch_offset_c);
426 			OUT_RING(clear->clear_color);
427 
428 			OUT_RING((x << 16) | y);
429 			OUT_RING((w << 16) | h);
430 
431 			ADVANCE_RING();
432 		}
433 
434 		if (flags & R128_DEPTH) {
435 			BEGIN_RING(6);
436 
437 			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
438 			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
439 				 R128_GMC_BRUSH_SOLID_COLOR |
440 				 (dev_priv->depth_fmt << 8) |
441 				 R128_GMC_SRC_DATATYPE_COLOR |
442 				 R128_ROP3_P |
443 				 R128_GMC_CLR_CMP_CNTL_DIS |
444 				 R128_GMC_AUX_CLIP_DIS | R128_GMC_WR_MSK_DIS);
445 
446 			OUT_RING(dev_priv->depth_pitch_offset_c);
447 			OUT_RING(clear->clear_depth);
448 
449 			OUT_RING((x << 16) | y);
450 			OUT_RING((w << 16) | h);
451 
452 			ADVANCE_RING();
453 		}
454 	}
455 }
456 
r128_cce_dispatch_swap(struct drm_device * dev)457 static void r128_cce_dispatch_swap(struct drm_device *dev)
458 {
459 	drm_r128_private_t *dev_priv = dev->dev_private;
460 	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
461 	int nbox = sarea_priv->nbox;
462 	struct drm_clip_rect *pbox = sarea_priv->boxes;
463 	int i;
464 	RING_LOCALS;
465 	DRM_DEBUG("\n");
466 
467 #if R128_PERFORMANCE_BOXES
468 	/* Do some trivial performance monitoring...
469 	 */
470 	r128_cce_performance_boxes(dev_priv);
471 #endif
472 
473 	for (i = 0; i < nbox; i++) {
474 		int x = pbox[i].x1;
475 		int y = pbox[i].y1;
476 		int w = pbox[i].x2 - x;
477 		int h = pbox[i].y2 - y;
478 
479 		BEGIN_RING(7);
480 
481 		OUT_RING(CCE_PACKET3(R128_CNTL_BITBLT_MULTI, 5));
482 		OUT_RING(R128_GMC_SRC_PITCH_OFFSET_CNTL |
483 			 R128_GMC_DST_PITCH_OFFSET_CNTL |
484 			 R128_GMC_BRUSH_NONE |
485 			 (dev_priv->color_fmt << 8) |
486 			 R128_GMC_SRC_DATATYPE_COLOR |
487 			 R128_ROP3_S |
488 			 R128_DP_SRC_SOURCE_MEMORY |
489 			 R128_GMC_CLR_CMP_CNTL_DIS |
490 			 R128_GMC_AUX_CLIP_DIS | R128_GMC_WR_MSK_DIS);
491 
492 		/* Make this work even if front & back are flipped:
493 		 */
494 		if (dev_priv->current_page == 0) {
495 			OUT_RING(dev_priv->back_pitch_offset_c);
496 			OUT_RING(dev_priv->front_pitch_offset_c);
497 		} else {
498 			OUT_RING(dev_priv->front_pitch_offset_c);
499 			OUT_RING(dev_priv->back_pitch_offset_c);
500 		}
501 
502 		OUT_RING((x << 16) | y);
503 		OUT_RING((x << 16) | y);
504 		OUT_RING((w << 16) | h);
505 
506 		ADVANCE_RING();
507 	}
508 
509 	/* Increment the frame counter.  The client-side 3D driver must
510 	 * throttle the framerate by waiting for this value before
511 	 * performing the swapbuffer ioctl.
512 	 */
513 	dev_priv->sarea_priv->last_frame++;
514 
515 	BEGIN_RING(2);
516 
517 	OUT_RING(CCE_PACKET0(R128_LAST_FRAME_REG, 0));
518 	OUT_RING(dev_priv->sarea_priv->last_frame);
519 
520 	ADVANCE_RING();
521 }
522 
r128_cce_dispatch_flip(struct drm_device * dev)523 static void r128_cce_dispatch_flip(struct drm_device *dev)
524 {
525 	drm_r128_private_t *dev_priv = dev->dev_private;
526 	RING_LOCALS;
527 	DRM_DEBUG("page=%d pfCurrentPage=%d\n",
528 		  dev_priv->current_page, dev_priv->sarea_priv->pfCurrentPage);
529 
530 #if R128_PERFORMANCE_BOXES
531 	/* Do some trivial performance monitoring...
532 	 */
533 	r128_cce_performance_boxes(dev_priv);
534 #endif
535 
536 	BEGIN_RING(4);
537 
538 	R128_WAIT_UNTIL_PAGE_FLIPPED();
539 	OUT_RING(CCE_PACKET0(R128_CRTC_OFFSET, 0));
540 
541 	if (dev_priv->current_page == 0)
542 		OUT_RING(dev_priv->back_offset);
543 	else
544 		OUT_RING(dev_priv->front_offset);
545 
546 	ADVANCE_RING();
547 
548 	/* Increment the frame counter.  The client-side 3D driver must
549 	 * throttle the framerate by waiting for this value before
550 	 * performing the swapbuffer ioctl.
551 	 */
552 	dev_priv->sarea_priv->last_frame++;
553 	dev_priv->sarea_priv->pfCurrentPage = dev_priv->current_page =
554 	    1 - dev_priv->current_page;
555 
556 	BEGIN_RING(2);
557 
558 	OUT_RING(CCE_PACKET0(R128_LAST_FRAME_REG, 0));
559 	OUT_RING(dev_priv->sarea_priv->last_frame);
560 
561 	ADVANCE_RING();
562 }
563 
r128_cce_dispatch_vertex(struct drm_device * dev,struct drm_buf * buf)564 static void r128_cce_dispatch_vertex(struct drm_device *dev, struct drm_buf *buf)
565 {
566 	drm_r128_private_t *dev_priv = dev->dev_private;
567 	drm_r128_buf_priv_t *buf_priv = buf->dev_private;
568 	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
569 	int format = sarea_priv->vc_format;
570 	int offset = buf->bus_address;
571 	int size = buf->used;
572 	int prim = buf_priv->prim;
573 	int i = 0;
574 	RING_LOCALS;
575 	DRM_DEBUG("buf=%d nbox=%d\n", buf->idx, sarea_priv->nbox);
576 
577 	if (0)
578 		r128_print_dirty("dispatch_vertex", sarea_priv->dirty);
579 
580 	if (buf->used) {
581 		buf_priv->dispatched = 1;
582 
583 		if (sarea_priv->dirty & ~R128_UPLOAD_CLIPRECTS)
584 			r128_emit_state(dev_priv);
585 
586 		do {
587 			/* Emit the next set of up to three cliprects */
588 			if (i < sarea_priv->nbox) {
589 				r128_emit_clip_rects(dev_priv,
590 						     &sarea_priv->boxes[i],
591 						     sarea_priv->nbox - i);
592 			}
593 
594 			/* Emit the vertex buffer rendering commands */
595 			BEGIN_RING(5);
596 
597 			OUT_RING(CCE_PACKET3(R128_3D_RNDR_GEN_INDX_PRIM, 3));
598 			OUT_RING(offset);
599 			OUT_RING(size);
600 			OUT_RING(format);
601 			OUT_RING(prim | R128_CCE_VC_CNTL_PRIM_WALK_LIST |
602 				 (size << R128_CCE_VC_CNTL_NUM_SHIFT));
603 
604 			ADVANCE_RING();
605 
606 			i += 3;
607 		} while (i < sarea_priv->nbox);
608 	}
609 
610 	if (buf_priv->discard) {
611 		buf_priv->age = dev_priv->sarea_priv->last_dispatch;
612 
613 		/* Emit the vertex buffer age */
614 		BEGIN_RING(2);
615 
616 		OUT_RING(CCE_PACKET0(R128_LAST_DISPATCH_REG, 0));
617 		OUT_RING(buf_priv->age);
618 
619 		ADVANCE_RING();
620 
621 		buf->pending = 1;
622 		buf->used = 0;
623 		/* FIXME: Check dispatched field */
624 		buf_priv->dispatched = 0;
625 	}
626 
627 	dev_priv->sarea_priv->last_dispatch++;
628 
629 	sarea_priv->dirty &= ~R128_UPLOAD_CLIPRECTS;
630 	sarea_priv->nbox = 0;
631 }
632 
r128_cce_dispatch_indirect(struct drm_device * dev,struct drm_buf * buf,int start,int end)633 static void r128_cce_dispatch_indirect(struct drm_device *dev,
634 				       struct drm_buf *buf, int start, int end)
635 {
636 	drm_r128_private_t *dev_priv = dev->dev_private;
637 	drm_r128_buf_priv_t *buf_priv = buf->dev_private;
638 	RING_LOCALS;
639 	DRM_DEBUG("indirect: buf=%d s=0x%x e=0x%x\n", buf->idx, start, end);
640 
641 	if (start != end) {
642 		int offset = buf->bus_address + start;
643 		int dwords = (end - start + 3) / sizeof(u32);
644 
645 		/* Indirect buffer data must be an even number of
646 		 * dwords, so if we've been given an odd number we must
647 		 * pad the data with a Type-2 CCE packet.
648 		 */
649 		if (dwords & 1) {
650 			u32 *data = (u32 *)
651 			    ((char *)dev->agp_buffer_map->handle
652 			     + buf->offset + start);
653 			data[dwords++] = cpu_to_le32(R128_CCE_PACKET2);
654 		}
655 
656 		buf_priv->dispatched = 1;
657 
658 		/* Fire off the indirect buffer */
659 		BEGIN_RING(3);
660 
661 		OUT_RING(CCE_PACKET0(R128_PM4_IW_INDOFF, 1));
662 		OUT_RING(offset);
663 		OUT_RING(dwords);
664 
665 		ADVANCE_RING();
666 	}
667 
668 	if (buf_priv->discard) {
669 		buf_priv->age = dev_priv->sarea_priv->last_dispatch;
670 
671 		/* Emit the indirect buffer age */
672 		BEGIN_RING(2);
673 
674 		OUT_RING(CCE_PACKET0(R128_LAST_DISPATCH_REG, 0));
675 		OUT_RING(buf_priv->age);
676 
677 		ADVANCE_RING();
678 
679 		buf->pending = 1;
680 		buf->used = 0;
681 		/* FIXME: Check dispatched field */
682 		buf_priv->dispatched = 0;
683 	}
684 
685 	dev_priv->sarea_priv->last_dispatch++;
686 }
687 
r128_cce_dispatch_indices(struct drm_device * dev,struct drm_buf * buf,int start,int end,int count)688 static void r128_cce_dispatch_indices(struct drm_device *dev,
689 				      struct drm_buf *buf,
690 				      int start, int end, int count)
691 {
692 	drm_r128_private_t *dev_priv = dev->dev_private;
693 	drm_r128_buf_priv_t *buf_priv = buf->dev_private;
694 	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
695 	int format = sarea_priv->vc_format;
696 	int offset = dev->agp_buffer_map->offset - dev_priv->cce_buffers_offset;
697 	int prim = buf_priv->prim;
698 	u32 *data;
699 	int dwords;
700 	int i = 0;
701 	RING_LOCALS;
702 	DRM_DEBUG("indices: s=%d e=%d c=%d\n", start, end, count);
703 
704 	if (0)
705 		r128_print_dirty("dispatch_indices", sarea_priv->dirty);
706 
707 	if (start != end) {
708 		buf_priv->dispatched = 1;
709 
710 		if (sarea_priv->dirty & ~R128_UPLOAD_CLIPRECTS)
711 			r128_emit_state(dev_priv);
712 
713 		dwords = (end - start + 3) / sizeof(u32);
714 
715 		data = (u32 *) ((char *)dev->agp_buffer_map->handle
716 				+ buf->offset + start);
717 
718 		data[0] = cpu_to_le32(CCE_PACKET3(R128_3D_RNDR_GEN_INDX_PRIM,
719 						  dwords - 2));
720 
721 		data[1] = cpu_to_le32(offset);
722 		data[2] = cpu_to_le32(R128_MAX_VB_VERTS);
723 		data[3] = cpu_to_le32(format);
724 		data[4] = cpu_to_le32((prim | R128_CCE_VC_CNTL_PRIM_WALK_IND |
725 				       (count << 16)));
726 
727 		if (count & 0x1) {
728 #ifdef __LITTLE_ENDIAN
729 			data[dwords - 1] &= 0x0000ffff;
730 #else
731 			data[dwords - 1] &= 0xffff0000;
732 #endif
733 		}
734 
735 		do {
736 			/* Emit the next set of up to three cliprects */
737 			if (i < sarea_priv->nbox) {
738 				r128_emit_clip_rects(dev_priv,
739 						     &sarea_priv->boxes[i],
740 						     sarea_priv->nbox - i);
741 			}
742 
743 			r128_cce_dispatch_indirect(dev, buf, start, end);
744 
745 			i += 3;
746 		} while (i < sarea_priv->nbox);
747 	}
748 
749 	if (buf_priv->discard) {
750 		buf_priv->age = dev_priv->sarea_priv->last_dispatch;
751 
752 		/* Emit the vertex buffer age */
753 		BEGIN_RING(2);
754 
755 		OUT_RING(CCE_PACKET0(R128_LAST_DISPATCH_REG, 0));
756 		OUT_RING(buf_priv->age);
757 
758 		ADVANCE_RING();
759 
760 		buf->pending = 1;
761 		/* FIXME: Check dispatched field */
762 		buf_priv->dispatched = 0;
763 	}
764 
765 	dev_priv->sarea_priv->last_dispatch++;
766 
767 	sarea_priv->dirty &= ~R128_UPLOAD_CLIPRECTS;
768 	sarea_priv->nbox = 0;
769 }
770 
r128_cce_dispatch_blit(struct drm_device * dev,struct drm_file * file_priv,drm_r128_blit_t * blit)771 static int r128_cce_dispatch_blit(struct drm_device *dev,
772 				  struct drm_file *file_priv,
773 				  drm_r128_blit_t *blit)
774 {
775 	drm_r128_private_t *dev_priv = dev->dev_private;
776 	struct drm_device_dma *dma = dev->dma;
777 	struct drm_buf *buf;
778 	drm_r128_buf_priv_t *buf_priv;
779 	u32 *data;
780 	int dword_shift, dwords;
781 	RING_LOCALS;
782 	DRM_DEBUG("\n");
783 
784 	/* The compiler won't optimize away a division by a variable,
785 	 * even if the only legal values are powers of two.  Thus, we'll
786 	 * use a shift instead.
787 	 */
788 	switch (blit->format) {
789 	case R128_DATATYPE_ARGB8888:
790 		dword_shift = 0;
791 		break;
792 	case R128_DATATYPE_ARGB1555:
793 	case R128_DATATYPE_RGB565:
794 	case R128_DATATYPE_ARGB4444:
795 	case R128_DATATYPE_YVYU422:
796 	case R128_DATATYPE_VYUY422:
797 		dword_shift = 1;
798 		break;
799 	case R128_DATATYPE_CI8:
800 	case R128_DATATYPE_RGB8:
801 		dword_shift = 2;
802 		break;
803 	default:
804 		DRM_ERROR("invalid blit format %d\n", blit->format);
805 		return -EINVAL;
806 	}
807 
808 	/* Flush the pixel cache, and mark the contents as Read Invalid.
809 	 * This ensures no pixel data gets mixed up with the texture
810 	 * data from the host data blit, otherwise part of the texture
811 	 * image may be corrupted.
812 	 */
813 	BEGIN_RING(2);
814 
815 	OUT_RING(CCE_PACKET0(R128_PC_GUI_CTLSTAT, 0));
816 	OUT_RING(R128_PC_RI_GUI | R128_PC_FLUSH_GUI);
817 
818 	ADVANCE_RING();
819 
820 	/* Dispatch the indirect buffer.
821 	 */
822 	buf = dma->buflist[blit->idx];
823 	buf_priv = buf->dev_private;
824 
825 	if (buf->file_priv != file_priv) {
826 		DRM_ERROR("process %d using buffer owned by %p\n",
827 			  DRM_CURRENTPID, buf->file_priv);
828 		return -EINVAL;
829 	}
830 	if (buf->pending) {
831 		DRM_ERROR("sending pending buffer %d\n", blit->idx);
832 		return -EINVAL;
833 	}
834 
835 	buf_priv->discard = 1;
836 
837 	dwords = (blit->width * blit->height) >> dword_shift;
838 
839 	data = (u32 *) ((char *)dev->agp_buffer_map->handle + buf->offset);
840 
841 	data[0] = cpu_to_le32(CCE_PACKET3(R128_CNTL_HOSTDATA_BLT, dwords + 6));
842 	data[1] = cpu_to_le32((R128_GMC_DST_PITCH_OFFSET_CNTL |
843 			       R128_GMC_BRUSH_NONE |
844 			       (blit->format << 8) |
845 			       R128_GMC_SRC_DATATYPE_COLOR |
846 			       R128_ROP3_S |
847 			       R128_DP_SRC_SOURCE_HOST_DATA |
848 			       R128_GMC_CLR_CMP_CNTL_DIS |
849 			       R128_GMC_AUX_CLIP_DIS | R128_GMC_WR_MSK_DIS));
850 
851 	data[2] = cpu_to_le32((blit->pitch << 21) | (blit->offset >> 5));
852 	data[3] = cpu_to_le32(0xffffffff);
853 	data[4] = cpu_to_le32(0xffffffff);
854 	data[5] = cpu_to_le32((blit->y << 16) | blit->x);
855 	data[6] = cpu_to_le32((blit->height << 16) | blit->width);
856 	data[7] = cpu_to_le32(dwords);
857 
858 	buf->used = (dwords + 8) * sizeof(u32);
859 
860 	r128_cce_dispatch_indirect(dev, buf, 0, buf->used);
861 
862 	/* Flush the pixel cache after the blit completes.  This ensures
863 	 * the texture data is written out to memory before rendering
864 	 * continues.
865 	 */
866 	BEGIN_RING(2);
867 
868 	OUT_RING(CCE_PACKET0(R128_PC_GUI_CTLSTAT, 0));
869 	OUT_RING(R128_PC_FLUSH_GUI);
870 
871 	ADVANCE_RING();
872 
873 	return 0;
874 }
875 
876 /* ================================================================
877  * Tiled depth buffer management
878  *
879  * FIXME: These should all set the destination write mask for when we
880  * have hardware stencil support.
881  */
882 
r128_cce_dispatch_write_span(struct drm_device * dev,drm_r128_depth_t * depth)883 static int r128_cce_dispatch_write_span(struct drm_device *dev,
884 					drm_r128_depth_t *depth)
885 {
886 	drm_r128_private_t *dev_priv = dev->dev_private;
887 	int count, x, y;
888 	u32 *buffer;
889 	u8 *mask;
890 	int i, buffer_size, mask_size;
891 	RING_LOCALS;
892 	DRM_DEBUG("\n");
893 
894 	count = depth->n;
895 	if (count > 4096 || count <= 0)
896 		return -EMSGSIZE;
897 
898 	if (copy_from_user(&x, depth->x, sizeof(x)))
899 		return -EFAULT;
900 	if (copy_from_user(&y, depth->y, sizeof(y)))
901 		return -EFAULT;
902 
903 	buffer_size = depth->n * sizeof(u32);
904 	buffer = memdup_user(depth->buffer, buffer_size);
905 	if (IS_ERR(buffer))
906 		return PTR_ERR(buffer);
907 
908 	mask_size = depth->n;
909 	if (depth->mask) {
910 		mask = memdup_user(depth->mask, mask_size);
911 		if (IS_ERR(mask)) {
912 			kfree(buffer);
913 			return PTR_ERR(mask);
914 		}
915 
916 		for (i = 0; i < count; i++, x++) {
917 			if (mask[i]) {
918 				BEGIN_RING(6);
919 
920 				OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
921 				OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
922 					 R128_GMC_BRUSH_SOLID_COLOR |
923 					 (dev_priv->depth_fmt << 8) |
924 					 R128_GMC_SRC_DATATYPE_COLOR |
925 					 R128_ROP3_P |
926 					 R128_GMC_CLR_CMP_CNTL_DIS |
927 					 R128_GMC_WR_MSK_DIS);
928 
929 				OUT_RING(dev_priv->depth_pitch_offset_c);
930 				OUT_RING(buffer[i]);
931 
932 				OUT_RING((x << 16) | y);
933 				OUT_RING((1 << 16) | 1);
934 
935 				ADVANCE_RING();
936 			}
937 		}
938 
939 		kfree(mask);
940 	} else {
941 		for (i = 0; i < count; i++, x++) {
942 			BEGIN_RING(6);
943 
944 			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
945 			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
946 				 R128_GMC_BRUSH_SOLID_COLOR |
947 				 (dev_priv->depth_fmt << 8) |
948 				 R128_GMC_SRC_DATATYPE_COLOR |
949 				 R128_ROP3_P |
950 				 R128_GMC_CLR_CMP_CNTL_DIS |
951 				 R128_GMC_WR_MSK_DIS);
952 
953 			OUT_RING(dev_priv->depth_pitch_offset_c);
954 			OUT_RING(buffer[i]);
955 
956 			OUT_RING((x << 16) | y);
957 			OUT_RING((1 << 16) | 1);
958 
959 			ADVANCE_RING();
960 		}
961 	}
962 
963 	kfree(buffer);
964 
965 	return 0;
966 }
967 
r128_cce_dispatch_write_pixels(struct drm_device * dev,drm_r128_depth_t * depth)968 static int r128_cce_dispatch_write_pixels(struct drm_device *dev,
969 					  drm_r128_depth_t *depth)
970 {
971 	drm_r128_private_t *dev_priv = dev->dev_private;
972 	int count, *x, *y;
973 	u32 *buffer;
974 	u8 *mask;
975 	int i, xbuf_size, ybuf_size, buffer_size, mask_size;
976 	RING_LOCALS;
977 	DRM_DEBUG("\n");
978 
979 	count = depth->n;
980 	if (count > 4096 || count <= 0)
981 		return -EMSGSIZE;
982 
983 	xbuf_size = count * sizeof(*x);
984 	ybuf_size = count * sizeof(*y);
985 	x = memdup_user(depth->x, xbuf_size);
986 	if (IS_ERR(x))
987 		return PTR_ERR(x);
988 	y = memdup_user(depth->y, ybuf_size);
989 	if (IS_ERR(y)) {
990 		kfree(x);
991 		return PTR_ERR(y);
992 	}
993 	buffer_size = depth->n * sizeof(u32);
994 	buffer = memdup_user(depth->buffer, buffer_size);
995 	if (IS_ERR(buffer)) {
996 		kfree(x);
997 		kfree(y);
998 		return PTR_ERR(buffer);
999 	}
1000 
1001 	if (depth->mask) {
1002 		mask_size = depth->n;
1003 		mask = memdup_user(depth->mask, mask_size);
1004 		if (IS_ERR(mask)) {
1005 			kfree(x);
1006 			kfree(y);
1007 			kfree(buffer);
1008 			return PTR_ERR(mask);
1009 		}
1010 
1011 		for (i = 0; i < count; i++) {
1012 			if (mask[i]) {
1013 				BEGIN_RING(6);
1014 
1015 				OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
1016 				OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
1017 					 R128_GMC_BRUSH_SOLID_COLOR |
1018 					 (dev_priv->depth_fmt << 8) |
1019 					 R128_GMC_SRC_DATATYPE_COLOR |
1020 					 R128_ROP3_P |
1021 					 R128_GMC_CLR_CMP_CNTL_DIS |
1022 					 R128_GMC_WR_MSK_DIS);
1023 
1024 				OUT_RING(dev_priv->depth_pitch_offset_c);
1025 				OUT_RING(buffer[i]);
1026 
1027 				OUT_RING((x[i] << 16) | y[i]);
1028 				OUT_RING((1 << 16) | 1);
1029 
1030 				ADVANCE_RING();
1031 			}
1032 		}
1033 
1034 		kfree(mask);
1035 	} else {
1036 		for (i = 0; i < count; i++) {
1037 			BEGIN_RING(6);
1038 
1039 			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
1040 			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
1041 				 R128_GMC_BRUSH_SOLID_COLOR |
1042 				 (dev_priv->depth_fmt << 8) |
1043 				 R128_GMC_SRC_DATATYPE_COLOR |
1044 				 R128_ROP3_P |
1045 				 R128_GMC_CLR_CMP_CNTL_DIS |
1046 				 R128_GMC_WR_MSK_DIS);
1047 
1048 			OUT_RING(dev_priv->depth_pitch_offset_c);
1049 			OUT_RING(buffer[i]);
1050 
1051 			OUT_RING((x[i] << 16) | y[i]);
1052 			OUT_RING((1 << 16) | 1);
1053 
1054 			ADVANCE_RING();
1055 		}
1056 	}
1057 
1058 	kfree(x);
1059 	kfree(y);
1060 	kfree(buffer);
1061 
1062 	return 0;
1063 }
1064 
r128_cce_dispatch_read_span(struct drm_device * dev,drm_r128_depth_t * depth)1065 static int r128_cce_dispatch_read_span(struct drm_device *dev,
1066 				       drm_r128_depth_t *depth)
1067 {
1068 	drm_r128_private_t *dev_priv = dev->dev_private;
1069 	int count, x, y;
1070 	RING_LOCALS;
1071 	DRM_DEBUG("\n");
1072 
1073 	count = depth->n;
1074 	if (count > 4096 || count <= 0)
1075 		return -EMSGSIZE;
1076 
1077 	if (copy_from_user(&x, depth->x, sizeof(x)))
1078 		return -EFAULT;
1079 	if (copy_from_user(&y, depth->y, sizeof(y)))
1080 		return -EFAULT;
1081 
1082 	BEGIN_RING(7);
1083 
1084 	OUT_RING(CCE_PACKET3(R128_CNTL_BITBLT_MULTI, 5));
1085 	OUT_RING(R128_GMC_SRC_PITCH_OFFSET_CNTL |
1086 		 R128_GMC_DST_PITCH_OFFSET_CNTL |
1087 		 R128_GMC_BRUSH_NONE |
1088 		 (dev_priv->depth_fmt << 8) |
1089 		 R128_GMC_SRC_DATATYPE_COLOR |
1090 		 R128_ROP3_S |
1091 		 R128_DP_SRC_SOURCE_MEMORY |
1092 		 R128_GMC_CLR_CMP_CNTL_DIS | R128_GMC_WR_MSK_DIS);
1093 
1094 	OUT_RING(dev_priv->depth_pitch_offset_c);
1095 	OUT_RING(dev_priv->span_pitch_offset_c);
1096 
1097 	OUT_RING((x << 16) | y);
1098 	OUT_RING((0 << 16) | 0);
1099 	OUT_RING((count << 16) | 1);
1100 
1101 	ADVANCE_RING();
1102 
1103 	return 0;
1104 }
1105 
r128_cce_dispatch_read_pixels(struct drm_device * dev,drm_r128_depth_t * depth)1106 static int r128_cce_dispatch_read_pixels(struct drm_device *dev,
1107 					 drm_r128_depth_t *depth)
1108 {
1109 	drm_r128_private_t *dev_priv = dev->dev_private;
1110 	int count, *x, *y;
1111 	int i, xbuf_size, ybuf_size;
1112 	RING_LOCALS;
1113 	DRM_DEBUG("\n");
1114 
1115 	count = depth->n;
1116 	if (count > 4096 || count <= 0)
1117 		return -EMSGSIZE;
1118 
1119 	if (count > dev_priv->depth_pitch)
1120 		count = dev_priv->depth_pitch;
1121 
1122 	xbuf_size = count * sizeof(*x);
1123 	ybuf_size = count * sizeof(*y);
1124 	x = kmalloc(xbuf_size, GFP_KERNEL);
1125 	if (x == NULL)
1126 		return -ENOMEM;
1127 	y = kmalloc(ybuf_size, GFP_KERNEL);
1128 	if (y == NULL) {
1129 		kfree(x);
1130 		return -ENOMEM;
1131 	}
1132 	if (copy_from_user(x, depth->x, xbuf_size)) {
1133 		kfree(x);
1134 		kfree(y);
1135 		return -EFAULT;
1136 	}
1137 	if (copy_from_user(y, depth->y, ybuf_size)) {
1138 		kfree(x);
1139 		kfree(y);
1140 		return -EFAULT;
1141 	}
1142 
1143 	for (i = 0; i < count; i++) {
1144 		BEGIN_RING(7);
1145 
1146 		OUT_RING(CCE_PACKET3(R128_CNTL_BITBLT_MULTI, 5));
1147 		OUT_RING(R128_GMC_SRC_PITCH_OFFSET_CNTL |
1148 			 R128_GMC_DST_PITCH_OFFSET_CNTL |
1149 			 R128_GMC_BRUSH_NONE |
1150 			 (dev_priv->depth_fmt << 8) |
1151 			 R128_GMC_SRC_DATATYPE_COLOR |
1152 			 R128_ROP3_S |
1153 			 R128_DP_SRC_SOURCE_MEMORY |
1154 			 R128_GMC_CLR_CMP_CNTL_DIS | R128_GMC_WR_MSK_DIS);
1155 
1156 		OUT_RING(dev_priv->depth_pitch_offset_c);
1157 		OUT_RING(dev_priv->span_pitch_offset_c);
1158 
1159 		OUT_RING((x[i] << 16) | y[i]);
1160 		OUT_RING((i << 16) | 0);
1161 		OUT_RING((1 << 16) | 1);
1162 
1163 		ADVANCE_RING();
1164 	}
1165 
1166 	kfree(x);
1167 	kfree(y);
1168 
1169 	return 0;
1170 }
1171 
1172 /* ================================================================
1173  * Polygon stipple
1174  */
1175 
r128_cce_dispatch_stipple(struct drm_device * dev,u32 * stipple)1176 static void r128_cce_dispatch_stipple(struct drm_device *dev, u32 *stipple)
1177 {
1178 	drm_r128_private_t *dev_priv = dev->dev_private;
1179 	int i;
1180 	RING_LOCALS;
1181 	DRM_DEBUG("\n");
1182 
1183 	BEGIN_RING(33);
1184 
1185 	OUT_RING(CCE_PACKET0(R128_BRUSH_DATA0, 31));
1186 	for (i = 0; i < 32; i++)
1187 		OUT_RING(stipple[i]);
1188 
1189 	ADVANCE_RING();
1190 }
1191 
1192 /* ================================================================
1193  * IOCTL functions
1194  */
1195 
r128_cce_clear(struct drm_device * dev,void * data,struct drm_file * file_priv)1196 static int r128_cce_clear(struct drm_device *dev, void *data, struct drm_file *file_priv)
1197 {
1198 	drm_r128_private_t *dev_priv = dev->dev_private;
1199 	drm_r128_sarea_t *sarea_priv;
1200 	drm_r128_clear_t *clear = data;
1201 	DRM_DEBUG("\n");
1202 
1203 	LOCK_TEST_WITH_RETURN(dev, file_priv);
1204 
1205 	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1206 
1207 	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1208 
1209 	sarea_priv = dev_priv->sarea_priv;
1210 
1211 	if (sarea_priv->nbox > R128_NR_SAREA_CLIPRECTS)
1212 		sarea_priv->nbox = R128_NR_SAREA_CLIPRECTS;
1213 
1214 	r128_cce_dispatch_clear(dev, clear);
1215 	COMMIT_RING();
1216 
1217 	/* Make sure we restore the 3D state next time.
1218 	 */
1219 	dev_priv->sarea_priv->dirty |= R128_UPLOAD_CONTEXT | R128_UPLOAD_MASKS;
1220 
1221 	return 0;
1222 }
1223 
r128_do_init_pageflip(struct drm_device * dev)1224 static int r128_do_init_pageflip(struct drm_device *dev)
1225 {
1226 	drm_r128_private_t *dev_priv = dev->dev_private;
1227 	DRM_DEBUG("\n");
1228 
1229 	dev_priv->crtc_offset = R128_READ(R128_CRTC_OFFSET);
1230 	dev_priv->crtc_offset_cntl = R128_READ(R128_CRTC_OFFSET_CNTL);
1231 
1232 	R128_WRITE(R128_CRTC_OFFSET, dev_priv->front_offset);
1233 	R128_WRITE(R128_CRTC_OFFSET_CNTL,
1234 		   dev_priv->crtc_offset_cntl | R128_CRTC_OFFSET_FLIP_CNTL);
1235 
1236 	dev_priv->page_flipping = 1;
1237 	dev_priv->current_page = 0;
1238 	dev_priv->sarea_priv->pfCurrentPage = dev_priv->current_page;
1239 
1240 	return 0;
1241 }
1242 
r128_do_cleanup_pageflip(struct drm_device * dev)1243 static int r128_do_cleanup_pageflip(struct drm_device *dev)
1244 {
1245 	drm_r128_private_t *dev_priv = dev->dev_private;
1246 	DRM_DEBUG("\n");
1247 
1248 	R128_WRITE(R128_CRTC_OFFSET, dev_priv->crtc_offset);
1249 	R128_WRITE(R128_CRTC_OFFSET_CNTL, dev_priv->crtc_offset_cntl);
1250 
1251 	if (dev_priv->current_page != 0) {
1252 		r128_cce_dispatch_flip(dev);
1253 		COMMIT_RING();
1254 	}
1255 
1256 	dev_priv->page_flipping = 0;
1257 	return 0;
1258 }
1259 
1260 /* Swapping and flipping are different operations, need different ioctls.
1261  * They can & should be intermixed to support multiple 3d windows.
1262  */
1263 
r128_cce_flip(struct drm_device * dev,void * data,struct drm_file * file_priv)1264 static int r128_cce_flip(struct drm_device *dev, void *data, struct drm_file *file_priv)
1265 {
1266 	drm_r128_private_t *dev_priv = dev->dev_private;
1267 	DRM_DEBUG("\n");
1268 
1269 	LOCK_TEST_WITH_RETURN(dev, file_priv);
1270 
1271 	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1272 
1273 	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1274 
1275 	if (!dev_priv->page_flipping)
1276 		r128_do_init_pageflip(dev);
1277 
1278 	r128_cce_dispatch_flip(dev);
1279 
1280 	COMMIT_RING();
1281 	return 0;
1282 }
1283 
r128_cce_swap(struct drm_device * dev,void * data,struct drm_file * file_priv)1284 static int r128_cce_swap(struct drm_device *dev, void *data, struct drm_file *file_priv)
1285 {
1286 	drm_r128_private_t *dev_priv = dev->dev_private;
1287 	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
1288 	DRM_DEBUG("\n");
1289 
1290 	LOCK_TEST_WITH_RETURN(dev, file_priv);
1291 
1292 	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1293 
1294 	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1295 
1296 	if (sarea_priv->nbox > R128_NR_SAREA_CLIPRECTS)
1297 		sarea_priv->nbox = R128_NR_SAREA_CLIPRECTS;
1298 
1299 	r128_cce_dispatch_swap(dev);
1300 	dev_priv->sarea_priv->dirty |= (R128_UPLOAD_CONTEXT |
1301 					R128_UPLOAD_MASKS);
1302 
1303 	COMMIT_RING();
1304 	return 0;
1305 }
1306 
r128_cce_vertex(struct drm_device * dev,void * data,struct drm_file * file_priv)1307 static int r128_cce_vertex(struct drm_device *dev, void *data, struct drm_file *file_priv)
1308 {
1309 	drm_r128_private_t *dev_priv = dev->dev_private;
1310 	struct drm_device_dma *dma = dev->dma;
1311 	struct drm_buf *buf;
1312 	drm_r128_buf_priv_t *buf_priv;
1313 	drm_r128_vertex_t *vertex = data;
1314 
1315 	LOCK_TEST_WITH_RETURN(dev, file_priv);
1316 
1317 	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1318 
1319 	DRM_DEBUG("pid=%d index=%d count=%d discard=%d\n",
1320 		  DRM_CURRENTPID, vertex->idx, vertex->count, vertex->discard);
1321 
1322 	if (vertex->idx < 0 || vertex->idx >= dma->buf_count) {
1323 		DRM_ERROR("buffer index %d (of %d max)\n",
1324 			  vertex->idx, dma->buf_count - 1);
1325 		return -EINVAL;
1326 	}
1327 	if (vertex->prim < 0 ||
1328 	    vertex->prim > R128_CCE_VC_CNTL_PRIM_TYPE_TRI_TYPE2) {
1329 		DRM_ERROR("buffer prim %d\n", vertex->prim);
1330 		return -EINVAL;
1331 	}
1332 
1333 	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1334 	VB_AGE_TEST_WITH_RETURN(dev_priv);
1335 
1336 	buf = dma->buflist[vertex->idx];
1337 	buf_priv = buf->dev_private;
1338 
1339 	if (buf->file_priv != file_priv) {
1340 		DRM_ERROR("process %d using buffer owned by %p\n",
1341 			  DRM_CURRENTPID, buf->file_priv);
1342 		return -EINVAL;
1343 	}
1344 	if (buf->pending) {
1345 		DRM_ERROR("sending pending buffer %d\n", vertex->idx);
1346 		return -EINVAL;
1347 	}
1348 
1349 	buf->used = vertex->count;
1350 	buf_priv->prim = vertex->prim;
1351 	buf_priv->discard = vertex->discard;
1352 
1353 	r128_cce_dispatch_vertex(dev, buf);
1354 
1355 	COMMIT_RING();
1356 	return 0;
1357 }
1358 
r128_cce_indices(struct drm_device * dev,void * data,struct drm_file * file_priv)1359 static int r128_cce_indices(struct drm_device *dev, void *data, struct drm_file *file_priv)
1360 {
1361 	drm_r128_private_t *dev_priv = dev->dev_private;
1362 	struct drm_device_dma *dma = dev->dma;
1363 	struct drm_buf *buf;
1364 	drm_r128_buf_priv_t *buf_priv;
1365 	drm_r128_indices_t *elts = data;
1366 	int count;
1367 
1368 	LOCK_TEST_WITH_RETURN(dev, file_priv);
1369 
1370 	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1371 
1372 	DRM_DEBUG("pid=%d buf=%d s=%d e=%d d=%d\n", DRM_CURRENTPID,
1373 		  elts->idx, elts->start, elts->end, elts->discard);
1374 
1375 	if (elts->idx < 0 || elts->idx >= dma->buf_count) {
1376 		DRM_ERROR("buffer index %d (of %d max)\n",
1377 			  elts->idx, dma->buf_count - 1);
1378 		return -EINVAL;
1379 	}
1380 	if (elts->prim < 0 ||
1381 	    elts->prim > R128_CCE_VC_CNTL_PRIM_TYPE_TRI_TYPE2) {
1382 		DRM_ERROR("buffer prim %d\n", elts->prim);
1383 		return -EINVAL;
1384 	}
1385 
1386 	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1387 	VB_AGE_TEST_WITH_RETURN(dev_priv);
1388 
1389 	buf = dma->buflist[elts->idx];
1390 	buf_priv = buf->dev_private;
1391 
1392 	if (buf->file_priv != file_priv) {
1393 		DRM_ERROR("process %d using buffer owned by %p\n",
1394 			  DRM_CURRENTPID, buf->file_priv);
1395 		return -EINVAL;
1396 	}
1397 	if (buf->pending) {
1398 		DRM_ERROR("sending pending buffer %d\n", elts->idx);
1399 		return -EINVAL;
1400 	}
1401 
1402 	count = (elts->end - elts->start) / sizeof(u16);
1403 	elts->start -= R128_INDEX_PRIM_OFFSET;
1404 
1405 	if (elts->start & 0x7) {
1406 		DRM_ERROR("misaligned buffer 0x%x\n", elts->start);
1407 		return -EINVAL;
1408 	}
1409 	if (elts->start < buf->used) {
1410 		DRM_ERROR("no header 0x%x - 0x%x\n", elts->start, buf->used);
1411 		return -EINVAL;
1412 	}
1413 
1414 	buf->used = elts->end;
1415 	buf_priv->prim = elts->prim;
1416 	buf_priv->discard = elts->discard;
1417 
1418 	r128_cce_dispatch_indices(dev, buf, elts->start, elts->end, count);
1419 
1420 	COMMIT_RING();
1421 	return 0;
1422 }
1423 
r128_cce_blit(struct drm_device * dev,void * data,struct drm_file * file_priv)1424 static int r128_cce_blit(struct drm_device *dev, void *data, struct drm_file *file_priv)
1425 {
1426 	struct drm_device_dma *dma = dev->dma;
1427 	drm_r128_private_t *dev_priv = dev->dev_private;
1428 	drm_r128_blit_t *blit = data;
1429 	int ret;
1430 
1431 	LOCK_TEST_WITH_RETURN(dev, file_priv);
1432 
1433 	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1434 
1435 	DRM_DEBUG("pid=%d index=%d\n", DRM_CURRENTPID, blit->idx);
1436 
1437 	if (blit->idx < 0 || blit->idx >= dma->buf_count) {
1438 		DRM_ERROR("buffer index %d (of %d max)\n",
1439 			  blit->idx, dma->buf_count - 1);
1440 		return -EINVAL;
1441 	}
1442 
1443 	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1444 	VB_AGE_TEST_WITH_RETURN(dev_priv);
1445 
1446 	ret = r128_cce_dispatch_blit(dev, file_priv, blit);
1447 
1448 	COMMIT_RING();
1449 	return ret;
1450 }
1451 
r128_cce_depth(struct drm_device * dev,void * data,struct drm_file * file_priv)1452 int r128_cce_depth(struct drm_device *dev, void *data, struct drm_file *file_priv)
1453 {
1454 	drm_r128_private_t *dev_priv = dev->dev_private;
1455 	drm_r128_depth_t *depth = data;
1456 	int ret;
1457 
1458 	LOCK_TEST_WITH_RETURN(dev, file_priv);
1459 
1460 	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1461 
1462 	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1463 
1464 	ret = -EINVAL;
1465 	switch (depth->func) {
1466 	case R128_WRITE_SPAN:
1467 		ret = r128_cce_dispatch_write_span(dev, depth);
1468 		break;
1469 	case R128_WRITE_PIXELS:
1470 		ret = r128_cce_dispatch_write_pixels(dev, depth);
1471 		break;
1472 	case R128_READ_SPAN:
1473 		ret = r128_cce_dispatch_read_span(dev, depth);
1474 		break;
1475 	case R128_READ_PIXELS:
1476 		ret = r128_cce_dispatch_read_pixels(dev, depth);
1477 		break;
1478 	}
1479 
1480 	COMMIT_RING();
1481 	return ret;
1482 }
1483 
r128_cce_stipple(struct drm_device * dev,void * data,struct drm_file * file_priv)1484 int r128_cce_stipple(struct drm_device *dev, void *data, struct drm_file *file_priv)
1485 {
1486 	drm_r128_private_t *dev_priv = dev->dev_private;
1487 	drm_r128_stipple_t *stipple = data;
1488 	u32 mask[32];
1489 
1490 	LOCK_TEST_WITH_RETURN(dev, file_priv);
1491 
1492 	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1493 
1494 	if (copy_from_user(&mask, stipple->mask, 32 * sizeof(u32)))
1495 		return -EFAULT;
1496 
1497 	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1498 
1499 	r128_cce_dispatch_stipple(dev, mask);
1500 
1501 	COMMIT_RING();
1502 	return 0;
1503 }
1504 
r128_cce_indirect(struct drm_device * dev,void * data,struct drm_file * file_priv)1505 static int r128_cce_indirect(struct drm_device *dev, void *data, struct drm_file *file_priv)
1506 {
1507 	drm_r128_private_t *dev_priv = dev->dev_private;
1508 	struct drm_device_dma *dma = dev->dma;
1509 	struct drm_buf *buf;
1510 	drm_r128_buf_priv_t *buf_priv;
1511 	drm_r128_indirect_t *indirect = data;
1512 #if 0
1513 	RING_LOCALS;
1514 #endif
1515 
1516 	LOCK_TEST_WITH_RETURN(dev, file_priv);
1517 
1518 	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1519 
1520 	DRM_DEBUG("idx=%d s=%d e=%d d=%d\n",
1521 		  indirect->idx, indirect->start, indirect->end,
1522 		  indirect->discard);
1523 
1524 	if (indirect->idx < 0 || indirect->idx >= dma->buf_count) {
1525 		DRM_ERROR("buffer index %d (of %d max)\n",
1526 			  indirect->idx, dma->buf_count - 1);
1527 		return -EINVAL;
1528 	}
1529 
1530 	buf = dma->buflist[indirect->idx];
1531 	buf_priv = buf->dev_private;
1532 
1533 	if (buf->file_priv != file_priv) {
1534 		DRM_ERROR("process %d using buffer owned by %p\n",
1535 			  DRM_CURRENTPID, buf->file_priv);
1536 		return -EINVAL;
1537 	}
1538 	if (buf->pending) {
1539 		DRM_ERROR("sending pending buffer %d\n", indirect->idx);
1540 		return -EINVAL;
1541 	}
1542 
1543 	if (indirect->start < buf->used) {
1544 		DRM_ERROR("reusing indirect: start=0x%x actual=0x%x\n",
1545 			  indirect->start, buf->used);
1546 		return -EINVAL;
1547 	}
1548 
1549 	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1550 	VB_AGE_TEST_WITH_RETURN(dev_priv);
1551 
1552 	buf->used = indirect->end;
1553 	buf_priv->discard = indirect->discard;
1554 
1555 #if 0
1556 	/* Wait for the 3D stream to idle before the indirect buffer
1557 	 * containing 2D acceleration commands is processed.
1558 	 */
1559 	BEGIN_RING(2);
1560 	RADEON_WAIT_UNTIL_3D_IDLE();
1561 	ADVANCE_RING();
1562 #endif
1563 
1564 	/* Dispatch the indirect buffer full of commands from the
1565 	 * X server.  This is insecure and is thus only available to
1566 	 * privileged clients.
1567 	 */
1568 	r128_cce_dispatch_indirect(dev, buf, indirect->start, indirect->end);
1569 
1570 	COMMIT_RING();
1571 	return 0;
1572 }
1573 
r128_getparam(struct drm_device * dev,void * data,struct drm_file * file_priv)1574 int r128_getparam(struct drm_device *dev, void *data, struct drm_file *file_priv)
1575 {
1576 	drm_r128_private_t *dev_priv = dev->dev_private;
1577 	drm_r128_getparam_t *param = data;
1578 	int value;
1579 
1580 	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1581 
1582 	DRM_DEBUG("pid=%d\n", DRM_CURRENTPID);
1583 
1584 	switch (param->param) {
1585 	case R128_PARAM_IRQ_NR:
1586 		value = dev->pdev->irq;
1587 		break;
1588 	default:
1589 		return -EINVAL;
1590 	}
1591 
1592 	if (copy_to_user(param->value, &value, sizeof(int))) {
1593 		DRM_ERROR("copy_to_user\n");
1594 		return -EFAULT;
1595 	}
1596 
1597 	return 0;
1598 }
1599 
r128_driver_preclose(struct drm_device * dev,struct drm_file * file_priv)1600 void r128_driver_preclose(struct drm_device *dev, struct drm_file *file_priv)
1601 {
1602 	if (dev->dev_private) {
1603 		drm_r128_private_t *dev_priv = dev->dev_private;
1604 		if (dev_priv->page_flipping)
1605 			r128_do_cleanup_pageflip(dev);
1606 	}
1607 }
r128_driver_lastclose(struct drm_device * dev)1608 void r128_driver_lastclose(struct drm_device *dev)
1609 {
1610 	r128_do_cleanup_cce(dev);
1611 }
1612 
1613 const struct drm_ioctl_desc r128_ioctls[] = {
1614 	DRM_IOCTL_DEF_DRV(R128_INIT, r128_cce_init, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1615 	DRM_IOCTL_DEF_DRV(R128_CCE_START, r128_cce_start, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1616 	DRM_IOCTL_DEF_DRV(R128_CCE_STOP, r128_cce_stop, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1617 	DRM_IOCTL_DEF_DRV(R128_CCE_RESET, r128_cce_reset, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1618 	DRM_IOCTL_DEF_DRV(R128_CCE_IDLE, r128_cce_idle, DRM_AUTH),
1619 	DRM_IOCTL_DEF_DRV(R128_RESET, r128_engine_reset, DRM_AUTH),
1620 	DRM_IOCTL_DEF_DRV(R128_FULLSCREEN, r128_fullscreen, DRM_AUTH),
1621 	DRM_IOCTL_DEF_DRV(R128_SWAP, r128_cce_swap, DRM_AUTH),
1622 	DRM_IOCTL_DEF_DRV(R128_FLIP, r128_cce_flip, DRM_AUTH),
1623 	DRM_IOCTL_DEF_DRV(R128_CLEAR, r128_cce_clear, DRM_AUTH),
1624 	DRM_IOCTL_DEF_DRV(R128_VERTEX, r128_cce_vertex, DRM_AUTH),
1625 	DRM_IOCTL_DEF_DRV(R128_INDICES, r128_cce_indices, DRM_AUTH),
1626 	DRM_IOCTL_DEF_DRV(R128_BLIT, r128_cce_blit, DRM_AUTH),
1627 	DRM_IOCTL_DEF_DRV(R128_DEPTH, r128_cce_depth, DRM_AUTH),
1628 	DRM_IOCTL_DEF_DRV(R128_STIPPLE, r128_cce_stipple, DRM_AUTH),
1629 	DRM_IOCTL_DEF_DRV(R128_INDIRECT, r128_cce_indirect, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1630 	DRM_IOCTL_DEF_DRV(R128_GETPARAM, r128_getparam, DRM_AUTH),
1631 };
1632 
1633 int r128_max_ioctl = ARRAY_SIZE(r128_ioctls);
1634