r128_state.c revision 1.1
1/* r128_state.c -- State support for r128 -*- linux-c -*-
2 * Created: Thu Jan 27 02:53:43 2000 by gareth@valinux.com
3 */
4/*
5 * Copyright 2000 VA Linux Systems, Inc., Sunnyvale, California.
6 * All Rights Reserved.
7 *
8 * Permission is hereby granted, free of charge, to any person obtaining a
9 * copy of this software and associated documentation files (the "Software"),
10 * to deal in the Software without restriction, including without limitation
11 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
12 * and/or sell copies of the Software, and to permit persons to whom the
13 * Software is furnished to do so, subject to the following conditions:
14 *
15 * The above copyright notice and this permission notice (including the next
16 * paragraph) shall be included in all copies or substantial portions of the
17 * Software.
18 *
19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
20 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
21 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
22 * PRECISION INSIGHT AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
23 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
24 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
25 * DEALINGS IN THE SOFTWARE.
26 *
27 * Authors:
28 *    Gareth Hughes <gareth@valinux.com>
29 */
30
31#include <drm/drmP.h>
32#include <drm/r128_drm.h>
33#include "r128_drv.h"
34
35/* ================================================================
36 * CCE hardware state programming functions
37 */
38
39static void r128_emit_clip_rects(drm_r128_private_t *dev_priv,
40				 struct drm_clip_rect *boxes, int count)
41{
42	u32 aux_sc_cntl = 0x00000000;
43	RING_LOCALS;
44	DRM_DEBUG("\n");
45
46	BEGIN_RING((count < 3 ? count : 3) * 5 + 2);
47
48	if (count >= 1) {
49		OUT_RING(CCE_PACKET0(R128_AUX1_SC_LEFT, 3));
50		OUT_RING(boxes[0].x1);
51		OUT_RING(boxes[0].x2 - 1);
52		OUT_RING(boxes[0].y1);
53		OUT_RING(boxes[0].y2 - 1);
54
55		aux_sc_cntl |= (R128_AUX1_SC_EN | R128_AUX1_SC_MODE_OR);
56	}
57	if (count >= 2) {
58		OUT_RING(CCE_PACKET0(R128_AUX2_SC_LEFT, 3));
59		OUT_RING(boxes[1].x1);
60		OUT_RING(boxes[1].x2 - 1);
61		OUT_RING(boxes[1].y1);
62		OUT_RING(boxes[1].y2 - 1);
63
64		aux_sc_cntl |= (R128_AUX2_SC_EN | R128_AUX2_SC_MODE_OR);
65	}
66	if (count >= 3) {
67		OUT_RING(CCE_PACKET0(R128_AUX3_SC_LEFT, 3));
68		OUT_RING(boxes[2].x1);
69		OUT_RING(boxes[2].x2 - 1);
70		OUT_RING(boxes[2].y1);
71		OUT_RING(boxes[2].y2 - 1);
72
73		aux_sc_cntl |= (R128_AUX3_SC_EN | R128_AUX3_SC_MODE_OR);
74	}
75
76	OUT_RING(CCE_PACKET0(R128_AUX_SC_CNTL, 0));
77	OUT_RING(aux_sc_cntl);
78
79	ADVANCE_RING();
80}
81
82static __inline__ void r128_emit_core(drm_r128_private_t *dev_priv)
83{
84	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
85	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
86	RING_LOCALS;
87	DRM_DEBUG("\n");
88
89	BEGIN_RING(2);
90
91	OUT_RING(CCE_PACKET0(R128_SCALE_3D_CNTL, 0));
92	OUT_RING(ctx->scale_3d_cntl);
93
94	ADVANCE_RING();
95}
96
97static __inline__ void r128_emit_context(drm_r128_private_t *dev_priv)
98{
99	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
100	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
101	RING_LOCALS;
102	DRM_DEBUG("\n");
103
104	BEGIN_RING(13);
105
106	OUT_RING(CCE_PACKET0(R128_DST_PITCH_OFFSET_C, 11));
107	OUT_RING(ctx->dst_pitch_offset_c);
108	OUT_RING(ctx->dp_gui_master_cntl_c);
109	OUT_RING(ctx->sc_top_left_c);
110	OUT_RING(ctx->sc_bottom_right_c);
111	OUT_RING(ctx->z_offset_c);
112	OUT_RING(ctx->z_pitch_c);
113	OUT_RING(ctx->z_sten_cntl_c);
114	OUT_RING(ctx->tex_cntl_c);
115	OUT_RING(ctx->misc_3d_state_cntl_reg);
116	OUT_RING(ctx->texture_clr_cmp_clr_c);
117	OUT_RING(ctx->texture_clr_cmp_msk_c);
118	OUT_RING(ctx->fog_color_c);
119
120	ADVANCE_RING();
121}
122
123static __inline__ void r128_emit_setup(drm_r128_private_t *dev_priv)
124{
125	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
126	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
127	RING_LOCALS;
128	DRM_DEBUG("\n");
129
130	BEGIN_RING(3);
131
132	OUT_RING(CCE_PACKET1(R128_SETUP_CNTL, R128_PM4_VC_FPU_SETUP));
133	OUT_RING(ctx->setup_cntl);
134	OUT_RING(ctx->pm4_vc_fpu_setup);
135
136	ADVANCE_RING();
137}
138
139static __inline__ void r128_emit_masks(drm_r128_private_t *dev_priv)
140{
141	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
142	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
143	RING_LOCALS;
144	DRM_DEBUG("\n");
145
146	BEGIN_RING(5);
147
148	OUT_RING(CCE_PACKET0(R128_DP_WRITE_MASK, 0));
149	OUT_RING(ctx->dp_write_mask);
150
151	OUT_RING(CCE_PACKET0(R128_STEN_REF_MASK_C, 1));
152	OUT_RING(ctx->sten_ref_mask_c);
153	OUT_RING(ctx->plane_3d_mask_c);
154
155	ADVANCE_RING();
156}
157
158static __inline__ void r128_emit_window(drm_r128_private_t *dev_priv)
159{
160	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
161	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
162	RING_LOCALS;
163	DRM_DEBUG("\n");
164
165	BEGIN_RING(2);
166
167	OUT_RING(CCE_PACKET0(R128_WINDOW_XY_OFFSET, 0));
168	OUT_RING(ctx->window_xy_offset);
169
170	ADVANCE_RING();
171}
172
173static __inline__ void r128_emit_tex0(drm_r128_private_t *dev_priv)
174{
175	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
176	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
177	drm_r128_texture_regs_t *tex = &sarea_priv->tex_state[0];
178	int i;
179	RING_LOCALS;
180	DRM_DEBUG("\n");
181
182	BEGIN_RING(7 + R128_MAX_TEXTURE_LEVELS);
183
184	OUT_RING(CCE_PACKET0(R128_PRIM_TEX_CNTL_C,
185			     2 + R128_MAX_TEXTURE_LEVELS));
186	OUT_RING(tex->tex_cntl);
187	OUT_RING(tex->tex_combine_cntl);
188	OUT_RING(ctx->tex_size_pitch_c);
189	for (i = 0; i < R128_MAX_TEXTURE_LEVELS; i++)
190		OUT_RING(tex->tex_offset[i]);
191
192	OUT_RING(CCE_PACKET0(R128_CONSTANT_COLOR_C, 1));
193	OUT_RING(ctx->constant_color_c);
194	OUT_RING(tex->tex_border_color);
195
196	ADVANCE_RING();
197}
198
199static __inline__ void r128_emit_tex1(drm_r128_private_t *dev_priv)
200{
201	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
202	drm_r128_texture_regs_t *tex = &sarea_priv->tex_state[1];
203	int i;
204	RING_LOCALS;
205	DRM_DEBUG("\n");
206
207	BEGIN_RING(5 + R128_MAX_TEXTURE_LEVELS);
208
209	OUT_RING(CCE_PACKET0(R128_SEC_TEX_CNTL_C, 1 + R128_MAX_TEXTURE_LEVELS));
210	OUT_RING(tex->tex_cntl);
211	OUT_RING(tex->tex_combine_cntl);
212	for (i = 0; i < R128_MAX_TEXTURE_LEVELS; i++)
213		OUT_RING(tex->tex_offset[i]);
214
215	OUT_RING(CCE_PACKET0(R128_SEC_TEXTURE_BORDER_COLOR_C, 0));
216	OUT_RING(tex->tex_border_color);
217
218	ADVANCE_RING();
219}
220
221static void r128_emit_state(drm_r128_private_t *dev_priv)
222{
223	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
224	unsigned int dirty = sarea_priv->dirty;
225
226	DRM_DEBUG("dirty=0x%08x\n", dirty);
227
228	if (dirty & R128_UPLOAD_CORE) {
229		r128_emit_core(dev_priv);
230		sarea_priv->dirty &= ~R128_UPLOAD_CORE;
231	}
232
233	if (dirty & R128_UPLOAD_CONTEXT) {
234		r128_emit_context(dev_priv);
235		sarea_priv->dirty &= ~R128_UPLOAD_CONTEXT;
236	}
237
238	if (dirty & R128_UPLOAD_SETUP) {
239		r128_emit_setup(dev_priv);
240		sarea_priv->dirty &= ~R128_UPLOAD_SETUP;
241	}
242
243	if (dirty & R128_UPLOAD_MASKS) {
244		r128_emit_masks(dev_priv);
245		sarea_priv->dirty &= ~R128_UPLOAD_MASKS;
246	}
247
248	if (dirty & R128_UPLOAD_WINDOW) {
249		r128_emit_window(dev_priv);
250		sarea_priv->dirty &= ~R128_UPLOAD_WINDOW;
251	}
252
253	if (dirty & R128_UPLOAD_TEX0) {
254		r128_emit_tex0(dev_priv);
255		sarea_priv->dirty &= ~R128_UPLOAD_TEX0;
256	}
257
258	if (dirty & R128_UPLOAD_TEX1) {
259		r128_emit_tex1(dev_priv);
260		sarea_priv->dirty &= ~R128_UPLOAD_TEX1;
261	}
262
263	/* Turn off the texture cache flushing */
264	sarea_priv->context_state.tex_cntl_c &= ~R128_TEX_CACHE_FLUSH;
265
266	sarea_priv->dirty &= ~R128_REQUIRE_QUIESCENCE;
267}
268
269#if R128_PERFORMANCE_BOXES
270/* ================================================================
271 * Performance monitoring functions
272 */
273
274static void r128_clear_box(drm_r128_private_t *dev_priv,
275			   int x, int y, int w, int h, int r, int g, int b)
276{
277	u32 pitch, offset;
278	u32 fb_bpp, color;
279	RING_LOCALS;
280
281	switch (dev_priv->fb_bpp) {
282	case 16:
283		fb_bpp = R128_GMC_DST_16BPP;
284		color = (((r & 0xf8) << 8) |
285			 ((g & 0xfc) << 3) | ((b & 0xf8) >> 3));
286		break;
287	case 24:
288		fb_bpp = R128_GMC_DST_24BPP;
289		color = ((r << 16) | (g << 8) | b);
290		break;
291	case 32:
292		fb_bpp = R128_GMC_DST_32BPP;
293		color = (((0xff) << 24) | (r << 16) | (g << 8) | b);
294		break;
295	default:
296		return;
297	}
298
299	offset = dev_priv->back_offset;
300	pitch = dev_priv->back_pitch >> 3;
301
302	BEGIN_RING(6);
303
304	OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
305	OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
306		 R128_GMC_BRUSH_SOLID_COLOR |
307		 fb_bpp |
308		 R128_GMC_SRC_DATATYPE_COLOR |
309		 R128_ROP3_P |
310		 R128_GMC_CLR_CMP_CNTL_DIS | R128_GMC_AUX_CLIP_DIS);
311
312	OUT_RING((pitch << 21) | (offset >> 5));
313	OUT_RING(color);
314
315	OUT_RING((x << 16) | y);
316	OUT_RING((w << 16) | h);
317
318	ADVANCE_RING();
319}
320
321static void r128_cce_performance_boxes(drm_r128_private_t *dev_priv)
322{
323	if (atomic_read(&dev_priv->idle_count) == 0)
324		r128_clear_box(dev_priv, 64, 4, 8, 8, 0, 255, 0);
325	else
326		atomic_set(&dev_priv->idle_count, 0);
327}
328
329#endif
330
331/* ================================================================
332 * CCE command dispatch functions
333 */
334
335static void r128_print_dirty(const char *msg, unsigned int flags)
336{
337	DRM_INFO("%s: (0x%x) %s%s%s%s%s%s%s%s%s\n",
338		 msg,
339		 flags,
340		 (flags & R128_UPLOAD_CORE) ? "core, " : "",
341		 (flags & R128_UPLOAD_CONTEXT) ? "context, " : "",
342		 (flags & R128_UPLOAD_SETUP) ? "setup, " : "",
343		 (flags & R128_UPLOAD_TEX0) ? "tex0, " : "",
344		 (flags & R128_UPLOAD_TEX1) ? "tex1, " : "",
345		 (flags & R128_UPLOAD_MASKS) ? "masks, " : "",
346		 (flags & R128_UPLOAD_WINDOW) ? "window, " : "",
347		 (flags & R128_UPLOAD_CLIPRECTS) ? "cliprects, " : "",
348		 (flags & R128_REQUIRE_QUIESCENCE) ? "quiescence, " : "");
349}
350
351static void r128_cce_dispatch_clear(struct drm_device *dev,
352				    drm_r128_clear_t *clear)
353{
354	drm_r128_private_t *dev_priv = dev->dev_private;
355	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
356	int nbox = sarea_priv->nbox;
357	struct drm_clip_rect *pbox = sarea_priv->boxes;
358	unsigned int flags = clear->flags;
359	int i;
360	RING_LOCALS;
361	DRM_DEBUG("\n");
362
363	if (dev_priv->page_flipping && dev_priv->current_page == 1) {
364		unsigned int tmp = flags;
365
366		flags &= ~(R128_FRONT | R128_BACK);
367		if (tmp & R128_FRONT)
368			flags |= R128_BACK;
369		if (tmp & R128_BACK)
370			flags |= R128_FRONT;
371	}
372
373	for (i = 0; i < nbox; i++) {
374		int x = pbox[i].x1;
375		int y = pbox[i].y1;
376		int w = pbox[i].x2 - x;
377		int h = pbox[i].y2 - y;
378
379		DRM_DEBUG("dispatch clear %d,%d-%d,%d flags 0x%x\n",
380			  pbox[i].x1, pbox[i].y1, pbox[i].x2,
381			  pbox[i].y2, flags);
382
383		if (flags & (R128_FRONT | R128_BACK)) {
384			BEGIN_RING(2);
385
386			OUT_RING(CCE_PACKET0(R128_DP_WRITE_MASK, 0));
387			OUT_RING(clear->color_mask);
388
389			ADVANCE_RING();
390		}
391
392		if (flags & R128_FRONT) {
393			BEGIN_RING(6);
394
395			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
396			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
397				 R128_GMC_BRUSH_SOLID_COLOR |
398				 (dev_priv->color_fmt << 8) |
399				 R128_GMC_SRC_DATATYPE_COLOR |
400				 R128_ROP3_P |
401				 R128_GMC_CLR_CMP_CNTL_DIS |
402				 R128_GMC_AUX_CLIP_DIS);
403
404			OUT_RING(dev_priv->front_pitch_offset_c);
405			OUT_RING(clear->clear_color);
406
407			OUT_RING((x << 16) | y);
408			OUT_RING((w << 16) | h);
409
410			ADVANCE_RING();
411		}
412
413		if (flags & R128_BACK) {
414			BEGIN_RING(6);
415
416			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
417			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
418				 R128_GMC_BRUSH_SOLID_COLOR |
419				 (dev_priv->color_fmt << 8) |
420				 R128_GMC_SRC_DATATYPE_COLOR |
421				 R128_ROP3_P |
422				 R128_GMC_CLR_CMP_CNTL_DIS |
423				 R128_GMC_AUX_CLIP_DIS);
424
425			OUT_RING(dev_priv->back_pitch_offset_c);
426			OUT_RING(clear->clear_color);
427
428			OUT_RING((x << 16) | y);
429			OUT_RING((w << 16) | h);
430
431			ADVANCE_RING();
432		}
433
434		if (flags & R128_DEPTH) {
435			BEGIN_RING(6);
436
437			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
438			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
439				 R128_GMC_BRUSH_SOLID_COLOR |
440				 (dev_priv->depth_fmt << 8) |
441				 R128_GMC_SRC_DATATYPE_COLOR |
442				 R128_ROP3_P |
443				 R128_GMC_CLR_CMP_CNTL_DIS |
444				 R128_GMC_AUX_CLIP_DIS | R128_GMC_WR_MSK_DIS);
445
446			OUT_RING(dev_priv->depth_pitch_offset_c);
447			OUT_RING(clear->clear_depth);
448
449			OUT_RING((x << 16) | y);
450			OUT_RING((w << 16) | h);
451
452			ADVANCE_RING();
453		}
454	}
455}
456
457static void r128_cce_dispatch_swap(struct drm_device *dev)
458{
459	drm_r128_private_t *dev_priv = dev->dev_private;
460	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
461	int nbox = sarea_priv->nbox;
462	struct drm_clip_rect *pbox = sarea_priv->boxes;
463	int i;
464	RING_LOCALS;
465	DRM_DEBUG("\n");
466
467#if R128_PERFORMANCE_BOXES
468	/* Do some trivial performance monitoring...
469	 */
470	r128_cce_performance_boxes(dev_priv);
471#endif
472
473	for (i = 0; i < nbox; i++) {
474		int x = pbox[i].x1;
475		int y = pbox[i].y1;
476		int w = pbox[i].x2 - x;
477		int h = pbox[i].y2 - y;
478
479		BEGIN_RING(7);
480
481		OUT_RING(CCE_PACKET3(R128_CNTL_BITBLT_MULTI, 5));
482		OUT_RING(R128_GMC_SRC_PITCH_OFFSET_CNTL |
483			 R128_GMC_DST_PITCH_OFFSET_CNTL |
484			 R128_GMC_BRUSH_NONE |
485			 (dev_priv->color_fmt << 8) |
486			 R128_GMC_SRC_DATATYPE_COLOR |
487			 R128_ROP3_S |
488			 R128_DP_SRC_SOURCE_MEMORY |
489			 R128_GMC_CLR_CMP_CNTL_DIS |
490			 R128_GMC_AUX_CLIP_DIS | R128_GMC_WR_MSK_DIS);
491
492		/* Make this work even if front & back are flipped:
493		 */
494		if (dev_priv->current_page == 0) {
495			OUT_RING(dev_priv->back_pitch_offset_c);
496			OUT_RING(dev_priv->front_pitch_offset_c);
497		} else {
498			OUT_RING(dev_priv->front_pitch_offset_c);
499			OUT_RING(dev_priv->back_pitch_offset_c);
500		}
501
502		OUT_RING((x << 16) | y);
503		OUT_RING((x << 16) | y);
504		OUT_RING((w << 16) | h);
505
506		ADVANCE_RING();
507	}
508
509	/* Increment the frame counter.  The client-side 3D driver must
510	 * throttle the framerate by waiting for this value before
511	 * performing the swapbuffer ioctl.
512	 */
513	dev_priv->sarea_priv->last_frame++;
514
515	BEGIN_RING(2);
516
517	OUT_RING(CCE_PACKET0(R128_LAST_FRAME_REG, 0));
518	OUT_RING(dev_priv->sarea_priv->last_frame);
519
520	ADVANCE_RING();
521}
522
523static void r128_cce_dispatch_flip(struct drm_device *dev)
524{
525	drm_r128_private_t *dev_priv = dev->dev_private;
526	RING_LOCALS;
527	DRM_DEBUG("page=%d pfCurrentPage=%d\n",
528		  dev_priv->current_page, dev_priv->sarea_priv->pfCurrentPage);
529
530#if R128_PERFORMANCE_BOXES
531	/* Do some trivial performance monitoring...
532	 */
533	r128_cce_performance_boxes(dev_priv);
534#endif
535
536	BEGIN_RING(4);
537
538	R128_WAIT_UNTIL_PAGE_FLIPPED();
539	OUT_RING(CCE_PACKET0(R128_CRTC_OFFSET, 0));
540
541	if (dev_priv->current_page == 0)
542		OUT_RING(dev_priv->back_offset);
543	else
544		OUT_RING(dev_priv->front_offset);
545
546	ADVANCE_RING();
547
548	/* Increment the frame counter.  The client-side 3D driver must
549	 * throttle the framerate by waiting for this value before
550	 * performing the swapbuffer ioctl.
551	 */
552	dev_priv->sarea_priv->last_frame++;
553	dev_priv->sarea_priv->pfCurrentPage = dev_priv->current_page =
554	    1 - dev_priv->current_page;
555
556	BEGIN_RING(2);
557
558	OUT_RING(CCE_PACKET0(R128_LAST_FRAME_REG, 0));
559	OUT_RING(dev_priv->sarea_priv->last_frame);
560
561	ADVANCE_RING();
562}
563
564static void r128_cce_dispatch_vertex(struct drm_device *dev, struct drm_buf *buf)
565{
566	drm_r128_private_t *dev_priv = dev->dev_private;
567	drm_r128_buf_priv_t *buf_priv = buf->dev_private;
568	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
569	int format = sarea_priv->vc_format;
570	int offset = buf->bus_address;
571	int size = buf->used;
572	int prim = buf_priv->prim;
573	int i = 0;
574	RING_LOCALS;
575	DRM_DEBUG("buf=%d nbox=%d\n", buf->idx, sarea_priv->nbox);
576
577	if (0)
578		r128_print_dirty("dispatch_vertex", sarea_priv->dirty);
579
580	if (buf->used) {
581		buf_priv->dispatched = 1;
582
583		if (sarea_priv->dirty & ~R128_UPLOAD_CLIPRECTS)
584			r128_emit_state(dev_priv);
585
586		do {
587			/* Emit the next set of up to three cliprects */
588			if (i < sarea_priv->nbox) {
589				r128_emit_clip_rects(dev_priv,
590						     &sarea_priv->boxes[i],
591						     sarea_priv->nbox - i);
592			}
593
594			/* Emit the vertex buffer rendering commands */
595			BEGIN_RING(5);
596
597			OUT_RING(CCE_PACKET3(R128_3D_RNDR_GEN_INDX_PRIM, 3));
598			OUT_RING(offset);
599			OUT_RING(size);
600			OUT_RING(format);
601			OUT_RING(prim | R128_CCE_VC_CNTL_PRIM_WALK_LIST |
602				 (size << R128_CCE_VC_CNTL_NUM_SHIFT));
603
604			ADVANCE_RING();
605
606			i += 3;
607		} while (i < sarea_priv->nbox);
608	}
609
610	if (buf_priv->discard) {
611		buf_priv->age = dev_priv->sarea_priv->last_dispatch;
612
613		/* Emit the vertex buffer age */
614		BEGIN_RING(2);
615
616		OUT_RING(CCE_PACKET0(R128_LAST_DISPATCH_REG, 0));
617		OUT_RING(buf_priv->age);
618
619		ADVANCE_RING();
620
621		buf->pending = 1;
622		buf->used = 0;
623		/* FIXME: Check dispatched field */
624		buf_priv->dispatched = 0;
625	}
626
627	dev_priv->sarea_priv->last_dispatch++;
628
629	sarea_priv->dirty &= ~R128_UPLOAD_CLIPRECTS;
630	sarea_priv->nbox = 0;
631}
632
633static void r128_cce_dispatch_indirect(struct drm_device *dev,
634				       struct drm_buf *buf, int start, int end)
635{
636	drm_r128_private_t *dev_priv = dev->dev_private;
637	drm_r128_buf_priv_t *buf_priv = buf->dev_private;
638	RING_LOCALS;
639	DRM_DEBUG("indirect: buf=%d s=0x%x e=0x%x\n", buf->idx, start, end);
640
641	if (start != end) {
642		int offset = buf->bus_address + start;
643		int dwords = (end - start + 3) / sizeof(u32);
644
645		/* Indirect buffer data must be an even number of
646		 * dwords, so if we've been given an odd number we must
647		 * pad the data with a Type-2 CCE packet.
648		 */
649		if (dwords & 1) {
650			u32 *data = (u32 *)
651			    ((char *)dev->agp_buffer_map->handle
652			     + buf->offset + start);
653			data[dwords++] = cpu_to_le32(R128_CCE_PACKET2);
654		}
655
656		buf_priv->dispatched = 1;
657
658		/* Fire off the indirect buffer */
659		BEGIN_RING(3);
660
661		OUT_RING(CCE_PACKET0(R128_PM4_IW_INDOFF, 1));
662		OUT_RING(offset);
663		OUT_RING(dwords);
664
665		ADVANCE_RING();
666	}
667
668	if (buf_priv->discard) {
669		buf_priv->age = dev_priv->sarea_priv->last_dispatch;
670
671		/* Emit the indirect buffer age */
672		BEGIN_RING(2);
673
674		OUT_RING(CCE_PACKET0(R128_LAST_DISPATCH_REG, 0));
675		OUT_RING(buf_priv->age);
676
677		ADVANCE_RING();
678
679		buf->pending = 1;
680		buf->used = 0;
681		/* FIXME: Check dispatched field */
682		buf_priv->dispatched = 0;
683	}
684
685	dev_priv->sarea_priv->last_dispatch++;
686}
687
688static void r128_cce_dispatch_indices(struct drm_device *dev,
689				      struct drm_buf *buf,
690				      int start, int end, int count)
691{
692	drm_r128_private_t *dev_priv = dev->dev_private;
693	drm_r128_buf_priv_t *buf_priv = buf->dev_private;
694	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
695	int format = sarea_priv->vc_format;
696	int offset = dev->agp_buffer_map->offset - dev_priv->cce_buffers_offset;
697	int prim = buf_priv->prim;
698	u32 *data;
699	int dwords;
700	int i = 0;
701	RING_LOCALS;
702	DRM_DEBUG("indices: s=%d e=%d c=%d\n", start, end, count);
703
704	if (0)
705		r128_print_dirty("dispatch_indices", sarea_priv->dirty);
706
707	if (start != end) {
708		buf_priv->dispatched = 1;
709
710		if (sarea_priv->dirty & ~R128_UPLOAD_CLIPRECTS)
711			r128_emit_state(dev_priv);
712
713		dwords = (end - start + 3) / sizeof(u32);
714
715		data = (u32 *) ((char *)dev->agp_buffer_map->handle
716				+ buf->offset + start);
717
718		data[0] = cpu_to_le32(CCE_PACKET3(R128_3D_RNDR_GEN_INDX_PRIM,
719						  dwords - 2));
720
721		data[1] = cpu_to_le32(offset);
722		data[2] = cpu_to_le32(R128_MAX_VB_VERTS);
723		data[3] = cpu_to_le32(format);
724		data[4] = cpu_to_le32((prim | R128_CCE_VC_CNTL_PRIM_WALK_IND |
725				       (count << 16)));
726
727		if (count & 0x1) {
728#ifdef __LITTLE_ENDIAN
729			data[dwords - 1] &= 0x0000ffff;
730#else
731			data[dwords - 1] &= 0xffff0000;
732#endif
733		}
734
735		do {
736			/* Emit the next set of up to three cliprects */
737			if (i < sarea_priv->nbox) {
738				r128_emit_clip_rects(dev_priv,
739						     &sarea_priv->boxes[i],
740						     sarea_priv->nbox - i);
741			}
742
743			r128_cce_dispatch_indirect(dev, buf, start, end);
744
745			i += 3;
746		} while (i < sarea_priv->nbox);
747	}
748
749	if (buf_priv->discard) {
750		buf_priv->age = dev_priv->sarea_priv->last_dispatch;
751
752		/* Emit the vertex buffer age */
753		BEGIN_RING(2);
754
755		OUT_RING(CCE_PACKET0(R128_LAST_DISPATCH_REG, 0));
756		OUT_RING(buf_priv->age);
757
758		ADVANCE_RING();
759
760		buf->pending = 1;
761		/* FIXME: Check dispatched field */
762		buf_priv->dispatched = 0;
763	}
764
765	dev_priv->sarea_priv->last_dispatch++;
766
767	sarea_priv->dirty &= ~R128_UPLOAD_CLIPRECTS;
768	sarea_priv->nbox = 0;
769}
770
771static int r128_cce_dispatch_blit(struct drm_device *dev,
772				  struct drm_file *file_priv,
773				  drm_r128_blit_t *blit)
774{
775	drm_r128_private_t *dev_priv = dev->dev_private;
776	struct drm_device_dma *dma = dev->dma;
777	struct drm_buf *buf;
778	drm_r128_buf_priv_t *buf_priv;
779	u32 *data;
780	int dword_shift, dwords;
781	RING_LOCALS;
782	DRM_DEBUG("\n");
783
784	/* The compiler won't optimize away a division by a variable,
785	 * even if the only legal values are powers of two.  Thus, we'll
786	 * use a shift instead.
787	 */
788	switch (blit->format) {
789	case R128_DATATYPE_ARGB8888:
790		dword_shift = 0;
791		break;
792	case R128_DATATYPE_ARGB1555:
793	case R128_DATATYPE_RGB565:
794	case R128_DATATYPE_ARGB4444:
795	case R128_DATATYPE_YVYU422:
796	case R128_DATATYPE_VYUY422:
797		dword_shift = 1;
798		break;
799	case R128_DATATYPE_CI8:
800	case R128_DATATYPE_RGB8:
801		dword_shift = 2;
802		break;
803	default:
804		DRM_ERROR("invalid blit format %d\n", blit->format);
805		return -EINVAL;
806	}
807
808	/* Flush the pixel cache, and mark the contents as Read Invalid.
809	 * This ensures no pixel data gets mixed up with the texture
810	 * data from the host data blit, otherwise part of the texture
811	 * image may be corrupted.
812	 */
813	BEGIN_RING(2);
814
815	OUT_RING(CCE_PACKET0(R128_PC_GUI_CTLSTAT, 0));
816	OUT_RING(R128_PC_RI_GUI | R128_PC_FLUSH_GUI);
817
818	ADVANCE_RING();
819
820	/* Dispatch the indirect buffer.
821	 */
822	buf = dma->buflist[blit->idx];
823	buf_priv = buf->dev_private;
824
825	if (buf->file_priv != file_priv) {
826		DRM_ERROR("process %d using buffer owned by %p\n",
827			  DRM_CURRENTPID, buf->file_priv);
828		return -EINVAL;
829	}
830	if (buf->pending) {
831		DRM_ERROR("sending pending buffer %d\n", blit->idx);
832		return -EINVAL;
833	}
834
835	buf_priv->discard = 1;
836
837	dwords = (blit->width * blit->height) >> dword_shift;
838
839	data = (u32 *) ((char *)dev->agp_buffer_map->handle + buf->offset);
840
841	data[0] = cpu_to_le32(CCE_PACKET3(R128_CNTL_HOSTDATA_BLT, dwords + 6));
842	data[1] = cpu_to_le32((R128_GMC_DST_PITCH_OFFSET_CNTL |
843			       R128_GMC_BRUSH_NONE |
844			       (blit->format << 8) |
845			       R128_GMC_SRC_DATATYPE_COLOR |
846			       R128_ROP3_S |
847			       R128_DP_SRC_SOURCE_HOST_DATA |
848			       R128_GMC_CLR_CMP_CNTL_DIS |
849			       R128_GMC_AUX_CLIP_DIS | R128_GMC_WR_MSK_DIS));
850
851	data[2] = cpu_to_le32((blit->pitch << 21) | (blit->offset >> 5));
852	data[3] = cpu_to_le32(0xffffffff);
853	data[4] = cpu_to_le32(0xffffffff);
854	data[5] = cpu_to_le32((blit->y << 16) | blit->x);
855	data[6] = cpu_to_le32((blit->height << 16) | blit->width);
856	data[7] = cpu_to_le32(dwords);
857
858	buf->used = (dwords + 8) * sizeof(u32);
859
860	r128_cce_dispatch_indirect(dev, buf, 0, buf->used);
861
862	/* Flush the pixel cache after the blit completes.  This ensures
863	 * the texture data is written out to memory before rendering
864	 * continues.
865	 */
866	BEGIN_RING(2);
867
868	OUT_RING(CCE_PACKET0(R128_PC_GUI_CTLSTAT, 0));
869	OUT_RING(R128_PC_FLUSH_GUI);
870
871	ADVANCE_RING();
872
873	return 0;
874}
875
876/* ================================================================
877 * Tiled depth buffer management
878 *
879 * FIXME: These should all set the destination write mask for when we
880 * have hardware stencil support.
881 */
882
883static int r128_cce_dispatch_write_span(struct drm_device *dev,
884					drm_r128_depth_t *depth)
885{
886	drm_r128_private_t *dev_priv = dev->dev_private;
887	int count, x, y;
888	u32 *buffer;
889	u8 *mask;
890	int i, buffer_size, mask_size;
891	RING_LOCALS;
892	DRM_DEBUG("\n");
893
894	count = depth->n;
895	if (count > 4096 || count <= 0)
896		return -EMSGSIZE;
897
898	if (DRM_COPY_FROM_USER(&x, depth->x, sizeof(x)))
899		return -EFAULT;
900	if (DRM_COPY_FROM_USER(&y, depth->y, sizeof(y)))
901		return -EFAULT;
902
903	buffer_size = depth->n * sizeof(u32);
904	buffer = kmalloc(buffer_size, GFP_KERNEL);
905	if (buffer == NULL)
906		return -ENOMEM;
907	if (DRM_COPY_FROM_USER(buffer, depth->buffer, buffer_size)) {
908		kfree(buffer);
909		return -EFAULT;
910	}
911
912	mask_size = depth->n * sizeof(u8);
913	if (depth->mask) {
914		mask = kmalloc(mask_size, GFP_KERNEL);
915		if (mask == NULL) {
916			kfree(buffer);
917			return -ENOMEM;
918		}
919		if (DRM_COPY_FROM_USER(mask, depth->mask, mask_size)) {
920			kfree(buffer);
921			kfree(mask);
922			return -EFAULT;
923		}
924
925		for (i = 0; i < count; i++, x++) {
926			if (mask[i]) {
927				BEGIN_RING(6);
928
929				OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
930				OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
931					 R128_GMC_BRUSH_SOLID_COLOR |
932					 (dev_priv->depth_fmt << 8) |
933					 R128_GMC_SRC_DATATYPE_COLOR |
934					 R128_ROP3_P |
935					 R128_GMC_CLR_CMP_CNTL_DIS |
936					 R128_GMC_WR_MSK_DIS);
937
938				OUT_RING(dev_priv->depth_pitch_offset_c);
939				OUT_RING(buffer[i]);
940
941				OUT_RING((x << 16) | y);
942				OUT_RING((1 << 16) | 1);
943
944				ADVANCE_RING();
945			}
946		}
947
948		kfree(mask);
949	} else {
950		for (i = 0; i < count; i++, x++) {
951			BEGIN_RING(6);
952
953			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
954			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
955				 R128_GMC_BRUSH_SOLID_COLOR |
956				 (dev_priv->depth_fmt << 8) |
957				 R128_GMC_SRC_DATATYPE_COLOR |
958				 R128_ROP3_P |
959				 R128_GMC_CLR_CMP_CNTL_DIS |
960				 R128_GMC_WR_MSK_DIS);
961
962			OUT_RING(dev_priv->depth_pitch_offset_c);
963			OUT_RING(buffer[i]);
964
965			OUT_RING((x << 16) | y);
966			OUT_RING((1 << 16) | 1);
967
968			ADVANCE_RING();
969		}
970	}
971
972	kfree(buffer);
973
974	return 0;
975}
976
977static int r128_cce_dispatch_write_pixels(struct drm_device *dev,
978					  drm_r128_depth_t *depth)
979{
980	drm_r128_private_t *dev_priv = dev->dev_private;
981	int count, *x, *y;
982	u32 *buffer;
983	u8 *mask;
984	int i, xbuf_size, ybuf_size, buffer_size, mask_size;
985	RING_LOCALS;
986	DRM_DEBUG("\n");
987
988	count = depth->n;
989	if (count > 4096 || count <= 0)
990		return -EMSGSIZE;
991
992	xbuf_size = count * sizeof(*x);
993	ybuf_size = count * sizeof(*y);
994	x = kmalloc(xbuf_size, GFP_KERNEL);
995	if (x == NULL)
996		return -ENOMEM;
997	y = kmalloc(ybuf_size, GFP_KERNEL);
998	if (y == NULL) {
999		kfree(x);
1000		return -ENOMEM;
1001	}
1002	if (DRM_COPY_FROM_USER(x, depth->x, xbuf_size)) {
1003		kfree(x);
1004		kfree(y);
1005		return -EFAULT;
1006	}
1007	if (DRM_COPY_FROM_USER(y, depth->y, xbuf_size)) {
1008		kfree(x);
1009		kfree(y);
1010		return -EFAULT;
1011	}
1012
1013	buffer_size = depth->n * sizeof(u32);
1014	buffer = kmalloc(buffer_size, GFP_KERNEL);
1015	if (buffer == NULL) {
1016		kfree(x);
1017		kfree(y);
1018		return -ENOMEM;
1019	}
1020	if (DRM_COPY_FROM_USER(buffer, depth->buffer, buffer_size)) {
1021		kfree(x);
1022		kfree(y);
1023		kfree(buffer);
1024		return -EFAULT;
1025	}
1026
1027	if (depth->mask) {
1028		mask_size = depth->n * sizeof(u8);
1029		mask = kmalloc(mask_size, GFP_KERNEL);
1030		if (mask == NULL) {
1031			kfree(x);
1032			kfree(y);
1033			kfree(buffer);
1034			return -ENOMEM;
1035		}
1036		if (DRM_COPY_FROM_USER(mask, depth->mask, mask_size)) {
1037			kfree(x);
1038			kfree(y);
1039			kfree(buffer);
1040			kfree(mask);
1041			return -EFAULT;
1042		}
1043
1044		for (i = 0; i < count; i++) {
1045			if (mask[i]) {
1046				BEGIN_RING(6);
1047
1048				OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
1049				OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
1050					 R128_GMC_BRUSH_SOLID_COLOR |
1051					 (dev_priv->depth_fmt << 8) |
1052					 R128_GMC_SRC_DATATYPE_COLOR |
1053					 R128_ROP3_P |
1054					 R128_GMC_CLR_CMP_CNTL_DIS |
1055					 R128_GMC_WR_MSK_DIS);
1056
1057				OUT_RING(dev_priv->depth_pitch_offset_c);
1058				OUT_RING(buffer[i]);
1059
1060				OUT_RING((x[i] << 16) | y[i]);
1061				OUT_RING((1 << 16) | 1);
1062
1063				ADVANCE_RING();
1064			}
1065		}
1066
1067		kfree(mask);
1068	} else {
1069		for (i = 0; i < count; i++) {
1070			BEGIN_RING(6);
1071
1072			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
1073			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
1074				 R128_GMC_BRUSH_SOLID_COLOR |
1075				 (dev_priv->depth_fmt << 8) |
1076				 R128_GMC_SRC_DATATYPE_COLOR |
1077				 R128_ROP3_P |
1078				 R128_GMC_CLR_CMP_CNTL_DIS |
1079				 R128_GMC_WR_MSK_DIS);
1080
1081			OUT_RING(dev_priv->depth_pitch_offset_c);
1082			OUT_RING(buffer[i]);
1083
1084			OUT_RING((x[i] << 16) | y[i]);
1085			OUT_RING((1 << 16) | 1);
1086
1087			ADVANCE_RING();
1088		}
1089	}
1090
1091	kfree(x);
1092	kfree(y);
1093	kfree(buffer);
1094
1095	return 0;
1096}
1097
1098static int r128_cce_dispatch_read_span(struct drm_device *dev,
1099				       drm_r128_depth_t *depth)
1100{
1101	drm_r128_private_t *dev_priv = dev->dev_private;
1102	int count, x, y;
1103	RING_LOCALS;
1104	DRM_DEBUG("\n");
1105
1106	count = depth->n;
1107	if (count > 4096 || count <= 0)
1108		return -EMSGSIZE;
1109
1110	if (DRM_COPY_FROM_USER(&x, depth->x, sizeof(x)))
1111		return -EFAULT;
1112	if (DRM_COPY_FROM_USER(&y, depth->y, sizeof(y)))
1113		return -EFAULT;
1114
1115	BEGIN_RING(7);
1116
1117	OUT_RING(CCE_PACKET3(R128_CNTL_BITBLT_MULTI, 5));
1118	OUT_RING(R128_GMC_SRC_PITCH_OFFSET_CNTL |
1119		 R128_GMC_DST_PITCH_OFFSET_CNTL |
1120		 R128_GMC_BRUSH_NONE |
1121		 (dev_priv->depth_fmt << 8) |
1122		 R128_GMC_SRC_DATATYPE_COLOR |
1123		 R128_ROP3_S |
1124		 R128_DP_SRC_SOURCE_MEMORY |
1125		 R128_GMC_CLR_CMP_CNTL_DIS | R128_GMC_WR_MSK_DIS);
1126
1127	OUT_RING(dev_priv->depth_pitch_offset_c);
1128	OUT_RING(dev_priv->span_pitch_offset_c);
1129
1130	OUT_RING((x << 16) | y);
1131	OUT_RING((0 << 16) | 0);
1132	OUT_RING((count << 16) | 1);
1133
1134	ADVANCE_RING();
1135
1136	return 0;
1137}
1138
1139static int r128_cce_dispatch_read_pixels(struct drm_device *dev,
1140					 drm_r128_depth_t *depth)
1141{
1142	drm_r128_private_t *dev_priv = dev->dev_private;
1143	int count, *x, *y;
1144	int i, xbuf_size, ybuf_size;
1145	RING_LOCALS;
1146	DRM_DEBUG("\n");
1147
1148	count = depth->n;
1149	if (count > 4096 || count <= 0)
1150		return -EMSGSIZE;
1151
1152	if (count > dev_priv->depth_pitch)
1153		count = dev_priv->depth_pitch;
1154
1155	xbuf_size = count * sizeof(*x);
1156	ybuf_size = count * sizeof(*y);
1157	x = kmalloc(xbuf_size, GFP_KERNEL);
1158	if (x == NULL)
1159		return -ENOMEM;
1160	y = kmalloc(ybuf_size, GFP_KERNEL);
1161	if (y == NULL) {
1162		kfree(x);
1163		return -ENOMEM;
1164	}
1165	if (DRM_COPY_FROM_USER(x, depth->x, xbuf_size)) {
1166		kfree(x);
1167		kfree(y);
1168		return -EFAULT;
1169	}
1170	if (DRM_COPY_FROM_USER(y, depth->y, ybuf_size)) {
1171		kfree(x);
1172		kfree(y);
1173		return -EFAULT;
1174	}
1175
1176	for (i = 0; i < count; i++) {
1177		BEGIN_RING(7);
1178
1179		OUT_RING(CCE_PACKET3(R128_CNTL_BITBLT_MULTI, 5));
1180		OUT_RING(R128_GMC_SRC_PITCH_OFFSET_CNTL |
1181			 R128_GMC_DST_PITCH_OFFSET_CNTL |
1182			 R128_GMC_BRUSH_NONE |
1183			 (dev_priv->depth_fmt << 8) |
1184			 R128_GMC_SRC_DATATYPE_COLOR |
1185			 R128_ROP3_S |
1186			 R128_DP_SRC_SOURCE_MEMORY |
1187			 R128_GMC_CLR_CMP_CNTL_DIS | R128_GMC_WR_MSK_DIS);
1188
1189		OUT_RING(dev_priv->depth_pitch_offset_c);
1190		OUT_RING(dev_priv->span_pitch_offset_c);
1191
1192		OUT_RING((x[i] << 16) | y[i]);
1193		OUT_RING((i << 16) | 0);
1194		OUT_RING((1 << 16) | 1);
1195
1196		ADVANCE_RING();
1197	}
1198
1199	kfree(x);
1200	kfree(y);
1201
1202	return 0;
1203}
1204
1205/* ================================================================
1206 * Polygon stipple
1207 */
1208
1209static void r128_cce_dispatch_stipple(struct drm_device *dev, u32 *stipple)
1210{
1211	drm_r128_private_t *dev_priv = dev->dev_private;
1212	int i;
1213	RING_LOCALS;
1214	DRM_DEBUG("\n");
1215
1216	BEGIN_RING(33);
1217
1218	OUT_RING(CCE_PACKET0(R128_BRUSH_DATA0, 31));
1219	for (i = 0; i < 32; i++)
1220		OUT_RING(stipple[i]);
1221
1222	ADVANCE_RING();
1223}
1224
1225/* ================================================================
1226 * IOCTL functions
1227 */
1228
1229static int r128_cce_clear(struct drm_device *dev, void *data, struct drm_file *file_priv)
1230{
1231	drm_r128_private_t *dev_priv = dev->dev_private;
1232	drm_r128_sarea_t *sarea_priv;
1233	drm_r128_clear_t *clear = data;
1234	DRM_DEBUG("\n");
1235
1236	LOCK_TEST_WITH_RETURN(dev, file_priv);
1237
1238	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1239
1240	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1241
1242	sarea_priv = dev_priv->sarea_priv;
1243
1244	if (sarea_priv->nbox > R128_NR_SAREA_CLIPRECTS)
1245		sarea_priv->nbox = R128_NR_SAREA_CLIPRECTS;
1246
1247	r128_cce_dispatch_clear(dev, clear);
1248	COMMIT_RING();
1249
1250	/* Make sure we restore the 3D state next time.
1251	 */
1252	dev_priv->sarea_priv->dirty |= R128_UPLOAD_CONTEXT | R128_UPLOAD_MASKS;
1253
1254	return 0;
1255}
1256
1257static int r128_do_init_pageflip(struct drm_device *dev)
1258{
1259	drm_r128_private_t *dev_priv = dev->dev_private;
1260	DRM_DEBUG("\n");
1261
1262	dev_priv->crtc_offset = R128_READ(R128_CRTC_OFFSET);
1263	dev_priv->crtc_offset_cntl = R128_READ(R128_CRTC_OFFSET_CNTL);
1264
1265	R128_WRITE(R128_CRTC_OFFSET, dev_priv->front_offset);
1266	R128_WRITE(R128_CRTC_OFFSET_CNTL,
1267		   dev_priv->crtc_offset_cntl | R128_CRTC_OFFSET_FLIP_CNTL);
1268
1269	dev_priv->page_flipping = 1;
1270	dev_priv->current_page = 0;
1271	dev_priv->sarea_priv->pfCurrentPage = dev_priv->current_page;
1272
1273	return 0;
1274}
1275
1276static int r128_do_cleanup_pageflip(struct drm_device *dev)
1277{
1278	drm_r128_private_t *dev_priv = dev->dev_private;
1279	DRM_DEBUG("\n");
1280
1281	R128_WRITE(R128_CRTC_OFFSET, dev_priv->crtc_offset);
1282	R128_WRITE(R128_CRTC_OFFSET_CNTL, dev_priv->crtc_offset_cntl);
1283
1284	if (dev_priv->current_page != 0) {
1285		r128_cce_dispatch_flip(dev);
1286		COMMIT_RING();
1287	}
1288
1289	dev_priv->page_flipping = 0;
1290	return 0;
1291}
1292
1293/* Swapping and flipping are different operations, need different ioctls.
1294 * They can & should be intermixed to support multiple 3d windows.
1295 */
1296
1297static int r128_cce_flip(struct drm_device *dev, void *data, struct drm_file *file_priv)
1298{
1299	drm_r128_private_t *dev_priv = dev->dev_private;
1300	DRM_DEBUG("\n");
1301
1302	LOCK_TEST_WITH_RETURN(dev, file_priv);
1303
1304	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1305
1306	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1307
1308	if (!dev_priv->page_flipping)
1309		r128_do_init_pageflip(dev);
1310
1311	r128_cce_dispatch_flip(dev);
1312
1313	COMMIT_RING();
1314	return 0;
1315}
1316
1317static int r128_cce_swap(struct drm_device *dev, void *data, struct drm_file *file_priv)
1318{
1319	drm_r128_private_t *dev_priv = dev->dev_private;
1320	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
1321	DRM_DEBUG("\n");
1322
1323	LOCK_TEST_WITH_RETURN(dev, file_priv);
1324
1325	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1326
1327	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1328
1329	if (sarea_priv->nbox > R128_NR_SAREA_CLIPRECTS)
1330		sarea_priv->nbox = R128_NR_SAREA_CLIPRECTS;
1331
1332	r128_cce_dispatch_swap(dev);
1333	dev_priv->sarea_priv->dirty |= (R128_UPLOAD_CONTEXT |
1334					R128_UPLOAD_MASKS);
1335
1336	COMMIT_RING();
1337	return 0;
1338}
1339
1340static int r128_cce_vertex(struct drm_device *dev, void *data, struct drm_file *file_priv)
1341{
1342	drm_r128_private_t *dev_priv = dev->dev_private;
1343	struct drm_device_dma *dma = dev->dma;
1344	struct drm_buf *buf;
1345	drm_r128_buf_priv_t *buf_priv;
1346	drm_r128_vertex_t *vertex = data;
1347
1348	LOCK_TEST_WITH_RETURN(dev, file_priv);
1349
1350	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1351
1352	DRM_DEBUG("pid=%d index=%d count=%d discard=%d\n",
1353		  DRM_CURRENTPID, vertex->idx, vertex->count, vertex->discard);
1354
1355	if (vertex->idx < 0 || vertex->idx >= dma->buf_count) {
1356		DRM_ERROR("buffer index %d (of %d max)\n",
1357			  vertex->idx, dma->buf_count - 1);
1358		return -EINVAL;
1359	}
1360	if (vertex->prim < 0 ||
1361	    vertex->prim > R128_CCE_VC_CNTL_PRIM_TYPE_TRI_TYPE2) {
1362		DRM_ERROR("buffer prim %d\n", vertex->prim);
1363		return -EINVAL;
1364	}
1365
1366	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1367	VB_AGE_TEST_WITH_RETURN(dev_priv);
1368
1369	buf = dma->buflist[vertex->idx];
1370	buf_priv = buf->dev_private;
1371
1372	if (buf->file_priv != file_priv) {
1373		DRM_ERROR("process %d using buffer owned by %p\n",
1374			  DRM_CURRENTPID, buf->file_priv);
1375		return -EINVAL;
1376	}
1377	if (buf->pending) {
1378		DRM_ERROR("sending pending buffer %d\n", vertex->idx);
1379		return -EINVAL;
1380	}
1381
1382	buf->used = vertex->count;
1383	buf_priv->prim = vertex->prim;
1384	buf_priv->discard = vertex->discard;
1385
1386	r128_cce_dispatch_vertex(dev, buf);
1387
1388	COMMIT_RING();
1389	return 0;
1390}
1391
1392static int r128_cce_indices(struct drm_device *dev, void *data, struct drm_file *file_priv)
1393{
1394	drm_r128_private_t *dev_priv = dev->dev_private;
1395	struct drm_device_dma *dma = dev->dma;
1396	struct drm_buf *buf;
1397	drm_r128_buf_priv_t *buf_priv;
1398	drm_r128_indices_t *elts = data;
1399	int count;
1400
1401	LOCK_TEST_WITH_RETURN(dev, file_priv);
1402
1403	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1404
1405	DRM_DEBUG("pid=%d buf=%d s=%d e=%d d=%d\n", DRM_CURRENTPID,
1406		  elts->idx, elts->start, elts->end, elts->discard);
1407
1408	if (elts->idx < 0 || elts->idx >= dma->buf_count) {
1409		DRM_ERROR("buffer index %d (of %d max)\n",
1410			  elts->idx, dma->buf_count - 1);
1411		return -EINVAL;
1412	}
1413	if (elts->prim < 0 ||
1414	    elts->prim > R128_CCE_VC_CNTL_PRIM_TYPE_TRI_TYPE2) {
1415		DRM_ERROR("buffer prim %d\n", elts->prim);
1416		return -EINVAL;
1417	}
1418
1419	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1420	VB_AGE_TEST_WITH_RETURN(dev_priv);
1421
1422	buf = dma->buflist[elts->idx];
1423	buf_priv = buf->dev_private;
1424
1425	if (buf->file_priv != file_priv) {
1426		DRM_ERROR("process %d using buffer owned by %p\n",
1427			  DRM_CURRENTPID, buf->file_priv);
1428		return -EINVAL;
1429	}
1430	if (buf->pending) {
1431		DRM_ERROR("sending pending buffer %d\n", elts->idx);
1432		return -EINVAL;
1433	}
1434
1435	count = (elts->end - elts->start) / sizeof(u16);
1436	elts->start -= R128_INDEX_PRIM_OFFSET;
1437
1438	if (elts->start & 0x7) {
1439		DRM_ERROR("misaligned buffer 0x%x\n", elts->start);
1440		return -EINVAL;
1441	}
1442	if (elts->start < buf->used) {
1443		DRM_ERROR("no header 0x%x - 0x%x\n", elts->start, buf->used);
1444		return -EINVAL;
1445	}
1446
1447	buf->used = elts->end;
1448	buf_priv->prim = elts->prim;
1449	buf_priv->discard = elts->discard;
1450
1451	r128_cce_dispatch_indices(dev, buf, elts->start, elts->end, count);
1452
1453	COMMIT_RING();
1454	return 0;
1455}
1456
1457static int r128_cce_blit(struct drm_device *dev, void *data, struct drm_file *file_priv)
1458{
1459	struct drm_device_dma *dma = dev->dma;
1460	drm_r128_private_t *dev_priv = dev->dev_private;
1461	drm_r128_blit_t *blit = data;
1462	int ret;
1463
1464	LOCK_TEST_WITH_RETURN(dev, file_priv);
1465
1466	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1467
1468	DRM_DEBUG("pid=%d index=%d\n", DRM_CURRENTPID, blit->idx);
1469
1470	if (blit->idx < 0 || blit->idx >= dma->buf_count) {
1471		DRM_ERROR("buffer index %d (of %d max)\n",
1472			  blit->idx, dma->buf_count - 1);
1473		return -EINVAL;
1474	}
1475
1476	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1477	VB_AGE_TEST_WITH_RETURN(dev_priv);
1478
1479	ret = r128_cce_dispatch_blit(dev, file_priv, blit);
1480
1481	COMMIT_RING();
1482	return ret;
1483}
1484
1485static int r128_cce_depth(struct drm_device *dev, void *data, struct drm_file *file_priv)
1486{
1487	drm_r128_private_t *dev_priv = dev->dev_private;
1488	drm_r128_depth_t *depth = data;
1489	int ret;
1490
1491	LOCK_TEST_WITH_RETURN(dev, file_priv);
1492
1493	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1494
1495	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1496
1497	ret = -EINVAL;
1498	switch (depth->func) {
1499	case R128_WRITE_SPAN:
1500		ret = r128_cce_dispatch_write_span(dev, depth);
1501		break;
1502	case R128_WRITE_PIXELS:
1503		ret = r128_cce_dispatch_write_pixels(dev, depth);
1504		break;
1505	case R128_READ_SPAN:
1506		ret = r128_cce_dispatch_read_span(dev, depth);
1507		break;
1508	case R128_READ_PIXELS:
1509		ret = r128_cce_dispatch_read_pixels(dev, depth);
1510		break;
1511	}
1512
1513	COMMIT_RING();
1514	return ret;
1515}
1516
1517static int r128_cce_stipple(struct drm_device *dev, void *data, struct drm_file *file_priv)
1518{
1519	drm_r128_private_t *dev_priv = dev->dev_private;
1520	drm_r128_stipple_t *stipple = data;
1521	u32 mask[32];
1522
1523	LOCK_TEST_WITH_RETURN(dev, file_priv);
1524
1525	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1526
1527	if (DRM_COPY_FROM_USER(&mask, stipple->mask, 32 * sizeof(u32)))
1528		return -EFAULT;
1529
1530	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1531
1532	r128_cce_dispatch_stipple(dev, mask);
1533
1534	COMMIT_RING();
1535	return 0;
1536}
1537
1538static int r128_cce_indirect(struct drm_device *dev, void *data, struct drm_file *file_priv)
1539{
1540	drm_r128_private_t *dev_priv = dev->dev_private;
1541	struct drm_device_dma *dma = dev->dma;
1542	struct drm_buf *buf;
1543	drm_r128_buf_priv_t *buf_priv;
1544	drm_r128_indirect_t *indirect = data;
1545#if 0
1546	RING_LOCALS;
1547#endif
1548
1549	LOCK_TEST_WITH_RETURN(dev, file_priv);
1550
1551	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1552
1553	DRM_DEBUG("idx=%d s=%d e=%d d=%d\n",
1554		  indirect->idx, indirect->start, indirect->end,
1555		  indirect->discard);
1556
1557	if (indirect->idx < 0 || indirect->idx >= dma->buf_count) {
1558		DRM_ERROR("buffer index %d (of %d max)\n",
1559			  indirect->idx, dma->buf_count - 1);
1560		return -EINVAL;
1561	}
1562
1563	buf = dma->buflist[indirect->idx];
1564	buf_priv = buf->dev_private;
1565
1566	if (buf->file_priv != file_priv) {
1567		DRM_ERROR("process %d using buffer owned by %p\n",
1568			  DRM_CURRENTPID, buf->file_priv);
1569		return -EINVAL;
1570	}
1571	if (buf->pending) {
1572		DRM_ERROR("sending pending buffer %d\n", indirect->idx);
1573		return -EINVAL;
1574	}
1575
1576	if (indirect->start < buf->used) {
1577		DRM_ERROR("reusing indirect: start=0x%x actual=0x%x\n",
1578			  indirect->start, buf->used);
1579		return -EINVAL;
1580	}
1581
1582	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1583	VB_AGE_TEST_WITH_RETURN(dev_priv);
1584
1585	buf->used = indirect->end;
1586	buf_priv->discard = indirect->discard;
1587
1588#if 0
1589	/* Wait for the 3D stream to idle before the indirect buffer
1590	 * containing 2D acceleration commands is processed.
1591	 */
1592	BEGIN_RING(2);
1593	RADEON_WAIT_UNTIL_3D_IDLE();
1594	ADVANCE_RING();
1595#endif
1596
1597	/* Dispatch the indirect buffer full of commands from the
1598	 * X server.  This is insecure and is thus only available to
1599	 * privileged clients.
1600	 */
1601	r128_cce_dispatch_indirect(dev, buf, indirect->start, indirect->end);
1602
1603	COMMIT_RING();
1604	return 0;
1605}
1606
1607static int r128_getparam(struct drm_device *dev, void *data, struct drm_file *file_priv)
1608{
1609	drm_r128_private_t *dev_priv = dev->dev_private;
1610	drm_r128_getparam_t *param = data;
1611	int value;
1612
1613	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1614
1615	DRM_DEBUG("pid=%d\n", DRM_CURRENTPID);
1616
1617	switch (param->param) {
1618	case R128_PARAM_IRQ_NR:
1619		value = drm_dev_to_irq(dev);
1620		break;
1621	default:
1622		return -EINVAL;
1623	}
1624
1625	if (DRM_COPY_TO_USER(param->value, &value, sizeof(int))) {
1626		DRM_ERROR("copy_to_user\n");
1627		return -EFAULT;
1628	}
1629
1630	return 0;
1631}
1632
1633void r128_driver_preclose(struct drm_device *dev, struct drm_file *file_priv)
1634{
1635	if (dev->dev_private) {
1636		drm_r128_private_t *dev_priv = dev->dev_private;
1637		if (dev_priv->page_flipping)
1638			r128_do_cleanup_pageflip(dev);
1639	}
1640}
1641void r128_driver_lastclose(struct drm_device *dev)
1642{
1643	r128_do_cleanup_cce(dev);
1644}
1645
1646struct drm_ioctl_desc r128_ioctls[] = {
1647	DRM_IOCTL_DEF_DRV(R128_INIT, r128_cce_init, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1648	DRM_IOCTL_DEF_DRV(R128_CCE_START, r128_cce_start, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1649	DRM_IOCTL_DEF_DRV(R128_CCE_STOP, r128_cce_stop, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1650	DRM_IOCTL_DEF_DRV(R128_CCE_RESET, r128_cce_reset, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1651	DRM_IOCTL_DEF_DRV(R128_CCE_IDLE, r128_cce_idle, DRM_AUTH),
1652	DRM_IOCTL_DEF_DRV(R128_RESET, r128_engine_reset, DRM_AUTH),
1653	DRM_IOCTL_DEF_DRV(R128_FULLSCREEN, r128_fullscreen, DRM_AUTH),
1654	DRM_IOCTL_DEF_DRV(R128_SWAP, r128_cce_swap, DRM_AUTH),
1655	DRM_IOCTL_DEF_DRV(R128_FLIP, r128_cce_flip, DRM_AUTH),
1656	DRM_IOCTL_DEF_DRV(R128_CLEAR, r128_cce_clear, DRM_AUTH),
1657	DRM_IOCTL_DEF_DRV(R128_VERTEX, r128_cce_vertex, DRM_AUTH),
1658	DRM_IOCTL_DEF_DRV(R128_INDICES, r128_cce_indices, DRM_AUTH),
1659	DRM_IOCTL_DEF_DRV(R128_BLIT, r128_cce_blit, DRM_AUTH),
1660	DRM_IOCTL_DEF_DRV(R128_DEPTH, r128_cce_depth, DRM_AUTH),
1661	DRM_IOCTL_DEF_DRV(R128_STIPPLE, r128_cce_stipple, DRM_AUTH),
1662	DRM_IOCTL_DEF_DRV(R128_INDIRECT, r128_cce_indirect, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1663	DRM_IOCTL_DEF_DRV(R128_GETPARAM, r128_getparam, DRM_AUTH),
1664};
1665
1666int r128_max_ioctl = DRM_ARRAY_SIZE(r128_ioctls);
1667