1/* r128_state.c -- State support for r128 -*- linux-c -*-
2 * Created: Thu Jan 27 02:53:43 2000 by gareth@valinux.com
3 */
4/*
5 * Copyright 2000 VA Linux Systems, Inc., Sunnyvale, California.
6 * All Rights Reserved.
7 *
8 * Permission is hereby granted, free of charge, to any person obtaining a
9 * copy of this software and associated documentation files (the "Software"),
10 * to deal in the Software without restriction, including without limitation
11 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
12 * and/or sell copies of the Software, and to permit persons to whom the
13 * Software is furnished to do so, subject to the following conditions:
14 *
15 * The above copyright notice and this permission notice (including the next
16 * paragraph) shall be included in all copies or substantial portions of the
17 * Software.
18 *
19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
20 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
21 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
22 * PRECISION INSIGHT AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
23 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
24 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
25 * DEALINGS IN THE SOFTWARE.
26 *
27 * Authors:
28 *    Gareth Hughes <gareth@valinux.com>
29 */
30
31#include <linux/pci.h>
32#include <linux/slab.h>
33#include <linux/uaccess.h>
34
35#include <drm/drm_device.h>
36#include <drm/drm_file.h>
37#include <drm/drm_print.h>
38#include <drm/r128_drm.h>
39
40#include "r128_drv.h"
41
42/* ================================================================
43 * CCE hardware state programming functions
44 */
45
46static void r128_emit_clip_rects(drm_r128_private_t *dev_priv,
47				 struct drm_clip_rect *boxes, int count)
48{
49	u32 aux_sc_cntl = 0x00000000;
50	RING_LOCALS;
51	DRM_DEBUG("\n");
52
53	BEGIN_RING((count < 3 ? count : 3) * 5 + 2);
54
55	if (count >= 1) {
56		OUT_RING(CCE_PACKET0(R128_AUX1_SC_LEFT, 3));
57		OUT_RING(boxes[0].x1);
58		OUT_RING(boxes[0].x2 - 1);
59		OUT_RING(boxes[0].y1);
60		OUT_RING(boxes[0].y2 - 1);
61
62		aux_sc_cntl |= (R128_AUX1_SC_EN | R128_AUX1_SC_MODE_OR);
63	}
64	if (count >= 2) {
65		OUT_RING(CCE_PACKET0(R128_AUX2_SC_LEFT, 3));
66		OUT_RING(boxes[1].x1);
67		OUT_RING(boxes[1].x2 - 1);
68		OUT_RING(boxes[1].y1);
69		OUT_RING(boxes[1].y2 - 1);
70
71		aux_sc_cntl |= (R128_AUX2_SC_EN | R128_AUX2_SC_MODE_OR);
72	}
73	if (count >= 3) {
74		OUT_RING(CCE_PACKET0(R128_AUX3_SC_LEFT, 3));
75		OUT_RING(boxes[2].x1);
76		OUT_RING(boxes[2].x2 - 1);
77		OUT_RING(boxes[2].y1);
78		OUT_RING(boxes[2].y2 - 1);
79
80		aux_sc_cntl |= (R128_AUX3_SC_EN | R128_AUX3_SC_MODE_OR);
81	}
82
83	OUT_RING(CCE_PACKET0(R128_AUX_SC_CNTL, 0));
84	OUT_RING(aux_sc_cntl);
85
86	ADVANCE_RING();
87}
88
89static __inline__ void r128_emit_core(drm_r128_private_t *dev_priv)
90{
91	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
92	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
93	RING_LOCALS;
94	DRM_DEBUG("\n");
95
96	BEGIN_RING(2);
97
98	OUT_RING(CCE_PACKET0(R128_SCALE_3D_CNTL, 0));
99	OUT_RING(ctx->scale_3d_cntl);
100
101	ADVANCE_RING();
102}
103
104static __inline__ void r128_emit_context(drm_r128_private_t *dev_priv)
105{
106	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
107	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
108	RING_LOCALS;
109	DRM_DEBUG("\n");
110
111	BEGIN_RING(13);
112
113	OUT_RING(CCE_PACKET0(R128_DST_PITCH_OFFSET_C, 11));
114	OUT_RING(ctx->dst_pitch_offset_c);
115	OUT_RING(ctx->dp_gui_master_cntl_c);
116	OUT_RING(ctx->sc_top_left_c);
117	OUT_RING(ctx->sc_bottom_right_c);
118	OUT_RING(ctx->z_offset_c);
119	OUT_RING(ctx->z_pitch_c);
120	OUT_RING(ctx->z_sten_cntl_c);
121	OUT_RING(ctx->tex_cntl_c);
122	OUT_RING(ctx->misc_3d_state_cntl_reg);
123	OUT_RING(ctx->texture_clr_cmp_clr_c);
124	OUT_RING(ctx->texture_clr_cmp_msk_c);
125	OUT_RING(ctx->fog_color_c);
126
127	ADVANCE_RING();
128}
129
130static __inline__ void r128_emit_setup(drm_r128_private_t *dev_priv)
131{
132	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
133	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
134	RING_LOCALS;
135	DRM_DEBUG("\n");
136
137	BEGIN_RING(3);
138
139	OUT_RING(CCE_PACKET1(R128_SETUP_CNTL, R128_PM4_VC_FPU_SETUP));
140	OUT_RING(ctx->setup_cntl);
141	OUT_RING(ctx->pm4_vc_fpu_setup);
142
143	ADVANCE_RING();
144}
145
146static __inline__ void r128_emit_masks(drm_r128_private_t *dev_priv)
147{
148	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
149	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
150	RING_LOCALS;
151	DRM_DEBUG("\n");
152
153	BEGIN_RING(5);
154
155	OUT_RING(CCE_PACKET0(R128_DP_WRITE_MASK, 0));
156	OUT_RING(ctx->dp_write_mask);
157
158	OUT_RING(CCE_PACKET0(R128_STEN_REF_MASK_C, 1));
159	OUT_RING(ctx->sten_ref_mask_c);
160	OUT_RING(ctx->plane_3d_mask_c);
161
162	ADVANCE_RING();
163}
164
165static __inline__ void r128_emit_window(drm_r128_private_t *dev_priv)
166{
167	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
168	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
169	RING_LOCALS;
170	DRM_DEBUG("\n");
171
172	BEGIN_RING(2);
173
174	OUT_RING(CCE_PACKET0(R128_WINDOW_XY_OFFSET, 0));
175	OUT_RING(ctx->window_xy_offset);
176
177	ADVANCE_RING();
178}
179
180static __inline__ void r128_emit_tex0(drm_r128_private_t *dev_priv)
181{
182	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
183	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
184	drm_r128_texture_regs_t *tex = &sarea_priv->tex_state[0];
185	int i;
186	RING_LOCALS;
187	DRM_DEBUG("\n");
188
189	BEGIN_RING(7 + R128_MAX_TEXTURE_LEVELS);
190
191	OUT_RING(CCE_PACKET0(R128_PRIM_TEX_CNTL_C,
192			     2 + R128_MAX_TEXTURE_LEVELS));
193	OUT_RING(tex->tex_cntl);
194	OUT_RING(tex->tex_combine_cntl);
195	OUT_RING(ctx->tex_size_pitch_c);
196	for (i = 0; i < R128_MAX_TEXTURE_LEVELS; i++)
197		OUT_RING(tex->tex_offset[i]);
198
199	OUT_RING(CCE_PACKET0(R128_CONSTANT_COLOR_C, 1));
200	OUT_RING(ctx->constant_color_c);
201	OUT_RING(tex->tex_border_color);
202
203	ADVANCE_RING();
204}
205
206static __inline__ void r128_emit_tex1(drm_r128_private_t *dev_priv)
207{
208	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
209	drm_r128_texture_regs_t *tex = &sarea_priv->tex_state[1];
210	int i;
211	RING_LOCALS;
212	DRM_DEBUG("\n");
213
214	BEGIN_RING(5 + R128_MAX_TEXTURE_LEVELS);
215
216	OUT_RING(CCE_PACKET0(R128_SEC_TEX_CNTL_C, 1 + R128_MAX_TEXTURE_LEVELS));
217	OUT_RING(tex->tex_cntl);
218	OUT_RING(tex->tex_combine_cntl);
219	for (i = 0; i < R128_MAX_TEXTURE_LEVELS; i++)
220		OUT_RING(tex->tex_offset[i]);
221
222	OUT_RING(CCE_PACKET0(R128_SEC_TEXTURE_BORDER_COLOR_C, 0));
223	OUT_RING(tex->tex_border_color);
224
225	ADVANCE_RING();
226}
227
228static void r128_emit_state(drm_r128_private_t *dev_priv)
229{
230	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
231	unsigned int dirty = sarea_priv->dirty;
232
233	DRM_DEBUG("dirty=0x%08x\n", dirty);
234
235	if (dirty & R128_UPLOAD_CORE) {
236		r128_emit_core(dev_priv);
237		sarea_priv->dirty &= ~R128_UPLOAD_CORE;
238	}
239
240	if (dirty & R128_UPLOAD_CONTEXT) {
241		r128_emit_context(dev_priv);
242		sarea_priv->dirty &= ~R128_UPLOAD_CONTEXT;
243	}
244
245	if (dirty & R128_UPLOAD_SETUP) {
246		r128_emit_setup(dev_priv);
247		sarea_priv->dirty &= ~R128_UPLOAD_SETUP;
248	}
249
250	if (dirty & R128_UPLOAD_MASKS) {
251		r128_emit_masks(dev_priv);
252		sarea_priv->dirty &= ~R128_UPLOAD_MASKS;
253	}
254
255	if (dirty & R128_UPLOAD_WINDOW) {
256		r128_emit_window(dev_priv);
257		sarea_priv->dirty &= ~R128_UPLOAD_WINDOW;
258	}
259
260	if (dirty & R128_UPLOAD_TEX0) {
261		r128_emit_tex0(dev_priv);
262		sarea_priv->dirty &= ~R128_UPLOAD_TEX0;
263	}
264
265	if (dirty & R128_UPLOAD_TEX1) {
266		r128_emit_tex1(dev_priv);
267		sarea_priv->dirty &= ~R128_UPLOAD_TEX1;
268	}
269
270	/* Turn off the texture cache flushing */
271	sarea_priv->context_state.tex_cntl_c &= ~R128_TEX_CACHE_FLUSH;
272
273	sarea_priv->dirty &= ~R128_REQUIRE_QUIESCENCE;
274}
275
276#if R128_PERFORMANCE_BOXES
277/* ================================================================
278 * Performance monitoring functions
279 */
280
281static void r128_clear_box(drm_r128_private_t *dev_priv,
282			   int x, int y, int w, int h, int r, int g, int b)
283{
284	u32 pitch, offset;
285	u32 fb_bpp, color;
286	RING_LOCALS;
287
288	switch (dev_priv->fb_bpp) {
289	case 16:
290		fb_bpp = R128_GMC_DST_16BPP;
291		color = (((r & 0xf8) << 8) |
292			 ((g & 0xfc) << 3) | ((b & 0xf8) >> 3));
293		break;
294	case 24:
295		fb_bpp = R128_GMC_DST_24BPP;
296		color = ((r << 16) | (g << 8) | b);
297		break;
298	case 32:
299		fb_bpp = R128_GMC_DST_32BPP;
300		color = (((0xff) << 24) | (r << 16) | (g << 8) | b);
301		break;
302	default:
303		return;
304	}
305
306	offset = dev_priv->back_offset;
307	pitch = dev_priv->back_pitch >> 3;
308
309	BEGIN_RING(6);
310
311	OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
312	OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
313		 R128_GMC_BRUSH_SOLID_COLOR |
314		 fb_bpp |
315		 R128_GMC_SRC_DATATYPE_COLOR |
316		 R128_ROP3_P |
317		 R128_GMC_CLR_CMP_CNTL_DIS | R128_GMC_AUX_CLIP_DIS);
318
319	OUT_RING((pitch << 21) | (offset >> 5));
320	OUT_RING(color);
321
322	OUT_RING((x << 16) | y);
323	OUT_RING((w << 16) | h);
324
325	ADVANCE_RING();
326}
327
328static void r128_cce_performance_boxes(drm_r128_private_t *dev_priv)
329{
330	if (atomic_read(&dev_priv->idle_count) == 0)
331		r128_clear_box(dev_priv, 64, 4, 8, 8, 0, 255, 0);
332	else
333		atomic_set(&dev_priv->idle_count, 0);
334}
335
336#endif
337
338/* ================================================================
339 * CCE command dispatch functions
340 */
341
342static void r128_print_dirty(const char *msg, unsigned int flags)
343{
344	DRM_INFO("%s: (0x%x) %s%s%s%s%s%s%s%s%s\n",
345		 msg,
346		 flags,
347		 (flags & R128_UPLOAD_CORE) ? "core, " : "",
348		 (flags & R128_UPLOAD_CONTEXT) ? "context, " : "",
349		 (flags & R128_UPLOAD_SETUP) ? "setup, " : "",
350		 (flags & R128_UPLOAD_TEX0) ? "tex0, " : "",
351		 (flags & R128_UPLOAD_TEX1) ? "tex1, " : "",
352		 (flags & R128_UPLOAD_MASKS) ? "masks, " : "",
353		 (flags & R128_UPLOAD_WINDOW) ? "window, " : "",
354		 (flags & R128_UPLOAD_CLIPRECTS) ? "cliprects, " : "",
355		 (flags & R128_REQUIRE_QUIESCENCE) ? "quiescence, " : "");
356}
357
358static void r128_cce_dispatch_clear(struct drm_device *dev,
359				    drm_r128_clear_t *clear)
360{
361	drm_r128_private_t *dev_priv = dev->dev_private;
362	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
363	int nbox = sarea_priv->nbox;
364	struct drm_clip_rect *pbox = sarea_priv->boxes;
365	unsigned int flags = clear->flags;
366	int i;
367	RING_LOCALS;
368	DRM_DEBUG("\n");
369
370	if (dev_priv->page_flipping && dev_priv->current_page == 1) {
371		unsigned int tmp = flags;
372
373		flags &= ~(R128_FRONT | R128_BACK);
374		if (tmp & R128_FRONT)
375			flags |= R128_BACK;
376		if (tmp & R128_BACK)
377			flags |= R128_FRONT;
378	}
379
380	for (i = 0; i < nbox; i++) {
381		int x = pbox[i].x1;
382		int y = pbox[i].y1;
383		int w = pbox[i].x2 - x;
384		int h = pbox[i].y2 - y;
385
386		DRM_DEBUG("dispatch clear %d,%d-%d,%d flags 0x%x\n",
387			  pbox[i].x1, pbox[i].y1, pbox[i].x2,
388			  pbox[i].y2, flags);
389
390		if (flags & (R128_FRONT | R128_BACK)) {
391			BEGIN_RING(2);
392
393			OUT_RING(CCE_PACKET0(R128_DP_WRITE_MASK, 0));
394			OUT_RING(clear->color_mask);
395
396			ADVANCE_RING();
397		}
398
399		if (flags & R128_FRONT) {
400			BEGIN_RING(6);
401
402			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
403			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
404				 R128_GMC_BRUSH_SOLID_COLOR |
405				 (dev_priv->color_fmt << 8) |
406				 R128_GMC_SRC_DATATYPE_COLOR |
407				 R128_ROP3_P |
408				 R128_GMC_CLR_CMP_CNTL_DIS |
409				 R128_GMC_AUX_CLIP_DIS);
410
411			OUT_RING(dev_priv->front_pitch_offset_c);
412			OUT_RING(clear->clear_color);
413
414			OUT_RING((x << 16) | y);
415			OUT_RING((w << 16) | h);
416
417			ADVANCE_RING();
418		}
419
420		if (flags & R128_BACK) {
421			BEGIN_RING(6);
422
423			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
424			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
425				 R128_GMC_BRUSH_SOLID_COLOR |
426				 (dev_priv->color_fmt << 8) |
427				 R128_GMC_SRC_DATATYPE_COLOR |
428				 R128_ROP3_P |
429				 R128_GMC_CLR_CMP_CNTL_DIS |
430				 R128_GMC_AUX_CLIP_DIS);
431
432			OUT_RING(dev_priv->back_pitch_offset_c);
433			OUT_RING(clear->clear_color);
434
435			OUT_RING((x << 16) | y);
436			OUT_RING((w << 16) | h);
437
438			ADVANCE_RING();
439		}
440
441		if (flags & R128_DEPTH) {
442			BEGIN_RING(6);
443
444			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
445			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
446				 R128_GMC_BRUSH_SOLID_COLOR |
447				 (dev_priv->depth_fmt << 8) |
448				 R128_GMC_SRC_DATATYPE_COLOR |
449				 R128_ROP3_P |
450				 R128_GMC_CLR_CMP_CNTL_DIS |
451				 R128_GMC_AUX_CLIP_DIS | R128_GMC_WR_MSK_DIS);
452
453			OUT_RING(dev_priv->depth_pitch_offset_c);
454			OUT_RING(clear->clear_depth);
455
456			OUT_RING((x << 16) | y);
457			OUT_RING((w << 16) | h);
458
459			ADVANCE_RING();
460		}
461	}
462}
463
464static void r128_cce_dispatch_swap(struct drm_device *dev)
465{
466	drm_r128_private_t *dev_priv = dev->dev_private;
467	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
468	int nbox = sarea_priv->nbox;
469	struct drm_clip_rect *pbox = sarea_priv->boxes;
470	int i;
471	RING_LOCALS;
472	DRM_DEBUG("\n");
473
474#if R128_PERFORMANCE_BOXES
475	/* Do some trivial performance monitoring...
476	 */
477	r128_cce_performance_boxes(dev_priv);
478#endif
479
480	for (i = 0; i < nbox; i++) {
481		int x = pbox[i].x1;
482		int y = pbox[i].y1;
483		int w = pbox[i].x2 - x;
484		int h = pbox[i].y2 - y;
485
486		BEGIN_RING(7);
487
488		OUT_RING(CCE_PACKET3(R128_CNTL_BITBLT_MULTI, 5));
489		OUT_RING(R128_GMC_SRC_PITCH_OFFSET_CNTL |
490			 R128_GMC_DST_PITCH_OFFSET_CNTL |
491			 R128_GMC_BRUSH_NONE |
492			 (dev_priv->color_fmt << 8) |
493			 R128_GMC_SRC_DATATYPE_COLOR |
494			 R128_ROP3_S |
495			 R128_DP_SRC_SOURCE_MEMORY |
496			 R128_GMC_CLR_CMP_CNTL_DIS |
497			 R128_GMC_AUX_CLIP_DIS | R128_GMC_WR_MSK_DIS);
498
499		/* Make this work even if front & back are flipped:
500		 */
501		if (dev_priv->current_page == 0) {
502			OUT_RING(dev_priv->back_pitch_offset_c);
503			OUT_RING(dev_priv->front_pitch_offset_c);
504		} else {
505			OUT_RING(dev_priv->front_pitch_offset_c);
506			OUT_RING(dev_priv->back_pitch_offset_c);
507		}
508
509		OUT_RING((x << 16) | y);
510		OUT_RING((x << 16) | y);
511		OUT_RING((w << 16) | h);
512
513		ADVANCE_RING();
514	}
515
516	/* Increment the frame counter.  The client-side 3D driver must
517	 * throttle the framerate by waiting for this value before
518	 * performing the swapbuffer ioctl.
519	 */
520	dev_priv->sarea_priv->last_frame++;
521
522	BEGIN_RING(2);
523
524	OUT_RING(CCE_PACKET0(R128_LAST_FRAME_REG, 0));
525	OUT_RING(dev_priv->sarea_priv->last_frame);
526
527	ADVANCE_RING();
528}
529
530static void r128_cce_dispatch_flip(struct drm_device *dev)
531{
532	drm_r128_private_t *dev_priv = dev->dev_private;
533	RING_LOCALS;
534	DRM_DEBUG("page=%d pfCurrentPage=%d\n",
535		  dev_priv->current_page, dev_priv->sarea_priv->pfCurrentPage);
536
537#if R128_PERFORMANCE_BOXES
538	/* Do some trivial performance monitoring...
539	 */
540	r128_cce_performance_boxes(dev_priv);
541#endif
542
543	BEGIN_RING(4);
544
545	R128_WAIT_UNTIL_PAGE_FLIPPED();
546	OUT_RING(CCE_PACKET0(R128_CRTC_OFFSET, 0));
547
548	if (dev_priv->current_page == 0)
549		OUT_RING(dev_priv->back_offset);
550	else
551		OUT_RING(dev_priv->front_offset);
552
553	ADVANCE_RING();
554
555	/* Increment the frame counter.  The client-side 3D driver must
556	 * throttle the framerate by waiting for this value before
557	 * performing the swapbuffer ioctl.
558	 */
559	dev_priv->sarea_priv->last_frame++;
560	dev_priv->sarea_priv->pfCurrentPage = dev_priv->current_page =
561	    1 - dev_priv->current_page;
562
563	BEGIN_RING(2);
564
565	OUT_RING(CCE_PACKET0(R128_LAST_FRAME_REG, 0));
566	OUT_RING(dev_priv->sarea_priv->last_frame);
567
568	ADVANCE_RING();
569}
570
571static void r128_cce_dispatch_vertex(struct drm_device *dev, struct drm_buf *buf)
572{
573	drm_r128_private_t *dev_priv = dev->dev_private;
574	drm_r128_buf_priv_t *buf_priv = buf->dev_private;
575	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
576	int format = sarea_priv->vc_format;
577	int offset = buf->bus_address;
578	int size = buf->used;
579	int prim = buf_priv->prim;
580	int i = 0;
581	RING_LOCALS;
582	DRM_DEBUG("buf=%d nbox=%d\n", buf->idx, sarea_priv->nbox);
583
584	if (0)
585		r128_print_dirty("dispatch_vertex", sarea_priv->dirty);
586
587	if (buf->used) {
588		buf_priv->dispatched = 1;
589
590		if (sarea_priv->dirty & ~R128_UPLOAD_CLIPRECTS)
591			r128_emit_state(dev_priv);
592
593		do {
594			/* Emit the next set of up to three cliprects */
595			if (i < sarea_priv->nbox) {
596				r128_emit_clip_rects(dev_priv,
597						     &sarea_priv->boxes[i],
598						     sarea_priv->nbox - i);
599			}
600
601			/* Emit the vertex buffer rendering commands */
602			BEGIN_RING(5);
603
604			OUT_RING(CCE_PACKET3(R128_3D_RNDR_GEN_INDX_PRIM, 3));
605			OUT_RING(offset);
606			OUT_RING(size);
607			OUT_RING(format);
608			OUT_RING(prim | R128_CCE_VC_CNTL_PRIM_WALK_LIST |
609				 (size << R128_CCE_VC_CNTL_NUM_SHIFT));
610
611			ADVANCE_RING();
612
613			i += 3;
614		} while (i < sarea_priv->nbox);
615	}
616
617	if (buf_priv->discard) {
618		buf_priv->age = dev_priv->sarea_priv->last_dispatch;
619
620		/* Emit the vertex buffer age */
621		BEGIN_RING(2);
622
623		OUT_RING(CCE_PACKET0(R128_LAST_DISPATCH_REG, 0));
624		OUT_RING(buf_priv->age);
625
626		ADVANCE_RING();
627
628		buf->pending = 1;
629		buf->used = 0;
630		/* FIXME: Check dispatched field */
631		buf_priv->dispatched = 0;
632	}
633
634	dev_priv->sarea_priv->last_dispatch++;
635
636	sarea_priv->dirty &= ~R128_UPLOAD_CLIPRECTS;
637	sarea_priv->nbox = 0;
638}
639
640static void r128_cce_dispatch_indirect(struct drm_device *dev,
641				       struct drm_buf *buf, int start, int end)
642{
643	drm_r128_private_t *dev_priv = dev->dev_private;
644	drm_r128_buf_priv_t *buf_priv = buf->dev_private;
645	RING_LOCALS;
646	DRM_DEBUG("indirect: buf=%d s=0x%x e=0x%x\n", buf->idx, start, end);
647
648	if (start != end) {
649		int offset = buf->bus_address + start;
650		int dwords = (end - start + 3) / sizeof(u32);
651
652		/* Indirect buffer data must be an even number of
653		 * dwords, so if we've been given an odd number we must
654		 * pad the data with a Type-2 CCE packet.
655		 */
656		if (dwords & 1) {
657			u32 *data = (u32 *)
658			    ((char *)dev->agp_buffer_map->handle
659			     + buf->offset + start);
660			data[dwords++] = cpu_to_le32(R128_CCE_PACKET2);
661		}
662
663		buf_priv->dispatched = 1;
664
665		/* Fire off the indirect buffer */
666		BEGIN_RING(3);
667
668		OUT_RING(CCE_PACKET0(R128_PM4_IW_INDOFF, 1));
669		OUT_RING(offset);
670		OUT_RING(dwords);
671
672		ADVANCE_RING();
673	}
674
675	if (buf_priv->discard) {
676		buf_priv->age = dev_priv->sarea_priv->last_dispatch;
677
678		/* Emit the indirect buffer age */
679		BEGIN_RING(2);
680
681		OUT_RING(CCE_PACKET0(R128_LAST_DISPATCH_REG, 0));
682		OUT_RING(buf_priv->age);
683
684		ADVANCE_RING();
685
686		buf->pending = 1;
687		buf->used = 0;
688		/* FIXME: Check dispatched field */
689		buf_priv->dispatched = 0;
690	}
691
692	dev_priv->sarea_priv->last_dispatch++;
693}
694
695static void r128_cce_dispatch_indices(struct drm_device *dev,
696				      struct drm_buf *buf,
697				      int start, int end, int count)
698{
699	drm_r128_private_t *dev_priv = dev->dev_private;
700	drm_r128_buf_priv_t *buf_priv = buf->dev_private;
701	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
702	int format = sarea_priv->vc_format;
703	int offset = dev->agp_buffer_map->offset - dev_priv->cce_buffers_offset;
704	int prim = buf_priv->prim;
705	u32 *data;
706	int dwords;
707	int i = 0;
708	RING_LOCALS;
709	DRM_DEBUG("indices: s=%d e=%d c=%d\n", start, end, count);
710
711	if (0)
712		r128_print_dirty("dispatch_indices", sarea_priv->dirty);
713
714	if (start != end) {
715		buf_priv->dispatched = 1;
716
717		if (sarea_priv->dirty & ~R128_UPLOAD_CLIPRECTS)
718			r128_emit_state(dev_priv);
719
720		dwords = (end - start + 3) / sizeof(u32);
721
722		data = (u32 *) ((char *)dev->agp_buffer_map->handle
723				+ buf->offset + start);
724
725		data[0] = cpu_to_le32(CCE_PACKET3(R128_3D_RNDR_GEN_INDX_PRIM,
726						  dwords - 2));
727
728		data[1] = cpu_to_le32(offset);
729		data[2] = cpu_to_le32(R128_MAX_VB_VERTS);
730		data[3] = cpu_to_le32(format);
731		data[4] = cpu_to_le32((prim | R128_CCE_VC_CNTL_PRIM_WALK_IND |
732				       (count << 16)));
733
734		if (count & 0x1) {
735#ifdef __LITTLE_ENDIAN
736			data[dwords - 1] &= 0x0000ffff;
737#else
738			data[dwords - 1] &= 0xffff0000;
739#endif
740		}
741
742		do {
743			/* Emit the next set of up to three cliprects */
744			if (i < sarea_priv->nbox) {
745				r128_emit_clip_rects(dev_priv,
746						     &sarea_priv->boxes[i],
747						     sarea_priv->nbox - i);
748			}
749
750			r128_cce_dispatch_indirect(dev, buf, start, end);
751
752			i += 3;
753		} while (i < sarea_priv->nbox);
754	}
755
756	if (buf_priv->discard) {
757		buf_priv->age = dev_priv->sarea_priv->last_dispatch;
758
759		/* Emit the vertex buffer age */
760		BEGIN_RING(2);
761
762		OUT_RING(CCE_PACKET0(R128_LAST_DISPATCH_REG, 0));
763		OUT_RING(buf_priv->age);
764
765		ADVANCE_RING();
766
767		buf->pending = 1;
768		/* FIXME: Check dispatched field */
769		buf_priv->dispatched = 0;
770	}
771
772	dev_priv->sarea_priv->last_dispatch++;
773
774	sarea_priv->dirty &= ~R128_UPLOAD_CLIPRECTS;
775	sarea_priv->nbox = 0;
776}
777
778static int r128_cce_dispatch_blit(struct drm_device *dev,
779				  struct drm_file *file_priv,
780				  drm_r128_blit_t *blit)
781{
782	drm_r128_private_t *dev_priv = dev->dev_private;
783	struct drm_device_dma *dma = dev->dma;
784	struct drm_buf *buf;
785	drm_r128_buf_priv_t *buf_priv;
786	u32 *data;
787	int dword_shift, dwords;
788	RING_LOCALS;
789	DRM_DEBUG("\n");
790
791	/* The compiler won't optimize away a division by a variable,
792	 * even if the only legal values are powers of two.  Thus, we'll
793	 * use a shift instead.
794	 */
795	switch (blit->format) {
796	case R128_DATATYPE_ARGB8888:
797		dword_shift = 0;
798		break;
799	case R128_DATATYPE_ARGB1555:
800	case R128_DATATYPE_RGB565:
801	case R128_DATATYPE_ARGB4444:
802	case R128_DATATYPE_YVYU422:
803	case R128_DATATYPE_VYUY422:
804		dword_shift = 1;
805		break;
806	case R128_DATATYPE_CI8:
807	case R128_DATATYPE_RGB8:
808		dword_shift = 2;
809		break;
810	default:
811		DRM_ERROR("invalid blit format %d\n", blit->format);
812		return -EINVAL;
813	}
814
815	/* Flush the pixel cache, and mark the contents as Read Invalid.
816	 * This ensures no pixel data gets mixed up with the texture
817	 * data from the host data blit, otherwise part of the texture
818	 * image may be corrupted.
819	 */
820	BEGIN_RING(2);
821
822	OUT_RING(CCE_PACKET0(R128_PC_GUI_CTLSTAT, 0));
823	OUT_RING(R128_PC_RI_GUI | R128_PC_FLUSH_GUI);
824
825	ADVANCE_RING();
826
827	/* Dispatch the indirect buffer.
828	 */
829	buf = dma->buflist[blit->idx];
830	buf_priv = buf->dev_private;
831
832	if (buf->file_priv != file_priv) {
833		DRM_ERROR("process %d using buffer owned by %p\n",
834			  task_pid_nr(current), buf->file_priv);
835		return -EINVAL;
836	}
837	if (buf->pending) {
838		DRM_ERROR("sending pending buffer %d\n", blit->idx);
839		return -EINVAL;
840	}
841
842	buf_priv->discard = 1;
843
844	dwords = (blit->width * blit->height) >> dword_shift;
845
846	data = (u32 *) ((char *)dev->agp_buffer_map->handle + buf->offset);
847
848	data[0] = cpu_to_le32(CCE_PACKET3(R128_CNTL_HOSTDATA_BLT, dwords + 6));
849	data[1] = cpu_to_le32((R128_GMC_DST_PITCH_OFFSET_CNTL |
850			       R128_GMC_BRUSH_NONE |
851			       (blit->format << 8) |
852			       R128_GMC_SRC_DATATYPE_COLOR |
853			       R128_ROP3_S |
854			       R128_DP_SRC_SOURCE_HOST_DATA |
855			       R128_GMC_CLR_CMP_CNTL_DIS |
856			       R128_GMC_AUX_CLIP_DIS | R128_GMC_WR_MSK_DIS));
857
858	data[2] = cpu_to_le32((blit->pitch << 21) | (blit->offset >> 5));
859	data[3] = cpu_to_le32(0xffffffff);
860	data[4] = cpu_to_le32(0xffffffff);
861	data[5] = cpu_to_le32((blit->y << 16) | blit->x);
862	data[6] = cpu_to_le32((blit->height << 16) | blit->width);
863	data[7] = cpu_to_le32(dwords);
864
865	buf->used = (dwords + 8) * sizeof(u32);
866
867	r128_cce_dispatch_indirect(dev, buf, 0, buf->used);
868
869	/* Flush the pixel cache after the blit completes.  This ensures
870	 * the texture data is written out to memory before rendering
871	 * continues.
872	 */
873	BEGIN_RING(2);
874
875	OUT_RING(CCE_PACKET0(R128_PC_GUI_CTLSTAT, 0));
876	OUT_RING(R128_PC_FLUSH_GUI);
877
878	ADVANCE_RING();
879
880	return 0;
881}
882
883/* ================================================================
884 * Tiled depth buffer management
885 *
886 * FIXME: These should all set the destination write mask for when we
887 * have hardware stencil support.
888 */
889
890static int r128_cce_dispatch_write_span(struct drm_device *dev,
891					drm_r128_depth_t *depth)
892{
893	drm_r128_private_t *dev_priv = dev->dev_private;
894	int count, x, y;
895	u32 *buffer;
896	u8 *mask;
897	int i, buffer_size, mask_size;
898	RING_LOCALS;
899	DRM_DEBUG("\n");
900
901	count = depth->n;
902	if (count > 4096 || count <= 0)
903		return -EMSGSIZE;
904
905	if (copy_from_user(&x, depth->x, sizeof(x)))
906		return -EFAULT;
907	if (copy_from_user(&y, depth->y, sizeof(y)))
908		return -EFAULT;
909
910	buffer_size = depth->n * sizeof(u32);
911	buffer = memdup_user(depth->buffer, buffer_size);
912	if (IS_ERR(buffer))
913		return PTR_ERR(buffer);
914
915	mask_size = depth->n;
916	if (depth->mask) {
917		mask = memdup_user(depth->mask, mask_size);
918		if (IS_ERR(mask)) {
919			kfree(buffer);
920			return PTR_ERR(mask);
921		}
922
923		for (i = 0; i < count; i++, x++) {
924			if (mask[i]) {
925				BEGIN_RING(6);
926
927				OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
928				OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
929					 R128_GMC_BRUSH_SOLID_COLOR |
930					 (dev_priv->depth_fmt << 8) |
931					 R128_GMC_SRC_DATATYPE_COLOR |
932					 R128_ROP3_P |
933					 R128_GMC_CLR_CMP_CNTL_DIS |
934					 R128_GMC_WR_MSK_DIS);
935
936				OUT_RING(dev_priv->depth_pitch_offset_c);
937				OUT_RING(buffer[i]);
938
939				OUT_RING((x << 16) | y);
940				OUT_RING((1 << 16) | 1);
941
942				ADVANCE_RING();
943			}
944		}
945
946		kfree(mask);
947	} else {
948		for (i = 0; i < count; i++, x++) {
949			BEGIN_RING(6);
950
951			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
952			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
953				 R128_GMC_BRUSH_SOLID_COLOR |
954				 (dev_priv->depth_fmt << 8) |
955				 R128_GMC_SRC_DATATYPE_COLOR |
956				 R128_ROP3_P |
957				 R128_GMC_CLR_CMP_CNTL_DIS |
958				 R128_GMC_WR_MSK_DIS);
959
960			OUT_RING(dev_priv->depth_pitch_offset_c);
961			OUT_RING(buffer[i]);
962
963			OUT_RING((x << 16) | y);
964			OUT_RING((1 << 16) | 1);
965
966			ADVANCE_RING();
967		}
968	}
969
970	kfree(buffer);
971
972	return 0;
973}
974
975static int r128_cce_dispatch_write_pixels(struct drm_device *dev,
976					  drm_r128_depth_t *depth)
977{
978	drm_r128_private_t *dev_priv = dev->dev_private;
979	int count, *x, *y;
980	u32 *buffer;
981	u8 *mask;
982	int i, xbuf_size, ybuf_size, buffer_size, mask_size;
983	RING_LOCALS;
984	DRM_DEBUG("\n");
985
986	count = depth->n;
987	if (count > 4096 || count <= 0)
988		return -EMSGSIZE;
989
990	xbuf_size = count * sizeof(*x);
991	ybuf_size = count * sizeof(*y);
992	x = memdup_user(depth->x, xbuf_size);
993	if (IS_ERR(x))
994		return PTR_ERR(x);
995	y = memdup_user(depth->y, ybuf_size);
996	if (IS_ERR(y)) {
997		kfree(x);
998		return PTR_ERR(y);
999	}
1000	buffer_size = depth->n * sizeof(u32);
1001	buffer = memdup_user(depth->buffer, buffer_size);
1002	if (IS_ERR(buffer)) {
1003		kfree(x);
1004		kfree(y);
1005		return PTR_ERR(buffer);
1006	}
1007
1008	if (depth->mask) {
1009		mask_size = depth->n;
1010		mask = memdup_user(depth->mask, mask_size);
1011		if (IS_ERR(mask)) {
1012			kfree(x);
1013			kfree(y);
1014			kfree(buffer);
1015			return PTR_ERR(mask);
1016		}
1017
1018		for (i = 0; i < count; i++) {
1019			if (mask[i]) {
1020				BEGIN_RING(6);
1021
1022				OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
1023				OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
1024					 R128_GMC_BRUSH_SOLID_COLOR |
1025					 (dev_priv->depth_fmt << 8) |
1026					 R128_GMC_SRC_DATATYPE_COLOR |
1027					 R128_ROP3_P |
1028					 R128_GMC_CLR_CMP_CNTL_DIS |
1029					 R128_GMC_WR_MSK_DIS);
1030
1031				OUT_RING(dev_priv->depth_pitch_offset_c);
1032				OUT_RING(buffer[i]);
1033
1034				OUT_RING((x[i] << 16) | y[i]);
1035				OUT_RING((1 << 16) | 1);
1036
1037				ADVANCE_RING();
1038			}
1039		}
1040
1041		kfree(mask);
1042	} else {
1043		for (i = 0; i < count; i++) {
1044			BEGIN_RING(6);
1045
1046			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
1047			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
1048				 R128_GMC_BRUSH_SOLID_COLOR |
1049				 (dev_priv->depth_fmt << 8) |
1050				 R128_GMC_SRC_DATATYPE_COLOR |
1051				 R128_ROP3_P |
1052				 R128_GMC_CLR_CMP_CNTL_DIS |
1053				 R128_GMC_WR_MSK_DIS);
1054
1055			OUT_RING(dev_priv->depth_pitch_offset_c);
1056			OUT_RING(buffer[i]);
1057
1058			OUT_RING((x[i] << 16) | y[i]);
1059			OUT_RING((1 << 16) | 1);
1060
1061			ADVANCE_RING();
1062		}
1063	}
1064
1065	kfree(x);
1066	kfree(y);
1067	kfree(buffer);
1068
1069	return 0;
1070}
1071
1072static int r128_cce_dispatch_read_span(struct drm_device *dev,
1073				       drm_r128_depth_t *depth)
1074{
1075	drm_r128_private_t *dev_priv = dev->dev_private;
1076	int count, x, y;
1077	RING_LOCALS;
1078	DRM_DEBUG("\n");
1079
1080	count = depth->n;
1081	if (count > 4096 || count <= 0)
1082		return -EMSGSIZE;
1083
1084	if (copy_from_user(&x, depth->x, sizeof(x)))
1085		return -EFAULT;
1086	if (copy_from_user(&y, depth->y, sizeof(y)))
1087		return -EFAULT;
1088
1089	BEGIN_RING(7);
1090
1091	OUT_RING(CCE_PACKET3(R128_CNTL_BITBLT_MULTI, 5));
1092	OUT_RING(R128_GMC_SRC_PITCH_OFFSET_CNTL |
1093		 R128_GMC_DST_PITCH_OFFSET_CNTL |
1094		 R128_GMC_BRUSH_NONE |
1095		 (dev_priv->depth_fmt << 8) |
1096		 R128_GMC_SRC_DATATYPE_COLOR |
1097		 R128_ROP3_S |
1098		 R128_DP_SRC_SOURCE_MEMORY |
1099		 R128_GMC_CLR_CMP_CNTL_DIS | R128_GMC_WR_MSK_DIS);
1100
1101	OUT_RING(dev_priv->depth_pitch_offset_c);
1102	OUT_RING(dev_priv->span_pitch_offset_c);
1103
1104	OUT_RING((x << 16) | y);
1105	OUT_RING((0 << 16) | 0);
1106	OUT_RING((count << 16) | 1);
1107
1108	ADVANCE_RING();
1109
1110	return 0;
1111}
1112
1113static int r128_cce_dispatch_read_pixels(struct drm_device *dev,
1114					 drm_r128_depth_t *depth)
1115{
1116	drm_r128_private_t *dev_priv = dev->dev_private;
1117	int count, *x, *y;
1118	int i, xbuf_size, ybuf_size;
1119	RING_LOCALS;
1120	DRM_DEBUG("\n");
1121
1122	count = depth->n;
1123	if (count > 4096 || count <= 0)
1124		return -EMSGSIZE;
1125
1126	if (count > dev_priv->depth_pitch)
1127		count = dev_priv->depth_pitch;
1128
1129	xbuf_size = count * sizeof(*x);
1130	ybuf_size = count * sizeof(*y);
1131	x = kmalloc(xbuf_size, GFP_KERNEL);
1132	if (x == NULL)
1133		return -ENOMEM;
1134	y = kmalloc(ybuf_size, GFP_KERNEL);
1135	if (y == NULL) {
1136		kfree(x);
1137		return -ENOMEM;
1138	}
1139	if (copy_from_user(x, depth->x, xbuf_size)) {
1140		kfree(x);
1141		kfree(y);
1142		return -EFAULT;
1143	}
1144	if (copy_from_user(y, depth->y, ybuf_size)) {
1145		kfree(x);
1146		kfree(y);
1147		return -EFAULT;
1148	}
1149
1150	for (i = 0; i < count; i++) {
1151		BEGIN_RING(7);
1152
1153		OUT_RING(CCE_PACKET3(R128_CNTL_BITBLT_MULTI, 5));
1154		OUT_RING(R128_GMC_SRC_PITCH_OFFSET_CNTL |
1155			 R128_GMC_DST_PITCH_OFFSET_CNTL |
1156			 R128_GMC_BRUSH_NONE |
1157			 (dev_priv->depth_fmt << 8) |
1158			 R128_GMC_SRC_DATATYPE_COLOR |
1159			 R128_ROP3_S |
1160			 R128_DP_SRC_SOURCE_MEMORY |
1161			 R128_GMC_CLR_CMP_CNTL_DIS | R128_GMC_WR_MSK_DIS);
1162
1163		OUT_RING(dev_priv->depth_pitch_offset_c);
1164		OUT_RING(dev_priv->span_pitch_offset_c);
1165
1166		OUT_RING((x[i] << 16) | y[i]);
1167		OUT_RING((i << 16) | 0);
1168		OUT_RING((1 << 16) | 1);
1169
1170		ADVANCE_RING();
1171	}
1172
1173	kfree(x);
1174	kfree(y);
1175
1176	return 0;
1177}
1178
1179/* ================================================================
1180 * Polygon stipple
1181 */
1182
1183static void r128_cce_dispatch_stipple(struct drm_device *dev, u32 *stipple)
1184{
1185	drm_r128_private_t *dev_priv = dev->dev_private;
1186	int i;
1187	RING_LOCALS;
1188	DRM_DEBUG("\n");
1189
1190	BEGIN_RING(33);
1191
1192	OUT_RING(CCE_PACKET0(R128_BRUSH_DATA0, 31));
1193	for (i = 0; i < 32; i++)
1194		OUT_RING(stipple[i]);
1195
1196	ADVANCE_RING();
1197}
1198
1199/* ================================================================
1200 * IOCTL functions
1201 */
1202
1203static int r128_cce_clear(struct drm_device *dev, void *data, struct drm_file *file_priv)
1204{
1205	drm_r128_private_t *dev_priv = dev->dev_private;
1206	drm_r128_sarea_t *sarea_priv;
1207	drm_r128_clear_t *clear = data;
1208	DRM_DEBUG("\n");
1209
1210	LOCK_TEST_WITH_RETURN(dev, file_priv);
1211
1212	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1213
1214	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1215
1216	sarea_priv = dev_priv->sarea_priv;
1217
1218	if (sarea_priv->nbox > R128_NR_SAREA_CLIPRECTS)
1219		sarea_priv->nbox = R128_NR_SAREA_CLIPRECTS;
1220
1221	r128_cce_dispatch_clear(dev, clear);
1222	COMMIT_RING();
1223
1224	/* Make sure we restore the 3D state next time.
1225	 */
1226	dev_priv->sarea_priv->dirty |= R128_UPLOAD_CONTEXT | R128_UPLOAD_MASKS;
1227
1228	return 0;
1229}
1230
1231static int r128_do_init_pageflip(struct drm_device *dev)
1232{
1233	drm_r128_private_t *dev_priv = dev->dev_private;
1234	DRM_DEBUG("\n");
1235
1236	dev_priv->crtc_offset = R128_READ(R128_CRTC_OFFSET);
1237	dev_priv->crtc_offset_cntl = R128_READ(R128_CRTC_OFFSET_CNTL);
1238
1239	R128_WRITE(R128_CRTC_OFFSET, dev_priv->front_offset);
1240	R128_WRITE(R128_CRTC_OFFSET_CNTL,
1241		   dev_priv->crtc_offset_cntl | R128_CRTC_OFFSET_FLIP_CNTL);
1242
1243	dev_priv->page_flipping = 1;
1244	dev_priv->current_page = 0;
1245	dev_priv->sarea_priv->pfCurrentPage = dev_priv->current_page;
1246
1247	return 0;
1248}
1249
1250static int r128_do_cleanup_pageflip(struct drm_device *dev)
1251{
1252	drm_r128_private_t *dev_priv = dev->dev_private;
1253	DRM_DEBUG("\n");
1254
1255	R128_WRITE(R128_CRTC_OFFSET, dev_priv->crtc_offset);
1256	R128_WRITE(R128_CRTC_OFFSET_CNTL, dev_priv->crtc_offset_cntl);
1257
1258	if (dev_priv->current_page != 0) {
1259		r128_cce_dispatch_flip(dev);
1260		COMMIT_RING();
1261	}
1262
1263	dev_priv->page_flipping = 0;
1264	return 0;
1265}
1266
1267/* Swapping and flipping are different operations, need different ioctls.
1268 * They can & should be intermixed to support multiple 3d windows.
1269 */
1270
1271static int r128_cce_flip(struct drm_device *dev, void *data, struct drm_file *file_priv)
1272{
1273	drm_r128_private_t *dev_priv = dev->dev_private;
1274	DRM_DEBUG("\n");
1275
1276	LOCK_TEST_WITH_RETURN(dev, file_priv);
1277
1278	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1279
1280	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1281
1282	if (!dev_priv->page_flipping)
1283		r128_do_init_pageflip(dev);
1284
1285	r128_cce_dispatch_flip(dev);
1286
1287	COMMIT_RING();
1288	return 0;
1289}
1290
1291static int r128_cce_swap(struct drm_device *dev, void *data, struct drm_file *file_priv)
1292{
1293	drm_r128_private_t *dev_priv = dev->dev_private;
1294	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
1295	DRM_DEBUG("\n");
1296
1297	LOCK_TEST_WITH_RETURN(dev, file_priv);
1298
1299	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1300
1301	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1302
1303	if (sarea_priv->nbox > R128_NR_SAREA_CLIPRECTS)
1304		sarea_priv->nbox = R128_NR_SAREA_CLIPRECTS;
1305
1306	r128_cce_dispatch_swap(dev);
1307	dev_priv->sarea_priv->dirty |= (R128_UPLOAD_CONTEXT |
1308					R128_UPLOAD_MASKS);
1309
1310	COMMIT_RING();
1311	return 0;
1312}
1313
1314static int r128_cce_vertex(struct drm_device *dev, void *data, struct drm_file *file_priv)
1315{
1316	drm_r128_private_t *dev_priv = dev->dev_private;
1317	struct drm_device_dma *dma = dev->dma;
1318	struct drm_buf *buf;
1319	drm_r128_buf_priv_t *buf_priv;
1320	drm_r128_vertex_t *vertex = data;
1321
1322	LOCK_TEST_WITH_RETURN(dev, file_priv);
1323
1324	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1325
1326	DRM_DEBUG("pid=%d index=%d count=%d discard=%d\n",
1327		  task_pid_nr(current), vertex->idx, vertex->count, vertex->discard);
1328
1329	if (vertex->idx < 0 || vertex->idx >= dma->buf_count) {
1330		DRM_ERROR("buffer index %d (of %d max)\n",
1331			  vertex->idx, dma->buf_count - 1);
1332		return -EINVAL;
1333	}
1334	if (vertex->prim < 0 ||
1335	    vertex->prim > R128_CCE_VC_CNTL_PRIM_TYPE_TRI_TYPE2) {
1336		DRM_ERROR("buffer prim %d\n", vertex->prim);
1337		return -EINVAL;
1338	}
1339
1340	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1341	VB_AGE_TEST_WITH_RETURN(dev_priv);
1342
1343	buf = dma->buflist[vertex->idx];
1344	buf_priv = buf->dev_private;
1345
1346	if (buf->file_priv != file_priv) {
1347		DRM_ERROR("process %d using buffer owned by %p\n",
1348			  task_pid_nr(current), buf->file_priv);
1349		return -EINVAL;
1350	}
1351	if (buf->pending) {
1352		DRM_ERROR("sending pending buffer %d\n", vertex->idx);
1353		return -EINVAL;
1354	}
1355
1356	buf->used = vertex->count;
1357	buf_priv->prim = vertex->prim;
1358	buf_priv->discard = vertex->discard;
1359
1360	r128_cce_dispatch_vertex(dev, buf);
1361
1362	COMMIT_RING();
1363	return 0;
1364}
1365
1366static int r128_cce_indices(struct drm_device *dev, void *data, struct drm_file *file_priv)
1367{
1368	drm_r128_private_t *dev_priv = dev->dev_private;
1369	struct drm_device_dma *dma = dev->dma;
1370	struct drm_buf *buf;
1371	drm_r128_buf_priv_t *buf_priv;
1372	drm_r128_indices_t *elts = data;
1373	int count;
1374
1375	LOCK_TEST_WITH_RETURN(dev, file_priv);
1376
1377	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1378
1379	DRM_DEBUG("pid=%d buf=%d s=%d e=%d d=%d\n", task_pid_nr(current),
1380		  elts->idx, elts->start, elts->end, elts->discard);
1381
1382	if (elts->idx < 0 || elts->idx >= dma->buf_count) {
1383		DRM_ERROR("buffer index %d (of %d max)\n",
1384			  elts->idx, dma->buf_count - 1);
1385		return -EINVAL;
1386	}
1387	if (elts->prim < 0 ||
1388	    elts->prim > R128_CCE_VC_CNTL_PRIM_TYPE_TRI_TYPE2) {
1389		DRM_ERROR("buffer prim %d\n", elts->prim);
1390		return -EINVAL;
1391	}
1392
1393	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1394	VB_AGE_TEST_WITH_RETURN(dev_priv);
1395
1396	buf = dma->buflist[elts->idx];
1397	buf_priv = buf->dev_private;
1398
1399	if (buf->file_priv != file_priv) {
1400		DRM_ERROR("process %d using buffer owned by %p\n",
1401			  task_pid_nr(current), buf->file_priv);
1402		return -EINVAL;
1403	}
1404	if (buf->pending) {
1405		DRM_ERROR("sending pending buffer %d\n", elts->idx);
1406		return -EINVAL;
1407	}
1408
1409	count = (elts->end - elts->start) / sizeof(u16);
1410	elts->start -= R128_INDEX_PRIM_OFFSET;
1411
1412	if (elts->start & 0x7) {
1413		DRM_ERROR("misaligned buffer 0x%x\n", elts->start);
1414		return -EINVAL;
1415	}
1416	if (elts->start < buf->used) {
1417		DRM_ERROR("no header 0x%x - 0x%x\n", elts->start, buf->used);
1418		return -EINVAL;
1419	}
1420
1421	buf->used = elts->end;
1422	buf_priv->prim = elts->prim;
1423	buf_priv->discard = elts->discard;
1424
1425	r128_cce_dispatch_indices(dev, buf, elts->start, elts->end, count);
1426
1427	COMMIT_RING();
1428	return 0;
1429}
1430
1431static int r128_cce_blit(struct drm_device *dev, void *data, struct drm_file *file_priv)
1432{
1433	struct drm_device_dma *dma = dev->dma;
1434	drm_r128_private_t *dev_priv = dev->dev_private;
1435	drm_r128_blit_t *blit = data;
1436	int ret;
1437
1438	LOCK_TEST_WITH_RETURN(dev, file_priv);
1439
1440	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1441
1442	DRM_DEBUG("pid=%d index=%d\n", task_pid_nr(current), blit->idx);
1443
1444	if (blit->idx < 0 || blit->idx >= dma->buf_count) {
1445		DRM_ERROR("buffer index %d (of %d max)\n",
1446			  blit->idx, dma->buf_count - 1);
1447		return -EINVAL;
1448	}
1449
1450	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1451	VB_AGE_TEST_WITH_RETURN(dev_priv);
1452
1453	ret = r128_cce_dispatch_blit(dev, file_priv, blit);
1454
1455	COMMIT_RING();
1456	return ret;
1457}
1458
1459int r128_cce_depth(struct drm_device *dev, void *data, struct drm_file *file_priv)
1460{
1461	drm_r128_private_t *dev_priv = dev->dev_private;
1462	drm_r128_depth_t *depth = data;
1463	int ret;
1464
1465	LOCK_TEST_WITH_RETURN(dev, file_priv);
1466
1467	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1468
1469	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1470
1471	ret = -EINVAL;
1472	switch (depth->func) {
1473	case R128_WRITE_SPAN:
1474		ret = r128_cce_dispatch_write_span(dev, depth);
1475		break;
1476	case R128_WRITE_PIXELS:
1477		ret = r128_cce_dispatch_write_pixels(dev, depth);
1478		break;
1479	case R128_READ_SPAN:
1480		ret = r128_cce_dispatch_read_span(dev, depth);
1481		break;
1482	case R128_READ_PIXELS:
1483		ret = r128_cce_dispatch_read_pixels(dev, depth);
1484		break;
1485	}
1486
1487	COMMIT_RING();
1488	return ret;
1489}
1490
1491int r128_cce_stipple(struct drm_device *dev, void *data, struct drm_file *file_priv)
1492{
1493	drm_r128_private_t *dev_priv = dev->dev_private;
1494	drm_r128_stipple_t *stipple = data;
1495	u32 mask[32];
1496
1497	LOCK_TEST_WITH_RETURN(dev, file_priv);
1498
1499	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1500
1501	if (copy_from_user(&mask, stipple->mask, 32 * sizeof(u32)))
1502		return -EFAULT;
1503
1504	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1505
1506	r128_cce_dispatch_stipple(dev, mask);
1507
1508	COMMIT_RING();
1509	return 0;
1510}
1511
1512static int r128_cce_indirect(struct drm_device *dev, void *data, struct drm_file *file_priv)
1513{
1514	drm_r128_private_t *dev_priv = dev->dev_private;
1515	struct drm_device_dma *dma = dev->dma;
1516	struct drm_buf *buf;
1517	drm_r128_buf_priv_t *buf_priv;
1518	drm_r128_indirect_t *indirect = data;
1519#if 0
1520	RING_LOCALS;
1521#endif
1522
1523	LOCK_TEST_WITH_RETURN(dev, file_priv);
1524
1525	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1526
1527	DRM_DEBUG("idx=%d s=%d e=%d d=%d\n",
1528		  indirect->idx, indirect->start, indirect->end,
1529		  indirect->discard);
1530
1531	if (indirect->idx < 0 || indirect->idx >= dma->buf_count) {
1532		DRM_ERROR("buffer index %d (of %d max)\n",
1533			  indirect->idx, dma->buf_count - 1);
1534		return -EINVAL;
1535	}
1536
1537	buf = dma->buflist[indirect->idx];
1538	buf_priv = buf->dev_private;
1539
1540	if (buf->file_priv != file_priv) {
1541		DRM_ERROR("process %d using buffer owned by %p\n",
1542			  task_pid_nr(current), buf->file_priv);
1543		return -EINVAL;
1544	}
1545	if (buf->pending) {
1546		DRM_ERROR("sending pending buffer %d\n", indirect->idx);
1547		return -EINVAL;
1548	}
1549
1550	if (indirect->start < buf->used) {
1551		DRM_ERROR("reusing indirect: start=0x%x actual=0x%x\n",
1552			  indirect->start, buf->used);
1553		return -EINVAL;
1554	}
1555
1556	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1557	VB_AGE_TEST_WITH_RETURN(dev_priv);
1558
1559	buf->used = indirect->end;
1560	buf_priv->discard = indirect->discard;
1561
1562#if 0
1563	/* Wait for the 3D stream to idle before the indirect buffer
1564	 * containing 2D acceleration commands is processed.
1565	 */
1566	BEGIN_RING(2);
1567	RADEON_WAIT_UNTIL_3D_IDLE();
1568	ADVANCE_RING();
1569#endif
1570
1571	/* Dispatch the indirect buffer full of commands from the
1572	 * X server.  This is insecure and is thus only available to
1573	 * privileged clients.
1574	 */
1575	r128_cce_dispatch_indirect(dev, buf, indirect->start, indirect->end);
1576
1577	COMMIT_RING();
1578	return 0;
1579}
1580
1581int r128_getparam(struct drm_device *dev, void *data, struct drm_file *file_priv)
1582{
1583	drm_r128_private_t *dev_priv = dev->dev_private;
1584	drm_r128_getparam_t *param = data;
1585	int value;
1586
1587	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1588
1589	DRM_DEBUG("pid=%d\n", task_pid_nr(current));
1590
1591	switch (param->param) {
1592	case R128_PARAM_IRQ_NR:
1593		value = dev->pdev->irq;
1594		break;
1595	default:
1596		return -EINVAL;
1597	}
1598
1599	if (copy_to_user(param->value, &value, sizeof(int))) {
1600		DRM_ERROR("copy_to_user\n");
1601		return -EFAULT;
1602	}
1603
1604	return 0;
1605}
1606
1607void r128_driver_preclose(struct drm_device *dev, struct drm_file *file_priv)
1608{
1609	if (dev->dev_private) {
1610		drm_r128_private_t *dev_priv = dev->dev_private;
1611		if (dev_priv->page_flipping)
1612			r128_do_cleanup_pageflip(dev);
1613	}
1614}
1615void r128_driver_lastclose(struct drm_device *dev)
1616{
1617	r128_do_cleanup_cce(dev);
1618}
1619
1620const struct drm_ioctl_desc r128_ioctls[] = {
1621	DRM_IOCTL_DEF_DRV(R128_INIT, r128_cce_init, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1622	DRM_IOCTL_DEF_DRV(R128_CCE_START, r128_cce_start, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1623	DRM_IOCTL_DEF_DRV(R128_CCE_STOP, r128_cce_stop, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1624	DRM_IOCTL_DEF_DRV(R128_CCE_RESET, r128_cce_reset, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1625	DRM_IOCTL_DEF_DRV(R128_CCE_IDLE, r128_cce_idle, DRM_AUTH),
1626	DRM_IOCTL_DEF_DRV(R128_RESET, r128_engine_reset, DRM_AUTH),
1627	DRM_IOCTL_DEF_DRV(R128_FULLSCREEN, r128_fullscreen, DRM_AUTH),
1628	DRM_IOCTL_DEF_DRV(R128_SWAP, r128_cce_swap, DRM_AUTH),
1629	DRM_IOCTL_DEF_DRV(R128_FLIP, r128_cce_flip, DRM_AUTH),
1630	DRM_IOCTL_DEF_DRV(R128_CLEAR, r128_cce_clear, DRM_AUTH),
1631	DRM_IOCTL_DEF_DRV(R128_VERTEX, r128_cce_vertex, DRM_AUTH),
1632	DRM_IOCTL_DEF_DRV(R128_INDICES, r128_cce_indices, DRM_AUTH),
1633	DRM_IOCTL_DEF_DRV(R128_BLIT, r128_cce_blit, DRM_AUTH),
1634	DRM_IOCTL_DEF_DRV(R128_DEPTH, r128_cce_depth, DRM_AUTH),
1635	DRM_IOCTL_DEF_DRV(R128_STIPPLE, r128_cce_stipple, DRM_AUTH),
1636	DRM_IOCTL_DEF_DRV(R128_INDIRECT, r128_cce_indirect, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1637	DRM_IOCTL_DEF_DRV(R128_GETPARAM, r128_getparam, DRM_AUTH),
1638};
1639
1640int r128_max_ioctl = ARRAY_SIZE(r128_ioctls);
1641