xref: /titanic_50/usr/src/uts/intel/io/drm/r300_cmdbuf.c (revision 0bdffa0f07e70f45f6810116ca9d547631a4c3f8)
1e57b9183Scg149915 /*
2e57b9183Scg149915  * Copyright 2008 Sun Microsystems, Inc.  All rights reserved.
3e57b9183Scg149915  * Use is subject to license terms.
4e57b9183Scg149915  */
5e57b9183Scg149915 /*
6e57b9183Scg149915  * r300_cmdbuf.c -- Command buffer emission for R300 -*- linux-c -*-
7e57b9183Scg149915  *
8e57b9183Scg149915  * Copyright (C) The Weather Channel, Inc.  2002.
9e57b9183Scg149915  * Copyright (C) 2004 Nicolai Haehnle.
10e57b9183Scg149915  * All Rights Reserved.
11e57b9183Scg149915  *
12e57b9183Scg149915  * The Weather Channel (TM) funded Tungsten Graphics to develop the
13e57b9183Scg149915  * initial release of the Radeon 8500 driver under the XFree86 license.
14e57b9183Scg149915  * This notice must be preserved.
15e57b9183Scg149915  *
16e57b9183Scg149915  * Permission is hereby granted, free of charge, to any person obtaining a
17e57b9183Scg149915  * copy of this software and associated documentation files (the "Software"),
18e57b9183Scg149915  * to deal in the Software without restriction, including without limitation
19e57b9183Scg149915  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
20e57b9183Scg149915  * and/or sell copies of the Software, and to permit persons to whom the
21e57b9183Scg149915  * Software is furnished to do so, subject to the following conditions:
22e57b9183Scg149915  *
23e57b9183Scg149915  * The above copyright notice and this permission notice (including the next
24e57b9183Scg149915  * paragraph) shall be included in all copies or substantial portions of the
25e57b9183Scg149915  * Software.
26e57b9183Scg149915  *
27e57b9183Scg149915  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
28e57b9183Scg149915  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
29e57b9183Scg149915  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
30e57b9183Scg149915  * PRECISION INSIGHT AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
31e57b9183Scg149915  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
32e57b9183Scg149915  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
33e57b9183Scg149915  * DEALINGS IN THE SOFTWARE.
34e57b9183Scg149915  *
35e57b9183Scg149915  * Authors:
36e57b9183Scg149915  *    Nicolai Haehnle <prefect_@gmx.net>
37e57b9183Scg149915  */
38e57b9183Scg149915 
39e57b9183Scg149915 #pragma ident	"%Z%%M%	%I%	%E% SMI"
40e57b9183Scg149915 
41e57b9183Scg149915 #include "drm.h"
42e57b9183Scg149915 #include "radeon_drm.h"
43e57b9183Scg149915 #include "drmP.h"
44e57b9183Scg149915 #include "radeon_drv.h"
45e57b9183Scg149915 #include "r300_reg.h"
46e57b9183Scg149915 
47e57b9183Scg149915 #define	R300_SIMULTANEOUS_CLIPRECTS		4
48e57b9183Scg149915 
49e57b9183Scg149915 /*
50e57b9183Scg149915  * Values for R300_RE_CLIPRECT_CNTL depending on the number of
51e57b9183Scg149915  * cliprects
52e57b9183Scg149915  */
53e57b9183Scg149915 static const int r300_cliprect_cntl[4] = {
54e57b9183Scg149915 	0xAAAA,
55e57b9183Scg149915 	0xEEEE,
56e57b9183Scg149915 	0xFEFE,
57e57b9183Scg149915 	0xFFFE
58e57b9183Scg149915 };
59e57b9183Scg149915 
60e57b9183Scg149915 /*
61e57b9183Scg149915  * Emit up to R300_SIMULTANEOUS_CLIPRECTS cliprects from the given command
62e57b9183Scg149915  * buffer, starting with index n.
63e57b9183Scg149915  */
r300_emit_cliprects(drm_radeon_private_t * dev_priv,drm_radeon_kcmd_buffer_t * cmdbuf,int n)64e57b9183Scg149915 static int r300_emit_cliprects(drm_radeon_private_t *dev_priv,
65e57b9183Scg149915     drm_radeon_kcmd_buffer_t *cmdbuf, int n)
66e57b9183Scg149915 {
67e57b9183Scg149915 	drm_clip_rect_t box;
68e57b9183Scg149915 	int nr;
69e57b9183Scg149915 	int i;
70e57b9183Scg149915 	RING_LOCALS;
71e57b9183Scg149915 
72e57b9183Scg149915 	nr = cmdbuf->nbox - n;
73e57b9183Scg149915 	if (nr > R300_SIMULTANEOUS_CLIPRECTS)
74e57b9183Scg149915 		nr = R300_SIMULTANEOUS_CLIPRECTS;
75e57b9183Scg149915 
76e57b9183Scg149915 	DRM_DEBUG("%i cliprects\n", nr);
77e57b9183Scg149915 
78e57b9183Scg149915 	if (nr) {
79e57b9183Scg149915 		BEGIN_RING(6 + nr * 2);
80e57b9183Scg149915 		OUT_RING(CP_PACKET0(R300_RE_CLIPRECT_TL_0, nr * 2 - 1));
81e57b9183Scg149915 
82e57b9183Scg149915 		for (i = 0; i < nr; ++i) {
83e57b9183Scg149915 			if (DRM_COPY_FROM_USER_UNCHECKED
84e57b9183Scg149915 			    (&box, &cmdbuf->boxes[n + i], sizeof (box))) {
85e57b9183Scg149915 				DRM_ERROR("copy cliprect faulted\n");
86e57b9183Scg149915 				return (EFAULT);
87e57b9183Scg149915 			}
88e57b9183Scg149915 
89e57b9183Scg149915 			box.x1 =
90e57b9183Scg149915 			    (box.x1 +
91e57b9183Scg149915 			    R300_CLIPRECT_OFFSET) & R300_CLIPRECT_MASK;
92e57b9183Scg149915 			box.y1 =
93e57b9183Scg149915 			    (box.y1 +
94e57b9183Scg149915 			    R300_CLIPRECT_OFFSET) & R300_CLIPRECT_MASK;
95e57b9183Scg149915 			box.x2 =
96e57b9183Scg149915 			    (box.x2 +
97e57b9183Scg149915 			    R300_CLIPRECT_OFFSET) & R300_CLIPRECT_MASK;
98e57b9183Scg149915 			box.y2 =
99e57b9183Scg149915 			    (box.y2 +
100e57b9183Scg149915 			    R300_CLIPRECT_OFFSET) & R300_CLIPRECT_MASK;
101e57b9183Scg149915 
102e57b9183Scg149915 			OUT_RING((box.x1 << R300_CLIPRECT_X_SHIFT) |
103e57b9183Scg149915 			    (box.y1 << R300_CLIPRECT_Y_SHIFT));
104e57b9183Scg149915 			OUT_RING((box.x2 << R300_CLIPRECT_X_SHIFT) |
105e57b9183Scg149915 			    (box.y2 << R300_CLIPRECT_Y_SHIFT));
106e57b9183Scg149915 		}
107e57b9183Scg149915 
108e57b9183Scg149915 		OUT_RING_REG(R300_RE_CLIPRECT_CNTL, r300_cliprect_cntl[nr - 1]);
109e57b9183Scg149915 
110e57b9183Scg149915 		/*
111e57b9183Scg149915 		 * TODO/SECURITY: Force scissors to a safe value, otherwise
112e57b9183Scg149915 		 * the client might be able to trample over memory.
113e57b9183Scg149915 		 * The impact should be very limited, but I'd rather be safe
114e57b9183Scg149915 		 * than sorry.
115e57b9183Scg149915 		 */
116e57b9183Scg149915 		OUT_RING(CP_PACKET0(R300_RE_SCISSORS_TL, 1));
117e57b9183Scg149915 		OUT_RING(0);
118e57b9183Scg149915 		OUT_RING(R300_SCISSORS_X_MASK | R300_SCISSORS_Y_MASK);
119e57b9183Scg149915 		ADVANCE_RING();
120e57b9183Scg149915 	} else {
121e57b9183Scg149915 		/*
122e57b9183Scg149915 		 * Why we allow zero cliprect rendering:
123e57b9183Scg149915 		 * There are some commands in a command buffer that must be
124e57b9183Scg149915 		 * submitted even when there are no cliprects, e.g. DMA buffer
125e57b9183Scg149915 		 * discard or state setting (though state setting could be
126e57b9183Scg149915 		 * avoided by simulating a loss of context).
127e57b9183Scg149915 		 *
128e57b9183Scg149915 		 * Now since the cmdbuf interface is so chaotic right now (and
129e57b9183Scg149915 		 * is bound to remain that way for a bit until things settle
130e57b9183Scg149915 		 * down), it is basically impossible to filter out the commands
131e57b9183Scg149915 		 * that are necessary and those that aren't.
132e57b9183Scg149915 		 *
133e57b9183Scg149915 		 * So I choose the safe way and don't do any filtering at all;
134e57b9183Scg149915 		 * instead, I simply set up the engine so that all rendering
135e57b9183Scg149915 		 * can't produce any fragments.
136e57b9183Scg149915 		 */
137e57b9183Scg149915 		BEGIN_RING(2);
138e57b9183Scg149915 		OUT_RING_REG(R300_RE_CLIPRECT_CNTL, 0);
139e57b9183Scg149915 		ADVANCE_RING();
140e57b9183Scg149915 	}
141e57b9183Scg149915 
142e57b9183Scg149915 	return (0);
143e57b9183Scg149915 }
144e57b9183Scg149915 
145e57b9183Scg149915 static u8 r300_reg_flags[0x10000 >> 2];
146e57b9183Scg149915 
147e57b9183Scg149915 void
r300_init_reg_flags(void)148e57b9183Scg149915 r300_init_reg_flags(void)
149e57b9183Scg149915 {
150e57b9183Scg149915 	int i;
151e57b9183Scg149915 	(void) memset(r300_reg_flags, 0, 0x10000 >> 2);
152e57b9183Scg149915 #define	ADD_RANGE_MARK(reg, count, mark) \
153e57b9183Scg149915 		for (i = ((reg) >> 2); i < ((reg) >> 2) + (count); i++)\
154e57b9183Scg149915 			r300_reg_flags[i] |= (mark);
155e57b9183Scg149915 
156e57b9183Scg149915 #define	MARK_SAFE		1
157e57b9183Scg149915 #define	MARK_CHECK_OFFSET	2
158e57b9183Scg149915 
159e57b9183Scg149915 #define	ADD_RANGE(reg, count)	ADD_RANGE_MARK(reg, count, MARK_SAFE)
160e57b9183Scg149915 
161e57b9183Scg149915 	/* these match cmducs() command in r300_driver/r300/r300_cmdbuf.c */
162e57b9183Scg149915 	ADD_RANGE(R300_SE_VPORT_XSCALE, 6);
163e57b9183Scg149915 	ADD_RANGE(0x2080, 1);
164e57b9183Scg149915 	ADD_RANGE(R300_SE_VTE_CNTL, 2);
165e57b9183Scg149915 	ADD_RANGE(0x2134, 2);
166e57b9183Scg149915 	ADD_RANGE(0x2140, 1);
167e57b9183Scg149915 	ADD_RANGE(R300_VAP_INPUT_CNTL_0, 2);
168e57b9183Scg149915 	ADD_RANGE(0x21DC, 1);
169e57b9183Scg149915 	ADD_RANGE(0x221C, 1);
170e57b9183Scg149915 	ADD_RANGE(0x2220, 4);
171e57b9183Scg149915 	ADD_RANGE(0x2288, 1);
172e57b9183Scg149915 	ADD_RANGE(R300_VAP_OUTPUT_VTX_FMT_0, 2);
173e57b9183Scg149915 	ADD_RANGE(R300_VAP_PVS_CNTL_1, 3);
174e57b9183Scg149915 	ADD_RANGE(R300_GB_ENABLE, 1);
175e57b9183Scg149915 	ADD_RANGE(R300_GB_MSPOS0, 5);
176e57b9183Scg149915 	ADD_RANGE(R300_TX_CNTL, 1);
177e57b9183Scg149915 	ADD_RANGE(R300_TX_ENABLE, 1);
178e57b9183Scg149915 	ADD_RANGE(0x4200, 4);
179e57b9183Scg149915 	ADD_RANGE(0x4214, 1);
180e57b9183Scg149915 	ADD_RANGE(R300_RE_POINTSIZE, 1);
181e57b9183Scg149915 	ADD_RANGE(0x4230, 3);
182e57b9183Scg149915 	ADD_RANGE(R300_RE_LINE_CNT, 1);
183e57b9183Scg149915 	ADD_RANGE(0x4238, 1);
184e57b9183Scg149915 	ADD_RANGE(0x4260, 3);
185e57b9183Scg149915 	ADD_RANGE(0x4274, 4);
186e57b9183Scg149915 	ADD_RANGE(0x4288, 5);
187e57b9183Scg149915 	ADD_RANGE(0x42A0, 1);
188e57b9183Scg149915 	ADD_RANGE(R300_RE_ZBIAS_T_FACTOR, 4);
189e57b9183Scg149915 	ADD_RANGE(0x42B4, 1);
190e57b9183Scg149915 	ADD_RANGE(R300_RE_CULL_CNTL, 1);
191e57b9183Scg149915 	ADD_RANGE(0x42C0, 2);
192e57b9183Scg149915 	ADD_RANGE(R300_RS_CNTL_0, 2);
193e57b9183Scg149915 	ADD_RANGE(R300_RS_INTERP_0, 8);
194e57b9183Scg149915 	ADD_RANGE(R300_RS_ROUTE_0, 8);
195e57b9183Scg149915 	ADD_RANGE(0x43A4, 2);
196e57b9183Scg149915 	ADD_RANGE(0x43E8, 1);
197e57b9183Scg149915 	ADD_RANGE(R300_PFS_CNTL_0, 3);
198e57b9183Scg149915 	ADD_RANGE(R300_PFS_NODE_0, 4);
199e57b9183Scg149915 	ADD_RANGE(R300_PFS_TEXI_0, 64);
200e57b9183Scg149915 	ADD_RANGE(0x46A4, 5);
201e57b9183Scg149915 	ADD_RANGE(R300_PFS_INSTR0_0, 64);
202e57b9183Scg149915 	ADD_RANGE(R300_PFS_INSTR1_0, 64);
203e57b9183Scg149915 	ADD_RANGE(R300_PFS_INSTR2_0, 64);
204e57b9183Scg149915 	ADD_RANGE(R300_PFS_INSTR3_0, 64);
205e57b9183Scg149915 	ADD_RANGE(0x4BC0, 1);
206e57b9183Scg149915 	ADD_RANGE(0x4BC8, 3);
207e57b9183Scg149915 	ADD_RANGE(R300_PP_ALPHA_TEST, 2);
208e57b9183Scg149915 	ADD_RANGE(0x4BD8, 1);
209e57b9183Scg149915 	ADD_RANGE(R300_PFS_PARAM_0_X, 64);
210e57b9183Scg149915 	ADD_RANGE(0x4E00, 1);
211e57b9183Scg149915 	ADD_RANGE(R300_RB3D_CBLEND, 2);
212e57b9183Scg149915 	ADD_RANGE(R300_RB3D_COLORMASK, 1);
213e57b9183Scg149915 	ADD_RANGE(0x4E10, 3);
214e57b9183Scg149915 	ADD_RANGE_MARK(R300_RB3D_COLOROFFSET0, 1, MARK_CHECK_OFFSET);
215e57b9183Scg149915 					/* check offset */
216e57b9183Scg149915 	ADD_RANGE(R300_RB3D_COLORPITCH0, 1);
217e57b9183Scg149915 	ADD_RANGE(0x4E50, 9);
218e57b9183Scg149915 	ADD_RANGE(0x4E88, 1);
219e57b9183Scg149915 	ADD_RANGE(0x4EA0, 2);
220e57b9183Scg149915 	ADD_RANGE(R300_RB3D_ZSTENCIL_CNTL_0, 3);
221e57b9183Scg149915 	ADD_RANGE(0x4F10, 4);
222e57b9183Scg149915 	ADD_RANGE_MARK(R300_RB3D_DEPTHOFFSET, 1, MARK_CHECK_OFFSET);
223e57b9183Scg149915 					/* check offset */
224e57b9183Scg149915 	ADD_RANGE(R300_RB3D_DEPTHPITCH, 1);
225e57b9183Scg149915 	ADD_RANGE(0x4F28, 1);
226e57b9183Scg149915 	ADD_RANGE(0x4F30, 2);
227e57b9183Scg149915 	ADD_RANGE(0x4F44, 1);
228e57b9183Scg149915 	ADD_RANGE(0x4F54, 1);
229e57b9183Scg149915 
230e57b9183Scg149915 	ADD_RANGE(R300_TX_FILTER_0, 16);
231e57b9183Scg149915 	ADD_RANGE(R300_TX_FILTER1_0, 16);
232e57b9183Scg149915 	ADD_RANGE(R300_TX_SIZE_0, 16);
233e57b9183Scg149915 	ADD_RANGE(R300_TX_FORMAT_0, 16);
234e57b9183Scg149915 	ADD_RANGE(R300_TX_PITCH_0, 16);
235e57b9183Scg149915 	/* Texture offset is dangerous and needs more checking */
236e57b9183Scg149915 	ADD_RANGE_MARK(R300_TX_OFFSET_0, 16, MARK_CHECK_OFFSET);
237e57b9183Scg149915 	ADD_RANGE(R300_TX_CHROMA_KEY_0, 16);
238e57b9183Scg149915 	ADD_RANGE(R300_TX_BORDER_COLOR_0, 16);
239e57b9183Scg149915 
240e57b9183Scg149915 	/* Sporadic registers used as primitives are emitted */
241e57b9183Scg149915 	ADD_RANGE(0x4f18, 1);
242e57b9183Scg149915 	ADD_RANGE(R300_RB3D_DSTCACHE_CTLSTAT, 1);
243e57b9183Scg149915 	ADD_RANGE(R300_VAP_INPUT_ROUTE_0_0, 8);
244e57b9183Scg149915 	ADD_RANGE(R300_VAP_INPUT_ROUTE_1_0, 8);
245e57b9183Scg149915 
246e57b9183Scg149915 }
247e57b9183Scg149915 
r300_check_range(unsigned reg,int count)248e57b9183Scg149915 static __inline__ int r300_check_range(unsigned reg, int count)
249e57b9183Scg149915 {
250e57b9183Scg149915 	int i;
251e57b9183Scg149915 	if (reg & ~0xffff)
252e57b9183Scg149915 		return (-1);
253e57b9183Scg149915 	for (i = (reg >> 2); i < (reg >> 2) + count; i++)
254e57b9183Scg149915 		if (r300_reg_flags[i] != MARK_SAFE)
255e57b9183Scg149915 			return (1);
256e57b9183Scg149915 	return (0);
257e57b9183Scg149915 }
258e57b9183Scg149915 
259e57b9183Scg149915 static inline int
r300_emit_carefully_checked_packet0(drm_radeon_private_t * dev_priv,drm_radeon_kcmd_buffer_t * cmdbuf,drm_r300_cmd_header_t header)260e57b9183Scg149915 r300_emit_carefully_checked_packet0(drm_radeon_private_t *dev_priv,
261e57b9183Scg149915     drm_radeon_kcmd_buffer_t *cmdbuf, drm_r300_cmd_header_t header)
262e57b9183Scg149915 {
263e57b9183Scg149915 	int reg;
264e57b9183Scg149915 	int sz;
265e57b9183Scg149915 	int i;
266e57b9183Scg149915 	int values[64];
267e57b9183Scg149915 	RING_LOCALS;
268e57b9183Scg149915 
269e57b9183Scg149915 	sz = header.packet0.count;
270e57b9183Scg149915 	reg = (header.packet0.reghi << 8) | header.packet0.reglo;
271e57b9183Scg149915 
272e57b9183Scg149915 	if ((sz > 64) || (sz < 0)) {
273e57b9183Scg149915 		DRM_ERROR("Cannot emit more than 64 values at a time "
274e57b9183Scg149915 		    "(reg=%04x sz=%d)\n", reg, sz);
275e57b9183Scg149915 		return (EINVAL);
276e57b9183Scg149915 	}
277e57b9183Scg149915 	for (i = 0; i < sz; i++) {
278e57b9183Scg149915 		values[i] = ((int *)(uintptr_t)cmdbuf->buf)[i];
279e57b9183Scg149915 		switch (r300_reg_flags[(reg >> 2) + i]) {
280e57b9183Scg149915 		case MARK_SAFE:
281e57b9183Scg149915 			break;
282e57b9183Scg149915 		case MARK_CHECK_OFFSET:
283*0bdffa0fShh224818 			if (!RADEON_CHECK_OFFSET(dev_priv, (u32) values[i])) {
284e57b9183Scg149915 				DRM_ERROR("Offset failed range check "
285e57b9183Scg149915 				    "(reg=%04x sz=%d)\n", reg, sz);
286e57b9183Scg149915 				return (EINVAL);
287e57b9183Scg149915 			}
288e57b9183Scg149915 			break;
289e57b9183Scg149915 		default:
290e57b9183Scg149915 			DRM_ERROR("Register %04x failed check as flag=%02x\n",
291e57b9183Scg149915 			    reg + i * 4, r300_reg_flags[(reg >> 2) + i]);
292e57b9183Scg149915 			return (EINVAL);
293e57b9183Scg149915 		}
294e57b9183Scg149915 	}
295e57b9183Scg149915 
296e57b9183Scg149915 	BEGIN_RING(1 + sz);
297e57b9183Scg149915 	OUT_RING(CP_PACKET0(reg, sz - 1));
298e57b9183Scg149915 	OUT_RING_TABLE(values, sz);
299e57b9183Scg149915 	ADVANCE_RING();
300e57b9183Scg149915 
301e57b9183Scg149915 	cmdbuf->buf += sz * 4;
302e57b9183Scg149915 	cmdbuf->bufsz -= sz * 4;
303e57b9183Scg149915 
304e57b9183Scg149915 	return (0);
305e57b9183Scg149915 }
306e57b9183Scg149915 
307e57b9183Scg149915 /*
308e57b9183Scg149915  * Emits a packet0 setting arbitrary registers.
309e57b9183Scg149915  * Called by r300_do_cp_cmdbuf.
310e57b9183Scg149915  *
311e57b9183Scg149915  * Note that checks are performed on contents and addresses of the registers
312e57b9183Scg149915  */
r300_emit_packet0(drm_radeon_private_t * dev_priv,drm_radeon_kcmd_buffer_t * cmdbuf,drm_r300_cmd_header_t header)313e57b9183Scg149915 static __inline__ int r300_emit_packet0(drm_radeon_private_t *dev_priv,
314e57b9183Scg149915 					drm_radeon_kcmd_buffer_t *cmdbuf,
315e57b9183Scg149915 					drm_r300_cmd_header_t header)
316e57b9183Scg149915 {
317e57b9183Scg149915 	int reg;
318e57b9183Scg149915 	int sz;
319e57b9183Scg149915 	RING_LOCALS;
320e57b9183Scg149915 
321e57b9183Scg149915 	sz = header.packet0.count;
322e57b9183Scg149915 	reg = (header.packet0.reghi << 8) | header.packet0.reglo;
323e57b9183Scg149915 
324e57b9183Scg149915 	if (!sz)
325e57b9183Scg149915 		return (0);
326e57b9183Scg149915 
327e57b9183Scg149915 	if (sz * 4 > cmdbuf->bufsz)
328e57b9183Scg149915 		return (EINVAL);
329e57b9183Scg149915 
330e57b9183Scg149915 	if (reg + sz * 4 >= 0x10000) {
331e57b9183Scg149915 		DRM_ERROR("No such registers in hardware reg=%04x sz=%d\n",
332e57b9183Scg149915 		    reg, sz);
333e57b9183Scg149915 		return (EINVAL);
334e57b9183Scg149915 	}
335e57b9183Scg149915 
336e57b9183Scg149915 	if (r300_check_range(reg, sz)) {
337e57b9183Scg149915 		/* go and check everything */
338e57b9183Scg149915 		return (r300_emit_carefully_checked_packet0(dev_priv,
339e57b9183Scg149915 		    cmdbuf, header));
340e57b9183Scg149915 	}
341e57b9183Scg149915 	/*
342e57b9183Scg149915 	 * the rest of the data is safe to emit, whatever the values
343e57b9183Scg149915 	 * the user passed
344e57b9183Scg149915 	 */
345e57b9183Scg149915 
346e57b9183Scg149915 	BEGIN_RING(1 + sz);
347e57b9183Scg149915 	OUT_RING(CP_PACKET0(reg, sz - 1));
348e57b9183Scg149915 	OUT_RING_TABLE(cmdbuf->buf, sz);
349e57b9183Scg149915 	ADVANCE_RING();
350e57b9183Scg149915 
351e57b9183Scg149915 	cmdbuf->buf += sz * 4;
352e57b9183Scg149915 	cmdbuf->bufsz -= sz * 4;
353e57b9183Scg149915 
354e57b9183Scg149915 	return (0);
355e57b9183Scg149915 }
356e57b9183Scg149915 
357e57b9183Scg149915 /*
358e57b9183Scg149915  * Uploads user-supplied vertex program instructions or parameters onto
359e57b9183Scg149915  * the graphics card.
360e57b9183Scg149915  * Called by r300_do_cp_cmdbuf.
361e57b9183Scg149915  */
r300_emit_vpu(drm_radeon_private_t * dev_priv,drm_radeon_kcmd_buffer_t * cmdbuf,drm_r300_cmd_header_t header)362e57b9183Scg149915 static inline int r300_emit_vpu(drm_radeon_private_t *dev_priv,
363e57b9183Scg149915     drm_radeon_kcmd_buffer_t *cmdbuf, drm_r300_cmd_header_t header)
364e57b9183Scg149915 {
365e57b9183Scg149915 	int sz;
366e57b9183Scg149915 	int addr;
367e57b9183Scg149915 	RING_LOCALS;
368e57b9183Scg149915 
369e57b9183Scg149915 	sz = header.vpu.count;
370e57b9183Scg149915 	addr = (header.vpu.adrhi << 8) | header.vpu.adrlo;
371e57b9183Scg149915 
372e57b9183Scg149915 	if (!sz)
373e57b9183Scg149915 		return (0);
374e57b9183Scg149915 	if (sz * 16 > cmdbuf->bufsz)
375e57b9183Scg149915 		return (EINVAL);
376e57b9183Scg149915 
377e57b9183Scg149915 	BEGIN_RING(5 + sz * 4);
378e57b9183Scg149915 	/* Wait for VAP to come to senses.. */
379e57b9183Scg149915 	/*
380e57b9183Scg149915 	 * there is no need to emit it multiple times, (only once before
381e57b9183Scg149915 	 * VAP is programmed, but this optimization is for later
382e57b9183Scg149915 	 */
383e57b9183Scg149915 	OUT_RING_REG(R300_VAP_PVS_WAITIDLE, 0);
384e57b9183Scg149915 	OUT_RING_REG(R300_VAP_PVS_UPLOAD_ADDRESS, addr);
385e57b9183Scg149915 	OUT_RING(CP_PACKET0_TABLE(R300_VAP_PVS_UPLOAD_DATA, sz * 4 - 1));
386e57b9183Scg149915 	OUT_RING_TABLE(cmdbuf->buf, sz * 4);
387e57b9183Scg149915 
388e57b9183Scg149915 	ADVANCE_RING();
389e57b9183Scg149915 
390e57b9183Scg149915 	cmdbuf->buf += sz * 16;
391e57b9183Scg149915 	cmdbuf->bufsz -= sz * 16;
392e57b9183Scg149915 
393e57b9183Scg149915 	return (0);
394e57b9183Scg149915 }
395e57b9183Scg149915 
396e57b9183Scg149915 /*
397e57b9183Scg149915  * Emit a clear packet from userspace.
398e57b9183Scg149915  * Called by r300_emit_packet3.
399e57b9183Scg149915  */
r300_emit_clear(drm_radeon_private_t * dev_priv,drm_radeon_kcmd_buffer_t * cmdbuf)400e57b9183Scg149915 static inline int r300_emit_clear(drm_radeon_private_t *dev_priv,
401e57b9183Scg149915     drm_radeon_kcmd_buffer_t *cmdbuf)
402e57b9183Scg149915 {
403e57b9183Scg149915 	RING_LOCALS;
404e57b9183Scg149915 
405e57b9183Scg149915 	if (8 * 4 > cmdbuf->bufsz)
406e57b9183Scg149915 		return (EINVAL);
407e57b9183Scg149915 
408e57b9183Scg149915 	BEGIN_RING(10);
409e57b9183Scg149915 	OUT_RING(CP_PACKET3(R200_3D_DRAW_IMMD_2, 8));
410e57b9183Scg149915 	OUT_RING(R300_PRIM_TYPE_POINT | R300_PRIM_WALK_RING |
411e57b9183Scg149915 	    (1 << R300_PRIM_NUM_VERTICES_SHIFT));
412e57b9183Scg149915 	OUT_RING_TABLE(cmdbuf->buf, 8);
413e57b9183Scg149915 	ADVANCE_RING();
414e57b9183Scg149915 
415e57b9183Scg149915 	cmdbuf->buf += 8 * 4;
416e57b9183Scg149915 	cmdbuf->bufsz -= 8 * 4;
417e57b9183Scg149915 
418e57b9183Scg149915 	return (0);
419e57b9183Scg149915 }
420e57b9183Scg149915 
r300_emit_3d_load_vbpntr(drm_radeon_private_t * dev_priv,drm_radeon_kcmd_buffer_t * cmdbuf,u32 header)421e57b9183Scg149915 static inline int r300_emit_3d_load_vbpntr(drm_radeon_private_t *dev_priv,
422e57b9183Scg149915     drm_radeon_kcmd_buffer_t *cmdbuf, u32 header)
423e57b9183Scg149915 {
424e57b9183Scg149915 	int count, i, k;
425e57b9183Scg149915 #define	MAX_ARRAY_PACKET		64
426e57b9183Scg149915 	u32 payload[MAX_ARRAY_PACKET];
427e57b9183Scg149915 	u32 narrays;
428e57b9183Scg149915 	RING_LOCALS;
429e57b9183Scg149915 
430e57b9183Scg149915 	count = (header >> 16) & 0x3fff;
431e57b9183Scg149915 
432e57b9183Scg149915 	if ((count + 1) > MAX_ARRAY_PACKET) {
433e57b9183Scg149915 		DRM_ERROR("Too large payload in 3D_LOAD_VBPNTR (count=%d)\n",
434e57b9183Scg149915 		    count);
435e57b9183Scg149915 		return (EINVAL);
436e57b9183Scg149915 	}
437e57b9183Scg149915 	(void) memset(payload, 0, MAX_ARRAY_PACKET * 4);
438e57b9183Scg149915 	(void) memcpy(payload, cmdbuf->buf + 4, (count + 1) * 4);
439e57b9183Scg149915 
440e57b9183Scg149915 	/* carefully check packet contents */
441e57b9183Scg149915 
442e57b9183Scg149915 	narrays = payload[0];
443e57b9183Scg149915 	k = 0;
444e57b9183Scg149915 	i = 1;
445e57b9183Scg149915 	while ((k < narrays) && (i < (count + 1))) {
446e57b9183Scg149915 		i++;		/* skip attribute field */
447*0bdffa0fShh224818 		if (!RADEON_CHECK_OFFSET(dev_priv, payload[i])) {
448e57b9183Scg149915 			DRM_ERROR("Offset failed range check (k=%d i=%d) "
449e57b9183Scg149915 			    "while processing 3D_LOAD_VBPNTR packet.\n",
450e57b9183Scg149915 			    k, i);
451e57b9183Scg149915 			return (EINVAL);
452e57b9183Scg149915 		}
453e57b9183Scg149915 		k++;
454e57b9183Scg149915 		i++;
455e57b9183Scg149915 		if (k == narrays)
456e57b9183Scg149915 			break;
457e57b9183Scg149915 		/* have one more to process, they come in pairs */
458*0bdffa0fShh224818 		if (!RADEON_CHECK_OFFSET(dev_priv, payload[i])) {
459e57b9183Scg149915 			DRM_ERROR("Offset failed range check (k=%d i=%d) "
460e57b9183Scg149915 			    "while processing 3D_LOAD_VBPNTR packet.\n",
461e57b9183Scg149915 			    k, i);
462e57b9183Scg149915 			return (EINVAL);
463e57b9183Scg149915 		}
464e57b9183Scg149915 		k++;
465e57b9183Scg149915 		i++;
466e57b9183Scg149915 	}
467e57b9183Scg149915 	/* do the counts match what we expect ? */
468e57b9183Scg149915 	if ((k != narrays) || (i != (count + 1))) {
469e57b9183Scg149915 		DRM_ERROR("Malformed 3D_LOAD_VBPNTR packet "
470e57b9183Scg149915 		    "(k=%d i=%d narrays=%d count+1=%d).\n",
471e57b9183Scg149915 		    k, i, narrays, count + 1);
472e57b9183Scg149915 		return (EINVAL);
473e57b9183Scg149915 	}
474e57b9183Scg149915 
475e57b9183Scg149915 	/* all clear, output packet */
476e57b9183Scg149915 
477e57b9183Scg149915 	BEGIN_RING(count + 2);
478e57b9183Scg149915 	OUT_RING(header);
479e57b9183Scg149915 	OUT_RING_TABLE(payload, count + 1);
480e57b9183Scg149915 	ADVANCE_RING();
481e57b9183Scg149915 
482e57b9183Scg149915 	cmdbuf->buf += (count + 2) * 4;
483e57b9183Scg149915 	cmdbuf->bufsz -= (count + 2) * 4;
484e57b9183Scg149915 
485e57b9183Scg149915 	return (0);
486e57b9183Scg149915 }
487e57b9183Scg149915 
r300_emit_bitblt_multi(drm_radeon_private_t * dev_priv,drm_radeon_kcmd_buffer_t * cmdbuf)488e57b9183Scg149915 static inline int r300_emit_bitblt_multi(drm_radeon_private_t *dev_priv,
489e57b9183Scg149915     drm_radeon_kcmd_buffer_t *cmdbuf)
490e57b9183Scg149915 {
491e57b9183Scg149915 	u32 *cmd = (u32 *)(uintptr_t)cmdbuf->buf;
492e57b9183Scg149915 	int count, ret;
493e57b9183Scg149915 	RING_LOCALS;
494e57b9183Scg149915 
495e57b9183Scg149915 	count = (cmd[0] >> 16) & 0x3fff;
496e57b9183Scg149915 
497e57b9183Scg149915 	if (cmd[0] & 0x8000) {
498e57b9183Scg149915 		u32 offset;
499e57b9183Scg149915 
500e57b9183Scg149915 		if (cmd[1] & (RADEON_GMC_SRC_PITCH_OFFSET_CNTL |
501e57b9183Scg149915 		    RADEON_GMC_DST_PITCH_OFFSET_CNTL)) {
502e57b9183Scg149915 			offset = cmd[2] << 10;
503*0bdffa0fShh224818 			ret = !RADEON_CHECK_OFFSET(dev_priv, offset);
504e57b9183Scg149915 			if (ret) {
505e57b9183Scg149915 				DRM_ERROR("Invalid bitblt first offset "
506e57b9183Scg149915 				    "is %08X\n", offset);
507e57b9183Scg149915 				return (EINVAL);
508e57b9183Scg149915 			}
509e57b9183Scg149915 		}
510e57b9183Scg149915 
511e57b9183Scg149915 		if ((cmd[1] & RADEON_GMC_SRC_PITCH_OFFSET_CNTL) &&
512e57b9183Scg149915 		    (cmd[1] & RADEON_GMC_DST_PITCH_OFFSET_CNTL)) {
513e57b9183Scg149915 			offset = cmd[3] << 10;
514*0bdffa0fShh224818 			ret = !RADEON_CHECK_OFFSET(dev_priv, offset);
515e57b9183Scg149915 			if (ret) {
516e57b9183Scg149915 				DRM_ERROR("Invalid bitblt second offset "
517e57b9183Scg149915 				    "is %08X\n", offset);
518e57b9183Scg149915 				return (EINVAL);
519e57b9183Scg149915 			}
520e57b9183Scg149915 
521e57b9183Scg149915 		}
522e57b9183Scg149915 	}
523e57b9183Scg149915 
524e57b9183Scg149915 	BEGIN_RING(count+2);
525e57b9183Scg149915 	OUT_RING(cmd[0]);
526e57b9183Scg149915 	OUT_RING_TABLE((cmdbuf->buf + 4), count + 1);
527e57b9183Scg149915 	ADVANCE_RING();
528e57b9183Scg149915 
529e57b9183Scg149915 	cmdbuf->buf += (count+2)*4;
530e57b9183Scg149915 	cmdbuf->bufsz -= (count+2)*4;
531e57b9183Scg149915 
532e57b9183Scg149915 	return (0);
533e57b9183Scg149915 }
534e57b9183Scg149915 
535e57b9183Scg149915 
r300_emit_indx_buffer(drm_radeon_private_t * dev_priv,drm_radeon_kcmd_buffer_t * cmdbuf)536e57b9183Scg149915 static inline int r300_emit_indx_buffer(drm_radeon_private_t *dev_priv,
537e57b9183Scg149915     drm_radeon_kcmd_buffer_t *cmdbuf)
538e57b9183Scg149915 {
539e57b9183Scg149915 	u32 *cmd = (u32 *)(uintptr_t)cmdbuf->buf;
540e57b9183Scg149915 	int count, ret;
541e57b9183Scg149915 	RING_LOCALS;
542e57b9183Scg149915 
543e57b9183Scg149915 	count = (cmd[0]>>16) & 0x3fff;
544e57b9183Scg149915 
545e57b9183Scg149915 	if ((cmd[1] & 0x8000ffff) != 0x80000810) {
546e57b9183Scg149915 		DRM_ERROR("Invalid indx_buffer reg address %08X\n", cmd[1]);
547e57b9183Scg149915 		return (EINVAL);
548e57b9183Scg149915 	}
549*0bdffa0fShh224818 	ret = !RADEON_CHECK_OFFSET(dev_priv, cmd[2]);
550e57b9183Scg149915 	if (ret) {
551e57b9183Scg149915 		DRM_ERROR("Invalid indx_buffer offset is %08X\n", cmd[2]);
552e57b9183Scg149915 		return (EINVAL);
553e57b9183Scg149915 	}
554e57b9183Scg149915 
555e57b9183Scg149915 	BEGIN_RING(count+2);
556e57b9183Scg149915 	OUT_RING(cmd[0]);
557e57b9183Scg149915 	OUT_RING_TABLE(cmdbuf->buf + 4, count + 1);
558e57b9183Scg149915 	ADVANCE_RING();
559e57b9183Scg149915 
560e57b9183Scg149915 	cmdbuf->buf += (count+2)*4;
561e57b9183Scg149915 	cmdbuf->bufsz -= (count+2)*4;
562e57b9183Scg149915 
563e57b9183Scg149915 	return (0);
564e57b9183Scg149915 }
565e57b9183Scg149915 
566e57b9183Scg149915 
r300_emit_raw_packet3(drm_radeon_private_t * dev_priv,drm_radeon_kcmd_buffer_t * cmdbuf)567e57b9183Scg149915 static __inline__ int r300_emit_raw_packet3(drm_radeon_private_t *dev_priv,
568e57b9183Scg149915 					    drm_radeon_kcmd_buffer_t *cmdbuf)
569e57b9183Scg149915 {
570e57b9183Scg149915 	u32 header;
571e57b9183Scg149915 	int count;
572e57b9183Scg149915 	RING_LOCALS;
573e57b9183Scg149915 
574e57b9183Scg149915 	if (4 > cmdbuf->bufsz)
575e57b9183Scg149915 		return (EINVAL);
576e57b9183Scg149915 
577e57b9183Scg149915 	/*
578e57b9183Scg149915 	 * Fixme !! This simply emits a packet without much checking.
579e57b9183Scg149915 	 * We need to be smarter.
580e57b9183Scg149915 	 */
581e57b9183Scg149915 
582e57b9183Scg149915 	/* obtain first word - actual packet3 header */
583e57b9183Scg149915 	header = *(u32 *)(uintptr_t)cmdbuf->buf;
584e57b9183Scg149915 
585e57b9183Scg149915 	/* Is it packet 3 ? */
586e57b9183Scg149915 	if ((header >> 30) != 0x3) {
587e57b9183Scg149915 		DRM_ERROR("Not a packet3 header (0x%08x)\n", header);
588e57b9183Scg149915 		return (EINVAL);
589e57b9183Scg149915 	}
590e57b9183Scg149915 
591e57b9183Scg149915 	count = (header >> 16) & 0x3fff;
592e57b9183Scg149915 
593e57b9183Scg149915 	/* Check again now that we know how much data to expect */
594e57b9183Scg149915 	if ((count + 2) * 4 > cmdbuf->bufsz) {
595e57b9183Scg149915 		DRM_ERROR("Expected packet3 of length %d but have only "
596e57b9183Scg149915 		    "%d bytes left\n", (count + 2) * 4, cmdbuf->bufsz);
597e57b9183Scg149915 		return (EINVAL);
598e57b9183Scg149915 	}
599e57b9183Scg149915 
600e57b9183Scg149915 	/* Is it a packet type we know about ? */
601e57b9183Scg149915 	switch (header & 0xff00) {
602e57b9183Scg149915 	case RADEON_3D_LOAD_VBPNTR:	/* load vertex array pointers */
603e57b9183Scg149915 		return (r300_emit_3d_load_vbpntr(dev_priv, cmdbuf, header));
604e57b9183Scg149915 
605e57b9183Scg149915 	case RADEON_CNTL_BITBLT_MULTI:
606e57b9183Scg149915 		return (r300_emit_bitblt_multi(dev_priv, cmdbuf));
607e57b9183Scg149915 
608e57b9183Scg149915 	case RADEON_CP_INDX_BUFFER:
609e57b9183Scg149915 			// DRAW_INDX_2 without INDX_BUFFER seems to lock
610e57b9183Scg149915 			// up the GPU
611e57b9183Scg149915 		return (r300_emit_indx_buffer(dev_priv, cmdbuf));
612e57b9183Scg149915 
613e57b9183Scg149915 	case RADEON_CP_3D_DRAW_IMMD_2:
614e57b9183Scg149915 			/* triggers drawing using in-packet vertex data */
615e57b9183Scg149915 	case RADEON_CP_3D_DRAW_VBUF_2:
616e57b9183Scg149915 			/* triggers drawing of vertex buffers setup elsewhere */
617e57b9183Scg149915 	case RADEON_CP_3D_DRAW_INDX_2:
618e57b9183Scg149915 			/* triggers drawing using indices to vertex buffer */
619e57b9183Scg149915 	case RADEON_WAIT_FOR_IDLE:
620e57b9183Scg149915 	case RADEON_CP_NOP:
621e57b9183Scg149915 		/* these packets are safe */
622e57b9183Scg149915 		break;
623e57b9183Scg149915 	default:
624e57b9183Scg149915 		DRM_ERROR("Unknown packet3 header (0x%08x)\n", header);
625e57b9183Scg149915 		return (EINVAL);
626e57b9183Scg149915 	}
627e57b9183Scg149915 
628e57b9183Scg149915 	BEGIN_RING(count + 2);
629e57b9183Scg149915 	OUT_RING(header);
630e57b9183Scg149915 	OUT_RING_TABLE((cmdbuf->buf + 4), count + 1);
631e57b9183Scg149915 	ADVANCE_RING();
632e57b9183Scg149915 
633e57b9183Scg149915 	cmdbuf->buf += (count + 2) * 4;
634e57b9183Scg149915 	cmdbuf->bufsz -= (count + 2) * 4;
635e57b9183Scg149915 
636e57b9183Scg149915 	return (0);
637e57b9183Scg149915 }
638e57b9183Scg149915 
639e57b9183Scg149915 /*
640e57b9183Scg149915  * Emit a rendering packet3 from userspace.
641e57b9183Scg149915  * Called by r300_do_cp_cmdbuf.
642e57b9183Scg149915  */
r300_emit_packet3(drm_radeon_private_t * dev_priv,drm_radeon_kcmd_buffer_t * cmdbuf,drm_r300_cmd_header_t header)643e57b9183Scg149915 static __inline__ int r300_emit_packet3(drm_radeon_private_t *dev_priv,
644e57b9183Scg149915     drm_radeon_kcmd_buffer_t *cmdbuf, drm_r300_cmd_header_t header)
645e57b9183Scg149915 {
646e57b9183Scg149915 	int n;
647e57b9183Scg149915 	int ret;
648e57b9183Scg149915 	char *orig_buf = cmdbuf->buf;
649e57b9183Scg149915 	int orig_bufsz = cmdbuf->bufsz;
650e57b9183Scg149915 
651e57b9183Scg149915 	/*
652e57b9183Scg149915 	 * This is a do-while-loop so that we run the interior at least once,
653e57b9183Scg149915 	 * even if cmdbuf->nbox is 0. Compare r300_emit_cliprects for rationale.
654e57b9183Scg149915 	 */
655e57b9183Scg149915 	n = 0;
656e57b9183Scg149915 	do {
657e57b9183Scg149915 		if (cmdbuf->nbox > R300_SIMULTANEOUS_CLIPRECTS) {
658e57b9183Scg149915 			ret = r300_emit_cliprects(dev_priv, cmdbuf, n);
659e57b9183Scg149915 			if (ret)
660e57b9183Scg149915 				return (ret);
661e57b9183Scg149915 
662e57b9183Scg149915 			cmdbuf->buf = orig_buf;
663e57b9183Scg149915 			cmdbuf->bufsz = orig_bufsz;
664e57b9183Scg149915 		}
665e57b9183Scg149915 
666e57b9183Scg149915 		switch (header.packet3.packet) {
667e57b9183Scg149915 		case R300_CMD_PACKET3_CLEAR:
668e57b9183Scg149915 			DRM_DEBUG("R300_CMD_PACKET3_CLEAR\n");
669e57b9183Scg149915 			ret = r300_emit_clear(dev_priv, cmdbuf);
670e57b9183Scg149915 			if (ret) {
671e57b9183Scg149915 				DRM_ERROR("r300_emit_clear failed\n");
672e57b9183Scg149915 				return (ret);
673e57b9183Scg149915 			}
674e57b9183Scg149915 			break;
675e57b9183Scg149915 
676e57b9183Scg149915 		case R300_CMD_PACKET3_RAW:
677e57b9183Scg149915 			DRM_DEBUG("R300_CMD_PACKET3_RAW\n");
678e57b9183Scg149915 			ret = r300_emit_raw_packet3(dev_priv, cmdbuf);
679e57b9183Scg149915 			if (ret) {
680e57b9183Scg149915 				DRM_ERROR("r300_emit_raw_packet3 failed\n");
681e57b9183Scg149915 				return (ret);
682e57b9183Scg149915 			}
683e57b9183Scg149915 			break;
684e57b9183Scg149915 
685e57b9183Scg149915 		default:
686e57b9183Scg149915 			DRM_ERROR("bad packet3 type %i at %p\n",
687e57b9183Scg149915 			    header.packet3.packet,
688e57b9183Scg149915 			    cmdbuf->buf - sizeof (header));
689e57b9183Scg149915 			return (EINVAL);
690e57b9183Scg149915 		}
691e57b9183Scg149915 
692e57b9183Scg149915 		n += R300_SIMULTANEOUS_CLIPRECTS;
693e57b9183Scg149915 	} while (n < cmdbuf->nbox);
694e57b9183Scg149915 
695e57b9183Scg149915 	return (0);
696e57b9183Scg149915 }
697e57b9183Scg149915 
698e57b9183Scg149915 /*
699e57b9183Scg149915  * Some of the R300 chips seem to be extremely touchy about the two registers
700e57b9183Scg149915  * that are configured in r300_pacify.
701e57b9183Scg149915  * Among the worst offenders seems to be the R300 ND (0x4E44): When userspace
702e57b9183Scg149915  * sends a command buffer that contains only state setting commands and a
703e57b9183Scg149915  * vertex program/parameter upload sequence, this will eventually lead to a
704e57b9183Scg149915  * lockup, unless the sequence is bracketed by calls to r300_pacify.
705e57b9183Scg149915  * So we should take great care to *always* call r300_pacify before
706e57b9183Scg149915  * *anything* 3D related, and again afterwards. This is what the
707e57b9183Scg149915  * call bracket in r300_do_cp_cmdbuf is for.
708e57b9183Scg149915  */
709e57b9183Scg149915 
710e57b9183Scg149915 /*
711e57b9183Scg149915  * Emit the sequence to pacify R300.
712e57b9183Scg149915  */
r300_pacify(drm_radeon_private_t * dev_priv)713e57b9183Scg149915 static __inline__ void r300_pacify(drm_radeon_private_t *dev_priv)
714e57b9183Scg149915 {
715e57b9183Scg149915 	RING_LOCALS;
716e57b9183Scg149915 
717e57b9183Scg149915 	BEGIN_RING(6);
718e57b9183Scg149915 	OUT_RING(CP_PACKET0(R300_RB3D_DSTCACHE_CTLSTAT, 0));
719e57b9183Scg149915 	OUT_RING(0xa);
720e57b9183Scg149915 	OUT_RING(CP_PACKET0(0x4f18, 0));
721e57b9183Scg149915 	OUT_RING(0x3);
722e57b9183Scg149915 	OUT_RING(CP_PACKET3(RADEON_CP_NOP, 0));
723e57b9183Scg149915 	OUT_RING(0x0);
724e57b9183Scg149915 	ADVANCE_RING();
725e57b9183Scg149915 }
726e57b9183Scg149915 
727e57b9183Scg149915 /*
728e57b9183Scg149915  * Called by r300_do_cp_cmdbuf to update the internal buffer age and state.
729e57b9183Scg149915  * The actual age emit is done by r300_do_cp_cmdbuf, which is why you must
730e57b9183Scg149915  * be careful about how this function is called.
731e57b9183Scg149915  */
r300_discard_buffer(drm_device_t * dev,drm_buf_t * buf)732e57b9183Scg149915 static void r300_discard_buffer(drm_device_t *dev, drm_buf_t *buf)
733e57b9183Scg149915 {
734e57b9183Scg149915 	drm_radeon_private_t *dev_priv = dev->dev_private;
735e57b9183Scg149915 	drm_radeon_buf_priv_t *buf_priv = buf->dev_private;
736e57b9183Scg149915 
737e57b9183Scg149915 	buf_priv->age = ++dev_priv->sarea_priv->last_dispatch;
738e57b9183Scg149915 	buf->pending = 1;
739e57b9183Scg149915 	buf->used = 0;
740e57b9183Scg149915 }
741e57b9183Scg149915 
r300_scratch(drm_radeon_private_t * dev_priv,drm_radeon_kcmd_buffer_t * cmdbuf,drm_r300_cmd_header_t header)742e57b9183Scg149915 static int r300_scratch(drm_radeon_private_t *dev_priv,
743e57b9183Scg149915 			drm_radeon_kcmd_buffer_t *cmdbuf,
744e57b9183Scg149915 			drm_r300_cmd_header_t header)
745e57b9183Scg149915 {
746e57b9183Scg149915 	u32 *ref_age_base;
747e57b9183Scg149915 	u32 i, buf_idx, h_pending;
748e57b9183Scg149915 	RING_LOCALS;
749e57b9183Scg149915 
750e57b9183Scg149915 	if (cmdbuf->bufsz < sizeof (uint64_t) +
751e57b9183Scg149915 	    header.scratch.n_bufs * sizeof (buf_idx)) {
752e57b9183Scg149915 		return (EINVAL);
753e57b9183Scg149915 	}
754e57b9183Scg149915 
755e57b9183Scg149915 	if (header.scratch.reg >= 5) {
756e57b9183Scg149915 		return (EINVAL);
757e57b9183Scg149915 	}
758e57b9183Scg149915 
759e57b9183Scg149915 	dev_priv->scratch_ages[header.scratch.reg] ++;
760e57b9183Scg149915 
761e57b9183Scg149915 	ref_age_base = (u32 *)(uintptr_t)*((uint64_t *)(uintptr_t)cmdbuf->buf);
762e57b9183Scg149915 
763e57b9183Scg149915 	cmdbuf->buf += sizeof (uint64_t);
764e57b9183Scg149915 	cmdbuf->bufsz -= sizeof (uint64_t);
765e57b9183Scg149915 
766e57b9183Scg149915 	for (i = 0; i < header.scratch.n_bufs; i++) {
767e57b9183Scg149915 		buf_idx = *(u32 *)(uintptr_t)cmdbuf->buf;
768e57b9183Scg149915 		buf_idx *= 2; /* 8 bytes per buf */
769e57b9183Scg149915 
770e57b9183Scg149915 		if (DRM_COPY_TO_USER(ref_age_base + buf_idx,
771e57b9183Scg149915 		    &dev_priv->scratch_ages[header.scratch.reg],
772e57b9183Scg149915 		    sizeof (u32))) {
773e57b9183Scg149915 			return (EINVAL);
774e57b9183Scg149915 		}
775e57b9183Scg149915 
776e57b9183Scg149915 		if (DRM_COPY_FROM_USER(&h_pending,
777e57b9183Scg149915 		    ref_age_base + buf_idx + 1, sizeof (u32))) {
778e57b9183Scg149915 			return (EINVAL);
779e57b9183Scg149915 		}
780e57b9183Scg149915 
781e57b9183Scg149915 		if (h_pending == 0) {
782e57b9183Scg149915 			return (EINVAL);
783e57b9183Scg149915 		}
784e57b9183Scg149915 
785e57b9183Scg149915 		h_pending--;
786e57b9183Scg149915 
787e57b9183Scg149915 		if (DRM_COPY_TO_USER(ref_age_base + buf_idx + 1,
788e57b9183Scg149915 		    &h_pending, sizeof (u32))) {
789e57b9183Scg149915 			return (EINVAL);
790e57b9183Scg149915 		}
791e57b9183Scg149915 
792e57b9183Scg149915 		cmdbuf->buf += sizeof (buf_idx);
793e57b9183Scg149915 		cmdbuf->bufsz -= sizeof (buf_idx);
794e57b9183Scg149915 	}
795e57b9183Scg149915 
796e57b9183Scg149915 	BEGIN_RING(2);
797e57b9183Scg149915 	OUT_RING(CP_PACKET0(RADEON_SCRATCH_REG0 + header.scratch.reg * 4, 0));
798e57b9183Scg149915 	OUT_RING(dev_priv->scratch_ages[header.scratch.reg]);
799e57b9183Scg149915 	ADVANCE_RING();
800e57b9183Scg149915 
801e57b9183Scg149915 	return (0);
802e57b9183Scg149915 }
803e57b9183Scg149915 
804e57b9183Scg149915 /*
805e57b9183Scg149915  * Parses and validates a user-supplied command buffer and emits appropriate
806e57b9183Scg149915  * commands on the DMA ring buffer.
807e57b9183Scg149915  * Called by the ioctl handler function radeon_cp_cmdbuf.
808e57b9183Scg149915  */
809e57b9183Scg149915 /*ARGSUSED*/
810e57b9183Scg149915 int
r300_do_cp_cmdbuf(drm_device_t * dev,drm_file_t * fpriv,drm_radeon_kcmd_buffer_t * cmdbuf)811e57b9183Scg149915 r300_do_cp_cmdbuf(drm_device_t *dev,
812e57b9183Scg149915     drm_file_t *fpriv, drm_radeon_kcmd_buffer_t *cmdbuf)
813e57b9183Scg149915 {
814e57b9183Scg149915 	drm_radeon_private_t *dev_priv = dev->dev_private;
815e57b9183Scg149915 	drm_device_dma_t *dma = dev->dma;
816e57b9183Scg149915 	drm_buf_t *buf = NULL;
817e57b9183Scg149915 	int emit_dispatch_age = 0;
818e57b9183Scg149915 	int ret = 0;
819e57b9183Scg149915 
820e57b9183Scg149915 	DRM_DEBUG("\n");
821e57b9183Scg149915 
822e57b9183Scg149915 	/*
823e57b9183Scg149915 	 * See the comment above r300_emit_begin3d for why this call
824e57b9183Scg149915 	 * must be here, and what the cleanup gotos are for.
825e57b9183Scg149915 	 */
826e57b9183Scg149915 	r300_pacify(dev_priv);
827e57b9183Scg149915 
828e57b9183Scg149915 	if (cmdbuf->nbox <= R300_SIMULTANEOUS_CLIPRECTS) {
829e57b9183Scg149915 		ret = r300_emit_cliprects(dev_priv, cmdbuf, 0);
830e57b9183Scg149915 		if (ret)
831e57b9183Scg149915 			goto cleanup;
832e57b9183Scg149915 	}
833e57b9183Scg149915 
834e57b9183Scg149915 	while (cmdbuf->bufsz >= sizeof (drm_r300_cmd_header_t)) {
835e57b9183Scg149915 		int idx;
836e57b9183Scg149915 		drm_r300_cmd_header_t header;
837e57b9183Scg149915 
838e57b9183Scg149915 		header.u = *(unsigned int *)(uintptr_t)cmdbuf->buf;
839e57b9183Scg149915 
840e57b9183Scg149915 		cmdbuf->buf += sizeof (header);
841e57b9183Scg149915 		cmdbuf->bufsz -= sizeof (header);
842e57b9183Scg149915 
843e57b9183Scg149915 		switch (header.header.cmd_type) {
844e57b9183Scg149915 		case R300_CMD_PACKET0:
845e57b9183Scg149915 			DRM_DEBUG("R300_CMD_PACKET0\n");
846e57b9183Scg149915 			ret = r300_emit_packet0(dev_priv, cmdbuf, header);
847e57b9183Scg149915 			if (ret) {
848e57b9183Scg149915 				DRM_ERROR("r300_emit_packet0 failed\n");
849e57b9183Scg149915 				goto cleanup;
850e57b9183Scg149915 			}
851e57b9183Scg149915 			break;
852e57b9183Scg149915 
853e57b9183Scg149915 		case R300_CMD_VPU:
854e57b9183Scg149915 			DRM_DEBUG("R300_CMD_VPU\n");
855e57b9183Scg149915 			ret = r300_emit_vpu(dev_priv, cmdbuf, header);
856e57b9183Scg149915 			if (ret) {
857e57b9183Scg149915 				DRM_ERROR("r300_emit_vpu failed\n");
858e57b9183Scg149915 				goto cleanup;
859e57b9183Scg149915 			}
860e57b9183Scg149915 			break;
861e57b9183Scg149915 
862e57b9183Scg149915 		case R300_CMD_PACKET3:
863e57b9183Scg149915 			DRM_DEBUG("R300_CMD_PACKET3\n");
864e57b9183Scg149915 			ret = r300_emit_packet3(dev_priv, cmdbuf, header);
865e57b9183Scg149915 			if (ret) {
866e57b9183Scg149915 				DRM_ERROR("r300_emit_packet3 failed\n");
867e57b9183Scg149915 				goto cleanup;
868e57b9183Scg149915 			}
869e57b9183Scg149915 			break;
870e57b9183Scg149915 
871e57b9183Scg149915 		case R300_CMD_END3D:
872e57b9183Scg149915 			DRM_DEBUG("R300_CMD_END3D\n");
873e57b9183Scg149915 			/*
874e57b9183Scg149915 			 * TODO:
875e57b9183Scg149915 			 * Ideally userspace driver should not need to issue
876e57b9183Scg149915 			 * this call, i.e. the drm driver should issue it
877e57b9183Scg149915 			 * automatically and prevent lockups. In practice, we
878e57b9183Scg149915 			 * do not understand why this call is needed and what
879e57b9183Scg149915 			 * it does (except for some vague guesses that it has
880e57b9183Scg149915 			 * to do with cache coherence) and so the user space
881e57b9183Scg149915 			 * driver does it.
882e57b9183Scg149915 			 *
883e57b9183Scg149915 			 * Once we are sure which uses prevent lockups the code
884e57b9183Scg149915 			 * could be moved into the kernel and the userspace
885e57b9183Scg149915 			 * driver will not need to use this command.
886e57b9183Scg149915 			 *
887e57b9183Scg149915 			 * Note that issuing this command does not hurt anything
888e57b9183Scg149915 			 * except, possibly, performance
889e57b9183Scg149915 			 */
890e57b9183Scg149915 			r300_pacify(dev_priv);
891e57b9183Scg149915 			break;
892e57b9183Scg149915 
893e57b9183Scg149915 		case R300_CMD_CP_DELAY:
894e57b9183Scg149915 			/* simple enough, we can do it here */
895e57b9183Scg149915 			DRM_DEBUG("R300_CMD_CP_DELAY\n");
896e57b9183Scg149915 			{
897e57b9183Scg149915 				int i;
898e57b9183Scg149915 				RING_LOCALS;
899e57b9183Scg149915 
900e57b9183Scg149915 				BEGIN_RING(header.delay.count);
901e57b9183Scg149915 				for (i = 0; i < header.delay.count; i++)
902e57b9183Scg149915 					OUT_RING(RADEON_CP_PACKET2);
903e57b9183Scg149915 				ADVANCE_RING();
904e57b9183Scg149915 			}
905e57b9183Scg149915 			break;
906e57b9183Scg149915 
907e57b9183Scg149915 		case R300_CMD_DMA_DISCARD:
908e57b9183Scg149915 			DRM_DEBUG("RADEON_CMD_DMA_DISCARD\n");
909e57b9183Scg149915 			idx = header.dma.buf_idx;
910e57b9183Scg149915 			if (idx < 0 || idx >= dma->buf_count) {
911e57b9183Scg149915 				DRM_ERROR("buffer index %d (of %d max)\n",
912e57b9183Scg149915 				    idx, dma->buf_count - 1);
913e57b9183Scg149915 				ret = EINVAL;
914e57b9183Scg149915 				goto cleanup;
915e57b9183Scg149915 			}
916e57b9183Scg149915 
917e57b9183Scg149915 			buf = dma->buflist[idx];
918e57b9183Scg149915 			if (buf->filp != fpriv || buf->pending) {
919e57b9183Scg149915 				DRM_ERROR("bad buffer %p %p %d\n",
920e57b9183Scg149915 				    buf->filp, fpriv, buf->pending);
921e57b9183Scg149915 				ret = EINVAL;
922e57b9183Scg149915 				goto cleanup;
923e57b9183Scg149915 			}
924e57b9183Scg149915 
925e57b9183Scg149915 			emit_dispatch_age = 1;
926e57b9183Scg149915 			r300_discard_buffer(dev, buf);
927e57b9183Scg149915 			break;
928e57b9183Scg149915 
929e57b9183Scg149915 		case R300_CMD_WAIT:
930e57b9183Scg149915 			/* simple enough, we can do it here */
931e57b9183Scg149915 			DRM_DEBUG("R300_CMD_WAIT\n");
932e57b9183Scg149915 			if (header.wait.flags == 0)
933e57b9183Scg149915 				break;	/* nothing to do */
934e57b9183Scg149915 
935e57b9183Scg149915 			{
936e57b9183Scg149915 				RING_LOCALS;
937e57b9183Scg149915 
938e57b9183Scg149915 				BEGIN_RING(2);
939e57b9183Scg149915 				OUT_RING(CP_PACKET0(RADEON_WAIT_UNTIL, 0));
940e57b9183Scg149915 				OUT_RING((header.wait.flags & 0xf) << 14);
941e57b9183Scg149915 				ADVANCE_RING();
942e57b9183Scg149915 			}
943e57b9183Scg149915 			break;
944e57b9183Scg149915 
945e57b9183Scg149915 		case R300_CMD_SCRATCH:
946e57b9183Scg149915 			DRM_DEBUG("R300_CMD_SCRATCH\n");
947e57b9183Scg149915 			ret = r300_scratch(dev_priv, cmdbuf, header);
948e57b9183Scg149915 			if (ret) {
949e57b9183Scg149915 				DRM_ERROR("r300_scratch failed\n");
950e57b9183Scg149915 				goto cleanup;
951e57b9183Scg149915 			}
952e57b9183Scg149915 			break;
953e57b9183Scg149915 
954e57b9183Scg149915 		default:
955e57b9183Scg149915 			DRM_ERROR("bad cmd_type %i at %p\n",
956e57b9183Scg149915 			    header.header.cmd_type,
957e57b9183Scg149915 			    cmdbuf->buf - sizeof (header));
958e57b9183Scg149915 			ret = EINVAL;
959e57b9183Scg149915 			goto cleanup;
960e57b9183Scg149915 		}
961e57b9183Scg149915 	}
962e57b9183Scg149915 
963e57b9183Scg149915 	DRM_DEBUG("END\n");
964e57b9183Scg149915 
965e57b9183Scg149915 cleanup:
966e57b9183Scg149915 	r300_pacify(dev_priv);
967e57b9183Scg149915 
968e57b9183Scg149915 	/*
969e57b9183Scg149915 	 * We emit the vertex buffer age here, outside the pacifier "brackets"
970e57b9183Scg149915 	 * for two reasons:
971e57b9183Scg149915 	 * (1) This may coalesce multiple age emissions into a single one and
972e57b9183Scg149915 	 * (2) more importantly, some chips lock up hard when scratch registers
973e57b9183Scg149915 	 * 		are written inside the pacifier bracket.
974e57b9183Scg149915 	 */
975e57b9183Scg149915 	if (emit_dispatch_age) {
976e57b9183Scg149915 		RING_LOCALS;
977e57b9183Scg149915 
978e57b9183Scg149915 		/* Emit the vertex buffer age */
979e57b9183Scg149915 		BEGIN_RING(2);
980e57b9183Scg149915 		RADEON_DISPATCH_AGE(dev_priv->sarea_priv->last_dispatch);
981e57b9183Scg149915 		ADVANCE_RING();
982e57b9183Scg149915 	}
983e57b9183Scg149915 
984e57b9183Scg149915 	COMMIT_RING();
985e57b9183Scg149915 
986e57b9183Scg149915 	return (ret);
987e57b9183Scg149915 }
988