Linux Audio

Check our new training course

Loading...
v3.1
   1/* r128_state.c -- State support for r128 -*- linux-c -*-
   2 * Created: Thu Jan 27 02:53:43 2000 by gareth@valinux.com
   3 */
   4/*
   5 * Copyright 2000 VA Linux Systems, Inc., Sunnyvale, California.
   6 * All Rights Reserved.
   7 *
   8 * Permission is hereby granted, free of charge, to any person obtaining a
   9 * copy of this software and associated documentation files (the "Software"),
  10 * to deal in the Software without restriction, including without limitation
  11 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  12 * and/or sell copies of the Software, and to permit persons to whom the
  13 * Software is furnished to do so, subject to the following conditions:
  14 *
  15 * The above copyright notice and this permission notice (including the next
  16 * paragraph) shall be included in all copies or substantial portions of the
  17 * Software.
  18 *
  19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  20 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  21 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  22 * PRECISION INSIGHT AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
  23 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  24 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
  25 * DEALINGS IN THE SOFTWARE.
  26 *
  27 * Authors:
  28 *    Gareth Hughes <gareth@valinux.com>
  29 */
  30
  31#include "drmP.h"
  32#include "drm.h"
  33#include "r128_drm.h"
  34#include "r128_drv.h"
  35
  36/* ================================================================
  37 * CCE hardware state programming functions
  38 */
  39
  40static void r128_emit_clip_rects(drm_r128_private_t *dev_priv,
  41				 struct drm_clip_rect *boxes, int count)
  42{
  43	u32 aux_sc_cntl = 0x00000000;
  44	RING_LOCALS;
  45	DRM_DEBUG("\n");
  46
  47	BEGIN_RING((count < 3 ? count : 3) * 5 + 2);
  48
  49	if (count >= 1) {
  50		OUT_RING(CCE_PACKET0(R128_AUX1_SC_LEFT, 3));
  51		OUT_RING(boxes[0].x1);
  52		OUT_RING(boxes[0].x2 - 1);
  53		OUT_RING(boxes[0].y1);
  54		OUT_RING(boxes[0].y2 - 1);
  55
  56		aux_sc_cntl |= (R128_AUX1_SC_EN | R128_AUX1_SC_MODE_OR);
  57	}
  58	if (count >= 2) {
  59		OUT_RING(CCE_PACKET0(R128_AUX2_SC_LEFT, 3));
  60		OUT_RING(boxes[1].x1);
  61		OUT_RING(boxes[1].x2 - 1);
  62		OUT_RING(boxes[1].y1);
  63		OUT_RING(boxes[1].y2 - 1);
  64
  65		aux_sc_cntl |= (R128_AUX2_SC_EN | R128_AUX2_SC_MODE_OR);
  66	}
  67	if (count >= 3) {
  68		OUT_RING(CCE_PACKET0(R128_AUX3_SC_LEFT, 3));
  69		OUT_RING(boxes[2].x1);
  70		OUT_RING(boxes[2].x2 - 1);
  71		OUT_RING(boxes[2].y1);
  72		OUT_RING(boxes[2].y2 - 1);
  73
  74		aux_sc_cntl |= (R128_AUX3_SC_EN | R128_AUX3_SC_MODE_OR);
  75	}
  76
  77	OUT_RING(CCE_PACKET0(R128_AUX_SC_CNTL, 0));
  78	OUT_RING(aux_sc_cntl);
  79
  80	ADVANCE_RING();
  81}
  82
  83static __inline__ void r128_emit_core(drm_r128_private_t *dev_priv)
  84{
  85	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
  86	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
  87	RING_LOCALS;
  88	DRM_DEBUG("\n");
  89
  90	BEGIN_RING(2);
  91
  92	OUT_RING(CCE_PACKET0(R128_SCALE_3D_CNTL, 0));
  93	OUT_RING(ctx->scale_3d_cntl);
  94
  95	ADVANCE_RING();
  96}
  97
  98static __inline__ void r128_emit_context(drm_r128_private_t *dev_priv)
  99{
 100	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 101	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
 102	RING_LOCALS;
 103	DRM_DEBUG("\n");
 104
 105	BEGIN_RING(13);
 106
 107	OUT_RING(CCE_PACKET0(R128_DST_PITCH_OFFSET_C, 11));
 108	OUT_RING(ctx->dst_pitch_offset_c);
 109	OUT_RING(ctx->dp_gui_master_cntl_c);
 110	OUT_RING(ctx->sc_top_left_c);
 111	OUT_RING(ctx->sc_bottom_right_c);
 112	OUT_RING(ctx->z_offset_c);
 113	OUT_RING(ctx->z_pitch_c);
 114	OUT_RING(ctx->z_sten_cntl_c);
 115	OUT_RING(ctx->tex_cntl_c);
 116	OUT_RING(ctx->misc_3d_state_cntl_reg);
 117	OUT_RING(ctx->texture_clr_cmp_clr_c);
 118	OUT_RING(ctx->texture_clr_cmp_msk_c);
 119	OUT_RING(ctx->fog_color_c);
 120
 121	ADVANCE_RING();
 122}
 123
 124static __inline__ void r128_emit_setup(drm_r128_private_t *dev_priv)
 125{
 126	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 127	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
 128	RING_LOCALS;
 129	DRM_DEBUG("\n");
 130
 131	BEGIN_RING(3);
 132
 133	OUT_RING(CCE_PACKET1(R128_SETUP_CNTL, R128_PM4_VC_FPU_SETUP));
 134	OUT_RING(ctx->setup_cntl);
 135	OUT_RING(ctx->pm4_vc_fpu_setup);
 136
 137	ADVANCE_RING();
 138}
 139
 140static __inline__ void r128_emit_masks(drm_r128_private_t *dev_priv)
 141{
 142	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 143	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
 144	RING_LOCALS;
 145	DRM_DEBUG("\n");
 146
 147	BEGIN_RING(5);
 148
 149	OUT_RING(CCE_PACKET0(R128_DP_WRITE_MASK, 0));
 150	OUT_RING(ctx->dp_write_mask);
 151
 152	OUT_RING(CCE_PACKET0(R128_STEN_REF_MASK_C, 1));
 153	OUT_RING(ctx->sten_ref_mask_c);
 154	OUT_RING(ctx->plane_3d_mask_c);
 155
 156	ADVANCE_RING();
 157}
 158
 159static __inline__ void r128_emit_window(drm_r128_private_t *dev_priv)
 160{
 161	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 162	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
 163	RING_LOCALS;
 164	DRM_DEBUG("\n");
 165
 166	BEGIN_RING(2);
 167
 168	OUT_RING(CCE_PACKET0(R128_WINDOW_XY_OFFSET, 0));
 169	OUT_RING(ctx->window_xy_offset);
 170
 171	ADVANCE_RING();
 172}
 173
 174static __inline__ void r128_emit_tex0(drm_r128_private_t *dev_priv)
 175{
 176	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 177	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
 178	drm_r128_texture_regs_t *tex = &sarea_priv->tex_state[0];
 179	int i;
 180	RING_LOCALS;
 181	DRM_DEBUG("\n");
 182
 183	BEGIN_RING(7 + R128_MAX_TEXTURE_LEVELS);
 184
 185	OUT_RING(CCE_PACKET0(R128_PRIM_TEX_CNTL_C,
 186			     2 + R128_MAX_TEXTURE_LEVELS));
 187	OUT_RING(tex->tex_cntl);
 188	OUT_RING(tex->tex_combine_cntl);
 189	OUT_RING(ctx->tex_size_pitch_c);
 190	for (i = 0; i < R128_MAX_TEXTURE_LEVELS; i++)
 191		OUT_RING(tex->tex_offset[i]);
 192
 193	OUT_RING(CCE_PACKET0(R128_CONSTANT_COLOR_C, 1));
 194	OUT_RING(ctx->constant_color_c);
 195	OUT_RING(tex->tex_border_color);
 196
 197	ADVANCE_RING();
 198}
 199
 200static __inline__ void r128_emit_tex1(drm_r128_private_t *dev_priv)
 201{
 202	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 203	drm_r128_texture_regs_t *tex = &sarea_priv->tex_state[1];
 204	int i;
 205	RING_LOCALS;
 206	DRM_DEBUG("\n");
 207
 208	BEGIN_RING(5 + R128_MAX_TEXTURE_LEVELS);
 209
 210	OUT_RING(CCE_PACKET0(R128_SEC_TEX_CNTL_C, 1 + R128_MAX_TEXTURE_LEVELS));
 211	OUT_RING(tex->tex_cntl);
 212	OUT_RING(tex->tex_combine_cntl);
 213	for (i = 0; i < R128_MAX_TEXTURE_LEVELS; i++)
 214		OUT_RING(tex->tex_offset[i]);
 215
 216	OUT_RING(CCE_PACKET0(R128_SEC_TEXTURE_BORDER_COLOR_C, 0));
 217	OUT_RING(tex->tex_border_color);
 218
 219	ADVANCE_RING();
 220}
 221
 222static void r128_emit_state(drm_r128_private_t *dev_priv)
 223{
 224	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 225	unsigned int dirty = sarea_priv->dirty;
 226
 227	DRM_DEBUG("dirty=0x%08x\n", dirty);
 228
 229	if (dirty & R128_UPLOAD_CORE) {
 230		r128_emit_core(dev_priv);
 231		sarea_priv->dirty &= ~R128_UPLOAD_CORE;
 232	}
 233
 234	if (dirty & R128_UPLOAD_CONTEXT) {
 235		r128_emit_context(dev_priv);
 236		sarea_priv->dirty &= ~R128_UPLOAD_CONTEXT;
 237	}
 238
 239	if (dirty & R128_UPLOAD_SETUP) {
 240		r128_emit_setup(dev_priv);
 241		sarea_priv->dirty &= ~R128_UPLOAD_SETUP;
 242	}
 243
 244	if (dirty & R128_UPLOAD_MASKS) {
 245		r128_emit_masks(dev_priv);
 246		sarea_priv->dirty &= ~R128_UPLOAD_MASKS;
 247	}
 248
 249	if (dirty & R128_UPLOAD_WINDOW) {
 250		r128_emit_window(dev_priv);
 251		sarea_priv->dirty &= ~R128_UPLOAD_WINDOW;
 252	}
 253
 254	if (dirty & R128_UPLOAD_TEX0) {
 255		r128_emit_tex0(dev_priv);
 256		sarea_priv->dirty &= ~R128_UPLOAD_TEX0;
 257	}
 258
 259	if (dirty & R128_UPLOAD_TEX1) {
 260		r128_emit_tex1(dev_priv);
 261		sarea_priv->dirty &= ~R128_UPLOAD_TEX1;
 262	}
 263
 264	/* Turn off the texture cache flushing */
 265	sarea_priv->context_state.tex_cntl_c &= ~R128_TEX_CACHE_FLUSH;
 266
 267	sarea_priv->dirty &= ~R128_REQUIRE_QUIESCENCE;
 268}
 269
 270#if R128_PERFORMANCE_BOXES
 271/* ================================================================
 272 * Performance monitoring functions
 273 */
 274
 275static void r128_clear_box(drm_r128_private_t *dev_priv,
 276			   int x, int y, int w, int h, int r, int g, int b)
 277{
 278	u32 pitch, offset;
 279	u32 fb_bpp, color;
 280	RING_LOCALS;
 281
 282	switch (dev_priv->fb_bpp) {
 283	case 16:
 284		fb_bpp = R128_GMC_DST_16BPP;
 285		color = (((r & 0xf8) << 8) |
 286			 ((g & 0xfc) << 3) | ((b & 0xf8) >> 3));
 287		break;
 288	case 24:
 289		fb_bpp = R128_GMC_DST_24BPP;
 290		color = ((r << 16) | (g << 8) | b);
 291		break;
 292	case 32:
 293		fb_bpp = R128_GMC_DST_32BPP;
 294		color = (((0xff) << 24) | (r << 16) | (g << 8) | b);
 295		break;
 296	default:
 297		return;
 298	}
 299
 300	offset = dev_priv->back_offset;
 301	pitch = dev_priv->back_pitch >> 3;
 302
 303	BEGIN_RING(6);
 304
 305	OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 306	OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 307		 R128_GMC_BRUSH_SOLID_COLOR |
 308		 fb_bpp |
 309		 R128_GMC_SRC_DATATYPE_COLOR |
 310		 R128_ROP3_P |
 311		 R128_GMC_CLR_CMP_CNTL_DIS | R128_GMC_AUX_CLIP_DIS);
 312
 313	OUT_RING((pitch << 21) | (offset >> 5));
 314	OUT_RING(color);
 315
 316	OUT_RING((x << 16) | y);
 317	OUT_RING((w << 16) | h);
 318
 319	ADVANCE_RING();
 320}
 321
 322static void r128_cce_performance_boxes(drm_r128_private_t *dev_priv)
 323{
 324	if (atomic_read(&dev_priv->idle_count) == 0)
 325		r128_clear_box(dev_priv, 64, 4, 8, 8, 0, 255, 0);
 326	else
 327		atomic_set(&dev_priv->idle_count, 0);
 328}
 329
 330#endif
 331
 332/* ================================================================
 333 * CCE command dispatch functions
 334 */
 335
 336static void r128_print_dirty(const char *msg, unsigned int flags)
 337{
 338	DRM_INFO("%s: (0x%x) %s%s%s%s%s%s%s%s%s\n",
 339		 msg,
 340		 flags,
 341		 (flags & R128_UPLOAD_CORE) ? "core, " : "",
 342		 (flags & R128_UPLOAD_CONTEXT) ? "context, " : "",
 343		 (flags & R128_UPLOAD_SETUP) ? "setup, " : "",
 344		 (flags & R128_UPLOAD_TEX0) ? "tex0, " : "",
 345		 (flags & R128_UPLOAD_TEX1) ? "tex1, " : "",
 346		 (flags & R128_UPLOAD_MASKS) ? "masks, " : "",
 347		 (flags & R128_UPLOAD_WINDOW) ? "window, " : "",
 348		 (flags & R128_UPLOAD_CLIPRECTS) ? "cliprects, " : "",
 349		 (flags & R128_REQUIRE_QUIESCENCE) ? "quiescence, " : "");
 350}
 351
 352static void r128_cce_dispatch_clear(struct drm_device *dev,
 353				    drm_r128_clear_t *clear)
 354{
 355	drm_r128_private_t *dev_priv = dev->dev_private;
 356	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 357	int nbox = sarea_priv->nbox;
 358	struct drm_clip_rect *pbox = sarea_priv->boxes;
 359	unsigned int flags = clear->flags;
 360	int i;
 361	RING_LOCALS;
 362	DRM_DEBUG("\n");
 363
 364	if (dev_priv->page_flipping && dev_priv->current_page == 1) {
 365		unsigned int tmp = flags;
 366
 367		flags &= ~(R128_FRONT | R128_BACK);
 368		if (tmp & R128_FRONT)
 369			flags |= R128_BACK;
 370		if (tmp & R128_BACK)
 371			flags |= R128_FRONT;
 372	}
 373
 374	for (i = 0; i < nbox; i++) {
 375		int x = pbox[i].x1;
 376		int y = pbox[i].y1;
 377		int w = pbox[i].x2 - x;
 378		int h = pbox[i].y2 - y;
 379
 380		DRM_DEBUG("dispatch clear %d,%d-%d,%d flags 0x%x\n",
 381			  pbox[i].x1, pbox[i].y1, pbox[i].x2,
 382			  pbox[i].y2, flags);
 383
 384		if (flags & (R128_FRONT | R128_BACK)) {
 385			BEGIN_RING(2);
 386
 387			OUT_RING(CCE_PACKET0(R128_DP_WRITE_MASK, 0));
 388			OUT_RING(clear->color_mask);
 389
 390			ADVANCE_RING();
 391		}
 392
 393		if (flags & R128_FRONT) {
 394			BEGIN_RING(6);
 395
 396			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 397			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 398				 R128_GMC_BRUSH_SOLID_COLOR |
 399				 (dev_priv->color_fmt << 8) |
 400				 R128_GMC_SRC_DATATYPE_COLOR |
 401				 R128_ROP3_P |
 402				 R128_GMC_CLR_CMP_CNTL_DIS |
 403				 R128_GMC_AUX_CLIP_DIS);
 404
 405			OUT_RING(dev_priv->front_pitch_offset_c);
 406			OUT_RING(clear->clear_color);
 407
 408			OUT_RING((x << 16) | y);
 409			OUT_RING((w << 16) | h);
 410
 411			ADVANCE_RING();
 412		}
 413
 414		if (flags & R128_BACK) {
 415			BEGIN_RING(6);
 416
 417			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 418			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 419				 R128_GMC_BRUSH_SOLID_COLOR |
 420				 (dev_priv->color_fmt << 8) |
 421				 R128_GMC_SRC_DATATYPE_COLOR |
 422				 R128_ROP3_P |
 423				 R128_GMC_CLR_CMP_CNTL_DIS |
 424				 R128_GMC_AUX_CLIP_DIS);
 425
 426			OUT_RING(dev_priv->back_pitch_offset_c);
 427			OUT_RING(clear->clear_color);
 428
 429			OUT_RING((x << 16) | y);
 430			OUT_RING((w << 16) | h);
 431
 432			ADVANCE_RING();
 433		}
 434
 435		if (flags & R128_DEPTH) {
 436			BEGIN_RING(6);
 437
 438			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 439			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 440				 R128_GMC_BRUSH_SOLID_COLOR |
 441				 (dev_priv->depth_fmt << 8) |
 442				 R128_GMC_SRC_DATATYPE_COLOR |
 443				 R128_ROP3_P |
 444				 R128_GMC_CLR_CMP_CNTL_DIS |
 445				 R128_GMC_AUX_CLIP_DIS | R128_GMC_WR_MSK_DIS);
 446
 447			OUT_RING(dev_priv->depth_pitch_offset_c);
 448			OUT_RING(clear->clear_depth);
 449
 450			OUT_RING((x << 16) | y);
 451			OUT_RING((w << 16) | h);
 452
 453			ADVANCE_RING();
 454		}
 455	}
 456}
 457
 458static void r128_cce_dispatch_swap(struct drm_device *dev)
 459{
 460	drm_r128_private_t *dev_priv = dev->dev_private;
 461	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 462	int nbox = sarea_priv->nbox;
 463	struct drm_clip_rect *pbox = sarea_priv->boxes;
 464	int i;
 465	RING_LOCALS;
 466	DRM_DEBUG("\n");
 467
 468#if R128_PERFORMANCE_BOXES
 469	/* Do some trivial performance monitoring...
 470	 */
 471	r128_cce_performance_boxes(dev_priv);
 472#endif
 473
 474	for (i = 0; i < nbox; i++) {
 475		int x = pbox[i].x1;
 476		int y = pbox[i].y1;
 477		int w = pbox[i].x2 - x;
 478		int h = pbox[i].y2 - y;
 479
 480		BEGIN_RING(7);
 481
 482		OUT_RING(CCE_PACKET3(R128_CNTL_BITBLT_MULTI, 5));
 483		OUT_RING(R128_GMC_SRC_PITCH_OFFSET_CNTL |
 484			 R128_GMC_DST_PITCH_OFFSET_CNTL |
 485			 R128_GMC_BRUSH_NONE |
 486			 (dev_priv->color_fmt << 8) |
 487			 R128_GMC_SRC_DATATYPE_COLOR |
 488			 R128_ROP3_S |
 489			 R128_DP_SRC_SOURCE_MEMORY |
 490			 R128_GMC_CLR_CMP_CNTL_DIS |
 491			 R128_GMC_AUX_CLIP_DIS | R128_GMC_WR_MSK_DIS);
 492
 493		/* Make this work even if front & back are flipped:
 494		 */
 495		if (dev_priv->current_page == 0) {
 496			OUT_RING(dev_priv->back_pitch_offset_c);
 497			OUT_RING(dev_priv->front_pitch_offset_c);
 498		} else {
 499			OUT_RING(dev_priv->front_pitch_offset_c);
 500			OUT_RING(dev_priv->back_pitch_offset_c);
 501		}
 502
 503		OUT_RING((x << 16) | y);
 504		OUT_RING((x << 16) | y);
 505		OUT_RING((w << 16) | h);
 506
 507		ADVANCE_RING();
 508	}
 509
 510	/* Increment the frame counter.  The client-side 3D driver must
 511	 * throttle the framerate by waiting for this value before
 512	 * performing the swapbuffer ioctl.
 513	 */
 514	dev_priv->sarea_priv->last_frame++;
 515
 516	BEGIN_RING(2);
 517
 518	OUT_RING(CCE_PACKET0(R128_LAST_FRAME_REG, 0));
 519	OUT_RING(dev_priv->sarea_priv->last_frame);
 520
 521	ADVANCE_RING();
 522}
 523
 524static void r128_cce_dispatch_flip(struct drm_device *dev)
 525{
 526	drm_r128_private_t *dev_priv = dev->dev_private;
 527	RING_LOCALS;
 528	DRM_DEBUG("page=%d pfCurrentPage=%d\n",
 529		  dev_priv->current_page, dev_priv->sarea_priv->pfCurrentPage);
 530
 531#if R128_PERFORMANCE_BOXES
 532	/* Do some trivial performance monitoring...
 533	 */
 534	r128_cce_performance_boxes(dev_priv);
 535#endif
 536
 537	BEGIN_RING(4);
 538
 539	R128_WAIT_UNTIL_PAGE_FLIPPED();
 540	OUT_RING(CCE_PACKET0(R128_CRTC_OFFSET, 0));
 541
 542	if (dev_priv->current_page == 0)
 543		OUT_RING(dev_priv->back_offset);
 544	else
 545		OUT_RING(dev_priv->front_offset);
 546
 547	ADVANCE_RING();
 548
 549	/* Increment the frame counter.  The client-side 3D driver must
 550	 * throttle the framerate by waiting for this value before
 551	 * performing the swapbuffer ioctl.
 552	 */
 553	dev_priv->sarea_priv->last_frame++;
 554	dev_priv->sarea_priv->pfCurrentPage = dev_priv->current_page =
 555	    1 - dev_priv->current_page;
 556
 557	BEGIN_RING(2);
 558
 559	OUT_RING(CCE_PACKET0(R128_LAST_FRAME_REG, 0));
 560	OUT_RING(dev_priv->sarea_priv->last_frame);
 561
 562	ADVANCE_RING();
 563}
 564
 565static void r128_cce_dispatch_vertex(struct drm_device *dev, struct drm_buf *buf)
 566{
 567	drm_r128_private_t *dev_priv = dev->dev_private;
 568	drm_r128_buf_priv_t *buf_priv = buf->dev_private;
 569	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 570	int format = sarea_priv->vc_format;
 571	int offset = buf->bus_address;
 572	int size = buf->used;
 573	int prim = buf_priv->prim;
 574	int i = 0;
 575	RING_LOCALS;
 576	DRM_DEBUG("buf=%d nbox=%d\n", buf->idx, sarea_priv->nbox);
 577
 578	if (0)
 579		r128_print_dirty("dispatch_vertex", sarea_priv->dirty);
 580
 581	if (buf->used) {
 582		buf_priv->dispatched = 1;
 583
 584		if (sarea_priv->dirty & ~R128_UPLOAD_CLIPRECTS)
 585			r128_emit_state(dev_priv);
 586
 587		do {
 588			/* Emit the next set of up to three cliprects */
 589			if (i < sarea_priv->nbox) {
 590				r128_emit_clip_rects(dev_priv,
 591						     &sarea_priv->boxes[i],
 592						     sarea_priv->nbox - i);
 593			}
 594
 595			/* Emit the vertex buffer rendering commands */
 596			BEGIN_RING(5);
 597
 598			OUT_RING(CCE_PACKET3(R128_3D_RNDR_GEN_INDX_PRIM, 3));
 599			OUT_RING(offset);
 600			OUT_RING(size);
 601			OUT_RING(format);
 602			OUT_RING(prim | R128_CCE_VC_CNTL_PRIM_WALK_LIST |
 603				 (size << R128_CCE_VC_CNTL_NUM_SHIFT));
 604
 605			ADVANCE_RING();
 606
 607			i += 3;
 608		} while (i < sarea_priv->nbox);
 609	}
 610
 611	if (buf_priv->discard) {
 612		buf_priv->age = dev_priv->sarea_priv->last_dispatch;
 613
 614		/* Emit the vertex buffer age */
 615		BEGIN_RING(2);
 616
 617		OUT_RING(CCE_PACKET0(R128_LAST_DISPATCH_REG, 0));
 618		OUT_RING(buf_priv->age);
 619
 620		ADVANCE_RING();
 621
 622		buf->pending = 1;
 623		buf->used = 0;
 624		/* FIXME: Check dispatched field */
 625		buf_priv->dispatched = 0;
 626	}
 627
 628	dev_priv->sarea_priv->last_dispatch++;
 629
 630	sarea_priv->dirty &= ~R128_UPLOAD_CLIPRECTS;
 631	sarea_priv->nbox = 0;
 632}
 633
 634static void r128_cce_dispatch_indirect(struct drm_device *dev,
 635				       struct drm_buf *buf, int start, int end)
 636{
 637	drm_r128_private_t *dev_priv = dev->dev_private;
 638	drm_r128_buf_priv_t *buf_priv = buf->dev_private;
 639	RING_LOCALS;
 640	DRM_DEBUG("indirect: buf=%d s=0x%x e=0x%x\n", buf->idx, start, end);
 641
 642	if (start != end) {
 643		int offset = buf->bus_address + start;
 644		int dwords = (end - start + 3) / sizeof(u32);
 645
 646		/* Indirect buffer data must be an even number of
 647		 * dwords, so if we've been given an odd number we must
 648		 * pad the data with a Type-2 CCE packet.
 649		 */
 650		if (dwords & 1) {
 651			u32 *data = (u32 *)
 652			    ((char *)dev->agp_buffer_map->handle
 653			     + buf->offset + start);
 654			data[dwords++] = cpu_to_le32(R128_CCE_PACKET2);
 655		}
 656
 657		buf_priv->dispatched = 1;
 658
 659		/* Fire off the indirect buffer */
 660		BEGIN_RING(3);
 661
 662		OUT_RING(CCE_PACKET0(R128_PM4_IW_INDOFF, 1));
 663		OUT_RING(offset);
 664		OUT_RING(dwords);
 665
 666		ADVANCE_RING();
 667	}
 668
 669	if (buf_priv->discard) {
 670		buf_priv->age = dev_priv->sarea_priv->last_dispatch;
 671
 672		/* Emit the indirect buffer age */
 673		BEGIN_RING(2);
 674
 675		OUT_RING(CCE_PACKET0(R128_LAST_DISPATCH_REG, 0));
 676		OUT_RING(buf_priv->age);
 677
 678		ADVANCE_RING();
 679
 680		buf->pending = 1;
 681		buf->used = 0;
 682		/* FIXME: Check dispatched field */
 683		buf_priv->dispatched = 0;
 684	}
 685
 686	dev_priv->sarea_priv->last_dispatch++;
 687}
 688
 689static void r128_cce_dispatch_indices(struct drm_device *dev,
 690				      struct drm_buf *buf,
 691				      int start, int end, int count)
 692{
 693	drm_r128_private_t *dev_priv = dev->dev_private;
 694	drm_r128_buf_priv_t *buf_priv = buf->dev_private;
 695	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 696	int format = sarea_priv->vc_format;
 697	int offset = dev->agp_buffer_map->offset - dev_priv->cce_buffers_offset;
 698	int prim = buf_priv->prim;
 699	u32 *data;
 700	int dwords;
 701	int i = 0;
 702	RING_LOCALS;
 703	DRM_DEBUG("indices: s=%d e=%d c=%d\n", start, end, count);
 704
 705	if (0)
 706		r128_print_dirty("dispatch_indices", sarea_priv->dirty);
 707
 708	if (start != end) {
 709		buf_priv->dispatched = 1;
 710
 711		if (sarea_priv->dirty & ~R128_UPLOAD_CLIPRECTS)
 712			r128_emit_state(dev_priv);
 713
 714		dwords = (end - start + 3) / sizeof(u32);
 715
 716		data = (u32 *) ((char *)dev->agp_buffer_map->handle
 717				+ buf->offset + start);
 718
 719		data[0] = cpu_to_le32(CCE_PACKET3(R128_3D_RNDR_GEN_INDX_PRIM,
 720						  dwords - 2));
 721
 722		data[1] = cpu_to_le32(offset);
 723		data[2] = cpu_to_le32(R128_MAX_VB_VERTS);
 724		data[3] = cpu_to_le32(format);
 725		data[4] = cpu_to_le32((prim | R128_CCE_VC_CNTL_PRIM_WALK_IND |
 726				       (count << 16)));
 727
 728		if (count & 0x1) {
 729#ifdef __LITTLE_ENDIAN
 730			data[dwords - 1] &= 0x0000ffff;
 731#else
 732			data[dwords - 1] &= 0xffff0000;
 733#endif
 734		}
 735
 736		do {
 737			/* Emit the next set of up to three cliprects */
 738			if (i < sarea_priv->nbox) {
 739				r128_emit_clip_rects(dev_priv,
 740						     &sarea_priv->boxes[i],
 741						     sarea_priv->nbox - i);
 742			}
 743
 744			r128_cce_dispatch_indirect(dev, buf, start, end);
 745
 746			i += 3;
 747		} while (i < sarea_priv->nbox);
 748	}
 749
 750	if (buf_priv->discard) {
 751		buf_priv->age = dev_priv->sarea_priv->last_dispatch;
 752
 753		/* Emit the vertex buffer age */
 754		BEGIN_RING(2);
 755
 756		OUT_RING(CCE_PACKET0(R128_LAST_DISPATCH_REG, 0));
 757		OUT_RING(buf_priv->age);
 758
 759		ADVANCE_RING();
 760
 761		buf->pending = 1;
 762		/* FIXME: Check dispatched field */
 763		buf_priv->dispatched = 0;
 764	}
 765
 766	dev_priv->sarea_priv->last_dispatch++;
 767
 768	sarea_priv->dirty &= ~R128_UPLOAD_CLIPRECTS;
 769	sarea_priv->nbox = 0;
 770}
 771
 772static int r128_cce_dispatch_blit(struct drm_device *dev,
 773				  struct drm_file *file_priv,
 774				  drm_r128_blit_t *blit)
 775{
 776	drm_r128_private_t *dev_priv = dev->dev_private;
 777	struct drm_device_dma *dma = dev->dma;
 778	struct drm_buf *buf;
 779	drm_r128_buf_priv_t *buf_priv;
 780	u32 *data;
 781	int dword_shift, dwords;
 782	RING_LOCALS;
 783	DRM_DEBUG("\n");
 784
 785	/* The compiler won't optimize away a division by a variable,
 786	 * even if the only legal values are powers of two.  Thus, we'll
 787	 * use a shift instead.
 788	 */
 789	switch (blit->format) {
 790	case R128_DATATYPE_ARGB8888:
 791		dword_shift = 0;
 792		break;
 793	case R128_DATATYPE_ARGB1555:
 794	case R128_DATATYPE_RGB565:
 795	case R128_DATATYPE_ARGB4444:
 796	case R128_DATATYPE_YVYU422:
 797	case R128_DATATYPE_VYUY422:
 798		dword_shift = 1;
 799		break;
 800	case R128_DATATYPE_CI8:
 801	case R128_DATATYPE_RGB8:
 802		dword_shift = 2;
 803		break;
 804	default:
 805		DRM_ERROR("invalid blit format %d\n", blit->format);
 806		return -EINVAL;
 807	}
 808
 809	/* Flush the pixel cache, and mark the contents as Read Invalid.
 810	 * This ensures no pixel data gets mixed up with the texture
 811	 * data from the host data blit, otherwise part of the texture
 812	 * image may be corrupted.
 813	 */
 814	BEGIN_RING(2);
 815
 816	OUT_RING(CCE_PACKET0(R128_PC_GUI_CTLSTAT, 0));
 817	OUT_RING(R128_PC_RI_GUI | R128_PC_FLUSH_GUI);
 818
 819	ADVANCE_RING();
 820
 821	/* Dispatch the indirect buffer.
 822	 */
 823	buf = dma->buflist[blit->idx];
 824	buf_priv = buf->dev_private;
 825
 826	if (buf->file_priv != file_priv) {
 827		DRM_ERROR("process %d using buffer owned by %p\n",
 828			  DRM_CURRENTPID, buf->file_priv);
 829		return -EINVAL;
 830	}
 831	if (buf->pending) {
 832		DRM_ERROR("sending pending buffer %d\n", blit->idx);
 833		return -EINVAL;
 834	}
 835
 836	buf_priv->discard = 1;
 837
 838	dwords = (blit->width * blit->height) >> dword_shift;
 839
 840	data = (u32 *) ((char *)dev->agp_buffer_map->handle + buf->offset);
 841
 842	data[0] = cpu_to_le32(CCE_PACKET3(R128_CNTL_HOSTDATA_BLT, dwords + 6));
 843	data[1] = cpu_to_le32((R128_GMC_DST_PITCH_OFFSET_CNTL |
 844			       R128_GMC_BRUSH_NONE |
 845			       (blit->format << 8) |
 846			       R128_GMC_SRC_DATATYPE_COLOR |
 847			       R128_ROP3_S |
 848			       R128_DP_SRC_SOURCE_HOST_DATA |
 849			       R128_GMC_CLR_CMP_CNTL_DIS |
 850			       R128_GMC_AUX_CLIP_DIS | R128_GMC_WR_MSK_DIS));
 851
 852	data[2] = cpu_to_le32((blit->pitch << 21) | (blit->offset >> 5));
 853	data[3] = cpu_to_le32(0xffffffff);
 854	data[4] = cpu_to_le32(0xffffffff);
 855	data[5] = cpu_to_le32((blit->y << 16) | blit->x);
 856	data[6] = cpu_to_le32((blit->height << 16) | blit->width);
 857	data[7] = cpu_to_le32(dwords);
 858
 859	buf->used = (dwords + 8) * sizeof(u32);
 860
 861	r128_cce_dispatch_indirect(dev, buf, 0, buf->used);
 862
 863	/* Flush the pixel cache after the blit completes.  This ensures
 864	 * the texture data is written out to memory before rendering
 865	 * continues.
 866	 */
 867	BEGIN_RING(2);
 868
 869	OUT_RING(CCE_PACKET0(R128_PC_GUI_CTLSTAT, 0));
 870	OUT_RING(R128_PC_FLUSH_GUI);
 871
 872	ADVANCE_RING();
 873
 874	return 0;
 875}
 876
 877/* ================================================================
 878 * Tiled depth buffer management
 879 *
 880 * FIXME: These should all set the destination write mask for when we
 881 * have hardware stencil support.
 882 */
 883
 884static int r128_cce_dispatch_write_span(struct drm_device *dev,
 885					drm_r128_depth_t *depth)
 886{
 887	drm_r128_private_t *dev_priv = dev->dev_private;
 888	int count, x, y;
 889	u32 *buffer;
 890	u8 *mask;
 891	int i, buffer_size, mask_size;
 892	RING_LOCALS;
 893	DRM_DEBUG("\n");
 894
 895	count = depth->n;
 896	if (count > 4096 || count <= 0)
 897		return -EMSGSIZE;
 898
 899	if (DRM_COPY_FROM_USER(&x, depth->x, sizeof(x)))
 900		return -EFAULT;
 901	if (DRM_COPY_FROM_USER(&y, depth->y, sizeof(y)))
 902		return -EFAULT;
 903
 904	buffer_size = depth->n * sizeof(u32);
 905	buffer = kmalloc(buffer_size, GFP_KERNEL);
 906	if (buffer == NULL)
 907		return -ENOMEM;
 908	if (DRM_COPY_FROM_USER(buffer, depth->buffer, buffer_size)) {
 909		kfree(buffer);
 910		return -EFAULT;
 911	}
 912
 913	mask_size = depth->n * sizeof(u8);
 914	if (depth->mask) {
 915		mask = kmalloc(mask_size, GFP_KERNEL);
 916		if (mask == NULL) {
 917			kfree(buffer);
 918			return -ENOMEM;
 919		}
 920		if (DRM_COPY_FROM_USER(mask, depth->mask, mask_size)) {
 921			kfree(buffer);
 922			kfree(mask);
 923			return -EFAULT;
 924		}
 925
 926		for (i = 0; i < count; i++, x++) {
 927			if (mask[i]) {
 928				BEGIN_RING(6);
 929
 930				OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 931				OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 932					 R128_GMC_BRUSH_SOLID_COLOR |
 933					 (dev_priv->depth_fmt << 8) |
 934					 R128_GMC_SRC_DATATYPE_COLOR |
 935					 R128_ROP3_P |
 936					 R128_GMC_CLR_CMP_CNTL_DIS |
 937					 R128_GMC_WR_MSK_DIS);
 938
 939				OUT_RING(dev_priv->depth_pitch_offset_c);
 940				OUT_RING(buffer[i]);
 941
 942				OUT_RING((x << 16) | y);
 943				OUT_RING((1 << 16) | 1);
 944
 945				ADVANCE_RING();
 946			}
 947		}
 948
 949		kfree(mask);
 950	} else {
 951		for (i = 0; i < count; i++, x++) {
 952			BEGIN_RING(6);
 953
 954			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 955			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 956				 R128_GMC_BRUSH_SOLID_COLOR |
 957				 (dev_priv->depth_fmt << 8) |
 958				 R128_GMC_SRC_DATATYPE_COLOR |
 959				 R128_ROP3_P |
 960				 R128_GMC_CLR_CMP_CNTL_DIS |
 961				 R128_GMC_WR_MSK_DIS);
 962
 963			OUT_RING(dev_priv->depth_pitch_offset_c);
 964			OUT_RING(buffer[i]);
 965
 966			OUT_RING((x << 16) | y);
 967			OUT_RING((1 << 16) | 1);
 968
 969			ADVANCE_RING();
 970		}
 971	}
 972
 973	kfree(buffer);
 974
 975	return 0;
 976}
 977
 978static int r128_cce_dispatch_write_pixels(struct drm_device *dev,
 979					  drm_r128_depth_t *depth)
 980{
 981	drm_r128_private_t *dev_priv = dev->dev_private;
 982	int count, *x, *y;
 983	u32 *buffer;
 984	u8 *mask;
 985	int i, xbuf_size, ybuf_size, buffer_size, mask_size;
 986	RING_LOCALS;
 987	DRM_DEBUG("\n");
 988
 989	count = depth->n;
 990	if (count > 4096 || count <= 0)
 991		return -EMSGSIZE;
 992
 993	xbuf_size = count * sizeof(*x);
 994	ybuf_size = count * sizeof(*y);
 995	x = kmalloc(xbuf_size, GFP_KERNEL);
 996	if (x == NULL)
 997		return -ENOMEM;
 998	y = kmalloc(ybuf_size, GFP_KERNEL);
 999	if (y == NULL) {
1000		kfree(x);
1001		return -ENOMEM;
1002	}
1003	if (DRM_COPY_FROM_USER(x, depth->x, xbuf_size)) {
1004		kfree(x);
1005		kfree(y);
1006		return -EFAULT;
1007	}
1008	if (DRM_COPY_FROM_USER(y, depth->y, xbuf_size)) {
1009		kfree(x);
1010		kfree(y);
1011		return -EFAULT;
1012	}
1013
1014	buffer_size = depth->n * sizeof(u32);
1015	buffer = kmalloc(buffer_size, GFP_KERNEL);
1016	if (buffer == NULL) {
1017		kfree(x);
1018		kfree(y);
1019		return -ENOMEM;
1020	}
1021	if (DRM_COPY_FROM_USER(buffer, depth->buffer, buffer_size)) {
1022		kfree(x);
1023		kfree(y);
1024		kfree(buffer);
1025		return -EFAULT;
1026	}
1027
1028	if (depth->mask) {
1029		mask_size = depth->n * sizeof(u8);
1030		mask = kmalloc(mask_size, GFP_KERNEL);
1031		if (mask == NULL) {
1032			kfree(x);
1033			kfree(y);
1034			kfree(buffer);
1035			return -ENOMEM;
1036		}
1037		if (DRM_COPY_FROM_USER(mask, depth->mask, mask_size)) {
1038			kfree(x);
1039			kfree(y);
1040			kfree(buffer);
1041			kfree(mask);
1042			return -EFAULT;
1043		}
1044
1045		for (i = 0; i < count; i++) {
1046			if (mask[i]) {
1047				BEGIN_RING(6);
1048
1049				OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
1050				OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
1051					 R128_GMC_BRUSH_SOLID_COLOR |
1052					 (dev_priv->depth_fmt << 8) |
1053					 R128_GMC_SRC_DATATYPE_COLOR |
1054					 R128_ROP3_P |
1055					 R128_GMC_CLR_CMP_CNTL_DIS |
1056					 R128_GMC_WR_MSK_DIS);
1057
1058				OUT_RING(dev_priv->depth_pitch_offset_c);
1059				OUT_RING(buffer[i]);
1060
1061				OUT_RING((x[i] << 16) | y[i]);
1062				OUT_RING((1 << 16) | 1);
1063
1064				ADVANCE_RING();
1065			}
1066		}
1067
1068		kfree(mask);
1069	} else {
1070		for (i = 0; i < count; i++) {
1071			BEGIN_RING(6);
1072
1073			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
1074			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
1075				 R128_GMC_BRUSH_SOLID_COLOR |
1076				 (dev_priv->depth_fmt << 8) |
1077				 R128_GMC_SRC_DATATYPE_COLOR |
1078				 R128_ROP3_P |
1079				 R128_GMC_CLR_CMP_CNTL_DIS |
1080				 R128_GMC_WR_MSK_DIS);
1081
1082			OUT_RING(dev_priv->depth_pitch_offset_c);
1083			OUT_RING(buffer[i]);
1084
1085			OUT_RING((x[i] << 16) | y[i]);
1086			OUT_RING((1 << 16) | 1);
1087
1088			ADVANCE_RING();
1089		}
1090	}
1091
1092	kfree(x);
1093	kfree(y);
1094	kfree(buffer);
1095
1096	return 0;
1097}
1098
1099static int r128_cce_dispatch_read_span(struct drm_device *dev,
1100				       drm_r128_depth_t *depth)
1101{
1102	drm_r128_private_t *dev_priv = dev->dev_private;
1103	int count, x, y;
1104	RING_LOCALS;
1105	DRM_DEBUG("\n");
1106
1107	count = depth->n;
1108	if (count > 4096 || count <= 0)
1109		return -EMSGSIZE;
1110
1111	if (DRM_COPY_FROM_USER(&x, depth->x, sizeof(x)))
1112		return -EFAULT;
1113	if (DRM_COPY_FROM_USER(&y, depth->y, sizeof(y)))
1114		return -EFAULT;
1115
1116	BEGIN_RING(7);
1117
1118	OUT_RING(CCE_PACKET3(R128_CNTL_BITBLT_MULTI, 5));
1119	OUT_RING(R128_GMC_SRC_PITCH_OFFSET_CNTL |
1120		 R128_GMC_DST_PITCH_OFFSET_CNTL |
1121		 R128_GMC_BRUSH_NONE |
1122		 (dev_priv->depth_fmt << 8) |
1123		 R128_GMC_SRC_DATATYPE_COLOR |
1124		 R128_ROP3_S |
1125		 R128_DP_SRC_SOURCE_MEMORY |
1126		 R128_GMC_CLR_CMP_CNTL_DIS | R128_GMC_WR_MSK_DIS);
1127
1128	OUT_RING(dev_priv->depth_pitch_offset_c);
1129	OUT_RING(dev_priv->span_pitch_offset_c);
1130
1131	OUT_RING((x << 16) | y);
1132	OUT_RING((0 << 16) | 0);
1133	OUT_RING((count << 16) | 1);
1134
1135	ADVANCE_RING();
1136
1137	return 0;
1138}
1139
1140static int r128_cce_dispatch_read_pixels(struct drm_device *dev,
1141					 drm_r128_depth_t *depth)
1142{
1143	drm_r128_private_t *dev_priv = dev->dev_private;
1144	int count, *x, *y;
1145	int i, xbuf_size, ybuf_size;
1146	RING_LOCALS;
1147	DRM_DEBUG("\n");
1148
1149	count = depth->n;
1150	if (count > 4096 || count <= 0)
1151		return -EMSGSIZE;
1152
1153	if (count > dev_priv->depth_pitch)
1154		count = dev_priv->depth_pitch;
1155
1156	xbuf_size = count * sizeof(*x);
1157	ybuf_size = count * sizeof(*y);
1158	x = kmalloc(xbuf_size, GFP_KERNEL);
1159	if (x == NULL)
1160		return -ENOMEM;
1161	y = kmalloc(ybuf_size, GFP_KERNEL);
1162	if (y == NULL) {
1163		kfree(x);
1164		return -ENOMEM;
1165	}
1166	if (DRM_COPY_FROM_USER(x, depth->x, xbuf_size)) {
1167		kfree(x);
1168		kfree(y);
1169		return -EFAULT;
1170	}
1171	if (DRM_COPY_FROM_USER(y, depth->y, ybuf_size)) {
1172		kfree(x);
1173		kfree(y);
1174		return -EFAULT;
1175	}
1176
1177	for (i = 0; i < count; i++) {
1178		BEGIN_RING(7);
1179
1180		OUT_RING(CCE_PACKET3(R128_CNTL_BITBLT_MULTI, 5));
1181		OUT_RING(R128_GMC_SRC_PITCH_OFFSET_CNTL |
1182			 R128_GMC_DST_PITCH_OFFSET_CNTL |
1183			 R128_GMC_BRUSH_NONE |
1184			 (dev_priv->depth_fmt << 8) |
1185			 R128_GMC_SRC_DATATYPE_COLOR |
1186			 R128_ROP3_S |
1187			 R128_DP_SRC_SOURCE_MEMORY |
1188			 R128_GMC_CLR_CMP_CNTL_DIS | R128_GMC_WR_MSK_DIS);
1189
1190		OUT_RING(dev_priv->depth_pitch_offset_c);
1191		OUT_RING(dev_priv->span_pitch_offset_c);
1192
1193		OUT_RING((x[i] << 16) | y[i]);
1194		OUT_RING((i << 16) | 0);
1195		OUT_RING((1 << 16) | 1);
1196
1197		ADVANCE_RING();
1198	}
1199
1200	kfree(x);
1201	kfree(y);
1202
1203	return 0;
1204}
1205
1206/* ================================================================
1207 * Polygon stipple
1208 */
1209
1210static void r128_cce_dispatch_stipple(struct drm_device *dev, u32 *stipple)
1211{
1212	drm_r128_private_t *dev_priv = dev->dev_private;
1213	int i;
1214	RING_LOCALS;
1215	DRM_DEBUG("\n");
1216
1217	BEGIN_RING(33);
1218
1219	OUT_RING(CCE_PACKET0(R128_BRUSH_DATA0, 31));
1220	for (i = 0; i < 32; i++)
1221		OUT_RING(stipple[i]);
1222
1223	ADVANCE_RING();
1224}
1225
1226/* ================================================================
1227 * IOCTL functions
1228 */
1229
1230static int r128_cce_clear(struct drm_device *dev, void *data, struct drm_file *file_priv)
1231{
1232	drm_r128_private_t *dev_priv = dev->dev_private;
1233	drm_r128_sarea_t *sarea_priv;
1234	drm_r128_clear_t *clear = data;
1235	DRM_DEBUG("\n");
1236
1237	LOCK_TEST_WITH_RETURN(dev, file_priv);
1238
1239	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1240
1241	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1242
1243	sarea_priv = dev_priv->sarea_priv;
1244
1245	if (sarea_priv->nbox > R128_NR_SAREA_CLIPRECTS)
1246		sarea_priv->nbox = R128_NR_SAREA_CLIPRECTS;
1247
1248	r128_cce_dispatch_clear(dev, clear);
1249	COMMIT_RING();
1250
1251	/* Make sure we restore the 3D state next time.
1252	 */
1253	dev_priv->sarea_priv->dirty |= R128_UPLOAD_CONTEXT | R128_UPLOAD_MASKS;
1254
1255	return 0;
1256}
1257
1258static int r128_do_init_pageflip(struct drm_device *dev)
1259{
1260	drm_r128_private_t *dev_priv = dev->dev_private;
1261	DRM_DEBUG("\n");
1262
1263	dev_priv->crtc_offset = R128_READ(R128_CRTC_OFFSET);
1264	dev_priv->crtc_offset_cntl = R128_READ(R128_CRTC_OFFSET_CNTL);
1265
1266	R128_WRITE(R128_CRTC_OFFSET, dev_priv->front_offset);
1267	R128_WRITE(R128_CRTC_OFFSET_CNTL,
1268		   dev_priv->crtc_offset_cntl | R128_CRTC_OFFSET_FLIP_CNTL);
1269
1270	dev_priv->page_flipping = 1;
1271	dev_priv->current_page = 0;
1272	dev_priv->sarea_priv->pfCurrentPage = dev_priv->current_page;
1273
1274	return 0;
1275}
1276
1277static int r128_do_cleanup_pageflip(struct drm_device *dev)
1278{
1279	drm_r128_private_t *dev_priv = dev->dev_private;
1280	DRM_DEBUG("\n");
1281
1282	R128_WRITE(R128_CRTC_OFFSET, dev_priv->crtc_offset);
1283	R128_WRITE(R128_CRTC_OFFSET_CNTL, dev_priv->crtc_offset_cntl);
1284
1285	if (dev_priv->current_page != 0) {
1286		r128_cce_dispatch_flip(dev);
1287		COMMIT_RING();
1288	}
1289
1290	dev_priv->page_flipping = 0;
1291	return 0;
1292}
1293
1294/* Swapping and flipping are different operations, need different ioctls.
1295 * They can & should be intermixed to support multiple 3d windows.
1296 */
1297
1298static int r128_cce_flip(struct drm_device *dev, void *data, struct drm_file *file_priv)
1299{
1300	drm_r128_private_t *dev_priv = dev->dev_private;
1301	DRM_DEBUG("\n");
1302
1303	LOCK_TEST_WITH_RETURN(dev, file_priv);
1304
1305	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1306
1307	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1308
1309	if (!dev_priv->page_flipping)
1310		r128_do_init_pageflip(dev);
1311
1312	r128_cce_dispatch_flip(dev);
1313
1314	COMMIT_RING();
1315	return 0;
1316}
1317
1318static int r128_cce_swap(struct drm_device *dev, void *data, struct drm_file *file_priv)
1319{
1320	drm_r128_private_t *dev_priv = dev->dev_private;
1321	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
1322	DRM_DEBUG("\n");
1323
1324	LOCK_TEST_WITH_RETURN(dev, file_priv);
1325
1326	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1327
1328	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1329
1330	if (sarea_priv->nbox > R128_NR_SAREA_CLIPRECTS)
1331		sarea_priv->nbox = R128_NR_SAREA_CLIPRECTS;
1332
1333	r128_cce_dispatch_swap(dev);
1334	dev_priv->sarea_priv->dirty |= (R128_UPLOAD_CONTEXT |
1335					R128_UPLOAD_MASKS);
1336
1337	COMMIT_RING();
1338	return 0;
1339}
1340
1341static int r128_cce_vertex(struct drm_device *dev, void *data, struct drm_file *file_priv)
1342{
1343	drm_r128_private_t *dev_priv = dev->dev_private;
1344	struct drm_device_dma *dma = dev->dma;
1345	struct drm_buf *buf;
1346	drm_r128_buf_priv_t *buf_priv;
1347	drm_r128_vertex_t *vertex = data;
1348
1349	LOCK_TEST_WITH_RETURN(dev, file_priv);
1350
1351	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1352
1353	DRM_DEBUG("pid=%d index=%d count=%d discard=%d\n",
1354		  DRM_CURRENTPID, vertex->idx, vertex->count, vertex->discard);
1355
1356	if (vertex->idx < 0 || vertex->idx >= dma->buf_count) {
1357		DRM_ERROR("buffer index %d (of %d max)\n",
1358			  vertex->idx, dma->buf_count - 1);
1359		return -EINVAL;
1360	}
1361	if (vertex->prim < 0 ||
1362	    vertex->prim > R128_CCE_VC_CNTL_PRIM_TYPE_TRI_TYPE2) {
1363		DRM_ERROR("buffer prim %d\n", vertex->prim);
1364		return -EINVAL;
1365	}
1366
1367	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1368	VB_AGE_TEST_WITH_RETURN(dev_priv);
1369
1370	buf = dma->buflist[vertex->idx];
1371	buf_priv = buf->dev_private;
1372
1373	if (buf->file_priv != file_priv) {
1374		DRM_ERROR("process %d using buffer owned by %p\n",
1375			  DRM_CURRENTPID, buf->file_priv);
1376		return -EINVAL;
1377	}
1378	if (buf->pending) {
1379		DRM_ERROR("sending pending buffer %d\n", vertex->idx);
1380		return -EINVAL;
1381	}
1382
1383	buf->used = vertex->count;
1384	buf_priv->prim = vertex->prim;
1385	buf_priv->discard = vertex->discard;
1386
1387	r128_cce_dispatch_vertex(dev, buf);
1388
1389	COMMIT_RING();
1390	return 0;
1391}
1392
1393static int r128_cce_indices(struct drm_device *dev, void *data, struct drm_file *file_priv)
1394{
1395	drm_r128_private_t *dev_priv = dev->dev_private;
1396	struct drm_device_dma *dma = dev->dma;
1397	struct drm_buf *buf;
1398	drm_r128_buf_priv_t *buf_priv;
1399	drm_r128_indices_t *elts = data;
1400	int count;
1401
1402	LOCK_TEST_WITH_RETURN(dev, file_priv);
1403
1404	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1405
1406	DRM_DEBUG("pid=%d buf=%d s=%d e=%d d=%d\n", DRM_CURRENTPID,
1407		  elts->idx, elts->start, elts->end, elts->discard);
1408
1409	if (elts->idx < 0 || elts->idx >= dma->buf_count) {
1410		DRM_ERROR("buffer index %d (of %d max)\n",
1411			  elts->idx, dma->buf_count - 1);
1412		return -EINVAL;
1413	}
1414	if (elts->prim < 0 ||
1415	    elts->prim > R128_CCE_VC_CNTL_PRIM_TYPE_TRI_TYPE2) {
1416		DRM_ERROR("buffer prim %d\n", elts->prim);
1417		return -EINVAL;
1418	}
1419
1420	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1421	VB_AGE_TEST_WITH_RETURN(dev_priv);
1422
1423	buf = dma->buflist[elts->idx];
1424	buf_priv = buf->dev_private;
1425
1426	if (buf->file_priv != file_priv) {
1427		DRM_ERROR("process %d using buffer owned by %p\n",
1428			  DRM_CURRENTPID, buf->file_priv);
1429		return -EINVAL;
1430	}
1431	if (buf->pending) {
1432		DRM_ERROR("sending pending buffer %d\n", elts->idx);
1433		return -EINVAL;
1434	}
1435
1436	count = (elts->end - elts->start) / sizeof(u16);
1437	elts->start -= R128_INDEX_PRIM_OFFSET;
1438
1439	if (elts->start & 0x7) {
1440		DRM_ERROR("misaligned buffer 0x%x\n", elts->start);
1441		return -EINVAL;
1442	}
1443	if (elts->start < buf->used) {
1444		DRM_ERROR("no header 0x%x - 0x%x\n", elts->start, buf->used);
1445		return -EINVAL;
1446	}
1447
1448	buf->used = elts->end;
1449	buf_priv->prim = elts->prim;
1450	buf_priv->discard = elts->discard;
1451
1452	r128_cce_dispatch_indices(dev, buf, elts->start, elts->end, count);
1453
1454	COMMIT_RING();
1455	return 0;
1456}
1457
1458static int r128_cce_blit(struct drm_device *dev, void *data, struct drm_file *file_priv)
1459{
1460	struct drm_device_dma *dma = dev->dma;
1461	drm_r128_private_t *dev_priv = dev->dev_private;
1462	drm_r128_blit_t *blit = data;
1463	int ret;
1464
1465	LOCK_TEST_WITH_RETURN(dev, file_priv);
1466
1467	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1468
1469	DRM_DEBUG("pid=%d index=%d\n", DRM_CURRENTPID, blit->idx);
1470
1471	if (blit->idx < 0 || blit->idx >= dma->buf_count) {
1472		DRM_ERROR("buffer index %d (of %d max)\n",
1473			  blit->idx, dma->buf_count - 1);
1474		return -EINVAL;
1475	}
1476
1477	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1478	VB_AGE_TEST_WITH_RETURN(dev_priv);
1479
1480	ret = r128_cce_dispatch_blit(dev, file_priv, blit);
1481
1482	COMMIT_RING();
1483	return ret;
1484}
1485
1486static int r128_cce_depth(struct drm_device *dev, void *data, struct drm_file *file_priv)
1487{
1488	drm_r128_private_t *dev_priv = dev->dev_private;
1489	drm_r128_depth_t *depth = data;
1490	int ret;
1491
1492	LOCK_TEST_WITH_RETURN(dev, file_priv);
1493
1494	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1495
1496	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1497
1498	ret = -EINVAL;
1499	switch (depth->func) {
1500	case R128_WRITE_SPAN:
1501		ret = r128_cce_dispatch_write_span(dev, depth);
1502		break;
1503	case R128_WRITE_PIXELS:
1504		ret = r128_cce_dispatch_write_pixels(dev, depth);
1505		break;
1506	case R128_READ_SPAN:
1507		ret = r128_cce_dispatch_read_span(dev, depth);
1508		break;
1509	case R128_READ_PIXELS:
1510		ret = r128_cce_dispatch_read_pixels(dev, depth);
1511		break;
1512	}
1513
1514	COMMIT_RING();
1515	return ret;
1516}
1517
1518static int r128_cce_stipple(struct drm_device *dev, void *data, struct drm_file *file_priv)
1519{
1520	drm_r128_private_t *dev_priv = dev->dev_private;
1521	drm_r128_stipple_t *stipple = data;
1522	u32 mask[32];
1523
1524	LOCK_TEST_WITH_RETURN(dev, file_priv);
1525
1526	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1527
1528	if (DRM_COPY_FROM_USER(&mask, stipple->mask, 32 * sizeof(u32)))
1529		return -EFAULT;
1530
1531	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1532
1533	r128_cce_dispatch_stipple(dev, mask);
1534
1535	COMMIT_RING();
1536	return 0;
1537}
1538
1539static int r128_cce_indirect(struct drm_device *dev, void *data, struct drm_file *file_priv)
1540{
1541	drm_r128_private_t *dev_priv = dev->dev_private;
1542	struct drm_device_dma *dma = dev->dma;
1543	struct drm_buf *buf;
1544	drm_r128_buf_priv_t *buf_priv;
1545	drm_r128_indirect_t *indirect = data;
1546#if 0
1547	RING_LOCALS;
1548#endif
1549
1550	LOCK_TEST_WITH_RETURN(dev, file_priv);
1551
1552	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1553
1554	DRM_DEBUG("idx=%d s=%d e=%d d=%d\n",
1555		  indirect->idx, indirect->start, indirect->end,
1556		  indirect->discard);
1557
1558	if (indirect->idx < 0 || indirect->idx >= dma->buf_count) {
1559		DRM_ERROR("buffer index %d (of %d max)\n",
1560			  indirect->idx, dma->buf_count - 1);
1561		return -EINVAL;
1562	}
1563
1564	buf = dma->buflist[indirect->idx];
1565	buf_priv = buf->dev_private;
1566
1567	if (buf->file_priv != file_priv) {
1568		DRM_ERROR("process %d using buffer owned by %p\n",
1569			  DRM_CURRENTPID, buf->file_priv);
1570		return -EINVAL;
1571	}
1572	if (buf->pending) {
1573		DRM_ERROR("sending pending buffer %d\n", indirect->idx);
1574		return -EINVAL;
1575	}
1576
1577	if (indirect->start < buf->used) {
1578		DRM_ERROR("reusing indirect: start=0x%x actual=0x%x\n",
1579			  indirect->start, buf->used);
1580		return -EINVAL;
1581	}
1582
1583	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1584	VB_AGE_TEST_WITH_RETURN(dev_priv);
1585
1586	buf->used = indirect->end;
1587	buf_priv->discard = indirect->discard;
1588
1589#if 0
1590	/* Wait for the 3D stream to idle before the indirect buffer
1591	 * containing 2D acceleration commands is processed.
1592	 */
1593	BEGIN_RING(2);
1594	RADEON_WAIT_UNTIL_3D_IDLE();
1595	ADVANCE_RING();
1596#endif
1597
1598	/* Dispatch the indirect buffer full of commands from the
1599	 * X server.  This is insecure and is thus only available to
1600	 * privileged clients.
1601	 */
1602	r128_cce_dispatch_indirect(dev, buf, indirect->start, indirect->end);
1603
1604	COMMIT_RING();
1605	return 0;
1606}
1607
1608static int r128_getparam(struct drm_device *dev, void *data, struct drm_file *file_priv)
1609{
1610	drm_r128_private_t *dev_priv = dev->dev_private;
1611	drm_r128_getparam_t *param = data;
1612	int value;
1613
1614	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1615
1616	DRM_DEBUG("pid=%d\n", DRM_CURRENTPID);
1617
1618	switch (param->param) {
1619	case R128_PARAM_IRQ_NR:
1620		value = drm_dev_to_irq(dev);
1621		break;
1622	default:
1623		return -EINVAL;
1624	}
1625
1626	if (DRM_COPY_TO_USER(param->value, &value, sizeof(int))) {
1627		DRM_ERROR("copy_to_user\n");
1628		return -EFAULT;
1629	}
1630
1631	return 0;
1632}
1633
1634void r128_driver_preclose(struct drm_device *dev, struct drm_file *file_priv)
1635{
1636	if (dev->dev_private) {
1637		drm_r128_private_t *dev_priv = dev->dev_private;
1638		if (dev_priv->page_flipping)
1639			r128_do_cleanup_pageflip(dev);
1640	}
1641}
1642void r128_driver_lastclose(struct drm_device *dev)
1643{
1644	r128_do_cleanup_cce(dev);
1645}
1646
1647struct drm_ioctl_desc r128_ioctls[] = {
1648	DRM_IOCTL_DEF_DRV(R128_INIT, r128_cce_init, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1649	DRM_IOCTL_DEF_DRV(R128_CCE_START, r128_cce_start, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1650	DRM_IOCTL_DEF_DRV(R128_CCE_STOP, r128_cce_stop, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1651	DRM_IOCTL_DEF_DRV(R128_CCE_RESET, r128_cce_reset, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1652	DRM_IOCTL_DEF_DRV(R128_CCE_IDLE, r128_cce_idle, DRM_AUTH),
1653	DRM_IOCTL_DEF_DRV(R128_RESET, r128_engine_reset, DRM_AUTH),
1654	DRM_IOCTL_DEF_DRV(R128_FULLSCREEN, r128_fullscreen, DRM_AUTH),
1655	DRM_IOCTL_DEF_DRV(R128_SWAP, r128_cce_swap, DRM_AUTH),
1656	DRM_IOCTL_DEF_DRV(R128_FLIP, r128_cce_flip, DRM_AUTH),
1657	DRM_IOCTL_DEF_DRV(R128_CLEAR, r128_cce_clear, DRM_AUTH),
1658	DRM_IOCTL_DEF_DRV(R128_VERTEX, r128_cce_vertex, DRM_AUTH),
1659	DRM_IOCTL_DEF_DRV(R128_INDICES, r128_cce_indices, DRM_AUTH),
1660	DRM_IOCTL_DEF_DRV(R128_BLIT, r128_cce_blit, DRM_AUTH),
1661	DRM_IOCTL_DEF_DRV(R128_DEPTH, r128_cce_depth, DRM_AUTH),
1662	DRM_IOCTL_DEF_DRV(R128_STIPPLE, r128_cce_stipple, DRM_AUTH),
1663	DRM_IOCTL_DEF_DRV(R128_INDIRECT, r128_cce_indirect, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1664	DRM_IOCTL_DEF_DRV(R128_GETPARAM, r128_getparam, DRM_AUTH),
1665};
1666
1667int r128_max_ioctl = DRM_ARRAY_SIZE(r128_ioctls);
v4.17
   1/* r128_state.c -- State support for r128 -*- linux-c -*-
   2 * Created: Thu Jan 27 02:53:43 2000 by gareth@valinux.com
   3 */
   4/*
   5 * Copyright 2000 VA Linux Systems, Inc., Sunnyvale, California.
   6 * All Rights Reserved.
   7 *
   8 * Permission is hereby granted, free of charge, to any person obtaining a
   9 * copy of this software and associated documentation files (the "Software"),
  10 * to deal in the Software without restriction, including without limitation
  11 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  12 * and/or sell copies of the Software, and to permit persons to whom the
  13 * Software is furnished to do so, subject to the following conditions:
  14 *
  15 * The above copyright notice and this permission notice (including the next
  16 * paragraph) shall be included in all copies or substantial portions of the
  17 * Software.
  18 *
  19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  20 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  21 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  22 * PRECISION INSIGHT AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
  23 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  24 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
  25 * DEALINGS IN THE SOFTWARE.
  26 *
  27 * Authors:
  28 *    Gareth Hughes <gareth@valinux.com>
  29 */
  30
  31#include <drm/drmP.h>
  32#include <drm/r128_drm.h>
 
  33#include "r128_drv.h"
  34
  35/* ================================================================
  36 * CCE hardware state programming functions
  37 */
  38
  39static void r128_emit_clip_rects(drm_r128_private_t *dev_priv,
  40				 struct drm_clip_rect *boxes, int count)
  41{
  42	u32 aux_sc_cntl = 0x00000000;
  43	RING_LOCALS;
  44	DRM_DEBUG("\n");
  45
  46	BEGIN_RING((count < 3 ? count : 3) * 5 + 2);
  47
  48	if (count >= 1) {
  49		OUT_RING(CCE_PACKET0(R128_AUX1_SC_LEFT, 3));
  50		OUT_RING(boxes[0].x1);
  51		OUT_RING(boxes[0].x2 - 1);
  52		OUT_RING(boxes[0].y1);
  53		OUT_RING(boxes[0].y2 - 1);
  54
  55		aux_sc_cntl |= (R128_AUX1_SC_EN | R128_AUX1_SC_MODE_OR);
  56	}
  57	if (count >= 2) {
  58		OUT_RING(CCE_PACKET0(R128_AUX2_SC_LEFT, 3));
  59		OUT_RING(boxes[1].x1);
  60		OUT_RING(boxes[1].x2 - 1);
  61		OUT_RING(boxes[1].y1);
  62		OUT_RING(boxes[1].y2 - 1);
  63
  64		aux_sc_cntl |= (R128_AUX2_SC_EN | R128_AUX2_SC_MODE_OR);
  65	}
  66	if (count >= 3) {
  67		OUT_RING(CCE_PACKET0(R128_AUX3_SC_LEFT, 3));
  68		OUT_RING(boxes[2].x1);
  69		OUT_RING(boxes[2].x2 - 1);
  70		OUT_RING(boxes[2].y1);
  71		OUT_RING(boxes[2].y2 - 1);
  72
  73		aux_sc_cntl |= (R128_AUX3_SC_EN | R128_AUX3_SC_MODE_OR);
  74	}
  75
  76	OUT_RING(CCE_PACKET0(R128_AUX_SC_CNTL, 0));
  77	OUT_RING(aux_sc_cntl);
  78
  79	ADVANCE_RING();
  80}
  81
  82static __inline__ void r128_emit_core(drm_r128_private_t *dev_priv)
  83{
  84	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
  85	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
  86	RING_LOCALS;
  87	DRM_DEBUG("\n");
  88
  89	BEGIN_RING(2);
  90
  91	OUT_RING(CCE_PACKET0(R128_SCALE_3D_CNTL, 0));
  92	OUT_RING(ctx->scale_3d_cntl);
  93
  94	ADVANCE_RING();
  95}
  96
  97static __inline__ void r128_emit_context(drm_r128_private_t *dev_priv)
  98{
  99	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 100	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
 101	RING_LOCALS;
 102	DRM_DEBUG("\n");
 103
 104	BEGIN_RING(13);
 105
 106	OUT_RING(CCE_PACKET0(R128_DST_PITCH_OFFSET_C, 11));
 107	OUT_RING(ctx->dst_pitch_offset_c);
 108	OUT_RING(ctx->dp_gui_master_cntl_c);
 109	OUT_RING(ctx->sc_top_left_c);
 110	OUT_RING(ctx->sc_bottom_right_c);
 111	OUT_RING(ctx->z_offset_c);
 112	OUT_RING(ctx->z_pitch_c);
 113	OUT_RING(ctx->z_sten_cntl_c);
 114	OUT_RING(ctx->tex_cntl_c);
 115	OUT_RING(ctx->misc_3d_state_cntl_reg);
 116	OUT_RING(ctx->texture_clr_cmp_clr_c);
 117	OUT_RING(ctx->texture_clr_cmp_msk_c);
 118	OUT_RING(ctx->fog_color_c);
 119
 120	ADVANCE_RING();
 121}
 122
 123static __inline__ void r128_emit_setup(drm_r128_private_t *dev_priv)
 124{
 125	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 126	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
 127	RING_LOCALS;
 128	DRM_DEBUG("\n");
 129
 130	BEGIN_RING(3);
 131
 132	OUT_RING(CCE_PACKET1(R128_SETUP_CNTL, R128_PM4_VC_FPU_SETUP));
 133	OUT_RING(ctx->setup_cntl);
 134	OUT_RING(ctx->pm4_vc_fpu_setup);
 135
 136	ADVANCE_RING();
 137}
 138
 139static __inline__ void r128_emit_masks(drm_r128_private_t *dev_priv)
 140{
 141	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 142	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
 143	RING_LOCALS;
 144	DRM_DEBUG("\n");
 145
 146	BEGIN_RING(5);
 147
 148	OUT_RING(CCE_PACKET0(R128_DP_WRITE_MASK, 0));
 149	OUT_RING(ctx->dp_write_mask);
 150
 151	OUT_RING(CCE_PACKET0(R128_STEN_REF_MASK_C, 1));
 152	OUT_RING(ctx->sten_ref_mask_c);
 153	OUT_RING(ctx->plane_3d_mask_c);
 154
 155	ADVANCE_RING();
 156}
 157
 158static __inline__ void r128_emit_window(drm_r128_private_t *dev_priv)
 159{
 160	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 161	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
 162	RING_LOCALS;
 163	DRM_DEBUG("\n");
 164
 165	BEGIN_RING(2);
 166
 167	OUT_RING(CCE_PACKET0(R128_WINDOW_XY_OFFSET, 0));
 168	OUT_RING(ctx->window_xy_offset);
 169
 170	ADVANCE_RING();
 171}
 172
 173static __inline__ void r128_emit_tex0(drm_r128_private_t *dev_priv)
 174{
 175	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 176	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
 177	drm_r128_texture_regs_t *tex = &sarea_priv->tex_state[0];
 178	int i;
 179	RING_LOCALS;
 180	DRM_DEBUG("\n");
 181
 182	BEGIN_RING(7 + R128_MAX_TEXTURE_LEVELS);
 183
 184	OUT_RING(CCE_PACKET0(R128_PRIM_TEX_CNTL_C,
 185			     2 + R128_MAX_TEXTURE_LEVELS));
 186	OUT_RING(tex->tex_cntl);
 187	OUT_RING(tex->tex_combine_cntl);
 188	OUT_RING(ctx->tex_size_pitch_c);
 189	for (i = 0; i < R128_MAX_TEXTURE_LEVELS; i++)
 190		OUT_RING(tex->tex_offset[i]);
 191
 192	OUT_RING(CCE_PACKET0(R128_CONSTANT_COLOR_C, 1));
 193	OUT_RING(ctx->constant_color_c);
 194	OUT_RING(tex->tex_border_color);
 195
 196	ADVANCE_RING();
 197}
 198
 199static __inline__ void r128_emit_tex1(drm_r128_private_t *dev_priv)
 200{
 201	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 202	drm_r128_texture_regs_t *tex = &sarea_priv->tex_state[1];
 203	int i;
 204	RING_LOCALS;
 205	DRM_DEBUG("\n");
 206
 207	BEGIN_RING(5 + R128_MAX_TEXTURE_LEVELS);
 208
 209	OUT_RING(CCE_PACKET0(R128_SEC_TEX_CNTL_C, 1 + R128_MAX_TEXTURE_LEVELS));
 210	OUT_RING(tex->tex_cntl);
 211	OUT_RING(tex->tex_combine_cntl);
 212	for (i = 0; i < R128_MAX_TEXTURE_LEVELS; i++)
 213		OUT_RING(tex->tex_offset[i]);
 214
 215	OUT_RING(CCE_PACKET0(R128_SEC_TEXTURE_BORDER_COLOR_C, 0));
 216	OUT_RING(tex->tex_border_color);
 217
 218	ADVANCE_RING();
 219}
 220
 221static void r128_emit_state(drm_r128_private_t *dev_priv)
 222{
 223	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 224	unsigned int dirty = sarea_priv->dirty;
 225
 226	DRM_DEBUG("dirty=0x%08x\n", dirty);
 227
 228	if (dirty & R128_UPLOAD_CORE) {
 229		r128_emit_core(dev_priv);
 230		sarea_priv->dirty &= ~R128_UPLOAD_CORE;
 231	}
 232
 233	if (dirty & R128_UPLOAD_CONTEXT) {
 234		r128_emit_context(dev_priv);
 235		sarea_priv->dirty &= ~R128_UPLOAD_CONTEXT;
 236	}
 237
 238	if (dirty & R128_UPLOAD_SETUP) {
 239		r128_emit_setup(dev_priv);
 240		sarea_priv->dirty &= ~R128_UPLOAD_SETUP;
 241	}
 242
 243	if (dirty & R128_UPLOAD_MASKS) {
 244		r128_emit_masks(dev_priv);
 245		sarea_priv->dirty &= ~R128_UPLOAD_MASKS;
 246	}
 247
 248	if (dirty & R128_UPLOAD_WINDOW) {
 249		r128_emit_window(dev_priv);
 250		sarea_priv->dirty &= ~R128_UPLOAD_WINDOW;
 251	}
 252
 253	if (dirty & R128_UPLOAD_TEX0) {
 254		r128_emit_tex0(dev_priv);
 255		sarea_priv->dirty &= ~R128_UPLOAD_TEX0;
 256	}
 257
 258	if (dirty & R128_UPLOAD_TEX1) {
 259		r128_emit_tex1(dev_priv);
 260		sarea_priv->dirty &= ~R128_UPLOAD_TEX1;
 261	}
 262
 263	/* Turn off the texture cache flushing */
 264	sarea_priv->context_state.tex_cntl_c &= ~R128_TEX_CACHE_FLUSH;
 265
 266	sarea_priv->dirty &= ~R128_REQUIRE_QUIESCENCE;
 267}
 268
 269#if R128_PERFORMANCE_BOXES
 270/* ================================================================
 271 * Performance monitoring functions
 272 */
 273
 274static void r128_clear_box(drm_r128_private_t *dev_priv,
 275			   int x, int y, int w, int h, int r, int g, int b)
 276{
 277	u32 pitch, offset;
 278	u32 fb_bpp, color;
 279	RING_LOCALS;
 280
 281	switch (dev_priv->fb_bpp) {
 282	case 16:
 283		fb_bpp = R128_GMC_DST_16BPP;
 284		color = (((r & 0xf8) << 8) |
 285			 ((g & 0xfc) << 3) | ((b & 0xf8) >> 3));
 286		break;
 287	case 24:
 288		fb_bpp = R128_GMC_DST_24BPP;
 289		color = ((r << 16) | (g << 8) | b);
 290		break;
 291	case 32:
 292		fb_bpp = R128_GMC_DST_32BPP;
 293		color = (((0xff) << 24) | (r << 16) | (g << 8) | b);
 294		break;
 295	default:
 296		return;
 297	}
 298
 299	offset = dev_priv->back_offset;
 300	pitch = dev_priv->back_pitch >> 3;
 301
 302	BEGIN_RING(6);
 303
 304	OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 305	OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 306		 R128_GMC_BRUSH_SOLID_COLOR |
 307		 fb_bpp |
 308		 R128_GMC_SRC_DATATYPE_COLOR |
 309		 R128_ROP3_P |
 310		 R128_GMC_CLR_CMP_CNTL_DIS | R128_GMC_AUX_CLIP_DIS);
 311
 312	OUT_RING((pitch << 21) | (offset >> 5));
 313	OUT_RING(color);
 314
 315	OUT_RING((x << 16) | y);
 316	OUT_RING((w << 16) | h);
 317
 318	ADVANCE_RING();
 319}
 320
 321static void r128_cce_performance_boxes(drm_r128_private_t *dev_priv)
 322{
 323	if (atomic_read(&dev_priv->idle_count) == 0)
 324		r128_clear_box(dev_priv, 64, 4, 8, 8, 0, 255, 0);
 325	else
 326		atomic_set(&dev_priv->idle_count, 0);
 327}
 328
 329#endif
 330
 331/* ================================================================
 332 * CCE command dispatch functions
 333 */
 334
 335static void r128_print_dirty(const char *msg, unsigned int flags)
 336{
 337	DRM_INFO("%s: (0x%x) %s%s%s%s%s%s%s%s%s\n",
 338		 msg,
 339		 flags,
 340		 (flags & R128_UPLOAD_CORE) ? "core, " : "",
 341		 (flags & R128_UPLOAD_CONTEXT) ? "context, " : "",
 342		 (flags & R128_UPLOAD_SETUP) ? "setup, " : "",
 343		 (flags & R128_UPLOAD_TEX0) ? "tex0, " : "",
 344		 (flags & R128_UPLOAD_TEX1) ? "tex1, " : "",
 345		 (flags & R128_UPLOAD_MASKS) ? "masks, " : "",
 346		 (flags & R128_UPLOAD_WINDOW) ? "window, " : "",
 347		 (flags & R128_UPLOAD_CLIPRECTS) ? "cliprects, " : "",
 348		 (flags & R128_REQUIRE_QUIESCENCE) ? "quiescence, " : "");
 349}
 350
 351static void r128_cce_dispatch_clear(struct drm_device *dev,
 352				    drm_r128_clear_t *clear)
 353{
 354	drm_r128_private_t *dev_priv = dev->dev_private;
 355	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 356	int nbox = sarea_priv->nbox;
 357	struct drm_clip_rect *pbox = sarea_priv->boxes;
 358	unsigned int flags = clear->flags;
 359	int i;
 360	RING_LOCALS;
 361	DRM_DEBUG("\n");
 362
 363	if (dev_priv->page_flipping && dev_priv->current_page == 1) {
 364		unsigned int tmp = flags;
 365
 366		flags &= ~(R128_FRONT | R128_BACK);
 367		if (tmp & R128_FRONT)
 368			flags |= R128_BACK;
 369		if (tmp & R128_BACK)
 370			flags |= R128_FRONT;
 371	}
 372
 373	for (i = 0; i < nbox; i++) {
 374		int x = pbox[i].x1;
 375		int y = pbox[i].y1;
 376		int w = pbox[i].x2 - x;
 377		int h = pbox[i].y2 - y;
 378
 379		DRM_DEBUG("dispatch clear %d,%d-%d,%d flags 0x%x\n",
 380			  pbox[i].x1, pbox[i].y1, pbox[i].x2,
 381			  pbox[i].y2, flags);
 382
 383		if (flags & (R128_FRONT | R128_BACK)) {
 384			BEGIN_RING(2);
 385
 386			OUT_RING(CCE_PACKET0(R128_DP_WRITE_MASK, 0));
 387			OUT_RING(clear->color_mask);
 388
 389			ADVANCE_RING();
 390		}
 391
 392		if (flags & R128_FRONT) {
 393			BEGIN_RING(6);
 394
 395			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 396			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 397				 R128_GMC_BRUSH_SOLID_COLOR |
 398				 (dev_priv->color_fmt << 8) |
 399				 R128_GMC_SRC_DATATYPE_COLOR |
 400				 R128_ROP3_P |
 401				 R128_GMC_CLR_CMP_CNTL_DIS |
 402				 R128_GMC_AUX_CLIP_DIS);
 403
 404			OUT_RING(dev_priv->front_pitch_offset_c);
 405			OUT_RING(clear->clear_color);
 406
 407			OUT_RING((x << 16) | y);
 408			OUT_RING((w << 16) | h);
 409
 410			ADVANCE_RING();
 411		}
 412
 413		if (flags & R128_BACK) {
 414			BEGIN_RING(6);
 415
 416			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 417			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 418				 R128_GMC_BRUSH_SOLID_COLOR |
 419				 (dev_priv->color_fmt << 8) |
 420				 R128_GMC_SRC_DATATYPE_COLOR |
 421				 R128_ROP3_P |
 422				 R128_GMC_CLR_CMP_CNTL_DIS |
 423				 R128_GMC_AUX_CLIP_DIS);
 424
 425			OUT_RING(dev_priv->back_pitch_offset_c);
 426			OUT_RING(clear->clear_color);
 427
 428			OUT_RING((x << 16) | y);
 429			OUT_RING((w << 16) | h);
 430
 431			ADVANCE_RING();
 432		}
 433
 434		if (flags & R128_DEPTH) {
 435			BEGIN_RING(6);
 436
 437			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 438			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 439				 R128_GMC_BRUSH_SOLID_COLOR |
 440				 (dev_priv->depth_fmt << 8) |
 441				 R128_GMC_SRC_DATATYPE_COLOR |
 442				 R128_ROP3_P |
 443				 R128_GMC_CLR_CMP_CNTL_DIS |
 444				 R128_GMC_AUX_CLIP_DIS | R128_GMC_WR_MSK_DIS);
 445
 446			OUT_RING(dev_priv->depth_pitch_offset_c);
 447			OUT_RING(clear->clear_depth);
 448
 449			OUT_RING((x << 16) | y);
 450			OUT_RING((w << 16) | h);
 451
 452			ADVANCE_RING();
 453		}
 454	}
 455}
 456
 457static void r128_cce_dispatch_swap(struct drm_device *dev)
 458{
 459	drm_r128_private_t *dev_priv = dev->dev_private;
 460	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 461	int nbox = sarea_priv->nbox;
 462	struct drm_clip_rect *pbox = sarea_priv->boxes;
 463	int i;
 464	RING_LOCALS;
 465	DRM_DEBUG("\n");
 466
 467#if R128_PERFORMANCE_BOXES
 468	/* Do some trivial performance monitoring...
 469	 */
 470	r128_cce_performance_boxes(dev_priv);
 471#endif
 472
 473	for (i = 0; i < nbox; i++) {
 474		int x = pbox[i].x1;
 475		int y = pbox[i].y1;
 476		int w = pbox[i].x2 - x;
 477		int h = pbox[i].y2 - y;
 478
 479		BEGIN_RING(7);
 480
 481		OUT_RING(CCE_PACKET3(R128_CNTL_BITBLT_MULTI, 5));
 482		OUT_RING(R128_GMC_SRC_PITCH_OFFSET_CNTL |
 483			 R128_GMC_DST_PITCH_OFFSET_CNTL |
 484			 R128_GMC_BRUSH_NONE |
 485			 (dev_priv->color_fmt << 8) |
 486			 R128_GMC_SRC_DATATYPE_COLOR |
 487			 R128_ROP3_S |
 488			 R128_DP_SRC_SOURCE_MEMORY |
 489			 R128_GMC_CLR_CMP_CNTL_DIS |
 490			 R128_GMC_AUX_CLIP_DIS | R128_GMC_WR_MSK_DIS);
 491
 492		/* Make this work even if front & back are flipped:
 493		 */
 494		if (dev_priv->current_page == 0) {
 495			OUT_RING(dev_priv->back_pitch_offset_c);
 496			OUT_RING(dev_priv->front_pitch_offset_c);
 497		} else {
 498			OUT_RING(dev_priv->front_pitch_offset_c);
 499			OUT_RING(dev_priv->back_pitch_offset_c);
 500		}
 501
 502		OUT_RING((x << 16) | y);
 503		OUT_RING((x << 16) | y);
 504		OUT_RING((w << 16) | h);
 505
 506		ADVANCE_RING();
 507	}
 508
 509	/* Increment the frame counter.  The client-side 3D driver must
 510	 * throttle the framerate by waiting for this value before
 511	 * performing the swapbuffer ioctl.
 512	 */
 513	dev_priv->sarea_priv->last_frame++;
 514
 515	BEGIN_RING(2);
 516
 517	OUT_RING(CCE_PACKET0(R128_LAST_FRAME_REG, 0));
 518	OUT_RING(dev_priv->sarea_priv->last_frame);
 519
 520	ADVANCE_RING();
 521}
 522
 523static void r128_cce_dispatch_flip(struct drm_device *dev)
 524{
 525	drm_r128_private_t *dev_priv = dev->dev_private;
 526	RING_LOCALS;
 527	DRM_DEBUG("page=%d pfCurrentPage=%d\n",
 528		  dev_priv->current_page, dev_priv->sarea_priv->pfCurrentPage);
 529
 530#if R128_PERFORMANCE_BOXES
 531	/* Do some trivial performance monitoring...
 532	 */
 533	r128_cce_performance_boxes(dev_priv);
 534#endif
 535
 536	BEGIN_RING(4);
 537
 538	R128_WAIT_UNTIL_PAGE_FLIPPED();
 539	OUT_RING(CCE_PACKET0(R128_CRTC_OFFSET, 0));
 540
 541	if (dev_priv->current_page == 0)
 542		OUT_RING(dev_priv->back_offset);
 543	else
 544		OUT_RING(dev_priv->front_offset);
 545
 546	ADVANCE_RING();
 547
 548	/* Increment the frame counter.  The client-side 3D driver must
 549	 * throttle the framerate by waiting for this value before
 550	 * performing the swapbuffer ioctl.
 551	 */
 552	dev_priv->sarea_priv->last_frame++;
 553	dev_priv->sarea_priv->pfCurrentPage = dev_priv->current_page =
 554	    1 - dev_priv->current_page;
 555
 556	BEGIN_RING(2);
 557
 558	OUT_RING(CCE_PACKET0(R128_LAST_FRAME_REG, 0));
 559	OUT_RING(dev_priv->sarea_priv->last_frame);
 560
 561	ADVANCE_RING();
 562}
 563
 564static void r128_cce_dispatch_vertex(struct drm_device *dev, struct drm_buf *buf)
 565{
 566	drm_r128_private_t *dev_priv = dev->dev_private;
 567	drm_r128_buf_priv_t *buf_priv = buf->dev_private;
 568	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 569	int format = sarea_priv->vc_format;
 570	int offset = buf->bus_address;
 571	int size = buf->used;
 572	int prim = buf_priv->prim;
 573	int i = 0;
 574	RING_LOCALS;
 575	DRM_DEBUG("buf=%d nbox=%d\n", buf->idx, sarea_priv->nbox);
 576
 577	if (0)
 578		r128_print_dirty("dispatch_vertex", sarea_priv->dirty);
 579
 580	if (buf->used) {
 581		buf_priv->dispatched = 1;
 582
 583		if (sarea_priv->dirty & ~R128_UPLOAD_CLIPRECTS)
 584			r128_emit_state(dev_priv);
 585
 586		do {
 587			/* Emit the next set of up to three cliprects */
 588			if (i < sarea_priv->nbox) {
 589				r128_emit_clip_rects(dev_priv,
 590						     &sarea_priv->boxes[i],
 591						     sarea_priv->nbox - i);
 592			}
 593
 594			/* Emit the vertex buffer rendering commands */
 595			BEGIN_RING(5);
 596
 597			OUT_RING(CCE_PACKET3(R128_3D_RNDR_GEN_INDX_PRIM, 3));
 598			OUT_RING(offset);
 599			OUT_RING(size);
 600			OUT_RING(format);
 601			OUT_RING(prim | R128_CCE_VC_CNTL_PRIM_WALK_LIST |
 602				 (size << R128_CCE_VC_CNTL_NUM_SHIFT));
 603
 604			ADVANCE_RING();
 605
 606			i += 3;
 607		} while (i < sarea_priv->nbox);
 608	}
 609
 610	if (buf_priv->discard) {
 611		buf_priv->age = dev_priv->sarea_priv->last_dispatch;
 612
 613		/* Emit the vertex buffer age */
 614		BEGIN_RING(2);
 615
 616		OUT_RING(CCE_PACKET0(R128_LAST_DISPATCH_REG, 0));
 617		OUT_RING(buf_priv->age);
 618
 619		ADVANCE_RING();
 620
 621		buf->pending = 1;
 622		buf->used = 0;
 623		/* FIXME: Check dispatched field */
 624		buf_priv->dispatched = 0;
 625	}
 626
 627	dev_priv->sarea_priv->last_dispatch++;
 628
 629	sarea_priv->dirty &= ~R128_UPLOAD_CLIPRECTS;
 630	sarea_priv->nbox = 0;
 631}
 632
 633static void r128_cce_dispatch_indirect(struct drm_device *dev,
 634				       struct drm_buf *buf, int start, int end)
 635{
 636	drm_r128_private_t *dev_priv = dev->dev_private;
 637	drm_r128_buf_priv_t *buf_priv = buf->dev_private;
 638	RING_LOCALS;
 639	DRM_DEBUG("indirect: buf=%d s=0x%x e=0x%x\n", buf->idx, start, end);
 640
 641	if (start != end) {
 642		int offset = buf->bus_address + start;
 643		int dwords = (end - start + 3) / sizeof(u32);
 644
 645		/* Indirect buffer data must be an even number of
 646		 * dwords, so if we've been given an odd number we must
 647		 * pad the data with a Type-2 CCE packet.
 648		 */
 649		if (dwords & 1) {
 650			u32 *data = (u32 *)
 651			    ((char *)dev->agp_buffer_map->handle
 652			     + buf->offset + start);
 653			data[dwords++] = cpu_to_le32(R128_CCE_PACKET2);
 654		}
 655
 656		buf_priv->dispatched = 1;
 657
 658		/* Fire off the indirect buffer */
 659		BEGIN_RING(3);
 660
 661		OUT_RING(CCE_PACKET0(R128_PM4_IW_INDOFF, 1));
 662		OUT_RING(offset);
 663		OUT_RING(dwords);
 664
 665		ADVANCE_RING();
 666	}
 667
 668	if (buf_priv->discard) {
 669		buf_priv->age = dev_priv->sarea_priv->last_dispatch;
 670
 671		/* Emit the indirect buffer age */
 672		BEGIN_RING(2);
 673
 674		OUT_RING(CCE_PACKET0(R128_LAST_DISPATCH_REG, 0));
 675		OUT_RING(buf_priv->age);
 676
 677		ADVANCE_RING();
 678
 679		buf->pending = 1;
 680		buf->used = 0;
 681		/* FIXME: Check dispatched field */
 682		buf_priv->dispatched = 0;
 683	}
 684
 685	dev_priv->sarea_priv->last_dispatch++;
 686}
 687
 688static void r128_cce_dispatch_indices(struct drm_device *dev,
 689				      struct drm_buf *buf,
 690				      int start, int end, int count)
 691{
 692	drm_r128_private_t *dev_priv = dev->dev_private;
 693	drm_r128_buf_priv_t *buf_priv = buf->dev_private;
 694	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 695	int format = sarea_priv->vc_format;
 696	int offset = dev->agp_buffer_map->offset - dev_priv->cce_buffers_offset;
 697	int prim = buf_priv->prim;
 698	u32 *data;
 699	int dwords;
 700	int i = 0;
 701	RING_LOCALS;
 702	DRM_DEBUG("indices: s=%d e=%d c=%d\n", start, end, count);
 703
 704	if (0)
 705		r128_print_dirty("dispatch_indices", sarea_priv->dirty);
 706
 707	if (start != end) {
 708		buf_priv->dispatched = 1;
 709
 710		if (sarea_priv->dirty & ~R128_UPLOAD_CLIPRECTS)
 711			r128_emit_state(dev_priv);
 712
 713		dwords = (end - start + 3) / sizeof(u32);
 714
 715		data = (u32 *) ((char *)dev->agp_buffer_map->handle
 716				+ buf->offset + start);
 717
 718		data[0] = cpu_to_le32(CCE_PACKET3(R128_3D_RNDR_GEN_INDX_PRIM,
 719						  dwords - 2));
 720
 721		data[1] = cpu_to_le32(offset);
 722		data[2] = cpu_to_le32(R128_MAX_VB_VERTS);
 723		data[3] = cpu_to_le32(format);
 724		data[4] = cpu_to_le32((prim | R128_CCE_VC_CNTL_PRIM_WALK_IND |
 725				       (count << 16)));
 726
 727		if (count & 0x1) {
 728#ifdef __LITTLE_ENDIAN
 729			data[dwords - 1] &= 0x0000ffff;
 730#else
 731			data[dwords - 1] &= 0xffff0000;
 732#endif
 733		}
 734
 735		do {
 736			/* Emit the next set of up to three cliprects */
 737			if (i < sarea_priv->nbox) {
 738				r128_emit_clip_rects(dev_priv,
 739						     &sarea_priv->boxes[i],
 740						     sarea_priv->nbox - i);
 741			}
 742
 743			r128_cce_dispatch_indirect(dev, buf, start, end);
 744
 745			i += 3;
 746		} while (i < sarea_priv->nbox);
 747	}
 748
 749	if (buf_priv->discard) {
 750		buf_priv->age = dev_priv->sarea_priv->last_dispatch;
 751
 752		/* Emit the vertex buffer age */
 753		BEGIN_RING(2);
 754
 755		OUT_RING(CCE_PACKET0(R128_LAST_DISPATCH_REG, 0));
 756		OUT_RING(buf_priv->age);
 757
 758		ADVANCE_RING();
 759
 760		buf->pending = 1;
 761		/* FIXME: Check dispatched field */
 762		buf_priv->dispatched = 0;
 763	}
 764
 765	dev_priv->sarea_priv->last_dispatch++;
 766
 767	sarea_priv->dirty &= ~R128_UPLOAD_CLIPRECTS;
 768	sarea_priv->nbox = 0;
 769}
 770
 771static int r128_cce_dispatch_blit(struct drm_device *dev,
 772				  struct drm_file *file_priv,
 773				  drm_r128_blit_t *blit)
 774{
 775	drm_r128_private_t *dev_priv = dev->dev_private;
 776	struct drm_device_dma *dma = dev->dma;
 777	struct drm_buf *buf;
 778	drm_r128_buf_priv_t *buf_priv;
 779	u32 *data;
 780	int dword_shift, dwords;
 781	RING_LOCALS;
 782	DRM_DEBUG("\n");
 783
 784	/* The compiler won't optimize away a division by a variable,
 785	 * even if the only legal values are powers of two.  Thus, we'll
 786	 * use a shift instead.
 787	 */
 788	switch (blit->format) {
 789	case R128_DATATYPE_ARGB8888:
 790		dword_shift = 0;
 791		break;
 792	case R128_DATATYPE_ARGB1555:
 793	case R128_DATATYPE_RGB565:
 794	case R128_DATATYPE_ARGB4444:
 795	case R128_DATATYPE_YVYU422:
 796	case R128_DATATYPE_VYUY422:
 797		dword_shift = 1;
 798		break;
 799	case R128_DATATYPE_CI8:
 800	case R128_DATATYPE_RGB8:
 801		dword_shift = 2;
 802		break;
 803	default:
 804		DRM_ERROR("invalid blit format %d\n", blit->format);
 805		return -EINVAL;
 806	}
 807
 808	/* Flush the pixel cache, and mark the contents as Read Invalid.
 809	 * This ensures no pixel data gets mixed up with the texture
 810	 * data from the host data blit, otherwise part of the texture
 811	 * image may be corrupted.
 812	 */
 813	BEGIN_RING(2);
 814
 815	OUT_RING(CCE_PACKET0(R128_PC_GUI_CTLSTAT, 0));
 816	OUT_RING(R128_PC_RI_GUI | R128_PC_FLUSH_GUI);
 817
 818	ADVANCE_RING();
 819
 820	/* Dispatch the indirect buffer.
 821	 */
 822	buf = dma->buflist[blit->idx];
 823	buf_priv = buf->dev_private;
 824
 825	if (buf->file_priv != file_priv) {
 826		DRM_ERROR("process %d using buffer owned by %p\n",
 827			  DRM_CURRENTPID, buf->file_priv);
 828		return -EINVAL;
 829	}
 830	if (buf->pending) {
 831		DRM_ERROR("sending pending buffer %d\n", blit->idx);
 832		return -EINVAL;
 833	}
 834
 835	buf_priv->discard = 1;
 836
 837	dwords = (blit->width * blit->height) >> dword_shift;
 838
 839	data = (u32 *) ((char *)dev->agp_buffer_map->handle + buf->offset);
 840
 841	data[0] = cpu_to_le32(CCE_PACKET3(R128_CNTL_HOSTDATA_BLT, dwords + 6));
 842	data[1] = cpu_to_le32((R128_GMC_DST_PITCH_OFFSET_CNTL |
 843			       R128_GMC_BRUSH_NONE |
 844			       (blit->format << 8) |
 845			       R128_GMC_SRC_DATATYPE_COLOR |
 846			       R128_ROP3_S |
 847			       R128_DP_SRC_SOURCE_HOST_DATA |
 848			       R128_GMC_CLR_CMP_CNTL_DIS |
 849			       R128_GMC_AUX_CLIP_DIS | R128_GMC_WR_MSK_DIS));
 850
 851	data[2] = cpu_to_le32((blit->pitch << 21) | (blit->offset >> 5));
 852	data[3] = cpu_to_le32(0xffffffff);
 853	data[4] = cpu_to_le32(0xffffffff);
 854	data[5] = cpu_to_le32((blit->y << 16) | blit->x);
 855	data[6] = cpu_to_le32((blit->height << 16) | blit->width);
 856	data[7] = cpu_to_le32(dwords);
 857
 858	buf->used = (dwords + 8) * sizeof(u32);
 859
 860	r128_cce_dispatch_indirect(dev, buf, 0, buf->used);
 861
 862	/* Flush the pixel cache after the blit completes.  This ensures
 863	 * the texture data is written out to memory before rendering
 864	 * continues.
 865	 */
 866	BEGIN_RING(2);
 867
 868	OUT_RING(CCE_PACKET0(R128_PC_GUI_CTLSTAT, 0));
 869	OUT_RING(R128_PC_FLUSH_GUI);
 870
 871	ADVANCE_RING();
 872
 873	return 0;
 874}
 875
 876/* ================================================================
 877 * Tiled depth buffer management
 878 *
 879 * FIXME: These should all set the destination write mask for when we
 880 * have hardware stencil support.
 881 */
 882
 883static int r128_cce_dispatch_write_span(struct drm_device *dev,
 884					drm_r128_depth_t *depth)
 885{
 886	drm_r128_private_t *dev_priv = dev->dev_private;
 887	int count, x, y;
 888	u32 *buffer;
 889	u8 *mask;
 890	int i, buffer_size, mask_size;
 891	RING_LOCALS;
 892	DRM_DEBUG("\n");
 893
 894	count = depth->n;
 895	if (count > 4096 || count <= 0)
 896		return -EMSGSIZE;
 897
 898	if (copy_from_user(&x, depth->x, sizeof(x)))
 899		return -EFAULT;
 900	if (copy_from_user(&y, depth->y, sizeof(y)))
 901		return -EFAULT;
 902
 903	buffer_size = depth->n * sizeof(u32);
 904	buffer = memdup_user(depth->buffer, buffer_size);
 905	if (IS_ERR(buffer))
 906		return PTR_ERR(buffer);
 
 
 
 
 907
 908	mask_size = depth->n;
 909	if (depth->mask) {
 910		mask = memdup_user(depth->mask, mask_size);
 911		if (IS_ERR(mask)) {
 
 
 
 
 912			kfree(buffer);
 913			return PTR_ERR(mask);
 
 914		}
 915
 916		for (i = 0; i < count; i++, x++) {
 917			if (mask[i]) {
 918				BEGIN_RING(6);
 919
 920				OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 921				OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 922					 R128_GMC_BRUSH_SOLID_COLOR |
 923					 (dev_priv->depth_fmt << 8) |
 924					 R128_GMC_SRC_DATATYPE_COLOR |
 925					 R128_ROP3_P |
 926					 R128_GMC_CLR_CMP_CNTL_DIS |
 927					 R128_GMC_WR_MSK_DIS);
 928
 929				OUT_RING(dev_priv->depth_pitch_offset_c);
 930				OUT_RING(buffer[i]);
 931
 932				OUT_RING((x << 16) | y);
 933				OUT_RING((1 << 16) | 1);
 934
 935				ADVANCE_RING();
 936			}
 937		}
 938
 939		kfree(mask);
 940	} else {
 941		for (i = 0; i < count; i++, x++) {
 942			BEGIN_RING(6);
 943
 944			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 945			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 946				 R128_GMC_BRUSH_SOLID_COLOR |
 947				 (dev_priv->depth_fmt << 8) |
 948				 R128_GMC_SRC_DATATYPE_COLOR |
 949				 R128_ROP3_P |
 950				 R128_GMC_CLR_CMP_CNTL_DIS |
 951				 R128_GMC_WR_MSK_DIS);
 952
 953			OUT_RING(dev_priv->depth_pitch_offset_c);
 954			OUT_RING(buffer[i]);
 955
 956			OUT_RING((x << 16) | y);
 957			OUT_RING((1 << 16) | 1);
 958
 959			ADVANCE_RING();
 960		}
 961	}
 962
 963	kfree(buffer);
 964
 965	return 0;
 966}
 967
 968static int r128_cce_dispatch_write_pixels(struct drm_device *dev,
 969					  drm_r128_depth_t *depth)
 970{
 971	drm_r128_private_t *dev_priv = dev->dev_private;
 972	int count, *x, *y;
 973	u32 *buffer;
 974	u8 *mask;
 975	int i, xbuf_size, ybuf_size, buffer_size, mask_size;
 976	RING_LOCALS;
 977	DRM_DEBUG("\n");
 978
 979	count = depth->n;
 980	if (count > 4096 || count <= 0)
 981		return -EMSGSIZE;
 982
 983	xbuf_size = count * sizeof(*x);
 984	ybuf_size = count * sizeof(*y);
 985	x = memdup_user(depth->x, xbuf_size);
 986	if (IS_ERR(x))
 987		return PTR_ERR(x);
 988	y = memdup_user(depth->y, ybuf_size);
 989	if (IS_ERR(y)) {
 990		kfree(x);
 991		return PTR_ERR(y);
 
 
 
 
 
 992	}
 
 
 
 
 
 
 993	buffer_size = depth->n * sizeof(u32);
 994	buffer = memdup_user(depth->buffer, buffer_size);
 995	if (IS_ERR(buffer)) {
 
 
 
 
 
 996		kfree(x);
 997		kfree(y);
 998		return PTR_ERR(buffer);
 
 999	}
1000
1001	if (depth->mask) {
1002		mask_size = depth->n;
1003		mask = memdup_user(depth->mask, mask_size);
1004		if (IS_ERR(mask)) {
 
 
 
 
 
 
1005			kfree(x);
1006			kfree(y);
1007			kfree(buffer);
1008			return PTR_ERR(mask);
 
1009		}
1010
1011		for (i = 0; i < count; i++) {
1012			if (mask[i]) {
1013				BEGIN_RING(6);
1014
1015				OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
1016				OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
1017					 R128_GMC_BRUSH_SOLID_COLOR |
1018					 (dev_priv->depth_fmt << 8) |
1019					 R128_GMC_SRC_DATATYPE_COLOR |
1020					 R128_ROP3_P |
1021					 R128_GMC_CLR_CMP_CNTL_DIS |
1022					 R128_GMC_WR_MSK_DIS);
1023
1024				OUT_RING(dev_priv->depth_pitch_offset_c);
1025				OUT_RING(buffer[i]);
1026
1027				OUT_RING((x[i] << 16) | y[i]);
1028				OUT_RING((1 << 16) | 1);
1029
1030				ADVANCE_RING();
1031			}
1032		}
1033
1034		kfree(mask);
1035	} else {
1036		for (i = 0; i < count; i++) {
1037			BEGIN_RING(6);
1038
1039			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
1040			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
1041				 R128_GMC_BRUSH_SOLID_COLOR |
1042				 (dev_priv->depth_fmt << 8) |
1043				 R128_GMC_SRC_DATATYPE_COLOR |
1044				 R128_ROP3_P |
1045				 R128_GMC_CLR_CMP_CNTL_DIS |
1046				 R128_GMC_WR_MSK_DIS);
1047
1048			OUT_RING(dev_priv->depth_pitch_offset_c);
1049			OUT_RING(buffer[i]);
1050
1051			OUT_RING((x[i] << 16) | y[i]);
1052			OUT_RING((1 << 16) | 1);
1053
1054			ADVANCE_RING();
1055		}
1056	}
1057
1058	kfree(x);
1059	kfree(y);
1060	kfree(buffer);
1061
1062	return 0;
1063}
1064
1065static int r128_cce_dispatch_read_span(struct drm_device *dev,
1066				       drm_r128_depth_t *depth)
1067{
1068	drm_r128_private_t *dev_priv = dev->dev_private;
1069	int count, x, y;
1070	RING_LOCALS;
1071	DRM_DEBUG("\n");
1072
1073	count = depth->n;
1074	if (count > 4096 || count <= 0)
1075		return -EMSGSIZE;
1076
1077	if (copy_from_user(&x, depth->x, sizeof(x)))
1078		return -EFAULT;
1079	if (copy_from_user(&y, depth->y, sizeof(y)))
1080		return -EFAULT;
1081
1082	BEGIN_RING(7);
1083
1084	OUT_RING(CCE_PACKET3(R128_CNTL_BITBLT_MULTI, 5));
1085	OUT_RING(R128_GMC_SRC_PITCH_OFFSET_CNTL |
1086		 R128_GMC_DST_PITCH_OFFSET_CNTL |
1087		 R128_GMC_BRUSH_NONE |
1088		 (dev_priv->depth_fmt << 8) |
1089		 R128_GMC_SRC_DATATYPE_COLOR |
1090		 R128_ROP3_S |
1091		 R128_DP_SRC_SOURCE_MEMORY |
1092		 R128_GMC_CLR_CMP_CNTL_DIS | R128_GMC_WR_MSK_DIS);
1093
1094	OUT_RING(dev_priv->depth_pitch_offset_c);
1095	OUT_RING(dev_priv->span_pitch_offset_c);
1096
1097	OUT_RING((x << 16) | y);
1098	OUT_RING((0 << 16) | 0);
1099	OUT_RING((count << 16) | 1);
1100
1101	ADVANCE_RING();
1102
1103	return 0;
1104}
1105
1106static int r128_cce_dispatch_read_pixels(struct drm_device *dev,
1107					 drm_r128_depth_t *depth)
1108{
1109	drm_r128_private_t *dev_priv = dev->dev_private;
1110	int count, *x, *y;
1111	int i, xbuf_size, ybuf_size;
1112	RING_LOCALS;
1113	DRM_DEBUG("\n");
1114
1115	count = depth->n;
1116	if (count > 4096 || count <= 0)
1117		return -EMSGSIZE;
1118
1119	if (count > dev_priv->depth_pitch)
1120		count = dev_priv->depth_pitch;
1121
1122	xbuf_size = count * sizeof(*x);
1123	ybuf_size = count * sizeof(*y);
1124	x = kmalloc(xbuf_size, GFP_KERNEL);
1125	if (x == NULL)
1126		return -ENOMEM;
1127	y = kmalloc(ybuf_size, GFP_KERNEL);
1128	if (y == NULL) {
1129		kfree(x);
1130		return -ENOMEM;
1131	}
1132	if (copy_from_user(x, depth->x, xbuf_size)) {
1133		kfree(x);
1134		kfree(y);
1135		return -EFAULT;
1136	}
1137	if (copy_from_user(y, depth->y, ybuf_size)) {
1138		kfree(x);
1139		kfree(y);
1140		return -EFAULT;
1141	}
1142
1143	for (i = 0; i < count; i++) {
1144		BEGIN_RING(7);
1145
1146		OUT_RING(CCE_PACKET3(R128_CNTL_BITBLT_MULTI, 5));
1147		OUT_RING(R128_GMC_SRC_PITCH_OFFSET_CNTL |
1148			 R128_GMC_DST_PITCH_OFFSET_CNTL |
1149			 R128_GMC_BRUSH_NONE |
1150			 (dev_priv->depth_fmt << 8) |
1151			 R128_GMC_SRC_DATATYPE_COLOR |
1152			 R128_ROP3_S |
1153			 R128_DP_SRC_SOURCE_MEMORY |
1154			 R128_GMC_CLR_CMP_CNTL_DIS | R128_GMC_WR_MSK_DIS);
1155
1156		OUT_RING(dev_priv->depth_pitch_offset_c);
1157		OUT_RING(dev_priv->span_pitch_offset_c);
1158
1159		OUT_RING((x[i] << 16) | y[i]);
1160		OUT_RING((i << 16) | 0);
1161		OUT_RING((1 << 16) | 1);
1162
1163		ADVANCE_RING();
1164	}
1165
1166	kfree(x);
1167	kfree(y);
1168
1169	return 0;
1170}
1171
1172/* ================================================================
1173 * Polygon stipple
1174 */
1175
1176static void r128_cce_dispatch_stipple(struct drm_device *dev, u32 *stipple)
1177{
1178	drm_r128_private_t *dev_priv = dev->dev_private;
1179	int i;
1180	RING_LOCALS;
1181	DRM_DEBUG("\n");
1182
1183	BEGIN_RING(33);
1184
1185	OUT_RING(CCE_PACKET0(R128_BRUSH_DATA0, 31));
1186	for (i = 0; i < 32; i++)
1187		OUT_RING(stipple[i]);
1188
1189	ADVANCE_RING();
1190}
1191
1192/* ================================================================
1193 * IOCTL functions
1194 */
1195
1196static int r128_cce_clear(struct drm_device *dev, void *data, struct drm_file *file_priv)
1197{
1198	drm_r128_private_t *dev_priv = dev->dev_private;
1199	drm_r128_sarea_t *sarea_priv;
1200	drm_r128_clear_t *clear = data;
1201	DRM_DEBUG("\n");
1202
1203	LOCK_TEST_WITH_RETURN(dev, file_priv);
1204
1205	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1206
1207	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1208
1209	sarea_priv = dev_priv->sarea_priv;
1210
1211	if (sarea_priv->nbox > R128_NR_SAREA_CLIPRECTS)
1212		sarea_priv->nbox = R128_NR_SAREA_CLIPRECTS;
1213
1214	r128_cce_dispatch_clear(dev, clear);
1215	COMMIT_RING();
1216
1217	/* Make sure we restore the 3D state next time.
1218	 */
1219	dev_priv->sarea_priv->dirty |= R128_UPLOAD_CONTEXT | R128_UPLOAD_MASKS;
1220
1221	return 0;
1222}
1223
1224static int r128_do_init_pageflip(struct drm_device *dev)
1225{
1226	drm_r128_private_t *dev_priv = dev->dev_private;
1227	DRM_DEBUG("\n");
1228
1229	dev_priv->crtc_offset = R128_READ(R128_CRTC_OFFSET);
1230	dev_priv->crtc_offset_cntl = R128_READ(R128_CRTC_OFFSET_CNTL);
1231
1232	R128_WRITE(R128_CRTC_OFFSET, dev_priv->front_offset);
1233	R128_WRITE(R128_CRTC_OFFSET_CNTL,
1234		   dev_priv->crtc_offset_cntl | R128_CRTC_OFFSET_FLIP_CNTL);
1235
1236	dev_priv->page_flipping = 1;
1237	dev_priv->current_page = 0;
1238	dev_priv->sarea_priv->pfCurrentPage = dev_priv->current_page;
1239
1240	return 0;
1241}
1242
1243static int r128_do_cleanup_pageflip(struct drm_device *dev)
1244{
1245	drm_r128_private_t *dev_priv = dev->dev_private;
1246	DRM_DEBUG("\n");
1247
1248	R128_WRITE(R128_CRTC_OFFSET, dev_priv->crtc_offset);
1249	R128_WRITE(R128_CRTC_OFFSET_CNTL, dev_priv->crtc_offset_cntl);
1250
1251	if (dev_priv->current_page != 0) {
1252		r128_cce_dispatch_flip(dev);
1253		COMMIT_RING();
1254	}
1255
1256	dev_priv->page_flipping = 0;
1257	return 0;
1258}
1259
1260/* Swapping and flipping are different operations, need different ioctls.
1261 * They can & should be intermixed to support multiple 3d windows.
1262 */
1263
1264static int r128_cce_flip(struct drm_device *dev, void *data, struct drm_file *file_priv)
1265{
1266	drm_r128_private_t *dev_priv = dev->dev_private;
1267	DRM_DEBUG("\n");
1268
1269	LOCK_TEST_WITH_RETURN(dev, file_priv);
1270
1271	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1272
1273	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1274
1275	if (!dev_priv->page_flipping)
1276		r128_do_init_pageflip(dev);
1277
1278	r128_cce_dispatch_flip(dev);
1279
1280	COMMIT_RING();
1281	return 0;
1282}
1283
1284static int r128_cce_swap(struct drm_device *dev, void *data, struct drm_file *file_priv)
1285{
1286	drm_r128_private_t *dev_priv = dev->dev_private;
1287	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
1288	DRM_DEBUG("\n");
1289
1290	LOCK_TEST_WITH_RETURN(dev, file_priv);
1291
1292	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1293
1294	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1295
1296	if (sarea_priv->nbox > R128_NR_SAREA_CLIPRECTS)
1297		sarea_priv->nbox = R128_NR_SAREA_CLIPRECTS;
1298
1299	r128_cce_dispatch_swap(dev);
1300	dev_priv->sarea_priv->dirty |= (R128_UPLOAD_CONTEXT |
1301					R128_UPLOAD_MASKS);
1302
1303	COMMIT_RING();
1304	return 0;
1305}
1306
1307static int r128_cce_vertex(struct drm_device *dev, void *data, struct drm_file *file_priv)
1308{
1309	drm_r128_private_t *dev_priv = dev->dev_private;
1310	struct drm_device_dma *dma = dev->dma;
1311	struct drm_buf *buf;
1312	drm_r128_buf_priv_t *buf_priv;
1313	drm_r128_vertex_t *vertex = data;
1314
1315	LOCK_TEST_WITH_RETURN(dev, file_priv);
1316
1317	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1318
1319	DRM_DEBUG("pid=%d index=%d count=%d discard=%d\n",
1320		  DRM_CURRENTPID, vertex->idx, vertex->count, vertex->discard);
1321
1322	if (vertex->idx < 0 || vertex->idx >= dma->buf_count) {
1323		DRM_ERROR("buffer index %d (of %d max)\n",
1324			  vertex->idx, dma->buf_count - 1);
1325		return -EINVAL;
1326	}
1327	if (vertex->prim < 0 ||
1328	    vertex->prim > R128_CCE_VC_CNTL_PRIM_TYPE_TRI_TYPE2) {
1329		DRM_ERROR("buffer prim %d\n", vertex->prim);
1330		return -EINVAL;
1331	}
1332
1333	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1334	VB_AGE_TEST_WITH_RETURN(dev_priv);
1335
1336	buf = dma->buflist[vertex->idx];
1337	buf_priv = buf->dev_private;
1338
1339	if (buf->file_priv != file_priv) {
1340		DRM_ERROR("process %d using buffer owned by %p\n",
1341			  DRM_CURRENTPID, buf->file_priv);
1342		return -EINVAL;
1343	}
1344	if (buf->pending) {
1345		DRM_ERROR("sending pending buffer %d\n", vertex->idx);
1346		return -EINVAL;
1347	}
1348
1349	buf->used = vertex->count;
1350	buf_priv->prim = vertex->prim;
1351	buf_priv->discard = vertex->discard;
1352
1353	r128_cce_dispatch_vertex(dev, buf);
1354
1355	COMMIT_RING();
1356	return 0;
1357}
1358
1359static int r128_cce_indices(struct drm_device *dev, void *data, struct drm_file *file_priv)
1360{
1361	drm_r128_private_t *dev_priv = dev->dev_private;
1362	struct drm_device_dma *dma = dev->dma;
1363	struct drm_buf *buf;
1364	drm_r128_buf_priv_t *buf_priv;
1365	drm_r128_indices_t *elts = data;
1366	int count;
1367
1368	LOCK_TEST_WITH_RETURN(dev, file_priv);
1369
1370	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1371
1372	DRM_DEBUG("pid=%d buf=%d s=%d e=%d d=%d\n", DRM_CURRENTPID,
1373		  elts->idx, elts->start, elts->end, elts->discard);
1374
1375	if (elts->idx < 0 || elts->idx >= dma->buf_count) {
1376		DRM_ERROR("buffer index %d (of %d max)\n",
1377			  elts->idx, dma->buf_count - 1);
1378		return -EINVAL;
1379	}
1380	if (elts->prim < 0 ||
1381	    elts->prim > R128_CCE_VC_CNTL_PRIM_TYPE_TRI_TYPE2) {
1382		DRM_ERROR("buffer prim %d\n", elts->prim);
1383		return -EINVAL;
1384	}
1385
1386	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1387	VB_AGE_TEST_WITH_RETURN(dev_priv);
1388
1389	buf = dma->buflist[elts->idx];
1390	buf_priv = buf->dev_private;
1391
1392	if (buf->file_priv != file_priv) {
1393		DRM_ERROR("process %d using buffer owned by %p\n",
1394			  DRM_CURRENTPID, buf->file_priv);
1395		return -EINVAL;
1396	}
1397	if (buf->pending) {
1398		DRM_ERROR("sending pending buffer %d\n", elts->idx);
1399		return -EINVAL;
1400	}
1401
1402	count = (elts->end - elts->start) / sizeof(u16);
1403	elts->start -= R128_INDEX_PRIM_OFFSET;
1404
1405	if (elts->start & 0x7) {
1406		DRM_ERROR("misaligned buffer 0x%x\n", elts->start);
1407		return -EINVAL;
1408	}
1409	if (elts->start < buf->used) {
1410		DRM_ERROR("no header 0x%x - 0x%x\n", elts->start, buf->used);
1411		return -EINVAL;
1412	}
1413
1414	buf->used = elts->end;
1415	buf_priv->prim = elts->prim;
1416	buf_priv->discard = elts->discard;
1417
1418	r128_cce_dispatch_indices(dev, buf, elts->start, elts->end, count);
1419
1420	COMMIT_RING();
1421	return 0;
1422}
1423
1424static int r128_cce_blit(struct drm_device *dev, void *data, struct drm_file *file_priv)
1425{
1426	struct drm_device_dma *dma = dev->dma;
1427	drm_r128_private_t *dev_priv = dev->dev_private;
1428	drm_r128_blit_t *blit = data;
1429	int ret;
1430
1431	LOCK_TEST_WITH_RETURN(dev, file_priv);
1432
1433	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1434
1435	DRM_DEBUG("pid=%d index=%d\n", DRM_CURRENTPID, blit->idx);
1436
1437	if (blit->idx < 0 || blit->idx >= dma->buf_count) {
1438		DRM_ERROR("buffer index %d (of %d max)\n",
1439			  blit->idx, dma->buf_count - 1);
1440		return -EINVAL;
1441	}
1442
1443	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1444	VB_AGE_TEST_WITH_RETURN(dev_priv);
1445
1446	ret = r128_cce_dispatch_blit(dev, file_priv, blit);
1447
1448	COMMIT_RING();
1449	return ret;
1450}
1451
1452int r128_cce_depth(struct drm_device *dev, void *data, struct drm_file *file_priv)
1453{
1454	drm_r128_private_t *dev_priv = dev->dev_private;
1455	drm_r128_depth_t *depth = data;
1456	int ret;
1457
1458	LOCK_TEST_WITH_RETURN(dev, file_priv);
1459
1460	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1461
1462	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1463
1464	ret = -EINVAL;
1465	switch (depth->func) {
1466	case R128_WRITE_SPAN:
1467		ret = r128_cce_dispatch_write_span(dev, depth);
1468		break;
1469	case R128_WRITE_PIXELS:
1470		ret = r128_cce_dispatch_write_pixels(dev, depth);
1471		break;
1472	case R128_READ_SPAN:
1473		ret = r128_cce_dispatch_read_span(dev, depth);
1474		break;
1475	case R128_READ_PIXELS:
1476		ret = r128_cce_dispatch_read_pixels(dev, depth);
1477		break;
1478	}
1479
1480	COMMIT_RING();
1481	return ret;
1482}
1483
1484int r128_cce_stipple(struct drm_device *dev, void *data, struct drm_file *file_priv)
1485{
1486	drm_r128_private_t *dev_priv = dev->dev_private;
1487	drm_r128_stipple_t *stipple = data;
1488	u32 mask[32];
1489
1490	LOCK_TEST_WITH_RETURN(dev, file_priv);
1491
1492	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1493
1494	if (copy_from_user(&mask, stipple->mask, 32 * sizeof(u32)))
1495		return -EFAULT;
1496
1497	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1498
1499	r128_cce_dispatch_stipple(dev, mask);
1500
1501	COMMIT_RING();
1502	return 0;
1503}
1504
1505static int r128_cce_indirect(struct drm_device *dev, void *data, struct drm_file *file_priv)
1506{
1507	drm_r128_private_t *dev_priv = dev->dev_private;
1508	struct drm_device_dma *dma = dev->dma;
1509	struct drm_buf *buf;
1510	drm_r128_buf_priv_t *buf_priv;
1511	drm_r128_indirect_t *indirect = data;
1512#if 0
1513	RING_LOCALS;
1514#endif
1515
1516	LOCK_TEST_WITH_RETURN(dev, file_priv);
1517
1518	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1519
1520	DRM_DEBUG("idx=%d s=%d e=%d d=%d\n",
1521		  indirect->idx, indirect->start, indirect->end,
1522		  indirect->discard);
1523
1524	if (indirect->idx < 0 || indirect->idx >= dma->buf_count) {
1525		DRM_ERROR("buffer index %d (of %d max)\n",
1526			  indirect->idx, dma->buf_count - 1);
1527		return -EINVAL;
1528	}
1529
1530	buf = dma->buflist[indirect->idx];
1531	buf_priv = buf->dev_private;
1532
1533	if (buf->file_priv != file_priv) {
1534		DRM_ERROR("process %d using buffer owned by %p\n",
1535			  DRM_CURRENTPID, buf->file_priv);
1536		return -EINVAL;
1537	}
1538	if (buf->pending) {
1539		DRM_ERROR("sending pending buffer %d\n", indirect->idx);
1540		return -EINVAL;
1541	}
1542
1543	if (indirect->start < buf->used) {
1544		DRM_ERROR("reusing indirect: start=0x%x actual=0x%x\n",
1545			  indirect->start, buf->used);
1546		return -EINVAL;
1547	}
1548
1549	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1550	VB_AGE_TEST_WITH_RETURN(dev_priv);
1551
1552	buf->used = indirect->end;
1553	buf_priv->discard = indirect->discard;
1554
1555#if 0
1556	/* Wait for the 3D stream to idle before the indirect buffer
1557	 * containing 2D acceleration commands is processed.
1558	 */
1559	BEGIN_RING(2);
1560	RADEON_WAIT_UNTIL_3D_IDLE();
1561	ADVANCE_RING();
1562#endif
1563
1564	/* Dispatch the indirect buffer full of commands from the
1565	 * X server.  This is insecure and is thus only available to
1566	 * privileged clients.
1567	 */
1568	r128_cce_dispatch_indirect(dev, buf, indirect->start, indirect->end);
1569
1570	COMMIT_RING();
1571	return 0;
1572}
1573
1574int r128_getparam(struct drm_device *dev, void *data, struct drm_file *file_priv)
1575{
1576	drm_r128_private_t *dev_priv = dev->dev_private;
1577	drm_r128_getparam_t *param = data;
1578	int value;
1579
1580	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1581
1582	DRM_DEBUG("pid=%d\n", DRM_CURRENTPID);
1583
1584	switch (param->param) {
1585	case R128_PARAM_IRQ_NR:
1586		value = dev->pdev->irq;
1587		break;
1588	default:
1589		return -EINVAL;
1590	}
1591
1592	if (copy_to_user(param->value, &value, sizeof(int))) {
1593		DRM_ERROR("copy_to_user\n");
1594		return -EFAULT;
1595	}
1596
1597	return 0;
1598}
1599
1600void r128_driver_preclose(struct drm_device *dev, struct drm_file *file_priv)
1601{
1602	if (dev->dev_private) {
1603		drm_r128_private_t *dev_priv = dev->dev_private;
1604		if (dev_priv->page_flipping)
1605			r128_do_cleanup_pageflip(dev);
1606	}
1607}
1608void r128_driver_lastclose(struct drm_device *dev)
1609{
1610	r128_do_cleanup_cce(dev);
1611}
1612
1613const struct drm_ioctl_desc r128_ioctls[] = {
1614	DRM_IOCTL_DEF_DRV(R128_INIT, r128_cce_init, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1615	DRM_IOCTL_DEF_DRV(R128_CCE_START, r128_cce_start, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1616	DRM_IOCTL_DEF_DRV(R128_CCE_STOP, r128_cce_stop, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1617	DRM_IOCTL_DEF_DRV(R128_CCE_RESET, r128_cce_reset, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1618	DRM_IOCTL_DEF_DRV(R128_CCE_IDLE, r128_cce_idle, DRM_AUTH),
1619	DRM_IOCTL_DEF_DRV(R128_RESET, r128_engine_reset, DRM_AUTH),
1620	DRM_IOCTL_DEF_DRV(R128_FULLSCREEN, r128_fullscreen, DRM_AUTH),
1621	DRM_IOCTL_DEF_DRV(R128_SWAP, r128_cce_swap, DRM_AUTH),
1622	DRM_IOCTL_DEF_DRV(R128_FLIP, r128_cce_flip, DRM_AUTH),
1623	DRM_IOCTL_DEF_DRV(R128_CLEAR, r128_cce_clear, DRM_AUTH),
1624	DRM_IOCTL_DEF_DRV(R128_VERTEX, r128_cce_vertex, DRM_AUTH),
1625	DRM_IOCTL_DEF_DRV(R128_INDICES, r128_cce_indices, DRM_AUTH),
1626	DRM_IOCTL_DEF_DRV(R128_BLIT, r128_cce_blit, DRM_AUTH),
1627	DRM_IOCTL_DEF_DRV(R128_DEPTH, r128_cce_depth, DRM_AUTH),
1628	DRM_IOCTL_DEF_DRV(R128_STIPPLE, r128_cce_stipple, DRM_AUTH),
1629	DRM_IOCTL_DEF_DRV(R128_INDIRECT, r128_cce_indirect, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1630	DRM_IOCTL_DEF_DRV(R128_GETPARAM, r128_getparam, DRM_AUTH),
1631};
1632
1633int r128_max_ioctl = ARRAY_SIZE(r128_ioctls);