Linux Audio

Check our new training course

Loading...
v4.6
   1/* r128_state.c -- State support for r128 -*- linux-c -*-
   2 * Created: Thu Jan 27 02:53:43 2000 by gareth@valinux.com
   3 */
   4/*
   5 * Copyright 2000 VA Linux Systems, Inc., Sunnyvale, California.
   6 * All Rights Reserved.
   7 *
   8 * Permission is hereby granted, free of charge, to any person obtaining a
   9 * copy of this software and associated documentation files (the "Software"),
  10 * to deal in the Software without restriction, including without limitation
  11 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  12 * and/or sell copies of the Software, and to permit persons to whom the
  13 * Software is furnished to do so, subject to the following conditions:
  14 *
  15 * The above copyright notice and this permission notice (including the next
  16 * paragraph) shall be included in all copies or substantial portions of the
  17 * Software.
  18 *
  19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  20 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  21 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  22 * PRECISION INSIGHT AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
  23 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  24 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
  25 * DEALINGS IN THE SOFTWARE.
  26 *
  27 * Authors:
  28 *    Gareth Hughes <gareth@valinux.com>
  29 */
  30
  31#include <drm/drmP.h>
 
 
 
 
 
 
  32#include <drm/r128_drm.h>
 
  33#include "r128_drv.h"
  34
  35/* ================================================================
  36 * CCE hardware state programming functions
  37 */
  38
  39static void r128_emit_clip_rects(drm_r128_private_t *dev_priv,
  40				 struct drm_clip_rect *boxes, int count)
  41{
  42	u32 aux_sc_cntl = 0x00000000;
  43	RING_LOCALS;
  44	DRM_DEBUG("\n");
  45
  46	BEGIN_RING((count < 3 ? count : 3) * 5 + 2);
  47
  48	if (count >= 1) {
  49		OUT_RING(CCE_PACKET0(R128_AUX1_SC_LEFT, 3));
  50		OUT_RING(boxes[0].x1);
  51		OUT_RING(boxes[0].x2 - 1);
  52		OUT_RING(boxes[0].y1);
  53		OUT_RING(boxes[0].y2 - 1);
  54
  55		aux_sc_cntl |= (R128_AUX1_SC_EN | R128_AUX1_SC_MODE_OR);
  56	}
  57	if (count >= 2) {
  58		OUT_RING(CCE_PACKET0(R128_AUX2_SC_LEFT, 3));
  59		OUT_RING(boxes[1].x1);
  60		OUT_RING(boxes[1].x2 - 1);
  61		OUT_RING(boxes[1].y1);
  62		OUT_RING(boxes[1].y2 - 1);
  63
  64		aux_sc_cntl |= (R128_AUX2_SC_EN | R128_AUX2_SC_MODE_OR);
  65	}
  66	if (count >= 3) {
  67		OUT_RING(CCE_PACKET0(R128_AUX3_SC_LEFT, 3));
  68		OUT_RING(boxes[2].x1);
  69		OUT_RING(boxes[2].x2 - 1);
  70		OUT_RING(boxes[2].y1);
  71		OUT_RING(boxes[2].y2 - 1);
  72
  73		aux_sc_cntl |= (R128_AUX3_SC_EN | R128_AUX3_SC_MODE_OR);
  74	}
  75
  76	OUT_RING(CCE_PACKET0(R128_AUX_SC_CNTL, 0));
  77	OUT_RING(aux_sc_cntl);
  78
  79	ADVANCE_RING();
  80}
  81
  82static __inline__ void r128_emit_core(drm_r128_private_t *dev_priv)
  83{
  84	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
  85	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
  86	RING_LOCALS;
  87	DRM_DEBUG("\n");
  88
  89	BEGIN_RING(2);
  90
  91	OUT_RING(CCE_PACKET0(R128_SCALE_3D_CNTL, 0));
  92	OUT_RING(ctx->scale_3d_cntl);
  93
  94	ADVANCE_RING();
  95}
  96
  97static __inline__ void r128_emit_context(drm_r128_private_t *dev_priv)
  98{
  99	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 100	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
 101	RING_LOCALS;
 102	DRM_DEBUG("\n");
 103
 104	BEGIN_RING(13);
 105
 106	OUT_RING(CCE_PACKET0(R128_DST_PITCH_OFFSET_C, 11));
 107	OUT_RING(ctx->dst_pitch_offset_c);
 108	OUT_RING(ctx->dp_gui_master_cntl_c);
 109	OUT_RING(ctx->sc_top_left_c);
 110	OUT_RING(ctx->sc_bottom_right_c);
 111	OUT_RING(ctx->z_offset_c);
 112	OUT_RING(ctx->z_pitch_c);
 113	OUT_RING(ctx->z_sten_cntl_c);
 114	OUT_RING(ctx->tex_cntl_c);
 115	OUT_RING(ctx->misc_3d_state_cntl_reg);
 116	OUT_RING(ctx->texture_clr_cmp_clr_c);
 117	OUT_RING(ctx->texture_clr_cmp_msk_c);
 118	OUT_RING(ctx->fog_color_c);
 119
 120	ADVANCE_RING();
 121}
 122
 123static __inline__ void r128_emit_setup(drm_r128_private_t *dev_priv)
 124{
 125	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 126	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
 127	RING_LOCALS;
 128	DRM_DEBUG("\n");
 129
 130	BEGIN_RING(3);
 131
 132	OUT_RING(CCE_PACKET1(R128_SETUP_CNTL, R128_PM4_VC_FPU_SETUP));
 133	OUT_RING(ctx->setup_cntl);
 134	OUT_RING(ctx->pm4_vc_fpu_setup);
 135
 136	ADVANCE_RING();
 137}
 138
 139static __inline__ void r128_emit_masks(drm_r128_private_t *dev_priv)
 140{
 141	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 142	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
 143	RING_LOCALS;
 144	DRM_DEBUG("\n");
 145
 146	BEGIN_RING(5);
 147
 148	OUT_RING(CCE_PACKET0(R128_DP_WRITE_MASK, 0));
 149	OUT_RING(ctx->dp_write_mask);
 150
 151	OUT_RING(CCE_PACKET0(R128_STEN_REF_MASK_C, 1));
 152	OUT_RING(ctx->sten_ref_mask_c);
 153	OUT_RING(ctx->plane_3d_mask_c);
 154
 155	ADVANCE_RING();
 156}
 157
 158static __inline__ void r128_emit_window(drm_r128_private_t *dev_priv)
 159{
 160	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 161	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
 162	RING_LOCALS;
 163	DRM_DEBUG("\n");
 164
 165	BEGIN_RING(2);
 166
 167	OUT_RING(CCE_PACKET0(R128_WINDOW_XY_OFFSET, 0));
 168	OUT_RING(ctx->window_xy_offset);
 169
 170	ADVANCE_RING();
 171}
 172
 173static __inline__ void r128_emit_tex0(drm_r128_private_t *dev_priv)
 174{
 175	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 176	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
 177	drm_r128_texture_regs_t *tex = &sarea_priv->tex_state[0];
 178	int i;
 179	RING_LOCALS;
 180	DRM_DEBUG("\n");
 181
 182	BEGIN_RING(7 + R128_MAX_TEXTURE_LEVELS);
 183
 184	OUT_RING(CCE_PACKET0(R128_PRIM_TEX_CNTL_C,
 185			     2 + R128_MAX_TEXTURE_LEVELS));
 186	OUT_RING(tex->tex_cntl);
 187	OUT_RING(tex->tex_combine_cntl);
 188	OUT_RING(ctx->tex_size_pitch_c);
 189	for (i = 0; i < R128_MAX_TEXTURE_LEVELS; i++)
 190		OUT_RING(tex->tex_offset[i]);
 191
 192	OUT_RING(CCE_PACKET0(R128_CONSTANT_COLOR_C, 1));
 193	OUT_RING(ctx->constant_color_c);
 194	OUT_RING(tex->tex_border_color);
 195
 196	ADVANCE_RING();
 197}
 198
 199static __inline__ void r128_emit_tex1(drm_r128_private_t *dev_priv)
 200{
 201	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 202	drm_r128_texture_regs_t *tex = &sarea_priv->tex_state[1];
 203	int i;
 204	RING_LOCALS;
 205	DRM_DEBUG("\n");
 206
 207	BEGIN_RING(5 + R128_MAX_TEXTURE_LEVELS);
 208
 209	OUT_RING(CCE_PACKET0(R128_SEC_TEX_CNTL_C, 1 + R128_MAX_TEXTURE_LEVELS));
 210	OUT_RING(tex->tex_cntl);
 211	OUT_RING(tex->tex_combine_cntl);
 212	for (i = 0; i < R128_MAX_TEXTURE_LEVELS; i++)
 213		OUT_RING(tex->tex_offset[i]);
 214
 215	OUT_RING(CCE_PACKET0(R128_SEC_TEXTURE_BORDER_COLOR_C, 0));
 216	OUT_RING(tex->tex_border_color);
 217
 218	ADVANCE_RING();
 219}
 220
 221static void r128_emit_state(drm_r128_private_t *dev_priv)
 222{
 223	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 224	unsigned int dirty = sarea_priv->dirty;
 225
 226	DRM_DEBUG("dirty=0x%08x\n", dirty);
 227
 228	if (dirty & R128_UPLOAD_CORE) {
 229		r128_emit_core(dev_priv);
 230		sarea_priv->dirty &= ~R128_UPLOAD_CORE;
 231	}
 232
 233	if (dirty & R128_UPLOAD_CONTEXT) {
 234		r128_emit_context(dev_priv);
 235		sarea_priv->dirty &= ~R128_UPLOAD_CONTEXT;
 236	}
 237
 238	if (dirty & R128_UPLOAD_SETUP) {
 239		r128_emit_setup(dev_priv);
 240		sarea_priv->dirty &= ~R128_UPLOAD_SETUP;
 241	}
 242
 243	if (dirty & R128_UPLOAD_MASKS) {
 244		r128_emit_masks(dev_priv);
 245		sarea_priv->dirty &= ~R128_UPLOAD_MASKS;
 246	}
 247
 248	if (dirty & R128_UPLOAD_WINDOW) {
 249		r128_emit_window(dev_priv);
 250		sarea_priv->dirty &= ~R128_UPLOAD_WINDOW;
 251	}
 252
 253	if (dirty & R128_UPLOAD_TEX0) {
 254		r128_emit_tex0(dev_priv);
 255		sarea_priv->dirty &= ~R128_UPLOAD_TEX0;
 256	}
 257
 258	if (dirty & R128_UPLOAD_TEX1) {
 259		r128_emit_tex1(dev_priv);
 260		sarea_priv->dirty &= ~R128_UPLOAD_TEX1;
 261	}
 262
 263	/* Turn off the texture cache flushing */
 264	sarea_priv->context_state.tex_cntl_c &= ~R128_TEX_CACHE_FLUSH;
 265
 266	sarea_priv->dirty &= ~R128_REQUIRE_QUIESCENCE;
 267}
 268
 269#if R128_PERFORMANCE_BOXES
 270/* ================================================================
 271 * Performance monitoring functions
 272 */
 273
 274static void r128_clear_box(drm_r128_private_t *dev_priv,
 275			   int x, int y, int w, int h, int r, int g, int b)
 276{
 277	u32 pitch, offset;
 278	u32 fb_bpp, color;
 279	RING_LOCALS;
 280
 281	switch (dev_priv->fb_bpp) {
 282	case 16:
 283		fb_bpp = R128_GMC_DST_16BPP;
 284		color = (((r & 0xf8) << 8) |
 285			 ((g & 0xfc) << 3) | ((b & 0xf8) >> 3));
 286		break;
 287	case 24:
 288		fb_bpp = R128_GMC_DST_24BPP;
 289		color = ((r << 16) | (g << 8) | b);
 290		break;
 291	case 32:
 292		fb_bpp = R128_GMC_DST_32BPP;
 293		color = (((0xff) << 24) | (r << 16) | (g << 8) | b);
 294		break;
 295	default:
 296		return;
 297	}
 298
 299	offset = dev_priv->back_offset;
 300	pitch = dev_priv->back_pitch >> 3;
 301
 302	BEGIN_RING(6);
 303
 304	OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 305	OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 306		 R128_GMC_BRUSH_SOLID_COLOR |
 307		 fb_bpp |
 308		 R128_GMC_SRC_DATATYPE_COLOR |
 309		 R128_ROP3_P |
 310		 R128_GMC_CLR_CMP_CNTL_DIS | R128_GMC_AUX_CLIP_DIS);
 311
 312	OUT_RING((pitch << 21) | (offset >> 5));
 313	OUT_RING(color);
 314
 315	OUT_RING((x << 16) | y);
 316	OUT_RING((w << 16) | h);
 317
 318	ADVANCE_RING();
 319}
 320
 321static void r128_cce_performance_boxes(drm_r128_private_t *dev_priv)
 322{
 323	if (atomic_read(&dev_priv->idle_count) == 0)
 324		r128_clear_box(dev_priv, 64, 4, 8, 8, 0, 255, 0);
 325	else
 326		atomic_set(&dev_priv->idle_count, 0);
 327}
 328
 329#endif
 330
 331/* ================================================================
 332 * CCE command dispatch functions
 333 */
 334
 335static void r128_print_dirty(const char *msg, unsigned int flags)
 336{
 337	DRM_INFO("%s: (0x%x) %s%s%s%s%s%s%s%s%s\n",
 338		 msg,
 339		 flags,
 340		 (flags & R128_UPLOAD_CORE) ? "core, " : "",
 341		 (flags & R128_UPLOAD_CONTEXT) ? "context, " : "",
 342		 (flags & R128_UPLOAD_SETUP) ? "setup, " : "",
 343		 (flags & R128_UPLOAD_TEX0) ? "tex0, " : "",
 344		 (flags & R128_UPLOAD_TEX1) ? "tex1, " : "",
 345		 (flags & R128_UPLOAD_MASKS) ? "masks, " : "",
 346		 (flags & R128_UPLOAD_WINDOW) ? "window, " : "",
 347		 (flags & R128_UPLOAD_CLIPRECTS) ? "cliprects, " : "",
 348		 (flags & R128_REQUIRE_QUIESCENCE) ? "quiescence, " : "");
 349}
 350
 351static void r128_cce_dispatch_clear(struct drm_device *dev,
 352				    drm_r128_clear_t *clear)
 353{
 354	drm_r128_private_t *dev_priv = dev->dev_private;
 355	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 356	int nbox = sarea_priv->nbox;
 357	struct drm_clip_rect *pbox = sarea_priv->boxes;
 358	unsigned int flags = clear->flags;
 359	int i;
 360	RING_LOCALS;
 361	DRM_DEBUG("\n");
 362
 363	if (dev_priv->page_flipping && dev_priv->current_page == 1) {
 364		unsigned int tmp = flags;
 365
 366		flags &= ~(R128_FRONT | R128_BACK);
 367		if (tmp & R128_FRONT)
 368			flags |= R128_BACK;
 369		if (tmp & R128_BACK)
 370			flags |= R128_FRONT;
 371	}
 372
 373	for (i = 0; i < nbox; i++) {
 374		int x = pbox[i].x1;
 375		int y = pbox[i].y1;
 376		int w = pbox[i].x2 - x;
 377		int h = pbox[i].y2 - y;
 378
 379		DRM_DEBUG("dispatch clear %d,%d-%d,%d flags 0x%x\n",
 380			  pbox[i].x1, pbox[i].y1, pbox[i].x2,
 381			  pbox[i].y2, flags);
 382
 383		if (flags & (R128_FRONT | R128_BACK)) {
 384			BEGIN_RING(2);
 385
 386			OUT_RING(CCE_PACKET0(R128_DP_WRITE_MASK, 0));
 387			OUT_RING(clear->color_mask);
 388
 389			ADVANCE_RING();
 390		}
 391
 392		if (flags & R128_FRONT) {
 393			BEGIN_RING(6);
 394
 395			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 396			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 397				 R128_GMC_BRUSH_SOLID_COLOR |
 398				 (dev_priv->color_fmt << 8) |
 399				 R128_GMC_SRC_DATATYPE_COLOR |
 400				 R128_ROP3_P |
 401				 R128_GMC_CLR_CMP_CNTL_DIS |
 402				 R128_GMC_AUX_CLIP_DIS);
 403
 404			OUT_RING(dev_priv->front_pitch_offset_c);
 405			OUT_RING(clear->clear_color);
 406
 407			OUT_RING((x << 16) | y);
 408			OUT_RING((w << 16) | h);
 409
 410			ADVANCE_RING();
 411		}
 412
 413		if (flags & R128_BACK) {
 414			BEGIN_RING(6);
 415
 416			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 417			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 418				 R128_GMC_BRUSH_SOLID_COLOR |
 419				 (dev_priv->color_fmt << 8) |
 420				 R128_GMC_SRC_DATATYPE_COLOR |
 421				 R128_ROP3_P |
 422				 R128_GMC_CLR_CMP_CNTL_DIS |
 423				 R128_GMC_AUX_CLIP_DIS);
 424
 425			OUT_RING(dev_priv->back_pitch_offset_c);
 426			OUT_RING(clear->clear_color);
 427
 428			OUT_RING((x << 16) | y);
 429			OUT_RING((w << 16) | h);
 430
 431			ADVANCE_RING();
 432		}
 433
 434		if (flags & R128_DEPTH) {
 435			BEGIN_RING(6);
 436
 437			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 438			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 439				 R128_GMC_BRUSH_SOLID_COLOR |
 440				 (dev_priv->depth_fmt << 8) |
 441				 R128_GMC_SRC_DATATYPE_COLOR |
 442				 R128_ROP3_P |
 443				 R128_GMC_CLR_CMP_CNTL_DIS |
 444				 R128_GMC_AUX_CLIP_DIS | R128_GMC_WR_MSK_DIS);
 445
 446			OUT_RING(dev_priv->depth_pitch_offset_c);
 447			OUT_RING(clear->clear_depth);
 448
 449			OUT_RING((x << 16) | y);
 450			OUT_RING((w << 16) | h);
 451
 452			ADVANCE_RING();
 453		}
 454	}
 455}
 456
 457static void r128_cce_dispatch_swap(struct drm_device *dev)
 458{
 459	drm_r128_private_t *dev_priv = dev->dev_private;
 460	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 461	int nbox = sarea_priv->nbox;
 462	struct drm_clip_rect *pbox = sarea_priv->boxes;
 463	int i;
 464	RING_LOCALS;
 465	DRM_DEBUG("\n");
 466
 467#if R128_PERFORMANCE_BOXES
 468	/* Do some trivial performance monitoring...
 469	 */
 470	r128_cce_performance_boxes(dev_priv);
 471#endif
 472
 473	for (i = 0; i < nbox; i++) {
 474		int x = pbox[i].x1;
 475		int y = pbox[i].y1;
 476		int w = pbox[i].x2 - x;
 477		int h = pbox[i].y2 - y;
 478
 479		BEGIN_RING(7);
 480
 481		OUT_RING(CCE_PACKET3(R128_CNTL_BITBLT_MULTI, 5));
 482		OUT_RING(R128_GMC_SRC_PITCH_OFFSET_CNTL |
 483			 R128_GMC_DST_PITCH_OFFSET_CNTL |
 484			 R128_GMC_BRUSH_NONE |
 485			 (dev_priv->color_fmt << 8) |
 486			 R128_GMC_SRC_DATATYPE_COLOR |
 487			 R128_ROP3_S |
 488			 R128_DP_SRC_SOURCE_MEMORY |
 489			 R128_GMC_CLR_CMP_CNTL_DIS |
 490			 R128_GMC_AUX_CLIP_DIS | R128_GMC_WR_MSK_DIS);
 491
 492		/* Make this work even if front & back are flipped:
 493		 */
 494		if (dev_priv->current_page == 0) {
 495			OUT_RING(dev_priv->back_pitch_offset_c);
 496			OUT_RING(dev_priv->front_pitch_offset_c);
 497		} else {
 498			OUT_RING(dev_priv->front_pitch_offset_c);
 499			OUT_RING(dev_priv->back_pitch_offset_c);
 500		}
 501
 502		OUT_RING((x << 16) | y);
 503		OUT_RING((x << 16) | y);
 504		OUT_RING((w << 16) | h);
 505
 506		ADVANCE_RING();
 507	}
 508
 509	/* Increment the frame counter.  The client-side 3D driver must
 510	 * throttle the framerate by waiting for this value before
 511	 * performing the swapbuffer ioctl.
 512	 */
 513	dev_priv->sarea_priv->last_frame++;
 514
 515	BEGIN_RING(2);
 516
 517	OUT_RING(CCE_PACKET0(R128_LAST_FRAME_REG, 0));
 518	OUT_RING(dev_priv->sarea_priv->last_frame);
 519
 520	ADVANCE_RING();
 521}
 522
 523static void r128_cce_dispatch_flip(struct drm_device *dev)
 524{
 525	drm_r128_private_t *dev_priv = dev->dev_private;
 526	RING_LOCALS;
 527	DRM_DEBUG("page=%d pfCurrentPage=%d\n",
 528		  dev_priv->current_page, dev_priv->sarea_priv->pfCurrentPage);
 529
 530#if R128_PERFORMANCE_BOXES
 531	/* Do some trivial performance monitoring...
 532	 */
 533	r128_cce_performance_boxes(dev_priv);
 534#endif
 535
 536	BEGIN_RING(4);
 537
 538	R128_WAIT_UNTIL_PAGE_FLIPPED();
 539	OUT_RING(CCE_PACKET0(R128_CRTC_OFFSET, 0));
 540
 541	if (dev_priv->current_page == 0)
 542		OUT_RING(dev_priv->back_offset);
 543	else
 544		OUT_RING(dev_priv->front_offset);
 545
 546	ADVANCE_RING();
 547
 548	/* Increment the frame counter.  The client-side 3D driver must
 549	 * throttle the framerate by waiting for this value before
 550	 * performing the swapbuffer ioctl.
 551	 */
 552	dev_priv->sarea_priv->last_frame++;
 553	dev_priv->sarea_priv->pfCurrentPage = dev_priv->current_page =
 554	    1 - dev_priv->current_page;
 555
 556	BEGIN_RING(2);
 557
 558	OUT_RING(CCE_PACKET0(R128_LAST_FRAME_REG, 0));
 559	OUT_RING(dev_priv->sarea_priv->last_frame);
 560
 561	ADVANCE_RING();
 562}
 563
 564static void r128_cce_dispatch_vertex(struct drm_device *dev, struct drm_buf *buf)
 565{
 566	drm_r128_private_t *dev_priv = dev->dev_private;
 567	drm_r128_buf_priv_t *buf_priv = buf->dev_private;
 568	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 569	int format = sarea_priv->vc_format;
 570	int offset = buf->bus_address;
 571	int size = buf->used;
 572	int prim = buf_priv->prim;
 573	int i = 0;
 574	RING_LOCALS;
 575	DRM_DEBUG("buf=%d nbox=%d\n", buf->idx, sarea_priv->nbox);
 576
 577	if (0)
 578		r128_print_dirty("dispatch_vertex", sarea_priv->dirty);
 579
 580	if (buf->used) {
 581		buf_priv->dispatched = 1;
 582
 583		if (sarea_priv->dirty & ~R128_UPLOAD_CLIPRECTS)
 584			r128_emit_state(dev_priv);
 585
 586		do {
 587			/* Emit the next set of up to three cliprects */
 588			if (i < sarea_priv->nbox) {
 589				r128_emit_clip_rects(dev_priv,
 590						     &sarea_priv->boxes[i],
 591						     sarea_priv->nbox - i);
 592			}
 593
 594			/* Emit the vertex buffer rendering commands */
 595			BEGIN_RING(5);
 596
 597			OUT_RING(CCE_PACKET3(R128_3D_RNDR_GEN_INDX_PRIM, 3));
 598			OUT_RING(offset);
 599			OUT_RING(size);
 600			OUT_RING(format);
 601			OUT_RING(prim | R128_CCE_VC_CNTL_PRIM_WALK_LIST |
 602				 (size << R128_CCE_VC_CNTL_NUM_SHIFT));
 603
 604			ADVANCE_RING();
 605
 606			i += 3;
 607		} while (i < sarea_priv->nbox);
 608	}
 609
 610	if (buf_priv->discard) {
 611		buf_priv->age = dev_priv->sarea_priv->last_dispatch;
 612
 613		/* Emit the vertex buffer age */
 614		BEGIN_RING(2);
 615
 616		OUT_RING(CCE_PACKET0(R128_LAST_DISPATCH_REG, 0));
 617		OUT_RING(buf_priv->age);
 618
 619		ADVANCE_RING();
 620
 621		buf->pending = 1;
 622		buf->used = 0;
 623		/* FIXME: Check dispatched field */
 624		buf_priv->dispatched = 0;
 625	}
 626
 627	dev_priv->sarea_priv->last_dispatch++;
 628
 629	sarea_priv->dirty &= ~R128_UPLOAD_CLIPRECTS;
 630	sarea_priv->nbox = 0;
 631}
 632
 633static void r128_cce_dispatch_indirect(struct drm_device *dev,
 634				       struct drm_buf *buf, int start, int end)
 635{
 636	drm_r128_private_t *dev_priv = dev->dev_private;
 637	drm_r128_buf_priv_t *buf_priv = buf->dev_private;
 638	RING_LOCALS;
 639	DRM_DEBUG("indirect: buf=%d s=0x%x e=0x%x\n", buf->idx, start, end);
 640
 641	if (start != end) {
 642		int offset = buf->bus_address + start;
 643		int dwords = (end - start + 3) / sizeof(u32);
 644
 645		/* Indirect buffer data must be an even number of
 646		 * dwords, so if we've been given an odd number we must
 647		 * pad the data with a Type-2 CCE packet.
 648		 */
 649		if (dwords & 1) {
 650			u32 *data = (u32 *)
 651			    ((char *)dev->agp_buffer_map->handle
 652			     + buf->offset + start);
 653			data[dwords++] = cpu_to_le32(R128_CCE_PACKET2);
 654		}
 655
 656		buf_priv->dispatched = 1;
 657
 658		/* Fire off the indirect buffer */
 659		BEGIN_RING(3);
 660
 661		OUT_RING(CCE_PACKET0(R128_PM4_IW_INDOFF, 1));
 662		OUT_RING(offset);
 663		OUT_RING(dwords);
 664
 665		ADVANCE_RING();
 666	}
 667
 668	if (buf_priv->discard) {
 669		buf_priv->age = dev_priv->sarea_priv->last_dispatch;
 670
 671		/* Emit the indirect buffer age */
 672		BEGIN_RING(2);
 673
 674		OUT_RING(CCE_PACKET0(R128_LAST_DISPATCH_REG, 0));
 675		OUT_RING(buf_priv->age);
 676
 677		ADVANCE_RING();
 678
 679		buf->pending = 1;
 680		buf->used = 0;
 681		/* FIXME: Check dispatched field */
 682		buf_priv->dispatched = 0;
 683	}
 684
 685	dev_priv->sarea_priv->last_dispatch++;
 686}
 687
 688static void r128_cce_dispatch_indices(struct drm_device *dev,
 689				      struct drm_buf *buf,
 690				      int start, int end, int count)
 691{
 692	drm_r128_private_t *dev_priv = dev->dev_private;
 693	drm_r128_buf_priv_t *buf_priv = buf->dev_private;
 694	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 695	int format = sarea_priv->vc_format;
 696	int offset = dev->agp_buffer_map->offset - dev_priv->cce_buffers_offset;
 697	int prim = buf_priv->prim;
 698	u32 *data;
 699	int dwords;
 700	int i = 0;
 701	RING_LOCALS;
 702	DRM_DEBUG("indices: s=%d e=%d c=%d\n", start, end, count);
 703
 704	if (0)
 705		r128_print_dirty("dispatch_indices", sarea_priv->dirty);
 706
 707	if (start != end) {
 708		buf_priv->dispatched = 1;
 709
 710		if (sarea_priv->dirty & ~R128_UPLOAD_CLIPRECTS)
 711			r128_emit_state(dev_priv);
 712
 713		dwords = (end - start + 3) / sizeof(u32);
 714
 715		data = (u32 *) ((char *)dev->agp_buffer_map->handle
 716				+ buf->offset + start);
 717
 718		data[0] = cpu_to_le32(CCE_PACKET3(R128_3D_RNDR_GEN_INDX_PRIM,
 719						  dwords - 2));
 720
 721		data[1] = cpu_to_le32(offset);
 722		data[2] = cpu_to_le32(R128_MAX_VB_VERTS);
 723		data[3] = cpu_to_le32(format);
 724		data[4] = cpu_to_le32((prim | R128_CCE_VC_CNTL_PRIM_WALK_IND |
 725				       (count << 16)));
 726
 727		if (count & 0x1) {
 728#ifdef __LITTLE_ENDIAN
 729			data[dwords - 1] &= 0x0000ffff;
 730#else
 731			data[dwords - 1] &= 0xffff0000;
 732#endif
 733		}
 734
 735		do {
 736			/* Emit the next set of up to three cliprects */
 737			if (i < sarea_priv->nbox) {
 738				r128_emit_clip_rects(dev_priv,
 739						     &sarea_priv->boxes[i],
 740						     sarea_priv->nbox - i);
 741			}
 742
 743			r128_cce_dispatch_indirect(dev, buf, start, end);
 744
 745			i += 3;
 746		} while (i < sarea_priv->nbox);
 747	}
 748
 749	if (buf_priv->discard) {
 750		buf_priv->age = dev_priv->sarea_priv->last_dispatch;
 751
 752		/* Emit the vertex buffer age */
 753		BEGIN_RING(2);
 754
 755		OUT_RING(CCE_PACKET0(R128_LAST_DISPATCH_REG, 0));
 756		OUT_RING(buf_priv->age);
 757
 758		ADVANCE_RING();
 759
 760		buf->pending = 1;
 761		/* FIXME: Check dispatched field */
 762		buf_priv->dispatched = 0;
 763	}
 764
 765	dev_priv->sarea_priv->last_dispatch++;
 766
 767	sarea_priv->dirty &= ~R128_UPLOAD_CLIPRECTS;
 768	sarea_priv->nbox = 0;
 769}
 770
 771static int r128_cce_dispatch_blit(struct drm_device *dev,
 772				  struct drm_file *file_priv,
 773				  drm_r128_blit_t *blit)
 774{
 775	drm_r128_private_t *dev_priv = dev->dev_private;
 776	struct drm_device_dma *dma = dev->dma;
 777	struct drm_buf *buf;
 778	drm_r128_buf_priv_t *buf_priv;
 779	u32 *data;
 780	int dword_shift, dwords;
 781	RING_LOCALS;
 782	DRM_DEBUG("\n");
 783
 784	/* The compiler won't optimize away a division by a variable,
 785	 * even if the only legal values are powers of two.  Thus, we'll
 786	 * use a shift instead.
 787	 */
 788	switch (blit->format) {
 789	case R128_DATATYPE_ARGB8888:
 790		dword_shift = 0;
 791		break;
 792	case R128_DATATYPE_ARGB1555:
 793	case R128_DATATYPE_RGB565:
 794	case R128_DATATYPE_ARGB4444:
 795	case R128_DATATYPE_YVYU422:
 796	case R128_DATATYPE_VYUY422:
 797		dword_shift = 1;
 798		break;
 799	case R128_DATATYPE_CI8:
 800	case R128_DATATYPE_RGB8:
 801		dword_shift = 2;
 802		break;
 803	default:
 804		DRM_ERROR("invalid blit format %d\n", blit->format);
 805		return -EINVAL;
 806	}
 807
 808	/* Flush the pixel cache, and mark the contents as Read Invalid.
 809	 * This ensures no pixel data gets mixed up with the texture
 810	 * data from the host data blit, otherwise part of the texture
 811	 * image may be corrupted.
 812	 */
 813	BEGIN_RING(2);
 814
 815	OUT_RING(CCE_PACKET0(R128_PC_GUI_CTLSTAT, 0));
 816	OUT_RING(R128_PC_RI_GUI | R128_PC_FLUSH_GUI);
 817
 818	ADVANCE_RING();
 819
 820	/* Dispatch the indirect buffer.
 821	 */
 822	buf = dma->buflist[blit->idx];
 823	buf_priv = buf->dev_private;
 824
 825	if (buf->file_priv != file_priv) {
 826		DRM_ERROR("process %d using buffer owned by %p\n",
 827			  DRM_CURRENTPID, buf->file_priv);
 828		return -EINVAL;
 829	}
 830	if (buf->pending) {
 831		DRM_ERROR("sending pending buffer %d\n", blit->idx);
 832		return -EINVAL;
 833	}
 834
 835	buf_priv->discard = 1;
 836
 837	dwords = (blit->width * blit->height) >> dword_shift;
 838
 839	data = (u32 *) ((char *)dev->agp_buffer_map->handle + buf->offset);
 840
 841	data[0] = cpu_to_le32(CCE_PACKET3(R128_CNTL_HOSTDATA_BLT, dwords + 6));
 842	data[1] = cpu_to_le32((R128_GMC_DST_PITCH_OFFSET_CNTL |
 843			       R128_GMC_BRUSH_NONE |
 844			       (blit->format << 8) |
 845			       R128_GMC_SRC_DATATYPE_COLOR |
 846			       R128_ROP3_S |
 847			       R128_DP_SRC_SOURCE_HOST_DATA |
 848			       R128_GMC_CLR_CMP_CNTL_DIS |
 849			       R128_GMC_AUX_CLIP_DIS | R128_GMC_WR_MSK_DIS));
 850
 851	data[2] = cpu_to_le32((blit->pitch << 21) | (blit->offset >> 5));
 852	data[3] = cpu_to_le32(0xffffffff);
 853	data[4] = cpu_to_le32(0xffffffff);
 854	data[5] = cpu_to_le32((blit->y << 16) | blit->x);
 855	data[6] = cpu_to_le32((blit->height << 16) | blit->width);
 856	data[7] = cpu_to_le32(dwords);
 857
 858	buf->used = (dwords + 8) * sizeof(u32);
 859
 860	r128_cce_dispatch_indirect(dev, buf, 0, buf->used);
 861
 862	/* Flush the pixel cache after the blit completes.  This ensures
 863	 * the texture data is written out to memory before rendering
 864	 * continues.
 865	 */
 866	BEGIN_RING(2);
 867
 868	OUT_RING(CCE_PACKET0(R128_PC_GUI_CTLSTAT, 0));
 869	OUT_RING(R128_PC_FLUSH_GUI);
 870
 871	ADVANCE_RING();
 872
 873	return 0;
 874}
 875
 876/* ================================================================
 877 * Tiled depth buffer management
 878 *
 879 * FIXME: These should all set the destination write mask for when we
 880 * have hardware stencil support.
 881 */
 882
 883static int r128_cce_dispatch_write_span(struct drm_device *dev,
 884					drm_r128_depth_t *depth)
 885{
 886	drm_r128_private_t *dev_priv = dev->dev_private;
 887	int count, x, y;
 888	u32 *buffer;
 889	u8 *mask;
 890	int i, buffer_size, mask_size;
 891	RING_LOCALS;
 892	DRM_DEBUG("\n");
 893
 894	count = depth->n;
 895	if (count > 4096 || count <= 0)
 896		return -EMSGSIZE;
 897
 898	if (copy_from_user(&x, depth->x, sizeof(x)))
 899		return -EFAULT;
 900	if (copy_from_user(&y, depth->y, sizeof(y)))
 901		return -EFAULT;
 902
 903	buffer_size = depth->n * sizeof(u32);
 904	buffer = memdup_user(depth->buffer, buffer_size);
 905	if (IS_ERR(buffer))
 906		return PTR_ERR(buffer);
 907
 908	mask_size = depth->n;
 909	if (depth->mask) {
 910		mask = memdup_user(depth->mask, mask_size);
 911		if (IS_ERR(mask)) {
 912			kfree(buffer);
 913			return PTR_ERR(mask);
 914		}
 915
 916		for (i = 0; i < count; i++, x++) {
 917			if (mask[i]) {
 918				BEGIN_RING(6);
 919
 920				OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 921				OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 922					 R128_GMC_BRUSH_SOLID_COLOR |
 923					 (dev_priv->depth_fmt << 8) |
 924					 R128_GMC_SRC_DATATYPE_COLOR |
 925					 R128_ROP3_P |
 926					 R128_GMC_CLR_CMP_CNTL_DIS |
 927					 R128_GMC_WR_MSK_DIS);
 928
 929				OUT_RING(dev_priv->depth_pitch_offset_c);
 930				OUT_RING(buffer[i]);
 931
 932				OUT_RING((x << 16) | y);
 933				OUT_RING((1 << 16) | 1);
 934
 935				ADVANCE_RING();
 936			}
 937		}
 938
 939		kfree(mask);
 940	} else {
 941		for (i = 0; i < count; i++, x++) {
 942			BEGIN_RING(6);
 943
 944			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 945			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 946				 R128_GMC_BRUSH_SOLID_COLOR |
 947				 (dev_priv->depth_fmt << 8) |
 948				 R128_GMC_SRC_DATATYPE_COLOR |
 949				 R128_ROP3_P |
 950				 R128_GMC_CLR_CMP_CNTL_DIS |
 951				 R128_GMC_WR_MSK_DIS);
 952
 953			OUT_RING(dev_priv->depth_pitch_offset_c);
 954			OUT_RING(buffer[i]);
 955
 956			OUT_RING((x << 16) | y);
 957			OUT_RING((1 << 16) | 1);
 958
 959			ADVANCE_RING();
 960		}
 961	}
 962
 963	kfree(buffer);
 964
 965	return 0;
 966}
 967
 968static int r128_cce_dispatch_write_pixels(struct drm_device *dev,
 969					  drm_r128_depth_t *depth)
 970{
 971	drm_r128_private_t *dev_priv = dev->dev_private;
 972	int count, *x, *y;
 973	u32 *buffer;
 974	u8 *mask;
 975	int i, xbuf_size, ybuf_size, buffer_size, mask_size;
 976	RING_LOCALS;
 977	DRM_DEBUG("\n");
 978
 979	count = depth->n;
 980	if (count > 4096 || count <= 0)
 981		return -EMSGSIZE;
 982
 983	xbuf_size = count * sizeof(*x);
 984	ybuf_size = count * sizeof(*y);
 985	x = kmalloc(xbuf_size, GFP_KERNEL);
 986	if (x == NULL)
 987		return -ENOMEM;
 988	y = kmalloc(ybuf_size, GFP_KERNEL);
 989	if (y == NULL) {
 990		kfree(x);
 991		return -ENOMEM;
 992	}
 993	if (copy_from_user(x, depth->x, xbuf_size)) {
 994		kfree(x);
 995		kfree(y);
 996		return -EFAULT;
 997	}
 998	if (copy_from_user(y, depth->y, xbuf_size)) {
 999		kfree(x);
1000		kfree(y);
1001		return -EFAULT;
1002	}
1003
1004	buffer_size = depth->n * sizeof(u32);
1005	buffer = memdup_user(depth->buffer, buffer_size);
1006	if (IS_ERR(buffer)) {
1007		kfree(x);
1008		kfree(y);
1009		return PTR_ERR(buffer);
1010	}
1011
1012	if (depth->mask) {
1013		mask_size = depth->n;
1014		mask = memdup_user(depth->mask, mask_size);
1015		if (IS_ERR(mask)) {
1016			kfree(x);
1017			kfree(y);
1018			kfree(buffer);
1019			return PTR_ERR(mask);
1020		}
1021
1022		for (i = 0; i < count; i++) {
1023			if (mask[i]) {
1024				BEGIN_RING(6);
1025
1026				OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
1027				OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
1028					 R128_GMC_BRUSH_SOLID_COLOR |
1029					 (dev_priv->depth_fmt << 8) |
1030					 R128_GMC_SRC_DATATYPE_COLOR |
1031					 R128_ROP3_P |
1032					 R128_GMC_CLR_CMP_CNTL_DIS |
1033					 R128_GMC_WR_MSK_DIS);
1034
1035				OUT_RING(dev_priv->depth_pitch_offset_c);
1036				OUT_RING(buffer[i]);
1037
1038				OUT_RING((x[i] << 16) | y[i]);
1039				OUT_RING((1 << 16) | 1);
1040
1041				ADVANCE_RING();
1042			}
1043		}
1044
1045		kfree(mask);
1046	} else {
1047		for (i = 0; i < count; i++) {
1048			BEGIN_RING(6);
1049
1050			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
1051			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
1052				 R128_GMC_BRUSH_SOLID_COLOR |
1053				 (dev_priv->depth_fmt << 8) |
1054				 R128_GMC_SRC_DATATYPE_COLOR |
1055				 R128_ROP3_P |
1056				 R128_GMC_CLR_CMP_CNTL_DIS |
1057				 R128_GMC_WR_MSK_DIS);
1058
1059			OUT_RING(dev_priv->depth_pitch_offset_c);
1060			OUT_RING(buffer[i]);
1061
1062			OUT_RING((x[i] << 16) | y[i]);
1063			OUT_RING((1 << 16) | 1);
1064
1065			ADVANCE_RING();
1066		}
1067	}
1068
1069	kfree(x);
1070	kfree(y);
1071	kfree(buffer);
1072
1073	return 0;
1074}
1075
1076static int r128_cce_dispatch_read_span(struct drm_device *dev,
1077				       drm_r128_depth_t *depth)
1078{
1079	drm_r128_private_t *dev_priv = dev->dev_private;
1080	int count, x, y;
1081	RING_LOCALS;
1082	DRM_DEBUG("\n");
1083
1084	count = depth->n;
1085	if (count > 4096 || count <= 0)
1086		return -EMSGSIZE;
1087
1088	if (copy_from_user(&x, depth->x, sizeof(x)))
1089		return -EFAULT;
1090	if (copy_from_user(&y, depth->y, sizeof(y)))
1091		return -EFAULT;
1092
1093	BEGIN_RING(7);
1094
1095	OUT_RING(CCE_PACKET3(R128_CNTL_BITBLT_MULTI, 5));
1096	OUT_RING(R128_GMC_SRC_PITCH_OFFSET_CNTL |
1097		 R128_GMC_DST_PITCH_OFFSET_CNTL |
1098		 R128_GMC_BRUSH_NONE |
1099		 (dev_priv->depth_fmt << 8) |
1100		 R128_GMC_SRC_DATATYPE_COLOR |
1101		 R128_ROP3_S |
1102		 R128_DP_SRC_SOURCE_MEMORY |
1103		 R128_GMC_CLR_CMP_CNTL_DIS | R128_GMC_WR_MSK_DIS);
1104
1105	OUT_RING(dev_priv->depth_pitch_offset_c);
1106	OUT_RING(dev_priv->span_pitch_offset_c);
1107
1108	OUT_RING((x << 16) | y);
1109	OUT_RING((0 << 16) | 0);
1110	OUT_RING((count << 16) | 1);
1111
1112	ADVANCE_RING();
1113
1114	return 0;
1115}
1116
1117static int r128_cce_dispatch_read_pixels(struct drm_device *dev,
1118					 drm_r128_depth_t *depth)
1119{
1120	drm_r128_private_t *dev_priv = dev->dev_private;
1121	int count, *x, *y;
1122	int i, xbuf_size, ybuf_size;
1123	RING_LOCALS;
1124	DRM_DEBUG("\n");
1125
1126	count = depth->n;
1127	if (count > 4096 || count <= 0)
1128		return -EMSGSIZE;
1129
1130	if (count > dev_priv->depth_pitch)
1131		count = dev_priv->depth_pitch;
1132
1133	xbuf_size = count * sizeof(*x);
1134	ybuf_size = count * sizeof(*y);
1135	x = kmalloc(xbuf_size, GFP_KERNEL);
1136	if (x == NULL)
1137		return -ENOMEM;
1138	y = kmalloc(ybuf_size, GFP_KERNEL);
1139	if (y == NULL) {
1140		kfree(x);
1141		return -ENOMEM;
1142	}
1143	if (copy_from_user(x, depth->x, xbuf_size)) {
1144		kfree(x);
1145		kfree(y);
1146		return -EFAULT;
1147	}
1148	if (copy_from_user(y, depth->y, ybuf_size)) {
1149		kfree(x);
1150		kfree(y);
1151		return -EFAULT;
1152	}
1153
1154	for (i = 0; i < count; i++) {
1155		BEGIN_RING(7);
1156
1157		OUT_RING(CCE_PACKET3(R128_CNTL_BITBLT_MULTI, 5));
1158		OUT_RING(R128_GMC_SRC_PITCH_OFFSET_CNTL |
1159			 R128_GMC_DST_PITCH_OFFSET_CNTL |
1160			 R128_GMC_BRUSH_NONE |
1161			 (dev_priv->depth_fmt << 8) |
1162			 R128_GMC_SRC_DATATYPE_COLOR |
1163			 R128_ROP3_S |
1164			 R128_DP_SRC_SOURCE_MEMORY |
1165			 R128_GMC_CLR_CMP_CNTL_DIS | R128_GMC_WR_MSK_DIS);
1166
1167		OUT_RING(dev_priv->depth_pitch_offset_c);
1168		OUT_RING(dev_priv->span_pitch_offset_c);
1169
1170		OUT_RING((x[i] << 16) | y[i]);
1171		OUT_RING((i << 16) | 0);
1172		OUT_RING((1 << 16) | 1);
1173
1174		ADVANCE_RING();
1175	}
1176
1177	kfree(x);
1178	kfree(y);
1179
1180	return 0;
1181}
1182
1183/* ================================================================
1184 * Polygon stipple
1185 */
1186
1187static void r128_cce_dispatch_stipple(struct drm_device *dev, u32 *stipple)
1188{
1189	drm_r128_private_t *dev_priv = dev->dev_private;
1190	int i;
1191	RING_LOCALS;
1192	DRM_DEBUG("\n");
1193
1194	BEGIN_RING(33);
1195
1196	OUT_RING(CCE_PACKET0(R128_BRUSH_DATA0, 31));
1197	for (i = 0; i < 32; i++)
1198		OUT_RING(stipple[i]);
1199
1200	ADVANCE_RING();
1201}
1202
1203/* ================================================================
1204 * IOCTL functions
1205 */
1206
1207static int r128_cce_clear(struct drm_device *dev, void *data, struct drm_file *file_priv)
1208{
1209	drm_r128_private_t *dev_priv = dev->dev_private;
1210	drm_r128_sarea_t *sarea_priv;
1211	drm_r128_clear_t *clear = data;
1212	DRM_DEBUG("\n");
1213
1214	LOCK_TEST_WITH_RETURN(dev, file_priv);
1215
1216	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1217
1218	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1219
1220	sarea_priv = dev_priv->sarea_priv;
1221
1222	if (sarea_priv->nbox > R128_NR_SAREA_CLIPRECTS)
1223		sarea_priv->nbox = R128_NR_SAREA_CLIPRECTS;
1224
1225	r128_cce_dispatch_clear(dev, clear);
1226	COMMIT_RING();
1227
1228	/* Make sure we restore the 3D state next time.
1229	 */
1230	dev_priv->sarea_priv->dirty |= R128_UPLOAD_CONTEXT | R128_UPLOAD_MASKS;
1231
1232	return 0;
1233}
1234
1235static int r128_do_init_pageflip(struct drm_device *dev)
1236{
1237	drm_r128_private_t *dev_priv = dev->dev_private;
1238	DRM_DEBUG("\n");
1239
1240	dev_priv->crtc_offset = R128_READ(R128_CRTC_OFFSET);
1241	dev_priv->crtc_offset_cntl = R128_READ(R128_CRTC_OFFSET_CNTL);
1242
1243	R128_WRITE(R128_CRTC_OFFSET, dev_priv->front_offset);
1244	R128_WRITE(R128_CRTC_OFFSET_CNTL,
1245		   dev_priv->crtc_offset_cntl | R128_CRTC_OFFSET_FLIP_CNTL);
1246
1247	dev_priv->page_flipping = 1;
1248	dev_priv->current_page = 0;
1249	dev_priv->sarea_priv->pfCurrentPage = dev_priv->current_page;
1250
1251	return 0;
1252}
1253
1254static int r128_do_cleanup_pageflip(struct drm_device *dev)
1255{
1256	drm_r128_private_t *dev_priv = dev->dev_private;
1257	DRM_DEBUG("\n");
1258
1259	R128_WRITE(R128_CRTC_OFFSET, dev_priv->crtc_offset);
1260	R128_WRITE(R128_CRTC_OFFSET_CNTL, dev_priv->crtc_offset_cntl);
1261
1262	if (dev_priv->current_page != 0) {
1263		r128_cce_dispatch_flip(dev);
1264		COMMIT_RING();
1265	}
1266
1267	dev_priv->page_flipping = 0;
1268	return 0;
1269}
1270
1271/* Swapping and flipping are different operations, need different ioctls.
1272 * They can & should be intermixed to support multiple 3d windows.
1273 */
1274
1275static int r128_cce_flip(struct drm_device *dev, void *data, struct drm_file *file_priv)
1276{
1277	drm_r128_private_t *dev_priv = dev->dev_private;
1278	DRM_DEBUG("\n");
1279
1280	LOCK_TEST_WITH_RETURN(dev, file_priv);
1281
1282	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1283
1284	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1285
1286	if (!dev_priv->page_flipping)
1287		r128_do_init_pageflip(dev);
1288
1289	r128_cce_dispatch_flip(dev);
1290
1291	COMMIT_RING();
1292	return 0;
1293}
1294
1295static int r128_cce_swap(struct drm_device *dev, void *data, struct drm_file *file_priv)
1296{
1297	drm_r128_private_t *dev_priv = dev->dev_private;
1298	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
1299	DRM_DEBUG("\n");
1300
1301	LOCK_TEST_WITH_RETURN(dev, file_priv);
1302
1303	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1304
1305	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1306
1307	if (sarea_priv->nbox > R128_NR_SAREA_CLIPRECTS)
1308		sarea_priv->nbox = R128_NR_SAREA_CLIPRECTS;
1309
1310	r128_cce_dispatch_swap(dev);
1311	dev_priv->sarea_priv->dirty |= (R128_UPLOAD_CONTEXT |
1312					R128_UPLOAD_MASKS);
1313
1314	COMMIT_RING();
1315	return 0;
1316}
1317
1318static int r128_cce_vertex(struct drm_device *dev, void *data, struct drm_file *file_priv)
1319{
1320	drm_r128_private_t *dev_priv = dev->dev_private;
1321	struct drm_device_dma *dma = dev->dma;
1322	struct drm_buf *buf;
1323	drm_r128_buf_priv_t *buf_priv;
1324	drm_r128_vertex_t *vertex = data;
1325
1326	LOCK_TEST_WITH_RETURN(dev, file_priv);
1327
1328	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1329
1330	DRM_DEBUG("pid=%d index=%d count=%d discard=%d\n",
1331		  DRM_CURRENTPID, vertex->idx, vertex->count, vertex->discard);
1332
1333	if (vertex->idx < 0 || vertex->idx >= dma->buf_count) {
1334		DRM_ERROR("buffer index %d (of %d max)\n",
1335			  vertex->idx, dma->buf_count - 1);
1336		return -EINVAL;
1337	}
1338	if (vertex->prim < 0 ||
1339	    vertex->prim > R128_CCE_VC_CNTL_PRIM_TYPE_TRI_TYPE2) {
1340		DRM_ERROR("buffer prim %d\n", vertex->prim);
1341		return -EINVAL;
1342	}
1343
1344	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1345	VB_AGE_TEST_WITH_RETURN(dev_priv);
1346
1347	buf = dma->buflist[vertex->idx];
1348	buf_priv = buf->dev_private;
1349
1350	if (buf->file_priv != file_priv) {
1351		DRM_ERROR("process %d using buffer owned by %p\n",
1352			  DRM_CURRENTPID, buf->file_priv);
1353		return -EINVAL;
1354	}
1355	if (buf->pending) {
1356		DRM_ERROR("sending pending buffer %d\n", vertex->idx);
1357		return -EINVAL;
1358	}
1359
1360	buf->used = vertex->count;
1361	buf_priv->prim = vertex->prim;
1362	buf_priv->discard = vertex->discard;
1363
1364	r128_cce_dispatch_vertex(dev, buf);
1365
1366	COMMIT_RING();
1367	return 0;
1368}
1369
1370static int r128_cce_indices(struct drm_device *dev, void *data, struct drm_file *file_priv)
1371{
1372	drm_r128_private_t *dev_priv = dev->dev_private;
1373	struct drm_device_dma *dma = dev->dma;
1374	struct drm_buf *buf;
1375	drm_r128_buf_priv_t *buf_priv;
1376	drm_r128_indices_t *elts = data;
1377	int count;
1378
1379	LOCK_TEST_WITH_RETURN(dev, file_priv);
1380
1381	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1382
1383	DRM_DEBUG("pid=%d buf=%d s=%d e=%d d=%d\n", DRM_CURRENTPID,
1384		  elts->idx, elts->start, elts->end, elts->discard);
1385
1386	if (elts->idx < 0 || elts->idx >= dma->buf_count) {
1387		DRM_ERROR("buffer index %d (of %d max)\n",
1388			  elts->idx, dma->buf_count - 1);
1389		return -EINVAL;
1390	}
1391	if (elts->prim < 0 ||
1392	    elts->prim > R128_CCE_VC_CNTL_PRIM_TYPE_TRI_TYPE2) {
1393		DRM_ERROR("buffer prim %d\n", elts->prim);
1394		return -EINVAL;
1395	}
1396
1397	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1398	VB_AGE_TEST_WITH_RETURN(dev_priv);
1399
1400	buf = dma->buflist[elts->idx];
1401	buf_priv = buf->dev_private;
1402
1403	if (buf->file_priv != file_priv) {
1404		DRM_ERROR("process %d using buffer owned by %p\n",
1405			  DRM_CURRENTPID, buf->file_priv);
1406		return -EINVAL;
1407	}
1408	if (buf->pending) {
1409		DRM_ERROR("sending pending buffer %d\n", elts->idx);
1410		return -EINVAL;
1411	}
1412
1413	count = (elts->end - elts->start) / sizeof(u16);
1414	elts->start -= R128_INDEX_PRIM_OFFSET;
1415
1416	if (elts->start & 0x7) {
1417		DRM_ERROR("misaligned buffer 0x%x\n", elts->start);
1418		return -EINVAL;
1419	}
1420	if (elts->start < buf->used) {
1421		DRM_ERROR("no header 0x%x - 0x%x\n", elts->start, buf->used);
1422		return -EINVAL;
1423	}
1424
1425	buf->used = elts->end;
1426	buf_priv->prim = elts->prim;
1427	buf_priv->discard = elts->discard;
1428
1429	r128_cce_dispatch_indices(dev, buf, elts->start, elts->end, count);
1430
1431	COMMIT_RING();
1432	return 0;
1433}
1434
1435static int r128_cce_blit(struct drm_device *dev, void *data, struct drm_file *file_priv)
1436{
1437	struct drm_device_dma *dma = dev->dma;
1438	drm_r128_private_t *dev_priv = dev->dev_private;
1439	drm_r128_blit_t *blit = data;
1440	int ret;
1441
1442	LOCK_TEST_WITH_RETURN(dev, file_priv);
1443
1444	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1445
1446	DRM_DEBUG("pid=%d index=%d\n", DRM_CURRENTPID, blit->idx);
1447
1448	if (blit->idx < 0 || blit->idx >= dma->buf_count) {
1449		DRM_ERROR("buffer index %d (of %d max)\n",
1450			  blit->idx, dma->buf_count - 1);
1451		return -EINVAL;
1452	}
1453
1454	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1455	VB_AGE_TEST_WITH_RETURN(dev_priv);
1456
1457	ret = r128_cce_dispatch_blit(dev, file_priv, blit);
1458
1459	COMMIT_RING();
1460	return ret;
1461}
1462
1463static int r128_cce_depth(struct drm_device *dev, void *data, struct drm_file *file_priv)
1464{
1465	drm_r128_private_t *dev_priv = dev->dev_private;
1466	drm_r128_depth_t *depth = data;
1467	int ret;
1468
1469	LOCK_TEST_WITH_RETURN(dev, file_priv);
1470
1471	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1472
1473	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1474
1475	ret = -EINVAL;
1476	switch (depth->func) {
1477	case R128_WRITE_SPAN:
1478		ret = r128_cce_dispatch_write_span(dev, depth);
1479		break;
1480	case R128_WRITE_PIXELS:
1481		ret = r128_cce_dispatch_write_pixels(dev, depth);
1482		break;
1483	case R128_READ_SPAN:
1484		ret = r128_cce_dispatch_read_span(dev, depth);
1485		break;
1486	case R128_READ_PIXELS:
1487		ret = r128_cce_dispatch_read_pixels(dev, depth);
1488		break;
1489	}
1490
1491	COMMIT_RING();
1492	return ret;
1493}
1494
1495static int r128_cce_stipple(struct drm_device *dev, void *data, struct drm_file *file_priv)
1496{
1497	drm_r128_private_t *dev_priv = dev->dev_private;
1498	drm_r128_stipple_t *stipple = data;
1499	u32 mask[32];
1500
1501	LOCK_TEST_WITH_RETURN(dev, file_priv);
1502
1503	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1504
1505	if (copy_from_user(&mask, stipple->mask, 32 * sizeof(u32)))
1506		return -EFAULT;
1507
1508	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1509
1510	r128_cce_dispatch_stipple(dev, mask);
1511
1512	COMMIT_RING();
1513	return 0;
1514}
1515
1516static int r128_cce_indirect(struct drm_device *dev, void *data, struct drm_file *file_priv)
1517{
1518	drm_r128_private_t *dev_priv = dev->dev_private;
1519	struct drm_device_dma *dma = dev->dma;
1520	struct drm_buf *buf;
1521	drm_r128_buf_priv_t *buf_priv;
1522	drm_r128_indirect_t *indirect = data;
1523#if 0
1524	RING_LOCALS;
1525#endif
1526
1527	LOCK_TEST_WITH_RETURN(dev, file_priv);
1528
1529	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1530
1531	DRM_DEBUG("idx=%d s=%d e=%d d=%d\n",
1532		  indirect->idx, indirect->start, indirect->end,
1533		  indirect->discard);
1534
1535	if (indirect->idx < 0 || indirect->idx >= dma->buf_count) {
1536		DRM_ERROR("buffer index %d (of %d max)\n",
1537			  indirect->idx, dma->buf_count - 1);
1538		return -EINVAL;
1539	}
1540
1541	buf = dma->buflist[indirect->idx];
1542	buf_priv = buf->dev_private;
1543
1544	if (buf->file_priv != file_priv) {
1545		DRM_ERROR("process %d using buffer owned by %p\n",
1546			  DRM_CURRENTPID, buf->file_priv);
1547		return -EINVAL;
1548	}
1549	if (buf->pending) {
1550		DRM_ERROR("sending pending buffer %d\n", indirect->idx);
1551		return -EINVAL;
1552	}
1553
1554	if (indirect->start < buf->used) {
1555		DRM_ERROR("reusing indirect: start=0x%x actual=0x%x\n",
1556			  indirect->start, buf->used);
1557		return -EINVAL;
1558	}
1559
1560	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1561	VB_AGE_TEST_WITH_RETURN(dev_priv);
1562
1563	buf->used = indirect->end;
1564	buf_priv->discard = indirect->discard;
1565
1566#if 0
1567	/* Wait for the 3D stream to idle before the indirect buffer
1568	 * containing 2D acceleration commands is processed.
1569	 */
1570	BEGIN_RING(2);
1571	RADEON_WAIT_UNTIL_3D_IDLE();
1572	ADVANCE_RING();
1573#endif
1574
1575	/* Dispatch the indirect buffer full of commands from the
1576	 * X server.  This is insecure and is thus only available to
1577	 * privileged clients.
1578	 */
1579	r128_cce_dispatch_indirect(dev, buf, indirect->start, indirect->end);
1580
1581	COMMIT_RING();
1582	return 0;
1583}
1584
1585static int r128_getparam(struct drm_device *dev, void *data, struct drm_file *file_priv)
1586{
1587	drm_r128_private_t *dev_priv = dev->dev_private;
1588	drm_r128_getparam_t *param = data;
1589	int value;
1590
1591	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1592
1593	DRM_DEBUG("pid=%d\n", DRM_CURRENTPID);
1594
1595	switch (param->param) {
1596	case R128_PARAM_IRQ_NR:
1597		value = dev->pdev->irq;
1598		break;
1599	default:
1600		return -EINVAL;
1601	}
1602
1603	if (copy_to_user(param->value, &value, sizeof(int))) {
1604		DRM_ERROR("copy_to_user\n");
1605		return -EFAULT;
1606	}
1607
1608	return 0;
1609}
1610
1611void r128_driver_preclose(struct drm_device *dev, struct drm_file *file_priv)
1612{
1613	if (dev->dev_private) {
1614		drm_r128_private_t *dev_priv = dev->dev_private;
1615		if (dev_priv->page_flipping)
1616			r128_do_cleanup_pageflip(dev);
1617	}
1618}
1619void r128_driver_lastclose(struct drm_device *dev)
1620{
1621	r128_do_cleanup_cce(dev);
1622}
1623
1624const struct drm_ioctl_desc r128_ioctls[] = {
1625	DRM_IOCTL_DEF_DRV(R128_INIT, r128_cce_init, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1626	DRM_IOCTL_DEF_DRV(R128_CCE_START, r128_cce_start, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1627	DRM_IOCTL_DEF_DRV(R128_CCE_STOP, r128_cce_stop, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1628	DRM_IOCTL_DEF_DRV(R128_CCE_RESET, r128_cce_reset, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1629	DRM_IOCTL_DEF_DRV(R128_CCE_IDLE, r128_cce_idle, DRM_AUTH),
1630	DRM_IOCTL_DEF_DRV(R128_RESET, r128_engine_reset, DRM_AUTH),
1631	DRM_IOCTL_DEF_DRV(R128_FULLSCREEN, r128_fullscreen, DRM_AUTH),
1632	DRM_IOCTL_DEF_DRV(R128_SWAP, r128_cce_swap, DRM_AUTH),
1633	DRM_IOCTL_DEF_DRV(R128_FLIP, r128_cce_flip, DRM_AUTH),
1634	DRM_IOCTL_DEF_DRV(R128_CLEAR, r128_cce_clear, DRM_AUTH),
1635	DRM_IOCTL_DEF_DRV(R128_VERTEX, r128_cce_vertex, DRM_AUTH),
1636	DRM_IOCTL_DEF_DRV(R128_INDICES, r128_cce_indices, DRM_AUTH),
1637	DRM_IOCTL_DEF_DRV(R128_BLIT, r128_cce_blit, DRM_AUTH),
1638	DRM_IOCTL_DEF_DRV(R128_DEPTH, r128_cce_depth, DRM_AUTH),
1639	DRM_IOCTL_DEF_DRV(R128_STIPPLE, r128_cce_stipple, DRM_AUTH),
1640	DRM_IOCTL_DEF_DRV(R128_INDIRECT, r128_cce_indirect, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1641	DRM_IOCTL_DEF_DRV(R128_GETPARAM, r128_getparam, DRM_AUTH),
1642};
1643
1644int r128_max_ioctl = ARRAY_SIZE(r128_ioctls);
v5.9
   1/* r128_state.c -- State support for r128 -*- linux-c -*-
   2 * Created: Thu Jan 27 02:53:43 2000 by gareth@valinux.com
   3 */
   4/*
   5 * Copyright 2000 VA Linux Systems, Inc., Sunnyvale, California.
   6 * All Rights Reserved.
   7 *
   8 * Permission is hereby granted, free of charge, to any person obtaining a
   9 * copy of this software and associated documentation files (the "Software"),
  10 * to deal in the Software without restriction, including without limitation
  11 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  12 * and/or sell copies of the Software, and to permit persons to whom the
  13 * Software is furnished to do so, subject to the following conditions:
  14 *
  15 * The above copyright notice and this permission notice (including the next
  16 * paragraph) shall be included in all copies or substantial portions of the
  17 * Software.
  18 *
  19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  20 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  21 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  22 * PRECISION INSIGHT AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
  23 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  24 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
  25 * DEALINGS IN THE SOFTWARE.
  26 *
  27 * Authors:
  28 *    Gareth Hughes <gareth@valinux.com>
  29 */
  30
  31#include <linux/pci.h>
  32#include <linux/slab.h>
  33#include <linux/uaccess.h>
  34
  35#include <drm/drm_device.h>
  36#include <drm/drm_file.h>
  37#include <drm/drm_print.h>
  38#include <drm/r128_drm.h>
  39
  40#include "r128_drv.h"
  41
  42/* ================================================================
  43 * CCE hardware state programming functions
  44 */
  45
  46static void r128_emit_clip_rects(drm_r128_private_t *dev_priv,
  47				 struct drm_clip_rect *boxes, int count)
  48{
  49	u32 aux_sc_cntl = 0x00000000;
  50	RING_LOCALS;
  51	DRM_DEBUG("\n");
  52
  53	BEGIN_RING((count < 3 ? count : 3) * 5 + 2);
  54
  55	if (count >= 1) {
  56		OUT_RING(CCE_PACKET0(R128_AUX1_SC_LEFT, 3));
  57		OUT_RING(boxes[0].x1);
  58		OUT_RING(boxes[0].x2 - 1);
  59		OUT_RING(boxes[0].y1);
  60		OUT_RING(boxes[0].y2 - 1);
  61
  62		aux_sc_cntl |= (R128_AUX1_SC_EN | R128_AUX1_SC_MODE_OR);
  63	}
  64	if (count >= 2) {
  65		OUT_RING(CCE_PACKET0(R128_AUX2_SC_LEFT, 3));
  66		OUT_RING(boxes[1].x1);
  67		OUT_RING(boxes[1].x2 - 1);
  68		OUT_RING(boxes[1].y1);
  69		OUT_RING(boxes[1].y2 - 1);
  70
  71		aux_sc_cntl |= (R128_AUX2_SC_EN | R128_AUX2_SC_MODE_OR);
  72	}
  73	if (count >= 3) {
  74		OUT_RING(CCE_PACKET0(R128_AUX3_SC_LEFT, 3));
  75		OUT_RING(boxes[2].x1);
  76		OUT_RING(boxes[2].x2 - 1);
  77		OUT_RING(boxes[2].y1);
  78		OUT_RING(boxes[2].y2 - 1);
  79
  80		aux_sc_cntl |= (R128_AUX3_SC_EN | R128_AUX3_SC_MODE_OR);
  81	}
  82
  83	OUT_RING(CCE_PACKET0(R128_AUX_SC_CNTL, 0));
  84	OUT_RING(aux_sc_cntl);
  85
  86	ADVANCE_RING();
  87}
  88
  89static __inline__ void r128_emit_core(drm_r128_private_t *dev_priv)
  90{
  91	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
  92	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
  93	RING_LOCALS;
  94	DRM_DEBUG("\n");
  95
  96	BEGIN_RING(2);
  97
  98	OUT_RING(CCE_PACKET0(R128_SCALE_3D_CNTL, 0));
  99	OUT_RING(ctx->scale_3d_cntl);
 100
 101	ADVANCE_RING();
 102}
 103
 104static __inline__ void r128_emit_context(drm_r128_private_t *dev_priv)
 105{
 106	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 107	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
 108	RING_LOCALS;
 109	DRM_DEBUG("\n");
 110
 111	BEGIN_RING(13);
 112
 113	OUT_RING(CCE_PACKET0(R128_DST_PITCH_OFFSET_C, 11));
 114	OUT_RING(ctx->dst_pitch_offset_c);
 115	OUT_RING(ctx->dp_gui_master_cntl_c);
 116	OUT_RING(ctx->sc_top_left_c);
 117	OUT_RING(ctx->sc_bottom_right_c);
 118	OUT_RING(ctx->z_offset_c);
 119	OUT_RING(ctx->z_pitch_c);
 120	OUT_RING(ctx->z_sten_cntl_c);
 121	OUT_RING(ctx->tex_cntl_c);
 122	OUT_RING(ctx->misc_3d_state_cntl_reg);
 123	OUT_RING(ctx->texture_clr_cmp_clr_c);
 124	OUT_RING(ctx->texture_clr_cmp_msk_c);
 125	OUT_RING(ctx->fog_color_c);
 126
 127	ADVANCE_RING();
 128}
 129
 130static __inline__ void r128_emit_setup(drm_r128_private_t *dev_priv)
 131{
 132	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 133	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
 134	RING_LOCALS;
 135	DRM_DEBUG("\n");
 136
 137	BEGIN_RING(3);
 138
 139	OUT_RING(CCE_PACKET1(R128_SETUP_CNTL, R128_PM4_VC_FPU_SETUP));
 140	OUT_RING(ctx->setup_cntl);
 141	OUT_RING(ctx->pm4_vc_fpu_setup);
 142
 143	ADVANCE_RING();
 144}
 145
 146static __inline__ void r128_emit_masks(drm_r128_private_t *dev_priv)
 147{
 148	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 149	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
 150	RING_LOCALS;
 151	DRM_DEBUG("\n");
 152
 153	BEGIN_RING(5);
 154
 155	OUT_RING(CCE_PACKET0(R128_DP_WRITE_MASK, 0));
 156	OUT_RING(ctx->dp_write_mask);
 157
 158	OUT_RING(CCE_PACKET0(R128_STEN_REF_MASK_C, 1));
 159	OUT_RING(ctx->sten_ref_mask_c);
 160	OUT_RING(ctx->plane_3d_mask_c);
 161
 162	ADVANCE_RING();
 163}
 164
 165static __inline__ void r128_emit_window(drm_r128_private_t *dev_priv)
 166{
 167	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 168	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
 169	RING_LOCALS;
 170	DRM_DEBUG("\n");
 171
 172	BEGIN_RING(2);
 173
 174	OUT_RING(CCE_PACKET0(R128_WINDOW_XY_OFFSET, 0));
 175	OUT_RING(ctx->window_xy_offset);
 176
 177	ADVANCE_RING();
 178}
 179
 180static __inline__ void r128_emit_tex0(drm_r128_private_t *dev_priv)
 181{
 182	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 183	drm_r128_context_regs_t *ctx = &sarea_priv->context_state;
 184	drm_r128_texture_regs_t *tex = &sarea_priv->tex_state[0];
 185	int i;
 186	RING_LOCALS;
 187	DRM_DEBUG("\n");
 188
 189	BEGIN_RING(7 + R128_MAX_TEXTURE_LEVELS);
 190
 191	OUT_RING(CCE_PACKET0(R128_PRIM_TEX_CNTL_C,
 192			     2 + R128_MAX_TEXTURE_LEVELS));
 193	OUT_RING(tex->tex_cntl);
 194	OUT_RING(tex->tex_combine_cntl);
 195	OUT_RING(ctx->tex_size_pitch_c);
 196	for (i = 0; i < R128_MAX_TEXTURE_LEVELS; i++)
 197		OUT_RING(tex->tex_offset[i]);
 198
 199	OUT_RING(CCE_PACKET0(R128_CONSTANT_COLOR_C, 1));
 200	OUT_RING(ctx->constant_color_c);
 201	OUT_RING(tex->tex_border_color);
 202
 203	ADVANCE_RING();
 204}
 205
 206static __inline__ void r128_emit_tex1(drm_r128_private_t *dev_priv)
 207{
 208	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 209	drm_r128_texture_regs_t *tex = &sarea_priv->tex_state[1];
 210	int i;
 211	RING_LOCALS;
 212	DRM_DEBUG("\n");
 213
 214	BEGIN_RING(5 + R128_MAX_TEXTURE_LEVELS);
 215
 216	OUT_RING(CCE_PACKET0(R128_SEC_TEX_CNTL_C, 1 + R128_MAX_TEXTURE_LEVELS));
 217	OUT_RING(tex->tex_cntl);
 218	OUT_RING(tex->tex_combine_cntl);
 219	for (i = 0; i < R128_MAX_TEXTURE_LEVELS; i++)
 220		OUT_RING(tex->tex_offset[i]);
 221
 222	OUT_RING(CCE_PACKET0(R128_SEC_TEXTURE_BORDER_COLOR_C, 0));
 223	OUT_RING(tex->tex_border_color);
 224
 225	ADVANCE_RING();
 226}
 227
 228static void r128_emit_state(drm_r128_private_t *dev_priv)
 229{
 230	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 231	unsigned int dirty = sarea_priv->dirty;
 232
 233	DRM_DEBUG("dirty=0x%08x\n", dirty);
 234
 235	if (dirty & R128_UPLOAD_CORE) {
 236		r128_emit_core(dev_priv);
 237		sarea_priv->dirty &= ~R128_UPLOAD_CORE;
 238	}
 239
 240	if (dirty & R128_UPLOAD_CONTEXT) {
 241		r128_emit_context(dev_priv);
 242		sarea_priv->dirty &= ~R128_UPLOAD_CONTEXT;
 243	}
 244
 245	if (dirty & R128_UPLOAD_SETUP) {
 246		r128_emit_setup(dev_priv);
 247		sarea_priv->dirty &= ~R128_UPLOAD_SETUP;
 248	}
 249
 250	if (dirty & R128_UPLOAD_MASKS) {
 251		r128_emit_masks(dev_priv);
 252		sarea_priv->dirty &= ~R128_UPLOAD_MASKS;
 253	}
 254
 255	if (dirty & R128_UPLOAD_WINDOW) {
 256		r128_emit_window(dev_priv);
 257		sarea_priv->dirty &= ~R128_UPLOAD_WINDOW;
 258	}
 259
 260	if (dirty & R128_UPLOAD_TEX0) {
 261		r128_emit_tex0(dev_priv);
 262		sarea_priv->dirty &= ~R128_UPLOAD_TEX0;
 263	}
 264
 265	if (dirty & R128_UPLOAD_TEX1) {
 266		r128_emit_tex1(dev_priv);
 267		sarea_priv->dirty &= ~R128_UPLOAD_TEX1;
 268	}
 269
 270	/* Turn off the texture cache flushing */
 271	sarea_priv->context_state.tex_cntl_c &= ~R128_TEX_CACHE_FLUSH;
 272
 273	sarea_priv->dirty &= ~R128_REQUIRE_QUIESCENCE;
 274}
 275
 276#if R128_PERFORMANCE_BOXES
 277/* ================================================================
 278 * Performance monitoring functions
 279 */
 280
 281static void r128_clear_box(drm_r128_private_t *dev_priv,
 282			   int x, int y, int w, int h, int r, int g, int b)
 283{
 284	u32 pitch, offset;
 285	u32 fb_bpp, color;
 286	RING_LOCALS;
 287
 288	switch (dev_priv->fb_bpp) {
 289	case 16:
 290		fb_bpp = R128_GMC_DST_16BPP;
 291		color = (((r & 0xf8) << 8) |
 292			 ((g & 0xfc) << 3) | ((b & 0xf8) >> 3));
 293		break;
 294	case 24:
 295		fb_bpp = R128_GMC_DST_24BPP;
 296		color = ((r << 16) | (g << 8) | b);
 297		break;
 298	case 32:
 299		fb_bpp = R128_GMC_DST_32BPP;
 300		color = (((0xff) << 24) | (r << 16) | (g << 8) | b);
 301		break;
 302	default:
 303		return;
 304	}
 305
 306	offset = dev_priv->back_offset;
 307	pitch = dev_priv->back_pitch >> 3;
 308
 309	BEGIN_RING(6);
 310
 311	OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 312	OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 313		 R128_GMC_BRUSH_SOLID_COLOR |
 314		 fb_bpp |
 315		 R128_GMC_SRC_DATATYPE_COLOR |
 316		 R128_ROP3_P |
 317		 R128_GMC_CLR_CMP_CNTL_DIS | R128_GMC_AUX_CLIP_DIS);
 318
 319	OUT_RING((pitch << 21) | (offset >> 5));
 320	OUT_RING(color);
 321
 322	OUT_RING((x << 16) | y);
 323	OUT_RING((w << 16) | h);
 324
 325	ADVANCE_RING();
 326}
 327
 328static void r128_cce_performance_boxes(drm_r128_private_t *dev_priv)
 329{
 330	if (atomic_read(&dev_priv->idle_count) == 0)
 331		r128_clear_box(dev_priv, 64, 4, 8, 8, 0, 255, 0);
 332	else
 333		atomic_set(&dev_priv->idle_count, 0);
 334}
 335
 336#endif
 337
 338/* ================================================================
 339 * CCE command dispatch functions
 340 */
 341
 342static void r128_print_dirty(const char *msg, unsigned int flags)
 343{
 344	DRM_INFO("%s: (0x%x) %s%s%s%s%s%s%s%s%s\n",
 345		 msg,
 346		 flags,
 347		 (flags & R128_UPLOAD_CORE) ? "core, " : "",
 348		 (flags & R128_UPLOAD_CONTEXT) ? "context, " : "",
 349		 (flags & R128_UPLOAD_SETUP) ? "setup, " : "",
 350		 (flags & R128_UPLOAD_TEX0) ? "tex0, " : "",
 351		 (flags & R128_UPLOAD_TEX1) ? "tex1, " : "",
 352		 (flags & R128_UPLOAD_MASKS) ? "masks, " : "",
 353		 (flags & R128_UPLOAD_WINDOW) ? "window, " : "",
 354		 (flags & R128_UPLOAD_CLIPRECTS) ? "cliprects, " : "",
 355		 (flags & R128_REQUIRE_QUIESCENCE) ? "quiescence, " : "");
 356}
 357
 358static void r128_cce_dispatch_clear(struct drm_device *dev,
 359				    drm_r128_clear_t *clear)
 360{
 361	drm_r128_private_t *dev_priv = dev->dev_private;
 362	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 363	int nbox = sarea_priv->nbox;
 364	struct drm_clip_rect *pbox = sarea_priv->boxes;
 365	unsigned int flags = clear->flags;
 366	int i;
 367	RING_LOCALS;
 368	DRM_DEBUG("\n");
 369
 370	if (dev_priv->page_flipping && dev_priv->current_page == 1) {
 371		unsigned int tmp = flags;
 372
 373		flags &= ~(R128_FRONT | R128_BACK);
 374		if (tmp & R128_FRONT)
 375			flags |= R128_BACK;
 376		if (tmp & R128_BACK)
 377			flags |= R128_FRONT;
 378	}
 379
 380	for (i = 0; i < nbox; i++) {
 381		int x = pbox[i].x1;
 382		int y = pbox[i].y1;
 383		int w = pbox[i].x2 - x;
 384		int h = pbox[i].y2 - y;
 385
 386		DRM_DEBUG("dispatch clear %d,%d-%d,%d flags 0x%x\n",
 387			  pbox[i].x1, pbox[i].y1, pbox[i].x2,
 388			  pbox[i].y2, flags);
 389
 390		if (flags & (R128_FRONT | R128_BACK)) {
 391			BEGIN_RING(2);
 392
 393			OUT_RING(CCE_PACKET0(R128_DP_WRITE_MASK, 0));
 394			OUT_RING(clear->color_mask);
 395
 396			ADVANCE_RING();
 397		}
 398
 399		if (flags & R128_FRONT) {
 400			BEGIN_RING(6);
 401
 402			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 403			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 404				 R128_GMC_BRUSH_SOLID_COLOR |
 405				 (dev_priv->color_fmt << 8) |
 406				 R128_GMC_SRC_DATATYPE_COLOR |
 407				 R128_ROP3_P |
 408				 R128_GMC_CLR_CMP_CNTL_DIS |
 409				 R128_GMC_AUX_CLIP_DIS);
 410
 411			OUT_RING(dev_priv->front_pitch_offset_c);
 412			OUT_RING(clear->clear_color);
 413
 414			OUT_RING((x << 16) | y);
 415			OUT_RING((w << 16) | h);
 416
 417			ADVANCE_RING();
 418		}
 419
 420		if (flags & R128_BACK) {
 421			BEGIN_RING(6);
 422
 423			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 424			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 425				 R128_GMC_BRUSH_SOLID_COLOR |
 426				 (dev_priv->color_fmt << 8) |
 427				 R128_GMC_SRC_DATATYPE_COLOR |
 428				 R128_ROP3_P |
 429				 R128_GMC_CLR_CMP_CNTL_DIS |
 430				 R128_GMC_AUX_CLIP_DIS);
 431
 432			OUT_RING(dev_priv->back_pitch_offset_c);
 433			OUT_RING(clear->clear_color);
 434
 435			OUT_RING((x << 16) | y);
 436			OUT_RING((w << 16) | h);
 437
 438			ADVANCE_RING();
 439		}
 440
 441		if (flags & R128_DEPTH) {
 442			BEGIN_RING(6);
 443
 444			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 445			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 446				 R128_GMC_BRUSH_SOLID_COLOR |
 447				 (dev_priv->depth_fmt << 8) |
 448				 R128_GMC_SRC_DATATYPE_COLOR |
 449				 R128_ROP3_P |
 450				 R128_GMC_CLR_CMP_CNTL_DIS |
 451				 R128_GMC_AUX_CLIP_DIS | R128_GMC_WR_MSK_DIS);
 452
 453			OUT_RING(dev_priv->depth_pitch_offset_c);
 454			OUT_RING(clear->clear_depth);
 455
 456			OUT_RING((x << 16) | y);
 457			OUT_RING((w << 16) | h);
 458
 459			ADVANCE_RING();
 460		}
 461	}
 462}
 463
 464static void r128_cce_dispatch_swap(struct drm_device *dev)
 465{
 466	drm_r128_private_t *dev_priv = dev->dev_private;
 467	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 468	int nbox = sarea_priv->nbox;
 469	struct drm_clip_rect *pbox = sarea_priv->boxes;
 470	int i;
 471	RING_LOCALS;
 472	DRM_DEBUG("\n");
 473
 474#if R128_PERFORMANCE_BOXES
 475	/* Do some trivial performance monitoring...
 476	 */
 477	r128_cce_performance_boxes(dev_priv);
 478#endif
 479
 480	for (i = 0; i < nbox; i++) {
 481		int x = pbox[i].x1;
 482		int y = pbox[i].y1;
 483		int w = pbox[i].x2 - x;
 484		int h = pbox[i].y2 - y;
 485
 486		BEGIN_RING(7);
 487
 488		OUT_RING(CCE_PACKET3(R128_CNTL_BITBLT_MULTI, 5));
 489		OUT_RING(R128_GMC_SRC_PITCH_OFFSET_CNTL |
 490			 R128_GMC_DST_PITCH_OFFSET_CNTL |
 491			 R128_GMC_BRUSH_NONE |
 492			 (dev_priv->color_fmt << 8) |
 493			 R128_GMC_SRC_DATATYPE_COLOR |
 494			 R128_ROP3_S |
 495			 R128_DP_SRC_SOURCE_MEMORY |
 496			 R128_GMC_CLR_CMP_CNTL_DIS |
 497			 R128_GMC_AUX_CLIP_DIS | R128_GMC_WR_MSK_DIS);
 498
 499		/* Make this work even if front & back are flipped:
 500		 */
 501		if (dev_priv->current_page == 0) {
 502			OUT_RING(dev_priv->back_pitch_offset_c);
 503			OUT_RING(dev_priv->front_pitch_offset_c);
 504		} else {
 505			OUT_RING(dev_priv->front_pitch_offset_c);
 506			OUT_RING(dev_priv->back_pitch_offset_c);
 507		}
 508
 509		OUT_RING((x << 16) | y);
 510		OUT_RING((x << 16) | y);
 511		OUT_RING((w << 16) | h);
 512
 513		ADVANCE_RING();
 514	}
 515
 516	/* Increment the frame counter.  The client-side 3D driver must
 517	 * throttle the framerate by waiting for this value before
 518	 * performing the swapbuffer ioctl.
 519	 */
 520	dev_priv->sarea_priv->last_frame++;
 521
 522	BEGIN_RING(2);
 523
 524	OUT_RING(CCE_PACKET0(R128_LAST_FRAME_REG, 0));
 525	OUT_RING(dev_priv->sarea_priv->last_frame);
 526
 527	ADVANCE_RING();
 528}
 529
 530static void r128_cce_dispatch_flip(struct drm_device *dev)
 531{
 532	drm_r128_private_t *dev_priv = dev->dev_private;
 533	RING_LOCALS;
 534	DRM_DEBUG("page=%d pfCurrentPage=%d\n",
 535		  dev_priv->current_page, dev_priv->sarea_priv->pfCurrentPage);
 536
 537#if R128_PERFORMANCE_BOXES
 538	/* Do some trivial performance monitoring...
 539	 */
 540	r128_cce_performance_boxes(dev_priv);
 541#endif
 542
 543	BEGIN_RING(4);
 544
 545	R128_WAIT_UNTIL_PAGE_FLIPPED();
 546	OUT_RING(CCE_PACKET0(R128_CRTC_OFFSET, 0));
 547
 548	if (dev_priv->current_page == 0)
 549		OUT_RING(dev_priv->back_offset);
 550	else
 551		OUT_RING(dev_priv->front_offset);
 552
 553	ADVANCE_RING();
 554
 555	/* Increment the frame counter.  The client-side 3D driver must
 556	 * throttle the framerate by waiting for this value before
 557	 * performing the swapbuffer ioctl.
 558	 */
 559	dev_priv->sarea_priv->last_frame++;
 560	dev_priv->sarea_priv->pfCurrentPage = dev_priv->current_page =
 561	    1 - dev_priv->current_page;
 562
 563	BEGIN_RING(2);
 564
 565	OUT_RING(CCE_PACKET0(R128_LAST_FRAME_REG, 0));
 566	OUT_RING(dev_priv->sarea_priv->last_frame);
 567
 568	ADVANCE_RING();
 569}
 570
 571static void r128_cce_dispatch_vertex(struct drm_device *dev, struct drm_buf *buf)
 572{
 573	drm_r128_private_t *dev_priv = dev->dev_private;
 574	drm_r128_buf_priv_t *buf_priv = buf->dev_private;
 575	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 576	int format = sarea_priv->vc_format;
 577	int offset = buf->bus_address;
 578	int size = buf->used;
 579	int prim = buf_priv->prim;
 580	int i = 0;
 581	RING_LOCALS;
 582	DRM_DEBUG("buf=%d nbox=%d\n", buf->idx, sarea_priv->nbox);
 583
 584	if (0)
 585		r128_print_dirty("dispatch_vertex", sarea_priv->dirty);
 586
 587	if (buf->used) {
 588		buf_priv->dispatched = 1;
 589
 590		if (sarea_priv->dirty & ~R128_UPLOAD_CLIPRECTS)
 591			r128_emit_state(dev_priv);
 592
 593		do {
 594			/* Emit the next set of up to three cliprects */
 595			if (i < sarea_priv->nbox) {
 596				r128_emit_clip_rects(dev_priv,
 597						     &sarea_priv->boxes[i],
 598						     sarea_priv->nbox - i);
 599			}
 600
 601			/* Emit the vertex buffer rendering commands */
 602			BEGIN_RING(5);
 603
 604			OUT_RING(CCE_PACKET3(R128_3D_RNDR_GEN_INDX_PRIM, 3));
 605			OUT_RING(offset);
 606			OUT_RING(size);
 607			OUT_RING(format);
 608			OUT_RING(prim | R128_CCE_VC_CNTL_PRIM_WALK_LIST |
 609				 (size << R128_CCE_VC_CNTL_NUM_SHIFT));
 610
 611			ADVANCE_RING();
 612
 613			i += 3;
 614		} while (i < sarea_priv->nbox);
 615	}
 616
 617	if (buf_priv->discard) {
 618		buf_priv->age = dev_priv->sarea_priv->last_dispatch;
 619
 620		/* Emit the vertex buffer age */
 621		BEGIN_RING(2);
 622
 623		OUT_RING(CCE_PACKET0(R128_LAST_DISPATCH_REG, 0));
 624		OUT_RING(buf_priv->age);
 625
 626		ADVANCE_RING();
 627
 628		buf->pending = 1;
 629		buf->used = 0;
 630		/* FIXME: Check dispatched field */
 631		buf_priv->dispatched = 0;
 632	}
 633
 634	dev_priv->sarea_priv->last_dispatch++;
 635
 636	sarea_priv->dirty &= ~R128_UPLOAD_CLIPRECTS;
 637	sarea_priv->nbox = 0;
 638}
 639
 640static void r128_cce_dispatch_indirect(struct drm_device *dev,
 641				       struct drm_buf *buf, int start, int end)
 642{
 643	drm_r128_private_t *dev_priv = dev->dev_private;
 644	drm_r128_buf_priv_t *buf_priv = buf->dev_private;
 645	RING_LOCALS;
 646	DRM_DEBUG("indirect: buf=%d s=0x%x e=0x%x\n", buf->idx, start, end);
 647
 648	if (start != end) {
 649		int offset = buf->bus_address + start;
 650		int dwords = (end - start + 3) / sizeof(u32);
 651
 652		/* Indirect buffer data must be an even number of
 653		 * dwords, so if we've been given an odd number we must
 654		 * pad the data with a Type-2 CCE packet.
 655		 */
 656		if (dwords & 1) {
 657			u32 *data = (u32 *)
 658			    ((char *)dev->agp_buffer_map->handle
 659			     + buf->offset + start);
 660			data[dwords++] = cpu_to_le32(R128_CCE_PACKET2);
 661		}
 662
 663		buf_priv->dispatched = 1;
 664
 665		/* Fire off the indirect buffer */
 666		BEGIN_RING(3);
 667
 668		OUT_RING(CCE_PACKET0(R128_PM4_IW_INDOFF, 1));
 669		OUT_RING(offset);
 670		OUT_RING(dwords);
 671
 672		ADVANCE_RING();
 673	}
 674
 675	if (buf_priv->discard) {
 676		buf_priv->age = dev_priv->sarea_priv->last_dispatch;
 677
 678		/* Emit the indirect buffer age */
 679		BEGIN_RING(2);
 680
 681		OUT_RING(CCE_PACKET0(R128_LAST_DISPATCH_REG, 0));
 682		OUT_RING(buf_priv->age);
 683
 684		ADVANCE_RING();
 685
 686		buf->pending = 1;
 687		buf->used = 0;
 688		/* FIXME: Check dispatched field */
 689		buf_priv->dispatched = 0;
 690	}
 691
 692	dev_priv->sarea_priv->last_dispatch++;
 693}
 694
 695static void r128_cce_dispatch_indices(struct drm_device *dev,
 696				      struct drm_buf *buf,
 697				      int start, int end, int count)
 698{
 699	drm_r128_private_t *dev_priv = dev->dev_private;
 700	drm_r128_buf_priv_t *buf_priv = buf->dev_private;
 701	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
 702	int format = sarea_priv->vc_format;
 703	int offset = dev->agp_buffer_map->offset - dev_priv->cce_buffers_offset;
 704	int prim = buf_priv->prim;
 705	u32 *data;
 706	int dwords;
 707	int i = 0;
 708	RING_LOCALS;
 709	DRM_DEBUG("indices: s=%d e=%d c=%d\n", start, end, count);
 710
 711	if (0)
 712		r128_print_dirty("dispatch_indices", sarea_priv->dirty);
 713
 714	if (start != end) {
 715		buf_priv->dispatched = 1;
 716
 717		if (sarea_priv->dirty & ~R128_UPLOAD_CLIPRECTS)
 718			r128_emit_state(dev_priv);
 719
 720		dwords = (end - start + 3) / sizeof(u32);
 721
 722		data = (u32 *) ((char *)dev->agp_buffer_map->handle
 723				+ buf->offset + start);
 724
 725		data[0] = cpu_to_le32(CCE_PACKET3(R128_3D_RNDR_GEN_INDX_PRIM,
 726						  dwords - 2));
 727
 728		data[1] = cpu_to_le32(offset);
 729		data[2] = cpu_to_le32(R128_MAX_VB_VERTS);
 730		data[3] = cpu_to_le32(format);
 731		data[4] = cpu_to_le32((prim | R128_CCE_VC_CNTL_PRIM_WALK_IND |
 732				       (count << 16)));
 733
 734		if (count & 0x1) {
 735#ifdef __LITTLE_ENDIAN
 736			data[dwords - 1] &= 0x0000ffff;
 737#else
 738			data[dwords - 1] &= 0xffff0000;
 739#endif
 740		}
 741
 742		do {
 743			/* Emit the next set of up to three cliprects */
 744			if (i < sarea_priv->nbox) {
 745				r128_emit_clip_rects(dev_priv,
 746						     &sarea_priv->boxes[i],
 747						     sarea_priv->nbox - i);
 748			}
 749
 750			r128_cce_dispatch_indirect(dev, buf, start, end);
 751
 752			i += 3;
 753		} while (i < sarea_priv->nbox);
 754	}
 755
 756	if (buf_priv->discard) {
 757		buf_priv->age = dev_priv->sarea_priv->last_dispatch;
 758
 759		/* Emit the vertex buffer age */
 760		BEGIN_RING(2);
 761
 762		OUT_RING(CCE_PACKET0(R128_LAST_DISPATCH_REG, 0));
 763		OUT_RING(buf_priv->age);
 764
 765		ADVANCE_RING();
 766
 767		buf->pending = 1;
 768		/* FIXME: Check dispatched field */
 769		buf_priv->dispatched = 0;
 770	}
 771
 772	dev_priv->sarea_priv->last_dispatch++;
 773
 774	sarea_priv->dirty &= ~R128_UPLOAD_CLIPRECTS;
 775	sarea_priv->nbox = 0;
 776}
 777
 778static int r128_cce_dispatch_blit(struct drm_device *dev,
 779				  struct drm_file *file_priv,
 780				  drm_r128_blit_t *blit)
 781{
 782	drm_r128_private_t *dev_priv = dev->dev_private;
 783	struct drm_device_dma *dma = dev->dma;
 784	struct drm_buf *buf;
 785	drm_r128_buf_priv_t *buf_priv;
 786	u32 *data;
 787	int dword_shift, dwords;
 788	RING_LOCALS;
 789	DRM_DEBUG("\n");
 790
 791	/* The compiler won't optimize away a division by a variable,
 792	 * even if the only legal values are powers of two.  Thus, we'll
 793	 * use a shift instead.
 794	 */
 795	switch (blit->format) {
 796	case R128_DATATYPE_ARGB8888:
 797		dword_shift = 0;
 798		break;
 799	case R128_DATATYPE_ARGB1555:
 800	case R128_DATATYPE_RGB565:
 801	case R128_DATATYPE_ARGB4444:
 802	case R128_DATATYPE_YVYU422:
 803	case R128_DATATYPE_VYUY422:
 804		dword_shift = 1;
 805		break;
 806	case R128_DATATYPE_CI8:
 807	case R128_DATATYPE_RGB8:
 808		dword_shift = 2;
 809		break;
 810	default:
 811		DRM_ERROR("invalid blit format %d\n", blit->format);
 812		return -EINVAL;
 813	}
 814
 815	/* Flush the pixel cache, and mark the contents as Read Invalid.
 816	 * This ensures no pixel data gets mixed up with the texture
 817	 * data from the host data blit, otherwise part of the texture
 818	 * image may be corrupted.
 819	 */
 820	BEGIN_RING(2);
 821
 822	OUT_RING(CCE_PACKET0(R128_PC_GUI_CTLSTAT, 0));
 823	OUT_RING(R128_PC_RI_GUI | R128_PC_FLUSH_GUI);
 824
 825	ADVANCE_RING();
 826
 827	/* Dispatch the indirect buffer.
 828	 */
 829	buf = dma->buflist[blit->idx];
 830	buf_priv = buf->dev_private;
 831
 832	if (buf->file_priv != file_priv) {
 833		DRM_ERROR("process %d using buffer owned by %p\n",
 834			  task_pid_nr(current), buf->file_priv);
 835		return -EINVAL;
 836	}
 837	if (buf->pending) {
 838		DRM_ERROR("sending pending buffer %d\n", blit->idx);
 839		return -EINVAL;
 840	}
 841
 842	buf_priv->discard = 1;
 843
 844	dwords = (blit->width * blit->height) >> dword_shift;
 845
 846	data = (u32 *) ((char *)dev->agp_buffer_map->handle + buf->offset);
 847
 848	data[0] = cpu_to_le32(CCE_PACKET3(R128_CNTL_HOSTDATA_BLT, dwords + 6));
 849	data[1] = cpu_to_le32((R128_GMC_DST_PITCH_OFFSET_CNTL |
 850			       R128_GMC_BRUSH_NONE |
 851			       (blit->format << 8) |
 852			       R128_GMC_SRC_DATATYPE_COLOR |
 853			       R128_ROP3_S |
 854			       R128_DP_SRC_SOURCE_HOST_DATA |
 855			       R128_GMC_CLR_CMP_CNTL_DIS |
 856			       R128_GMC_AUX_CLIP_DIS | R128_GMC_WR_MSK_DIS));
 857
 858	data[2] = cpu_to_le32((blit->pitch << 21) | (blit->offset >> 5));
 859	data[3] = cpu_to_le32(0xffffffff);
 860	data[4] = cpu_to_le32(0xffffffff);
 861	data[5] = cpu_to_le32((blit->y << 16) | blit->x);
 862	data[6] = cpu_to_le32((blit->height << 16) | blit->width);
 863	data[7] = cpu_to_le32(dwords);
 864
 865	buf->used = (dwords + 8) * sizeof(u32);
 866
 867	r128_cce_dispatch_indirect(dev, buf, 0, buf->used);
 868
 869	/* Flush the pixel cache after the blit completes.  This ensures
 870	 * the texture data is written out to memory before rendering
 871	 * continues.
 872	 */
 873	BEGIN_RING(2);
 874
 875	OUT_RING(CCE_PACKET0(R128_PC_GUI_CTLSTAT, 0));
 876	OUT_RING(R128_PC_FLUSH_GUI);
 877
 878	ADVANCE_RING();
 879
 880	return 0;
 881}
 882
 883/* ================================================================
 884 * Tiled depth buffer management
 885 *
 886 * FIXME: These should all set the destination write mask for when we
 887 * have hardware stencil support.
 888 */
 889
 890static int r128_cce_dispatch_write_span(struct drm_device *dev,
 891					drm_r128_depth_t *depth)
 892{
 893	drm_r128_private_t *dev_priv = dev->dev_private;
 894	int count, x, y;
 895	u32 *buffer;
 896	u8 *mask;
 897	int i, buffer_size, mask_size;
 898	RING_LOCALS;
 899	DRM_DEBUG("\n");
 900
 901	count = depth->n;
 902	if (count > 4096 || count <= 0)
 903		return -EMSGSIZE;
 904
 905	if (copy_from_user(&x, depth->x, sizeof(x)))
 906		return -EFAULT;
 907	if (copy_from_user(&y, depth->y, sizeof(y)))
 908		return -EFAULT;
 909
 910	buffer_size = depth->n * sizeof(u32);
 911	buffer = memdup_user(depth->buffer, buffer_size);
 912	if (IS_ERR(buffer))
 913		return PTR_ERR(buffer);
 914
 915	mask_size = depth->n;
 916	if (depth->mask) {
 917		mask = memdup_user(depth->mask, mask_size);
 918		if (IS_ERR(mask)) {
 919			kfree(buffer);
 920			return PTR_ERR(mask);
 921		}
 922
 923		for (i = 0; i < count; i++, x++) {
 924			if (mask[i]) {
 925				BEGIN_RING(6);
 926
 927				OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 928				OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 929					 R128_GMC_BRUSH_SOLID_COLOR |
 930					 (dev_priv->depth_fmt << 8) |
 931					 R128_GMC_SRC_DATATYPE_COLOR |
 932					 R128_ROP3_P |
 933					 R128_GMC_CLR_CMP_CNTL_DIS |
 934					 R128_GMC_WR_MSK_DIS);
 935
 936				OUT_RING(dev_priv->depth_pitch_offset_c);
 937				OUT_RING(buffer[i]);
 938
 939				OUT_RING((x << 16) | y);
 940				OUT_RING((1 << 16) | 1);
 941
 942				ADVANCE_RING();
 943			}
 944		}
 945
 946		kfree(mask);
 947	} else {
 948		for (i = 0; i < count; i++, x++) {
 949			BEGIN_RING(6);
 950
 951			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
 952			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
 953				 R128_GMC_BRUSH_SOLID_COLOR |
 954				 (dev_priv->depth_fmt << 8) |
 955				 R128_GMC_SRC_DATATYPE_COLOR |
 956				 R128_ROP3_P |
 957				 R128_GMC_CLR_CMP_CNTL_DIS |
 958				 R128_GMC_WR_MSK_DIS);
 959
 960			OUT_RING(dev_priv->depth_pitch_offset_c);
 961			OUT_RING(buffer[i]);
 962
 963			OUT_RING((x << 16) | y);
 964			OUT_RING((1 << 16) | 1);
 965
 966			ADVANCE_RING();
 967		}
 968	}
 969
 970	kfree(buffer);
 971
 972	return 0;
 973}
 974
 975static int r128_cce_dispatch_write_pixels(struct drm_device *dev,
 976					  drm_r128_depth_t *depth)
 977{
 978	drm_r128_private_t *dev_priv = dev->dev_private;
 979	int count, *x, *y;
 980	u32 *buffer;
 981	u8 *mask;
 982	int i, xbuf_size, ybuf_size, buffer_size, mask_size;
 983	RING_LOCALS;
 984	DRM_DEBUG("\n");
 985
 986	count = depth->n;
 987	if (count > 4096 || count <= 0)
 988		return -EMSGSIZE;
 989
 990	xbuf_size = count * sizeof(*x);
 991	ybuf_size = count * sizeof(*y);
 992	x = memdup_user(depth->x, xbuf_size);
 993	if (IS_ERR(x))
 994		return PTR_ERR(x);
 995	y = memdup_user(depth->y, ybuf_size);
 996	if (IS_ERR(y)) {
 997		kfree(x);
 998		return PTR_ERR(y);
 999	}
 
 
 
 
 
 
 
 
 
 
 
1000	buffer_size = depth->n * sizeof(u32);
1001	buffer = memdup_user(depth->buffer, buffer_size);
1002	if (IS_ERR(buffer)) {
1003		kfree(x);
1004		kfree(y);
1005		return PTR_ERR(buffer);
1006	}
1007
1008	if (depth->mask) {
1009		mask_size = depth->n;
1010		mask = memdup_user(depth->mask, mask_size);
1011		if (IS_ERR(mask)) {
1012			kfree(x);
1013			kfree(y);
1014			kfree(buffer);
1015			return PTR_ERR(mask);
1016		}
1017
1018		for (i = 0; i < count; i++) {
1019			if (mask[i]) {
1020				BEGIN_RING(6);
1021
1022				OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
1023				OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
1024					 R128_GMC_BRUSH_SOLID_COLOR |
1025					 (dev_priv->depth_fmt << 8) |
1026					 R128_GMC_SRC_DATATYPE_COLOR |
1027					 R128_ROP3_P |
1028					 R128_GMC_CLR_CMP_CNTL_DIS |
1029					 R128_GMC_WR_MSK_DIS);
1030
1031				OUT_RING(dev_priv->depth_pitch_offset_c);
1032				OUT_RING(buffer[i]);
1033
1034				OUT_RING((x[i] << 16) | y[i]);
1035				OUT_RING((1 << 16) | 1);
1036
1037				ADVANCE_RING();
1038			}
1039		}
1040
1041		kfree(mask);
1042	} else {
1043		for (i = 0; i < count; i++) {
1044			BEGIN_RING(6);
1045
1046			OUT_RING(CCE_PACKET3(R128_CNTL_PAINT_MULTI, 4));
1047			OUT_RING(R128_GMC_DST_PITCH_OFFSET_CNTL |
1048				 R128_GMC_BRUSH_SOLID_COLOR |
1049				 (dev_priv->depth_fmt << 8) |
1050				 R128_GMC_SRC_DATATYPE_COLOR |
1051				 R128_ROP3_P |
1052				 R128_GMC_CLR_CMP_CNTL_DIS |
1053				 R128_GMC_WR_MSK_DIS);
1054
1055			OUT_RING(dev_priv->depth_pitch_offset_c);
1056			OUT_RING(buffer[i]);
1057
1058			OUT_RING((x[i] << 16) | y[i]);
1059			OUT_RING((1 << 16) | 1);
1060
1061			ADVANCE_RING();
1062		}
1063	}
1064
1065	kfree(x);
1066	kfree(y);
1067	kfree(buffer);
1068
1069	return 0;
1070}
1071
1072static int r128_cce_dispatch_read_span(struct drm_device *dev,
1073				       drm_r128_depth_t *depth)
1074{
1075	drm_r128_private_t *dev_priv = dev->dev_private;
1076	int count, x, y;
1077	RING_LOCALS;
1078	DRM_DEBUG("\n");
1079
1080	count = depth->n;
1081	if (count > 4096 || count <= 0)
1082		return -EMSGSIZE;
1083
1084	if (copy_from_user(&x, depth->x, sizeof(x)))
1085		return -EFAULT;
1086	if (copy_from_user(&y, depth->y, sizeof(y)))
1087		return -EFAULT;
1088
1089	BEGIN_RING(7);
1090
1091	OUT_RING(CCE_PACKET3(R128_CNTL_BITBLT_MULTI, 5));
1092	OUT_RING(R128_GMC_SRC_PITCH_OFFSET_CNTL |
1093		 R128_GMC_DST_PITCH_OFFSET_CNTL |
1094		 R128_GMC_BRUSH_NONE |
1095		 (dev_priv->depth_fmt << 8) |
1096		 R128_GMC_SRC_DATATYPE_COLOR |
1097		 R128_ROP3_S |
1098		 R128_DP_SRC_SOURCE_MEMORY |
1099		 R128_GMC_CLR_CMP_CNTL_DIS | R128_GMC_WR_MSK_DIS);
1100
1101	OUT_RING(dev_priv->depth_pitch_offset_c);
1102	OUT_RING(dev_priv->span_pitch_offset_c);
1103
1104	OUT_RING((x << 16) | y);
1105	OUT_RING((0 << 16) | 0);
1106	OUT_RING((count << 16) | 1);
1107
1108	ADVANCE_RING();
1109
1110	return 0;
1111}
1112
1113static int r128_cce_dispatch_read_pixels(struct drm_device *dev,
1114					 drm_r128_depth_t *depth)
1115{
1116	drm_r128_private_t *dev_priv = dev->dev_private;
1117	int count, *x, *y;
1118	int i, xbuf_size, ybuf_size;
1119	RING_LOCALS;
1120	DRM_DEBUG("\n");
1121
1122	count = depth->n;
1123	if (count > 4096 || count <= 0)
1124		return -EMSGSIZE;
1125
1126	if (count > dev_priv->depth_pitch)
1127		count = dev_priv->depth_pitch;
1128
1129	xbuf_size = count * sizeof(*x);
1130	ybuf_size = count * sizeof(*y);
1131	x = kmalloc(xbuf_size, GFP_KERNEL);
1132	if (x == NULL)
1133		return -ENOMEM;
1134	y = kmalloc(ybuf_size, GFP_KERNEL);
1135	if (y == NULL) {
1136		kfree(x);
1137		return -ENOMEM;
1138	}
1139	if (copy_from_user(x, depth->x, xbuf_size)) {
1140		kfree(x);
1141		kfree(y);
1142		return -EFAULT;
1143	}
1144	if (copy_from_user(y, depth->y, ybuf_size)) {
1145		kfree(x);
1146		kfree(y);
1147		return -EFAULT;
1148	}
1149
1150	for (i = 0; i < count; i++) {
1151		BEGIN_RING(7);
1152
1153		OUT_RING(CCE_PACKET3(R128_CNTL_BITBLT_MULTI, 5));
1154		OUT_RING(R128_GMC_SRC_PITCH_OFFSET_CNTL |
1155			 R128_GMC_DST_PITCH_OFFSET_CNTL |
1156			 R128_GMC_BRUSH_NONE |
1157			 (dev_priv->depth_fmt << 8) |
1158			 R128_GMC_SRC_DATATYPE_COLOR |
1159			 R128_ROP3_S |
1160			 R128_DP_SRC_SOURCE_MEMORY |
1161			 R128_GMC_CLR_CMP_CNTL_DIS | R128_GMC_WR_MSK_DIS);
1162
1163		OUT_RING(dev_priv->depth_pitch_offset_c);
1164		OUT_RING(dev_priv->span_pitch_offset_c);
1165
1166		OUT_RING((x[i] << 16) | y[i]);
1167		OUT_RING((i << 16) | 0);
1168		OUT_RING((1 << 16) | 1);
1169
1170		ADVANCE_RING();
1171	}
1172
1173	kfree(x);
1174	kfree(y);
1175
1176	return 0;
1177}
1178
1179/* ================================================================
1180 * Polygon stipple
1181 */
1182
1183static void r128_cce_dispatch_stipple(struct drm_device *dev, u32 *stipple)
1184{
1185	drm_r128_private_t *dev_priv = dev->dev_private;
1186	int i;
1187	RING_LOCALS;
1188	DRM_DEBUG("\n");
1189
1190	BEGIN_RING(33);
1191
1192	OUT_RING(CCE_PACKET0(R128_BRUSH_DATA0, 31));
1193	for (i = 0; i < 32; i++)
1194		OUT_RING(stipple[i]);
1195
1196	ADVANCE_RING();
1197}
1198
1199/* ================================================================
1200 * IOCTL functions
1201 */
1202
1203static int r128_cce_clear(struct drm_device *dev, void *data, struct drm_file *file_priv)
1204{
1205	drm_r128_private_t *dev_priv = dev->dev_private;
1206	drm_r128_sarea_t *sarea_priv;
1207	drm_r128_clear_t *clear = data;
1208	DRM_DEBUG("\n");
1209
1210	LOCK_TEST_WITH_RETURN(dev, file_priv);
1211
1212	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1213
1214	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1215
1216	sarea_priv = dev_priv->sarea_priv;
1217
1218	if (sarea_priv->nbox > R128_NR_SAREA_CLIPRECTS)
1219		sarea_priv->nbox = R128_NR_SAREA_CLIPRECTS;
1220
1221	r128_cce_dispatch_clear(dev, clear);
1222	COMMIT_RING();
1223
1224	/* Make sure we restore the 3D state next time.
1225	 */
1226	dev_priv->sarea_priv->dirty |= R128_UPLOAD_CONTEXT | R128_UPLOAD_MASKS;
1227
1228	return 0;
1229}
1230
1231static int r128_do_init_pageflip(struct drm_device *dev)
1232{
1233	drm_r128_private_t *dev_priv = dev->dev_private;
1234	DRM_DEBUG("\n");
1235
1236	dev_priv->crtc_offset = R128_READ(R128_CRTC_OFFSET);
1237	dev_priv->crtc_offset_cntl = R128_READ(R128_CRTC_OFFSET_CNTL);
1238
1239	R128_WRITE(R128_CRTC_OFFSET, dev_priv->front_offset);
1240	R128_WRITE(R128_CRTC_OFFSET_CNTL,
1241		   dev_priv->crtc_offset_cntl | R128_CRTC_OFFSET_FLIP_CNTL);
1242
1243	dev_priv->page_flipping = 1;
1244	dev_priv->current_page = 0;
1245	dev_priv->sarea_priv->pfCurrentPage = dev_priv->current_page;
1246
1247	return 0;
1248}
1249
1250static int r128_do_cleanup_pageflip(struct drm_device *dev)
1251{
1252	drm_r128_private_t *dev_priv = dev->dev_private;
1253	DRM_DEBUG("\n");
1254
1255	R128_WRITE(R128_CRTC_OFFSET, dev_priv->crtc_offset);
1256	R128_WRITE(R128_CRTC_OFFSET_CNTL, dev_priv->crtc_offset_cntl);
1257
1258	if (dev_priv->current_page != 0) {
1259		r128_cce_dispatch_flip(dev);
1260		COMMIT_RING();
1261	}
1262
1263	dev_priv->page_flipping = 0;
1264	return 0;
1265}
1266
1267/* Swapping and flipping are different operations, need different ioctls.
1268 * They can & should be intermixed to support multiple 3d windows.
1269 */
1270
1271static int r128_cce_flip(struct drm_device *dev, void *data, struct drm_file *file_priv)
1272{
1273	drm_r128_private_t *dev_priv = dev->dev_private;
1274	DRM_DEBUG("\n");
1275
1276	LOCK_TEST_WITH_RETURN(dev, file_priv);
1277
1278	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1279
1280	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1281
1282	if (!dev_priv->page_flipping)
1283		r128_do_init_pageflip(dev);
1284
1285	r128_cce_dispatch_flip(dev);
1286
1287	COMMIT_RING();
1288	return 0;
1289}
1290
1291static int r128_cce_swap(struct drm_device *dev, void *data, struct drm_file *file_priv)
1292{
1293	drm_r128_private_t *dev_priv = dev->dev_private;
1294	drm_r128_sarea_t *sarea_priv = dev_priv->sarea_priv;
1295	DRM_DEBUG("\n");
1296
1297	LOCK_TEST_WITH_RETURN(dev, file_priv);
1298
1299	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1300
1301	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1302
1303	if (sarea_priv->nbox > R128_NR_SAREA_CLIPRECTS)
1304		sarea_priv->nbox = R128_NR_SAREA_CLIPRECTS;
1305
1306	r128_cce_dispatch_swap(dev);
1307	dev_priv->sarea_priv->dirty |= (R128_UPLOAD_CONTEXT |
1308					R128_UPLOAD_MASKS);
1309
1310	COMMIT_RING();
1311	return 0;
1312}
1313
1314static int r128_cce_vertex(struct drm_device *dev, void *data, struct drm_file *file_priv)
1315{
1316	drm_r128_private_t *dev_priv = dev->dev_private;
1317	struct drm_device_dma *dma = dev->dma;
1318	struct drm_buf *buf;
1319	drm_r128_buf_priv_t *buf_priv;
1320	drm_r128_vertex_t *vertex = data;
1321
1322	LOCK_TEST_WITH_RETURN(dev, file_priv);
1323
1324	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1325
1326	DRM_DEBUG("pid=%d index=%d count=%d discard=%d\n",
1327		  task_pid_nr(current), vertex->idx, vertex->count, vertex->discard);
1328
1329	if (vertex->idx < 0 || vertex->idx >= dma->buf_count) {
1330		DRM_ERROR("buffer index %d (of %d max)\n",
1331			  vertex->idx, dma->buf_count - 1);
1332		return -EINVAL;
1333	}
1334	if (vertex->prim < 0 ||
1335	    vertex->prim > R128_CCE_VC_CNTL_PRIM_TYPE_TRI_TYPE2) {
1336		DRM_ERROR("buffer prim %d\n", vertex->prim);
1337		return -EINVAL;
1338	}
1339
1340	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1341	VB_AGE_TEST_WITH_RETURN(dev_priv);
1342
1343	buf = dma->buflist[vertex->idx];
1344	buf_priv = buf->dev_private;
1345
1346	if (buf->file_priv != file_priv) {
1347		DRM_ERROR("process %d using buffer owned by %p\n",
1348			  task_pid_nr(current), buf->file_priv);
1349		return -EINVAL;
1350	}
1351	if (buf->pending) {
1352		DRM_ERROR("sending pending buffer %d\n", vertex->idx);
1353		return -EINVAL;
1354	}
1355
1356	buf->used = vertex->count;
1357	buf_priv->prim = vertex->prim;
1358	buf_priv->discard = vertex->discard;
1359
1360	r128_cce_dispatch_vertex(dev, buf);
1361
1362	COMMIT_RING();
1363	return 0;
1364}
1365
1366static int r128_cce_indices(struct drm_device *dev, void *data, struct drm_file *file_priv)
1367{
1368	drm_r128_private_t *dev_priv = dev->dev_private;
1369	struct drm_device_dma *dma = dev->dma;
1370	struct drm_buf *buf;
1371	drm_r128_buf_priv_t *buf_priv;
1372	drm_r128_indices_t *elts = data;
1373	int count;
1374
1375	LOCK_TEST_WITH_RETURN(dev, file_priv);
1376
1377	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1378
1379	DRM_DEBUG("pid=%d buf=%d s=%d e=%d d=%d\n", task_pid_nr(current),
1380		  elts->idx, elts->start, elts->end, elts->discard);
1381
1382	if (elts->idx < 0 || elts->idx >= dma->buf_count) {
1383		DRM_ERROR("buffer index %d (of %d max)\n",
1384			  elts->idx, dma->buf_count - 1);
1385		return -EINVAL;
1386	}
1387	if (elts->prim < 0 ||
1388	    elts->prim > R128_CCE_VC_CNTL_PRIM_TYPE_TRI_TYPE2) {
1389		DRM_ERROR("buffer prim %d\n", elts->prim);
1390		return -EINVAL;
1391	}
1392
1393	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1394	VB_AGE_TEST_WITH_RETURN(dev_priv);
1395
1396	buf = dma->buflist[elts->idx];
1397	buf_priv = buf->dev_private;
1398
1399	if (buf->file_priv != file_priv) {
1400		DRM_ERROR("process %d using buffer owned by %p\n",
1401			  task_pid_nr(current), buf->file_priv);
1402		return -EINVAL;
1403	}
1404	if (buf->pending) {
1405		DRM_ERROR("sending pending buffer %d\n", elts->idx);
1406		return -EINVAL;
1407	}
1408
1409	count = (elts->end - elts->start) / sizeof(u16);
1410	elts->start -= R128_INDEX_PRIM_OFFSET;
1411
1412	if (elts->start & 0x7) {
1413		DRM_ERROR("misaligned buffer 0x%x\n", elts->start);
1414		return -EINVAL;
1415	}
1416	if (elts->start < buf->used) {
1417		DRM_ERROR("no header 0x%x - 0x%x\n", elts->start, buf->used);
1418		return -EINVAL;
1419	}
1420
1421	buf->used = elts->end;
1422	buf_priv->prim = elts->prim;
1423	buf_priv->discard = elts->discard;
1424
1425	r128_cce_dispatch_indices(dev, buf, elts->start, elts->end, count);
1426
1427	COMMIT_RING();
1428	return 0;
1429}
1430
1431static int r128_cce_blit(struct drm_device *dev, void *data, struct drm_file *file_priv)
1432{
1433	struct drm_device_dma *dma = dev->dma;
1434	drm_r128_private_t *dev_priv = dev->dev_private;
1435	drm_r128_blit_t *blit = data;
1436	int ret;
1437
1438	LOCK_TEST_WITH_RETURN(dev, file_priv);
1439
1440	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1441
1442	DRM_DEBUG("pid=%d index=%d\n", task_pid_nr(current), blit->idx);
1443
1444	if (blit->idx < 0 || blit->idx >= dma->buf_count) {
1445		DRM_ERROR("buffer index %d (of %d max)\n",
1446			  blit->idx, dma->buf_count - 1);
1447		return -EINVAL;
1448	}
1449
1450	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1451	VB_AGE_TEST_WITH_RETURN(dev_priv);
1452
1453	ret = r128_cce_dispatch_blit(dev, file_priv, blit);
1454
1455	COMMIT_RING();
1456	return ret;
1457}
1458
1459int r128_cce_depth(struct drm_device *dev, void *data, struct drm_file *file_priv)
1460{
1461	drm_r128_private_t *dev_priv = dev->dev_private;
1462	drm_r128_depth_t *depth = data;
1463	int ret;
1464
1465	LOCK_TEST_WITH_RETURN(dev, file_priv);
1466
1467	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1468
1469	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1470
1471	ret = -EINVAL;
1472	switch (depth->func) {
1473	case R128_WRITE_SPAN:
1474		ret = r128_cce_dispatch_write_span(dev, depth);
1475		break;
1476	case R128_WRITE_PIXELS:
1477		ret = r128_cce_dispatch_write_pixels(dev, depth);
1478		break;
1479	case R128_READ_SPAN:
1480		ret = r128_cce_dispatch_read_span(dev, depth);
1481		break;
1482	case R128_READ_PIXELS:
1483		ret = r128_cce_dispatch_read_pixels(dev, depth);
1484		break;
1485	}
1486
1487	COMMIT_RING();
1488	return ret;
1489}
1490
1491int r128_cce_stipple(struct drm_device *dev, void *data, struct drm_file *file_priv)
1492{
1493	drm_r128_private_t *dev_priv = dev->dev_private;
1494	drm_r128_stipple_t *stipple = data;
1495	u32 mask[32];
1496
1497	LOCK_TEST_WITH_RETURN(dev, file_priv);
1498
1499	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1500
1501	if (copy_from_user(&mask, stipple->mask, 32 * sizeof(u32)))
1502		return -EFAULT;
1503
1504	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1505
1506	r128_cce_dispatch_stipple(dev, mask);
1507
1508	COMMIT_RING();
1509	return 0;
1510}
1511
1512static int r128_cce_indirect(struct drm_device *dev, void *data, struct drm_file *file_priv)
1513{
1514	drm_r128_private_t *dev_priv = dev->dev_private;
1515	struct drm_device_dma *dma = dev->dma;
1516	struct drm_buf *buf;
1517	drm_r128_buf_priv_t *buf_priv;
1518	drm_r128_indirect_t *indirect = data;
1519#if 0
1520	RING_LOCALS;
1521#endif
1522
1523	LOCK_TEST_WITH_RETURN(dev, file_priv);
1524
1525	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1526
1527	DRM_DEBUG("idx=%d s=%d e=%d d=%d\n",
1528		  indirect->idx, indirect->start, indirect->end,
1529		  indirect->discard);
1530
1531	if (indirect->idx < 0 || indirect->idx >= dma->buf_count) {
1532		DRM_ERROR("buffer index %d (of %d max)\n",
1533			  indirect->idx, dma->buf_count - 1);
1534		return -EINVAL;
1535	}
1536
1537	buf = dma->buflist[indirect->idx];
1538	buf_priv = buf->dev_private;
1539
1540	if (buf->file_priv != file_priv) {
1541		DRM_ERROR("process %d using buffer owned by %p\n",
1542			  task_pid_nr(current), buf->file_priv);
1543		return -EINVAL;
1544	}
1545	if (buf->pending) {
1546		DRM_ERROR("sending pending buffer %d\n", indirect->idx);
1547		return -EINVAL;
1548	}
1549
1550	if (indirect->start < buf->used) {
1551		DRM_ERROR("reusing indirect: start=0x%x actual=0x%x\n",
1552			  indirect->start, buf->used);
1553		return -EINVAL;
1554	}
1555
1556	RING_SPACE_TEST_WITH_RETURN(dev_priv);
1557	VB_AGE_TEST_WITH_RETURN(dev_priv);
1558
1559	buf->used = indirect->end;
1560	buf_priv->discard = indirect->discard;
1561
1562#if 0
1563	/* Wait for the 3D stream to idle before the indirect buffer
1564	 * containing 2D acceleration commands is processed.
1565	 */
1566	BEGIN_RING(2);
1567	RADEON_WAIT_UNTIL_3D_IDLE();
1568	ADVANCE_RING();
1569#endif
1570
1571	/* Dispatch the indirect buffer full of commands from the
1572	 * X server.  This is insecure and is thus only available to
1573	 * privileged clients.
1574	 */
1575	r128_cce_dispatch_indirect(dev, buf, indirect->start, indirect->end);
1576
1577	COMMIT_RING();
1578	return 0;
1579}
1580
1581int r128_getparam(struct drm_device *dev, void *data, struct drm_file *file_priv)
1582{
1583	drm_r128_private_t *dev_priv = dev->dev_private;
1584	drm_r128_getparam_t *param = data;
1585	int value;
1586
1587	DEV_INIT_TEST_WITH_RETURN(dev_priv);
1588
1589	DRM_DEBUG("pid=%d\n", task_pid_nr(current));
1590
1591	switch (param->param) {
1592	case R128_PARAM_IRQ_NR:
1593		value = dev->pdev->irq;
1594		break;
1595	default:
1596		return -EINVAL;
1597	}
1598
1599	if (copy_to_user(param->value, &value, sizeof(int))) {
1600		DRM_ERROR("copy_to_user\n");
1601		return -EFAULT;
1602	}
1603
1604	return 0;
1605}
1606
1607void r128_driver_preclose(struct drm_device *dev, struct drm_file *file_priv)
1608{
1609	if (dev->dev_private) {
1610		drm_r128_private_t *dev_priv = dev->dev_private;
1611		if (dev_priv->page_flipping)
1612			r128_do_cleanup_pageflip(dev);
1613	}
1614}
1615void r128_driver_lastclose(struct drm_device *dev)
1616{
1617	r128_do_cleanup_cce(dev);
1618}
1619
1620const struct drm_ioctl_desc r128_ioctls[] = {
1621	DRM_IOCTL_DEF_DRV(R128_INIT, r128_cce_init, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1622	DRM_IOCTL_DEF_DRV(R128_CCE_START, r128_cce_start, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1623	DRM_IOCTL_DEF_DRV(R128_CCE_STOP, r128_cce_stop, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1624	DRM_IOCTL_DEF_DRV(R128_CCE_RESET, r128_cce_reset, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1625	DRM_IOCTL_DEF_DRV(R128_CCE_IDLE, r128_cce_idle, DRM_AUTH),
1626	DRM_IOCTL_DEF_DRV(R128_RESET, r128_engine_reset, DRM_AUTH),
1627	DRM_IOCTL_DEF_DRV(R128_FULLSCREEN, r128_fullscreen, DRM_AUTH),
1628	DRM_IOCTL_DEF_DRV(R128_SWAP, r128_cce_swap, DRM_AUTH),
1629	DRM_IOCTL_DEF_DRV(R128_FLIP, r128_cce_flip, DRM_AUTH),
1630	DRM_IOCTL_DEF_DRV(R128_CLEAR, r128_cce_clear, DRM_AUTH),
1631	DRM_IOCTL_DEF_DRV(R128_VERTEX, r128_cce_vertex, DRM_AUTH),
1632	DRM_IOCTL_DEF_DRV(R128_INDICES, r128_cce_indices, DRM_AUTH),
1633	DRM_IOCTL_DEF_DRV(R128_BLIT, r128_cce_blit, DRM_AUTH),
1634	DRM_IOCTL_DEF_DRV(R128_DEPTH, r128_cce_depth, DRM_AUTH),
1635	DRM_IOCTL_DEF_DRV(R128_STIPPLE, r128_cce_stipple, DRM_AUTH),
1636	DRM_IOCTL_DEF_DRV(R128_INDIRECT, r128_cce_indirect, DRM_AUTH|DRM_MASTER|DRM_ROOT_ONLY),
1637	DRM_IOCTL_DEF_DRV(R128_GETPARAM, r128_getparam, DRM_AUTH),
1638};
1639
1640int r128_max_ioctl = ARRAY_SIZE(r128_ioctls);