Linux Audio

Check our new training course

Loading...
v5.9
  1/* r128_cce.c -- ATI Rage 128 driver -*- linux-c -*-
  2 * Created: Wed Apr  5 19:24:19 2000 by kevin@precisioninsight.com
  3 */
  4/*
  5 * Copyright 2000 Precision Insight, Inc., Cedar Park, Texas.
  6 * Copyright 2000 VA Linux Systems, Inc., Sunnyvale, California.
  7 * All Rights Reserved.
  8 *
  9 * Permission is hereby granted, free of charge, to any person obtaining a
 10 * copy of this software and associated documentation files (the "Software"),
 11 * to deal in the Software without restriction, including without limitation
 12 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
 13 * and/or sell copies of the Software, and to permit persons to whom the
 14 * Software is furnished to do so, subject to the following conditions:
 15 *
 16 * The above copyright notice and this permission notice (including the next
 17 * paragraph) shall be included in all copies or substantial portions of the
 18 * Software.
 19 *
 20 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 21 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 22 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 23 * PRECISION INSIGHT AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
 24 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
 25 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
 26 * DEALINGS IN THE SOFTWARE.
 27 *
 28 * Authors:
 29 *    Gareth Hughes <gareth@valinux.com>
 30 */
 31
 32#include <linux/delay.h>
 33#include <linux/dma-mapping.h>
 34#include <linux/firmware.h>
 35#include <linux/module.h>
 36#include <linux/platform_device.h>
 37#include <linux/slab.h>
 38#include <linux/uaccess.h>
 39
 40#include <drm/drm_agpsupport.h>
 41#include <drm/drm_device.h>
 42#include <drm/drm_file.h>
 43#include <drm/drm_irq.h>
 44#include <drm/drm_print.h>
 45#include <drm/r128_drm.h>
 46
 47#include "r128_drv.h"
 48
 49#define R128_FIFO_DEBUG		0
 50
 51#define FIRMWARE_NAME		"r128/r128_cce.bin"
 52
 53MODULE_FIRMWARE(FIRMWARE_NAME);
 54
 55static int R128_READ_PLL(struct drm_device *dev, int addr)
 56{
 57	drm_r128_private_t *dev_priv = dev->dev_private;
 58
 59	R128_WRITE8(R128_CLOCK_CNTL_INDEX, addr & 0x1f);
 60	return R128_READ(R128_CLOCK_CNTL_DATA);
 61}
 62
 63#if R128_FIFO_DEBUG
 64static void r128_status(drm_r128_private_t *dev_priv)
 65{
 66	printk("GUI_STAT           = 0x%08x\n",
 67	       (unsigned int)R128_READ(R128_GUI_STAT));
 68	printk("PM4_STAT           = 0x%08x\n",
 69	       (unsigned int)R128_READ(R128_PM4_STAT));
 70	printk("PM4_BUFFER_DL_WPTR = 0x%08x\n",
 71	       (unsigned int)R128_READ(R128_PM4_BUFFER_DL_WPTR));
 72	printk("PM4_BUFFER_DL_RPTR = 0x%08x\n",
 73	       (unsigned int)R128_READ(R128_PM4_BUFFER_DL_RPTR));
 74	printk("PM4_MICRO_CNTL     = 0x%08x\n",
 75	       (unsigned int)R128_READ(R128_PM4_MICRO_CNTL));
 76	printk("PM4_BUFFER_CNTL    = 0x%08x\n",
 77	       (unsigned int)R128_READ(R128_PM4_BUFFER_CNTL));
 78}
 79#endif
 80
 81/* ================================================================
 82 * Engine, FIFO control
 83 */
 84
 85static int r128_do_pixcache_flush(drm_r128_private_t *dev_priv)
 86{
 87	u32 tmp;
 88	int i;
 89
 90	tmp = R128_READ(R128_PC_NGUI_CTLSTAT) | R128_PC_FLUSH_ALL;
 91	R128_WRITE(R128_PC_NGUI_CTLSTAT, tmp);
 92
 93	for (i = 0; i < dev_priv->usec_timeout; i++) {
 94		if (!(R128_READ(R128_PC_NGUI_CTLSTAT) & R128_PC_BUSY))
 95			return 0;
 96		udelay(1);
 97	}
 98
 99#if R128_FIFO_DEBUG
100	DRM_ERROR("failed!\n");
101#endif
102	return -EBUSY;
103}
104
105static int r128_do_wait_for_fifo(drm_r128_private_t *dev_priv, int entries)
106{
107	int i;
108
109	for (i = 0; i < dev_priv->usec_timeout; i++) {
110		int slots = R128_READ(R128_GUI_STAT) & R128_GUI_FIFOCNT_MASK;
111		if (slots >= entries)
112			return 0;
113		udelay(1);
114	}
115
116#if R128_FIFO_DEBUG
117	DRM_ERROR("failed!\n");
118#endif
119	return -EBUSY;
120}
121
122static int r128_do_wait_for_idle(drm_r128_private_t *dev_priv)
123{
124	int i, ret;
125
126	ret = r128_do_wait_for_fifo(dev_priv, 64);
127	if (ret)
128		return ret;
129
130	for (i = 0; i < dev_priv->usec_timeout; i++) {
131		if (!(R128_READ(R128_GUI_STAT) & R128_GUI_ACTIVE)) {
132			r128_do_pixcache_flush(dev_priv);
133			return 0;
134		}
135		udelay(1);
136	}
137
138#if R128_FIFO_DEBUG
139	DRM_ERROR("failed!\n");
140#endif
141	return -EBUSY;
142}
143
144/* ================================================================
145 * CCE control, initialization
146 */
147
148/* Load the microcode for the CCE */
149static int r128_cce_load_microcode(drm_r128_private_t *dev_priv)
150{
151	struct platform_device *pdev;
152	const struct firmware *fw;
153	const __be32 *fw_data;
154	int rc, i;
155
156	DRM_DEBUG("\n");
157
158	pdev = platform_device_register_simple("r128_cce", 0, NULL, 0);
159	if (IS_ERR(pdev)) {
160		pr_err("r128_cce: Failed to register firmware\n");
161		return PTR_ERR(pdev);
162	}
163	rc = request_firmware(&fw, FIRMWARE_NAME, &pdev->dev);
164	platform_device_unregister(pdev);
165	if (rc) {
166		pr_err("r128_cce: Failed to load firmware \"%s\"\n",
167		       FIRMWARE_NAME);
168		return rc;
169	}
170
171	if (fw->size != 256 * 8) {
172		pr_err("r128_cce: Bogus length %zu in firmware \"%s\"\n",
173		       fw->size, FIRMWARE_NAME);
174		rc = -EINVAL;
175		goto out_release;
176	}
177
178	r128_do_wait_for_idle(dev_priv);
179
180	fw_data = (const __be32 *)fw->data;
181	R128_WRITE(R128_PM4_MICROCODE_ADDR, 0);
182	for (i = 0; i < 256; i++) {
183		R128_WRITE(R128_PM4_MICROCODE_DATAH,
184			   be32_to_cpup(&fw_data[i * 2]));
185		R128_WRITE(R128_PM4_MICROCODE_DATAL,
186			   be32_to_cpup(&fw_data[i * 2 + 1]));
187	}
188
189out_release:
190	release_firmware(fw);
191	return rc;
192}
193
194/* Flush any pending commands to the CCE.  This should only be used just
195 * prior to a wait for idle, as it informs the engine that the command
196 * stream is ending.
197 */
198static void r128_do_cce_flush(drm_r128_private_t *dev_priv)
199{
200	u32 tmp;
201
202	tmp = R128_READ(R128_PM4_BUFFER_DL_WPTR) | R128_PM4_BUFFER_DL_DONE;
203	R128_WRITE(R128_PM4_BUFFER_DL_WPTR, tmp);
204}
205
206/* Wait for the CCE to go idle.
207 */
208int r128_do_cce_idle(drm_r128_private_t *dev_priv)
209{
210	int i;
211
212	for (i = 0; i < dev_priv->usec_timeout; i++) {
213		if (GET_RING_HEAD(dev_priv) == dev_priv->ring.tail) {
214			int pm4stat = R128_READ(R128_PM4_STAT);
215			if (((pm4stat & R128_PM4_FIFOCNT_MASK) >=
216			     dev_priv->cce_fifo_size) &&
217			    !(pm4stat & (R128_PM4_BUSY |
218					 R128_PM4_GUI_ACTIVE))) {
219				return r128_do_pixcache_flush(dev_priv);
220			}
221		}
222		udelay(1);
223	}
224
225#if R128_FIFO_DEBUG
226	DRM_ERROR("failed!\n");
227	r128_status(dev_priv);
228#endif
229	return -EBUSY;
230}
231
232/* Start the Concurrent Command Engine.
233 */
234static void r128_do_cce_start(drm_r128_private_t *dev_priv)
235{
236	r128_do_wait_for_idle(dev_priv);
237
238	R128_WRITE(R128_PM4_BUFFER_CNTL,
239		   dev_priv->cce_mode | dev_priv->ring.size_l2qw
240		   | R128_PM4_BUFFER_CNTL_NOUPDATE);
241	R128_READ(R128_PM4_BUFFER_ADDR);	/* as per the sample code */
242	R128_WRITE(R128_PM4_MICRO_CNTL, R128_PM4_MICRO_FREERUN);
243
244	dev_priv->cce_running = 1;
245}
246
247/* Reset the Concurrent Command Engine.  This will not flush any pending
248 * commands, so you must wait for the CCE command stream to complete
249 * before calling this routine.
250 */
251static void r128_do_cce_reset(drm_r128_private_t *dev_priv)
252{
253	R128_WRITE(R128_PM4_BUFFER_DL_WPTR, 0);
254	R128_WRITE(R128_PM4_BUFFER_DL_RPTR, 0);
255	dev_priv->ring.tail = 0;
256}
257
258/* Stop the Concurrent Command Engine.  This will not flush any pending
259 * commands, so you must flush the command stream and wait for the CCE
260 * to go idle before calling this routine.
261 */
262static void r128_do_cce_stop(drm_r128_private_t *dev_priv)
263{
264	R128_WRITE(R128_PM4_MICRO_CNTL, 0);
265	R128_WRITE(R128_PM4_BUFFER_CNTL,
266		   R128_PM4_NONPM4 | R128_PM4_BUFFER_CNTL_NOUPDATE);
267
268	dev_priv->cce_running = 0;
269}
270
271/* Reset the engine.  This will stop the CCE if it is running.
272 */
273static int r128_do_engine_reset(struct drm_device *dev)
274{
275	drm_r128_private_t *dev_priv = dev->dev_private;
276	u32 clock_cntl_index, mclk_cntl, gen_reset_cntl;
277
278	r128_do_pixcache_flush(dev_priv);
279
280	clock_cntl_index = R128_READ(R128_CLOCK_CNTL_INDEX);
281	mclk_cntl = R128_READ_PLL(dev, R128_MCLK_CNTL);
282
283	R128_WRITE_PLL(R128_MCLK_CNTL,
284		       mclk_cntl | R128_FORCE_GCP | R128_FORCE_PIPE3D_CP);
285
286	gen_reset_cntl = R128_READ(R128_GEN_RESET_CNTL);
287
288	/* Taken from the sample code - do not change */
289	R128_WRITE(R128_GEN_RESET_CNTL, gen_reset_cntl | R128_SOFT_RESET_GUI);
290	R128_READ(R128_GEN_RESET_CNTL);
291	R128_WRITE(R128_GEN_RESET_CNTL, gen_reset_cntl & ~R128_SOFT_RESET_GUI);
292	R128_READ(R128_GEN_RESET_CNTL);
293
294	R128_WRITE_PLL(R128_MCLK_CNTL, mclk_cntl);
295	R128_WRITE(R128_CLOCK_CNTL_INDEX, clock_cntl_index);
296	R128_WRITE(R128_GEN_RESET_CNTL, gen_reset_cntl);
297
298	/* Reset the CCE ring */
299	r128_do_cce_reset(dev_priv);
300
301	/* The CCE is no longer running after an engine reset */
302	dev_priv->cce_running = 0;
303
304	/* Reset any pending vertex, indirect buffers */
305	r128_freelist_reset(dev);
306
307	return 0;
308}
309
310static void r128_cce_init_ring_buffer(struct drm_device *dev,
311				      drm_r128_private_t *dev_priv)
312{
313	u32 ring_start;
314	u32 tmp;
315
316	DRM_DEBUG("\n");
317
318	/* The manual (p. 2) says this address is in "VM space".  This
319	 * means it's an offset from the start of AGP space.
320	 */
321#if IS_ENABLED(CONFIG_AGP)
322	if (!dev_priv->is_pci)
323		ring_start = dev_priv->cce_ring->offset - dev->agp->base;
324	else
325#endif
326		ring_start = dev_priv->cce_ring->offset -
327		    (unsigned long)dev->sg->virtual;
328
329	R128_WRITE(R128_PM4_BUFFER_OFFSET, ring_start | R128_AGP_OFFSET);
330
331	R128_WRITE(R128_PM4_BUFFER_DL_WPTR, 0);
332	R128_WRITE(R128_PM4_BUFFER_DL_RPTR, 0);
333
334	/* Set watermark control */
335	R128_WRITE(R128_PM4_BUFFER_WM_CNTL,
336		   ((R128_WATERMARK_L / 4) << R128_WMA_SHIFT)
337		   | ((R128_WATERMARK_M / 4) << R128_WMB_SHIFT)
338		   | ((R128_WATERMARK_N / 4) << R128_WMC_SHIFT)
339		   | ((R128_WATERMARK_K / 64) << R128_WB_WM_SHIFT));
340
341	/* Force read.  Why?  Because it's in the examples... */
342	R128_READ(R128_PM4_BUFFER_ADDR);
343
344	/* Turn on bus mastering */
345	tmp = R128_READ(R128_BUS_CNTL) & ~R128_BUS_MASTER_DIS;
346	R128_WRITE(R128_BUS_CNTL, tmp);
347}
348
349static int r128_do_init_cce(struct drm_device *dev, drm_r128_init_t *init)
350{
351	drm_r128_private_t *dev_priv;
352	int rc;
353
354	DRM_DEBUG("\n");
355
356	if (dev->dev_private) {
357		DRM_DEBUG("called when already initialized\n");
358		return -EINVAL;
359	}
360
361	dev_priv = kzalloc(sizeof(drm_r128_private_t), GFP_KERNEL);
362	if (dev_priv == NULL)
363		return -ENOMEM;
364
365	dev_priv->is_pci = init->is_pci;
366
367	if (dev_priv->is_pci && !dev->sg) {
368		DRM_ERROR("PCI GART memory not allocated!\n");
369		dev->dev_private = (void *)dev_priv;
370		r128_do_cleanup_cce(dev);
371		return -EINVAL;
372	}
373
374	dev_priv->usec_timeout = init->usec_timeout;
375	if (dev_priv->usec_timeout < 1 ||
376	    dev_priv->usec_timeout > R128_MAX_USEC_TIMEOUT) {
377		DRM_DEBUG("TIMEOUT problem!\n");
378		dev->dev_private = (void *)dev_priv;
379		r128_do_cleanup_cce(dev);
380		return -EINVAL;
381	}
382
383	dev_priv->cce_mode = init->cce_mode;
384
385	/* GH: Simple idle check.
386	 */
387	atomic_set(&dev_priv->idle_count, 0);
388
389	/* We don't support anything other than bus-mastering ring mode,
390	 * but the ring can be in either AGP or PCI space for the ring
391	 * read pointer.
392	 */
393	if ((init->cce_mode != R128_PM4_192BM) &&
394	    (init->cce_mode != R128_PM4_128BM_64INDBM) &&
395	    (init->cce_mode != R128_PM4_64BM_128INDBM) &&
396	    (init->cce_mode != R128_PM4_64BM_64VCBM_64INDBM)) {
397		DRM_DEBUG("Bad cce_mode!\n");
398		dev->dev_private = (void *)dev_priv;
399		r128_do_cleanup_cce(dev);
400		return -EINVAL;
401	}
402
403	switch (init->cce_mode) {
404	case R128_PM4_NONPM4:
405		dev_priv->cce_fifo_size = 0;
406		break;
407	case R128_PM4_192PIO:
408	case R128_PM4_192BM:
409		dev_priv->cce_fifo_size = 192;
410		break;
411	case R128_PM4_128PIO_64INDBM:
412	case R128_PM4_128BM_64INDBM:
413		dev_priv->cce_fifo_size = 128;
414		break;
415	case R128_PM4_64PIO_128INDBM:
416	case R128_PM4_64BM_128INDBM:
417	case R128_PM4_64PIO_64VCBM_64INDBM:
418	case R128_PM4_64BM_64VCBM_64INDBM:
419	case R128_PM4_64PIO_64VCPIO_64INDPIO:
420		dev_priv->cce_fifo_size = 64;
421		break;
422	}
423
424	switch (init->fb_bpp) {
425	case 16:
426		dev_priv->color_fmt = R128_DATATYPE_RGB565;
427		break;
428	case 32:
429	default:
430		dev_priv->color_fmt = R128_DATATYPE_ARGB8888;
431		break;
432	}
433	dev_priv->front_offset = init->front_offset;
434	dev_priv->front_pitch = init->front_pitch;
435	dev_priv->back_offset = init->back_offset;
436	dev_priv->back_pitch = init->back_pitch;
437
438	switch (init->depth_bpp) {
439	case 16:
440		dev_priv->depth_fmt = R128_DATATYPE_RGB565;
441		break;
442	case 24:
443	case 32:
444	default:
445		dev_priv->depth_fmt = R128_DATATYPE_ARGB8888;
446		break;
447	}
448	dev_priv->depth_offset = init->depth_offset;
449	dev_priv->depth_pitch = init->depth_pitch;
450	dev_priv->span_offset = init->span_offset;
451
452	dev_priv->front_pitch_offset_c = (((dev_priv->front_pitch / 8) << 21) |
453					  (dev_priv->front_offset >> 5));
454	dev_priv->back_pitch_offset_c = (((dev_priv->back_pitch / 8) << 21) |
455					 (dev_priv->back_offset >> 5));
456	dev_priv->depth_pitch_offset_c = (((dev_priv->depth_pitch / 8) << 21) |
457					  (dev_priv->depth_offset >> 5) |
458					  R128_DST_TILE);
459	dev_priv->span_pitch_offset_c = (((dev_priv->depth_pitch / 8) << 21) |
460					 (dev_priv->span_offset >> 5));
461
462	dev_priv->sarea = drm_legacy_getsarea(dev);
463	if (!dev_priv->sarea) {
464		DRM_ERROR("could not find sarea!\n");
465		dev->dev_private = (void *)dev_priv;
466		r128_do_cleanup_cce(dev);
467		return -EINVAL;
468	}
469
470	dev_priv->mmio = drm_legacy_findmap(dev, init->mmio_offset);
471	if (!dev_priv->mmio) {
472		DRM_ERROR("could not find mmio region!\n");
473		dev->dev_private = (void *)dev_priv;
474		r128_do_cleanup_cce(dev);
475		return -EINVAL;
476	}
477	dev_priv->cce_ring = drm_legacy_findmap(dev, init->ring_offset);
478	if (!dev_priv->cce_ring) {
479		DRM_ERROR("could not find cce ring region!\n");
480		dev->dev_private = (void *)dev_priv;
481		r128_do_cleanup_cce(dev);
482		return -EINVAL;
483	}
484	dev_priv->ring_rptr = drm_legacy_findmap(dev, init->ring_rptr_offset);
485	if (!dev_priv->ring_rptr) {
486		DRM_ERROR("could not find ring read pointer!\n");
487		dev->dev_private = (void *)dev_priv;
488		r128_do_cleanup_cce(dev);
489		return -EINVAL;
490	}
491	dev->agp_buffer_token = init->buffers_offset;
492	dev->agp_buffer_map = drm_legacy_findmap(dev, init->buffers_offset);
493	if (!dev->agp_buffer_map) {
494		DRM_ERROR("could not find dma buffer region!\n");
495		dev->dev_private = (void *)dev_priv;
496		r128_do_cleanup_cce(dev);
497		return -EINVAL;
498	}
499
500	if (!dev_priv->is_pci) {
501		dev_priv->agp_textures =
502		    drm_legacy_findmap(dev, init->agp_textures_offset);
503		if (!dev_priv->agp_textures) {
504			DRM_ERROR("could not find agp texture region!\n");
505			dev->dev_private = (void *)dev_priv;
506			r128_do_cleanup_cce(dev);
507			return -EINVAL;
508		}
509	}
510
511	dev_priv->sarea_priv =
512	    (drm_r128_sarea_t *) ((u8 *) dev_priv->sarea->handle +
513				  init->sarea_priv_offset);
514
515#if IS_ENABLED(CONFIG_AGP)
516	if (!dev_priv->is_pci) {
517		drm_legacy_ioremap_wc(dev_priv->cce_ring, dev);
518		drm_legacy_ioremap_wc(dev_priv->ring_rptr, dev);
519		drm_legacy_ioremap_wc(dev->agp_buffer_map, dev);
520		if (!dev_priv->cce_ring->handle ||
521		    !dev_priv->ring_rptr->handle ||
522		    !dev->agp_buffer_map->handle) {
523			DRM_ERROR("Could not ioremap agp regions!\n");
524			dev->dev_private = (void *)dev_priv;
525			r128_do_cleanup_cce(dev);
526			return -ENOMEM;
527		}
528	} else
529#endif
530	{
531		dev_priv->cce_ring->handle =
532			(void *)(unsigned long)dev_priv->cce_ring->offset;
533		dev_priv->ring_rptr->handle =
534			(void *)(unsigned long)dev_priv->ring_rptr->offset;
535		dev->agp_buffer_map->handle =
536			(void *)(unsigned long)dev->agp_buffer_map->offset;
537	}
538
539#if IS_ENABLED(CONFIG_AGP)
540	if (!dev_priv->is_pci)
541		dev_priv->cce_buffers_offset = dev->agp->base;
542	else
543#endif
544		dev_priv->cce_buffers_offset = (unsigned long)dev->sg->virtual;
545
546	dev_priv->ring.start = (u32 *) dev_priv->cce_ring->handle;
547	dev_priv->ring.end = ((u32 *) dev_priv->cce_ring->handle
548			      + init->ring_size / sizeof(u32));
549	dev_priv->ring.size = init->ring_size;
550	dev_priv->ring.size_l2qw = order_base_2(init->ring_size / 8);
551
552	dev_priv->ring.tail_mask = (dev_priv->ring.size / sizeof(u32)) - 1;
553
554	dev_priv->ring.high_mark = 128;
555
556	dev_priv->sarea_priv->last_frame = 0;
557	R128_WRITE(R128_LAST_FRAME_REG, dev_priv->sarea_priv->last_frame);
558
559	dev_priv->sarea_priv->last_dispatch = 0;
560	R128_WRITE(R128_LAST_DISPATCH_REG, dev_priv->sarea_priv->last_dispatch);
561
562#if IS_ENABLED(CONFIG_AGP)
563	if (dev_priv->is_pci) {
564#endif
565		dev_priv->gart_info.table_mask = DMA_BIT_MASK(32);
566		dev_priv->gart_info.gart_table_location = DRM_ATI_GART_MAIN;
567		dev_priv->gart_info.table_size = R128_PCIGART_TABLE_SIZE;
568		dev_priv->gart_info.addr = NULL;
569		dev_priv->gart_info.bus_addr = 0;
570		dev_priv->gart_info.gart_reg_if = DRM_ATI_GART_PCI;
571		rc = drm_ati_pcigart_init(dev, &dev_priv->gart_info);
572		if (rc) {
573			DRM_ERROR("failed to init PCI GART!\n");
574			dev->dev_private = (void *)dev_priv;
575			r128_do_cleanup_cce(dev);
576			return rc;
577		}
578		R128_WRITE(R128_PCI_GART_PAGE, dev_priv->gart_info.bus_addr);
579#if IS_ENABLED(CONFIG_AGP)
580	}
581#endif
582
583	r128_cce_init_ring_buffer(dev, dev_priv);
584	rc = r128_cce_load_microcode(dev_priv);
585
586	dev->dev_private = (void *)dev_priv;
587
588	r128_do_engine_reset(dev);
589
590	if (rc) {
591		DRM_ERROR("Failed to load firmware!\n");
592		r128_do_cleanup_cce(dev);
593	}
594
595	return rc;
596}
597
598int r128_do_cleanup_cce(struct drm_device *dev)
599{
600
601	/* Make sure interrupts are disabled here because the uninstall ioctl
602	 * may not have been called from userspace and after dev_private
603	 * is freed, it's too late.
604	 */
605	if (dev->irq_enabled)
606		drm_irq_uninstall(dev);
607
608	if (dev->dev_private) {
609		drm_r128_private_t *dev_priv = dev->dev_private;
610
611#if IS_ENABLED(CONFIG_AGP)
612		if (!dev_priv->is_pci) {
613			if (dev_priv->cce_ring != NULL)
614				drm_legacy_ioremapfree(dev_priv->cce_ring, dev);
615			if (dev_priv->ring_rptr != NULL)
616				drm_legacy_ioremapfree(dev_priv->ring_rptr, dev);
617			if (dev->agp_buffer_map != NULL) {
618				drm_legacy_ioremapfree(dev->agp_buffer_map, dev);
619				dev->agp_buffer_map = NULL;
620			}
621		} else
622#endif
623		{
624			if (dev_priv->gart_info.bus_addr)
625				if (!drm_ati_pcigart_cleanup(dev,
626							&dev_priv->gart_info))
627					DRM_ERROR
628					    ("failed to cleanup PCI GART!\n");
629		}
630
631		kfree(dev->dev_private);
632		dev->dev_private = NULL;
633	}
634
635	return 0;
636}
637
638int r128_cce_init(struct drm_device *dev, void *data, struct drm_file *file_priv)
639{
640	drm_r128_init_t *init = data;
641
642	DRM_DEBUG("\n");
643
644	LOCK_TEST_WITH_RETURN(dev, file_priv);
645
646	switch (init->func) {
647	case R128_INIT_CCE:
648		return r128_do_init_cce(dev, init);
649	case R128_CLEANUP_CCE:
650		return r128_do_cleanup_cce(dev);
651	}
652
653	return -EINVAL;
654}
655
656int r128_cce_start(struct drm_device *dev, void *data, struct drm_file *file_priv)
657{
658	drm_r128_private_t *dev_priv = dev->dev_private;
659	DRM_DEBUG("\n");
660
661	LOCK_TEST_WITH_RETURN(dev, file_priv);
662
663	DEV_INIT_TEST_WITH_RETURN(dev_priv);
664
665	if (dev_priv->cce_running || dev_priv->cce_mode == R128_PM4_NONPM4) {
666		DRM_DEBUG("while CCE running\n");
667		return 0;
668	}
669
670	r128_do_cce_start(dev_priv);
671
672	return 0;
673}
674
675/* Stop the CCE.  The engine must have been idled before calling this
676 * routine.
677 */
678int r128_cce_stop(struct drm_device *dev, void *data, struct drm_file *file_priv)
679{
680	drm_r128_private_t *dev_priv = dev->dev_private;
681	drm_r128_cce_stop_t *stop = data;
682	int ret;
683	DRM_DEBUG("\n");
684
685	LOCK_TEST_WITH_RETURN(dev, file_priv);
686
687	DEV_INIT_TEST_WITH_RETURN(dev_priv);
688
689	/* Flush any pending CCE commands.  This ensures any outstanding
690	 * commands are exectuted by the engine before we turn it off.
691	 */
692	if (stop->flush)
693		r128_do_cce_flush(dev_priv);
694
695	/* If we fail to make the engine go idle, we return an error
696	 * code so that the DRM ioctl wrapper can try again.
697	 */
698	if (stop->idle) {
699		ret = r128_do_cce_idle(dev_priv);
700		if (ret)
701			return ret;
702	}
703
704	/* Finally, we can turn off the CCE.  If the engine isn't idle,
705	 * we will get some dropped triangles as they won't be fully
706	 * rendered before the CCE is shut down.
707	 */
708	r128_do_cce_stop(dev_priv);
709
710	/* Reset the engine */
711	r128_do_engine_reset(dev);
712
713	return 0;
714}
715
716/* Just reset the CCE ring.  Called as part of an X Server engine reset.
717 */
718int r128_cce_reset(struct drm_device *dev, void *data, struct drm_file *file_priv)
719{
720	drm_r128_private_t *dev_priv = dev->dev_private;
721	DRM_DEBUG("\n");
722
723	LOCK_TEST_WITH_RETURN(dev, file_priv);
724
725	DEV_INIT_TEST_WITH_RETURN(dev_priv);
726
727	r128_do_cce_reset(dev_priv);
728
729	/* The CCE is no longer running after an engine reset */
730	dev_priv->cce_running = 0;
731
732	return 0;
733}
734
735int r128_cce_idle(struct drm_device *dev, void *data, struct drm_file *file_priv)
736{
737	drm_r128_private_t *dev_priv = dev->dev_private;
738	DRM_DEBUG("\n");
739
740	LOCK_TEST_WITH_RETURN(dev, file_priv);
741
742	DEV_INIT_TEST_WITH_RETURN(dev_priv);
743
744	if (dev_priv->cce_running)
745		r128_do_cce_flush(dev_priv);
746
747	return r128_do_cce_idle(dev_priv);
748}
749
750int r128_engine_reset(struct drm_device *dev, void *data, struct drm_file *file_priv)
751{
752	DRM_DEBUG("\n");
753
754	LOCK_TEST_WITH_RETURN(dev, file_priv);
755
756	DEV_INIT_TEST_WITH_RETURN(dev->dev_private);
757
758	return r128_do_engine_reset(dev);
759}
760
761int r128_fullscreen(struct drm_device *dev, void *data, struct drm_file *file_priv)
762{
763	return -EINVAL;
764}
765
766/* ================================================================
767 * Freelist management
768 */
769#define R128_BUFFER_USED	0xffffffff
770#define R128_BUFFER_FREE	0
771
772#if 0
773static int r128_freelist_init(struct drm_device *dev)
774{
775	struct drm_device_dma *dma = dev->dma;
776	drm_r128_private_t *dev_priv = dev->dev_private;
777	struct drm_buf *buf;
778	drm_r128_buf_priv_t *buf_priv;
779	drm_r128_freelist_t *entry;
780	int i;
781
782	dev_priv->head = kzalloc(sizeof(drm_r128_freelist_t), GFP_KERNEL);
783	if (dev_priv->head == NULL)
784		return -ENOMEM;
785
786	dev_priv->head->age = R128_BUFFER_USED;
787
788	for (i = 0; i < dma->buf_count; i++) {
789		buf = dma->buflist[i];
790		buf_priv = buf->dev_private;
791
792		entry = kmalloc(sizeof(drm_r128_freelist_t), GFP_KERNEL);
793		if (!entry)
794			return -ENOMEM;
795
796		entry->age = R128_BUFFER_FREE;
797		entry->buf = buf;
798		entry->prev = dev_priv->head;
799		entry->next = dev_priv->head->next;
800		if (!entry->next)
801			dev_priv->tail = entry;
802
803		buf_priv->discard = 0;
804		buf_priv->dispatched = 0;
805		buf_priv->list_entry = entry;
806
807		dev_priv->head->next = entry;
808
809		if (dev_priv->head->next)
810			dev_priv->head->next->prev = entry;
811	}
812
813	return 0;
814
815}
816#endif
817
818static struct drm_buf *r128_freelist_get(struct drm_device * dev)
819{
820	struct drm_device_dma *dma = dev->dma;
821	drm_r128_private_t *dev_priv = dev->dev_private;
822	drm_r128_buf_priv_t *buf_priv;
823	struct drm_buf *buf;
824	int i, t;
825
826	/* FIXME: Optimize -- use freelist code */
827
828	for (i = 0; i < dma->buf_count; i++) {
829		buf = dma->buflist[i];
830		buf_priv = buf->dev_private;
831		if (!buf->file_priv)
832			return buf;
833	}
834
835	for (t = 0; t < dev_priv->usec_timeout; t++) {
836		u32 done_age = R128_READ(R128_LAST_DISPATCH_REG);
837
838		for (i = 0; i < dma->buf_count; i++) {
839			buf = dma->buflist[i];
840			buf_priv = buf->dev_private;
841			if (buf->pending && buf_priv->age <= done_age) {
842				/* The buffer has been processed, so it
843				 * can now be used.
844				 */
845				buf->pending = 0;
846				return buf;
847			}
848		}
849		udelay(1);
850	}
851
852	DRM_DEBUG("returning NULL!\n");
853	return NULL;
854}
855
856void r128_freelist_reset(struct drm_device *dev)
857{
858	struct drm_device_dma *dma = dev->dma;
859	int i;
860
861	for (i = 0; i < dma->buf_count; i++) {
862		struct drm_buf *buf = dma->buflist[i];
863		drm_r128_buf_priv_t *buf_priv = buf->dev_private;
864		buf_priv->age = 0;
865	}
866}
867
868/* ================================================================
869 * CCE command submission
870 */
871
872int r128_wait_ring(drm_r128_private_t *dev_priv, int n)
873{
874	drm_r128_ring_buffer_t *ring = &dev_priv->ring;
875	int i;
876
877	for (i = 0; i < dev_priv->usec_timeout; i++) {
878		r128_update_ring_snapshot(dev_priv);
879		if (ring->space >= n)
880			return 0;
881		udelay(1);
882	}
883
884	/* FIXME: This is being ignored... */
885	DRM_ERROR("failed!\n");
886	return -EBUSY;
887}
888
889static int r128_cce_get_buffers(struct drm_device *dev,
890				struct drm_file *file_priv,
891				struct drm_dma *d)
892{
893	int i;
894	struct drm_buf *buf;
895
896	for (i = d->granted_count; i < d->request_count; i++) {
897		buf = r128_freelist_get(dev);
898		if (!buf)
899			return -EAGAIN;
900
901		buf->file_priv = file_priv;
902
903		if (copy_to_user(&d->request_indices[i], &buf->idx,
904				     sizeof(buf->idx)))
905			return -EFAULT;
906		if (copy_to_user(&d->request_sizes[i], &buf->total,
907				     sizeof(buf->total)))
908			return -EFAULT;
909
910		d->granted_count++;
911	}
912	return 0;
913}
914
915int r128_cce_buffers(struct drm_device *dev, void *data, struct drm_file *file_priv)
916{
917	struct drm_device_dma *dma = dev->dma;
918	int ret = 0;
919	struct drm_dma *d = data;
920
921	LOCK_TEST_WITH_RETURN(dev, file_priv);
922
923	/* Please don't send us buffers.
924	 */
925	if (d->send_count != 0) {
926		DRM_ERROR("Process %d trying to send %d buffers via drmDMA\n",
927			  task_pid_nr(current), d->send_count);
928		return -EINVAL;
929	}
930
931	/* We'll send you buffers.
932	 */
933	if (d->request_count < 0 || d->request_count > dma->buf_count) {
934		DRM_ERROR("Process %d trying to get %d buffers (of %d max)\n",
935			  task_pid_nr(current), d->request_count, dma->buf_count);
936		return -EINVAL;
937	}
938
939	d->granted_count = 0;
940
941	if (d->request_count)
942		ret = r128_cce_get_buffers(dev, file_priv, d);
943
944	return ret;
945}
v4.17
  1/* r128_cce.c -- ATI Rage 128 driver -*- linux-c -*-
  2 * Created: Wed Apr  5 19:24:19 2000 by kevin@precisioninsight.com
  3 */
  4/*
  5 * Copyright 2000 Precision Insight, Inc., Cedar Park, Texas.
  6 * Copyright 2000 VA Linux Systems, Inc., Sunnyvale, California.
  7 * All Rights Reserved.
  8 *
  9 * Permission is hereby granted, free of charge, to any person obtaining a
 10 * copy of this software and associated documentation files (the "Software"),
 11 * to deal in the Software without restriction, including without limitation
 12 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
 13 * and/or sell copies of the Software, and to permit persons to whom the
 14 * Software is furnished to do so, subject to the following conditions:
 15 *
 16 * The above copyright notice and this permission notice (including the next
 17 * paragraph) shall be included in all copies or substantial portions of the
 18 * Software.
 19 *
 20 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 21 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 22 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 23 * PRECISION INSIGHT AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
 24 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
 25 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
 26 * DEALINGS IN THE SOFTWARE.
 27 *
 28 * Authors:
 29 *    Gareth Hughes <gareth@valinux.com>
 30 */
 31
 
 
 32#include <linux/firmware.h>
 
 33#include <linux/platform_device.h>
 34#include <linux/slab.h>
 35#include <linux/module.h>
 36
 37#include <drm/drmP.h>
 
 
 
 
 38#include <drm/r128_drm.h>
 
 39#include "r128_drv.h"
 40
 41#define R128_FIFO_DEBUG		0
 42
 43#define FIRMWARE_NAME		"r128/r128_cce.bin"
 44
 45MODULE_FIRMWARE(FIRMWARE_NAME);
 46
 47static int R128_READ_PLL(struct drm_device *dev, int addr)
 48{
 49	drm_r128_private_t *dev_priv = dev->dev_private;
 50
 51	R128_WRITE8(R128_CLOCK_CNTL_INDEX, addr & 0x1f);
 52	return R128_READ(R128_CLOCK_CNTL_DATA);
 53}
 54
 55#if R128_FIFO_DEBUG
 56static void r128_status(drm_r128_private_t *dev_priv)
 57{
 58	printk("GUI_STAT           = 0x%08x\n",
 59	       (unsigned int)R128_READ(R128_GUI_STAT));
 60	printk("PM4_STAT           = 0x%08x\n",
 61	       (unsigned int)R128_READ(R128_PM4_STAT));
 62	printk("PM4_BUFFER_DL_WPTR = 0x%08x\n",
 63	       (unsigned int)R128_READ(R128_PM4_BUFFER_DL_WPTR));
 64	printk("PM4_BUFFER_DL_RPTR = 0x%08x\n",
 65	       (unsigned int)R128_READ(R128_PM4_BUFFER_DL_RPTR));
 66	printk("PM4_MICRO_CNTL     = 0x%08x\n",
 67	       (unsigned int)R128_READ(R128_PM4_MICRO_CNTL));
 68	printk("PM4_BUFFER_CNTL    = 0x%08x\n",
 69	       (unsigned int)R128_READ(R128_PM4_BUFFER_CNTL));
 70}
 71#endif
 72
 73/* ================================================================
 74 * Engine, FIFO control
 75 */
 76
 77static int r128_do_pixcache_flush(drm_r128_private_t *dev_priv)
 78{
 79	u32 tmp;
 80	int i;
 81
 82	tmp = R128_READ(R128_PC_NGUI_CTLSTAT) | R128_PC_FLUSH_ALL;
 83	R128_WRITE(R128_PC_NGUI_CTLSTAT, tmp);
 84
 85	for (i = 0; i < dev_priv->usec_timeout; i++) {
 86		if (!(R128_READ(R128_PC_NGUI_CTLSTAT) & R128_PC_BUSY))
 87			return 0;
 88		DRM_UDELAY(1);
 89	}
 90
 91#if R128_FIFO_DEBUG
 92	DRM_ERROR("failed!\n");
 93#endif
 94	return -EBUSY;
 95}
 96
 97static int r128_do_wait_for_fifo(drm_r128_private_t *dev_priv, int entries)
 98{
 99	int i;
100
101	for (i = 0; i < dev_priv->usec_timeout; i++) {
102		int slots = R128_READ(R128_GUI_STAT) & R128_GUI_FIFOCNT_MASK;
103		if (slots >= entries)
104			return 0;
105		DRM_UDELAY(1);
106	}
107
108#if R128_FIFO_DEBUG
109	DRM_ERROR("failed!\n");
110#endif
111	return -EBUSY;
112}
113
114static int r128_do_wait_for_idle(drm_r128_private_t *dev_priv)
115{
116	int i, ret;
117
118	ret = r128_do_wait_for_fifo(dev_priv, 64);
119	if (ret)
120		return ret;
121
122	for (i = 0; i < dev_priv->usec_timeout; i++) {
123		if (!(R128_READ(R128_GUI_STAT) & R128_GUI_ACTIVE)) {
124			r128_do_pixcache_flush(dev_priv);
125			return 0;
126		}
127		DRM_UDELAY(1);
128	}
129
130#if R128_FIFO_DEBUG
131	DRM_ERROR("failed!\n");
132#endif
133	return -EBUSY;
134}
135
136/* ================================================================
137 * CCE control, initialization
138 */
139
140/* Load the microcode for the CCE */
141static int r128_cce_load_microcode(drm_r128_private_t *dev_priv)
142{
143	struct platform_device *pdev;
144	const struct firmware *fw;
145	const __be32 *fw_data;
146	int rc, i;
147
148	DRM_DEBUG("\n");
149
150	pdev = platform_device_register_simple("r128_cce", 0, NULL, 0);
151	if (IS_ERR(pdev)) {
152		pr_err("r128_cce: Failed to register firmware\n");
153		return PTR_ERR(pdev);
154	}
155	rc = request_firmware(&fw, FIRMWARE_NAME, &pdev->dev);
156	platform_device_unregister(pdev);
157	if (rc) {
158		pr_err("r128_cce: Failed to load firmware \"%s\"\n",
159		       FIRMWARE_NAME);
160		return rc;
161	}
162
163	if (fw->size != 256 * 8) {
164		pr_err("r128_cce: Bogus length %zu in firmware \"%s\"\n",
165		       fw->size, FIRMWARE_NAME);
166		rc = -EINVAL;
167		goto out_release;
168	}
169
170	r128_do_wait_for_idle(dev_priv);
171
172	fw_data = (const __be32 *)fw->data;
173	R128_WRITE(R128_PM4_MICROCODE_ADDR, 0);
174	for (i = 0; i < 256; i++) {
175		R128_WRITE(R128_PM4_MICROCODE_DATAH,
176			   be32_to_cpup(&fw_data[i * 2]));
177		R128_WRITE(R128_PM4_MICROCODE_DATAL,
178			   be32_to_cpup(&fw_data[i * 2 + 1]));
179	}
180
181out_release:
182	release_firmware(fw);
183	return rc;
184}
185
186/* Flush any pending commands to the CCE.  This should only be used just
187 * prior to a wait for idle, as it informs the engine that the command
188 * stream is ending.
189 */
190static void r128_do_cce_flush(drm_r128_private_t *dev_priv)
191{
192	u32 tmp;
193
194	tmp = R128_READ(R128_PM4_BUFFER_DL_WPTR) | R128_PM4_BUFFER_DL_DONE;
195	R128_WRITE(R128_PM4_BUFFER_DL_WPTR, tmp);
196}
197
198/* Wait for the CCE to go idle.
199 */
200int r128_do_cce_idle(drm_r128_private_t *dev_priv)
201{
202	int i;
203
204	for (i = 0; i < dev_priv->usec_timeout; i++) {
205		if (GET_RING_HEAD(dev_priv) == dev_priv->ring.tail) {
206			int pm4stat = R128_READ(R128_PM4_STAT);
207			if (((pm4stat & R128_PM4_FIFOCNT_MASK) >=
208			     dev_priv->cce_fifo_size) &&
209			    !(pm4stat & (R128_PM4_BUSY |
210					 R128_PM4_GUI_ACTIVE))) {
211				return r128_do_pixcache_flush(dev_priv);
212			}
213		}
214		DRM_UDELAY(1);
215	}
216
217#if R128_FIFO_DEBUG
218	DRM_ERROR("failed!\n");
219	r128_status(dev_priv);
220#endif
221	return -EBUSY;
222}
223
224/* Start the Concurrent Command Engine.
225 */
226static void r128_do_cce_start(drm_r128_private_t *dev_priv)
227{
228	r128_do_wait_for_idle(dev_priv);
229
230	R128_WRITE(R128_PM4_BUFFER_CNTL,
231		   dev_priv->cce_mode | dev_priv->ring.size_l2qw
232		   | R128_PM4_BUFFER_CNTL_NOUPDATE);
233	R128_READ(R128_PM4_BUFFER_ADDR);	/* as per the sample code */
234	R128_WRITE(R128_PM4_MICRO_CNTL, R128_PM4_MICRO_FREERUN);
235
236	dev_priv->cce_running = 1;
237}
238
239/* Reset the Concurrent Command Engine.  This will not flush any pending
240 * commands, so you must wait for the CCE command stream to complete
241 * before calling this routine.
242 */
243static void r128_do_cce_reset(drm_r128_private_t *dev_priv)
244{
245	R128_WRITE(R128_PM4_BUFFER_DL_WPTR, 0);
246	R128_WRITE(R128_PM4_BUFFER_DL_RPTR, 0);
247	dev_priv->ring.tail = 0;
248}
249
250/* Stop the Concurrent Command Engine.  This will not flush any pending
251 * commands, so you must flush the command stream and wait for the CCE
252 * to go idle before calling this routine.
253 */
254static void r128_do_cce_stop(drm_r128_private_t *dev_priv)
255{
256	R128_WRITE(R128_PM4_MICRO_CNTL, 0);
257	R128_WRITE(R128_PM4_BUFFER_CNTL,
258		   R128_PM4_NONPM4 | R128_PM4_BUFFER_CNTL_NOUPDATE);
259
260	dev_priv->cce_running = 0;
261}
262
263/* Reset the engine.  This will stop the CCE if it is running.
264 */
265static int r128_do_engine_reset(struct drm_device *dev)
266{
267	drm_r128_private_t *dev_priv = dev->dev_private;
268	u32 clock_cntl_index, mclk_cntl, gen_reset_cntl;
269
270	r128_do_pixcache_flush(dev_priv);
271
272	clock_cntl_index = R128_READ(R128_CLOCK_CNTL_INDEX);
273	mclk_cntl = R128_READ_PLL(dev, R128_MCLK_CNTL);
274
275	R128_WRITE_PLL(R128_MCLK_CNTL,
276		       mclk_cntl | R128_FORCE_GCP | R128_FORCE_PIPE3D_CP);
277
278	gen_reset_cntl = R128_READ(R128_GEN_RESET_CNTL);
279
280	/* Taken from the sample code - do not change */
281	R128_WRITE(R128_GEN_RESET_CNTL, gen_reset_cntl | R128_SOFT_RESET_GUI);
282	R128_READ(R128_GEN_RESET_CNTL);
283	R128_WRITE(R128_GEN_RESET_CNTL, gen_reset_cntl & ~R128_SOFT_RESET_GUI);
284	R128_READ(R128_GEN_RESET_CNTL);
285
286	R128_WRITE_PLL(R128_MCLK_CNTL, mclk_cntl);
287	R128_WRITE(R128_CLOCK_CNTL_INDEX, clock_cntl_index);
288	R128_WRITE(R128_GEN_RESET_CNTL, gen_reset_cntl);
289
290	/* Reset the CCE ring */
291	r128_do_cce_reset(dev_priv);
292
293	/* The CCE is no longer running after an engine reset */
294	dev_priv->cce_running = 0;
295
296	/* Reset any pending vertex, indirect buffers */
297	r128_freelist_reset(dev);
298
299	return 0;
300}
301
302static void r128_cce_init_ring_buffer(struct drm_device *dev,
303				      drm_r128_private_t *dev_priv)
304{
305	u32 ring_start;
306	u32 tmp;
307
308	DRM_DEBUG("\n");
309
310	/* The manual (p. 2) says this address is in "VM space".  This
311	 * means it's an offset from the start of AGP space.
312	 */
313#if IS_ENABLED(CONFIG_AGP)
314	if (!dev_priv->is_pci)
315		ring_start = dev_priv->cce_ring->offset - dev->agp->base;
316	else
317#endif
318		ring_start = dev_priv->cce_ring->offset -
319		    (unsigned long)dev->sg->virtual;
320
321	R128_WRITE(R128_PM4_BUFFER_OFFSET, ring_start | R128_AGP_OFFSET);
322
323	R128_WRITE(R128_PM4_BUFFER_DL_WPTR, 0);
324	R128_WRITE(R128_PM4_BUFFER_DL_RPTR, 0);
325
326	/* Set watermark control */
327	R128_WRITE(R128_PM4_BUFFER_WM_CNTL,
328		   ((R128_WATERMARK_L / 4) << R128_WMA_SHIFT)
329		   | ((R128_WATERMARK_M / 4) << R128_WMB_SHIFT)
330		   | ((R128_WATERMARK_N / 4) << R128_WMC_SHIFT)
331		   | ((R128_WATERMARK_K / 64) << R128_WB_WM_SHIFT));
332
333	/* Force read.  Why?  Because it's in the examples... */
334	R128_READ(R128_PM4_BUFFER_ADDR);
335
336	/* Turn on bus mastering */
337	tmp = R128_READ(R128_BUS_CNTL) & ~R128_BUS_MASTER_DIS;
338	R128_WRITE(R128_BUS_CNTL, tmp);
339}
340
341static int r128_do_init_cce(struct drm_device *dev, drm_r128_init_t *init)
342{
343	drm_r128_private_t *dev_priv;
344	int rc;
345
346	DRM_DEBUG("\n");
347
348	if (dev->dev_private) {
349		DRM_DEBUG("called when already initialized\n");
350		return -EINVAL;
351	}
352
353	dev_priv = kzalloc(sizeof(drm_r128_private_t), GFP_KERNEL);
354	if (dev_priv == NULL)
355		return -ENOMEM;
356
357	dev_priv->is_pci = init->is_pci;
358
359	if (dev_priv->is_pci && !dev->sg) {
360		DRM_ERROR("PCI GART memory not allocated!\n");
361		dev->dev_private = (void *)dev_priv;
362		r128_do_cleanup_cce(dev);
363		return -EINVAL;
364	}
365
366	dev_priv->usec_timeout = init->usec_timeout;
367	if (dev_priv->usec_timeout < 1 ||
368	    dev_priv->usec_timeout > R128_MAX_USEC_TIMEOUT) {
369		DRM_DEBUG("TIMEOUT problem!\n");
370		dev->dev_private = (void *)dev_priv;
371		r128_do_cleanup_cce(dev);
372		return -EINVAL;
373	}
374
375	dev_priv->cce_mode = init->cce_mode;
376
377	/* GH: Simple idle check.
378	 */
379	atomic_set(&dev_priv->idle_count, 0);
380
381	/* We don't support anything other than bus-mastering ring mode,
382	 * but the ring can be in either AGP or PCI space for the ring
383	 * read pointer.
384	 */
385	if ((init->cce_mode != R128_PM4_192BM) &&
386	    (init->cce_mode != R128_PM4_128BM_64INDBM) &&
387	    (init->cce_mode != R128_PM4_64BM_128INDBM) &&
388	    (init->cce_mode != R128_PM4_64BM_64VCBM_64INDBM)) {
389		DRM_DEBUG("Bad cce_mode!\n");
390		dev->dev_private = (void *)dev_priv;
391		r128_do_cleanup_cce(dev);
392		return -EINVAL;
393	}
394
395	switch (init->cce_mode) {
396	case R128_PM4_NONPM4:
397		dev_priv->cce_fifo_size = 0;
398		break;
399	case R128_PM4_192PIO:
400	case R128_PM4_192BM:
401		dev_priv->cce_fifo_size = 192;
402		break;
403	case R128_PM4_128PIO_64INDBM:
404	case R128_PM4_128BM_64INDBM:
405		dev_priv->cce_fifo_size = 128;
406		break;
407	case R128_PM4_64PIO_128INDBM:
408	case R128_PM4_64BM_128INDBM:
409	case R128_PM4_64PIO_64VCBM_64INDBM:
410	case R128_PM4_64BM_64VCBM_64INDBM:
411	case R128_PM4_64PIO_64VCPIO_64INDPIO:
412		dev_priv->cce_fifo_size = 64;
413		break;
414	}
415
416	switch (init->fb_bpp) {
417	case 16:
418		dev_priv->color_fmt = R128_DATATYPE_RGB565;
419		break;
420	case 32:
421	default:
422		dev_priv->color_fmt = R128_DATATYPE_ARGB8888;
423		break;
424	}
425	dev_priv->front_offset = init->front_offset;
426	dev_priv->front_pitch = init->front_pitch;
427	dev_priv->back_offset = init->back_offset;
428	dev_priv->back_pitch = init->back_pitch;
429
430	switch (init->depth_bpp) {
431	case 16:
432		dev_priv->depth_fmt = R128_DATATYPE_RGB565;
433		break;
434	case 24:
435	case 32:
436	default:
437		dev_priv->depth_fmt = R128_DATATYPE_ARGB8888;
438		break;
439	}
440	dev_priv->depth_offset = init->depth_offset;
441	dev_priv->depth_pitch = init->depth_pitch;
442	dev_priv->span_offset = init->span_offset;
443
444	dev_priv->front_pitch_offset_c = (((dev_priv->front_pitch / 8) << 21) |
445					  (dev_priv->front_offset >> 5));
446	dev_priv->back_pitch_offset_c = (((dev_priv->back_pitch / 8) << 21) |
447					 (dev_priv->back_offset >> 5));
448	dev_priv->depth_pitch_offset_c = (((dev_priv->depth_pitch / 8) << 21) |
449					  (dev_priv->depth_offset >> 5) |
450					  R128_DST_TILE);
451	dev_priv->span_pitch_offset_c = (((dev_priv->depth_pitch / 8) << 21) |
452					 (dev_priv->span_offset >> 5));
453
454	dev_priv->sarea = drm_legacy_getsarea(dev);
455	if (!dev_priv->sarea) {
456		DRM_ERROR("could not find sarea!\n");
457		dev->dev_private = (void *)dev_priv;
458		r128_do_cleanup_cce(dev);
459		return -EINVAL;
460	}
461
462	dev_priv->mmio = drm_legacy_findmap(dev, init->mmio_offset);
463	if (!dev_priv->mmio) {
464		DRM_ERROR("could not find mmio region!\n");
465		dev->dev_private = (void *)dev_priv;
466		r128_do_cleanup_cce(dev);
467		return -EINVAL;
468	}
469	dev_priv->cce_ring = drm_legacy_findmap(dev, init->ring_offset);
470	if (!dev_priv->cce_ring) {
471		DRM_ERROR("could not find cce ring region!\n");
472		dev->dev_private = (void *)dev_priv;
473		r128_do_cleanup_cce(dev);
474		return -EINVAL;
475	}
476	dev_priv->ring_rptr = drm_legacy_findmap(dev, init->ring_rptr_offset);
477	if (!dev_priv->ring_rptr) {
478		DRM_ERROR("could not find ring read pointer!\n");
479		dev->dev_private = (void *)dev_priv;
480		r128_do_cleanup_cce(dev);
481		return -EINVAL;
482	}
483	dev->agp_buffer_token = init->buffers_offset;
484	dev->agp_buffer_map = drm_legacy_findmap(dev, init->buffers_offset);
485	if (!dev->agp_buffer_map) {
486		DRM_ERROR("could not find dma buffer region!\n");
487		dev->dev_private = (void *)dev_priv;
488		r128_do_cleanup_cce(dev);
489		return -EINVAL;
490	}
491
492	if (!dev_priv->is_pci) {
493		dev_priv->agp_textures =
494		    drm_legacy_findmap(dev, init->agp_textures_offset);
495		if (!dev_priv->agp_textures) {
496			DRM_ERROR("could not find agp texture region!\n");
497			dev->dev_private = (void *)dev_priv;
498			r128_do_cleanup_cce(dev);
499			return -EINVAL;
500		}
501	}
502
503	dev_priv->sarea_priv =
504	    (drm_r128_sarea_t *) ((u8 *) dev_priv->sarea->handle +
505				  init->sarea_priv_offset);
506
507#if IS_ENABLED(CONFIG_AGP)
508	if (!dev_priv->is_pci) {
509		drm_legacy_ioremap_wc(dev_priv->cce_ring, dev);
510		drm_legacy_ioremap_wc(dev_priv->ring_rptr, dev);
511		drm_legacy_ioremap_wc(dev->agp_buffer_map, dev);
512		if (!dev_priv->cce_ring->handle ||
513		    !dev_priv->ring_rptr->handle ||
514		    !dev->agp_buffer_map->handle) {
515			DRM_ERROR("Could not ioremap agp regions!\n");
516			dev->dev_private = (void *)dev_priv;
517			r128_do_cleanup_cce(dev);
518			return -ENOMEM;
519		}
520	} else
521#endif
522	{
523		dev_priv->cce_ring->handle =
524			(void *)(unsigned long)dev_priv->cce_ring->offset;
525		dev_priv->ring_rptr->handle =
526			(void *)(unsigned long)dev_priv->ring_rptr->offset;
527		dev->agp_buffer_map->handle =
528			(void *)(unsigned long)dev->agp_buffer_map->offset;
529	}
530
531#if IS_ENABLED(CONFIG_AGP)
532	if (!dev_priv->is_pci)
533		dev_priv->cce_buffers_offset = dev->agp->base;
534	else
535#endif
536		dev_priv->cce_buffers_offset = (unsigned long)dev->sg->virtual;
537
538	dev_priv->ring.start = (u32 *) dev_priv->cce_ring->handle;
539	dev_priv->ring.end = ((u32 *) dev_priv->cce_ring->handle
540			      + init->ring_size / sizeof(u32));
541	dev_priv->ring.size = init->ring_size;
542	dev_priv->ring.size_l2qw = order_base_2(init->ring_size / 8);
543
544	dev_priv->ring.tail_mask = (dev_priv->ring.size / sizeof(u32)) - 1;
545
546	dev_priv->ring.high_mark = 128;
547
548	dev_priv->sarea_priv->last_frame = 0;
549	R128_WRITE(R128_LAST_FRAME_REG, dev_priv->sarea_priv->last_frame);
550
551	dev_priv->sarea_priv->last_dispatch = 0;
552	R128_WRITE(R128_LAST_DISPATCH_REG, dev_priv->sarea_priv->last_dispatch);
553
554#if IS_ENABLED(CONFIG_AGP)
555	if (dev_priv->is_pci) {
556#endif
557		dev_priv->gart_info.table_mask = DMA_BIT_MASK(32);
558		dev_priv->gart_info.gart_table_location = DRM_ATI_GART_MAIN;
559		dev_priv->gart_info.table_size = R128_PCIGART_TABLE_SIZE;
560		dev_priv->gart_info.addr = NULL;
561		dev_priv->gart_info.bus_addr = 0;
562		dev_priv->gart_info.gart_reg_if = DRM_ATI_GART_PCI;
563		if (!drm_ati_pcigart_init(dev, &dev_priv->gart_info)) {
 
564			DRM_ERROR("failed to init PCI GART!\n");
565			dev->dev_private = (void *)dev_priv;
566			r128_do_cleanup_cce(dev);
567			return -ENOMEM;
568		}
569		R128_WRITE(R128_PCI_GART_PAGE, dev_priv->gart_info.bus_addr);
570#if IS_ENABLED(CONFIG_AGP)
571	}
572#endif
573
574	r128_cce_init_ring_buffer(dev, dev_priv);
575	rc = r128_cce_load_microcode(dev_priv);
576
577	dev->dev_private = (void *)dev_priv;
578
579	r128_do_engine_reset(dev);
580
581	if (rc) {
582		DRM_ERROR("Failed to load firmware!\n");
583		r128_do_cleanup_cce(dev);
584	}
585
586	return rc;
587}
588
589int r128_do_cleanup_cce(struct drm_device *dev)
590{
591
592	/* Make sure interrupts are disabled here because the uninstall ioctl
593	 * may not have been called from userspace and after dev_private
594	 * is freed, it's too late.
595	 */
596	if (dev->irq_enabled)
597		drm_irq_uninstall(dev);
598
599	if (dev->dev_private) {
600		drm_r128_private_t *dev_priv = dev->dev_private;
601
602#if IS_ENABLED(CONFIG_AGP)
603		if (!dev_priv->is_pci) {
604			if (dev_priv->cce_ring != NULL)
605				drm_legacy_ioremapfree(dev_priv->cce_ring, dev);
606			if (dev_priv->ring_rptr != NULL)
607				drm_legacy_ioremapfree(dev_priv->ring_rptr, dev);
608			if (dev->agp_buffer_map != NULL) {
609				drm_legacy_ioremapfree(dev->agp_buffer_map, dev);
610				dev->agp_buffer_map = NULL;
611			}
612		} else
613#endif
614		{
615			if (dev_priv->gart_info.bus_addr)
616				if (!drm_ati_pcigart_cleanup(dev,
617							&dev_priv->gart_info))
618					DRM_ERROR
619					    ("failed to cleanup PCI GART!\n");
620		}
621
622		kfree(dev->dev_private);
623		dev->dev_private = NULL;
624	}
625
626	return 0;
627}
628
629int r128_cce_init(struct drm_device *dev, void *data, struct drm_file *file_priv)
630{
631	drm_r128_init_t *init = data;
632
633	DRM_DEBUG("\n");
634
635	LOCK_TEST_WITH_RETURN(dev, file_priv);
636
637	switch (init->func) {
638	case R128_INIT_CCE:
639		return r128_do_init_cce(dev, init);
640	case R128_CLEANUP_CCE:
641		return r128_do_cleanup_cce(dev);
642	}
643
644	return -EINVAL;
645}
646
647int r128_cce_start(struct drm_device *dev, void *data, struct drm_file *file_priv)
648{
649	drm_r128_private_t *dev_priv = dev->dev_private;
650	DRM_DEBUG("\n");
651
652	LOCK_TEST_WITH_RETURN(dev, file_priv);
653
654	DEV_INIT_TEST_WITH_RETURN(dev_priv);
655
656	if (dev_priv->cce_running || dev_priv->cce_mode == R128_PM4_NONPM4) {
657		DRM_DEBUG("while CCE running\n");
658		return 0;
659	}
660
661	r128_do_cce_start(dev_priv);
662
663	return 0;
664}
665
666/* Stop the CCE.  The engine must have been idled before calling this
667 * routine.
668 */
669int r128_cce_stop(struct drm_device *dev, void *data, struct drm_file *file_priv)
670{
671	drm_r128_private_t *dev_priv = dev->dev_private;
672	drm_r128_cce_stop_t *stop = data;
673	int ret;
674	DRM_DEBUG("\n");
675
676	LOCK_TEST_WITH_RETURN(dev, file_priv);
677
678	DEV_INIT_TEST_WITH_RETURN(dev_priv);
679
680	/* Flush any pending CCE commands.  This ensures any outstanding
681	 * commands are exectuted by the engine before we turn it off.
682	 */
683	if (stop->flush)
684		r128_do_cce_flush(dev_priv);
685
686	/* If we fail to make the engine go idle, we return an error
687	 * code so that the DRM ioctl wrapper can try again.
688	 */
689	if (stop->idle) {
690		ret = r128_do_cce_idle(dev_priv);
691		if (ret)
692			return ret;
693	}
694
695	/* Finally, we can turn off the CCE.  If the engine isn't idle,
696	 * we will get some dropped triangles as they won't be fully
697	 * rendered before the CCE is shut down.
698	 */
699	r128_do_cce_stop(dev_priv);
700
701	/* Reset the engine */
702	r128_do_engine_reset(dev);
703
704	return 0;
705}
706
707/* Just reset the CCE ring.  Called as part of an X Server engine reset.
708 */
709int r128_cce_reset(struct drm_device *dev, void *data, struct drm_file *file_priv)
710{
711	drm_r128_private_t *dev_priv = dev->dev_private;
712	DRM_DEBUG("\n");
713
714	LOCK_TEST_WITH_RETURN(dev, file_priv);
715
716	DEV_INIT_TEST_WITH_RETURN(dev_priv);
717
718	r128_do_cce_reset(dev_priv);
719
720	/* The CCE is no longer running after an engine reset */
721	dev_priv->cce_running = 0;
722
723	return 0;
724}
725
726int r128_cce_idle(struct drm_device *dev, void *data, struct drm_file *file_priv)
727{
728	drm_r128_private_t *dev_priv = dev->dev_private;
729	DRM_DEBUG("\n");
730
731	LOCK_TEST_WITH_RETURN(dev, file_priv);
732
733	DEV_INIT_TEST_WITH_RETURN(dev_priv);
734
735	if (dev_priv->cce_running)
736		r128_do_cce_flush(dev_priv);
737
738	return r128_do_cce_idle(dev_priv);
739}
740
741int r128_engine_reset(struct drm_device *dev, void *data, struct drm_file *file_priv)
742{
743	DRM_DEBUG("\n");
744
745	LOCK_TEST_WITH_RETURN(dev, file_priv);
746
747	DEV_INIT_TEST_WITH_RETURN(dev->dev_private);
748
749	return r128_do_engine_reset(dev);
750}
751
752int r128_fullscreen(struct drm_device *dev, void *data, struct drm_file *file_priv)
753{
754	return -EINVAL;
755}
756
757/* ================================================================
758 * Freelist management
759 */
760#define R128_BUFFER_USED	0xffffffff
761#define R128_BUFFER_FREE	0
762
763#if 0
764static int r128_freelist_init(struct drm_device *dev)
765{
766	struct drm_device_dma *dma = dev->dma;
767	drm_r128_private_t *dev_priv = dev->dev_private;
768	struct drm_buf *buf;
769	drm_r128_buf_priv_t *buf_priv;
770	drm_r128_freelist_t *entry;
771	int i;
772
773	dev_priv->head = kzalloc(sizeof(drm_r128_freelist_t), GFP_KERNEL);
774	if (dev_priv->head == NULL)
775		return -ENOMEM;
776
777	dev_priv->head->age = R128_BUFFER_USED;
778
779	for (i = 0; i < dma->buf_count; i++) {
780		buf = dma->buflist[i];
781		buf_priv = buf->dev_private;
782
783		entry = kmalloc(sizeof(drm_r128_freelist_t), GFP_KERNEL);
784		if (!entry)
785			return -ENOMEM;
786
787		entry->age = R128_BUFFER_FREE;
788		entry->buf = buf;
789		entry->prev = dev_priv->head;
790		entry->next = dev_priv->head->next;
791		if (!entry->next)
792			dev_priv->tail = entry;
793
794		buf_priv->discard = 0;
795		buf_priv->dispatched = 0;
796		buf_priv->list_entry = entry;
797
798		dev_priv->head->next = entry;
799
800		if (dev_priv->head->next)
801			dev_priv->head->next->prev = entry;
802	}
803
804	return 0;
805
806}
807#endif
808
809static struct drm_buf *r128_freelist_get(struct drm_device * dev)
810{
811	struct drm_device_dma *dma = dev->dma;
812	drm_r128_private_t *dev_priv = dev->dev_private;
813	drm_r128_buf_priv_t *buf_priv;
814	struct drm_buf *buf;
815	int i, t;
816
817	/* FIXME: Optimize -- use freelist code */
818
819	for (i = 0; i < dma->buf_count; i++) {
820		buf = dma->buflist[i];
821		buf_priv = buf->dev_private;
822		if (!buf->file_priv)
823			return buf;
824	}
825
826	for (t = 0; t < dev_priv->usec_timeout; t++) {
827		u32 done_age = R128_READ(R128_LAST_DISPATCH_REG);
828
829		for (i = 0; i < dma->buf_count; i++) {
830			buf = dma->buflist[i];
831			buf_priv = buf->dev_private;
832			if (buf->pending && buf_priv->age <= done_age) {
833				/* The buffer has been processed, so it
834				 * can now be used.
835				 */
836				buf->pending = 0;
837				return buf;
838			}
839		}
840		DRM_UDELAY(1);
841	}
842
843	DRM_DEBUG("returning NULL!\n");
844	return NULL;
845}
846
847void r128_freelist_reset(struct drm_device *dev)
848{
849	struct drm_device_dma *dma = dev->dma;
850	int i;
851
852	for (i = 0; i < dma->buf_count; i++) {
853		struct drm_buf *buf = dma->buflist[i];
854		drm_r128_buf_priv_t *buf_priv = buf->dev_private;
855		buf_priv->age = 0;
856	}
857}
858
859/* ================================================================
860 * CCE command submission
861 */
862
863int r128_wait_ring(drm_r128_private_t *dev_priv, int n)
864{
865	drm_r128_ring_buffer_t *ring = &dev_priv->ring;
866	int i;
867
868	for (i = 0; i < dev_priv->usec_timeout; i++) {
869		r128_update_ring_snapshot(dev_priv);
870		if (ring->space >= n)
871			return 0;
872		DRM_UDELAY(1);
873	}
874
875	/* FIXME: This is being ignored... */
876	DRM_ERROR("failed!\n");
877	return -EBUSY;
878}
879
880static int r128_cce_get_buffers(struct drm_device *dev,
881				struct drm_file *file_priv,
882				struct drm_dma *d)
883{
884	int i;
885	struct drm_buf *buf;
886
887	for (i = d->granted_count; i < d->request_count; i++) {
888		buf = r128_freelist_get(dev);
889		if (!buf)
890			return -EAGAIN;
891
892		buf->file_priv = file_priv;
893
894		if (copy_to_user(&d->request_indices[i], &buf->idx,
895				     sizeof(buf->idx)))
896			return -EFAULT;
897		if (copy_to_user(&d->request_sizes[i], &buf->total,
898				     sizeof(buf->total)))
899			return -EFAULT;
900
901		d->granted_count++;
902	}
903	return 0;
904}
905
906int r128_cce_buffers(struct drm_device *dev, void *data, struct drm_file *file_priv)
907{
908	struct drm_device_dma *dma = dev->dma;
909	int ret = 0;
910	struct drm_dma *d = data;
911
912	LOCK_TEST_WITH_RETURN(dev, file_priv);
913
914	/* Please don't send us buffers.
915	 */
916	if (d->send_count != 0) {
917		DRM_ERROR("Process %d trying to send %d buffers via drmDMA\n",
918			  DRM_CURRENTPID, d->send_count);
919		return -EINVAL;
920	}
921
922	/* We'll send you buffers.
923	 */
924	if (d->request_count < 0 || d->request_count > dma->buf_count) {
925		DRM_ERROR("Process %d trying to get %d buffers (of %d max)\n",
926			  DRM_CURRENTPID, d->request_count, dma->buf_count);
927		return -EINVAL;
928	}
929
930	d->granted_count = 0;
931
932	if (d->request_count)
933		ret = r128_cce_get_buffers(dev, file_priv, d);
934
935	return ret;
936}