Linux Audio

Check our new training course

Loading...
v6.8
   1/*
   2 * Copyright 2014 Advanced Micro Devices, Inc.
   3 *
   4 * Permission is hereby granted, free of charge, to any person obtaining a
   5 * copy of this software and associated documentation files (the "Software"),
   6 * to deal in the Software without restriction, including without limitation
   7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
   8 * and/or sell copies of the Software, and to permit persons to whom the
   9 * Software is furnished to do so, subject to the following conditions:
  10 *
  11 * The above copyright notice and this permission notice shall be included in
  12 * all copies or substantial portions of the Software.
  13 *
  14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20 * OTHER DEALINGS IN THE SOFTWARE.
  21 *
  22 * Authors: Christian König <christian.koenig@amd.com>
  23 */
  24
  25#include <linux/firmware.h>
  26
  27#include "amdgpu.h"
  28#include "amdgpu_uvd.h"
  29#include "vid.h"
  30#include "uvd/uvd_6_0_d.h"
  31#include "uvd/uvd_6_0_sh_mask.h"
  32#include "oss/oss_2_0_d.h"
  33#include "oss/oss_2_0_sh_mask.h"
  34#include "smu/smu_7_1_3_d.h"
  35#include "smu/smu_7_1_3_sh_mask.h"
  36#include "bif/bif_5_1_d.h"
  37#include "gmc/gmc_8_1_d.h"
  38#include "vi.h"
  39#include "ivsrcid/ivsrcid_vislands30.h"
  40
  41/* Polaris10/11/12 firmware version */
  42#define FW_1_130_16 ((1 << 24) | (130 << 16) | (16 << 8))
  43
  44static void uvd_v6_0_set_ring_funcs(struct amdgpu_device *adev);
  45static void uvd_v6_0_set_enc_ring_funcs(struct amdgpu_device *adev);
  46
  47static void uvd_v6_0_set_irq_funcs(struct amdgpu_device *adev);
  48static int uvd_v6_0_start(struct amdgpu_device *adev);
  49static void uvd_v6_0_stop(struct amdgpu_device *adev);
  50static void uvd_v6_0_set_sw_clock_gating(struct amdgpu_device *adev);
  51static int uvd_v6_0_set_clockgating_state(void *handle,
  52					  enum amd_clockgating_state state);
  53static void uvd_v6_0_enable_mgcg(struct amdgpu_device *adev,
  54				 bool enable);
  55
  56/**
  57* uvd_v6_0_enc_support - get encode support status
  58*
  59* @adev: amdgpu_device pointer
  60*
  61* Returns the current hardware encode support status
  62*/
  63static inline bool uvd_v6_0_enc_support(struct amdgpu_device *adev)
  64{
  65	return ((adev->asic_type >= CHIP_POLARIS10) &&
  66			(adev->asic_type <= CHIP_VEGAM) &&
  67			(!adev->uvd.fw_version || adev->uvd.fw_version >= FW_1_130_16));
  68}
  69
  70/**
  71 * uvd_v6_0_ring_get_rptr - get read pointer
  72 *
  73 * @ring: amdgpu_ring pointer
  74 *
  75 * Returns the current hardware read pointer
  76 */
  77static uint64_t uvd_v6_0_ring_get_rptr(struct amdgpu_ring *ring)
  78{
  79	struct amdgpu_device *adev = ring->adev;
  80
  81	return RREG32(mmUVD_RBC_RB_RPTR);
  82}
  83
  84/**
  85 * uvd_v6_0_enc_ring_get_rptr - get enc read pointer
  86 *
  87 * @ring: amdgpu_ring pointer
  88 *
  89 * Returns the current hardware enc read pointer
  90 */
  91static uint64_t uvd_v6_0_enc_ring_get_rptr(struct amdgpu_ring *ring)
  92{
  93	struct amdgpu_device *adev = ring->adev;
  94
  95	if (ring == &adev->uvd.inst->ring_enc[0])
  96		return RREG32(mmUVD_RB_RPTR);
  97	else
  98		return RREG32(mmUVD_RB_RPTR2);
  99}
 100/**
 101 * uvd_v6_0_ring_get_wptr - get write pointer
 102 *
 103 * @ring: amdgpu_ring pointer
 104 *
 105 * Returns the current hardware write pointer
 106 */
 107static uint64_t uvd_v6_0_ring_get_wptr(struct amdgpu_ring *ring)
 108{
 109	struct amdgpu_device *adev = ring->adev;
 110
 111	return RREG32(mmUVD_RBC_RB_WPTR);
 112}
 113
 114/**
 115 * uvd_v6_0_enc_ring_get_wptr - get enc write pointer
 116 *
 117 * @ring: amdgpu_ring pointer
 118 *
 119 * Returns the current hardware enc write pointer
 120 */
 121static uint64_t uvd_v6_0_enc_ring_get_wptr(struct amdgpu_ring *ring)
 122{
 123	struct amdgpu_device *adev = ring->adev;
 124
 125	if (ring == &adev->uvd.inst->ring_enc[0])
 126		return RREG32(mmUVD_RB_WPTR);
 127	else
 128		return RREG32(mmUVD_RB_WPTR2);
 129}
 130
 131/**
 132 * uvd_v6_0_ring_set_wptr - set write pointer
 133 *
 134 * @ring: amdgpu_ring pointer
 135 *
 136 * Commits the write pointer to the hardware
 137 */
 138static void uvd_v6_0_ring_set_wptr(struct amdgpu_ring *ring)
 139{
 140	struct amdgpu_device *adev = ring->adev;
 141
 142	WREG32(mmUVD_RBC_RB_WPTR, lower_32_bits(ring->wptr));
 143}
 144
 145/**
 146 * uvd_v6_0_enc_ring_set_wptr - set enc write pointer
 147 *
 148 * @ring: amdgpu_ring pointer
 149 *
 150 * Commits the enc write pointer to the hardware
 151 */
 152static void uvd_v6_0_enc_ring_set_wptr(struct amdgpu_ring *ring)
 153{
 154	struct amdgpu_device *adev = ring->adev;
 155
 156	if (ring == &adev->uvd.inst->ring_enc[0])
 157		WREG32(mmUVD_RB_WPTR,
 158			lower_32_bits(ring->wptr));
 159	else
 160		WREG32(mmUVD_RB_WPTR2,
 161			lower_32_bits(ring->wptr));
 162}
 163
 164/**
 165 * uvd_v6_0_enc_ring_test_ring - test if UVD ENC ring is working
 166 *
 167 * @ring: the engine to test on
 168 *
 169 */
 170static int uvd_v6_0_enc_ring_test_ring(struct amdgpu_ring *ring)
 171{
 172	struct amdgpu_device *adev = ring->adev;
 173	uint32_t rptr;
 174	unsigned i;
 175	int r;
 176
 177	r = amdgpu_ring_alloc(ring, 16);
 178	if (r)
 179		return r;
 180
 181	rptr = amdgpu_ring_get_rptr(ring);
 182
 183	amdgpu_ring_write(ring, HEVC_ENC_CMD_END);
 184	amdgpu_ring_commit(ring);
 185
 186	for (i = 0; i < adev->usec_timeout; i++) {
 187		if (amdgpu_ring_get_rptr(ring) != rptr)
 188			break;
 189		udelay(1);
 190	}
 191
 192	if (i >= adev->usec_timeout)
 193		r = -ETIMEDOUT;
 194
 195	return r;
 196}
 197
 198/**
 199 * uvd_v6_0_enc_get_create_msg - generate a UVD ENC create msg
 200 *
 201 * @ring: ring we should submit the msg to
 202 * @handle: session handle to use
 203 * @bo: amdgpu object for which we query the offset
 204 * @fence: optional fence to return
 205 *
 206 * Open up a stream for HW test
 207 */
 208static int uvd_v6_0_enc_get_create_msg(struct amdgpu_ring *ring, uint32_t handle,
 209				       struct amdgpu_bo *bo,
 210				       struct dma_fence **fence)
 211{
 212	const unsigned ib_size_dw = 16;
 213	struct amdgpu_job *job;
 214	struct amdgpu_ib *ib;
 215	struct dma_fence *f = NULL;
 216	uint64_t addr;
 217	int i, r;
 218
 219	r = amdgpu_job_alloc_with_ib(ring->adev, NULL, NULL, ib_size_dw * 4,
 220				     AMDGPU_IB_POOL_DIRECT, &job);
 221	if (r)
 222		return r;
 223
 224	ib = &job->ibs[0];
 225	addr = amdgpu_bo_gpu_offset(bo);
 226
 227	ib->length_dw = 0;
 228	ib->ptr[ib->length_dw++] = 0x00000018;
 229	ib->ptr[ib->length_dw++] = 0x00000001; /* session info */
 230	ib->ptr[ib->length_dw++] = handle;
 231	ib->ptr[ib->length_dw++] = 0x00010000;
 232	ib->ptr[ib->length_dw++] = upper_32_bits(addr);
 233	ib->ptr[ib->length_dw++] = addr;
 234
 235	ib->ptr[ib->length_dw++] = 0x00000014;
 236	ib->ptr[ib->length_dw++] = 0x00000002; /* task info */
 237	ib->ptr[ib->length_dw++] = 0x0000001c;
 238	ib->ptr[ib->length_dw++] = 0x00000001;
 239	ib->ptr[ib->length_dw++] = 0x00000000;
 240
 241	ib->ptr[ib->length_dw++] = 0x00000008;
 242	ib->ptr[ib->length_dw++] = 0x08000001; /* op initialize */
 243
 244	for (i = ib->length_dw; i < ib_size_dw; ++i)
 245		ib->ptr[i] = 0x0;
 246
 247	r = amdgpu_job_submit_direct(job, ring, &f);
 248	if (r)
 249		goto err;
 250
 251	if (fence)
 252		*fence = dma_fence_get(f);
 253	dma_fence_put(f);
 254	return 0;
 255
 256err:
 257	amdgpu_job_free(job);
 258	return r;
 259}
 260
 261/**
 262 * uvd_v6_0_enc_get_destroy_msg - generate a UVD ENC destroy msg
 263 *
 264 * @ring: ring we should submit the msg to
 265 * @handle: session handle to use
 266 * @bo: amdgpu object for which we query the offset
 267 * @fence: optional fence to return
 268 *
 269 * Close up a stream for HW test or if userspace failed to do so
 270 */
 271static int uvd_v6_0_enc_get_destroy_msg(struct amdgpu_ring *ring,
 272					uint32_t handle,
 273					struct amdgpu_bo *bo,
 274					struct dma_fence **fence)
 275{
 276	const unsigned ib_size_dw = 16;
 277	struct amdgpu_job *job;
 278	struct amdgpu_ib *ib;
 279	struct dma_fence *f = NULL;
 280	uint64_t addr;
 281	int i, r;
 282
 283	r = amdgpu_job_alloc_with_ib(ring->adev, NULL, NULL, ib_size_dw * 4,
 284				     AMDGPU_IB_POOL_DIRECT, &job);
 285	if (r)
 286		return r;
 287
 288	ib = &job->ibs[0];
 289	addr = amdgpu_bo_gpu_offset(bo);
 290
 291	ib->length_dw = 0;
 292	ib->ptr[ib->length_dw++] = 0x00000018;
 293	ib->ptr[ib->length_dw++] = 0x00000001; /* session info */
 294	ib->ptr[ib->length_dw++] = handle;
 295	ib->ptr[ib->length_dw++] = 0x00010000;
 296	ib->ptr[ib->length_dw++] = upper_32_bits(addr);
 297	ib->ptr[ib->length_dw++] = addr;
 298
 299	ib->ptr[ib->length_dw++] = 0x00000014;
 300	ib->ptr[ib->length_dw++] = 0x00000002; /* task info */
 301	ib->ptr[ib->length_dw++] = 0x0000001c;
 302	ib->ptr[ib->length_dw++] = 0x00000001;
 303	ib->ptr[ib->length_dw++] = 0x00000000;
 304
 305	ib->ptr[ib->length_dw++] = 0x00000008;
 306	ib->ptr[ib->length_dw++] = 0x08000002; /* op close session */
 307
 308	for (i = ib->length_dw; i < ib_size_dw; ++i)
 309		ib->ptr[i] = 0x0;
 310
 311	r = amdgpu_job_submit_direct(job, ring, &f);
 312	if (r)
 313		goto err;
 314
 315	if (fence)
 316		*fence = dma_fence_get(f);
 317	dma_fence_put(f);
 318	return 0;
 319
 320err:
 321	amdgpu_job_free(job);
 322	return r;
 323}
 324
 325/**
 326 * uvd_v6_0_enc_ring_test_ib - test if UVD ENC IBs are working
 327 *
 328 * @ring: the engine to test on
 329 * @timeout: timeout value in jiffies, or MAX_SCHEDULE_TIMEOUT
 330 *
 331 */
 332static int uvd_v6_0_enc_ring_test_ib(struct amdgpu_ring *ring, long timeout)
 333{
 334	struct dma_fence *fence = NULL;
 335	struct amdgpu_bo *bo = ring->adev->uvd.ib_bo;
 336	long r;
 337
 
 
 
 
 
 
 338	r = uvd_v6_0_enc_get_create_msg(ring, 1, bo, NULL);
 339	if (r)
 340		goto error;
 341
 342	r = uvd_v6_0_enc_get_destroy_msg(ring, 1, bo, &fence);
 343	if (r)
 344		goto error;
 345
 346	r = dma_fence_wait_timeout(fence, false, timeout);
 347	if (r == 0)
 348		r = -ETIMEDOUT;
 349	else if (r > 0)
 350		r = 0;
 351
 352error:
 353	dma_fence_put(fence);
 
 
 
 354	return r;
 355}
 356
 357static int uvd_v6_0_early_init(void *handle)
 358{
 359	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
 360	adev->uvd.num_uvd_inst = 1;
 361
 362	if (!(adev->flags & AMD_IS_APU) &&
 363	    (RREG32_SMC(ixCC_HARVEST_FUSES) & CC_HARVEST_FUSES__UVD_DISABLE_MASK))
 364		return -ENOENT;
 365
 366	uvd_v6_0_set_ring_funcs(adev);
 367
 368	if (uvd_v6_0_enc_support(adev)) {
 369		adev->uvd.num_enc_rings = 2;
 370		uvd_v6_0_set_enc_ring_funcs(adev);
 371	}
 372
 373	uvd_v6_0_set_irq_funcs(adev);
 374
 375	return 0;
 376}
 377
 378static int uvd_v6_0_sw_init(void *handle)
 379{
 380	struct amdgpu_ring *ring;
 381	int i, r;
 382	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
 383
 384	/* UVD TRAP */
 385	r = amdgpu_irq_add_id(adev, AMDGPU_IRQ_CLIENTID_LEGACY, VISLANDS30_IV_SRCID_UVD_SYSTEM_MESSAGE, &adev->uvd.inst->irq);
 386	if (r)
 387		return r;
 388
 389	/* UVD ENC TRAP */
 390	if (uvd_v6_0_enc_support(adev)) {
 391		for (i = 0; i < adev->uvd.num_enc_rings; ++i) {
 392			r = amdgpu_irq_add_id(adev, AMDGPU_IRQ_CLIENTID_LEGACY, i + VISLANDS30_IV_SRCID_UVD_ENC_GEN_PURP, &adev->uvd.inst->irq);
 393			if (r)
 394				return r;
 395		}
 396	}
 397
 398	r = amdgpu_uvd_sw_init(adev);
 399	if (r)
 400		return r;
 401
 402	if (!uvd_v6_0_enc_support(adev)) {
 403		for (i = 0; i < adev->uvd.num_enc_rings; ++i)
 404			adev->uvd.inst->ring_enc[i].funcs = NULL;
 405
 406		adev->uvd.inst->irq.num_types = 1;
 407		adev->uvd.num_enc_rings = 0;
 408
 409		DRM_INFO("UVD ENC is disabled\n");
 410	}
 411
 412	ring = &adev->uvd.inst->ring;
 413	sprintf(ring->name, "uvd");
 414	r = amdgpu_ring_init(adev, ring, 512, &adev->uvd.inst->irq, 0,
 415			     AMDGPU_RING_PRIO_DEFAULT, NULL);
 416	if (r)
 417		return r;
 418
 419	r = amdgpu_uvd_resume(adev);
 420	if (r)
 421		return r;
 422
 423	if (uvd_v6_0_enc_support(adev)) {
 424		for (i = 0; i < adev->uvd.num_enc_rings; ++i) {
 425			ring = &adev->uvd.inst->ring_enc[i];
 426			sprintf(ring->name, "uvd_enc%d", i);
 427			r = amdgpu_ring_init(adev, ring, 512,
 428					     &adev->uvd.inst->irq, 0,
 429					     AMDGPU_RING_PRIO_DEFAULT, NULL);
 430			if (r)
 431				return r;
 432		}
 433	}
 434
 
 
 435	return r;
 436}
 437
 438static int uvd_v6_0_sw_fini(void *handle)
 439{
 440	int i, r;
 441	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
 442
 443	r = amdgpu_uvd_suspend(adev);
 444	if (r)
 445		return r;
 446
 447	if (uvd_v6_0_enc_support(adev)) {
 448		for (i = 0; i < adev->uvd.num_enc_rings; ++i)
 449			amdgpu_ring_fini(&adev->uvd.inst->ring_enc[i]);
 450	}
 451
 452	return amdgpu_uvd_sw_fini(adev);
 453}
 454
 455/**
 456 * uvd_v6_0_hw_init - start and test UVD block
 457 *
 458 * @handle: handle used to pass amdgpu_device pointer
 459 *
 460 * Initialize the hardware, boot up the VCPU and do some testing
 461 */
 462static int uvd_v6_0_hw_init(void *handle)
 463{
 464	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
 465	struct amdgpu_ring *ring = &adev->uvd.inst->ring;
 466	uint32_t tmp;
 467	int i, r;
 468
 469	amdgpu_asic_set_uvd_clocks(adev, 10000, 10000);
 470	uvd_v6_0_set_clockgating_state(adev, AMD_CG_STATE_UNGATE);
 471	uvd_v6_0_enable_mgcg(adev, true);
 472
 473	r = amdgpu_ring_test_helper(ring);
 474	if (r)
 475		goto done;
 476
 477	r = amdgpu_ring_alloc(ring, 10);
 478	if (r) {
 479		DRM_ERROR("amdgpu: ring failed to lock UVD ring (%d).\n", r);
 480		goto done;
 481	}
 482
 483	tmp = PACKET0(mmUVD_SEMA_WAIT_FAULT_TIMEOUT_CNTL, 0);
 484	amdgpu_ring_write(ring, tmp);
 485	amdgpu_ring_write(ring, 0xFFFFF);
 486
 487	tmp = PACKET0(mmUVD_SEMA_WAIT_INCOMPLETE_TIMEOUT_CNTL, 0);
 488	amdgpu_ring_write(ring, tmp);
 489	amdgpu_ring_write(ring, 0xFFFFF);
 490
 491	tmp = PACKET0(mmUVD_SEMA_SIGNAL_INCOMPLETE_TIMEOUT_CNTL, 0);
 492	amdgpu_ring_write(ring, tmp);
 493	amdgpu_ring_write(ring, 0xFFFFF);
 494
 495	/* Clear timeout status bits */
 496	amdgpu_ring_write(ring, PACKET0(mmUVD_SEMA_TIMEOUT_STATUS, 0));
 497	amdgpu_ring_write(ring, 0x8);
 498
 499	amdgpu_ring_write(ring, PACKET0(mmUVD_SEMA_CNTL, 0));
 500	amdgpu_ring_write(ring, 3);
 501
 502	amdgpu_ring_commit(ring);
 503
 504	if (uvd_v6_0_enc_support(adev)) {
 505		for (i = 0; i < adev->uvd.num_enc_rings; ++i) {
 506			ring = &adev->uvd.inst->ring_enc[i];
 507			r = amdgpu_ring_test_helper(ring);
 508			if (r)
 509				goto done;
 510		}
 511	}
 512
 513done:
 514	if (!r) {
 515		if (uvd_v6_0_enc_support(adev))
 516			DRM_INFO("UVD and UVD ENC initialized successfully.\n");
 517		else
 518			DRM_INFO("UVD initialized successfully.\n");
 519	}
 520
 521	return r;
 522}
 523
 524/**
 525 * uvd_v6_0_hw_fini - stop the hardware block
 526 *
 527 * @handle: handle used to pass amdgpu_device pointer
 528 *
 529 * Stop the UVD block, mark ring as not ready any more
 530 */
 531static int uvd_v6_0_hw_fini(void *handle)
 532{
 533	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
 534
 535	cancel_delayed_work_sync(&adev->uvd.idle_work);
 536
 537	if (RREG32(mmUVD_STATUS) != 0)
 538		uvd_v6_0_stop(adev);
 539
 540	return 0;
 541}
 542
 543static int uvd_v6_0_prepare_suspend(void *handle)
 544{
 545	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
 546
 547	return amdgpu_uvd_prepare_suspend(adev);
 548}
 549
 550static int uvd_v6_0_suspend(void *handle)
 551{
 552	int r;
 553	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
 554
 555	/*
 556	 * Proper cleanups before halting the HW engine:
 557	 *   - cancel the delayed idle work
 558	 *   - enable powergating
 559	 *   - enable clockgating
 560	 *   - disable dpm
 561	 *
 562	 * TODO: to align with the VCN implementation, move the
 563	 * jobs for clockgating/powergating/dpm setting to
 564	 * ->set_powergating_state().
 565	 */
 566	cancel_delayed_work_sync(&adev->uvd.idle_work);
 567
 568	if (adev->pm.dpm_enabled) {
 569		amdgpu_dpm_enable_uvd(adev, false);
 570	} else {
 571		amdgpu_asic_set_uvd_clocks(adev, 0, 0);
 572		/* shutdown the UVD block */
 573		amdgpu_device_ip_set_powergating_state(adev, AMD_IP_BLOCK_TYPE_UVD,
 574						       AMD_PG_STATE_GATE);
 575		amdgpu_device_ip_set_clockgating_state(adev, AMD_IP_BLOCK_TYPE_UVD,
 576						       AMD_CG_STATE_GATE);
 577	}
 578
 579	r = uvd_v6_0_hw_fini(adev);
 580	if (r)
 581		return r;
 582
 583	return amdgpu_uvd_suspend(adev);
 584}
 585
 586static int uvd_v6_0_resume(void *handle)
 587{
 588	int r;
 589	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
 590
 591	r = amdgpu_uvd_resume(adev);
 592	if (r)
 593		return r;
 594
 595	return uvd_v6_0_hw_init(adev);
 596}
 597
 598/**
 599 * uvd_v6_0_mc_resume - memory controller programming
 600 *
 601 * @adev: amdgpu_device pointer
 602 *
 603 * Let the UVD memory controller know it's offsets
 604 */
 605static void uvd_v6_0_mc_resume(struct amdgpu_device *adev)
 606{
 607	uint64_t offset;
 608	uint32_t size;
 609
 610	/* program memory controller bits 0-27 */
 611	WREG32(mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW,
 612			lower_32_bits(adev->uvd.inst->gpu_addr));
 613	WREG32(mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH,
 614			upper_32_bits(adev->uvd.inst->gpu_addr));
 615
 616	offset = AMDGPU_UVD_FIRMWARE_OFFSET;
 617	size = AMDGPU_UVD_FIRMWARE_SIZE(adev);
 618	WREG32(mmUVD_VCPU_CACHE_OFFSET0, offset >> 3);
 619	WREG32(mmUVD_VCPU_CACHE_SIZE0, size);
 620
 621	offset += size;
 622	size = AMDGPU_UVD_HEAP_SIZE;
 623	WREG32(mmUVD_VCPU_CACHE_OFFSET1, offset >> 3);
 624	WREG32(mmUVD_VCPU_CACHE_SIZE1, size);
 625
 626	offset += size;
 627	size = AMDGPU_UVD_STACK_SIZE +
 628	       (AMDGPU_UVD_SESSION_SIZE * adev->uvd.max_handles);
 629	WREG32(mmUVD_VCPU_CACHE_OFFSET2, offset >> 3);
 630	WREG32(mmUVD_VCPU_CACHE_SIZE2, size);
 631
 632	WREG32(mmUVD_UDEC_ADDR_CONFIG, adev->gfx.config.gb_addr_config);
 633	WREG32(mmUVD_UDEC_DB_ADDR_CONFIG, adev->gfx.config.gb_addr_config);
 634	WREG32(mmUVD_UDEC_DBW_ADDR_CONFIG, adev->gfx.config.gb_addr_config);
 635
 636	WREG32(mmUVD_GP_SCRATCH4, adev->uvd.max_handles);
 637}
 638
 639#if 0
 640static void cz_set_uvd_clock_gating_branches(struct amdgpu_device *adev,
 641		bool enable)
 642{
 643	u32 data, data1;
 644
 645	data = RREG32(mmUVD_CGC_GATE);
 646	data1 = RREG32(mmUVD_SUVD_CGC_GATE);
 647	if (enable) {
 648		data |= UVD_CGC_GATE__SYS_MASK |
 649				UVD_CGC_GATE__UDEC_MASK |
 650				UVD_CGC_GATE__MPEG2_MASK |
 651				UVD_CGC_GATE__RBC_MASK |
 652				UVD_CGC_GATE__LMI_MC_MASK |
 653				UVD_CGC_GATE__IDCT_MASK |
 654				UVD_CGC_GATE__MPRD_MASK |
 655				UVD_CGC_GATE__MPC_MASK |
 656				UVD_CGC_GATE__LBSI_MASK |
 657				UVD_CGC_GATE__LRBBM_MASK |
 658				UVD_CGC_GATE__UDEC_RE_MASK |
 659				UVD_CGC_GATE__UDEC_CM_MASK |
 660				UVD_CGC_GATE__UDEC_IT_MASK |
 661				UVD_CGC_GATE__UDEC_DB_MASK |
 662				UVD_CGC_GATE__UDEC_MP_MASK |
 663				UVD_CGC_GATE__WCB_MASK |
 664				UVD_CGC_GATE__VCPU_MASK |
 665				UVD_CGC_GATE__SCPU_MASK;
 666		data1 |= UVD_SUVD_CGC_GATE__SRE_MASK |
 667				UVD_SUVD_CGC_GATE__SIT_MASK |
 668				UVD_SUVD_CGC_GATE__SMP_MASK |
 669				UVD_SUVD_CGC_GATE__SCM_MASK |
 670				UVD_SUVD_CGC_GATE__SDB_MASK |
 671				UVD_SUVD_CGC_GATE__SRE_H264_MASK |
 672				UVD_SUVD_CGC_GATE__SRE_HEVC_MASK |
 673				UVD_SUVD_CGC_GATE__SIT_H264_MASK |
 674				UVD_SUVD_CGC_GATE__SIT_HEVC_MASK |
 675				UVD_SUVD_CGC_GATE__SCM_H264_MASK |
 676				UVD_SUVD_CGC_GATE__SCM_HEVC_MASK |
 677				UVD_SUVD_CGC_GATE__SDB_H264_MASK |
 678				UVD_SUVD_CGC_GATE__SDB_HEVC_MASK;
 679	} else {
 680		data &= ~(UVD_CGC_GATE__SYS_MASK |
 681				UVD_CGC_GATE__UDEC_MASK |
 682				UVD_CGC_GATE__MPEG2_MASK |
 683				UVD_CGC_GATE__RBC_MASK |
 684				UVD_CGC_GATE__LMI_MC_MASK |
 685				UVD_CGC_GATE__LMI_UMC_MASK |
 686				UVD_CGC_GATE__IDCT_MASK |
 687				UVD_CGC_GATE__MPRD_MASK |
 688				UVD_CGC_GATE__MPC_MASK |
 689				UVD_CGC_GATE__LBSI_MASK |
 690				UVD_CGC_GATE__LRBBM_MASK |
 691				UVD_CGC_GATE__UDEC_RE_MASK |
 692				UVD_CGC_GATE__UDEC_CM_MASK |
 693				UVD_CGC_GATE__UDEC_IT_MASK |
 694				UVD_CGC_GATE__UDEC_DB_MASK |
 695				UVD_CGC_GATE__UDEC_MP_MASK |
 696				UVD_CGC_GATE__WCB_MASK |
 697				UVD_CGC_GATE__VCPU_MASK |
 698				UVD_CGC_GATE__SCPU_MASK);
 699		data1 &= ~(UVD_SUVD_CGC_GATE__SRE_MASK |
 700				UVD_SUVD_CGC_GATE__SIT_MASK |
 701				UVD_SUVD_CGC_GATE__SMP_MASK |
 702				UVD_SUVD_CGC_GATE__SCM_MASK |
 703				UVD_SUVD_CGC_GATE__SDB_MASK |
 704				UVD_SUVD_CGC_GATE__SRE_H264_MASK |
 705				UVD_SUVD_CGC_GATE__SRE_HEVC_MASK |
 706				UVD_SUVD_CGC_GATE__SIT_H264_MASK |
 707				UVD_SUVD_CGC_GATE__SIT_HEVC_MASK |
 708				UVD_SUVD_CGC_GATE__SCM_H264_MASK |
 709				UVD_SUVD_CGC_GATE__SCM_HEVC_MASK |
 710				UVD_SUVD_CGC_GATE__SDB_H264_MASK |
 711				UVD_SUVD_CGC_GATE__SDB_HEVC_MASK);
 712	}
 713	WREG32(mmUVD_CGC_GATE, data);
 714	WREG32(mmUVD_SUVD_CGC_GATE, data1);
 715}
 716#endif
 717
 718/**
 719 * uvd_v6_0_start - start UVD block
 720 *
 721 * @adev: amdgpu_device pointer
 722 *
 723 * Setup and start the UVD block
 724 */
 725static int uvd_v6_0_start(struct amdgpu_device *adev)
 726{
 727	struct amdgpu_ring *ring = &adev->uvd.inst->ring;
 728	uint32_t rb_bufsz, tmp;
 729	uint32_t lmi_swap_cntl;
 730	uint32_t mp_swap_cntl;
 731	int i, j, r;
 732
 733	/* disable DPG */
 734	WREG32_P(mmUVD_POWER_STATUS, 0, ~UVD_POWER_STATUS__UVD_PG_MODE_MASK);
 735
 736	/* disable byte swapping */
 737	lmi_swap_cntl = 0;
 738	mp_swap_cntl = 0;
 739
 740	uvd_v6_0_mc_resume(adev);
 741
 742	/* disable interupt */
 743	WREG32_FIELD(UVD_MASTINT_EN, VCPU_EN, 0);
 744
 745	/* stall UMC and register bus before resetting VCPU */
 746	WREG32_FIELD(UVD_LMI_CTRL2, STALL_ARB_UMC, 1);
 747	mdelay(1);
 748
 749	/* put LMI, VCPU, RBC etc... into reset */
 750	WREG32(mmUVD_SOFT_RESET,
 751		UVD_SOFT_RESET__LMI_SOFT_RESET_MASK |
 752		UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK |
 753		UVD_SOFT_RESET__LBSI_SOFT_RESET_MASK |
 754		UVD_SOFT_RESET__RBC_SOFT_RESET_MASK |
 755		UVD_SOFT_RESET__CSM_SOFT_RESET_MASK |
 756		UVD_SOFT_RESET__CXW_SOFT_RESET_MASK |
 757		UVD_SOFT_RESET__TAP_SOFT_RESET_MASK |
 758		UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK);
 759	mdelay(5);
 760
 761	/* take UVD block out of reset */
 762	WREG32_FIELD(SRBM_SOFT_RESET, SOFT_RESET_UVD, 0);
 763	mdelay(5);
 764
 765	/* initialize UVD memory controller */
 766	WREG32(mmUVD_LMI_CTRL,
 767		(0x40 << UVD_LMI_CTRL__WRITE_CLEAN_TIMER__SHIFT) |
 768		UVD_LMI_CTRL__WRITE_CLEAN_TIMER_EN_MASK |
 769		UVD_LMI_CTRL__DATA_COHERENCY_EN_MASK |
 770		UVD_LMI_CTRL__VCPU_DATA_COHERENCY_EN_MASK |
 771		UVD_LMI_CTRL__REQ_MODE_MASK |
 772		UVD_LMI_CTRL__DISABLE_ON_FWV_FAIL_MASK);
 773
 774#ifdef __BIG_ENDIAN
 775	/* swap (8 in 32) RB and IB */
 776	lmi_swap_cntl = 0xa;
 777	mp_swap_cntl = 0;
 778#endif
 779	WREG32(mmUVD_LMI_SWAP_CNTL, lmi_swap_cntl);
 780	WREG32(mmUVD_MP_SWAP_CNTL, mp_swap_cntl);
 781
 782	WREG32(mmUVD_MPC_SET_MUXA0, 0x40c2040);
 783	WREG32(mmUVD_MPC_SET_MUXA1, 0x0);
 784	WREG32(mmUVD_MPC_SET_MUXB0, 0x40c2040);
 785	WREG32(mmUVD_MPC_SET_MUXB1, 0x0);
 786	WREG32(mmUVD_MPC_SET_ALU, 0);
 787	WREG32(mmUVD_MPC_SET_MUX, 0x88);
 788
 789	/* take all subblocks out of reset, except VCPU */
 790	WREG32(mmUVD_SOFT_RESET, UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
 791	mdelay(5);
 792
 793	/* enable VCPU clock */
 794	WREG32(mmUVD_VCPU_CNTL, UVD_VCPU_CNTL__CLK_EN_MASK);
 795
 796	/* enable UMC */
 797	WREG32_FIELD(UVD_LMI_CTRL2, STALL_ARB_UMC, 0);
 798
 799	/* boot up the VCPU */
 800	WREG32(mmUVD_SOFT_RESET, 0);
 801	mdelay(10);
 802
 803	for (i = 0; i < 10; ++i) {
 804		uint32_t status;
 805
 806		for (j = 0; j < 100; ++j) {
 807			status = RREG32(mmUVD_STATUS);
 808			if (status & 2)
 809				break;
 810			mdelay(10);
 811		}
 812		r = 0;
 813		if (status & 2)
 814			break;
 815
 816		DRM_ERROR("UVD not responding, trying to reset the VCPU!!!\n");
 817		WREG32_FIELD(UVD_SOFT_RESET, VCPU_SOFT_RESET, 1);
 818		mdelay(10);
 819		WREG32_FIELD(UVD_SOFT_RESET, VCPU_SOFT_RESET, 0);
 820		mdelay(10);
 821		r = -1;
 822	}
 823
 824	if (r) {
 825		DRM_ERROR("UVD not responding, giving up!!!\n");
 826		return r;
 827	}
 828	/* enable master interrupt */
 829	WREG32_P(mmUVD_MASTINT_EN,
 830		(UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK),
 831		~(UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK));
 832
 833	/* clear the bit 4 of UVD_STATUS */
 834	WREG32_P(mmUVD_STATUS, 0, ~(2 << UVD_STATUS__VCPU_REPORT__SHIFT));
 835
 836	/* force RBC into idle state */
 837	rb_bufsz = order_base_2(ring->ring_size);
 838	tmp = REG_SET_FIELD(0, UVD_RBC_RB_CNTL, RB_BUFSZ, rb_bufsz);
 839	tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_BLKSZ, 1);
 840	tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_FETCH, 1);
 841	tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_WPTR_POLL_EN, 0);
 842	tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_UPDATE, 1);
 843	tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_RPTR_WR_EN, 1);
 844	WREG32(mmUVD_RBC_RB_CNTL, tmp);
 845
 846	/* set the write pointer delay */
 847	WREG32(mmUVD_RBC_RB_WPTR_CNTL, 0);
 848
 849	/* set the wb address */
 850	WREG32(mmUVD_RBC_RB_RPTR_ADDR, (upper_32_bits(ring->gpu_addr) >> 2));
 851
 852	/* program the RB_BASE for ring buffer */
 853	WREG32(mmUVD_LMI_RBC_RB_64BIT_BAR_LOW,
 854			lower_32_bits(ring->gpu_addr));
 855	WREG32(mmUVD_LMI_RBC_RB_64BIT_BAR_HIGH,
 856			upper_32_bits(ring->gpu_addr));
 857
 858	/* Initialize the ring buffer's read and write pointers */
 859	WREG32(mmUVD_RBC_RB_RPTR, 0);
 860
 861	ring->wptr = RREG32(mmUVD_RBC_RB_RPTR);
 862	WREG32(mmUVD_RBC_RB_WPTR, lower_32_bits(ring->wptr));
 863
 864	WREG32_FIELD(UVD_RBC_RB_CNTL, RB_NO_FETCH, 0);
 865
 866	if (uvd_v6_0_enc_support(adev)) {
 867		ring = &adev->uvd.inst->ring_enc[0];
 868		WREG32(mmUVD_RB_RPTR, lower_32_bits(ring->wptr));
 869		WREG32(mmUVD_RB_WPTR, lower_32_bits(ring->wptr));
 870		WREG32(mmUVD_RB_BASE_LO, ring->gpu_addr);
 871		WREG32(mmUVD_RB_BASE_HI, upper_32_bits(ring->gpu_addr));
 872		WREG32(mmUVD_RB_SIZE, ring->ring_size / 4);
 873
 874		ring = &adev->uvd.inst->ring_enc[1];
 875		WREG32(mmUVD_RB_RPTR2, lower_32_bits(ring->wptr));
 876		WREG32(mmUVD_RB_WPTR2, lower_32_bits(ring->wptr));
 877		WREG32(mmUVD_RB_BASE_LO2, ring->gpu_addr);
 878		WREG32(mmUVD_RB_BASE_HI2, upper_32_bits(ring->gpu_addr));
 879		WREG32(mmUVD_RB_SIZE2, ring->ring_size / 4);
 880	}
 881
 882	return 0;
 883}
 884
 885/**
 886 * uvd_v6_0_stop - stop UVD block
 887 *
 888 * @adev: amdgpu_device pointer
 889 *
 890 * stop the UVD block
 891 */
 892static void uvd_v6_0_stop(struct amdgpu_device *adev)
 893{
 894	/* force RBC into idle state */
 895	WREG32(mmUVD_RBC_RB_CNTL, 0x11010101);
 896
 897	/* Stall UMC and register bus before resetting VCPU */
 898	WREG32_P(mmUVD_LMI_CTRL2, 1 << 8, ~(1 << 8));
 899	mdelay(1);
 900
 901	/* put VCPU into reset */
 902	WREG32(mmUVD_SOFT_RESET, UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
 903	mdelay(5);
 904
 905	/* disable VCPU clock */
 906	WREG32(mmUVD_VCPU_CNTL, 0x0);
 907
 908	/* Unstall UMC and register bus */
 909	WREG32_P(mmUVD_LMI_CTRL2, 0, ~(1 << 8));
 910
 911	WREG32(mmUVD_STATUS, 0);
 912}
 913
 914/**
 915 * uvd_v6_0_ring_emit_fence - emit an fence & trap command
 916 *
 917 * @ring: amdgpu_ring pointer
 918 * @addr: address
 919 * @seq: sequence number
 920 * @flags: fence related flags
 921 *
 922 * Write a fence and a trap command to the ring.
 923 */
 924static void uvd_v6_0_ring_emit_fence(struct amdgpu_ring *ring, u64 addr, u64 seq,
 925				     unsigned flags)
 926{
 927	WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
 928
 929	amdgpu_ring_write(ring, PACKET0(mmUVD_CONTEXT_ID, 0));
 930	amdgpu_ring_write(ring, seq);
 931	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0));
 932	amdgpu_ring_write(ring, addr & 0xffffffff);
 933	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA1, 0));
 934	amdgpu_ring_write(ring, upper_32_bits(addr) & 0xff);
 935	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_CMD, 0));
 936	amdgpu_ring_write(ring, 0);
 937
 938	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0));
 939	amdgpu_ring_write(ring, 0);
 940	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA1, 0));
 941	amdgpu_ring_write(ring, 0);
 942	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_CMD, 0));
 943	amdgpu_ring_write(ring, 2);
 944}
 945
 946/**
 947 * uvd_v6_0_enc_ring_emit_fence - emit an enc fence & trap command
 948 *
 949 * @ring: amdgpu_ring pointer
 950 * @addr: address
 951 * @seq: sequence number
 952 * @flags: fence related flags
 953 *
 954 * Write enc a fence and a trap command to the ring.
 955 */
 956static void uvd_v6_0_enc_ring_emit_fence(struct amdgpu_ring *ring, u64 addr,
 957			u64 seq, unsigned flags)
 958{
 959	WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
 960
 961	amdgpu_ring_write(ring, HEVC_ENC_CMD_FENCE);
 962	amdgpu_ring_write(ring, addr);
 963	amdgpu_ring_write(ring, upper_32_bits(addr));
 964	amdgpu_ring_write(ring, seq);
 965	amdgpu_ring_write(ring, HEVC_ENC_CMD_TRAP);
 966}
 967
 968/**
 969 * uvd_v6_0_ring_emit_hdp_flush - skip HDP flushing
 970 *
 971 * @ring: amdgpu_ring pointer
 972 */
 973static void uvd_v6_0_ring_emit_hdp_flush(struct amdgpu_ring *ring)
 974{
 975	/* The firmware doesn't seem to like touching registers at this point. */
 976}
 977
 978/**
 979 * uvd_v6_0_ring_test_ring - register write test
 980 *
 981 * @ring: amdgpu_ring pointer
 982 *
 983 * Test if we can successfully write to the context register
 984 */
 985static int uvd_v6_0_ring_test_ring(struct amdgpu_ring *ring)
 986{
 987	struct amdgpu_device *adev = ring->adev;
 988	uint32_t tmp = 0;
 989	unsigned i;
 990	int r;
 991
 992	WREG32(mmUVD_CONTEXT_ID, 0xCAFEDEAD);
 993	r = amdgpu_ring_alloc(ring, 3);
 994	if (r)
 995		return r;
 996
 997	amdgpu_ring_write(ring, PACKET0(mmUVD_CONTEXT_ID, 0));
 998	amdgpu_ring_write(ring, 0xDEADBEEF);
 999	amdgpu_ring_commit(ring);
1000	for (i = 0; i < adev->usec_timeout; i++) {
1001		tmp = RREG32(mmUVD_CONTEXT_ID);
1002		if (tmp == 0xDEADBEEF)
1003			break;
1004		udelay(1);
1005	}
1006
1007	if (i >= adev->usec_timeout)
1008		r = -ETIMEDOUT;
1009
1010	return r;
1011}
1012
1013/**
1014 * uvd_v6_0_ring_emit_ib - execute indirect buffer
1015 *
1016 * @ring: amdgpu_ring pointer
1017 * @job: job to retrieve vmid from
1018 * @ib: indirect buffer to execute
1019 * @flags: unused
1020 *
1021 * Write ring commands to execute the indirect buffer
1022 */
1023static void uvd_v6_0_ring_emit_ib(struct amdgpu_ring *ring,
1024				  struct amdgpu_job *job,
1025				  struct amdgpu_ib *ib,
1026				  uint32_t flags)
1027{
1028	unsigned vmid = AMDGPU_JOB_GET_VMID(job);
1029
1030	amdgpu_ring_write(ring, PACKET0(mmUVD_LMI_RBC_IB_VMID, 0));
1031	amdgpu_ring_write(ring, vmid);
1032
1033	amdgpu_ring_write(ring, PACKET0(mmUVD_LMI_RBC_IB_64BIT_BAR_LOW, 0));
1034	amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
1035	amdgpu_ring_write(ring, PACKET0(mmUVD_LMI_RBC_IB_64BIT_BAR_HIGH, 0));
1036	amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
1037	amdgpu_ring_write(ring, PACKET0(mmUVD_RBC_IB_SIZE, 0));
1038	amdgpu_ring_write(ring, ib->length_dw);
1039}
1040
1041/**
1042 * uvd_v6_0_enc_ring_emit_ib - enc execute indirect buffer
1043 *
1044 * @ring: amdgpu_ring pointer
1045 * @job: job to retrive vmid from
1046 * @ib: indirect buffer to execute
1047 * @flags: unused
1048 *
1049 * Write enc ring commands to execute the indirect buffer
1050 */
1051static void uvd_v6_0_enc_ring_emit_ib(struct amdgpu_ring *ring,
1052					struct amdgpu_job *job,
1053					struct amdgpu_ib *ib,
1054					uint32_t flags)
1055{
1056	unsigned vmid = AMDGPU_JOB_GET_VMID(job);
1057
1058	amdgpu_ring_write(ring, HEVC_ENC_CMD_IB_VM);
1059	amdgpu_ring_write(ring, vmid);
1060	amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
1061	amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
1062	amdgpu_ring_write(ring, ib->length_dw);
1063}
1064
1065static void uvd_v6_0_ring_emit_wreg(struct amdgpu_ring *ring,
1066				    uint32_t reg, uint32_t val)
1067{
1068	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0));
1069	amdgpu_ring_write(ring, reg << 2);
1070	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA1, 0));
1071	amdgpu_ring_write(ring, val);
1072	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_CMD, 0));
1073	amdgpu_ring_write(ring, 0x8);
1074}
1075
1076static void uvd_v6_0_ring_emit_vm_flush(struct amdgpu_ring *ring,
1077					unsigned vmid, uint64_t pd_addr)
1078{
1079	amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr);
1080
1081	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0));
1082	amdgpu_ring_write(ring, mmVM_INVALIDATE_REQUEST << 2);
1083	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA1, 0));
1084	amdgpu_ring_write(ring, 0);
1085	amdgpu_ring_write(ring, PACKET0(mmUVD_GP_SCRATCH8, 0));
1086	amdgpu_ring_write(ring, 1 << vmid); /* mask */
1087	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_CMD, 0));
1088	amdgpu_ring_write(ring, 0xC);
1089}
1090
1091static void uvd_v6_0_ring_emit_pipeline_sync(struct amdgpu_ring *ring)
1092{
1093	uint32_t seq = ring->fence_drv.sync_seq;
1094	uint64_t addr = ring->fence_drv.gpu_addr;
1095
1096	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0));
1097	amdgpu_ring_write(ring, lower_32_bits(addr));
1098	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA1, 0));
1099	amdgpu_ring_write(ring, upper_32_bits(addr));
1100	amdgpu_ring_write(ring, PACKET0(mmUVD_GP_SCRATCH8, 0));
1101	amdgpu_ring_write(ring, 0xffffffff); /* mask */
1102	amdgpu_ring_write(ring, PACKET0(mmUVD_GP_SCRATCH9, 0));
1103	amdgpu_ring_write(ring, seq);
1104	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_CMD, 0));
1105	amdgpu_ring_write(ring, 0xE);
1106}
1107
1108static void uvd_v6_0_ring_insert_nop(struct amdgpu_ring *ring, uint32_t count)
1109{
1110	int i;
1111
1112	WARN_ON(ring->wptr % 2 || count % 2);
1113
1114	for (i = 0; i < count / 2; i++) {
1115		amdgpu_ring_write(ring, PACKET0(mmUVD_NO_OP, 0));
1116		amdgpu_ring_write(ring, 0);
1117	}
1118}
1119
1120static void uvd_v6_0_enc_ring_emit_pipeline_sync(struct amdgpu_ring *ring)
1121{
1122	uint32_t seq = ring->fence_drv.sync_seq;
1123	uint64_t addr = ring->fence_drv.gpu_addr;
1124
1125	amdgpu_ring_write(ring, HEVC_ENC_CMD_WAIT_GE);
1126	amdgpu_ring_write(ring, lower_32_bits(addr));
1127	amdgpu_ring_write(ring, upper_32_bits(addr));
1128	amdgpu_ring_write(ring, seq);
1129}
1130
1131static void uvd_v6_0_enc_ring_insert_end(struct amdgpu_ring *ring)
1132{
1133	amdgpu_ring_write(ring, HEVC_ENC_CMD_END);
1134}
1135
1136static void uvd_v6_0_enc_ring_emit_vm_flush(struct amdgpu_ring *ring,
1137					    unsigned int vmid, uint64_t pd_addr)
1138{
1139	amdgpu_ring_write(ring, HEVC_ENC_CMD_UPDATE_PTB);
1140	amdgpu_ring_write(ring, vmid);
1141	amdgpu_ring_write(ring, pd_addr >> 12);
1142
1143	amdgpu_ring_write(ring, HEVC_ENC_CMD_FLUSH_TLB);
1144	amdgpu_ring_write(ring, vmid);
1145}
1146
1147static bool uvd_v6_0_is_idle(void *handle)
1148{
1149	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1150
1151	return !(RREG32(mmSRBM_STATUS) & SRBM_STATUS__UVD_BUSY_MASK);
1152}
1153
1154static int uvd_v6_0_wait_for_idle(void *handle)
1155{
1156	unsigned i;
1157	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1158
1159	for (i = 0; i < adev->usec_timeout; i++) {
1160		if (uvd_v6_0_is_idle(handle))
1161			return 0;
1162	}
1163	return -ETIMEDOUT;
1164}
1165
1166#define AMDGPU_UVD_STATUS_BUSY_MASK    0xfd
1167static bool uvd_v6_0_check_soft_reset(void *handle)
1168{
1169	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1170	u32 srbm_soft_reset = 0;
1171	u32 tmp = RREG32(mmSRBM_STATUS);
1172
1173	if (REG_GET_FIELD(tmp, SRBM_STATUS, UVD_RQ_PENDING) ||
1174	    REG_GET_FIELD(tmp, SRBM_STATUS, UVD_BUSY) ||
1175	    (RREG32(mmUVD_STATUS) & AMDGPU_UVD_STATUS_BUSY_MASK))
1176		srbm_soft_reset = REG_SET_FIELD(srbm_soft_reset, SRBM_SOFT_RESET, SOFT_RESET_UVD, 1);
1177
1178	if (srbm_soft_reset) {
1179		adev->uvd.inst->srbm_soft_reset = srbm_soft_reset;
1180		return true;
1181	} else {
1182		adev->uvd.inst->srbm_soft_reset = 0;
1183		return false;
1184	}
1185}
1186
1187static int uvd_v6_0_pre_soft_reset(void *handle)
1188{
1189	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1190
1191	if (!adev->uvd.inst->srbm_soft_reset)
1192		return 0;
1193
1194	uvd_v6_0_stop(adev);
1195	return 0;
1196}
1197
1198static int uvd_v6_0_soft_reset(void *handle)
1199{
1200	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1201	u32 srbm_soft_reset;
1202
1203	if (!adev->uvd.inst->srbm_soft_reset)
1204		return 0;
1205	srbm_soft_reset = adev->uvd.inst->srbm_soft_reset;
1206
1207	if (srbm_soft_reset) {
1208		u32 tmp;
1209
1210		tmp = RREG32(mmSRBM_SOFT_RESET);
1211		tmp |= srbm_soft_reset;
1212		dev_info(adev->dev, "SRBM_SOFT_RESET=0x%08X\n", tmp);
1213		WREG32(mmSRBM_SOFT_RESET, tmp);
1214		tmp = RREG32(mmSRBM_SOFT_RESET);
1215
1216		udelay(50);
1217
1218		tmp &= ~srbm_soft_reset;
1219		WREG32(mmSRBM_SOFT_RESET, tmp);
1220		tmp = RREG32(mmSRBM_SOFT_RESET);
1221
1222		/* Wait a little for things to settle down */
1223		udelay(50);
1224	}
1225
1226	return 0;
1227}
1228
1229static int uvd_v6_0_post_soft_reset(void *handle)
1230{
1231	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1232
1233	if (!adev->uvd.inst->srbm_soft_reset)
1234		return 0;
1235
1236	mdelay(5);
1237
1238	return uvd_v6_0_start(adev);
1239}
1240
1241static int uvd_v6_0_set_interrupt_state(struct amdgpu_device *adev,
1242					struct amdgpu_irq_src *source,
1243					unsigned type,
1244					enum amdgpu_interrupt_state state)
1245{
1246	// TODO
1247	return 0;
1248}
1249
1250static int uvd_v6_0_process_interrupt(struct amdgpu_device *adev,
1251				      struct amdgpu_irq_src *source,
1252				      struct amdgpu_iv_entry *entry)
1253{
1254	bool int_handled = true;
1255	DRM_DEBUG("IH: UVD TRAP\n");
1256
1257	switch (entry->src_id) {
1258	case 124:
1259		amdgpu_fence_process(&adev->uvd.inst->ring);
1260		break;
1261	case 119:
1262		if (likely(uvd_v6_0_enc_support(adev)))
1263			amdgpu_fence_process(&adev->uvd.inst->ring_enc[0]);
1264		else
1265			int_handled = false;
1266		break;
1267	case 120:
1268		if (likely(uvd_v6_0_enc_support(adev)))
1269			amdgpu_fence_process(&adev->uvd.inst->ring_enc[1]);
1270		else
1271			int_handled = false;
1272		break;
1273	}
1274
1275	if (!int_handled)
1276		DRM_ERROR("Unhandled interrupt: %d %d\n",
1277			  entry->src_id, entry->src_data[0]);
1278
1279	return 0;
1280}
1281
1282static void uvd_v6_0_enable_clock_gating(struct amdgpu_device *adev, bool enable)
1283{
1284	uint32_t data1, data3;
1285
1286	data1 = RREG32(mmUVD_SUVD_CGC_GATE);
1287	data3 = RREG32(mmUVD_CGC_GATE);
1288
1289	data1 |= UVD_SUVD_CGC_GATE__SRE_MASK |
1290		     UVD_SUVD_CGC_GATE__SIT_MASK |
1291		     UVD_SUVD_CGC_GATE__SMP_MASK |
1292		     UVD_SUVD_CGC_GATE__SCM_MASK |
1293		     UVD_SUVD_CGC_GATE__SDB_MASK |
1294		     UVD_SUVD_CGC_GATE__SRE_H264_MASK |
1295		     UVD_SUVD_CGC_GATE__SRE_HEVC_MASK |
1296		     UVD_SUVD_CGC_GATE__SIT_H264_MASK |
1297		     UVD_SUVD_CGC_GATE__SIT_HEVC_MASK |
1298		     UVD_SUVD_CGC_GATE__SCM_H264_MASK |
1299		     UVD_SUVD_CGC_GATE__SCM_HEVC_MASK |
1300		     UVD_SUVD_CGC_GATE__SDB_H264_MASK |
1301		     UVD_SUVD_CGC_GATE__SDB_HEVC_MASK;
1302
1303	if (enable) {
1304		data3 |= (UVD_CGC_GATE__SYS_MASK       |
1305			UVD_CGC_GATE__UDEC_MASK      |
1306			UVD_CGC_GATE__MPEG2_MASK     |
1307			UVD_CGC_GATE__RBC_MASK       |
1308			UVD_CGC_GATE__LMI_MC_MASK    |
1309			UVD_CGC_GATE__LMI_UMC_MASK   |
1310			UVD_CGC_GATE__IDCT_MASK      |
1311			UVD_CGC_GATE__MPRD_MASK      |
1312			UVD_CGC_GATE__MPC_MASK       |
1313			UVD_CGC_GATE__LBSI_MASK      |
1314			UVD_CGC_GATE__LRBBM_MASK     |
1315			UVD_CGC_GATE__UDEC_RE_MASK   |
1316			UVD_CGC_GATE__UDEC_CM_MASK   |
1317			UVD_CGC_GATE__UDEC_IT_MASK   |
1318			UVD_CGC_GATE__UDEC_DB_MASK   |
1319			UVD_CGC_GATE__UDEC_MP_MASK   |
1320			UVD_CGC_GATE__WCB_MASK       |
1321			UVD_CGC_GATE__JPEG_MASK      |
1322			UVD_CGC_GATE__SCPU_MASK      |
1323			UVD_CGC_GATE__JPEG2_MASK);
1324		/* only in pg enabled, we can gate clock to vcpu*/
1325		if (adev->pg_flags & AMD_PG_SUPPORT_UVD)
1326			data3 |= UVD_CGC_GATE__VCPU_MASK;
1327
1328		data3 &= ~UVD_CGC_GATE__REGS_MASK;
1329	} else {
1330		data3 = 0;
1331	}
1332
1333	WREG32(mmUVD_SUVD_CGC_GATE, data1);
1334	WREG32(mmUVD_CGC_GATE, data3);
1335}
1336
1337static void uvd_v6_0_set_sw_clock_gating(struct amdgpu_device *adev)
1338{
1339	uint32_t data, data2;
1340
1341	data = RREG32(mmUVD_CGC_CTRL);
1342	data2 = RREG32(mmUVD_SUVD_CGC_CTRL);
1343
1344
1345	data &= ~(UVD_CGC_CTRL__CLK_OFF_DELAY_MASK |
1346		  UVD_CGC_CTRL__CLK_GATE_DLY_TIMER_MASK);
1347
1348
1349	data |= UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK |
1350		(1 << REG_FIELD_SHIFT(UVD_CGC_CTRL, CLK_GATE_DLY_TIMER)) |
1351		(4 << REG_FIELD_SHIFT(UVD_CGC_CTRL, CLK_OFF_DELAY));
1352
1353	data &= ~(UVD_CGC_CTRL__UDEC_RE_MODE_MASK |
1354			UVD_CGC_CTRL__UDEC_CM_MODE_MASK |
1355			UVD_CGC_CTRL__UDEC_IT_MODE_MASK |
1356			UVD_CGC_CTRL__UDEC_DB_MODE_MASK |
1357			UVD_CGC_CTRL__UDEC_MP_MODE_MASK |
1358			UVD_CGC_CTRL__SYS_MODE_MASK |
1359			UVD_CGC_CTRL__UDEC_MODE_MASK |
1360			UVD_CGC_CTRL__MPEG2_MODE_MASK |
1361			UVD_CGC_CTRL__REGS_MODE_MASK |
1362			UVD_CGC_CTRL__RBC_MODE_MASK |
1363			UVD_CGC_CTRL__LMI_MC_MODE_MASK |
1364			UVD_CGC_CTRL__LMI_UMC_MODE_MASK |
1365			UVD_CGC_CTRL__IDCT_MODE_MASK |
1366			UVD_CGC_CTRL__MPRD_MODE_MASK |
1367			UVD_CGC_CTRL__MPC_MODE_MASK |
1368			UVD_CGC_CTRL__LBSI_MODE_MASK |
1369			UVD_CGC_CTRL__LRBBM_MODE_MASK |
1370			UVD_CGC_CTRL__WCB_MODE_MASK |
1371			UVD_CGC_CTRL__VCPU_MODE_MASK |
1372			UVD_CGC_CTRL__JPEG_MODE_MASK |
1373			UVD_CGC_CTRL__SCPU_MODE_MASK |
1374			UVD_CGC_CTRL__JPEG2_MODE_MASK);
1375	data2 &= ~(UVD_SUVD_CGC_CTRL__SRE_MODE_MASK |
1376			UVD_SUVD_CGC_CTRL__SIT_MODE_MASK |
1377			UVD_SUVD_CGC_CTRL__SMP_MODE_MASK |
1378			UVD_SUVD_CGC_CTRL__SCM_MODE_MASK |
1379			UVD_SUVD_CGC_CTRL__SDB_MODE_MASK);
1380
1381	WREG32(mmUVD_CGC_CTRL, data);
1382	WREG32(mmUVD_SUVD_CGC_CTRL, data2);
1383}
1384
1385#if 0
1386static void uvd_v6_0_set_hw_clock_gating(struct amdgpu_device *adev)
1387{
1388	uint32_t data, data1, cgc_flags, suvd_flags;
1389
1390	data = RREG32(mmUVD_CGC_GATE);
1391	data1 = RREG32(mmUVD_SUVD_CGC_GATE);
1392
1393	cgc_flags = UVD_CGC_GATE__SYS_MASK |
1394		UVD_CGC_GATE__UDEC_MASK |
1395		UVD_CGC_GATE__MPEG2_MASK |
1396		UVD_CGC_GATE__RBC_MASK |
1397		UVD_CGC_GATE__LMI_MC_MASK |
1398		UVD_CGC_GATE__IDCT_MASK |
1399		UVD_CGC_GATE__MPRD_MASK |
1400		UVD_CGC_GATE__MPC_MASK |
1401		UVD_CGC_GATE__LBSI_MASK |
1402		UVD_CGC_GATE__LRBBM_MASK |
1403		UVD_CGC_GATE__UDEC_RE_MASK |
1404		UVD_CGC_GATE__UDEC_CM_MASK |
1405		UVD_CGC_GATE__UDEC_IT_MASK |
1406		UVD_CGC_GATE__UDEC_DB_MASK |
1407		UVD_CGC_GATE__UDEC_MP_MASK |
1408		UVD_CGC_GATE__WCB_MASK |
1409		UVD_CGC_GATE__VCPU_MASK |
1410		UVD_CGC_GATE__SCPU_MASK |
1411		UVD_CGC_GATE__JPEG_MASK |
1412		UVD_CGC_GATE__JPEG2_MASK;
1413
1414	suvd_flags = UVD_SUVD_CGC_GATE__SRE_MASK |
1415				UVD_SUVD_CGC_GATE__SIT_MASK |
1416				UVD_SUVD_CGC_GATE__SMP_MASK |
1417				UVD_SUVD_CGC_GATE__SCM_MASK |
1418				UVD_SUVD_CGC_GATE__SDB_MASK;
1419
1420	data |= cgc_flags;
1421	data1 |= suvd_flags;
1422
1423	WREG32(mmUVD_CGC_GATE, data);
1424	WREG32(mmUVD_SUVD_CGC_GATE, data1);
1425}
1426#endif
1427
1428static void uvd_v6_0_enable_mgcg(struct amdgpu_device *adev,
1429				 bool enable)
1430{
1431	u32 orig, data;
1432
1433	if (enable && (adev->cg_flags & AMD_CG_SUPPORT_UVD_MGCG)) {
1434		data = RREG32_UVD_CTX(ixUVD_CGC_MEM_CTRL);
1435		data |= 0xfff;
1436		WREG32_UVD_CTX(ixUVD_CGC_MEM_CTRL, data);
1437
1438		orig = data = RREG32(mmUVD_CGC_CTRL);
1439		data |= UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK;
1440		if (orig != data)
1441			WREG32(mmUVD_CGC_CTRL, data);
1442	} else {
1443		data = RREG32_UVD_CTX(ixUVD_CGC_MEM_CTRL);
1444		data &= ~0xfff;
1445		WREG32_UVD_CTX(ixUVD_CGC_MEM_CTRL, data);
1446
1447		orig = data = RREG32(mmUVD_CGC_CTRL);
1448		data &= ~UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK;
1449		if (orig != data)
1450			WREG32(mmUVD_CGC_CTRL, data);
1451	}
1452}
1453
1454static int uvd_v6_0_set_clockgating_state(void *handle,
1455					  enum amd_clockgating_state state)
1456{
1457	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1458	bool enable = (state == AMD_CG_STATE_GATE);
1459
1460	if (enable) {
1461		/* wait for STATUS to clear */
1462		if (uvd_v6_0_wait_for_idle(handle))
1463			return -EBUSY;
1464		uvd_v6_0_enable_clock_gating(adev, true);
1465		/* enable HW gates because UVD is idle */
1466/*		uvd_v6_0_set_hw_clock_gating(adev); */
1467	} else {
1468		/* disable HW gating and enable Sw gating */
1469		uvd_v6_0_enable_clock_gating(adev, false);
1470	}
1471	uvd_v6_0_set_sw_clock_gating(adev);
1472	return 0;
1473}
1474
1475static int uvd_v6_0_set_powergating_state(void *handle,
1476					  enum amd_powergating_state state)
1477{
1478	/* This doesn't actually powergate the UVD block.
1479	 * That's done in the dpm code via the SMC.  This
1480	 * just re-inits the block as necessary.  The actual
1481	 * gating still happens in the dpm code.  We should
1482	 * revisit this when there is a cleaner line between
1483	 * the smc and the hw blocks
1484	 */
1485	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1486	int ret = 0;
1487
1488	WREG32(mmUVD_POWER_STATUS, UVD_POWER_STATUS__UVD_PG_EN_MASK);
1489
1490	if (state == AMD_PG_STATE_GATE) {
1491		uvd_v6_0_stop(adev);
1492	} else {
1493		ret = uvd_v6_0_start(adev);
1494		if (ret)
1495			goto out;
1496	}
1497
1498out:
1499	return ret;
1500}
1501
1502static void uvd_v6_0_get_clockgating_state(void *handle, u64 *flags)
1503{
1504	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1505	int data;
1506
1507	mutex_lock(&adev->pm.mutex);
1508
1509	if (adev->flags & AMD_IS_APU)
1510		data = RREG32_SMC(ixCURRENT_PG_STATUS_APU);
1511	else
1512		data = RREG32_SMC(ixCURRENT_PG_STATUS);
1513
1514	if (data & CURRENT_PG_STATUS__UVD_PG_STATUS_MASK) {
1515		DRM_INFO("Cannot get clockgating state when UVD is powergated.\n");
1516		goto out;
1517	}
1518
1519	/* AMD_CG_SUPPORT_UVD_MGCG */
1520	data = RREG32(mmUVD_CGC_CTRL);
1521	if (data & UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK)
1522		*flags |= AMD_CG_SUPPORT_UVD_MGCG;
1523
1524out:
1525	mutex_unlock(&adev->pm.mutex);
1526}
1527
1528static const struct amd_ip_funcs uvd_v6_0_ip_funcs = {
1529	.name = "uvd_v6_0",
1530	.early_init = uvd_v6_0_early_init,
1531	.late_init = NULL,
1532	.sw_init = uvd_v6_0_sw_init,
1533	.sw_fini = uvd_v6_0_sw_fini,
1534	.hw_init = uvd_v6_0_hw_init,
1535	.hw_fini = uvd_v6_0_hw_fini,
1536	.prepare_suspend = uvd_v6_0_prepare_suspend,
1537	.suspend = uvd_v6_0_suspend,
1538	.resume = uvd_v6_0_resume,
1539	.is_idle = uvd_v6_0_is_idle,
1540	.wait_for_idle = uvd_v6_0_wait_for_idle,
1541	.check_soft_reset = uvd_v6_0_check_soft_reset,
1542	.pre_soft_reset = uvd_v6_0_pre_soft_reset,
1543	.soft_reset = uvd_v6_0_soft_reset,
1544	.post_soft_reset = uvd_v6_0_post_soft_reset,
1545	.set_clockgating_state = uvd_v6_0_set_clockgating_state,
1546	.set_powergating_state = uvd_v6_0_set_powergating_state,
1547	.get_clockgating_state = uvd_v6_0_get_clockgating_state,
1548};
1549
1550static const struct amdgpu_ring_funcs uvd_v6_0_ring_phys_funcs = {
1551	.type = AMDGPU_RING_TYPE_UVD,
1552	.align_mask = 0xf,
1553	.support_64bit_ptrs = false,
1554	.no_user_fence = true,
1555	.get_rptr = uvd_v6_0_ring_get_rptr,
1556	.get_wptr = uvd_v6_0_ring_get_wptr,
1557	.set_wptr = uvd_v6_0_ring_set_wptr,
1558	.parse_cs = amdgpu_uvd_ring_parse_cs,
1559	.emit_frame_size =
1560		6 + /* hdp invalidate */
1561		10 + /* uvd_v6_0_ring_emit_pipeline_sync */
1562		14, /* uvd_v6_0_ring_emit_fence x1 no user fence */
1563	.emit_ib_size = 8, /* uvd_v6_0_ring_emit_ib */
1564	.emit_ib = uvd_v6_0_ring_emit_ib,
1565	.emit_fence = uvd_v6_0_ring_emit_fence,
1566	.emit_hdp_flush = uvd_v6_0_ring_emit_hdp_flush,
1567	.test_ring = uvd_v6_0_ring_test_ring,
1568	.test_ib = amdgpu_uvd_ring_test_ib,
1569	.insert_nop = uvd_v6_0_ring_insert_nop,
1570	.pad_ib = amdgpu_ring_generic_pad_ib,
1571	.begin_use = amdgpu_uvd_ring_begin_use,
1572	.end_use = amdgpu_uvd_ring_end_use,
1573	.emit_wreg = uvd_v6_0_ring_emit_wreg,
1574};
1575
1576static const struct amdgpu_ring_funcs uvd_v6_0_ring_vm_funcs = {
1577	.type = AMDGPU_RING_TYPE_UVD,
1578	.align_mask = 0xf,
1579	.support_64bit_ptrs = false,
1580	.no_user_fence = true,
1581	.get_rptr = uvd_v6_0_ring_get_rptr,
1582	.get_wptr = uvd_v6_0_ring_get_wptr,
1583	.set_wptr = uvd_v6_0_ring_set_wptr,
1584	.emit_frame_size =
1585		6 + /* hdp invalidate */
1586		10 + /* uvd_v6_0_ring_emit_pipeline_sync */
1587		VI_FLUSH_GPU_TLB_NUM_WREG * 6 + 8 + /* uvd_v6_0_ring_emit_vm_flush */
1588		14 + 14, /* uvd_v6_0_ring_emit_fence x2 vm fence */
1589	.emit_ib_size = 8, /* uvd_v6_0_ring_emit_ib */
1590	.emit_ib = uvd_v6_0_ring_emit_ib,
1591	.emit_fence = uvd_v6_0_ring_emit_fence,
1592	.emit_vm_flush = uvd_v6_0_ring_emit_vm_flush,
1593	.emit_pipeline_sync = uvd_v6_0_ring_emit_pipeline_sync,
1594	.emit_hdp_flush = uvd_v6_0_ring_emit_hdp_flush,
1595	.test_ring = uvd_v6_0_ring_test_ring,
1596	.test_ib = amdgpu_uvd_ring_test_ib,
1597	.insert_nop = uvd_v6_0_ring_insert_nop,
1598	.pad_ib = amdgpu_ring_generic_pad_ib,
1599	.begin_use = amdgpu_uvd_ring_begin_use,
1600	.end_use = amdgpu_uvd_ring_end_use,
1601	.emit_wreg = uvd_v6_0_ring_emit_wreg,
1602};
1603
1604static const struct amdgpu_ring_funcs uvd_v6_0_enc_ring_vm_funcs = {
1605	.type = AMDGPU_RING_TYPE_UVD_ENC,
1606	.align_mask = 0x3f,
1607	.nop = HEVC_ENC_CMD_NO_OP,
1608	.support_64bit_ptrs = false,
1609	.no_user_fence = true,
1610	.get_rptr = uvd_v6_0_enc_ring_get_rptr,
1611	.get_wptr = uvd_v6_0_enc_ring_get_wptr,
1612	.set_wptr = uvd_v6_0_enc_ring_set_wptr,
1613	.emit_frame_size =
1614		4 + /* uvd_v6_0_enc_ring_emit_pipeline_sync */
1615		5 + /* uvd_v6_0_enc_ring_emit_vm_flush */
1616		5 + 5 + /* uvd_v6_0_enc_ring_emit_fence x2 vm fence */
1617		1, /* uvd_v6_0_enc_ring_insert_end */
1618	.emit_ib_size = 5, /* uvd_v6_0_enc_ring_emit_ib */
1619	.emit_ib = uvd_v6_0_enc_ring_emit_ib,
1620	.emit_fence = uvd_v6_0_enc_ring_emit_fence,
1621	.emit_vm_flush = uvd_v6_0_enc_ring_emit_vm_flush,
1622	.emit_pipeline_sync = uvd_v6_0_enc_ring_emit_pipeline_sync,
1623	.test_ring = uvd_v6_0_enc_ring_test_ring,
1624	.test_ib = uvd_v6_0_enc_ring_test_ib,
1625	.insert_nop = amdgpu_ring_insert_nop,
1626	.insert_end = uvd_v6_0_enc_ring_insert_end,
1627	.pad_ib = amdgpu_ring_generic_pad_ib,
1628	.begin_use = amdgpu_uvd_ring_begin_use,
1629	.end_use = amdgpu_uvd_ring_end_use,
1630};
1631
1632static void uvd_v6_0_set_ring_funcs(struct amdgpu_device *adev)
1633{
1634	if (adev->asic_type >= CHIP_POLARIS10) {
1635		adev->uvd.inst->ring.funcs = &uvd_v6_0_ring_vm_funcs;
1636		DRM_INFO("UVD is enabled in VM mode\n");
1637	} else {
1638		adev->uvd.inst->ring.funcs = &uvd_v6_0_ring_phys_funcs;
1639		DRM_INFO("UVD is enabled in physical mode\n");
1640	}
1641}
1642
1643static void uvd_v6_0_set_enc_ring_funcs(struct amdgpu_device *adev)
1644{
1645	int i;
1646
1647	for (i = 0; i < adev->uvd.num_enc_rings; ++i)
1648		adev->uvd.inst->ring_enc[i].funcs = &uvd_v6_0_enc_ring_vm_funcs;
1649
1650	DRM_INFO("UVD ENC is enabled in VM mode\n");
1651}
1652
1653static const struct amdgpu_irq_src_funcs uvd_v6_0_irq_funcs = {
1654	.set = uvd_v6_0_set_interrupt_state,
1655	.process = uvd_v6_0_process_interrupt,
1656};
1657
1658static void uvd_v6_0_set_irq_funcs(struct amdgpu_device *adev)
1659{
1660	if (uvd_v6_0_enc_support(adev))
1661		adev->uvd.inst->irq.num_types = adev->uvd.num_enc_rings + 1;
1662	else
1663		adev->uvd.inst->irq.num_types = 1;
1664
1665	adev->uvd.inst->irq.funcs = &uvd_v6_0_irq_funcs;
1666}
1667
1668const struct amdgpu_ip_block_version uvd_v6_0_ip_block =
1669{
1670		.type = AMD_IP_BLOCK_TYPE_UVD,
1671		.major = 6,
1672		.minor = 0,
1673		.rev = 0,
1674		.funcs = &uvd_v6_0_ip_funcs,
1675};
1676
1677const struct amdgpu_ip_block_version uvd_v6_2_ip_block =
1678{
1679		.type = AMD_IP_BLOCK_TYPE_UVD,
1680		.major = 6,
1681		.minor = 2,
1682		.rev = 0,
1683		.funcs = &uvd_v6_0_ip_funcs,
1684};
1685
1686const struct amdgpu_ip_block_version uvd_v6_3_ip_block =
1687{
1688		.type = AMD_IP_BLOCK_TYPE_UVD,
1689		.major = 6,
1690		.minor = 3,
1691		.rev = 0,
1692		.funcs = &uvd_v6_0_ip_funcs,
1693};
v5.14.15
   1/*
   2 * Copyright 2014 Advanced Micro Devices, Inc.
   3 *
   4 * Permission is hereby granted, free of charge, to any person obtaining a
   5 * copy of this software and associated documentation files (the "Software"),
   6 * to deal in the Software without restriction, including without limitation
   7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
   8 * and/or sell copies of the Software, and to permit persons to whom the
   9 * Software is furnished to do so, subject to the following conditions:
  10 *
  11 * The above copyright notice and this permission notice shall be included in
  12 * all copies or substantial portions of the Software.
  13 *
  14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20 * OTHER DEALINGS IN THE SOFTWARE.
  21 *
  22 * Authors: Christian König <christian.koenig@amd.com>
  23 */
  24
  25#include <linux/firmware.h>
  26
  27#include "amdgpu.h"
  28#include "amdgpu_uvd.h"
  29#include "vid.h"
  30#include "uvd/uvd_6_0_d.h"
  31#include "uvd/uvd_6_0_sh_mask.h"
  32#include "oss/oss_2_0_d.h"
  33#include "oss/oss_2_0_sh_mask.h"
  34#include "smu/smu_7_1_3_d.h"
  35#include "smu/smu_7_1_3_sh_mask.h"
  36#include "bif/bif_5_1_d.h"
  37#include "gmc/gmc_8_1_d.h"
  38#include "vi.h"
  39#include "ivsrcid/ivsrcid_vislands30.h"
  40
  41/* Polaris10/11/12 firmware version */
  42#define FW_1_130_16 ((1 << 24) | (130 << 16) | (16 << 8))
  43
  44static void uvd_v6_0_set_ring_funcs(struct amdgpu_device *adev);
  45static void uvd_v6_0_set_enc_ring_funcs(struct amdgpu_device *adev);
  46
  47static void uvd_v6_0_set_irq_funcs(struct amdgpu_device *adev);
  48static int uvd_v6_0_start(struct amdgpu_device *adev);
  49static void uvd_v6_0_stop(struct amdgpu_device *adev);
  50static void uvd_v6_0_set_sw_clock_gating(struct amdgpu_device *adev);
  51static int uvd_v6_0_set_clockgating_state(void *handle,
  52					  enum amd_clockgating_state state);
  53static void uvd_v6_0_enable_mgcg(struct amdgpu_device *adev,
  54				 bool enable);
  55
  56/**
  57* uvd_v6_0_enc_support - get encode support status
  58*
  59* @adev: amdgpu_device pointer
  60*
  61* Returns the current hardware encode support status
  62*/
  63static inline bool uvd_v6_0_enc_support(struct amdgpu_device *adev)
  64{
  65	return ((adev->asic_type >= CHIP_POLARIS10) &&
  66			(adev->asic_type <= CHIP_VEGAM) &&
  67			(!adev->uvd.fw_version || adev->uvd.fw_version >= FW_1_130_16));
  68}
  69
  70/**
  71 * uvd_v6_0_ring_get_rptr - get read pointer
  72 *
  73 * @ring: amdgpu_ring pointer
  74 *
  75 * Returns the current hardware read pointer
  76 */
  77static uint64_t uvd_v6_0_ring_get_rptr(struct amdgpu_ring *ring)
  78{
  79	struct amdgpu_device *adev = ring->adev;
  80
  81	return RREG32(mmUVD_RBC_RB_RPTR);
  82}
  83
  84/**
  85 * uvd_v6_0_enc_ring_get_rptr - get enc read pointer
  86 *
  87 * @ring: amdgpu_ring pointer
  88 *
  89 * Returns the current hardware enc read pointer
  90 */
  91static uint64_t uvd_v6_0_enc_ring_get_rptr(struct amdgpu_ring *ring)
  92{
  93	struct amdgpu_device *adev = ring->adev;
  94
  95	if (ring == &adev->uvd.inst->ring_enc[0])
  96		return RREG32(mmUVD_RB_RPTR);
  97	else
  98		return RREG32(mmUVD_RB_RPTR2);
  99}
 100/**
 101 * uvd_v6_0_ring_get_wptr - get write pointer
 102 *
 103 * @ring: amdgpu_ring pointer
 104 *
 105 * Returns the current hardware write pointer
 106 */
 107static uint64_t uvd_v6_0_ring_get_wptr(struct amdgpu_ring *ring)
 108{
 109	struct amdgpu_device *adev = ring->adev;
 110
 111	return RREG32(mmUVD_RBC_RB_WPTR);
 112}
 113
 114/**
 115 * uvd_v6_0_enc_ring_get_wptr - get enc write pointer
 116 *
 117 * @ring: amdgpu_ring pointer
 118 *
 119 * Returns the current hardware enc write pointer
 120 */
 121static uint64_t uvd_v6_0_enc_ring_get_wptr(struct amdgpu_ring *ring)
 122{
 123	struct amdgpu_device *adev = ring->adev;
 124
 125	if (ring == &adev->uvd.inst->ring_enc[0])
 126		return RREG32(mmUVD_RB_WPTR);
 127	else
 128		return RREG32(mmUVD_RB_WPTR2);
 129}
 130
 131/**
 132 * uvd_v6_0_ring_set_wptr - set write pointer
 133 *
 134 * @ring: amdgpu_ring pointer
 135 *
 136 * Commits the write pointer to the hardware
 137 */
 138static void uvd_v6_0_ring_set_wptr(struct amdgpu_ring *ring)
 139{
 140	struct amdgpu_device *adev = ring->adev;
 141
 142	WREG32(mmUVD_RBC_RB_WPTR, lower_32_bits(ring->wptr));
 143}
 144
 145/**
 146 * uvd_v6_0_enc_ring_set_wptr - set enc write pointer
 147 *
 148 * @ring: amdgpu_ring pointer
 149 *
 150 * Commits the enc write pointer to the hardware
 151 */
 152static void uvd_v6_0_enc_ring_set_wptr(struct amdgpu_ring *ring)
 153{
 154	struct amdgpu_device *adev = ring->adev;
 155
 156	if (ring == &adev->uvd.inst->ring_enc[0])
 157		WREG32(mmUVD_RB_WPTR,
 158			lower_32_bits(ring->wptr));
 159	else
 160		WREG32(mmUVD_RB_WPTR2,
 161			lower_32_bits(ring->wptr));
 162}
 163
 164/**
 165 * uvd_v6_0_enc_ring_test_ring - test if UVD ENC ring is working
 166 *
 167 * @ring: the engine to test on
 168 *
 169 */
 170static int uvd_v6_0_enc_ring_test_ring(struct amdgpu_ring *ring)
 171{
 172	struct amdgpu_device *adev = ring->adev;
 173	uint32_t rptr;
 174	unsigned i;
 175	int r;
 176
 177	r = amdgpu_ring_alloc(ring, 16);
 178	if (r)
 179		return r;
 180
 181	rptr = amdgpu_ring_get_rptr(ring);
 182
 183	amdgpu_ring_write(ring, HEVC_ENC_CMD_END);
 184	amdgpu_ring_commit(ring);
 185
 186	for (i = 0; i < adev->usec_timeout; i++) {
 187		if (amdgpu_ring_get_rptr(ring) != rptr)
 188			break;
 189		udelay(1);
 190	}
 191
 192	if (i >= adev->usec_timeout)
 193		r = -ETIMEDOUT;
 194
 195	return r;
 196}
 197
 198/**
 199 * uvd_v6_0_enc_get_create_msg - generate a UVD ENC create msg
 200 *
 201 * @ring: ring we should submit the msg to
 202 * @handle: session handle to use
 203 * @bo: amdgpu object for which we query the offset
 204 * @fence: optional fence to return
 205 *
 206 * Open up a stream for HW test
 207 */
 208static int uvd_v6_0_enc_get_create_msg(struct amdgpu_ring *ring, uint32_t handle,
 209				       struct amdgpu_bo *bo,
 210				       struct dma_fence **fence)
 211{
 212	const unsigned ib_size_dw = 16;
 213	struct amdgpu_job *job;
 214	struct amdgpu_ib *ib;
 215	struct dma_fence *f = NULL;
 216	uint64_t addr;
 217	int i, r;
 218
 219	r = amdgpu_job_alloc_with_ib(ring->adev, ib_size_dw * 4,
 220					AMDGPU_IB_POOL_DIRECT, &job);
 221	if (r)
 222		return r;
 223
 224	ib = &job->ibs[0];
 225	addr = amdgpu_bo_gpu_offset(bo);
 226
 227	ib->length_dw = 0;
 228	ib->ptr[ib->length_dw++] = 0x00000018;
 229	ib->ptr[ib->length_dw++] = 0x00000001; /* session info */
 230	ib->ptr[ib->length_dw++] = handle;
 231	ib->ptr[ib->length_dw++] = 0x00010000;
 232	ib->ptr[ib->length_dw++] = upper_32_bits(addr);
 233	ib->ptr[ib->length_dw++] = addr;
 234
 235	ib->ptr[ib->length_dw++] = 0x00000014;
 236	ib->ptr[ib->length_dw++] = 0x00000002; /* task info */
 237	ib->ptr[ib->length_dw++] = 0x0000001c;
 238	ib->ptr[ib->length_dw++] = 0x00000001;
 239	ib->ptr[ib->length_dw++] = 0x00000000;
 240
 241	ib->ptr[ib->length_dw++] = 0x00000008;
 242	ib->ptr[ib->length_dw++] = 0x08000001; /* op initialize */
 243
 244	for (i = ib->length_dw; i < ib_size_dw; ++i)
 245		ib->ptr[i] = 0x0;
 246
 247	r = amdgpu_job_submit_direct(job, ring, &f);
 248	if (r)
 249		goto err;
 250
 251	if (fence)
 252		*fence = dma_fence_get(f);
 253	dma_fence_put(f);
 254	return 0;
 255
 256err:
 257	amdgpu_job_free(job);
 258	return r;
 259}
 260
 261/**
 262 * uvd_v6_0_enc_get_destroy_msg - generate a UVD ENC destroy msg
 263 *
 264 * @ring: ring we should submit the msg to
 265 * @handle: session handle to use
 266 * @bo: amdgpu object for which we query the offset
 267 * @fence: optional fence to return
 268 *
 269 * Close up a stream for HW test or if userspace failed to do so
 270 */
 271static int uvd_v6_0_enc_get_destroy_msg(struct amdgpu_ring *ring,
 272					uint32_t handle,
 273					struct amdgpu_bo *bo,
 274					struct dma_fence **fence)
 275{
 276	const unsigned ib_size_dw = 16;
 277	struct amdgpu_job *job;
 278	struct amdgpu_ib *ib;
 279	struct dma_fence *f = NULL;
 280	uint64_t addr;
 281	int i, r;
 282
 283	r = amdgpu_job_alloc_with_ib(ring->adev, ib_size_dw * 4,
 284					AMDGPU_IB_POOL_DIRECT, &job);
 285	if (r)
 286		return r;
 287
 288	ib = &job->ibs[0];
 289	addr = amdgpu_bo_gpu_offset(bo);
 290
 291	ib->length_dw = 0;
 292	ib->ptr[ib->length_dw++] = 0x00000018;
 293	ib->ptr[ib->length_dw++] = 0x00000001; /* session info */
 294	ib->ptr[ib->length_dw++] = handle;
 295	ib->ptr[ib->length_dw++] = 0x00010000;
 296	ib->ptr[ib->length_dw++] = upper_32_bits(addr);
 297	ib->ptr[ib->length_dw++] = addr;
 298
 299	ib->ptr[ib->length_dw++] = 0x00000014;
 300	ib->ptr[ib->length_dw++] = 0x00000002; /* task info */
 301	ib->ptr[ib->length_dw++] = 0x0000001c;
 302	ib->ptr[ib->length_dw++] = 0x00000001;
 303	ib->ptr[ib->length_dw++] = 0x00000000;
 304
 305	ib->ptr[ib->length_dw++] = 0x00000008;
 306	ib->ptr[ib->length_dw++] = 0x08000002; /* op close session */
 307
 308	for (i = ib->length_dw; i < ib_size_dw; ++i)
 309		ib->ptr[i] = 0x0;
 310
 311	r = amdgpu_job_submit_direct(job, ring, &f);
 312	if (r)
 313		goto err;
 314
 315	if (fence)
 316		*fence = dma_fence_get(f);
 317	dma_fence_put(f);
 318	return 0;
 319
 320err:
 321	amdgpu_job_free(job);
 322	return r;
 323}
 324
 325/**
 326 * uvd_v6_0_enc_ring_test_ib - test if UVD ENC IBs are working
 327 *
 328 * @ring: the engine to test on
 329 * @timeout: timeout value in jiffies, or MAX_SCHEDULE_TIMEOUT
 330 *
 331 */
 332static int uvd_v6_0_enc_ring_test_ib(struct amdgpu_ring *ring, long timeout)
 333{
 334	struct dma_fence *fence = NULL;
 335	struct amdgpu_bo *bo = NULL;
 336	long r;
 337
 338	r = amdgpu_bo_create_reserved(ring->adev, 128 * 1024, PAGE_SIZE,
 339				      AMDGPU_GEM_DOMAIN_VRAM,
 340				      &bo, NULL, NULL);
 341	if (r)
 342		return r;
 343
 344	r = uvd_v6_0_enc_get_create_msg(ring, 1, bo, NULL);
 345	if (r)
 346		goto error;
 347
 348	r = uvd_v6_0_enc_get_destroy_msg(ring, 1, bo, &fence);
 349	if (r)
 350		goto error;
 351
 352	r = dma_fence_wait_timeout(fence, false, timeout);
 353	if (r == 0)
 354		r = -ETIMEDOUT;
 355	else if (r > 0)
 356		r = 0;
 357
 358error:
 359	dma_fence_put(fence);
 360	amdgpu_bo_unpin(bo);
 361	amdgpu_bo_unreserve(bo);
 362	amdgpu_bo_unref(&bo);
 363	return r;
 364}
 365
 366static int uvd_v6_0_early_init(void *handle)
 367{
 368	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
 369	adev->uvd.num_uvd_inst = 1;
 370
 371	if (!(adev->flags & AMD_IS_APU) &&
 372	    (RREG32_SMC(ixCC_HARVEST_FUSES) & CC_HARVEST_FUSES__UVD_DISABLE_MASK))
 373		return -ENOENT;
 374
 375	uvd_v6_0_set_ring_funcs(adev);
 376
 377	if (uvd_v6_0_enc_support(adev)) {
 378		adev->uvd.num_enc_rings = 2;
 379		uvd_v6_0_set_enc_ring_funcs(adev);
 380	}
 381
 382	uvd_v6_0_set_irq_funcs(adev);
 383
 384	return 0;
 385}
 386
 387static int uvd_v6_0_sw_init(void *handle)
 388{
 389	struct amdgpu_ring *ring;
 390	int i, r;
 391	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
 392
 393	/* UVD TRAP */
 394	r = amdgpu_irq_add_id(adev, AMDGPU_IRQ_CLIENTID_LEGACY, VISLANDS30_IV_SRCID_UVD_SYSTEM_MESSAGE, &adev->uvd.inst->irq);
 395	if (r)
 396		return r;
 397
 398	/* UVD ENC TRAP */
 399	if (uvd_v6_0_enc_support(adev)) {
 400		for (i = 0; i < adev->uvd.num_enc_rings; ++i) {
 401			r = amdgpu_irq_add_id(adev, AMDGPU_IRQ_CLIENTID_LEGACY, i + VISLANDS30_IV_SRCID_UVD_ENC_GEN_PURP, &adev->uvd.inst->irq);
 402			if (r)
 403				return r;
 404		}
 405	}
 406
 407	r = amdgpu_uvd_sw_init(adev);
 408	if (r)
 409		return r;
 410
 411	if (!uvd_v6_0_enc_support(adev)) {
 412		for (i = 0; i < adev->uvd.num_enc_rings; ++i)
 413			adev->uvd.inst->ring_enc[i].funcs = NULL;
 414
 415		adev->uvd.inst->irq.num_types = 1;
 416		adev->uvd.num_enc_rings = 0;
 417
 418		DRM_INFO("UVD ENC is disabled\n");
 419	}
 420
 421	ring = &adev->uvd.inst->ring;
 422	sprintf(ring->name, "uvd");
 423	r = amdgpu_ring_init(adev, ring, 512, &adev->uvd.inst->irq, 0,
 424			     AMDGPU_RING_PRIO_DEFAULT, NULL);
 425	if (r)
 426		return r;
 427
 428	r = amdgpu_uvd_resume(adev);
 429	if (r)
 430		return r;
 431
 432	if (uvd_v6_0_enc_support(adev)) {
 433		for (i = 0; i < adev->uvd.num_enc_rings; ++i) {
 434			ring = &adev->uvd.inst->ring_enc[i];
 435			sprintf(ring->name, "uvd_enc%d", i);
 436			r = amdgpu_ring_init(adev, ring, 512,
 437					     &adev->uvd.inst->irq, 0,
 438					     AMDGPU_RING_PRIO_DEFAULT, NULL);
 439			if (r)
 440				return r;
 441		}
 442	}
 443
 444	r = amdgpu_uvd_entity_init(adev);
 445
 446	return r;
 447}
 448
 449static int uvd_v6_0_sw_fini(void *handle)
 450{
 451	int i, r;
 452	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
 453
 454	r = amdgpu_uvd_suspend(adev);
 455	if (r)
 456		return r;
 457
 458	if (uvd_v6_0_enc_support(adev)) {
 459		for (i = 0; i < adev->uvd.num_enc_rings; ++i)
 460			amdgpu_ring_fini(&adev->uvd.inst->ring_enc[i]);
 461	}
 462
 463	return amdgpu_uvd_sw_fini(adev);
 464}
 465
 466/**
 467 * uvd_v6_0_hw_init - start and test UVD block
 468 *
 469 * @handle: handle used to pass amdgpu_device pointer
 470 *
 471 * Initialize the hardware, boot up the VCPU and do some testing
 472 */
 473static int uvd_v6_0_hw_init(void *handle)
 474{
 475	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
 476	struct amdgpu_ring *ring = &adev->uvd.inst->ring;
 477	uint32_t tmp;
 478	int i, r;
 479
 480	amdgpu_asic_set_uvd_clocks(adev, 10000, 10000);
 481	uvd_v6_0_set_clockgating_state(adev, AMD_CG_STATE_UNGATE);
 482	uvd_v6_0_enable_mgcg(adev, true);
 483
 484	r = amdgpu_ring_test_helper(ring);
 485	if (r)
 486		goto done;
 487
 488	r = amdgpu_ring_alloc(ring, 10);
 489	if (r) {
 490		DRM_ERROR("amdgpu: ring failed to lock UVD ring (%d).\n", r);
 491		goto done;
 492	}
 493
 494	tmp = PACKET0(mmUVD_SEMA_WAIT_FAULT_TIMEOUT_CNTL, 0);
 495	amdgpu_ring_write(ring, tmp);
 496	amdgpu_ring_write(ring, 0xFFFFF);
 497
 498	tmp = PACKET0(mmUVD_SEMA_WAIT_INCOMPLETE_TIMEOUT_CNTL, 0);
 499	amdgpu_ring_write(ring, tmp);
 500	amdgpu_ring_write(ring, 0xFFFFF);
 501
 502	tmp = PACKET0(mmUVD_SEMA_SIGNAL_INCOMPLETE_TIMEOUT_CNTL, 0);
 503	amdgpu_ring_write(ring, tmp);
 504	amdgpu_ring_write(ring, 0xFFFFF);
 505
 506	/* Clear timeout status bits */
 507	amdgpu_ring_write(ring, PACKET0(mmUVD_SEMA_TIMEOUT_STATUS, 0));
 508	amdgpu_ring_write(ring, 0x8);
 509
 510	amdgpu_ring_write(ring, PACKET0(mmUVD_SEMA_CNTL, 0));
 511	amdgpu_ring_write(ring, 3);
 512
 513	amdgpu_ring_commit(ring);
 514
 515	if (uvd_v6_0_enc_support(adev)) {
 516		for (i = 0; i < adev->uvd.num_enc_rings; ++i) {
 517			ring = &adev->uvd.inst->ring_enc[i];
 518			r = amdgpu_ring_test_helper(ring);
 519			if (r)
 520				goto done;
 521		}
 522	}
 523
 524done:
 525	if (!r) {
 526		if (uvd_v6_0_enc_support(adev))
 527			DRM_INFO("UVD and UVD ENC initialized successfully.\n");
 528		else
 529			DRM_INFO("UVD initialized successfully.\n");
 530	}
 531
 532	return r;
 533}
 534
 535/**
 536 * uvd_v6_0_hw_fini - stop the hardware block
 537 *
 538 * @handle: handle used to pass amdgpu_device pointer
 539 *
 540 * Stop the UVD block, mark ring as not ready any more
 541 */
 542static int uvd_v6_0_hw_fini(void *handle)
 543{
 544	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
 545
 
 
 546	if (RREG32(mmUVD_STATUS) != 0)
 547		uvd_v6_0_stop(adev);
 548
 549	return 0;
 550}
 551
 
 
 
 
 
 
 
 552static int uvd_v6_0_suspend(void *handle)
 553{
 554	int r;
 555	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
 556
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 557	r = uvd_v6_0_hw_fini(adev);
 558	if (r)
 559		return r;
 560
 561	return amdgpu_uvd_suspend(adev);
 562}
 563
 564static int uvd_v6_0_resume(void *handle)
 565{
 566	int r;
 567	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
 568
 569	r = amdgpu_uvd_resume(adev);
 570	if (r)
 571		return r;
 572
 573	return uvd_v6_0_hw_init(adev);
 574}
 575
 576/**
 577 * uvd_v6_0_mc_resume - memory controller programming
 578 *
 579 * @adev: amdgpu_device pointer
 580 *
 581 * Let the UVD memory controller know it's offsets
 582 */
 583static void uvd_v6_0_mc_resume(struct amdgpu_device *adev)
 584{
 585	uint64_t offset;
 586	uint32_t size;
 587
 588	/* program memory controller bits 0-27 */
 589	WREG32(mmUVD_LMI_VCPU_CACHE_64BIT_BAR_LOW,
 590			lower_32_bits(adev->uvd.inst->gpu_addr));
 591	WREG32(mmUVD_LMI_VCPU_CACHE_64BIT_BAR_HIGH,
 592			upper_32_bits(adev->uvd.inst->gpu_addr));
 593
 594	offset = AMDGPU_UVD_FIRMWARE_OFFSET;
 595	size = AMDGPU_UVD_FIRMWARE_SIZE(adev);
 596	WREG32(mmUVD_VCPU_CACHE_OFFSET0, offset >> 3);
 597	WREG32(mmUVD_VCPU_CACHE_SIZE0, size);
 598
 599	offset += size;
 600	size = AMDGPU_UVD_HEAP_SIZE;
 601	WREG32(mmUVD_VCPU_CACHE_OFFSET1, offset >> 3);
 602	WREG32(mmUVD_VCPU_CACHE_SIZE1, size);
 603
 604	offset += size;
 605	size = AMDGPU_UVD_STACK_SIZE +
 606	       (AMDGPU_UVD_SESSION_SIZE * adev->uvd.max_handles);
 607	WREG32(mmUVD_VCPU_CACHE_OFFSET2, offset >> 3);
 608	WREG32(mmUVD_VCPU_CACHE_SIZE2, size);
 609
 610	WREG32(mmUVD_UDEC_ADDR_CONFIG, adev->gfx.config.gb_addr_config);
 611	WREG32(mmUVD_UDEC_DB_ADDR_CONFIG, adev->gfx.config.gb_addr_config);
 612	WREG32(mmUVD_UDEC_DBW_ADDR_CONFIG, adev->gfx.config.gb_addr_config);
 613
 614	WREG32(mmUVD_GP_SCRATCH4, adev->uvd.max_handles);
 615}
 616
 617#if 0
 618static void cz_set_uvd_clock_gating_branches(struct amdgpu_device *adev,
 619		bool enable)
 620{
 621	u32 data, data1;
 622
 623	data = RREG32(mmUVD_CGC_GATE);
 624	data1 = RREG32(mmUVD_SUVD_CGC_GATE);
 625	if (enable) {
 626		data |= UVD_CGC_GATE__SYS_MASK |
 627				UVD_CGC_GATE__UDEC_MASK |
 628				UVD_CGC_GATE__MPEG2_MASK |
 629				UVD_CGC_GATE__RBC_MASK |
 630				UVD_CGC_GATE__LMI_MC_MASK |
 631				UVD_CGC_GATE__IDCT_MASK |
 632				UVD_CGC_GATE__MPRD_MASK |
 633				UVD_CGC_GATE__MPC_MASK |
 634				UVD_CGC_GATE__LBSI_MASK |
 635				UVD_CGC_GATE__LRBBM_MASK |
 636				UVD_CGC_GATE__UDEC_RE_MASK |
 637				UVD_CGC_GATE__UDEC_CM_MASK |
 638				UVD_CGC_GATE__UDEC_IT_MASK |
 639				UVD_CGC_GATE__UDEC_DB_MASK |
 640				UVD_CGC_GATE__UDEC_MP_MASK |
 641				UVD_CGC_GATE__WCB_MASK |
 642				UVD_CGC_GATE__VCPU_MASK |
 643				UVD_CGC_GATE__SCPU_MASK;
 644		data1 |= UVD_SUVD_CGC_GATE__SRE_MASK |
 645				UVD_SUVD_CGC_GATE__SIT_MASK |
 646				UVD_SUVD_CGC_GATE__SMP_MASK |
 647				UVD_SUVD_CGC_GATE__SCM_MASK |
 648				UVD_SUVD_CGC_GATE__SDB_MASK |
 649				UVD_SUVD_CGC_GATE__SRE_H264_MASK |
 650				UVD_SUVD_CGC_GATE__SRE_HEVC_MASK |
 651				UVD_SUVD_CGC_GATE__SIT_H264_MASK |
 652				UVD_SUVD_CGC_GATE__SIT_HEVC_MASK |
 653				UVD_SUVD_CGC_GATE__SCM_H264_MASK |
 654				UVD_SUVD_CGC_GATE__SCM_HEVC_MASK |
 655				UVD_SUVD_CGC_GATE__SDB_H264_MASK |
 656				UVD_SUVD_CGC_GATE__SDB_HEVC_MASK;
 657	} else {
 658		data &= ~(UVD_CGC_GATE__SYS_MASK |
 659				UVD_CGC_GATE__UDEC_MASK |
 660				UVD_CGC_GATE__MPEG2_MASK |
 661				UVD_CGC_GATE__RBC_MASK |
 662				UVD_CGC_GATE__LMI_MC_MASK |
 663				UVD_CGC_GATE__LMI_UMC_MASK |
 664				UVD_CGC_GATE__IDCT_MASK |
 665				UVD_CGC_GATE__MPRD_MASK |
 666				UVD_CGC_GATE__MPC_MASK |
 667				UVD_CGC_GATE__LBSI_MASK |
 668				UVD_CGC_GATE__LRBBM_MASK |
 669				UVD_CGC_GATE__UDEC_RE_MASK |
 670				UVD_CGC_GATE__UDEC_CM_MASK |
 671				UVD_CGC_GATE__UDEC_IT_MASK |
 672				UVD_CGC_GATE__UDEC_DB_MASK |
 673				UVD_CGC_GATE__UDEC_MP_MASK |
 674				UVD_CGC_GATE__WCB_MASK |
 675				UVD_CGC_GATE__VCPU_MASK |
 676				UVD_CGC_GATE__SCPU_MASK);
 677		data1 &= ~(UVD_SUVD_CGC_GATE__SRE_MASK |
 678				UVD_SUVD_CGC_GATE__SIT_MASK |
 679				UVD_SUVD_CGC_GATE__SMP_MASK |
 680				UVD_SUVD_CGC_GATE__SCM_MASK |
 681				UVD_SUVD_CGC_GATE__SDB_MASK |
 682				UVD_SUVD_CGC_GATE__SRE_H264_MASK |
 683				UVD_SUVD_CGC_GATE__SRE_HEVC_MASK |
 684				UVD_SUVD_CGC_GATE__SIT_H264_MASK |
 685				UVD_SUVD_CGC_GATE__SIT_HEVC_MASK |
 686				UVD_SUVD_CGC_GATE__SCM_H264_MASK |
 687				UVD_SUVD_CGC_GATE__SCM_HEVC_MASK |
 688				UVD_SUVD_CGC_GATE__SDB_H264_MASK |
 689				UVD_SUVD_CGC_GATE__SDB_HEVC_MASK);
 690	}
 691	WREG32(mmUVD_CGC_GATE, data);
 692	WREG32(mmUVD_SUVD_CGC_GATE, data1);
 693}
 694#endif
 695
 696/**
 697 * uvd_v6_0_start - start UVD block
 698 *
 699 * @adev: amdgpu_device pointer
 700 *
 701 * Setup and start the UVD block
 702 */
 703static int uvd_v6_0_start(struct amdgpu_device *adev)
 704{
 705	struct amdgpu_ring *ring = &adev->uvd.inst->ring;
 706	uint32_t rb_bufsz, tmp;
 707	uint32_t lmi_swap_cntl;
 708	uint32_t mp_swap_cntl;
 709	int i, j, r;
 710
 711	/* disable DPG */
 712	WREG32_P(mmUVD_POWER_STATUS, 0, ~UVD_POWER_STATUS__UVD_PG_MODE_MASK);
 713
 714	/* disable byte swapping */
 715	lmi_swap_cntl = 0;
 716	mp_swap_cntl = 0;
 717
 718	uvd_v6_0_mc_resume(adev);
 719
 720	/* disable interupt */
 721	WREG32_FIELD(UVD_MASTINT_EN, VCPU_EN, 0);
 722
 723	/* stall UMC and register bus before resetting VCPU */
 724	WREG32_FIELD(UVD_LMI_CTRL2, STALL_ARB_UMC, 1);
 725	mdelay(1);
 726
 727	/* put LMI, VCPU, RBC etc... into reset */
 728	WREG32(mmUVD_SOFT_RESET,
 729		UVD_SOFT_RESET__LMI_SOFT_RESET_MASK |
 730		UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK |
 731		UVD_SOFT_RESET__LBSI_SOFT_RESET_MASK |
 732		UVD_SOFT_RESET__RBC_SOFT_RESET_MASK |
 733		UVD_SOFT_RESET__CSM_SOFT_RESET_MASK |
 734		UVD_SOFT_RESET__CXW_SOFT_RESET_MASK |
 735		UVD_SOFT_RESET__TAP_SOFT_RESET_MASK |
 736		UVD_SOFT_RESET__LMI_UMC_SOFT_RESET_MASK);
 737	mdelay(5);
 738
 739	/* take UVD block out of reset */
 740	WREG32_FIELD(SRBM_SOFT_RESET, SOFT_RESET_UVD, 0);
 741	mdelay(5);
 742
 743	/* initialize UVD memory controller */
 744	WREG32(mmUVD_LMI_CTRL,
 745		(0x40 << UVD_LMI_CTRL__WRITE_CLEAN_TIMER__SHIFT) |
 746		UVD_LMI_CTRL__WRITE_CLEAN_TIMER_EN_MASK |
 747		UVD_LMI_CTRL__DATA_COHERENCY_EN_MASK |
 748		UVD_LMI_CTRL__VCPU_DATA_COHERENCY_EN_MASK |
 749		UVD_LMI_CTRL__REQ_MODE_MASK |
 750		UVD_LMI_CTRL__DISABLE_ON_FWV_FAIL_MASK);
 751
 752#ifdef __BIG_ENDIAN
 753	/* swap (8 in 32) RB and IB */
 754	lmi_swap_cntl = 0xa;
 755	mp_swap_cntl = 0;
 756#endif
 757	WREG32(mmUVD_LMI_SWAP_CNTL, lmi_swap_cntl);
 758	WREG32(mmUVD_MP_SWAP_CNTL, mp_swap_cntl);
 759
 760	WREG32(mmUVD_MPC_SET_MUXA0, 0x40c2040);
 761	WREG32(mmUVD_MPC_SET_MUXA1, 0x0);
 762	WREG32(mmUVD_MPC_SET_MUXB0, 0x40c2040);
 763	WREG32(mmUVD_MPC_SET_MUXB1, 0x0);
 764	WREG32(mmUVD_MPC_SET_ALU, 0);
 765	WREG32(mmUVD_MPC_SET_MUX, 0x88);
 766
 767	/* take all subblocks out of reset, except VCPU */
 768	WREG32(mmUVD_SOFT_RESET, UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
 769	mdelay(5);
 770
 771	/* enable VCPU clock */
 772	WREG32(mmUVD_VCPU_CNTL, UVD_VCPU_CNTL__CLK_EN_MASK);
 773
 774	/* enable UMC */
 775	WREG32_FIELD(UVD_LMI_CTRL2, STALL_ARB_UMC, 0);
 776
 777	/* boot up the VCPU */
 778	WREG32(mmUVD_SOFT_RESET, 0);
 779	mdelay(10);
 780
 781	for (i = 0; i < 10; ++i) {
 782		uint32_t status;
 783
 784		for (j = 0; j < 100; ++j) {
 785			status = RREG32(mmUVD_STATUS);
 786			if (status & 2)
 787				break;
 788			mdelay(10);
 789		}
 790		r = 0;
 791		if (status & 2)
 792			break;
 793
 794		DRM_ERROR("UVD not responding, trying to reset the VCPU!!!\n");
 795		WREG32_FIELD(UVD_SOFT_RESET, VCPU_SOFT_RESET, 1);
 796		mdelay(10);
 797		WREG32_FIELD(UVD_SOFT_RESET, VCPU_SOFT_RESET, 0);
 798		mdelay(10);
 799		r = -1;
 800	}
 801
 802	if (r) {
 803		DRM_ERROR("UVD not responding, giving up!!!\n");
 804		return r;
 805	}
 806	/* enable master interrupt */
 807	WREG32_P(mmUVD_MASTINT_EN,
 808		(UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK),
 809		~(UVD_MASTINT_EN__VCPU_EN_MASK|UVD_MASTINT_EN__SYS_EN_MASK));
 810
 811	/* clear the bit 4 of UVD_STATUS */
 812	WREG32_P(mmUVD_STATUS, 0, ~(2 << UVD_STATUS__VCPU_REPORT__SHIFT));
 813
 814	/* force RBC into idle state */
 815	rb_bufsz = order_base_2(ring->ring_size);
 816	tmp = REG_SET_FIELD(0, UVD_RBC_RB_CNTL, RB_BUFSZ, rb_bufsz);
 817	tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_BLKSZ, 1);
 818	tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_FETCH, 1);
 819	tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_WPTR_POLL_EN, 0);
 820	tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_NO_UPDATE, 1);
 821	tmp = REG_SET_FIELD(tmp, UVD_RBC_RB_CNTL, RB_RPTR_WR_EN, 1);
 822	WREG32(mmUVD_RBC_RB_CNTL, tmp);
 823
 824	/* set the write pointer delay */
 825	WREG32(mmUVD_RBC_RB_WPTR_CNTL, 0);
 826
 827	/* set the wb address */
 828	WREG32(mmUVD_RBC_RB_RPTR_ADDR, (upper_32_bits(ring->gpu_addr) >> 2));
 829
 830	/* program the RB_BASE for ring buffer */
 831	WREG32(mmUVD_LMI_RBC_RB_64BIT_BAR_LOW,
 832			lower_32_bits(ring->gpu_addr));
 833	WREG32(mmUVD_LMI_RBC_RB_64BIT_BAR_HIGH,
 834			upper_32_bits(ring->gpu_addr));
 835
 836	/* Initialize the ring buffer's read and write pointers */
 837	WREG32(mmUVD_RBC_RB_RPTR, 0);
 838
 839	ring->wptr = RREG32(mmUVD_RBC_RB_RPTR);
 840	WREG32(mmUVD_RBC_RB_WPTR, lower_32_bits(ring->wptr));
 841
 842	WREG32_FIELD(UVD_RBC_RB_CNTL, RB_NO_FETCH, 0);
 843
 844	if (uvd_v6_0_enc_support(adev)) {
 845		ring = &adev->uvd.inst->ring_enc[0];
 846		WREG32(mmUVD_RB_RPTR, lower_32_bits(ring->wptr));
 847		WREG32(mmUVD_RB_WPTR, lower_32_bits(ring->wptr));
 848		WREG32(mmUVD_RB_BASE_LO, ring->gpu_addr);
 849		WREG32(mmUVD_RB_BASE_HI, upper_32_bits(ring->gpu_addr));
 850		WREG32(mmUVD_RB_SIZE, ring->ring_size / 4);
 851
 852		ring = &adev->uvd.inst->ring_enc[1];
 853		WREG32(mmUVD_RB_RPTR2, lower_32_bits(ring->wptr));
 854		WREG32(mmUVD_RB_WPTR2, lower_32_bits(ring->wptr));
 855		WREG32(mmUVD_RB_BASE_LO2, ring->gpu_addr);
 856		WREG32(mmUVD_RB_BASE_HI2, upper_32_bits(ring->gpu_addr));
 857		WREG32(mmUVD_RB_SIZE2, ring->ring_size / 4);
 858	}
 859
 860	return 0;
 861}
 862
 863/**
 864 * uvd_v6_0_stop - stop UVD block
 865 *
 866 * @adev: amdgpu_device pointer
 867 *
 868 * stop the UVD block
 869 */
 870static void uvd_v6_0_stop(struct amdgpu_device *adev)
 871{
 872	/* force RBC into idle state */
 873	WREG32(mmUVD_RBC_RB_CNTL, 0x11010101);
 874
 875	/* Stall UMC and register bus before resetting VCPU */
 876	WREG32_P(mmUVD_LMI_CTRL2, 1 << 8, ~(1 << 8));
 877	mdelay(1);
 878
 879	/* put VCPU into reset */
 880	WREG32(mmUVD_SOFT_RESET, UVD_SOFT_RESET__VCPU_SOFT_RESET_MASK);
 881	mdelay(5);
 882
 883	/* disable VCPU clock */
 884	WREG32(mmUVD_VCPU_CNTL, 0x0);
 885
 886	/* Unstall UMC and register bus */
 887	WREG32_P(mmUVD_LMI_CTRL2, 0, ~(1 << 8));
 888
 889	WREG32(mmUVD_STATUS, 0);
 890}
 891
 892/**
 893 * uvd_v6_0_ring_emit_fence - emit an fence & trap command
 894 *
 895 * @ring: amdgpu_ring pointer
 896 * @addr: address
 897 * @seq: sequence number
 898 * @flags: fence related flags
 899 *
 900 * Write a fence and a trap command to the ring.
 901 */
 902static void uvd_v6_0_ring_emit_fence(struct amdgpu_ring *ring, u64 addr, u64 seq,
 903				     unsigned flags)
 904{
 905	WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
 906
 907	amdgpu_ring_write(ring, PACKET0(mmUVD_CONTEXT_ID, 0));
 908	amdgpu_ring_write(ring, seq);
 909	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0));
 910	amdgpu_ring_write(ring, addr & 0xffffffff);
 911	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA1, 0));
 912	amdgpu_ring_write(ring, upper_32_bits(addr) & 0xff);
 913	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_CMD, 0));
 914	amdgpu_ring_write(ring, 0);
 915
 916	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0));
 917	amdgpu_ring_write(ring, 0);
 918	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA1, 0));
 919	amdgpu_ring_write(ring, 0);
 920	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_CMD, 0));
 921	amdgpu_ring_write(ring, 2);
 922}
 923
 924/**
 925 * uvd_v6_0_enc_ring_emit_fence - emit an enc fence & trap command
 926 *
 927 * @ring: amdgpu_ring pointer
 928 * @addr: address
 929 * @seq: sequence number
 930 * @flags: fence related flags
 931 *
 932 * Write enc a fence and a trap command to the ring.
 933 */
 934static void uvd_v6_0_enc_ring_emit_fence(struct amdgpu_ring *ring, u64 addr,
 935			u64 seq, unsigned flags)
 936{
 937	WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
 938
 939	amdgpu_ring_write(ring, HEVC_ENC_CMD_FENCE);
 940	amdgpu_ring_write(ring, addr);
 941	amdgpu_ring_write(ring, upper_32_bits(addr));
 942	amdgpu_ring_write(ring, seq);
 943	amdgpu_ring_write(ring, HEVC_ENC_CMD_TRAP);
 944}
 945
 946/**
 947 * uvd_v6_0_ring_emit_hdp_flush - skip HDP flushing
 948 *
 949 * @ring: amdgpu_ring pointer
 950 */
 951static void uvd_v6_0_ring_emit_hdp_flush(struct amdgpu_ring *ring)
 952{
 953	/* The firmware doesn't seem to like touching registers at this point. */
 954}
 955
 956/**
 957 * uvd_v6_0_ring_test_ring - register write test
 958 *
 959 * @ring: amdgpu_ring pointer
 960 *
 961 * Test if we can successfully write to the context register
 962 */
 963static int uvd_v6_0_ring_test_ring(struct amdgpu_ring *ring)
 964{
 965	struct amdgpu_device *adev = ring->adev;
 966	uint32_t tmp = 0;
 967	unsigned i;
 968	int r;
 969
 970	WREG32(mmUVD_CONTEXT_ID, 0xCAFEDEAD);
 971	r = amdgpu_ring_alloc(ring, 3);
 972	if (r)
 973		return r;
 974
 975	amdgpu_ring_write(ring, PACKET0(mmUVD_CONTEXT_ID, 0));
 976	amdgpu_ring_write(ring, 0xDEADBEEF);
 977	amdgpu_ring_commit(ring);
 978	for (i = 0; i < adev->usec_timeout; i++) {
 979		tmp = RREG32(mmUVD_CONTEXT_ID);
 980		if (tmp == 0xDEADBEEF)
 981			break;
 982		udelay(1);
 983	}
 984
 985	if (i >= adev->usec_timeout)
 986		r = -ETIMEDOUT;
 987
 988	return r;
 989}
 990
 991/**
 992 * uvd_v6_0_ring_emit_ib - execute indirect buffer
 993 *
 994 * @ring: amdgpu_ring pointer
 995 * @job: job to retrieve vmid from
 996 * @ib: indirect buffer to execute
 997 * @flags: unused
 998 *
 999 * Write ring commands to execute the indirect buffer
1000 */
1001static void uvd_v6_0_ring_emit_ib(struct amdgpu_ring *ring,
1002				  struct amdgpu_job *job,
1003				  struct amdgpu_ib *ib,
1004				  uint32_t flags)
1005{
1006	unsigned vmid = AMDGPU_JOB_GET_VMID(job);
1007
1008	amdgpu_ring_write(ring, PACKET0(mmUVD_LMI_RBC_IB_VMID, 0));
1009	amdgpu_ring_write(ring, vmid);
1010
1011	amdgpu_ring_write(ring, PACKET0(mmUVD_LMI_RBC_IB_64BIT_BAR_LOW, 0));
1012	amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
1013	amdgpu_ring_write(ring, PACKET0(mmUVD_LMI_RBC_IB_64BIT_BAR_HIGH, 0));
1014	amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
1015	amdgpu_ring_write(ring, PACKET0(mmUVD_RBC_IB_SIZE, 0));
1016	amdgpu_ring_write(ring, ib->length_dw);
1017}
1018
1019/**
1020 * uvd_v6_0_enc_ring_emit_ib - enc execute indirect buffer
1021 *
1022 * @ring: amdgpu_ring pointer
1023 * @job: job to retrive vmid from
1024 * @ib: indirect buffer to execute
1025 * @flags: unused
1026 *
1027 * Write enc ring commands to execute the indirect buffer
1028 */
1029static void uvd_v6_0_enc_ring_emit_ib(struct amdgpu_ring *ring,
1030					struct amdgpu_job *job,
1031					struct amdgpu_ib *ib,
1032					uint32_t flags)
1033{
1034	unsigned vmid = AMDGPU_JOB_GET_VMID(job);
1035
1036	amdgpu_ring_write(ring, HEVC_ENC_CMD_IB_VM);
1037	amdgpu_ring_write(ring, vmid);
1038	amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
1039	amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
1040	amdgpu_ring_write(ring, ib->length_dw);
1041}
1042
1043static void uvd_v6_0_ring_emit_wreg(struct amdgpu_ring *ring,
1044				    uint32_t reg, uint32_t val)
1045{
1046	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0));
1047	amdgpu_ring_write(ring, reg << 2);
1048	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA1, 0));
1049	amdgpu_ring_write(ring, val);
1050	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_CMD, 0));
1051	amdgpu_ring_write(ring, 0x8);
1052}
1053
1054static void uvd_v6_0_ring_emit_vm_flush(struct amdgpu_ring *ring,
1055					unsigned vmid, uint64_t pd_addr)
1056{
1057	amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr);
1058
1059	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0));
1060	amdgpu_ring_write(ring, mmVM_INVALIDATE_REQUEST << 2);
1061	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA1, 0));
1062	amdgpu_ring_write(ring, 0);
1063	amdgpu_ring_write(ring, PACKET0(mmUVD_GP_SCRATCH8, 0));
1064	amdgpu_ring_write(ring, 1 << vmid); /* mask */
1065	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_CMD, 0));
1066	amdgpu_ring_write(ring, 0xC);
1067}
1068
1069static void uvd_v6_0_ring_emit_pipeline_sync(struct amdgpu_ring *ring)
1070{
1071	uint32_t seq = ring->fence_drv.sync_seq;
1072	uint64_t addr = ring->fence_drv.gpu_addr;
1073
1074	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA0, 0));
1075	amdgpu_ring_write(ring, lower_32_bits(addr));
1076	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_DATA1, 0));
1077	amdgpu_ring_write(ring, upper_32_bits(addr));
1078	amdgpu_ring_write(ring, PACKET0(mmUVD_GP_SCRATCH8, 0));
1079	amdgpu_ring_write(ring, 0xffffffff); /* mask */
1080	amdgpu_ring_write(ring, PACKET0(mmUVD_GP_SCRATCH9, 0));
1081	amdgpu_ring_write(ring, seq);
1082	amdgpu_ring_write(ring, PACKET0(mmUVD_GPCOM_VCPU_CMD, 0));
1083	amdgpu_ring_write(ring, 0xE);
1084}
1085
1086static void uvd_v6_0_ring_insert_nop(struct amdgpu_ring *ring, uint32_t count)
1087{
1088	int i;
1089
1090	WARN_ON(ring->wptr % 2 || count % 2);
1091
1092	for (i = 0; i < count / 2; i++) {
1093		amdgpu_ring_write(ring, PACKET0(mmUVD_NO_OP, 0));
1094		amdgpu_ring_write(ring, 0);
1095	}
1096}
1097
1098static void uvd_v6_0_enc_ring_emit_pipeline_sync(struct amdgpu_ring *ring)
1099{
1100	uint32_t seq = ring->fence_drv.sync_seq;
1101	uint64_t addr = ring->fence_drv.gpu_addr;
1102
1103	amdgpu_ring_write(ring, HEVC_ENC_CMD_WAIT_GE);
1104	amdgpu_ring_write(ring, lower_32_bits(addr));
1105	amdgpu_ring_write(ring, upper_32_bits(addr));
1106	amdgpu_ring_write(ring, seq);
1107}
1108
1109static void uvd_v6_0_enc_ring_insert_end(struct amdgpu_ring *ring)
1110{
1111	amdgpu_ring_write(ring, HEVC_ENC_CMD_END);
1112}
1113
1114static void uvd_v6_0_enc_ring_emit_vm_flush(struct amdgpu_ring *ring,
1115					    unsigned int vmid, uint64_t pd_addr)
1116{
1117	amdgpu_ring_write(ring, HEVC_ENC_CMD_UPDATE_PTB);
1118	amdgpu_ring_write(ring, vmid);
1119	amdgpu_ring_write(ring, pd_addr >> 12);
1120
1121	amdgpu_ring_write(ring, HEVC_ENC_CMD_FLUSH_TLB);
1122	amdgpu_ring_write(ring, vmid);
1123}
1124
1125static bool uvd_v6_0_is_idle(void *handle)
1126{
1127	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1128
1129	return !(RREG32(mmSRBM_STATUS) & SRBM_STATUS__UVD_BUSY_MASK);
1130}
1131
1132static int uvd_v6_0_wait_for_idle(void *handle)
1133{
1134	unsigned i;
1135	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1136
1137	for (i = 0; i < adev->usec_timeout; i++) {
1138		if (uvd_v6_0_is_idle(handle))
1139			return 0;
1140	}
1141	return -ETIMEDOUT;
1142}
1143
1144#define AMDGPU_UVD_STATUS_BUSY_MASK    0xfd
1145static bool uvd_v6_0_check_soft_reset(void *handle)
1146{
1147	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1148	u32 srbm_soft_reset = 0;
1149	u32 tmp = RREG32(mmSRBM_STATUS);
1150
1151	if (REG_GET_FIELD(tmp, SRBM_STATUS, UVD_RQ_PENDING) ||
1152	    REG_GET_FIELD(tmp, SRBM_STATUS, UVD_BUSY) ||
1153	    (RREG32(mmUVD_STATUS) & AMDGPU_UVD_STATUS_BUSY_MASK))
1154		srbm_soft_reset = REG_SET_FIELD(srbm_soft_reset, SRBM_SOFT_RESET, SOFT_RESET_UVD, 1);
1155
1156	if (srbm_soft_reset) {
1157		adev->uvd.inst->srbm_soft_reset = srbm_soft_reset;
1158		return true;
1159	} else {
1160		adev->uvd.inst->srbm_soft_reset = 0;
1161		return false;
1162	}
1163}
1164
1165static int uvd_v6_0_pre_soft_reset(void *handle)
1166{
1167	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1168
1169	if (!adev->uvd.inst->srbm_soft_reset)
1170		return 0;
1171
1172	uvd_v6_0_stop(adev);
1173	return 0;
1174}
1175
1176static int uvd_v6_0_soft_reset(void *handle)
1177{
1178	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1179	u32 srbm_soft_reset;
1180
1181	if (!adev->uvd.inst->srbm_soft_reset)
1182		return 0;
1183	srbm_soft_reset = adev->uvd.inst->srbm_soft_reset;
1184
1185	if (srbm_soft_reset) {
1186		u32 tmp;
1187
1188		tmp = RREG32(mmSRBM_SOFT_RESET);
1189		tmp |= srbm_soft_reset;
1190		dev_info(adev->dev, "SRBM_SOFT_RESET=0x%08X\n", tmp);
1191		WREG32(mmSRBM_SOFT_RESET, tmp);
1192		tmp = RREG32(mmSRBM_SOFT_RESET);
1193
1194		udelay(50);
1195
1196		tmp &= ~srbm_soft_reset;
1197		WREG32(mmSRBM_SOFT_RESET, tmp);
1198		tmp = RREG32(mmSRBM_SOFT_RESET);
1199
1200		/* Wait a little for things to settle down */
1201		udelay(50);
1202	}
1203
1204	return 0;
1205}
1206
1207static int uvd_v6_0_post_soft_reset(void *handle)
1208{
1209	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1210
1211	if (!adev->uvd.inst->srbm_soft_reset)
1212		return 0;
1213
1214	mdelay(5);
1215
1216	return uvd_v6_0_start(adev);
1217}
1218
1219static int uvd_v6_0_set_interrupt_state(struct amdgpu_device *adev,
1220					struct amdgpu_irq_src *source,
1221					unsigned type,
1222					enum amdgpu_interrupt_state state)
1223{
1224	// TODO
1225	return 0;
1226}
1227
1228static int uvd_v6_0_process_interrupt(struct amdgpu_device *adev,
1229				      struct amdgpu_irq_src *source,
1230				      struct amdgpu_iv_entry *entry)
1231{
1232	bool int_handled = true;
1233	DRM_DEBUG("IH: UVD TRAP\n");
1234
1235	switch (entry->src_id) {
1236	case 124:
1237		amdgpu_fence_process(&adev->uvd.inst->ring);
1238		break;
1239	case 119:
1240		if (likely(uvd_v6_0_enc_support(adev)))
1241			amdgpu_fence_process(&adev->uvd.inst->ring_enc[0]);
1242		else
1243			int_handled = false;
1244		break;
1245	case 120:
1246		if (likely(uvd_v6_0_enc_support(adev)))
1247			amdgpu_fence_process(&adev->uvd.inst->ring_enc[1]);
1248		else
1249			int_handled = false;
1250		break;
1251	}
1252
1253	if (!int_handled)
1254		DRM_ERROR("Unhandled interrupt: %d %d\n",
1255			  entry->src_id, entry->src_data[0]);
1256
1257	return 0;
1258}
1259
1260static void uvd_v6_0_enable_clock_gating(struct amdgpu_device *adev, bool enable)
1261{
1262	uint32_t data1, data3;
1263
1264	data1 = RREG32(mmUVD_SUVD_CGC_GATE);
1265	data3 = RREG32(mmUVD_CGC_GATE);
1266
1267	data1 |= UVD_SUVD_CGC_GATE__SRE_MASK |
1268		     UVD_SUVD_CGC_GATE__SIT_MASK |
1269		     UVD_SUVD_CGC_GATE__SMP_MASK |
1270		     UVD_SUVD_CGC_GATE__SCM_MASK |
1271		     UVD_SUVD_CGC_GATE__SDB_MASK |
1272		     UVD_SUVD_CGC_GATE__SRE_H264_MASK |
1273		     UVD_SUVD_CGC_GATE__SRE_HEVC_MASK |
1274		     UVD_SUVD_CGC_GATE__SIT_H264_MASK |
1275		     UVD_SUVD_CGC_GATE__SIT_HEVC_MASK |
1276		     UVD_SUVD_CGC_GATE__SCM_H264_MASK |
1277		     UVD_SUVD_CGC_GATE__SCM_HEVC_MASK |
1278		     UVD_SUVD_CGC_GATE__SDB_H264_MASK |
1279		     UVD_SUVD_CGC_GATE__SDB_HEVC_MASK;
1280
1281	if (enable) {
1282		data3 |= (UVD_CGC_GATE__SYS_MASK       |
1283			UVD_CGC_GATE__UDEC_MASK      |
1284			UVD_CGC_GATE__MPEG2_MASK     |
1285			UVD_CGC_GATE__RBC_MASK       |
1286			UVD_CGC_GATE__LMI_MC_MASK    |
1287			UVD_CGC_GATE__LMI_UMC_MASK   |
1288			UVD_CGC_GATE__IDCT_MASK      |
1289			UVD_CGC_GATE__MPRD_MASK      |
1290			UVD_CGC_GATE__MPC_MASK       |
1291			UVD_CGC_GATE__LBSI_MASK      |
1292			UVD_CGC_GATE__LRBBM_MASK     |
1293			UVD_CGC_GATE__UDEC_RE_MASK   |
1294			UVD_CGC_GATE__UDEC_CM_MASK   |
1295			UVD_CGC_GATE__UDEC_IT_MASK   |
1296			UVD_CGC_GATE__UDEC_DB_MASK   |
1297			UVD_CGC_GATE__UDEC_MP_MASK   |
1298			UVD_CGC_GATE__WCB_MASK       |
1299			UVD_CGC_GATE__JPEG_MASK      |
1300			UVD_CGC_GATE__SCPU_MASK      |
1301			UVD_CGC_GATE__JPEG2_MASK);
1302		/* only in pg enabled, we can gate clock to vcpu*/
1303		if (adev->pg_flags & AMD_PG_SUPPORT_UVD)
1304			data3 |= UVD_CGC_GATE__VCPU_MASK;
1305
1306		data3 &= ~UVD_CGC_GATE__REGS_MASK;
1307	} else {
1308		data3 = 0;
1309	}
1310
1311	WREG32(mmUVD_SUVD_CGC_GATE, data1);
1312	WREG32(mmUVD_CGC_GATE, data3);
1313}
1314
1315static void uvd_v6_0_set_sw_clock_gating(struct amdgpu_device *adev)
1316{
1317	uint32_t data, data2;
1318
1319	data = RREG32(mmUVD_CGC_CTRL);
1320	data2 = RREG32(mmUVD_SUVD_CGC_CTRL);
1321
1322
1323	data &= ~(UVD_CGC_CTRL__CLK_OFF_DELAY_MASK |
1324		  UVD_CGC_CTRL__CLK_GATE_DLY_TIMER_MASK);
1325
1326
1327	data |= UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK |
1328		(1 << REG_FIELD_SHIFT(UVD_CGC_CTRL, CLK_GATE_DLY_TIMER)) |
1329		(4 << REG_FIELD_SHIFT(UVD_CGC_CTRL, CLK_OFF_DELAY));
1330
1331	data &= ~(UVD_CGC_CTRL__UDEC_RE_MODE_MASK |
1332			UVD_CGC_CTRL__UDEC_CM_MODE_MASK |
1333			UVD_CGC_CTRL__UDEC_IT_MODE_MASK |
1334			UVD_CGC_CTRL__UDEC_DB_MODE_MASK |
1335			UVD_CGC_CTRL__UDEC_MP_MODE_MASK |
1336			UVD_CGC_CTRL__SYS_MODE_MASK |
1337			UVD_CGC_CTRL__UDEC_MODE_MASK |
1338			UVD_CGC_CTRL__MPEG2_MODE_MASK |
1339			UVD_CGC_CTRL__REGS_MODE_MASK |
1340			UVD_CGC_CTRL__RBC_MODE_MASK |
1341			UVD_CGC_CTRL__LMI_MC_MODE_MASK |
1342			UVD_CGC_CTRL__LMI_UMC_MODE_MASK |
1343			UVD_CGC_CTRL__IDCT_MODE_MASK |
1344			UVD_CGC_CTRL__MPRD_MODE_MASK |
1345			UVD_CGC_CTRL__MPC_MODE_MASK |
1346			UVD_CGC_CTRL__LBSI_MODE_MASK |
1347			UVD_CGC_CTRL__LRBBM_MODE_MASK |
1348			UVD_CGC_CTRL__WCB_MODE_MASK |
1349			UVD_CGC_CTRL__VCPU_MODE_MASK |
1350			UVD_CGC_CTRL__JPEG_MODE_MASK |
1351			UVD_CGC_CTRL__SCPU_MODE_MASK |
1352			UVD_CGC_CTRL__JPEG2_MODE_MASK);
1353	data2 &= ~(UVD_SUVD_CGC_CTRL__SRE_MODE_MASK |
1354			UVD_SUVD_CGC_CTRL__SIT_MODE_MASK |
1355			UVD_SUVD_CGC_CTRL__SMP_MODE_MASK |
1356			UVD_SUVD_CGC_CTRL__SCM_MODE_MASK |
1357			UVD_SUVD_CGC_CTRL__SDB_MODE_MASK);
1358
1359	WREG32(mmUVD_CGC_CTRL, data);
1360	WREG32(mmUVD_SUVD_CGC_CTRL, data2);
1361}
1362
1363#if 0
1364static void uvd_v6_0_set_hw_clock_gating(struct amdgpu_device *adev)
1365{
1366	uint32_t data, data1, cgc_flags, suvd_flags;
1367
1368	data = RREG32(mmUVD_CGC_GATE);
1369	data1 = RREG32(mmUVD_SUVD_CGC_GATE);
1370
1371	cgc_flags = UVD_CGC_GATE__SYS_MASK |
1372		UVD_CGC_GATE__UDEC_MASK |
1373		UVD_CGC_GATE__MPEG2_MASK |
1374		UVD_CGC_GATE__RBC_MASK |
1375		UVD_CGC_GATE__LMI_MC_MASK |
1376		UVD_CGC_GATE__IDCT_MASK |
1377		UVD_CGC_GATE__MPRD_MASK |
1378		UVD_CGC_GATE__MPC_MASK |
1379		UVD_CGC_GATE__LBSI_MASK |
1380		UVD_CGC_GATE__LRBBM_MASK |
1381		UVD_CGC_GATE__UDEC_RE_MASK |
1382		UVD_CGC_GATE__UDEC_CM_MASK |
1383		UVD_CGC_GATE__UDEC_IT_MASK |
1384		UVD_CGC_GATE__UDEC_DB_MASK |
1385		UVD_CGC_GATE__UDEC_MP_MASK |
1386		UVD_CGC_GATE__WCB_MASK |
1387		UVD_CGC_GATE__VCPU_MASK |
1388		UVD_CGC_GATE__SCPU_MASK |
1389		UVD_CGC_GATE__JPEG_MASK |
1390		UVD_CGC_GATE__JPEG2_MASK;
1391
1392	suvd_flags = UVD_SUVD_CGC_GATE__SRE_MASK |
1393				UVD_SUVD_CGC_GATE__SIT_MASK |
1394				UVD_SUVD_CGC_GATE__SMP_MASK |
1395				UVD_SUVD_CGC_GATE__SCM_MASK |
1396				UVD_SUVD_CGC_GATE__SDB_MASK;
1397
1398	data |= cgc_flags;
1399	data1 |= suvd_flags;
1400
1401	WREG32(mmUVD_CGC_GATE, data);
1402	WREG32(mmUVD_SUVD_CGC_GATE, data1);
1403}
1404#endif
1405
1406static void uvd_v6_0_enable_mgcg(struct amdgpu_device *adev,
1407				 bool enable)
1408{
1409	u32 orig, data;
1410
1411	if (enable && (adev->cg_flags & AMD_CG_SUPPORT_UVD_MGCG)) {
1412		data = RREG32_UVD_CTX(ixUVD_CGC_MEM_CTRL);
1413		data |= 0xfff;
1414		WREG32_UVD_CTX(ixUVD_CGC_MEM_CTRL, data);
1415
1416		orig = data = RREG32(mmUVD_CGC_CTRL);
1417		data |= UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK;
1418		if (orig != data)
1419			WREG32(mmUVD_CGC_CTRL, data);
1420	} else {
1421		data = RREG32_UVD_CTX(ixUVD_CGC_MEM_CTRL);
1422		data &= ~0xfff;
1423		WREG32_UVD_CTX(ixUVD_CGC_MEM_CTRL, data);
1424
1425		orig = data = RREG32(mmUVD_CGC_CTRL);
1426		data &= ~UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK;
1427		if (orig != data)
1428			WREG32(mmUVD_CGC_CTRL, data);
1429	}
1430}
1431
1432static int uvd_v6_0_set_clockgating_state(void *handle,
1433					  enum amd_clockgating_state state)
1434{
1435	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1436	bool enable = (state == AMD_CG_STATE_GATE);
1437
1438	if (enable) {
1439		/* wait for STATUS to clear */
1440		if (uvd_v6_0_wait_for_idle(handle))
1441			return -EBUSY;
1442		uvd_v6_0_enable_clock_gating(adev, true);
1443		/* enable HW gates because UVD is idle */
1444/*		uvd_v6_0_set_hw_clock_gating(adev); */
1445	} else {
1446		/* disable HW gating and enable Sw gating */
1447		uvd_v6_0_enable_clock_gating(adev, false);
1448	}
1449	uvd_v6_0_set_sw_clock_gating(adev);
1450	return 0;
1451}
1452
1453static int uvd_v6_0_set_powergating_state(void *handle,
1454					  enum amd_powergating_state state)
1455{
1456	/* This doesn't actually powergate the UVD block.
1457	 * That's done in the dpm code via the SMC.  This
1458	 * just re-inits the block as necessary.  The actual
1459	 * gating still happens in the dpm code.  We should
1460	 * revisit this when there is a cleaner line between
1461	 * the smc and the hw blocks
1462	 */
1463	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1464	int ret = 0;
1465
1466	WREG32(mmUVD_POWER_STATUS, UVD_POWER_STATUS__UVD_PG_EN_MASK);
1467
1468	if (state == AMD_PG_STATE_GATE) {
1469		uvd_v6_0_stop(adev);
1470	} else {
1471		ret = uvd_v6_0_start(adev);
1472		if (ret)
1473			goto out;
1474	}
1475
1476out:
1477	return ret;
1478}
1479
1480static void uvd_v6_0_get_clockgating_state(void *handle, u32 *flags)
1481{
1482	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
1483	int data;
1484
1485	mutex_lock(&adev->pm.mutex);
1486
1487	if (adev->flags & AMD_IS_APU)
1488		data = RREG32_SMC(ixCURRENT_PG_STATUS_APU);
1489	else
1490		data = RREG32_SMC(ixCURRENT_PG_STATUS);
1491
1492	if (data & CURRENT_PG_STATUS__UVD_PG_STATUS_MASK) {
1493		DRM_INFO("Cannot get clockgating state when UVD is powergated.\n");
1494		goto out;
1495	}
1496
1497	/* AMD_CG_SUPPORT_UVD_MGCG */
1498	data = RREG32(mmUVD_CGC_CTRL);
1499	if (data & UVD_CGC_CTRL__DYN_CLOCK_MODE_MASK)
1500		*flags |= AMD_CG_SUPPORT_UVD_MGCG;
1501
1502out:
1503	mutex_unlock(&adev->pm.mutex);
1504}
1505
1506static const struct amd_ip_funcs uvd_v6_0_ip_funcs = {
1507	.name = "uvd_v6_0",
1508	.early_init = uvd_v6_0_early_init,
1509	.late_init = NULL,
1510	.sw_init = uvd_v6_0_sw_init,
1511	.sw_fini = uvd_v6_0_sw_fini,
1512	.hw_init = uvd_v6_0_hw_init,
1513	.hw_fini = uvd_v6_0_hw_fini,
 
1514	.suspend = uvd_v6_0_suspend,
1515	.resume = uvd_v6_0_resume,
1516	.is_idle = uvd_v6_0_is_idle,
1517	.wait_for_idle = uvd_v6_0_wait_for_idle,
1518	.check_soft_reset = uvd_v6_0_check_soft_reset,
1519	.pre_soft_reset = uvd_v6_0_pre_soft_reset,
1520	.soft_reset = uvd_v6_0_soft_reset,
1521	.post_soft_reset = uvd_v6_0_post_soft_reset,
1522	.set_clockgating_state = uvd_v6_0_set_clockgating_state,
1523	.set_powergating_state = uvd_v6_0_set_powergating_state,
1524	.get_clockgating_state = uvd_v6_0_get_clockgating_state,
1525};
1526
1527static const struct amdgpu_ring_funcs uvd_v6_0_ring_phys_funcs = {
1528	.type = AMDGPU_RING_TYPE_UVD,
1529	.align_mask = 0xf,
1530	.support_64bit_ptrs = false,
1531	.no_user_fence = true,
1532	.get_rptr = uvd_v6_0_ring_get_rptr,
1533	.get_wptr = uvd_v6_0_ring_get_wptr,
1534	.set_wptr = uvd_v6_0_ring_set_wptr,
1535	.parse_cs = amdgpu_uvd_ring_parse_cs,
1536	.emit_frame_size =
1537		6 + /* hdp invalidate */
1538		10 + /* uvd_v6_0_ring_emit_pipeline_sync */
1539		14, /* uvd_v6_0_ring_emit_fence x1 no user fence */
1540	.emit_ib_size = 8, /* uvd_v6_0_ring_emit_ib */
1541	.emit_ib = uvd_v6_0_ring_emit_ib,
1542	.emit_fence = uvd_v6_0_ring_emit_fence,
1543	.emit_hdp_flush = uvd_v6_0_ring_emit_hdp_flush,
1544	.test_ring = uvd_v6_0_ring_test_ring,
1545	.test_ib = amdgpu_uvd_ring_test_ib,
1546	.insert_nop = uvd_v6_0_ring_insert_nop,
1547	.pad_ib = amdgpu_ring_generic_pad_ib,
1548	.begin_use = amdgpu_uvd_ring_begin_use,
1549	.end_use = amdgpu_uvd_ring_end_use,
1550	.emit_wreg = uvd_v6_0_ring_emit_wreg,
1551};
1552
1553static const struct amdgpu_ring_funcs uvd_v6_0_ring_vm_funcs = {
1554	.type = AMDGPU_RING_TYPE_UVD,
1555	.align_mask = 0xf,
1556	.support_64bit_ptrs = false,
1557	.no_user_fence = true,
1558	.get_rptr = uvd_v6_0_ring_get_rptr,
1559	.get_wptr = uvd_v6_0_ring_get_wptr,
1560	.set_wptr = uvd_v6_0_ring_set_wptr,
1561	.emit_frame_size =
1562		6 + /* hdp invalidate */
1563		10 + /* uvd_v6_0_ring_emit_pipeline_sync */
1564		VI_FLUSH_GPU_TLB_NUM_WREG * 6 + 8 + /* uvd_v6_0_ring_emit_vm_flush */
1565		14 + 14, /* uvd_v6_0_ring_emit_fence x2 vm fence */
1566	.emit_ib_size = 8, /* uvd_v6_0_ring_emit_ib */
1567	.emit_ib = uvd_v6_0_ring_emit_ib,
1568	.emit_fence = uvd_v6_0_ring_emit_fence,
1569	.emit_vm_flush = uvd_v6_0_ring_emit_vm_flush,
1570	.emit_pipeline_sync = uvd_v6_0_ring_emit_pipeline_sync,
1571	.emit_hdp_flush = uvd_v6_0_ring_emit_hdp_flush,
1572	.test_ring = uvd_v6_0_ring_test_ring,
1573	.test_ib = amdgpu_uvd_ring_test_ib,
1574	.insert_nop = uvd_v6_0_ring_insert_nop,
1575	.pad_ib = amdgpu_ring_generic_pad_ib,
1576	.begin_use = amdgpu_uvd_ring_begin_use,
1577	.end_use = amdgpu_uvd_ring_end_use,
1578	.emit_wreg = uvd_v6_0_ring_emit_wreg,
1579};
1580
1581static const struct amdgpu_ring_funcs uvd_v6_0_enc_ring_vm_funcs = {
1582	.type = AMDGPU_RING_TYPE_UVD_ENC,
1583	.align_mask = 0x3f,
1584	.nop = HEVC_ENC_CMD_NO_OP,
1585	.support_64bit_ptrs = false,
1586	.no_user_fence = true,
1587	.get_rptr = uvd_v6_0_enc_ring_get_rptr,
1588	.get_wptr = uvd_v6_0_enc_ring_get_wptr,
1589	.set_wptr = uvd_v6_0_enc_ring_set_wptr,
1590	.emit_frame_size =
1591		4 + /* uvd_v6_0_enc_ring_emit_pipeline_sync */
1592		5 + /* uvd_v6_0_enc_ring_emit_vm_flush */
1593		5 + 5 + /* uvd_v6_0_enc_ring_emit_fence x2 vm fence */
1594		1, /* uvd_v6_0_enc_ring_insert_end */
1595	.emit_ib_size = 5, /* uvd_v6_0_enc_ring_emit_ib */
1596	.emit_ib = uvd_v6_0_enc_ring_emit_ib,
1597	.emit_fence = uvd_v6_0_enc_ring_emit_fence,
1598	.emit_vm_flush = uvd_v6_0_enc_ring_emit_vm_flush,
1599	.emit_pipeline_sync = uvd_v6_0_enc_ring_emit_pipeline_sync,
1600	.test_ring = uvd_v6_0_enc_ring_test_ring,
1601	.test_ib = uvd_v6_0_enc_ring_test_ib,
1602	.insert_nop = amdgpu_ring_insert_nop,
1603	.insert_end = uvd_v6_0_enc_ring_insert_end,
1604	.pad_ib = amdgpu_ring_generic_pad_ib,
1605	.begin_use = amdgpu_uvd_ring_begin_use,
1606	.end_use = amdgpu_uvd_ring_end_use,
1607};
1608
1609static void uvd_v6_0_set_ring_funcs(struct amdgpu_device *adev)
1610{
1611	if (adev->asic_type >= CHIP_POLARIS10) {
1612		adev->uvd.inst->ring.funcs = &uvd_v6_0_ring_vm_funcs;
1613		DRM_INFO("UVD is enabled in VM mode\n");
1614	} else {
1615		adev->uvd.inst->ring.funcs = &uvd_v6_0_ring_phys_funcs;
1616		DRM_INFO("UVD is enabled in physical mode\n");
1617	}
1618}
1619
1620static void uvd_v6_0_set_enc_ring_funcs(struct amdgpu_device *adev)
1621{
1622	int i;
1623
1624	for (i = 0; i < adev->uvd.num_enc_rings; ++i)
1625		adev->uvd.inst->ring_enc[i].funcs = &uvd_v6_0_enc_ring_vm_funcs;
1626
1627	DRM_INFO("UVD ENC is enabled in VM mode\n");
1628}
1629
1630static const struct amdgpu_irq_src_funcs uvd_v6_0_irq_funcs = {
1631	.set = uvd_v6_0_set_interrupt_state,
1632	.process = uvd_v6_0_process_interrupt,
1633};
1634
1635static void uvd_v6_0_set_irq_funcs(struct amdgpu_device *adev)
1636{
1637	if (uvd_v6_0_enc_support(adev))
1638		adev->uvd.inst->irq.num_types = adev->uvd.num_enc_rings + 1;
1639	else
1640		adev->uvd.inst->irq.num_types = 1;
1641
1642	adev->uvd.inst->irq.funcs = &uvd_v6_0_irq_funcs;
1643}
1644
1645const struct amdgpu_ip_block_version uvd_v6_0_ip_block =
1646{
1647		.type = AMD_IP_BLOCK_TYPE_UVD,
1648		.major = 6,
1649		.minor = 0,
1650		.rev = 0,
1651		.funcs = &uvd_v6_0_ip_funcs,
1652};
1653
1654const struct amdgpu_ip_block_version uvd_v6_2_ip_block =
1655{
1656		.type = AMD_IP_BLOCK_TYPE_UVD,
1657		.major = 6,
1658		.minor = 2,
1659		.rev = 0,
1660		.funcs = &uvd_v6_0_ip_funcs,
1661};
1662
1663const struct amdgpu_ip_block_version uvd_v6_3_ip_block =
1664{
1665		.type = AMD_IP_BLOCK_TYPE_UVD,
1666		.major = 6,
1667		.minor = 3,
1668		.rev = 0,
1669		.funcs = &uvd_v6_0_ip_funcs,
1670};