Linux Audio

Check our new training course

Linux debugging, profiling, tracing and performance analysis training

Apr 14-17, 2025
Register
Loading...
Note: File does not exist in v4.6.
   1/*
   2 * Copyright 2016 Advanced Micro Devices, Inc.
   3 *
   4 * Permission is hereby granted, free of charge, to any person obtaining a
   5 * copy of this software and associated documentation files (the "Software"),
   6 * to deal in the Software without restriction, including without limitation
   7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
   8 * and/or sell copies of the Software, and to permit persons to whom the
   9 * Software is furnished to do so, subject to the following conditions:
  10 *
  11 * The above copyright notice and this permission notice shall be included in
  12 * all copies or substantial portions of the Software.
  13 *
  14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20 * OTHER DEALINGS IN THE SOFTWARE.
  21 *
  22 */
  23
  24#include <linux/module.h>
  25
  26#ifdef CONFIG_X86
  27#include <asm/hypervisor.h>
  28#endif
  29
  30#include <drm/drm_drv.h>
  31#include <xen/xen.h>
  32
  33#include "amdgpu.h"
  34#include "amdgpu_ras.h"
  35#include "amdgpu_reset.h"
  36#include "amdgpu_dpm.h"
  37#include "vi.h"
  38#include "soc15.h"
  39#include "nv.h"
  40
  41#define POPULATE_UCODE_INFO(vf2pf_info, ucode, ver) \
  42	do { \
  43		vf2pf_info->ucode_info[ucode].id = ucode; \
  44		vf2pf_info->ucode_info[ucode].version = ver; \
  45	} while (0)
  46
  47bool amdgpu_virt_mmio_blocked(struct amdgpu_device *adev)
  48{
  49	/* By now all MMIO pages except mailbox are blocked */
  50	/* if blocking is enabled in hypervisor. Choose the */
  51	/* SCRATCH_REG0 to test. */
  52	return RREG32_NO_KIQ(0xc040) == 0xffffffff;
  53}
  54
  55void amdgpu_virt_init_setting(struct amdgpu_device *adev)
  56{
  57	struct drm_device *ddev = adev_to_drm(adev);
  58
  59	/* enable virtual display */
  60	if (adev->asic_type != CHIP_ALDEBARAN &&
  61	    adev->asic_type != CHIP_ARCTURUS &&
  62	    ((adev->pdev->class >> 8) != PCI_CLASS_ACCELERATOR_PROCESSING)) {
  63		if (adev->mode_info.num_crtc == 0)
  64			adev->mode_info.num_crtc = 1;
  65		adev->enable_virtual_display = true;
  66	}
  67	ddev->driver_features &= ~DRIVER_ATOMIC;
  68	adev->cg_flags = 0;
  69	adev->pg_flags = 0;
  70
  71	/* Reduce kcq number to 2 to reduce latency */
  72	if (amdgpu_num_kcq == -1)
  73		amdgpu_num_kcq = 2;
  74}
  75
  76/**
  77 * amdgpu_virt_request_full_gpu() - request full gpu access
  78 * @adev:	amdgpu device.
  79 * @init:	is driver init time.
  80 * When start to init/fini driver, first need to request full gpu access.
  81 * Return: Zero if request success, otherwise will return error.
  82 */
  83int amdgpu_virt_request_full_gpu(struct amdgpu_device *adev, bool init)
  84{
  85	struct amdgpu_virt *virt = &adev->virt;
  86	int r;
  87
  88	if (virt->ops && virt->ops->req_full_gpu) {
  89		r = virt->ops->req_full_gpu(adev, init);
  90		if (r) {
  91			adev->no_hw_access = true;
  92			return r;
  93		}
  94
  95		adev->virt.caps &= ~AMDGPU_SRIOV_CAPS_RUNTIME;
  96	}
  97
  98	return 0;
  99}
 100
 101/**
 102 * amdgpu_virt_release_full_gpu() - release full gpu access
 103 * @adev:	amdgpu device.
 104 * @init:	is driver init time.
 105 * When finishing driver init/fini, need to release full gpu access.
 106 * Return: Zero if release success, otherwise will returen error.
 107 */
 108int amdgpu_virt_release_full_gpu(struct amdgpu_device *adev, bool init)
 109{
 110	struct amdgpu_virt *virt = &adev->virt;
 111	int r;
 112
 113	if (virt->ops && virt->ops->rel_full_gpu) {
 114		r = virt->ops->rel_full_gpu(adev, init);
 115		if (r)
 116			return r;
 117
 118		adev->virt.caps |= AMDGPU_SRIOV_CAPS_RUNTIME;
 119	}
 120	return 0;
 121}
 122
 123/**
 124 * amdgpu_virt_reset_gpu() - reset gpu
 125 * @adev:	amdgpu device.
 126 * Send reset command to GPU hypervisor to reset GPU that VM is using
 127 * Return: Zero if reset success, otherwise will return error.
 128 */
 129int amdgpu_virt_reset_gpu(struct amdgpu_device *adev)
 130{
 131	struct amdgpu_virt *virt = &adev->virt;
 132	int r;
 133
 134	if (virt->ops && virt->ops->reset_gpu) {
 135		r = virt->ops->reset_gpu(adev);
 136		if (r)
 137			return r;
 138
 139		adev->virt.caps &= ~AMDGPU_SRIOV_CAPS_RUNTIME;
 140	}
 141
 142	return 0;
 143}
 144
 145void amdgpu_virt_request_init_data(struct amdgpu_device *adev)
 146{
 147	struct amdgpu_virt *virt = &adev->virt;
 148
 149	if (virt->ops && virt->ops->req_init_data)
 150		virt->ops->req_init_data(adev);
 151
 152	if (adev->virt.req_init_data_ver > 0)
 153		DRM_INFO("host supports REQ_INIT_DATA handshake\n");
 154	else
 155		DRM_WARN("host doesn't support REQ_INIT_DATA handshake\n");
 156}
 157
 158/**
 159 * amdgpu_virt_ready_to_reset() - send ready to reset to host
 160 * @adev:	amdgpu device.
 161 * Send ready to reset message to GPU hypervisor to signal we have stopped GPU
 162 * activity and is ready for host FLR
 163 */
 164void amdgpu_virt_ready_to_reset(struct amdgpu_device *adev)
 165{
 166	struct amdgpu_virt *virt = &adev->virt;
 167
 168	if (virt->ops && virt->ops->reset_gpu)
 169		virt->ops->ready_to_reset(adev);
 170}
 171
 172/**
 173 * amdgpu_virt_wait_reset() - wait for reset gpu completed
 174 * @adev:	amdgpu device.
 175 * Wait for GPU reset completed.
 176 * Return: Zero if reset success, otherwise will return error.
 177 */
 178int amdgpu_virt_wait_reset(struct amdgpu_device *adev)
 179{
 180	struct amdgpu_virt *virt = &adev->virt;
 181
 182	if (!virt->ops || !virt->ops->wait_reset)
 183		return -EINVAL;
 184
 185	return virt->ops->wait_reset(adev);
 186}
 187
 188/**
 189 * amdgpu_virt_alloc_mm_table() - alloc memory for mm table
 190 * @adev:	amdgpu device.
 191 * MM table is used by UVD and VCE for its initialization
 192 * Return: Zero if allocate success.
 193 */
 194int amdgpu_virt_alloc_mm_table(struct amdgpu_device *adev)
 195{
 196	int r;
 197
 198	if (!amdgpu_sriov_vf(adev) || adev->virt.mm_table.gpu_addr)
 199		return 0;
 200
 201	r = amdgpu_bo_create_kernel(adev, PAGE_SIZE, PAGE_SIZE,
 202				    AMDGPU_GEM_DOMAIN_VRAM |
 203				    AMDGPU_GEM_DOMAIN_GTT,
 204				    &adev->virt.mm_table.bo,
 205				    &adev->virt.mm_table.gpu_addr,
 206				    (void *)&adev->virt.mm_table.cpu_addr);
 207	if (r) {
 208		DRM_ERROR("failed to alloc mm table and error = %d.\n", r);
 209		return r;
 210	}
 211
 212	memset((void *)adev->virt.mm_table.cpu_addr, 0, PAGE_SIZE);
 213	DRM_INFO("MM table gpu addr = 0x%llx, cpu addr = %p.\n",
 214		 adev->virt.mm_table.gpu_addr,
 215		 adev->virt.mm_table.cpu_addr);
 216	return 0;
 217}
 218
 219/**
 220 * amdgpu_virt_free_mm_table() - free mm table memory
 221 * @adev:	amdgpu device.
 222 * Free MM table memory
 223 */
 224void amdgpu_virt_free_mm_table(struct amdgpu_device *adev)
 225{
 226	if (!amdgpu_sriov_vf(adev) || !adev->virt.mm_table.gpu_addr)
 227		return;
 228
 229	amdgpu_bo_free_kernel(&adev->virt.mm_table.bo,
 230			      &adev->virt.mm_table.gpu_addr,
 231			      (void *)&adev->virt.mm_table.cpu_addr);
 232	adev->virt.mm_table.gpu_addr = 0;
 233}
 234
 235/**
 236 * amdgpu_virt_rcvd_ras_interrupt() - receive ras interrupt
 237 * @adev:	amdgpu device.
 238 * Check whether host sent RAS error message
 239 * Return: true if found, otherwise false
 240 */
 241bool amdgpu_virt_rcvd_ras_interrupt(struct amdgpu_device *adev)
 242{
 243	struct amdgpu_virt *virt = &adev->virt;
 244
 245	if (!virt->ops || !virt->ops->rcvd_ras_intr)
 246		return false;
 247
 248	return virt->ops->rcvd_ras_intr(adev);
 249}
 250
 251
 252unsigned int amd_sriov_msg_checksum(void *obj,
 253				unsigned long obj_size,
 254				unsigned int key,
 255				unsigned int checksum)
 256{
 257	unsigned int ret = key;
 258	unsigned long i = 0;
 259	unsigned char *pos;
 260
 261	pos = (char *)obj;
 262	/* calculate checksum */
 263	for (i = 0; i < obj_size; ++i)
 264		ret += *(pos + i);
 265	/* minus the checksum itself */
 266	pos = (char *)&checksum;
 267	for (i = 0; i < sizeof(checksum); ++i)
 268		ret -= *(pos + i);
 269	return ret;
 270}
 271
 272static int amdgpu_virt_init_ras_err_handler_data(struct amdgpu_device *adev)
 273{
 274	struct amdgpu_virt *virt = &adev->virt;
 275	struct amdgpu_virt_ras_err_handler_data **data = &virt->virt_eh_data;
 276	/* GPU will be marked bad on host if bp count more then 10,
 277	 * so alloc 512 is enough.
 278	 */
 279	unsigned int align_space = 512;
 280	void *bps = NULL;
 281	struct amdgpu_bo **bps_bo = NULL;
 282
 283	*data = kmalloc(sizeof(struct amdgpu_virt_ras_err_handler_data), GFP_KERNEL);
 284	if (!*data)
 285		goto data_failure;
 286
 287	bps = kmalloc_array(align_space, sizeof(*(*data)->bps), GFP_KERNEL);
 288	if (!bps)
 289		goto bps_failure;
 290
 291	bps_bo = kmalloc_array(align_space, sizeof(*(*data)->bps_bo), GFP_KERNEL);
 292	if (!bps_bo)
 293		goto bps_bo_failure;
 294
 295	(*data)->bps = bps;
 296	(*data)->bps_bo = bps_bo;
 297	(*data)->count = 0;
 298	(*data)->last_reserved = 0;
 299
 300	virt->ras_init_done = true;
 301
 302	return 0;
 303
 304bps_bo_failure:
 305	kfree(bps);
 306bps_failure:
 307	kfree(*data);
 308data_failure:
 309	return -ENOMEM;
 310}
 311
 312static void amdgpu_virt_ras_release_bp(struct amdgpu_device *adev)
 313{
 314	struct amdgpu_virt *virt = &adev->virt;
 315	struct amdgpu_virt_ras_err_handler_data *data = virt->virt_eh_data;
 316	struct amdgpu_bo *bo;
 317	int i;
 318
 319	if (!data)
 320		return;
 321
 322	for (i = data->last_reserved - 1; i >= 0; i--) {
 323		bo = data->bps_bo[i];
 324		if (bo) {
 325			amdgpu_bo_free_kernel(&bo, NULL, NULL);
 326			data->bps_bo[i] = bo;
 327		}
 328		data->last_reserved = i;
 329	}
 330}
 331
 332void amdgpu_virt_release_ras_err_handler_data(struct amdgpu_device *adev)
 333{
 334	struct amdgpu_virt *virt = &adev->virt;
 335	struct amdgpu_virt_ras_err_handler_data *data = virt->virt_eh_data;
 336
 337	virt->ras_init_done = false;
 338
 339	if (!data)
 340		return;
 341
 342	amdgpu_virt_ras_release_bp(adev);
 343
 344	kfree(data->bps);
 345	kfree(data->bps_bo);
 346	kfree(data);
 347	virt->virt_eh_data = NULL;
 348}
 349
 350static void amdgpu_virt_ras_add_bps(struct amdgpu_device *adev,
 351		struct eeprom_table_record *bps, int pages)
 352{
 353	struct amdgpu_virt *virt = &adev->virt;
 354	struct amdgpu_virt_ras_err_handler_data *data = virt->virt_eh_data;
 355
 356	if (!data)
 357		return;
 358
 359	memcpy(&data->bps[data->count], bps, pages * sizeof(*data->bps));
 360	data->count += pages;
 361}
 362
 363static void amdgpu_virt_ras_reserve_bps(struct amdgpu_device *adev)
 364{
 365	struct amdgpu_virt *virt = &adev->virt;
 366	struct amdgpu_virt_ras_err_handler_data *data = virt->virt_eh_data;
 367	struct amdgpu_vram_mgr *mgr = &adev->mman.vram_mgr;
 368	struct ttm_resource_manager *man = &mgr->manager;
 369	struct amdgpu_bo *bo = NULL;
 370	uint64_t bp;
 371	int i;
 372
 373	if (!data)
 374		return;
 375
 376	for (i = data->last_reserved; i < data->count; i++) {
 377		bp = data->bps[i].retired_page;
 378
 379		/* There are two cases of reserve error should be ignored:
 380		 * 1) a ras bad page has been allocated (used by someone);
 381		 * 2) a ras bad page has been reserved (duplicate error injection
 382		 *    for one page);
 383		 */
 384		if  (ttm_resource_manager_used(man)) {
 385			amdgpu_vram_mgr_reserve_range(&adev->mman.vram_mgr,
 386				bp << AMDGPU_GPU_PAGE_SHIFT,
 387				AMDGPU_GPU_PAGE_SIZE);
 388			data->bps_bo[i] = NULL;
 389		} else {
 390			if (amdgpu_bo_create_kernel_at(adev, bp << AMDGPU_GPU_PAGE_SHIFT,
 391							AMDGPU_GPU_PAGE_SIZE,
 392							&bo, NULL))
 393				DRM_DEBUG("RAS WARN: reserve vram for retired page %llx fail\n", bp);
 394			data->bps_bo[i] = bo;
 395		}
 396		data->last_reserved = i + 1;
 397		bo = NULL;
 398	}
 399}
 400
 401static bool amdgpu_virt_ras_check_bad_page(struct amdgpu_device *adev,
 402		uint64_t retired_page)
 403{
 404	struct amdgpu_virt *virt = &adev->virt;
 405	struct amdgpu_virt_ras_err_handler_data *data = virt->virt_eh_data;
 406	int i;
 407
 408	if (!data)
 409		return true;
 410
 411	for (i = 0; i < data->count; i++)
 412		if (retired_page == data->bps[i].retired_page)
 413			return true;
 414
 415	return false;
 416}
 417
 418static void amdgpu_virt_add_bad_page(struct amdgpu_device *adev,
 419		uint64_t bp_block_offset, uint32_t bp_block_size)
 420{
 421	struct eeprom_table_record bp;
 422	uint64_t retired_page;
 423	uint32_t bp_idx, bp_cnt;
 424	void *vram_usage_va = NULL;
 425
 426	if (adev->mman.fw_vram_usage_va)
 427		vram_usage_va = adev->mman.fw_vram_usage_va;
 428	else
 429		vram_usage_va = adev->mman.drv_vram_usage_va;
 430
 431	memset(&bp, 0, sizeof(bp));
 432
 433	if (bp_block_size) {
 434		bp_cnt = bp_block_size / sizeof(uint64_t);
 435		for (bp_idx = 0; bp_idx < bp_cnt; bp_idx++) {
 436			retired_page = *(uint64_t *)(vram_usage_va +
 437					bp_block_offset + bp_idx * sizeof(uint64_t));
 438			bp.retired_page = retired_page;
 439
 440			if (amdgpu_virt_ras_check_bad_page(adev, retired_page))
 441				continue;
 442
 443			amdgpu_virt_ras_add_bps(adev, &bp, 1);
 444
 445			amdgpu_virt_ras_reserve_bps(adev);
 446		}
 447	}
 448}
 449
 450static int amdgpu_virt_read_pf2vf_data(struct amdgpu_device *adev)
 451{
 452	struct amd_sriov_msg_pf2vf_info_header *pf2vf_info = adev->virt.fw_reserve.p_pf2vf;
 453	uint32_t checksum;
 454	uint32_t checkval;
 455
 456	uint32_t i;
 457	uint32_t tmp;
 458
 459	if (adev->virt.fw_reserve.p_pf2vf == NULL)
 460		return -EINVAL;
 461
 462	if (pf2vf_info->size > 1024) {
 463		dev_err(adev->dev, "invalid pf2vf message size: 0x%x\n", pf2vf_info->size);
 464		return -EINVAL;
 465	}
 466
 467	switch (pf2vf_info->version) {
 468	case 1:
 469		checksum = ((struct amdgim_pf2vf_info_v1 *)pf2vf_info)->checksum;
 470		checkval = amd_sriov_msg_checksum(
 471			adev->virt.fw_reserve.p_pf2vf, pf2vf_info->size,
 472			adev->virt.fw_reserve.checksum_key, checksum);
 473		if (checksum != checkval) {
 474			dev_err(adev->dev,
 475				"invalid pf2vf message: header checksum=0x%x calculated checksum=0x%x\n",
 476				checksum, checkval);
 477			return -EINVAL;
 478		}
 479
 480		adev->virt.gim_feature =
 481			((struct amdgim_pf2vf_info_v1 *)pf2vf_info)->feature_flags;
 482		break;
 483	case 2:
 484		/* TODO: missing key, need to add it later */
 485		checksum = ((struct amd_sriov_msg_pf2vf_info *)pf2vf_info)->checksum;
 486		checkval = amd_sriov_msg_checksum(
 487			adev->virt.fw_reserve.p_pf2vf, pf2vf_info->size,
 488			0, checksum);
 489		if (checksum != checkval) {
 490			dev_err(adev->dev,
 491				"invalid pf2vf message: header checksum=0x%x calculated checksum=0x%x\n",
 492				checksum, checkval);
 493			return -EINVAL;
 494		}
 495
 496		adev->virt.vf2pf_update_interval_ms =
 497			((struct amd_sriov_msg_pf2vf_info *)pf2vf_info)->vf2pf_update_interval_ms;
 498		adev->virt.gim_feature =
 499			((struct amd_sriov_msg_pf2vf_info *)pf2vf_info)->feature_flags.all;
 500		adev->virt.reg_access =
 501			((struct amd_sriov_msg_pf2vf_info *)pf2vf_info)->reg_access_flags.all;
 502
 503		adev->virt.decode_max_dimension_pixels = 0;
 504		adev->virt.decode_max_frame_pixels = 0;
 505		adev->virt.encode_max_dimension_pixels = 0;
 506		adev->virt.encode_max_frame_pixels = 0;
 507		adev->virt.is_mm_bw_enabled = false;
 508		for (i = 0; i < AMD_SRIOV_MSG_RESERVE_VCN_INST; i++) {
 509			tmp = ((struct amd_sriov_msg_pf2vf_info *)pf2vf_info)->mm_bw_management[i].decode_max_dimension_pixels;
 510			adev->virt.decode_max_dimension_pixels = max(tmp, adev->virt.decode_max_dimension_pixels);
 511
 512			tmp = ((struct amd_sriov_msg_pf2vf_info *)pf2vf_info)->mm_bw_management[i].decode_max_frame_pixels;
 513			adev->virt.decode_max_frame_pixels = max(tmp, adev->virt.decode_max_frame_pixels);
 514
 515			tmp = ((struct amd_sriov_msg_pf2vf_info *)pf2vf_info)->mm_bw_management[i].encode_max_dimension_pixels;
 516			adev->virt.encode_max_dimension_pixels = max(tmp, adev->virt.encode_max_dimension_pixels);
 517
 518			tmp = ((struct amd_sriov_msg_pf2vf_info *)pf2vf_info)->mm_bw_management[i].encode_max_frame_pixels;
 519			adev->virt.encode_max_frame_pixels = max(tmp, adev->virt.encode_max_frame_pixels);
 520		}
 521		if ((adev->virt.decode_max_dimension_pixels > 0) || (adev->virt.encode_max_dimension_pixels > 0))
 522			adev->virt.is_mm_bw_enabled = true;
 523
 524		adev->unique_id =
 525			((struct amd_sriov_msg_pf2vf_info *)pf2vf_info)->uuid;
 526		adev->virt.ras_en_caps.all = ((struct amd_sriov_msg_pf2vf_info *)pf2vf_info)->ras_en_caps.all;
 527		adev->virt.ras_telemetry_en_caps.all =
 528			((struct amd_sriov_msg_pf2vf_info *)pf2vf_info)->ras_telemetry_en_caps.all;
 529		break;
 530	default:
 531		dev_err(adev->dev, "invalid pf2vf version: 0x%x\n", pf2vf_info->version);
 532		return -EINVAL;
 533	}
 534
 535	/* correct too large or too little interval value */
 536	if (adev->virt.vf2pf_update_interval_ms < 200 || adev->virt.vf2pf_update_interval_ms > 10000)
 537		adev->virt.vf2pf_update_interval_ms = 2000;
 538
 539	return 0;
 540}
 541
 542static void amdgpu_virt_populate_vf2pf_ucode_info(struct amdgpu_device *adev)
 543{
 544	struct amd_sriov_msg_vf2pf_info *vf2pf_info;
 545	vf2pf_info = (struct amd_sriov_msg_vf2pf_info *) adev->virt.fw_reserve.p_vf2pf;
 546
 547	if (adev->virt.fw_reserve.p_vf2pf == NULL)
 548		return;
 549
 550	POPULATE_UCODE_INFO(vf2pf_info, AMD_SRIOV_UCODE_ID_VCE,      adev->vce.fw_version);
 551	POPULATE_UCODE_INFO(vf2pf_info, AMD_SRIOV_UCODE_ID_UVD,      adev->uvd.fw_version);
 552	POPULATE_UCODE_INFO(vf2pf_info, AMD_SRIOV_UCODE_ID_MC,       adev->gmc.fw_version);
 553	POPULATE_UCODE_INFO(vf2pf_info, AMD_SRIOV_UCODE_ID_ME,       adev->gfx.me_fw_version);
 554	POPULATE_UCODE_INFO(vf2pf_info, AMD_SRIOV_UCODE_ID_PFP,      adev->gfx.pfp_fw_version);
 555	POPULATE_UCODE_INFO(vf2pf_info, AMD_SRIOV_UCODE_ID_CE,       adev->gfx.ce_fw_version);
 556	POPULATE_UCODE_INFO(vf2pf_info, AMD_SRIOV_UCODE_ID_RLC,      adev->gfx.rlc_fw_version);
 557	POPULATE_UCODE_INFO(vf2pf_info, AMD_SRIOV_UCODE_ID_RLC_SRLC, adev->gfx.rlc_srlc_fw_version);
 558	POPULATE_UCODE_INFO(vf2pf_info, AMD_SRIOV_UCODE_ID_RLC_SRLG, adev->gfx.rlc_srlg_fw_version);
 559	POPULATE_UCODE_INFO(vf2pf_info, AMD_SRIOV_UCODE_ID_RLC_SRLS, adev->gfx.rlc_srls_fw_version);
 560	POPULATE_UCODE_INFO(vf2pf_info, AMD_SRIOV_UCODE_ID_MEC,      adev->gfx.mec_fw_version);
 561	POPULATE_UCODE_INFO(vf2pf_info, AMD_SRIOV_UCODE_ID_MEC2,     adev->gfx.mec2_fw_version);
 562	POPULATE_UCODE_INFO(vf2pf_info, AMD_SRIOV_UCODE_ID_SOS,      adev->psp.sos.fw_version);
 563	POPULATE_UCODE_INFO(vf2pf_info, AMD_SRIOV_UCODE_ID_ASD,
 564			    adev->psp.asd_context.bin_desc.fw_version);
 565	POPULATE_UCODE_INFO(vf2pf_info, AMD_SRIOV_UCODE_ID_TA_RAS,
 566			    adev->psp.ras_context.context.bin_desc.fw_version);
 567	POPULATE_UCODE_INFO(vf2pf_info, AMD_SRIOV_UCODE_ID_TA_XGMI,
 568			    adev->psp.xgmi_context.context.bin_desc.fw_version);
 569	POPULATE_UCODE_INFO(vf2pf_info, AMD_SRIOV_UCODE_ID_SMC,      adev->pm.fw_version);
 570	POPULATE_UCODE_INFO(vf2pf_info, AMD_SRIOV_UCODE_ID_SDMA,     adev->sdma.instance[0].fw_version);
 571	POPULATE_UCODE_INFO(vf2pf_info, AMD_SRIOV_UCODE_ID_SDMA2,    adev->sdma.instance[1].fw_version);
 572	POPULATE_UCODE_INFO(vf2pf_info, AMD_SRIOV_UCODE_ID_VCN,      adev->vcn.fw_version);
 573	POPULATE_UCODE_INFO(vf2pf_info, AMD_SRIOV_UCODE_ID_DMCU,     adev->dm.dmcu_fw_version);
 574}
 575
 576static int amdgpu_virt_write_vf2pf_data(struct amdgpu_device *adev)
 577{
 578	struct amd_sriov_msg_vf2pf_info *vf2pf_info;
 579
 580	vf2pf_info = (struct amd_sriov_msg_vf2pf_info *) adev->virt.fw_reserve.p_vf2pf;
 581
 582	if (adev->virt.fw_reserve.p_vf2pf == NULL)
 583		return -EINVAL;
 584
 585	memset(vf2pf_info, 0, sizeof(struct amd_sriov_msg_vf2pf_info));
 586
 587	vf2pf_info->header.size = sizeof(struct amd_sriov_msg_vf2pf_info);
 588	vf2pf_info->header.version = AMD_SRIOV_MSG_FW_VRAM_VF2PF_VER;
 589
 590#ifdef MODULE
 591	if (THIS_MODULE->version != NULL)
 592		strcpy(vf2pf_info->driver_version, THIS_MODULE->version);
 593	else
 594#endif
 595		strcpy(vf2pf_info->driver_version, "N/A");
 596
 597	vf2pf_info->pf2vf_version_required = 0; // no requirement, guest understands all
 598	vf2pf_info->driver_cert = 0;
 599	vf2pf_info->os_info.all = 0;
 600
 601	vf2pf_info->fb_usage =
 602		ttm_resource_manager_usage(&adev->mman.vram_mgr.manager) >> 20;
 603	vf2pf_info->fb_vis_usage =
 604		amdgpu_vram_mgr_vis_usage(&adev->mman.vram_mgr) >> 20;
 605	vf2pf_info->fb_size = adev->gmc.real_vram_size >> 20;
 606	vf2pf_info->fb_vis_size = adev->gmc.visible_vram_size >> 20;
 607
 608	amdgpu_virt_populate_vf2pf_ucode_info(adev);
 609
 610	/* TODO: read dynamic info */
 611	vf2pf_info->gfx_usage = 0;
 612	vf2pf_info->compute_usage = 0;
 613	vf2pf_info->encode_usage = 0;
 614	vf2pf_info->decode_usage = 0;
 615
 616	vf2pf_info->dummy_page_addr = (uint64_t)adev->dummy_page_addr;
 617	vf2pf_info->mes_info_addr = (uint64_t)adev->mes.resource_1_gpu_addr;
 618
 619	if (adev->mes.resource_1) {
 620		vf2pf_info->mes_info_size = adev->mes.resource_1->tbo.base.size;
 621	}
 622	vf2pf_info->checksum =
 623		amd_sriov_msg_checksum(
 624		vf2pf_info, sizeof(*vf2pf_info), 0, 0);
 625
 626	return 0;
 627}
 628
 629static void amdgpu_virt_update_vf2pf_work_item(struct work_struct *work)
 630{
 631	struct amdgpu_device *adev = container_of(work, struct amdgpu_device, virt.vf2pf_work.work);
 632	int ret;
 633
 634	ret = amdgpu_virt_read_pf2vf_data(adev);
 635	if (ret) {
 636		adev->virt.vf2pf_update_retry_cnt++;
 637
 638		if ((amdgpu_virt_rcvd_ras_interrupt(adev) ||
 639			adev->virt.vf2pf_update_retry_cnt >= AMDGPU_VF2PF_UPDATE_MAX_RETRY_LIMIT) &&
 640			amdgpu_sriov_runtime(adev)) {
 641
 642			amdgpu_ras_set_fed(adev, true);
 643			if (amdgpu_reset_domain_schedule(adev->reset_domain,
 644							&adev->kfd.reset_work))
 645				return;
 646			else
 647				dev_err(adev->dev, "Failed to queue work! at %s", __func__);
 648		}
 649
 650		goto out;
 651	}
 652
 653	adev->virt.vf2pf_update_retry_cnt = 0;
 654	amdgpu_virt_write_vf2pf_data(adev);
 655
 656out:
 657	schedule_delayed_work(&(adev->virt.vf2pf_work), adev->virt.vf2pf_update_interval_ms);
 658}
 659
 660void amdgpu_virt_fini_data_exchange(struct amdgpu_device *adev)
 661{
 662	if (adev->virt.vf2pf_update_interval_ms != 0) {
 663		DRM_INFO("clean up the vf2pf work item\n");
 664		cancel_delayed_work_sync(&adev->virt.vf2pf_work);
 665		adev->virt.vf2pf_update_interval_ms = 0;
 666	}
 667}
 668
 669void amdgpu_virt_init_data_exchange(struct amdgpu_device *adev)
 670{
 671	adev->virt.fw_reserve.p_pf2vf = NULL;
 672	adev->virt.fw_reserve.p_vf2pf = NULL;
 673	adev->virt.vf2pf_update_interval_ms = 0;
 674	adev->virt.vf2pf_update_retry_cnt = 0;
 675
 676	if (adev->mman.fw_vram_usage_va && adev->mman.drv_vram_usage_va) {
 677		DRM_WARN("Currently fw_vram and drv_vram should not have values at the same time!");
 678	} else if (adev->mman.fw_vram_usage_va || adev->mman.drv_vram_usage_va) {
 679		/* go through this logic in ip_init and reset to init workqueue*/
 680		amdgpu_virt_exchange_data(adev);
 681
 682		INIT_DELAYED_WORK(&adev->virt.vf2pf_work, amdgpu_virt_update_vf2pf_work_item);
 683		schedule_delayed_work(&(adev->virt.vf2pf_work), msecs_to_jiffies(adev->virt.vf2pf_update_interval_ms));
 684	} else if (adev->bios != NULL) {
 685		/* got through this logic in early init stage to get necessary flags, e.g. rlcg_acc related*/
 686		adev->virt.fw_reserve.p_pf2vf =
 687			(struct amd_sriov_msg_pf2vf_info_header *)
 688			(adev->bios + (AMD_SRIOV_MSG_PF2VF_OFFSET_KB << 10));
 689
 690		amdgpu_virt_read_pf2vf_data(adev);
 691	}
 692}
 693
 694
 695void amdgpu_virt_exchange_data(struct amdgpu_device *adev)
 696{
 697	uint64_t bp_block_offset = 0;
 698	uint32_t bp_block_size = 0;
 699	struct amd_sriov_msg_pf2vf_info *pf2vf_v2 = NULL;
 700
 701	if (adev->mman.fw_vram_usage_va || adev->mman.drv_vram_usage_va) {
 702		if (adev->mman.fw_vram_usage_va) {
 703			adev->virt.fw_reserve.p_pf2vf =
 704				(struct amd_sriov_msg_pf2vf_info_header *)
 705				(adev->mman.fw_vram_usage_va + (AMD_SRIOV_MSG_PF2VF_OFFSET_KB << 10));
 706			adev->virt.fw_reserve.p_vf2pf =
 707				(struct amd_sriov_msg_vf2pf_info_header *)
 708				(adev->mman.fw_vram_usage_va + (AMD_SRIOV_MSG_VF2PF_OFFSET_KB << 10));
 709			adev->virt.fw_reserve.ras_telemetry =
 710				(adev->mman.fw_vram_usage_va + (AMD_SRIOV_MSG_RAS_TELEMETRY_OFFSET_KB << 10));
 711		} else if (adev->mman.drv_vram_usage_va) {
 712			adev->virt.fw_reserve.p_pf2vf =
 713				(struct amd_sriov_msg_pf2vf_info_header *)
 714				(adev->mman.drv_vram_usage_va + (AMD_SRIOV_MSG_PF2VF_OFFSET_KB << 10));
 715			adev->virt.fw_reserve.p_vf2pf =
 716				(struct amd_sriov_msg_vf2pf_info_header *)
 717				(adev->mman.drv_vram_usage_va + (AMD_SRIOV_MSG_VF2PF_OFFSET_KB << 10));
 718			adev->virt.fw_reserve.ras_telemetry =
 719				(adev->mman.drv_vram_usage_va + (AMD_SRIOV_MSG_RAS_TELEMETRY_OFFSET_KB << 10));
 720		}
 721
 722		amdgpu_virt_read_pf2vf_data(adev);
 723		amdgpu_virt_write_vf2pf_data(adev);
 724
 725		/* bad page handling for version 2 */
 726		if (adev->virt.fw_reserve.p_pf2vf->version == 2) {
 727			pf2vf_v2 = (struct amd_sriov_msg_pf2vf_info *)adev->virt.fw_reserve.p_pf2vf;
 728
 729			bp_block_offset = ((uint64_t)pf2vf_v2->bp_block_offset_low & 0xFFFFFFFF) |
 730				((((uint64_t)pf2vf_v2->bp_block_offset_high) << 32) & 0xFFFFFFFF00000000);
 731			bp_block_size = pf2vf_v2->bp_block_size;
 732
 733			if (bp_block_size && !adev->virt.ras_init_done)
 734				amdgpu_virt_init_ras_err_handler_data(adev);
 735
 736			if (adev->virt.ras_init_done)
 737				amdgpu_virt_add_bad_page(adev, bp_block_offset, bp_block_size);
 738		}
 739	}
 740}
 741
 742void amdgpu_detect_virtualization(struct amdgpu_device *adev)
 743{
 744	uint32_t reg;
 745
 746	switch (adev->asic_type) {
 747	case CHIP_TONGA:
 748	case CHIP_FIJI:
 749		reg = RREG32(mmBIF_IOV_FUNC_IDENTIFIER);
 750		break;
 751	case CHIP_VEGA10:
 752	case CHIP_VEGA20:
 753	case CHIP_NAVI10:
 754	case CHIP_NAVI12:
 755	case CHIP_SIENNA_CICHLID:
 756	case CHIP_ARCTURUS:
 757	case CHIP_ALDEBARAN:
 758	case CHIP_IP_DISCOVERY:
 759		reg = RREG32(mmRCC_IOV_FUNC_IDENTIFIER);
 760		break;
 761	default: /* other chip doesn't support SRIOV */
 762		reg = 0;
 763		break;
 764	}
 765
 766	if (reg & 1)
 767		adev->virt.caps |= AMDGPU_SRIOV_CAPS_IS_VF;
 768
 769	if (reg & 0x80000000)
 770		adev->virt.caps |= AMDGPU_SRIOV_CAPS_ENABLE_IOV;
 771
 772	if (!reg) {
 773		/* passthrough mode exclus sriov mod */
 774		if (is_virtual_machine() && !xen_initial_domain())
 775			adev->virt.caps |= AMDGPU_PASSTHROUGH_MODE;
 776	}
 777
 778	/* we have the ability to check now */
 779	if (amdgpu_sriov_vf(adev)) {
 780		switch (adev->asic_type) {
 781		case CHIP_TONGA:
 782		case CHIP_FIJI:
 783			vi_set_virt_ops(adev);
 784			break;
 785		case CHIP_VEGA10:
 786			soc15_set_virt_ops(adev);
 787#ifdef CONFIG_X86
 788			/* not send GPU_INIT_DATA with MS_HYPERV*/
 789			if (!hypervisor_is_type(X86_HYPER_MS_HYPERV))
 790#endif
 791				/* send a dummy GPU_INIT_DATA request to host on vega10 */
 792				amdgpu_virt_request_init_data(adev);
 793			break;
 794		case CHIP_VEGA20:
 795		case CHIP_ARCTURUS:
 796		case CHIP_ALDEBARAN:
 797			soc15_set_virt_ops(adev);
 798			break;
 799		case CHIP_NAVI10:
 800		case CHIP_NAVI12:
 801		case CHIP_SIENNA_CICHLID:
 802		case CHIP_IP_DISCOVERY:
 803			nv_set_virt_ops(adev);
 804			/* try send GPU_INIT_DATA request to host */
 805			amdgpu_virt_request_init_data(adev);
 806			break;
 807		default: /* other chip doesn't support SRIOV */
 808			DRM_ERROR("Unknown asic type: %d!\n", adev->asic_type);
 809			break;
 810		}
 811	}
 812}
 813
 814static bool amdgpu_virt_access_debugfs_is_mmio(struct amdgpu_device *adev)
 815{
 816	return amdgpu_sriov_is_debug(adev) ? true : false;
 817}
 818
 819static bool amdgpu_virt_access_debugfs_is_kiq(struct amdgpu_device *adev)
 820{
 821	return amdgpu_sriov_is_normal(adev) ? true : false;
 822}
 823
 824int amdgpu_virt_enable_access_debugfs(struct amdgpu_device *adev)
 825{
 826	if (!amdgpu_sriov_vf(adev) ||
 827	    amdgpu_virt_access_debugfs_is_kiq(adev))
 828		return 0;
 829
 830	if (amdgpu_virt_access_debugfs_is_mmio(adev))
 831		adev->virt.caps &= ~AMDGPU_SRIOV_CAPS_RUNTIME;
 832	else
 833		return -EPERM;
 834
 835	return 0;
 836}
 837
 838void amdgpu_virt_disable_access_debugfs(struct amdgpu_device *adev)
 839{
 840	if (amdgpu_sriov_vf(adev))
 841		adev->virt.caps |= AMDGPU_SRIOV_CAPS_RUNTIME;
 842}
 843
 844enum amdgpu_sriov_vf_mode amdgpu_virt_get_sriov_vf_mode(struct amdgpu_device *adev)
 845{
 846	enum amdgpu_sriov_vf_mode mode;
 847
 848	if (amdgpu_sriov_vf(adev)) {
 849		if (amdgpu_sriov_is_pp_one_vf(adev))
 850			mode = SRIOV_VF_MODE_ONE_VF;
 851		else
 852			mode = SRIOV_VF_MODE_MULTI_VF;
 853	} else {
 854		mode = SRIOV_VF_MODE_BARE_METAL;
 855	}
 856
 857	return mode;
 858}
 859
 860void amdgpu_virt_pre_reset(struct amdgpu_device *adev)
 861{
 862	/* stop the data exchange thread */
 863	amdgpu_virt_fini_data_exchange(adev);
 864	amdgpu_dpm_set_mp1_state(adev, PP_MP1_STATE_FLR);
 865}
 866
 867void amdgpu_virt_post_reset(struct amdgpu_device *adev)
 868{
 869	if (amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(11, 0, 3)) {
 870		/* force set to GFXOFF state after reset,
 871		 * to avoid some invalid operation before GC enable
 872		 */
 873		adev->gfx.is_poweron = false;
 874	}
 875
 876	adev->mes.ring[0].sched.ready = false;
 877}
 878
 879bool amdgpu_virt_fw_load_skip_check(struct amdgpu_device *adev, uint32_t ucode_id)
 880{
 881	switch (amdgpu_ip_version(adev, MP0_HWIP, 0)) {
 882	case IP_VERSION(13, 0, 0):
 883		/* no vf autoload, white list */
 884		if (ucode_id == AMDGPU_UCODE_ID_VCN1 ||
 885		    ucode_id == AMDGPU_UCODE_ID_VCN)
 886			return false;
 887		else
 888			return true;
 889	case IP_VERSION(11, 0, 9):
 890	case IP_VERSION(11, 0, 7):
 891		/* black list for CHIP_NAVI12 and CHIP_SIENNA_CICHLID */
 892		if (ucode_id == AMDGPU_UCODE_ID_RLC_G
 893		    || ucode_id == AMDGPU_UCODE_ID_RLC_RESTORE_LIST_CNTL
 894		    || ucode_id == AMDGPU_UCODE_ID_RLC_RESTORE_LIST_GPM_MEM
 895		    || ucode_id == AMDGPU_UCODE_ID_RLC_RESTORE_LIST_SRM_MEM
 896		    || ucode_id == AMDGPU_UCODE_ID_SMC)
 897			return true;
 898		else
 899			return false;
 900	case IP_VERSION(13, 0, 10):
 901		/* white list */
 902		if (ucode_id == AMDGPU_UCODE_ID_CAP
 903		|| ucode_id == AMDGPU_UCODE_ID_CP_RS64_PFP
 904		|| ucode_id == AMDGPU_UCODE_ID_CP_RS64_ME
 905		|| ucode_id == AMDGPU_UCODE_ID_CP_RS64_MEC
 906		|| ucode_id == AMDGPU_UCODE_ID_CP_RS64_PFP_P0_STACK
 907		|| ucode_id == AMDGPU_UCODE_ID_CP_RS64_PFP_P1_STACK
 908		|| ucode_id == AMDGPU_UCODE_ID_CP_RS64_ME_P0_STACK
 909		|| ucode_id == AMDGPU_UCODE_ID_CP_RS64_ME_P1_STACK
 910		|| ucode_id == AMDGPU_UCODE_ID_CP_RS64_MEC_P0_STACK
 911		|| ucode_id == AMDGPU_UCODE_ID_CP_RS64_MEC_P1_STACK
 912		|| ucode_id == AMDGPU_UCODE_ID_CP_RS64_MEC_P2_STACK
 913		|| ucode_id == AMDGPU_UCODE_ID_CP_RS64_MEC_P3_STACK
 914		|| ucode_id == AMDGPU_UCODE_ID_CP_MES
 915		|| ucode_id == AMDGPU_UCODE_ID_CP_MES_DATA
 916		|| ucode_id == AMDGPU_UCODE_ID_CP_MES1
 917		|| ucode_id == AMDGPU_UCODE_ID_CP_MES1_DATA
 918		|| ucode_id == AMDGPU_UCODE_ID_VCN1
 919		|| ucode_id == AMDGPU_UCODE_ID_VCN)
 920			return false;
 921		else
 922			return true;
 923	default:
 924		/* lagacy black list */
 925		if (ucode_id == AMDGPU_UCODE_ID_SDMA0
 926		    || ucode_id == AMDGPU_UCODE_ID_SDMA1
 927		    || ucode_id == AMDGPU_UCODE_ID_SDMA2
 928		    || ucode_id == AMDGPU_UCODE_ID_SDMA3
 929		    || ucode_id == AMDGPU_UCODE_ID_SDMA4
 930		    || ucode_id == AMDGPU_UCODE_ID_SDMA5
 931		    || ucode_id == AMDGPU_UCODE_ID_SDMA6
 932		    || ucode_id == AMDGPU_UCODE_ID_SDMA7
 933		    || ucode_id == AMDGPU_UCODE_ID_RLC_G
 934		    || ucode_id == AMDGPU_UCODE_ID_RLC_RESTORE_LIST_CNTL
 935		    || ucode_id == AMDGPU_UCODE_ID_RLC_RESTORE_LIST_GPM_MEM
 936		    || ucode_id == AMDGPU_UCODE_ID_RLC_RESTORE_LIST_SRM_MEM
 937		    || ucode_id == AMDGPU_UCODE_ID_SMC)
 938			return true;
 939		else
 940			return false;
 941	}
 942}
 943
 944void amdgpu_virt_update_sriov_video_codec(struct amdgpu_device *adev,
 945			struct amdgpu_video_codec_info *encode, uint32_t encode_array_size,
 946			struct amdgpu_video_codec_info *decode, uint32_t decode_array_size)
 947{
 948	uint32_t i;
 949
 950	if (!adev->virt.is_mm_bw_enabled)
 951		return;
 952
 953	if (encode) {
 954		for (i = 0; i < encode_array_size; i++) {
 955			encode[i].max_width = adev->virt.encode_max_dimension_pixels;
 956			encode[i].max_pixels_per_frame = adev->virt.encode_max_frame_pixels;
 957			if (encode[i].max_width > 0)
 958				encode[i].max_height = encode[i].max_pixels_per_frame / encode[i].max_width;
 959			else
 960				encode[i].max_height = 0;
 961		}
 962	}
 963
 964	if (decode) {
 965		for (i = 0; i < decode_array_size; i++) {
 966			decode[i].max_width = adev->virt.decode_max_dimension_pixels;
 967			decode[i].max_pixels_per_frame = adev->virt.decode_max_frame_pixels;
 968			if (decode[i].max_width > 0)
 969				decode[i].max_height = decode[i].max_pixels_per_frame / decode[i].max_width;
 970			else
 971				decode[i].max_height = 0;
 972		}
 973	}
 974}
 975
 976bool amdgpu_virt_get_rlcg_reg_access_flag(struct amdgpu_device *adev,
 977						 u32 acc_flags, u32 hwip,
 978						 bool write, u32 *rlcg_flag)
 979{
 980	bool ret = false;
 981
 982	switch (hwip) {
 983	case GC_HWIP:
 984		if (amdgpu_sriov_reg_indirect_gc(adev)) {
 985			*rlcg_flag =
 986				write ? AMDGPU_RLCG_GC_WRITE : AMDGPU_RLCG_GC_READ;
 987			ret = true;
 988		/* only in new version, AMDGPU_REGS_NO_KIQ and
 989		 * AMDGPU_REGS_RLC are enabled simultaneously */
 990		} else if ((acc_flags & AMDGPU_REGS_RLC) &&
 991				!(acc_flags & AMDGPU_REGS_NO_KIQ) && write) {
 992			*rlcg_flag = AMDGPU_RLCG_GC_WRITE_LEGACY;
 993			ret = true;
 994		}
 995		break;
 996	case MMHUB_HWIP:
 997		if (amdgpu_sriov_reg_indirect_mmhub(adev) &&
 998		    (acc_flags & AMDGPU_REGS_RLC) && write) {
 999			*rlcg_flag = AMDGPU_RLCG_MMHUB_WRITE;
1000			ret = true;
1001		}
1002		break;
1003	default:
1004		break;
1005	}
1006	return ret;
1007}
1008
1009u32 amdgpu_virt_rlcg_reg_rw(struct amdgpu_device *adev, u32 offset, u32 v, u32 flag, u32 xcc_id)
1010{
1011	struct amdgpu_rlcg_reg_access_ctrl *reg_access_ctrl;
1012	uint32_t timeout = 50000;
1013	uint32_t i, tmp;
1014	uint32_t ret = 0;
1015	void *scratch_reg0;
1016	void *scratch_reg1;
1017	void *scratch_reg2;
1018	void *scratch_reg3;
1019	void *spare_int;
1020
1021	if (!adev->gfx.rlc.rlcg_reg_access_supported) {
1022		dev_err(adev->dev,
1023			"indirect registers access through rlcg is not available\n");
1024		return 0;
1025	}
1026
1027	if (adev->gfx.xcc_mask && (((1 << xcc_id) & adev->gfx.xcc_mask) == 0)) {
1028		dev_err(adev->dev, "invalid xcc\n");
1029		return 0;
1030	}
1031
1032	if (amdgpu_device_skip_hw_access(adev))
1033		return 0;
1034
1035	reg_access_ctrl = &adev->gfx.rlc.reg_access_ctrl[xcc_id];
1036	scratch_reg0 = (void __iomem *)adev->rmmio + 4 * reg_access_ctrl->scratch_reg0;
1037	scratch_reg1 = (void __iomem *)adev->rmmio + 4 * reg_access_ctrl->scratch_reg1;
1038	scratch_reg2 = (void __iomem *)adev->rmmio + 4 * reg_access_ctrl->scratch_reg2;
1039	scratch_reg3 = (void __iomem *)adev->rmmio + 4 * reg_access_ctrl->scratch_reg3;
1040
1041	mutex_lock(&adev->virt.rlcg_reg_lock);
1042
1043	if (reg_access_ctrl->spare_int)
1044		spare_int = (void __iomem *)adev->rmmio + 4 * reg_access_ctrl->spare_int;
1045
1046	if (offset == reg_access_ctrl->grbm_cntl) {
1047		/* if the target reg offset is grbm_cntl, write to scratch_reg2 */
1048		writel(v, scratch_reg2);
1049		if (flag == AMDGPU_RLCG_GC_WRITE_LEGACY)
1050			writel(v, ((void __iomem *)adev->rmmio) + (offset * 4));
1051	} else if (offset == reg_access_ctrl->grbm_idx) {
1052		/* if the target reg offset is grbm_idx, write to scratch_reg3 */
1053		writel(v, scratch_reg3);
1054		if (flag == AMDGPU_RLCG_GC_WRITE_LEGACY)
1055			writel(v, ((void __iomem *)adev->rmmio) + (offset * 4));
1056	} else {
1057		/*
1058		 * SCRATCH_REG0 	= read/write value
1059		 * SCRATCH_REG1[30:28]	= command
1060		 * SCRATCH_REG1[19:0]	= address in dword
1061		 * SCRATCH_REG1[27:24]	= Error reporting
1062		 */
1063		writel(v, scratch_reg0);
1064		writel((offset | flag), scratch_reg1);
1065		if (reg_access_ctrl->spare_int)
1066			writel(1, spare_int);
1067
1068		for (i = 0; i < timeout; i++) {
1069			tmp = readl(scratch_reg1);
1070			if (!(tmp & AMDGPU_RLCG_SCRATCH1_ADDRESS_MASK))
1071				break;
1072			udelay(10);
1073		}
1074
1075		tmp = readl(scratch_reg1);
1076		if (i >= timeout || (tmp & AMDGPU_RLCG_SCRATCH1_ERROR_MASK) != 0) {
1077			if (amdgpu_sriov_rlcg_error_report_enabled(adev)) {
1078				if (tmp & AMDGPU_RLCG_VFGATE_DISABLED) {
1079					dev_err(adev->dev,
1080						"vfgate is disabled, rlcg failed to program reg: 0x%05x\n", offset);
1081				} else if (tmp & AMDGPU_RLCG_WRONG_OPERATION_TYPE) {
1082					dev_err(adev->dev,
1083						"wrong operation type, rlcg failed to program reg: 0x%05x\n", offset);
1084				} else if (tmp & AMDGPU_RLCG_REG_NOT_IN_RANGE) {
1085					dev_err(adev->dev,
1086						"register is not in range, rlcg failed to program reg: 0x%05x\n", offset);
1087				} else {
1088					dev_err(adev->dev,
1089						"unknown error type, rlcg failed to program reg: 0x%05x\n", offset);
1090				}
1091			} else {
1092				dev_err(adev->dev,
1093					"timeout: rlcg faled to program reg: 0x%05x\n", offset);
1094			}
1095		}
1096	}
1097
1098	ret = readl(scratch_reg0);
1099
1100	mutex_unlock(&adev->virt.rlcg_reg_lock);
1101
1102	return ret;
1103}
1104
1105void amdgpu_sriov_wreg(struct amdgpu_device *adev,
1106		       u32 offset, u32 value,
1107		       u32 acc_flags, u32 hwip, u32 xcc_id)
1108{
1109	u32 rlcg_flag;
1110
1111	if (amdgpu_device_skip_hw_access(adev))
1112		return;
1113
1114	if (!amdgpu_sriov_runtime(adev) &&
1115		amdgpu_virt_get_rlcg_reg_access_flag(adev, acc_flags, hwip, true, &rlcg_flag)) {
1116		amdgpu_virt_rlcg_reg_rw(adev, offset, value, rlcg_flag, xcc_id);
1117		return;
1118	}
1119
1120	if (acc_flags & AMDGPU_REGS_NO_KIQ)
1121		WREG32_NO_KIQ(offset, value);
1122	else
1123		WREG32(offset, value);
1124}
1125
1126u32 amdgpu_sriov_rreg(struct amdgpu_device *adev,
1127		      u32 offset, u32 acc_flags, u32 hwip, u32 xcc_id)
1128{
1129	u32 rlcg_flag;
1130
1131	if (amdgpu_device_skip_hw_access(adev))
1132		return 0;
1133
1134	if (!amdgpu_sriov_runtime(adev) &&
1135		amdgpu_virt_get_rlcg_reg_access_flag(adev, acc_flags, hwip, false, &rlcg_flag))
1136		return amdgpu_virt_rlcg_reg_rw(adev, offset, 0, rlcg_flag, xcc_id);
1137
1138	if (acc_flags & AMDGPU_REGS_NO_KIQ)
1139		return RREG32_NO_KIQ(offset);
1140	else
1141		return RREG32(offset);
1142}
1143
1144bool amdgpu_sriov_xnack_support(struct amdgpu_device *adev)
1145{
1146	bool xnack_mode = true;
1147
1148	if (amdgpu_sriov_vf(adev) &&
1149	    amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 4, 2))
1150		xnack_mode = false;
1151
1152	return xnack_mode;
1153}
1154
1155bool amdgpu_virt_get_ras_capability(struct amdgpu_device *adev)
1156{
1157	struct amdgpu_ras *con = amdgpu_ras_get_context(adev);
1158
1159	if (!amdgpu_sriov_ras_caps_en(adev))
1160		return false;
1161
1162	if (adev->virt.ras_en_caps.bits.block_umc)
1163		adev->ras_hw_enabled |= BIT(AMDGPU_RAS_BLOCK__UMC);
1164	if (adev->virt.ras_en_caps.bits.block_sdma)
1165		adev->ras_hw_enabled |= BIT(AMDGPU_RAS_BLOCK__SDMA);
1166	if (adev->virt.ras_en_caps.bits.block_gfx)
1167		adev->ras_hw_enabled |= BIT(AMDGPU_RAS_BLOCK__GFX);
1168	if (adev->virt.ras_en_caps.bits.block_mmhub)
1169		adev->ras_hw_enabled |= BIT(AMDGPU_RAS_BLOCK__MMHUB);
1170	if (adev->virt.ras_en_caps.bits.block_athub)
1171		adev->ras_hw_enabled |= BIT(AMDGPU_RAS_BLOCK__ATHUB);
1172	if (adev->virt.ras_en_caps.bits.block_pcie_bif)
1173		adev->ras_hw_enabled |= BIT(AMDGPU_RAS_BLOCK__PCIE_BIF);
1174	if (adev->virt.ras_en_caps.bits.block_hdp)
1175		adev->ras_hw_enabled |= BIT(AMDGPU_RAS_BLOCK__HDP);
1176	if (adev->virt.ras_en_caps.bits.block_xgmi_wafl)
1177		adev->ras_hw_enabled |= BIT(AMDGPU_RAS_BLOCK__XGMI_WAFL);
1178	if (adev->virt.ras_en_caps.bits.block_df)
1179		adev->ras_hw_enabled |= BIT(AMDGPU_RAS_BLOCK__DF);
1180	if (adev->virt.ras_en_caps.bits.block_smn)
1181		adev->ras_hw_enabled |= BIT(AMDGPU_RAS_BLOCK__SMN);
1182	if (adev->virt.ras_en_caps.bits.block_sem)
1183		adev->ras_hw_enabled |= BIT(AMDGPU_RAS_BLOCK__SEM);
1184	if (adev->virt.ras_en_caps.bits.block_mp0)
1185		adev->ras_hw_enabled |= BIT(AMDGPU_RAS_BLOCK__MP0);
1186	if (adev->virt.ras_en_caps.bits.block_mp1)
1187		adev->ras_hw_enabled |= BIT(AMDGPU_RAS_BLOCK__MP1);
1188	if (adev->virt.ras_en_caps.bits.block_fuse)
1189		adev->ras_hw_enabled |= BIT(AMDGPU_RAS_BLOCK__FUSE);
1190	if (adev->virt.ras_en_caps.bits.block_mca)
1191		adev->ras_hw_enabled |= BIT(AMDGPU_RAS_BLOCK__MCA);
1192	if (adev->virt.ras_en_caps.bits.block_vcn)
1193		adev->ras_hw_enabled |= BIT(AMDGPU_RAS_BLOCK__VCN);
1194	if (adev->virt.ras_en_caps.bits.block_jpeg)
1195		adev->ras_hw_enabled |= BIT(AMDGPU_RAS_BLOCK__JPEG);
1196	if (adev->virt.ras_en_caps.bits.block_ih)
1197		adev->ras_hw_enabled |= BIT(AMDGPU_RAS_BLOCK__IH);
1198	if (adev->virt.ras_en_caps.bits.block_mpio)
1199		adev->ras_hw_enabled |= BIT(AMDGPU_RAS_BLOCK__MPIO);
1200
1201	if (adev->virt.ras_en_caps.bits.poison_propogation_mode)
1202		con->poison_supported = true; /* Poison is handled by host */
1203
1204	return true;
1205}
1206
1207static inline enum amd_sriov_ras_telemetry_gpu_block
1208amdgpu_ras_block_to_sriov(struct amdgpu_device *adev, enum amdgpu_ras_block block) {
1209	switch (block) {
1210	case AMDGPU_RAS_BLOCK__UMC:
1211		return RAS_TELEMETRY_GPU_BLOCK_UMC;
1212	case AMDGPU_RAS_BLOCK__SDMA:
1213		return RAS_TELEMETRY_GPU_BLOCK_SDMA;
1214	case AMDGPU_RAS_BLOCK__GFX:
1215		return RAS_TELEMETRY_GPU_BLOCK_GFX;
1216	case AMDGPU_RAS_BLOCK__MMHUB:
1217		return RAS_TELEMETRY_GPU_BLOCK_MMHUB;
1218	case AMDGPU_RAS_BLOCK__ATHUB:
1219		return RAS_TELEMETRY_GPU_BLOCK_ATHUB;
1220	case AMDGPU_RAS_BLOCK__PCIE_BIF:
1221		return RAS_TELEMETRY_GPU_BLOCK_PCIE_BIF;
1222	case AMDGPU_RAS_BLOCK__HDP:
1223		return RAS_TELEMETRY_GPU_BLOCK_HDP;
1224	case AMDGPU_RAS_BLOCK__XGMI_WAFL:
1225		return RAS_TELEMETRY_GPU_BLOCK_XGMI_WAFL;
1226	case AMDGPU_RAS_BLOCK__DF:
1227		return RAS_TELEMETRY_GPU_BLOCK_DF;
1228	case AMDGPU_RAS_BLOCK__SMN:
1229		return RAS_TELEMETRY_GPU_BLOCK_SMN;
1230	case AMDGPU_RAS_BLOCK__SEM:
1231		return RAS_TELEMETRY_GPU_BLOCK_SEM;
1232	case AMDGPU_RAS_BLOCK__MP0:
1233		return RAS_TELEMETRY_GPU_BLOCK_MP0;
1234	case AMDGPU_RAS_BLOCK__MP1:
1235		return RAS_TELEMETRY_GPU_BLOCK_MP1;
1236	case AMDGPU_RAS_BLOCK__FUSE:
1237		return RAS_TELEMETRY_GPU_BLOCK_FUSE;
1238	case AMDGPU_RAS_BLOCK__MCA:
1239		return RAS_TELEMETRY_GPU_BLOCK_MCA;
1240	case AMDGPU_RAS_BLOCK__VCN:
1241		return RAS_TELEMETRY_GPU_BLOCK_VCN;
1242	case AMDGPU_RAS_BLOCK__JPEG:
1243		return RAS_TELEMETRY_GPU_BLOCK_JPEG;
1244	case AMDGPU_RAS_BLOCK__IH:
1245		return RAS_TELEMETRY_GPU_BLOCK_IH;
1246	case AMDGPU_RAS_BLOCK__MPIO:
1247		return RAS_TELEMETRY_GPU_BLOCK_MPIO;
1248	default:
1249		dev_err(adev->dev, "Unsupported SRIOV RAS telemetry block 0x%x\n", block);
1250		return RAS_TELEMETRY_GPU_BLOCK_COUNT;
1251	}
1252}
1253
1254static int amdgpu_virt_cache_host_error_counts(struct amdgpu_device *adev,
1255					       struct amdsriov_ras_telemetry *host_telemetry)
1256{
1257	struct amd_sriov_ras_telemetry_error_count *tmp = NULL;
1258	uint32_t checksum, used_size;
1259
1260	checksum = host_telemetry->header.checksum;
1261	used_size = host_telemetry->header.used_size;
1262
1263	if (used_size > (AMD_SRIOV_RAS_TELEMETRY_SIZE_KB << 10))
1264		return 0;
1265
1266	tmp = kmalloc(used_size, GFP_KERNEL);
1267	if (!tmp)
1268		return -ENOMEM;
1269
1270	memcpy(tmp, &host_telemetry->body.error_count, used_size);
1271
1272	if (checksum != amd_sriov_msg_checksum(tmp, used_size, 0, 0))
1273		goto out;
1274
1275	memcpy(&adev->virt.count_cache, tmp,
1276	       min(used_size, sizeof(adev->virt.count_cache)));
1277out:
1278	kfree(tmp);
1279
1280	return 0;
1281}
1282
1283static int amdgpu_virt_req_ras_err_count_internal(struct amdgpu_device *adev, bool force_update)
1284{
1285	struct amdgpu_virt *virt = &adev->virt;
1286
1287	/* Host allows 15 ras telemetry requests per 60 seconds. Afterwhich, the Host
1288	 * will ignore incoming guest messages. Ratelimit the guest messages to
1289	 * prevent guest self DOS.
1290	 */
1291	if (__ratelimit(&adev->virt.ras_telemetry_rs) || force_update) {
1292		if (!virt->ops->req_ras_err_count(adev))
1293			amdgpu_virt_cache_host_error_counts(adev,
1294				adev->virt.fw_reserve.ras_telemetry);
1295	}
1296
1297	return 0;
1298}
1299
1300/* Bypass ACA interface and query ECC counts directly from host */
1301int amdgpu_virt_req_ras_err_count(struct amdgpu_device *adev, enum amdgpu_ras_block block,
1302				  struct ras_err_data *err_data)
1303{
1304	enum amd_sriov_ras_telemetry_gpu_block sriov_block;
1305
1306	sriov_block = amdgpu_ras_block_to_sriov(adev, block);
1307
1308	if (sriov_block >= RAS_TELEMETRY_GPU_BLOCK_COUNT ||
1309	    !amdgpu_sriov_ras_telemetry_block_en(adev, sriov_block))
1310		return -EOPNOTSUPP;
1311
1312	/* Host Access may be lost during reset, just return last cached data. */
1313	if (down_read_trylock(&adev->reset_domain->sem)) {
1314		amdgpu_virt_req_ras_err_count_internal(adev, false);
1315		up_read(&adev->reset_domain->sem);
1316	}
1317
1318	err_data->ue_count = adev->virt.count_cache.block[sriov_block].ue_count;
1319	err_data->ce_count = adev->virt.count_cache.block[sriov_block].ce_count;
1320	err_data->de_count = adev->virt.count_cache.block[sriov_block].de_count;
1321
1322	return 0;
1323}
1324
1325int amdgpu_virt_ras_telemetry_post_reset(struct amdgpu_device *adev)
1326{
1327	unsigned long ue_count, ce_count;
1328
1329	if (amdgpu_sriov_ras_telemetry_en(adev)) {
1330		amdgpu_virt_req_ras_err_count_internal(adev, true);
1331		amdgpu_ras_query_error_count(adev, &ce_count, &ue_count, NULL);
1332	}
1333
1334	return 0;
1335}