Linux Audio

Check our new training course

Loading...
v4.6
   1/*
   2 * Copyright 2008 Advanced Micro Devices, Inc.
   3 *
   4 * Permission is hereby granted, free of charge, to any person obtaining a
   5 * copy of this software and associated documentation files (the "Software"),
   6 * to deal in the Software without restriction, including without limitation
   7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
   8 * and/or sell copies of the Software, and to permit persons to whom the
   9 * Software is furnished to do so, subject to the following conditions:
  10 *
  11 * The above copyright notice and this permission notice shall be included in
  12 * all copies or substantial portions of the Software.
  13 *
  14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20 * OTHER DEALINGS IN THE SOFTWARE.
  21 *
  22 * Author: Stanislaw Skowronek
  23 */
  24
  25#include <linux/module.h>
  26#include <linux/sched.h>
  27#include <linux/slab.h>
  28#include <asm/unaligned.h>
  29
 
 
  30#define ATOM_DEBUG
  31
  32#include "atom.h"
  33#include "atom-names.h"
  34#include "atom-bits.h"
  35#include "amdgpu.h"
  36
  37#define ATOM_COND_ABOVE		0
  38#define ATOM_COND_ABOVEOREQUAL	1
  39#define ATOM_COND_ALWAYS	2
  40#define ATOM_COND_BELOW		3
  41#define ATOM_COND_BELOWOREQUAL	4
  42#define ATOM_COND_EQUAL		5
  43#define ATOM_COND_NOTEQUAL	6
  44
  45#define ATOM_PORT_ATI	0
  46#define ATOM_PORT_PCI	1
  47#define ATOM_PORT_SYSIO	2
  48
  49#define ATOM_UNIT_MICROSEC	0
  50#define ATOM_UNIT_MILLISEC	1
  51
  52#define PLL_INDEX	2
  53#define PLL_DATA	3
  54
 
 
  55typedef struct {
  56	struct atom_context *ctx;
  57	uint32_t *ps, *ws;
  58	int ps_shift;
  59	uint16_t start;
  60	unsigned last_jump;
  61	unsigned long last_jump_jiffies;
  62	bool abort;
  63} atom_exec_context;
  64
  65int amdgpu_atom_debug = 0;
  66static int amdgpu_atom_execute_table_locked(struct atom_context *ctx, int index, uint32_t * params);
  67int amdgpu_atom_execute_table(struct atom_context *ctx, int index, uint32_t * params);
  68
  69static uint32_t atom_arg_mask[8] =
  70    { 0xFFFFFFFF, 0xFFFF, 0xFFFF00, 0xFFFF0000, 0xFF, 0xFF00, 0xFF0000,
  710xFF000000 };
  72static int atom_arg_shift[8] = { 0, 0, 8, 16, 0, 8, 16, 24 };
  73
  74static int atom_dst_to_src[8][4] = {
  75	/* translate destination alignment field to the source alignment encoding */
  76	{0, 0, 0, 0},
  77	{1, 2, 3, 0},
  78	{1, 2, 3, 0},
  79	{1, 2, 3, 0},
  80	{4, 5, 6, 7},
  81	{4, 5, 6, 7},
  82	{4, 5, 6, 7},
  83	{4, 5, 6, 7},
  84};
  85static int atom_def_dst[8] = { 0, 0, 1, 2, 0, 1, 2, 3 };
  86
  87static int debug_depth = 0;
  88#ifdef ATOM_DEBUG
  89static void debug_print_spaces(int n)
  90{
  91	while (n--)
  92		printk("   ");
  93}
  94
  95#define DEBUG(...) do if (amdgpu_atom_debug) { printk(KERN_DEBUG __VA_ARGS__); } while (0)
  96#define SDEBUG(...) do if (amdgpu_atom_debug) { printk(KERN_DEBUG); debug_print_spaces(debug_depth); printk(__VA_ARGS__); } while (0)
  97#else
  98#define DEBUG(...) do { } while (0)
  99#define SDEBUG(...) do { } while (0)
 100#endif
 101
 102static uint32_t atom_iio_execute(struct atom_context *ctx, int base,
 103				 uint32_t index, uint32_t data)
 104{
 105	uint32_t temp = 0xCDCDCDCD;
 106
 107	while (1)
 108		switch (CU8(base)) {
 109		case ATOM_IIO_NOP:
 110			base++;
 111			break;
 112		case ATOM_IIO_READ:
 113			temp = ctx->card->ioreg_read(ctx->card, CU16(base + 1));
 114			base += 3;
 115			break;
 116		case ATOM_IIO_WRITE:
 117			ctx->card->ioreg_write(ctx->card, CU16(base + 1), temp);
 118			base += 3;
 119			break;
 120		case ATOM_IIO_CLEAR:
 121			temp &=
 122			    ~((0xFFFFFFFF >> (32 - CU8(base + 1))) <<
 123			      CU8(base + 2));
 124			base += 3;
 125			break;
 126		case ATOM_IIO_SET:
 127			temp |=
 128			    (0xFFFFFFFF >> (32 - CU8(base + 1))) << CU8(base +
 129									2);
 130			base += 3;
 131			break;
 132		case ATOM_IIO_MOVE_INDEX:
 133			temp &=
 134			    ~((0xFFFFFFFF >> (32 - CU8(base + 1))) <<
 135			      CU8(base + 3));
 136			temp |=
 137			    ((index >> CU8(base + 2)) &
 138			     (0xFFFFFFFF >> (32 - CU8(base + 1)))) << CU8(base +
 139									  3);
 140			base += 4;
 141			break;
 142		case ATOM_IIO_MOVE_DATA:
 143			temp &=
 144			    ~((0xFFFFFFFF >> (32 - CU8(base + 1))) <<
 145			      CU8(base + 3));
 146			temp |=
 147			    ((data >> CU8(base + 2)) &
 148			     (0xFFFFFFFF >> (32 - CU8(base + 1)))) << CU8(base +
 149									  3);
 150			base += 4;
 151			break;
 152		case ATOM_IIO_MOVE_ATTR:
 153			temp &=
 154			    ~((0xFFFFFFFF >> (32 - CU8(base + 1))) <<
 155			      CU8(base + 3));
 156			temp |=
 157			    ((ctx->
 158			      io_attr >> CU8(base + 2)) & (0xFFFFFFFF >> (32 -
 159									  CU8
 160									  (base
 161									   +
 162									   1))))
 163			    << CU8(base + 3);
 164			base += 4;
 165			break;
 166		case ATOM_IIO_END:
 167			return temp;
 168		default:
 169			printk(KERN_INFO "Unknown IIO opcode.\n");
 170			return 0;
 171		}
 172}
 173
 174static uint32_t atom_get_src_int(atom_exec_context *ctx, uint8_t attr,
 175				 int *ptr, uint32_t *saved, int print)
 176{
 177	uint32_t idx, val = 0xCDCDCDCD, align, arg;
 178	struct atom_context *gctx = ctx->ctx;
 179	arg = attr & 7;
 180	align = (attr >> 3) & 7;
 181	switch (arg) {
 182	case ATOM_ARG_REG:
 183		idx = U16(*ptr);
 184		(*ptr) += 2;
 185		if (print)
 186			DEBUG("REG[0x%04X]", idx);
 187		idx += gctx->reg_block;
 188		switch (gctx->io_mode) {
 189		case ATOM_IO_MM:
 190			val = gctx->card->reg_read(gctx->card, idx);
 191			break;
 192		case ATOM_IO_PCI:
 193			printk(KERN_INFO
 194			       "PCI registers are not implemented.\n");
 195			return 0;
 196		case ATOM_IO_SYSIO:
 197			printk(KERN_INFO
 198			       "SYSIO registers are not implemented.\n");
 199			return 0;
 200		default:
 201			if (!(gctx->io_mode & 0x80)) {
 202				printk(KERN_INFO "Bad IO mode.\n");
 203				return 0;
 204			}
 205			if (!gctx->iio[gctx->io_mode & 0x7F]) {
 206				printk(KERN_INFO
 207				       "Undefined indirect IO read method %d.\n",
 208				       gctx->io_mode & 0x7F);
 209				return 0;
 210			}
 211			val =
 212			    atom_iio_execute(gctx,
 213					     gctx->iio[gctx->io_mode & 0x7F],
 214					     idx, 0);
 215		}
 216		break;
 217	case ATOM_ARG_PS:
 218		idx = U8(*ptr);
 219		(*ptr)++;
 220		/* get_unaligned_le32 avoids unaligned accesses from atombios
 221		 * tables, noticed on a DEC Alpha. */
 222		val = get_unaligned_le32((u32 *)&ctx->ps[idx]);
 223		if (print)
 224			DEBUG("PS[0x%02X,0x%04X]", idx, val);
 225		break;
 226	case ATOM_ARG_WS:
 227		idx = U8(*ptr);
 228		(*ptr)++;
 229		if (print)
 230			DEBUG("WS[0x%02X]", idx);
 231		switch (idx) {
 232		case ATOM_WS_QUOTIENT:
 233			val = gctx->divmul[0];
 234			break;
 235		case ATOM_WS_REMAINDER:
 236			val = gctx->divmul[1];
 237			break;
 238		case ATOM_WS_DATAPTR:
 239			val = gctx->data_block;
 240			break;
 241		case ATOM_WS_SHIFT:
 242			val = gctx->shift;
 243			break;
 244		case ATOM_WS_OR_MASK:
 245			val = 1 << gctx->shift;
 246			break;
 247		case ATOM_WS_AND_MASK:
 248			val = ~(1 << gctx->shift);
 249			break;
 250		case ATOM_WS_FB_WINDOW:
 251			val = gctx->fb_base;
 252			break;
 253		case ATOM_WS_ATTRIBUTES:
 254			val = gctx->io_attr;
 255			break;
 256		case ATOM_WS_REGPTR:
 257			val = gctx->reg_block;
 258			break;
 259		default:
 260			val = ctx->ws[idx];
 261		}
 262		break;
 263	case ATOM_ARG_ID:
 264		idx = U16(*ptr);
 265		(*ptr) += 2;
 266		if (print) {
 267			if (gctx->data_block)
 268				DEBUG("ID[0x%04X+%04X]", idx, gctx->data_block);
 269			else
 270				DEBUG("ID[0x%04X]", idx);
 271		}
 272		val = U32(idx + gctx->data_block);
 273		break;
 274	case ATOM_ARG_FB:
 275		idx = U8(*ptr);
 276		(*ptr)++;
 277		if ((gctx->fb_base + (idx * 4)) > gctx->scratch_size_bytes) {
 278			DRM_ERROR("ATOM: fb read beyond scratch region: %d vs. %d\n",
 279				  gctx->fb_base + (idx * 4), gctx->scratch_size_bytes);
 280			val = 0;
 281		} else
 282			val = gctx->scratch[(gctx->fb_base / 4) + idx];
 283		if (print)
 284			DEBUG("FB[0x%02X]", idx);
 285		break;
 286	case ATOM_ARG_IMM:
 287		switch (align) {
 288		case ATOM_SRC_DWORD:
 289			val = U32(*ptr);
 290			(*ptr) += 4;
 291			if (print)
 292				DEBUG("IMM 0x%08X\n", val);
 293			return val;
 294		case ATOM_SRC_WORD0:
 295		case ATOM_SRC_WORD8:
 296		case ATOM_SRC_WORD16:
 297			val = U16(*ptr);
 298			(*ptr) += 2;
 299			if (print)
 300				DEBUG("IMM 0x%04X\n", val);
 301			return val;
 302		case ATOM_SRC_BYTE0:
 303		case ATOM_SRC_BYTE8:
 304		case ATOM_SRC_BYTE16:
 305		case ATOM_SRC_BYTE24:
 306			val = U8(*ptr);
 307			(*ptr)++;
 308			if (print)
 309				DEBUG("IMM 0x%02X\n", val);
 310			return val;
 311		}
 312		return 0;
 313	case ATOM_ARG_PLL:
 314		idx = U8(*ptr);
 315		(*ptr)++;
 316		if (print)
 317			DEBUG("PLL[0x%02X]", idx);
 318		val = gctx->card->pll_read(gctx->card, idx);
 319		break;
 320	case ATOM_ARG_MC:
 321		idx = U8(*ptr);
 322		(*ptr)++;
 323		if (print)
 324			DEBUG("MC[0x%02X]", idx);
 325		val = gctx->card->mc_read(gctx->card, idx);
 326		break;
 327	}
 328	if (saved)
 329		*saved = val;
 330	val &= atom_arg_mask[align];
 331	val >>= atom_arg_shift[align];
 332	if (print)
 333		switch (align) {
 334		case ATOM_SRC_DWORD:
 335			DEBUG(".[31:0] -> 0x%08X\n", val);
 336			break;
 337		case ATOM_SRC_WORD0:
 338			DEBUG(".[15:0] -> 0x%04X\n", val);
 339			break;
 340		case ATOM_SRC_WORD8:
 341			DEBUG(".[23:8] -> 0x%04X\n", val);
 342			break;
 343		case ATOM_SRC_WORD16:
 344			DEBUG(".[31:16] -> 0x%04X\n", val);
 345			break;
 346		case ATOM_SRC_BYTE0:
 347			DEBUG(".[7:0] -> 0x%02X\n", val);
 348			break;
 349		case ATOM_SRC_BYTE8:
 350			DEBUG(".[15:8] -> 0x%02X\n", val);
 351			break;
 352		case ATOM_SRC_BYTE16:
 353			DEBUG(".[23:16] -> 0x%02X\n", val);
 354			break;
 355		case ATOM_SRC_BYTE24:
 356			DEBUG(".[31:24] -> 0x%02X\n", val);
 357			break;
 358		}
 359	return val;
 360}
 361
 362static void atom_skip_src_int(atom_exec_context *ctx, uint8_t attr, int *ptr)
 363{
 364	uint32_t align = (attr >> 3) & 7, arg = attr & 7;
 365	switch (arg) {
 366	case ATOM_ARG_REG:
 367	case ATOM_ARG_ID:
 368		(*ptr) += 2;
 369		break;
 370	case ATOM_ARG_PLL:
 371	case ATOM_ARG_MC:
 372	case ATOM_ARG_PS:
 373	case ATOM_ARG_WS:
 374	case ATOM_ARG_FB:
 375		(*ptr)++;
 376		break;
 377	case ATOM_ARG_IMM:
 378		switch (align) {
 379		case ATOM_SRC_DWORD:
 380			(*ptr) += 4;
 381			return;
 382		case ATOM_SRC_WORD0:
 383		case ATOM_SRC_WORD8:
 384		case ATOM_SRC_WORD16:
 385			(*ptr) += 2;
 386			return;
 387		case ATOM_SRC_BYTE0:
 388		case ATOM_SRC_BYTE8:
 389		case ATOM_SRC_BYTE16:
 390		case ATOM_SRC_BYTE24:
 391			(*ptr)++;
 392			return;
 393		}
 394		return;
 395	}
 396}
 397
 398static uint32_t atom_get_src(atom_exec_context *ctx, uint8_t attr, int *ptr)
 399{
 400	return atom_get_src_int(ctx, attr, ptr, NULL, 1);
 401}
 402
 403static uint32_t atom_get_src_direct(atom_exec_context *ctx, uint8_t align, int *ptr)
 404{
 405	uint32_t val = 0xCDCDCDCD;
 406
 407	switch (align) {
 408	case ATOM_SRC_DWORD:
 409		val = U32(*ptr);
 410		(*ptr) += 4;
 411		break;
 412	case ATOM_SRC_WORD0:
 413	case ATOM_SRC_WORD8:
 414	case ATOM_SRC_WORD16:
 415		val = U16(*ptr);
 416		(*ptr) += 2;
 417		break;
 418	case ATOM_SRC_BYTE0:
 419	case ATOM_SRC_BYTE8:
 420	case ATOM_SRC_BYTE16:
 421	case ATOM_SRC_BYTE24:
 422		val = U8(*ptr);
 423		(*ptr)++;
 424		break;
 425	}
 426	return val;
 427}
 428
 429static uint32_t atom_get_dst(atom_exec_context *ctx, int arg, uint8_t attr,
 430			     int *ptr, uint32_t *saved, int print)
 431{
 432	return atom_get_src_int(ctx,
 433				arg | atom_dst_to_src[(attr >> 3) &
 434						      7][(attr >> 6) & 3] << 3,
 435				ptr, saved, print);
 436}
 437
 438static void atom_skip_dst(atom_exec_context *ctx, int arg, uint8_t attr, int *ptr)
 439{
 440	atom_skip_src_int(ctx,
 441			  arg | atom_dst_to_src[(attr >> 3) & 7][(attr >> 6) &
 442								 3] << 3, ptr);
 443}
 444
 445static void atom_put_dst(atom_exec_context *ctx, int arg, uint8_t attr,
 446			 int *ptr, uint32_t val, uint32_t saved)
 447{
 448	uint32_t align =
 449	    atom_dst_to_src[(attr >> 3) & 7][(attr >> 6) & 3], old_val =
 450	    val, idx;
 451	struct atom_context *gctx = ctx->ctx;
 452	old_val &= atom_arg_mask[align] >> atom_arg_shift[align];
 453	val <<= atom_arg_shift[align];
 454	val &= atom_arg_mask[align];
 455	saved &= ~atom_arg_mask[align];
 456	val |= saved;
 457	switch (arg) {
 458	case ATOM_ARG_REG:
 459		idx = U16(*ptr);
 460		(*ptr) += 2;
 461		DEBUG("REG[0x%04X]", idx);
 462		idx += gctx->reg_block;
 463		switch (gctx->io_mode) {
 464		case ATOM_IO_MM:
 465			if (idx == 0)
 466				gctx->card->reg_write(gctx->card, idx,
 467						      val << 2);
 468			else
 469				gctx->card->reg_write(gctx->card, idx, val);
 470			break;
 471		case ATOM_IO_PCI:
 472			printk(KERN_INFO
 473			       "PCI registers are not implemented.\n");
 474			return;
 475		case ATOM_IO_SYSIO:
 476			printk(KERN_INFO
 477			       "SYSIO registers are not implemented.\n");
 478			return;
 479		default:
 480			if (!(gctx->io_mode & 0x80)) {
 481				printk(KERN_INFO "Bad IO mode.\n");
 482				return;
 483			}
 484			if (!gctx->iio[gctx->io_mode & 0xFF]) {
 485				printk(KERN_INFO
 486				       "Undefined indirect IO write method %d.\n",
 487				       gctx->io_mode & 0x7F);
 488				return;
 489			}
 490			atom_iio_execute(gctx, gctx->iio[gctx->io_mode & 0xFF],
 491					 idx, val);
 492		}
 493		break;
 494	case ATOM_ARG_PS:
 495		idx = U8(*ptr);
 496		(*ptr)++;
 497		DEBUG("PS[0x%02X]", idx);
 498		ctx->ps[idx] = cpu_to_le32(val);
 499		break;
 500	case ATOM_ARG_WS:
 501		idx = U8(*ptr);
 502		(*ptr)++;
 503		DEBUG("WS[0x%02X]", idx);
 504		switch (idx) {
 505		case ATOM_WS_QUOTIENT:
 506			gctx->divmul[0] = val;
 507			break;
 508		case ATOM_WS_REMAINDER:
 509			gctx->divmul[1] = val;
 510			break;
 511		case ATOM_WS_DATAPTR:
 512			gctx->data_block = val;
 513			break;
 514		case ATOM_WS_SHIFT:
 515			gctx->shift = val;
 516			break;
 517		case ATOM_WS_OR_MASK:
 518		case ATOM_WS_AND_MASK:
 519			break;
 520		case ATOM_WS_FB_WINDOW:
 521			gctx->fb_base = val;
 522			break;
 523		case ATOM_WS_ATTRIBUTES:
 524			gctx->io_attr = val;
 525			break;
 526		case ATOM_WS_REGPTR:
 527			gctx->reg_block = val;
 528			break;
 529		default:
 530			ctx->ws[idx] = val;
 531		}
 532		break;
 533	case ATOM_ARG_FB:
 534		idx = U8(*ptr);
 535		(*ptr)++;
 536		if ((gctx->fb_base + (idx * 4)) > gctx->scratch_size_bytes) {
 537			DRM_ERROR("ATOM: fb write beyond scratch region: %d vs. %d\n",
 538				  gctx->fb_base + (idx * 4), gctx->scratch_size_bytes);
 539		} else
 540			gctx->scratch[(gctx->fb_base / 4) + idx] = val;
 541		DEBUG("FB[0x%02X]", idx);
 542		break;
 543	case ATOM_ARG_PLL:
 544		idx = U8(*ptr);
 545		(*ptr)++;
 546		DEBUG("PLL[0x%02X]", idx);
 547		gctx->card->pll_write(gctx->card, idx, val);
 548		break;
 549	case ATOM_ARG_MC:
 550		idx = U8(*ptr);
 551		(*ptr)++;
 552		DEBUG("MC[0x%02X]", idx);
 553		gctx->card->mc_write(gctx->card, idx, val);
 554		return;
 555	}
 556	switch (align) {
 557	case ATOM_SRC_DWORD:
 558		DEBUG(".[31:0] <- 0x%08X\n", old_val);
 559		break;
 560	case ATOM_SRC_WORD0:
 561		DEBUG(".[15:0] <- 0x%04X\n", old_val);
 562		break;
 563	case ATOM_SRC_WORD8:
 564		DEBUG(".[23:8] <- 0x%04X\n", old_val);
 565		break;
 566	case ATOM_SRC_WORD16:
 567		DEBUG(".[31:16] <- 0x%04X\n", old_val);
 568		break;
 569	case ATOM_SRC_BYTE0:
 570		DEBUG(".[7:0] <- 0x%02X\n", old_val);
 571		break;
 572	case ATOM_SRC_BYTE8:
 573		DEBUG(".[15:8] <- 0x%02X\n", old_val);
 574		break;
 575	case ATOM_SRC_BYTE16:
 576		DEBUG(".[23:16] <- 0x%02X\n", old_val);
 577		break;
 578	case ATOM_SRC_BYTE24:
 579		DEBUG(".[31:24] <- 0x%02X\n", old_val);
 580		break;
 581	}
 582}
 583
 584static void atom_op_add(atom_exec_context *ctx, int *ptr, int arg)
 585{
 586	uint8_t attr = U8((*ptr)++);
 587	uint32_t dst, src, saved;
 588	int dptr = *ptr;
 589	SDEBUG("   dst: ");
 590	dst = atom_get_dst(ctx, arg, attr, ptr, &saved, 1);
 591	SDEBUG("   src: ");
 592	src = atom_get_src(ctx, attr, ptr);
 593	dst += src;
 594	SDEBUG("   dst: ");
 595	atom_put_dst(ctx, arg, attr, &dptr, dst, saved);
 596}
 597
 598static void atom_op_and(atom_exec_context *ctx, int *ptr, int arg)
 599{
 600	uint8_t attr = U8((*ptr)++);
 601	uint32_t dst, src, saved;
 602	int dptr = *ptr;
 603	SDEBUG("   dst: ");
 604	dst = atom_get_dst(ctx, arg, attr, ptr, &saved, 1);
 605	SDEBUG("   src: ");
 606	src = atom_get_src(ctx, attr, ptr);
 607	dst &= src;
 608	SDEBUG("   dst: ");
 609	atom_put_dst(ctx, arg, attr, &dptr, dst, saved);
 610}
 611
 612static void atom_op_beep(atom_exec_context *ctx, int *ptr, int arg)
 613{
 614	printk("ATOM BIOS beeped!\n");
 615}
 616
 617static void atom_op_calltable(atom_exec_context *ctx, int *ptr, int arg)
 618{
 619	int idx = U8((*ptr)++);
 620	int r = 0;
 621
 622	if (idx < ATOM_TABLE_NAMES_CNT)
 623		SDEBUG("   table: %d (%s)\n", idx, atom_table_names[idx]);
 624	else
 625		SDEBUG("   table: %d\n", idx);
 626	if (U16(ctx->ctx->cmd_table + 4 + 2 * idx))
 627		r = amdgpu_atom_execute_table_locked(ctx->ctx, idx, ctx->ps + ctx->ps_shift);
 628	if (r) {
 629		ctx->abort = true;
 630	}
 631}
 632
 633static void atom_op_clear(atom_exec_context *ctx, int *ptr, int arg)
 634{
 635	uint8_t attr = U8((*ptr)++);
 636	uint32_t saved;
 637	int dptr = *ptr;
 638	attr &= 0x38;
 639	attr |= atom_def_dst[attr >> 3] << 6;
 640	atom_get_dst(ctx, arg, attr, ptr, &saved, 0);
 641	SDEBUG("   dst: ");
 642	atom_put_dst(ctx, arg, attr, &dptr, 0, saved);
 643}
 644
 645static void atom_op_compare(atom_exec_context *ctx, int *ptr, int arg)
 646{
 647	uint8_t attr = U8((*ptr)++);
 648	uint32_t dst, src;
 649	SDEBUG("   src1: ");
 650	dst = atom_get_dst(ctx, arg, attr, ptr, NULL, 1);
 651	SDEBUG("   src2: ");
 652	src = atom_get_src(ctx, attr, ptr);
 653	ctx->ctx->cs_equal = (dst == src);
 654	ctx->ctx->cs_above = (dst > src);
 655	SDEBUG("   result: %s %s\n", ctx->ctx->cs_equal ? "EQ" : "NE",
 656	       ctx->ctx->cs_above ? "GT" : "LE");
 657}
 658
 659static void atom_op_delay(atom_exec_context *ctx, int *ptr, int arg)
 660{
 661	unsigned count = U8((*ptr)++);
 662	SDEBUG("   count: %d\n", count);
 663	if (arg == ATOM_UNIT_MICROSEC)
 664		udelay(count);
 665	else if (!drm_can_sleep())
 666		mdelay(count);
 667	else
 668		msleep(count);
 669}
 670
 671static void atom_op_div(atom_exec_context *ctx, int *ptr, int arg)
 672{
 673	uint8_t attr = U8((*ptr)++);
 674	uint32_t dst, src;
 675	SDEBUG("   src1: ");
 676	dst = atom_get_dst(ctx, arg, attr, ptr, NULL, 1);
 677	SDEBUG("   src2: ");
 678	src = atom_get_src(ctx, attr, ptr);
 679	if (src != 0) {
 680		ctx->ctx->divmul[0] = dst / src;
 681		ctx->ctx->divmul[1] = dst % src;
 682	} else {
 683		ctx->ctx->divmul[0] = 0;
 684		ctx->ctx->divmul[1] = 0;
 685	}
 686}
 687
 688static void atom_op_div32(atom_exec_context *ctx, int *ptr, int arg)
 689{
 690	uint64_t val64;
 691	uint8_t attr = U8((*ptr)++);
 692	uint32_t dst, src;
 693	SDEBUG("   src1: ");
 694	dst = atom_get_dst(ctx, arg, attr, ptr, NULL, 1);
 695	SDEBUG("   src2: ");
 696	src = atom_get_src(ctx, attr, ptr);
 697	if (src != 0) {
 698		val64 = dst;
 699		val64 |= ((uint64_t)ctx->ctx->divmul[1]) << 32;
 700		do_div(val64, src);
 701		ctx->ctx->divmul[0] = lower_32_bits(val64);
 702		ctx->ctx->divmul[1] = upper_32_bits(val64);
 703	} else {
 704		ctx->ctx->divmul[0] = 0;
 705		ctx->ctx->divmul[1] = 0;
 706	}
 707}
 708
 709static void atom_op_eot(atom_exec_context *ctx, int *ptr, int arg)
 710{
 711	/* functionally, a nop */
 712}
 713
 714static void atom_op_jump(atom_exec_context *ctx, int *ptr, int arg)
 715{
 716	int execute = 0, target = U16(*ptr);
 717	unsigned long cjiffies;
 718
 719	(*ptr) += 2;
 720	switch (arg) {
 721	case ATOM_COND_ABOVE:
 722		execute = ctx->ctx->cs_above;
 723		break;
 724	case ATOM_COND_ABOVEOREQUAL:
 725		execute = ctx->ctx->cs_above || ctx->ctx->cs_equal;
 726		break;
 727	case ATOM_COND_ALWAYS:
 728		execute = 1;
 729		break;
 730	case ATOM_COND_BELOW:
 731		execute = !(ctx->ctx->cs_above || ctx->ctx->cs_equal);
 732		break;
 733	case ATOM_COND_BELOWOREQUAL:
 734		execute = !ctx->ctx->cs_above;
 735		break;
 736	case ATOM_COND_EQUAL:
 737		execute = ctx->ctx->cs_equal;
 738		break;
 739	case ATOM_COND_NOTEQUAL:
 740		execute = !ctx->ctx->cs_equal;
 741		break;
 742	}
 743	if (arg != ATOM_COND_ALWAYS)
 744		SDEBUG("   taken: %s\n", execute ? "yes" : "no");
 745	SDEBUG("   target: 0x%04X\n", target);
 746	if (execute) {
 747		if (ctx->last_jump == (ctx->start + target)) {
 748			cjiffies = jiffies;
 749			if (time_after(cjiffies, ctx->last_jump_jiffies)) {
 750				cjiffies -= ctx->last_jump_jiffies;
 751				if ((jiffies_to_msecs(cjiffies) > 5000)) {
 752					DRM_ERROR("atombios stuck in loop for more than 5secs aborting\n");
 
 753					ctx->abort = true;
 754				}
 755			} else {
 756				/* jiffies wrap around we will just wait a little longer */
 757				ctx->last_jump_jiffies = jiffies;
 758			}
 759		} else {
 760			ctx->last_jump = ctx->start + target;
 761			ctx->last_jump_jiffies = jiffies;
 762		}
 763		*ptr = ctx->start + target;
 764	}
 765}
 766
 767static void atom_op_mask(atom_exec_context *ctx, int *ptr, int arg)
 768{
 769	uint8_t attr = U8((*ptr)++);
 770	uint32_t dst, mask, src, saved;
 771	int dptr = *ptr;
 772	SDEBUG("   dst: ");
 773	dst = atom_get_dst(ctx, arg, attr, ptr, &saved, 1);
 774	mask = atom_get_src_direct(ctx, ((attr >> 3) & 7), ptr);
 775	SDEBUG("   mask: 0x%08x", mask);
 776	SDEBUG("   src: ");
 777	src = atom_get_src(ctx, attr, ptr);
 778	dst &= mask;
 779	dst |= src;
 780	SDEBUG("   dst: ");
 781	atom_put_dst(ctx, arg, attr, &dptr, dst, saved);
 782}
 783
 784static void atom_op_move(atom_exec_context *ctx, int *ptr, int arg)
 785{
 786	uint8_t attr = U8((*ptr)++);
 787	uint32_t src, saved;
 788	int dptr = *ptr;
 789	if (((attr >> 3) & 7) != ATOM_SRC_DWORD)
 790		atom_get_dst(ctx, arg, attr, ptr, &saved, 0);
 791	else {
 792		atom_skip_dst(ctx, arg, attr, ptr);
 793		saved = 0xCDCDCDCD;
 794	}
 795	SDEBUG("   src: ");
 796	src = atom_get_src(ctx, attr, ptr);
 797	SDEBUG("   dst: ");
 798	atom_put_dst(ctx, arg, attr, &dptr, src, saved);
 799}
 800
 801static void atom_op_mul(atom_exec_context *ctx, int *ptr, int arg)
 802{
 803	uint8_t attr = U8((*ptr)++);
 804	uint32_t dst, src;
 805	SDEBUG("   src1: ");
 806	dst = atom_get_dst(ctx, arg, attr, ptr, NULL, 1);
 807	SDEBUG("   src2: ");
 808	src = atom_get_src(ctx, attr, ptr);
 809	ctx->ctx->divmul[0] = dst * src;
 810}
 811
 812static void atom_op_mul32(atom_exec_context *ctx, int *ptr, int arg)
 813{
 814	uint64_t val64;
 815	uint8_t attr = U8((*ptr)++);
 816	uint32_t dst, src;
 817	SDEBUG("   src1: ");
 818	dst = atom_get_dst(ctx, arg, attr, ptr, NULL, 1);
 819	SDEBUG("   src2: ");
 820	src = atom_get_src(ctx, attr, ptr);
 821	val64 = (uint64_t)dst * (uint64_t)src;
 822	ctx->ctx->divmul[0] = lower_32_bits(val64);
 823	ctx->ctx->divmul[1] = upper_32_bits(val64);
 824}
 825
 826static void atom_op_nop(atom_exec_context *ctx, int *ptr, int arg)
 827{
 828	/* nothing */
 829}
 830
 831static void atom_op_or(atom_exec_context *ctx, int *ptr, int arg)
 832{
 833	uint8_t attr = U8((*ptr)++);
 834	uint32_t dst, src, saved;
 835	int dptr = *ptr;
 836	SDEBUG("   dst: ");
 837	dst = atom_get_dst(ctx, arg, attr, ptr, &saved, 1);
 838	SDEBUG("   src: ");
 839	src = atom_get_src(ctx, attr, ptr);
 840	dst |= src;
 841	SDEBUG("   dst: ");
 842	atom_put_dst(ctx, arg, attr, &dptr, dst, saved);
 843}
 844
 845static void atom_op_postcard(atom_exec_context *ctx, int *ptr, int arg)
 846{
 847	uint8_t val = U8((*ptr)++);
 848	SDEBUG("POST card output: 0x%02X\n", val);
 849}
 850
 851static void atom_op_repeat(atom_exec_context *ctx, int *ptr, int arg)
 852{
 853	printk(KERN_INFO "unimplemented!\n");
 854}
 855
 856static void atom_op_restorereg(atom_exec_context *ctx, int *ptr, int arg)
 857{
 858	printk(KERN_INFO "unimplemented!\n");
 859}
 860
 861static void atom_op_savereg(atom_exec_context *ctx, int *ptr, int arg)
 862{
 863	printk(KERN_INFO "unimplemented!\n");
 864}
 865
 866static void atom_op_setdatablock(atom_exec_context *ctx, int *ptr, int arg)
 867{
 868	int idx = U8(*ptr);
 869	(*ptr)++;
 870	SDEBUG("   block: %d\n", idx);
 871	if (!idx)
 872		ctx->ctx->data_block = 0;
 873	else if (idx == 255)
 874		ctx->ctx->data_block = ctx->start;
 875	else
 876		ctx->ctx->data_block = U16(ctx->ctx->data_table + 4 + 2 * idx);
 877	SDEBUG("   base: 0x%04X\n", ctx->ctx->data_block);
 878}
 879
 880static void atom_op_setfbbase(atom_exec_context *ctx, int *ptr, int arg)
 881{
 882	uint8_t attr = U8((*ptr)++);
 883	SDEBUG("   fb_base: ");
 884	ctx->ctx->fb_base = atom_get_src(ctx, attr, ptr);
 885}
 886
 887static void atom_op_setport(atom_exec_context *ctx, int *ptr, int arg)
 888{
 889	int port;
 890	switch (arg) {
 891	case ATOM_PORT_ATI:
 892		port = U16(*ptr);
 893		if (port < ATOM_IO_NAMES_CNT)
 894			SDEBUG("   port: %d (%s)\n", port, atom_io_names[port]);
 895		else
 896			SDEBUG("   port: %d\n", port);
 897		if (!port)
 898			ctx->ctx->io_mode = ATOM_IO_MM;
 899		else
 900			ctx->ctx->io_mode = ATOM_IO_IIO | port;
 901		(*ptr) += 2;
 902		break;
 903	case ATOM_PORT_PCI:
 904		ctx->ctx->io_mode = ATOM_IO_PCI;
 905		(*ptr)++;
 906		break;
 907	case ATOM_PORT_SYSIO:
 908		ctx->ctx->io_mode = ATOM_IO_SYSIO;
 909		(*ptr)++;
 910		break;
 911	}
 912}
 913
 914static void atom_op_setregblock(atom_exec_context *ctx, int *ptr, int arg)
 915{
 916	ctx->ctx->reg_block = U16(*ptr);
 917	(*ptr) += 2;
 918	SDEBUG("   base: 0x%04X\n", ctx->ctx->reg_block);
 919}
 920
 921static void atom_op_shift_left(atom_exec_context *ctx, int *ptr, int arg)
 922{
 923	uint8_t attr = U8((*ptr)++), shift;
 924	uint32_t saved, dst;
 925	int dptr = *ptr;
 926	attr &= 0x38;
 927	attr |= atom_def_dst[attr >> 3] << 6;
 928	SDEBUG("   dst: ");
 929	dst = atom_get_dst(ctx, arg, attr, ptr, &saved, 1);
 930	shift = atom_get_src_direct(ctx, ATOM_SRC_BYTE0, ptr);
 931	SDEBUG("   shift: %d\n", shift);
 932	dst <<= shift;
 933	SDEBUG("   dst: ");
 934	atom_put_dst(ctx, arg, attr, &dptr, dst, saved);
 935}
 936
 937static void atom_op_shift_right(atom_exec_context *ctx, int *ptr, int arg)
 938{
 939	uint8_t attr = U8((*ptr)++), shift;
 940	uint32_t saved, dst;
 941	int dptr = *ptr;
 942	attr &= 0x38;
 943	attr |= atom_def_dst[attr >> 3] << 6;
 944	SDEBUG("   dst: ");
 945	dst = atom_get_dst(ctx, arg, attr, ptr, &saved, 1);
 946	shift = atom_get_src_direct(ctx, ATOM_SRC_BYTE0, ptr);
 947	SDEBUG("   shift: %d\n", shift);
 948	dst >>= shift;
 949	SDEBUG("   dst: ");
 950	atom_put_dst(ctx, arg, attr, &dptr, dst, saved);
 951}
 952
 953static void atom_op_shl(atom_exec_context *ctx, int *ptr, int arg)
 954{
 955	uint8_t attr = U8((*ptr)++), shift;
 956	uint32_t saved, dst;
 957	int dptr = *ptr;
 958	uint32_t dst_align = atom_dst_to_src[(attr >> 3) & 7][(attr >> 6) & 3];
 959	SDEBUG("   dst: ");
 960	dst = atom_get_dst(ctx, arg, attr, ptr, &saved, 1);
 961	/* op needs to full dst value */
 962	dst = saved;
 963	shift = atom_get_src(ctx, attr, ptr);
 964	SDEBUG("   shift: %d\n", shift);
 965	dst <<= shift;
 966	dst &= atom_arg_mask[dst_align];
 967	dst >>= atom_arg_shift[dst_align];
 968	SDEBUG("   dst: ");
 969	atom_put_dst(ctx, arg, attr, &dptr, dst, saved);
 970}
 971
 972static void atom_op_shr(atom_exec_context *ctx, int *ptr, int arg)
 973{
 974	uint8_t attr = U8((*ptr)++), shift;
 975	uint32_t saved, dst;
 976	int dptr = *ptr;
 977	uint32_t dst_align = atom_dst_to_src[(attr >> 3) & 7][(attr >> 6) & 3];
 978	SDEBUG("   dst: ");
 979	dst = atom_get_dst(ctx, arg, attr, ptr, &saved, 1);
 980	/* op needs to full dst value */
 981	dst = saved;
 982	shift = atom_get_src(ctx, attr, ptr);
 983	SDEBUG("   shift: %d\n", shift);
 984	dst >>= shift;
 985	dst &= atom_arg_mask[dst_align];
 986	dst >>= atom_arg_shift[dst_align];
 987	SDEBUG("   dst: ");
 988	atom_put_dst(ctx, arg, attr, &dptr, dst, saved);
 989}
 990
 991static void atom_op_sub(atom_exec_context *ctx, int *ptr, int arg)
 992{
 993	uint8_t attr = U8((*ptr)++);
 994	uint32_t dst, src, saved;
 995	int dptr = *ptr;
 996	SDEBUG("   dst: ");
 997	dst = atom_get_dst(ctx, arg, attr, ptr, &saved, 1);
 998	SDEBUG("   src: ");
 999	src = atom_get_src(ctx, attr, ptr);
1000	dst -= src;
1001	SDEBUG("   dst: ");
1002	atom_put_dst(ctx, arg, attr, &dptr, dst, saved);
1003}
1004
1005static void atom_op_switch(atom_exec_context *ctx, int *ptr, int arg)
1006{
1007	uint8_t attr = U8((*ptr)++);
1008	uint32_t src, val, target;
1009	SDEBUG("   switch: ");
1010	src = atom_get_src(ctx, attr, ptr);
1011	while (U16(*ptr) != ATOM_CASE_END)
1012		if (U8(*ptr) == ATOM_CASE_MAGIC) {
1013			(*ptr)++;
1014			SDEBUG("   case: ");
1015			val =
1016			    atom_get_src(ctx, (attr & 0x38) | ATOM_ARG_IMM,
1017					 ptr);
1018			target = U16(*ptr);
1019			if (val == src) {
1020				SDEBUG("   target: %04X\n", target);
1021				*ptr = ctx->start + target;
1022				return;
1023			}
1024			(*ptr) += 2;
1025		} else {
1026			printk(KERN_INFO "Bad case.\n");
1027			return;
1028		}
1029	(*ptr) += 2;
1030}
1031
1032static void atom_op_test(atom_exec_context *ctx, int *ptr, int arg)
1033{
1034	uint8_t attr = U8((*ptr)++);
1035	uint32_t dst, src;
1036	SDEBUG("   src1: ");
1037	dst = atom_get_dst(ctx, arg, attr, ptr, NULL, 1);
1038	SDEBUG("   src2: ");
1039	src = atom_get_src(ctx, attr, ptr);
1040	ctx->ctx->cs_equal = ((dst & src) == 0);
1041	SDEBUG("   result: %s\n", ctx->ctx->cs_equal ? "EQ" : "NE");
1042}
1043
1044static void atom_op_xor(atom_exec_context *ctx, int *ptr, int arg)
1045{
1046	uint8_t attr = U8((*ptr)++);
1047	uint32_t dst, src, saved;
1048	int dptr = *ptr;
1049	SDEBUG("   dst: ");
1050	dst = atom_get_dst(ctx, arg, attr, ptr, &saved, 1);
1051	SDEBUG("   src: ");
1052	src = atom_get_src(ctx, attr, ptr);
1053	dst ^= src;
1054	SDEBUG("   dst: ");
1055	atom_put_dst(ctx, arg, attr, &dptr, dst, saved);
1056}
1057
1058static void atom_op_debug(atom_exec_context *ctx, int *ptr, int arg)
1059{
1060	uint8_t val = U8((*ptr)++);
1061	SDEBUG("DEBUG output: 0x%02X\n", val);
1062}
1063
1064static void atom_op_processds(atom_exec_context *ctx, int *ptr, int arg)
1065{
1066	uint16_t val = U16(*ptr);
1067	(*ptr) += val + 2;
1068	SDEBUG("PROCESSDS output: 0x%02X\n", val);
1069}
1070
1071static struct {
1072	void (*func) (atom_exec_context *, int *, int);
1073	int arg;
1074} opcode_table[ATOM_OP_CNT] = {
1075	{
1076	NULL, 0}, {
1077	atom_op_move, ATOM_ARG_REG}, {
1078	atom_op_move, ATOM_ARG_PS}, {
1079	atom_op_move, ATOM_ARG_WS}, {
1080	atom_op_move, ATOM_ARG_FB}, {
1081	atom_op_move, ATOM_ARG_PLL}, {
1082	atom_op_move, ATOM_ARG_MC}, {
1083	atom_op_and, ATOM_ARG_REG}, {
1084	atom_op_and, ATOM_ARG_PS}, {
1085	atom_op_and, ATOM_ARG_WS}, {
1086	atom_op_and, ATOM_ARG_FB}, {
1087	atom_op_and, ATOM_ARG_PLL}, {
1088	atom_op_and, ATOM_ARG_MC}, {
1089	atom_op_or, ATOM_ARG_REG}, {
1090	atom_op_or, ATOM_ARG_PS}, {
1091	atom_op_or, ATOM_ARG_WS}, {
1092	atom_op_or, ATOM_ARG_FB}, {
1093	atom_op_or, ATOM_ARG_PLL}, {
1094	atom_op_or, ATOM_ARG_MC}, {
1095	atom_op_shift_left, ATOM_ARG_REG}, {
1096	atom_op_shift_left, ATOM_ARG_PS}, {
1097	atom_op_shift_left, ATOM_ARG_WS}, {
1098	atom_op_shift_left, ATOM_ARG_FB}, {
1099	atom_op_shift_left, ATOM_ARG_PLL}, {
1100	atom_op_shift_left, ATOM_ARG_MC}, {
1101	atom_op_shift_right, ATOM_ARG_REG}, {
1102	atom_op_shift_right, ATOM_ARG_PS}, {
1103	atom_op_shift_right, ATOM_ARG_WS}, {
1104	atom_op_shift_right, ATOM_ARG_FB}, {
1105	atom_op_shift_right, ATOM_ARG_PLL}, {
1106	atom_op_shift_right, ATOM_ARG_MC}, {
1107	atom_op_mul, ATOM_ARG_REG}, {
1108	atom_op_mul, ATOM_ARG_PS}, {
1109	atom_op_mul, ATOM_ARG_WS}, {
1110	atom_op_mul, ATOM_ARG_FB}, {
1111	atom_op_mul, ATOM_ARG_PLL}, {
1112	atom_op_mul, ATOM_ARG_MC}, {
1113	atom_op_div, ATOM_ARG_REG}, {
1114	atom_op_div, ATOM_ARG_PS}, {
1115	atom_op_div, ATOM_ARG_WS}, {
1116	atom_op_div, ATOM_ARG_FB}, {
1117	atom_op_div, ATOM_ARG_PLL}, {
1118	atom_op_div, ATOM_ARG_MC}, {
1119	atom_op_add, ATOM_ARG_REG}, {
1120	atom_op_add, ATOM_ARG_PS}, {
1121	atom_op_add, ATOM_ARG_WS}, {
1122	atom_op_add, ATOM_ARG_FB}, {
1123	atom_op_add, ATOM_ARG_PLL}, {
1124	atom_op_add, ATOM_ARG_MC}, {
1125	atom_op_sub, ATOM_ARG_REG}, {
1126	atom_op_sub, ATOM_ARG_PS}, {
1127	atom_op_sub, ATOM_ARG_WS}, {
1128	atom_op_sub, ATOM_ARG_FB}, {
1129	atom_op_sub, ATOM_ARG_PLL}, {
1130	atom_op_sub, ATOM_ARG_MC}, {
1131	atom_op_setport, ATOM_PORT_ATI}, {
1132	atom_op_setport, ATOM_PORT_PCI}, {
1133	atom_op_setport, ATOM_PORT_SYSIO}, {
1134	atom_op_setregblock, 0}, {
1135	atom_op_setfbbase, 0}, {
1136	atom_op_compare, ATOM_ARG_REG}, {
1137	atom_op_compare, ATOM_ARG_PS}, {
1138	atom_op_compare, ATOM_ARG_WS}, {
1139	atom_op_compare, ATOM_ARG_FB}, {
1140	atom_op_compare, ATOM_ARG_PLL}, {
1141	atom_op_compare, ATOM_ARG_MC}, {
1142	atom_op_switch, 0}, {
1143	atom_op_jump, ATOM_COND_ALWAYS}, {
1144	atom_op_jump, ATOM_COND_EQUAL}, {
1145	atom_op_jump, ATOM_COND_BELOW}, {
1146	atom_op_jump, ATOM_COND_ABOVE}, {
1147	atom_op_jump, ATOM_COND_BELOWOREQUAL}, {
1148	atom_op_jump, ATOM_COND_ABOVEOREQUAL}, {
1149	atom_op_jump, ATOM_COND_NOTEQUAL}, {
1150	atom_op_test, ATOM_ARG_REG}, {
1151	atom_op_test, ATOM_ARG_PS}, {
1152	atom_op_test, ATOM_ARG_WS}, {
1153	atom_op_test, ATOM_ARG_FB}, {
1154	atom_op_test, ATOM_ARG_PLL}, {
1155	atom_op_test, ATOM_ARG_MC}, {
1156	atom_op_delay, ATOM_UNIT_MILLISEC}, {
1157	atom_op_delay, ATOM_UNIT_MICROSEC}, {
1158	atom_op_calltable, 0}, {
1159	atom_op_repeat, 0}, {
1160	atom_op_clear, ATOM_ARG_REG}, {
1161	atom_op_clear, ATOM_ARG_PS}, {
1162	atom_op_clear, ATOM_ARG_WS}, {
1163	atom_op_clear, ATOM_ARG_FB}, {
1164	atom_op_clear, ATOM_ARG_PLL}, {
1165	atom_op_clear, ATOM_ARG_MC}, {
1166	atom_op_nop, 0}, {
1167	atom_op_eot, 0}, {
1168	atom_op_mask, ATOM_ARG_REG}, {
1169	atom_op_mask, ATOM_ARG_PS}, {
1170	atom_op_mask, ATOM_ARG_WS}, {
1171	atom_op_mask, ATOM_ARG_FB}, {
1172	atom_op_mask, ATOM_ARG_PLL}, {
1173	atom_op_mask, ATOM_ARG_MC}, {
1174	atom_op_postcard, 0}, {
1175	atom_op_beep, 0}, {
1176	atom_op_savereg, 0}, {
1177	atom_op_restorereg, 0}, {
1178	atom_op_setdatablock, 0}, {
1179	atom_op_xor, ATOM_ARG_REG}, {
1180	atom_op_xor, ATOM_ARG_PS}, {
1181	atom_op_xor, ATOM_ARG_WS}, {
1182	atom_op_xor, ATOM_ARG_FB}, {
1183	atom_op_xor, ATOM_ARG_PLL}, {
1184	atom_op_xor, ATOM_ARG_MC}, {
1185	atom_op_shl, ATOM_ARG_REG}, {
1186	atom_op_shl, ATOM_ARG_PS}, {
1187	atom_op_shl, ATOM_ARG_WS}, {
1188	atom_op_shl, ATOM_ARG_FB}, {
1189	atom_op_shl, ATOM_ARG_PLL}, {
1190	atom_op_shl, ATOM_ARG_MC}, {
1191	atom_op_shr, ATOM_ARG_REG}, {
1192	atom_op_shr, ATOM_ARG_PS}, {
1193	atom_op_shr, ATOM_ARG_WS}, {
1194	atom_op_shr, ATOM_ARG_FB}, {
1195	atom_op_shr, ATOM_ARG_PLL}, {
1196	atom_op_shr, ATOM_ARG_MC}, {
1197	atom_op_debug, 0}, {
1198	atom_op_processds, 0}, {
1199	atom_op_mul32, ATOM_ARG_PS}, {
1200	atom_op_mul32, ATOM_ARG_WS}, {
1201	atom_op_div32, ATOM_ARG_PS}, {
1202	atom_op_div32, ATOM_ARG_WS},
1203};
1204
1205static int amdgpu_atom_execute_table_locked(struct atom_context *ctx, int index, uint32_t * params)
1206{
1207	int base = CU16(ctx->cmd_table + 4 + 2 * index);
1208	int len, ws, ps, ptr;
1209	unsigned char op;
1210	atom_exec_context ectx;
1211	int ret = 0;
1212
1213	if (!base)
1214		return -EINVAL;
1215
1216	len = CU16(base + ATOM_CT_SIZE_PTR);
1217	ws = CU8(base + ATOM_CT_WS_PTR);
1218	ps = CU8(base + ATOM_CT_PS_PTR) & ATOM_CT_PS_MASK;
1219	ptr = base + ATOM_CT_CODE_PTR;
1220
1221	SDEBUG(">> execute %04X (len %d, WS %d, PS %d)\n", base, len, ws, ps);
1222
1223	ectx.ctx = ctx;
1224	ectx.ps_shift = ps / 4;
1225	ectx.start = base;
1226	ectx.ps = params;
1227	ectx.abort = false;
1228	ectx.last_jump = 0;
1229	if (ws)
1230		ectx.ws = kzalloc(4 * ws, GFP_KERNEL);
1231	else
1232		ectx.ws = NULL;
1233
1234	debug_depth++;
1235	while (1) {
1236		op = CU8(ptr++);
1237		if (op < ATOM_OP_NAMES_CNT)
1238			SDEBUG("%s @ 0x%04X\n", atom_op_names[op], ptr - 1);
1239		else
1240			SDEBUG("[%d] @ 0x%04X\n", op, ptr - 1);
1241		if (ectx.abort) {
1242			DRM_ERROR("atombios stuck executing %04X (len %d, WS %d, PS %d) @ 0x%04X\n",
1243				base, len, ws, ps, ptr - 1);
1244			ret = -EINVAL;
1245			goto free;
1246		}
1247
1248		if (op < ATOM_OP_CNT && op > 0)
1249			opcode_table[op].func(&ectx, &ptr,
1250					      opcode_table[op].arg);
1251		else
1252			break;
1253
1254		if (op == ATOM_OP_EOT)
1255			break;
1256	}
1257	debug_depth--;
1258	SDEBUG("<<\n");
1259
1260free:
1261	if (ws)
1262		kfree(ectx.ws);
1263	return ret;
1264}
1265
1266int amdgpu_atom_execute_table(struct atom_context *ctx, int index, uint32_t * params)
1267{
1268	int r;
1269
1270	mutex_lock(&ctx->mutex);
1271	/* reset data block */
1272	ctx->data_block = 0;
1273	/* reset reg block */
1274	ctx->reg_block = 0;
1275	/* reset fb window */
1276	ctx->fb_base = 0;
1277	/* reset io mode */
1278	ctx->io_mode = ATOM_IO_MM;
1279	/* reset divmul */
1280	ctx->divmul[0] = 0;
1281	ctx->divmul[1] = 0;
1282	r = amdgpu_atom_execute_table_locked(ctx, index, params);
1283	mutex_unlock(&ctx->mutex);
1284	return r;
1285}
1286
1287static int atom_iio_len[] = { 1, 2, 3, 3, 3, 3, 4, 4, 4, 3 };
1288
1289static void atom_index_iio(struct atom_context *ctx, int base)
1290{
1291	ctx->iio = kzalloc(2 * 256, GFP_KERNEL);
1292	if (!ctx->iio)
1293		return;
1294	while (CU8(base) == ATOM_IIO_START) {
1295		ctx->iio[CU8(base + 1)] = base + 2;
1296		base += 2;
1297		while (CU8(base) != ATOM_IIO_END)
1298			base += atom_iio_len[CU8(base)];
1299		base += 3;
1300	}
1301}
1302
1303struct atom_context *amdgpu_atom_parse(struct card_info *card, void *bios)
1304{
1305	int base;
1306	struct atom_context *ctx =
1307	    kzalloc(sizeof(struct atom_context), GFP_KERNEL);
1308	char *str;
1309	char name[512];
1310	int i;
1311
1312	if (!ctx)
1313		return NULL;
1314
1315	ctx->card = card;
1316	ctx->bios = bios;
1317
1318	if (CU16(0) != ATOM_BIOS_MAGIC) {
1319		printk(KERN_INFO "Invalid BIOS magic.\n");
1320		kfree(ctx);
1321		return NULL;
1322	}
1323	if (strncmp
1324	    (CSTR(ATOM_ATI_MAGIC_PTR), ATOM_ATI_MAGIC,
1325	     strlen(ATOM_ATI_MAGIC))) {
1326		printk(KERN_INFO "Invalid ATI magic.\n");
1327		kfree(ctx);
1328		return NULL;
1329	}
1330
1331	base = CU16(ATOM_ROM_TABLE_PTR);
1332	if (strncmp
1333	    (CSTR(base + ATOM_ROM_MAGIC_PTR), ATOM_ROM_MAGIC,
1334	     strlen(ATOM_ROM_MAGIC))) {
1335		printk(KERN_INFO "Invalid ATOM magic.\n");
1336		kfree(ctx);
1337		return NULL;
1338	}
1339
1340	ctx->cmd_table = CU16(base + ATOM_ROM_CMD_PTR);
1341	ctx->data_table = CU16(base + ATOM_ROM_DATA_PTR);
1342	atom_index_iio(ctx, CU16(ctx->data_table + ATOM_DATA_IIO_PTR) + 4);
1343	if (!ctx->iio) {
1344		amdgpu_atom_destroy(ctx);
1345		return NULL;
1346	}
1347
1348	str = CSTR(CU16(base + ATOM_ROM_MSG_PTR));
1349	while (*str && ((*str == '\n') || (*str == '\r')))
1350		str++;
1351	/* name string isn't always 0 terminated */
1352	for (i = 0; i < 511; i++) {
1353		name[i] = str[i];
1354		if (name[i] < '.' || name[i] > 'z') {
1355			name[i] = 0;
1356			break;
1357		}
1358	}
1359	printk(KERN_INFO "ATOM BIOS: %s\n", name);
1360
1361	return ctx;
1362}
1363
1364int amdgpu_atom_asic_init(struct atom_context *ctx)
1365{
1366	int hwi = CU16(ctx->data_table + ATOM_DATA_FWI_PTR);
1367	uint32_t ps[16];
1368	int ret;
1369
1370	memset(ps, 0, 64);
1371
1372	ps[0] = cpu_to_le32(CU32(hwi + ATOM_FWI_DEFSCLK_PTR));
1373	ps[1] = cpu_to_le32(CU32(hwi + ATOM_FWI_DEFMCLK_PTR));
1374	if (!ps[0] || !ps[1])
1375		return 1;
1376
1377	if (!CU16(ctx->cmd_table + 4 + 2 * ATOM_CMD_INIT))
1378		return 1;
1379	ret = amdgpu_atom_execute_table(ctx, ATOM_CMD_INIT, ps);
1380	if (ret)
1381		return ret;
1382
1383	memset(ps, 0, 64);
1384
1385	return ret;
1386}
1387
1388void amdgpu_atom_destroy(struct atom_context *ctx)
1389{
1390	kfree(ctx->iio);
1391	kfree(ctx);
1392}
1393
1394bool amdgpu_atom_parse_data_header(struct atom_context *ctx, int index,
1395			    uint16_t * size, uint8_t * frev, uint8_t * crev,
1396			    uint16_t * data_start)
1397{
1398	int offset = index * 2 + 4;
1399	int idx = CU16(ctx->data_table + offset);
1400	u16 *mdt = (u16 *)(ctx->bios + ctx->data_table + 4);
1401
1402	if (!mdt[index])
1403		return false;
1404
1405	if (size)
1406		*size = CU16(idx);
1407	if (frev)
1408		*frev = CU8(idx + 2);
1409	if (crev)
1410		*crev = CU8(idx + 3);
1411	*data_start = idx;
1412	return true;
1413}
1414
1415bool amdgpu_atom_parse_cmd_header(struct atom_context *ctx, int index, uint8_t * frev,
1416			   uint8_t * crev)
1417{
1418	int offset = index * 2 + 4;
1419	int idx = CU16(ctx->cmd_table + offset);
1420	u16 *mct = (u16 *)(ctx->bios + ctx->cmd_table + 4);
1421
1422	if (!mct[index])
1423		return false;
1424
1425	if (frev)
1426		*frev = CU8(idx + 2);
1427	if (crev)
1428		*crev = CU8(idx + 3);
1429	return true;
1430}
1431
1432int amdgpu_atom_allocate_fb_scratch(struct atom_context *ctx)
1433{
1434	int index = GetIndexIntoMasterTable(DATA, VRAM_UsageByFirmware);
1435	uint16_t data_offset;
1436	int usage_bytes = 0;
1437	struct _ATOM_VRAM_USAGE_BY_FIRMWARE *firmware_usage;
1438
1439	if (amdgpu_atom_parse_data_header(ctx, index, NULL, NULL, NULL, &data_offset)) {
1440		firmware_usage = (struct _ATOM_VRAM_USAGE_BY_FIRMWARE *)(ctx->bios + data_offset);
1441
1442		DRM_DEBUG("atom firmware requested %08x %dkb\n",
1443			  le32_to_cpu(firmware_usage->asFirmwareVramReserveInfo[0].ulStartAddrUsedByFirmware),
1444			  le16_to_cpu(firmware_usage->asFirmwareVramReserveInfo[0].usFirmwareUseInKb));
1445
1446		usage_bytes = le16_to_cpu(firmware_usage->asFirmwareVramReserveInfo[0].usFirmwareUseInKb) * 1024;
1447	}
1448	ctx->scratch_size_bytes = 0;
1449	if (usage_bytes == 0)
1450		usage_bytes = 20 * 1024;
1451	/* allocate some scratch memory */
1452	ctx->scratch = kzalloc(usage_bytes, GFP_KERNEL);
1453	if (!ctx->scratch)
1454		return -ENOMEM;
1455	ctx->scratch_size_bytes = usage_bytes;
1456	return 0;
1457}
v5.9
   1/*
   2 * Copyright 2008 Advanced Micro Devices, Inc.
   3 *
   4 * Permission is hereby granted, free of charge, to any person obtaining a
   5 * copy of this software and associated documentation files (the "Software"),
   6 * to deal in the Software without restriction, including without limitation
   7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
   8 * and/or sell copies of the Software, and to permit persons to whom the
   9 * Software is furnished to do so, subject to the following conditions:
  10 *
  11 * The above copyright notice and this permission notice shall be included in
  12 * all copies or substantial portions of the Software.
  13 *
  14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20 * OTHER DEALINGS IN THE SOFTWARE.
  21 *
  22 * Author: Stanislaw Skowronek
  23 */
  24
  25#include <linux/module.h>
  26#include <linux/sched.h>
  27#include <linux/slab.h>
  28#include <asm/unaligned.h>
  29
  30#include <drm/drm_util.h>
  31
  32#define ATOM_DEBUG
  33
  34#include "atom.h"
  35#include "atom-names.h"
  36#include "atom-bits.h"
  37#include "amdgpu.h"
  38
  39#define ATOM_COND_ABOVE		0
  40#define ATOM_COND_ABOVEOREQUAL	1
  41#define ATOM_COND_ALWAYS	2
  42#define ATOM_COND_BELOW		3
  43#define ATOM_COND_BELOWOREQUAL	4
  44#define ATOM_COND_EQUAL		5
  45#define ATOM_COND_NOTEQUAL	6
  46
  47#define ATOM_PORT_ATI	0
  48#define ATOM_PORT_PCI	1
  49#define ATOM_PORT_SYSIO	2
  50
  51#define ATOM_UNIT_MICROSEC	0
  52#define ATOM_UNIT_MILLISEC	1
  53
  54#define PLL_INDEX	2
  55#define PLL_DATA	3
  56
  57#define ATOM_CMD_TIMEOUT_SEC	20
  58
  59typedef struct {
  60	struct atom_context *ctx;
  61	uint32_t *ps, *ws;
  62	int ps_shift;
  63	uint16_t start;
  64	unsigned last_jump;
  65	unsigned long last_jump_jiffies;
  66	bool abort;
  67} atom_exec_context;
  68
  69int amdgpu_atom_debug = 0;
  70static int amdgpu_atom_execute_table_locked(struct atom_context *ctx, int index, uint32_t * params);
  71int amdgpu_atom_execute_table(struct atom_context *ctx, int index, uint32_t * params);
  72
  73static uint32_t atom_arg_mask[8] =
  74    { 0xFFFFFFFF, 0xFFFF, 0xFFFF00, 0xFFFF0000, 0xFF, 0xFF00, 0xFF0000,
  750xFF000000 };
  76static int atom_arg_shift[8] = { 0, 0, 8, 16, 0, 8, 16, 24 };
  77
  78static int atom_dst_to_src[8][4] = {
  79	/* translate destination alignment field to the source alignment encoding */
  80	{0, 0, 0, 0},
  81	{1, 2, 3, 0},
  82	{1, 2, 3, 0},
  83	{1, 2, 3, 0},
  84	{4, 5, 6, 7},
  85	{4, 5, 6, 7},
  86	{4, 5, 6, 7},
  87	{4, 5, 6, 7},
  88};
  89static int atom_def_dst[8] = { 0, 0, 1, 2, 0, 1, 2, 3 };
  90
  91static int debug_depth = 0;
  92#ifdef ATOM_DEBUG
  93static void debug_print_spaces(int n)
  94{
  95	while (n--)
  96		printk("   ");
  97}
  98
  99#define DEBUG(...) do if (amdgpu_atom_debug) { printk(KERN_DEBUG __VA_ARGS__); } while (0)
 100#define SDEBUG(...) do if (amdgpu_atom_debug) { printk(KERN_DEBUG); debug_print_spaces(debug_depth); printk(__VA_ARGS__); } while (0)
 101#else
 102#define DEBUG(...) do { } while (0)
 103#define SDEBUG(...) do { } while (0)
 104#endif
 105
 106static uint32_t atom_iio_execute(struct atom_context *ctx, int base,
 107				 uint32_t index, uint32_t data)
 108{
 109	uint32_t temp = 0xCDCDCDCD;
 110
 111	while (1)
 112		switch (CU8(base)) {
 113		case ATOM_IIO_NOP:
 114			base++;
 115			break;
 116		case ATOM_IIO_READ:
 117			temp = ctx->card->ioreg_read(ctx->card, CU16(base + 1));
 118			base += 3;
 119			break;
 120		case ATOM_IIO_WRITE:
 121			ctx->card->ioreg_write(ctx->card, CU16(base + 1), temp);
 122			base += 3;
 123			break;
 124		case ATOM_IIO_CLEAR:
 125			temp &=
 126			    ~((0xFFFFFFFF >> (32 - CU8(base + 1))) <<
 127			      CU8(base + 2));
 128			base += 3;
 129			break;
 130		case ATOM_IIO_SET:
 131			temp |=
 132			    (0xFFFFFFFF >> (32 - CU8(base + 1))) << CU8(base +
 133									2);
 134			base += 3;
 135			break;
 136		case ATOM_IIO_MOVE_INDEX:
 137			temp &=
 138			    ~((0xFFFFFFFF >> (32 - CU8(base + 1))) <<
 139			      CU8(base + 3));
 140			temp |=
 141			    ((index >> CU8(base + 2)) &
 142			     (0xFFFFFFFF >> (32 - CU8(base + 1)))) << CU8(base +
 143									  3);
 144			base += 4;
 145			break;
 146		case ATOM_IIO_MOVE_DATA:
 147			temp &=
 148			    ~((0xFFFFFFFF >> (32 - CU8(base + 1))) <<
 149			      CU8(base + 3));
 150			temp |=
 151			    ((data >> CU8(base + 2)) &
 152			     (0xFFFFFFFF >> (32 - CU8(base + 1)))) << CU8(base +
 153									  3);
 154			base += 4;
 155			break;
 156		case ATOM_IIO_MOVE_ATTR:
 157			temp &=
 158			    ~((0xFFFFFFFF >> (32 - CU8(base + 1))) <<
 159			      CU8(base + 3));
 160			temp |=
 161			    ((ctx->
 162			      io_attr >> CU8(base + 2)) & (0xFFFFFFFF >> (32 -
 163									  CU8
 164									  (base
 165									   +
 166									   1))))
 167			    << CU8(base + 3);
 168			base += 4;
 169			break;
 170		case ATOM_IIO_END:
 171			return temp;
 172		default:
 173			pr_info("Unknown IIO opcode\n");
 174			return 0;
 175		}
 176}
 177
 178static uint32_t atom_get_src_int(atom_exec_context *ctx, uint8_t attr,
 179				 int *ptr, uint32_t *saved, int print)
 180{
 181	uint32_t idx, val = 0xCDCDCDCD, align, arg;
 182	struct atom_context *gctx = ctx->ctx;
 183	arg = attr & 7;
 184	align = (attr >> 3) & 7;
 185	switch (arg) {
 186	case ATOM_ARG_REG:
 187		idx = U16(*ptr);
 188		(*ptr) += 2;
 189		if (print)
 190			DEBUG("REG[0x%04X]", idx);
 191		idx += gctx->reg_block;
 192		switch (gctx->io_mode) {
 193		case ATOM_IO_MM:
 194			val = gctx->card->reg_read(gctx->card, idx);
 195			break;
 196		case ATOM_IO_PCI:
 197			pr_info("PCI registers are not implemented\n");
 
 198			return 0;
 199		case ATOM_IO_SYSIO:
 200			pr_info("SYSIO registers are not implemented\n");
 
 201			return 0;
 202		default:
 203			if (!(gctx->io_mode & 0x80)) {
 204				pr_info("Bad IO mode\n");
 205				return 0;
 206			}
 207			if (!gctx->iio[gctx->io_mode & 0x7F]) {
 208				pr_info("Undefined indirect IO read method %d\n",
 209					gctx->io_mode & 0x7F);
 
 210				return 0;
 211			}
 212			val =
 213			    atom_iio_execute(gctx,
 214					     gctx->iio[gctx->io_mode & 0x7F],
 215					     idx, 0);
 216		}
 217		break;
 218	case ATOM_ARG_PS:
 219		idx = U8(*ptr);
 220		(*ptr)++;
 221		/* get_unaligned_le32 avoids unaligned accesses from atombios
 222		 * tables, noticed on a DEC Alpha. */
 223		val = get_unaligned_le32((u32 *)&ctx->ps[idx]);
 224		if (print)
 225			DEBUG("PS[0x%02X,0x%04X]", idx, val);
 226		break;
 227	case ATOM_ARG_WS:
 228		idx = U8(*ptr);
 229		(*ptr)++;
 230		if (print)
 231			DEBUG("WS[0x%02X]", idx);
 232		switch (idx) {
 233		case ATOM_WS_QUOTIENT:
 234			val = gctx->divmul[0];
 235			break;
 236		case ATOM_WS_REMAINDER:
 237			val = gctx->divmul[1];
 238			break;
 239		case ATOM_WS_DATAPTR:
 240			val = gctx->data_block;
 241			break;
 242		case ATOM_WS_SHIFT:
 243			val = gctx->shift;
 244			break;
 245		case ATOM_WS_OR_MASK:
 246			val = 1 << gctx->shift;
 247			break;
 248		case ATOM_WS_AND_MASK:
 249			val = ~(1 << gctx->shift);
 250			break;
 251		case ATOM_WS_FB_WINDOW:
 252			val = gctx->fb_base;
 253			break;
 254		case ATOM_WS_ATTRIBUTES:
 255			val = gctx->io_attr;
 256			break;
 257		case ATOM_WS_REGPTR:
 258			val = gctx->reg_block;
 259			break;
 260		default:
 261			val = ctx->ws[idx];
 262		}
 263		break;
 264	case ATOM_ARG_ID:
 265		idx = U16(*ptr);
 266		(*ptr) += 2;
 267		if (print) {
 268			if (gctx->data_block)
 269				DEBUG("ID[0x%04X+%04X]", idx, gctx->data_block);
 270			else
 271				DEBUG("ID[0x%04X]", idx);
 272		}
 273		val = U32(idx + gctx->data_block);
 274		break;
 275	case ATOM_ARG_FB:
 276		idx = U8(*ptr);
 277		(*ptr)++;
 278		if ((gctx->fb_base + (idx * 4)) > gctx->scratch_size_bytes) {
 279			DRM_ERROR("ATOM: fb read beyond scratch region: %d vs. %d\n",
 280				  gctx->fb_base + (idx * 4), gctx->scratch_size_bytes);
 281			val = 0;
 282		} else
 283			val = gctx->scratch[(gctx->fb_base / 4) + idx];
 284		if (print)
 285			DEBUG("FB[0x%02X]", idx);
 286		break;
 287	case ATOM_ARG_IMM:
 288		switch (align) {
 289		case ATOM_SRC_DWORD:
 290			val = U32(*ptr);
 291			(*ptr) += 4;
 292			if (print)
 293				DEBUG("IMM 0x%08X\n", val);
 294			return val;
 295		case ATOM_SRC_WORD0:
 296		case ATOM_SRC_WORD8:
 297		case ATOM_SRC_WORD16:
 298			val = U16(*ptr);
 299			(*ptr) += 2;
 300			if (print)
 301				DEBUG("IMM 0x%04X\n", val);
 302			return val;
 303		case ATOM_SRC_BYTE0:
 304		case ATOM_SRC_BYTE8:
 305		case ATOM_SRC_BYTE16:
 306		case ATOM_SRC_BYTE24:
 307			val = U8(*ptr);
 308			(*ptr)++;
 309			if (print)
 310				DEBUG("IMM 0x%02X\n", val);
 311			return val;
 312		}
 313		return 0;
 314	case ATOM_ARG_PLL:
 315		idx = U8(*ptr);
 316		(*ptr)++;
 317		if (print)
 318			DEBUG("PLL[0x%02X]", idx);
 319		val = gctx->card->pll_read(gctx->card, idx);
 320		break;
 321	case ATOM_ARG_MC:
 322		idx = U8(*ptr);
 323		(*ptr)++;
 324		if (print)
 325			DEBUG("MC[0x%02X]", idx);
 326		val = gctx->card->mc_read(gctx->card, idx);
 327		break;
 328	}
 329	if (saved)
 330		*saved = val;
 331	val &= atom_arg_mask[align];
 332	val >>= atom_arg_shift[align];
 333	if (print)
 334		switch (align) {
 335		case ATOM_SRC_DWORD:
 336			DEBUG(".[31:0] -> 0x%08X\n", val);
 337			break;
 338		case ATOM_SRC_WORD0:
 339			DEBUG(".[15:0] -> 0x%04X\n", val);
 340			break;
 341		case ATOM_SRC_WORD8:
 342			DEBUG(".[23:8] -> 0x%04X\n", val);
 343			break;
 344		case ATOM_SRC_WORD16:
 345			DEBUG(".[31:16] -> 0x%04X\n", val);
 346			break;
 347		case ATOM_SRC_BYTE0:
 348			DEBUG(".[7:0] -> 0x%02X\n", val);
 349			break;
 350		case ATOM_SRC_BYTE8:
 351			DEBUG(".[15:8] -> 0x%02X\n", val);
 352			break;
 353		case ATOM_SRC_BYTE16:
 354			DEBUG(".[23:16] -> 0x%02X\n", val);
 355			break;
 356		case ATOM_SRC_BYTE24:
 357			DEBUG(".[31:24] -> 0x%02X\n", val);
 358			break;
 359		}
 360	return val;
 361}
 362
 363static void atom_skip_src_int(atom_exec_context *ctx, uint8_t attr, int *ptr)
 364{
 365	uint32_t align = (attr >> 3) & 7, arg = attr & 7;
 366	switch (arg) {
 367	case ATOM_ARG_REG:
 368	case ATOM_ARG_ID:
 369		(*ptr) += 2;
 370		break;
 371	case ATOM_ARG_PLL:
 372	case ATOM_ARG_MC:
 373	case ATOM_ARG_PS:
 374	case ATOM_ARG_WS:
 375	case ATOM_ARG_FB:
 376		(*ptr)++;
 377		break;
 378	case ATOM_ARG_IMM:
 379		switch (align) {
 380		case ATOM_SRC_DWORD:
 381			(*ptr) += 4;
 382			return;
 383		case ATOM_SRC_WORD0:
 384		case ATOM_SRC_WORD8:
 385		case ATOM_SRC_WORD16:
 386			(*ptr) += 2;
 387			return;
 388		case ATOM_SRC_BYTE0:
 389		case ATOM_SRC_BYTE8:
 390		case ATOM_SRC_BYTE16:
 391		case ATOM_SRC_BYTE24:
 392			(*ptr)++;
 393			return;
 394		}
 395		return;
 396	}
 397}
 398
 399static uint32_t atom_get_src(atom_exec_context *ctx, uint8_t attr, int *ptr)
 400{
 401	return atom_get_src_int(ctx, attr, ptr, NULL, 1);
 402}
 403
 404static uint32_t atom_get_src_direct(atom_exec_context *ctx, uint8_t align, int *ptr)
 405{
 406	uint32_t val = 0xCDCDCDCD;
 407
 408	switch (align) {
 409	case ATOM_SRC_DWORD:
 410		val = U32(*ptr);
 411		(*ptr) += 4;
 412		break;
 413	case ATOM_SRC_WORD0:
 414	case ATOM_SRC_WORD8:
 415	case ATOM_SRC_WORD16:
 416		val = U16(*ptr);
 417		(*ptr) += 2;
 418		break;
 419	case ATOM_SRC_BYTE0:
 420	case ATOM_SRC_BYTE8:
 421	case ATOM_SRC_BYTE16:
 422	case ATOM_SRC_BYTE24:
 423		val = U8(*ptr);
 424		(*ptr)++;
 425		break;
 426	}
 427	return val;
 428}
 429
 430static uint32_t atom_get_dst(atom_exec_context *ctx, int arg, uint8_t attr,
 431			     int *ptr, uint32_t *saved, int print)
 432{
 433	return atom_get_src_int(ctx,
 434				arg | atom_dst_to_src[(attr >> 3) &
 435						      7][(attr >> 6) & 3] << 3,
 436				ptr, saved, print);
 437}
 438
 439static void atom_skip_dst(atom_exec_context *ctx, int arg, uint8_t attr, int *ptr)
 440{
 441	atom_skip_src_int(ctx,
 442			  arg | atom_dst_to_src[(attr >> 3) & 7][(attr >> 6) &
 443								 3] << 3, ptr);
 444}
 445
 446static void atom_put_dst(atom_exec_context *ctx, int arg, uint8_t attr,
 447			 int *ptr, uint32_t val, uint32_t saved)
 448{
 449	uint32_t align =
 450	    atom_dst_to_src[(attr >> 3) & 7][(attr >> 6) & 3], old_val =
 451	    val, idx;
 452	struct atom_context *gctx = ctx->ctx;
 453	old_val &= atom_arg_mask[align] >> atom_arg_shift[align];
 454	val <<= atom_arg_shift[align];
 455	val &= atom_arg_mask[align];
 456	saved &= ~atom_arg_mask[align];
 457	val |= saved;
 458	switch (arg) {
 459	case ATOM_ARG_REG:
 460		idx = U16(*ptr);
 461		(*ptr) += 2;
 462		DEBUG("REG[0x%04X]", idx);
 463		idx += gctx->reg_block;
 464		switch (gctx->io_mode) {
 465		case ATOM_IO_MM:
 466			if (idx == 0)
 467				gctx->card->reg_write(gctx->card, idx,
 468						      val << 2);
 469			else
 470				gctx->card->reg_write(gctx->card, idx, val);
 471			break;
 472		case ATOM_IO_PCI:
 473			pr_info("PCI registers are not implemented\n");
 
 474			return;
 475		case ATOM_IO_SYSIO:
 476			pr_info("SYSIO registers are not implemented\n");
 
 477			return;
 478		default:
 479			if (!(gctx->io_mode & 0x80)) {
 480				pr_info("Bad IO mode\n");
 481				return;
 482			}
 483			if (!gctx->iio[gctx->io_mode & 0xFF]) {
 484				pr_info("Undefined indirect IO write method %d\n",
 485					gctx->io_mode & 0x7F);
 
 486				return;
 487			}
 488			atom_iio_execute(gctx, gctx->iio[gctx->io_mode & 0xFF],
 489					 idx, val);
 490		}
 491		break;
 492	case ATOM_ARG_PS:
 493		idx = U8(*ptr);
 494		(*ptr)++;
 495		DEBUG("PS[0x%02X]", idx);
 496		ctx->ps[idx] = cpu_to_le32(val);
 497		break;
 498	case ATOM_ARG_WS:
 499		idx = U8(*ptr);
 500		(*ptr)++;
 501		DEBUG("WS[0x%02X]", idx);
 502		switch (idx) {
 503		case ATOM_WS_QUOTIENT:
 504			gctx->divmul[0] = val;
 505			break;
 506		case ATOM_WS_REMAINDER:
 507			gctx->divmul[1] = val;
 508			break;
 509		case ATOM_WS_DATAPTR:
 510			gctx->data_block = val;
 511			break;
 512		case ATOM_WS_SHIFT:
 513			gctx->shift = val;
 514			break;
 515		case ATOM_WS_OR_MASK:
 516		case ATOM_WS_AND_MASK:
 517			break;
 518		case ATOM_WS_FB_WINDOW:
 519			gctx->fb_base = val;
 520			break;
 521		case ATOM_WS_ATTRIBUTES:
 522			gctx->io_attr = val;
 523			break;
 524		case ATOM_WS_REGPTR:
 525			gctx->reg_block = val;
 526			break;
 527		default:
 528			ctx->ws[idx] = val;
 529		}
 530		break;
 531	case ATOM_ARG_FB:
 532		idx = U8(*ptr);
 533		(*ptr)++;
 534		if ((gctx->fb_base + (idx * 4)) > gctx->scratch_size_bytes) {
 535			DRM_ERROR("ATOM: fb write beyond scratch region: %d vs. %d\n",
 536				  gctx->fb_base + (idx * 4), gctx->scratch_size_bytes);
 537		} else
 538			gctx->scratch[(gctx->fb_base / 4) + idx] = val;
 539		DEBUG("FB[0x%02X]", idx);
 540		break;
 541	case ATOM_ARG_PLL:
 542		idx = U8(*ptr);
 543		(*ptr)++;
 544		DEBUG("PLL[0x%02X]", idx);
 545		gctx->card->pll_write(gctx->card, idx, val);
 546		break;
 547	case ATOM_ARG_MC:
 548		idx = U8(*ptr);
 549		(*ptr)++;
 550		DEBUG("MC[0x%02X]", idx);
 551		gctx->card->mc_write(gctx->card, idx, val);
 552		return;
 553	}
 554	switch (align) {
 555	case ATOM_SRC_DWORD:
 556		DEBUG(".[31:0] <- 0x%08X\n", old_val);
 557		break;
 558	case ATOM_SRC_WORD0:
 559		DEBUG(".[15:0] <- 0x%04X\n", old_val);
 560		break;
 561	case ATOM_SRC_WORD8:
 562		DEBUG(".[23:8] <- 0x%04X\n", old_val);
 563		break;
 564	case ATOM_SRC_WORD16:
 565		DEBUG(".[31:16] <- 0x%04X\n", old_val);
 566		break;
 567	case ATOM_SRC_BYTE0:
 568		DEBUG(".[7:0] <- 0x%02X\n", old_val);
 569		break;
 570	case ATOM_SRC_BYTE8:
 571		DEBUG(".[15:8] <- 0x%02X\n", old_val);
 572		break;
 573	case ATOM_SRC_BYTE16:
 574		DEBUG(".[23:16] <- 0x%02X\n", old_val);
 575		break;
 576	case ATOM_SRC_BYTE24:
 577		DEBUG(".[31:24] <- 0x%02X\n", old_val);
 578		break;
 579	}
 580}
 581
 582static void atom_op_add(atom_exec_context *ctx, int *ptr, int arg)
 583{
 584	uint8_t attr = U8((*ptr)++);
 585	uint32_t dst, src, saved;
 586	int dptr = *ptr;
 587	SDEBUG("   dst: ");
 588	dst = atom_get_dst(ctx, arg, attr, ptr, &saved, 1);
 589	SDEBUG("   src: ");
 590	src = atom_get_src(ctx, attr, ptr);
 591	dst += src;
 592	SDEBUG("   dst: ");
 593	atom_put_dst(ctx, arg, attr, &dptr, dst, saved);
 594}
 595
 596static void atom_op_and(atom_exec_context *ctx, int *ptr, int arg)
 597{
 598	uint8_t attr = U8((*ptr)++);
 599	uint32_t dst, src, saved;
 600	int dptr = *ptr;
 601	SDEBUG("   dst: ");
 602	dst = atom_get_dst(ctx, arg, attr, ptr, &saved, 1);
 603	SDEBUG("   src: ");
 604	src = atom_get_src(ctx, attr, ptr);
 605	dst &= src;
 606	SDEBUG("   dst: ");
 607	atom_put_dst(ctx, arg, attr, &dptr, dst, saved);
 608}
 609
 610static void atom_op_beep(atom_exec_context *ctx, int *ptr, int arg)
 611{
 612	printk("ATOM BIOS beeped!\n");
 613}
 614
 615static void atom_op_calltable(atom_exec_context *ctx, int *ptr, int arg)
 616{
 617	int idx = U8((*ptr)++);
 618	int r = 0;
 619
 620	if (idx < ATOM_TABLE_NAMES_CNT)
 621		SDEBUG("   table: %d (%s)\n", idx, atom_table_names[idx]);
 622	else
 623		SDEBUG("   table: %d\n", idx);
 624	if (U16(ctx->ctx->cmd_table + 4 + 2 * idx))
 625		r = amdgpu_atom_execute_table_locked(ctx->ctx, idx, ctx->ps + ctx->ps_shift);
 626	if (r) {
 627		ctx->abort = true;
 628	}
 629}
 630
 631static void atom_op_clear(atom_exec_context *ctx, int *ptr, int arg)
 632{
 633	uint8_t attr = U8((*ptr)++);
 634	uint32_t saved;
 635	int dptr = *ptr;
 636	attr &= 0x38;
 637	attr |= atom_def_dst[attr >> 3] << 6;
 638	atom_get_dst(ctx, arg, attr, ptr, &saved, 0);
 639	SDEBUG("   dst: ");
 640	atom_put_dst(ctx, arg, attr, &dptr, 0, saved);
 641}
 642
 643static void atom_op_compare(atom_exec_context *ctx, int *ptr, int arg)
 644{
 645	uint8_t attr = U8((*ptr)++);
 646	uint32_t dst, src;
 647	SDEBUG("   src1: ");
 648	dst = atom_get_dst(ctx, arg, attr, ptr, NULL, 1);
 649	SDEBUG("   src2: ");
 650	src = atom_get_src(ctx, attr, ptr);
 651	ctx->ctx->cs_equal = (dst == src);
 652	ctx->ctx->cs_above = (dst > src);
 653	SDEBUG("   result: %s %s\n", ctx->ctx->cs_equal ? "EQ" : "NE",
 654	       ctx->ctx->cs_above ? "GT" : "LE");
 655}
 656
 657static void atom_op_delay(atom_exec_context *ctx, int *ptr, int arg)
 658{
 659	unsigned count = U8((*ptr)++);
 660	SDEBUG("   count: %d\n", count);
 661	if (arg == ATOM_UNIT_MICROSEC)
 662		udelay(count);
 663	else if (!drm_can_sleep())
 664		mdelay(count);
 665	else
 666		msleep(count);
 667}
 668
 669static void atom_op_div(atom_exec_context *ctx, int *ptr, int arg)
 670{
 671	uint8_t attr = U8((*ptr)++);
 672	uint32_t dst, src;
 673	SDEBUG("   src1: ");
 674	dst = atom_get_dst(ctx, arg, attr, ptr, NULL, 1);
 675	SDEBUG("   src2: ");
 676	src = atom_get_src(ctx, attr, ptr);
 677	if (src != 0) {
 678		ctx->ctx->divmul[0] = dst / src;
 679		ctx->ctx->divmul[1] = dst % src;
 680	} else {
 681		ctx->ctx->divmul[0] = 0;
 682		ctx->ctx->divmul[1] = 0;
 683	}
 684}
 685
 686static void atom_op_div32(atom_exec_context *ctx, int *ptr, int arg)
 687{
 688	uint64_t val64;
 689	uint8_t attr = U8((*ptr)++);
 690	uint32_t dst, src;
 691	SDEBUG("   src1: ");
 692	dst = atom_get_dst(ctx, arg, attr, ptr, NULL, 1);
 693	SDEBUG("   src2: ");
 694	src = atom_get_src(ctx, attr, ptr);
 695	if (src != 0) {
 696		val64 = dst;
 697		val64 |= ((uint64_t)ctx->ctx->divmul[1]) << 32;
 698		do_div(val64, src);
 699		ctx->ctx->divmul[0] = lower_32_bits(val64);
 700		ctx->ctx->divmul[1] = upper_32_bits(val64);
 701	} else {
 702		ctx->ctx->divmul[0] = 0;
 703		ctx->ctx->divmul[1] = 0;
 704	}
 705}
 706
 707static void atom_op_eot(atom_exec_context *ctx, int *ptr, int arg)
 708{
 709	/* functionally, a nop */
 710}
 711
 712static void atom_op_jump(atom_exec_context *ctx, int *ptr, int arg)
 713{
 714	int execute = 0, target = U16(*ptr);
 715	unsigned long cjiffies;
 716
 717	(*ptr) += 2;
 718	switch (arg) {
 719	case ATOM_COND_ABOVE:
 720		execute = ctx->ctx->cs_above;
 721		break;
 722	case ATOM_COND_ABOVEOREQUAL:
 723		execute = ctx->ctx->cs_above || ctx->ctx->cs_equal;
 724		break;
 725	case ATOM_COND_ALWAYS:
 726		execute = 1;
 727		break;
 728	case ATOM_COND_BELOW:
 729		execute = !(ctx->ctx->cs_above || ctx->ctx->cs_equal);
 730		break;
 731	case ATOM_COND_BELOWOREQUAL:
 732		execute = !ctx->ctx->cs_above;
 733		break;
 734	case ATOM_COND_EQUAL:
 735		execute = ctx->ctx->cs_equal;
 736		break;
 737	case ATOM_COND_NOTEQUAL:
 738		execute = !ctx->ctx->cs_equal;
 739		break;
 740	}
 741	if (arg != ATOM_COND_ALWAYS)
 742		SDEBUG("   taken: %s\n", execute ? "yes" : "no");
 743	SDEBUG("   target: 0x%04X\n", target);
 744	if (execute) {
 745		if (ctx->last_jump == (ctx->start + target)) {
 746			cjiffies = jiffies;
 747			if (time_after(cjiffies, ctx->last_jump_jiffies)) {
 748				cjiffies -= ctx->last_jump_jiffies;
 749				if ((jiffies_to_msecs(cjiffies) > ATOM_CMD_TIMEOUT_SEC*1000)) {
 750					DRM_ERROR("atombios stuck in loop for more than %dsecs aborting\n",
 751						  ATOM_CMD_TIMEOUT_SEC);
 752					ctx->abort = true;
 753				}
 754			} else {
 755				/* jiffies wrap around we will just wait a little longer */
 756				ctx->last_jump_jiffies = jiffies;
 757			}
 758		} else {
 759			ctx->last_jump = ctx->start + target;
 760			ctx->last_jump_jiffies = jiffies;
 761		}
 762		*ptr = ctx->start + target;
 763	}
 764}
 765
 766static void atom_op_mask(atom_exec_context *ctx, int *ptr, int arg)
 767{
 768	uint8_t attr = U8((*ptr)++);
 769	uint32_t dst, mask, src, saved;
 770	int dptr = *ptr;
 771	SDEBUG("   dst: ");
 772	dst = atom_get_dst(ctx, arg, attr, ptr, &saved, 1);
 773	mask = atom_get_src_direct(ctx, ((attr >> 3) & 7), ptr);
 774	SDEBUG("   mask: 0x%08x", mask);
 775	SDEBUG("   src: ");
 776	src = atom_get_src(ctx, attr, ptr);
 777	dst &= mask;
 778	dst |= src;
 779	SDEBUG("   dst: ");
 780	atom_put_dst(ctx, arg, attr, &dptr, dst, saved);
 781}
 782
 783static void atom_op_move(atom_exec_context *ctx, int *ptr, int arg)
 784{
 785	uint8_t attr = U8((*ptr)++);
 786	uint32_t src, saved;
 787	int dptr = *ptr;
 788	if (((attr >> 3) & 7) != ATOM_SRC_DWORD)
 789		atom_get_dst(ctx, arg, attr, ptr, &saved, 0);
 790	else {
 791		atom_skip_dst(ctx, arg, attr, ptr);
 792		saved = 0xCDCDCDCD;
 793	}
 794	SDEBUG("   src: ");
 795	src = atom_get_src(ctx, attr, ptr);
 796	SDEBUG("   dst: ");
 797	atom_put_dst(ctx, arg, attr, &dptr, src, saved);
 798}
 799
 800static void atom_op_mul(atom_exec_context *ctx, int *ptr, int arg)
 801{
 802	uint8_t attr = U8((*ptr)++);
 803	uint32_t dst, src;
 804	SDEBUG("   src1: ");
 805	dst = atom_get_dst(ctx, arg, attr, ptr, NULL, 1);
 806	SDEBUG("   src2: ");
 807	src = atom_get_src(ctx, attr, ptr);
 808	ctx->ctx->divmul[0] = dst * src;
 809}
 810
 811static void atom_op_mul32(atom_exec_context *ctx, int *ptr, int arg)
 812{
 813	uint64_t val64;
 814	uint8_t attr = U8((*ptr)++);
 815	uint32_t dst, src;
 816	SDEBUG("   src1: ");
 817	dst = atom_get_dst(ctx, arg, attr, ptr, NULL, 1);
 818	SDEBUG("   src2: ");
 819	src = atom_get_src(ctx, attr, ptr);
 820	val64 = (uint64_t)dst * (uint64_t)src;
 821	ctx->ctx->divmul[0] = lower_32_bits(val64);
 822	ctx->ctx->divmul[1] = upper_32_bits(val64);
 823}
 824
 825static void atom_op_nop(atom_exec_context *ctx, int *ptr, int arg)
 826{
 827	/* nothing */
 828}
 829
 830static void atom_op_or(atom_exec_context *ctx, int *ptr, int arg)
 831{
 832	uint8_t attr = U8((*ptr)++);
 833	uint32_t dst, src, saved;
 834	int dptr = *ptr;
 835	SDEBUG("   dst: ");
 836	dst = atom_get_dst(ctx, arg, attr, ptr, &saved, 1);
 837	SDEBUG("   src: ");
 838	src = atom_get_src(ctx, attr, ptr);
 839	dst |= src;
 840	SDEBUG("   dst: ");
 841	atom_put_dst(ctx, arg, attr, &dptr, dst, saved);
 842}
 843
 844static void atom_op_postcard(atom_exec_context *ctx, int *ptr, int arg)
 845{
 846	uint8_t val = U8((*ptr)++);
 847	SDEBUG("POST card output: 0x%02X\n", val);
 848}
 849
 850static void atom_op_repeat(atom_exec_context *ctx, int *ptr, int arg)
 851{
 852	pr_info("unimplemented!\n");
 853}
 854
 855static void atom_op_restorereg(atom_exec_context *ctx, int *ptr, int arg)
 856{
 857	pr_info("unimplemented!\n");
 858}
 859
 860static void atom_op_savereg(atom_exec_context *ctx, int *ptr, int arg)
 861{
 862	pr_info("unimplemented!\n");
 863}
 864
 865static void atom_op_setdatablock(atom_exec_context *ctx, int *ptr, int arg)
 866{
 867	int idx = U8(*ptr);
 868	(*ptr)++;
 869	SDEBUG("   block: %d\n", idx);
 870	if (!idx)
 871		ctx->ctx->data_block = 0;
 872	else if (idx == 255)
 873		ctx->ctx->data_block = ctx->start;
 874	else
 875		ctx->ctx->data_block = U16(ctx->ctx->data_table + 4 + 2 * idx);
 876	SDEBUG("   base: 0x%04X\n", ctx->ctx->data_block);
 877}
 878
 879static void atom_op_setfbbase(atom_exec_context *ctx, int *ptr, int arg)
 880{
 881	uint8_t attr = U8((*ptr)++);
 882	SDEBUG("   fb_base: ");
 883	ctx->ctx->fb_base = atom_get_src(ctx, attr, ptr);
 884}
 885
 886static void atom_op_setport(atom_exec_context *ctx, int *ptr, int arg)
 887{
 888	int port;
 889	switch (arg) {
 890	case ATOM_PORT_ATI:
 891		port = U16(*ptr);
 892		if (port < ATOM_IO_NAMES_CNT)
 893			SDEBUG("   port: %d (%s)\n", port, atom_io_names[port]);
 894		else
 895			SDEBUG("   port: %d\n", port);
 896		if (!port)
 897			ctx->ctx->io_mode = ATOM_IO_MM;
 898		else
 899			ctx->ctx->io_mode = ATOM_IO_IIO | port;
 900		(*ptr) += 2;
 901		break;
 902	case ATOM_PORT_PCI:
 903		ctx->ctx->io_mode = ATOM_IO_PCI;
 904		(*ptr)++;
 905		break;
 906	case ATOM_PORT_SYSIO:
 907		ctx->ctx->io_mode = ATOM_IO_SYSIO;
 908		(*ptr)++;
 909		break;
 910	}
 911}
 912
 913static void atom_op_setregblock(atom_exec_context *ctx, int *ptr, int arg)
 914{
 915	ctx->ctx->reg_block = U16(*ptr);
 916	(*ptr) += 2;
 917	SDEBUG("   base: 0x%04X\n", ctx->ctx->reg_block);
 918}
 919
 920static void atom_op_shift_left(atom_exec_context *ctx, int *ptr, int arg)
 921{
 922	uint8_t attr = U8((*ptr)++), shift;
 923	uint32_t saved, dst;
 924	int dptr = *ptr;
 925	attr &= 0x38;
 926	attr |= atom_def_dst[attr >> 3] << 6;
 927	SDEBUG("   dst: ");
 928	dst = atom_get_dst(ctx, arg, attr, ptr, &saved, 1);
 929	shift = atom_get_src_direct(ctx, ATOM_SRC_BYTE0, ptr);
 930	SDEBUG("   shift: %d\n", shift);
 931	dst <<= shift;
 932	SDEBUG("   dst: ");
 933	atom_put_dst(ctx, arg, attr, &dptr, dst, saved);
 934}
 935
 936static void atom_op_shift_right(atom_exec_context *ctx, int *ptr, int arg)
 937{
 938	uint8_t attr = U8((*ptr)++), shift;
 939	uint32_t saved, dst;
 940	int dptr = *ptr;
 941	attr &= 0x38;
 942	attr |= atom_def_dst[attr >> 3] << 6;
 943	SDEBUG("   dst: ");
 944	dst = atom_get_dst(ctx, arg, attr, ptr, &saved, 1);
 945	shift = atom_get_src_direct(ctx, ATOM_SRC_BYTE0, ptr);
 946	SDEBUG("   shift: %d\n", shift);
 947	dst >>= shift;
 948	SDEBUG("   dst: ");
 949	atom_put_dst(ctx, arg, attr, &dptr, dst, saved);
 950}
 951
 952static void atom_op_shl(atom_exec_context *ctx, int *ptr, int arg)
 953{
 954	uint8_t attr = U8((*ptr)++), shift;
 955	uint32_t saved, dst;
 956	int dptr = *ptr;
 957	uint32_t dst_align = atom_dst_to_src[(attr >> 3) & 7][(attr >> 6) & 3];
 958	SDEBUG("   dst: ");
 959	dst = atom_get_dst(ctx, arg, attr, ptr, &saved, 1);
 960	/* op needs to full dst value */
 961	dst = saved;
 962	shift = atom_get_src(ctx, attr, ptr);
 963	SDEBUG("   shift: %d\n", shift);
 964	dst <<= shift;
 965	dst &= atom_arg_mask[dst_align];
 966	dst >>= atom_arg_shift[dst_align];
 967	SDEBUG("   dst: ");
 968	atom_put_dst(ctx, arg, attr, &dptr, dst, saved);
 969}
 970
 971static void atom_op_shr(atom_exec_context *ctx, int *ptr, int arg)
 972{
 973	uint8_t attr = U8((*ptr)++), shift;
 974	uint32_t saved, dst;
 975	int dptr = *ptr;
 976	uint32_t dst_align = atom_dst_to_src[(attr >> 3) & 7][(attr >> 6) & 3];
 977	SDEBUG("   dst: ");
 978	dst = atom_get_dst(ctx, arg, attr, ptr, &saved, 1);
 979	/* op needs to full dst value */
 980	dst = saved;
 981	shift = atom_get_src(ctx, attr, ptr);
 982	SDEBUG("   shift: %d\n", shift);
 983	dst >>= shift;
 984	dst &= atom_arg_mask[dst_align];
 985	dst >>= atom_arg_shift[dst_align];
 986	SDEBUG("   dst: ");
 987	atom_put_dst(ctx, arg, attr, &dptr, dst, saved);
 988}
 989
 990static void atom_op_sub(atom_exec_context *ctx, int *ptr, int arg)
 991{
 992	uint8_t attr = U8((*ptr)++);
 993	uint32_t dst, src, saved;
 994	int dptr = *ptr;
 995	SDEBUG("   dst: ");
 996	dst = atom_get_dst(ctx, arg, attr, ptr, &saved, 1);
 997	SDEBUG("   src: ");
 998	src = atom_get_src(ctx, attr, ptr);
 999	dst -= src;
1000	SDEBUG("   dst: ");
1001	atom_put_dst(ctx, arg, attr, &dptr, dst, saved);
1002}
1003
1004static void atom_op_switch(atom_exec_context *ctx, int *ptr, int arg)
1005{
1006	uint8_t attr = U8((*ptr)++);
1007	uint32_t src, val, target;
1008	SDEBUG("   switch: ");
1009	src = atom_get_src(ctx, attr, ptr);
1010	while (U16(*ptr) != ATOM_CASE_END)
1011		if (U8(*ptr) == ATOM_CASE_MAGIC) {
1012			(*ptr)++;
1013			SDEBUG("   case: ");
1014			val =
1015			    atom_get_src(ctx, (attr & 0x38) | ATOM_ARG_IMM,
1016					 ptr);
1017			target = U16(*ptr);
1018			if (val == src) {
1019				SDEBUG("   target: %04X\n", target);
1020				*ptr = ctx->start + target;
1021				return;
1022			}
1023			(*ptr) += 2;
1024		} else {
1025			pr_info("Bad case\n");
1026			return;
1027		}
1028	(*ptr) += 2;
1029}
1030
1031static void atom_op_test(atom_exec_context *ctx, int *ptr, int arg)
1032{
1033	uint8_t attr = U8((*ptr)++);
1034	uint32_t dst, src;
1035	SDEBUG("   src1: ");
1036	dst = atom_get_dst(ctx, arg, attr, ptr, NULL, 1);
1037	SDEBUG("   src2: ");
1038	src = atom_get_src(ctx, attr, ptr);
1039	ctx->ctx->cs_equal = ((dst & src) == 0);
1040	SDEBUG("   result: %s\n", ctx->ctx->cs_equal ? "EQ" : "NE");
1041}
1042
1043static void atom_op_xor(atom_exec_context *ctx, int *ptr, int arg)
1044{
1045	uint8_t attr = U8((*ptr)++);
1046	uint32_t dst, src, saved;
1047	int dptr = *ptr;
1048	SDEBUG("   dst: ");
1049	dst = atom_get_dst(ctx, arg, attr, ptr, &saved, 1);
1050	SDEBUG("   src: ");
1051	src = atom_get_src(ctx, attr, ptr);
1052	dst ^= src;
1053	SDEBUG("   dst: ");
1054	atom_put_dst(ctx, arg, attr, &dptr, dst, saved);
1055}
1056
1057static void atom_op_debug(atom_exec_context *ctx, int *ptr, int arg)
1058{
1059	uint8_t val = U8((*ptr)++);
1060	SDEBUG("DEBUG output: 0x%02X\n", val);
1061}
1062
1063static void atom_op_processds(atom_exec_context *ctx, int *ptr, int arg)
1064{
1065	uint16_t val = U16(*ptr);
1066	(*ptr) += val + 2;
1067	SDEBUG("PROCESSDS output: 0x%02X\n", val);
1068}
1069
1070static struct {
1071	void (*func) (atom_exec_context *, int *, int);
1072	int arg;
1073} opcode_table[ATOM_OP_CNT] = {
1074	{
1075	NULL, 0}, {
1076	atom_op_move, ATOM_ARG_REG}, {
1077	atom_op_move, ATOM_ARG_PS}, {
1078	atom_op_move, ATOM_ARG_WS}, {
1079	atom_op_move, ATOM_ARG_FB}, {
1080	atom_op_move, ATOM_ARG_PLL}, {
1081	atom_op_move, ATOM_ARG_MC}, {
1082	atom_op_and, ATOM_ARG_REG}, {
1083	atom_op_and, ATOM_ARG_PS}, {
1084	atom_op_and, ATOM_ARG_WS}, {
1085	atom_op_and, ATOM_ARG_FB}, {
1086	atom_op_and, ATOM_ARG_PLL}, {
1087	atom_op_and, ATOM_ARG_MC}, {
1088	atom_op_or, ATOM_ARG_REG}, {
1089	atom_op_or, ATOM_ARG_PS}, {
1090	atom_op_or, ATOM_ARG_WS}, {
1091	atom_op_or, ATOM_ARG_FB}, {
1092	atom_op_or, ATOM_ARG_PLL}, {
1093	atom_op_or, ATOM_ARG_MC}, {
1094	atom_op_shift_left, ATOM_ARG_REG}, {
1095	atom_op_shift_left, ATOM_ARG_PS}, {
1096	atom_op_shift_left, ATOM_ARG_WS}, {
1097	atom_op_shift_left, ATOM_ARG_FB}, {
1098	atom_op_shift_left, ATOM_ARG_PLL}, {
1099	atom_op_shift_left, ATOM_ARG_MC}, {
1100	atom_op_shift_right, ATOM_ARG_REG}, {
1101	atom_op_shift_right, ATOM_ARG_PS}, {
1102	atom_op_shift_right, ATOM_ARG_WS}, {
1103	atom_op_shift_right, ATOM_ARG_FB}, {
1104	atom_op_shift_right, ATOM_ARG_PLL}, {
1105	atom_op_shift_right, ATOM_ARG_MC}, {
1106	atom_op_mul, ATOM_ARG_REG}, {
1107	atom_op_mul, ATOM_ARG_PS}, {
1108	atom_op_mul, ATOM_ARG_WS}, {
1109	atom_op_mul, ATOM_ARG_FB}, {
1110	atom_op_mul, ATOM_ARG_PLL}, {
1111	atom_op_mul, ATOM_ARG_MC}, {
1112	atom_op_div, ATOM_ARG_REG}, {
1113	atom_op_div, ATOM_ARG_PS}, {
1114	atom_op_div, ATOM_ARG_WS}, {
1115	atom_op_div, ATOM_ARG_FB}, {
1116	atom_op_div, ATOM_ARG_PLL}, {
1117	atom_op_div, ATOM_ARG_MC}, {
1118	atom_op_add, ATOM_ARG_REG}, {
1119	atom_op_add, ATOM_ARG_PS}, {
1120	atom_op_add, ATOM_ARG_WS}, {
1121	atom_op_add, ATOM_ARG_FB}, {
1122	atom_op_add, ATOM_ARG_PLL}, {
1123	atom_op_add, ATOM_ARG_MC}, {
1124	atom_op_sub, ATOM_ARG_REG}, {
1125	atom_op_sub, ATOM_ARG_PS}, {
1126	atom_op_sub, ATOM_ARG_WS}, {
1127	atom_op_sub, ATOM_ARG_FB}, {
1128	atom_op_sub, ATOM_ARG_PLL}, {
1129	atom_op_sub, ATOM_ARG_MC}, {
1130	atom_op_setport, ATOM_PORT_ATI}, {
1131	atom_op_setport, ATOM_PORT_PCI}, {
1132	atom_op_setport, ATOM_PORT_SYSIO}, {
1133	atom_op_setregblock, 0}, {
1134	atom_op_setfbbase, 0}, {
1135	atom_op_compare, ATOM_ARG_REG}, {
1136	atom_op_compare, ATOM_ARG_PS}, {
1137	atom_op_compare, ATOM_ARG_WS}, {
1138	atom_op_compare, ATOM_ARG_FB}, {
1139	atom_op_compare, ATOM_ARG_PLL}, {
1140	atom_op_compare, ATOM_ARG_MC}, {
1141	atom_op_switch, 0}, {
1142	atom_op_jump, ATOM_COND_ALWAYS}, {
1143	atom_op_jump, ATOM_COND_EQUAL}, {
1144	atom_op_jump, ATOM_COND_BELOW}, {
1145	atom_op_jump, ATOM_COND_ABOVE}, {
1146	atom_op_jump, ATOM_COND_BELOWOREQUAL}, {
1147	atom_op_jump, ATOM_COND_ABOVEOREQUAL}, {
1148	atom_op_jump, ATOM_COND_NOTEQUAL}, {
1149	atom_op_test, ATOM_ARG_REG}, {
1150	atom_op_test, ATOM_ARG_PS}, {
1151	atom_op_test, ATOM_ARG_WS}, {
1152	atom_op_test, ATOM_ARG_FB}, {
1153	atom_op_test, ATOM_ARG_PLL}, {
1154	atom_op_test, ATOM_ARG_MC}, {
1155	atom_op_delay, ATOM_UNIT_MILLISEC}, {
1156	atom_op_delay, ATOM_UNIT_MICROSEC}, {
1157	atom_op_calltable, 0}, {
1158	atom_op_repeat, 0}, {
1159	atom_op_clear, ATOM_ARG_REG}, {
1160	atom_op_clear, ATOM_ARG_PS}, {
1161	atom_op_clear, ATOM_ARG_WS}, {
1162	atom_op_clear, ATOM_ARG_FB}, {
1163	atom_op_clear, ATOM_ARG_PLL}, {
1164	atom_op_clear, ATOM_ARG_MC}, {
1165	atom_op_nop, 0}, {
1166	atom_op_eot, 0}, {
1167	atom_op_mask, ATOM_ARG_REG}, {
1168	atom_op_mask, ATOM_ARG_PS}, {
1169	atom_op_mask, ATOM_ARG_WS}, {
1170	atom_op_mask, ATOM_ARG_FB}, {
1171	atom_op_mask, ATOM_ARG_PLL}, {
1172	atom_op_mask, ATOM_ARG_MC}, {
1173	atom_op_postcard, 0}, {
1174	atom_op_beep, 0}, {
1175	atom_op_savereg, 0}, {
1176	atom_op_restorereg, 0}, {
1177	atom_op_setdatablock, 0}, {
1178	atom_op_xor, ATOM_ARG_REG}, {
1179	atom_op_xor, ATOM_ARG_PS}, {
1180	atom_op_xor, ATOM_ARG_WS}, {
1181	atom_op_xor, ATOM_ARG_FB}, {
1182	atom_op_xor, ATOM_ARG_PLL}, {
1183	atom_op_xor, ATOM_ARG_MC}, {
1184	atom_op_shl, ATOM_ARG_REG}, {
1185	atom_op_shl, ATOM_ARG_PS}, {
1186	atom_op_shl, ATOM_ARG_WS}, {
1187	atom_op_shl, ATOM_ARG_FB}, {
1188	atom_op_shl, ATOM_ARG_PLL}, {
1189	atom_op_shl, ATOM_ARG_MC}, {
1190	atom_op_shr, ATOM_ARG_REG}, {
1191	atom_op_shr, ATOM_ARG_PS}, {
1192	atom_op_shr, ATOM_ARG_WS}, {
1193	atom_op_shr, ATOM_ARG_FB}, {
1194	atom_op_shr, ATOM_ARG_PLL}, {
1195	atom_op_shr, ATOM_ARG_MC}, {
1196	atom_op_debug, 0}, {
1197	atom_op_processds, 0}, {
1198	atom_op_mul32, ATOM_ARG_PS}, {
1199	atom_op_mul32, ATOM_ARG_WS}, {
1200	atom_op_div32, ATOM_ARG_PS}, {
1201	atom_op_div32, ATOM_ARG_WS},
1202};
1203
1204static int amdgpu_atom_execute_table_locked(struct atom_context *ctx, int index, uint32_t * params)
1205{
1206	int base = CU16(ctx->cmd_table + 4 + 2 * index);
1207	int len, ws, ps, ptr;
1208	unsigned char op;
1209	atom_exec_context ectx;
1210	int ret = 0;
1211
1212	if (!base)
1213		return -EINVAL;
1214
1215	len = CU16(base + ATOM_CT_SIZE_PTR);
1216	ws = CU8(base + ATOM_CT_WS_PTR);
1217	ps = CU8(base + ATOM_CT_PS_PTR) & ATOM_CT_PS_MASK;
1218	ptr = base + ATOM_CT_CODE_PTR;
1219
1220	SDEBUG(">> execute %04X (len %d, WS %d, PS %d)\n", base, len, ws, ps);
1221
1222	ectx.ctx = ctx;
1223	ectx.ps_shift = ps / 4;
1224	ectx.start = base;
1225	ectx.ps = params;
1226	ectx.abort = false;
1227	ectx.last_jump = 0;
1228	if (ws)
1229		ectx.ws = kcalloc(4, ws, GFP_KERNEL);
1230	else
1231		ectx.ws = NULL;
1232
1233	debug_depth++;
1234	while (1) {
1235		op = CU8(ptr++);
1236		if (op < ATOM_OP_NAMES_CNT)
1237			SDEBUG("%s @ 0x%04X\n", atom_op_names[op], ptr - 1);
1238		else
1239			SDEBUG("[%d] @ 0x%04X\n", op, ptr - 1);
1240		if (ectx.abort) {
1241			DRM_ERROR("atombios stuck executing %04X (len %d, WS %d, PS %d) @ 0x%04X\n",
1242				base, len, ws, ps, ptr - 1);
1243			ret = -EINVAL;
1244			goto free;
1245		}
1246
1247		if (op < ATOM_OP_CNT && op > 0)
1248			opcode_table[op].func(&ectx, &ptr,
1249					      opcode_table[op].arg);
1250		else
1251			break;
1252
1253		if (op == ATOM_OP_EOT)
1254			break;
1255	}
1256	debug_depth--;
1257	SDEBUG("<<\n");
1258
1259free:
1260	if (ws)
1261		kfree(ectx.ws);
1262	return ret;
1263}
1264
1265int amdgpu_atom_execute_table(struct atom_context *ctx, int index, uint32_t * params)
1266{
1267	int r;
1268
1269	mutex_lock(&ctx->mutex);
1270	/* reset data block */
1271	ctx->data_block = 0;
1272	/* reset reg block */
1273	ctx->reg_block = 0;
1274	/* reset fb window */
1275	ctx->fb_base = 0;
1276	/* reset io mode */
1277	ctx->io_mode = ATOM_IO_MM;
1278	/* reset divmul */
1279	ctx->divmul[0] = 0;
1280	ctx->divmul[1] = 0;
1281	r = amdgpu_atom_execute_table_locked(ctx, index, params);
1282	mutex_unlock(&ctx->mutex);
1283	return r;
1284}
1285
1286static int atom_iio_len[] = { 1, 2, 3, 3, 3, 3, 4, 4, 4, 3 };
1287
1288static void atom_index_iio(struct atom_context *ctx, int base)
1289{
1290	ctx->iio = kzalloc(2 * 256, GFP_KERNEL);
1291	if (!ctx->iio)
1292		return;
1293	while (CU8(base) == ATOM_IIO_START) {
1294		ctx->iio[CU8(base + 1)] = base + 2;
1295		base += 2;
1296		while (CU8(base) != ATOM_IIO_END)
1297			base += atom_iio_len[CU8(base)];
1298		base += 3;
1299	}
1300}
1301
1302struct atom_context *amdgpu_atom_parse(struct card_info *card, void *bios)
1303{
1304	int base;
1305	struct atom_context *ctx =
1306	    kzalloc(sizeof(struct atom_context), GFP_KERNEL);
1307	char *str;
1308	u16 idx;
 
1309
1310	if (!ctx)
1311		return NULL;
1312
1313	ctx->card = card;
1314	ctx->bios = bios;
1315
1316	if (CU16(0) != ATOM_BIOS_MAGIC) {
1317		pr_info("Invalid BIOS magic\n");
1318		kfree(ctx);
1319		return NULL;
1320	}
1321	if (strncmp
1322	    (CSTR(ATOM_ATI_MAGIC_PTR), ATOM_ATI_MAGIC,
1323	     strlen(ATOM_ATI_MAGIC))) {
1324		pr_info("Invalid ATI magic\n");
1325		kfree(ctx);
1326		return NULL;
1327	}
1328
1329	base = CU16(ATOM_ROM_TABLE_PTR);
1330	if (strncmp
1331	    (CSTR(base + ATOM_ROM_MAGIC_PTR), ATOM_ROM_MAGIC,
1332	     strlen(ATOM_ROM_MAGIC))) {
1333		pr_info("Invalid ATOM magic\n");
1334		kfree(ctx);
1335		return NULL;
1336	}
1337
1338	ctx->cmd_table = CU16(base + ATOM_ROM_CMD_PTR);
1339	ctx->data_table = CU16(base + ATOM_ROM_DATA_PTR);
1340	atom_index_iio(ctx, CU16(ctx->data_table + ATOM_DATA_IIO_PTR) + 4);
1341	if (!ctx->iio) {
1342		amdgpu_atom_destroy(ctx);
1343		return NULL;
1344	}
1345
1346	idx = CU16(ATOM_ROM_PART_NUMBER_PTR);
1347	if (idx == 0)
1348		idx = 0x80;
1349
1350	str = CSTR(idx);
1351	if (*str != '\0') {
1352		pr_info("ATOM BIOS: %s\n", str);
1353		strlcpy(ctx->vbios_version, str, sizeof(ctx->vbios_version));
 
 
1354	}
1355
1356
1357	return ctx;
1358}
1359
1360int amdgpu_atom_asic_init(struct atom_context *ctx)
1361{
1362	int hwi = CU16(ctx->data_table + ATOM_DATA_FWI_PTR);
1363	uint32_t ps[16];
1364	int ret;
1365
1366	memset(ps, 0, 64);
1367
1368	ps[0] = cpu_to_le32(CU32(hwi + ATOM_FWI_DEFSCLK_PTR));
1369	ps[1] = cpu_to_le32(CU32(hwi + ATOM_FWI_DEFMCLK_PTR));
1370	if (!ps[0] || !ps[1])
1371		return 1;
1372
1373	if (!CU16(ctx->cmd_table + 4 + 2 * ATOM_CMD_INIT))
1374		return 1;
1375	ret = amdgpu_atom_execute_table(ctx, ATOM_CMD_INIT, ps);
1376	if (ret)
1377		return ret;
1378
1379	memset(ps, 0, 64);
1380
1381	return ret;
1382}
1383
1384void amdgpu_atom_destroy(struct atom_context *ctx)
1385{
1386	kfree(ctx->iio);
1387	kfree(ctx);
1388}
1389
1390bool amdgpu_atom_parse_data_header(struct atom_context *ctx, int index,
1391			    uint16_t * size, uint8_t * frev, uint8_t * crev,
1392			    uint16_t * data_start)
1393{
1394	int offset = index * 2 + 4;
1395	int idx = CU16(ctx->data_table + offset);
1396	u16 *mdt = (u16 *)(ctx->bios + ctx->data_table + 4);
1397
1398	if (!mdt[index])
1399		return false;
1400
1401	if (size)
1402		*size = CU16(idx);
1403	if (frev)
1404		*frev = CU8(idx + 2);
1405	if (crev)
1406		*crev = CU8(idx + 3);
1407	*data_start = idx;
1408	return true;
1409}
1410
1411bool amdgpu_atom_parse_cmd_header(struct atom_context *ctx, int index, uint8_t * frev,
1412			   uint8_t * crev)
1413{
1414	int offset = index * 2 + 4;
1415	int idx = CU16(ctx->cmd_table + offset);
1416	u16 *mct = (u16 *)(ctx->bios + ctx->cmd_table + 4);
1417
1418	if (!mct[index])
1419		return false;
1420
1421	if (frev)
1422		*frev = CU8(idx + 2);
1423	if (crev)
1424		*crev = CU8(idx + 3);
1425	return true;
1426}
1427