Linux Audio

Check our new training course

Loading...
v6.8
   1// SPDX-License-Identifier: GPL-2.0-only
   2/*
   3 * Intel I/OAT DMA Linux driver
   4 * Copyright(c) 2004 - 2015 Intel Corporation.
 
 
 
 
 
 
 
 
 
 
 
 
 
   5 */
   6
   7#include <linux/init.h>
   8#include <linux/module.h>
   9#include <linux/slab.h>
  10#include <linux/pci.h>
  11#include <linux/interrupt.h>
  12#include <linux/dmaengine.h>
  13#include <linux/delay.h>
  14#include <linux/dma-mapping.h>
  15#include <linux/workqueue.h>
  16#include <linux/prefetch.h>
  17#include <linux/dca.h>
 
  18#include <linux/sizes.h>
  19#include "dma.h"
  20#include "registers.h"
  21#include "hw.h"
  22
  23#include "../dmaengine.h"
  24
  25MODULE_VERSION(IOAT_DMA_VERSION);
  26MODULE_LICENSE("Dual BSD/GPL");
  27MODULE_AUTHOR("Intel Corporation");
  28
  29static const struct pci_device_id ioat_pci_tbl[] = {
  30	/* I/OAT v3 platforms */
  31	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_TBG0) },
  32	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_TBG1) },
  33	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_TBG2) },
  34	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_TBG3) },
  35	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_TBG4) },
  36	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_TBG5) },
  37	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_TBG6) },
  38	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_TBG7) },
  39
  40	/* I/OAT v3.2 platforms */
  41	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_JSF0) },
  42	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_JSF1) },
  43	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_JSF2) },
  44	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_JSF3) },
  45	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_JSF4) },
  46	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_JSF5) },
  47	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_JSF6) },
  48	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_JSF7) },
  49	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_JSF8) },
  50	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_JSF9) },
  51
  52	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_SNB0) },
  53	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_SNB1) },
  54	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_SNB2) },
  55	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_SNB3) },
  56	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_SNB4) },
  57	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_SNB5) },
  58	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_SNB6) },
  59	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_SNB7) },
  60	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_SNB8) },
  61	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_SNB9) },
  62
  63	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_IVB0) },
  64	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_IVB1) },
  65	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_IVB2) },
  66	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_IVB3) },
  67	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_IVB4) },
  68	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_IVB5) },
  69	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_IVB6) },
  70	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_IVB7) },
  71	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_IVB8) },
  72	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_IVB9) },
  73
  74	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_HSW0) },
  75	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_HSW1) },
  76	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_HSW2) },
  77	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_HSW3) },
  78	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_HSW4) },
  79	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_HSW5) },
  80	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_HSW6) },
  81	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_HSW7) },
  82	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_HSW8) },
  83	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_HSW9) },
  84
  85	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDX0) },
  86	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDX1) },
  87	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDX2) },
  88	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDX3) },
  89	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDX4) },
  90	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDX5) },
  91	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDX6) },
  92	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDX7) },
  93	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDX8) },
  94	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDX9) },
  95
  96	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_SKX) },
  97
  98	/* I/OAT v3.3 platforms */
  99	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BWD0) },
 100	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BWD1) },
 101	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BWD2) },
 102	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BWD3) },
 103
 104	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDXDE0) },
 105	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDXDE1) },
 106	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDXDE2) },
 107	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDXDE3) },
 108
 109	/* I/OAT v3.4 platforms */
 110	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_ICX) },
 111
 112	{ 0, }
 113};
 114MODULE_DEVICE_TABLE(pci, ioat_pci_tbl);
 115
 116static int ioat_pci_probe(struct pci_dev *pdev, const struct pci_device_id *id);
 117static void ioat_remove(struct pci_dev *pdev);
 118static void
 119ioat_init_channel(struct ioatdma_device *ioat_dma,
 120		  struct ioatdma_chan *ioat_chan, int idx);
 121static void ioat_intr_quirk(struct ioatdma_device *ioat_dma);
 122static void ioat_enumerate_channels(struct ioatdma_device *ioat_dma);
 123static int ioat3_dma_self_test(struct ioatdma_device *ioat_dma);
 124
 125static int ioat_dca_enabled = 1;
 126module_param(ioat_dca_enabled, int, 0644);
 127MODULE_PARM_DESC(ioat_dca_enabled, "control support of dca service (default: 1)");
 128int ioat_pending_level = 7;
 129module_param(ioat_pending_level, int, 0644);
 130MODULE_PARM_DESC(ioat_pending_level,
 131		 "high-water mark for pushing ioat descriptors (default: 7)");
 132static char ioat_interrupt_style[32] = "msix";
 133module_param_string(ioat_interrupt_style, ioat_interrupt_style,
 134		    sizeof(ioat_interrupt_style), 0644);
 135MODULE_PARM_DESC(ioat_interrupt_style,
 136		 "set ioat interrupt style: msix (default), msi, intx");
 137
 138struct kmem_cache *ioat_cache;
 139struct kmem_cache *ioat_sed_cache;
 140
 141static bool is_jf_ioat(struct pci_dev *pdev)
 142{
 143	switch (pdev->device) {
 144	case PCI_DEVICE_ID_INTEL_IOAT_JSF0:
 145	case PCI_DEVICE_ID_INTEL_IOAT_JSF1:
 146	case PCI_DEVICE_ID_INTEL_IOAT_JSF2:
 147	case PCI_DEVICE_ID_INTEL_IOAT_JSF3:
 148	case PCI_DEVICE_ID_INTEL_IOAT_JSF4:
 149	case PCI_DEVICE_ID_INTEL_IOAT_JSF5:
 150	case PCI_DEVICE_ID_INTEL_IOAT_JSF6:
 151	case PCI_DEVICE_ID_INTEL_IOAT_JSF7:
 152	case PCI_DEVICE_ID_INTEL_IOAT_JSF8:
 153	case PCI_DEVICE_ID_INTEL_IOAT_JSF9:
 154		return true;
 155	default:
 156		return false;
 157	}
 158}
 159
 160static bool is_snb_ioat(struct pci_dev *pdev)
 161{
 162	switch (pdev->device) {
 163	case PCI_DEVICE_ID_INTEL_IOAT_SNB0:
 164	case PCI_DEVICE_ID_INTEL_IOAT_SNB1:
 165	case PCI_DEVICE_ID_INTEL_IOAT_SNB2:
 166	case PCI_DEVICE_ID_INTEL_IOAT_SNB3:
 167	case PCI_DEVICE_ID_INTEL_IOAT_SNB4:
 168	case PCI_DEVICE_ID_INTEL_IOAT_SNB5:
 169	case PCI_DEVICE_ID_INTEL_IOAT_SNB6:
 170	case PCI_DEVICE_ID_INTEL_IOAT_SNB7:
 171	case PCI_DEVICE_ID_INTEL_IOAT_SNB8:
 172	case PCI_DEVICE_ID_INTEL_IOAT_SNB9:
 173		return true;
 174	default:
 175		return false;
 176	}
 177}
 178
 179static bool is_ivb_ioat(struct pci_dev *pdev)
 180{
 181	switch (pdev->device) {
 182	case PCI_DEVICE_ID_INTEL_IOAT_IVB0:
 183	case PCI_DEVICE_ID_INTEL_IOAT_IVB1:
 184	case PCI_DEVICE_ID_INTEL_IOAT_IVB2:
 185	case PCI_DEVICE_ID_INTEL_IOAT_IVB3:
 186	case PCI_DEVICE_ID_INTEL_IOAT_IVB4:
 187	case PCI_DEVICE_ID_INTEL_IOAT_IVB5:
 188	case PCI_DEVICE_ID_INTEL_IOAT_IVB6:
 189	case PCI_DEVICE_ID_INTEL_IOAT_IVB7:
 190	case PCI_DEVICE_ID_INTEL_IOAT_IVB8:
 191	case PCI_DEVICE_ID_INTEL_IOAT_IVB9:
 192		return true;
 193	default:
 194		return false;
 195	}
 196
 197}
 198
 199static bool is_hsw_ioat(struct pci_dev *pdev)
 200{
 201	switch (pdev->device) {
 202	case PCI_DEVICE_ID_INTEL_IOAT_HSW0:
 203	case PCI_DEVICE_ID_INTEL_IOAT_HSW1:
 204	case PCI_DEVICE_ID_INTEL_IOAT_HSW2:
 205	case PCI_DEVICE_ID_INTEL_IOAT_HSW3:
 206	case PCI_DEVICE_ID_INTEL_IOAT_HSW4:
 207	case PCI_DEVICE_ID_INTEL_IOAT_HSW5:
 208	case PCI_DEVICE_ID_INTEL_IOAT_HSW6:
 209	case PCI_DEVICE_ID_INTEL_IOAT_HSW7:
 210	case PCI_DEVICE_ID_INTEL_IOAT_HSW8:
 211	case PCI_DEVICE_ID_INTEL_IOAT_HSW9:
 212		return true;
 213	default:
 214		return false;
 215	}
 216
 217}
 218
 219static bool is_bdx_ioat(struct pci_dev *pdev)
 220{
 221	switch (pdev->device) {
 222	case PCI_DEVICE_ID_INTEL_IOAT_BDX0:
 223	case PCI_DEVICE_ID_INTEL_IOAT_BDX1:
 224	case PCI_DEVICE_ID_INTEL_IOAT_BDX2:
 225	case PCI_DEVICE_ID_INTEL_IOAT_BDX3:
 226	case PCI_DEVICE_ID_INTEL_IOAT_BDX4:
 227	case PCI_DEVICE_ID_INTEL_IOAT_BDX5:
 228	case PCI_DEVICE_ID_INTEL_IOAT_BDX6:
 229	case PCI_DEVICE_ID_INTEL_IOAT_BDX7:
 230	case PCI_DEVICE_ID_INTEL_IOAT_BDX8:
 231	case PCI_DEVICE_ID_INTEL_IOAT_BDX9:
 232		return true;
 233	default:
 234		return false;
 235	}
 236}
 237
 238static inline bool is_skx_ioat(struct pci_dev *pdev)
 239{
 240	return (pdev->device == PCI_DEVICE_ID_INTEL_IOAT_SKX) ? true : false;
 241}
 242
 243static bool is_xeon_cb32(struct pci_dev *pdev)
 244{
 245	return is_jf_ioat(pdev) || is_snb_ioat(pdev) || is_ivb_ioat(pdev) ||
 246		is_hsw_ioat(pdev) || is_bdx_ioat(pdev) || is_skx_ioat(pdev);
 247}
 248
 249bool is_bwd_ioat(struct pci_dev *pdev)
 250{
 251	switch (pdev->device) {
 252	case PCI_DEVICE_ID_INTEL_IOAT_BWD0:
 253	case PCI_DEVICE_ID_INTEL_IOAT_BWD1:
 254	case PCI_DEVICE_ID_INTEL_IOAT_BWD2:
 255	case PCI_DEVICE_ID_INTEL_IOAT_BWD3:
 256	/* even though not Atom, BDX-DE has same DMA silicon */
 257	case PCI_DEVICE_ID_INTEL_IOAT_BDXDE0:
 258	case PCI_DEVICE_ID_INTEL_IOAT_BDXDE1:
 259	case PCI_DEVICE_ID_INTEL_IOAT_BDXDE2:
 260	case PCI_DEVICE_ID_INTEL_IOAT_BDXDE3:
 261		return true;
 262	default:
 263		return false;
 264	}
 265}
 266
 267static bool is_bwd_noraid(struct pci_dev *pdev)
 268{
 269	switch (pdev->device) {
 270	case PCI_DEVICE_ID_INTEL_IOAT_BWD2:
 271	case PCI_DEVICE_ID_INTEL_IOAT_BWD3:
 272	case PCI_DEVICE_ID_INTEL_IOAT_BDXDE0:
 273	case PCI_DEVICE_ID_INTEL_IOAT_BDXDE1:
 274	case PCI_DEVICE_ID_INTEL_IOAT_BDXDE2:
 275	case PCI_DEVICE_ID_INTEL_IOAT_BDXDE3:
 276		return true;
 277	default:
 278		return false;
 279	}
 280
 281}
 282
 283/*
 284 * Perform a IOAT transaction to verify the HW works.
 285 */
 286#define IOAT_TEST_SIZE 2000
 287
 288static void ioat_dma_test_callback(void *dma_async_param)
 289{
 290	struct completion *cmp = dma_async_param;
 291
 292	complete(cmp);
 293}
 294
 295/**
 296 * ioat_dma_self_test - Perform a IOAT transaction to verify the HW works.
 297 * @ioat_dma: dma device to be tested
 298 */
 299static int ioat_dma_self_test(struct ioatdma_device *ioat_dma)
 300{
 301	int i;
 302	u8 *src;
 303	u8 *dest;
 304	struct dma_device *dma = &ioat_dma->dma_dev;
 305	struct device *dev = &ioat_dma->pdev->dev;
 306	struct dma_chan *dma_chan;
 307	struct dma_async_tx_descriptor *tx;
 308	dma_addr_t dma_dest, dma_src;
 309	dma_cookie_t cookie;
 310	int err = 0;
 311	struct completion cmp;
 312	unsigned long tmo;
 313	unsigned long flags;
 314
 315	src = kzalloc(IOAT_TEST_SIZE, GFP_KERNEL);
 316	if (!src)
 317		return -ENOMEM;
 318	dest = kzalloc(IOAT_TEST_SIZE, GFP_KERNEL);
 319	if (!dest) {
 320		kfree(src);
 321		return -ENOMEM;
 322	}
 323
 324	/* Fill in src buffer */
 325	for (i = 0; i < IOAT_TEST_SIZE; i++)
 326		src[i] = (u8)i;
 327
 328	/* Start copy, using first DMA channel */
 329	dma_chan = container_of(dma->channels.next, struct dma_chan,
 330				device_node);
 331	if (dma->device_alloc_chan_resources(dma_chan) < 1) {
 332		dev_err(dev, "selftest cannot allocate chan resource\n");
 333		err = -ENODEV;
 334		goto out;
 335	}
 336
 337	dma_src = dma_map_single(dev, src, IOAT_TEST_SIZE, DMA_TO_DEVICE);
 338	if (dma_mapping_error(dev, dma_src)) {
 339		dev_err(dev, "mapping src buffer failed\n");
 340		err = -ENOMEM;
 341		goto free_resources;
 342	}
 343	dma_dest = dma_map_single(dev, dest, IOAT_TEST_SIZE, DMA_FROM_DEVICE);
 344	if (dma_mapping_error(dev, dma_dest)) {
 345		dev_err(dev, "mapping dest buffer failed\n");
 346		err = -ENOMEM;
 347		goto unmap_src;
 348	}
 349	flags = DMA_PREP_INTERRUPT;
 350	tx = ioat_dma->dma_dev.device_prep_dma_memcpy(dma_chan, dma_dest,
 351						      dma_src, IOAT_TEST_SIZE,
 352						      flags);
 353	if (!tx) {
 354		dev_err(dev, "Self-test prep failed, disabling\n");
 355		err = -ENODEV;
 356		goto unmap_dma;
 357	}
 358
 359	async_tx_ack(tx);
 360	init_completion(&cmp);
 361	tx->callback = ioat_dma_test_callback;
 362	tx->callback_param = &cmp;
 363	cookie = tx->tx_submit(tx);
 364	if (cookie < 0) {
 365		dev_err(dev, "Self-test setup failed, disabling\n");
 366		err = -ENODEV;
 367		goto unmap_dma;
 368	}
 369	dma->device_issue_pending(dma_chan);
 370
 371	tmo = wait_for_completion_timeout(&cmp, msecs_to_jiffies(3000));
 372
 373	if (tmo == 0 ||
 374	    dma->device_tx_status(dma_chan, cookie, NULL)
 375					!= DMA_COMPLETE) {
 376		dev_err(dev, "Self-test copy timed out, disabling\n");
 377		err = -ENODEV;
 378		goto unmap_dma;
 379	}
 380	if (memcmp(src, dest, IOAT_TEST_SIZE)) {
 381		dev_err(dev, "Self-test copy failed compare, disabling\n");
 382		err = -ENODEV;
 383		goto unmap_dma;
 384	}
 385
 386unmap_dma:
 387	dma_unmap_single(dev, dma_dest, IOAT_TEST_SIZE, DMA_FROM_DEVICE);
 388unmap_src:
 389	dma_unmap_single(dev, dma_src, IOAT_TEST_SIZE, DMA_TO_DEVICE);
 390free_resources:
 391	dma->device_free_chan_resources(dma_chan);
 392out:
 393	kfree(src);
 394	kfree(dest);
 395	return err;
 396}
 397
 398/**
 399 * ioat_dma_setup_interrupts - setup interrupt handler
 400 * @ioat_dma: ioat dma device
 401 */
 402int ioat_dma_setup_interrupts(struct ioatdma_device *ioat_dma)
 403{
 404	struct ioatdma_chan *ioat_chan;
 405	struct pci_dev *pdev = ioat_dma->pdev;
 406	struct device *dev = &pdev->dev;
 407	struct msix_entry *msix;
 408	int i, j, msixcnt;
 409	int err = -EINVAL;
 410	u8 intrctrl = 0;
 411
 412	if (!strcmp(ioat_interrupt_style, "msix"))
 413		goto msix;
 414	if (!strcmp(ioat_interrupt_style, "msi"))
 415		goto msi;
 416	if (!strcmp(ioat_interrupt_style, "intx"))
 417		goto intx;
 418	dev_err(dev, "invalid ioat_interrupt_style %s\n", ioat_interrupt_style);
 419	goto err_no_irq;
 420
 421msix:
 422	/* The number of MSI-X vectors should equal the number of channels */
 423	msixcnt = ioat_dma->chancnt;
 424	for (i = 0; i < msixcnt; i++)
 425		ioat_dma->msix_entries[i].entry = i;
 426
 427	err = pci_enable_msix_exact(pdev, ioat_dma->msix_entries, msixcnt);
 428	if (err)
 429		goto msi;
 430
 431	for (i = 0; i < msixcnt; i++) {
 432		msix = &ioat_dma->msix_entries[i];
 433		ioat_chan = ioat_chan_by_index(ioat_dma, i);
 434		err = devm_request_irq(dev, msix->vector,
 435				       ioat_dma_do_interrupt_msix, 0,
 436				       "ioat-msix", ioat_chan);
 437		if (err) {
 438			for (j = 0; j < i; j++) {
 439				msix = &ioat_dma->msix_entries[j];
 440				ioat_chan = ioat_chan_by_index(ioat_dma, j);
 441				devm_free_irq(dev, msix->vector, ioat_chan);
 442			}
 443			goto msi;
 444		}
 445	}
 446	intrctrl |= IOAT_INTRCTRL_MSIX_VECTOR_CONTROL;
 447	ioat_dma->irq_mode = IOAT_MSIX;
 448	goto done;
 449
 450msi:
 451	err = pci_enable_msi(pdev);
 452	if (err)
 453		goto intx;
 454
 455	err = devm_request_irq(dev, pdev->irq, ioat_dma_do_interrupt, 0,
 456			       "ioat-msi", ioat_dma);
 457	if (err) {
 458		pci_disable_msi(pdev);
 459		goto intx;
 460	}
 461	ioat_dma->irq_mode = IOAT_MSI;
 462	goto done;
 463
 464intx:
 465	err = devm_request_irq(dev, pdev->irq, ioat_dma_do_interrupt,
 466			       IRQF_SHARED, "ioat-intx", ioat_dma);
 467	if (err)
 468		goto err_no_irq;
 469
 470	ioat_dma->irq_mode = IOAT_INTX;
 471done:
 472	if (is_bwd_ioat(pdev))
 473		ioat_intr_quirk(ioat_dma);
 474	intrctrl |= IOAT_INTRCTRL_MASTER_INT_EN;
 475	writeb(intrctrl, ioat_dma->reg_base + IOAT_INTRCTRL_OFFSET);
 476	return 0;
 477
 478err_no_irq:
 479	/* Disable all interrupt generation */
 480	writeb(0, ioat_dma->reg_base + IOAT_INTRCTRL_OFFSET);
 481	ioat_dma->irq_mode = IOAT_NOIRQ;
 482	dev_err(dev, "no usable interrupts\n");
 483	return err;
 484}
 485
 486static void ioat_disable_interrupts(struct ioatdma_device *ioat_dma)
 487{
 488	/* Disable all interrupt generation */
 489	writeb(0, ioat_dma->reg_base + IOAT_INTRCTRL_OFFSET);
 490}
 491
 492static int ioat_probe(struct ioatdma_device *ioat_dma)
 493{
 494	int err = -ENODEV;
 495	struct dma_device *dma = &ioat_dma->dma_dev;
 496	struct pci_dev *pdev = ioat_dma->pdev;
 497	struct device *dev = &pdev->dev;
 498
 499	ioat_dma->completion_pool = dma_pool_create("completion_pool", dev,
 500						    sizeof(u64),
 501						    SMP_CACHE_BYTES,
 502						    SMP_CACHE_BYTES);
 503
 504	if (!ioat_dma->completion_pool) {
 505		err = -ENOMEM;
 506		goto err_out;
 507	}
 508
 509	ioat_enumerate_channels(ioat_dma);
 510
 511	dma_cap_set(DMA_MEMCPY, dma->cap_mask);
 512	dma->dev = &pdev->dev;
 513
 514	if (!ioat_dma->chancnt) {
 515		dev_err(dev, "channel enumeration error\n");
 516		goto err_setup_interrupts;
 517	}
 518
 519	err = ioat_dma_setup_interrupts(ioat_dma);
 520	if (err)
 521		goto err_setup_interrupts;
 522
 523	err = ioat3_dma_self_test(ioat_dma);
 524	if (err)
 525		goto err_self_test;
 526
 527	return 0;
 528
 529err_self_test:
 530	ioat_disable_interrupts(ioat_dma);
 531err_setup_interrupts:
 532	dma_pool_destroy(ioat_dma->completion_pool);
 533err_out:
 534	return err;
 535}
 536
 537static int ioat_register(struct ioatdma_device *ioat_dma)
 538{
 539	int err = dma_async_device_register(&ioat_dma->dma_dev);
 540
 541	if (err) {
 542		ioat_disable_interrupts(ioat_dma);
 543		dma_pool_destroy(ioat_dma->completion_pool);
 544	}
 545
 546	return err;
 547}
 548
 549static void ioat_dma_remove(struct ioatdma_device *ioat_dma)
 550{
 551	struct dma_device *dma = &ioat_dma->dma_dev;
 552
 553	ioat_disable_interrupts(ioat_dma);
 554
 555	ioat_kobject_del(ioat_dma);
 556
 557	dma_async_device_unregister(dma);
 
 
 
 
 558}
 559
 560/**
 561 * ioat_enumerate_channels - find and initialize the device's channels
 562 * @ioat_dma: the ioat dma device to be enumerated
 563 */
 564static void ioat_enumerate_channels(struct ioatdma_device *ioat_dma)
 565{
 566	struct ioatdma_chan *ioat_chan;
 567	struct device *dev = &ioat_dma->pdev->dev;
 568	struct dma_device *dma = &ioat_dma->dma_dev;
 569	u8 xfercap_log;
 570	int chancnt;
 571	int i;
 572
 573	INIT_LIST_HEAD(&dma->channels);
 574	chancnt = readb(ioat_dma->reg_base + IOAT_CHANCNT_OFFSET);
 575	chancnt &= 0x1f; /* bits [4:0] valid */
 576	if (chancnt > ARRAY_SIZE(ioat_dma->idx)) {
 577		dev_warn(dev, "(%d) exceeds max supported channels (%zu)\n",
 578			 chancnt, ARRAY_SIZE(ioat_dma->idx));
 579		chancnt = ARRAY_SIZE(ioat_dma->idx);
 580	}
 581	xfercap_log = readb(ioat_dma->reg_base + IOAT_XFERCAP_OFFSET);
 582	xfercap_log &= 0x1f; /* bits [4:0] valid */
 583	if (xfercap_log == 0)
 584		return;
 585	dev_dbg(dev, "%s: xfercap = %d\n", __func__, 1 << xfercap_log);
 586
 587	for (i = 0; i < chancnt; i++) {
 588		ioat_chan = kzalloc(sizeof(*ioat_chan), GFP_KERNEL);
 589		if (!ioat_chan)
 590			break;
 591
 592		ioat_init_channel(ioat_dma, ioat_chan, i);
 593		ioat_chan->xfercap_log = xfercap_log;
 594		spin_lock_init(&ioat_chan->prep_lock);
 595		if (ioat_reset_hw(ioat_chan)) {
 596			i = 0;
 597			break;
 598		}
 599	}
 600	ioat_dma->chancnt = i;
 
 601}
 602
 603/**
 604 * ioat_free_chan_resources - release all the descriptors
 605 * @c: the channel to be cleaned
 606 */
 607static void ioat_free_chan_resources(struct dma_chan *c)
 608{
 609	struct ioatdma_chan *ioat_chan = to_ioat_chan(c);
 610	struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma;
 611	struct ioat_ring_ent *desc;
 612	const int total_descs = 1 << ioat_chan->alloc_order;
 613	int descs;
 614	int i;
 615
 616	/* Before freeing channel resources first check
 617	 * if they have been previously allocated for this channel.
 618	 */
 619	if (!ioat_chan->ring)
 620		return;
 621
 622	ioat_stop(ioat_chan);
 623
 624	if (!test_bit(IOAT_CHAN_DOWN, &ioat_chan->state)) {
 625		ioat_reset_hw(ioat_chan);
 626
 627		/* Put LTR to idle */
 628		if (ioat_dma->version >= IOAT_VER_3_4)
 629			writeb(IOAT_CHAN_LTR_SWSEL_IDLE,
 630			       ioat_chan->reg_base +
 631			       IOAT_CHAN_LTR_SWSEL_OFFSET);
 632	}
 633
 634	spin_lock_bh(&ioat_chan->cleanup_lock);
 635	spin_lock_bh(&ioat_chan->prep_lock);
 636	descs = ioat_ring_space(ioat_chan);
 637	dev_dbg(to_dev(ioat_chan), "freeing %d idle descriptors\n", descs);
 638	for (i = 0; i < descs; i++) {
 639		desc = ioat_get_ring_ent(ioat_chan, ioat_chan->head + i);
 640		ioat_free_ring_ent(desc, c);
 641	}
 642
 643	if (descs < total_descs)
 644		dev_err(to_dev(ioat_chan), "Freeing %d in use descriptors!\n",
 645			total_descs - descs);
 646
 647	for (i = 0; i < total_descs - descs; i++) {
 648		desc = ioat_get_ring_ent(ioat_chan, ioat_chan->tail + i);
 649		dump_desc_dbg(ioat_chan, desc);
 650		ioat_free_ring_ent(desc, c);
 651	}
 652
 653	for (i = 0; i < ioat_chan->desc_chunks; i++) {
 654		dma_free_coherent(to_dev(ioat_chan), IOAT_CHUNK_SIZE,
 655				  ioat_chan->descs[i].virt,
 656				  ioat_chan->descs[i].hw);
 657		ioat_chan->descs[i].virt = NULL;
 658		ioat_chan->descs[i].hw = 0;
 659	}
 660	ioat_chan->desc_chunks = 0;
 661
 662	kfree(ioat_chan->ring);
 663	ioat_chan->ring = NULL;
 664	ioat_chan->alloc_order = 0;
 665	dma_pool_free(ioat_dma->completion_pool, ioat_chan->completion,
 666		      ioat_chan->completion_dma);
 667	spin_unlock_bh(&ioat_chan->prep_lock);
 668	spin_unlock_bh(&ioat_chan->cleanup_lock);
 669
 670	ioat_chan->last_completion = 0;
 671	ioat_chan->completion_dma = 0;
 672	ioat_chan->dmacount = 0;
 673}
 674
 675/* ioat_alloc_chan_resources - allocate/initialize ioat descriptor ring
 676 * @chan: channel to be initialized
 677 */
 678static int ioat_alloc_chan_resources(struct dma_chan *c)
 679{
 680	struct ioatdma_chan *ioat_chan = to_ioat_chan(c);
 681	struct ioat_ring_ent **ring;
 682	u64 status;
 683	int order;
 684	int i = 0;
 685	u32 chanerr;
 686
 687	/* have we already been set up? */
 688	if (ioat_chan->ring)
 689		return 1 << ioat_chan->alloc_order;
 690
 691	/* Setup register to interrupt and write completion status on error */
 692	writew(IOAT_CHANCTRL_RUN, ioat_chan->reg_base + IOAT_CHANCTRL_OFFSET);
 693
 694	/* allocate a completion writeback area */
 695	/* doing 2 32bit writes to mmio since 1 64b write doesn't work */
 696	ioat_chan->completion =
 697		dma_pool_zalloc(ioat_chan->ioat_dma->completion_pool,
 698				GFP_NOWAIT, &ioat_chan->completion_dma);
 699	if (!ioat_chan->completion)
 700		return -ENOMEM;
 701
 702	writel(((u64)ioat_chan->completion_dma) & 0x00000000FFFFFFFF,
 703	       ioat_chan->reg_base + IOAT_CHANCMP_OFFSET_LOW);
 704	writel(((u64)ioat_chan->completion_dma) >> 32,
 705	       ioat_chan->reg_base + IOAT_CHANCMP_OFFSET_HIGH);
 706
 707	order = IOAT_MAX_ORDER;
 708	ring = ioat_alloc_ring(c, order, GFP_NOWAIT);
 709	if (!ring)
 710		return -ENOMEM;
 711
 712	spin_lock_bh(&ioat_chan->cleanup_lock);
 713	spin_lock_bh(&ioat_chan->prep_lock);
 714	ioat_chan->ring = ring;
 715	ioat_chan->head = 0;
 716	ioat_chan->issued = 0;
 717	ioat_chan->tail = 0;
 718	ioat_chan->alloc_order = order;
 719	set_bit(IOAT_RUN, &ioat_chan->state);
 720	spin_unlock_bh(&ioat_chan->prep_lock);
 721	spin_unlock_bh(&ioat_chan->cleanup_lock);
 722
 723	/* Setting up LTR values for 3.4 or later */
 724	if (ioat_chan->ioat_dma->version >= IOAT_VER_3_4) {
 725		u32 lat_val;
 726
 727		lat_val = IOAT_CHAN_LTR_ACTIVE_SNVAL |
 728			IOAT_CHAN_LTR_ACTIVE_SNLATSCALE |
 729			IOAT_CHAN_LTR_ACTIVE_SNREQMNT;
 730		writel(lat_val, ioat_chan->reg_base +
 731				IOAT_CHAN_LTR_ACTIVE_OFFSET);
 732
 733		lat_val = IOAT_CHAN_LTR_IDLE_SNVAL |
 734			  IOAT_CHAN_LTR_IDLE_SNLATSCALE |
 735			  IOAT_CHAN_LTR_IDLE_SNREQMNT;
 736		writel(lat_val, ioat_chan->reg_base +
 737				IOAT_CHAN_LTR_IDLE_OFFSET);
 738
 739		/* Select to active */
 740		writeb(IOAT_CHAN_LTR_SWSEL_ACTIVE,
 741		       ioat_chan->reg_base +
 742		       IOAT_CHAN_LTR_SWSEL_OFFSET);
 743	}
 744
 745	ioat_start_null_desc(ioat_chan);
 746
 747	/* check that we got off the ground */
 748	do {
 749		udelay(1);
 750		status = ioat_chansts(ioat_chan);
 751	} while (i++ < 20 && !is_ioat_active(status) && !is_ioat_idle(status));
 752
 753	if (is_ioat_active(status) || is_ioat_idle(status))
 754		return 1 << ioat_chan->alloc_order;
 755
 756	chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
 757
 758	dev_WARN(to_dev(ioat_chan),
 759		 "failed to start channel chanerr: %#x\n", chanerr);
 760	ioat_free_chan_resources(c);
 761	return -EFAULT;
 762}
 763
 764/* common channel initialization */
 765static void
 766ioat_init_channel(struct ioatdma_device *ioat_dma,
 767		  struct ioatdma_chan *ioat_chan, int idx)
 768{
 769	struct dma_device *dma = &ioat_dma->dma_dev;
 
 
 770
 771	ioat_chan->ioat_dma = ioat_dma;
 772	ioat_chan->reg_base = ioat_dma->reg_base + (0x80 * (idx + 1));
 773	spin_lock_init(&ioat_chan->cleanup_lock);
 774	ioat_chan->dma_chan.device = dma;
 775	dma_cookie_init(&ioat_chan->dma_chan);
 776	list_add_tail(&ioat_chan->dma_chan.device_node, &dma->channels);
 777	ioat_dma->idx[idx] = ioat_chan;
 778	timer_setup(&ioat_chan->timer, ioat_timer_event, 0);
 779	tasklet_setup(&ioat_chan->cleanup_task, ioat_cleanup_event);
 780}
 781
 782#define IOAT_NUM_SRC_TEST 6 /* must be <= 8 */
 783static int ioat_xor_val_self_test(struct ioatdma_device *ioat_dma)
 784{
 785	int i, src_idx;
 786	struct page *dest;
 787	struct page *xor_srcs[IOAT_NUM_SRC_TEST];
 788	struct page *xor_val_srcs[IOAT_NUM_SRC_TEST + 1];
 789	dma_addr_t dma_srcs[IOAT_NUM_SRC_TEST + 1];
 790	dma_addr_t dest_dma;
 791	struct dma_async_tx_descriptor *tx;
 792	struct dma_chan *dma_chan;
 793	dma_cookie_t cookie;
 794	u8 cmp_byte = 0;
 795	u32 cmp_word;
 796	u32 xor_val_result;
 797	int err = 0;
 798	struct completion cmp;
 799	unsigned long tmo;
 800	struct device *dev = &ioat_dma->pdev->dev;
 801	struct dma_device *dma = &ioat_dma->dma_dev;
 802	u8 op = 0;
 803
 804	dev_dbg(dev, "%s\n", __func__);
 805
 806	if (!dma_has_cap(DMA_XOR, dma->cap_mask))
 807		return 0;
 808
 809	for (src_idx = 0; src_idx < IOAT_NUM_SRC_TEST; src_idx++) {
 810		xor_srcs[src_idx] = alloc_page(GFP_KERNEL);
 811		if (!xor_srcs[src_idx]) {
 812			while (src_idx--)
 813				__free_page(xor_srcs[src_idx]);
 814			return -ENOMEM;
 815		}
 816	}
 817
 818	dest = alloc_page(GFP_KERNEL);
 819	if (!dest) {
 820		while (src_idx--)
 821			__free_page(xor_srcs[src_idx]);
 822		return -ENOMEM;
 823	}
 824
 825	/* Fill in src buffers */
 826	for (src_idx = 0; src_idx < IOAT_NUM_SRC_TEST; src_idx++) {
 827		u8 *ptr = page_address(xor_srcs[src_idx]);
 828
 829		for (i = 0; i < PAGE_SIZE; i++)
 830			ptr[i] = (1 << src_idx);
 831	}
 832
 833	for (src_idx = 0; src_idx < IOAT_NUM_SRC_TEST; src_idx++)
 834		cmp_byte ^= (u8) (1 << src_idx);
 835
 836	cmp_word = (cmp_byte << 24) | (cmp_byte << 16) |
 837			(cmp_byte << 8) | cmp_byte;
 838
 839	memset(page_address(dest), 0, PAGE_SIZE);
 840
 841	dma_chan = container_of(dma->channels.next, struct dma_chan,
 842				device_node);
 843	if (dma->device_alloc_chan_resources(dma_chan) < 1) {
 844		err = -ENODEV;
 845		goto out;
 846	}
 847
 848	/* test xor */
 849	op = IOAT_OP_XOR;
 850
 851	dest_dma = dma_map_page(dev, dest, 0, PAGE_SIZE, DMA_FROM_DEVICE);
 852	if (dma_mapping_error(dev, dest_dma)) {
 853		err = -ENOMEM;
 854		goto free_resources;
 855	}
 856
 857	for (i = 0; i < IOAT_NUM_SRC_TEST; i++) {
 858		dma_srcs[i] = dma_map_page(dev, xor_srcs[i], 0, PAGE_SIZE,
 859					   DMA_TO_DEVICE);
 860		if (dma_mapping_error(dev, dma_srcs[i])) {
 861			err = -ENOMEM;
 862			goto dma_unmap;
 863		}
 864	}
 865	tx = dma->device_prep_dma_xor(dma_chan, dest_dma, dma_srcs,
 866				      IOAT_NUM_SRC_TEST, PAGE_SIZE,
 867				      DMA_PREP_INTERRUPT);
 868
 869	if (!tx) {
 870		dev_err(dev, "Self-test xor prep failed\n");
 871		err = -ENODEV;
 872		goto dma_unmap;
 873	}
 874
 875	async_tx_ack(tx);
 876	init_completion(&cmp);
 877	tx->callback = ioat_dma_test_callback;
 878	tx->callback_param = &cmp;
 879	cookie = tx->tx_submit(tx);
 880	if (cookie < 0) {
 881		dev_err(dev, "Self-test xor setup failed\n");
 882		err = -ENODEV;
 883		goto dma_unmap;
 884	}
 885	dma->device_issue_pending(dma_chan);
 886
 887	tmo = wait_for_completion_timeout(&cmp, msecs_to_jiffies(3000));
 888
 889	if (tmo == 0 ||
 890	    dma->device_tx_status(dma_chan, cookie, NULL) != DMA_COMPLETE) {
 891		dev_err(dev, "Self-test xor timed out\n");
 892		err = -ENODEV;
 893		goto dma_unmap;
 894	}
 895
 896	for (i = 0; i < IOAT_NUM_SRC_TEST; i++)
 897		dma_unmap_page(dev, dma_srcs[i], PAGE_SIZE, DMA_TO_DEVICE);
 898
 899	dma_sync_single_for_cpu(dev, dest_dma, PAGE_SIZE, DMA_FROM_DEVICE);
 900	for (i = 0; i < (PAGE_SIZE / sizeof(u32)); i++) {
 901		u32 *ptr = page_address(dest);
 902
 903		if (ptr[i] != cmp_word) {
 904			dev_err(dev, "Self-test xor failed compare\n");
 905			err = -ENODEV;
 906			goto free_resources;
 907		}
 908	}
 909	dma_sync_single_for_device(dev, dest_dma, PAGE_SIZE, DMA_FROM_DEVICE);
 910
 911	dma_unmap_page(dev, dest_dma, PAGE_SIZE, DMA_FROM_DEVICE);
 912
 913	/* skip validate if the capability is not present */
 914	if (!dma_has_cap(DMA_XOR_VAL, dma_chan->device->cap_mask))
 915		goto free_resources;
 916
 917	op = IOAT_OP_XOR_VAL;
 918
 919	/* validate the sources with the destintation page */
 920	for (i = 0; i < IOAT_NUM_SRC_TEST; i++)
 921		xor_val_srcs[i] = xor_srcs[i];
 922	xor_val_srcs[i] = dest;
 923
 924	xor_val_result = 1;
 925
 926	for (i = 0; i < IOAT_NUM_SRC_TEST + 1; i++) {
 927		dma_srcs[i] = dma_map_page(dev, xor_val_srcs[i], 0, PAGE_SIZE,
 928					   DMA_TO_DEVICE);
 929		if (dma_mapping_error(dev, dma_srcs[i])) {
 930			err = -ENOMEM;
 931			goto dma_unmap;
 932		}
 933	}
 934	tx = dma->device_prep_dma_xor_val(dma_chan, dma_srcs,
 935					  IOAT_NUM_SRC_TEST + 1, PAGE_SIZE,
 936					  &xor_val_result, DMA_PREP_INTERRUPT);
 937	if (!tx) {
 938		dev_err(dev, "Self-test zero prep failed\n");
 939		err = -ENODEV;
 940		goto dma_unmap;
 941	}
 942
 943	async_tx_ack(tx);
 944	init_completion(&cmp);
 945	tx->callback = ioat_dma_test_callback;
 946	tx->callback_param = &cmp;
 947	cookie = tx->tx_submit(tx);
 948	if (cookie < 0) {
 949		dev_err(dev, "Self-test zero setup failed\n");
 950		err = -ENODEV;
 951		goto dma_unmap;
 952	}
 953	dma->device_issue_pending(dma_chan);
 954
 955	tmo = wait_for_completion_timeout(&cmp, msecs_to_jiffies(3000));
 956
 957	if (tmo == 0 ||
 958	    dma->device_tx_status(dma_chan, cookie, NULL) != DMA_COMPLETE) {
 959		dev_err(dev, "Self-test validate timed out\n");
 960		err = -ENODEV;
 961		goto dma_unmap;
 962	}
 963
 964	for (i = 0; i < IOAT_NUM_SRC_TEST + 1; i++)
 965		dma_unmap_page(dev, dma_srcs[i], PAGE_SIZE, DMA_TO_DEVICE);
 966
 967	if (xor_val_result != 0) {
 968		dev_err(dev, "Self-test validate failed compare\n");
 969		err = -ENODEV;
 970		goto free_resources;
 971	}
 972
 973	memset(page_address(dest), 0, PAGE_SIZE);
 974
 975	/* test for non-zero parity sum */
 976	op = IOAT_OP_XOR_VAL;
 977
 978	xor_val_result = 0;
 979	for (i = 0; i < IOAT_NUM_SRC_TEST + 1; i++) {
 980		dma_srcs[i] = dma_map_page(dev, xor_val_srcs[i], 0, PAGE_SIZE,
 981					   DMA_TO_DEVICE);
 982		if (dma_mapping_error(dev, dma_srcs[i])) {
 983			err = -ENOMEM;
 984			goto dma_unmap;
 985		}
 986	}
 987	tx = dma->device_prep_dma_xor_val(dma_chan, dma_srcs,
 988					  IOAT_NUM_SRC_TEST + 1, PAGE_SIZE,
 989					  &xor_val_result, DMA_PREP_INTERRUPT);
 990	if (!tx) {
 991		dev_err(dev, "Self-test 2nd zero prep failed\n");
 992		err = -ENODEV;
 993		goto dma_unmap;
 994	}
 995
 996	async_tx_ack(tx);
 997	init_completion(&cmp);
 998	tx->callback = ioat_dma_test_callback;
 999	tx->callback_param = &cmp;
1000	cookie = tx->tx_submit(tx);
1001	if (cookie < 0) {
1002		dev_err(dev, "Self-test  2nd zero setup failed\n");
1003		err = -ENODEV;
1004		goto dma_unmap;
1005	}
1006	dma->device_issue_pending(dma_chan);
1007
1008	tmo = wait_for_completion_timeout(&cmp, msecs_to_jiffies(3000));
1009
1010	if (tmo == 0 ||
1011	    dma->device_tx_status(dma_chan, cookie, NULL) != DMA_COMPLETE) {
1012		dev_err(dev, "Self-test 2nd validate timed out\n");
1013		err = -ENODEV;
1014		goto dma_unmap;
1015	}
1016
1017	if (xor_val_result != SUM_CHECK_P_RESULT) {
1018		dev_err(dev, "Self-test validate failed compare\n");
1019		err = -ENODEV;
1020		goto dma_unmap;
1021	}
1022
1023	for (i = 0; i < IOAT_NUM_SRC_TEST + 1; i++)
1024		dma_unmap_page(dev, dma_srcs[i], PAGE_SIZE, DMA_TO_DEVICE);
1025
1026	goto free_resources;
1027dma_unmap:
1028	if (op == IOAT_OP_XOR) {
1029		while (--i >= 0)
1030			dma_unmap_page(dev, dma_srcs[i], PAGE_SIZE,
1031				       DMA_TO_DEVICE);
1032		dma_unmap_page(dev, dest_dma, PAGE_SIZE, DMA_FROM_DEVICE);
1033	} else if (op == IOAT_OP_XOR_VAL) {
1034		while (--i >= 0)
1035			dma_unmap_page(dev, dma_srcs[i], PAGE_SIZE,
1036				       DMA_TO_DEVICE);
1037	}
1038free_resources:
1039	dma->device_free_chan_resources(dma_chan);
1040out:
1041	src_idx = IOAT_NUM_SRC_TEST;
1042	while (src_idx--)
1043		__free_page(xor_srcs[src_idx]);
1044	__free_page(dest);
1045	return err;
1046}
1047
1048static int ioat3_dma_self_test(struct ioatdma_device *ioat_dma)
1049{
1050	int rc;
1051
1052	rc = ioat_dma_self_test(ioat_dma);
1053	if (rc)
1054		return rc;
1055
1056	rc = ioat_xor_val_self_test(ioat_dma);
1057
1058	return rc;
1059}
1060
1061static void ioat_intr_quirk(struct ioatdma_device *ioat_dma)
1062{
1063	struct dma_device *dma;
1064	struct dma_chan *c;
1065	struct ioatdma_chan *ioat_chan;
1066	u32 errmask;
1067
1068	dma = &ioat_dma->dma_dev;
1069
1070	/*
1071	 * if we have descriptor write back error status, we mask the
1072	 * error interrupts
1073	 */
1074	if (ioat_dma->cap & IOAT_CAP_DWBES) {
1075		list_for_each_entry(c, &dma->channels, device_node) {
1076			ioat_chan = to_ioat_chan(c);
1077			errmask = readl(ioat_chan->reg_base +
1078					IOAT_CHANERR_MASK_OFFSET);
1079			errmask |= IOAT_CHANERR_XOR_P_OR_CRC_ERR |
1080				   IOAT_CHANERR_XOR_Q_ERR;
1081			writel(errmask, ioat_chan->reg_base +
1082					IOAT_CHANERR_MASK_OFFSET);
1083		}
1084	}
1085}
1086
1087static int ioat3_dma_probe(struct ioatdma_device *ioat_dma, int dca)
1088{
1089	struct pci_dev *pdev = ioat_dma->pdev;
1090	int dca_en = system_has_dca_enabled(pdev);
1091	struct dma_device *dma;
1092	struct dma_chan *c;
1093	struct ioatdma_chan *ioat_chan;
1094	int err;
1095	u16 val16;
1096
1097	dma = &ioat_dma->dma_dev;
1098	dma->device_prep_dma_memcpy = ioat_dma_prep_memcpy_lock;
1099	dma->device_issue_pending = ioat_issue_pending;
1100	dma->device_alloc_chan_resources = ioat_alloc_chan_resources;
1101	dma->device_free_chan_resources = ioat_free_chan_resources;
1102
1103	dma_cap_set(DMA_INTERRUPT, dma->cap_mask);
1104	dma->device_prep_dma_interrupt = ioat_prep_interrupt_lock;
1105
1106	ioat_dma->cap = readl(ioat_dma->reg_base + IOAT_DMA_CAP_OFFSET);
1107
1108	if (is_xeon_cb32(pdev) || is_bwd_noraid(pdev))
1109		ioat_dma->cap &=
1110			~(IOAT_CAP_XOR | IOAT_CAP_PQ | IOAT_CAP_RAID16SS);
1111
1112	/* dca is incompatible with raid operations */
1113	if (dca_en && (ioat_dma->cap & (IOAT_CAP_XOR|IOAT_CAP_PQ)))
1114		ioat_dma->cap &= ~(IOAT_CAP_XOR|IOAT_CAP_PQ);
1115
1116	if (ioat_dma->cap & IOAT_CAP_XOR) {
1117		dma->max_xor = 8;
1118
1119		dma_cap_set(DMA_XOR, dma->cap_mask);
1120		dma->device_prep_dma_xor = ioat_prep_xor;
1121
1122		dma_cap_set(DMA_XOR_VAL, dma->cap_mask);
1123		dma->device_prep_dma_xor_val = ioat_prep_xor_val;
1124	}
1125
1126	if (ioat_dma->cap & IOAT_CAP_PQ) {
1127
1128		dma->device_prep_dma_pq = ioat_prep_pq;
1129		dma->device_prep_dma_pq_val = ioat_prep_pq_val;
1130		dma_cap_set(DMA_PQ, dma->cap_mask);
1131		dma_cap_set(DMA_PQ_VAL, dma->cap_mask);
1132
1133		if (ioat_dma->cap & IOAT_CAP_RAID16SS)
1134			dma_set_maxpq(dma, 16, 0);
1135		else
1136			dma_set_maxpq(dma, 8, 0);
1137
1138		if (!(ioat_dma->cap & IOAT_CAP_XOR)) {
1139			dma->device_prep_dma_xor = ioat_prep_pqxor;
1140			dma->device_prep_dma_xor_val = ioat_prep_pqxor_val;
1141			dma_cap_set(DMA_XOR, dma->cap_mask);
1142			dma_cap_set(DMA_XOR_VAL, dma->cap_mask);
1143
1144			if (ioat_dma->cap & IOAT_CAP_RAID16SS)
1145				dma->max_xor = 16;
1146			else
1147				dma->max_xor = 8;
1148		}
1149	}
1150
1151	dma->device_tx_status = ioat_tx_status;
1152
1153	/* starting with CB3.3 super extended descriptors are supported */
1154	if (ioat_dma->cap & IOAT_CAP_RAID16SS) {
1155		char pool_name[14];
1156		int i;
1157
1158		for (i = 0; i < MAX_SED_POOLS; i++) {
1159			snprintf(pool_name, 14, "ioat_hw%d_sed", i);
1160
1161			/* allocate SED DMA pool */
1162			ioat_dma->sed_hw_pool[i] = dmam_pool_create(pool_name,
1163					&pdev->dev,
1164					SED_SIZE * (i + 1), 64, 0);
1165			if (!ioat_dma->sed_hw_pool[i])
1166				return -ENOMEM;
1167
1168		}
1169	}
1170
1171	if (!(ioat_dma->cap & (IOAT_CAP_XOR | IOAT_CAP_PQ)))
1172		dma_cap_set(DMA_PRIVATE, dma->cap_mask);
1173
1174	err = ioat_probe(ioat_dma);
1175	if (err)
1176		return err;
1177
1178	list_for_each_entry(c, &dma->channels, device_node) {
1179		ioat_chan = to_ioat_chan(c);
1180		writel(IOAT_DMA_DCA_ANY_CPU,
1181		       ioat_chan->reg_base + IOAT_DCACTRL_OFFSET);
1182	}
1183
1184	err = ioat_register(ioat_dma);
1185	if (err)
1186		return err;
1187
1188	ioat_kobject_add(ioat_dma, &ioat_ktype);
1189
1190	if (dca)
1191		ioat_dma->dca = ioat_dca_init(pdev, ioat_dma->reg_base);
1192
1193	/* disable relaxed ordering */
1194	err = pcie_capability_read_word(pdev, PCI_EXP_DEVCTL, &val16);
1195	if (err)
1196		return pcibios_err_to_errno(err);
1197
1198	/* clear relaxed ordering enable */
1199	val16 &= ~PCI_EXP_DEVCTL_RELAX_EN;
1200	err = pcie_capability_write_word(pdev, PCI_EXP_DEVCTL, val16);
1201	if (err)
1202		return pcibios_err_to_errno(err);
1203
1204	if (ioat_dma->cap & IOAT_CAP_DPS)
1205		writeb(ioat_pending_level + 1,
1206		       ioat_dma->reg_base + IOAT_PREFETCH_LIMIT_OFFSET);
1207
1208	return 0;
1209}
1210
1211static void ioat_shutdown(struct pci_dev *pdev)
1212{
1213	struct ioatdma_device *ioat_dma = pci_get_drvdata(pdev);
1214	struct ioatdma_chan *ioat_chan;
1215	int i;
1216
1217	if (!ioat_dma)
1218		return;
1219
1220	for (i = 0; i < IOAT_MAX_CHANS; i++) {
1221		ioat_chan = ioat_dma->idx[i];
1222		if (!ioat_chan)
1223			continue;
1224
1225		spin_lock_bh(&ioat_chan->prep_lock);
1226		set_bit(IOAT_CHAN_DOWN, &ioat_chan->state);
1227		spin_unlock_bh(&ioat_chan->prep_lock);
1228		/*
1229		 * Synchronization rule for del_timer_sync():
1230		 *  - The caller must not hold locks which would prevent
1231		 *    completion of the timer's handler.
1232		 * So prep_lock cannot be held before calling it.
1233		 */
1234		del_timer_sync(&ioat_chan->timer);
1235
1236		/* this should quiesce then reset */
1237		ioat_reset_hw(ioat_chan);
1238	}
1239
1240	ioat_disable_interrupts(ioat_dma);
1241}
1242
1243static void ioat_resume(struct ioatdma_device *ioat_dma)
1244{
1245	struct ioatdma_chan *ioat_chan;
1246	u32 chanerr;
1247	int i;
1248
1249	for (i = 0; i < IOAT_MAX_CHANS; i++) {
1250		ioat_chan = ioat_dma->idx[i];
1251		if (!ioat_chan)
1252			continue;
1253
1254		spin_lock_bh(&ioat_chan->prep_lock);
1255		clear_bit(IOAT_CHAN_DOWN, &ioat_chan->state);
1256		spin_unlock_bh(&ioat_chan->prep_lock);
1257
1258		chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
1259		writel(chanerr, ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
1260
1261		/* no need to reset as shutdown already did that */
1262	}
1263}
1264
1265#define DRV_NAME "ioatdma"
1266
1267static pci_ers_result_t ioat_pcie_error_detected(struct pci_dev *pdev,
1268						 pci_channel_state_t error)
1269{
1270	dev_dbg(&pdev->dev, "%s: PCIe AER error %d\n", DRV_NAME, error);
1271
1272	/* quiesce and block I/O */
1273	ioat_shutdown(pdev);
1274
1275	return PCI_ERS_RESULT_NEED_RESET;
1276}
1277
1278static pci_ers_result_t ioat_pcie_error_slot_reset(struct pci_dev *pdev)
1279{
1280	pci_ers_result_t result = PCI_ERS_RESULT_RECOVERED;
 
1281
1282	dev_dbg(&pdev->dev, "%s post reset handling\n", DRV_NAME);
1283
1284	if (pci_enable_device_mem(pdev) < 0) {
1285		dev_err(&pdev->dev,
1286			"Failed to enable PCIe device after reset.\n");
1287		result = PCI_ERS_RESULT_DISCONNECT;
1288	} else {
1289		pci_set_master(pdev);
1290		pci_restore_state(pdev);
1291		pci_save_state(pdev);
1292		pci_wake_from_d3(pdev, false);
1293	}
1294
 
 
 
 
 
 
1295	return result;
1296}
1297
1298static void ioat_pcie_error_resume(struct pci_dev *pdev)
1299{
1300	struct ioatdma_device *ioat_dma = pci_get_drvdata(pdev);
1301
1302	dev_dbg(&pdev->dev, "%s: AER handling resuming\n", DRV_NAME);
1303
1304	/* initialize and bring everything back */
1305	ioat_resume(ioat_dma);
1306}
1307
1308static const struct pci_error_handlers ioat_err_handler = {
1309	.error_detected = ioat_pcie_error_detected,
1310	.slot_reset = ioat_pcie_error_slot_reset,
1311	.resume = ioat_pcie_error_resume,
1312};
1313
1314static struct pci_driver ioat_pci_driver = {
1315	.name		= DRV_NAME,
1316	.id_table	= ioat_pci_tbl,
1317	.probe		= ioat_pci_probe,
1318	.remove		= ioat_remove,
1319	.shutdown	= ioat_shutdown,
1320	.err_handler	= &ioat_err_handler,
1321};
1322
1323static void release_ioatdma(struct dma_device *device)
1324{
1325	struct ioatdma_device *d = to_ioatdma_device(device);
1326	int i;
1327
1328	for (i = 0; i < IOAT_MAX_CHANS; i++)
1329		kfree(d->idx[i]);
1330
1331	dma_pool_destroy(d->completion_pool);
1332	kfree(d);
1333}
1334
1335static struct ioatdma_device *
1336alloc_ioatdma(struct pci_dev *pdev, void __iomem *iobase)
1337{
1338	struct ioatdma_device *d = kzalloc(sizeof(*d), GFP_KERNEL);
 
1339
1340	if (!d)
1341		return NULL;
1342	d->pdev = pdev;
1343	d->reg_base = iobase;
1344	d->dma_dev.device_release = release_ioatdma;
1345	return d;
1346}
1347
1348static int ioat_pci_probe(struct pci_dev *pdev, const struct pci_device_id *id)
1349{
1350	void __iomem * const *iomap;
1351	struct device *dev = &pdev->dev;
1352	struct ioatdma_device *device;
1353	int err;
1354
1355	err = pcim_enable_device(pdev);
1356	if (err)
1357		return err;
1358
1359	err = pcim_iomap_regions(pdev, 1 << IOAT_MMIO_BAR, DRV_NAME);
1360	if (err)
1361		return err;
1362	iomap = pcim_iomap_table(pdev);
1363	if (!iomap)
1364		return -ENOMEM;
1365
1366	err = dma_set_mask_and_coherent(&pdev->dev, DMA_BIT_MASK(64));
 
 
 
 
 
 
 
 
1367	if (err)
1368		return err;
1369
1370	device = alloc_ioatdma(pdev, iomap[IOAT_MMIO_BAR]);
1371	if (!device)
1372		return -ENOMEM;
1373	pci_set_master(pdev);
1374	pci_set_drvdata(pdev, device);
1375
1376	device->version = readb(device->reg_base + IOAT_VER_OFFSET);
1377	if (device->version >= IOAT_VER_3_4)
1378		ioat_dca_enabled = 0;
1379	if (device->version >= IOAT_VER_3_0) {
1380		if (is_skx_ioat(pdev))
1381			device->version = IOAT_VER_3_2;
1382		err = ioat3_dma_probe(device, ioat_dca_enabled);
 
 
 
1383	} else
1384		return -ENODEV;
1385
1386	if (err) {
1387		dev_err(dev, "Intel(R) I/OAT DMA Engine init failed\n");
 
1388		return -ENODEV;
1389	}
1390
1391	return 0;
1392}
1393
1394static void ioat_remove(struct pci_dev *pdev)
1395{
1396	struct ioatdma_device *device = pci_get_drvdata(pdev);
1397
1398	if (!device)
1399		return;
1400
1401	ioat_shutdown(pdev);
1402
1403	dev_err(&pdev->dev, "Removing dma and dca services\n");
1404	if (device->dca) {
1405		unregister_dca_provider(device->dca, &pdev->dev);
1406		free_dca_provider(device->dca);
1407		device->dca = NULL;
1408	}
1409
 
1410	ioat_dma_remove(device);
1411}
1412
1413static int __init ioat_init_module(void)
1414{
1415	int err = -ENOMEM;
1416
1417	pr_info("%s: Intel(R) QuickData Technology Driver %s\n",
1418		DRV_NAME, IOAT_DMA_VERSION);
1419
1420	ioat_cache = kmem_cache_create("ioat", sizeof(struct ioat_ring_ent),
1421					0, SLAB_HWCACHE_ALIGN, NULL);
1422	if (!ioat_cache)
1423		return -ENOMEM;
1424
1425	ioat_sed_cache = KMEM_CACHE(ioat_sed_ent, 0);
1426	if (!ioat_sed_cache)
1427		goto err_ioat_cache;
1428
1429	err = pci_register_driver(&ioat_pci_driver);
1430	if (err)
1431		goto err_ioat3_cache;
1432
1433	return 0;
1434
1435 err_ioat3_cache:
1436	kmem_cache_destroy(ioat_sed_cache);
1437
1438 err_ioat_cache:
1439	kmem_cache_destroy(ioat_cache);
1440
1441	return err;
1442}
1443module_init(ioat_init_module);
1444
1445static void __exit ioat_exit_module(void)
1446{
1447	pci_unregister_driver(&ioat_pci_driver);
1448	kmem_cache_destroy(ioat_cache);
1449}
1450module_exit(ioat_exit_module);
v4.17
 
   1/*
   2 * Intel I/OAT DMA Linux driver
   3 * Copyright(c) 2004 - 2015 Intel Corporation.
   4 *
   5 * This program is free software; you can redistribute it and/or modify it
   6 * under the terms and conditions of the GNU General Public License,
   7 * version 2, as published by the Free Software Foundation.
   8 *
   9 * This program is distributed in the hope that it will be useful, but WITHOUT
  10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  11 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
  12 * more details.
  13 *
  14 * The full GNU General Public License is included in this distribution in
  15 * the file called "COPYING".
  16 *
  17 */
  18
  19#include <linux/init.h>
  20#include <linux/module.h>
  21#include <linux/slab.h>
  22#include <linux/pci.h>
  23#include <linux/interrupt.h>
  24#include <linux/dmaengine.h>
  25#include <linux/delay.h>
  26#include <linux/dma-mapping.h>
  27#include <linux/workqueue.h>
  28#include <linux/prefetch.h>
  29#include <linux/dca.h>
  30#include <linux/aer.h>
  31#include <linux/sizes.h>
  32#include "dma.h"
  33#include "registers.h"
  34#include "hw.h"
  35
  36#include "../dmaengine.h"
  37
  38MODULE_VERSION(IOAT_DMA_VERSION);
  39MODULE_LICENSE("Dual BSD/GPL");
  40MODULE_AUTHOR("Intel Corporation");
  41
  42static const struct pci_device_id ioat_pci_tbl[] = {
  43	/* I/OAT v3 platforms */
  44	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_TBG0) },
  45	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_TBG1) },
  46	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_TBG2) },
  47	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_TBG3) },
  48	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_TBG4) },
  49	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_TBG5) },
  50	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_TBG6) },
  51	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_TBG7) },
  52
  53	/* I/OAT v3.2 platforms */
  54	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_JSF0) },
  55	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_JSF1) },
  56	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_JSF2) },
  57	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_JSF3) },
  58	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_JSF4) },
  59	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_JSF5) },
  60	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_JSF6) },
  61	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_JSF7) },
  62	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_JSF8) },
  63	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_JSF9) },
  64
  65	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_SNB0) },
  66	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_SNB1) },
  67	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_SNB2) },
  68	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_SNB3) },
  69	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_SNB4) },
  70	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_SNB5) },
  71	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_SNB6) },
  72	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_SNB7) },
  73	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_SNB8) },
  74	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_SNB9) },
  75
  76	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_IVB0) },
  77	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_IVB1) },
  78	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_IVB2) },
  79	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_IVB3) },
  80	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_IVB4) },
  81	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_IVB5) },
  82	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_IVB6) },
  83	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_IVB7) },
  84	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_IVB8) },
  85	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_IVB9) },
  86
  87	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_HSW0) },
  88	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_HSW1) },
  89	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_HSW2) },
  90	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_HSW3) },
  91	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_HSW4) },
  92	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_HSW5) },
  93	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_HSW6) },
  94	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_HSW7) },
  95	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_HSW8) },
  96	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_HSW9) },
  97
  98	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDX0) },
  99	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDX1) },
 100	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDX2) },
 101	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDX3) },
 102	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDX4) },
 103	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDX5) },
 104	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDX6) },
 105	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDX7) },
 106	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDX8) },
 107	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDX9) },
 108
 109	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_SKX) },
 110
 111	/* I/OAT v3.3 platforms */
 112	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BWD0) },
 113	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BWD1) },
 114	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BWD2) },
 115	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BWD3) },
 116
 117	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDXDE0) },
 118	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDXDE1) },
 119	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDXDE2) },
 120	{ PCI_VDEVICE(INTEL, PCI_DEVICE_ID_INTEL_IOAT_BDXDE3) },
 121
 
 
 
 122	{ 0, }
 123};
 124MODULE_DEVICE_TABLE(pci, ioat_pci_tbl);
 125
 126static int ioat_pci_probe(struct pci_dev *pdev, const struct pci_device_id *id);
 127static void ioat_remove(struct pci_dev *pdev);
 128static void
 129ioat_init_channel(struct ioatdma_device *ioat_dma,
 130		  struct ioatdma_chan *ioat_chan, int idx);
 131static void ioat_intr_quirk(struct ioatdma_device *ioat_dma);
 132static int ioat_enumerate_channels(struct ioatdma_device *ioat_dma);
 133static int ioat3_dma_self_test(struct ioatdma_device *ioat_dma);
 134
 135static int ioat_dca_enabled = 1;
 136module_param(ioat_dca_enabled, int, 0644);
 137MODULE_PARM_DESC(ioat_dca_enabled, "control support of dca service (default: 1)");
 138int ioat_pending_level = 4;
 139module_param(ioat_pending_level, int, 0644);
 140MODULE_PARM_DESC(ioat_pending_level,
 141		 "high-water mark for pushing ioat descriptors (default: 4)");
 142static char ioat_interrupt_style[32] = "msix";
 143module_param_string(ioat_interrupt_style, ioat_interrupt_style,
 144		    sizeof(ioat_interrupt_style), 0644);
 145MODULE_PARM_DESC(ioat_interrupt_style,
 146		 "set ioat interrupt style: msix (default), msi, intx");
 147
 148struct kmem_cache *ioat_cache;
 149struct kmem_cache *ioat_sed_cache;
 150
 151static bool is_jf_ioat(struct pci_dev *pdev)
 152{
 153	switch (pdev->device) {
 154	case PCI_DEVICE_ID_INTEL_IOAT_JSF0:
 155	case PCI_DEVICE_ID_INTEL_IOAT_JSF1:
 156	case PCI_DEVICE_ID_INTEL_IOAT_JSF2:
 157	case PCI_DEVICE_ID_INTEL_IOAT_JSF3:
 158	case PCI_DEVICE_ID_INTEL_IOAT_JSF4:
 159	case PCI_DEVICE_ID_INTEL_IOAT_JSF5:
 160	case PCI_DEVICE_ID_INTEL_IOAT_JSF6:
 161	case PCI_DEVICE_ID_INTEL_IOAT_JSF7:
 162	case PCI_DEVICE_ID_INTEL_IOAT_JSF8:
 163	case PCI_DEVICE_ID_INTEL_IOAT_JSF9:
 164		return true;
 165	default:
 166		return false;
 167	}
 168}
 169
 170static bool is_snb_ioat(struct pci_dev *pdev)
 171{
 172	switch (pdev->device) {
 173	case PCI_DEVICE_ID_INTEL_IOAT_SNB0:
 174	case PCI_DEVICE_ID_INTEL_IOAT_SNB1:
 175	case PCI_DEVICE_ID_INTEL_IOAT_SNB2:
 176	case PCI_DEVICE_ID_INTEL_IOAT_SNB3:
 177	case PCI_DEVICE_ID_INTEL_IOAT_SNB4:
 178	case PCI_DEVICE_ID_INTEL_IOAT_SNB5:
 179	case PCI_DEVICE_ID_INTEL_IOAT_SNB6:
 180	case PCI_DEVICE_ID_INTEL_IOAT_SNB7:
 181	case PCI_DEVICE_ID_INTEL_IOAT_SNB8:
 182	case PCI_DEVICE_ID_INTEL_IOAT_SNB9:
 183		return true;
 184	default:
 185		return false;
 186	}
 187}
 188
 189static bool is_ivb_ioat(struct pci_dev *pdev)
 190{
 191	switch (pdev->device) {
 192	case PCI_DEVICE_ID_INTEL_IOAT_IVB0:
 193	case PCI_DEVICE_ID_INTEL_IOAT_IVB1:
 194	case PCI_DEVICE_ID_INTEL_IOAT_IVB2:
 195	case PCI_DEVICE_ID_INTEL_IOAT_IVB3:
 196	case PCI_DEVICE_ID_INTEL_IOAT_IVB4:
 197	case PCI_DEVICE_ID_INTEL_IOAT_IVB5:
 198	case PCI_DEVICE_ID_INTEL_IOAT_IVB6:
 199	case PCI_DEVICE_ID_INTEL_IOAT_IVB7:
 200	case PCI_DEVICE_ID_INTEL_IOAT_IVB8:
 201	case PCI_DEVICE_ID_INTEL_IOAT_IVB9:
 202		return true;
 203	default:
 204		return false;
 205	}
 206
 207}
 208
 209static bool is_hsw_ioat(struct pci_dev *pdev)
 210{
 211	switch (pdev->device) {
 212	case PCI_DEVICE_ID_INTEL_IOAT_HSW0:
 213	case PCI_DEVICE_ID_INTEL_IOAT_HSW1:
 214	case PCI_DEVICE_ID_INTEL_IOAT_HSW2:
 215	case PCI_DEVICE_ID_INTEL_IOAT_HSW3:
 216	case PCI_DEVICE_ID_INTEL_IOAT_HSW4:
 217	case PCI_DEVICE_ID_INTEL_IOAT_HSW5:
 218	case PCI_DEVICE_ID_INTEL_IOAT_HSW6:
 219	case PCI_DEVICE_ID_INTEL_IOAT_HSW7:
 220	case PCI_DEVICE_ID_INTEL_IOAT_HSW8:
 221	case PCI_DEVICE_ID_INTEL_IOAT_HSW9:
 222		return true;
 223	default:
 224		return false;
 225	}
 226
 227}
 228
 229static bool is_bdx_ioat(struct pci_dev *pdev)
 230{
 231	switch (pdev->device) {
 232	case PCI_DEVICE_ID_INTEL_IOAT_BDX0:
 233	case PCI_DEVICE_ID_INTEL_IOAT_BDX1:
 234	case PCI_DEVICE_ID_INTEL_IOAT_BDX2:
 235	case PCI_DEVICE_ID_INTEL_IOAT_BDX3:
 236	case PCI_DEVICE_ID_INTEL_IOAT_BDX4:
 237	case PCI_DEVICE_ID_INTEL_IOAT_BDX5:
 238	case PCI_DEVICE_ID_INTEL_IOAT_BDX6:
 239	case PCI_DEVICE_ID_INTEL_IOAT_BDX7:
 240	case PCI_DEVICE_ID_INTEL_IOAT_BDX8:
 241	case PCI_DEVICE_ID_INTEL_IOAT_BDX9:
 242		return true;
 243	default:
 244		return false;
 245	}
 246}
 247
 248static inline bool is_skx_ioat(struct pci_dev *pdev)
 249{
 250	return (pdev->device == PCI_DEVICE_ID_INTEL_IOAT_SKX) ? true : false;
 251}
 252
 253static bool is_xeon_cb32(struct pci_dev *pdev)
 254{
 255	return is_jf_ioat(pdev) || is_snb_ioat(pdev) || is_ivb_ioat(pdev) ||
 256		is_hsw_ioat(pdev) || is_bdx_ioat(pdev) || is_skx_ioat(pdev);
 257}
 258
 259bool is_bwd_ioat(struct pci_dev *pdev)
 260{
 261	switch (pdev->device) {
 262	case PCI_DEVICE_ID_INTEL_IOAT_BWD0:
 263	case PCI_DEVICE_ID_INTEL_IOAT_BWD1:
 264	case PCI_DEVICE_ID_INTEL_IOAT_BWD2:
 265	case PCI_DEVICE_ID_INTEL_IOAT_BWD3:
 266	/* even though not Atom, BDX-DE has same DMA silicon */
 267	case PCI_DEVICE_ID_INTEL_IOAT_BDXDE0:
 268	case PCI_DEVICE_ID_INTEL_IOAT_BDXDE1:
 269	case PCI_DEVICE_ID_INTEL_IOAT_BDXDE2:
 270	case PCI_DEVICE_ID_INTEL_IOAT_BDXDE3:
 271		return true;
 272	default:
 273		return false;
 274	}
 275}
 276
 277static bool is_bwd_noraid(struct pci_dev *pdev)
 278{
 279	switch (pdev->device) {
 280	case PCI_DEVICE_ID_INTEL_IOAT_BWD2:
 281	case PCI_DEVICE_ID_INTEL_IOAT_BWD3:
 282	case PCI_DEVICE_ID_INTEL_IOAT_BDXDE0:
 283	case PCI_DEVICE_ID_INTEL_IOAT_BDXDE1:
 284	case PCI_DEVICE_ID_INTEL_IOAT_BDXDE2:
 285	case PCI_DEVICE_ID_INTEL_IOAT_BDXDE3:
 286		return true;
 287	default:
 288		return false;
 289	}
 290
 291}
 292
 293/*
 294 * Perform a IOAT transaction to verify the HW works.
 295 */
 296#define IOAT_TEST_SIZE 2000
 297
 298static void ioat_dma_test_callback(void *dma_async_param)
 299{
 300	struct completion *cmp = dma_async_param;
 301
 302	complete(cmp);
 303}
 304
 305/**
 306 * ioat_dma_self_test - Perform a IOAT transaction to verify the HW works.
 307 * @ioat_dma: dma device to be tested
 308 */
 309static int ioat_dma_self_test(struct ioatdma_device *ioat_dma)
 310{
 311	int i;
 312	u8 *src;
 313	u8 *dest;
 314	struct dma_device *dma = &ioat_dma->dma_dev;
 315	struct device *dev = &ioat_dma->pdev->dev;
 316	struct dma_chan *dma_chan;
 317	struct dma_async_tx_descriptor *tx;
 318	dma_addr_t dma_dest, dma_src;
 319	dma_cookie_t cookie;
 320	int err = 0;
 321	struct completion cmp;
 322	unsigned long tmo;
 323	unsigned long flags;
 324
 325	src = kzalloc(sizeof(u8) * IOAT_TEST_SIZE, GFP_KERNEL);
 326	if (!src)
 327		return -ENOMEM;
 328	dest = kzalloc(sizeof(u8) * IOAT_TEST_SIZE, GFP_KERNEL);
 329	if (!dest) {
 330		kfree(src);
 331		return -ENOMEM;
 332	}
 333
 334	/* Fill in src buffer */
 335	for (i = 0; i < IOAT_TEST_SIZE; i++)
 336		src[i] = (u8)i;
 337
 338	/* Start copy, using first DMA channel */
 339	dma_chan = container_of(dma->channels.next, struct dma_chan,
 340				device_node);
 341	if (dma->device_alloc_chan_resources(dma_chan) < 1) {
 342		dev_err(dev, "selftest cannot allocate chan resource\n");
 343		err = -ENODEV;
 344		goto out;
 345	}
 346
 347	dma_src = dma_map_single(dev, src, IOAT_TEST_SIZE, DMA_TO_DEVICE);
 348	if (dma_mapping_error(dev, dma_src)) {
 349		dev_err(dev, "mapping src buffer failed\n");
 350		err = -ENOMEM;
 351		goto free_resources;
 352	}
 353	dma_dest = dma_map_single(dev, dest, IOAT_TEST_SIZE, DMA_FROM_DEVICE);
 354	if (dma_mapping_error(dev, dma_dest)) {
 355		dev_err(dev, "mapping dest buffer failed\n");
 356		err = -ENOMEM;
 357		goto unmap_src;
 358	}
 359	flags = DMA_PREP_INTERRUPT;
 360	tx = ioat_dma->dma_dev.device_prep_dma_memcpy(dma_chan, dma_dest,
 361						      dma_src, IOAT_TEST_SIZE,
 362						      flags);
 363	if (!tx) {
 364		dev_err(dev, "Self-test prep failed, disabling\n");
 365		err = -ENODEV;
 366		goto unmap_dma;
 367	}
 368
 369	async_tx_ack(tx);
 370	init_completion(&cmp);
 371	tx->callback = ioat_dma_test_callback;
 372	tx->callback_param = &cmp;
 373	cookie = tx->tx_submit(tx);
 374	if (cookie < 0) {
 375		dev_err(dev, "Self-test setup failed, disabling\n");
 376		err = -ENODEV;
 377		goto unmap_dma;
 378	}
 379	dma->device_issue_pending(dma_chan);
 380
 381	tmo = wait_for_completion_timeout(&cmp, msecs_to_jiffies(3000));
 382
 383	if (tmo == 0 ||
 384	    dma->device_tx_status(dma_chan, cookie, NULL)
 385					!= DMA_COMPLETE) {
 386		dev_err(dev, "Self-test copy timed out, disabling\n");
 387		err = -ENODEV;
 388		goto unmap_dma;
 389	}
 390	if (memcmp(src, dest, IOAT_TEST_SIZE)) {
 391		dev_err(dev, "Self-test copy failed compare, disabling\n");
 392		err = -ENODEV;
 393		goto unmap_dma;
 394	}
 395
 396unmap_dma:
 397	dma_unmap_single(dev, dma_dest, IOAT_TEST_SIZE, DMA_FROM_DEVICE);
 398unmap_src:
 399	dma_unmap_single(dev, dma_src, IOAT_TEST_SIZE, DMA_TO_DEVICE);
 400free_resources:
 401	dma->device_free_chan_resources(dma_chan);
 402out:
 403	kfree(src);
 404	kfree(dest);
 405	return err;
 406}
 407
 408/**
 409 * ioat_dma_setup_interrupts - setup interrupt handler
 410 * @ioat_dma: ioat dma device
 411 */
 412int ioat_dma_setup_interrupts(struct ioatdma_device *ioat_dma)
 413{
 414	struct ioatdma_chan *ioat_chan;
 415	struct pci_dev *pdev = ioat_dma->pdev;
 416	struct device *dev = &pdev->dev;
 417	struct msix_entry *msix;
 418	int i, j, msixcnt;
 419	int err = -EINVAL;
 420	u8 intrctrl = 0;
 421
 422	if (!strcmp(ioat_interrupt_style, "msix"))
 423		goto msix;
 424	if (!strcmp(ioat_interrupt_style, "msi"))
 425		goto msi;
 426	if (!strcmp(ioat_interrupt_style, "intx"))
 427		goto intx;
 428	dev_err(dev, "invalid ioat_interrupt_style %s\n", ioat_interrupt_style);
 429	goto err_no_irq;
 430
 431msix:
 432	/* The number of MSI-X vectors should equal the number of channels */
 433	msixcnt = ioat_dma->dma_dev.chancnt;
 434	for (i = 0; i < msixcnt; i++)
 435		ioat_dma->msix_entries[i].entry = i;
 436
 437	err = pci_enable_msix_exact(pdev, ioat_dma->msix_entries, msixcnt);
 438	if (err)
 439		goto msi;
 440
 441	for (i = 0; i < msixcnt; i++) {
 442		msix = &ioat_dma->msix_entries[i];
 443		ioat_chan = ioat_chan_by_index(ioat_dma, i);
 444		err = devm_request_irq(dev, msix->vector,
 445				       ioat_dma_do_interrupt_msix, 0,
 446				       "ioat-msix", ioat_chan);
 447		if (err) {
 448			for (j = 0; j < i; j++) {
 449				msix = &ioat_dma->msix_entries[j];
 450				ioat_chan = ioat_chan_by_index(ioat_dma, j);
 451				devm_free_irq(dev, msix->vector, ioat_chan);
 452			}
 453			goto msi;
 454		}
 455	}
 456	intrctrl |= IOAT_INTRCTRL_MSIX_VECTOR_CONTROL;
 457	ioat_dma->irq_mode = IOAT_MSIX;
 458	goto done;
 459
 460msi:
 461	err = pci_enable_msi(pdev);
 462	if (err)
 463		goto intx;
 464
 465	err = devm_request_irq(dev, pdev->irq, ioat_dma_do_interrupt, 0,
 466			       "ioat-msi", ioat_dma);
 467	if (err) {
 468		pci_disable_msi(pdev);
 469		goto intx;
 470	}
 471	ioat_dma->irq_mode = IOAT_MSI;
 472	goto done;
 473
 474intx:
 475	err = devm_request_irq(dev, pdev->irq, ioat_dma_do_interrupt,
 476			       IRQF_SHARED, "ioat-intx", ioat_dma);
 477	if (err)
 478		goto err_no_irq;
 479
 480	ioat_dma->irq_mode = IOAT_INTX;
 481done:
 482	if (is_bwd_ioat(pdev))
 483		ioat_intr_quirk(ioat_dma);
 484	intrctrl |= IOAT_INTRCTRL_MASTER_INT_EN;
 485	writeb(intrctrl, ioat_dma->reg_base + IOAT_INTRCTRL_OFFSET);
 486	return 0;
 487
 488err_no_irq:
 489	/* Disable all interrupt generation */
 490	writeb(0, ioat_dma->reg_base + IOAT_INTRCTRL_OFFSET);
 491	ioat_dma->irq_mode = IOAT_NOIRQ;
 492	dev_err(dev, "no usable interrupts\n");
 493	return err;
 494}
 495
 496static void ioat_disable_interrupts(struct ioatdma_device *ioat_dma)
 497{
 498	/* Disable all interrupt generation */
 499	writeb(0, ioat_dma->reg_base + IOAT_INTRCTRL_OFFSET);
 500}
 501
 502static int ioat_probe(struct ioatdma_device *ioat_dma)
 503{
 504	int err = -ENODEV;
 505	struct dma_device *dma = &ioat_dma->dma_dev;
 506	struct pci_dev *pdev = ioat_dma->pdev;
 507	struct device *dev = &pdev->dev;
 508
 509	ioat_dma->completion_pool = dma_pool_create("completion_pool", dev,
 510						    sizeof(u64),
 511						    SMP_CACHE_BYTES,
 512						    SMP_CACHE_BYTES);
 513
 514	if (!ioat_dma->completion_pool) {
 515		err = -ENOMEM;
 516		goto err_out;
 517	}
 518
 519	ioat_enumerate_channels(ioat_dma);
 520
 521	dma_cap_set(DMA_MEMCPY, dma->cap_mask);
 522	dma->dev = &pdev->dev;
 523
 524	if (!dma->chancnt) {
 525		dev_err(dev, "channel enumeration error\n");
 526		goto err_setup_interrupts;
 527	}
 528
 529	err = ioat_dma_setup_interrupts(ioat_dma);
 530	if (err)
 531		goto err_setup_interrupts;
 532
 533	err = ioat3_dma_self_test(ioat_dma);
 534	if (err)
 535		goto err_self_test;
 536
 537	return 0;
 538
 539err_self_test:
 540	ioat_disable_interrupts(ioat_dma);
 541err_setup_interrupts:
 542	dma_pool_destroy(ioat_dma->completion_pool);
 543err_out:
 544	return err;
 545}
 546
 547static int ioat_register(struct ioatdma_device *ioat_dma)
 548{
 549	int err = dma_async_device_register(&ioat_dma->dma_dev);
 550
 551	if (err) {
 552		ioat_disable_interrupts(ioat_dma);
 553		dma_pool_destroy(ioat_dma->completion_pool);
 554	}
 555
 556	return err;
 557}
 558
 559static void ioat_dma_remove(struct ioatdma_device *ioat_dma)
 560{
 561	struct dma_device *dma = &ioat_dma->dma_dev;
 562
 563	ioat_disable_interrupts(ioat_dma);
 564
 565	ioat_kobject_del(ioat_dma);
 566
 567	dma_async_device_unregister(dma);
 568
 569	dma_pool_destroy(ioat_dma->completion_pool);
 570
 571	INIT_LIST_HEAD(&dma->channels);
 572}
 573
 574/**
 575 * ioat_enumerate_channels - find and initialize the device's channels
 576 * @ioat_dma: the ioat dma device to be enumerated
 577 */
 578static int ioat_enumerate_channels(struct ioatdma_device *ioat_dma)
 579{
 580	struct ioatdma_chan *ioat_chan;
 581	struct device *dev = &ioat_dma->pdev->dev;
 582	struct dma_device *dma = &ioat_dma->dma_dev;
 583	u8 xfercap_log;
 
 584	int i;
 585
 586	INIT_LIST_HEAD(&dma->channels);
 587	dma->chancnt = readb(ioat_dma->reg_base + IOAT_CHANCNT_OFFSET);
 588	dma->chancnt &= 0x1f; /* bits [4:0] valid */
 589	if (dma->chancnt > ARRAY_SIZE(ioat_dma->idx)) {
 590		dev_warn(dev, "(%d) exceeds max supported channels (%zu)\n",
 591			 dma->chancnt, ARRAY_SIZE(ioat_dma->idx));
 592		dma->chancnt = ARRAY_SIZE(ioat_dma->idx);
 593	}
 594	xfercap_log = readb(ioat_dma->reg_base + IOAT_XFERCAP_OFFSET);
 595	xfercap_log &= 0x1f; /* bits [4:0] valid */
 596	if (xfercap_log == 0)
 597		return 0;
 598	dev_dbg(dev, "%s: xfercap = %d\n", __func__, 1 << xfercap_log);
 599
 600	for (i = 0; i < dma->chancnt; i++) {
 601		ioat_chan = devm_kzalloc(dev, sizeof(*ioat_chan), GFP_KERNEL);
 602		if (!ioat_chan)
 603			break;
 604
 605		ioat_init_channel(ioat_dma, ioat_chan, i);
 606		ioat_chan->xfercap_log = xfercap_log;
 607		spin_lock_init(&ioat_chan->prep_lock);
 608		if (ioat_reset_hw(ioat_chan)) {
 609			i = 0;
 610			break;
 611		}
 612	}
 613	dma->chancnt = i;
 614	return i;
 615}
 616
 617/**
 618 * ioat_free_chan_resources - release all the descriptors
 619 * @chan: the channel to be cleaned
 620 */
 621static void ioat_free_chan_resources(struct dma_chan *c)
 622{
 623	struct ioatdma_chan *ioat_chan = to_ioat_chan(c);
 624	struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma;
 625	struct ioat_ring_ent *desc;
 626	const int total_descs = 1 << ioat_chan->alloc_order;
 627	int descs;
 628	int i;
 629
 630	/* Before freeing channel resources first check
 631	 * if they have been previously allocated for this channel.
 632	 */
 633	if (!ioat_chan->ring)
 634		return;
 635
 636	ioat_stop(ioat_chan);
 637	ioat_reset_hw(ioat_chan);
 
 
 
 
 
 
 
 
 
 638
 639	spin_lock_bh(&ioat_chan->cleanup_lock);
 640	spin_lock_bh(&ioat_chan->prep_lock);
 641	descs = ioat_ring_space(ioat_chan);
 642	dev_dbg(to_dev(ioat_chan), "freeing %d idle descriptors\n", descs);
 643	for (i = 0; i < descs; i++) {
 644		desc = ioat_get_ring_ent(ioat_chan, ioat_chan->head + i);
 645		ioat_free_ring_ent(desc, c);
 646	}
 647
 648	if (descs < total_descs)
 649		dev_err(to_dev(ioat_chan), "Freeing %d in use descriptors!\n",
 650			total_descs - descs);
 651
 652	for (i = 0; i < total_descs - descs; i++) {
 653		desc = ioat_get_ring_ent(ioat_chan, ioat_chan->tail + i);
 654		dump_desc_dbg(ioat_chan, desc);
 655		ioat_free_ring_ent(desc, c);
 656	}
 657
 658	for (i = 0; i < ioat_chan->desc_chunks; i++) {
 659		dma_free_coherent(to_dev(ioat_chan), SZ_2M,
 660				  ioat_chan->descs[i].virt,
 661				  ioat_chan->descs[i].hw);
 662		ioat_chan->descs[i].virt = NULL;
 663		ioat_chan->descs[i].hw = 0;
 664	}
 665	ioat_chan->desc_chunks = 0;
 666
 667	kfree(ioat_chan->ring);
 668	ioat_chan->ring = NULL;
 669	ioat_chan->alloc_order = 0;
 670	dma_pool_free(ioat_dma->completion_pool, ioat_chan->completion,
 671		      ioat_chan->completion_dma);
 672	spin_unlock_bh(&ioat_chan->prep_lock);
 673	spin_unlock_bh(&ioat_chan->cleanup_lock);
 674
 675	ioat_chan->last_completion = 0;
 676	ioat_chan->completion_dma = 0;
 677	ioat_chan->dmacount = 0;
 678}
 679
 680/* ioat_alloc_chan_resources - allocate/initialize ioat descriptor ring
 681 * @chan: channel to be initialized
 682 */
 683static int ioat_alloc_chan_resources(struct dma_chan *c)
 684{
 685	struct ioatdma_chan *ioat_chan = to_ioat_chan(c);
 686	struct ioat_ring_ent **ring;
 687	u64 status;
 688	int order;
 689	int i = 0;
 690	u32 chanerr;
 691
 692	/* have we already been set up? */
 693	if (ioat_chan->ring)
 694		return 1 << ioat_chan->alloc_order;
 695
 696	/* Setup register to interrupt and write completion status on error */
 697	writew(IOAT_CHANCTRL_RUN, ioat_chan->reg_base + IOAT_CHANCTRL_OFFSET);
 698
 699	/* allocate a completion writeback area */
 700	/* doing 2 32bit writes to mmio since 1 64b write doesn't work */
 701	ioat_chan->completion =
 702		dma_pool_zalloc(ioat_chan->ioat_dma->completion_pool,
 703				GFP_NOWAIT, &ioat_chan->completion_dma);
 704	if (!ioat_chan->completion)
 705		return -ENOMEM;
 706
 707	writel(((u64)ioat_chan->completion_dma) & 0x00000000FFFFFFFF,
 708	       ioat_chan->reg_base + IOAT_CHANCMP_OFFSET_LOW);
 709	writel(((u64)ioat_chan->completion_dma) >> 32,
 710	       ioat_chan->reg_base + IOAT_CHANCMP_OFFSET_HIGH);
 711
 712	order = IOAT_MAX_ORDER;
 713	ring = ioat_alloc_ring(c, order, GFP_NOWAIT);
 714	if (!ring)
 715		return -ENOMEM;
 716
 717	spin_lock_bh(&ioat_chan->cleanup_lock);
 718	spin_lock_bh(&ioat_chan->prep_lock);
 719	ioat_chan->ring = ring;
 720	ioat_chan->head = 0;
 721	ioat_chan->issued = 0;
 722	ioat_chan->tail = 0;
 723	ioat_chan->alloc_order = order;
 724	set_bit(IOAT_RUN, &ioat_chan->state);
 725	spin_unlock_bh(&ioat_chan->prep_lock);
 726	spin_unlock_bh(&ioat_chan->cleanup_lock);
 727
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 728	ioat_start_null_desc(ioat_chan);
 729
 730	/* check that we got off the ground */
 731	do {
 732		udelay(1);
 733		status = ioat_chansts(ioat_chan);
 734	} while (i++ < 20 && !is_ioat_active(status) && !is_ioat_idle(status));
 735
 736	if (is_ioat_active(status) || is_ioat_idle(status))
 737		return 1 << ioat_chan->alloc_order;
 738
 739	chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
 740
 741	dev_WARN(to_dev(ioat_chan),
 742		 "failed to start channel chanerr: %#x\n", chanerr);
 743	ioat_free_chan_resources(c);
 744	return -EFAULT;
 745}
 746
 747/* common channel initialization */
 748static void
 749ioat_init_channel(struct ioatdma_device *ioat_dma,
 750		  struct ioatdma_chan *ioat_chan, int idx)
 751{
 752	struct dma_device *dma = &ioat_dma->dma_dev;
 753	struct dma_chan *c = &ioat_chan->dma_chan;
 754	unsigned long data = (unsigned long) c;
 755
 756	ioat_chan->ioat_dma = ioat_dma;
 757	ioat_chan->reg_base = ioat_dma->reg_base + (0x80 * (idx + 1));
 758	spin_lock_init(&ioat_chan->cleanup_lock);
 759	ioat_chan->dma_chan.device = dma;
 760	dma_cookie_init(&ioat_chan->dma_chan);
 761	list_add_tail(&ioat_chan->dma_chan.device_node, &dma->channels);
 762	ioat_dma->idx[idx] = ioat_chan;
 763	timer_setup(&ioat_chan->timer, ioat_timer_event, 0);
 764	tasklet_init(&ioat_chan->cleanup_task, ioat_cleanup_event, data);
 765}
 766
 767#define IOAT_NUM_SRC_TEST 6 /* must be <= 8 */
 768static int ioat_xor_val_self_test(struct ioatdma_device *ioat_dma)
 769{
 770	int i, src_idx;
 771	struct page *dest;
 772	struct page *xor_srcs[IOAT_NUM_SRC_TEST];
 773	struct page *xor_val_srcs[IOAT_NUM_SRC_TEST + 1];
 774	dma_addr_t dma_srcs[IOAT_NUM_SRC_TEST + 1];
 775	dma_addr_t dest_dma;
 776	struct dma_async_tx_descriptor *tx;
 777	struct dma_chan *dma_chan;
 778	dma_cookie_t cookie;
 779	u8 cmp_byte = 0;
 780	u32 cmp_word;
 781	u32 xor_val_result;
 782	int err = 0;
 783	struct completion cmp;
 784	unsigned long tmo;
 785	struct device *dev = &ioat_dma->pdev->dev;
 786	struct dma_device *dma = &ioat_dma->dma_dev;
 787	u8 op = 0;
 788
 789	dev_dbg(dev, "%s\n", __func__);
 790
 791	if (!dma_has_cap(DMA_XOR, dma->cap_mask))
 792		return 0;
 793
 794	for (src_idx = 0; src_idx < IOAT_NUM_SRC_TEST; src_idx++) {
 795		xor_srcs[src_idx] = alloc_page(GFP_KERNEL);
 796		if (!xor_srcs[src_idx]) {
 797			while (src_idx--)
 798				__free_page(xor_srcs[src_idx]);
 799			return -ENOMEM;
 800		}
 801	}
 802
 803	dest = alloc_page(GFP_KERNEL);
 804	if (!dest) {
 805		while (src_idx--)
 806			__free_page(xor_srcs[src_idx]);
 807		return -ENOMEM;
 808	}
 809
 810	/* Fill in src buffers */
 811	for (src_idx = 0; src_idx < IOAT_NUM_SRC_TEST; src_idx++) {
 812		u8 *ptr = page_address(xor_srcs[src_idx]);
 813
 814		for (i = 0; i < PAGE_SIZE; i++)
 815			ptr[i] = (1 << src_idx);
 816	}
 817
 818	for (src_idx = 0; src_idx < IOAT_NUM_SRC_TEST; src_idx++)
 819		cmp_byte ^= (u8) (1 << src_idx);
 820
 821	cmp_word = (cmp_byte << 24) | (cmp_byte << 16) |
 822			(cmp_byte << 8) | cmp_byte;
 823
 824	memset(page_address(dest), 0, PAGE_SIZE);
 825
 826	dma_chan = container_of(dma->channels.next, struct dma_chan,
 827				device_node);
 828	if (dma->device_alloc_chan_resources(dma_chan) < 1) {
 829		err = -ENODEV;
 830		goto out;
 831	}
 832
 833	/* test xor */
 834	op = IOAT_OP_XOR;
 835
 836	dest_dma = dma_map_page(dev, dest, 0, PAGE_SIZE, DMA_FROM_DEVICE);
 837	if (dma_mapping_error(dev, dest_dma)) {
 838		err = -ENOMEM;
 839		goto free_resources;
 840	}
 841
 842	for (i = 0; i < IOAT_NUM_SRC_TEST; i++) {
 843		dma_srcs[i] = dma_map_page(dev, xor_srcs[i], 0, PAGE_SIZE,
 844					   DMA_TO_DEVICE);
 845		if (dma_mapping_error(dev, dma_srcs[i])) {
 846			err = -ENOMEM;
 847			goto dma_unmap;
 848		}
 849	}
 850	tx = dma->device_prep_dma_xor(dma_chan, dest_dma, dma_srcs,
 851				      IOAT_NUM_SRC_TEST, PAGE_SIZE,
 852				      DMA_PREP_INTERRUPT);
 853
 854	if (!tx) {
 855		dev_err(dev, "Self-test xor prep failed\n");
 856		err = -ENODEV;
 857		goto dma_unmap;
 858	}
 859
 860	async_tx_ack(tx);
 861	init_completion(&cmp);
 862	tx->callback = ioat_dma_test_callback;
 863	tx->callback_param = &cmp;
 864	cookie = tx->tx_submit(tx);
 865	if (cookie < 0) {
 866		dev_err(dev, "Self-test xor setup failed\n");
 867		err = -ENODEV;
 868		goto dma_unmap;
 869	}
 870	dma->device_issue_pending(dma_chan);
 871
 872	tmo = wait_for_completion_timeout(&cmp, msecs_to_jiffies(3000));
 873
 874	if (tmo == 0 ||
 875	    dma->device_tx_status(dma_chan, cookie, NULL) != DMA_COMPLETE) {
 876		dev_err(dev, "Self-test xor timed out\n");
 877		err = -ENODEV;
 878		goto dma_unmap;
 879	}
 880
 881	for (i = 0; i < IOAT_NUM_SRC_TEST; i++)
 882		dma_unmap_page(dev, dma_srcs[i], PAGE_SIZE, DMA_TO_DEVICE);
 883
 884	dma_sync_single_for_cpu(dev, dest_dma, PAGE_SIZE, DMA_FROM_DEVICE);
 885	for (i = 0; i < (PAGE_SIZE / sizeof(u32)); i++) {
 886		u32 *ptr = page_address(dest);
 887
 888		if (ptr[i] != cmp_word) {
 889			dev_err(dev, "Self-test xor failed compare\n");
 890			err = -ENODEV;
 891			goto free_resources;
 892		}
 893	}
 894	dma_sync_single_for_device(dev, dest_dma, PAGE_SIZE, DMA_FROM_DEVICE);
 895
 896	dma_unmap_page(dev, dest_dma, PAGE_SIZE, DMA_FROM_DEVICE);
 897
 898	/* skip validate if the capability is not present */
 899	if (!dma_has_cap(DMA_XOR_VAL, dma_chan->device->cap_mask))
 900		goto free_resources;
 901
 902	op = IOAT_OP_XOR_VAL;
 903
 904	/* validate the sources with the destintation page */
 905	for (i = 0; i < IOAT_NUM_SRC_TEST; i++)
 906		xor_val_srcs[i] = xor_srcs[i];
 907	xor_val_srcs[i] = dest;
 908
 909	xor_val_result = 1;
 910
 911	for (i = 0; i < IOAT_NUM_SRC_TEST + 1; i++) {
 912		dma_srcs[i] = dma_map_page(dev, xor_val_srcs[i], 0, PAGE_SIZE,
 913					   DMA_TO_DEVICE);
 914		if (dma_mapping_error(dev, dma_srcs[i])) {
 915			err = -ENOMEM;
 916			goto dma_unmap;
 917		}
 918	}
 919	tx = dma->device_prep_dma_xor_val(dma_chan, dma_srcs,
 920					  IOAT_NUM_SRC_TEST + 1, PAGE_SIZE,
 921					  &xor_val_result, DMA_PREP_INTERRUPT);
 922	if (!tx) {
 923		dev_err(dev, "Self-test zero prep failed\n");
 924		err = -ENODEV;
 925		goto dma_unmap;
 926	}
 927
 928	async_tx_ack(tx);
 929	init_completion(&cmp);
 930	tx->callback = ioat_dma_test_callback;
 931	tx->callback_param = &cmp;
 932	cookie = tx->tx_submit(tx);
 933	if (cookie < 0) {
 934		dev_err(dev, "Self-test zero setup failed\n");
 935		err = -ENODEV;
 936		goto dma_unmap;
 937	}
 938	dma->device_issue_pending(dma_chan);
 939
 940	tmo = wait_for_completion_timeout(&cmp, msecs_to_jiffies(3000));
 941
 942	if (tmo == 0 ||
 943	    dma->device_tx_status(dma_chan, cookie, NULL) != DMA_COMPLETE) {
 944		dev_err(dev, "Self-test validate timed out\n");
 945		err = -ENODEV;
 946		goto dma_unmap;
 947	}
 948
 949	for (i = 0; i < IOAT_NUM_SRC_TEST + 1; i++)
 950		dma_unmap_page(dev, dma_srcs[i], PAGE_SIZE, DMA_TO_DEVICE);
 951
 952	if (xor_val_result != 0) {
 953		dev_err(dev, "Self-test validate failed compare\n");
 954		err = -ENODEV;
 955		goto free_resources;
 956	}
 957
 958	memset(page_address(dest), 0, PAGE_SIZE);
 959
 960	/* test for non-zero parity sum */
 961	op = IOAT_OP_XOR_VAL;
 962
 963	xor_val_result = 0;
 964	for (i = 0; i < IOAT_NUM_SRC_TEST + 1; i++) {
 965		dma_srcs[i] = dma_map_page(dev, xor_val_srcs[i], 0, PAGE_SIZE,
 966					   DMA_TO_DEVICE);
 967		if (dma_mapping_error(dev, dma_srcs[i])) {
 968			err = -ENOMEM;
 969			goto dma_unmap;
 970		}
 971	}
 972	tx = dma->device_prep_dma_xor_val(dma_chan, dma_srcs,
 973					  IOAT_NUM_SRC_TEST + 1, PAGE_SIZE,
 974					  &xor_val_result, DMA_PREP_INTERRUPT);
 975	if (!tx) {
 976		dev_err(dev, "Self-test 2nd zero prep failed\n");
 977		err = -ENODEV;
 978		goto dma_unmap;
 979	}
 980
 981	async_tx_ack(tx);
 982	init_completion(&cmp);
 983	tx->callback = ioat_dma_test_callback;
 984	tx->callback_param = &cmp;
 985	cookie = tx->tx_submit(tx);
 986	if (cookie < 0) {
 987		dev_err(dev, "Self-test  2nd zero setup failed\n");
 988		err = -ENODEV;
 989		goto dma_unmap;
 990	}
 991	dma->device_issue_pending(dma_chan);
 992
 993	tmo = wait_for_completion_timeout(&cmp, msecs_to_jiffies(3000));
 994
 995	if (tmo == 0 ||
 996	    dma->device_tx_status(dma_chan, cookie, NULL) != DMA_COMPLETE) {
 997		dev_err(dev, "Self-test 2nd validate timed out\n");
 998		err = -ENODEV;
 999		goto dma_unmap;
1000	}
1001
1002	if (xor_val_result != SUM_CHECK_P_RESULT) {
1003		dev_err(dev, "Self-test validate failed compare\n");
1004		err = -ENODEV;
1005		goto dma_unmap;
1006	}
1007
1008	for (i = 0; i < IOAT_NUM_SRC_TEST + 1; i++)
1009		dma_unmap_page(dev, dma_srcs[i], PAGE_SIZE, DMA_TO_DEVICE);
1010
1011	goto free_resources;
1012dma_unmap:
1013	if (op == IOAT_OP_XOR) {
1014		while (--i >= 0)
1015			dma_unmap_page(dev, dma_srcs[i], PAGE_SIZE,
1016				       DMA_TO_DEVICE);
1017		dma_unmap_page(dev, dest_dma, PAGE_SIZE, DMA_FROM_DEVICE);
1018	} else if (op == IOAT_OP_XOR_VAL) {
1019		while (--i >= 0)
1020			dma_unmap_page(dev, dma_srcs[i], PAGE_SIZE,
1021				       DMA_TO_DEVICE);
1022	}
1023free_resources:
1024	dma->device_free_chan_resources(dma_chan);
1025out:
1026	src_idx = IOAT_NUM_SRC_TEST;
1027	while (src_idx--)
1028		__free_page(xor_srcs[src_idx]);
1029	__free_page(dest);
1030	return err;
1031}
1032
1033static int ioat3_dma_self_test(struct ioatdma_device *ioat_dma)
1034{
1035	int rc;
1036
1037	rc = ioat_dma_self_test(ioat_dma);
1038	if (rc)
1039		return rc;
1040
1041	rc = ioat_xor_val_self_test(ioat_dma);
1042
1043	return rc;
1044}
1045
1046static void ioat_intr_quirk(struct ioatdma_device *ioat_dma)
1047{
1048	struct dma_device *dma;
1049	struct dma_chan *c;
1050	struct ioatdma_chan *ioat_chan;
1051	u32 errmask;
1052
1053	dma = &ioat_dma->dma_dev;
1054
1055	/*
1056	 * if we have descriptor write back error status, we mask the
1057	 * error interrupts
1058	 */
1059	if (ioat_dma->cap & IOAT_CAP_DWBES) {
1060		list_for_each_entry(c, &dma->channels, device_node) {
1061			ioat_chan = to_ioat_chan(c);
1062			errmask = readl(ioat_chan->reg_base +
1063					IOAT_CHANERR_MASK_OFFSET);
1064			errmask |= IOAT_CHANERR_XOR_P_OR_CRC_ERR |
1065				   IOAT_CHANERR_XOR_Q_ERR;
1066			writel(errmask, ioat_chan->reg_base +
1067					IOAT_CHANERR_MASK_OFFSET);
1068		}
1069	}
1070}
1071
1072static int ioat3_dma_probe(struct ioatdma_device *ioat_dma, int dca)
1073{
1074	struct pci_dev *pdev = ioat_dma->pdev;
1075	int dca_en = system_has_dca_enabled(pdev);
1076	struct dma_device *dma;
1077	struct dma_chan *c;
1078	struct ioatdma_chan *ioat_chan;
1079	int err;
1080	u16 val16;
1081
1082	dma = &ioat_dma->dma_dev;
1083	dma->device_prep_dma_memcpy = ioat_dma_prep_memcpy_lock;
1084	dma->device_issue_pending = ioat_issue_pending;
1085	dma->device_alloc_chan_resources = ioat_alloc_chan_resources;
1086	dma->device_free_chan_resources = ioat_free_chan_resources;
1087
1088	dma_cap_set(DMA_INTERRUPT, dma->cap_mask);
1089	dma->device_prep_dma_interrupt = ioat_prep_interrupt_lock;
1090
1091	ioat_dma->cap = readl(ioat_dma->reg_base + IOAT_DMA_CAP_OFFSET);
1092
1093	if (is_xeon_cb32(pdev) || is_bwd_noraid(pdev))
1094		ioat_dma->cap &=
1095			~(IOAT_CAP_XOR | IOAT_CAP_PQ | IOAT_CAP_RAID16SS);
1096
1097	/* dca is incompatible with raid operations */
1098	if (dca_en && (ioat_dma->cap & (IOAT_CAP_XOR|IOAT_CAP_PQ)))
1099		ioat_dma->cap &= ~(IOAT_CAP_XOR|IOAT_CAP_PQ);
1100
1101	if (ioat_dma->cap & IOAT_CAP_XOR) {
1102		dma->max_xor = 8;
1103
1104		dma_cap_set(DMA_XOR, dma->cap_mask);
1105		dma->device_prep_dma_xor = ioat_prep_xor;
1106
1107		dma_cap_set(DMA_XOR_VAL, dma->cap_mask);
1108		dma->device_prep_dma_xor_val = ioat_prep_xor_val;
1109	}
1110
1111	if (ioat_dma->cap & IOAT_CAP_PQ) {
1112
1113		dma->device_prep_dma_pq = ioat_prep_pq;
1114		dma->device_prep_dma_pq_val = ioat_prep_pq_val;
1115		dma_cap_set(DMA_PQ, dma->cap_mask);
1116		dma_cap_set(DMA_PQ_VAL, dma->cap_mask);
1117
1118		if (ioat_dma->cap & IOAT_CAP_RAID16SS)
1119			dma_set_maxpq(dma, 16, 0);
1120		else
1121			dma_set_maxpq(dma, 8, 0);
1122
1123		if (!(ioat_dma->cap & IOAT_CAP_XOR)) {
1124			dma->device_prep_dma_xor = ioat_prep_pqxor;
1125			dma->device_prep_dma_xor_val = ioat_prep_pqxor_val;
1126			dma_cap_set(DMA_XOR, dma->cap_mask);
1127			dma_cap_set(DMA_XOR_VAL, dma->cap_mask);
1128
1129			if (ioat_dma->cap & IOAT_CAP_RAID16SS)
1130				dma->max_xor = 16;
1131			else
1132				dma->max_xor = 8;
1133		}
1134	}
1135
1136	dma->device_tx_status = ioat_tx_status;
1137
1138	/* starting with CB3.3 super extended descriptors are supported */
1139	if (ioat_dma->cap & IOAT_CAP_RAID16SS) {
1140		char pool_name[14];
1141		int i;
1142
1143		for (i = 0; i < MAX_SED_POOLS; i++) {
1144			snprintf(pool_name, 14, "ioat_hw%d_sed", i);
1145
1146			/* allocate SED DMA pool */
1147			ioat_dma->sed_hw_pool[i] = dmam_pool_create(pool_name,
1148					&pdev->dev,
1149					SED_SIZE * (i + 1), 64, 0);
1150			if (!ioat_dma->sed_hw_pool[i])
1151				return -ENOMEM;
1152
1153		}
1154	}
1155
1156	if (!(ioat_dma->cap & (IOAT_CAP_XOR | IOAT_CAP_PQ)))
1157		dma_cap_set(DMA_PRIVATE, dma->cap_mask);
1158
1159	err = ioat_probe(ioat_dma);
1160	if (err)
1161		return err;
1162
1163	list_for_each_entry(c, &dma->channels, device_node) {
1164		ioat_chan = to_ioat_chan(c);
1165		writel(IOAT_DMA_DCA_ANY_CPU,
1166		       ioat_chan->reg_base + IOAT_DCACTRL_OFFSET);
1167	}
1168
1169	err = ioat_register(ioat_dma);
1170	if (err)
1171		return err;
1172
1173	ioat_kobject_add(ioat_dma, &ioat_ktype);
1174
1175	if (dca)
1176		ioat_dma->dca = ioat_dca_init(pdev, ioat_dma->reg_base);
1177
1178	/* disable relaxed ordering */
1179	err = pcie_capability_read_word(pdev, IOAT_DEVCTRL_OFFSET, &val16);
1180	if (err)
1181		return err;
1182
1183	/* clear relaxed ordering enable */
1184	val16 &= ~IOAT_DEVCTRL_ROE;
1185	err = pcie_capability_write_word(pdev, IOAT_DEVCTRL_OFFSET, val16);
1186	if (err)
1187		return err;
 
 
 
 
1188
1189	return 0;
1190}
1191
1192static void ioat_shutdown(struct pci_dev *pdev)
1193{
1194	struct ioatdma_device *ioat_dma = pci_get_drvdata(pdev);
1195	struct ioatdma_chan *ioat_chan;
1196	int i;
1197
1198	if (!ioat_dma)
1199		return;
1200
1201	for (i = 0; i < IOAT_MAX_CHANS; i++) {
1202		ioat_chan = ioat_dma->idx[i];
1203		if (!ioat_chan)
1204			continue;
1205
1206		spin_lock_bh(&ioat_chan->prep_lock);
1207		set_bit(IOAT_CHAN_DOWN, &ioat_chan->state);
 
 
 
 
 
 
 
1208		del_timer_sync(&ioat_chan->timer);
1209		spin_unlock_bh(&ioat_chan->prep_lock);
1210		/* this should quiesce then reset */
1211		ioat_reset_hw(ioat_chan);
1212	}
1213
1214	ioat_disable_interrupts(ioat_dma);
1215}
1216
1217static void ioat_resume(struct ioatdma_device *ioat_dma)
1218{
1219	struct ioatdma_chan *ioat_chan;
1220	u32 chanerr;
1221	int i;
1222
1223	for (i = 0; i < IOAT_MAX_CHANS; i++) {
1224		ioat_chan = ioat_dma->idx[i];
1225		if (!ioat_chan)
1226			continue;
1227
1228		spin_lock_bh(&ioat_chan->prep_lock);
1229		clear_bit(IOAT_CHAN_DOWN, &ioat_chan->state);
1230		spin_unlock_bh(&ioat_chan->prep_lock);
1231
1232		chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
1233		writel(chanerr, ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
1234
1235		/* no need to reset as shutdown already did that */
1236	}
1237}
1238
1239#define DRV_NAME "ioatdma"
1240
1241static pci_ers_result_t ioat_pcie_error_detected(struct pci_dev *pdev,
1242						 enum pci_channel_state error)
1243{
1244	dev_dbg(&pdev->dev, "%s: PCIe AER error %d\n", DRV_NAME, error);
1245
1246	/* quiesce and block I/O */
1247	ioat_shutdown(pdev);
1248
1249	return PCI_ERS_RESULT_NEED_RESET;
1250}
1251
1252static pci_ers_result_t ioat_pcie_error_slot_reset(struct pci_dev *pdev)
1253{
1254	pci_ers_result_t result = PCI_ERS_RESULT_RECOVERED;
1255	int err;
1256
1257	dev_dbg(&pdev->dev, "%s post reset handling\n", DRV_NAME);
1258
1259	if (pci_enable_device_mem(pdev) < 0) {
1260		dev_err(&pdev->dev,
1261			"Failed to enable PCIe device after reset.\n");
1262		result = PCI_ERS_RESULT_DISCONNECT;
1263	} else {
1264		pci_set_master(pdev);
1265		pci_restore_state(pdev);
1266		pci_save_state(pdev);
1267		pci_wake_from_d3(pdev, false);
1268	}
1269
1270	err = pci_cleanup_aer_uncorrect_error_status(pdev);
1271	if (err) {
1272		dev_err(&pdev->dev,
1273			"AER uncorrect error status clear failed: %#x\n", err);
1274	}
1275
1276	return result;
1277}
1278
1279static void ioat_pcie_error_resume(struct pci_dev *pdev)
1280{
1281	struct ioatdma_device *ioat_dma = pci_get_drvdata(pdev);
1282
1283	dev_dbg(&pdev->dev, "%s: AER handling resuming\n", DRV_NAME);
1284
1285	/* initialize and bring everything back */
1286	ioat_resume(ioat_dma);
1287}
1288
1289static const struct pci_error_handlers ioat_err_handler = {
1290	.error_detected = ioat_pcie_error_detected,
1291	.slot_reset = ioat_pcie_error_slot_reset,
1292	.resume = ioat_pcie_error_resume,
1293};
1294
1295static struct pci_driver ioat_pci_driver = {
1296	.name		= DRV_NAME,
1297	.id_table	= ioat_pci_tbl,
1298	.probe		= ioat_pci_probe,
1299	.remove		= ioat_remove,
1300	.shutdown	= ioat_shutdown,
1301	.err_handler	= &ioat_err_handler,
1302};
1303
 
 
 
 
 
 
 
 
 
 
 
 
1304static struct ioatdma_device *
1305alloc_ioatdma(struct pci_dev *pdev, void __iomem *iobase)
1306{
1307	struct device *dev = &pdev->dev;
1308	struct ioatdma_device *d = devm_kzalloc(dev, sizeof(*d), GFP_KERNEL);
1309
1310	if (!d)
1311		return NULL;
1312	d->pdev = pdev;
1313	d->reg_base = iobase;
 
1314	return d;
1315}
1316
1317static int ioat_pci_probe(struct pci_dev *pdev, const struct pci_device_id *id)
1318{
1319	void __iomem * const *iomap;
1320	struct device *dev = &pdev->dev;
1321	struct ioatdma_device *device;
1322	int err;
1323
1324	err = pcim_enable_device(pdev);
1325	if (err)
1326		return err;
1327
1328	err = pcim_iomap_regions(pdev, 1 << IOAT_MMIO_BAR, DRV_NAME);
1329	if (err)
1330		return err;
1331	iomap = pcim_iomap_table(pdev);
1332	if (!iomap)
1333		return -ENOMEM;
1334
1335	err = pci_set_dma_mask(pdev, DMA_BIT_MASK(64));
1336	if (err)
1337		err = pci_set_dma_mask(pdev, DMA_BIT_MASK(32));
1338	if (err)
1339		return err;
1340
1341	err = pci_set_consistent_dma_mask(pdev, DMA_BIT_MASK(64));
1342	if (err)
1343		err = pci_set_consistent_dma_mask(pdev, DMA_BIT_MASK(32));
1344	if (err)
1345		return err;
1346
1347	device = alloc_ioatdma(pdev, iomap[IOAT_MMIO_BAR]);
1348	if (!device)
1349		return -ENOMEM;
1350	pci_set_master(pdev);
1351	pci_set_drvdata(pdev, device);
1352
1353	device->version = readb(device->reg_base + IOAT_VER_OFFSET);
 
 
1354	if (device->version >= IOAT_VER_3_0) {
1355		if (is_skx_ioat(pdev))
1356			device->version = IOAT_VER_3_2;
1357		err = ioat3_dma_probe(device, ioat_dca_enabled);
1358
1359		if (device->version >= IOAT_VER_3_3)
1360			pci_enable_pcie_error_reporting(pdev);
1361	} else
1362		return -ENODEV;
1363
1364	if (err) {
1365		dev_err(dev, "Intel(R) I/OAT DMA Engine init failed\n");
1366		pci_disable_pcie_error_reporting(pdev);
1367		return -ENODEV;
1368	}
1369
1370	return 0;
1371}
1372
1373static void ioat_remove(struct pci_dev *pdev)
1374{
1375	struct ioatdma_device *device = pci_get_drvdata(pdev);
1376
1377	if (!device)
1378		return;
1379
 
 
1380	dev_err(&pdev->dev, "Removing dma and dca services\n");
1381	if (device->dca) {
1382		unregister_dca_provider(device->dca, &pdev->dev);
1383		free_dca_provider(device->dca);
1384		device->dca = NULL;
1385	}
1386
1387	pci_disable_pcie_error_reporting(pdev);
1388	ioat_dma_remove(device);
1389}
1390
1391static int __init ioat_init_module(void)
1392{
1393	int err = -ENOMEM;
1394
1395	pr_info("%s: Intel(R) QuickData Technology Driver %s\n",
1396		DRV_NAME, IOAT_DMA_VERSION);
1397
1398	ioat_cache = kmem_cache_create("ioat", sizeof(struct ioat_ring_ent),
1399					0, SLAB_HWCACHE_ALIGN, NULL);
1400	if (!ioat_cache)
1401		return -ENOMEM;
1402
1403	ioat_sed_cache = KMEM_CACHE(ioat_sed_ent, 0);
1404	if (!ioat_sed_cache)
1405		goto err_ioat_cache;
1406
1407	err = pci_register_driver(&ioat_pci_driver);
1408	if (err)
1409		goto err_ioat3_cache;
1410
1411	return 0;
1412
1413 err_ioat3_cache:
1414	kmem_cache_destroy(ioat_sed_cache);
1415
1416 err_ioat_cache:
1417	kmem_cache_destroy(ioat_cache);
1418
1419	return err;
1420}
1421module_init(ioat_init_module);
1422
1423static void __exit ioat_exit_module(void)
1424{
1425	pci_unregister_driver(&ioat_pci_driver);
1426	kmem_cache_destroy(ioat_cache);
1427}
1428module_exit(ioat_exit_module);