Linux Audio

Check our new training course

Loading...
Note: File does not exist in v6.13.7.
   1/*******************************************************************************
   2
   3  Intel PRO/10GbE Linux driver
   4  Copyright(c) 1999 - 2008 Intel Corporation.
   5
   6  This program is free software; you can redistribute it and/or modify it
   7  under the terms and conditions of the GNU General Public License,
   8  version 2, as published by the Free Software Foundation.
   9
  10  This program is distributed in the hope it will be useful, but WITHOUT
  11  ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  12  FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
  13  more details.
  14
  15  You should have received a copy of the GNU General Public License along with
  16  this program; if not, write to the Free Software Foundation, Inc.,
  17  51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA.
  18
  19  The full GNU General Public License is included in this distribution in
  20  the file called "COPYING".
  21
  22  Contact Information:
  23  Linux NICS <linux.nics@intel.com>
  24  e1000-devel Mailing List <e1000-devel@lists.sourceforge.net>
  25  Intel Corporation, 5200 N.E. Elam Young Parkway, Hillsboro, OR 97124-6497
  26
  27*******************************************************************************/
  28
  29#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
  30
  31#include <linux/prefetch.h>
  32#include "ixgb.h"
  33
  34char ixgb_driver_name[] = "ixgb";
  35static char ixgb_driver_string[] = "Intel(R) PRO/10GbE Network Driver";
  36
  37#define DRIVERNAPI "-NAPI"
  38#define DRV_VERSION "1.0.135-k2" DRIVERNAPI
  39const char ixgb_driver_version[] = DRV_VERSION;
  40static const char ixgb_copyright[] = "Copyright (c) 1999-2008 Intel Corporation.";
  41
  42#define IXGB_CB_LENGTH 256
  43static unsigned int copybreak __read_mostly = IXGB_CB_LENGTH;
  44module_param(copybreak, uint, 0644);
  45MODULE_PARM_DESC(copybreak,
  46	"Maximum size of packet that is copied to a new buffer on receive");
  47
  48/* ixgb_pci_tbl - PCI Device ID Table
  49 *
  50 * Wildcard entries (PCI_ANY_ID) should come last
  51 * Last entry must be all 0s
  52 *
  53 * { Vendor ID, Device ID, SubVendor ID, SubDevice ID,
  54 *   Class, Class Mask, private data (not used) }
  55 */
  56static const struct pci_device_id ixgb_pci_tbl[] = {
  57	{PCI_VENDOR_ID_INTEL, IXGB_DEVICE_ID_82597EX,
  58	 PCI_ANY_ID, PCI_ANY_ID, 0, 0, 0},
  59	{PCI_VENDOR_ID_INTEL, IXGB_DEVICE_ID_82597EX_CX4,
  60	 PCI_ANY_ID, PCI_ANY_ID, 0, 0, 0},
  61	{PCI_VENDOR_ID_INTEL, IXGB_DEVICE_ID_82597EX_SR,
  62	 PCI_ANY_ID, PCI_ANY_ID, 0, 0, 0},
  63	{PCI_VENDOR_ID_INTEL, IXGB_DEVICE_ID_82597EX_LR,
  64	 PCI_ANY_ID, PCI_ANY_ID, 0, 0, 0},
  65
  66	/* required last entry */
  67	{0,}
  68};
  69
  70MODULE_DEVICE_TABLE(pci, ixgb_pci_tbl);
  71
  72/* Local Function Prototypes */
  73static int ixgb_init_module(void);
  74static void ixgb_exit_module(void);
  75static int ixgb_probe(struct pci_dev *pdev, const struct pci_device_id *ent);
  76static void ixgb_remove(struct pci_dev *pdev);
  77static int ixgb_sw_init(struct ixgb_adapter *adapter);
  78static int ixgb_open(struct net_device *netdev);
  79static int ixgb_close(struct net_device *netdev);
  80static void ixgb_configure_tx(struct ixgb_adapter *adapter);
  81static void ixgb_configure_rx(struct ixgb_adapter *adapter);
  82static void ixgb_setup_rctl(struct ixgb_adapter *adapter);
  83static void ixgb_clean_tx_ring(struct ixgb_adapter *adapter);
  84static void ixgb_clean_rx_ring(struct ixgb_adapter *adapter);
  85static void ixgb_set_multi(struct net_device *netdev);
  86static void ixgb_watchdog(struct timer_list *t);
  87static netdev_tx_t ixgb_xmit_frame(struct sk_buff *skb,
  88				   struct net_device *netdev);
  89static int ixgb_change_mtu(struct net_device *netdev, int new_mtu);
  90static int ixgb_set_mac(struct net_device *netdev, void *p);
  91static irqreturn_t ixgb_intr(int irq, void *data);
  92static bool ixgb_clean_tx_irq(struct ixgb_adapter *adapter);
  93
  94static int ixgb_clean(struct napi_struct *, int);
  95static bool ixgb_clean_rx_irq(struct ixgb_adapter *, int *, int);
  96static void ixgb_alloc_rx_buffers(struct ixgb_adapter *, int);
  97
  98static void ixgb_tx_timeout(struct net_device *dev);
  99static void ixgb_tx_timeout_task(struct work_struct *work);
 100
 101static void ixgb_vlan_strip_enable(struct ixgb_adapter *adapter);
 102static void ixgb_vlan_strip_disable(struct ixgb_adapter *adapter);
 103static int ixgb_vlan_rx_add_vid(struct net_device *netdev,
 104				__be16 proto, u16 vid);
 105static int ixgb_vlan_rx_kill_vid(struct net_device *netdev,
 106				 __be16 proto, u16 vid);
 107static void ixgb_restore_vlan(struct ixgb_adapter *adapter);
 108
 109#ifdef CONFIG_NET_POLL_CONTROLLER
 110/* for netdump / net console */
 111static void ixgb_netpoll(struct net_device *dev);
 112#endif
 113
 114static pci_ers_result_t ixgb_io_error_detected (struct pci_dev *pdev,
 115                             enum pci_channel_state state);
 116static pci_ers_result_t ixgb_io_slot_reset (struct pci_dev *pdev);
 117static void ixgb_io_resume (struct pci_dev *pdev);
 118
 119static const struct pci_error_handlers ixgb_err_handler = {
 120	.error_detected = ixgb_io_error_detected,
 121	.slot_reset = ixgb_io_slot_reset,
 122	.resume = ixgb_io_resume,
 123};
 124
 125static struct pci_driver ixgb_driver = {
 126	.name     = ixgb_driver_name,
 127	.id_table = ixgb_pci_tbl,
 128	.probe    = ixgb_probe,
 129	.remove   = ixgb_remove,
 130	.err_handler = &ixgb_err_handler
 131};
 132
 133MODULE_AUTHOR("Intel Corporation, <linux.nics@intel.com>");
 134MODULE_DESCRIPTION("Intel(R) PRO/10GbE Network Driver");
 135MODULE_LICENSE("GPL");
 136MODULE_VERSION(DRV_VERSION);
 137
 138#define DEFAULT_MSG_ENABLE (NETIF_MSG_DRV|NETIF_MSG_PROBE|NETIF_MSG_LINK)
 139static int debug = -1;
 140module_param(debug, int, 0);
 141MODULE_PARM_DESC(debug, "Debug level (0=none,...,16=all)");
 142
 143/**
 144 * ixgb_init_module - Driver Registration Routine
 145 *
 146 * ixgb_init_module is the first routine called when the driver is
 147 * loaded. All it does is register with the PCI subsystem.
 148 **/
 149
 150static int __init
 151ixgb_init_module(void)
 152{
 153	pr_info("%s - version %s\n", ixgb_driver_string, ixgb_driver_version);
 154	pr_info("%s\n", ixgb_copyright);
 155
 156	return pci_register_driver(&ixgb_driver);
 157}
 158
 159module_init(ixgb_init_module);
 160
 161/**
 162 * ixgb_exit_module - Driver Exit Cleanup Routine
 163 *
 164 * ixgb_exit_module is called just before the driver is removed
 165 * from memory.
 166 **/
 167
 168static void __exit
 169ixgb_exit_module(void)
 170{
 171	pci_unregister_driver(&ixgb_driver);
 172}
 173
 174module_exit(ixgb_exit_module);
 175
 176/**
 177 * ixgb_irq_disable - Mask off interrupt generation on the NIC
 178 * @adapter: board private structure
 179 **/
 180
 181static void
 182ixgb_irq_disable(struct ixgb_adapter *adapter)
 183{
 184	IXGB_WRITE_REG(&adapter->hw, IMC, ~0);
 185	IXGB_WRITE_FLUSH(&adapter->hw);
 186	synchronize_irq(adapter->pdev->irq);
 187}
 188
 189/**
 190 * ixgb_irq_enable - Enable default interrupt generation settings
 191 * @adapter: board private structure
 192 **/
 193
 194static void
 195ixgb_irq_enable(struct ixgb_adapter *adapter)
 196{
 197	u32 val = IXGB_INT_RXT0 | IXGB_INT_RXDMT0 |
 198		  IXGB_INT_TXDW | IXGB_INT_LSC;
 199	if (adapter->hw.subsystem_vendor_id == PCI_VENDOR_ID_SUN)
 200		val |= IXGB_INT_GPI0;
 201	IXGB_WRITE_REG(&adapter->hw, IMS, val);
 202	IXGB_WRITE_FLUSH(&adapter->hw);
 203}
 204
 205int
 206ixgb_up(struct ixgb_adapter *adapter)
 207{
 208	struct net_device *netdev = adapter->netdev;
 209	int err, irq_flags = IRQF_SHARED;
 210	int max_frame = netdev->mtu + ENET_HEADER_SIZE + ENET_FCS_LENGTH;
 211	struct ixgb_hw *hw = &adapter->hw;
 212
 213	/* hardware has been reset, we need to reload some things */
 214
 215	ixgb_rar_set(hw, netdev->dev_addr, 0);
 216	ixgb_set_multi(netdev);
 217
 218	ixgb_restore_vlan(adapter);
 219
 220	ixgb_configure_tx(adapter);
 221	ixgb_setup_rctl(adapter);
 222	ixgb_configure_rx(adapter);
 223	ixgb_alloc_rx_buffers(adapter, IXGB_DESC_UNUSED(&adapter->rx_ring));
 224
 225	/* disable interrupts and get the hardware into a known state */
 226	IXGB_WRITE_REG(&adapter->hw, IMC, 0xffffffff);
 227
 228	/* only enable MSI if bus is in PCI-X mode */
 229	if (IXGB_READ_REG(&adapter->hw, STATUS) & IXGB_STATUS_PCIX_MODE) {
 230		err = pci_enable_msi(adapter->pdev);
 231		if (!err) {
 232			adapter->have_msi = true;
 233			irq_flags = 0;
 234		}
 235		/* proceed to try to request regular interrupt */
 236	}
 237
 238	err = request_irq(adapter->pdev->irq, ixgb_intr, irq_flags,
 239	                  netdev->name, netdev);
 240	if (err) {
 241		if (adapter->have_msi)
 242			pci_disable_msi(adapter->pdev);
 243		netif_err(adapter, probe, adapter->netdev,
 244			  "Unable to allocate interrupt Error: %d\n", err);
 245		return err;
 246	}
 247
 248	if ((hw->max_frame_size != max_frame) ||
 249		(hw->max_frame_size !=
 250		(IXGB_READ_REG(hw, MFS) >> IXGB_MFS_SHIFT))) {
 251
 252		hw->max_frame_size = max_frame;
 253
 254		IXGB_WRITE_REG(hw, MFS, hw->max_frame_size << IXGB_MFS_SHIFT);
 255
 256		if (hw->max_frame_size >
 257		   IXGB_MAX_ENET_FRAME_SIZE_WITHOUT_FCS + ENET_FCS_LENGTH) {
 258			u32 ctrl0 = IXGB_READ_REG(hw, CTRL0);
 259
 260			if (!(ctrl0 & IXGB_CTRL0_JFE)) {
 261				ctrl0 |= IXGB_CTRL0_JFE;
 262				IXGB_WRITE_REG(hw, CTRL0, ctrl0);
 263			}
 264		}
 265	}
 266
 267	clear_bit(__IXGB_DOWN, &adapter->flags);
 268
 269	napi_enable(&adapter->napi);
 270	ixgb_irq_enable(adapter);
 271
 272	netif_wake_queue(netdev);
 273
 274	mod_timer(&adapter->watchdog_timer, jiffies);
 275
 276	return 0;
 277}
 278
 279void
 280ixgb_down(struct ixgb_adapter *adapter, bool kill_watchdog)
 281{
 282	struct net_device *netdev = adapter->netdev;
 283
 284	/* prevent the interrupt handler from restarting watchdog */
 285	set_bit(__IXGB_DOWN, &adapter->flags);
 286
 287	netif_carrier_off(netdev);
 288
 289	napi_disable(&adapter->napi);
 290	/* waiting for NAPI to complete can re-enable interrupts */
 291	ixgb_irq_disable(adapter);
 292	free_irq(adapter->pdev->irq, netdev);
 293
 294	if (adapter->have_msi)
 295		pci_disable_msi(adapter->pdev);
 296
 297	if (kill_watchdog)
 298		del_timer_sync(&adapter->watchdog_timer);
 299
 300	adapter->link_speed = 0;
 301	adapter->link_duplex = 0;
 302	netif_stop_queue(netdev);
 303
 304	ixgb_reset(adapter);
 305	ixgb_clean_tx_ring(adapter);
 306	ixgb_clean_rx_ring(adapter);
 307}
 308
 309void
 310ixgb_reset(struct ixgb_adapter *adapter)
 311{
 312	struct ixgb_hw *hw = &adapter->hw;
 313
 314	ixgb_adapter_stop(hw);
 315	if (!ixgb_init_hw(hw))
 316		netif_err(adapter, probe, adapter->netdev, "ixgb_init_hw failed\n");
 317
 318	/* restore frame size information */
 319	IXGB_WRITE_REG(hw, MFS, hw->max_frame_size << IXGB_MFS_SHIFT);
 320	if (hw->max_frame_size >
 321	    IXGB_MAX_ENET_FRAME_SIZE_WITHOUT_FCS + ENET_FCS_LENGTH) {
 322		u32 ctrl0 = IXGB_READ_REG(hw, CTRL0);
 323		if (!(ctrl0 & IXGB_CTRL0_JFE)) {
 324			ctrl0 |= IXGB_CTRL0_JFE;
 325			IXGB_WRITE_REG(hw, CTRL0, ctrl0);
 326		}
 327	}
 328}
 329
 330static netdev_features_t
 331ixgb_fix_features(struct net_device *netdev, netdev_features_t features)
 332{
 333	/*
 334	 * Tx VLAN insertion does not work per HW design when Rx stripping is
 335	 * disabled.
 336	 */
 337	if (!(features & NETIF_F_HW_VLAN_CTAG_RX))
 338		features &= ~NETIF_F_HW_VLAN_CTAG_TX;
 339
 340	return features;
 341}
 342
 343static int
 344ixgb_set_features(struct net_device *netdev, netdev_features_t features)
 345{
 346	struct ixgb_adapter *adapter = netdev_priv(netdev);
 347	netdev_features_t changed = features ^ netdev->features;
 348
 349	if (!(changed & (NETIF_F_RXCSUM|NETIF_F_HW_VLAN_CTAG_RX)))
 350		return 0;
 351
 352	adapter->rx_csum = !!(features & NETIF_F_RXCSUM);
 353
 354	if (netif_running(netdev)) {
 355		ixgb_down(adapter, true);
 356		ixgb_up(adapter);
 357		ixgb_set_speed_duplex(netdev);
 358	} else
 359		ixgb_reset(adapter);
 360
 361	return 0;
 362}
 363
 364
 365static const struct net_device_ops ixgb_netdev_ops = {
 366	.ndo_open 		= ixgb_open,
 367	.ndo_stop		= ixgb_close,
 368	.ndo_start_xmit		= ixgb_xmit_frame,
 369	.ndo_set_rx_mode	= ixgb_set_multi,
 370	.ndo_validate_addr	= eth_validate_addr,
 371	.ndo_set_mac_address	= ixgb_set_mac,
 372	.ndo_change_mtu		= ixgb_change_mtu,
 373	.ndo_tx_timeout		= ixgb_tx_timeout,
 374	.ndo_vlan_rx_add_vid	= ixgb_vlan_rx_add_vid,
 375	.ndo_vlan_rx_kill_vid	= ixgb_vlan_rx_kill_vid,
 376#ifdef CONFIG_NET_POLL_CONTROLLER
 377	.ndo_poll_controller	= ixgb_netpoll,
 378#endif
 379	.ndo_fix_features       = ixgb_fix_features,
 380	.ndo_set_features       = ixgb_set_features,
 381};
 382
 383/**
 384 * ixgb_probe - Device Initialization Routine
 385 * @pdev: PCI device information struct
 386 * @ent: entry in ixgb_pci_tbl
 387 *
 388 * Returns 0 on success, negative on failure
 389 *
 390 * ixgb_probe initializes an adapter identified by a pci_dev structure.
 391 * The OS initialization, configuring of the adapter private structure,
 392 * and a hardware reset occur.
 393 **/
 394
 395static int
 396ixgb_probe(struct pci_dev *pdev, const struct pci_device_id *ent)
 397{
 398	struct net_device *netdev = NULL;
 399	struct ixgb_adapter *adapter;
 400	static int cards_found = 0;
 401	int pci_using_dac;
 402	int i;
 403	int err;
 404
 405	err = pci_enable_device(pdev);
 406	if (err)
 407		return err;
 408
 409	pci_using_dac = 0;
 410	err = dma_set_mask_and_coherent(&pdev->dev, DMA_BIT_MASK(64));
 411	if (!err) {
 412		pci_using_dac = 1;
 413	} else {
 414		err = dma_set_mask_and_coherent(&pdev->dev, DMA_BIT_MASK(32));
 415		if (err) {
 416			pr_err("No usable DMA configuration, aborting\n");
 417			goto err_dma_mask;
 418		}
 419	}
 420
 421	err = pci_request_regions(pdev, ixgb_driver_name);
 422	if (err)
 423		goto err_request_regions;
 424
 425	pci_set_master(pdev);
 426
 427	netdev = alloc_etherdev(sizeof(struct ixgb_adapter));
 428	if (!netdev) {
 429		err = -ENOMEM;
 430		goto err_alloc_etherdev;
 431	}
 432
 433	SET_NETDEV_DEV(netdev, &pdev->dev);
 434
 435	pci_set_drvdata(pdev, netdev);
 436	adapter = netdev_priv(netdev);
 437	adapter->netdev = netdev;
 438	adapter->pdev = pdev;
 439	adapter->hw.back = adapter;
 440	adapter->msg_enable = netif_msg_init(debug, DEFAULT_MSG_ENABLE);
 441
 442	adapter->hw.hw_addr = pci_ioremap_bar(pdev, BAR_0);
 443	if (!adapter->hw.hw_addr) {
 444		err = -EIO;
 445		goto err_ioremap;
 446	}
 447
 448	for (i = BAR_1; i <= BAR_5; i++) {
 449		if (pci_resource_len(pdev, i) == 0)
 450			continue;
 451		if (pci_resource_flags(pdev, i) & IORESOURCE_IO) {
 452			adapter->hw.io_base = pci_resource_start(pdev, i);
 453			break;
 454		}
 455	}
 456
 457	netdev->netdev_ops = &ixgb_netdev_ops;
 458	ixgb_set_ethtool_ops(netdev);
 459	netdev->watchdog_timeo = 5 * HZ;
 460	netif_napi_add(netdev, &adapter->napi, ixgb_clean, 64);
 461
 462	strncpy(netdev->name, pci_name(pdev), sizeof(netdev->name) - 1);
 463
 464	adapter->bd_number = cards_found;
 465	adapter->link_speed = 0;
 466	adapter->link_duplex = 0;
 467
 468	/* setup the private structure */
 469
 470	err = ixgb_sw_init(adapter);
 471	if (err)
 472		goto err_sw_init;
 473
 474	netdev->hw_features = NETIF_F_SG |
 475			   NETIF_F_TSO |
 476			   NETIF_F_HW_CSUM |
 477			   NETIF_F_HW_VLAN_CTAG_TX |
 478			   NETIF_F_HW_VLAN_CTAG_RX;
 479	netdev->features = netdev->hw_features |
 480			   NETIF_F_HW_VLAN_CTAG_FILTER;
 481	netdev->hw_features |= NETIF_F_RXCSUM;
 482
 483	if (pci_using_dac) {
 484		netdev->features |= NETIF_F_HIGHDMA;
 485		netdev->vlan_features |= NETIF_F_HIGHDMA;
 486	}
 487
 488	/* MTU range: 68 - 16114 */
 489	netdev->min_mtu = ETH_MIN_MTU;
 490	netdev->max_mtu = IXGB_MAX_JUMBO_FRAME_SIZE - ETH_HLEN;
 491
 492	/* make sure the EEPROM is good */
 493
 494	if (!ixgb_validate_eeprom_checksum(&adapter->hw)) {
 495		netif_err(adapter, probe, adapter->netdev,
 496			  "The EEPROM Checksum Is Not Valid\n");
 497		err = -EIO;
 498		goto err_eeprom;
 499	}
 500
 501	ixgb_get_ee_mac_addr(&adapter->hw, netdev->dev_addr);
 502
 503	if (!is_valid_ether_addr(netdev->dev_addr)) {
 504		netif_err(adapter, probe, adapter->netdev, "Invalid MAC Address\n");
 505		err = -EIO;
 506		goto err_eeprom;
 507	}
 508
 509	adapter->part_num = ixgb_get_ee_pba_number(&adapter->hw);
 510
 511	timer_setup(&adapter->watchdog_timer, ixgb_watchdog, 0);
 512
 513	INIT_WORK(&adapter->tx_timeout_task, ixgb_tx_timeout_task);
 514
 515	strcpy(netdev->name, "eth%d");
 516	err = register_netdev(netdev);
 517	if (err)
 518		goto err_register;
 519
 520	/* carrier off reporting is important to ethtool even BEFORE open */
 521	netif_carrier_off(netdev);
 522
 523	netif_info(adapter, probe, adapter->netdev,
 524		   "Intel(R) PRO/10GbE Network Connection\n");
 525	ixgb_check_options(adapter);
 526	/* reset the hardware with the new settings */
 527
 528	ixgb_reset(adapter);
 529
 530	cards_found++;
 531	return 0;
 532
 533err_register:
 534err_sw_init:
 535err_eeprom:
 536	iounmap(adapter->hw.hw_addr);
 537err_ioremap:
 538	free_netdev(netdev);
 539err_alloc_etherdev:
 540	pci_release_regions(pdev);
 541err_request_regions:
 542err_dma_mask:
 543	pci_disable_device(pdev);
 544	return err;
 545}
 546
 547/**
 548 * ixgb_remove - Device Removal Routine
 549 * @pdev: PCI device information struct
 550 *
 551 * ixgb_remove is called by the PCI subsystem to alert the driver
 552 * that it should release a PCI device.  The could be caused by a
 553 * Hot-Plug event, or because the driver is going to be removed from
 554 * memory.
 555 **/
 556
 557static void
 558ixgb_remove(struct pci_dev *pdev)
 559{
 560	struct net_device *netdev = pci_get_drvdata(pdev);
 561	struct ixgb_adapter *adapter = netdev_priv(netdev);
 562
 563	cancel_work_sync(&adapter->tx_timeout_task);
 564
 565	unregister_netdev(netdev);
 566
 567	iounmap(adapter->hw.hw_addr);
 568	pci_release_regions(pdev);
 569
 570	free_netdev(netdev);
 571	pci_disable_device(pdev);
 572}
 573
 574/**
 575 * ixgb_sw_init - Initialize general software structures (struct ixgb_adapter)
 576 * @adapter: board private structure to initialize
 577 *
 578 * ixgb_sw_init initializes the Adapter private data structure.
 579 * Fields are initialized based on PCI device information and
 580 * OS network device settings (MTU size).
 581 **/
 582
 583static int
 584ixgb_sw_init(struct ixgb_adapter *adapter)
 585{
 586	struct ixgb_hw *hw = &adapter->hw;
 587	struct net_device *netdev = adapter->netdev;
 588	struct pci_dev *pdev = adapter->pdev;
 589
 590	/* PCI config space info */
 591
 592	hw->vendor_id = pdev->vendor;
 593	hw->device_id = pdev->device;
 594	hw->subsystem_vendor_id = pdev->subsystem_vendor;
 595	hw->subsystem_id = pdev->subsystem_device;
 596
 597	hw->max_frame_size = netdev->mtu + ENET_HEADER_SIZE + ENET_FCS_LENGTH;
 598	adapter->rx_buffer_len = hw->max_frame_size + 8; /* + 8 for errata */
 599
 600	if ((hw->device_id == IXGB_DEVICE_ID_82597EX) ||
 601	    (hw->device_id == IXGB_DEVICE_ID_82597EX_CX4) ||
 602	    (hw->device_id == IXGB_DEVICE_ID_82597EX_LR) ||
 603	    (hw->device_id == IXGB_DEVICE_ID_82597EX_SR))
 604		hw->mac_type = ixgb_82597;
 605	else {
 606		/* should never have loaded on this device */
 607		netif_err(adapter, probe, adapter->netdev, "unsupported device id\n");
 608	}
 609
 610	/* enable flow control to be programmed */
 611	hw->fc.send_xon = 1;
 612
 613	set_bit(__IXGB_DOWN, &adapter->flags);
 614	return 0;
 615}
 616
 617/**
 618 * ixgb_open - Called when a network interface is made active
 619 * @netdev: network interface device structure
 620 *
 621 * Returns 0 on success, negative value on failure
 622 *
 623 * The open entry point is called when a network interface is made
 624 * active by the system (IFF_UP).  At this point all resources needed
 625 * for transmit and receive operations are allocated, the interrupt
 626 * handler is registered with the OS, the watchdog timer is started,
 627 * and the stack is notified that the interface is ready.
 628 **/
 629
 630static int
 631ixgb_open(struct net_device *netdev)
 632{
 633	struct ixgb_adapter *adapter = netdev_priv(netdev);
 634	int err;
 635
 636	/* allocate transmit descriptors */
 637	err = ixgb_setup_tx_resources(adapter);
 638	if (err)
 639		goto err_setup_tx;
 640
 641	netif_carrier_off(netdev);
 642
 643	/* allocate receive descriptors */
 644
 645	err = ixgb_setup_rx_resources(adapter);
 646	if (err)
 647		goto err_setup_rx;
 648
 649	err = ixgb_up(adapter);
 650	if (err)
 651		goto err_up;
 652
 653	netif_start_queue(netdev);
 654
 655	return 0;
 656
 657err_up:
 658	ixgb_free_rx_resources(adapter);
 659err_setup_rx:
 660	ixgb_free_tx_resources(adapter);
 661err_setup_tx:
 662	ixgb_reset(adapter);
 663
 664	return err;
 665}
 666
 667/**
 668 * ixgb_close - Disables a network interface
 669 * @netdev: network interface device structure
 670 *
 671 * Returns 0, this is not allowed to fail
 672 *
 673 * The close entry point is called when an interface is de-activated
 674 * by the OS.  The hardware is still under the drivers control, but
 675 * needs to be disabled.  A global MAC reset is issued to stop the
 676 * hardware, and all transmit and receive resources are freed.
 677 **/
 678
 679static int
 680ixgb_close(struct net_device *netdev)
 681{
 682	struct ixgb_adapter *adapter = netdev_priv(netdev);
 683
 684	ixgb_down(adapter, true);
 685
 686	ixgb_free_tx_resources(adapter);
 687	ixgb_free_rx_resources(adapter);
 688
 689	return 0;
 690}
 691
 692/**
 693 * ixgb_setup_tx_resources - allocate Tx resources (Descriptors)
 694 * @adapter: board private structure
 695 *
 696 * Return 0 on success, negative on failure
 697 **/
 698
 699int
 700ixgb_setup_tx_resources(struct ixgb_adapter *adapter)
 701{
 702	struct ixgb_desc_ring *txdr = &adapter->tx_ring;
 703	struct pci_dev *pdev = adapter->pdev;
 704	int size;
 705
 706	size = sizeof(struct ixgb_buffer) * txdr->count;
 707	txdr->buffer_info = vzalloc(size);
 708	if (!txdr->buffer_info)
 709		return -ENOMEM;
 710
 711	/* round up to nearest 4K */
 712
 713	txdr->size = txdr->count * sizeof(struct ixgb_tx_desc);
 714	txdr->size = ALIGN(txdr->size, 4096);
 715
 716	txdr->desc = dma_zalloc_coherent(&pdev->dev, txdr->size, &txdr->dma,
 717					 GFP_KERNEL);
 718	if (!txdr->desc) {
 719		vfree(txdr->buffer_info);
 720		return -ENOMEM;
 721	}
 722
 723	txdr->next_to_use = 0;
 724	txdr->next_to_clean = 0;
 725
 726	return 0;
 727}
 728
 729/**
 730 * ixgb_configure_tx - Configure 82597 Transmit Unit after Reset.
 731 * @adapter: board private structure
 732 *
 733 * Configure the Tx unit of the MAC after a reset.
 734 **/
 735
 736static void
 737ixgb_configure_tx(struct ixgb_adapter *adapter)
 738{
 739	u64 tdba = adapter->tx_ring.dma;
 740	u32 tdlen = adapter->tx_ring.count * sizeof(struct ixgb_tx_desc);
 741	u32 tctl;
 742	struct ixgb_hw *hw = &adapter->hw;
 743
 744	/* Setup the Base and Length of the Tx Descriptor Ring
 745	 * tx_ring.dma can be either a 32 or 64 bit value
 746	 */
 747
 748	IXGB_WRITE_REG(hw, TDBAL, (tdba & 0x00000000ffffffffULL));
 749	IXGB_WRITE_REG(hw, TDBAH, (tdba >> 32));
 750
 751	IXGB_WRITE_REG(hw, TDLEN, tdlen);
 752
 753	/* Setup the HW Tx Head and Tail descriptor pointers */
 754
 755	IXGB_WRITE_REG(hw, TDH, 0);
 756	IXGB_WRITE_REG(hw, TDT, 0);
 757
 758	/* don't set up txdctl, it induces performance problems if configured
 759	 * incorrectly */
 760	/* Set the Tx Interrupt Delay register */
 761
 762	IXGB_WRITE_REG(hw, TIDV, adapter->tx_int_delay);
 763
 764	/* Program the Transmit Control Register */
 765
 766	tctl = IXGB_TCTL_TCE | IXGB_TCTL_TXEN | IXGB_TCTL_TPDE;
 767	IXGB_WRITE_REG(hw, TCTL, tctl);
 768
 769	/* Setup Transmit Descriptor Settings for this adapter */
 770	adapter->tx_cmd_type =
 771		IXGB_TX_DESC_TYPE |
 772		(adapter->tx_int_delay_enable ? IXGB_TX_DESC_CMD_IDE : 0);
 773}
 774
 775/**
 776 * ixgb_setup_rx_resources - allocate Rx resources (Descriptors)
 777 * @adapter: board private structure
 778 *
 779 * Returns 0 on success, negative on failure
 780 **/
 781
 782int
 783ixgb_setup_rx_resources(struct ixgb_adapter *adapter)
 784{
 785	struct ixgb_desc_ring *rxdr = &adapter->rx_ring;
 786	struct pci_dev *pdev = adapter->pdev;
 787	int size;
 788
 789	size = sizeof(struct ixgb_buffer) * rxdr->count;
 790	rxdr->buffer_info = vzalloc(size);
 791	if (!rxdr->buffer_info)
 792		return -ENOMEM;
 793
 794	/* Round up to nearest 4K */
 795
 796	rxdr->size = rxdr->count * sizeof(struct ixgb_rx_desc);
 797	rxdr->size = ALIGN(rxdr->size, 4096);
 798
 799	rxdr->desc = dma_alloc_coherent(&pdev->dev, rxdr->size, &rxdr->dma,
 800					GFP_KERNEL);
 801
 802	if (!rxdr->desc) {
 803		vfree(rxdr->buffer_info);
 804		return -ENOMEM;
 805	}
 806	memset(rxdr->desc, 0, rxdr->size);
 807
 808	rxdr->next_to_clean = 0;
 809	rxdr->next_to_use = 0;
 810
 811	return 0;
 812}
 813
 814/**
 815 * ixgb_setup_rctl - configure the receive control register
 816 * @adapter: Board private structure
 817 **/
 818
 819static void
 820ixgb_setup_rctl(struct ixgb_adapter *adapter)
 821{
 822	u32 rctl;
 823
 824	rctl = IXGB_READ_REG(&adapter->hw, RCTL);
 825
 826	rctl &= ~(3 << IXGB_RCTL_MO_SHIFT);
 827
 828	rctl |=
 829		IXGB_RCTL_BAM | IXGB_RCTL_RDMTS_1_2 |
 830		IXGB_RCTL_RXEN | IXGB_RCTL_CFF |
 831		(adapter->hw.mc_filter_type << IXGB_RCTL_MO_SHIFT);
 832
 833	rctl |= IXGB_RCTL_SECRC;
 834
 835	if (adapter->rx_buffer_len <= IXGB_RXBUFFER_2048)
 836		rctl |= IXGB_RCTL_BSIZE_2048;
 837	else if (adapter->rx_buffer_len <= IXGB_RXBUFFER_4096)
 838		rctl |= IXGB_RCTL_BSIZE_4096;
 839	else if (adapter->rx_buffer_len <= IXGB_RXBUFFER_8192)
 840		rctl |= IXGB_RCTL_BSIZE_8192;
 841	else if (adapter->rx_buffer_len <= IXGB_RXBUFFER_16384)
 842		rctl |= IXGB_RCTL_BSIZE_16384;
 843
 844	IXGB_WRITE_REG(&adapter->hw, RCTL, rctl);
 845}
 846
 847/**
 848 * ixgb_configure_rx - Configure 82597 Receive Unit after Reset.
 849 * @adapter: board private structure
 850 *
 851 * Configure the Rx unit of the MAC after a reset.
 852 **/
 853
 854static void
 855ixgb_configure_rx(struct ixgb_adapter *adapter)
 856{
 857	u64 rdba = adapter->rx_ring.dma;
 858	u32 rdlen = adapter->rx_ring.count * sizeof(struct ixgb_rx_desc);
 859	struct ixgb_hw *hw = &adapter->hw;
 860	u32 rctl;
 861	u32 rxcsum;
 862
 863	/* make sure receives are disabled while setting up the descriptors */
 864
 865	rctl = IXGB_READ_REG(hw, RCTL);
 866	IXGB_WRITE_REG(hw, RCTL, rctl & ~IXGB_RCTL_RXEN);
 867
 868	/* set the Receive Delay Timer Register */
 869
 870	IXGB_WRITE_REG(hw, RDTR, adapter->rx_int_delay);
 871
 872	/* Setup the Base and Length of the Rx Descriptor Ring */
 873
 874	IXGB_WRITE_REG(hw, RDBAL, (rdba & 0x00000000ffffffffULL));
 875	IXGB_WRITE_REG(hw, RDBAH, (rdba >> 32));
 876
 877	IXGB_WRITE_REG(hw, RDLEN, rdlen);
 878
 879	/* Setup the HW Rx Head and Tail Descriptor Pointers */
 880	IXGB_WRITE_REG(hw, RDH, 0);
 881	IXGB_WRITE_REG(hw, RDT, 0);
 882
 883	/* due to the hardware errata with RXDCTL, we are unable to use any of
 884	 * the performance enhancing features of it without causing other
 885	 * subtle bugs, some of the bugs could include receive length
 886	 * corruption at high data rates (WTHRESH > 0) and/or receive
 887	 * descriptor ring irregularites (particularly in hardware cache) */
 888	IXGB_WRITE_REG(hw, RXDCTL, 0);
 889
 890	/* Enable Receive Checksum Offload for TCP and UDP */
 891	if (adapter->rx_csum) {
 892		rxcsum = IXGB_READ_REG(hw, RXCSUM);
 893		rxcsum |= IXGB_RXCSUM_TUOFL;
 894		IXGB_WRITE_REG(hw, RXCSUM, rxcsum);
 895	}
 896
 897	/* Enable Receives */
 898
 899	IXGB_WRITE_REG(hw, RCTL, rctl);
 900}
 901
 902/**
 903 * ixgb_free_tx_resources - Free Tx Resources
 904 * @adapter: board private structure
 905 *
 906 * Free all transmit software resources
 907 **/
 908
 909void
 910ixgb_free_tx_resources(struct ixgb_adapter *adapter)
 911{
 912	struct pci_dev *pdev = adapter->pdev;
 913
 914	ixgb_clean_tx_ring(adapter);
 915
 916	vfree(adapter->tx_ring.buffer_info);
 917	adapter->tx_ring.buffer_info = NULL;
 918
 919	dma_free_coherent(&pdev->dev, adapter->tx_ring.size,
 920			  adapter->tx_ring.desc, adapter->tx_ring.dma);
 921
 922	adapter->tx_ring.desc = NULL;
 923}
 924
 925static void
 926ixgb_unmap_and_free_tx_resource(struct ixgb_adapter *adapter,
 927                                struct ixgb_buffer *buffer_info)
 928{
 929	if (buffer_info->dma) {
 930		if (buffer_info->mapped_as_page)
 931			dma_unmap_page(&adapter->pdev->dev, buffer_info->dma,
 932				       buffer_info->length, DMA_TO_DEVICE);
 933		else
 934			dma_unmap_single(&adapter->pdev->dev, buffer_info->dma,
 935					 buffer_info->length, DMA_TO_DEVICE);
 936		buffer_info->dma = 0;
 937	}
 938
 939	if (buffer_info->skb) {
 940		dev_kfree_skb_any(buffer_info->skb);
 941		buffer_info->skb = NULL;
 942	}
 943	buffer_info->time_stamp = 0;
 944	/* these fields must always be initialized in tx
 945	 * buffer_info->length = 0;
 946	 * buffer_info->next_to_watch = 0; */
 947}
 948
 949/**
 950 * ixgb_clean_tx_ring - Free Tx Buffers
 951 * @adapter: board private structure
 952 **/
 953
 954static void
 955ixgb_clean_tx_ring(struct ixgb_adapter *adapter)
 956{
 957	struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
 958	struct ixgb_buffer *buffer_info;
 959	unsigned long size;
 960	unsigned int i;
 961
 962	/* Free all the Tx ring sk_buffs */
 963
 964	for (i = 0; i < tx_ring->count; i++) {
 965		buffer_info = &tx_ring->buffer_info[i];
 966		ixgb_unmap_and_free_tx_resource(adapter, buffer_info);
 967	}
 968
 969	size = sizeof(struct ixgb_buffer) * tx_ring->count;
 970	memset(tx_ring->buffer_info, 0, size);
 971
 972	/* Zero out the descriptor ring */
 973
 974	memset(tx_ring->desc, 0, tx_ring->size);
 975
 976	tx_ring->next_to_use = 0;
 977	tx_ring->next_to_clean = 0;
 978
 979	IXGB_WRITE_REG(&adapter->hw, TDH, 0);
 980	IXGB_WRITE_REG(&adapter->hw, TDT, 0);
 981}
 982
 983/**
 984 * ixgb_free_rx_resources - Free Rx Resources
 985 * @adapter: board private structure
 986 *
 987 * Free all receive software resources
 988 **/
 989
 990void
 991ixgb_free_rx_resources(struct ixgb_adapter *adapter)
 992{
 993	struct ixgb_desc_ring *rx_ring = &adapter->rx_ring;
 994	struct pci_dev *pdev = adapter->pdev;
 995
 996	ixgb_clean_rx_ring(adapter);
 997
 998	vfree(rx_ring->buffer_info);
 999	rx_ring->buffer_info = NULL;
1000
1001	dma_free_coherent(&pdev->dev, rx_ring->size, rx_ring->desc,
1002			  rx_ring->dma);
1003
1004	rx_ring->desc = NULL;
1005}
1006
1007/**
1008 * ixgb_clean_rx_ring - Free Rx Buffers
1009 * @adapter: board private structure
1010 **/
1011
1012static void
1013ixgb_clean_rx_ring(struct ixgb_adapter *adapter)
1014{
1015	struct ixgb_desc_ring *rx_ring = &adapter->rx_ring;
1016	struct ixgb_buffer *buffer_info;
1017	struct pci_dev *pdev = adapter->pdev;
1018	unsigned long size;
1019	unsigned int i;
1020
1021	/* Free all the Rx ring sk_buffs */
1022
1023	for (i = 0; i < rx_ring->count; i++) {
1024		buffer_info = &rx_ring->buffer_info[i];
1025		if (buffer_info->dma) {
1026			dma_unmap_single(&pdev->dev,
1027					 buffer_info->dma,
1028					 buffer_info->length,
1029					 DMA_FROM_DEVICE);
1030			buffer_info->dma = 0;
1031			buffer_info->length = 0;
1032		}
1033
1034		if (buffer_info->skb) {
1035			dev_kfree_skb(buffer_info->skb);
1036			buffer_info->skb = NULL;
1037		}
1038	}
1039
1040	size = sizeof(struct ixgb_buffer) * rx_ring->count;
1041	memset(rx_ring->buffer_info, 0, size);
1042
1043	/* Zero out the descriptor ring */
1044
1045	memset(rx_ring->desc, 0, rx_ring->size);
1046
1047	rx_ring->next_to_clean = 0;
1048	rx_ring->next_to_use = 0;
1049
1050	IXGB_WRITE_REG(&adapter->hw, RDH, 0);
1051	IXGB_WRITE_REG(&adapter->hw, RDT, 0);
1052}
1053
1054/**
1055 * ixgb_set_mac - Change the Ethernet Address of the NIC
1056 * @netdev: network interface device structure
1057 * @p: pointer to an address structure
1058 *
1059 * Returns 0 on success, negative on failure
1060 **/
1061
1062static int
1063ixgb_set_mac(struct net_device *netdev, void *p)
1064{
1065	struct ixgb_adapter *adapter = netdev_priv(netdev);
1066	struct sockaddr *addr = p;
1067
1068	if (!is_valid_ether_addr(addr->sa_data))
1069		return -EADDRNOTAVAIL;
1070
1071	memcpy(netdev->dev_addr, addr->sa_data, netdev->addr_len);
1072
1073	ixgb_rar_set(&adapter->hw, addr->sa_data, 0);
1074
1075	return 0;
1076}
1077
1078/**
1079 * ixgb_set_multi - Multicast and Promiscuous mode set
1080 * @netdev: network interface device structure
1081 *
1082 * The set_multi entry point is called whenever the multicast address
1083 * list or the network interface flags are updated.  This routine is
1084 * responsible for configuring the hardware for proper multicast,
1085 * promiscuous mode, and all-multi behavior.
1086 **/
1087
1088static void
1089ixgb_set_multi(struct net_device *netdev)
1090{
1091	struct ixgb_adapter *adapter = netdev_priv(netdev);
1092	struct ixgb_hw *hw = &adapter->hw;
1093	struct netdev_hw_addr *ha;
1094	u32 rctl;
1095
1096	/* Check for Promiscuous and All Multicast modes */
1097
1098	rctl = IXGB_READ_REG(hw, RCTL);
1099
1100	if (netdev->flags & IFF_PROMISC) {
1101		rctl |= (IXGB_RCTL_UPE | IXGB_RCTL_MPE);
1102		/* disable VLAN filtering */
1103		rctl &= ~IXGB_RCTL_CFIEN;
1104		rctl &= ~IXGB_RCTL_VFE;
1105	} else {
1106		if (netdev->flags & IFF_ALLMULTI) {
1107			rctl |= IXGB_RCTL_MPE;
1108			rctl &= ~IXGB_RCTL_UPE;
1109		} else {
1110			rctl &= ~(IXGB_RCTL_UPE | IXGB_RCTL_MPE);
1111		}
1112		/* enable VLAN filtering */
1113		rctl |= IXGB_RCTL_VFE;
1114		rctl &= ~IXGB_RCTL_CFIEN;
1115	}
1116
1117	if (netdev_mc_count(netdev) > IXGB_MAX_NUM_MULTICAST_ADDRESSES) {
1118		rctl |= IXGB_RCTL_MPE;
1119		IXGB_WRITE_REG(hw, RCTL, rctl);
1120	} else {
1121		u8 *mta = kmalloc(IXGB_MAX_NUM_MULTICAST_ADDRESSES *
1122			      ETH_ALEN, GFP_ATOMIC);
1123		u8 *addr;
1124		if (!mta)
1125			goto alloc_failed;
1126
1127		IXGB_WRITE_REG(hw, RCTL, rctl);
1128
1129		addr = mta;
1130		netdev_for_each_mc_addr(ha, netdev) {
1131			memcpy(addr, ha->addr, ETH_ALEN);
1132			addr += ETH_ALEN;
1133		}
1134
1135		ixgb_mc_addr_list_update(hw, mta, netdev_mc_count(netdev), 0);
1136		kfree(mta);
1137	}
1138
1139alloc_failed:
1140	if (netdev->features & NETIF_F_HW_VLAN_CTAG_RX)
1141		ixgb_vlan_strip_enable(adapter);
1142	else
1143		ixgb_vlan_strip_disable(adapter);
1144
1145}
1146
1147/**
1148 * ixgb_watchdog - Timer Call-back
1149 * @data: pointer to netdev cast into an unsigned long
1150 **/
1151
1152static void
1153ixgb_watchdog(struct timer_list *t)
1154{
1155	struct ixgb_adapter *adapter = from_timer(adapter, t, watchdog_timer);
1156	struct net_device *netdev = adapter->netdev;
1157	struct ixgb_desc_ring *txdr = &adapter->tx_ring;
1158
1159	ixgb_check_for_link(&adapter->hw);
1160
1161	if (ixgb_check_for_bad_link(&adapter->hw)) {
1162		/* force the reset path */
1163		netif_stop_queue(netdev);
1164	}
1165
1166	if (adapter->hw.link_up) {
1167		if (!netif_carrier_ok(netdev)) {
1168			netdev_info(netdev,
1169				    "NIC Link is Up 10 Gbps Full Duplex, Flow Control: %s\n",
1170				    (adapter->hw.fc.type == ixgb_fc_full) ?
1171				    "RX/TX" :
1172				    (adapter->hw.fc.type == ixgb_fc_rx_pause) ?
1173				     "RX" :
1174				    (adapter->hw.fc.type == ixgb_fc_tx_pause) ?
1175				    "TX" : "None");
1176			adapter->link_speed = 10000;
1177			adapter->link_duplex = FULL_DUPLEX;
1178			netif_carrier_on(netdev);
1179		}
1180	} else {
1181		if (netif_carrier_ok(netdev)) {
1182			adapter->link_speed = 0;
1183			adapter->link_duplex = 0;
1184			netdev_info(netdev, "NIC Link is Down\n");
1185			netif_carrier_off(netdev);
1186		}
1187	}
1188
1189	ixgb_update_stats(adapter);
1190
1191	if (!netif_carrier_ok(netdev)) {
1192		if (IXGB_DESC_UNUSED(txdr) + 1 < txdr->count) {
1193			/* We've lost link, so the controller stops DMA,
1194			 * but we've got queued Tx work that's never going
1195			 * to get done, so reset controller to flush Tx.
1196			 * (Do the reset outside of interrupt context). */
1197			schedule_work(&adapter->tx_timeout_task);
1198			/* return immediately since reset is imminent */
1199			return;
1200		}
1201	}
1202
1203	/* Force detection of hung controller every watchdog period */
1204	adapter->detect_tx_hung = true;
1205
1206	/* generate an interrupt to force clean up of any stragglers */
1207	IXGB_WRITE_REG(&adapter->hw, ICS, IXGB_INT_TXDW);
1208
1209	/* Reset the timer */
1210	mod_timer(&adapter->watchdog_timer, jiffies + 2 * HZ);
1211}
1212
1213#define IXGB_TX_FLAGS_CSUM		0x00000001
1214#define IXGB_TX_FLAGS_VLAN		0x00000002
1215#define IXGB_TX_FLAGS_TSO		0x00000004
1216
1217static int
1218ixgb_tso(struct ixgb_adapter *adapter, struct sk_buff *skb)
1219{
1220	struct ixgb_context_desc *context_desc;
1221	unsigned int i;
1222	u8 ipcss, ipcso, tucss, tucso, hdr_len;
1223	u16 ipcse, tucse, mss;
1224
1225	if (likely(skb_is_gso(skb))) {
1226		struct ixgb_buffer *buffer_info;
1227		struct iphdr *iph;
1228		int err;
1229
1230		err = skb_cow_head(skb, 0);
1231		if (err < 0)
1232			return err;
1233
1234		hdr_len = skb_transport_offset(skb) + tcp_hdrlen(skb);
1235		mss = skb_shinfo(skb)->gso_size;
1236		iph = ip_hdr(skb);
1237		iph->tot_len = 0;
1238		iph->check = 0;
1239		tcp_hdr(skb)->check = ~csum_tcpudp_magic(iph->saddr,
1240							 iph->daddr, 0,
1241							 IPPROTO_TCP, 0);
1242		ipcss = skb_network_offset(skb);
1243		ipcso = (void *)&(iph->check) - (void *)skb->data;
1244		ipcse = skb_transport_offset(skb) - 1;
1245		tucss = skb_transport_offset(skb);
1246		tucso = (void *)&(tcp_hdr(skb)->check) - (void *)skb->data;
1247		tucse = 0;
1248
1249		i = adapter->tx_ring.next_to_use;
1250		context_desc = IXGB_CONTEXT_DESC(adapter->tx_ring, i);
1251		buffer_info = &adapter->tx_ring.buffer_info[i];
1252		WARN_ON(buffer_info->dma != 0);
1253
1254		context_desc->ipcss = ipcss;
1255		context_desc->ipcso = ipcso;
1256		context_desc->ipcse = cpu_to_le16(ipcse);
1257		context_desc->tucss = tucss;
1258		context_desc->tucso = tucso;
1259		context_desc->tucse = cpu_to_le16(tucse);
1260		context_desc->mss = cpu_to_le16(mss);
1261		context_desc->hdr_len = hdr_len;
1262		context_desc->status = 0;
1263		context_desc->cmd_type_len = cpu_to_le32(
1264						  IXGB_CONTEXT_DESC_TYPE
1265						| IXGB_CONTEXT_DESC_CMD_TSE
1266						| IXGB_CONTEXT_DESC_CMD_IP
1267						| IXGB_CONTEXT_DESC_CMD_TCP
1268						| IXGB_CONTEXT_DESC_CMD_IDE
1269						| (skb->len - (hdr_len)));
1270
1271
1272		if (++i == adapter->tx_ring.count) i = 0;
1273		adapter->tx_ring.next_to_use = i;
1274
1275		return 1;
1276	}
1277
1278	return 0;
1279}
1280
1281static bool
1282ixgb_tx_csum(struct ixgb_adapter *adapter, struct sk_buff *skb)
1283{
1284	struct ixgb_context_desc *context_desc;
1285	unsigned int i;
1286	u8 css, cso;
1287
1288	if (likely(skb->ip_summed == CHECKSUM_PARTIAL)) {
1289		struct ixgb_buffer *buffer_info;
1290		css = skb_checksum_start_offset(skb);
1291		cso = css + skb->csum_offset;
1292
1293		i = adapter->tx_ring.next_to_use;
1294		context_desc = IXGB_CONTEXT_DESC(adapter->tx_ring, i);
1295		buffer_info = &adapter->tx_ring.buffer_info[i];
1296		WARN_ON(buffer_info->dma != 0);
1297
1298		context_desc->tucss = css;
1299		context_desc->tucso = cso;
1300		context_desc->tucse = 0;
1301		/* zero out any previously existing data in one instruction */
1302		*(u32 *)&(context_desc->ipcss) = 0;
1303		context_desc->status = 0;
1304		context_desc->hdr_len = 0;
1305		context_desc->mss = 0;
1306		context_desc->cmd_type_len =
1307			cpu_to_le32(IXGB_CONTEXT_DESC_TYPE
1308				    | IXGB_TX_DESC_CMD_IDE);
1309
1310		if (++i == adapter->tx_ring.count) i = 0;
1311		adapter->tx_ring.next_to_use = i;
1312
1313		return true;
1314	}
1315
1316	return false;
1317}
1318
1319#define IXGB_MAX_TXD_PWR	14
1320#define IXGB_MAX_DATA_PER_TXD	(1<<IXGB_MAX_TXD_PWR)
1321
1322static int
1323ixgb_tx_map(struct ixgb_adapter *adapter, struct sk_buff *skb,
1324	    unsigned int first)
1325{
1326	struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
1327	struct pci_dev *pdev = adapter->pdev;
1328	struct ixgb_buffer *buffer_info;
1329	int len = skb_headlen(skb);
1330	unsigned int offset = 0, size, count = 0, i;
1331	unsigned int mss = skb_shinfo(skb)->gso_size;
1332	unsigned int nr_frags = skb_shinfo(skb)->nr_frags;
1333	unsigned int f;
1334
1335	i = tx_ring->next_to_use;
1336
1337	while (len) {
1338		buffer_info = &tx_ring->buffer_info[i];
1339		size = min(len, IXGB_MAX_DATA_PER_TXD);
1340		/* Workaround for premature desc write-backs
1341		 * in TSO mode.  Append 4-byte sentinel desc */
1342		if (unlikely(mss && !nr_frags && size == len && size > 8))
1343			size -= 4;
1344
1345		buffer_info->length = size;
1346		WARN_ON(buffer_info->dma != 0);
1347		buffer_info->time_stamp = jiffies;
1348		buffer_info->mapped_as_page = false;
1349		buffer_info->dma = dma_map_single(&pdev->dev,
1350						  skb->data + offset,
1351						  size, DMA_TO_DEVICE);
1352		if (dma_mapping_error(&pdev->dev, buffer_info->dma))
1353			goto dma_error;
1354		buffer_info->next_to_watch = 0;
1355
1356		len -= size;
1357		offset += size;
1358		count++;
1359		if (len) {
1360			i++;
1361			if (i == tx_ring->count)
1362				i = 0;
1363		}
1364	}
1365
1366	for (f = 0; f < nr_frags; f++) {
1367		const struct skb_frag_struct *frag;
1368
1369		frag = &skb_shinfo(skb)->frags[f];
1370		len = skb_frag_size(frag);
1371		offset = 0;
1372
1373		while (len) {
1374			i++;
1375			if (i == tx_ring->count)
1376				i = 0;
1377
1378			buffer_info = &tx_ring->buffer_info[i];
1379			size = min(len, IXGB_MAX_DATA_PER_TXD);
1380
1381			/* Workaround for premature desc write-backs
1382			 * in TSO mode.  Append 4-byte sentinel desc */
1383			if (unlikely(mss && (f == (nr_frags - 1))
1384				     && size == len && size > 8))
1385				size -= 4;
1386
1387			buffer_info->length = size;
1388			buffer_info->time_stamp = jiffies;
1389			buffer_info->mapped_as_page = true;
1390			buffer_info->dma =
1391				skb_frag_dma_map(&pdev->dev, frag, offset, size,
1392						 DMA_TO_DEVICE);
1393			if (dma_mapping_error(&pdev->dev, buffer_info->dma))
1394				goto dma_error;
1395			buffer_info->next_to_watch = 0;
1396
1397			len -= size;
1398			offset += size;
1399			count++;
1400		}
1401	}
1402	tx_ring->buffer_info[i].skb = skb;
1403	tx_ring->buffer_info[first].next_to_watch = i;
1404
1405	return count;
1406
1407dma_error:
1408	dev_err(&pdev->dev, "TX DMA map failed\n");
1409	buffer_info->dma = 0;
1410	if (count)
1411		count--;
1412
1413	while (count--) {
1414		if (i==0)
1415			i += tx_ring->count;
1416		i--;
1417		buffer_info = &tx_ring->buffer_info[i];
1418		ixgb_unmap_and_free_tx_resource(adapter, buffer_info);
1419	}
1420
1421	return 0;
1422}
1423
1424static void
1425ixgb_tx_queue(struct ixgb_adapter *adapter, int count, int vlan_id,int tx_flags)
1426{
1427	struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
1428	struct ixgb_tx_desc *tx_desc = NULL;
1429	struct ixgb_buffer *buffer_info;
1430	u32 cmd_type_len = adapter->tx_cmd_type;
1431	u8 status = 0;
1432	u8 popts = 0;
1433	unsigned int i;
1434
1435	if (tx_flags & IXGB_TX_FLAGS_TSO) {
1436		cmd_type_len |= IXGB_TX_DESC_CMD_TSE;
1437		popts |= (IXGB_TX_DESC_POPTS_IXSM | IXGB_TX_DESC_POPTS_TXSM);
1438	}
1439
1440	if (tx_flags & IXGB_TX_FLAGS_CSUM)
1441		popts |= IXGB_TX_DESC_POPTS_TXSM;
1442
1443	if (tx_flags & IXGB_TX_FLAGS_VLAN)
1444		cmd_type_len |= IXGB_TX_DESC_CMD_VLE;
1445
1446	i = tx_ring->next_to_use;
1447
1448	while (count--) {
1449		buffer_info = &tx_ring->buffer_info[i];
1450		tx_desc = IXGB_TX_DESC(*tx_ring, i);
1451		tx_desc->buff_addr = cpu_to_le64(buffer_info->dma);
1452		tx_desc->cmd_type_len =
1453			cpu_to_le32(cmd_type_len | buffer_info->length);
1454		tx_desc->status = status;
1455		tx_desc->popts = popts;
1456		tx_desc->vlan = cpu_to_le16(vlan_id);
1457
1458		if (++i == tx_ring->count) i = 0;
1459	}
1460
1461	tx_desc->cmd_type_len |=
1462		cpu_to_le32(IXGB_TX_DESC_CMD_EOP | IXGB_TX_DESC_CMD_RS);
1463
1464	/* Force memory writes to complete before letting h/w
1465	 * know there are new descriptors to fetch.  (Only
1466	 * applicable for weak-ordered memory model archs,
1467	 * such as IA-64). */
1468	wmb();
1469
1470	tx_ring->next_to_use = i;
1471	IXGB_WRITE_REG(&adapter->hw, TDT, i);
1472}
1473
1474static int __ixgb_maybe_stop_tx(struct net_device *netdev, int size)
1475{
1476	struct ixgb_adapter *adapter = netdev_priv(netdev);
1477	struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
1478
1479	netif_stop_queue(netdev);
1480	/* Herbert's original patch had:
1481	 *  smp_mb__after_netif_stop_queue();
1482	 * but since that doesn't exist yet, just open code it. */
1483	smp_mb();
1484
1485	/* We need to check again in a case another CPU has just
1486	 * made room available. */
1487	if (likely(IXGB_DESC_UNUSED(tx_ring) < size))
1488		return -EBUSY;
1489
1490	/* A reprieve! */
1491	netif_start_queue(netdev);
1492	++adapter->restart_queue;
1493	return 0;
1494}
1495
1496static int ixgb_maybe_stop_tx(struct net_device *netdev,
1497                              struct ixgb_desc_ring *tx_ring, int size)
1498{
1499	if (likely(IXGB_DESC_UNUSED(tx_ring) >= size))
1500		return 0;
1501	return __ixgb_maybe_stop_tx(netdev, size);
1502}
1503
1504
1505/* Tx Descriptors needed, worst case */
1506#define TXD_USE_COUNT(S) (((S) >> IXGB_MAX_TXD_PWR) + \
1507			 (((S) & (IXGB_MAX_DATA_PER_TXD - 1)) ? 1 : 0))
1508#define DESC_NEEDED TXD_USE_COUNT(IXGB_MAX_DATA_PER_TXD) /* skb->date */ + \
1509	MAX_SKB_FRAGS * TXD_USE_COUNT(PAGE_SIZE) + 1 /* for context */ \
1510	+ 1 /* one more needed for sentinel TSO workaround */
1511
1512static netdev_tx_t
1513ixgb_xmit_frame(struct sk_buff *skb, struct net_device *netdev)
1514{
1515	struct ixgb_adapter *adapter = netdev_priv(netdev);
1516	unsigned int first;
1517	unsigned int tx_flags = 0;
1518	int vlan_id = 0;
1519	int count = 0;
1520	int tso;
1521
1522	if (test_bit(__IXGB_DOWN, &adapter->flags)) {
1523		dev_kfree_skb_any(skb);
1524		return NETDEV_TX_OK;
1525	}
1526
1527	if (skb->len <= 0) {
1528		dev_kfree_skb_any(skb);
1529		return NETDEV_TX_OK;
1530	}
1531
1532	if (unlikely(ixgb_maybe_stop_tx(netdev, &adapter->tx_ring,
1533                     DESC_NEEDED)))
1534		return NETDEV_TX_BUSY;
1535
1536	if (skb_vlan_tag_present(skb)) {
1537		tx_flags |= IXGB_TX_FLAGS_VLAN;
1538		vlan_id = skb_vlan_tag_get(skb);
1539	}
1540
1541	first = adapter->tx_ring.next_to_use;
1542
1543	tso = ixgb_tso(adapter, skb);
1544	if (tso < 0) {
1545		dev_kfree_skb_any(skb);
1546		return NETDEV_TX_OK;
1547	}
1548
1549	if (likely(tso))
1550		tx_flags |= IXGB_TX_FLAGS_TSO;
1551	else if (ixgb_tx_csum(adapter, skb))
1552		tx_flags |= IXGB_TX_FLAGS_CSUM;
1553
1554	count = ixgb_tx_map(adapter, skb, first);
1555
1556	if (count) {
1557		ixgb_tx_queue(adapter, count, vlan_id, tx_flags);
1558		/* Make sure there is space in the ring for the next send. */
1559		ixgb_maybe_stop_tx(netdev, &adapter->tx_ring, DESC_NEEDED);
1560
1561	} else {
1562		dev_kfree_skb_any(skb);
1563		adapter->tx_ring.buffer_info[first].time_stamp = 0;
1564		adapter->tx_ring.next_to_use = first;
1565	}
1566
1567	return NETDEV_TX_OK;
1568}
1569
1570/**
1571 * ixgb_tx_timeout - Respond to a Tx Hang
1572 * @netdev: network interface device structure
1573 **/
1574
1575static void
1576ixgb_tx_timeout(struct net_device *netdev)
1577{
1578	struct ixgb_adapter *adapter = netdev_priv(netdev);
1579
1580	/* Do the reset outside of interrupt context */
1581	schedule_work(&adapter->tx_timeout_task);
1582}
1583
1584static void
1585ixgb_tx_timeout_task(struct work_struct *work)
1586{
1587	struct ixgb_adapter *adapter =
1588		container_of(work, struct ixgb_adapter, tx_timeout_task);
1589
1590	adapter->tx_timeout_count++;
1591	ixgb_down(adapter, true);
1592	ixgb_up(adapter);
1593}
1594
1595/**
1596 * ixgb_change_mtu - Change the Maximum Transfer Unit
1597 * @netdev: network interface device structure
1598 * @new_mtu: new value for maximum frame size
1599 *
1600 * Returns 0 on success, negative on failure
1601 **/
1602
1603static int
1604ixgb_change_mtu(struct net_device *netdev, int new_mtu)
1605{
1606	struct ixgb_adapter *adapter = netdev_priv(netdev);
1607	int max_frame = new_mtu + ENET_HEADER_SIZE + ENET_FCS_LENGTH;
1608
1609	if (netif_running(netdev))
1610		ixgb_down(adapter, true);
1611
1612	adapter->rx_buffer_len = max_frame + 8; /* + 8 for errata */
1613
1614	netdev->mtu = new_mtu;
1615
1616	if (netif_running(netdev))
1617		ixgb_up(adapter);
1618
1619	return 0;
1620}
1621
1622/**
1623 * ixgb_update_stats - Update the board statistics counters.
1624 * @adapter: board private structure
1625 **/
1626
1627void
1628ixgb_update_stats(struct ixgb_adapter *adapter)
1629{
1630	struct net_device *netdev = adapter->netdev;
1631	struct pci_dev *pdev = adapter->pdev;
1632
1633	/* Prevent stats update while adapter is being reset */
1634	if (pci_channel_offline(pdev))
1635		return;
1636
1637	if ((netdev->flags & IFF_PROMISC) || (netdev->flags & IFF_ALLMULTI) ||
1638	   (netdev_mc_count(netdev) > IXGB_MAX_NUM_MULTICAST_ADDRESSES)) {
1639		u64 multi = IXGB_READ_REG(&adapter->hw, MPRCL);
1640		u32 bcast_l = IXGB_READ_REG(&adapter->hw, BPRCL);
1641		u32 bcast_h = IXGB_READ_REG(&adapter->hw, BPRCH);
1642		u64 bcast = ((u64)bcast_h << 32) | bcast_l;
1643
1644		multi |= ((u64)IXGB_READ_REG(&adapter->hw, MPRCH) << 32);
1645		/* fix up multicast stats by removing broadcasts */
1646		if (multi >= bcast)
1647			multi -= bcast;
1648
1649		adapter->stats.mprcl += (multi & 0xFFFFFFFF);
1650		adapter->stats.mprch += (multi >> 32);
1651		adapter->stats.bprcl += bcast_l;
1652		adapter->stats.bprch += bcast_h;
1653	} else {
1654		adapter->stats.mprcl += IXGB_READ_REG(&adapter->hw, MPRCL);
1655		adapter->stats.mprch += IXGB_READ_REG(&adapter->hw, MPRCH);
1656		adapter->stats.bprcl += IXGB_READ_REG(&adapter->hw, BPRCL);
1657		adapter->stats.bprch += IXGB_READ_REG(&adapter->hw, BPRCH);
1658	}
1659	adapter->stats.tprl += IXGB_READ_REG(&adapter->hw, TPRL);
1660	adapter->stats.tprh += IXGB_READ_REG(&adapter->hw, TPRH);
1661	adapter->stats.gprcl += IXGB_READ_REG(&adapter->hw, GPRCL);
1662	adapter->stats.gprch += IXGB_READ_REG(&adapter->hw, GPRCH);
1663	adapter->stats.uprcl += IXGB_READ_REG(&adapter->hw, UPRCL);
1664	adapter->stats.uprch += IXGB_READ_REG(&adapter->hw, UPRCH);
1665	adapter->stats.vprcl += IXGB_READ_REG(&adapter->hw, VPRCL);
1666	adapter->stats.vprch += IXGB_READ_REG(&adapter->hw, VPRCH);
1667	adapter->stats.jprcl += IXGB_READ_REG(&adapter->hw, JPRCL);
1668	adapter->stats.jprch += IXGB_READ_REG(&adapter->hw, JPRCH);
1669	adapter->stats.gorcl += IXGB_READ_REG(&adapter->hw, GORCL);
1670	adapter->stats.gorch += IXGB_READ_REG(&adapter->hw, GORCH);
1671	adapter->stats.torl += IXGB_READ_REG(&adapter->hw, TORL);
1672	adapter->stats.torh += IXGB_READ_REG(&adapter->hw, TORH);
1673	adapter->stats.rnbc += IXGB_READ_REG(&adapter->hw, RNBC);
1674	adapter->stats.ruc += IXGB_READ_REG(&adapter->hw, RUC);
1675	adapter->stats.roc += IXGB_READ_REG(&adapter->hw, ROC);
1676	adapter->stats.rlec += IXGB_READ_REG(&adapter->hw, RLEC);
1677	adapter->stats.crcerrs += IXGB_READ_REG(&adapter->hw, CRCERRS);
1678	adapter->stats.icbc += IXGB_READ_REG(&adapter->hw, ICBC);
1679	adapter->stats.ecbc += IXGB_READ_REG(&adapter->hw, ECBC);
1680	adapter->stats.mpc += IXGB_READ_REG(&adapter->hw, MPC);
1681	adapter->stats.tptl += IXGB_READ_REG(&adapter->hw, TPTL);
1682	adapter->stats.tpth += IXGB_READ_REG(&adapter->hw, TPTH);
1683	adapter->stats.gptcl += IXGB_READ_REG(&adapter->hw, GPTCL);
1684	adapter->stats.gptch += IXGB_READ_REG(&adapter->hw, GPTCH);
1685	adapter->stats.bptcl += IXGB_READ_REG(&adapter->hw, BPTCL);
1686	adapter->stats.bptch += IXGB_READ_REG(&adapter->hw, BPTCH);
1687	adapter->stats.mptcl += IXGB_READ_REG(&adapter->hw, MPTCL);
1688	adapter->stats.mptch += IXGB_READ_REG(&adapter->hw, MPTCH);
1689	adapter->stats.uptcl += IXGB_READ_REG(&adapter->hw, UPTCL);
1690	adapter->stats.uptch += IXGB_READ_REG(&adapter->hw, UPTCH);
1691	adapter->stats.vptcl += IXGB_READ_REG(&adapter->hw, VPTCL);
1692	adapter->stats.vptch += IXGB_READ_REG(&adapter->hw, VPTCH);
1693	adapter->stats.jptcl += IXGB_READ_REG(&adapter->hw, JPTCL);
1694	adapter->stats.jptch += IXGB_READ_REG(&adapter->hw, JPTCH);
1695	adapter->stats.gotcl += IXGB_READ_REG(&adapter->hw, GOTCL);
1696	adapter->stats.gotch += IXGB_READ_REG(&adapter->hw, GOTCH);
1697	adapter->stats.totl += IXGB_READ_REG(&adapter->hw, TOTL);
1698	adapter->stats.toth += IXGB_READ_REG(&adapter->hw, TOTH);
1699	adapter->stats.dc += IXGB_READ_REG(&adapter->hw, DC);
1700	adapter->stats.plt64c += IXGB_READ_REG(&adapter->hw, PLT64C);
1701	adapter->stats.tsctc += IXGB_READ_REG(&adapter->hw, TSCTC);
1702	adapter->stats.tsctfc += IXGB_READ_REG(&adapter->hw, TSCTFC);
1703	adapter->stats.ibic += IXGB_READ_REG(&adapter->hw, IBIC);
1704	adapter->stats.rfc += IXGB_READ_REG(&adapter->hw, RFC);
1705	adapter->stats.lfc += IXGB_READ_REG(&adapter->hw, LFC);
1706	adapter->stats.pfrc += IXGB_READ_REG(&adapter->hw, PFRC);
1707	adapter->stats.pftc += IXGB_READ_REG(&adapter->hw, PFTC);
1708	adapter->stats.mcfrc += IXGB_READ_REG(&adapter->hw, MCFRC);
1709	adapter->stats.mcftc += IXGB_READ_REG(&adapter->hw, MCFTC);
1710	adapter->stats.xonrxc += IXGB_READ_REG(&adapter->hw, XONRXC);
1711	adapter->stats.xontxc += IXGB_READ_REG(&adapter->hw, XONTXC);
1712	adapter->stats.xoffrxc += IXGB_READ_REG(&adapter->hw, XOFFRXC);
1713	adapter->stats.xofftxc += IXGB_READ_REG(&adapter->hw, XOFFTXC);
1714	adapter->stats.rjc += IXGB_READ_REG(&adapter->hw, RJC);
1715
1716	/* Fill out the OS statistics structure */
1717
1718	netdev->stats.rx_packets = adapter->stats.gprcl;
1719	netdev->stats.tx_packets = adapter->stats.gptcl;
1720	netdev->stats.rx_bytes = adapter->stats.gorcl;
1721	netdev->stats.tx_bytes = adapter->stats.gotcl;
1722	netdev->stats.multicast = adapter->stats.mprcl;
1723	netdev->stats.collisions = 0;
1724
1725	/* ignore RLEC as it reports errors for padded (<64bytes) frames
1726	 * with a length in the type/len field */
1727	netdev->stats.rx_errors =
1728	    /* adapter->stats.rnbc + */ adapter->stats.crcerrs +
1729	    adapter->stats.ruc +
1730	    adapter->stats.roc /*+ adapter->stats.rlec */  +
1731	    adapter->stats.icbc +
1732	    adapter->stats.ecbc + adapter->stats.mpc;
1733
1734	/* see above
1735	 * netdev->stats.rx_length_errors = adapter->stats.rlec;
1736	 */
1737
1738	netdev->stats.rx_crc_errors = adapter->stats.crcerrs;
1739	netdev->stats.rx_fifo_errors = adapter->stats.mpc;
1740	netdev->stats.rx_missed_errors = adapter->stats.mpc;
1741	netdev->stats.rx_over_errors = adapter->stats.mpc;
1742
1743	netdev->stats.tx_errors = 0;
1744	netdev->stats.rx_frame_errors = 0;
1745	netdev->stats.tx_aborted_errors = 0;
1746	netdev->stats.tx_carrier_errors = 0;
1747	netdev->stats.tx_fifo_errors = 0;
1748	netdev->stats.tx_heartbeat_errors = 0;
1749	netdev->stats.tx_window_errors = 0;
1750}
1751
1752#define IXGB_MAX_INTR 10
1753/**
1754 * ixgb_intr - Interrupt Handler
1755 * @irq: interrupt number
1756 * @data: pointer to a network interface device structure
1757 **/
1758
1759static irqreturn_t
1760ixgb_intr(int irq, void *data)
1761{
1762	struct net_device *netdev = data;
1763	struct ixgb_adapter *adapter = netdev_priv(netdev);
1764	struct ixgb_hw *hw = &adapter->hw;
1765	u32 icr = IXGB_READ_REG(hw, ICR);
1766
1767	if (unlikely(!icr))
1768		return IRQ_NONE;  /* Not our interrupt */
1769
1770	if (unlikely(icr & (IXGB_INT_RXSEQ | IXGB_INT_LSC)))
1771		if (!test_bit(__IXGB_DOWN, &adapter->flags))
1772			mod_timer(&adapter->watchdog_timer, jiffies);
1773
1774	if (napi_schedule_prep(&adapter->napi)) {
1775
1776		/* Disable interrupts and register for poll. The flush
1777		  of the posted write is intentionally left out.
1778		*/
1779
1780		IXGB_WRITE_REG(&adapter->hw, IMC, ~0);
1781		__napi_schedule(&adapter->napi);
1782	}
1783	return IRQ_HANDLED;
1784}
1785
1786/**
1787 * ixgb_clean - NAPI Rx polling callback
1788 * @adapter: board private structure
1789 **/
1790
1791static int
1792ixgb_clean(struct napi_struct *napi, int budget)
1793{
1794	struct ixgb_adapter *adapter = container_of(napi, struct ixgb_adapter, napi);
1795	int work_done = 0;
1796
1797	ixgb_clean_tx_irq(adapter);
1798	ixgb_clean_rx_irq(adapter, &work_done, budget);
1799
1800	/* If budget not fully consumed, exit the polling mode */
1801	if (work_done < budget) {
1802		napi_complete_done(napi, work_done);
1803		if (!test_bit(__IXGB_DOWN, &adapter->flags))
1804			ixgb_irq_enable(adapter);
1805	}
1806
1807	return work_done;
1808}
1809
1810/**
1811 * ixgb_clean_tx_irq - Reclaim resources after transmit completes
1812 * @adapter: board private structure
1813 **/
1814
1815static bool
1816ixgb_clean_tx_irq(struct ixgb_adapter *adapter)
1817{
1818	struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
1819	struct net_device *netdev = adapter->netdev;
1820	struct ixgb_tx_desc *tx_desc, *eop_desc;
1821	struct ixgb_buffer *buffer_info;
1822	unsigned int i, eop;
1823	bool cleaned = false;
1824
1825	i = tx_ring->next_to_clean;
1826	eop = tx_ring->buffer_info[i].next_to_watch;
1827	eop_desc = IXGB_TX_DESC(*tx_ring, eop);
1828
1829	while (eop_desc->status & IXGB_TX_DESC_STATUS_DD) {
1830
1831		rmb(); /* read buffer_info after eop_desc */
1832		for (cleaned = false; !cleaned; ) {
1833			tx_desc = IXGB_TX_DESC(*tx_ring, i);
1834			buffer_info = &tx_ring->buffer_info[i];
1835
1836			if (tx_desc->popts &
1837			   (IXGB_TX_DESC_POPTS_TXSM |
1838			    IXGB_TX_DESC_POPTS_IXSM))
1839				adapter->hw_csum_tx_good++;
1840
1841			ixgb_unmap_and_free_tx_resource(adapter, buffer_info);
1842
1843			*(u32 *)&(tx_desc->status) = 0;
1844
1845			cleaned = (i == eop);
1846			if (++i == tx_ring->count) i = 0;
1847		}
1848
1849		eop = tx_ring->buffer_info[i].next_to_watch;
1850		eop_desc = IXGB_TX_DESC(*tx_ring, eop);
1851	}
1852
1853	tx_ring->next_to_clean = i;
1854
1855	if (unlikely(cleaned && netif_carrier_ok(netdev) &&
1856		     IXGB_DESC_UNUSED(tx_ring) >= DESC_NEEDED)) {
1857		/* Make sure that anybody stopping the queue after this
1858		 * sees the new next_to_clean. */
1859		smp_mb();
1860
1861		if (netif_queue_stopped(netdev) &&
1862		    !(test_bit(__IXGB_DOWN, &adapter->flags))) {
1863			netif_wake_queue(netdev);
1864			++adapter->restart_queue;
1865		}
1866	}
1867
1868	if (adapter->detect_tx_hung) {
1869		/* detect a transmit hang in hardware, this serializes the
1870		 * check with the clearing of time_stamp and movement of i */
1871		adapter->detect_tx_hung = false;
1872		if (tx_ring->buffer_info[eop].time_stamp &&
1873		   time_after(jiffies, tx_ring->buffer_info[eop].time_stamp + HZ)
1874		   && !(IXGB_READ_REG(&adapter->hw, STATUS) &
1875		        IXGB_STATUS_TXOFF)) {
1876			/* detected Tx unit hang */
1877			netif_err(adapter, drv, adapter->netdev,
1878				  "Detected Tx Unit Hang\n"
1879				  "  TDH                  <%x>\n"
1880				  "  TDT                  <%x>\n"
1881				  "  next_to_use          <%x>\n"
1882				  "  next_to_clean        <%x>\n"
1883				  "buffer_info[next_to_clean]\n"
1884				  "  time_stamp           <%lx>\n"
1885				  "  next_to_watch        <%x>\n"
1886				  "  jiffies              <%lx>\n"
1887				  "  next_to_watch.status <%x>\n",
1888				  IXGB_READ_REG(&adapter->hw, TDH),
1889				  IXGB_READ_REG(&adapter->hw, TDT),
1890				  tx_ring->next_to_use,
1891				  tx_ring->next_to_clean,
1892				  tx_ring->buffer_info[eop].time_stamp,
1893				  eop,
1894				  jiffies,
1895				  eop_desc->status);
1896			netif_stop_queue(netdev);
1897		}
1898	}
1899
1900	return cleaned;
1901}
1902
1903/**
1904 * ixgb_rx_checksum - Receive Checksum Offload for 82597.
1905 * @adapter: board private structure
1906 * @rx_desc: receive descriptor
1907 * @sk_buff: socket buffer with received data
1908 **/
1909
1910static void
1911ixgb_rx_checksum(struct ixgb_adapter *adapter,
1912                 struct ixgb_rx_desc *rx_desc,
1913                 struct sk_buff *skb)
1914{
1915	/* Ignore Checksum bit is set OR
1916	 * TCP Checksum has not been calculated
1917	 */
1918	if ((rx_desc->status & IXGB_RX_DESC_STATUS_IXSM) ||
1919	   (!(rx_desc->status & IXGB_RX_DESC_STATUS_TCPCS))) {
1920		skb_checksum_none_assert(skb);
1921		return;
1922	}
1923
1924	/* At this point we know the hardware did the TCP checksum */
1925	/* now look at the TCP checksum error bit */
1926	if (rx_desc->errors & IXGB_RX_DESC_ERRORS_TCPE) {
1927		/* let the stack verify checksum errors */
1928		skb_checksum_none_assert(skb);
1929		adapter->hw_csum_rx_error++;
1930	} else {
1931		/* TCP checksum is good */
1932		skb->ip_summed = CHECKSUM_UNNECESSARY;
1933		adapter->hw_csum_rx_good++;
1934	}
1935}
1936
1937/*
1938 * this should improve performance for small packets with large amounts
1939 * of reassembly being done in the stack
1940 */
1941static void ixgb_check_copybreak(struct napi_struct *napi,
1942				 struct ixgb_buffer *buffer_info,
1943				 u32 length, struct sk_buff **skb)
1944{
1945	struct sk_buff *new_skb;
1946
1947	if (length > copybreak)
1948		return;
1949
1950	new_skb = napi_alloc_skb(napi, length);
1951	if (!new_skb)
1952		return;
1953
1954	skb_copy_to_linear_data_offset(new_skb, -NET_IP_ALIGN,
1955				       (*skb)->data - NET_IP_ALIGN,
1956				       length + NET_IP_ALIGN);
1957	/* save the skb in buffer_info as good */
1958	buffer_info->skb = *skb;
1959	*skb = new_skb;
1960}
1961
1962/**
1963 * ixgb_clean_rx_irq - Send received data up the network stack,
1964 * @adapter: board private structure
1965 **/
1966
1967static bool
1968ixgb_clean_rx_irq(struct ixgb_adapter *adapter, int *work_done, int work_to_do)
1969{
1970	struct ixgb_desc_ring *rx_ring = &adapter->rx_ring;
1971	struct net_device *netdev = adapter->netdev;
1972	struct pci_dev *pdev = adapter->pdev;
1973	struct ixgb_rx_desc *rx_desc, *next_rxd;
1974	struct ixgb_buffer *buffer_info, *next_buffer, *next2_buffer;
1975	u32 length;
1976	unsigned int i, j;
1977	int cleaned_count = 0;
1978	bool cleaned = false;
1979
1980	i = rx_ring->next_to_clean;
1981	rx_desc = IXGB_RX_DESC(*rx_ring, i);
1982	buffer_info = &rx_ring->buffer_info[i];
1983
1984	while (rx_desc->status & IXGB_RX_DESC_STATUS_DD) {
1985		struct sk_buff *skb;
1986		u8 status;
1987
1988		if (*work_done >= work_to_do)
1989			break;
1990
1991		(*work_done)++;
1992		rmb();	/* read descriptor and rx_buffer_info after status DD */
1993		status = rx_desc->status;
1994		skb = buffer_info->skb;
1995		buffer_info->skb = NULL;
1996
1997		prefetch(skb->data - NET_IP_ALIGN);
1998
1999		if (++i == rx_ring->count)
2000			i = 0;
2001		next_rxd = IXGB_RX_DESC(*rx_ring, i);
2002		prefetch(next_rxd);
2003
2004		j = i + 1;
2005		if (j == rx_ring->count)
2006			j = 0;
2007		next2_buffer = &rx_ring->buffer_info[j];
2008		prefetch(next2_buffer);
2009
2010		next_buffer = &rx_ring->buffer_info[i];
2011
2012		cleaned = true;
2013		cleaned_count++;
2014
2015		dma_unmap_single(&pdev->dev,
2016				 buffer_info->dma,
2017				 buffer_info->length,
2018				 DMA_FROM_DEVICE);
2019		buffer_info->dma = 0;
2020
2021		length = le16_to_cpu(rx_desc->length);
2022		rx_desc->length = 0;
2023
2024		if (unlikely(!(status & IXGB_RX_DESC_STATUS_EOP))) {
2025
2026			/* All receives must fit into a single buffer */
2027
2028			pr_debug("Receive packet consumed multiple buffers length<%x>\n",
2029				 length);
2030
2031			dev_kfree_skb_irq(skb);
2032			goto rxdesc_done;
2033		}
2034
2035		if (unlikely(rx_desc->errors &
2036		    (IXGB_RX_DESC_ERRORS_CE | IXGB_RX_DESC_ERRORS_SE |
2037		     IXGB_RX_DESC_ERRORS_P | IXGB_RX_DESC_ERRORS_RXE))) {
2038			dev_kfree_skb_irq(skb);
2039			goto rxdesc_done;
2040		}
2041
2042		ixgb_check_copybreak(&adapter->napi, buffer_info, length, &skb);
2043
2044		/* Good Receive */
2045		skb_put(skb, length);
2046
2047		/* Receive Checksum Offload */
2048		ixgb_rx_checksum(adapter, rx_desc, skb);
2049
2050		skb->protocol = eth_type_trans(skb, netdev);
2051		if (status & IXGB_RX_DESC_STATUS_VP)
2052			__vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q),
2053				       le16_to_cpu(rx_desc->special));
2054
2055		netif_receive_skb(skb);
2056
2057rxdesc_done:
2058		/* clean up descriptor, might be written over by hw */
2059		rx_desc->status = 0;
2060
2061		/* return some buffers to hardware, one at a time is too slow */
2062		if (unlikely(cleaned_count >= IXGB_RX_BUFFER_WRITE)) {
2063			ixgb_alloc_rx_buffers(adapter, cleaned_count);
2064			cleaned_count = 0;
2065		}
2066
2067		/* use prefetched values */
2068		rx_desc = next_rxd;
2069		buffer_info = next_buffer;
2070	}
2071
2072	rx_ring->next_to_clean = i;
2073
2074	cleaned_count = IXGB_DESC_UNUSED(rx_ring);
2075	if (cleaned_count)
2076		ixgb_alloc_rx_buffers(adapter, cleaned_count);
2077
2078	return cleaned;
2079}
2080
2081/**
2082 * ixgb_alloc_rx_buffers - Replace used receive buffers
2083 * @adapter: address of board private structure
2084 **/
2085
2086static void
2087ixgb_alloc_rx_buffers(struct ixgb_adapter *adapter, int cleaned_count)
2088{
2089	struct ixgb_desc_ring *rx_ring = &adapter->rx_ring;
2090	struct net_device *netdev = adapter->netdev;
2091	struct pci_dev *pdev = adapter->pdev;
2092	struct ixgb_rx_desc *rx_desc;
2093	struct ixgb_buffer *buffer_info;
2094	struct sk_buff *skb;
2095	unsigned int i;
2096	long cleancount;
2097
2098	i = rx_ring->next_to_use;
2099	buffer_info = &rx_ring->buffer_info[i];
2100	cleancount = IXGB_DESC_UNUSED(rx_ring);
2101
2102
2103	/* leave three descriptors unused */
2104	while (--cleancount > 2 && cleaned_count--) {
2105		/* recycle! its good for you */
2106		skb = buffer_info->skb;
2107		if (skb) {
2108			skb_trim(skb, 0);
2109			goto map_skb;
2110		}
2111
2112		skb = netdev_alloc_skb_ip_align(netdev, adapter->rx_buffer_len);
2113		if (unlikely(!skb)) {
2114			/* Better luck next round */
2115			adapter->alloc_rx_buff_failed++;
2116			break;
2117		}
2118
2119		buffer_info->skb = skb;
2120		buffer_info->length = adapter->rx_buffer_len;
2121map_skb:
2122		buffer_info->dma = dma_map_single(&pdev->dev,
2123		                                  skb->data,
2124		                                  adapter->rx_buffer_len,
2125						  DMA_FROM_DEVICE);
2126		if (dma_mapping_error(&pdev->dev, buffer_info->dma)) {
2127			adapter->alloc_rx_buff_failed++;
2128			break;
2129		}
2130
2131		rx_desc = IXGB_RX_DESC(*rx_ring, i);
2132		rx_desc->buff_addr = cpu_to_le64(buffer_info->dma);
2133		/* guarantee DD bit not set now before h/w gets descriptor
2134		 * this is the rest of the workaround for h/w double
2135		 * writeback. */
2136		rx_desc->status = 0;
2137
2138
2139		if (++i == rx_ring->count)
2140			i = 0;
2141		buffer_info = &rx_ring->buffer_info[i];
2142	}
2143
2144	if (likely(rx_ring->next_to_use != i)) {
2145		rx_ring->next_to_use = i;
2146		if (unlikely(i-- == 0))
2147			i = (rx_ring->count - 1);
2148
2149		/* Force memory writes to complete before letting h/w
2150		 * know there are new descriptors to fetch.  (Only
2151		 * applicable for weak-ordered memory model archs, such
2152		 * as IA-64). */
2153		wmb();
2154		IXGB_WRITE_REG(&adapter->hw, RDT, i);
2155	}
2156}
2157
2158static void
2159ixgb_vlan_strip_enable(struct ixgb_adapter *adapter)
2160{
2161	u32 ctrl;
2162
2163	/* enable VLAN tag insert/strip */
2164	ctrl = IXGB_READ_REG(&adapter->hw, CTRL0);
2165	ctrl |= IXGB_CTRL0_VME;
2166	IXGB_WRITE_REG(&adapter->hw, CTRL0, ctrl);
2167}
2168
2169static void
2170ixgb_vlan_strip_disable(struct ixgb_adapter *adapter)
2171{
2172	u32 ctrl;
2173
2174	/* disable VLAN tag insert/strip */
2175	ctrl = IXGB_READ_REG(&adapter->hw, CTRL0);
2176	ctrl &= ~IXGB_CTRL0_VME;
2177	IXGB_WRITE_REG(&adapter->hw, CTRL0, ctrl);
2178}
2179
2180static int
2181ixgb_vlan_rx_add_vid(struct net_device *netdev, __be16 proto, u16 vid)
2182{
2183	struct ixgb_adapter *adapter = netdev_priv(netdev);
2184	u32 vfta, index;
2185
2186	/* add VID to filter table */
2187
2188	index = (vid >> 5) & 0x7F;
2189	vfta = IXGB_READ_REG_ARRAY(&adapter->hw, VFTA, index);
2190	vfta |= (1 << (vid & 0x1F));
2191	ixgb_write_vfta(&adapter->hw, index, vfta);
2192	set_bit(vid, adapter->active_vlans);
2193
2194	return 0;
2195}
2196
2197static int
2198ixgb_vlan_rx_kill_vid(struct net_device *netdev, __be16 proto, u16 vid)
2199{
2200	struct ixgb_adapter *adapter = netdev_priv(netdev);
2201	u32 vfta, index;
2202
2203	/* remove VID from filter table */
2204
2205	index = (vid >> 5) & 0x7F;
2206	vfta = IXGB_READ_REG_ARRAY(&adapter->hw, VFTA, index);
2207	vfta &= ~(1 << (vid & 0x1F));
2208	ixgb_write_vfta(&adapter->hw, index, vfta);
2209	clear_bit(vid, adapter->active_vlans);
2210
2211	return 0;
2212}
2213
2214static void
2215ixgb_restore_vlan(struct ixgb_adapter *adapter)
2216{
2217	u16 vid;
2218
2219	for_each_set_bit(vid, adapter->active_vlans, VLAN_N_VID)
2220		ixgb_vlan_rx_add_vid(adapter->netdev, htons(ETH_P_8021Q), vid);
2221}
2222
2223#ifdef CONFIG_NET_POLL_CONTROLLER
2224/*
2225 * Polling 'interrupt' - used by things like netconsole to send skbs
2226 * without having to re-enable interrupts. It's not called while
2227 * the interrupt routine is executing.
2228 */
2229
2230static void ixgb_netpoll(struct net_device *dev)
2231{
2232	struct ixgb_adapter *adapter = netdev_priv(dev);
2233
2234	disable_irq(adapter->pdev->irq);
2235	ixgb_intr(adapter->pdev->irq, dev);
2236	enable_irq(adapter->pdev->irq);
2237}
2238#endif
2239
2240/**
2241 * ixgb_io_error_detected - called when PCI error is detected
2242 * @pdev:    pointer to pci device with error
2243 * @state:   pci channel state after error
2244 *
2245 * This callback is called by the PCI subsystem whenever
2246 * a PCI bus error is detected.
2247 */
2248static pci_ers_result_t ixgb_io_error_detected(struct pci_dev *pdev,
2249                                               enum pci_channel_state state)
2250{
2251	struct net_device *netdev = pci_get_drvdata(pdev);
2252	struct ixgb_adapter *adapter = netdev_priv(netdev);
2253
2254	netif_device_detach(netdev);
2255
2256	if (state == pci_channel_io_perm_failure)
2257		return PCI_ERS_RESULT_DISCONNECT;
2258
2259	if (netif_running(netdev))
2260		ixgb_down(adapter, true);
2261
2262	pci_disable_device(pdev);
2263
2264	/* Request a slot reset. */
2265	return PCI_ERS_RESULT_NEED_RESET;
2266}
2267
2268/**
2269 * ixgb_io_slot_reset - called after the pci bus has been reset.
2270 * @pdev    pointer to pci device with error
2271 *
2272 * This callback is called after the PCI bus has been reset.
2273 * Basically, this tries to restart the card from scratch.
2274 * This is a shortened version of the device probe/discovery code,
2275 * it resembles the first-half of the ixgb_probe() routine.
2276 */
2277static pci_ers_result_t ixgb_io_slot_reset(struct pci_dev *pdev)
2278{
2279	struct net_device *netdev = pci_get_drvdata(pdev);
2280	struct ixgb_adapter *adapter = netdev_priv(netdev);
2281
2282	if (pci_enable_device(pdev)) {
2283		netif_err(adapter, probe, adapter->netdev,
2284			  "Cannot re-enable PCI device after reset\n");
2285		return PCI_ERS_RESULT_DISCONNECT;
2286	}
2287
2288	/* Perform card reset only on one instance of the card */
2289	if (0 != PCI_FUNC (pdev->devfn))
2290		return PCI_ERS_RESULT_RECOVERED;
2291
2292	pci_set_master(pdev);
2293
2294	netif_carrier_off(netdev);
2295	netif_stop_queue(netdev);
2296	ixgb_reset(adapter);
2297
2298	/* Make sure the EEPROM is good */
2299	if (!ixgb_validate_eeprom_checksum(&adapter->hw)) {
2300		netif_err(adapter, probe, adapter->netdev,
2301			  "After reset, the EEPROM checksum is not valid\n");
2302		return PCI_ERS_RESULT_DISCONNECT;
2303	}
2304	ixgb_get_ee_mac_addr(&adapter->hw, netdev->dev_addr);
2305	memcpy(netdev->perm_addr, netdev->dev_addr, netdev->addr_len);
2306
2307	if (!is_valid_ether_addr(netdev->perm_addr)) {
2308		netif_err(adapter, probe, adapter->netdev,
2309			  "After reset, invalid MAC address\n");
2310		return PCI_ERS_RESULT_DISCONNECT;
2311	}
2312
2313	return PCI_ERS_RESULT_RECOVERED;
2314}
2315
2316/**
2317 * ixgb_io_resume - called when its OK to resume normal operations
2318 * @pdev    pointer to pci device with error
2319 *
2320 * The error recovery driver tells us that its OK to resume
2321 * normal operation. Implementation resembles the second-half
2322 * of the ixgb_probe() routine.
2323 */
2324static void ixgb_io_resume(struct pci_dev *pdev)
2325{
2326	struct net_device *netdev = pci_get_drvdata(pdev);
2327	struct ixgb_adapter *adapter = netdev_priv(netdev);
2328
2329	pci_set_master(pdev);
2330
2331	if (netif_running(netdev)) {
2332		if (ixgb_up(adapter)) {
2333			pr_err("can't bring device back up after reset\n");
2334			return;
2335		}
2336	}
2337
2338	netif_device_attach(netdev);
2339	mod_timer(&adapter->watchdog_timer, jiffies);
2340}
2341
2342/* ixgb_main.c */