Linux Audio

Check our new training course

Loading...
Note: File does not exist in v6.13.7.
   1/*******************************************************************************
   2
   3  Intel PRO/10GbE Linux driver
   4  Copyright(c) 1999 - 2008 Intel Corporation.
   5
   6  This program is free software; you can redistribute it and/or modify it
   7  under the terms and conditions of the GNU General Public License,
   8  version 2, as published by the Free Software Foundation.
   9
  10  This program is distributed in the hope it will be useful, but WITHOUT
  11  ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  12  FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
  13  more details.
  14
  15  You should have received a copy of the GNU General Public License along with
  16  this program; if not, write to the Free Software Foundation, Inc.,
  17  51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA.
  18
  19  The full GNU General Public License is included in this distribution in
  20  the file called "COPYING".
  21
  22  Contact Information:
  23  Linux NICS <linux.nics@intel.com>
  24  e1000-devel Mailing List <e1000-devel@lists.sourceforge.net>
  25  Intel Corporation, 5200 N.E. Elam Young Parkway, Hillsboro, OR 97124-6497
  26
  27*******************************************************************************/
  28
  29#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
  30
  31#include <linux/prefetch.h>
  32#include "ixgb.h"
  33
  34char ixgb_driver_name[] = "ixgb";
  35static char ixgb_driver_string[] = "Intel(R) PRO/10GbE Network Driver";
  36
  37#define DRIVERNAPI "-NAPI"
  38#define DRV_VERSION "1.0.135-k2" DRIVERNAPI
  39const char ixgb_driver_version[] = DRV_VERSION;
  40static const char ixgb_copyright[] = "Copyright (c) 1999-2008 Intel Corporation.";
  41
  42#define IXGB_CB_LENGTH 256
  43static unsigned int copybreak __read_mostly = IXGB_CB_LENGTH;
  44module_param(copybreak, uint, 0644);
  45MODULE_PARM_DESC(copybreak,
  46	"Maximum size of packet that is copied to a new buffer on receive");
  47
  48/* ixgb_pci_tbl - PCI Device ID Table
  49 *
  50 * Wildcard entries (PCI_ANY_ID) should come last
  51 * Last entry must be all 0s
  52 *
  53 * { Vendor ID, Device ID, SubVendor ID, SubDevice ID,
  54 *   Class, Class Mask, private data (not used) }
  55 */
  56static DEFINE_PCI_DEVICE_TABLE(ixgb_pci_tbl) = {
  57	{PCI_VENDOR_ID_INTEL, IXGB_DEVICE_ID_82597EX,
  58	 PCI_ANY_ID, PCI_ANY_ID, 0, 0, 0},
  59	{PCI_VENDOR_ID_INTEL, IXGB_DEVICE_ID_82597EX_CX4,
  60	 PCI_ANY_ID, PCI_ANY_ID, 0, 0, 0},
  61	{PCI_VENDOR_ID_INTEL, IXGB_DEVICE_ID_82597EX_SR,
  62	 PCI_ANY_ID, PCI_ANY_ID, 0, 0, 0},
  63	{PCI_VENDOR_ID_INTEL, IXGB_DEVICE_ID_82597EX_LR,
  64	 PCI_ANY_ID, PCI_ANY_ID, 0, 0, 0},
  65
  66	/* required last entry */
  67	{0,}
  68};
  69
  70MODULE_DEVICE_TABLE(pci, ixgb_pci_tbl);
  71
  72/* Local Function Prototypes */
  73static int ixgb_init_module(void);
  74static void ixgb_exit_module(void);
  75static int ixgb_probe(struct pci_dev *pdev, const struct pci_device_id *ent);
  76static void ixgb_remove(struct pci_dev *pdev);
  77static int ixgb_sw_init(struct ixgb_adapter *adapter);
  78static int ixgb_open(struct net_device *netdev);
  79static int ixgb_close(struct net_device *netdev);
  80static void ixgb_configure_tx(struct ixgb_adapter *adapter);
  81static void ixgb_configure_rx(struct ixgb_adapter *adapter);
  82static void ixgb_setup_rctl(struct ixgb_adapter *adapter);
  83static void ixgb_clean_tx_ring(struct ixgb_adapter *adapter);
  84static void ixgb_clean_rx_ring(struct ixgb_adapter *adapter);
  85static void ixgb_set_multi(struct net_device *netdev);
  86static void ixgb_watchdog(unsigned long data);
  87static netdev_tx_t ixgb_xmit_frame(struct sk_buff *skb,
  88				   struct net_device *netdev);
  89static struct net_device_stats *ixgb_get_stats(struct net_device *netdev);
  90static int ixgb_change_mtu(struct net_device *netdev, int new_mtu);
  91static int ixgb_set_mac(struct net_device *netdev, void *p);
  92static irqreturn_t ixgb_intr(int irq, void *data);
  93static bool ixgb_clean_tx_irq(struct ixgb_adapter *adapter);
  94
  95static int ixgb_clean(struct napi_struct *, int);
  96static bool ixgb_clean_rx_irq(struct ixgb_adapter *, int *, int);
  97static void ixgb_alloc_rx_buffers(struct ixgb_adapter *, int);
  98
  99static void ixgb_tx_timeout(struct net_device *dev);
 100static void ixgb_tx_timeout_task(struct work_struct *work);
 101
 102static void ixgb_vlan_strip_enable(struct ixgb_adapter *adapter);
 103static void ixgb_vlan_strip_disable(struct ixgb_adapter *adapter);
 104static int ixgb_vlan_rx_add_vid(struct net_device *netdev,
 105				__be16 proto, u16 vid);
 106static int ixgb_vlan_rx_kill_vid(struct net_device *netdev,
 107				 __be16 proto, u16 vid);
 108static void ixgb_restore_vlan(struct ixgb_adapter *adapter);
 109
 110#ifdef CONFIG_NET_POLL_CONTROLLER
 111/* for netdump / net console */
 112static void ixgb_netpoll(struct net_device *dev);
 113#endif
 114
 115static pci_ers_result_t ixgb_io_error_detected (struct pci_dev *pdev,
 116                             enum pci_channel_state state);
 117static pci_ers_result_t ixgb_io_slot_reset (struct pci_dev *pdev);
 118static void ixgb_io_resume (struct pci_dev *pdev);
 119
 120static const struct pci_error_handlers ixgb_err_handler = {
 121	.error_detected = ixgb_io_error_detected,
 122	.slot_reset = ixgb_io_slot_reset,
 123	.resume = ixgb_io_resume,
 124};
 125
 126static struct pci_driver ixgb_driver = {
 127	.name     = ixgb_driver_name,
 128	.id_table = ixgb_pci_tbl,
 129	.probe    = ixgb_probe,
 130	.remove   = ixgb_remove,
 131	.err_handler = &ixgb_err_handler
 132};
 133
 134MODULE_AUTHOR("Intel Corporation, <linux.nics@intel.com>");
 135MODULE_DESCRIPTION("Intel(R) PRO/10GbE Network Driver");
 136MODULE_LICENSE("GPL");
 137MODULE_VERSION(DRV_VERSION);
 138
 139#define DEFAULT_MSG_ENABLE (NETIF_MSG_DRV|NETIF_MSG_PROBE|NETIF_MSG_LINK)
 140static int debug = -1;
 141module_param(debug, int, 0);
 142MODULE_PARM_DESC(debug, "Debug level (0=none,...,16=all)");
 143
 144/**
 145 * ixgb_init_module - Driver Registration Routine
 146 *
 147 * ixgb_init_module is the first routine called when the driver is
 148 * loaded. All it does is register with the PCI subsystem.
 149 **/
 150
 151static int __init
 152ixgb_init_module(void)
 153{
 154	pr_info("%s - version %s\n", ixgb_driver_string, ixgb_driver_version);
 155	pr_info("%s\n", ixgb_copyright);
 156
 157	return pci_register_driver(&ixgb_driver);
 158}
 159
 160module_init(ixgb_init_module);
 161
 162/**
 163 * ixgb_exit_module - Driver Exit Cleanup Routine
 164 *
 165 * ixgb_exit_module is called just before the driver is removed
 166 * from memory.
 167 **/
 168
 169static void __exit
 170ixgb_exit_module(void)
 171{
 172	pci_unregister_driver(&ixgb_driver);
 173}
 174
 175module_exit(ixgb_exit_module);
 176
 177/**
 178 * ixgb_irq_disable - Mask off interrupt generation on the NIC
 179 * @adapter: board private structure
 180 **/
 181
 182static void
 183ixgb_irq_disable(struct ixgb_adapter *adapter)
 184{
 185	IXGB_WRITE_REG(&adapter->hw, IMC, ~0);
 186	IXGB_WRITE_FLUSH(&adapter->hw);
 187	synchronize_irq(adapter->pdev->irq);
 188}
 189
 190/**
 191 * ixgb_irq_enable - Enable default interrupt generation settings
 192 * @adapter: board private structure
 193 **/
 194
 195static void
 196ixgb_irq_enable(struct ixgb_adapter *adapter)
 197{
 198	u32 val = IXGB_INT_RXT0 | IXGB_INT_RXDMT0 |
 199		  IXGB_INT_TXDW | IXGB_INT_LSC;
 200	if (adapter->hw.subsystem_vendor_id == PCI_VENDOR_ID_SUN)
 201		val |= IXGB_INT_GPI0;
 202	IXGB_WRITE_REG(&adapter->hw, IMS, val);
 203	IXGB_WRITE_FLUSH(&adapter->hw);
 204}
 205
 206int
 207ixgb_up(struct ixgb_adapter *adapter)
 208{
 209	struct net_device *netdev = adapter->netdev;
 210	int err, irq_flags = IRQF_SHARED;
 211	int max_frame = netdev->mtu + ENET_HEADER_SIZE + ENET_FCS_LENGTH;
 212	struct ixgb_hw *hw = &adapter->hw;
 213
 214	/* hardware has been reset, we need to reload some things */
 215
 216	ixgb_rar_set(hw, netdev->dev_addr, 0);
 217	ixgb_set_multi(netdev);
 218
 219	ixgb_restore_vlan(adapter);
 220
 221	ixgb_configure_tx(adapter);
 222	ixgb_setup_rctl(adapter);
 223	ixgb_configure_rx(adapter);
 224	ixgb_alloc_rx_buffers(adapter, IXGB_DESC_UNUSED(&adapter->rx_ring));
 225
 226	/* disable interrupts and get the hardware into a known state */
 227	IXGB_WRITE_REG(&adapter->hw, IMC, 0xffffffff);
 228
 229	/* only enable MSI if bus is in PCI-X mode */
 230	if (IXGB_READ_REG(&adapter->hw, STATUS) & IXGB_STATUS_PCIX_MODE) {
 231		err = pci_enable_msi(adapter->pdev);
 232		if (!err) {
 233			adapter->have_msi = true;
 234			irq_flags = 0;
 235		}
 236		/* proceed to try to request regular interrupt */
 237	}
 238
 239	err = request_irq(adapter->pdev->irq, ixgb_intr, irq_flags,
 240	                  netdev->name, netdev);
 241	if (err) {
 242		if (adapter->have_msi)
 243			pci_disable_msi(adapter->pdev);
 244		netif_err(adapter, probe, adapter->netdev,
 245			  "Unable to allocate interrupt Error: %d\n", err);
 246		return err;
 247	}
 248
 249	if ((hw->max_frame_size != max_frame) ||
 250		(hw->max_frame_size !=
 251		(IXGB_READ_REG(hw, MFS) >> IXGB_MFS_SHIFT))) {
 252
 253		hw->max_frame_size = max_frame;
 254
 255		IXGB_WRITE_REG(hw, MFS, hw->max_frame_size << IXGB_MFS_SHIFT);
 256
 257		if (hw->max_frame_size >
 258		   IXGB_MAX_ENET_FRAME_SIZE_WITHOUT_FCS + ENET_FCS_LENGTH) {
 259			u32 ctrl0 = IXGB_READ_REG(hw, CTRL0);
 260
 261			if (!(ctrl0 & IXGB_CTRL0_JFE)) {
 262				ctrl0 |= IXGB_CTRL0_JFE;
 263				IXGB_WRITE_REG(hw, CTRL0, ctrl0);
 264			}
 265		}
 266	}
 267
 268	clear_bit(__IXGB_DOWN, &adapter->flags);
 269
 270	napi_enable(&adapter->napi);
 271	ixgb_irq_enable(adapter);
 272
 273	netif_wake_queue(netdev);
 274
 275	mod_timer(&adapter->watchdog_timer, jiffies);
 276
 277	return 0;
 278}
 279
 280void
 281ixgb_down(struct ixgb_adapter *adapter, bool kill_watchdog)
 282{
 283	struct net_device *netdev = adapter->netdev;
 284
 285	/* prevent the interrupt handler from restarting watchdog */
 286	set_bit(__IXGB_DOWN, &adapter->flags);
 287
 288	napi_disable(&adapter->napi);
 289	/* waiting for NAPI to complete can re-enable interrupts */
 290	ixgb_irq_disable(adapter);
 291	free_irq(adapter->pdev->irq, netdev);
 292
 293	if (adapter->have_msi)
 294		pci_disable_msi(adapter->pdev);
 295
 296	if (kill_watchdog)
 297		del_timer_sync(&adapter->watchdog_timer);
 298
 299	adapter->link_speed = 0;
 300	adapter->link_duplex = 0;
 301	netif_carrier_off(netdev);
 302	netif_stop_queue(netdev);
 303
 304	ixgb_reset(adapter);
 305	ixgb_clean_tx_ring(adapter);
 306	ixgb_clean_rx_ring(adapter);
 307}
 308
 309void
 310ixgb_reset(struct ixgb_adapter *adapter)
 311{
 312	struct ixgb_hw *hw = &adapter->hw;
 313
 314	ixgb_adapter_stop(hw);
 315	if (!ixgb_init_hw(hw))
 316		netif_err(adapter, probe, adapter->netdev, "ixgb_init_hw failed\n");
 317
 318	/* restore frame size information */
 319	IXGB_WRITE_REG(hw, MFS, hw->max_frame_size << IXGB_MFS_SHIFT);
 320	if (hw->max_frame_size >
 321	    IXGB_MAX_ENET_FRAME_SIZE_WITHOUT_FCS + ENET_FCS_LENGTH) {
 322		u32 ctrl0 = IXGB_READ_REG(hw, CTRL0);
 323		if (!(ctrl0 & IXGB_CTRL0_JFE)) {
 324			ctrl0 |= IXGB_CTRL0_JFE;
 325			IXGB_WRITE_REG(hw, CTRL0, ctrl0);
 326		}
 327	}
 328}
 329
 330static netdev_features_t
 331ixgb_fix_features(struct net_device *netdev, netdev_features_t features)
 332{
 333	/*
 334	 * Tx VLAN insertion does not work per HW design when Rx stripping is
 335	 * disabled.
 336	 */
 337	if (!(features & NETIF_F_HW_VLAN_CTAG_RX))
 338		features &= ~NETIF_F_HW_VLAN_CTAG_TX;
 339
 340	return features;
 341}
 342
 343static int
 344ixgb_set_features(struct net_device *netdev, netdev_features_t features)
 345{
 346	struct ixgb_adapter *adapter = netdev_priv(netdev);
 347	netdev_features_t changed = features ^ netdev->features;
 348
 349	if (!(changed & (NETIF_F_RXCSUM|NETIF_F_HW_VLAN_CTAG_RX)))
 350		return 0;
 351
 352	adapter->rx_csum = !!(features & NETIF_F_RXCSUM);
 353
 354	if (netif_running(netdev)) {
 355		ixgb_down(adapter, true);
 356		ixgb_up(adapter);
 357		ixgb_set_speed_duplex(netdev);
 358	} else
 359		ixgb_reset(adapter);
 360
 361	return 0;
 362}
 363
 364
 365static const struct net_device_ops ixgb_netdev_ops = {
 366	.ndo_open 		= ixgb_open,
 367	.ndo_stop		= ixgb_close,
 368	.ndo_start_xmit		= ixgb_xmit_frame,
 369	.ndo_get_stats		= ixgb_get_stats,
 370	.ndo_set_rx_mode	= ixgb_set_multi,
 371	.ndo_validate_addr	= eth_validate_addr,
 372	.ndo_set_mac_address	= ixgb_set_mac,
 373	.ndo_change_mtu		= ixgb_change_mtu,
 374	.ndo_tx_timeout		= ixgb_tx_timeout,
 375	.ndo_vlan_rx_add_vid	= ixgb_vlan_rx_add_vid,
 376	.ndo_vlan_rx_kill_vid	= ixgb_vlan_rx_kill_vid,
 377#ifdef CONFIG_NET_POLL_CONTROLLER
 378	.ndo_poll_controller	= ixgb_netpoll,
 379#endif
 380	.ndo_fix_features       = ixgb_fix_features,
 381	.ndo_set_features       = ixgb_set_features,
 382};
 383
 384/**
 385 * ixgb_probe - Device Initialization Routine
 386 * @pdev: PCI device information struct
 387 * @ent: entry in ixgb_pci_tbl
 388 *
 389 * Returns 0 on success, negative on failure
 390 *
 391 * ixgb_probe initializes an adapter identified by a pci_dev structure.
 392 * The OS initialization, configuring of the adapter private structure,
 393 * and a hardware reset occur.
 394 **/
 395
 396static int
 397ixgb_probe(struct pci_dev *pdev, const struct pci_device_id *ent)
 398{
 399	struct net_device *netdev = NULL;
 400	struct ixgb_adapter *adapter;
 401	static int cards_found = 0;
 402	int pci_using_dac;
 403	int i;
 404	int err;
 405
 406	err = pci_enable_device(pdev);
 407	if (err)
 408		return err;
 409
 410	pci_using_dac = 0;
 411	err = dma_set_mask_and_coherent(&pdev->dev, DMA_BIT_MASK(64));
 412	if (!err) {
 413		pci_using_dac = 1;
 414	} else {
 415		err = dma_set_mask_and_coherent(&pdev->dev, DMA_BIT_MASK(32));
 416		if (err) {
 417			pr_err("No usable DMA configuration, aborting\n");
 418			goto err_dma_mask;
 419		}
 420	}
 421
 422	err = pci_request_regions(pdev, ixgb_driver_name);
 423	if (err)
 424		goto err_request_regions;
 425
 426	pci_set_master(pdev);
 427
 428	netdev = alloc_etherdev(sizeof(struct ixgb_adapter));
 429	if (!netdev) {
 430		err = -ENOMEM;
 431		goto err_alloc_etherdev;
 432	}
 433
 434	SET_NETDEV_DEV(netdev, &pdev->dev);
 435
 436	pci_set_drvdata(pdev, netdev);
 437	adapter = netdev_priv(netdev);
 438	adapter->netdev = netdev;
 439	adapter->pdev = pdev;
 440	adapter->hw.back = adapter;
 441	adapter->msg_enable = netif_msg_init(debug, DEFAULT_MSG_ENABLE);
 442
 443	adapter->hw.hw_addr = pci_ioremap_bar(pdev, BAR_0);
 444	if (!adapter->hw.hw_addr) {
 445		err = -EIO;
 446		goto err_ioremap;
 447	}
 448
 449	for (i = BAR_1; i <= BAR_5; i++) {
 450		if (pci_resource_len(pdev, i) == 0)
 451			continue;
 452		if (pci_resource_flags(pdev, i) & IORESOURCE_IO) {
 453			adapter->hw.io_base = pci_resource_start(pdev, i);
 454			break;
 455		}
 456	}
 457
 458	netdev->netdev_ops = &ixgb_netdev_ops;
 459	ixgb_set_ethtool_ops(netdev);
 460	netdev->watchdog_timeo = 5 * HZ;
 461	netif_napi_add(netdev, &adapter->napi, ixgb_clean, 64);
 462
 463	strncpy(netdev->name, pci_name(pdev), sizeof(netdev->name) - 1);
 464
 465	adapter->bd_number = cards_found;
 466	adapter->link_speed = 0;
 467	adapter->link_duplex = 0;
 468
 469	/* setup the private structure */
 470
 471	err = ixgb_sw_init(adapter);
 472	if (err)
 473		goto err_sw_init;
 474
 475	netdev->hw_features = NETIF_F_SG |
 476			   NETIF_F_TSO |
 477			   NETIF_F_HW_CSUM |
 478			   NETIF_F_HW_VLAN_CTAG_TX |
 479			   NETIF_F_HW_VLAN_CTAG_RX;
 480	netdev->features = netdev->hw_features |
 481			   NETIF_F_HW_VLAN_CTAG_FILTER;
 482	netdev->hw_features |= NETIF_F_RXCSUM;
 483
 484	if (pci_using_dac) {
 485		netdev->features |= NETIF_F_HIGHDMA;
 486		netdev->vlan_features |= NETIF_F_HIGHDMA;
 487	}
 488
 489	/* make sure the EEPROM is good */
 490
 491	if (!ixgb_validate_eeprom_checksum(&adapter->hw)) {
 492		netif_err(adapter, probe, adapter->netdev,
 493			  "The EEPROM Checksum Is Not Valid\n");
 494		err = -EIO;
 495		goto err_eeprom;
 496	}
 497
 498	ixgb_get_ee_mac_addr(&adapter->hw, netdev->dev_addr);
 499
 500	if (!is_valid_ether_addr(netdev->dev_addr)) {
 501		netif_err(adapter, probe, adapter->netdev, "Invalid MAC Address\n");
 502		err = -EIO;
 503		goto err_eeprom;
 504	}
 505
 506	adapter->part_num = ixgb_get_ee_pba_number(&adapter->hw);
 507
 508	init_timer(&adapter->watchdog_timer);
 509	adapter->watchdog_timer.function = ixgb_watchdog;
 510	adapter->watchdog_timer.data = (unsigned long)adapter;
 511
 512	INIT_WORK(&adapter->tx_timeout_task, ixgb_tx_timeout_task);
 513
 514	strcpy(netdev->name, "eth%d");
 515	err = register_netdev(netdev);
 516	if (err)
 517		goto err_register;
 518
 519	/* carrier off reporting is important to ethtool even BEFORE open */
 520	netif_carrier_off(netdev);
 521
 522	netif_info(adapter, probe, adapter->netdev,
 523		   "Intel(R) PRO/10GbE Network Connection\n");
 524	ixgb_check_options(adapter);
 525	/* reset the hardware with the new settings */
 526
 527	ixgb_reset(adapter);
 528
 529	cards_found++;
 530	return 0;
 531
 532err_register:
 533err_sw_init:
 534err_eeprom:
 535	iounmap(adapter->hw.hw_addr);
 536err_ioremap:
 537	free_netdev(netdev);
 538err_alloc_etherdev:
 539	pci_release_regions(pdev);
 540err_request_regions:
 541err_dma_mask:
 542	pci_disable_device(pdev);
 543	return err;
 544}
 545
 546/**
 547 * ixgb_remove - Device Removal Routine
 548 * @pdev: PCI device information struct
 549 *
 550 * ixgb_remove is called by the PCI subsystem to alert the driver
 551 * that it should release a PCI device.  The could be caused by a
 552 * Hot-Plug event, or because the driver is going to be removed from
 553 * memory.
 554 **/
 555
 556static void
 557ixgb_remove(struct pci_dev *pdev)
 558{
 559	struct net_device *netdev = pci_get_drvdata(pdev);
 560	struct ixgb_adapter *adapter = netdev_priv(netdev);
 561
 562	cancel_work_sync(&adapter->tx_timeout_task);
 563
 564	unregister_netdev(netdev);
 565
 566	iounmap(adapter->hw.hw_addr);
 567	pci_release_regions(pdev);
 568
 569	free_netdev(netdev);
 570	pci_disable_device(pdev);
 571}
 572
 573/**
 574 * ixgb_sw_init - Initialize general software structures (struct ixgb_adapter)
 575 * @adapter: board private structure to initialize
 576 *
 577 * ixgb_sw_init initializes the Adapter private data structure.
 578 * Fields are initialized based on PCI device information and
 579 * OS network device settings (MTU size).
 580 **/
 581
 582static int
 583ixgb_sw_init(struct ixgb_adapter *adapter)
 584{
 585	struct ixgb_hw *hw = &adapter->hw;
 586	struct net_device *netdev = adapter->netdev;
 587	struct pci_dev *pdev = adapter->pdev;
 588
 589	/* PCI config space info */
 590
 591	hw->vendor_id = pdev->vendor;
 592	hw->device_id = pdev->device;
 593	hw->subsystem_vendor_id = pdev->subsystem_vendor;
 594	hw->subsystem_id = pdev->subsystem_device;
 595
 596	hw->max_frame_size = netdev->mtu + ENET_HEADER_SIZE + ENET_FCS_LENGTH;
 597	adapter->rx_buffer_len = hw->max_frame_size + 8; /* + 8 for errata */
 598
 599	if ((hw->device_id == IXGB_DEVICE_ID_82597EX) ||
 600	    (hw->device_id == IXGB_DEVICE_ID_82597EX_CX4) ||
 601	    (hw->device_id == IXGB_DEVICE_ID_82597EX_LR) ||
 602	    (hw->device_id == IXGB_DEVICE_ID_82597EX_SR))
 603		hw->mac_type = ixgb_82597;
 604	else {
 605		/* should never have loaded on this device */
 606		netif_err(adapter, probe, adapter->netdev, "unsupported device id\n");
 607	}
 608
 609	/* enable flow control to be programmed */
 610	hw->fc.send_xon = 1;
 611
 612	set_bit(__IXGB_DOWN, &adapter->flags);
 613	return 0;
 614}
 615
 616/**
 617 * ixgb_open - Called when a network interface is made active
 618 * @netdev: network interface device structure
 619 *
 620 * Returns 0 on success, negative value on failure
 621 *
 622 * The open entry point is called when a network interface is made
 623 * active by the system (IFF_UP).  At this point all resources needed
 624 * for transmit and receive operations are allocated, the interrupt
 625 * handler is registered with the OS, the watchdog timer is started,
 626 * and the stack is notified that the interface is ready.
 627 **/
 628
 629static int
 630ixgb_open(struct net_device *netdev)
 631{
 632	struct ixgb_adapter *adapter = netdev_priv(netdev);
 633	int err;
 634
 635	/* allocate transmit descriptors */
 636	err = ixgb_setup_tx_resources(adapter);
 637	if (err)
 638		goto err_setup_tx;
 639
 640	netif_carrier_off(netdev);
 641
 642	/* allocate receive descriptors */
 643
 644	err = ixgb_setup_rx_resources(adapter);
 645	if (err)
 646		goto err_setup_rx;
 647
 648	err = ixgb_up(adapter);
 649	if (err)
 650		goto err_up;
 651
 652	netif_start_queue(netdev);
 653
 654	return 0;
 655
 656err_up:
 657	ixgb_free_rx_resources(adapter);
 658err_setup_rx:
 659	ixgb_free_tx_resources(adapter);
 660err_setup_tx:
 661	ixgb_reset(adapter);
 662
 663	return err;
 664}
 665
 666/**
 667 * ixgb_close - Disables a network interface
 668 * @netdev: network interface device structure
 669 *
 670 * Returns 0, this is not allowed to fail
 671 *
 672 * The close entry point is called when an interface is de-activated
 673 * by the OS.  The hardware is still under the drivers control, but
 674 * needs to be disabled.  A global MAC reset is issued to stop the
 675 * hardware, and all transmit and receive resources are freed.
 676 **/
 677
 678static int
 679ixgb_close(struct net_device *netdev)
 680{
 681	struct ixgb_adapter *adapter = netdev_priv(netdev);
 682
 683	ixgb_down(adapter, true);
 684
 685	ixgb_free_tx_resources(adapter);
 686	ixgb_free_rx_resources(adapter);
 687
 688	return 0;
 689}
 690
 691/**
 692 * ixgb_setup_tx_resources - allocate Tx resources (Descriptors)
 693 * @adapter: board private structure
 694 *
 695 * Return 0 on success, negative on failure
 696 **/
 697
 698int
 699ixgb_setup_tx_resources(struct ixgb_adapter *adapter)
 700{
 701	struct ixgb_desc_ring *txdr = &adapter->tx_ring;
 702	struct pci_dev *pdev = adapter->pdev;
 703	int size;
 704
 705	size = sizeof(struct ixgb_buffer) * txdr->count;
 706	txdr->buffer_info = vzalloc(size);
 707	if (!txdr->buffer_info)
 708		return -ENOMEM;
 709
 710	/* round up to nearest 4K */
 711
 712	txdr->size = txdr->count * sizeof(struct ixgb_tx_desc);
 713	txdr->size = ALIGN(txdr->size, 4096);
 714
 715	txdr->desc = dma_zalloc_coherent(&pdev->dev, txdr->size, &txdr->dma,
 716					 GFP_KERNEL);
 717	if (!txdr->desc) {
 718		vfree(txdr->buffer_info);
 719		return -ENOMEM;
 720	}
 721
 722	txdr->next_to_use = 0;
 723	txdr->next_to_clean = 0;
 724
 725	return 0;
 726}
 727
 728/**
 729 * ixgb_configure_tx - Configure 82597 Transmit Unit after Reset.
 730 * @adapter: board private structure
 731 *
 732 * Configure the Tx unit of the MAC after a reset.
 733 **/
 734
 735static void
 736ixgb_configure_tx(struct ixgb_adapter *adapter)
 737{
 738	u64 tdba = adapter->tx_ring.dma;
 739	u32 tdlen = adapter->tx_ring.count * sizeof(struct ixgb_tx_desc);
 740	u32 tctl;
 741	struct ixgb_hw *hw = &adapter->hw;
 742
 743	/* Setup the Base and Length of the Tx Descriptor Ring
 744	 * tx_ring.dma can be either a 32 or 64 bit value
 745	 */
 746
 747	IXGB_WRITE_REG(hw, TDBAL, (tdba & 0x00000000ffffffffULL));
 748	IXGB_WRITE_REG(hw, TDBAH, (tdba >> 32));
 749
 750	IXGB_WRITE_REG(hw, TDLEN, tdlen);
 751
 752	/* Setup the HW Tx Head and Tail descriptor pointers */
 753
 754	IXGB_WRITE_REG(hw, TDH, 0);
 755	IXGB_WRITE_REG(hw, TDT, 0);
 756
 757	/* don't set up txdctl, it induces performance problems if configured
 758	 * incorrectly */
 759	/* Set the Tx Interrupt Delay register */
 760
 761	IXGB_WRITE_REG(hw, TIDV, adapter->tx_int_delay);
 762
 763	/* Program the Transmit Control Register */
 764
 765	tctl = IXGB_TCTL_TCE | IXGB_TCTL_TXEN | IXGB_TCTL_TPDE;
 766	IXGB_WRITE_REG(hw, TCTL, tctl);
 767
 768	/* Setup Transmit Descriptor Settings for this adapter */
 769	adapter->tx_cmd_type =
 770		IXGB_TX_DESC_TYPE |
 771		(adapter->tx_int_delay_enable ? IXGB_TX_DESC_CMD_IDE : 0);
 772}
 773
 774/**
 775 * ixgb_setup_rx_resources - allocate Rx resources (Descriptors)
 776 * @adapter: board private structure
 777 *
 778 * Returns 0 on success, negative on failure
 779 **/
 780
 781int
 782ixgb_setup_rx_resources(struct ixgb_adapter *adapter)
 783{
 784	struct ixgb_desc_ring *rxdr = &adapter->rx_ring;
 785	struct pci_dev *pdev = adapter->pdev;
 786	int size;
 787
 788	size = sizeof(struct ixgb_buffer) * rxdr->count;
 789	rxdr->buffer_info = vzalloc(size);
 790	if (!rxdr->buffer_info)
 791		return -ENOMEM;
 792
 793	/* Round up to nearest 4K */
 794
 795	rxdr->size = rxdr->count * sizeof(struct ixgb_rx_desc);
 796	rxdr->size = ALIGN(rxdr->size, 4096);
 797
 798	rxdr->desc = dma_alloc_coherent(&pdev->dev, rxdr->size, &rxdr->dma,
 799					GFP_KERNEL);
 800
 801	if (!rxdr->desc) {
 802		vfree(rxdr->buffer_info);
 803		return -ENOMEM;
 804	}
 805	memset(rxdr->desc, 0, rxdr->size);
 806
 807	rxdr->next_to_clean = 0;
 808	rxdr->next_to_use = 0;
 809
 810	return 0;
 811}
 812
 813/**
 814 * ixgb_setup_rctl - configure the receive control register
 815 * @adapter: Board private structure
 816 **/
 817
 818static void
 819ixgb_setup_rctl(struct ixgb_adapter *adapter)
 820{
 821	u32 rctl;
 822
 823	rctl = IXGB_READ_REG(&adapter->hw, RCTL);
 824
 825	rctl &= ~(3 << IXGB_RCTL_MO_SHIFT);
 826
 827	rctl |=
 828		IXGB_RCTL_BAM | IXGB_RCTL_RDMTS_1_2 |
 829		IXGB_RCTL_RXEN | IXGB_RCTL_CFF |
 830		(adapter->hw.mc_filter_type << IXGB_RCTL_MO_SHIFT);
 831
 832	rctl |= IXGB_RCTL_SECRC;
 833
 834	if (adapter->rx_buffer_len <= IXGB_RXBUFFER_2048)
 835		rctl |= IXGB_RCTL_BSIZE_2048;
 836	else if (adapter->rx_buffer_len <= IXGB_RXBUFFER_4096)
 837		rctl |= IXGB_RCTL_BSIZE_4096;
 838	else if (adapter->rx_buffer_len <= IXGB_RXBUFFER_8192)
 839		rctl |= IXGB_RCTL_BSIZE_8192;
 840	else if (adapter->rx_buffer_len <= IXGB_RXBUFFER_16384)
 841		rctl |= IXGB_RCTL_BSIZE_16384;
 842
 843	IXGB_WRITE_REG(&adapter->hw, RCTL, rctl);
 844}
 845
 846/**
 847 * ixgb_configure_rx - Configure 82597 Receive Unit after Reset.
 848 * @adapter: board private structure
 849 *
 850 * Configure the Rx unit of the MAC after a reset.
 851 **/
 852
 853static void
 854ixgb_configure_rx(struct ixgb_adapter *adapter)
 855{
 856	u64 rdba = adapter->rx_ring.dma;
 857	u32 rdlen = adapter->rx_ring.count * sizeof(struct ixgb_rx_desc);
 858	struct ixgb_hw *hw = &adapter->hw;
 859	u32 rctl;
 860	u32 rxcsum;
 861
 862	/* make sure receives are disabled while setting up the descriptors */
 863
 864	rctl = IXGB_READ_REG(hw, RCTL);
 865	IXGB_WRITE_REG(hw, RCTL, rctl & ~IXGB_RCTL_RXEN);
 866
 867	/* set the Receive Delay Timer Register */
 868
 869	IXGB_WRITE_REG(hw, RDTR, adapter->rx_int_delay);
 870
 871	/* Setup the Base and Length of the Rx Descriptor Ring */
 872
 873	IXGB_WRITE_REG(hw, RDBAL, (rdba & 0x00000000ffffffffULL));
 874	IXGB_WRITE_REG(hw, RDBAH, (rdba >> 32));
 875
 876	IXGB_WRITE_REG(hw, RDLEN, rdlen);
 877
 878	/* Setup the HW Rx Head and Tail Descriptor Pointers */
 879	IXGB_WRITE_REG(hw, RDH, 0);
 880	IXGB_WRITE_REG(hw, RDT, 0);
 881
 882	/* due to the hardware errata with RXDCTL, we are unable to use any of
 883	 * the performance enhancing features of it without causing other
 884	 * subtle bugs, some of the bugs could include receive length
 885	 * corruption at high data rates (WTHRESH > 0) and/or receive
 886	 * descriptor ring irregularites (particularly in hardware cache) */
 887	IXGB_WRITE_REG(hw, RXDCTL, 0);
 888
 889	/* Enable Receive Checksum Offload for TCP and UDP */
 890	if (adapter->rx_csum) {
 891		rxcsum = IXGB_READ_REG(hw, RXCSUM);
 892		rxcsum |= IXGB_RXCSUM_TUOFL;
 893		IXGB_WRITE_REG(hw, RXCSUM, rxcsum);
 894	}
 895
 896	/* Enable Receives */
 897
 898	IXGB_WRITE_REG(hw, RCTL, rctl);
 899}
 900
 901/**
 902 * ixgb_free_tx_resources - Free Tx Resources
 903 * @adapter: board private structure
 904 *
 905 * Free all transmit software resources
 906 **/
 907
 908void
 909ixgb_free_tx_resources(struct ixgb_adapter *adapter)
 910{
 911	struct pci_dev *pdev = adapter->pdev;
 912
 913	ixgb_clean_tx_ring(adapter);
 914
 915	vfree(adapter->tx_ring.buffer_info);
 916	adapter->tx_ring.buffer_info = NULL;
 917
 918	dma_free_coherent(&pdev->dev, adapter->tx_ring.size,
 919			  adapter->tx_ring.desc, adapter->tx_ring.dma);
 920
 921	adapter->tx_ring.desc = NULL;
 922}
 923
 924static void
 925ixgb_unmap_and_free_tx_resource(struct ixgb_adapter *adapter,
 926                                struct ixgb_buffer *buffer_info)
 927{
 928	if (buffer_info->dma) {
 929		if (buffer_info->mapped_as_page)
 930			dma_unmap_page(&adapter->pdev->dev, buffer_info->dma,
 931				       buffer_info->length, DMA_TO_DEVICE);
 932		else
 933			dma_unmap_single(&adapter->pdev->dev, buffer_info->dma,
 934					 buffer_info->length, DMA_TO_DEVICE);
 935		buffer_info->dma = 0;
 936	}
 937
 938	if (buffer_info->skb) {
 939		dev_kfree_skb_any(buffer_info->skb);
 940		buffer_info->skb = NULL;
 941	}
 942	buffer_info->time_stamp = 0;
 943	/* these fields must always be initialized in tx
 944	 * buffer_info->length = 0;
 945	 * buffer_info->next_to_watch = 0; */
 946}
 947
 948/**
 949 * ixgb_clean_tx_ring - Free Tx Buffers
 950 * @adapter: board private structure
 951 **/
 952
 953static void
 954ixgb_clean_tx_ring(struct ixgb_adapter *adapter)
 955{
 956	struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
 957	struct ixgb_buffer *buffer_info;
 958	unsigned long size;
 959	unsigned int i;
 960
 961	/* Free all the Tx ring sk_buffs */
 962
 963	for (i = 0; i < tx_ring->count; i++) {
 964		buffer_info = &tx_ring->buffer_info[i];
 965		ixgb_unmap_and_free_tx_resource(adapter, buffer_info);
 966	}
 967
 968	size = sizeof(struct ixgb_buffer) * tx_ring->count;
 969	memset(tx_ring->buffer_info, 0, size);
 970
 971	/* Zero out the descriptor ring */
 972
 973	memset(tx_ring->desc, 0, tx_ring->size);
 974
 975	tx_ring->next_to_use = 0;
 976	tx_ring->next_to_clean = 0;
 977
 978	IXGB_WRITE_REG(&adapter->hw, TDH, 0);
 979	IXGB_WRITE_REG(&adapter->hw, TDT, 0);
 980}
 981
 982/**
 983 * ixgb_free_rx_resources - Free Rx Resources
 984 * @adapter: board private structure
 985 *
 986 * Free all receive software resources
 987 **/
 988
 989void
 990ixgb_free_rx_resources(struct ixgb_adapter *adapter)
 991{
 992	struct ixgb_desc_ring *rx_ring = &adapter->rx_ring;
 993	struct pci_dev *pdev = adapter->pdev;
 994
 995	ixgb_clean_rx_ring(adapter);
 996
 997	vfree(rx_ring->buffer_info);
 998	rx_ring->buffer_info = NULL;
 999
1000	dma_free_coherent(&pdev->dev, rx_ring->size, rx_ring->desc,
1001			  rx_ring->dma);
1002
1003	rx_ring->desc = NULL;
1004}
1005
1006/**
1007 * ixgb_clean_rx_ring - Free Rx Buffers
1008 * @adapter: board private structure
1009 **/
1010
1011static void
1012ixgb_clean_rx_ring(struct ixgb_adapter *adapter)
1013{
1014	struct ixgb_desc_ring *rx_ring = &adapter->rx_ring;
1015	struct ixgb_buffer *buffer_info;
1016	struct pci_dev *pdev = adapter->pdev;
1017	unsigned long size;
1018	unsigned int i;
1019
1020	/* Free all the Rx ring sk_buffs */
1021
1022	for (i = 0; i < rx_ring->count; i++) {
1023		buffer_info = &rx_ring->buffer_info[i];
1024		if (buffer_info->dma) {
1025			dma_unmap_single(&pdev->dev,
1026					 buffer_info->dma,
1027					 buffer_info->length,
1028					 DMA_FROM_DEVICE);
1029			buffer_info->dma = 0;
1030			buffer_info->length = 0;
1031		}
1032
1033		if (buffer_info->skb) {
1034			dev_kfree_skb(buffer_info->skb);
1035			buffer_info->skb = NULL;
1036		}
1037	}
1038
1039	size = sizeof(struct ixgb_buffer) * rx_ring->count;
1040	memset(rx_ring->buffer_info, 0, size);
1041
1042	/* Zero out the descriptor ring */
1043
1044	memset(rx_ring->desc, 0, rx_ring->size);
1045
1046	rx_ring->next_to_clean = 0;
1047	rx_ring->next_to_use = 0;
1048
1049	IXGB_WRITE_REG(&adapter->hw, RDH, 0);
1050	IXGB_WRITE_REG(&adapter->hw, RDT, 0);
1051}
1052
1053/**
1054 * ixgb_set_mac - Change the Ethernet Address of the NIC
1055 * @netdev: network interface device structure
1056 * @p: pointer to an address structure
1057 *
1058 * Returns 0 on success, negative on failure
1059 **/
1060
1061static int
1062ixgb_set_mac(struct net_device *netdev, void *p)
1063{
1064	struct ixgb_adapter *adapter = netdev_priv(netdev);
1065	struct sockaddr *addr = p;
1066
1067	if (!is_valid_ether_addr(addr->sa_data))
1068		return -EADDRNOTAVAIL;
1069
1070	memcpy(netdev->dev_addr, addr->sa_data, netdev->addr_len);
1071
1072	ixgb_rar_set(&adapter->hw, addr->sa_data, 0);
1073
1074	return 0;
1075}
1076
1077/**
1078 * ixgb_set_multi - Multicast and Promiscuous mode set
1079 * @netdev: network interface device structure
1080 *
1081 * The set_multi entry point is called whenever the multicast address
1082 * list or the network interface flags are updated.  This routine is
1083 * responsible for configuring the hardware for proper multicast,
1084 * promiscuous mode, and all-multi behavior.
1085 **/
1086
1087static void
1088ixgb_set_multi(struct net_device *netdev)
1089{
1090	struct ixgb_adapter *adapter = netdev_priv(netdev);
1091	struct ixgb_hw *hw = &adapter->hw;
1092	struct netdev_hw_addr *ha;
1093	u32 rctl;
1094
1095	/* Check for Promiscuous and All Multicast modes */
1096
1097	rctl = IXGB_READ_REG(hw, RCTL);
1098
1099	if (netdev->flags & IFF_PROMISC) {
1100		rctl |= (IXGB_RCTL_UPE | IXGB_RCTL_MPE);
1101		/* disable VLAN filtering */
1102		rctl &= ~IXGB_RCTL_CFIEN;
1103		rctl &= ~IXGB_RCTL_VFE;
1104	} else {
1105		if (netdev->flags & IFF_ALLMULTI) {
1106			rctl |= IXGB_RCTL_MPE;
1107			rctl &= ~IXGB_RCTL_UPE;
1108		} else {
1109			rctl &= ~(IXGB_RCTL_UPE | IXGB_RCTL_MPE);
1110		}
1111		/* enable VLAN filtering */
1112		rctl |= IXGB_RCTL_VFE;
1113		rctl &= ~IXGB_RCTL_CFIEN;
1114	}
1115
1116	if (netdev_mc_count(netdev) > IXGB_MAX_NUM_MULTICAST_ADDRESSES) {
1117		rctl |= IXGB_RCTL_MPE;
1118		IXGB_WRITE_REG(hw, RCTL, rctl);
1119	} else {
1120		u8 *mta = kmalloc(IXGB_MAX_NUM_MULTICAST_ADDRESSES *
1121			      ETH_ALEN, GFP_ATOMIC);
1122		u8 *addr;
1123		if (!mta)
1124			goto alloc_failed;
1125
1126		IXGB_WRITE_REG(hw, RCTL, rctl);
1127
1128		addr = mta;
1129		netdev_for_each_mc_addr(ha, netdev) {
1130			memcpy(addr, ha->addr, ETH_ALEN);
1131			addr += ETH_ALEN;
1132		}
1133
1134		ixgb_mc_addr_list_update(hw, mta, netdev_mc_count(netdev), 0);
1135		kfree(mta);
1136	}
1137
1138alloc_failed:
1139	if (netdev->features & NETIF_F_HW_VLAN_CTAG_RX)
1140		ixgb_vlan_strip_enable(adapter);
1141	else
1142		ixgb_vlan_strip_disable(adapter);
1143
1144}
1145
1146/**
1147 * ixgb_watchdog - Timer Call-back
1148 * @data: pointer to netdev cast into an unsigned long
1149 **/
1150
1151static void
1152ixgb_watchdog(unsigned long data)
1153{
1154	struct ixgb_adapter *adapter = (struct ixgb_adapter *)data;
1155	struct net_device *netdev = adapter->netdev;
1156	struct ixgb_desc_ring *txdr = &adapter->tx_ring;
1157
1158	ixgb_check_for_link(&adapter->hw);
1159
1160	if (ixgb_check_for_bad_link(&adapter->hw)) {
1161		/* force the reset path */
1162		netif_stop_queue(netdev);
1163	}
1164
1165	if (adapter->hw.link_up) {
1166		if (!netif_carrier_ok(netdev)) {
1167			netdev_info(netdev,
1168				    "NIC Link is Up 10 Gbps Full Duplex, Flow Control: %s\n",
1169				    (adapter->hw.fc.type == ixgb_fc_full) ?
1170				    "RX/TX" :
1171				    (adapter->hw.fc.type == ixgb_fc_rx_pause) ?
1172				     "RX" :
1173				    (adapter->hw.fc.type == ixgb_fc_tx_pause) ?
1174				    "TX" : "None");
1175			adapter->link_speed = 10000;
1176			adapter->link_duplex = FULL_DUPLEX;
1177			netif_carrier_on(netdev);
1178		}
1179	} else {
1180		if (netif_carrier_ok(netdev)) {
1181			adapter->link_speed = 0;
1182			adapter->link_duplex = 0;
1183			netdev_info(netdev, "NIC Link is Down\n");
1184			netif_carrier_off(netdev);
1185		}
1186	}
1187
1188	ixgb_update_stats(adapter);
1189
1190	if (!netif_carrier_ok(netdev)) {
1191		if (IXGB_DESC_UNUSED(txdr) + 1 < txdr->count) {
1192			/* We've lost link, so the controller stops DMA,
1193			 * but we've got queued Tx work that's never going
1194			 * to get done, so reset controller to flush Tx.
1195			 * (Do the reset outside of interrupt context). */
1196			schedule_work(&adapter->tx_timeout_task);
1197			/* return immediately since reset is imminent */
1198			return;
1199		}
1200	}
1201
1202	/* Force detection of hung controller every watchdog period */
1203	adapter->detect_tx_hung = true;
1204
1205	/* generate an interrupt to force clean up of any stragglers */
1206	IXGB_WRITE_REG(&adapter->hw, ICS, IXGB_INT_TXDW);
1207
1208	/* Reset the timer */
1209	mod_timer(&adapter->watchdog_timer, jiffies + 2 * HZ);
1210}
1211
1212#define IXGB_TX_FLAGS_CSUM		0x00000001
1213#define IXGB_TX_FLAGS_VLAN		0x00000002
1214#define IXGB_TX_FLAGS_TSO		0x00000004
1215
1216static int
1217ixgb_tso(struct ixgb_adapter *adapter, struct sk_buff *skb)
1218{
1219	struct ixgb_context_desc *context_desc;
1220	unsigned int i;
1221	u8 ipcss, ipcso, tucss, tucso, hdr_len;
1222	u16 ipcse, tucse, mss;
1223
1224	if (likely(skb_is_gso(skb))) {
1225		struct ixgb_buffer *buffer_info;
1226		struct iphdr *iph;
1227		int err;
1228
1229		err = skb_cow_head(skb, 0);
1230		if (err < 0)
1231			return err;
1232
1233		hdr_len = skb_transport_offset(skb) + tcp_hdrlen(skb);
1234		mss = skb_shinfo(skb)->gso_size;
1235		iph = ip_hdr(skb);
1236		iph->tot_len = 0;
1237		iph->check = 0;
1238		tcp_hdr(skb)->check = ~csum_tcpudp_magic(iph->saddr,
1239							 iph->daddr, 0,
1240							 IPPROTO_TCP, 0);
1241		ipcss = skb_network_offset(skb);
1242		ipcso = (void *)&(iph->check) - (void *)skb->data;
1243		ipcse = skb_transport_offset(skb) - 1;
1244		tucss = skb_transport_offset(skb);
1245		tucso = (void *)&(tcp_hdr(skb)->check) - (void *)skb->data;
1246		tucse = 0;
1247
1248		i = adapter->tx_ring.next_to_use;
1249		context_desc = IXGB_CONTEXT_DESC(adapter->tx_ring, i);
1250		buffer_info = &adapter->tx_ring.buffer_info[i];
1251		WARN_ON(buffer_info->dma != 0);
1252
1253		context_desc->ipcss = ipcss;
1254		context_desc->ipcso = ipcso;
1255		context_desc->ipcse = cpu_to_le16(ipcse);
1256		context_desc->tucss = tucss;
1257		context_desc->tucso = tucso;
1258		context_desc->tucse = cpu_to_le16(tucse);
1259		context_desc->mss = cpu_to_le16(mss);
1260		context_desc->hdr_len = hdr_len;
1261		context_desc->status = 0;
1262		context_desc->cmd_type_len = cpu_to_le32(
1263						  IXGB_CONTEXT_DESC_TYPE
1264						| IXGB_CONTEXT_DESC_CMD_TSE
1265						| IXGB_CONTEXT_DESC_CMD_IP
1266						| IXGB_CONTEXT_DESC_CMD_TCP
1267						| IXGB_CONTEXT_DESC_CMD_IDE
1268						| (skb->len - (hdr_len)));
1269
1270
1271		if (++i == adapter->tx_ring.count) i = 0;
1272		adapter->tx_ring.next_to_use = i;
1273
1274		return 1;
1275	}
1276
1277	return 0;
1278}
1279
1280static bool
1281ixgb_tx_csum(struct ixgb_adapter *adapter, struct sk_buff *skb)
1282{
1283	struct ixgb_context_desc *context_desc;
1284	unsigned int i;
1285	u8 css, cso;
1286
1287	if (likely(skb->ip_summed == CHECKSUM_PARTIAL)) {
1288		struct ixgb_buffer *buffer_info;
1289		css = skb_checksum_start_offset(skb);
1290		cso = css + skb->csum_offset;
1291
1292		i = adapter->tx_ring.next_to_use;
1293		context_desc = IXGB_CONTEXT_DESC(adapter->tx_ring, i);
1294		buffer_info = &adapter->tx_ring.buffer_info[i];
1295		WARN_ON(buffer_info->dma != 0);
1296
1297		context_desc->tucss = css;
1298		context_desc->tucso = cso;
1299		context_desc->tucse = 0;
1300		/* zero out any previously existing data in one instruction */
1301		*(u32 *)&(context_desc->ipcss) = 0;
1302		context_desc->status = 0;
1303		context_desc->hdr_len = 0;
1304		context_desc->mss = 0;
1305		context_desc->cmd_type_len =
1306			cpu_to_le32(IXGB_CONTEXT_DESC_TYPE
1307				    | IXGB_TX_DESC_CMD_IDE);
1308
1309		if (++i == adapter->tx_ring.count) i = 0;
1310		adapter->tx_ring.next_to_use = i;
1311
1312		return true;
1313	}
1314
1315	return false;
1316}
1317
1318#define IXGB_MAX_TXD_PWR	14
1319#define IXGB_MAX_DATA_PER_TXD	(1<<IXGB_MAX_TXD_PWR)
1320
1321static int
1322ixgb_tx_map(struct ixgb_adapter *adapter, struct sk_buff *skb,
1323	    unsigned int first)
1324{
1325	struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
1326	struct pci_dev *pdev = adapter->pdev;
1327	struct ixgb_buffer *buffer_info;
1328	int len = skb_headlen(skb);
1329	unsigned int offset = 0, size, count = 0, i;
1330	unsigned int mss = skb_shinfo(skb)->gso_size;
1331	unsigned int nr_frags = skb_shinfo(skb)->nr_frags;
1332	unsigned int f;
1333
1334	i = tx_ring->next_to_use;
1335
1336	while (len) {
1337		buffer_info = &tx_ring->buffer_info[i];
1338		size = min(len, IXGB_MAX_DATA_PER_TXD);
1339		/* Workaround for premature desc write-backs
1340		 * in TSO mode.  Append 4-byte sentinel desc */
1341		if (unlikely(mss && !nr_frags && size == len && size > 8))
1342			size -= 4;
1343
1344		buffer_info->length = size;
1345		WARN_ON(buffer_info->dma != 0);
1346		buffer_info->time_stamp = jiffies;
1347		buffer_info->mapped_as_page = false;
1348		buffer_info->dma = dma_map_single(&pdev->dev,
1349						  skb->data + offset,
1350						  size, DMA_TO_DEVICE);
1351		if (dma_mapping_error(&pdev->dev, buffer_info->dma))
1352			goto dma_error;
1353		buffer_info->next_to_watch = 0;
1354
1355		len -= size;
1356		offset += size;
1357		count++;
1358		if (len) {
1359			i++;
1360			if (i == tx_ring->count)
1361				i = 0;
1362		}
1363	}
1364
1365	for (f = 0; f < nr_frags; f++) {
1366		const struct skb_frag_struct *frag;
1367
1368		frag = &skb_shinfo(skb)->frags[f];
1369		len = skb_frag_size(frag);
1370		offset = 0;
1371
1372		while (len) {
1373			i++;
1374			if (i == tx_ring->count)
1375				i = 0;
1376
1377			buffer_info = &tx_ring->buffer_info[i];
1378			size = min(len, IXGB_MAX_DATA_PER_TXD);
1379
1380			/* Workaround for premature desc write-backs
1381			 * in TSO mode.  Append 4-byte sentinel desc */
1382			if (unlikely(mss && (f == (nr_frags - 1))
1383				     && size == len && size > 8))
1384				size -= 4;
1385
1386			buffer_info->length = size;
1387			buffer_info->time_stamp = jiffies;
1388			buffer_info->mapped_as_page = true;
1389			buffer_info->dma =
1390				skb_frag_dma_map(&pdev->dev, frag, offset, size,
1391						 DMA_TO_DEVICE);
1392			if (dma_mapping_error(&pdev->dev, buffer_info->dma))
1393				goto dma_error;
1394			buffer_info->next_to_watch = 0;
1395
1396			len -= size;
1397			offset += size;
1398			count++;
1399		}
1400	}
1401	tx_ring->buffer_info[i].skb = skb;
1402	tx_ring->buffer_info[first].next_to_watch = i;
1403
1404	return count;
1405
1406dma_error:
1407	dev_err(&pdev->dev, "TX DMA map failed\n");
1408	buffer_info->dma = 0;
1409	if (count)
1410		count--;
1411
1412	while (count--) {
1413		if (i==0)
1414			i += tx_ring->count;
1415		i--;
1416		buffer_info = &tx_ring->buffer_info[i];
1417		ixgb_unmap_and_free_tx_resource(adapter, buffer_info);
1418	}
1419
1420	return 0;
1421}
1422
1423static void
1424ixgb_tx_queue(struct ixgb_adapter *adapter, int count, int vlan_id,int tx_flags)
1425{
1426	struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
1427	struct ixgb_tx_desc *tx_desc = NULL;
1428	struct ixgb_buffer *buffer_info;
1429	u32 cmd_type_len = adapter->tx_cmd_type;
1430	u8 status = 0;
1431	u8 popts = 0;
1432	unsigned int i;
1433
1434	if (tx_flags & IXGB_TX_FLAGS_TSO) {
1435		cmd_type_len |= IXGB_TX_DESC_CMD_TSE;
1436		popts |= (IXGB_TX_DESC_POPTS_IXSM | IXGB_TX_DESC_POPTS_TXSM);
1437	}
1438
1439	if (tx_flags & IXGB_TX_FLAGS_CSUM)
1440		popts |= IXGB_TX_DESC_POPTS_TXSM;
1441
1442	if (tx_flags & IXGB_TX_FLAGS_VLAN)
1443		cmd_type_len |= IXGB_TX_DESC_CMD_VLE;
1444
1445	i = tx_ring->next_to_use;
1446
1447	while (count--) {
1448		buffer_info = &tx_ring->buffer_info[i];
1449		tx_desc = IXGB_TX_DESC(*tx_ring, i);
1450		tx_desc->buff_addr = cpu_to_le64(buffer_info->dma);
1451		tx_desc->cmd_type_len =
1452			cpu_to_le32(cmd_type_len | buffer_info->length);
1453		tx_desc->status = status;
1454		tx_desc->popts = popts;
1455		tx_desc->vlan = cpu_to_le16(vlan_id);
1456
1457		if (++i == tx_ring->count) i = 0;
1458	}
1459
1460	tx_desc->cmd_type_len |=
1461		cpu_to_le32(IXGB_TX_DESC_CMD_EOP | IXGB_TX_DESC_CMD_RS);
1462
1463	/* Force memory writes to complete before letting h/w
1464	 * know there are new descriptors to fetch.  (Only
1465	 * applicable for weak-ordered memory model archs,
1466	 * such as IA-64). */
1467	wmb();
1468
1469	tx_ring->next_to_use = i;
1470	IXGB_WRITE_REG(&adapter->hw, TDT, i);
1471}
1472
1473static int __ixgb_maybe_stop_tx(struct net_device *netdev, int size)
1474{
1475	struct ixgb_adapter *adapter = netdev_priv(netdev);
1476	struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
1477
1478	netif_stop_queue(netdev);
1479	/* Herbert's original patch had:
1480	 *  smp_mb__after_netif_stop_queue();
1481	 * but since that doesn't exist yet, just open code it. */
1482	smp_mb();
1483
1484	/* We need to check again in a case another CPU has just
1485	 * made room available. */
1486	if (likely(IXGB_DESC_UNUSED(tx_ring) < size))
1487		return -EBUSY;
1488
1489	/* A reprieve! */
1490	netif_start_queue(netdev);
1491	++adapter->restart_queue;
1492	return 0;
1493}
1494
1495static int ixgb_maybe_stop_tx(struct net_device *netdev,
1496                              struct ixgb_desc_ring *tx_ring, int size)
1497{
1498	if (likely(IXGB_DESC_UNUSED(tx_ring) >= size))
1499		return 0;
1500	return __ixgb_maybe_stop_tx(netdev, size);
1501}
1502
1503
1504/* Tx Descriptors needed, worst case */
1505#define TXD_USE_COUNT(S) (((S) >> IXGB_MAX_TXD_PWR) + \
1506			 (((S) & (IXGB_MAX_DATA_PER_TXD - 1)) ? 1 : 0))
1507#define DESC_NEEDED TXD_USE_COUNT(IXGB_MAX_DATA_PER_TXD) /* skb->date */ + \
1508	MAX_SKB_FRAGS * TXD_USE_COUNT(PAGE_SIZE) + 1 /* for context */ \
1509	+ 1 /* one more needed for sentinel TSO workaround */
1510
1511static netdev_tx_t
1512ixgb_xmit_frame(struct sk_buff *skb, struct net_device *netdev)
1513{
1514	struct ixgb_adapter *adapter = netdev_priv(netdev);
1515	unsigned int first;
1516	unsigned int tx_flags = 0;
1517	int vlan_id = 0;
1518	int count = 0;
1519	int tso;
1520
1521	if (test_bit(__IXGB_DOWN, &adapter->flags)) {
1522		dev_kfree_skb_any(skb);
1523		return NETDEV_TX_OK;
1524	}
1525
1526	if (skb->len <= 0) {
1527		dev_kfree_skb_any(skb);
1528		return NETDEV_TX_OK;
1529	}
1530
1531	if (unlikely(ixgb_maybe_stop_tx(netdev, &adapter->tx_ring,
1532                     DESC_NEEDED)))
1533		return NETDEV_TX_BUSY;
1534
1535	if (vlan_tx_tag_present(skb)) {
1536		tx_flags |= IXGB_TX_FLAGS_VLAN;
1537		vlan_id = vlan_tx_tag_get(skb);
1538	}
1539
1540	first = adapter->tx_ring.next_to_use;
1541
1542	tso = ixgb_tso(adapter, skb);
1543	if (tso < 0) {
1544		dev_kfree_skb_any(skb);
1545		return NETDEV_TX_OK;
1546	}
1547
1548	if (likely(tso))
1549		tx_flags |= IXGB_TX_FLAGS_TSO;
1550	else if (ixgb_tx_csum(adapter, skb))
1551		tx_flags |= IXGB_TX_FLAGS_CSUM;
1552
1553	count = ixgb_tx_map(adapter, skb, first);
1554
1555	if (count) {
1556		ixgb_tx_queue(adapter, count, vlan_id, tx_flags);
1557		/* Make sure there is space in the ring for the next send. */
1558		ixgb_maybe_stop_tx(netdev, &adapter->tx_ring, DESC_NEEDED);
1559
1560	} else {
1561		dev_kfree_skb_any(skb);
1562		adapter->tx_ring.buffer_info[first].time_stamp = 0;
1563		adapter->tx_ring.next_to_use = first;
1564	}
1565
1566	return NETDEV_TX_OK;
1567}
1568
1569/**
1570 * ixgb_tx_timeout - Respond to a Tx Hang
1571 * @netdev: network interface device structure
1572 **/
1573
1574static void
1575ixgb_tx_timeout(struct net_device *netdev)
1576{
1577	struct ixgb_adapter *adapter = netdev_priv(netdev);
1578
1579	/* Do the reset outside of interrupt context */
1580	schedule_work(&adapter->tx_timeout_task);
1581}
1582
1583static void
1584ixgb_tx_timeout_task(struct work_struct *work)
1585{
1586	struct ixgb_adapter *adapter =
1587		container_of(work, struct ixgb_adapter, tx_timeout_task);
1588
1589	adapter->tx_timeout_count++;
1590	ixgb_down(adapter, true);
1591	ixgb_up(adapter);
1592}
1593
1594/**
1595 * ixgb_get_stats - Get System Network Statistics
1596 * @netdev: network interface device structure
1597 *
1598 * Returns the address of the device statistics structure.
1599 * The statistics are actually updated from the timer callback.
1600 **/
1601
1602static struct net_device_stats *
1603ixgb_get_stats(struct net_device *netdev)
1604{
1605	return &netdev->stats;
1606}
1607
1608/**
1609 * ixgb_change_mtu - Change the Maximum Transfer Unit
1610 * @netdev: network interface device structure
1611 * @new_mtu: new value for maximum frame size
1612 *
1613 * Returns 0 on success, negative on failure
1614 **/
1615
1616static int
1617ixgb_change_mtu(struct net_device *netdev, int new_mtu)
1618{
1619	struct ixgb_adapter *adapter = netdev_priv(netdev);
1620	int max_frame = new_mtu + ENET_HEADER_SIZE + ENET_FCS_LENGTH;
1621	int old_max_frame = netdev->mtu + ENET_HEADER_SIZE + ENET_FCS_LENGTH;
1622
1623	/* MTU < 68 is an error for IPv4 traffic, just don't allow it */
1624	if ((new_mtu < 68) ||
1625	    (max_frame > IXGB_MAX_JUMBO_FRAME_SIZE + ENET_FCS_LENGTH)) {
1626		netif_err(adapter, probe, adapter->netdev,
1627			  "Invalid MTU setting %d\n", new_mtu);
1628		return -EINVAL;
1629	}
1630
1631	if (old_max_frame == max_frame)
1632		return 0;
1633
1634	if (netif_running(netdev))
1635		ixgb_down(adapter, true);
1636
1637	adapter->rx_buffer_len = max_frame + 8; /* + 8 for errata */
1638
1639	netdev->mtu = new_mtu;
1640
1641	if (netif_running(netdev))
1642		ixgb_up(adapter);
1643
1644	return 0;
1645}
1646
1647/**
1648 * ixgb_update_stats - Update the board statistics counters.
1649 * @adapter: board private structure
1650 **/
1651
1652void
1653ixgb_update_stats(struct ixgb_adapter *adapter)
1654{
1655	struct net_device *netdev = adapter->netdev;
1656	struct pci_dev *pdev = adapter->pdev;
1657
1658	/* Prevent stats update while adapter is being reset */
1659	if (pci_channel_offline(pdev))
1660		return;
1661
1662	if ((netdev->flags & IFF_PROMISC) || (netdev->flags & IFF_ALLMULTI) ||
1663	   (netdev_mc_count(netdev) > IXGB_MAX_NUM_MULTICAST_ADDRESSES)) {
1664		u64 multi = IXGB_READ_REG(&adapter->hw, MPRCL);
1665		u32 bcast_l = IXGB_READ_REG(&adapter->hw, BPRCL);
1666		u32 bcast_h = IXGB_READ_REG(&adapter->hw, BPRCH);
1667		u64 bcast = ((u64)bcast_h << 32) | bcast_l;
1668
1669		multi |= ((u64)IXGB_READ_REG(&adapter->hw, MPRCH) << 32);
1670		/* fix up multicast stats by removing broadcasts */
1671		if (multi >= bcast)
1672			multi -= bcast;
1673
1674		adapter->stats.mprcl += (multi & 0xFFFFFFFF);
1675		adapter->stats.mprch += (multi >> 32);
1676		adapter->stats.bprcl += bcast_l;
1677		adapter->stats.bprch += bcast_h;
1678	} else {
1679		adapter->stats.mprcl += IXGB_READ_REG(&adapter->hw, MPRCL);
1680		adapter->stats.mprch += IXGB_READ_REG(&adapter->hw, MPRCH);
1681		adapter->stats.bprcl += IXGB_READ_REG(&adapter->hw, BPRCL);
1682		adapter->stats.bprch += IXGB_READ_REG(&adapter->hw, BPRCH);
1683	}
1684	adapter->stats.tprl += IXGB_READ_REG(&adapter->hw, TPRL);
1685	adapter->stats.tprh += IXGB_READ_REG(&adapter->hw, TPRH);
1686	adapter->stats.gprcl += IXGB_READ_REG(&adapter->hw, GPRCL);
1687	adapter->stats.gprch += IXGB_READ_REG(&adapter->hw, GPRCH);
1688	adapter->stats.uprcl += IXGB_READ_REG(&adapter->hw, UPRCL);
1689	adapter->stats.uprch += IXGB_READ_REG(&adapter->hw, UPRCH);
1690	adapter->stats.vprcl += IXGB_READ_REG(&adapter->hw, VPRCL);
1691	adapter->stats.vprch += IXGB_READ_REG(&adapter->hw, VPRCH);
1692	adapter->stats.jprcl += IXGB_READ_REG(&adapter->hw, JPRCL);
1693	adapter->stats.jprch += IXGB_READ_REG(&adapter->hw, JPRCH);
1694	adapter->stats.gorcl += IXGB_READ_REG(&adapter->hw, GORCL);
1695	adapter->stats.gorch += IXGB_READ_REG(&adapter->hw, GORCH);
1696	adapter->stats.torl += IXGB_READ_REG(&adapter->hw, TORL);
1697	adapter->stats.torh += IXGB_READ_REG(&adapter->hw, TORH);
1698	adapter->stats.rnbc += IXGB_READ_REG(&adapter->hw, RNBC);
1699	adapter->stats.ruc += IXGB_READ_REG(&adapter->hw, RUC);
1700	adapter->stats.roc += IXGB_READ_REG(&adapter->hw, ROC);
1701	adapter->stats.rlec += IXGB_READ_REG(&adapter->hw, RLEC);
1702	adapter->stats.crcerrs += IXGB_READ_REG(&adapter->hw, CRCERRS);
1703	adapter->stats.icbc += IXGB_READ_REG(&adapter->hw, ICBC);
1704	adapter->stats.ecbc += IXGB_READ_REG(&adapter->hw, ECBC);
1705	adapter->stats.mpc += IXGB_READ_REG(&adapter->hw, MPC);
1706	adapter->stats.tptl += IXGB_READ_REG(&adapter->hw, TPTL);
1707	adapter->stats.tpth += IXGB_READ_REG(&adapter->hw, TPTH);
1708	adapter->stats.gptcl += IXGB_READ_REG(&adapter->hw, GPTCL);
1709	adapter->stats.gptch += IXGB_READ_REG(&adapter->hw, GPTCH);
1710	adapter->stats.bptcl += IXGB_READ_REG(&adapter->hw, BPTCL);
1711	adapter->stats.bptch += IXGB_READ_REG(&adapter->hw, BPTCH);
1712	adapter->stats.mptcl += IXGB_READ_REG(&adapter->hw, MPTCL);
1713	adapter->stats.mptch += IXGB_READ_REG(&adapter->hw, MPTCH);
1714	adapter->stats.uptcl += IXGB_READ_REG(&adapter->hw, UPTCL);
1715	adapter->stats.uptch += IXGB_READ_REG(&adapter->hw, UPTCH);
1716	adapter->stats.vptcl += IXGB_READ_REG(&adapter->hw, VPTCL);
1717	adapter->stats.vptch += IXGB_READ_REG(&adapter->hw, VPTCH);
1718	adapter->stats.jptcl += IXGB_READ_REG(&adapter->hw, JPTCL);
1719	adapter->stats.jptch += IXGB_READ_REG(&adapter->hw, JPTCH);
1720	adapter->stats.gotcl += IXGB_READ_REG(&adapter->hw, GOTCL);
1721	adapter->stats.gotch += IXGB_READ_REG(&adapter->hw, GOTCH);
1722	adapter->stats.totl += IXGB_READ_REG(&adapter->hw, TOTL);
1723	adapter->stats.toth += IXGB_READ_REG(&adapter->hw, TOTH);
1724	adapter->stats.dc += IXGB_READ_REG(&adapter->hw, DC);
1725	adapter->stats.plt64c += IXGB_READ_REG(&adapter->hw, PLT64C);
1726	adapter->stats.tsctc += IXGB_READ_REG(&adapter->hw, TSCTC);
1727	adapter->stats.tsctfc += IXGB_READ_REG(&adapter->hw, TSCTFC);
1728	adapter->stats.ibic += IXGB_READ_REG(&adapter->hw, IBIC);
1729	adapter->stats.rfc += IXGB_READ_REG(&adapter->hw, RFC);
1730	adapter->stats.lfc += IXGB_READ_REG(&adapter->hw, LFC);
1731	adapter->stats.pfrc += IXGB_READ_REG(&adapter->hw, PFRC);
1732	adapter->stats.pftc += IXGB_READ_REG(&adapter->hw, PFTC);
1733	adapter->stats.mcfrc += IXGB_READ_REG(&adapter->hw, MCFRC);
1734	adapter->stats.mcftc += IXGB_READ_REG(&adapter->hw, MCFTC);
1735	adapter->stats.xonrxc += IXGB_READ_REG(&adapter->hw, XONRXC);
1736	adapter->stats.xontxc += IXGB_READ_REG(&adapter->hw, XONTXC);
1737	adapter->stats.xoffrxc += IXGB_READ_REG(&adapter->hw, XOFFRXC);
1738	adapter->stats.xofftxc += IXGB_READ_REG(&adapter->hw, XOFFTXC);
1739	adapter->stats.rjc += IXGB_READ_REG(&adapter->hw, RJC);
1740
1741	/* Fill out the OS statistics structure */
1742
1743	netdev->stats.rx_packets = adapter->stats.gprcl;
1744	netdev->stats.tx_packets = adapter->stats.gptcl;
1745	netdev->stats.rx_bytes = adapter->stats.gorcl;
1746	netdev->stats.tx_bytes = adapter->stats.gotcl;
1747	netdev->stats.multicast = adapter->stats.mprcl;
1748	netdev->stats.collisions = 0;
1749
1750	/* ignore RLEC as it reports errors for padded (<64bytes) frames
1751	 * with a length in the type/len field */
1752	netdev->stats.rx_errors =
1753	    /* adapter->stats.rnbc + */ adapter->stats.crcerrs +
1754	    adapter->stats.ruc +
1755	    adapter->stats.roc /*+ adapter->stats.rlec */  +
1756	    adapter->stats.icbc +
1757	    adapter->stats.ecbc + adapter->stats.mpc;
1758
1759	/* see above
1760	 * netdev->stats.rx_length_errors = adapter->stats.rlec;
1761	 */
1762
1763	netdev->stats.rx_crc_errors = adapter->stats.crcerrs;
1764	netdev->stats.rx_fifo_errors = adapter->stats.mpc;
1765	netdev->stats.rx_missed_errors = adapter->stats.mpc;
1766	netdev->stats.rx_over_errors = adapter->stats.mpc;
1767
1768	netdev->stats.tx_errors = 0;
1769	netdev->stats.rx_frame_errors = 0;
1770	netdev->stats.tx_aborted_errors = 0;
1771	netdev->stats.tx_carrier_errors = 0;
1772	netdev->stats.tx_fifo_errors = 0;
1773	netdev->stats.tx_heartbeat_errors = 0;
1774	netdev->stats.tx_window_errors = 0;
1775}
1776
1777#define IXGB_MAX_INTR 10
1778/**
1779 * ixgb_intr - Interrupt Handler
1780 * @irq: interrupt number
1781 * @data: pointer to a network interface device structure
1782 **/
1783
1784static irqreturn_t
1785ixgb_intr(int irq, void *data)
1786{
1787	struct net_device *netdev = data;
1788	struct ixgb_adapter *adapter = netdev_priv(netdev);
1789	struct ixgb_hw *hw = &adapter->hw;
1790	u32 icr = IXGB_READ_REG(hw, ICR);
1791
1792	if (unlikely(!icr))
1793		return IRQ_NONE;  /* Not our interrupt */
1794
1795	if (unlikely(icr & (IXGB_INT_RXSEQ | IXGB_INT_LSC)))
1796		if (!test_bit(__IXGB_DOWN, &adapter->flags))
1797			mod_timer(&adapter->watchdog_timer, jiffies);
1798
1799	if (napi_schedule_prep(&adapter->napi)) {
1800
1801		/* Disable interrupts and register for poll. The flush
1802		  of the posted write is intentionally left out.
1803		*/
1804
1805		IXGB_WRITE_REG(&adapter->hw, IMC, ~0);
1806		__napi_schedule(&adapter->napi);
1807	}
1808	return IRQ_HANDLED;
1809}
1810
1811/**
1812 * ixgb_clean - NAPI Rx polling callback
1813 * @adapter: board private structure
1814 **/
1815
1816static int
1817ixgb_clean(struct napi_struct *napi, int budget)
1818{
1819	struct ixgb_adapter *adapter = container_of(napi, struct ixgb_adapter, napi);
1820	int work_done = 0;
1821
1822	ixgb_clean_tx_irq(adapter);
1823	ixgb_clean_rx_irq(adapter, &work_done, budget);
1824
1825	/* If budget not fully consumed, exit the polling mode */
1826	if (work_done < budget) {
1827		napi_complete(napi);
1828		if (!test_bit(__IXGB_DOWN, &adapter->flags))
1829			ixgb_irq_enable(adapter);
1830	}
1831
1832	return work_done;
1833}
1834
1835/**
1836 * ixgb_clean_tx_irq - Reclaim resources after transmit completes
1837 * @adapter: board private structure
1838 **/
1839
1840static bool
1841ixgb_clean_tx_irq(struct ixgb_adapter *adapter)
1842{
1843	struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
1844	struct net_device *netdev = adapter->netdev;
1845	struct ixgb_tx_desc *tx_desc, *eop_desc;
1846	struct ixgb_buffer *buffer_info;
1847	unsigned int i, eop;
1848	bool cleaned = false;
1849
1850	i = tx_ring->next_to_clean;
1851	eop = tx_ring->buffer_info[i].next_to_watch;
1852	eop_desc = IXGB_TX_DESC(*tx_ring, eop);
1853
1854	while (eop_desc->status & IXGB_TX_DESC_STATUS_DD) {
1855
1856		rmb(); /* read buffer_info after eop_desc */
1857		for (cleaned = false; !cleaned; ) {
1858			tx_desc = IXGB_TX_DESC(*tx_ring, i);
1859			buffer_info = &tx_ring->buffer_info[i];
1860
1861			if (tx_desc->popts &
1862			   (IXGB_TX_DESC_POPTS_TXSM |
1863			    IXGB_TX_DESC_POPTS_IXSM))
1864				adapter->hw_csum_tx_good++;
1865
1866			ixgb_unmap_and_free_tx_resource(adapter, buffer_info);
1867
1868			*(u32 *)&(tx_desc->status) = 0;
1869
1870			cleaned = (i == eop);
1871			if (++i == tx_ring->count) i = 0;
1872		}
1873
1874		eop = tx_ring->buffer_info[i].next_to_watch;
1875		eop_desc = IXGB_TX_DESC(*tx_ring, eop);
1876	}
1877
1878	tx_ring->next_to_clean = i;
1879
1880	if (unlikely(cleaned && netif_carrier_ok(netdev) &&
1881		     IXGB_DESC_UNUSED(tx_ring) >= DESC_NEEDED)) {
1882		/* Make sure that anybody stopping the queue after this
1883		 * sees the new next_to_clean. */
1884		smp_mb();
1885
1886		if (netif_queue_stopped(netdev) &&
1887		    !(test_bit(__IXGB_DOWN, &adapter->flags))) {
1888			netif_wake_queue(netdev);
1889			++adapter->restart_queue;
1890		}
1891	}
1892
1893	if (adapter->detect_tx_hung) {
1894		/* detect a transmit hang in hardware, this serializes the
1895		 * check with the clearing of time_stamp and movement of i */
1896		adapter->detect_tx_hung = false;
1897		if (tx_ring->buffer_info[eop].time_stamp &&
1898		   time_after(jiffies, tx_ring->buffer_info[eop].time_stamp + HZ)
1899		   && !(IXGB_READ_REG(&adapter->hw, STATUS) &
1900		        IXGB_STATUS_TXOFF)) {
1901			/* detected Tx unit hang */
1902			netif_err(adapter, drv, adapter->netdev,
1903				  "Detected Tx Unit Hang\n"
1904				  "  TDH                  <%x>\n"
1905				  "  TDT                  <%x>\n"
1906				  "  next_to_use          <%x>\n"
1907				  "  next_to_clean        <%x>\n"
1908				  "buffer_info[next_to_clean]\n"
1909				  "  time_stamp           <%lx>\n"
1910				  "  next_to_watch        <%x>\n"
1911				  "  jiffies              <%lx>\n"
1912				  "  next_to_watch.status <%x>\n",
1913				  IXGB_READ_REG(&adapter->hw, TDH),
1914				  IXGB_READ_REG(&adapter->hw, TDT),
1915				  tx_ring->next_to_use,
1916				  tx_ring->next_to_clean,
1917				  tx_ring->buffer_info[eop].time_stamp,
1918				  eop,
1919				  jiffies,
1920				  eop_desc->status);
1921			netif_stop_queue(netdev);
1922		}
1923	}
1924
1925	return cleaned;
1926}
1927
1928/**
1929 * ixgb_rx_checksum - Receive Checksum Offload for 82597.
1930 * @adapter: board private structure
1931 * @rx_desc: receive descriptor
1932 * @sk_buff: socket buffer with received data
1933 **/
1934
1935static void
1936ixgb_rx_checksum(struct ixgb_adapter *adapter,
1937                 struct ixgb_rx_desc *rx_desc,
1938                 struct sk_buff *skb)
1939{
1940	/* Ignore Checksum bit is set OR
1941	 * TCP Checksum has not been calculated
1942	 */
1943	if ((rx_desc->status & IXGB_RX_DESC_STATUS_IXSM) ||
1944	   (!(rx_desc->status & IXGB_RX_DESC_STATUS_TCPCS))) {
1945		skb_checksum_none_assert(skb);
1946		return;
1947	}
1948
1949	/* At this point we know the hardware did the TCP checksum */
1950	/* now look at the TCP checksum error bit */
1951	if (rx_desc->errors & IXGB_RX_DESC_ERRORS_TCPE) {
1952		/* let the stack verify checksum errors */
1953		skb_checksum_none_assert(skb);
1954		adapter->hw_csum_rx_error++;
1955	} else {
1956		/* TCP checksum is good */
1957		skb->ip_summed = CHECKSUM_UNNECESSARY;
1958		adapter->hw_csum_rx_good++;
1959	}
1960}
1961
1962/*
1963 * this should improve performance for small packets with large amounts
1964 * of reassembly being done in the stack
1965 */
1966static void ixgb_check_copybreak(struct net_device *netdev,
1967				 struct ixgb_buffer *buffer_info,
1968				 u32 length, struct sk_buff **skb)
1969{
1970	struct sk_buff *new_skb;
1971
1972	if (length > copybreak)
1973		return;
1974
1975	new_skb = netdev_alloc_skb_ip_align(netdev, length);
1976	if (!new_skb)
1977		return;
1978
1979	skb_copy_to_linear_data_offset(new_skb, -NET_IP_ALIGN,
1980				       (*skb)->data - NET_IP_ALIGN,
1981				       length + NET_IP_ALIGN);
1982	/* save the skb in buffer_info as good */
1983	buffer_info->skb = *skb;
1984	*skb = new_skb;
1985}
1986
1987/**
1988 * ixgb_clean_rx_irq - Send received data up the network stack,
1989 * @adapter: board private structure
1990 **/
1991
1992static bool
1993ixgb_clean_rx_irq(struct ixgb_adapter *adapter, int *work_done, int work_to_do)
1994{
1995	struct ixgb_desc_ring *rx_ring = &adapter->rx_ring;
1996	struct net_device *netdev = adapter->netdev;
1997	struct pci_dev *pdev = adapter->pdev;
1998	struct ixgb_rx_desc *rx_desc, *next_rxd;
1999	struct ixgb_buffer *buffer_info, *next_buffer, *next2_buffer;
2000	u32 length;
2001	unsigned int i, j;
2002	int cleaned_count = 0;
2003	bool cleaned = false;
2004
2005	i = rx_ring->next_to_clean;
2006	rx_desc = IXGB_RX_DESC(*rx_ring, i);
2007	buffer_info = &rx_ring->buffer_info[i];
2008
2009	while (rx_desc->status & IXGB_RX_DESC_STATUS_DD) {
2010		struct sk_buff *skb;
2011		u8 status;
2012
2013		if (*work_done >= work_to_do)
2014			break;
2015
2016		(*work_done)++;
2017		rmb();	/* read descriptor and rx_buffer_info after status DD */
2018		status = rx_desc->status;
2019		skb = buffer_info->skb;
2020		buffer_info->skb = NULL;
2021
2022		prefetch(skb->data - NET_IP_ALIGN);
2023
2024		if (++i == rx_ring->count)
2025			i = 0;
2026		next_rxd = IXGB_RX_DESC(*rx_ring, i);
2027		prefetch(next_rxd);
2028
2029		j = i + 1;
2030		if (j == rx_ring->count)
2031			j = 0;
2032		next2_buffer = &rx_ring->buffer_info[j];
2033		prefetch(next2_buffer);
2034
2035		next_buffer = &rx_ring->buffer_info[i];
2036
2037		cleaned = true;
2038		cleaned_count++;
2039
2040		dma_unmap_single(&pdev->dev,
2041				 buffer_info->dma,
2042				 buffer_info->length,
2043				 DMA_FROM_DEVICE);
2044		buffer_info->dma = 0;
2045
2046		length = le16_to_cpu(rx_desc->length);
2047		rx_desc->length = 0;
2048
2049		if (unlikely(!(status & IXGB_RX_DESC_STATUS_EOP))) {
2050
2051			/* All receives must fit into a single buffer */
2052
2053			pr_debug("Receive packet consumed multiple buffers length<%x>\n",
2054				 length);
2055
2056			dev_kfree_skb_irq(skb);
2057			goto rxdesc_done;
2058		}
2059
2060		if (unlikely(rx_desc->errors &
2061		    (IXGB_RX_DESC_ERRORS_CE | IXGB_RX_DESC_ERRORS_SE |
2062		     IXGB_RX_DESC_ERRORS_P | IXGB_RX_DESC_ERRORS_RXE))) {
2063			dev_kfree_skb_irq(skb);
2064			goto rxdesc_done;
2065		}
2066
2067		ixgb_check_copybreak(netdev, buffer_info, length, &skb);
2068
2069		/* Good Receive */
2070		skb_put(skb, length);
2071
2072		/* Receive Checksum Offload */
2073		ixgb_rx_checksum(adapter, rx_desc, skb);
2074
2075		skb->protocol = eth_type_trans(skb, netdev);
2076		if (status & IXGB_RX_DESC_STATUS_VP)
2077			__vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q),
2078				       le16_to_cpu(rx_desc->special));
2079
2080		netif_receive_skb(skb);
2081
2082rxdesc_done:
2083		/* clean up descriptor, might be written over by hw */
2084		rx_desc->status = 0;
2085
2086		/* return some buffers to hardware, one at a time is too slow */
2087		if (unlikely(cleaned_count >= IXGB_RX_BUFFER_WRITE)) {
2088			ixgb_alloc_rx_buffers(adapter, cleaned_count);
2089			cleaned_count = 0;
2090		}
2091
2092		/* use prefetched values */
2093		rx_desc = next_rxd;
2094		buffer_info = next_buffer;
2095	}
2096
2097	rx_ring->next_to_clean = i;
2098
2099	cleaned_count = IXGB_DESC_UNUSED(rx_ring);
2100	if (cleaned_count)
2101		ixgb_alloc_rx_buffers(adapter, cleaned_count);
2102
2103	return cleaned;
2104}
2105
2106/**
2107 * ixgb_alloc_rx_buffers - Replace used receive buffers
2108 * @adapter: address of board private structure
2109 **/
2110
2111static void
2112ixgb_alloc_rx_buffers(struct ixgb_adapter *adapter, int cleaned_count)
2113{
2114	struct ixgb_desc_ring *rx_ring = &adapter->rx_ring;
2115	struct net_device *netdev = adapter->netdev;
2116	struct pci_dev *pdev = adapter->pdev;
2117	struct ixgb_rx_desc *rx_desc;
2118	struct ixgb_buffer *buffer_info;
2119	struct sk_buff *skb;
2120	unsigned int i;
2121	long cleancount;
2122
2123	i = rx_ring->next_to_use;
2124	buffer_info = &rx_ring->buffer_info[i];
2125	cleancount = IXGB_DESC_UNUSED(rx_ring);
2126
2127
2128	/* leave three descriptors unused */
2129	while (--cleancount > 2 && cleaned_count--) {
2130		/* recycle! its good for you */
2131		skb = buffer_info->skb;
2132		if (skb) {
2133			skb_trim(skb, 0);
2134			goto map_skb;
2135		}
2136
2137		skb = netdev_alloc_skb_ip_align(netdev, adapter->rx_buffer_len);
2138		if (unlikely(!skb)) {
2139			/* Better luck next round */
2140			adapter->alloc_rx_buff_failed++;
2141			break;
2142		}
2143
2144		buffer_info->skb = skb;
2145		buffer_info->length = adapter->rx_buffer_len;
2146map_skb:
2147		buffer_info->dma = dma_map_single(&pdev->dev,
2148		                                  skb->data,
2149		                                  adapter->rx_buffer_len,
2150						  DMA_FROM_DEVICE);
2151		if (dma_mapping_error(&pdev->dev, buffer_info->dma)) {
2152			adapter->alloc_rx_buff_failed++;
2153			break;
2154		}
2155
2156		rx_desc = IXGB_RX_DESC(*rx_ring, i);
2157		rx_desc->buff_addr = cpu_to_le64(buffer_info->dma);
2158		/* guarantee DD bit not set now before h/w gets descriptor
2159		 * this is the rest of the workaround for h/w double
2160		 * writeback. */
2161		rx_desc->status = 0;
2162
2163
2164		if (++i == rx_ring->count)
2165			i = 0;
2166		buffer_info = &rx_ring->buffer_info[i];
2167	}
2168
2169	if (likely(rx_ring->next_to_use != i)) {
2170		rx_ring->next_to_use = i;
2171		if (unlikely(i-- == 0))
2172			i = (rx_ring->count - 1);
2173
2174		/* Force memory writes to complete before letting h/w
2175		 * know there are new descriptors to fetch.  (Only
2176		 * applicable for weak-ordered memory model archs, such
2177		 * as IA-64). */
2178		wmb();
2179		IXGB_WRITE_REG(&adapter->hw, RDT, i);
2180	}
2181}
2182
2183static void
2184ixgb_vlan_strip_enable(struct ixgb_adapter *adapter)
2185{
2186	u32 ctrl;
2187
2188	/* enable VLAN tag insert/strip */
2189	ctrl = IXGB_READ_REG(&adapter->hw, CTRL0);
2190	ctrl |= IXGB_CTRL0_VME;
2191	IXGB_WRITE_REG(&adapter->hw, CTRL0, ctrl);
2192}
2193
2194static void
2195ixgb_vlan_strip_disable(struct ixgb_adapter *adapter)
2196{
2197	u32 ctrl;
2198
2199	/* disable VLAN tag insert/strip */
2200	ctrl = IXGB_READ_REG(&adapter->hw, CTRL0);
2201	ctrl &= ~IXGB_CTRL0_VME;
2202	IXGB_WRITE_REG(&adapter->hw, CTRL0, ctrl);
2203}
2204
2205static int
2206ixgb_vlan_rx_add_vid(struct net_device *netdev, __be16 proto, u16 vid)
2207{
2208	struct ixgb_adapter *adapter = netdev_priv(netdev);
2209	u32 vfta, index;
2210
2211	/* add VID to filter table */
2212
2213	index = (vid >> 5) & 0x7F;
2214	vfta = IXGB_READ_REG_ARRAY(&adapter->hw, VFTA, index);
2215	vfta |= (1 << (vid & 0x1F));
2216	ixgb_write_vfta(&adapter->hw, index, vfta);
2217	set_bit(vid, adapter->active_vlans);
2218
2219	return 0;
2220}
2221
2222static int
2223ixgb_vlan_rx_kill_vid(struct net_device *netdev, __be16 proto, u16 vid)
2224{
2225	struct ixgb_adapter *adapter = netdev_priv(netdev);
2226	u32 vfta, index;
2227
2228	/* remove VID from filter table */
2229
2230	index = (vid >> 5) & 0x7F;
2231	vfta = IXGB_READ_REG_ARRAY(&adapter->hw, VFTA, index);
2232	vfta &= ~(1 << (vid & 0x1F));
2233	ixgb_write_vfta(&adapter->hw, index, vfta);
2234	clear_bit(vid, adapter->active_vlans);
2235
2236	return 0;
2237}
2238
2239static void
2240ixgb_restore_vlan(struct ixgb_adapter *adapter)
2241{
2242	u16 vid;
2243
2244	for_each_set_bit(vid, adapter->active_vlans, VLAN_N_VID)
2245		ixgb_vlan_rx_add_vid(adapter->netdev, htons(ETH_P_8021Q), vid);
2246}
2247
2248#ifdef CONFIG_NET_POLL_CONTROLLER
2249/*
2250 * Polling 'interrupt' - used by things like netconsole to send skbs
2251 * without having to re-enable interrupts. It's not called while
2252 * the interrupt routine is executing.
2253 */
2254
2255static void ixgb_netpoll(struct net_device *dev)
2256{
2257	struct ixgb_adapter *adapter = netdev_priv(dev);
2258
2259	disable_irq(adapter->pdev->irq);
2260	ixgb_intr(adapter->pdev->irq, dev);
2261	enable_irq(adapter->pdev->irq);
2262}
2263#endif
2264
2265/**
2266 * ixgb_io_error_detected - called when PCI error is detected
2267 * @pdev:    pointer to pci device with error
2268 * @state:   pci channel state after error
2269 *
2270 * This callback is called by the PCI subsystem whenever
2271 * a PCI bus error is detected.
2272 */
2273static pci_ers_result_t ixgb_io_error_detected(struct pci_dev *pdev,
2274                                               enum pci_channel_state state)
2275{
2276	struct net_device *netdev = pci_get_drvdata(pdev);
2277	struct ixgb_adapter *adapter = netdev_priv(netdev);
2278
2279	netif_device_detach(netdev);
2280
2281	if (state == pci_channel_io_perm_failure)
2282		return PCI_ERS_RESULT_DISCONNECT;
2283
2284	if (netif_running(netdev))
2285		ixgb_down(adapter, true);
2286
2287	pci_disable_device(pdev);
2288
2289	/* Request a slot reset. */
2290	return PCI_ERS_RESULT_NEED_RESET;
2291}
2292
2293/**
2294 * ixgb_io_slot_reset - called after the pci bus has been reset.
2295 * @pdev    pointer to pci device with error
2296 *
2297 * This callback is called after the PCI bus has been reset.
2298 * Basically, this tries to restart the card from scratch.
2299 * This is a shortened version of the device probe/discovery code,
2300 * it resembles the first-half of the ixgb_probe() routine.
2301 */
2302static pci_ers_result_t ixgb_io_slot_reset(struct pci_dev *pdev)
2303{
2304	struct net_device *netdev = pci_get_drvdata(pdev);
2305	struct ixgb_adapter *adapter = netdev_priv(netdev);
2306
2307	if (pci_enable_device(pdev)) {
2308		netif_err(adapter, probe, adapter->netdev,
2309			  "Cannot re-enable PCI device after reset\n");
2310		return PCI_ERS_RESULT_DISCONNECT;
2311	}
2312
2313	/* Perform card reset only on one instance of the card */
2314	if (0 != PCI_FUNC (pdev->devfn))
2315		return PCI_ERS_RESULT_RECOVERED;
2316
2317	pci_set_master(pdev);
2318
2319	netif_carrier_off(netdev);
2320	netif_stop_queue(netdev);
2321	ixgb_reset(adapter);
2322
2323	/* Make sure the EEPROM is good */
2324	if (!ixgb_validate_eeprom_checksum(&adapter->hw)) {
2325		netif_err(adapter, probe, adapter->netdev,
2326			  "After reset, the EEPROM checksum is not valid\n");
2327		return PCI_ERS_RESULT_DISCONNECT;
2328	}
2329	ixgb_get_ee_mac_addr(&adapter->hw, netdev->dev_addr);
2330	memcpy(netdev->perm_addr, netdev->dev_addr, netdev->addr_len);
2331
2332	if (!is_valid_ether_addr(netdev->perm_addr)) {
2333		netif_err(adapter, probe, adapter->netdev,
2334			  "After reset, invalid MAC address\n");
2335		return PCI_ERS_RESULT_DISCONNECT;
2336	}
2337
2338	return PCI_ERS_RESULT_RECOVERED;
2339}
2340
2341/**
2342 * ixgb_io_resume - called when its OK to resume normal operations
2343 * @pdev    pointer to pci device with error
2344 *
2345 * The error recovery driver tells us that its OK to resume
2346 * normal operation. Implementation resembles the second-half
2347 * of the ixgb_probe() routine.
2348 */
2349static void ixgb_io_resume(struct pci_dev *pdev)
2350{
2351	struct net_device *netdev = pci_get_drvdata(pdev);
2352	struct ixgb_adapter *adapter = netdev_priv(netdev);
2353
2354	pci_set_master(pdev);
2355
2356	if (netif_running(netdev)) {
2357		if (ixgb_up(adapter)) {
2358			pr_err("can't bring device back up after reset\n");
2359			return;
2360		}
2361	}
2362
2363	netif_device_attach(netdev);
2364	mod_timer(&adapter->watchdog_timer, jiffies);
2365}
2366
2367/* ixgb_main.c */