linux/drivers/net/ethernet/intel/ixgb/ixgb_main.c
<<
>>
Prefs
   1/*******************************************************************************
   2
   3  Intel PRO/10GbE Linux driver
   4  Copyright(c) 1999 - 2008 Intel Corporation.
   5
   6  This program is free software; you can redistribute it and/or modify it
   7  under the terms and conditions of the GNU General Public License,
   8  version 2, as published by the Free Software Foundation.
   9
  10  This program is distributed in the hope it will be useful, but WITHOUT
  11  ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  12  FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
  13  more details.
  14
  15  You should have received a copy of the GNU General Public License along with
  16  this program; if not, write to the Free Software Foundation, Inc.,
  17  51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA.
  18
  19  The full GNU General Public License is included in this distribution in
  20  the file called "COPYING".
  21
  22  Contact Information:
  23  Linux NICS <linux.nics@intel.com>
  24  e1000-devel Mailing List <e1000-devel@lists.sourceforge.net>
  25  Intel Corporation, 5200 N.E. Elam Young Parkway, Hillsboro, OR 97124-6497
  26
  27*******************************************************************************/
  28
  29#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
  30
  31#include <linux/prefetch.h>
  32#include "ixgb.h"
  33
  34char ixgb_driver_name[] = "ixgb";
  35static char ixgb_driver_string[] = "Intel(R) PRO/10GbE Network Driver";
  36
  37#define DRIVERNAPI "-NAPI"
  38#define DRV_VERSION "1.0.135-k2" DRIVERNAPI
  39const char ixgb_driver_version[] = DRV_VERSION;
  40static const char ixgb_copyright[] = "Copyright (c) 1999-2008 Intel Corporation.";
  41
  42#define IXGB_CB_LENGTH 256
  43static unsigned int copybreak __read_mostly = IXGB_CB_LENGTH;
  44module_param(copybreak, uint, 0644);
  45MODULE_PARM_DESC(copybreak,
  46        "Maximum size of packet that is copied to a new buffer on receive");
  47
  48/* ixgb_pci_tbl - PCI Device ID Table
  49 *
  50 * Wildcard entries (PCI_ANY_ID) should come last
  51 * Last entry must be all 0s
  52 *
  53 * { Vendor ID, Device ID, SubVendor ID, SubDevice ID,
  54 *   Class, Class Mask, private data (not used) }
  55 */
  56static const struct pci_device_id ixgb_pci_tbl[] = {
  57        {PCI_VENDOR_ID_INTEL, IXGB_DEVICE_ID_82597EX,
  58         PCI_ANY_ID, PCI_ANY_ID, 0, 0, 0},
  59        {PCI_VENDOR_ID_INTEL, IXGB_DEVICE_ID_82597EX_CX4,
  60         PCI_ANY_ID, PCI_ANY_ID, 0, 0, 0},
  61        {PCI_VENDOR_ID_INTEL, IXGB_DEVICE_ID_82597EX_SR,
  62         PCI_ANY_ID, PCI_ANY_ID, 0, 0, 0},
  63        {PCI_VENDOR_ID_INTEL, IXGB_DEVICE_ID_82597EX_LR,
  64         PCI_ANY_ID, PCI_ANY_ID, 0, 0, 0},
  65
  66        /* required last entry */
  67        {0,}
  68};
  69
  70MODULE_DEVICE_TABLE(pci, ixgb_pci_tbl);
  71
  72/* Local Function Prototypes */
  73static int ixgb_init_module(void);
  74static void ixgb_exit_module(void);
  75static int ixgb_probe(struct pci_dev *pdev, const struct pci_device_id *ent);
  76static void ixgb_remove(struct pci_dev *pdev);
  77static int ixgb_sw_init(struct ixgb_adapter *adapter);
  78static int ixgb_open(struct net_device *netdev);
  79static int ixgb_close(struct net_device *netdev);
  80static void ixgb_configure_tx(struct ixgb_adapter *adapter);
  81static void ixgb_configure_rx(struct ixgb_adapter *adapter);
  82static void ixgb_setup_rctl(struct ixgb_adapter *adapter);
  83static void ixgb_clean_tx_ring(struct ixgb_adapter *adapter);
  84static void ixgb_clean_rx_ring(struct ixgb_adapter *adapter);
  85static void ixgb_set_multi(struct net_device *netdev);
  86static void ixgb_watchdog(unsigned long data);
  87static netdev_tx_t ixgb_xmit_frame(struct sk_buff *skb,
  88                                   struct net_device *netdev);
  89static struct net_device_stats *ixgb_get_stats(struct net_device *netdev);
  90static int ixgb_change_mtu(struct net_device *netdev, int new_mtu);
  91static int ixgb_set_mac(struct net_device *netdev, void *p);
  92static irqreturn_t ixgb_intr(int irq, void *data);
  93static bool ixgb_clean_tx_irq(struct ixgb_adapter *adapter);
  94
  95static int ixgb_clean(struct napi_struct *, int);
  96static bool ixgb_clean_rx_irq(struct ixgb_adapter *, int *, int);
  97static void ixgb_alloc_rx_buffers(struct ixgb_adapter *, int);
  98
  99static void ixgb_tx_timeout(struct net_device *dev);
 100static void ixgb_tx_timeout_task(struct work_struct *work);
 101
 102static void ixgb_vlan_strip_enable(struct ixgb_adapter *adapter);
 103static void ixgb_vlan_strip_disable(struct ixgb_adapter *adapter);
 104static int ixgb_vlan_rx_add_vid(struct net_device *netdev,
 105                                __be16 proto, u16 vid);
 106static int ixgb_vlan_rx_kill_vid(struct net_device *netdev,
 107                                 __be16 proto, u16 vid);
 108static void ixgb_restore_vlan(struct ixgb_adapter *adapter);
 109
 110#ifdef CONFIG_NET_POLL_CONTROLLER
 111/* for netdump / net console */
 112static void ixgb_netpoll(struct net_device *dev);
 113#endif
 114
 115static pci_ers_result_t ixgb_io_error_detected (struct pci_dev *pdev,
 116                             enum pci_channel_state state);
 117static pci_ers_result_t ixgb_io_slot_reset (struct pci_dev *pdev);
 118static void ixgb_io_resume (struct pci_dev *pdev);
 119
 120static const struct pci_error_handlers ixgb_err_handler = {
 121        .error_detected = ixgb_io_error_detected,
 122        .slot_reset = ixgb_io_slot_reset,
 123        .resume = ixgb_io_resume,
 124};
 125
 126static struct pci_driver ixgb_driver = {
 127        .name     = ixgb_driver_name,
 128        .id_table = ixgb_pci_tbl,
 129        .probe    = ixgb_probe,
 130        .remove   = ixgb_remove,
 131        .err_handler = &ixgb_err_handler
 132};
 133
 134MODULE_AUTHOR("Intel Corporation, <linux.nics@intel.com>");
 135MODULE_DESCRIPTION("Intel(R) PRO/10GbE Network Driver");
 136MODULE_LICENSE("GPL");
 137MODULE_VERSION(DRV_VERSION);
 138
 139#define DEFAULT_MSG_ENABLE (NETIF_MSG_DRV|NETIF_MSG_PROBE|NETIF_MSG_LINK)
 140static int debug = -1;
 141module_param(debug, int, 0);
 142MODULE_PARM_DESC(debug, "Debug level (0=none,...,16=all)");
 143
 144/**
 145 * ixgb_init_module - Driver Registration Routine
 146 *
 147 * ixgb_init_module is the first routine called when the driver is
 148 * loaded. All it does is register with the PCI subsystem.
 149 **/
 150
 151static int __init
 152ixgb_init_module(void)
 153{
 154        pr_info("%s - version %s\n", ixgb_driver_string, ixgb_driver_version);
 155        pr_info("%s\n", ixgb_copyright);
 156
 157        return pci_register_driver(&ixgb_driver);
 158}
 159
 160module_init(ixgb_init_module);
 161
 162/**
 163 * ixgb_exit_module - Driver Exit Cleanup Routine
 164 *
 165 * ixgb_exit_module is called just before the driver is removed
 166 * from memory.
 167 **/
 168
 169static void __exit
 170ixgb_exit_module(void)
 171{
 172        pci_unregister_driver(&ixgb_driver);
 173}
 174
 175module_exit(ixgb_exit_module);
 176
 177/**
 178 * ixgb_irq_disable - Mask off interrupt generation on the NIC
 179 * @adapter: board private structure
 180 **/
 181
 182static void
 183ixgb_irq_disable(struct ixgb_adapter *adapter)
 184{
 185        IXGB_WRITE_REG(&adapter->hw, IMC, ~0);
 186        IXGB_WRITE_FLUSH(&adapter->hw);
 187        synchronize_irq(adapter->pdev->irq);
 188}
 189
 190/**
 191 * ixgb_irq_enable - Enable default interrupt generation settings
 192 * @adapter: board private structure
 193 **/
 194
 195static void
 196ixgb_irq_enable(struct ixgb_adapter *adapter)
 197{
 198        u32 val = IXGB_INT_RXT0 | IXGB_INT_RXDMT0 |
 199                  IXGB_INT_TXDW | IXGB_INT_LSC;
 200        if (adapter->hw.subsystem_vendor_id == PCI_VENDOR_ID_SUN)
 201                val |= IXGB_INT_GPI0;
 202        IXGB_WRITE_REG(&adapter->hw, IMS, val);
 203        IXGB_WRITE_FLUSH(&adapter->hw);
 204}
 205
 206int
 207ixgb_up(struct ixgb_adapter *adapter)
 208{
 209        struct net_device *netdev = adapter->netdev;
 210        int err, irq_flags = IRQF_SHARED;
 211        int max_frame = netdev->mtu + ENET_HEADER_SIZE + ENET_FCS_LENGTH;
 212        struct ixgb_hw *hw = &adapter->hw;
 213
 214        /* hardware has been reset, we need to reload some things */
 215
 216        ixgb_rar_set(hw, netdev->dev_addr, 0);
 217        ixgb_set_multi(netdev);
 218
 219        ixgb_restore_vlan(adapter);
 220
 221        ixgb_configure_tx(adapter);
 222        ixgb_setup_rctl(adapter);
 223        ixgb_configure_rx(adapter);
 224        ixgb_alloc_rx_buffers(adapter, IXGB_DESC_UNUSED(&adapter->rx_ring));
 225
 226        /* disable interrupts and get the hardware into a known state */
 227        IXGB_WRITE_REG(&adapter->hw, IMC, 0xffffffff);
 228
 229        /* only enable MSI if bus is in PCI-X mode */
 230        if (IXGB_READ_REG(&adapter->hw, STATUS) & IXGB_STATUS_PCIX_MODE) {
 231                err = pci_enable_msi(adapter->pdev);
 232                if (!err) {
 233                        adapter->have_msi = true;
 234                        irq_flags = 0;
 235                }
 236                /* proceed to try to request regular interrupt */
 237        }
 238
 239        err = request_irq(adapter->pdev->irq, ixgb_intr, irq_flags,
 240                          netdev->name, netdev);
 241        if (err) {
 242                if (adapter->have_msi)
 243                        pci_disable_msi(adapter->pdev);
 244                netif_err(adapter, probe, adapter->netdev,
 245                          "Unable to allocate interrupt Error: %d\n", err);
 246                return err;
 247        }
 248
 249        if ((hw->max_frame_size != max_frame) ||
 250                (hw->max_frame_size !=
 251                (IXGB_READ_REG(hw, MFS) >> IXGB_MFS_SHIFT))) {
 252
 253                hw->max_frame_size = max_frame;
 254
 255                IXGB_WRITE_REG(hw, MFS, hw->max_frame_size << IXGB_MFS_SHIFT);
 256
 257                if (hw->max_frame_size >
 258                   IXGB_MAX_ENET_FRAME_SIZE_WITHOUT_FCS + ENET_FCS_LENGTH) {
 259                        u32 ctrl0 = IXGB_READ_REG(hw, CTRL0);
 260
 261                        if (!(ctrl0 & IXGB_CTRL0_JFE)) {
 262                                ctrl0 |= IXGB_CTRL0_JFE;
 263                                IXGB_WRITE_REG(hw, CTRL0, ctrl0);
 264                        }
 265                }
 266        }
 267
 268        clear_bit(__IXGB_DOWN, &adapter->flags);
 269
 270        napi_enable(&adapter->napi);
 271        ixgb_irq_enable(adapter);
 272
 273        netif_wake_queue(netdev);
 274
 275        mod_timer(&adapter->watchdog_timer, jiffies);
 276
 277        return 0;
 278}
 279
 280void
 281ixgb_down(struct ixgb_adapter *adapter, bool kill_watchdog)
 282{
 283        struct net_device *netdev = adapter->netdev;
 284
 285        /* prevent the interrupt handler from restarting watchdog */
 286        set_bit(__IXGB_DOWN, &adapter->flags);
 287
 288        netif_carrier_off(netdev);
 289
 290        napi_disable(&adapter->napi);
 291        /* waiting for NAPI to complete can re-enable interrupts */
 292        ixgb_irq_disable(adapter);
 293        free_irq(adapter->pdev->irq, netdev);
 294
 295        if (adapter->have_msi)
 296                pci_disable_msi(adapter->pdev);
 297
 298        if (kill_watchdog)
 299                del_timer_sync(&adapter->watchdog_timer);
 300
 301        adapter->link_speed = 0;
 302        adapter->link_duplex = 0;
 303        netif_stop_queue(netdev);
 304
 305        ixgb_reset(adapter);
 306        ixgb_clean_tx_ring(adapter);
 307        ixgb_clean_rx_ring(adapter);
 308}
 309
 310void
 311ixgb_reset(struct ixgb_adapter *adapter)
 312{
 313        struct ixgb_hw *hw = &adapter->hw;
 314
 315        ixgb_adapter_stop(hw);
 316        if (!ixgb_init_hw(hw))
 317                netif_err(adapter, probe, adapter->netdev, "ixgb_init_hw failed\n");
 318
 319        /* restore frame size information */
 320        IXGB_WRITE_REG(hw, MFS, hw->max_frame_size << IXGB_MFS_SHIFT);
 321        if (hw->max_frame_size >
 322            IXGB_MAX_ENET_FRAME_SIZE_WITHOUT_FCS + ENET_FCS_LENGTH) {
 323                u32 ctrl0 = IXGB_READ_REG(hw, CTRL0);
 324                if (!(ctrl0 & IXGB_CTRL0_JFE)) {
 325                        ctrl0 |= IXGB_CTRL0_JFE;
 326                        IXGB_WRITE_REG(hw, CTRL0, ctrl0);
 327                }
 328        }
 329}
 330
 331static netdev_features_t
 332ixgb_fix_features(struct net_device *netdev, netdev_features_t features)
 333{
 334        /*
 335         * Tx VLAN insertion does not work per HW design when Rx stripping is
 336         * disabled.
 337         */
 338        if (!(features & NETIF_F_HW_VLAN_CTAG_RX))
 339                features &= ~NETIF_F_HW_VLAN_CTAG_TX;
 340
 341        return features;
 342}
 343
 344static int
 345ixgb_set_features(struct net_device *netdev, netdev_features_t features)
 346{
 347        struct ixgb_adapter *adapter = netdev_priv(netdev);
 348        netdev_features_t changed = features ^ netdev->features;
 349
 350        if (!(changed & (NETIF_F_RXCSUM|NETIF_F_HW_VLAN_CTAG_RX)))
 351                return 0;
 352
 353        adapter->rx_csum = !!(features & NETIF_F_RXCSUM);
 354
 355        if (netif_running(netdev)) {
 356                ixgb_down(adapter, true);
 357                ixgb_up(adapter);
 358                ixgb_set_speed_duplex(netdev);
 359        } else
 360                ixgb_reset(adapter);
 361
 362        return 0;
 363}
 364
 365
 366static const struct net_device_ops ixgb_netdev_ops = {
 367        .ndo_open               = ixgb_open,
 368        .ndo_stop               = ixgb_close,
 369        .ndo_start_xmit         = ixgb_xmit_frame,
 370        .ndo_get_stats          = ixgb_get_stats,
 371        .ndo_set_rx_mode        = ixgb_set_multi,
 372        .ndo_validate_addr      = eth_validate_addr,
 373        .ndo_set_mac_address    = ixgb_set_mac,
 374        .ndo_change_mtu         = ixgb_change_mtu,
 375        .ndo_tx_timeout         = ixgb_tx_timeout,
 376        .ndo_vlan_rx_add_vid    = ixgb_vlan_rx_add_vid,
 377        .ndo_vlan_rx_kill_vid   = ixgb_vlan_rx_kill_vid,
 378#ifdef CONFIG_NET_POLL_CONTROLLER
 379        .ndo_poll_controller    = ixgb_netpoll,
 380#endif
 381        .ndo_fix_features       = ixgb_fix_features,
 382        .ndo_set_features       = ixgb_set_features,
 383};
 384
 385/**
 386 * ixgb_probe - Device Initialization Routine
 387 * @pdev: PCI device information struct
 388 * @ent: entry in ixgb_pci_tbl
 389 *
 390 * Returns 0 on success, negative on failure
 391 *
 392 * ixgb_probe initializes an adapter identified by a pci_dev structure.
 393 * The OS initialization, configuring of the adapter private structure,
 394 * and a hardware reset occur.
 395 **/
 396
 397static int
 398ixgb_probe(struct pci_dev *pdev, const struct pci_device_id *ent)
 399{
 400        struct net_device *netdev = NULL;
 401        struct ixgb_adapter *adapter;
 402        static int cards_found = 0;
 403        int pci_using_dac;
 404        int i;
 405        int err;
 406
 407        err = pci_enable_device(pdev);
 408        if (err)
 409                return err;
 410
 411        pci_using_dac = 0;
 412        err = dma_set_mask_and_coherent(&pdev->dev, DMA_BIT_MASK(64));
 413        if (!err) {
 414                pci_using_dac = 1;
 415        } else {
 416                err = dma_set_mask_and_coherent(&pdev->dev, DMA_BIT_MASK(32));
 417                if (err) {
 418                        pr_err("No usable DMA configuration, aborting\n");
 419                        goto err_dma_mask;
 420                }
 421        }
 422
 423        err = pci_request_regions(pdev, ixgb_driver_name);
 424        if (err)
 425                goto err_request_regions;
 426
 427        pci_set_master(pdev);
 428
 429        netdev = alloc_etherdev(sizeof(struct ixgb_adapter));
 430        if (!netdev) {
 431                err = -ENOMEM;
 432                goto err_alloc_etherdev;
 433        }
 434
 435        SET_NETDEV_DEV(netdev, &pdev->dev);
 436
 437        pci_set_drvdata(pdev, netdev);
 438        adapter = netdev_priv(netdev);
 439        adapter->netdev = netdev;
 440        adapter->pdev = pdev;
 441        adapter->hw.back = adapter;
 442        adapter->msg_enable = netif_msg_init(debug, DEFAULT_MSG_ENABLE);
 443
 444        adapter->hw.hw_addr = pci_ioremap_bar(pdev, BAR_0);
 445        if (!adapter->hw.hw_addr) {
 446                err = -EIO;
 447                goto err_ioremap;
 448        }
 449
 450        for (i = BAR_1; i <= BAR_5; i++) {
 451                if (pci_resource_len(pdev, i) == 0)
 452                        continue;
 453                if (pci_resource_flags(pdev, i) & IORESOURCE_IO) {
 454                        adapter->hw.io_base = pci_resource_start(pdev, i);
 455                        break;
 456                }
 457        }
 458
 459        netdev->netdev_ops = &ixgb_netdev_ops;
 460        ixgb_set_ethtool_ops(netdev);
 461        netdev->watchdog_timeo = 5 * HZ;
 462        netif_napi_add(netdev, &adapter->napi, ixgb_clean, 64);
 463
 464        strncpy(netdev->name, pci_name(pdev), sizeof(netdev->name) - 1);
 465
 466        adapter->bd_number = cards_found;
 467        adapter->link_speed = 0;
 468        adapter->link_duplex = 0;
 469
 470        /* setup the private structure */
 471
 472        err = ixgb_sw_init(adapter);
 473        if (err)
 474                goto err_sw_init;
 475
 476        netdev->hw_features = NETIF_F_SG |
 477                           NETIF_F_TSO |
 478                           NETIF_F_HW_CSUM |
 479                           NETIF_F_HW_VLAN_CTAG_TX |
 480                           NETIF_F_HW_VLAN_CTAG_RX;
 481        netdev->features = netdev->hw_features |
 482                           NETIF_F_HW_VLAN_CTAG_FILTER;
 483        netdev->hw_features |= NETIF_F_RXCSUM;
 484
 485        if (pci_using_dac) {
 486                netdev->features |= NETIF_F_HIGHDMA;
 487                netdev->vlan_features |= NETIF_F_HIGHDMA;
 488        }
 489
 490        /* make sure the EEPROM is good */
 491
 492        if (!ixgb_validate_eeprom_checksum(&adapter->hw)) {
 493                netif_err(adapter, probe, adapter->netdev,
 494                          "The EEPROM Checksum Is Not Valid\n");
 495                err = -EIO;
 496                goto err_eeprom;
 497        }
 498
 499        ixgb_get_ee_mac_addr(&adapter->hw, netdev->dev_addr);
 500
 501        if (!is_valid_ether_addr(netdev->dev_addr)) {
 502                netif_err(adapter, probe, adapter->netdev, "Invalid MAC Address\n");
 503                err = -EIO;
 504                goto err_eeprom;
 505        }
 506
 507        adapter->part_num = ixgb_get_ee_pba_number(&adapter->hw);
 508
 509        init_timer(&adapter->watchdog_timer);
 510        adapter->watchdog_timer.function = ixgb_watchdog;
 511        adapter->watchdog_timer.data = (unsigned long)adapter;
 512
 513        INIT_WORK(&adapter->tx_timeout_task, ixgb_tx_timeout_task);
 514
 515        strcpy(netdev->name, "eth%d");
 516        err = register_netdev(netdev);
 517        if (err)
 518                goto err_register;
 519
 520        /* carrier off reporting is important to ethtool even BEFORE open */
 521        netif_carrier_off(netdev);
 522
 523        netif_info(adapter, probe, adapter->netdev,
 524                   "Intel(R) PRO/10GbE Network Connection\n");
 525        ixgb_check_options(adapter);
 526        /* reset the hardware with the new settings */
 527
 528        ixgb_reset(adapter);
 529
 530        cards_found++;
 531        return 0;
 532
 533err_register:
 534err_sw_init:
 535err_eeprom:
 536        iounmap(adapter->hw.hw_addr);
 537err_ioremap:
 538        free_netdev(netdev);
 539err_alloc_etherdev:
 540        pci_release_regions(pdev);
 541err_request_regions:
 542err_dma_mask:
 543        pci_disable_device(pdev);
 544        return err;
 545}
 546
 547/**
 548 * ixgb_remove - Device Removal Routine
 549 * @pdev: PCI device information struct
 550 *
 551 * ixgb_remove is called by the PCI subsystem to alert the driver
 552 * that it should release a PCI device.  The could be caused by a
 553 * Hot-Plug event, or because the driver is going to be removed from
 554 * memory.
 555 **/
 556
 557static void
 558ixgb_remove(struct pci_dev *pdev)
 559{
 560        struct net_device *netdev = pci_get_drvdata(pdev);
 561        struct ixgb_adapter *adapter = netdev_priv(netdev);
 562
 563        cancel_work_sync(&adapter->tx_timeout_task);
 564
 565        unregister_netdev(netdev);
 566
 567        iounmap(adapter->hw.hw_addr);
 568        pci_release_regions(pdev);
 569
 570        free_netdev(netdev);
 571        pci_disable_device(pdev);
 572}
 573
 574/**
 575 * ixgb_sw_init - Initialize general software structures (struct ixgb_adapter)
 576 * @adapter: board private structure to initialize
 577 *
 578 * ixgb_sw_init initializes the Adapter private data structure.
 579 * Fields are initialized based on PCI device information and
 580 * OS network device settings (MTU size).
 581 **/
 582
 583static int
 584ixgb_sw_init(struct ixgb_adapter *adapter)
 585{
 586        struct ixgb_hw *hw = &adapter->hw;
 587        struct net_device *netdev = adapter->netdev;
 588        struct pci_dev *pdev = adapter->pdev;
 589
 590        /* PCI config space info */
 591
 592        hw->vendor_id = pdev->vendor;
 593        hw->device_id = pdev->device;
 594        hw->subsystem_vendor_id = pdev->subsystem_vendor;
 595        hw->subsystem_id = pdev->subsystem_device;
 596
 597        hw->max_frame_size = netdev->mtu + ENET_HEADER_SIZE + ENET_FCS_LENGTH;
 598        adapter->rx_buffer_len = hw->max_frame_size + 8; /* + 8 for errata */
 599
 600        if ((hw->device_id == IXGB_DEVICE_ID_82597EX) ||
 601            (hw->device_id == IXGB_DEVICE_ID_82597EX_CX4) ||
 602            (hw->device_id == IXGB_DEVICE_ID_82597EX_LR) ||
 603            (hw->device_id == IXGB_DEVICE_ID_82597EX_SR))
 604                hw->mac_type = ixgb_82597;
 605        else {
 606                /* should never have loaded on this device */
 607                netif_err(adapter, probe, adapter->netdev, "unsupported device id\n");
 608        }
 609
 610        /* enable flow control to be programmed */
 611        hw->fc.send_xon = 1;
 612
 613        set_bit(__IXGB_DOWN, &adapter->flags);
 614        return 0;
 615}
 616
 617/**
 618 * ixgb_open - Called when a network interface is made active
 619 * @netdev: network interface device structure
 620 *
 621 * Returns 0 on success, negative value on failure
 622 *
 623 * The open entry point is called when a network interface is made
 624 * active by the system (IFF_UP).  At this point all resources needed
 625 * for transmit and receive operations are allocated, the interrupt
 626 * handler is registered with the OS, the watchdog timer is started,
 627 * and the stack is notified that the interface is ready.
 628 **/
 629
 630static int
 631ixgb_open(struct net_device *netdev)
 632{
 633        struct ixgb_adapter *adapter = netdev_priv(netdev);
 634        int err;
 635
 636        /* allocate transmit descriptors */
 637        err = ixgb_setup_tx_resources(adapter);
 638        if (err)
 639                goto err_setup_tx;
 640
 641        netif_carrier_off(netdev);
 642
 643        /* allocate receive descriptors */
 644
 645        err = ixgb_setup_rx_resources(adapter);
 646        if (err)
 647                goto err_setup_rx;
 648
 649        err = ixgb_up(adapter);
 650        if (err)
 651                goto err_up;
 652
 653        netif_start_queue(netdev);
 654
 655        return 0;
 656
 657err_up:
 658        ixgb_free_rx_resources(adapter);
 659err_setup_rx:
 660        ixgb_free_tx_resources(adapter);
 661err_setup_tx:
 662        ixgb_reset(adapter);
 663
 664        return err;
 665}
 666
 667/**
 668 * ixgb_close - Disables a network interface
 669 * @netdev: network interface device structure
 670 *
 671 * Returns 0, this is not allowed to fail
 672 *
 673 * The close entry point is called when an interface is de-activated
 674 * by the OS.  The hardware is still under the drivers control, but
 675 * needs to be disabled.  A global MAC reset is issued to stop the
 676 * hardware, and all transmit and receive resources are freed.
 677 **/
 678
 679static int
 680ixgb_close(struct net_device *netdev)
 681{
 682        struct ixgb_adapter *adapter = netdev_priv(netdev);
 683
 684        ixgb_down(adapter, true);
 685
 686        ixgb_free_tx_resources(adapter);
 687        ixgb_free_rx_resources(adapter);
 688
 689        return 0;
 690}
 691
 692/**
 693 * ixgb_setup_tx_resources - allocate Tx resources (Descriptors)
 694 * @adapter: board private structure
 695 *
 696 * Return 0 on success, negative on failure
 697 **/
 698
 699int
 700ixgb_setup_tx_resources(struct ixgb_adapter *adapter)
 701{
 702        struct ixgb_desc_ring *txdr = &adapter->tx_ring;
 703        struct pci_dev *pdev = adapter->pdev;
 704        int size;
 705
 706        size = sizeof(struct ixgb_buffer) * txdr->count;
 707        txdr->buffer_info = vzalloc(size);
 708        if (!txdr->buffer_info)
 709                return -ENOMEM;
 710
 711        /* round up to nearest 4K */
 712
 713        txdr->size = txdr->count * sizeof(struct ixgb_tx_desc);
 714        txdr->size = ALIGN(txdr->size, 4096);
 715
 716        txdr->desc = dma_zalloc_coherent(&pdev->dev, txdr->size, &txdr->dma,
 717                                         GFP_KERNEL);
 718        if (!txdr->desc) {
 719                vfree(txdr->buffer_info);
 720                return -ENOMEM;
 721        }
 722
 723        txdr->next_to_use = 0;
 724        txdr->next_to_clean = 0;
 725
 726        return 0;
 727}
 728
 729/**
 730 * ixgb_configure_tx - Configure 82597 Transmit Unit after Reset.
 731 * @adapter: board private structure
 732 *
 733 * Configure the Tx unit of the MAC after a reset.
 734 **/
 735
 736static void
 737ixgb_configure_tx(struct ixgb_adapter *adapter)
 738{
 739        u64 tdba = adapter->tx_ring.dma;
 740        u32 tdlen = adapter->tx_ring.count * sizeof(struct ixgb_tx_desc);
 741        u32 tctl;
 742        struct ixgb_hw *hw = &adapter->hw;
 743
 744        /* Setup the Base and Length of the Tx Descriptor Ring
 745         * tx_ring.dma can be either a 32 or 64 bit value
 746         */
 747
 748        IXGB_WRITE_REG(hw, TDBAL, (tdba & 0x00000000ffffffffULL));
 749        IXGB_WRITE_REG(hw, TDBAH, (tdba >> 32));
 750
 751        IXGB_WRITE_REG(hw, TDLEN, tdlen);
 752
 753        /* Setup the HW Tx Head and Tail descriptor pointers */
 754
 755        IXGB_WRITE_REG(hw, TDH, 0);
 756        IXGB_WRITE_REG(hw, TDT, 0);
 757
 758        /* don't set up txdctl, it induces performance problems if configured
 759         * incorrectly */
 760        /* Set the Tx Interrupt Delay register */
 761
 762        IXGB_WRITE_REG(hw, TIDV, adapter->tx_int_delay);
 763
 764        /* Program the Transmit Control Register */
 765
 766        tctl = IXGB_TCTL_TCE | IXGB_TCTL_TXEN | IXGB_TCTL_TPDE;
 767        IXGB_WRITE_REG(hw, TCTL, tctl);
 768
 769        /* Setup Transmit Descriptor Settings for this adapter */
 770        adapter->tx_cmd_type =
 771                IXGB_TX_DESC_TYPE |
 772                (adapter->tx_int_delay_enable ? IXGB_TX_DESC_CMD_IDE : 0);
 773}
 774
 775/**
 776 * ixgb_setup_rx_resources - allocate Rx resources (Descriptors)
 777 * @adapter: board private structure
 778 *
 779 * Returns 0 on success, negative on failure
 780 **/
 781
 782int
 783ixgb_setup_rx_resources(struct ixgb_adapter *adapter)
 784{
 785        struct ixgb_desc_ring *rxdr = &adapter->rx_ring;
 786        struct pci_dev *pdev = adapter->pdev;
 787        int size;
 788
 789        size = sizeof(struct ixgb_buffer) * rxdr->count;
 790        rxdr->buffer_info = vzalloc(size);
 791        if (!rxdr->buffer_info)
 792                return -ENOMEM;
 793
 794        /* Round up to nearest 4K */
 795
 796        rxdr->size = rxdr->count * sizeof(struct ixgb_rx_desc);
 797        rxdr->size = ALIGN(rxdr->size, 4096);
 798
 799        rxdr->desc = dma_alloc_coherent(&pdev->dev, rxdr->size, &rxdr->dma,
 800                                        GFP_KERNEL);
 801
 802        if (!rxdr->desc) {
 803                vfree(rxdr->buffer_info);
 804                return -ENOMEM;
 805        }
 806        memset(rxdr->desc, 0, rxdr->size);
 807
 808        rxdr->next_to_clean = 0;
 809        rxdr->next_to_use = 0;
 810
 811        return 0;
 812}
 813
 814/**
 815 * ixgb_setup_rctl - configure the receive control register
 816 * @adapter: Board private structure
 817 **/
 818
 819static void
 820ixgb_setup_rctl(struct ixgb_adapter *adapter)
 821{
 822        u32 rctl;
 823
 824        rctl = IXGB_READ_REG(&adapter->hw, RCTL);
 825
 826        rctl &= ~(3 << IXGB_RCTL_MO_SHIFT);
 827
 828        rctl |=
 829                IXGB_RCTL_BAM | IXGB_RCTL_RDMTS_1_2 |
 830                IXGB_RCTL_RXEN | IXGB_RCTL_CFF |
 831                (adapter->hw.mc_filter_type << IXGB_RCTL_MO_SHIFT);
 832
 833        rctl |= IXGB_RCTL_SECRC;
 834
 835        if (adapter->rx_buffer_len <= IXGB_RXBUFFER_2048)
 836                rctl |= IXGB_RCTL_BSIZE_2048;
 837        else if (adapter->rx_buffer_len <= IXGB_RXBUFFER_4096)
 838                rctl |= IXGB_RCTL_BSIZE_4096;
 839        else if (adapter->rx_buffer_len <= IXGB_RXBUFFER_8192)
 840                rctl |= IXGB_RCTL_BSIZE_8192;
 841        else if (adapter->rx_buffer_len <= IXGB_RXBUFFER_16384)
 842                rctl |= IXGB_RCTL_BSIZE_16384;
 843
 844        IXGB_WRITE_REG(&adapter->hw, RCTL, rctl);
 845}
 846
 847/**
 848 * ixgb_configure_rx - Configure 82597 Receive Unit after Reset.
 849 * @adapter: board private structure
 850 *
 851 * Configure the Rx unit of the MAC after a reset.
 852 **/
 853
 854static void
 855ixgb_configure_rx(struct ixgb_adapter *adapter)
 856{
 857        u64 rdba = adapter->rx_ring.dma;
 858        u32 rdlen = adapter->rx_ring.count * sizeof(struct ixgb_rx_desc);
 859        struct ixgb_hw *hw = &adapter->hw;
 860        u32 rctl;
 861        u32 rxcsum;
 862
 863        /* make sure receives are disabled while setting up the descriptors */
 864
 865        rctl = IXGB_READ_REG(hw, RCTL);
 866        IXGB_WRITE_REG(hw, RCTL, rctl & ~IXGB_RCTL_RXEN);
 867
 868        /* set the Receive Delay Timer Register */
 869
 870        IXGB_WRITE_REG(hw, RDTR, adapter->rx_int_delay);
 871
 872        /* Setup the Base and Length of the Rx Descriptor Ring */
 873
 874        IXGB_WRITE_REG(hw, RDBAL, (rdba & 0x00000000ffffffffULL));
 875        IXGB_WRITE_REG(hw, RDBAH, (rdba >> 32));
 876
 877        IXGB_WRITE_REG(hw, RDLEN, rdlen);
 878
 879        /* Setup the HW Rx Head and Tail Descriptor Pointers */
 880        IXGB_WRITE_REG(hw, RDH, 0);
 881        IXGB_WRITE_REG(hw, RDT, 0);
 882
 883        /* due to the hardware errata with RXDCTL, we are unable to use any of
 884         * the performance enhancing features of it without causing other
 885         * subtle bugs, some of the bugs could include receive length
 886         * corruption at high data rates (WTHRESH > 0) and/or receive
 887         * descriptor ring irregularites (particularly in hardware cache) */
 888        IXGB_WRITE_REG(hw, RXDCTL, 0);
 889
 890        /* Enable Receive Checksum Offload for TCP and UDP */
 891        if (adapter->rx_csum) {
 892                rxcsum = IXGB_READ_REG(hw, RXCSUM);
 893                rxcsum |= IXGB_RXCSUM_TUOFL;
 894                IXGB_WRITE_REG(hw, RXCSUM, rxcsum);
 895        }
 896
 897        /* Enable Receives */
 898
 899        IXGB_WRITE_REG(hw, RCTL, rctl);
 900}
 901
 902/**
 903 * ixgb_free_tx_resources - Free Tx Resources
 904 * @adapter: board private structure
 905 *
 906 * Free all transmit software resources
 907 **/
 908
 909void
 910ixgb_free_tx_resources(struct ixgb_adapter *adapter)
 911{
 912        struct pci_dev *pdev = adapter->pdev;
 913
 914        ixgb_clean_tx_ring(adapter);
 915
 916        vfree(adapter->tx_ring.buffer_info);
 917        adapter->tx_ring.buffer_info = NULL;
 918
 919        dma_free_coherent(&pdev->dev, adapter->tx_ring.size,
 920                          adapter->tx_ring.desc, adapter->tx_ring.dma);
 921
 922        adapter->tx_ring.desc = NULL;
 923}
 924
 925static void
 926ixgb_unmap_and_free_tx_resource(struct ixgb_adapter *adapter,
 927                                struct ixgb_buffer *buffer_info)
 928{
 929        if (buffer_info->dma) {
 930                if (buffer_info->mapped_as_page)
 931                        dma_unmap_page(&adapter->pdev->dev, buffer_info->dma,
 932                                       buffer_info->length, DMA_TO_DEVICE);
 933                else
 934                        dma_unmap_single(&adapter->pdev->dev, buffer_info->dma,
 935                                         buffer_info->length, DMA_TO_DEVICE);
 936                buffer_info->dma = 0;
 937        }
 938
 939        if (buffer_info->skb) {
 940                dev_kfree_skb_any(buffer_info->skb);
 941                buffer_info->skb = NULL;
 942        }
 943        buffer_info->time_stamp = 0;
 944        /* these fields must always be initialized in tx
 945         * buffer_info->length = 0;
 946         * buffer_info->next_to_watch = 0; */
 947}
 948
 949/**
 950 * ixgb_clean_tx_ring - Free Tx Buffers
 951 * @adapter: board private structure
 952 **/
 953
 954static void
 955ixgb_clean_tx_ring(struct ixgb_adapter *adapter)
 956{
 957        struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
 958        struct ixgb_buffer *buffer_info;
 959        unsigned long size;
 960        unsigned int i;
 961
 962        /* Free all the Tx ring sk_buffs */
 963
 964        for (i = 0; i < tx_ring->count; i++) {
 965                buffer_info = &tx_ring->buffer_info[i];
 966                ixgb_unmap_and_free_tx_resource(adapter, buffer_info);
 967        }
 968
 969        size = sizeof(struct ixgb_buffer) * tx_ring->count;
 970        memset(tx_ring->buffer_info, 0, size);
 971
 972        /* Zero out the descriptor ring */
 973
 974        memset(tx_ring->desc, 0, tx_ring->size);
 975
 976        tx_ring->next_to_use = 0;
 977        tx_ring->next_to_clean = 0;
 978
 979        IXGB_WRITE_REG(&adapter->hw, TDH, 0);
 980        IXGB_WRITE_REG(&adapter->hw, TDT, 0);
 981}
 982
 983/**
 984 * ixgb_free_rx_resources - Free Rx Resources
 985 * @adapter: board private structure
 986 *
 987 * Free all receive software resources
 988 **/
 989
 990void
 991ixgb_free_rx_resources(struct ixgb_adapter *adapter)
 992{
 993        struct ixgb_desc_ring *rx_ring = &adapter->rx_ring;
 994        struct pci_dev *pdev = adapter->pdev;
 995
 996        ixgb_clean_rx_ring(adapter);
 997
 998        vfree(rx_ring->buffer_info);
 999        rx_ring->buffer_info = NULL;
1000
1001        dma_free_coherent(&pdev->dev, rx_ring->size, rx_ring->desc,
1002                          rx_ring->dma);
1003
1004        rx_ring->desc = NULL;
1005}
1006
1007/**
1008 * ixgb_clean_rx_ring - Free Rx Buffers
1009 * @adapter: board private structure
1010 **/
1011
1012static void
1013ixgb_clean_rx_ring(struct ixgb_adapter *adapter)
1014{
1015        struct ixgb_desc_ring *rx_ring = &adapter->rx_ring;
1016        struct ixgb_buffer *buffer_info;
1017        struct pci_dev *pdev = adapter->pdev;
1018        unsigned long size;
1019        unsigned int i;
1020
1021        /* Free all the Rx ring sk_buffs */
1022
1023        for (i = 0; i < rx_ring->count; i++) {
1024                buffer_info = &rx_ring->buffer_info[i];
1025                if (buffer_info->dma) {
1026                        dma_unmap_single(&pdev->dev,
1027                                         buffer_info->dma,
1028                                         buffer_info->length,
1029                                         DMA_FROM_DEVICE);
1030                        buffer_info->dma = 0;
1031                        buffer_info->length = 0;
1032                }
1033
1034                if (buffer_info->skb) {
1035                        dev_kfree_skb(buffer_info->skb);
1036                        buffer_info->skb = NULL;
1037                }
1038        }
1039
1040        size = sizeof(struct ixgb_buffer) * rx_ring->count;
1041        memset(rx_ring->buffer_info, 0, size);
1042
1043        /* Zero out the descriptor ring */
1044
1045        memset(rx_ring->desc, 0, rx_ring->size);
1046
1047        rx_ring->next_to_clean = 0;
1048        rx_ring->next_to_use = 0;
1049
1050        IXGB_WRITE_REG(&adapter->hw, RDH, 0);
1051        IXGB_WRITE_REG(&adapter->hw, RDT, 0);
1052}
1053
1054/**
1055 * ixgb_set_mac - Change the Ethernet Address of the NIC
1056 * @netdev: network interface device structure
1057 * @p: pointer to an address structure
1058 *
1059 * Returns 0 on success, negative on failure
1060 **/
1061
1062static int
1063ixgb_set_mac(struct net_device *netdev, void *p)
1064{
1065        struct ixgb_adapter *adapter = netdev_priv(netdev);
1066        struct sockaddr *addr = p;
1067
1068        if (!is_valid_ether_addr(addr->sa_data))
1069                return -EADDRNOTAVAIL;
1070
1071        memcpy(netdev->dev_addr, addr->sa_data, netdev->addr_len);
1072
1073        ixgb_rar_set(&adapter->hw, addr->sa_data, 0);
1074
1075        return 0;
1076}
1077
1078/**
1079 * ixgb_set_multi - Multicast and Promiscuous mode set
1080 * @netdev: network interface device structure
1081 *
1082 * The set_multi entry point is called whenever the multicast address
1083 * list or the network interface flags are updated.  This routine is
1084 * responsible for configuring the hardware for proper multicast,
1085 * promiscuous mode, and all-multi behavior.
1086 **/
1087
1088static void
1089ixgb_set_multi(struct net_device *netdev)
1090{
1091        struct ixgb_adapter *adapter = netdev_priv(netdev);
1092        struct ixgb_hw *hw = &adapter->hw;
1093        struct netdev_hw_addr *ha;
1094        u32 rctl;
1095
1096        /* Check for Promiscuous and All Multicast modes */
1097
1098        rctl = IXGB_READ_REG(hw, RCTL);
1099
1100        if (netdev->flags & IFF_PROMISC) {
1101                rctl |= (IXGB_RCTL_UPE | IXGB_RCTL_MPE);
1102                /* disable VLAN filtering */
1103                rctl &= ~IXGB_RCTL_CFIEN;
1104                rctl &= ~IXGB_RCTL_VFE;
1105        } else {
1106                if (netdev->flags & IFF_ALLMULTI) {
1107                        rctl |= IXGB_RCTL_MPE;
1108                        rctl &= ~IXGB_RCTL_UPE;
1109                } else {
1110                        rctl &= ~(IXGB_RCTL_UPE | IXGB_RCTL_MPE);
1111                }
1112                /* enable VLAN filtering */
1113                rctl |= IXGB_RCTL_VFE;
1114                rctl &= ~IXGB_RCTL_CFIEN;
1115        }
1116
1117        if (netdev_mc_count(netdev) > IXGB_MAX_NUM_MULTICAST_ADDRESSES) {
1118                rctl |= IXGB_RCTL_MPE;
1119                IXGB_WRITE_REG(hw, RCTL, rctl);
1120        } else {
1121                u8 *mta = kmalloc(IXGB_MAX_NUM_MULTICAST_ADDRESSES *
1122                              ETH_ALEN, GFP_ATOMIC);
1123                u8 *addr;
1124                if (!mta)
1125                        goto alloc_failed;
1126
1127                IXGB_WRITE_REG(hw, RCTL, rctl);
1128
1129                addr = mta;
1130                netdev_for_each_mc_addr(ha, netdev) {
1131                        memcpy(addr, ha->addr, ETH_ALEN);
1132                        addr += ETH_ALEN;
1133                }
1134
1135                ixgb_mc_addr_list_update(hw, mta, netdev_mc_count(netdev), 0);
1136                kfree(mta);
1137        }
1138
1139alloc_failed:
1140        if (netdev->features & NETIF_F_HW_VLAN_CTAG_RX)
1141                ixgb_vlan_strip_enable(adapter);
1142        else
1143                ixgb_vlan_strip_disable(adapter);
1144
1145}
1146
1147/**
1148 * ixgb_watchdog - Timer Call-back
1149 * @data: pointer to netdev cast into an unsigned long
1150 **/
1151
1152static void
1153ixgb_watchdog(unsigned long data)
1154{
1155        struct ixgb_adapter *adapter = (struct ixgb_adapter *)data;
1156        struct net_device *netdev = adapter->netdev;
1157        struct ixgb_desc_ring *txdr = &adapter->tx_ring;
1158
1159        ixgb_check_for_link(&adapter->hw);
1160
1161        if (ixgb_check_for_bad_link(&adapter->hw)) {
1162                /* force the reset path */
1163                netif_stop_queue(netdev);
1164        }
1165
1166        if (adapter->hw.link_up) {
1167                if (!netif_carrier_ok(netdev)) {
1168                        netdev_info(netdev,
1169                                    "NIC Link is Up 10 Gbps Full Duplex, Flow Control: %s\n",
1170                                    (adapter->hw.fc.type == ixgb_fc_full) ?
1171                                    "RX/TX" :
1172                                    (adapter->hw.fc.type == ixgb_fc_rx_pause) ?
1173                                     "RX" :
1174                                    (adapter->hw.fc.type == ixgb_fc_tx_pause) ?
1175                                    "TX" : "None");
1176                        adapter->link_speed = 10000;
1177                        adapter->link_duplex = FULL_DUPLEX;
1178                        netif_carrier_on(netdev);
1179                }
1180        } else {
1181                if (netif_carrier_ok(netdev)) {
1182                        adapter->link_speed = 0;
1183                        adapter->link_duplex = 0;
1184                        netdev_info(netdev, "NIC Link is Down\n");
1185                        netif_carrier_off(netdev);
1186                }
1187        }
1188
1189        ixgb_update_stats(adapter);
1190
1191        if (!netif_carrier_ok(netdev)) {
1192                if (IXGB_DESC_UNUSED(txdr) + 1 < txdr->count) {
1193                        /* We've lost link, so the controller stops DMA,
1194                         * but we've got queued Tx work that's never going
1195                         * to get done, so reset controller to flush Tx.
1196                         * (Do the reset outside of interrupt context). */
1197                        schedule_work(&adapter->tx_timeout_task);
1198                        /* return immediately since reset is imminent */
1199                        return;
1200                }
1201        }
1202
1203        /* Force detection of hung controller every watchdog period */
1204        adapter->detect_tx_hung = true;
1205
1206        /* generate an interrupt to force clean up of any stragglers */
1207        IXGB_WRITE_REG(&adapter->hw, ICS, IXGB_INT_TXDW);
1208
1209        /* Reset the timer */
1210        mod_timer(&adapter->watchdog_timer, jiffies + 2 * HZ);
1211}
1212
1213#define IXGB_TX_FLAGS_CSUM              0x00000001
1214#define IXGB_TX_FLAGS_VLAN              0x00000002
1215#define IXGB_TX_FLAGS_TSO               0x00000004
1216
1217static int
1218ixgb_tso(struct ixgb_adapter *adapter, struct sk_buff *skb)
1219{
1220        struct ixgb_context_desc *context_desc;
1221        unsigned int i;
1222        u8 ipcss, ipcso, tucss, tucso, hdr_len;
1223        u16 ipcse, tucse, mss;
1224
1225        if (likely(skb_is_gso(skb))) {
1226                struct ixgb_buffer *buffer_info;
1227                struct iphdr *iph;
1228                int err;
1229
1230                err = skb_cow_head(skb, 0);
1231                if (err < 0)
1232                        return err;
1233
1234                hdr_len = skb_transport_offset(skb) + tcp_hdrlen(skb);
1235                mss = skb_shinfo(skb)->gso_size;
1236                iph = ip_hdr(skb);
1237                iph->tot_len = 0;
1238                iph->check = 0;
1239                tcp_hdr(skb)->check = ~csum_tcpudp_magic(iph->saddr,
1240                                                         iph->daddr, 0,
1241                                                         IPPROTO_TCP, 0);
1242                ipcss = skb_network_offset(skb);
1243                ipcso = (void *)&(iph->check) - (void *)skb->data;
1244                ipcse = skb_transport_offset(skb) - 1;
1245                tucss = skb_transport_offset(skb);
1246                tucso = (void *)&(tcp_hdr(skb)->check) - (void *)skb->data;
1247                tucse = 0;
1248
1249                i = adapter->tx_ring.next_to_use;
1250                context_desc = IXGB_CONTEXT_DESC(adapter->tx_ring, i);
1251                buffer_info = &adapter->tx_ring.buffer_info[i];
1252                WARN_ON(buffer_info->dma != 0);
1253
1254                context_desc->ipcss = ipcss;
1255                context_desc->ipcso = ipcso;
1256                context_desc->ipcse = cpu_to_le16(ipcse);
1257                context_desc->tucss = tucss;
1258                context_desc->tucso = tucso;
1259                context_desc->tucse = cpu_to_le16(tucse);
1260                context_desc->mss = cpu_to_le16(mss);
1261                context_desc->hdr_len = hdr_len;
1262                context_desc->status = 0;
1263                context_desc->cmd_type_len = cpu_to_le32(
1264                                                  IXGB_CONTEXT_DESC_TYPE
1265                                                | IXGB_CONTEXT_DESC_CMD_TSE
1266                                                | IXGB_CONTEXT_DESC_CMD_IP
1267                                                | IXGB_CONTEXT_DESC_CMD_TCP
1268                                                | IXGB_CONTEXT_DESC_CMD_IDE
1269                                                | (skb->len - (hdr_len)));
1270
1271
1272                if (++i == adapter->tx_ring.count) i = 0;
1273                adapter->tx_ring.next_to_use = i;
1274
1275                return 1;
1276        }
1277
1278        return 0;
1279}
1280
1281static bool
1282ixgb_tx_csum(struct ixgb_adapter *adapter, struct sk_buff *skb)
1283{
1284        struct ixgb_context_desc *context_desc;
1285        unsigned int i;
1286        u8 css, cso;
1287
1288        if (likely(skb->ip_summed == CHECKSUM_PARTIAL)) {
1289                struct ixgb_buffer *buffer_info;
1290                css = skb_checksum_start_offset(skb);
1291                cso = css + skb->csum_offset;
1292
1293                i = adapter->tx_ring.next_to_use;
1294                context_desc = IXGB_CONTEXT_DESC(adapter->tx_ring, i);
1295                buffer_info = &adapter->tx_ring.buffer_info[i];
1296                WARN_ON(buffer_info->dma != 0);
1297
1298                context_desc->tucss = css;
1299                context_desc->tucso = cso;
1300                context_desc->tucse = 0;
1301                /* zero out any previously existing data in one instruction */
1302                *(u32 *)&(context_desc->ipcss) = 0;
1303                context_desc->status = 0;
1304                context_desc->hdr_len = 0;
1305                context_desc->mss = 0;
1306                context_desc->cmd_type_len =
1307                        cpu_to_le32(IXGB_CONTEXT_DESC_TYPE
1308                                    | IXGB_TX_DESC_CMD_IDE);
1309
1310                if (++i == adapter->tx_ring.count) i = 0;
1311                adapter->tx_ring.next_to_use = i;
1312
1313                return true;
1314        }
1315
1316        return false;
1317}
1318
1319#define IXGB_MAX_TXD_PWR        14
1320#define IXGB_MAX_DATA_PER_TXD   (1<<IXGB_MAX_TXD_PWR)
1321
1322static int
1323ixgb_tx_map(struct ixgb_adapter *adapter, struct sk_buff *skb,
1324            unsigned int first)
1325{
1326        struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
1327        struct pci_dev *pdev = adapter->pdev;
1328        struct ixgb_buffer *buffer_info;
1329        int len = skb_headlen(skb);
1330        unsigned int offset = 0, size, count = 0, i;
1331        unsigned int mss = skb_shinfo(skb)->gso_size;
1332        unsigned int nr_frags = skb_shinfo(skb)->nr_frags;
1333        unsigned int f;
1334
1335        i = tx_ring->next_to_use;
1336
1337        while (len) {
1338                buffer_info = &tx_ring->buffer_info[i];
1339                size = min(len, IXGB_MAX_DATA_PER_TXD);
1340                /* Workaround for premature desc write-backs
1341                 * in TSO mode.  Append 4-byte sentinel desc */
1342                if (unlikely(mss && !nr_frags && size == len && size > 8))
1343                        size -= 4;
1344
1345                buffer_info->length = size;
1346                WARN_ON(buffer_info->dma != 0);
1347                buffer_info->time_stamp = jiffies;
1348                buffer_info->mapped_as_page = false;
1349                buffer_info->dma = dma_map_single(&pdev->dev,
1350                                                  skb->data + offset,
1351                                                  size, DMA_TO_DEVICE);
1352                if (dma_mapping_error(&pdev->dev, buffer_info->dma))
1353                        goto dma_error;
1354                buffer_info->next_to_watch = 0;
1355
1356                len -= size;
1357                offset += size;
1358                count++;
1359                if (len) {
1360                        i++;
1361                        if (i == tx_ring->count)
1362                                i = 0;
1363                }
1364        }
1365
1366        for (f = 0; f < nr_frags; f++) {
1367                const struct skb_frag_struct *frag;
1368
1369                frag = &skb_shinfo(skb)->frags[f];
1370                len = skb_frag_size(frag);
1371                offset = 0;
1372
1373                while (len) {
1374                        i++;
1375                        if (i == tx_ring->count)
1376                                i = 0;
1377
1378                        buffer_info = &tx_ring->buffer_info[i];
1379                        size = min(len, IXGB_MAX_DATA_PER_TXD);
1380
1381                        /* Workaround for premature desc write-backs
1382                         * in TSO mode.  Append 4-byte sentinel desc */
1383                        if (unlikely(mss && (f == (nr_frags - 1))
1384                                     && size == len && size > 8))
1385                                size -= 4;
1386
1387                        buffer_info->length = size;
1388                        buffer_info->time_stamp = jiffies;
1389                        buffer_info->mapped_as_page = true;
1390                        buffer_info->dma =
1391                                skb_frag_dma_map(&pdev->dev, frag, offset, size,
1392                                                 DMA_TO_DEVICE);
1393                        if (dma_mapping_error(&pdev->dev, buffer_info->dma))
1394                                goto dma_error;
1395                        buffer_info->next_to_watch = 0;
1396
1397                        len -= size;
1398                        offset += size;
1399                        count++;
1400                }
1401        }
1402        tx_ring->buffer_info[i].skb = skb;
1403        tx_ring->buffer_info[first].next_to_watch = i;
1404
1405        return count;
1406
1407dma_error:
1408        dev_err(&pdev->dev, "TX DMA map failed\n");
1409        buffer_info->dma = 0;
1410        if (count)
1411                count--;
1412
1413        while (count--) {
1414                if (i==0)
1415                        i += tx_ring->count;
1416                i--;
1417                buffer_info = &tx_ring->buffer_info[i];
1418                ixgb_unmap_and_free_tx_resource(adapter, buffer_info);
1419        }
1420
1421        return 0;
1422}
1423
1424static void
1425ixgb_tx_queue(struct ixgb_adapter *adapter, int count, int vlan_id,int tx_flags)
1426{
1427        struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
1428        struct ixgb_tx_desc *tx_desc = NULL;
1429        struct ixgb_buffer *buffer_info;
1430        u32 cmd_type_len = adapter->tx_cmd_type;
1431        u8 status = 0;
1432        u8 popts = 0;
1433        unsigned int i;
1434
1435        if (tx_flags & IXGB_TX_FLAGS_TSO) {
1436                cmd_type_len |= IXGB_TX_DESC_CMD_TSE;
1437                popts |= (IXGB_TX_DESC_POPTS_IXSM | IXGB_TX_DESC_POPTS_TXSM);
1438        }
1439
1440        if (tx_flags & IXGB_TX_FLAGS_CSUM)
1441                popts |= IXGB_TX_DESC_POPTS_TXSM;
1442
1443        if (tx_flags & IXGB_TX_FLAGS_VLAN)
1444                cmd_type_len |= IXGB_TX_DESC_CMD_VLE;
1445
1446        i = tx_ring->next_to_use;
1447
1448        while (count--) {
1449                buffer_info = &tx_ring->buffer_info[i];
1450                tx_desc = IXGB_TX_DESC(*tx_ring, i);
1451                tx_desc->buff_addr = cpu_to_le64(buffer_info->dma);
1452                tx_desc->cmd_type_len =
1453                        cpu_to_le32(cmd_type_len | buffer_info->length);
1454                tx_desc->status = status;
1455                tx_desc->popts = popts;
1456                tx_desc->vlan = cpu_to_le16(vlan_id);
1457
1458                if (++i == tx_ring->count) i = 0;
1459        }
1460
1461        tx_desc->cmd_type_len |=
1462                cpu_to_le32(IXGB_TX_DESC_CMD_EOP | IXGB_TX_DESC_CMD_RS);
1463
1464        /* Force memory writes to complete before letting h/w
1465         * know there are new descriptors to fetch.  (Only
1466         * applicable for weak-ordered memory model archs,
1467         * such as IA-64). */
1468        wmb();
1469
1470        tx_ring->next_to_use = i;
1471        IXGB_WRITE_REG(&adapter->hw, TDT, i);
1472}
1473
1474static int __ixgb_maybe_stop_tx(struct net_device *netdev, int size)
1475{
1476        struct ixgb_adapter *adapter = netdev_priv(netdev);
1477        struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
1478
1479        netif_stop_queue(netdev);
1480        /* Herbert's original patch had:
1481         *  smp_mb__after_netif_stop_queue();
1482         * but since that doesn't exist yet, just open code it. */
1483        smp_mb();
1484
1485        /* We need to check again in a case another CPU has just
1486         * made room available. */
1487        if (likely(IXGB_DESC_UNUSED(tx_ring) < size))
1488                return -EBUSY;
1489
1490        /* A reprieve! */
1491        netif_start_queue(netdev);
1492        ++adapter->restart_queue;
1493        return 0;
1494}
1495
1496static int ixgb_maybe_stop_tx(struct net_device *netdev,
1497                              struct ixgb_desc_ring *tx_ring, int size)
1498{
1499        if (likely(IXGB_DESC_UNUSED(tx_ring) >= size))
1500                return 0;
1501        return __ixgb_maybe_stop_tx(netdev, size);
1502}
1503
1504
1505/* Tx Descriptors needed, worst case */
1506#define TXD_USE_COUNT(S) (((S) >> IXGB_MAX_TXD_PWR) + \
1507                         (((S) & (IXGB_MAX_DATA_PER_TXD - 1)) ? 1 : 0))
1508#define DESC_NEEDED TXD_USE_COUNT(IXGB_MAX_DATA_PER_TXD) /* skb->date */ + \
1509        MAX_SKB_FRAGS * TXD_USE_COUNT(PAGE_SIZE) + 1 /* for context */ \
1510        + 1 /* one more needed for sentinel TSO workaround */
1511
1512static netdev_tx_t
1513ixgb_xmit_frame(struct sk_buff *skb, struct net_device *netdev)
1514{
1515        struct ixgb_adapter *adapter = netdev_priv(netdev);
1516        unsigned int first;
1517        unsigned int tx_flags = 0;
1518        int vlan_id = 0;
1519        int count = 0;
1520        int tso;
1521
1522        if (test_bit(__IXGB_DOWN, &adapter->flags)) {
1523                dev_kfree_skb_any(skb);
1524                return NETDEV_TX_OK;
1525        }
1526
1527        if (skb->len <= 0) {
1528                dev_kfree_skb_any(skb);
1529                return NETDEV_TX_OK;
1530        }
1531
1532        if (unlikely(ixgb_maybe_stop_tx(netdev, &adapter->tx_ring,
1533                     DESC_NEEDED)))
1534                return NETDEV_TX_BUSY;
1535
1536        if (skb_vlan_tag_present(skb)) {
1537                tx_flags |= IXGB_TX_FLAGS_VLAN;
1538                vlan_id = skb_vlan_tag_get(skb);
1539        }
1540
1541        first = adapter->tx_ring.next_to_use;
1542
1543        tso = ixgb_tso(adapter, skb);
1544        if (tso < 0) {
1545                dev_kfree_skb_any(skb);
1546                return NETDEV_TX_OK;
1547        }
1548
1549        if (likely(tso))
1550                tx_flags |= IXGB_TX_FLAGS_TSO;
1551        else if (ixgb_tx_csum(adapter, skb))
1552                tx_flags |= IXGB_TX_FLAGS_CSUM;
1553
1554        count = ixgb_tx_map(adapter, skb, first);
1555
1556        if (count) {
1557                ixgb_tx_queue(adapter, count, vlan_id, tx_flags);
1558                /* Make sure there is space in the ring for the next send. */
1559                ixgb_maybe_stop_tx(netdev, &adapter->tx_ring, DESC_NEEDED);
1560
1561        } else {
1562                dev_kfree_skb_any(skb);
1563                adapter->tx_ring.buffer_info[first].time_stamp = 0;
1564                adapter->tx_ring.next_to_use = first;
1565        }
1566
1567        return NETDEV_TX_OK;
1568}
1569
1570/**
1571 * ixgb_tx_timeout - Respond to a Tx Hang
1572 * @netdev: network interface device structure
1573 **/
1574
1575static void
1576ixgb_tx_timeout(struct net_device *netdev)
1577{
1578        struct ixgb_adapter *adapter = netdev_priv(netdev);
1579
1580        /* Do the reset outside of interrupt context */
1581        schedule_work(&adapter->tx_timeout_task);
1582}
1583
1584static void
1585ixgb_tx_timeout_task(struct work_struct *work)
1586{
1587        struct ixgb_adapter *adapter =
1588                container_of(work, struct ixgb_adapter, tx_timeout_task);
1589
1590        adapter->tx_timeout_count++;
1591        ixgb_down(adapter, true);
1592        ixgb_up(adapter);
1593}
1594
1595/**
1596 * ixgb_get_stats - Get System Network Statistics
1597 * @netdev: network interface device structure
1598 *
1599 * Returns the address of the device statistics structure.
1600 * The statistics are actually updated from the timer callback.
1601 **/
1602
1603static struct net_device_stats *
1604ixgb_get_stats(struct net_device *netdev)
1605{
1606        return &netdev->stats;
1607}
1608
1609/**
1610 * ixgb_change_mtu - Change the Maximum Transfer Unit
1611 * @netdev: network interface device structure
1612 * @new_mtu: new value for maximum frame size
1613 *
1614 * Returns 0 on success, negative on failure
1615 **/
1616
1617static int
1618ixgb_change_mtu(struct net_device *netdev, int new_mtu)
1619{
1620        struct ixgb_adapter *adapter = netdev_priv(netdev);
1621        int max_frame = new_mtu + ENET_HEADER_SIZE + ENET_FCS_LENGTH;
1622        int old_max_frame = netdev->mtu + ENET_HEADER_SIZE + ENET_FCS_LENGTH;
1623
1624        /* MTU < 68 is an error for IPv4 traffic, just don't allow it */
1625        if ((new_mtu < 68) ||
1626            (max_frame > IXGB_MAX_JUMBO_FRAME_SIZE + ENET_FCS_LENGTH)) {
1627                netif_err(adapter, probe, adapter->netdev,
1628                          "Invalid MTU setting %d\n", new_mtu);
1629                return -EINVAL;
1630        }
1631
1632        if (old_max_frame == max_frame)
1633                return 0;
1634
1635        if (netif_running(netdev))
1636                ixgb_down(adapter, true);
1637
1638        adapter->rx_buffer_len = max_frame + 8; /* + 8 for errata */
1639
1640        netdev->mtu = new_mtu;
1641
1642        if (netif_running(netdev))
1643                ixgb_up(adapter);
1644
1645        return 0;
1646}
1647
1648/**
1649 * ixgb_update_stats - Update the board statistics counters.
1650 * @adapter: board private structure
1651 **/
1652
1653void
1654ixgb_update_stats(struct ixgb_adapter *adapter)
1655{
1656        struct net_device *netdev = adapter->netdev;
1657        struct pci_dev *pdev = adapter->pdev;
1658
1659        /* Prevent stats update while adapter is being reset */
1660        if (pci_channel_offline(pdev))
1661                return;
1662
1663        if ((netdev->flags & IFF_PROMISC) || (netdev->flags & IFF_ALLMULTI) ||
1664           (netdev_mc_count(netdev) > IXGB_MAX_NUM_MULTICAST_ADDRESSES)) {
1665                u64 multi = IXGB_READ_REG(&adapter->hw, MPRCL);
1666                u32 bcast_l = IXGB_READ_REG(&adapter->hw, BPRCL);
1667                u32 bcast_h = IXGB_READ_REG(&adapter->hw, BPRCH);
1668                u64 bcast = ((u64)bcast_h << 32) | bcast_l;
1669
1670                multi |= ((u64)IXGB_READ_REG(&adapter->hw, MPRCH) << 32);
1671                /* fix up multicast stats by removing broadcasts */
1672                if (multi >= bcast)
1673                        multi -= bcast;
1674
1675                adapter->stats.mprcl += (multi & 0xFFFFFFFF);
1676                adapter->stats.mprch += (multi >> 32);
1677                adapter->stats.bprcl += bcast_l;
1678                adapter->stats.bprch += bcast_h;
1679        } else {
1680                adapter->stats.mprcl += IXGB_READ_REG(&adapter->hw, MPRCL);
1681                adapter->stats.mprch += IXGB_READ_REG(&adapter->hw, MPRCH);
1682                adapter->stats.bprcl += IXGB_READ_REG(&adapter->hw, BPRCL);
1683                adapter->stats.bprch += IXGB_READ_REG(&adapter->hw, BPRCH);
1684        }
1685        adapter->stats.tprl += IXGB_READ_REG(&adapter->hw, TPRL);
1686        adapter->stats.tprh += IXGB_READ_REG(&adapter->hw, TPRH);
1687        adapter->stats.gprcl += IXGB_READ_REG(&adapter->hw, GPRCL);
1688        adapter->stats.gprch += IXGB_READ_REG(&adapter->hw, GPRCH);
1689        adapter->stats.uprcl += IXGB_READ_REG(&adapter->hw, UPRCL);
1690        adapter->stats.uprch += IXGB_READ_REG(&adapter->hw, UPRCH);
1691        adapter->stats.vprcl += IXGB_READ_REG(&adapter->hw, VPRCL);
1692        adapter->stats.vprch += IXGB_READ_REG(&adapter->hw, VPRCH);
1693        adapter->stats.jprcl += IXGB_READ_REG(&adapter->hw, JPRCL);
1694        adapter->stats.jprch += IXGB_READ_REG(&adapter->hw, JPRCH);
1695        adapter->stats.gorcl += IXGB_READ_REG(&adapter->hw, GORCL);
1696        adapter->stats.gorch += IXGB_READ_REG(&adapter->hw, GORCH);
1697        adapter->stats.torl += IXGB_READ_REG(&adapter->hw, TORL);
1698        adapter->stats.torh += IXGB_READ_REG(&adapter->hw, TORH);
1699        adapter->stats.rnbc += IXGB_READ_REG(&adapter->hw, RNBC);
1700        adapter->stats.ruc += IXGB_READ_REG(&adapter->hw, RUC);
1701        adapter->stats.roc += IXGB_READ_REG(&adapter->hw, ROC);
1702        adapter->stats.rlec += IXGB_READ_REG(&adapter->hw, RLEC);
1703        adapter->stats.crcerrs += IXGB_READ_REG(&adapter->hw, CRCERRS);
1704        adapter->stats.icbc += IXGB_READ_REG(&adapter->hw, ICBC);
1705        adapter->stats.ecbc += IXGB_READ_REG(&adapter->hw, ECBC);
1706        adapter->stats.mpc += IXGB_READ_REG(&adapter->hw, MPC);
1707        adapter->stats.tptl += IXGB_READ_REG(&adapter->hw, TPTL);
1708        adapter->stats.tpth += IXGB_READ_REG(&adapter->hw, TPTH);
1709        adapter->stats.gptcl += IXGB_READ_REG(&adapter->hw, GPTCL);
1710        adapter->stats.gptch += IXGB_READ_REG(&adapter->hw, GPTCH);
1711        adapter->stats.bptcl += IXGB_READ_REG(&adapter->hw, BPTCL);
1712        adapter->stats.bptch += IXGB_READ_REG(&adapter->hw, BPTCH);
1713        adapter->stats.mptcl += IXGB_READ_REG(&adapter->hw, MPTCL);
1714        adapter->stats.mptch += IXGB_READ_REG(&adapter->hw, MPTCH);
1715        adapter->stats.uptcl += IXGB_READ_REG(&adapter->hw, UPTCL);
1716        adapter->stats.uptch += IXGB_READ_REG(&adapter->hw, UPTCH);
1717        adapter->stats.vptcl += IXGB_READ_REG(&adapter->hw, VPTCL);
1718        adapter->stats.vptch += IXGB_READ_REG(&adapter->hw, VPTCH);
1719        adapter->stats.jptcl += IXGB_READ_REG(&adapter->hw, JPTCL);
1720        adapter->stats.jptch += IXGB_READ_REG(&adapter->hw, JPTCH);
1721        adapter->stats.gotcl += IXGB_READ_REG(&adapter->hw, GOTCL);
1722        adapter->stats.gotch += IXGB_READ_REG(&adapter->hw, GOTCH);
1723        adapter->stats.totl += IXGB_READ_REG(&adapter->hw, TOTL);
1724        adapter->stats.toth += IXGB_READ_REG(&adapter->hw, TOTH);
1725        adapter->stats.dc += IXGB_READ_REG(&adapter->hw, DC);
1726        adapter->stats.plt64c += IXGB_READ_REG(&adapter->hw, PLT64C);
1727        adapter->stats.tsctc += IXGB_READ_REG(&adapter->hw, TSCTC);
1728        adapter->stats.tsctfc += IXGB_READ_REG(&adapter->hw, TSCTFC);
1729        adapter->stats.ibic += IXGB_READ_REG(&adapter->hw, IBIC);
1730        adapter->stats.rfc += IXGB_READ_REG(&adapter->hw, RFC);
1731        adapter->stats.lfc += IXGB_READ_REG(&adapter->hw, LFC);
1732        adapter->stats.pfrc += IXGB_READ_REG(&adapter->hw, PFRC);
1733        adapter->stats.pftc += IXGB_READ_REG(&adapter->hw, PFTC);
1734        adapter->stats.mcfrc += IXGB_READ_REG(&adapter->hw, MCFRC);
1735        adapter->stats.mcftc += IXGB_READ_REG(&adapter->hw, MCFTC);
1736        adapter->stats.xonrxc += IXGB_READ_REG(&adapter->hw, XONRXC);
1737        adapter->stats.xontxc += IXGB_READ_REG(&adapter->hw, XONTXC);
1738        adapter->stats.xoffrxc += IXGB_READ_REG(&adapter->hw, XOFFRXC);
1739        adapter->stats.xofftxc += IXGB_READ_REG(&adapter->hw, XOFFTXC);
1740        adapter->stats.rjc += IXGB_READ_REG(&adapter->hw, RJC);
1741
1742        /* Fill out the OS statistics structure */
1743
1744        netdev->stats.rx_packets = adapter->stats.gprcl;
1745        netdev->stats.tx_packets = adapter->stats.gptcl;
1746        netdev->stats.rx_bytes = adapter->stats.gorcl;
1747        netdev->stats.tx_bytes = adapter->stats.gotcl;
1748        netdev->stats.multicast = adapter->stats.mprcl;
1749        netdev->stats.collisions = 0;
1750
1751        /* ignore RLEC as it reports errors for padded (<64bytes) frames
1752         * with a length in the type/len field */
1753        netdev->stats.rx_errors =
1754            /* adapter->stats.rnbc + */ adapter->stats.crcerrs +
1755            adapter->stats.ruc +
1756            adapter->stats.roc /*+ adapter->stats.rlec */  +
1757            adapter->stats.icbc +
1758            adapter->stats.ecbc + adapter->stats.mpc;
1759
1760        /* see above
1761         * netdev->stats.rx_length_errors = adapter->stats.rlec;
1762         */
1763
1764        netdev->stats.rx_crc_errors = adapter->stats.crcerrs;
1765        netdev->stats.rx_fifo_errors = adapter->stats.mpc;
1766        netdev->stats.rx_missed_errors = adapter->stats.mpc;
1767        netdev->stats.rx_over_errors = adapter->stats.mpc;
1768
1769        netdev->stats.tx_errors = 0;
1770        netdev->stats.rx_frame_errors = 0;
1771        netdev->stats.tx_aborted_errors = 0;
1772        netdev->stats.tx_carrier_errors = 0;
1773        netdev->stats.tx_fifo_errors = 0;
1774        netdev->stats.tx_heartbeat_errors = 0;
1775        netdev->stats.tx_window_errors = 0;
1776}
1777
1778#define IXGB_MAX_INTR 10
1779/**
1780 * ixgb_intr - Interrupt Handler
1781 * @irq: interrupt number
1782 * @data: pointer to a network interface device structure
1783 **/
1784
1785static irqreturn_t
1786ixgb_intr(int irq, void *data)
1787{
1788        struct net_device *netdev = data;
1789        struct ixgb_adapter *adapter = netdev_priv(netdev);
1790        struct ixgb_hw *hw = &adapter->hw;
1791        u32 icr = IXGB_READ_REG(hw, ICR);
1792
1793        if (unlikely(!icr))
1794                return IRQ_NONE;  /* Not our interrupt */
1795
1796        if (unlikely(icr & (IXGB_INT_RXSEQ | IXGB_INT_LSC)))
1797                if (!test_bit(__IXGB_DOWN, &adapter->flags))
1798                        mod_timer(&adapter->watchdog_timer, jiffies);
1799
1800        if (napi_schedule_prep(&adapter->napi)) {
1801
1802                /* Disable interrupts and register for poll. The flush
1803                  of the posted write is intentionally left out.
1804                */
1805
1806                IXGB_WRITE_REG(&adapter->hw, IMC, ~0);
1807                __napi_schedule(&adapter->napi);
1808        }
1809        return IRQ_HANDLED;
1810}
1811
1812/**
1813 * ixgb_clean - NAPI Rx polling callback
1814 * @adapter: board private structure
1815 **/
1816
1817static int
1818ixgb_clean(struct napi_struct *napi, int budget)
1819{
1820        struct ixgb_adapter *adapter = container_of(napi, struct ixgb_adapter, napi);
1821        int work_done = 0;
1822
1823        ixgb_clean_tx_irq(adapter);
1824        ixgb_clean_rx_irq(adapter, &work_done, budget);
1825
1826        /* If budget not fully consumed, exit the polling mode */
1827        if (work_done < budget) {
1828                napi_complete(napi);
1829                if (!test_bit(__IXGB_DOWN, &adapter->flags))
1830                        ixgb_irq_enable(adapter);
1831        }
1832
1833        return work_done;
1834}
1835
1836/**
1837 * ixgb_clean_tx_irq - Reclaim resources after transmit completes
1838 * @adapter: board private structure
1839 **/
1840
1841static bool
1842ixgb_clean_tx_irq(struct ixgb_adapter *adapter)
1843{
1844        struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
1845        struct net_device *netdev = adapter->netdev;
1846        struct ixgb_tx_desc *tx_desc, *eop_desc;
1847        struct ixgb_buffer *buffer_info;
1848        unsigned int i, eop;
1849        bool cleaned = false;
1850
1851        i = tx_ring->next_to_clean;
1852        eop = tx_ring->buffer_info[i].next_to_watch;
1853        eop_desc = IXGB_TX_DESC(*tx_ring, eop);
1854
1855        while (eop_desc->status & IXGB_TX_DESC_STATUS_DD) {
1856
1857                rmb(); /* read buffer_info after eop_desc */
1858                for (cleaned = false; !cleaned; ) {
1859                        tx_desc = IXGB_TX_DESC(*tx_ring, i);
1860                        buffer_info = &tx_ring->buffer_info[i];
1861
1862                        if (tx_desc->popts &
1863                           (IXGB_TX_DESC_POPTS_TXSM |
1864                            IXGB_TX_DESC_POPTS_IXSM))
1865                                adapter->hw_csum_tx_good++;
1866
1867                        ixgb_unmap_and_free_tx_resource(adapter, buffer_info);
1868
1869                        *(u32 *)&(tx_desc->status) = 0;
1870
1871                        cleaned = (i == eop);
1872                        if (++i == tx_ring->count) i = 0;
1873                }
1874
1875                eop = tx_ring->buffer_info[i].next_to_watch;
1876                eop_desc = IXGB_TX_DESC(*tx_ring, eop);
1877        }
1878
1879        tx_ring->next_to_clean = i;
1880
1881        if (unlikely(cleaned && netif_carrier_ok(netdev) &&
1882                     IXGB_DESC_UNUSED(tx_ring) >= DESC_NEEDED)) {
1883                /* Make sure that anybody stopping the queue after this
1884                 * sees the new next_to_clean. */
1885                smp_mb();
1886
1887                if (netif_queue_stopped(netdev) &&
1888                    !(test_bit(__IXGB_DOWN, &adapter->flags))) {
1889                        netif_wake_queue(netdev);
1890                        ++adapter->restart_queue;
1891                }
1892        }
1893
1894        if (adapter->detect_tx_hung) {
1895                /* detect a transmit hang in hardware, this serializes the
1896                 * check with the clearing of time_stamp and movement of i */
1897                adapter->detect_tx_hung = false;
1898                if (tx_ring->buffer_info[eop].time_stamp &&
1899                   time_after(jiffies, tx_ring->buffer_info[eop].time_stamp + HZ)
1900                   && !(IXGB_READ_REG(&adapter->hw, STATUS) &
1901                        IXGB_STATUS_TXOFF)) {
1902                        /* detected Tx unit hang */
1903                        netif_err(adapter, drv, adapter->netdev,
1904                                  "Detected Tx Unit Hang\n"
1905                                  "  TDH                  <%x>\n"
1906                                  "  TDT                  <%x>\n"
1907                                  "  next_to_use          <%x>\n"
1908                                  "  next_to_clean        <%x>\n"
1909                                  "buffer_info[next_to_clean]\n"
1910                                  "  time_stamp           <%lx>\n"
1911                                  "  next_to_watch        <%x>\n"
1912                                  "  jiffies              <%lx>\n"
1913                                  "  next_to_watch.status <%x>\n",
1914                                  IXGB_READ_REG(&adapter->hw, TDH),
1915                                  IXGB_READ_REG(&adapter->hw, TDT),
1916                                  tx_ring->next_to_use,
1917                                  tx_ring->next_to_clean,
1918                                  tx_ring->buffer_info[eop].time_stamp,
1919                                  eop,
1920                                  jiffies,
1921                                  eop_desc->status);
1922                        netif_stop_queue(netdev);
1923                }
1924        }
1925
1926        return cleaned;
1927}
1928
1929/**
1930 * ixgb_rx_checksum - Receive Checksum Offload for 82597.
1931 * @adapter: board private structure
1932 * @rx_desc: receive descriptor
1933 * @sk_buff: socket buffer with received data
1934 **/
1935
1936static void
1937ixgb_rx_checksum(struct ixgb_adapter *adapter,
1938                 struct ixgb_rx_desc *rx_desc,
1939                 struct sk_buff *skb)
1940{
1941        /* Ignore Checksum bit is set OR
1942         * TCP Checksum has not been calculated
1943         */
1944        if ((rx_desc->status & IXGB_RX_DESC_STATUS_IXSM) ||
1945           (!(rx_desc->status & IXGB_RX_DESC_STATUS_TCPCS))) {
1946                skb_checksum_none_assert(skb);
1947                return;
1948        }
1949
1950        /* At this point we know the hardware did the TCP checksum */
1951        /* now look at the TCP checksum error bit */
1952        if (rx_desc->errors & IXGB_RX_DESC_ERRORS_TCPE) {
1953                /* let the stack verify checksum errors */
1954                skb_checksum_none_assert(skb);
1955                adapter->hw_csum_rx_error++;
1956        } else {
1957                /* TCP checksum is good */
1958                skb->ip_summed = CHECKSUM_UNNECESSARY;
1959                adapter->hw_csum_rx_good++;
1960        }
1961}
1962
1963/*
1964 * this should improve performance for small packets with large amounts
1965 * of reassembly being done in the stack
1966 */
1967static void ixgb_check_copybreak(struct napi_struct *napi,
1968                                 struct ixgb_buffer *buffer_info,
1969                                 u32 length, struct sk_buff **skb)
1970{
1971        struct sk_buff *new_skb;
1972
1973        if (length > copybreak)
1974                return;
1975
1976        new_skb = napi_alloc_skb(napi, length);
1977        if (!new_skb)
1978                return;
1979
1980        skb_copy_to_linear_data_offset(new_skb, -NET_IP_ALIGN,
1981                                       (*skb)->data - NET_IP_ALIGN,
1982                                       length + NET_IP_ALIGN);
1983        /* save the skb in buffer_info as good */
1984        buffer_info->skb = *skb;
1985        *skb = new_skb;
1986}
1987
1988/**
1989 * ixgb_clean_rx_irq - Send received data up the network stack,
1990 * @adapter: board private structure
1991 **/
1992
1993static bool
1994ixgb_clean_rx_irq(struct ixgb_adapter *adapter, int *work_done, int work_to_do)
1995{
1996        struct ixgb_desc_ring *rx_ring = &adapter->rx_ring;
1997        struct net_device *netdev = adapter->netdev;
1998        struct pci_dev *pdev = adapter->pdev;
1999        struct ixgb_rx_desc *rx_desc, *next_rxd;
2000        struct ixgb_buffer *buffer_info, *next_buffer, *next2_buffer;
2001        u32 length;
2002        unsigned int i, j;
2003        int cleaned_count = 0;
2004        bool cleaned = false;
2005
2006        i = rx_ring->next_to_clean;
2007        rx_desc = IXGB_RX_DESC(*rx_ring, i);
2008        buffer_info = &rx_ring->buffer_info[i];
2009
2010        while (rx_desc->status & IXGB_RX_DESC_STATUS_DD) {
2011                struct sk_buff *skb;
2012                u8 status;
2013
2014                if (*work_done >= work_to_do)
2015                        break;
2016
2017                (*work_done)++;
2018                rmb();  /* read descriptor and rx_buffer_info after status DD */
2019                status = rx_desc->status;
2020                skb = buffer_info->skb;
2021                buffer_info->skb = NULL;
2022
2023                prefetch(skb->data - NET_IP_ALIGN);
2024
2025                if (++i == rx_ring->count)
2026                        i = 0;
2027                next_rxd = IXGB_RX_DESC(*rx_ring, i);
2028                prefetch(next_rxd);
2029
2030                j = i + 1;
2031                if (j == rx_ring->count)
2032                        j = 0;
2033                next2_buffer = &rx_ring->buffer_info[j];
2034                prefetch(next2_buffer);
2035
2036                next_buffer = &rx_ring->buffer_info[i];
2037
2038                cleaned = true;
2039                cleaned_count++;
2040
2041                dma_unmap_single(&pdev->dev,
2042                                 buffer_info->dma,
2043                                 buffer_info->length,
2044                                 DMA_FROM_DEVICE);
2045                buffer_info->dma = 0;
2046
2047                length = le16_to_cpu(rx_desc->length);
2048                rx_desc->length = 0;
2049
2050                if (unlikely(!(status & IXGB_RX_DESC_STATUS_EOP))) {
2051
2052                        /* All receives must fit into a single buffer */
2053
2054                        pr_debug("Receive packet consumed multiple buffers length<%x>\n",
2055                                 length);
2056
2057                        dev_kfree_skb_irq(skb);
2058                        goto rxdesc_done;
2059                }
2060
2061                if (unlikely(rx_desc->errors &
2062                    (IXGB_RX_DESC_ERRORS_CE | IXGB_RX_DESC_ERRORS_SE |
2063                     IXGB_RX_DESC_ERRORS_P | IXGB_RX_DESC_ERRORS_RXE))) {
2064                        dev_kfree_skb_irq(skb);
2065                        goto rxdesc_done;
2066                }
2067
2068                ixgb_check_copybreak(&adapter->napi, buffer_info, length, &skb);
2069
2070                /* Good Receive */
2071                skb_put(skb, length);
2072
2073                /* Receive Checksum Offload */
2074                ixgb_rx_checksum(adapter, rx_desc, skb);
2075
2076                skb->protocol = eth_type_trans(skb, netdev);
2077                if (status & IXGB_RX_DESC_STATUS_VP)
2078                        __vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q),
2079                                       le16_to_cpu(rx_desc->special));
2080
2081                netif_receive_skb(skb);
2082
2083rxdesc_done:
2084                /* clean up descriptor, might be written over by hw */
2085                rx_desc->status = 0;
2086
2087                /* return some buffers to hardware, one at a time is too slow */
2088                if (unlikely(cleaned_count >= IXGB_RX_BUFFER_WRITE)) {
2089                        ixgb_alloc_rx_buffers(adapter, cleaned_count);
2090                        cleaned_count = 0;
2091                }
2092
2093                /* use prefetched values */
2094                rx_desc = next_rxd;
2095                buffer_info = next_buffer;
2096        }
2097
2098        rx_ring->next_to_clean = i;
2099
2100        cleaned_count = IXGB_DESC_UNUSED(rx_ring);
2101        if (cleaned_count)
2102                ixgb_alloc_rx_buffers(adapter, cleaned_count);
2103
2104        return cleaned;
2105}
2106
2107/**
2108 * ixgb_alloc_rx_buffers - Replace used receive buffers
2109 * @adapter: address of board private structure
2110 **/
2111
2112static void
2113ixgb_alloc_rx_buffers(struct ixgb_adapter *adapter, int cleaned_count)
2114{
2115        struct ixgb_desc_ring *rx_ring = &adapter->rx_ring;
2116        struct net_device *netdev = adapter->netdev;
2117        struct pci_dev *pdev = adapter->pdev;
2118        struct ixgb_rx_desc *rx_desc;
2119        struct ixgb_buffer *buffer_info;
2120        struct sk_buff *skb;
2121        unsigned int i;
2122        long cleancount;
2123
2124        i = rx_ring->next_to_use;
2125        buffer_info = &rx_ring->buffer_info[i];
2126        cleancount = IXGB_DESC_UNUSED(rx_ring);
2127
2128
2129        /* leave three descriptors unused */
2130        while (--cleancount > 2 && cleaned_count--) {
2131                /* recycle! its good for you */
2132                skb = buffer_info->skb;
2133                if (skb) {
2134                        skb_trim(skb, 0);
2135                        goto map_skb;
2136                }
2137
2138                skb = netdev_alloc_skb_ip_align(netdev, adapter->rx_buffer_len);
2139                if (unlikely(!skb)) {
2140                        /* Better luck next round */
2141                        adapter->alloc_rx_buff_failed++;
2142                        break;
2143                }
2144
2145                buffer_info->skb = skb;
2146                buffer_info->length = adapter->rx_buffer_len;
2147map_skb:
2148                buffer_info->dma = dma_map_single(&pdev->dev,
2149                                                  skb->data,
2150                                                  adapter->rx_buffer_len,
2151                                                  DMA_FROM_DEVICE);
2152                if (dma_mapping_error(&pdev->dev, buffer_info->dma)) {
2153                        adapter->alloc_rx_buff_failed++;
2154                        break;
2155                }
2156
2157                rx_desc = IXGB_RX_DESC(*rx_ring, i);
2158                rx_desc->buff_addr = cpu_to_le64(buffer_info->dma);
2159                /* guarantee DD bit not set now before h/w gets descriptor
2160                 * this is the rest of the workaround for h/w double
2161                 * writeback. */
2162                rx_desc->status = 0;
2163
2164
2165                if (++i == rx_ring->count)
2166                        i = 0;
2167                buffer_info = &rx_ring->buffer_info[i];
2168        }
2169
2170        if (likely(rx_ring->next_to_use != i)) {
2171                rx_ring->next_to_use = i;
2172                if (unlikely(i-- == 0))
2173                        i = (rx_ring->count - 1);
2174
2175                /* Force memory writes to complete before letting h/w
2176                 * know there are new descriptors to fetch.  (Only
2177                 * applicable for weak-ordered memory model archs, such
2178                 * as IA-64). */
2179                wmb();
2180                IXGB_WRITE_REG(&adapter->hw, RDT, i);
2181        }
2182}
2183
2184static void
2185ixgb_vlan_strip_enable(struct ixgb_adapter *adapter)
2186{
2187        u32 ctrl;
2188
2189        /* enable VLAN tag insert/strip */
2190        ctrl = IXGB_READ_REG(&adapter->hw, CTRL0);
2191        ctrl |= IXGB_CTRL0_VME;
2192        IXGB_WRITE_REG(&adapter->hw, CTRL0, ctrl);
2193}
2194
2195static void
2196ixgb_vlan_strip_disable(struct ixgb_adapter *adapter)
2197{
2198        u32 ctrl;
2199
2200        /* disable VLAN tag insert/strip */
2201        ctrl = IXGB_READ_REG(&adapter->hw, CTRL0);
2202        ctrl &= ~IXGB_CTRL0_VME;
2203        IXGB_WRITE_REG(&adapter->hw, CTRL0, ctrl);
2204}
2205
2206static int
2207ixgb_vlan_rx_add_vid(struct net_device *netdev, __be16 proto, u16 vid)
2208{
2209        struct ixgb_adapter *adapter = netdev_priv(netdev);
2210        u32 vfta, index;
2211
2212        /* add VID to filter table */
2213
2214        index = (vid >> 5) & 0x7F;
2215        vfta = IXGB_READ_REG_ARRAY(&adapter->hw, VFTA, index);
2216        vfta |= (1 << (vid & 0x1F));
2217        ixgb_write_vfta(&adapter->hw, index, vfta);
2218        set_bit(vid, adapter->active_vlans);
2219
2220        return 0;
2221}
2222
2223static int
2224ixgb_vlan_rx_kill_vid(struct net_device *netdev, __be16 proto, u16 vid)
2225{
2226        struct ixgb_adapter *adapter = netdev_priv(netdev);
2227        u32 vfta, index;
2228
2229        /* remove VID from filter table */
2230
2231        index = (vid >> 5) & 0x7F;
2232        vfta = IXGB_READ_REG_ARRAY(&adapter->hw, VFTA, index);
2233        vfta &= ~(1 << (vid & 0x1F));
2234        ixgb_write_vfta(&adapter->hw, index, vfta);
2235        clear_bit(vid, adapter->active_vlans);
2236
2237        return 0;
2238}
2239
2240static void
2241ixgb_restore_vlan(struct ixgb_adapter *adapter)
2242{
2243        u16 vid;
2244
2245        for_each_set_bit(vid, adapter->active_vlans, VLAN_N_VID)
2246                ixgb_vlan_rx_add_vid(adapter->netdev, htons(ETH_P_8021Q), vid);
2247}
2248
2249#ifdef CONFIG_NET_POLL_CONTROLLER
2250/*
2251 * Polling 'interrupt' - used by things like netconsole to send skbs
2252 * without having to re-enable interrupts. It's not called while
2253 * the interrupt routine is executing.
2254 */
2255
2256static void ixgb_netpoll(struct net_device *dev)
2257{
2258        struct ixgb_adapter *adapter = netdev_priv(dev);
2259
2260        disable_irq(adapter->pdev->irq);
2261        ixgb_intr(adapter->pdev->irq, dev);
2262        enable_irq(adapter->pdev->irq);
2263}
2264#endif
2265
2266/**
2267 * ixgb_io_error_detected - called when PCI error is detected
2268 * @pdev:    pointer to pci device with error
2269 * @state:   pci channel state after error
2270 *
2271 * This callback is called by the PCI subsystem whenever
2272 * a PCI bus error is detected.
2273 */
2274static pci_ers_result_t ixgb_io_error_detected(struct pci_dev *pdev,
2275                                               enum pci_channel_state state)
2276{
2277        struct net_device *netdev = pci_get_drvdata(pdev);
2278        struct ixgb_adapter *adapter = netdev_priv(netdev);
2279
2280        netif_device_detach(netdev);
2281
2282        if (state == pci_channel_io_perm_failure)
2283                return PCI_ERS_RESULT_DISCONNECT;
2284
2285        if (netif_running(netdev))
2286                ixgb_down(adapter, true);
2287
2288        pci_disable_device(pdev);
2289
2290        /* Request a slot reset. */
2291        return PCI_ERS_RESULT_NEED_RESET;
2292}
2293
2294/**
2295 * ixgb_io_slot_reset - called after the pci bus has been reset.
2296 * @pdev    pointer to pci device with error
2297 *
2298 * This callback is called after the PCI bus has been reset.
2299 * Basically, this tries to restart the card from scratch.
2300 * This is a shortened version of the device probe/discovery code,
2301 * it resembles the first-half of the ixgb_probe() routine.
2302 */
2303static pci_ers_result_t ixgb_io_slot_reset(struct pci_dev *pdev)
2304{
2305        struct net_device *netdev = pci_get_drvdata(pdev);
2306        struct ixgb_adapter *adapter = netdev_priv(netdev);
2307
2308        if (pci_enable_device(pdev)) {
2309                netif_err(adapter, probe, adapter->netdev,
2310                          "Cannot re-enable PCI device after reset\n");
2311                return PCI_ERS_RESULT_DISCONNECT;
2312        }
2313
2314        /* Perform card reset only on one instance of the card */
2315        if (0 != PCI_FUNC (pdev->devfn))
2316                return PCI_ERS_RESULT_RECOVERED;
2317
2318        pci_set_master(pdev);
2319
2320        netif_carrier_off(netdev);
2321        netif_stop_queue(netdev);
2322        ixgb_reset(adapter);
2323
2324        /* Make sure the EEPROM is good */
2325        if (!ixgb_validate_eeprom_checksum(&adapter->hw)) {
2326                netif_err(adapter, probe, adapter->netdev,
2327                          "After reset, the EEPROM checksum is not valid\n");
2328                return PCI_ERS_RESULT_DISCONNECT;
2329        }
2330        ixgb_get_ee_mac_addr(&adapter->hw, netdev->dev_addr);
2331        memcpy(netdev->perm_addr, netdev->dev_addr, netdev->addr_len);
2332
2333        if (!is_valid_ether_addr(netdev->perm_addr)) {
2334                netif_err(adapter, probe, adapter->netdev,
2335                          "After reset, invalid MAC address\n");
2336                return PCI_ERS_RESULT_DISCONNECT;
2337        }
2338
2339        return PCI_ERS_RESULT_RECOVERED;
2340}
2341
2342/**
2343 * ixgb_io_resume - called when its OK to resume normal operations
2344 * @pdev    pointer to pci device with error
2345 *
2346 * The error recovery driver tells us that its OK to resume
2347 * normal operation. Implementation resembles the second-half
2348 * of the ixgb_probe() routine.
2349 */
2350static void ixgb_io_resume(struct pci_dev *pdev)
2351{
2352        struct net_device *netdev = pci_get_drvdata(pdev);
2353        struct ixgb_adapter *adapter = netdev_priv(netdev);
2354
2355        pci_set_master(pdev);
2356
2357        if (netif_running(netdev)) {
2358                if (ixgb_up(adapter)) {
2359                        pr_err("can't bring device back up after reset\n");
2360                        return;
2361                }
2362        }
2363
2364        netif_device_attach(netdev);
2365        mod_timer(&adapter->watchdog_timer, jiffies);
2366}
2367
2368/* ixgb_main.c */
2369