ixgb: remove open-coded skb_cow_head
[linux.git] / drivers / net / ethernet / intel / ixgb / ixgb_main.c
1 /*******************************************************************************
2
3   Intel PRO/10GbE Linux driver
4   Copyright(c) 1999 - 2008 Intel Corporation.
5
6   This program is free software; you can redistribute it and/or modify it
7   under the terms and conditions of the GNU General Public License,
8   version 2, as published by the Free Software Foundation.
9
10   This program is distributed in the hope it will be useful, but WITHOUT
11   ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
12   FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
13   more details.
14
15   You should have received a copy of the GNU General Public License along with
16   this program; if not, write to the Free Software Foundation, Inc.,
17   51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA.
18
19   The full GNU General Public License is included in this distribution in
20   the file called "COPYING".
21
22   Contact Information:
23   Linux NICS <linux.nics@intel.com>
24   e1000-devel Mailing List <e1000-devel@lists.sourceforge.net>
25   Intel Corporation, 5200 N.E. Elam Young Parkway, Hillsboro, OR 97124-6497
26
27 *******************************************************************************/
28
29 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
30
31 #include <linux/prefetch.h>
32 #include "ixgb.h"
33
34 char ixgb_driver_name[] = "ixgb";
35 static char ixgb_driver_string[] = "Intel(R) PRO/10GbE Network Driver";
36
37 #define DRIVERNAPI "-NAPI"
38 #define DRV_VERSION "1.0.135-k2" DRIVERNAPI
39 const char ixgb_driver_version[] = DRV_VERSION;
40 static const char ixgb_copyright[] = "Copyright (c) 1999-2008 Intel Corporation.";
41
42 #define IXGB_CB_LENGTH 256
43 static unsigned int copybreak __read_mostly = IXGB_CB_LENGTH;
44 module_param(copybreak, uint, 0644);
45 MODULE_PARM_DESC(copybreak,
46         "Maximum size of packet that is copied to a new buffer on receive");
47
48 /* ixgb_pci_tbl - PCI Device ID Table
49  *
50  * Wildcard entries (PCI_ANY_ID) should come last
51  * Last entry must be all 0s
52  *
53  * { Vendor ID, Device ID, SubVendor ID, SubDevice ID,
54  *   Class, Class Mask, private data (not used) }
55  */
56 static DEFINE_PCI_DEVICE_TABLE(ixgb_pci_tbl) = {
57         {PCI_VENDOR_ID_INTEL, IXGB_DEVICE_ID_82597EX,
58          PCI_ANY_ID, PCI_ANY_ID, 0, 0, 0},
59         {PCI_VENDOR_ID_INTEL, IXGB_DEVICE_ID_82597EX_CX4,
60          PCI_ANY_ID, PCI_ANY_ID, 0, 0, 0},
61         {PCI_VENDOR_ID_INTEL, IXGB_DEVICE_ID_82597EX_SR,
62          PCI_ANY_ID, PCI_ANY_ID, 0, 0, 0},
63         {PCI_VENDOR_ID_INTEL, IXGB_DEVICE_ID_82597EX_LR,
64          PCI_ANY_ID, PCI_ANY_ID, 0, 0, 0},
65
66         /* required last entry */
67         {0,}
68 };
69
70 MODULE_DEVICE_TABLE(pci, ixgb_pci_tbl);
71
72 /* Local Function Prototypes */
73 static int ixgb_init_module(void);
74 static void ixgb_exit_module(void);
75 static int ixgb_probe(struct pci_dev *pdev, const struct pci_device_id *ent);
76 static void ixgb_remove(struct pci_dev *pdev);
77 static int ixgb_sw_init(struct ixgb_adapter *adapter);
78 static int ixgb_open(struct net_device *netdev);
79 static int ixgb_close(struct net_device *netdev);
80 static void ixgb_configure_tx(struct ixgb_adapter *adapter);
81 static void ixgb_configure_rx(struct ixgb_adapter *adapter);
82 static void ixgb_setup_rctl(struct ixgb_adapter *adapter);
83 static void ixgb_clean_tx_ring(struct ixgb_adapter *adapter);
84 static void ixgb_clean_rx_ring(struct ixgb_adapter *adapter);
85 static void ixgb_set_multi(struct net_device *netdev);
86 static void ixgb_watchdog(unsigned long data);
87 static netdev_tx_t ixgb_xmit_frame(struct sk_buff *skb,
88                                    struct net_device *netdev);
89 static struct net_device_stats *ixgb_get_stats(struct net_device *netdev);
90 static int ixgb_change_mtu(struct net_device *netdev, int new_mtu);
91 static int ixgb_set_mac(struct net_device *netdev, void *p);
92 static irqreturn_t ixgb_intr(int irq, void *data);
93 static bool ixgb_clean_tx_irq(struct ixgb_adapter *adapter);
94
95 static int ixgb_clean(struct napi_struct *, int);
96 static bool ixgb_clean_rx_irq(struct ixgb_adapter *, int *, int);
97 static void ixgb_alloc_rx_buffers(struct ixgb_adapter *, int);
98
99 static void ixgb_tx_timeout(struct net_device *dev);
100 static void ixgb_tx_timeout_task(struct work_struct *work);
101
102 static void ixgb_vlan_strip_enable(struct ixgb_adapter *adapter);
103 static void ixgb_vlan_strip_disable(struct ixgb_adapter *adapter);
104 static int ixgb_vlan_rx_add_vid(struct net_device *netdev,
105                                 __be16 proto, u16 vid);
106 static int ixgb_vlan_rx_kill_vid(struct net_device *netdev,
107                                  __be16 proto, u16 vid);
108 static void ixgb_restore_vlan(struct ixgb_adapter *adapter);
109
110 #ifdef CONFIG_NET_POLL_CONTROLLER
111 /* for netdump / net console */
112 static void ixgb_netpoll(struct net_device *dev);
113 #endif
114
115 static pci_ers_result_t ixgb_io_error_detected (struct pci_dev *pdev,
116                              enum pci_channel_state state);
117 static pci_ers_result_t ixgb_io_slot_reset (struct pci_dev *pdev);
118 static void ixgb_io_resume (struct pci_dev *pdev);
119
120 static const struct pci_error_handlers ixgb_err_handler = {
121         .error_detected = ixgb_io_error_detected,
122         .slot_reset = ixgb_io_slot_reset,
123         .resume = ixgb_io_resume,
124 };
125
126 static struct pci_driver ixgb_driver = {
127         .name     = ixgb_driver_name,
128         .id_table = ixgb_pci_tbl,
129         .probe    = ixgb_probe,
130         .remove   = ixgb_remove,
131         .err_handler = &ixgb_err_handler
132 };
133
134 MODULE_AUTHOR("Intel Corporation, <linux.nics@intel.com>");
135 MODULE_DESCRIPTION("Intel(R) PRO/10GbE Network Driver");
136 MODULE_LICENSE("GPL");
137 MODULE_VERSION(DRV_VERSION);
138
139 #define DEFAULT_MSG_ENABLE (NETIF_MSG_DRV|NETIF_MSG_PROBE|NETIF_MSG_LINK)
140 static int debug = -1;
141 module_param(debug, int, 0);
142 MODULE_PARM_DESC(debug, "Debug level (0=none,...,16=all)");
143
144 /**
145  * ixgb_init_module - Driver Registration Routine
146  *
147  * ixgb_init_module is the first routine called when the driver is
148  * loaded. All it does is register with the PCI subsystem.
149  **/
150
151 static int __init
152 ixgb_init_module(void)
153 {
154         pr_info("%s - version %s\n", ixgb_driver_string, ixgb_driver_version);
155         pr_info("%s\n", ixgb_copyright);
156
157         return pci_register_driver(&ixgb_driver);
158 }
159
160 module_init(ixgb_init_module);
161
162 /**
163  * ixgb_exit_module - Driver Exit Cleanup Routine
164  *
165  * ixgb_exit_module is called just before the driver is removed
166  * from memory.
167  **/
168
169 static void __exit
170 ixgb_exit_module(void)
171 {
172         pci_unregister_driver(&ixgb_driver);
173 }
174
175 module_exit(ixgb_exit_module);
176
177 /**
178  * ixgb_irq_disable - Mask off interrupt generation on the NIC
179  * @adapter: board private structure
180  **/
181
182 static void
183 ixgb_irq_disable(struct ixgb_adapter *adapter)
184 {
185         IXGB_WRITE_REG(&adapter->hw, IMC, ~0);
186         IXGB_WRITE_FLUSH(&adapter->hw);
187         synchronize_irq(adapter->pdev->irq);
188 }
189
190 /**
191  * ixgb_irq_enable - Enable default interrupt generation settings
192  * @adapter: board private structure
193  **/
194
195 static void
196 ixgb_irq_enable(struct ixgb_adapter *adapter)
197 {
198         u32 val = IXGB_INT_RXT0 | IXGB_INT_RXDMT0 |
199                   IXGB_INT_TXDW | IXGB_INT_LSC;
200         if (adapter->hw.subsystem_vendor_id == PCI_VENDOR_ID_SUN)
201                 val |= IXGB_INT_GPI0;
202         IXGB_WRITE_REG(&adapter->hw, IMS, val);
203         IXGB_WRITE_FLUSH(&adapter->hw);
204 }
205
206 int
207 ixgb_up(struct ixgb_adapter *adapter)
208 {
209         struct net_device *netdev = adapter->netdev;
210         int err, irq_flags = IRQF_SHARED;
211         int max_frame = netdev->mtu + ENET_HEADER_SIZE + ENET_FCS_LENGTH;
212         struct ixgb_hw *hw = &adapter->hw;
213
214         /* hardware has been reset, we need to reload some things */
215
216         ixgb_rar_set(hw, netdev->dev_addr, 0);
217         ixgb_set_multi(netdev);
218
219         ixgb_restore_vlan(adapter);
220
221         ixgb_configure_tx(adapter);
222         ixgb_setup_rctl(adapter);
223         ixgb_configure_rx(adapter);
224         ixgb_alloc_rx_buffers(adapter, IXGB_DESC_UNUSED(&adapter->rx_ring));
225
226         /* disable interrupts and get the hardware into a known state */
227         IXGB_WRITE_REG(&adapter->hw, IMC, 0xffffffff);
228
229         /* only enable MSI if bus is in PCI-X mode */
230         if (IXGB_READ_REG(&adapter->hw, STATUS) & IXGB_STATUS_PCIX_MODE) {
231                 err = pci_enable_msi(adapter->pdev);
232                 if (!err) {
233                         adapter->have_msi = true;
234                         irq_flags = 0;
235                 }
236                 /* proceed to try to request regular interrupt */
237         }
238
239         err = request_irq(adapter->pdev->irq, ixgb_intr, irq_flags,
240                           netdev->name, netdev);
241         if (err) {
242                 if (adapter->have_msi)
243                         pci_disable_msi(adapter->pdev);
244                 netif_err(adapter, probe, adapter->netdev,
245                           "Unable to allocate interrupt Error: %d\n", err);
246                 return err;
247         }
248
249         if ((hw->max_frame_size != max_frame) ||
250                 (hw->max_frame_size !=
251                 (IXGB_READ_REG(hw, MFS) >> IXGB_MFS_SHIFT))) {
252
253                 hw->max_frame_size = max_frame;
254
255                 IXGB_WRITE_REG(hw, MFS, hw->max_frame_size << IXGB_MFS_SHIFT);
256
257                 if (hw->max_frame_size >
258                    IXGB_MAX_ENET_FRAME_SIZE_WITHOUT_FCS + ENET_FCS_LENGTH) {
259                         u32 ctrl0 = IXGB_READ_REG(hw, CTRL0);
260
261                         if (!(ctrl0 & IXGB_CTRL0_JFE)) {
262                                 ctrl0 |= IXGB_CTRL0_JFE;
263                                 IXGB_WRITE_REG(hw, CTRL0, ctrl0);
264                         }
265                 }
266         }
267
268         clear_bit(__IXGB_DOWN, &adapter->flags);
269
270         napi_enable(&adapter->napi);
271         ixgb_irq_enable(adapter);
272
273         netif_wake_queue(netdev);
274
275         mod_timer(&adapter->watchdog_timer, jiffies);
276
277         return 0;
278 }
279
280 void
281 ixgb_down(struct ixgb_adapter *adapter, bool kill_watchdog)
282 {
283         struct net_device *netdev = adapter->netdev;
284
285         /* prevent the interrupt handler from restarting watchdog */
286         set_bit(__IXGB_DOWN, &adapter->flags);
287
288         napi_disable(&adapter->napi);
289         /* waiting for NAPI to complete can re-enable interrupts */
290         ixgb_irq_disable(adapter);
291         free_irq(adapter->pdev->irq, netdev);
292
293         if (adapter->have_msi)
294                 pci_disable_msi(adapter->pdev);
295
296         if (kill_watchdog)
297                 del_timer_sync(&adapter->watchdog_timer);
298
299         adapter->link_speed = 0;
300         adapter->link_duplex = 0;
301         netif_carrier_off(netdev);
302         netif_stop_queue(netdev);
303
304         ixgb_reset(adapter);
305         ixgb_clean_tx_ring(adapter);
306         ixgb_clean_rx_ring(adapter);
307 }
308
309 void
310 ixgb_reset(struct ixgb_adapter *adapter)
311 {
312         struct ixgb_hw *hw = &adapter->hw;
313
314         ixgb_adapter_stop(hw);
315         if (!ixgb_init_hw(hw))
316                 netif_err(adapter, probe, adapter->netdev, "ixgb_init_hw failed\n");
317
318         /* restore frame size information */
319         IXGB_WRITE_REG(hw, MFS, hw->max_frame_size << IXGB_MFS_SHIFT);
320         if (hw->max_frame_size >
321             IXGB_MAX_ENET_FRAME_SIZE_WITHOUT_FCS + ENET_FCS_LENGTH) {
322                 u32 ctrl0 = IXGB_READ_REG(hw, CTRL0);
323                 if (!(ctrl0 & IXGB_CTRL0_JFE)) {
324                         ctrl0 |= IXGB_CTRL0_JFE;
325                         IXGB_WRITE_REG(hw, CTRL0, ctrl0);
326                 }
327         }
328 }
329
330 static netdev_features_t
331 ixgb_fix_features(struct net_device *netdev, netdev_features_t features)
332 {
333         /*
334          * Tx VLAN insertion does not work per HW design when Rx stripping is
335          * disabled.
336          */
337         if (!(features & NETIF_F_HW_VLAN_CTAG_RX))
338                 features &= ~NETIF_F_HW_VLAN_CTAG_TX;
339
340         return features;
341 }
342
343 static int
344 ixgb_set_features(struct net_device *netdev, netdev_features_t features)
345 {
346         struct ixgb_adapter *adapter = netdev_priv(netdev);
347         netdev_features_t changed = features ^ netdev->features;
348
349         if (!(changed & (NETIF_F_RXCSUM|NETIF_F_HW_VLAN_CTAG_RX)))
350                 return 0;
351
352         adapter->rx_csum = !!(features & NETIF_F_RXCSUM);
353
354         if (netif_running(netdev)) {
355                 ixgb_down(adapter, true);
356                 ixgb_up(adapter);
357                 ixgb_set_speed_duplex(netdev);
358         } else
359                 ixgb_reset(adapter);
360
361         return 0;
362 }
363
364
365 static const struct net_device_ops ixgb_netdev_ops = {
366         .ndo_open               = ixgb_open,
367         .ndo_stop               = ixgb_close,
368         .ndo_start_xmit         = ixgb_xmit_frame,
369         .ndo_get_stats          = ixgb_get_stats,
370         .ndo_set_rx_mode        = ixgb_set_multi,
371         .ndo_validate_addr      = eth_validate_addr,
372         .ndo_set_mac_address    = ixgb_set_mac,
373         .ndo_change_mtu         = ixgb_change_mtu,
374         .ndo_tx_timeout         = ixgb_tx_timeout,
375         .ndo_vlan_rx_add_vid    = ixgb_vlan_rx_add_vid,
376         .ndo_vlan_rx_kill_vid   = ixgb_vlan_rx_kill_vid,
377 #ifdef CONFIG_NET_POLL_CONTROLLER
378         .ndo_poll_controller    = ixgb_netpoll,
379 #endif
380         .ndo_fix_features       = ixgb_fix_features,
381         .ndo_set_features       = ixgb_set_features,
382 };
383
384 /**
385  * ixgb_probe - Device Initialization Routine
386  * @pdev: PCI device information struct
387  * @ent: entry in ixgb_pci_tbl
388  *
389  * Returns 0 on success, negative on failure
390  *
391  * ixgb_probe initializes an adapter identified by a pci_dev structure.
392  * The OS initialization, configuring of the adapter private structure,
393  * and a hardware reset occur.
394  **/
395
396 static int
397 ixgb_probe(struct pci_dev *pdev, const struct pci_device_id *ent)
398 {
399         struct net_device *netdev = NULL;
400         struct ixgb_adapter *adapter;
401         static int cards_found = 0;
402         int pci_using_dac;
403         int i;
404         int err;
405
406         err = pci_enable_device(pdev);
407         if (err)
408                 return err;
409
410         pci_using_dac = 0;
411         err = dma_set_mask_and_coherent(&pdev->dev, DMA_BIT_MASK(64));
412         if (!err) {
413                 pci_using_dac = 1;
414         } else {
415                 err = dma_set_mask_and_coherent(&pdev->dev, DMA_BIT_MASK(32));
416                 if (err) {
417                         pr_err("No usable DMA configuration, aborting\n");
418                         goto err_dma_mask;
419                 }
420         }
421
422         err = pci_request_regions(pdev, ixgb_driver_name);
423         if (err)
424                 goto err_request_regions;
425
426         pci_set_master(pdev);
427
428         netdev = alloc_etherdev(sizeof(struct ixgb_adapter));
429         if (!netdev) {
430                 err = -ENOMEM;
431                 goto err_alloc_etherdev;
432         }
433
434         SET_NETDEV_DEV(netdev, &pdev->dev);
435
436         pci_set_drvdata(pdev, netdev);
437         adapter = netdev_priv(netdev);
438         adapter->netdev = netdev;
439         adapter->pdev = pdev;
440         adapter->hw.back = adapter;
441         adapter->msg_enable = netif_msg_init(debug, DEFAULT_MSG_ENABLE);
442
443         adapter->hw.hw_addr = pci_ioremap_bar(pdev, BAR_0);
444         if (!adapter->hw.hw_addr) {
445                 err = -EIO;
446                 goto err_ioremap;
447         }
448
449         for (i = BAR_1; i <= BAR_5; i++) {
450                 if (pci_resource_len(pdev, i) == 0)
451                         continue;
452                 if (pci_resource_flags(pdev, i) & IORESOURCE_IO) {
453                         adapter->hw.io_base = pci_resource_start(pdev, i);
454                         break;
455                 }
456         }
457
458         netdev->netdev_ops = &ixgb_netdev_ops;
459         ixgb_set_ethtool_ops(netdev);
460         netdev->watchdog_timeo = 5 * HZ;
461         netif_napi_add(netdev, &adapter->napi, ixgb_clean, 64);
462
463         strncpy(netdev->name, pci_name(pdev), sizeof(netdev->name) - 1);
464
465         adapter->bd_number = cards_found;
466         adapter->link_speed = 0;
467         adapter->link_duplex = 0;
468
469         /* setup the private structure */
470
471         err = ixgb_sw_init(adapter);
472         if (err)
473                 goto err_sw_init;
474
475         netdev->hw_features = NETIF_F_SG |
476                            NETIF_F_TSO |
477                            NETIF_F_HW_CSUM |
478                            NETIF_F_HW_VLAN_CTAG_TX |
479                            NETIF_F_HW_VLAN_CTAG_RX;
480         netdev->features = netdev->hw_features |
481                            NETIF_F_HW_VLAN_CTAG_FILTER;
482         netdev->hw_features |= NETIF_F_RXCSUM;
483
484         if (pci_using_dac) {
485                 netdev->features |= NETIF_F_HIGHDMA;
486                 netdev->vlan_features |= NETIF_F_HIGHDMA;
487         }
488
489         /* make sure the EEPROM is good */
490
491         if (!ixgb_validate_eeprom_checksum(&adapter->hw)) {
492                 netif_err(adapter, probe, adapter->netdev,
493                           "The EEPROM Checksum Is Not Valid\n");
494                 err = -EIO;
495                 goto err_eeprom;
496         }
497
498         ixgb_get_ee_mac_addr(&adapter->hw, netdev->dev_addr);
499
500         if (!is_valid_ether_addr(netdev->dev_addr)) {
501                 netif_err(adapter, probe, adapter->netdev, "Invalid MAC Address\n");
502                 err = -EIO;
503                 goto err_eeprom;
504         }
505
506         adapter->part_num = ixgb_get_ee_pba_number(&adapter->hw);
507
508         init_timer(&adapter->watchdog_timer);
509         adapter->watchdog_timer.function = ixgb_watchdog;
510         adapter->watchdog_timer.data = (unsigned long)adapter;
511
512         INIT_WORK(&adapter->tx_timeout_task, ixgb_tx_timeout_task);
513
514         strcpy(netdev->name, "eth%d");
515         err = register_netdev(netdev);
516         if (err)
517                 goto err_register;
518
519         /* carrier off reporting is important to ethtool even BEFORE open */
520         netif_carrier_off(netdev);
521
522         netif_info(adapter, probe, adapter->netdev,
523                    "Intel(R) PRO/10GbE Network Connection\n");
524         ixgb_check_options(adapter);
525         /* reset the hardware with the new settings */
526
527         ixgb_reset(adapter);
528
529         cards_found++;
530         return 0;
531
532 err_register:
533 err_sw_init:
534 err_eeprom:
535         iounmap(adapter->hw.hw_addr);
536 err_ioremap:
537         free_netdev(netdev);
538 err_alloc_etherdev:
539         pci_release_regions(pdev);
540 err_request_regions:
541 err_dma_mask:
542         pci_disable_device(pdev);
543         return err;
544 }
545
546 /**
547  * ixgb_remove - Device Removal Routine
548  * @pdev: PCI device information struct
549  *
550  * ixgb_remove is called by the PCI subsystem to alert the driver
551  * that it should release a PCI device.  The could be caused by a
552  * Hot-Plug event, or because the driver is going to be removed from
553  * memory.
554  **/
555
556 static void
557 ixgb_remove(struct pci_dev *pdev)
558 {
559         struct net_device *netdev = pci_get_drvdata(pdev);
560         struct ixgb_adapter *adapter = netdev_priv(netdev);
561
562         cancel_work_sync(&adapter->tx_timeout_task);
563
564         unregister_netdev(netdev);
565
566         iounmap(adapter->hw.hw_addr);
567         pci_release_regions(pdev);
568
569         free_netdev(netdev);
570         pci_disable_device(pdev);
571 }
572
573 /**
574  * ixgb_sw_init - Initialize general software structures (struct ixgb_adapter)
575  * @adapter: board private structure to initialize
576  *
577  * ixgb_sw_init initializes the Adapter private data structure.
578  * Fields are initialized based on PCI device information and
579  * OS network device settings (MTU size).
580  **/
581
582 static int
583 ixgb_sw_init(struct ixgb_adapter *adapter)
584 {
585         struct ixgb_hw *hw = &adapter->hw;
586         struct net_device *netdev = adapter->netdev;
587         struct pci_dev *pdev = adapter->pdev;
588
589         /* PCI config space info */
590
591         hw->vendor_id = pdev->vendor;
592         hw->device_id = pdev->device;
593         hw->subsystem_vendor_id = pdev->subsystem_vendor;
594         hw->subsystem_id = pdev->subsystem_device;
595
596         hw->max_frame_size = netdev->mtu + ENET_HEADER_SIZE + ENET_FCS_LENGTH;
597         adapter->rx_buffer_len = hw->max_frame_size + 8; /* + 8 for errata */
598
599         if ((hw->device_id == IXGB_DEVICE_ID_82597EX) ||
600             (hw->device_id == IXGB_DEVICE_ID_82597EX_CX4) ||
601             (hw->device_id == IXGB_DEVICE_ID_82597EX_LR) ||
602             (hw->device_id == IXGB_DEVICE_ID_82597EX_SR))
603                 hw->mac_type = ixgb_82597;
604         else {
605                 /* should never have loaded on this device */
606                 netif_err(adapter, probe, adapter->netdev, "unsupported device id\n");
607         }
608
609         /* enable flow control to be programmed */
610         hw->fc.send_xon = 1;
611
612         set_bit(__IXGB_DOWN, &adapter->flags);
613         return 0;
614 }
615
616 /**
617  * ixgb_open - Called when a network interface is made active
618  * @netdev: network interface device structure
619  *
620  * Returns 0 on success, negative value on failure
621  *
622  * The open entry point is called when a network interface is made
623  * active by the system (IFF_UP).  At this point all resources needed
624  * for transmit and receive operations are allocated, the interrupt
625  * handler is registered with the OS, the watchdog timer is started,
626  * and the stack is notified that the interface is ready.
627  **/
628
629 static int
630 ixgb_open(struct net_device *netdev)
631 {
632         struct ixgb_adapter *adapter = netdev_priv(netdev);
633         int err;
634
635         /* allocate transmit descriptors */
636         err = ixgb_setup_tx_resources(adapter);
637         if (err)
638                 goto err_setup_tx;
639
640         netif_carrier_off(netdev);
641
642         /* allocate receive descriptors */
643
644         err = ixgb_setup_rx_resources(adapter);
645         if (err)
646                 goto err_setup_rx;
647
648         err = ixgb_up(adapter);
649         if (err)
650                 goto err_up;
651
652         netif_start_queue(netdev);
653
654         return 0;
655
656 err_up:
657         ixgb_free_rx_resources(adapter);
658 err_setup_rx:
659         ixgb_free_tx_resources(adapter);
660 err_setup_tx:
661         ixgb_reset(adapter);
662
663         return err;
664 }
665
666 /**
667  * ixgb_close - Disables a network interface
668  * @netdev: network interface device structure
669  *
670  * Returns 0, this is not allowed to fail
671  *
672  * The close entry point is called when an interface is de-activated
673  * by the OS.  The hardware is still under the drivers control, but
674  * needs to be disabled.  A global MAC reset is issued to stop the
675  * hardware, and all transmit and receive resources are freed.
676  **/
677
678 static int
679 ixgb_close(struct net_device *netdev)
680 {
681         struct ixgb_adapter *adapter = netdev_priv(netdev);
682
683         ixgb_down(adapter, true);
684
685         ixgb_free_tx_resources(adapter);
686         ixgb_free_rx_resources(adapter);
687
688         return 0;
689 }
690
691 /**
692  * ixgb_setup_tx_resources - allocate Tx resources (Descriptors)
693  * @adapter: board private structure
694  *
695  * Return 0 on success, negative on failure
696  **/
697
698 int
699 ixgb_setup_tx_resources(struct ixgb_adapter *adapter)
700 {
701         struct ixgb_desc_ring *txdr = &adapter->tx_ring;
702         struct pci_dev *pdev = adapter->pdev;
703         int size;
704
705         size = sizeof(struct ixgb_buffer) * txdr->count;
706         txdr->buffer_info = vzalloc(size);
707         if (!txdr->buffer_info)
708                 return -ENOMEM;
709
710         /* round up to nearest 4K */
711
712         txdr->size = txdr->count * sizeof(struct ixgb_tx_desc);
713         txdr->size = ALIGN(txdr->size, 4096);
714
715         txdr->desc = dma_zalloc_coherent(&pdev->dev, txdr->size, &txdr->dma,
716                                          GFP_KERNEL);
717         if (!txdr->desc) {
718                 vfree(txdr->buffer_info);
719                 return -ENOMEM;
720         }
721
722         txdr->next_to_use = 0;
723         txdr->next_to_clean = 0;
724
725         return 0;
726 }
727
728 /**
729  * ixgb_configure_tx - Configure 82597 Transmit Unit after Reset.
730  * @adapter: board private structure
731  *
732  * Configure the Tx unit of the MAC after a reset.
733  **/
734
735 static void
736 ixgb_configure_tx(struct ixgb_adapter *adapter)
737 {
738         u64 tdba = adapter->tx_ring.dma;
739         u32 tdlen = adapter->tx_ring.count * sizeof(struct ixgb_tx_desc);
740         u32 tctl;
741         struct ixgb_hw *hw = &adapter->hw;
742
743         /* Setup the Base and Length of the Tx Descriptor Ring
744          * tx_ring.dma can be either a 32 or 64 bit value
745          */
746
747         IXGB_WRITE_REG(hw, TDBAL, (tdba & 0x00000000ffffffffULL));
748         IXGB_WRITE_REG(hw, TDBAH, (tdba >> 32));
749
750         IXGB_WRITE_REG(hw, TDLEN, tdlen);
751
752         /* Setup the HW Tx Head and Tail descriptor pointers */
753
754         IXGB_WRITE_REG(hw, TDH, 0);
755         IXGB_WRITE_REG(hw, TDT, 0);
756
757         /* don't set up txdctl, it induces performance problems if configured
758          * incorrectly */
759         /* Set the Tx Interrupt Delay register */
760
761         IXGB_WRITE_REG(hw, TIDV, adapter->tx_int_delay);
762
763         /* Program the Transmit Control Register */
764
765         tctl = IXGB_TCTL_TCE | IXGB_TCTL_TXEN | IXGB_TCTL_TPDE;
766         IXGB_WRITE_REG(hw, TCTL, tctl);
767
768         /* Setup Transmit Descriptor Settings for this adapter */
769         adapter->tx_cmd_type =
770                 IXGB_TX_DESC_TYPE |
771                 (adapter->tx_int_delay_enable ? IXGB_TX_DESC_CMD_IDE : 0);
772 }
773
774 /**
775  * ixgb_setup_rx_resources - allocate Rx resources (Descriptors)
776  * @adapter: board private structure
777  *
778  * Returns 0 on success, negative on failure
779  **/
780
781 int
782 ixgb_setup_rx_resources(struct ixgb_adapter *adapter)
783 {
784         struct ixgb_desc_ring *rxdr = &adapter->rx_ring;
785         struct pci_dev *pdev = adapter->pdev;
786         int size;
787
788         size = sizeof(struct ixgb_buffer) * rxdr->count;
789         rxdr->buffer_info = vzalloc(size);
790         if (!rxdr->buffer_info)
791                 return -ENOMEM;
792
793         /* Round up to nearest 4K */
794
795         rxdr->size = rxdr->count * sizeof(struct ixgb_rx_desc);
796         rxdr->size = ALIGN(rxdr->size, 4096);
797
798         rxdr->desc = dma_alloc_coherent(&pdev->dev, rxdr->size, &rxdr->dma,
799                                         GFP_KERNEL);
800
801         if (!rxdr->desc) {
802                 vfree(rxdr->buffer_info);
803                 return -ENOMEM;
804         }
805         memset(rxdr->desc, 0, rxdr->size);
806
807         rxdr->next_to_clean = 0;
808         rxdr->next_to_use = 0;
809
810         return 0;
811 }
812
813 /**
814  * ixgb_setup_rctl - configure the receive control register
815  * @adapter: Board private structure
816  **/
817
818 static void
819 ixgb_setup_rctl(struct ixgb_adapter *adapter)
820 {
821         u32 rctl;
822
823         rctl = IXGB_READ_REG(&adapter->hw, RCTL);
824
825         rctl &= ~(3 << IXGB_RCTL_MO_SHIFT);
826
827         rctl |=
828                 IXGB_RCTL_BAM | IXGB_RCTL_RDMTS_1_2 |
829                 IXGB_RCTL_RXEN | IXGB_RCTL_CFF |
830                 (adapter->hw.mc_filter_type << IXGB_RCTL_MO_SHIFT);
831
832         rctl |= IXGB_RCTL_SECRC;
833
834         if (adapter->rx_buffer_len <= IXGB_RXBUFFER_2048)
835                 rctl |= IXGB_RCTL_BSIZE_2048;
836         else if (adapter->rx_buffer_len <= IXGB_RXBUFFER_4096)
837                 rctl |= IXGB_RCTL_BSIZE_4096;
838         else if (adapter->rx_buffer_len <= IXGB_RXBUFFER_8192)
839                 rctl |= IXGB_RCTL_BSIZE_8192;
840         else if (adapter->rx_buffer_len <= IXGB_RXBUFFER_16384)
841                 rctl |= IXGB_RCTL_BSIZE_16384;
842
843         IXGB_WRITE_REG(&adapter->hw, RCTL, rctl);
844 }
845
846 /**
847  * ixgb_configure_rx - Configure 82597 Receive Unit after Reset.
848  * @adapter: board private structure
849  *
850  * Configure the Rx unit of the MAC after a reset.
851  **/
852
853 static void
854 ixgb_configure_rx(struct ixgb_adapter *adapter)
855 {
856         u64 rdba = adapter->rx_ring.dma;
857         u32 rdlen = adapter->rx_ring.count * sizeof(struct ixgb_rx_desc);
858         struct ixgb_hw *hw = &adapter->hw;
859         u32 rctl;
860         u32 rxcsum;
861
862         /* make sure receives are disabled while setting up the descriptors */
863
864         rctl = IXGB_READ_REG(hw, RCTL);
865         IXGB_WRITE_REG(hw, RCTL, rctl & ~IXGB_RCTL_RXEN);
866
867         /* set the Receive Delay Timer Register */
868
869         IXGB_WRITE_REG(hw, RDTR, adapter->rx_int_delay);
870
871         /* Setup the Base and Length of the Rx Descriptor Ring */
872
873         IXGB_WRITE_REG(hw, RDBAL, (rdba & 0x00000000ffffffffULL));
874         IXGB_WRITE_REG(hw, RDBAH, (rdba >> 32));
875
876         IXGB_WRITE_REG(hw, RDLEN, rdlen);
877
878         /* Setup the HW Rx Head and Tail Descriptor Pointers */
879         IXGB_WRITE_REG(hw, RDH, 0);
880         IXGB_WRITE_REG(hw, RDT, 0);
881
882         /* due to the hardware errata with RXDCTL, we are unable to use any of
883          * the performance enhancing features of it without causing other
884          * subtle bugs, some of the bugs could include receive length
885          * corruption at high data rates (WTHRESH > 0) and/or receive
886          * descriptor ring irregularites (particularly in hardware cache) */
887         IXGB_WRITE_REG(hw, RXDCTL, 0);
888
889         /* Enable Receive Checksum Offload for TCP and UDP */
890         if (adapter->rx_csum) {
891                 rxcsum = IXGB_READ_REG(hw, RXCSUM);
892                 rxcsum |= IXGB_RXCSUM_TUOFL;
893                 IXGB_WRITE_REG(hw, RXCSUM, rxcsum);
894         }
895
896         /* Enable Receives */
897
898         IXGB_WRITE_REG(hw, RCTL, rctl);
899 }
900
901 /**
902  * ixgb_free_tx_resources - Free Tx Resources
903  * @adapter: board private structure
904  *
905  * Free all transmit software resources
906  **/
907
908 void
909 ixgb_free_tx_resources(struct ixgb_adapter *adapter)
910 {
911         struct pci_dev *pdev = adapter->pdev;
912
913         ixgb_clean_tx_ring(adapter);
914
915         vfree(adapter->tx_ring.buffer_info);
916         adapter->tx_ring.buffer_info = NULL;
917
918         dma_free_coherent(&pdev->dev, adapter->tx_ring.size,
919                           adapter->tx_ring.desc, adapter->tx_ring.dma);
920
921         adapter->tx_ring.desc = NULL;
922 }
923
924 static void
925 ixgb_unmap_and_free_tx_resource(struct ixgb_adapter *adapter,
926                                 struct ixgb_buffer *buffer_info)
927 {
928         if (buffer_info->dma) {
929                 if (buffer_info->mapped_as_page)
930                         dma_unmap_page(&adapter->pdev->dev, buffer_info->dma,
931                                        buffer_info->length, DMA_TO_DEVICE);
932                 else
933                         dma_unmap_single(&adapter->pdev->dev, buffer_info->dma,
934                                          buffer_info->length, DMA_TO_DEVICE);
935                 buffer_info->dma = 0;
936         }
937
938         if (buffer_info->skb) {
939                 dev_kfree_skb_any(buffer_info->skb);
940                 buffer_info->skb = NULL;
941         }
942         buffer_info->time_stamp = 0;
943         /* these fields must always be initialized in tx
944          * buffer_info->length = 0;
945          * buffer_info->next_to_watch = 0; */
946 }
947
948 /**
949  * ixgb_clean_tx_ring - Free Tx Buffers
950  * @adapter: board private structure
951  **/
952
953 static void
954 ixgb_clean_tx_ring(struct ixgb_adapter *adapter)
955 {
956         struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
957         struct ixgb_buffer *buffer_info;
958         unsigned long size;
959         unsigned int i;
960
961         /* Free all the Tx ring sk_buffs */
962
963         for (i = 0; i < tx_ring->count; i++) {
964                 buffer_info = &tx_ring->buffer_info[i];
965                 ixgb_unmap_and_free_tx_resource(adapter, buffer_info);
966         }
967
968         size = sizeof(struct ixgb_buffer) * tx_ring->count;
969         memset(tx_ring->buffer_info, 0, size);
970
971         /* Zero out the descriptor ring */
972
973         memset(tx_ring->desc, 0, tx_ring->size);
974
975         tx_ring->next_to_use = 0;
976         tx_ring->next_to_clean = 0;
977
978         IXGB_WRITE_REG(&adapter->hw, TDH, 0);
979         IXGB_WRITE_REG(&adapter->hw, TDT, 0);
980 }
981
982 /**
983  * ixgb_free_rx_resources - Free Rx Resources
984  * @adapter: board private structure
985  *
986  * Free all receive software resources
987  **/
988
989 void
990 ixgb_free_rx_resources(struct ixgb_adapter *adapter)
991 {
992         struct ixgb_desc_ring *rx_ring = &adapter->rx_ring;
993         struct pci_dev *pdev = adapter->pdev;
994
995         ixgb_clean_rx_ring(adapter);
996
997         vfree(rx_ring->buffer_info);
998         rx_ring->buffer_info = NULL;
999
1000         dma_free_coherent(&pdev->dev, rx_ring->size, rx_ring->desc,
1001                           rx_ring->dma);
1002
1003         rx_ring->desc = NULL;
1004 }
1005
1006 /**
1007  * ixgb_clean_rx_ring - Free Rx Buffers
1008  * @adapter: board private structure
1009  **/
1010
1011 static void
1012 ixgb_clean_rx_ring(struct ixgb_adapter *adapter)
1013 {
1014         struct ixgb_desc_ring *rx_ring = &adapter->rx_ring;
1015         struct ixgb_buffer *buffer_info;
1016         struct pci_dev *pdev = adapter->pdev;
1017         unsigned long size;
1018         unsigned int i;
1019
1020         /* Free all the Rx ring sk_buffs */
1021
1022         for (i = 0; i < rx_ring->count; i++) {
1023                 buffer_info = &rx_ring->buffer_info[i];
1024                 if (buffer_info->dma) {
1025                         dma_unmap_single(&pdev->dev,
1026                                          buffer_info->dma,
1027                                          buffer_info->length,
1028                                          DMA_FROM_DEVICE);
1029                         buffer_info->dma = 0;
1030                         buffer_info->length = 0;
1031                 }
1032
1033                 if (buffer_info->skb) {
1034                         dev_kfree_skb(buffer_info->skb);
1035                         buffer_info->skb = NULL;
1036                 }
1037         }
1038
1039         size = sizeof(struct ixgb_buffer) * rx_ring->count;
1040         memset(rx_ring->buffer_info, 0, size);
1041
1042         /* Zero out the descriptor ring */
1043
1044         memset(rx_ring->desc, 0, rx_ring->size);
1045
1046         rx_ring->next_to_clean = 0;
1047         rx_ring->next_to_use = 0;
1048
1049         IXGB_WRITE_REG(&adapter->hw, RDH, 0);
1050         IXGB_WRITE_REG(&adapter->hw, RDT, 0);
1051 }
1052
1053 /**
1054  * ixgb_set_mac - Change the Ethernet Address of the NIC
1055  * @netdev: network interface device structure
1056  * @p: pointer to an address structure
1057  *
1058  * Returns 0 on success, negative on failure
1059  **/
1060
1061 static int
1062 ixgb_set_mac(struct net_device *netdev, void *p)
1063 {
1064         struct ixgb_adapter *adapter = netdev_priv(netdev);
1065         struct sockaddr *addr = p;
1066
1067         if (!is_valid_ether_addr(addr->sa_data))
1068                 return -EADDRNOTAVAIL;
1069
1070         memcpy(netdev->dev_addr, addr->sa_data, netdev->addr_len);
1071
1072         ixgb_rar_set(&adapter->hw, addr->sa_data, 0);
1073
1074         return 0;
1075 }
1076
1077 /**
1078  * ixgb_set_multi - Multicast and Promiscuous mode set
1079  * @netdev: network interface device structure
1080  *
1081  * The set_multi entry point is called whenever the multicast address
1082  * list or the network interface flags are updated.  This routine is
1083  * responsible for configuring the hardware for proper multicast,
1084  * promiscuous mode, and all-multi behavior.
1085  **/
1086
1087 static void
1088 ixgb_set_multi(struct net_device *netdev)
1089 {
1090         struct ixgb_adapter *adapter = netdev_priv(netdev);
1091         struct ixgb_hw *hw = &adapter->hw;
1092         struct netdev_hw_addr *ha;
1093         u32 rctl;
1094
1095         /* Check for Promiscuous and All Multicast modes */
1096
1097         rctl = IXGB_READ_REG(hw, RCTL);
1098
1099         if (netdev->flags & IFF_PROMISC) {
1100                 rctl |= (IXGB_RCTL_UPE | IXGB_RCTL_MPE);
1101                 /* disable VLAN filtering */
1102                 rctl &= ~IXGB_RCTL_CFIEN;
1103                 rctl &= ~IXGB_RCTL_VFE;
1104         } else {
1105                 if (netdev->flags & IFF_ALLMULTI) {
1106                         rctl |= IXGB_RCTL_MPE;
1107                         rctl &= ~IXGB_RCTL_UPE;
1108                 } else {
1109                         rctl &= ~(IXGB_RCTL_UPE | IXGB_RCTL_MPE);
1110                 }
1111                 /* enable VLAN filtering */
1112                 rctl |= IXGB_RCTL_VFE;
1113                 rctl &= ~IXGB_RCTL_CFIEN;
1114         }
1115
1116         if (netdev_mc_count(netdev) > IXGB_MAX_NUM_MULTICAST_ADDRESSES) {
1117                 rctl |= IXGB_RCTL_MPE;
1118                 IXGB_WRITE_REG(hw, RCTL, rctl);
1119         } else {
1120                 u8 *mta = kmalloc(IXGB_MAX_NUM_MULTICAST_ADDRESSES *
1121                               ETH_ALEN, GFP_ATOMIC);
1122                 u8 *addr;
1123                 if (!mta)
1124                         goto alloc_failed;
1125
1126                 IXGB_WRITE_REG(hw, RCTL, rctl);
1127
1128                 addr = mta;
1129                 netdev_for_each_mc_addr(ha, netdev) {
1130                         memcpy(addr, ha->addr, ETH_ALEN);
1131                         addr += ETH_ALEN;
1132                 }
1133
1134                 ixgb_mc_addr_list_update(hw, mta, netdev_mc_count(netdev), 0);
1135                 kfree(mta);
1136         }
1137
1138 alloc_failed:
1139         if (netdev->features & NETIF_F_HW_VLAN_CTAG_RX)
1140                 ixgb_vlan_strip_enable(adapter);
1141         else
1142                 ixgb_vlan_strip_disable(adapter);
1143
1144 }
1145
1146 /**
1147  * ixgb_watchdog - Timer Call-back
1148  * @data: pointer to netdev cast into an unsigned long
1149  **/
1150
1151 static void
1152 ixgb_watchdog(unsigned long data)
1153 {
1154         struct ixgb_adapter *adapter = (struct ixgb_adapter *)data;
1155         struct net_device *netdev = adapter->netdev;
1156         struct ixgb_desc_ring *txdr = &adapter->tx_ring;
1157
1158         ixgb_check_for_link(&adapter->hw);
1159
1160         if (ixgb_check_for_bad_link(&adapter->hw)) {
1161                 /* force the reset path */
1162                 netif_stop_queue(netdev);
1163         }
1164
1165         if (adapter->hw.link_up) {
1166                 if (!netif_carrier_ok(netdev)) {
1167                         netdev_info(netdev,
1168                                     "NIC Link is Up 10 Gbps Full Duplex, Flow Control: %s\n",
1169                                     (adapter->hw.fc.type == ixgb_fc_full) ?
1170                                     "RX/TX" :
1171                                     (adapter->hw.fc.type == ixgb_fc_rx_pause) ?
1172                                      "RX" :
1173                                     (adapter->hw.fc.type == ixgb_fc_tx_pause) ?
1174                                     "TX" : "None");
1175                         adapter->link_speed = 10000;
1176                         adapter->link_duplex = FULL_DUPLEX;
1177                         netif_carrier_on(netdev);
1178                 }
1179         } else {
1180                 if (netif_carrier_ok(netdev)) {
1181                         adapter->link_speed = 0;
1182                         adapter->link_duplex = 0;
1183                         netdev_info(netdev, "NIC Link is Down\n");
1184                         netif_carrier_off(netdev);
1185                 }
1186         }
1187
1188         ixgb_update_stats(adapter);
1189
1190         if (!netif_carrier_ok(netdev)) {
1191                 if (IXGB_DESC_UNUSED(txdr) + 1 < txdr->count) {
1192                         /* We've lost link, so the controller stops DMA,
1193                          * but we've got queued Tx work that's never going
1194                          * to get done, so reset controller to flush Tx.
1195                          * (Do the reset outside of interrupt context). */
1196                         schedule_work(&adapter->tx_timeout_task);
1197                         /* return immediately since reset is imminent */
1198                         return;
1199                 }
1200         }
1201
1202         /* Force detection of hung controller every watchdog period */
1203         adapter->detect_tx_hung = true;
1204
1205         /* generate an interrupt to force clean up of any stragglers */
1206         IXGB_WRITE_REG(&adapter->hw, ICS, IXGB_INT_TXDW);
1207
1208         /* Reset the timer */
1209         mod_timer(&adapter->watchdog_timer, jiffies + 2 * HZ);
1210 }
1211
1212 #define IXGB_TX_FLAGS_CSUM              0x00000001
1213 #define IXGB_TX_FLAGS_VLAN              0x00000002
1214 #define IXGB_TX_FLAGS_TSO               0x00000004
1215
1216 static int
1217 ixgb_tso(struct ixgb_adapter *adapter, struct sk_buff *skb)
1218 {
1219         struct ixgb_context_desc *context_desc;
1220         unsigned int i;
1221         u8 ipcss, ipcso, tucss, tucso, hdr_len;
1222         u16 ipcse, tucse, mss;
1223
1224         if (likely(skb_is_gso(skb))) {
1225                 struct ixgb_buffer *buffer_info;
1226                 struct iphdr *iph;
1227                 int err;
1228
1229                 err = skb_cow_head(skb, 0);
1230                 if (err < 0)
1231                         return err;
1232
1233                 hdr_len = skb_transport_offset(skb) + tcp_hdrlen(skb);
1234                 mss = skb_shinfo(skb)->gso_size;
1235                 iph = ip_hdr(skb);
1236                 iph->tot_len = 0;
1237                 iph->check = 0;
1238                 tcp_hdr(skb)->check = ~csum_tcpudp_magic(iph->saddr,
1239                                                          iph->daddr, 0,
1240                                                          IPPROTO_TCP, 0);
1241                 ipcss = skb_network_offset(skb);
1242                 ipcso = (void *)&(iph->check) - (void *)skb->data;
1243                 ipcse = skb_transport_offset(skb) - 1;
1244                 tucss = skb_transport_offset(skb);
1245                 tucso = (void *)&(tcp_hdr(skb)->check) - (void *)skb->data;
1246                 tucse = 0;
1247
1248                 i = adapter->tx_ring.next_to_use;
1249                 context_desc = IXGB_CONTEXT_DESC(adapter->tx_ring, i);
1250                 buffer_info = &adapter->tx_ring.buffer_info[i];
1251                 WARN_ON(buffer_info->dma != 0);
1252
1253                 context_desc->ipcss = ipcss;
1254                 context_desc->ipcso = ipcso;
1255                 context_desc->ipcse = cpu_to_le16(ipcse);
1256                 context_desc->tucss = tucss;
1257                 context_desc->tucso = tucso;
1258                 context_desc->tucse = cpu_to_le16(tucse);
1259                 context_desc->mss = cpu_to_le16(mss);
1260                 context_desc->hdr_len = hdr_len;
1261                 context_desc->status = 0;
1262                 context_desc->cmd_type_len = cpu_to_le32(
1263                                                   IXGB_CONTEXT_DESC_TYPE
1264                                                 | IXGB_CONTEXT_DESC_CMD_TSE
1265                                                 | IXGB_CONTEXT_DESC_CMD_IP
1266                                                 | IXGB_CONTEXT_DESC_CMD_TCP
1267                                                 | IXGB_CONTEXT_DESC_CMD_IDE
1268                                                 | (skb->len - (hdr_len)));
1269
1270
1271                 if (++i == adapter->tx_ring.count) i = 0;
1272                 adapter->tx_ring.next_to_use = i;
1273
1274                 return 1;
1275         }
1276
1277         return 0;
1278 }
1279
1280 static bool
1281 ixgb_tx_csum(struct ixgb_adapter *adapter, struct sk_buff *skb)
1282 {
1283         struct ixgb_context_desc *context_desc;
1284         unsigned int i;
1285         u8 css, cso;
1286
1287         if (likely(skb->ip_summed == CHECKSUM_PARTIAL)) {
1288                 struct ixgb_buffer *buffer_info;
1289                 css = skb_checksum_start_offset(skb);
1290                 cso = css + skb->csum_offset;
1291
1292                 i = adapter->tx_ring.next_to_use;
1293                 context_desc = IXGB_CONTEXT_DESC(adapter->tx_ring, i);
1294                 buffer_info = &adapter->tx_ring.buffer_info[i];
1295                 WARN_ON(buffer_info->dma != 0);
1296
1297                 context_desc->tucss = css;
1298                 context_desc->tucso = cso;
1299                 context_desc->tucse = 0;
1300                 /* zero out any previously existing data in one instruction */
1301                 *(u32 *)&(context_desc->ipcss) = 0;
1302                 context_desc->status = 0;
1303                 context_desc->hdr_len = 0;
1304                 context_desc->mss = 0;
1305                 context_desc->cmd_type_len =
1306                         cpu_to_le32(IXGB_CONTEXT_DESC_TYPE
1307                                     | IXGB_TX_DESC_CMD_IDE);
1308
1309                 if (++i == adapter->tx_ring.count) i = 0;
1310                 adapter->tx_ring.next_to_use = i;
1311
1312                 return true;
1313         }
1314
1315         return false;
1316 }
1317
1318 #define IXGB_MAX_TXD_PWR        14
1319 #define IXGB_MAX_DATA_PER_TXD   (1<<IXGB_MAX_TXD_PWR)
1320
1321 static int
1322 ixgb_tx_map(struct ixgb_adapter *adapter, struct sk_buff *skb,
1323             unsigned int first)
1324 {
1325         struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
1326         struct pci_dev *pdev = adapter->pdev;
1327         struct ixgb_buffer *buffer_info;
1328         int len = skb_headlen(skb);
1329         unsigned int offset = 0, size, count = 0, i;
1330         unsigned int mss = skb_shinfo(skb)->gso_size;
1331         unsigned int nr_frags = skb_shinfo(skb)->nr_frags;
1332         unsigned int f;
1333
1334         i = tx_ring->next_to_use;
1335
1336         while (len) {
1337                 buffer_info = &tx_ring->buffer_info[i];
1338                 size = min(len, IXGB_MAX_DATA_PER_TXD);
1339                 /* Workaround for premature desc write-backs
1340                  * in TSO mode.  Append 4-byte sentinel desc */
1341                 if (unlikely(mss && !nr_frags && size == len && size > 8))
1342                         size -= 4;
1343
1344                 buffer_info->length = size;
1345                 WARN_ON(buffer_info->dma != 0);
1346                 buffer_info->time_stamp = jiffies;
1347                 buffer_info->mapped_as_page = false;
1348                 buffer_info->dma = dma_map_single(&pdev->dev,
1349                                                   skb->data + offset,
1350                                                   size, DMA_TO_DEVICE);
1351                 if (dma_mapping_error(&pdev->dev, buffer_info->dma))
1352                         goto dma_error;
1353                 buffer_info->next_to_watch = 0;
1354
1355                 len -= size;
1356                 offset += size;
1357                 count++;
1358                 if (len) {
1359                         i++;
1360                         if (i == tx_ring->count)
1361                                 i = 0;
1362                 }
1363         }
1364
1365         for (f = 0; f < nr_frags; f++) {
1366                 const struct skb_frag_struct *frag;
1367
1368                 frag = &skb_shinfo(skb)->frags[f];
1369                 len = skb_frag_size(frag);
1370                 offset = 0;
1371
1372                 while (len) {
1373                         i++;
1374                         if (i == tx_ring->count)
1375                                 i = 0;
1376
1377                         buffer_info = &tx_ring->buffer_info[i];
1378                         size = min(len, IXGB_MAX_DATA_PER_TXD);
1379
1380                         /* Workaround for premature desc write-backs
1381                          * in TSO mode.  Append 4-byte sentinel desc */
1382                         if (unlikely(mss && (f == (nr_frags - 1))
1383                                      && size == len && size > 8))
1384                                 size -= 4;
1385
1386                         buffer_info->length = size;
1387                         buffer_info->time_stamp = jiffies;
1388                         buffer_info->mapped_as_page = true;
1389                         buffer_info->dma =
1390                                 skb_frag_dma_map(&pdev->dev, frag, offset, size,
1391                                                  DMA_TO_DEVICE);
1392                         if (dma_mapping_error(&pdev->dev, buffer_info->dma))
1393                                 goto dma_error;
1394                         buffer_info->next_to_watch = 0;
1395
1396                         len -= size;
1397                         offset += size;
1398                         count++;
1399                 }
1400         }
1401         tx_ring->buffer_info[i].skb = skb;
1402         tx_ring->buffer_info[first].next_to_watch = i;
1403
1404         return count;
1405
1406 dma_error:
1407         dev_err(&pdev->dev, "TX DMA map failed\n");
1408         buffer_info->dma = 0;
1409         if (count)
1410                 count--;
1411
1412         while (count--) {
1413                 if (i==0)
1414                         i += tx_ring->count;
1415                 i--;
1416                 buffer_info = &tx_ring->buffer_info[i];
1417                 ixgb_unmap_and_free_tx_resource(adapter, buffer_info);
1418         }
1419
1420         return 0;
1421 }
1422
1423 static void
1424 ixgb_tx_queue(struct ixgb_adapter *adapter, int count, int vlan_id,int tx_flags)
1425 {
1426         struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
1427         struct ixgb_tx_desc *tx_desc = NULL;
1428         struct ixgb_buffer *buffer_info;
1429         u32 cmd_type_len = adapter->tx_cmd_type;
1430         u8 status = 0;
1431         u8 popts = 0;
1432         unsigned int i;
1433
1434         if (tx_flags & IXGB_TX_FLAGS_TSO) {
1435                 cmd_type_len |= IXGB_TX_DESC_CMD_TSE;
1436                 popts |= (IXGB_TX_DESC_POPTS_IXSM | IXGB_TX_DESC_POPTS_TXSM);
1437         }
1438
1439         if (tx_flags & IXGB_TX_FLAGS_CSUM)
1440                 popts |= IXGB_TX_DESC_POPTS_TXSM;
1441
1442         if (tx_flags & IXGB_TX_FLAGS_VLAN)
1443                 cmd_type_len |= IXGB_TX_DESC_CMD_VLE;
1444
1445         i = tx_ring->next_to_use;
1446
1447         while (count--) {
1448                 buffer_info = &tx_ring->buffer_info[i];
1449                 tx_desc = IXGB_TX_DESC(*tx_ring, i);
1450                 tx_desc->buff_addr = cpu_to_le64(buffer_info->dma);
1451                 tx_desc->cmd_type_len =
1452                         cpu_to_le32(cmd_type_len | buffer_info->length);
1453                 tx_desc->status = status;
1454                 tx_desc->popts = popts;
1455                 tx_desc->vlan = cpu_to_le16(vlan_id);
1456
1457                 if (++i == tx_ring->count) i = 0;
1458         }
1459
1460         tx_desc->cmd_type_len |=
1461                 cpu_to_le32(IXGB_TX_DESC_CMD_EOP | IXGB_TX_DESC_CMD_RS);
1462
1463         /* Force memory writes to complete before letting h/w
1464          * know there are new descriptors to fetch.  (Only
1465          * applicable for weak-ordered memory model archs,
1466          * such as IA-64). */
1467         wmb();
1468
1469         tx_ring->next_to_use = i;
1470         IXGB_WRITE_REG(&adapter->hw, TDT, i);
1471 }
1472
1473 static int __ixgb_maybe_stop_tx(struct net_device *netdev, int size)
1474 {
1475         struct ixgb_adapter *adapter = netdev_priv(netdev);
1476         struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
1477
1478         netif_stop_queue(netdev);
1479         /* Herbert's original patch had:
1480          *  smp_mb__after_netif_stop_queue();
1481          * but since that doesn't exist yet, just open code it. */
1482         smp_mb();
1483
1484         /* We need to check again in a case another CPU has just
1485          * made room available. */
1486         if (likely(IXGB_DESC_UNUSED(tx_ring) < size))
1487                 return -EBUSY;
1488
1489         /* A reprieve! */
1490         netif_start_queue(netdev);
1491         ++adapter->restart_queue;
1492         return 0;
1493 }
1494
1495 static int ixgb_maybe_stop_tx(struct net_device *netdev,
1496                               struct ixgb_desc_ring *tx_ring, int size)
1497 {
1498         if (likely(IXGB_DESC_UNUSED(tx_ring) >= size))
1499                 return 0;
1500         return __ixgb_maybe_stop_tx(netdev, size);
1501 }
1502
1503
1504 /* Tx Descriptors needed, worst case */
1505 #define TXD_USE_COUNT(S) (((S) >> IXGB_MAX_TXD_PWR) + \
1506                          (((S) & (IXGB_MAX_DATA_PER_TXD - 1)) ? 1 : 0))
1507 #define DESC_NEEDED TXD_USE_COUNT(IXGB_MAX_DATA_PER_TXD) /* skb->date */ + \
1508         MAX_SKB_FRAGS * TXD_USE_COUNT(PAGE_SIZE) + 1 /* for context */ \
1509         + 1 /* one more needed for sentinel TSO workaround */
1510
1511 static netdev_tx_t
1512 ixgb_xmit_frame(struct sk_buff *skb, struct net_device *netdev)
1513 {
1514         struct ixgb_adapter *adapter = netdev_priv(netdev);
1515         unsigned int first;
1516         unsigned int tx_flags = 0;
1517         int vlan_id = 0;
1518         int count = 0;
1519         int tso;
1520
1521         if (test_bit(__IXGB_DOWN, &adapter->flags)) {
1522                 dev_kfree_skb_any(skb);
1523                 return NETDEV_TX_OK;
1524         }
1525
1526         if (skb->len <= 0) {
1527                 dev_kfree_skb_any(skb);
1528                 return NETDEV_TX_OK;
1529         }
1530
1531         if (unlikely(ixgb_maybe_stop_tx(netdev, &adapter->tx_ring,
1532                      DESC_NEEDED)))
1533                 return NETDEV_TX_BUSY;
1534
1535         if (vlan_tx_tag_present(skb)) {
1536                 tx_flags |= IXGB_TX_FLAGS_VLAN;
1537                 vlan_id = vlan_tx_tag_get(skb);
1538         }
1539
1540         first = adapter->tx_ring.next_to_use;
1541
1542         tso = ixgb_tso(adapter, skb);
1543         if (tso < 0) {
1544                 dev_kfree_skb_any(skb);
1545                 return NETDEV_TX_OK;
1546         }
1547
1548         if (likely(tso))
1549                 tx_flags |= IXGB_TX_FLAGS_TSO;
1550         else if (ixgb_tx_csum(adapter, skb))
1551                 tx_flags |= IXGB_TX_FLAGS_CSUM;
1552
1553         count = ixgb_tx_map(adapter, skb, first);
1554
1555         if (count) {
1556                 ixgb_tx_queue(adapter, count, vlan_id, tx_flags);
1557                 /* Make sure there is space in the ring for the next send. */
1558                 ixgb_maybe_stop_tx(netdev, &adapter->tx_ring, DESC_NEEDED);
1559
1560         } else {
1561                 dev_kfree_skb_any(skb);
1562                 adapter->tx_ring.buffer_info[first].time_stamp = 0;
1563                 adapter->tx_ring.next_to_use = first;
1564         }
1565
1566         return NETDEV_TX_OK;
1567 }
1568
1569 /**
1570  * ixgb_tx_timeout - Respond to a Tx Hang
1571  * @netdev: network interface device structure
1572  **/
1573
1574 static void
1575 ixgb_tx_timeout(struct net_device *netdev)
1576 {
1577         struct ixgb_adapter *adapter = netdev_priv(netdev);
1578
1579         /* Do the reset outside of interrupt context */
1580         schedule_work(&adapter->tx_timeout_task);
1581 }
1582
1583 static void
1584 ixgb_tx_timeout_task(struct work_struct *work)
1585 {
1586         struct ixgb_adapter *adapter =
1587                 container_of(work, struct ixgb_adapter, tx_timeout_task);
1588
1589         adapter->tx_timeout_count++;
1590         ixgb_down(adapter, true);
1591         ixgb_up(adapter);
1592 }
1593
1594 /**
1595  * ixgb_get_stats - Get System Network Statistics
1596  * @netdev: network interface device structure
1597  *
1598  * Returns the address of the device statistics structure.
1599  * The statistics are actually updated from the timer callback.
1600  **/
1601
1602 static struct net_device_stats *
1603 ixgb_get_stats(struct net_device *netdev)
1604 {
1605         return &netdev->stats;
1606 }
1607
1608 /**
1609  * ixgb_change_mtu - Change the Maximum Transfer Unit
1610  * @netdev: network interface device structure
1611  * @new_mtu: new value for maximum frame size
1612  *
1613  * Returns 0 on success, negative on failure
1614  **/
1615
1616 static int
1617 ixgb_change_mtu(struct net_device *netdev, int new_mtu)
1618 {
1619         struct ixgb_adapter *adapter = netdev_priv(netdev);
1620         int max_frame = new_mtu + ENET_HEADER_SIZE + ENET_FCS_LENGTH;
1621         int old_max_frame = netdev->mtu + ENET_HEADER_SIZE + ENET_FCS_LENGTH;
1622
1623         /* MTU < 68 is an error for IPv4 traffic, just don't allow it */
1624         if ((new_mtu < 68) ||
1625             (max_frame > IXGB_MAX_JUMBO_FRAME_SIZE + ENET_FCS_LENGTH)) {
1626                 netif_err(adapter, probe, adapter->netdev,
1627                           "Invalid MTU setting %d\n", new_mtu);
1628                 return -EINVAL;
1629         }
1630
1631         if (old_max_frame == max_frame)
1632                 return 0;
1633
1634         if (netif_running(netdev))
1635                 ixgb_down(adapter, true);
1636
1637         adapter->rx_buffer_len = max_frame + 8; /* + 8 for errata */
1638
1639         netdev->mtu = new_mtu;
1640
1641         if (netif_running(netdev))
1642                 ixgb_up(adapter);
1643
1644         return 0;
1645 }
1646
1647 /**
1648  * ixgb_update_stats - Update the board statistics counters.
1649  * @adapter: board private structure
1650  **/
1651
1652 void
1653 ixgb_update_stats(struct ixgb_adapter *adapter)
1654 {
1655         struct net_device *netdev = adapter->netdev;
1656         struct pci_dev *pdev = adapter->pdev;
1657
1658         /* Prevent stats update while adapter is being reset */
1659         if (pci_channel_offline(pdev))
1660                 return;
1661
1662         if ((netdev->flags & IFF_PROMISC) || (netdev->flags & IFF_ALLMULTI) ||
1663            (netdev_mc_count(netdev) > IXGB_MAX_NUM_MULTICAST_ADDRESSES)) {
1664                 u64 multi = IXGB_READ_REG(&adapter->hw, MPRCL);
1665                 u32 bcast_l = IXGB_READ_REG(&adapter->hw, BPRCL);
1666                 u32 bcast_h = IXGB_READ_REG(&adapter->hw, BPRCH);
1667                 u64 bcast = ((u64)bcast_h << 32) | bcast_l;
1668
1669                 multi |= ((u64)IXGB_READ_REG(&adapter->hw, MPRCH) << 32);
1670                 /* fix up multicast stats by removing broadcasts */
1671                 if (multi >= bcast)
1672                         multi -= bcast;
1673
1674                 adapter->stats.mprcl += (multi & 0xFFFFFFFF);
1675                 adapter->stats.mprch += (multi >> 32);
1676                 adapter->stats.bprcl += bcast_l;
1677                 adapter->stats.bprch += bcast_h;
1678         } else {
1679                 adapter->stats.mprcl += IXGB_READ_REG(&adapter->hw, MPRCL);
1680                 adapter->stats.mprch += IXGB_READ_REG(&adapter->hw, MPRCH);
1681                 adapter->stats.bprcl += IXGB_READ_REG(&adapter->hw, BPRCL);
1682                 adapter->stats.bprch += IXGB_READ_REG(&adapter->hw, BPRCH);
1683         }
1684         adapter->stats.tprl += IXGB_READ_REG(&adapter->hw, TPRL);
1685         adapter->stats.tprh += IXGB_READ_REG(&adapter->hw, TPRH);
1686         adapter->stats.gprcl += IXGB_READ_REG(&adapter->hw, GPRCL);
1687         adapter->stats.gprch += IXGB_READ_REG(&adapter->hw, GPRCH);
1688         adapter->stats.uprcl += IXGB_READ_REG(&adapter->hw, UPRCL);
1689         adapter->stats.uprch += IXGB_READ_REG(&adapter->hw, UPRCH);
1690         adapter->stats.vprcl += IXGB_READ_REG(&adapter->hw, VPRCL);
1691         adapter->stats.vprch += IXGB_READ_REG(&adapter->hw, VPRCH);
1692         adapter->stats.jprcl += IXGB_READ_REG(&adapter->hw, JPRCL);
1693         adapter->stats.jprch += IXGB_READ_REG(&adapter->hw, JPRCH);
1694         adapter->stats.gorcl += IXGB_READ_REG(&adapter->hw, GORCL);
1695         adapter->stats.gorch += IXGB_READ_REG(&adapter->hw, GORCH);
1696         adapter->stats.torl += IXGB_READ_REG(&adapter->hw, TORL);
1697         adapter->stats.torh += IXGB_READ_REG(&adapter->hw, TORH);
1698         adapter->stats.rnbc += IXGB_READ_REG(&adapter->hw, RNBC);
1699         adapter->stats.ruc += IXGB_READ_REG(&adapter->hw, RUC);
1700         adapter->stats.roc += IXGB_READ_REG(&adapter->hw, ROC);
1701         adapter->stats.rlec += IXGB_READ_REG(&adapter->hw, RLEC);
1702         adapter->stats.crcerrs += IXGB_READ_REG(&adapter->hw, CRCERRS);
1703         adapter->stats.icbc += IXGB_READ_REG(&adapter->hw, ICBC);
1704         adapter->stats.ecbc += IXGB_READ_REG(&adapter->hw, ECBC);
1705         adapter->stats.mpc += IXGB_READ_REG(&adapter->hw, MPC);
1706         adapter->stats.tptl += IXGB_READ_REG(&adapter->hw, TPTL);
1707         adapter->stats.tpth += IXGB_READ_REG(&adapter->hw, TPTH);
1708         adapter->stats.gptcl += IXGB_READ_REG(&adapter->hw, GPTCL);
1709         adapter->stats.gptch += IXGB_READ_REG(&adapter->hw, GPTCH);
1710         adapter->stats.bptcl += IXGB_READ_REG(&adapter->hw, BPTCL);
1711         adapter->stats.bptch += IXGB_READ_REG(&adapter->hw, BPTCH);
1712         adapter->stats.mptcl += IXGB_READ_REG(&adapter->hw, MPTCL);
1713         adapter->stats.mptch += IXGB_READ_REG(&adapter->hw, MPTCH);
1714         adapter->stats.uptcl += IXGB_READ_REG(&adapter->hw, UPTCL);
1715         adapter->stats.uptch += IXGB_READ_REG(&adapter->hw, UPTCH);
1716         adapter->stats.vptcl += IXGB_READ_REG(&adapter->hw, VPTCL);
1717         adapter->stats.vptch += IXGB_READ_REG(&adapter->hw, VPTCH);
1718         adapter->stats.jptcl += IXGB_READ_REG(&adapter->hw, JPTCL);
1719         adapter->stats.jptch += IXGB_READ_REG(&adapter->hw, JPTCH);
1720         adapter->stats.gotcl += IXGB_READ_REG(&adapter->hw, GOTCL);
1721         adapter->stats.gotch += IXGB_READ_REG(&adapter->hw, GOTCH);
1722         adapter->stats.totl += IXGB_READ_REG(&adapter->hw, TOTL);
1723         adapter->stats.toth += IXGB_READ_REG(&adapter->hw, TOTH);
1724         adapter->stats.dc += IXGB_READ_REG(&adapter->hw, DC);
1725         adapter->stats.plt64c += IXGB_READ_REG(&adapter->hw, PLT64C);
1726         adapter->stats.tsctc += IXGB_READ_REG(&adapter->hw, TSCTC);
1727         adapter->stats.tsctfc += IXGB_READ_REG(&adapter->hw, TSCTFC);
1728         adapter->stats.ibic += IXGB_READ_REG(&adapter->hw, IBIC);
1729         adapter->stats.rfc += IXGB_READ_REG(&adapter->hw, RFC);
1730         adapter->stats.lfc += IXGB_READ_REG(&adapter->hw, LFC);
1731         adapter->stats.pfrc += IXGB_READ_REG(&adapter->hw, PFRC);
1732         adapter->stats.pftc += IXGB_READ_REG(&adapter->hw, PFTC);
1733         adapter->stats.mcfrc += IXGB_READ_REG(&adapter->hw, MCFRC);
1734         adapter->stats.mcftc += IXGB_READ_REG(&adapter->hw, MCFTC);
1735         adapter->stats.xonrxc += IXGB_READ_REG(&adapter->hw, XONRXC);
1736         adapter->stats.xontxc += IXGB_READ_REG(&adapter->hw, XONTXC);
1737         adapter->stats.xoffrxc += IXGB_READ_REG(&adapter->hw, XOFFRXC);
1738         adapter->stats.xofftxc += IXGB_READ_REG(&adapter->hw, XOFFTXC);
1739         adapter->stats.rjc += IXGB_READ_REG(&adapter->hw, RJC);
1740
1741         /* Fill out the OS statistics structure */
1742
1743         netdev->stats.rx_packets = adapter->stats.gprcl;
1744         netdev->stats.tx_packets = adapter->stats.gptcl;
1745         netdev->stats.rx_bytes = adapter->stats.gorcl;
1746         netdev->stats.tx_bytes = adapter->stats.gotcl;
1747         netdev->stats.multicast = adapter->stats.mprcl;
1748         netdev->stats.collisions = 0;
1749
1750         /* ignore RLEC as it reports errors for padded (<64bytes) frames
1751          * with a length in the type/len field */
1752         netdev->stats.rx_errors =
1753             /* adapter->stats.rnbc + */ adapter->stats.crcerrs +
1754             adapter->stats.ruc +
1755             adapter->stats.roc /*+ adapter->stats.rlec */  +
1756             adapter->stats.icbc +
1757             adapter->stats.ecbc + adapter->stats.mpc;
1758
1759         /* see above
1760          * netdev->stats.rx_length_errors = adapter->stats.rlec;
1761          */
1762
1763         netdev->stats.rx_crc_errors = adapter->stats.crcerrs;
1764         netdev->stats.rx_fifo_errors = adapter->stats.mpc;
1765         netdev->stats.rx_missed_errors = adapter->stats.mpc;
1766         netdev->stats.rx_over_errors = adapter->stats.mpc;
1767
1768         netdev->stats.tx_errors = 0;
1769         netdev->stats.rx_frame_errors = 0;
1770         netdev->stats.tx_aborted_errors = 0;
1771         netdev->stats.tx_carrier_errors = 0;
1772         netdev->stats.tx_fifo_errors = 0;
1773         netdev->stats.tx_heartbeat_errors = 0;
1774         netdev->stats.tx_window_errors = 0;
1775 }
1776
1777 #define IXGB_MAX_INTR 10
1778 /**
1779  * ixgb_intr - Interrupt Handler
1780  * @irq: interrupt number
1781  * @data: pointer to a network interface device structure
1782  **/
1783
1784 static irqreturn_t
1785 ixgb_intr(int irq, void *data)
1786 {
1787         struct net_device *netdev = data;
1788         struct ixgb_adapter *adapter = netdev_priv(netdev);
1789         struct ixgb_hw *hw = &adapter->hw;
1790         u32 icr = IXGB_READ_REG(hw, ICR);
1791
1792         if (unlikely(!icr))
1793                 return IRQ_NONE;  /* Not our interrupt */
1794
1795         if (unlikely(icr & (IXGB_INT_RXSEQ | IXGB_INT_LSC)))
1796                 if (!test_bit(__IXGB_DOWN, &adapter->flags))
1797                         mod_timer(&adapter->watchdog_timer, jiffies);
1798
1799         if (napi_schedule_prep(&adapter->napi)) {
1800
1801                 /* Disable interrupts and register for poll. The flush
1802                   of the posted write is intentionally left out.
1803                 */
1804
1805                 IXGB_WRITE_REG(&adapter->hw, IMC, ~0);
1806                 __napi_schedule(&adapter->napi);
1807         }
1808         return IRQ_HANDLED;
1809 }
1810
1811 /**
1812  * ixgb_clean - NAPI Rx polling callback
1813  * @adapter: board private structure
1814  **/
1815
1816 static int
1817 ixgb_clean(struct napi_struct *napi, int budget)
1818 {
1819         struct ixgb_adapter *adapter = container_of(napi, struct ixgb_adapter, napi);
1820         int work_done = 0;
1821
1822         ixgb_clean_tx_irq(adapter);
1823         ixgb_clean_rx_irq(adapter, &work_done, budget);
1824
1825         /* If budget not fully consumed, exit the polling mode */
1826         if (work_done < budget) {
1827                 napi_complete(napi);
1828                 if (!test_bit(__IXGB_DOWN, &adapter->flags))
1829                         ixgb_irq_enable(adapter);
1830         }
1831
1832         return work_done;
1833 }
1834
1835 /**
1836  * ixgb_clean_tx_irq - Reclaim resources after transmit completes
1837  * @adapter: board private structure
1838  **/
1839
1840 static bool
1841 ixgb_clean_tx_irq(struct ixgb_adapter *adapter)
1842 {
1843         struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
1844         struct net_device *netdev = adapter->netdev;
1845         struct ixgb_tx_desc *tx_desc, *eop_desc;
1846         struct ixgb_buffer *buffer_info;
1847         unsigned int i, eop;
1848         bool cleaned = false;
1849
1850         i = tx_ring->next_to_clean;
1851         eop = tx_ring->buffer_info[i].next_to_watch;
1852         eop_desc = IXGB_TX_DESC(*tx_ring, eop);
1853
1854         while (eop_desc->status & IXGB_TX_DESC_STATUS_DD) {
1855
1856                 rmb(); /* read buffer_info after eop_desc */
1857                 for (cleaned = false; !cleaned; ) {
1858                         tx_desc = IXGB_TX_DESC(*tx_ring, i);
1859                         buffer_info = &tx_ring->buffer_info[i];
1860
1861                         if (tx_desc->popts &
1862                            (IXGB_TX_DESC_POPTS_TXSM |
1863                             IXGB_TX_DESC_POPTS_IXSM))
1864                                 adapter->hw_csum_tx_good++;
1865
1866                         ixgb_unmap_and_free_tx_resource(adapter, buffer_info);
1867
1868                         *(u32 *)&(tx_desc->status) = 0;
1869
1870                         cleaned = (i == eop);
1871                         if (++i == tx_ring->count) i = 0;
1872                 }
1873
1874                 eop = tx_ring->buffer_info[i].next_to_watch;
1875                 eop_desc = IXGB_TX_DESC(*tx_ring, eop);
1876         }
1877
1878         tx_ring->next_to_clean = i;
1879
1880         if (unlikely(cleaned && netif_carrier_ok(netdev) &&
1881                      IXGB_DESC_UNUSED(tx_ring) >= DESC_NEEDED)) {
1882                 /* Make sure that anybody stopping the queue after this
1883                  * sees the new next_to_clean. */
1884                 smp_mb();
1885
1886                 if (netif_queue_stopped(netdev) &&
1887                     !(test_bit(__IXGB_DOWN, &adapter->flags))) {
1888                         netif_wake_queue(netdev);
1889                         ++adapter->restart_queue;
1890                 }
1891         }
1892
1893         if (adapter->detect_tx_hung) {
1894                 /* detect a transmit hang in hardware, this serializes the
1895                  * check with the clearing of time_stamp and movement of i */
1896                 adapter->detect_tx_hung = false;
1897                 if (tx_ring->buffer_info[eop].time_stamp &&
1898                    time_after(jiffies, tx_ring->buffer_info[eop].time_stamp + HZ)
1899                    && !(IXGB_READ_REG(&adapter->hw, STATUS) &
1900                         IXGB_STATUS_TXOFF)) {
1901                         /* detected Tx unit hang */
1902                         netif_err(adapter, drv, adapter->netdev,
1903                                   "Detected Tx Unit Hang\n"
1904                                   "  TDH                  <%x>\n"
1905                                   "  TDT                  <%x>\n"
1906                                   "  next_to_use          <%x>\n"
1907                                   "  next_to_clean        <%x>\n"
1908                                   "buffer_info[next_to_clean]\n"
1909                                   "  time_stamp           <%lx>\n"
1910                                   "  next_to_watch        <%x>\n"
1911                                   "  jiffies              <%lx>\n"
1912                                   "  next_to_watch.status <%x>\n",
1913                                   IXGB_READ_REG(&adapter->hw, TDH),
1914                                   IXGB_READ_REG(&adapter->hw, TDT),
1915                                   tx_ring->next_to_use,
1916                                   tx_ring->next_to_clean,
1917                                   tx_ring->buffer_info[eop].time_stamp,
1918                                   eop,
1919                                   jiffies,
1920                                   eop_desc->status);
1921                         netif_stop_queue(netdev);
1922                 }
1923         }
1924
1925         return cleaned;
1926 }
1927
1928 /**
1929  * ixgb_rx_checksum - Receive Checksum Offload for 82597.
1930  * @adapter: board private structure
1931  * @rx_desc: receive descriptor
1932  * @sk_buff: socket buffer with received data
1933  **/
1934
1935 static void
1936 ixgb_rx_checksum(struct ixgb_adapter *adapter,
1937                  struct ixgb_rx_desc *rx_desc,
1938                  struct sk_buff *skb)
1939 {
1940         /* Ignore Checksum bit is set OR
1941          * TCP Checksum has not been calculated
1942          */
1943         if ((rx_desc->status & IXGB_RX_DESC_STATUS_IXSM) ||
1944            (!(rx_desc->status & IXGB_RX_DESC_STATUS_TCPCS))) {
1945                 skb_checksum_none_assert(skb);
1946                 return;
1947         }
1948
1949         /* At this point we know the hardware did the TCP checksum */
1950         /* now look at the TCP checksum error bit */
1951         if (rx_desc->errors & IXGB_RX_DESC_ERRORS_TCPE) {
1952                 /* let the stack verify checksum errors */
1953                 skb_checksum_none_assert(skb);
1954                 adapter->hw_csum_rx_error++;
1955         } else {
1956                 /* TCP checksum is good */
1957                 skb->ip_summed = CHECKSUM_UNNECESSARY;
1958                 adapter->hw_csum_rx_good++;
1959         }
1960 }
1961
1962 /*
1963  * this should improve performance for small packets with large amounts
1964  * of reassembly being done in the stack
1965  */
1966 static void ixgb_check_copybreak(struct net_device *netdev,
1967                                  struct ixgb_buffer *buffer_info,
1968                                  u32 length, struct sk_buff **skb)
1969 {
1970         struct sk_buff *new_skb;
1971
1972         if (length > copybreak)
1973                 return;
1974
1975         new_skb = netdev_alloc_skb_ip_align(netdev, length);
1976         if (!new_skb)
1977                 return;
1978
1979         skb_copy_to_linear_data_offset(new_skb, -NET_IP_ALIGN,
1980                                        (*skb)->data - NET_IP_ALIGN,
1981                                        length + NET_IP_ALIGN);
1982         /* save the skb in buffer_info as good */
1983         buffer_info->skb = *skb;
1984         *skb = new_skb;
1985 }
1986
1987 /**
1988  * ixgb_clean_rx_irq - Send received data up the network stack,
1989  * @adapter: board private structure
1990  **/
1991
1992 static bool
1993 ixgb_clean_rx_irq(struct ixgb_adapter *adapter, int *work_done, int work_to_do)
1994 {
1995         struct ixgb_desc_ring *rx_ring = &adapter->rx_ring;
1996         struct net_device *netdev = adapter->netdev;
1997         struct pci_dev *pdev = adapter->pdev;
1998         struct ixgb_rx_desc *rx_desc, *next_rxd;
1999         struct ixgb_buffer *buffer_info, *next_buffer, *next2_buffer;
2000         u32 length;
2001         unsigned int i, j;
2002         int cleaned_count = 0;
2003         bool cleaned = false;
2004
2005         i = rx_ring->next_to_clean;
2006         rx_desc = IXGB_RX_DESC(*rx_ring, i);
2007         buffer_info = &rx_ring->buffer_info[i];
2008
2009         while (rx_desc->status & IXGB_RX_DESC_STATUS_DD) {
2010                 struct sk_buff *skb;
2011                 u8 status;
2012
2013                 if (*work_done >= work_to_do)
2014                         break;
2015
2016                 (*work_done)++;
2017                 rmb();  /* read descriptor and rx_buffer_info after status DD */
2018                 status = rx_desc->status;
2019                 skb = buffer_info->skb;
2020                 buffer_info->skb = NULL;
2021
2022                 prefetch(skb->data - NET_IP_ALIGN);
2023
2024                 if (++i == rx_ring->count)
2025                         i = 0;
2026                 next_rxd = IXGB_RX_DESC(*rx_ring, i);
2027                 prefetch(next_rxd);
2028
2029                 j = i + 1;
2030                 if (j == rx_ring->count)
2031                         j = 0;
2032                 next2_buffer = &rx_ring->buffer_info[j];
2033                 prefetch(next2_buffer);
2034
2035                 next_buffer = &rx_ring->buffer_info[i];
2036
2037                 cleaned = true;
2038                 cleaned_count++;
2039
2040                 dma_unmap_single(&pdev->dev,
2041                                  buffer_info->dma,
2042                                  buffer_info->length,
2043                                  DMA_FROM_DEVICE);
2044                 buffer_info->dma = 0;
2045
2046                 length = le16_to_cpu(rx_desc->length);
2047                 rx_desc->length = 0;
2048
2049                 if (unlikely(!(status & IXGB_RX_DESC_STATUS_EOP))) {
2050
2051                         /* All receives must fit into a single buffer */
2052
2053                         pr_debug("Receive packet consumed multiple buffers length<%x>\n",
2054                                  length);
2055
2056                         dev_kfree_skb_irq(skb);
2057                         goto rxdesc_done;
2058                 }
2059
2060                 if (unlikely(rx_desc->errors &
2061                     (IXGB_RX_DESC_ERRORS_CE | IXGB_RX_DESC_ERRORS_SE |
2062                      IXGB_RX_DESC_ERRORS_P | IXGB_RX_DESC_ERRORS_RXE))) {
2063                         dev_kfree_skb_irq(skb);
2064                         goto rxdesc_done;
2065                 }
2066
2067                 ixgb_check_copybreak(netdev, buffer_info, length, &skb);
2068
2069                 /* Good Receive */
2070                 skb_put(skb, length);
2071
2072                 /* Receive Checksum Offload */
2073                 ixgb_rx_checksum(adapter, rx_desc, skb);
2074
2075                 skb->protocol = eth_type_trans(skb, netdev);
2076                 if (status & IXGB_RX_DESC_STATUS_VP)
2077                         __vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q),
2078                                        le16_to_cpu(rx_desc->special));
2079
2080                 netif_receive_skb(skb);
2081
2082 rxdesc_done:
2083                 /* clean up descriptor, might be written over by hw */
2084                 rx_desc->status = 0;
2085
2086                 /* return some buffers to hardware, one at a time is too slow */
2087                 if (unlikely(cleaned_count >= IXGB_RX_BUFFER_WRITE)) {
2088                         ixgb_alloc_rx_buffers(adapter, cleaned_count);
2089                         cleaned_count = 0;
2090                 }
2091
2092                 /* use prefetched values */
2093                 rx_desc = next_rxd;
2094                 buffer_info = next_buffer;
2095         }
2096
2097         rx_ring->next_to_clean = i;
2098
2099         cleaned_count = IXGB_DESC_UNUSED(rx_ring);
2100         if (cleaned_count)
2101                 ixgb_alloc_rx_buffers(adapter, cleaned_count);
2102
2103         return cleaned;
2104 }
2105
2106 /**
2107  * ixgb_alloc_rx_buffers - Replace used receive buffers
2108  * @adapter: address of board private structure
2109  **/
2110
2111 static void
2112 ixgb_alloc_rx_buffers(struct ixgb_adapter *adapter, int cleaned_count)
2113 {
2114         struct ixgb_desc_ring *rx_ring = &adapter->rx_ring;
2115         struct net_device *netdev = adapter->netdev;
2116         struct pci_dev *pdev = adapter->pdev;
2117         struct ixgb_rx_desc *rx_desc;
2118         struct ixgb_buffer *buffer_info;
2119         struct sk_buff *skb;
2120         unsigned int i;
2121         long cleancount;
2122
2123         i = rx_ring->next_to_use;
2124         buffer_info = &rx_ring->buffer_info[i];
2125         cleancount = IXGB_DESC_UNUSED(rx_ring);
2126
2127
2128         /* leave three descriptors unused */
2129         while (--cleancount > 2 && cleaned_count--) {
2130                 /* recycle! its good for you */
2131                 skb = buffer_info->skb;
2132                 if (skb) {
2133                         skb_trim(skb, 0);
2134                         goto map_skb;
2135                 }
2136
2137                 skb = netdev_alloc_skb_ip_align(netdev, adapter->rx_buffer_len);
2138                 if (unlikely(!skb)) {
2139                         /* Better luck next round */
2140                         adapter->alloc_rx_buff_failed++;
2141                         break;
2142                 }
2143
2144                 buffer_info->skb = skb;
2145                 buffer_info->length = adapter->rx_buffer_len;
2146 map_skb:
2147                 buffer_info->dma = dma_map_single(&pdev->dev,
2148                                                   skb->data,
2149                                                   adapter->rx_buffer_len,
2150                                                   DMA_FROM_DEVICE);
2151                 if (dma_mapping_error(&pdev->dev, buffer_info->dma)) {
2152                         adapter->alloc_rx_buff_failed++;
2153                         break;
2154                 }
2155
2156                 rx_desc = IXGB_RX_DESC(*rx_ring, i);
2157                 rx_desc->buff_addr = cpu_to_le64(buffer_info->dma);
2158                 /* guarantee DD bit not set now before h/w gets descriptor
2159                  * this is the rest of the workaround for h/w double
2160                  * writeback. */
2161                 rx_desc->status = 0;
2162
2163
2164                 if (++i == rx_ring->count)
2165                         i = 0;
2166                 buffer_info = &rx_ring->buffer_info[i];
2167         }
2168
2169         if (likely(rx_ring->next_to_use != i)) {
2170                 rx_ring->next_to_use = i;
2171                 if (unlikely(i-- == 0))
2172                         i = (rx_ring->count - 1);
2173
2174                 /* Force memory writes to complete before letting h/w
2175                  * know there are new descriptors to fetch.  (Only
2176                  * applicable for weak-ordered memory model archs, such
2177                  * as IA-64). */
2178                 wmb();
2179                 IXGB_WRITE_REG(&adapter->hw, RDT, i);
2180         }
2181 }
2182
2183 static void
2184 ixgb_vlan_strip_enable(struct ixgb_adapter *adapter)
2185 {
2186         u32 ctrl;
2187
2188         /* enable VLAN tag insert/strip */
2189         ctrl = IXGB_READ_REG(&adapter->hw, CTRL0);
2190         ctrl |= IXGB_CTRL0_VME;
2191         IXGB_WRITE_REG(&adapter->hw, CTRL0, ctrl);
2192 }
2193
2194 static void
2195 ixgb_vlan_strip_disable(struct ixgb_adapter *adapter)
2196 {
2197         u32 ctrl;
2198
2199         /* disable VLAN tag insert/strip */
2200         ctrl = IXGB_READ_REG(&adapter->hw, CTRL0);
2201         ctrl &= ~IXGB_CTRL0_VME;
2202         IXGB_WRITE_REG(&adapter->hw, CTRL0, ctrl);
2203 }
2204
2205 static int
2206 ixgb_vlan_rx_add_vid(struct net_device *netdev, __be16 proto, u16 vid)
2207 {
2208         struct ixgb_adapter *adapter = netdev_priv(netdev);
2209         u32 vfta, index;
2210
2211         /* add VID to filter table */
2212
2213         index = (vid >> 5) & 0x7F;
2214         vfta = IXGB_READ_REG_ARRAY(&adapter->hw, VFTA, index);
2215         vfta |= (1 << (vid & 0x1F));
2216         ixgb_write_vfta(&adapter->hw, index, vfta);
2217         set_bit(vid, adapter->active_vlans);
2218
2219         return 0;
2220 }
2221
2222 static int
2223 ixgb_vlan_rx_kill_vid(struct net_device *netdev, __be16 proto, u16 vid)
2224 {
2225         struct ixgb_adapter *adapter = netdev_priv(netdev);
2226         u32 vfta, index;
2227
2228         /* remove VID from filter table */
2229
2230         index = (vid >> 5) & 0x7F;
2231         vfta = IXGB_READ_REG_ARRAY(&adapter->hw, VFTA, index);
2232         vfta &= ~(1 << (vid & 0x1F));
2233         ixgb_write_vfta(&adapter->hw, index, vfta);
2234         clear_bit(vid, adapter->active_vlans);
2235
2236         return 0;
2237 }
2238
2239 static void
2240 ixgb_restore_vlan(struct ixgb_adapter *adapter)
2241 {
2242         u16 vid;
2243
2244         for_each_set_bit(vid, adapter->active_vlans, VLAN_N_VID)
2245                 ixgb_vlan_rx_add_vid(adapter->netdev, htons(ETH_P_8021Q), vid);
2246 }
2247
2248 #ifdef CONFIG_NET_POLL_CONTROLLER
2249 /*
2250  * Polling 'interrupt' - used by things like netconsole to send skbs
2251  * without having to re-enable interrupts. It's not called while
2252  * the interrupt routine is executing.
2253  */
2254
2255 static void ixgb_netpoll(struct net_device *dev)
2256 {
2257         struct ixgb_adapter *adapter = netdev_priv(dev);
2258
2259         disable_irq(adapter->pdev->irq);
2260         ixgb_intr(adapter->pdev->irq, dev);
2261         enable_irq(adapter->pdev->irq);
2262 }
2263 #endif
2264
2265 /**
2266  * ixgb_io_error_detected - called when PCI error is detected
2267  * @pdev:    pointer to pci device with error
2268  * @state:   pci channel state after error
2269  *
2270  * This callback is called by the PCI subsystem whenever
2271  * a PCI bus error is detected.
2272  */
2273 static pci_ers_result_t ixgb_io_error_detected(struct pci_dev *pdev,
2274                                                enum pci_channel_state state)
2275 {
2276         struct net_device *netdev = pci_get_drvdata(pdev);
2277         struct ixgb_adapter *adapter = netdev_priv(netdev);
2278
2279         netif_device_detach(netdev);
2280
2281         if (state == pci_channel_io_perm_failure)
2282                 return PCI_ERS_RESULT_DISCONNECT;
2283
2284         if (netif_running(netdev))
2285                 ixgb_down(adapter, true);
2286
2287         pci_disable_device(pdev);
2288
2289         /* Request a slot reset. */
2290         return PCI_ERS_RESULT_NEED_RESET;
2291 }
2292
2293 /**
2294  * ixgb_io_slot_reset - called after the pci bus has been reset.
2295  * @pdev    pointer to pci device with error
2296  *
2297  * This callback is called after the PCI bus has been reset.
2298  * Basically, this tries to restart the card from scratch.
2299  * This is a shortened version of the device probe/discovery code,
2300  * it resembles the first-half of the ixgb_probe() routine.
2301  */
2302 static pci_ers_result_t ixgb_io_slot_reset(struct pci_dev *pdev)
2303 {
2304         struct net_device *netdev = pci_get_drvdata(pdev);
2305         struct ixgb_adapter *adapter = netdev_priv(netdev);
2306
2307         if (pci_enable_device(pdev)) {
2308                 netif_err(adapter, probe, adapter->netdev,
2309                           "Cannot re-enable PCI device after reset\n");
2310                 return PCI_ERS_RESULT_DISCONNECT;
2311         }
2312
2313         /* Perform card reset only on one instance of the card */
2314         if (0 != PCI_FUNC (pdev->devfn))
2315                 return PCI_ERS_RESULT_RECOVERED;
2316
2317         pci_set_master(pdev);
2318
2319         netif_carrier_off(netdev);
2320         netif_stop_queue(netdev);
2321         ixgb_reset(adapter);
2322
2323         /* Make sure the EEPROM is good */
2324         if (!ixgb_validate_eeprom_checksum(&adapter->hw)) {
2325                 netif_err(adapter, probe, adapter->netdev,
2326                           "After reset, the EEPROM checksum is not valid\n");
2327                 return PCI_ERS_RESULT_DISCONNECT;
2328         }
2329         ixgb_get_ee_mac_addr(&adapter->hw, netdev->dev_addr);
2330         memcpy(netdev->perm_addr, netdev->dev_addr, netdev->addr_len);
2331
2332         if (!is_valid_ether_addr(netdev->perm_addr)) {
2333                 netif_err(adapter, probe, adapter->netdev,
2334                           "After reset, invalid MAC address\n");
2335                 return PCI_ERS_RESULT_DISCONNECT;
2336         }
2337
2338         return PCI_ERS_RESULT_RECOVERED;
2339 }
2340
2341 /**
2342  * ixgb_io_resume - called when its OK to resume normal operations
2343  * @pdev    pointer to pci device with error
2344  *
2345  * The error recovery driver tells us that its OK to resume
2346  * normal operation. Implementation resembles the second-half
2347  * of the ixgb_probe() routine.
2348  */
2349 static void ixgb_io_resume(struct pci_dev *pdev)
2350 {
2351         struct net_device *netdev = pci_get_drvdata(pdev);
2352         struct ixgb_adapter *adapter = netdev_priv(netdev);
2353
2354         pci_set_master(pdev);
2355
2356         if (netif_running(netdev)) {
2357                 if (ixgb_up(adapter)) {
2358                         pr_err("can't bring device back up after reset\n");
2359                         return;
2360                 }
2361         }
2362
2363         netif_device_attach(netdev);
2364         mod_timer(&adapter->watchdog_timer, jiffies);
2365 }
2366
2367 /* ixgb_main.c */