]> err.no Git - linux-2.6/blob - drivers/net/ixgb/ixgb_main.c
ixgb: fix race on rx_buffer_len in mtu change
[linux-2.6] / drivers / net / ixgb / ixgb_main.c
1 /*******************************************************************************
2
3   Intel PRO/10GbE Linux driver
4   Copyright(c) 1999 - 2006 Intel Corporation.
5
6   This program is free software; you can redistribute it and/or modify it
7   under the terms and conditions of the GNU General Public License,
8   version 2, as published by the Free Software Foundation.
9
10   This program is distributed in the hope it will be useful, but WITHOUT
11   ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
12   FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
13   more details.
14
15   You should have received a copy of the GNU General Public License along with
16   this program; if not, write to the Free Software Foundation, Inc.,
17   51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA.
18
19   The full GNU General Public License is included in this distribution in
20   the file called "COPYING".
21
22   Contact Information:
23   Linux NICS <linux.nics@intel.com>
24   e1000-devel Mailing List <e1000-devel@lists.sourceforge.net>
25   Intel Corporation, 5200 N.E. Elam Young Parkway, Hillsboro, OR 97124-6497
26
27 *******************************************************************************/
28
29 #include "ixgb.h"
30
31 char ixgb_driver_name[] = "ixgb";
32 static char ixgb_driver_string[] = "Intel(R) PRO/10GbE Network Driver";
33
34 #ifndef CONFIG_IXGB_NAPI
35 #define DRIVERNAPI
36 #else
37 #define DRIVERNAPI "-NAPI"
38 #endif
39 #define DRV_VERSION             "1.0.126-k4"DRIVERNAPI
40 const char ixgb_driver_version[] = DRV_VERSION;
41 static const char ixgb_copyright[] = "Copyright (c) 1999-2006 Intel Corporation.";
42
43 /* ixgb_pci_tbl - PCI Device ID Table
44  *
45  * Wildcard entries (PCI_ANY_ID) should come last
46  * Last entry must be all 0s
47  *
48  * { Vendor ID, Device ID, SubVendor ID, SubDevice ID,
49  *   Class, Class Mask, private data (not used) }
50  */
51 static struct pci_device_id ixgb_pci_tbl[] = {
52         {INTEL_VENDOR_ID, IXGB_DEVICE_ID_82597EX,
53          PCI_ANY_ID, PCI_ANY_ID, 0, 0, 0},
54         {INTEL_VENDOR_ID, IXGB_DEVICE_ID_82597EX_CX4,
55          PCI_ANY_ID, PCI_ANY_ID, 0, 0, 0},
56         {INTEL_VENDOR_ID, IXGB_DEVICE_ID_82597EX_SR,
57          PCI_ANY_ID, PCI_ANY_ID, 0, 0, 0},
58         {INTEL_VENDOR_ID, IXGB_DEVICE_ID_82597EX_LR,  
59          PCI_ANY_ID, PCI_ANY_ID, 0, 0, 0},
60
61         /* required last entry */
62         {0,}
63 };
64
65 MODULE_DEVICE_TABLE(pci, ixgb_pci_tbl);
66
67 /* Local Function Prototypes */
68
69 int ixgb_up(struct ixgb_adapter *adapter);
70 void ixgb_down(struct ixgb_adapter *adapter, bool kill_watchdog);
71 void ixgb_reset(struct ixgb_adapter *adapter);
72 int ixgb_setup_tx_resources(struct ixgb_adapter *adapter);
73 int ixgb_setup_rx_resources(struct ixgb_adapter *adapter);
74 void ixgb_free_tx_resources(struct ixgb_adapter *adapter);
75 void ixgb_free_rx_resources(struct ixgb_adapter *adapter);
76 void ixgb_update_stats(struct ixgb_adapter *adapter);
77
78 static int ixgb_init_module(void);
79 static void ixgb_exit_module(void);
80 static int ixgb_probe(struct pci_dev *pdev, const struct pci_device_id *ent);
81 static void __devexit ixgb_remove(struct pci_dev *pdev);
82 static int ixgb_sw_init(struct ixgb_adapter *adapter);
83 static int ixgb_open(struct net_device *netdev);
84 static int ixgb_close(struct net_device *netdev);
85 static void ixgb_configure_tx(struct ixgb_adapter *adapter);
86 static void ixgb_configure_rx(struct ixgb_adapter *adapter);
87 static void ixgb_setup_rctl(struct ixgb_adapter *adapter);
88 static void ixgb_clean_tx_ring(struct ixgb_adapter *adapter);
89 static void ixgb_clean_rx_ring(struct ixgb_adapter *adapter);
90 static void ixgb_set_multi(struct net_device *netdev);
91 static void ixgb_watchdog(unsigned long data);
92 static int ixgb_xmit_frame(struct sk_buff *skb, struct net_device *netdev);
93 static struct net_device_stats *ixgb_get_stats(struct net_device *netdev);
94 static int ixgb_change_mtu(struct net_device *netdev, int new_mtu);
95 static int ixgb_set_mac(struct net_device *netdev, void *p);
96 static irqreturn_t ixgb_intr(int irq, void *data);
97 static bool ixgb_clean_tx_irq(struct ixgb_adapter *adapter);
98
99 #ifdef CONFIG_IXGB_NAPI
100 static int ixgb_clean(struct napi_struct *napi, int budget);
101 static bool ixgb_clean_rx_irq(struct ixgb_adapter *adapter,
102                               int *work_done, int work_to_do);
103 #else
104 static bool ixgb_clean_rx_irq(struct ixgb_adapter *adapter);
105 #endif
106 static void ixgb_alloc_rx_buffers(struct ixgb_adapter *adapter);
107 static void ixgb_tx_timeout(struct net_device *dev);
108 static void ixgb_tx_timeout_task(struct work_struct *work);
109 static void ixgb_vlan_rx_register(struct net_device *netdev,
110                                   struct vlan_group *grp);
111 static void ixgb_vlan_rx_add_vid(struct net_device *netdev, u16 vid);
112 static void ixgb_vlan_rx_kill_vid(struct net_device *netdev, u16 vid);
113 static void ixgb_restore_vlan(struct ixgb_adapter *adapter);
114
115 #ifdef CONFIG_NET_POLL_CONTROLLER
116 /* for netdump / net console */
117 static void ixgb_netpoll(struct net_device *dev);
118 #endif
119
120 static pci_ers_result_t ixgb_io_error_detected (struct pci_dev *pdev,
121                              enum pci_channel_state state);
122 static pci_ers_result_t ixgb_io_slot_reset (struct pci_dev *pdev);
123 static void ixgb_io_resume (struct pci_dev *pdev);
124
125 static struct pci_error_handlers ixgb_err_handler = {
126         .error_detected = ixgb_io_error_detected,
127         .slot_reset = ixgb_io_slot_reset,
128         .resume = ixgb_io_resume,
129 };
130
131 static struct pci_driver ixgb_driver = {
132         .name     = ixgb_driver_name,
133         .id_table = ixgb_pci_tbl,
134         .probe    = ixgb_probe,
135         .remove   = __devexit_p(ixgb_remove),
136         .err_handler = &ixgb_err_handler
137 };
138
139 MODULE_AUTHOR("Intel Corporation, <linux.nics@intel.com>");
140 MODULE_DESCRIPTION("Intel(R) PRO/10GbE Network Driver");
141 MODULE_LICENSE("GPL");
142 MODULE_VERSION(DRV_VERSION);
143
144 #define DEFAULT_DEBUG_LEVEL_SHIFT 3
145 static int debug = DEFAULT_DEBUG_LEVEL_SHIFT;
146 module_param(debug, int, 0);
147 MODULE_PARM_DESC(debug, "Debug level (0=none,...,16=all)");
148
149 /**
150  * ixgb_init_module - Driver Registration Routine
151  *
152  * ixgb_init_module is the first routine called when the driver is
153  * loaded. All it does is register with the PCI subsystem.
154  **/
155
156 static int __init
157 ixgb_init_module(void)
158 {
159         printk(KERN_INFO "%s - version %s\n",
160                ixgb_driver_string, ixgb_driver_version);
161
162         printk(KERN_INFO "%s\n", ixgb_copyright);
163
164         return pci_register_driver(&ixgb_driver);
165 }
166
167 module_init(ixgb_init_module);
168
169 /**
170  * ixgb_exit_module - Driver Exit Cleanup Routine
171  *
172  * ixgb_exit_module is called just before the driver is removed
173  * from memory.
174  **/
175
176 static void __exit
177 ixgb_exit_module(void)
178 {
179         pci_unregister_driver(&ixgb_driver);
180 }
181
182 module_exit(ixgb_exit_module);
183
184 /**
185  * ixgb_irq_disable - Mask off interrupt generation on the NIC
186  * @adapter: board private structure
187  **/
188
189 static void
190 ixgb_irq_disable(struct ixgb_adapter *adapter)
191 {
192         IXGB_WRITE_REG(&adapter->hw, IMC, ~0);
193         IXGB_WRITE_FLUSH(&adapter->hw);
194         synchronize_irq(adapter->pdev->irq);
195 }
196
197 /**
198  * ixgb_irq_enable - Enable default interrupt generation settings
199  * @adapter: board private structure
200  **/
201
202 static void
203 ixgb_irq_enable(struct ixgb_adapter *adapter)
204 {
205         u32 val = IXGB_INT_RXT0 | IXGB_INT_RXDMT0 |
206                   IXGB_INT_TXDW | IXGB_INT_LSC;
207         if (adapter->hw.subsystem_vendor_id == SUN_SUBVENDOR_ID)
208                 val |= IXGB_INT_GPI0;
209         IXGB_WRITE_REG(&adapter->hw, IMS, val);
210         IXGB_WRITE_FLUSH(&adapter->hw);
211 }
212
213 int
214 ixgb_up(struct ixgb_adapter *adapter)
215 {
216         struct net_device *netdev = adapter->netdev;
217         int err, irq_flags = IRQF_SHARED;
218         int max_frame = netdev->mtu + ENET_HEADER_SIZE + ENET_FCS_LENGTH;
219         struct ixgb_hw *hw = &adapter->hw;
220
221         /* hardware has been reset, we need to reload some things */
222
223         ixgb_rar_set(hw, netdev->dev_addr, 0);
224         ixgb_set_multi(netdev);
225
226         ixgb_restore_vlan(adapter);
227
228         ixgb_configure_tx(adapter);
229         ixgb_setup_rctl(adapter);
230         ixgb_configure_rx(adapter);
231         ixgb_alloc_rx_buffers(adapter);
232
233         /* disable interrupts and get the hardware into a known state */
234         IXGB_WRITE_REG(&adapter->hw, IMC, 0xffffffff);
235
236         /* only enable MSI if bus is in PCI-X mode */
237         if (IXGB_READ_REG(&adapter->hw, STATUS) & IXGB_STATUS_PCIX_MODE) {
238                 err = pci_enable_msi(adapter->pdev);
239                 if (!err) {
240                         adapter->have_msi = 1;
241                         irq_flags = 0;
242                 }
243                 /* proceed to try to request regular interrupt */
244         }
245
246         err = request_irq(adapter->pdev->irq, &ixgb_intr, irq_flags,
247                           netdev->name, netdev);
248         if (err) {
249                 if (adapter->have_msi)
250                         pci_disable_msi(adapter->pdev);
251                 DPRINTK(PROBE, ERR,
252                  "Unable to allocate interrupt Error: %d\n", err);
253                 return err;
254         }
255
256         if((hw->max_frame_size != max_frame) ||
257                 (hw->max_frame_size !=
258                 (IXGB_READ_REG(hw, MFS) >> IXGB_MFS_SHIFT))) {
259
260                 hw->max_frame_size = max_frame;
261
262                 IXGB_WRITE_REG(hw, MFS, hw->max_frame_size << IXGB_MFS_SHIFT);
263
264                 if(hw->max_frame_size >
265                    IXGB_MAX_ENET_FRAME_SIZE_WITHOUT_FCS + ENET_FCS_LENGTH) {
266                         u32 ctrl0 = IXGB_READ_REG(hw, CTRL0);
267
268                         if(!(ctrl0 & IXGB_CTRL0_JFE)) {
269                                 ctrl0 |= IXGB_CTRL0_JFE;
270                                 IXGB_WRITE_REG(hw, CTRL0, ctrl0);
271                         }
272                 }
273         }
274
275         clear_bit(__IXGB_DOWN, &adapter->flags);
276
277 #ifdef CONFIG_IXGB_NAPI
278         napi_enable(&adapter->napi);
279 #endif
280         ixgb_irq_enable(adapter);
281
282         mod_timer(&adapter->watchdog_timer, jiffies);
283
284         return 0;
285 }
286
287 void
288 ixgb_down(struct ixgb_adapter *adapter, bool kill_watchdog)
289 {
290         struct net_device *netdev = adapter->netdev;
291
292         /* prevent the interrupt handler from restarting watchdog */
293         set_bit(__IXGB_DOWN, &adapter->flags);
294
295 #ifdef CONFIG_IXGB_NAPI
296         napi_disable(&adapter->napi);
297 #endif
298         /* waiting for NAPI to complete can re-enable interrupts */
299         ixgb_irq_disable(adapter);
300         free_irq(adapter->pdev->irq, netdev);
301
302         if (adapter->have_msi)
303                 pci_disable_msi(adapter->pdev);
304
305         if(kill_watchdog)
306                 del_timer_sync(&adapter->watchdog_timer);
307
308         adapter->link_speed = 0;
309         adapter->link_duplex = 0;
310         netif_carrier_off(netdev);
311         netif_stop_queue(netdev);
312
313         ixgb_reset(adapter);
314         ixgb_clean_tx_ring(adapter);
315         ixgb_clean_rx_ring(adapter);
316 }
317
318 void
319 ixgb_reset(struct ixgb_adapter *adapter)
320 {
321         struct ixgb_hw *hw = &adapter->hw;
322
323         ixgb_adapter_stop(hw);
324         if (!ixgb_init_hw(hw))
325                 DPRINTK(PROBE, ERR, "ixgb_init_hw failed.\n");
326
327         /* restore frame size information */
328         IXGB_WRITE_REG(hw, MFS, hw->max_frame_size << IXGB_MFS_SHIFT);
329         if (hw->max_frame_size >
330             IXGB_MAX_ENET_FRAME_SIZE_WITHOUT_FCS + ENET_FCS_LENGTH) {
331                 u32 ctrl0 = IXGB_READ_REG(hw, CTRL0);
332                 if (!(ctrl0 & IXGB_CTRL0_JFE)) {
333                         ctrl0 |= IXGB_CTRL0_JFE;
334                         IXGB_WRITE_REG(hw, CTRL0, ctrl0);
335                 }
336         }
337 }
338
339 /**
340  * ixgb_probe - Device Initialization Routine
341  * @pdev: PCI device information struct
342  * @ent: entry in ixgb_pci_tbl
343  *
344  * Returns 0 on success, negative on failure
345  *
346  * ixgb_probe initializes an adapter identified by a pci_dev structure.
347  * The OS initialization, configuring of the adapter private structure,
348  * and a hardware reset occur.
349  **/
350
351 static int __devinit
352 ixgb_probe(struct pci_dev *pdev,
353                 const struct pci_device_id *ent)
354 {
355         struct net_device *netdev = NULL;
356         struct ixgb_adapter *adapter;
357         static int cards_found = 0;
358         int pci_using_dac;
359         int i;
360         int err;
361
362         if((err = pci_enable_device(pdev)))
363                 return err;
364
365         if(!(err = pci_set_dma_mask(pdev, DMA_64BIT_MASK)) &&
366            !(err = pci_set_consistent_dma_mask(pdev, DMA_64BIT_MASK))) {
367                 pci_using_dac = 1;
368         } else {
369                 if((err = pci_set_dma_mask(pdev, DMA_32BIT_MASK)) ||
370                    (err = pci_set_consistent_dma_mask(pdev, DMA_32BIT_MASK))) {
371                         printk(KERN_ERR
372                          "ixgb: No usable DMA configuration, aborting\n");
373                         goto err_dma_mask;
374                 }
375                 pci_using_dac = 0;
376         }
377
378         if((err = pci_request_regions(pdev, ixgb_driver_name)))
379                 goto err_request_regions;
380
381         pci_set_master(pdev);
382
383         netdev = alloc_etherdev(sizeof(struct ixgb_adapter));
384         if(!netdev) {
385                 err = -ENOMEM;
386                 goto err_alloc_etherdev;
387         }
388
389         SET_NETDEV_DEV(netdev, &pdev->dev);
390
391         pci_set_drvdata(pdev, netdev);
392         adapter = netdev_priv(netdev);
393         adapter->netdev = netdev;
394         adapter->pdev = pdev;
395         adapter->hw.back = adapter;
396         adapter->msg_enable = netif_msg_init(debug, DEFAULT_DEBUG_LEVEL_SHIFT);
397
398         adapter->hw.hw_addr = ioremap(pci_resource_start(pdev, BAR_0),
399                                       pci_resource_len(pdev, BAR_0));
400         if (!adapter->hw.hw_addr) {
401                 err = -EIO;
402                 goto err_ioremap;
403         }
404
405         for(i = BAR_1; i <= BAR_5; i++) {
406                 if(pci_resource_len(pdev, i) == 0)
407                         continue;
408                 if(pci_resource_flags(pdev, i) & IORESOURCE_IO) {
409                         adapter->hw.io_base = pci_resource_start(pdev, i);
410                         break;
411                 }
412         }
413
414         netdev->open = &ixgb_open;
415         netdev->stop = &ixgb_close;
416         netdev->hard_start_xmit = &ixgb_xmit_frame;
417         netdev->get_stats = &ixgb_get_stats;
418         netdev->set_multicast_list = &ixgb_set_multi;
419         netdev->set_mac_address = &ixgb_set_mac;
420         netdev->change_mtu = &ixgb_change_mtu;
421         ixgb_set_ethtool_ops(netdev);
422         netdev->tx_timeout = &ixgb_tx_timeout;
423         netdev->watchdog_timeo = 5 * HZ;
424 #ifdef CONFIG_IXGB_NAPI
425         netif_napi_add(netdev, &adapter->napi, ixgb_clean, 64);
426 #endif
427         netdev->vlan_rx_register = ixgb_vlan_rx_register;
428         netdev->vlan_rx_add_vid = ixgb_vlan_rx_add_vid;
429         netdev->vlan_rx_kill_vid = ixgb_vlan_rx_kill_vid;
430 #ifdef CONFIG_NET_POLL_CONTROLLER
431         netdev->poll_controller = ixgb_netpoll;
432 #endif
433
434         strncpy(netdev->name, pci_name(pdev), sizeof(netdev->name) - 1);
435
436         adapter->bd_number = cards_found;
437         adapter->link_speed = 0;
438         adapter->link_duplex = 0;
439
440         /* setup the private structure */
441
442         if((err = ixgb_sw_init(adapter)))
443                 goto err_sw_init;
444
445         netdev->features = NETIF_F_SG |
446                            NETIF_F_HW_CSUM |
447                            NETIF_F_HW_VLAN_TX |
448                            NETIF_F_HW_VLAN_RX |
449                            NETIF_F_HW_VLAN_FILTER;
450         netdev->features |= NETIF_F_TSO;
451 #ifdef NETIF_F_LLTX
452         netdev->features |= NETIF_F_LLTX;
453 #endif
454
455         if(pci_using_dac)
456                 netdev->features |= NETIF_F_HIGHDMA;
457
458         /* make sure the EEPROM is good */
459
460         if(!ixgb_validate_eeprom_checksum(&adapter->hw)) {
461                 DPRINTK(PROBE, ERR, "The EEPROM Checksum Is Not Valid\n");
462                 err = -EIO;
463                 goto err_eeprom;
464         }
465
466         ixgb_get_ee_mac_addr(&adapter->hw, netdev->dev_addr);
467         memcpy(netdev->perm_addr, netdev->dev_addr, netdev->addr_len);
468
469         if(!is_valid_ether_addr(netdev->perm_addr)) {
470                 DPRINTK(PROBE, ERR, "Invalid MAC Address\n");
471                 err = -EIO;
472                 goto err_eeprom;
473         }
474
475         adapter->part_num = ixgb_get_ee_pba_number(&adapter->hw);
476
477         init_timer(&adapter->watchdog_timer);
478         adapter->watchdog_timer.function = &ixgb_watchdog;
479         adapter->watchdog_timer.data = (unsigned long)adapter;
480
481         INIT_WORK(&adapter->tx_timeout_task, ixgb_tx_timeout_task);
482
483         strcpy(netdev->name, "eth%d");
484         if((err = register_netdev(netdev)))
485                 goto err_register;
486
487         /* we're going to reset, so assume we have no link for now */
488
489         netif_carrier_off(netdev);
490         netif_stop_queue(netdev);
491
492         DPRINTK(PROBE, INFO, "Intel(R) PRO/10GbE Network Connection\n");
493         ixgb_check_options(adapter);
494         /* reset the hardware with the new settings */
495
496         ixgb_reset(adapter);
497
498         cards_found++;
499         return 0;
500
501 err_register:
502 err_sw_init:
503 err_eeprom:
504         iounmap(adapter->hw.hw_addr);
505 err_ioremap:
506         free_netdev(netdev);
507 err_alloc_etherdev:
508         pci_release_regions(pdev);
509 err_request_regions:
510 err_dma_mask:
511         pci_disable_device(pdev);
512         return err;
513 }
514
515 /**
516  * ixgb_remove - Device Removal Routine
517  * @pdev: PCI device information struct
518  *
519  * ixgb_remove is called by the PCI subsystem to alert the driver
520  * that it should release a PCI device.  The could be caused by a
521  * Hot-Plug event, or because the driver is going to be removed from
522  * memory.
523  **/
524
525 static void __devexit
526 ixgb_remove(struct pci_dev *pdev)
527 {
528         struct net_device *netdev = pci_get_drvdata(pdev);
529         struct ixgb_adapter *adapter = netdev_priv(netdev);
530
531         unregister_netdev(netdev);
532
533         iounmap(adapter->hw.hw_addr);
534         pci_release_regions(pdev);
535
536         free_netdev(netdev);
537 }
538
539 /**
540  * ixgb_sw_init - Initialize general software structures (struct ixgb_adapter)
541  * @adapter: board private structure to initialize
542  *
543  * ixgb_sw_init initializes the Adapter private data structure.
544  * Fields are initialized based on PCI device information and
545  * OS network device settings (MTU size).
546  **/
547
548 static int __devinit
549 ixgb_sw_init(struct ixgb_adapter *adapter)
550 {
551         struct ixgb_hw *hw = &adapter->hw;
552         struct net_device *netdev = adapter->netdev;
553         struct pci_dev *pdev = adapter->pdev;
554
555         /* PCI config space info */
556
557         hw->vendor_id = pdev->vendor;
558         hw->device_id = pdev->device;
559         hw->subsystem_vendor_id = pdev->subsystem_vendor;
560         hw->subsystem_id = pdev->subsystem_device;
561
562         hw->max_frame_size = netdev->mtu + ENET_HEADER_SIZE + ENET_FCS_LENGTH;
563         adapter->rx_buffer_len = hw->max_frame_size + 8; /* + 8 for errata */
564
565         if((hw->device_id == IXGB_DEVICE_ID_82597EX)
566            || (hw->device_id == IXGB_DEVICE_ID_82597EX_CX4)
567            || (hw->device_id == IXGB_DEVICE_ID_82597EX_LR)
568            || (hw->device_id == IXGB_DEVICE_ID_82597EX_SR))
569                         hw->mac_type = ixgb_82597;
570         else {
571                 /* should never have loaded on this device */
572                 DPRINTK(PROBE, ERR, "unsupported device id\n");
573         }
574
575         /* enable flow control to be programmed */
576         hw->fc.send_xon = 1;
577
578         spin_lock_init(&adapter->tx_lock);
579
580         set_bit(__IXGB_DOWN, &adapter->flags);
581         return 0;
582 }
583
584 /**
585  * ixgb_open - Called when a network interface is made active
586  * @netdev: network interface device structure
587  *
588  * Returns 0 on success, negative value on failure
589  *
590  * The open entry point is called when a network interface is made
591  * active by the system (IFF_UP).  At this point all resources needed
592  * for transmit and receive operations are allocated, the interrupt
593  * handler is registered with the OS, the watchdog timer is started,
594  * and the stack is notified that the interface is ready.
595  **/
596
597 static int
598 ixgb_open(struct net_device *netdev)
599 {
600         struct ixgb_adapter *adapter = netdev_priv(netdev);
601         int err;
602
603         /* allocate transmit descriptors */
604
605         if((err = ixgb_setup_tx_resources(adapter)))
606                 goto err_setup_tx;
607
608         /* allocate receive descriptors */
609
610         if((err = ixgb_setup_rx_resources(adapter)))
611                 goto err_setup_rx;
612
613         if((err = ixgb_up(adapter)))
614                 goto err_up;
615
616         return 0;
617
618 err_up:
619         ixgb_free_rx_resources(adapter);
620 err_setup_rx:
621         ixgb_free_tx_resources(adapter);
622 err_setup_tx:
623         ixgb_reset(adapter);
624
625         return err;
626 }
627
628 /**
629  * ixgb_close - Disables a network interface
630  * @netdev: network interface device structure
631  *
632  * Returns 0, this is not allowed to fail
633  *
634  * The close entry point is called when an interface is de-activated
635  * by the OS.  The hardware is still under the drivers control, but
636  * needs to be disabled.  A global MAC reset is issued to stop the
637  * hardware, and all transmit and receive resources are freed.
638  **/
639
640 static int
641 ixgb_close(struct net_device *netdev)
642 {
643         struct ixgb_adapter *adapter = netdev_priv(netdev);
644
645         ixgb_down(adapter, true);
646
647         ixgb_free_tx_resources(adapter);
648         ixgb_free_rx_resources(adapter);
649
650         return 0;
651 }
652
653 /**
654  * ixgb_setup_tx_resources - allocate Tx resources (Descriptors)
655  * @adapter: board private structure
656  *
657  * Return 0 on success, negative on failure
658  **/
659
660 int
661 ixgb_setup_tx_resources(struct ixgb_adapter *adapter)
662 {
663         struct ixgb_desc_ring *txdr = &adapter->tx_ring;
664         struct pci_dev *pdev = adapter->pdev;
665         int size;
666
667         size = sizeof(struct ixgb_buffer) * txdr->count;
668         txdr->buffer_info = vmalloc(size);
669         if(!txdr->buffer_info) {
670                 DPRINTK(PROBE, ERR,
671                  "Unable to allocate transmit descriptor ring memory\n");
672                 return -ENOMEM;
673         }
674         memset(txdr->buffer_info, 0, size);
675
676         /* round up to nearest 4K */
677
678         txdr->size = txdr->count * sizeof(struct ixgb_tx_desc);
679         txdr->size = ALIGN(txdr->size, 4096);
680
681         txdr->desc = pci_alloc_consistent(pdev, txdr->size, &txdr->dma);
682         if(!txdr->desc) {
683                 vfree(txdr->buffer_info);
684                 DPRINTK(PROBE, ERR,
685                  "Unable to allocate transmit descriptor memory\n");
686                 return -ENOMEM;
687         }
688         memset(txdr->desc, 0, txdr->size);
689
690         txdr->next_to_use = 0;
691         txdr->next_to_clean = 0;
692
693         return 0;
694 }
695
696 /**
697  * ixgb_configure_tx - Configure 82597 Transmit Unit after Reset.
698  * @adapter: board private structure
699  *
700  * Configure the Tx unit of the MAC after a reset.
701  **/
702
703 static void
704 ixgb_configure_tx(struct ixgb_adapter *adapter)
705 {
706         u64 tdba = adapter->tx_ring.dma;
707         u32 tdlen = adapter->tx_ring.count * sizeof(struct ixgb_tx_desc);
708         u32 tctl;
709         struct ixgb_hw *hw = &adapter->hw;
710
711         /* Setup the Base and Length of the Tx Descriptor Ring 
712          * tx_ring.dma can be either a 32 or 64 bit value 
713          */
714
715         IXGB_WRITE_REG(hw, TDBAL, (tdba & 0x00000000ffffffffULL));
716         IXGB_WRITE_REG(hw, TDBAH, (tdba >> 32));
717
718         IXGB_WRITE_REG(hw, TDLEN, tdlen);
719
720         /* Setup the HW Tx Head and Tail descriptor pointers */
721
722         IXGB_WRITE_REG(hw, TDH, 0);
723         IXGB_WRITE_REG(hw, TDT, 0);
724
725         /* don't set up txdctl, it induces performance problems if configured
726          * incorrectly */
727         /* Set the Tx Interrupt Delay register */
728
729         IXGB_WRITE_REG(hw, TIDV, adapter->tx_int_delay);
730
731         /* Program the Transmit Control Register */
732
733         tctl = IXGB_TCTL_TCE | IXGB_TCTL_TXEN | IXGB_TCTL_TPDE;
734         IXGB_WRITE_REG(hw, TCTL, tctl);
735
736         /* Setup Transmit Descriptor Settings for this adapter */
737         adapter->tx_cmd_type =
738                 IXGB_TX_DESC_TYPE 
739                 | (adapter->tx_int_delay_enable ? IXGB_TX_DESC_CMD_IDE : 0);
740 }
741
742 /**
743  * ixgb_setup_rx_resources - allocate Rx resources (Descriptors)
744  * @adapter: board private structure
745  *
746  * Returns 0 on success, negative on failure
747  **/
748
749 int
750 ixgb_setup_rx_resources(struct ixgb_adapter *adapter)
751 {
752         struct ixgb_desc_ring *rxdr = &adapter->rx_ring;
753         struct pci_dev *pdev = adapter->pdev;
754         int size;
755
756         size = sizeof(struct ixgb_buffer) * rxdr->count;
757         rxdr->buffer_info = vmalloc(size);
758         if(!rxdr->buffer_info) {
759                 DPRINTK(PROBE, ERR,
760                  "Unable to allocate receive descriptor ring\n");
761                 return -ENOMEM;
762         }
763         memset(rxdr->buffer_info, 0, size);
764
765         /* Round up to nearest 4K */
766
767         rxdr->size = rxdr->count * sizeof(struct ixgb_rx_desc);
768         rxdr->size = ALIGN(rxdr->size, 4096);
769
770         rxdr->desc = pci_alloc_consistent(pdev, rxdr->size, &rxdr->dma);
771
772         if(!rxdr->desc) {
773                 vfree(rxdr->buffer_info);
774                 DPRINTK(PROBE, ERR,
775                  "Unable to allocate receive descriptors\n");
776                 return -ENOMEM;
777         }
778         memset(rxdr->desc, 0, rxdr->size);
779
780         rxdr->next_to_clean = 0;
781         rxdr->next_to_use = 0;
782
783         return 0;
784 }
785
786 /**
787  * ixgb_setup_rctl - configure the receive control register
788  * @adapter: Board private structure
789  **/
790
791 static void
792 ixgb_setup_rctl(struct ixgb_adapter *adapter)
793 {
794         u32 rctl;
795
796         rctl = IXGB_READ_REG(&adapter->hw, RCTL);
797
798         rctl &= ~(3 << IXGB_RCTL_MO_SHIFT);
799
800         rctl |=
801                 IXGB_RCTL_BAM | IXGB_RCTL_RDMTS_1_2 | 
802                 IXGB_RCTL_RXEN | IXGB_RCTL_CFF | 
803                 (adapter->hw.mc_filter_type << IXGB_RCTL_MO_SHIFT);
804
805         rctl |= IXGB_RCTL_SECRC;
806
807         if (adapter->rx_buffer_len <= IXGB_RXBUFFER_2048)
808                 rctl |= IXGB_RCTL_BSIZE_2048;
809         else if (adapter->rx_buffer_len <= IXGB_RXBUFFER_4096)
810                 rctl |= IXGB_RCTL_BSIZE_4096;
811         else if (adapter->rx_buffer_len <= IXGB_RXBUFFER_8192)
812                 rctl |= IXGB_RCTL_BSIZE_8192;
813         else if (adapter->rx_buffer_len <= IXGB_RXBUFFER_16384)
814                 rctl |= IXGB_RCTL_BSIZE_16384;
815
816         IXGB_WRITE_REG(&adapter->hw, RCTL, rctl);
817 }
818
819 /**
820  * ixgb_configure_rx - Configure 82597 Receive Unit after Reset.
821  * @adapter: board private structure
822  *
823  * Configure the Rx unit of the MAC after a reset.
824  **/
825
826 static void
827 ixgb_configure_rx(struct ixgb_adapter *adapter)
828 {
829         u64 rdba = adapter->rx_ring.dma;
830         u32 rdlen = adapter->rx_ring.count * sizeof(struct ixgb_rx_desc);
831         struct ixgb_hw *hw = &adapter->hw;
832         u32 rctl;
833         u32 rxcsum;
834
835         /* make sure receives are disabled while setting up the descriptors */
836
837         rctl = IXGB_READ_REG(hw, RCTL);
838         IXGB_WRITE_REG(hw, RCTL, rctl & ~IXGB_RCTL_RXEN);
839
840         /* set the Receive Delay Timer Register */
841
842         IXGB_WRITE_REG(hw, RDTR, adapter->rx_int_delay);
843
844         /* Setup the Base and Length of the Rx Descriptor Ring */
845
846         IXGB_WRITE_REG(hw, RDBAL, (rdba & 0x00000000ffffffffULL));
847         IXGB_WRITE_REG(hw, RDBAH, (rdba >> 32));
848
849         IXGB_WRITE_REG(hw, RDLEN, rdlen);
850
851         /* Setup the HW Rx Head and Tail Descriptor Pointers */
852         IXGB_WRITE_REG(hw, RDH, 0);
853         IXGB_WRITE_REG(hw, RDT, 0);
854
855         /* due to the hardware errata with RXDCTL, we are unable to use any of
856          * the performance enhancing features of it without causing other
857          * subtle bugs, some of the bugs could include receive length
858          * corruption at high data rates (WTHRESH > 0) and/or receive
859          * descriptor ring irregularites (particularly in hardware cache) */
860         IXGB_WRITE_REG(hw, RXDCTL, 0);
861
862         /* Enable Receive Checksum Offload for TCP and UDP */
863         if (adapter->rx_csum) {
864                 rxcsum = IXGB_READ_REG(hw, RXCSUM);
865                 rxcsum |= IXGB_RXCSUM_TUOFL;
866                 IXGB_WRITE_REG(hw, RXCSUM, rxcsum);
867         }
868
869         /* Enable Receives */
870
871         IXGB_WRITE_REG(hw, RCTL, rctl);
872 }
873
874 /**
875  * ixgb_free_tx_resources - Free Tx Resources
876  * @adapter: board private structure
877  *
878  * Free all transmit software resources
879  **/
880
881 void
882 ixgb_free_tx_resources(struct ixgb_adapter *adapter)
883 {
884         struct pci_dev *pdev = adapter->pdev;
885
886         ixgb_clean_tx_ring(adapter);
887
888         vfree(adapter->tx_ring.buffer_info);
889         adapter->tx_ring.buffer_info = NULL;
890
891         pci_free_consistent(pdev, adapter->tx_ring.size,
892                             adapter->tx_ring.desc, adapter->tx_ring.dma);
893
894         adapter->tx_ring.desc = NULL;
895 }
896
897 static void
898 ixgb_unmap_and_free_tx_resource(struct ixgb_adapter *adapter,
899                                         struct ixgb_buffer *buffer_info)
900 {
901         struct pci_dev *pdev = adapter->pdev;
902
903         if (buffer_info->dma)
904                 pci_unmap_page(pdev, buffer_info->dma, buffer_info->length,
905                                PCI_DMA_TODEVICE);
906
907         if (buffer_info->skb)
908                 dev_kfree_skb_any(buffer_info->skb);
909
910         buffer_info->skb = NULL;
911         buffer_info->dma = 0;
912         buffer_info->time_stamp = 0;
913         /* these fields must always be initialized in tx
914          * buffer_info->length = 0;
915          * buffer_info->next_to_watch = 0; */
916 }
917
918 /**
919  * ixgb_clean_tx_ring - Free Tx Buffers
920  * @adapter: board private structure
921  **/
922
923 static void
924 ixgb_clean_tx_ring(struct ixgb_adapter *adapter)
925 {
926         struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
927         struct ixgb_buffer *buffer_info;
928         unsigned long size;
929         unsigned int i;
930
931         /* Free all the Tx ring sk_buffs */
932
933         for(i = 0; i < tx_ring->count; i++) {
934                 buffer_info = &tx_ring->buffer_info[i];
935                 ixgb_unmap_and_free_tx_resource(adapter, buffer_info);
936         }
937
938         size = sizeof(struct ixgb_buffer) * tx_ring->count;
939         memset(tx_ring->buffer_info, 0, size);
940
941         /* Zero out the descriptor ring */
942
943         memset(tx_ring->desc, 0, tx_ring->size);
944
945         tx_ring->next_to_use = 0;
946         tx_ring->next_to_clean = 0;
947
948         IXGB_WRITE_REG(&adapter->hw, TDH, 0);
949         IXGB_WRITE_REG(&adapter->hw, TDT, 0);
950 }
951
952 /**
953  * ixgb_free_rx_resources - Free Rx Resources
954  * @adapter: board private structure
955  *
956  * Free all receive software resources
957  **/
958
959 void
960 ixgb_free_rx_resources(struct ixgb_adapter *adapter)
961 {
962         struct ixgb_desc_ring *rx_ring = &adapter->rx_ring;
963         struct pci_dev *pdev = adapter->pdev;
964
965         ixgb_clean_rx_ring(adapter);
966
967         vfree(rx_ring->buffer_info);
968         rx_ring->buffer_info = NULL;
969
970         pci_free_consistent(pdev, rx_ring->size, rx_ring->desc, rx_ring->dma);
971
972         rx_ring->desc = NULL;
973 }
974
975 /**
976  * ixgb_clean_rx_ring - Free Rx Buffers
977  * @adapter: board private structure
978  **/
979
980 static void
981 ixgb_clean_rx_ring(struct ixgb_adapter *adapter)
982 {
983         struct ixgb_desc_ring *rx_ring = &adapter->rx_ring;
984         struct ixgb_buffer *buffer_info;
985         struct pci_dev *pdev = adapter->pdev;
986         unsigned long size;
987         unsigned int i;
988
989         /* Free all the Rx ring sk_buffs */
990
991         for(i = 0; i < rx_ring->count; i++) {
992                 buffer_info = &rx_ring->buffer_info[i];
993                 if(buffer_info->skb) {
994
995                         pci_unmap_single(pdev,
996                                          buffer_info->dma,
997                                          buffer_info->length,
998                                          PCI_DMA_FROMDEVICE);
999
1000                         dev_kfree_skb(buffer_info->skb);
1001
1002                         buffer_info->skb = NULL;
1003                 }
1004         }
1005
1006         size = sizeof(struct ixgb_buffer) * rx_ring->count;
1007         memset(rx_ring->buffer_info, 0, size);
1008
1009         /* Zero out the descriptor ring */
1010
1011         memset(rx_ring->desc, 0, rx_ring->size);
1012
1013         rx_ring->next_to_clean = 0;
1014         rx_ring->next_to_use = 0;
1015
1016         IXGB_WRITE_REG(&adapter->hw, RDH, 0);
1017         IXGB_WRITE_REG(&adapter->hw, RDT, 0);
1018 }
1019
1020 /**
1021  * ixgb_set_mac - Change the Ethernet Address of the NIC
1022  * @netdev: network interface device structure
1023  * @p: pointer to an address structure
1024  *
1025  * Returns 0 on success, negative on failure
1026  **/
1027
1028 static int
1029 ixgb_set_mac(struct net_device *netdev, void *p)
1030 {
1031         struct ixgb_adapter *adapter = netdev_priv(netdev);
1032         struct sockaddr *addr = p;
1033
1034         if(!is_valid_ether_addr(addr->sa_data))
1035                 return -EADDRNOTAVAIL;
1036
1037         memcpy(netdev->dev_addr, addr->sa_data, netdev->addr_len);
1038
1039         ixgb_rar_set(&adapter->hw, addr->sa_data, 0);
1040
1041         return 0;
1042 }
1043
1044 /**
1045  * ixgb_set_multi - Multicast and Promiscuous mode set
1046  * @netdev: network interface device structure
1047  *
1048  * The set_multi entry point is called whenever the multicast address
1049  * list or the network interface flags are updated.  This routine is
1050  * responsible for configuring the hardware for proper multicast,
1051  * promiscuous mode, and all-multi behavior.
1052  **/
1053
1054 static void
1055 ixgb_set_multi(struct net_device *netdev)
1056 {
1057         struct ixgb_adapter *adapter = netdev_priv(netdev);
1058         struct ixgb_hw *hw = &adapter->hw;
1059         struct dev_mc_list *mc_ptr;
1060         u32 rctl;
1061         int i;
1062
1063         /* Check for Promiscuous and All Multicast modes */
1064
1065         rctl = IXGB_READ_REG(hw, RCTL);
1066
1067         if(netdev->flags & IFF_PROMISC) {
1068                 rctl |= (IXGB_RCTL_UPE | IXGB_RCTL_MPE);
1069         } else if(netdev->flags & IFF_ALLMULTI) {
1070                 rctl |= IXGB_RCTL_MPE;
1071                 rctl &= ~IXGB_RCTL_UPE;
1072         } else {
1073                 rctl &= ~(IXGB_RCTL_UPE | IXGB_RCTL_MPE);
1074         }
1075
1076         if(netdev->mc_count > IXGB_MAX_NUM_MULTICAST_ADDRESSES) {
1077                 rctl |= IXGB_RCTL_MPE;
1078                 IXGB_WRITE_REG(hw, RCTL, rctl);
1079         } else {
1080                 u8 mta[IXGB_MAX_NUM_MULTICAST_ADDRESSES *
1081                             IXGB_ETH_LENGTH_OF_ADDRESS];
1082
1083                 IXGB_WRITE_REG(hw, RCTL, rctl);
1084
1085                 for(i = 0, mc_ptr = netdev->mc_list; mc_ptr;
1086                         i++, mc_ptr = mc_ptr->next)
1087                         memcpy(&mta[i * IXGB_ETH_LENGTH_OF_ADDRESS],
1088                                    mc_ptr->dmi_addr, IXGB_ETH_LENGTH_OF_ADDRESS);
1089
1090                 ixgb_mc_addr_list_update(hw, mta, netdev->mc_count, 0);
1091         }
1092 }
1093
1094 /**
1095  * ixgb_watchdog - Timer Call-back
1096  * @data: pointer to netdev cast into an unsigned long
1097  **/
1098
1099 static void
1100 ixgb_watchdog(unsigned long data)
1101 {
1102         struct ixgb_adapter *adapter = (struct ixgb_adapter *)data;
1103         struct net_device *netdev = adapter->netdev;
1104         struct ixgb_desc_ring *txdr = &adapter->tx_ring;
1105
1106         ixgb_check_for_link(&adapter->hw);
1107
1108         if (ixgb_check_for_bad_link(&adapter->hw)) {
1109                 /* force the reset path */
1110                 netif_stop_queue(netdev);
1111         }
1112
1113         if(adapter->hw.link_up) {
1114                 if(!netif_carrier_ok(netdev)) {
1115                         DPRINTK(LINK, INFO,
1116                                 "NIC Link is Up 10000 Mbps Full Duplex\n");
1117                         adapter->link_speed = 10000;
1118                         adapter->link_duplex = FULL_DUPLEX;
1119                         netif_carrier_on(netdev);
1120                         netif_wake_queue(netdev);
1121                 }
1122         } else {
1123                 if(netif_carrier_ok(netdev)) {
1124                         adapter->link_speed = 0;
1125                         adapter->link_duplex = 0;
1126                         DPRINTK(LINK, INFO, "NIC Link is Down\n");
1127                         netif_carrier_off(netdev);
1128                         netif_stop_queue(netdev);
1129
1130                 }
1131         }
1132
1133         ixgb_update_stats(adapter);
1134
1135         if(!netif_carrier_ok(netdev)) {
1136                 if(IXGB_DESC_UNUSED(txdr) + 1 < txdr->count) {
1137                         /* We've lost link, so the controller stops DMA,
1138                          * but we've got queued Tx work that's never going
1139                          * to get done, so reset controller to flush Tx.
1140                          * (Do the reset outside of interrupt context). */
1141                         schedule_work(&adapter->tx_timeout_task);
1142                 }
1143         }
1144
1145         /* Force detection of hung controller every watchdog period */
1146         adapter->detect_tx_hung = true;
1147
1148         /* generate an interrupt to force clean up of any stragglers */
1149         IXGB_WRITE_REG(&adapter->hw, ICS, IXGB_INT_TXDW);
1150
1151         /* Reset the timer */
1152         mod_timer(&adapter->watchdog_timer, jiffies + 2 * HZ);
1153 }
1154
1155 #define IXGB_TX_FLAGS_CSUM              0x00000001
1156 #define IXGB_TX_FLAGS_VLAN              0x00000002
1157 #define IXGB_TX_FLAGS_TSO               0x00000004
1158
1159 static int
1160 ixgb_tso(struct ixgb_adapter *adapter, struct sk_buff *skb)
1161 {
1162         struct ixgb_context_desc *context_desc;
1163         unsigned int i;
1164         u8 ipcss, ipcso, tucss, tucso, hdr_len;
1165         u16 ipcse, tucse, mss;
1166         int err;
1167
1168         if (likely(skb_is_gso(skb))) {
1169                 struct ixgb_buffer *buffer_info;
1170                 struct iphdr *iph;
1171
1172                 if (skb_header_cloned(skb)) {
1173                         err = pskb_expand_head(skb, 0, 0, GFP_ATOMIC);
1174                         if (err)
1175                                 return err;
1176                 }
1177
1178                 hdr_len = skb_transport_offset(skb) + tcp_hdrlen(skb);
1179                 mss = skb_shinfo(skb)->gso_size;
1180                 iph = ip_hdr(skb);
1181                 iph->tot_len = 0;
1182                 iph->check = 0;
1183                 tcp_hdr(skb)->check = ~csum_tcpudp_magic(iph->saddr,
1184                                                          iph->daddr, 0,
1185                                                          IPPROTO_TCP, 0);
1186                 ipcss = skb_network_offset(skb);
1187                 ipcso = (void *)&(iph->check) - (void *)skb->data;
1188                 ipcse = skb_transport_offset(skb) - 1;
1189                 tucss = skb_transport_offset(skb);
1190                 tucso = (void *)&(tcp_hdr(skb)->check) - (void *)skb->data;
1191                 tucse = 0;
1192
1193                 i = adapter->tx_ring.next_to_use;
1194                 context_desc = IXGB_CONTEXT_DESC(adapter->tx_ring, i);
1195                 buffer_info = &adapter->tx_ring.buffer_info[i];
1196                 WARN_ON(buffer_info->dma != 0);
1197
1198                 context_desc->ipcss = ipcss;
1199                 context_desc->ipcso = ipcso;
1200                 context_desc->ipcse = cpu_to_le16(ipcse);
1201                 context_desc->tucss = tucss;
1202                 context_desc->tucso = tucso;
1203                 context_desc->tucse = cpu_to_le16(tucse);
1204                 context_desc->mss = cpu_to_le16(mss);
1205                 context_desc->hdr_len = hdr_len;
1206                 context_desc->status = 0;
1207                 context_desc->cmd_type_len = cpu_to_le32(
1208                                                   IXGB_CONTEXT_DESC_TYPE 
1209                                                 | IXGB_CONTEXT_DESC_CMD_TSE
1210                                                 | IXGB_CONTEXT_DESC_CMD_IP
1211                                                 | IXGB_CONTEXT_DESC_CMD_TCP
1212                                                 | IXGB_CONTEXT_DESC_CMD_IDE
1213                                                 | (skb->len - (hdr_len)));
1214
1215
1216                 if(++i == adapter->tx_ring.count) i = 0;
1217                 adapter->tx_ring.next_to_use = i;
1218
1219                 return 1;
1220         }
1221
1222         return 0;
1223 }
1224
1225 static bool
1226 ixgb_tx_csum(struct ixgb_adapter *adapter, struct sk_buff *skb)
1227 {
1228         struct ixgb_context_desc *context_desc;
1229         unsigned int i;
1230         u8 css, cso;
1231
1232         if(likely(skb->ip_summed == CHECKSUM_PARTIAL)) {
1233                 struct ixgb_buffer *buffer_info;
1234                 css = skb_transport_offset(skb);
1235                 cso = css + skb->csum_offset;
1236
1237                 i = adapter->tx_ring.next_to_use;
1238                 context_desc = IXGB_CONTEXT_DESC(adapter->tx_ring, i);
1239                 buffer_info = &adapter->tx_ring.buffer_info[i];
1240                 WARN_ON(buffer_info->dma != 0);
1241
1242                 context_desc->tucss = css;
1243                 context_desc->tucso = cso;
1244                 context_desc->tucse = 0;
1245                 /* zero out any previously existing data in one instruction */
1246                 *(u32 *)&(context_desc->ipcss) = 0;
1247                 context_desc->status = 0;
1248                 context_desc->hdr_len = 0;
1249                 context_desc->mss = 0;
1250                 context_desc->cmd_type_len =
1251                         cpu_to_le32(IXGB_CONTEXT_DESC_TYPE
1252                                     | IXGB_TX_DESC_CMD_IDE);
1253
1254                 if(++i == adapter->tx_ring.count) i = 0;
1255                 adapter->tx_ring.next_to_use = i;
1256
1257                 return true;
1258         }
1259
1260         return false;
1261 }
1262
1263 #define IXGB_MAX_TXD_PWR        14
1264 #define IXGB_MAX_DATA_PER_TXD   (1<<IXGB_MAX_TXD_PWR)
1265
1266 static int
1267 ixgb_tx_map(struct ixgb_adapter *adapter, struct sk_buff *skb,
1268             unsigned int first)
1269 {
1270         struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
1271         struct ixgb_buffer *buffer_info;
1272         int len = skb->len;
1273         unsigned int offset = 0, size, count = 0, i;
1274         unsigned int mss = skb_shinfo(skb)->gso_size;
1275
1276         unsigned int nr_frags = skb_shinfo(skb)->nr_frags;
1277         unsigned int f;
1278
1279         len -= skb->data_len;
1280
1281         i = tx_ring->next_to_use;
1282
1283         while(len) {
1284                 buffer_info = &tx_ring->buffer_info[i];
1285                 size = min(len, IXGB_MAX_DATA_PER_TXD);
1286                 /* Workaround for premature desc write-backs
1287                  * in TSO mode.  Append 4-byte sentinel desc */
1288                 if (unlikely(mss && !nr_frags && size == len && size > 8))
1289                         size -= 4;
1290
1291                 buffer_info->length = size;
1292                 WARN_ON(buffer_info->dma != 0);
1293                 buffer_info->time_stamp = jiffies;
1294                 buffer_info->dma =
1295                         pci_map_single(adapter->pdev,
1296                                 skb->data + offset,
1297                                 size,
1298                                 PCI_DMA_TODEVICE);
1299                 buffer_info->next_to_watch = 0;
1300
1301                 len -= size;
1302                 offset += size;
1303                 count++;
1304                 if(++i == tx_ring->count) i = 0;
1305         }
1306
1307         for(f = 0; f < nr_frags; f++) {
1308                 struct skb_frag_struct *frag;
1309
1310                 frag = &skb_shinfo(skb)->frags[f];
1311                 len = frag->size;
1312                 offset = 0;
1313
1314                 while(len) {
1315                         buffer_info = &tx_ring->buffer_info[i];
1316                         size = min(len, IXGB_MAX_DATA_PER_TXD);
1317
1318                         /* Workaround for premature desc write-backs
1319                          * in TSO mode.  Append 4-byte sentinel desc */
1320                         if (unlikely(mss && (f == (nr_frags - 1))
1321                                      && size == len && size > 8))
1322                                 size -= 4;
1323
1324                         buffer_info->length = size;
1325                         buffer_info->time_stamp = jiffies;
1326                         buffer_info->dma =
1327                                 pci_map_page(adapter->pdev,
1328                                         frag->page,
1329                                         frag->page_offset + offset,
1330                                         size,
1331                                         PCI_DMA_TODEVICE);
1332                         buffer_info->next_to_watch = 0;
1333
1334                         len -= size;
1335                         offset += size;
1336                         count++;
1337                         if(++i == tx_ring->count) i = 0;
1338                 }
1339         }
1340         i = (i == 0) ? tx_ring->count - 1 : i - 1;
1341         tx_ring->buffer_info[i].skb = skb;
1342         tx_ring->buffer_info[first].next_to_watch = i;
1343
1344         return count;
1345 }
1346
1347 static void
1348 ixgb_tx_queue(struct ixgb_adapter *adapter, int count, int vlan_id,int tx_flags)
1349 {
1350         struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
1351         struct ixgb_tx_desc *tx_desc = NULL;
1352         struct ixgb_buffer *buffer_info;
1353         u32 cmd_type_len = adapter->tx_cmd_type;
1354         u8 status = 0;
1355         u8 popts = 0;
1356         unsigned int i;
1357
1358         if(tx_flags & IXGB_TX_FLAGS_TSO) {
1359                 cmd_type_len |= IXGB_TX_DESC_CMD_TSE;
1360                 popts |= (IXGB_TX_DESC_POPTS_IXSM | IXGB_TX_DESC_POPTS_TXSM);
1361         }
1362
1363         if(tx_flags & IXGB_TX_FLAGS_CSUM)
1364                 popts |= IXGB_TX_DESC_POPTS_TXSM;
1365
1366         if(tx_flags & IXGB_TX_FLAGS_VLAN) {
1367                 cmd_type_len |= IXGB_TX_DESC_CMD_VLE;
1368         }
1369
1370         i = tx_ring->next_to_use;
1371
1372         while(count--) {
1373                 buffer_info = &tx_ring->buffer_info[i];
1374                 tx_desc = IXGB_TX_DESC(*tx_ring, i);
1375                 tx_desc->buff_addr = cpu_to_le64(buffer_info->dma);
1376                 tx_desc->cmd_type_len =
1377                         cpu_to_le32(cmd_type_len | buffer_info->length);
1378                 tx_desc->status = status;
1379                 tx_desc->popts = popts;
1380                 tx_desc->vlan = cpu_to_le16(vlan_id);
1381
1382                 if(++i == tx_ring->count) i = 0;
1383         }
1384
1385         tx_desc->cmd_type_len |= cpu_to_le32(IXGB_TX_DESC_CMD_EOP 
1386                                 | IXGB_TX_DESC_CMD_RS );
1387
1388         /* Force memory writes to complete before letting h/w
1389          * know there are new descriptors to fetch.  (Only
1390          * applicable for weak-ordered memory model archs,
1391          * such as IA-64). */
1392         wmb();
1393
1394         tx_ring->next_to_use = i;
1395         IXGB_WRITE_REG(&adapter->hw, TDT, i);
1396 }
1397
1398 static int __ixgb_maybe_stop_tx(struct net_device *netdev, int size)
1399 {
1400         struct ixgb_adapter *adapter = netdev_priv(netdev);
1401         struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
1402
1403         netif_stop_queue(netdev);
1404         /* Herbert's original patch had:
1405          *  smp_mb__after_netif_stop_queue();
1406          * but since that doesn't exist yet, just open code it. */
1407         smp_mb();
1408
1409         /* We need to check again in a case another CPU has just
1410          * made room available. */
1411         if (likely(IXGB_DESC_UNUSED(tx_ring) < size))
1412                 return -EBUSY;
1413
1414         /* A reprieve! */
1415         netif_start_queue(netdev);
1416         ++adapter->restart_queue;
1417         return 0;
1418 }
1419
1420 static int ixgb_maybe_stop_tx(struct net_device *netdev,
1421                               struct ixgb_desc_ring *tx_ring, int size)
1422 {
1423         if (likely(IXGB_DESC_UNUSED(tx_ring) >= size))
1424                 return 0;
1425         return __ixgb_maybe_stop_tx(netdev, size);
1426 }
1427
1428
1429 /* Tx Descriptors needed, worst case */
1430 #define TXD_USE_COUNT(S) (((S) >> IXGB_MAX_TXD_PWR) + \
1431                          (((S) & (IXGB_MAX_DATA_PER_TXD - 1)) ? 1 : 0))
1432 #define DESC_NEEDED TXD_USE_COUNT(IXGB_MAX_DATA_PER_TXD) /* skb->date */ + \
1433         MAX_SKB_FRAGS * TXD_USE_COUNT(PAGE_SIZE) + 1 /* for context */ \
1434         + 1 /* one more needed for sentinel TSO workaround */
1435
1436 static int
1437 ixgb_xmit_frame(struct sk_buff *skb, struct net_device *netdev)
1438 {
1439         struct ixgb_adapter *adapter = netdev_priv(netdev);
1440         unsigned int first;
1441         unsigned int tx_flags = 0;
1442         unsigned long flags;
1443         int vlan_id = 0;
1444         int tso;
1445
1446         if (test_bit(__IXGB_DOWN, &adapter->flags)) {
1447                 dev_kfree_skb(skb);
1448                 return NETDEV_TX_OK;
1449         }
1450
1451         if(skb->len <= 0) {
1452                 dev_kfree_skb_any(skb);
1453                 return 0;
1454         }
1455
1456 #ifdef NETIF_F_LLTX
1457         if (!spin_trylock_irqsave(&adapter->tx_lock, flags)) {
1458                 /* Collision - tell upper layer to requeue */
1459                 local_irq_restore(flags);
1460                 return NETDEV_TX_LOCKED;
1461         }
1462 #else
1463         spin_lock_irqsave(&adapter->tx_lock, flags);
1464 #endif
1465
1466         if (unlikely(ixgb_maybe_stop_tx(netdev, &adapter->tx_ring,
1467                      DESC_NEEDED))) {
1468                 netif_stop_queue(netdev);
1469                 spin_unlock_irqrestore(&adapter->tx_lock, flags);
1470                 return NETDEV_TX_BUSY;
1471         }
1472
1473 #ifndef NETIF_F_LLTX
1474         spin_unlock_irqrestore(&adapter->tx_lock, flags);
1475 #endif
1476
1477         if(adapter->vlgrp && vlan_tx_tag_present(skb)) {
1478                 tx_flags |= IXGB_TX_FLAGS_VLAN;
1479                 vlan_id = vlan_tx_tag_get(skb);
1480         }
1481
1482         first = adapter->tx_ring.next_to_use;
1483         
1484         tso = ixgb_tso(adapter, skb);
1485         if (tso < 0) {
1486                 dev_kfree_skb_any(skb);
1487 #ifdef NETIF_F_LLTX
1488                 spin_unlock_irqrestore(&adapter->tx_lock, flags);
1489 #endif
1490                 return NETDEV_TX_OK;
1491         }
1492
1493         if (likely(tso))
1494                 tx_flags |= IXGB_TX_FLAGS_TSO;
1495         else if(ixgb_tx_csum(adapter, skb))
1496                 tx_flags |= IXGB_TX_FLAGS_CSUM;
1497
1498         ixgb_tx_queue(adapter, ixgb_tx_map(adapter, skb, first), vlan_id,
1499                         tx_flags);
1500
1501         netdev->trans_start = jiffies;
1502
1503 #ifdef NETIF_F_LLTX
1504         /* Make sure there is space in the ring for the next send. */
1505         ixgb_maybe_stop_tx(netdev, &adapter->tx_ring, DESC_NEEDED);
1506
1507         spin_unlock_irqrestore(&adapter->tx_lock, flags);
1508
1509 #endif
1510         return NETDEV_TX_OK;
1511 }
1512
1513 /**
1514  * ixgb_tx_timeout - Respond to a Tx Hang
1515  * @netdev: network interface device structure
1516  **/
1517
1518 static void
1519 ixgb_tx_timeout(struct net_device *netdev)
1520 {
1521         struct ixgb_adapter *adapter = netdev_priv(netdev);
1522
1523         /* Do the reset outside of interrupt context */
1524         schedule_work(&adapter->tx_timeout_task);
1525 }
1526
1527 static void
1528 ixgb_tx_timeout_task(struct work_struct *work)
1529 {
1530         struct ixgb_adapter *adapter =
1531                 container_of(work, struct ixgb_adapter, tx_timeout_task);
1532
1533         adapter->tx_timeout_count++;
1534         ixgb_down(adapter, true);
1535         ixgb_up(adapter);
1536 }
1537
1538 /**
1539  * ixgb_get_stats - Get System Network Statistics
1540  * @netdev: network interface device structure
1541  *
1542  * Returns the address of the device statistics structure.
1543  * The statistics are actually updated from the timer callback.
1544  **/
1545
1546 static struct net_device_stats *
1547 ixgb_get_stats(struct net_device *netdev)
1548 {
1549         struct ixgb_adapter *adapter = netdev_priv(netdev);
1550
1551         return &adapter->net_stats;
1552 }
1553
1554 /**
1555  * ixgb_change_mtu - Change the Maximum Transfer Unit
1556  * @netdev: network interface device structure
1557  * @new_mtu: new value for maximum frame size
1558  *
1559  * Returns 0 on success, negative on failure
1560  **/
1561
1562 static int
1563 ixgb_change_mtu(struct net_device *netdev, int new_mtu)
1564 {
1565         struct ixgb_adapter *adapter = netdev_priv(netdev);
1566         int max_frame = new_mtu + ENET_HEADER_SIZE + ENET_FCS_LENGTH;
1567         int old_max_frame = netdev->mtu + ENET_HEADER_SIZE + ENET_FCS_LENGTH;
1568
1569         /* MTU < 68 is an error for IPv4 traffic, just don't allow it */
1570         if ((new_mtu < 68) ||
1571             (max_frame > IXGB_MAX_JUMBO_FRAME_SIZE + ENET_FCS_LENGTH)) {
1572                 DPRINTK(PROBE, ERR, "Invalid MTU setting %d\n", new_mtu);
1573                 return -EINVAL;
1574         }
1575
1576         if (old_max_frame == max_frame)
1577                 return 0;
1578
1579         if (netif_running(netdev))
1580                 ixgb_down(adapter, true);
1581
1582         adapter->rx_buffer_len = max_frame + 8; /* + 8 for errata */
1583
1584         netdev->mtu = new_mtu;
1585
1586         if (netif_running(netdev))
1587                 ixgb_up(adapter);
1588
1589         return 0;
1590 }
1591
1592 /**
1593  * ixgb_update_stats - Update the board statistics counters.
1594  * @adapter: board private structure
1595  **/
1596
1597 void
1598 ixgb_update_stats(struct ixgb_adapter *adapter)
1599 {
1600         struct net_device *netdev = adapter->netdev;
1601         struct pci_dev *pdev = adapter->pdev;
1602
1603         /* Prevent stats update while adapter is being reset */
1604         if (pci_channel_offline(pdev))
1605                 return;
1606
1607         if((netdev->flags & IFF_PROMISC) || (netdev->flags & IFF_ALLMULTI) ||
1608            (netdev->mc_count > IXGB_MAX_NUM_MULTICAST_ADDRESSES)) {
1609                 u64 multi = IXGB_READ_REG(&adapter->hw, MPRCL);
1610                 u32 bcast_l = IXGB_READ_REG(&adapter->hw, BPRCL);
1611                 u32 bcast_h = IXGB_READ_REG(&adapter->hw, BPRCH);
1612                 u64 bcast = ((u64)bcast_h << 32) | bcast_l; 
1613
1614                 multi |= ((u64)IXGB_READ_REG(&adapter->hw, MPRCH) << 32);
1615                 /* fix up multicast stats by removing broadcasts */
1616                 if(multi >= bcast)
1617                         multi -= bcast;
1618                 
1619                 adapter->stats.mprcl += (multi & 0xFFFFFFFF);
1620                 adapter->stats.mprch += (multi >> 32);
1621                 adapter->stats.bprcl += bcast_l; 
1622                 adapter->stats.bprch += bcast_h;
1623         } else {
1624                 adapter->stats.mprcl += IXGB_READ_REG(&adapter->hw, MPRCL);
1625                 adapter->stats.mprch += IXGB_READ_REG(&adapter->hw, MPRCH);
1626                 adapter->stats.bprcl += IXGB_READ_REG(&adapter->hw, BPRCL);
1627                 adapter->stats.bprch += IXGB_READ_REG(&adapter->hw, BPRCH);
1628         }
1629         adapter->stats.tprl += IXGB_READ_REG(&adapter->hw, TPRL);
1630         adapter->stats.tprh += IXGB_READ_REG(&adapter->hw, TPRH);
1631         adapter->stats.gprcl += IXGB_READ_REG(&adapter->hw, GPRCL);
1632         adapter->stats.gprch += IXGB_READ_REG(&adapter->hw, GPRCH);
1633         adapter->stats.uprcl += IXGB_READ_REG(&adapter->hw, UPRCL);
1634         adapter->stats.uprch += IXGB_READ_REG(&adapter->hw, UPRCH);
1635         adapter->stats.vprcl += IXGB_READ_REG(&adapter->hw, VPRCL);
1636         adapter->stats.vprch += IXGB_READ_REG(&adapter->hw, VPRCH);
1637         adapter->stats.jprcl += IXGB_READ_REG(&adapter->hw, JPRCL);
1638         adapter->stats.jprch += IXGB_READ_REG(&adapter->hw, JPRCH);
1639         adapter->stats.gorcl += IXGB_READ_REG(&adapter->hw, GORCL);
1640         adapter->stats.gorch += IXGB_READ_REG(&adapter->hw, GORCH);
1641         adapter->stats.torl += IXGB_READ_REG(&adapter->hw, TORL);
1642         adapter->stats.torh += IXGB_READ_REG(&adapter->hw, TORH);
1643         adapter->stats.rnbc += IXGB_READ_REG(&adapter->hw, RNBC);
1644         adapter->stats.ruc += IXGB_READ_REG(&adapter->hw, RUC);
1645         adapter->stats.roc += IXGB_READ_REG(&adapter->hw, ROC);
1646         adapter->stats.rlec += IXGB_READ_REG(&adapter->hw, RLEC);
1647         adapter->stats.crcerrs += IXGB_READ_REG(&adapter->hw, CRCERRS);
1648         adapter->stats.icbc += IXGB_READ_REG(&adapter->hw, ICBC);
1649         adapter->stats.ecbc += IXGB_READ_REG(&adapter->hw, ECBC);
1650         adapter->stats.mpc += IXGB_READ_REG(&adapter->hw, MPC);
1651         adapter->stats.tptl += IXGB_READ_REG(&adapter->hw, TPTL);
1652         adapter->stats.tpth += IXGB_READ_REG(&adapter->hw, TPTH);
1653         adapter->stats.gptcl += IXGB_READ_REG(&adapter->hw, GPTCL);
1654         adapter->stats.gptch += IXGB_READ_REG(&adapter->hw, GPTCH);
1655         adapter->stats.bptcl += IXGB_READ_REG(&adapter->hw, BPTCL);
1656         adapter->stats.bptch += IXGB_READ_REG(&adapter->hw, BPTCH);
1657         adapter->stats.mptcl += IXGB_READ_REG(&adapter->hw, MPTCL);
1658         adapter->stats.mptch += IXGB_READ_REG(&adapter->hw, MPTCH);
1659         adapter->stats.uptcl += IXGB_READ_REG(&adapter->hw, UPTCL);
1660         adapter->stats.uptch += IXGB_READ_REG(&adapter->hw, UPTCH);
1661         adapter->stats.vptcl += IXGB_READ_REG(&adapter->hw, VPTCL);
1662         adapter->stats.vptch += IXGB_READ_REG(&adapter->hw, VPTCH);
1663         adapter->stats.jptcl += IXGB_READ_REG(&adapter->hw, JPTCL);
1664         adapter->stats.jptch += IXGB_READ_REG(&adapter->hw, JPTCH);
1665         adapter->stats.gotcl += IXGB_READ_REG(&adapter->hw, GOTCL);
1666         adapter->stats.gotch += IXGB_READ_REG(&adapter->hw, GOTCH);
1667         adapter->stats.totl += IXGB_READ_REG(&adapter->hw, TOTL);
1668         adapter->stats.toth += IXGB_READ_REG(&adapter->hw, TOTH);
1669         adapter->stats.dc += IXGB_READ_REG(&adapter->hw, DC);
1670         adapter->stats.plt64c += IXGB_READ_REG(&adapter->hw, PLT64C);
1671         adapter->stats.tsctc += IXGB_READ_REG(&adapter->hw, TSCTC);
1672         adapter->stats.tsctfc += IXGB_READ_REG(&adapter->hw, TSCTFC);
1673         adapter->stats.ibic += IXGB_READ_REG(&adapter->hw, IBIC);
1674         adapter->stats.rfc += IXGB_READ_REG(&adapter->hw, RFC);
1675         adapter->stats.lfc += IXGB_READ_REG(&adapter->hw, LFC);
1676         adapter->stats.pfrc += IXGB_READ_REG(&adapter->hw, PFRC);
1677         adapter->stats.pftc += IXGB_READ_REG(&adapter->hw, PFTC);
1678         adapter->stats.mcfrc += IXGB_READ_REG(&adapter->hw, MCFRC);
1679         adapter->stats.mcftc += IXGB_READ_REG(&adapter->hw, MCFTC);
1680         adapter->stats.xonrxc += IXGB_READ_REG(&adapter->hw, XONRXC);
1681         adapter->stats.xontxc += IXGB_READ_REG(&adapter->hw, XONTXC);
1682         adapter->stats.xoffrxc += IXGB_READ_REG(&adapter->hw, XOFFRXC);
1683         adapter->stats.xofftxc += IXGB_READ_REG(&adapter->hw, XOFFTXC);
1684         adapter->stats.rjc += IXGB_READ_REG(&adapter->hw, RJC);
1685
1686         /* Fill out the OS statistics structure */
1687
1688         adapter->net_stats.rx_packets = adapter->stats.gprcl;
1689         adapter->net_stats.tx_packets = adapter->stats.gptcl;
1690         adapter->net_stats.rx_bytes = adapter->stats.gorcl;
1691         adapter->net_stats.tx_bytes = adapter->stats.gotcl;
1692         adapter->net_stats.multicast = adapter->stats.mprcl;
1693         adapter->net_stats.collisions = 0;
1694
1695         /* ignore RLEC as it reports errors for padded (<64bytes) frames
1696          * with a length in the type/len field */
1697         adapter->net_stats.rx_errors =
1698             /* adapter->stats.rnbc + */ adapter->stats.crcerrs +
1699             adapter->stats.ruc +
1700             adapter->stats.roc /*+ adapter->stats.rlec */  +
1701             adapter->stats.icbc +
1702             adapter->stats.ecbc + adapter->stats.mpc;
1703
1704         /* see above
1705          * adapter->net_stats.rx_length_errors = adapter->stats.rlec;
1706          */
1707
1708         adapter->net_stats.rx_crc_errors = adapter->stats.crcerrs;
1709         adapter->net_stats.rx_fifo_errors = adapter->stats.mpc;
1710         adapter->net_stats.rx_missed_errors = adapter->stats.mpc;
1711         adapter->net_stats.rx_over_errors = adapter->stats.mpc;
1712
1713         adapter->net_stats.tx_errors = 0;
1714         adapter->net_stats.rx_frame_errors = 0;
1715         adapter->net_stats.tx_aborted_errors = 0;
1716         adapter->net_stats.tx_carrier_errors = 0;
1717         adapter->net_stats.tx_fifo_errors = 0;
1718         adapter->net_stats.tx_heartbeat_errors = 0;
1719         adapter->net_stats.tx_window_errors = 0;
1720 }
1721
1722 #define IXGB_MAX_INTR 10
1723 /**
1724  * ixgb_intr - Interrupt Handler
1725  * @irq: interrupt number
1726  * @data: pointer to a network interface device structure
1727  **/
1728
1729 static irqreturn_t
1730 ixgb_intr(int irq, void *data)
1731 {
1732         struct net_device *netdev = data;
1733         struct ixgb_adapter *adapter = netdev_priv(netdev);
1734         struct ixgb_hw *hw = &adapter->hw;
1735         u32 icr = IXGB_READ_REG(hw, ICR);
1736 #ifndef CONFIG_IXGB_NAPI
1737         unsigned int i;
1738 #endif
1739
1740         if(unlikely(!icr))
1741                 return IRQ_NONE;  /* Not our interrupt */
1742
1743         if (unlikely(icr & (IXGB_INT_RXSEQ | IXGB_INT_LSC)))
1744                 if (!test_bit(__IXGB_DOWN, &adapter->flags))
1745                         mod_timer(&adapter->watchdog_timer, jiffies);
1746
1747 #ifdef CONFIG_IXGB_NAPI
1748         if (netif_rx_schedule_prep(netdev, &adapter->napi)) {
1749
1750                 /* Disable interrupts and register for poll. The flush 
1751                   of the posted write is intentionally left out.
1752                 */
1753
1754                 IXGB_WRITE_REG(&adapter->hw, IMC, ~0);
1755                 __netif_rx_schedule(netdev, &adapter->napi);
1756         }
1757 #else
1758         /* yes, that is actually a & and it is meant to make sure that
1759          * every pass through this for loop checks both receive and
1760          * transmit queues for completed descriptors, intended to
1761          * avoid starvation issues and assist tx/rx fairness. */
1762         for(i = 0; i < IXGB_MAX_INTR; i++)
1763                 if(!ixgb_clean_rx_irq(adapter) &
1764                    !ixgb_clean_tx_irq(adapter))
1765                         break;
1766 #endif 
1767         return IRQ_HANDLED;
1768 }
1769
1770 #ifdef CONFIG_IXGB_NAPI
1771 /**
1772  * ixgb_clean - NAPI Rx polling callback
1773  * @adapter: board private structure
1774  **/
1775
1776 static int
1777 ixgb_clean(struct napi_struct *napi, int budget)
1778 {
1779         struct ixgb_adapter *adapter = container_of(napi, struct ixgb_adapter, napi);
1780         struct net_device *netdev = adapter->netdev;
1781         int work_done = 0;
1782
1783         ixgb_clean_tx_irq(adapter);
1784         ixgb_clean_rx_irq(adapter, &work_done, budget);
1785
1786         /* If budget not fully consumed, exit the polling mode */
1787         if (work_done < budget) {
1788                 netif_rx_complete(netdev, napi);
1789                 if (!test_bit(__IXGB_DOWN, &adapter->flags))
1790                         ixgb_irq_enable(adapter);
1791         }
1792
1793         return work_done;
1794 }
1795 #endif
1796
1797 /**
1798  * ixgb_clean_tx_irq - Reclaim resources after transmit completes
1799  * @adapter: board private structure
1800  **/
1801
1802 static bool
1803 ixgb_clean_tx_irq(struct ixgb_adapter *adapter)
1804 {
1805         struct ixgb_desc_ring *tx_ring = &adapter->tx_ring;
1806         struct net_device *netdev = adapter->netdev;
1807         struct ixgb_tx_desc *tx_desc, *eop_desc;
1808         struct ixgb_buffer *buffer_info;
1809         unsigned int i, eop;
1810         bool cleaned = false;
1811
1812         i = tx_ring->next_to_clean;
1813         eop = tx_ring->buffer_info[i].next_to_watch;
1814         eop_desc = IXGB_TX_DESC(*tx_ring, eop);
1815
1816         while(eop_desc->status & IXGB_TX_DESC_STATUS_DD) {
1817
1818                 for (cleaned = false; !cleaned; ) {
1819                         tx_desc = IXGB_TX_DESC(*tx_ring, i);
1820                         buffer_info = &tx_ring->buffer_info[i];
1821
1822                         if (tx_desc->popts
1823                             & (IXGB_TX_DESC_POPTS_TXSM |
1824                                IXGB_TX_DESC_POPTS_IXSM))
1825                                 adapter->hw_csum_tx_good++;
1826
1827                         ixgb_unmap_and_free_tx_resource(adapter, buffer_info);
1828
1829                         *(u32 *)&(tx_desc->status) = 0;
1830
1831                         cleaned = (i == eop);
1832                         if(++i == tx_ring->count) i = 0;
1833                 }
1834
1835                 eop = tx_ring->buffer_info[i].next_to_watch;
1836                 eop_desc = IXGB_TX_DESC(*tx_ring, eop);
1837         }
1838
1839         tx_ring->next_to_clean = i;
1840
1841         if (unlikely(cleaned && netif_carrier_ok(netdev) &&
1842                      IXGB_DESC_UNUSED(tx_ring) >= DESC_NEEDED)) {
1843                 /* Make sure that anybody stopping the queue after this
1844                  * sees the new next_to_clean. */
1845                 smp_mb();
1846
1847                 if (netif_queue_stopped(netdev) &&
1848                     !(test_bit(__IXGB_DOWN, &adapter->flags))) {
1849                         netif_wake_queue(netdev);
1850                         ++adapter->restart_queue;
1851                 }
1852         }
1853
1854         if(adapter->detect_tx_hung) {
1855                 /* detect a transmit hang in hardware, this serializes the
1856                  * check with the clearing of time_stamp and movement of i */
1857                 adapter->detect_tx_hung = false;
1858                 if (tx_ring->buffer_info[eop].dma &&
1859                    time_after(jiffies, tx_ring->buffer_info[eop].time_stamp + HZ)
1860                    && !(IXGB_READ_REG(&adapter->hw, STATUS) &
1861                         IXGB_STATUS_TXOFF)) {
1862                         /* detected Tx unit hang */
1863                         DPRINTK(DRV, ERR, "Detected Tx Unit Hang\n"
1864                                         "  TDH                  <%x>\n"
1865                                         "  TDT                  <%x>\n"
1866                                         "  next_to_use          <%x>\n"
1867                                         "  next_to_clean        <%x>\n"
1868                                         "buffer_info[next_to_clean]\n"
1869                                         "  time_stamp           <%lx>\n"
1870                                         "  next_to_watch        <%x>\n"
1871                                         "  jiffies              <%lx>\n"
1872                                         "  next_to_watch.status <%x>\n",
1873                                 IXGB_READ_REG(&adapter->hw, TDH),
1874                                 IXGB_READ_REG(&adapter->hw, TDT),
1875                                 tx_ring->next_to_use,
1876                                 tx_ring->next_to_clean,
1877                                 tx_ring->buffer_info[eop].time_stamp,
1878                                 eop,
1879                                 jiffies,
1880                                 eop_desc->status);
1881                         netif_stop_queue(netdev);
1882                 }
1883         }
1884
1885         return cleaned;
1886 }
1887
1888 /**
1889  * ixgb_rx_checksum - Receive Checksum Offload for 82597.
1890  * @adapter: board private structure
1891  * @rx_desc: receive descriptor
1892  * @sk_buff: socket buffer with received data
1893  **/
1894
1895 static void
1896 ixgb_rx_checksum(struct ixgb_adapter *adapter,
1897                  struct ixgb_rx_desc *rx_desc,
1898                  struct sk_buff *skb)
1899 {
1900         /* Ignore Checksum bit is set OR
1901          * TCP Checksum has not been calculated
1902          */
1903         if((rx_desc->status & IXGB_RX_DESC_STATUS_IXSM) ||
1904            (!(rx_desc->status & IXGB_RX_DESC_STATUS_TCPCS))) {
1905                 skb->ip_summed = CHECKSUM_NONE;
1906                 return;
1907         }
1908
1909         /* At this point we know the hardware did the TCP checksum */
1910         /* now look at the TCP checksum error bit */
1911         if(rx_desc->errors & IXGB_RX_DESC_ERRORS_TCPE) {
1912                 /* let the stack verify checksum errors */
1913                 skb->ip_summed = CHECKSUM_NONE;
1914                 adapter->hw_csum_rx_error++;
1915         } else {
1916                 /* TCP checksum is good */
1917                 skb->ip_summed = CHECKSUM_UNNECESSARY;
1918                 adapter->hw_csum_rx_good++;
1919         }
1920 }
1921
1922 /**
1923  * ixgb_clean_rx_irq - Send received data up the network stack,
1924  * @adapter: board private structure
1925  **/
1926
1927 static bool
1928 #ifdef CONFIG_IXGB_NAPI
1929 ixgb_clean_rx_irq(struct ixgb_adapter *adapter, int *work_done, int work_to_do)
1930 #else
1931 ixgb_clean_rx_irq(struct ixgb_adapter *adapter)
1932 #endif
1933 {
1934         struct ixgb_desc_ring *rx_ring = &adapter->rx_ring;
1935         struct net_device *netdev = adapter->netdev;
1936         struct pci_dev *pdev = adapter->pdev;
1937         struct ixgb_rx_desc *rx_desc, *next_rxd;
1938         struct ixgb_buffer *buffer_info, *next_buffer, *next2_buffer;
1939         u32 length;
1940         unsigned int i, j;
1941         bool cleaned = false;
1942
1943         i = rx_ring->next_to_clean;
1944         rx_desc = IXGB_RX_DESC(*rx_ring, i);
1945         buffer_info = &rx_ring->buffer_info[i];
1946
1947         while(rx_desc->status & IXGB_RX_DESC_STATUS_DD) {
1948                 struct sk_buff *skb, *next_skb;
1949                 u8 status;
1950
1951 #ifdef CONFIG_IXGB_NAPI
1952                 if(*work_done >= work_to_do)
1953                         break;
1954
1955                 (*work_done)++;
1956 #endif
1957                 status = rx_desc->status;
1958                 skb = buffer_info->skb;
1959                 buffer_info->skb = NULL;
1960
1961                 prefetch(skb->data);
1962
1963                 if(++i == rx_ring->count) i = 0;
1964                 next_rxd = IXGB_RX_DESC(*rx_ring, i);
1965                 prefetch(next_rxd);
1966
1967                 if((j = i + 1) == rx_ring->count) j = 0;
1968                 next2_buffer = &rx_ring->buffer_info[j];
1969                 prefetch(next2_buffer);
1970
1971                 next_buffer = &rx_ring->buffer_info[i];
1972                 next_skb = next_buffer->skb;
1973                 prefetch(next_skb);
1974
1975                 cleaned = true;
1976
1977                 pci_unmap_single(pdev,
1978                                  buffer_info->dma,
1979                                  buffer_info->length,
1980                                  PCI_DMA_FROMDEVICE);
1981
1982                 length = le16_to_cpu(rx_desc->length);
1983
1984                 if(unlikely(!(status & IXGB_RX_DESC_STATUS_EOP))) {
1985
1986                         /* All receives must fit into a single buffer */
1987
1988                         IXGB_DBG("Receive packet consumed multiple buffers "
1989                                          "length<%x>\n", length);
1990
1991                         dev_kfree_skb_irq(skb);
1992                         goto rxdesc_done;
1993                 }
1994
1995                 if (unlikely(rx_desc->errors
1996                              & (IXGB_RX_DESC_ERRORS_CE | IXGB_RX_DESC_ERRORS_SE
1997                                 | IXGB_RX_DESC_ERRORS_P |
1998                                 IXGB_RX_DESC_ERRORS_RXE))) {
1999
2000                         dev_kfree_skb_irq(skb);
2001                         goto rxdesc_done;
2002                 }
2003
2004                 /* code added for copybreak, this should improve
2005                  * performance for small packets with large amounts
2006                  * of reassembly being done in the stack */
2007 #define IXGB_CB_LENGTH 256
2008                 if (length < IXGB_CB_LENGTH) {
2009                         struct sk_buff *new_skb =
2010                             netdev_alloc_skb(netdev, length + NET_IP_ALIGN);
2011                         if (new_skb) {
2012                                 skb_reserve(new_skb, NET_IP_ALIGN);
2013                                 skb_copy_to_linear_data_offset(new_skb,
2014                                                                -NET_IP_ALIGN,
2015                                                                (skb->data -
2016                                                                 NET_IP_ALIGN),
2017                                                                (length +
2018                                                                 NET_IP_ALIGN));
2019                                 /* save the skb in buffer_info as good */
2020                                 buffer_info->skb = skb;
2021                                 skb = new_skb;
2022                         }
2023                 }
2024                 /* end copybreak code */
2025
2026                 /* Good Receive */
2027                 skb_put(skb, length);
2028
2029                 /* Receive Checksum Offload */
2030                 ixgb_rx_checksum(adapter, rx_desc, skb);
2031
2032                 skb->protocol = eth_type_trans(skb, netdev);
2033 #ifdef CONFIG_IXGB_NAPI
2034                 if(adapter->vlgrp && (status & IXGB_RX_DESC_STATUS_VP)) {
2035                         vlan_hwaccel_receive_skb(skb, adapter->vlgrp,
2036                                 le16_to_cpu(rx_desc->special));
2037                 } else {
2038                         netif_receive_skb(skb);
2039                 }
2040 #else /* CONFIG_IXGB_NAPI */
2041                 if(adapter->vlgrp && (status & IXGB_RX_DESC_STATUS_VP)) {
2042                         vlan_hwaccel_rx(skb, adapter->vlgrp,
2043                                 le16_to_cpu(rx_desc->special));
2044                 } else {
2045                         netif_rx(skb);
2046                 }
2047 #endif /* CONFIG_IXGB_NAPI */
2048                 netdev->last_rx = jiffies;
2049
2050 rxdesc_done:
2051                 /* clean up descriptor, might be written over by hw */
2052                 rx_desc->status = 0;
2053
2054                 /* use prefetched values */
2055                 rx_desc = next_rxd;
2056                 buffer_info = next_buffer;
2057         }
2058
2059         rx_ring->next_to_clean = i;
2060
2061         ixgb_alloc_rx_buffers(adapter);
2062
2063         return cleaned;
2064 }
2065
2066 /**
2067  * ixgb_alloc_rx_buffers - Replace used receive buffers
2068  * @adapter: address of board private structure
2069  **/
2070
2071 static void
2072 ixgb_alloc_rx_buffers(struct ixgb_adapter *adapter)
2073 {
2074         struct ixgb_desc_ring *rx_ring = &adapter->rx_ring;
2075         struct net_device *netdev = adapter->netdev;
2076         struct pci_dev *pdev = adapter->pdev;
2077         struct ixgb_rx_desc *rx_desc;
2078         struct ixgb_buffer *buffer_info;
2079         struct sk_buff *skb;
2080         unsigned int i;
2081         long cleancount;
2082
2083         i = rx_ring->next_to_use;
2084         buffer_info = &rx_ring->buffer_info[i];
2085         cleancount = IXGB_DESC_UNUSED(rx_ring);
2086
2087
2088         /* leave three descriptors unused */
2089         while(--cleancount > 2) {
2090                 /* recycle! its good for you */
2091                 skb = buffer_info->skb;
2092                 if (skb) {
2093                         skb_trim(skb, 0);
2094                         goto map_skb;
2095                 }
2096
2097                 skb = netdev_alloc_skb(netdev, adapter->rx_buffer_len
2098                                        + NET_IP_ALIGN);
2099                 if (unlikely(!skb)) {
2100                         /* Better luck next round */
2101                         adapter->alloc_rx_buff_failed++;
2102                         break;
2103                 }
2104
2105                 /* Make buffer alignment 2 beyond a 16 byte boundary
2106                  * this will result in a 16 byte aligned IP header after
2107                  * the 14 byte MAC header is removed
2108                  */
2109                 skb_reserve(skb, NET_IP_ALIGN);
2110
2111                 buffer_info->skb = skb;
2112                 buffer_info->length = adapter->rx_buffer_len;
2113 map_skb:
2114                 buffer_info->dma = pci_map_single(pdev,
2115                                                   skb->data,
2116                                                   adapter->rx_buffer_len,
2117                                                   PCI_DMA_FROMDEVICE);
2118
2119                 rx_desc = IXGB_RX_DESC(*rx_ring, i);
2120                 rx_desc->buff_addr = cpu_to_le64(buffer_info->dma);
2121                 /* guarantee DD bit not set now before h/w gets descriptor
2122                  * this is the rest of the workaround for h/w double 
2123                  * writeback. */
2124                 rx_desc->status = 0;
2125
2126
2127                 if(++i == rx_ring->count) i = 0;
2128                 buffer_info = &rx_ring->buffer_info[i];
2129         }
2130
2131         if (likely(rx_ring->next_to_use != i)) {
2132                 rx_ring->next_to_use = i;
2133                 if (unlikely(i-- == 0))
2134                         i = (rx_ring->count - 1);
2135
2136                 /* Force memory writes to complete before letting h/w
2137                  * know there are new descriptors to fetch.  (Only
2138                  * applicable for weak-ordered memory model archs, such
2139                  * as IA-64). */
2140                 wmb();
2141                 IXGB_WRITE_REG(&adapter->hw, RDT, i);
2142         }
2143 }
2144
2145 /**
2146  * ixgb_vlan_rx_register - enables or disables vlan tagging/stripping.
2147  * 
2148  * @param netdev network interface device structure
2149  * @param grp indicates to enable or disable tagging/stripping
2150  **/
2151 static void
2152 ixgb_vlan_rx_register(struct net_device *netdev, struct vlan_group *grp)
2153 {
2154         struct ixgb_adapter *adapter = netdev_priv(netdev);
2155         u32 ctrl, rctl;
2156
2157         ixgb_irq_disable(adapter);
2158         adapter->vlgrp = grp;
2159
2160         if(grp) {
2161                 /* enable VLAN tag insert/strip */
2162                 ctrl = IXGB_READ_REG(&adapter->hw, CTRL0);
2163                 ctrl |= IXGB_CTRL0_VME;
2164                 IXGB_WRITE_REG(&adapter->hw, CTRL0, ctrl);
2165
2166                 /* enable VLAN receive filtering */
2167
2168                 rctl = IXGB_READ_REG(&adapter->hw, RCTL);
2169                 rctl |= IXGB_RCTL_VFE;
2170                 rctl &= ~IXGB_RCTL_CFIEN;
2171                 IXGB_WRITE_REG(&adapter->hw, RCTL, rctl);
2172         } else {
2173                 /* disable VLAN tag insert/strip */
2174
2175                 ctrl = IXGB_READ_REG(&adapter->hw, CTRL0);
2176                 ctrl &= ~IXGB_CTRL0_VME;
2177                 IXGB_WRITE_REG(&adapter->hw, CTRL0, ctrl);
2178
2179                 /* disable VLAN filtering */
2180
2181                 rctl = IXGB_READ_REG(&adapter->hw, RCTL);
2182                 rctl &= ~IXGB_RCTL_VFE;
2183                 IXGB_WRITE_REG(&adapter->hw, RCTL, rctl);
2184         }
2185
2186         /* don't enable interrupts unless we are UP */
2187         if (adapter->netdev->flags & IFF_UP)
2188                 ixgb_irq_enable(adapter);
2189 }
2190
2191 static void
2192 ixgb_vlan_rx_add_vid(struct net_device *netdev, u16 vid)
2193 {
2194         struct ixgb_adapter *adapter = netdev_priv(netdev);
2195         u32 vfta, index;
2196
2197         /* add VID to filter table */
2198
2199         index = (vid >> 5) & 0x7F;
2200         vfta = IXGB_READ_REG_ARRAY(&adapter->hw, VFTA, index);
2201         vfta |= (1 << (vid & 0x1F));
2202         ixgb_write_vfta(&adapter->hw, index, vfta);
2203 }
2204
2205 static void
2206 ixgb_vlan_rx_kill_vid(struct net_device *netdev, u16 vid)
2207 {
2208         struct ixgb_adapter *adapter = netdev_priv(netdev);
2209         u32 vfta, index;
2210
2211         ixgb_irq_disable(adapter);
2212
2213         vlan_group_set_device(adapter->vlgrp, vid, NULL);
2214
2215         /* don't enable interrupts unless we are UP */
2216         if (adapter->netdev->flags & IFF_UP)
2217                 ixgb_irq_enable(adapter);
2218
2219         /* remove VID from filter table */
2220
2221         index = (vid >> 5) & 0x7F;
2222         vfta = IXGB_READ_REG_ARRAY(&adapter->hw, VFTA, index);
2223         vfta &= ~(1 << (vid & 0x1F));
2224         ixgb_write_vfta(&adapter->hw, index, vfta);
2225 }
2226
2227 static void
2228 ixgb_restore_vlan(struct ixgb_adapter *adapter)
2229 {
2230         ixgb_vlan_rx_register(adapter->netdev, adapter->vlgrp);
2231
2232         if(adapter->vlgrp) {
2233                 u16 vid;
2234                 for(vid = 0; vid < VLAN_GROUP_ARRAY_LEN; vid++) {
2235                         if(!vlan_group_get_device(adapter->vlgrp, vid))
2236                                 continue;
2237                         ixgb_vlan_rx_add_vid(adapter->netdev, vid);
2238                 }
2239         }
2240 }
2241
2242 #ifdef CONFIG_NET_POLL_CONTROLLER
2243 /*
2244  * Polling 'interrupt' - used by things like netconsole to send skbs
2245  * without having to re-enable interrupts. It's not called while
2246  * the interrupt routine is executing.
2247  */
2248
2249 static void ixgb_netpoll(struct net_device *dev)
2250 {
2251         struct ixgb_adapter *adapter = netdev_priv(dev);
2252
2253         disable_irq(adapter->pdev->irq);
2254         ixgb_intr(adapter->pdev->irq, dev);
2255         enable_irq(adapter->pdev->irq);
2256 }
2257 #endif
2258
2259 /**
2260  * ixgb_io_error_detected() - called when PCI error is detected
2261  * @pdev    pointer to pci device with error
2262  * @state   pci channel state after error
2263  *
2264  * This callback is called by the PCI subsystem whenever
2265  * a PCI bus error is detected.
2266  */
2267 static pci_ers_result_t ixgb_io_error_detected (struct pci_dev *pdev,
2268                                      enum pci_channel_state state)
2269 {
2270         struct net_device *netdev = pci_get_drvdata(pdev);
2271         struct ixgb_adapter *adapter = netdev_priv(netdev);
2272
2273         if(netif_running(netdev))
2274                 ixgb_down(adapter, true);
2275
2276         pci_disable_device(pdev);
2277
2278         /* Request a slot reset. */
2279         return PCI_ERS_RESULT_NEED_RESET;
2280 }
2281
2282 /**
2283  * ixgb_io_slot_reset - called after the pci bus has been reset.
2284  * @pdev    pointer to pci device with error
2285  *
2286  * This callback is called after the PCI buss has been reset.
2287  * Basically, this tries to restart the card from scratch.
2288  * This is a shortened version of the device probe/discovery code,
2289  * it resembles the first-half of the ixgb_probe() routine.
2290  */
2291 static pci_ers_result_t ixgb_io_slot_reset (struct pci_dev *pdev)
2292 {
2293         struct net_device *netdev = pci_get_drvdata(pdev);
2294         struct ixgb_adapter *adapter = netdev_priv(netdev);
2295
2296         if(pci_enable_device(pdev)) {
2297                 DPRINTK(PROBE, ERR, "Cannot re-enable PCI device after reset.\n");
2298                 return PCI_ERS_RESULT_DISCONNECT;
2299         }
2300
2301         /* Perform card reset only on one instance of the card */
2302         if (0 != PCI_FUNC (pdev->devfn))
2303                 return PCI_ERS_RESULT_RECOVERED;
2304
2305         pci_set_master(pdev);
2306
2307         netif_carrier_off(netdev);
2308         netif_stop_queue(netdev);
2309         ixgb_reset(adapter);
2310
2311         /* Make sure the EEPROM is good */
2312         if(!ixgb_validate_eeprom_checksum(&adapter->hw)) {
2313                 DPRINTK(PROBE, ERR, "After reset, the EEPROM checksum is not valid.\n");
2314                 return PCI_ERS_RESULT_DISCONNECT;
2315         }
2316         ixgb_get_ee_mac_addr(&adapter->hw, netdev->dev_addr);
2317         memcpy(netdev->perm_addr, netdev->dev_addr, netdev->addr_len);
2318
2319         if(!is_valid_ether_addr(netdev->perm_addr)) {
2320                 DPRINTK(PROBE, ERR, "After reset, invalid MAC address.\n");
2321                 return PCI_ERS_RESULT_DISCONNECT;
2322         }
2323
2324         return PCI_ERS_RESULT_RECOVERED;
2325 }
2326
2327 /**
2328  * ixgb_io_resume - called when its OK to resume normal operations
2329  * @pdev    pointer to pci device with error
2330  *
2331  * The error recovery driver tells us that its OK to resume
2332  * normal operation. Implementation resembles the second-half
2333  * of the ixgb_probe() routine.
2334  */
2335 static void ixgb_io_resume (struct pci_dev *pdev)
2336 {
2337         struct net_device *netdev = pci_get_drvdata(pdev);
2338         struct ixgb_adapter *adapter = netdev_priv(netdev);
2339
2340         pci_set_master(pdev);
2341
2342         if(netif_running(netdev)) {
2343                 if(ixgb_up(adapter)) {
2344                         printk ("ixgb: can't bring device back up after reset\n");
2345                         return;
2346                 }
2347         }
2348
2349         netif_device_attach(netdev);
2350         mod_timer(&adapter->watchdog_timer, jiffies);
2351 }
2352
2353 /* ixgb_main.c */