Linux kernel mirror (for testing) git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
kernel os linux
1
fork

Configure Feed

Select the types of activity you want to include in your feed.

at v2.6.36-rc1 6522 lines 184 kB view raw
1/******************************************************************************* 2 3 Intel(R) Gigabit Ethernet Linux driver 4 Copyright(c) 2007-2009 Intel Corporation. 5 6 This program is free software; you can redistribute it and/or modify it 7 under the terms and conditions of the GNU General Public License, 8 version 2, as published by the Free Software Foundation. 9 10 This program is distributed in the hope it will be useful, but WITHOUT 11 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 12 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for 13 more details. 14 15 You should have received a copy of the GNU General Public License along with 16 this program; if not, write to the Free Software Foundation, Inc., 17 51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA. 18 19 The full GNU General Public License is included in this distribution in 20 the file called "COPYING". 21 22 Contact Information: 23 e1000-devel Mailing List <e1000-devel@lists.sourceforge.net> 24 Intel Corporation, 5200 N.E. Elam Young Parkway, Hillsboro, OR 97124-6497 25 26*******************************************************************************/ 27 28#include <linux/module.h> 29#include <linux/types.h> 30#include <linux/init.h> 31#include <linux/vmalloc.h> 32#include <linux/pagemap.h> 33#include <linux/netdevice.h> 34#include <linux/ipv6.h> 35#include <linux/slab.h> 36#include <net/checksum.h> 37#include <net/ip6_checksum.h> 38#include <linux/net_tstamp.h> 39#include <linux/mii.h> 40#include <linux/ethtool.h> 41#include <linux/if_vlan.h> 42#include <linux/pci.h> 43#include <linux/pci-aspm.h> 44#include <linux/delay.h> 45#include <linux/interrupt.h> 46#include <linux/if_ether.h> 47#include <linux/aer.h> 48#ifdef CONFIG_IGB_DCA 49#include <linux/dca.h> 50#endif 51#include "igb.h" 52 53#define DRV_VERSION "2.1.0-k2" 54char igb_driver_name[] = "igb"; 55char igb_driver_version[] = DRV_VERSION; 56static const char igb_driver_string[] = 57 "Intel(R) Gigabit Ethernet Network Driver"; 58static const char igb_copyright[] = "Copyright (c) 2007-2009 Intel Corporation."; 59 60static const struct e1000_info *igb_info_tbl[] = { 61 [board_82575] = &e1000_82575_info, 62}; 63 64static DEFINE_PCI_DEVICE_TABLE(igb_pci_tbl) = { 65 { PCI_VDEVICE(INTEL, E1000_DEV_ID_I350_COPPER), board_82575 }, 66 { PCI_VDEVICE(INTEL, E1000_DEV_ID_I350_FIBER), board_82575 }, 67 { PCI_VDEVICE(INTEL, E1000_DEV_ID_I350_SERDES), board_82575 }, 68 { PCI_VDEVICE(INTEL, E1000_DEV_ID_I350_SGMII), board_82575 }, 69 { PCI_VDEVICE(INTEL, E1000_DEV_ID_82580_COPPER), board_82575 }, 70 { PCI_VDEVICE(INTEL, E1000_DEV_ID_82580_FIBER), board_82575 }, 71 { PCI_VDEVICE(INTEL, E1000_DEV_ID_82580_SERDES), board_82575 }, 72 { PCI_VDEVICE(INTEL, E1000_DEV_ID_82580_SGMII), board_82575 }, 73 { PCI_VDEVICE(INTEL, E1000_DEV_ID_82580_COPPER_DUAL), board_82575 }, 74 { PCI_VDEVICE(INTEL, E1000_DEV_ID_82576), board_82575 }, 75 { PCI_VDEVICE(INTEL, E1000_DEV_ID_82576_NS), board_82575 }, 76 { PCI_VDEVICE(INTEL, E1000_DEV_ID_82576_NS_SERDES), board_82575 }, 77 { PCI_VDEVICE(INTEL, E1000_DEV_ID_82576_FIBER), board_82575 }, 78 { PCI_VDEVICE(INTEL, E1000_DEV_ID_82576_SERDES), board_82575 }, 79 { PCI_VDEVICE(INTEL, E1000_DEV_ID_82576_SERDES_QUAD), board_82575 }, 80 { PCI_VDEVICE(INTEL, E1000_DEV_ID_82576_QUAD_COPPER_ET2), board_82575 }, 81 { PCI_VDEVICE(INTEL, E1000_DEV_ID_82576_QUAD_COPPER), board_82575 }, 82 { PCI_VDEVICE(INTEL, E1000_DEV_ID_82575EB_COPPER), board_82575 }, 83 { PCI_VDEVICE(INTEL, E1000_DEV_ID_82575EB_FIBER_SERDES), board_82575 }, 84 { PCI_VDEVICE(INTEL, E1000_DEV_ID_82575GB_QUAD_COPPER), board_82575 }, 85 /* required last entry */ 86 {0, } 87}; 88 89MODULE_DEVICE_TABLE(pci, igb_pci_tbl); 90 91void igb_reset(struct igb_adapter *); 92static int igb_setup_all_tx_resources(struct igb_adapter *); 93static int igb_setup_all_rx_resources(struct igb_adapter *); 94static void igb_free_all_tx_resources(struct igb_adapter *); 95static void igb_free_all_rx_resources(struct igb_adapter *); 96static void igb_setup_mrqc(struct igb_adapter *); 97void igb_update_stats(struct igb_adapter *); 98static int igb_probe(struct pci_dev *, const struct pci_device_id *); 99static void __devexit igb_remove(struct pci_dev *pdev); 100static int igb_sw_init(struct igb_adapter *); 101static int igb_open(struct net_device *); 102static int igb_close(struct net_device *); 103static void igb_configure_tx(struct igb_adapter *); 104static void igb_configure_rx(struct igb_adapter *); 105static void igb_clean_all_tx_rings(struct igb_adapter *); 106static void igb_clean_all_rx_rings(struct igb_adapter *); 107static void igb_clean_tx_ring(struct igb_ring *); 108static void igb_clean_rx_ring(struct igb_ring *); 109static void igb_set_rx_mode(struct net_device *); 110static void igb_update_phy_info(unsigned long); 111static void igb_watchdog(unsigned long); 112static void igb_watchdog_task(struct work_struct *); 113static netdev_tx_t igb_xmit_frame_adv(struct sk_buff *skb, struct net_device *); 114static struct net_device_stats *igb_get_stats(struct net_device *); 115static int igb_change_mtu(struct net_device *, int); 116static int igb_set_mac(struct net_device *, void *); 117static void igb_set_uta(struct igb_adapter *adapter); 118static irqreturn_t igb_intr(int irq, void *); 119static irqreturn_t igb_intr_msi(int irq, void *); 120static irqreturn_t igb_msix_other(int irq, void *); 121static irqreturn_t igb_msix_ring(int irq, void *); 122#ifdef CONFIG_IGB_DCA 123static void igb_update_dca(struct igb_q_vector *); 124static void igb_setup_dca(struct igb_adapter *); 125#endif /* CONFIG_IGB_DCA */ 126static bool igb_clean_tx_irq(struct igb_q_vector *); 127static int igb_poll(struct napi_struct *, int); 128static bool igb_clean_rx_irq_adv(struct igb_q_vector *, int *, int); 129static int igb_ioctl(struct net_device *, struct ifreq *, int cmd); 130static void igb_tx_timeout(struct net_device *); 131static void igb_reset_task(struct work_struct *); 132static void igb_vlan_rx_register(struct net_device *, struct vlan_group *); 133static void igb_vlan_rx_add_vid(struct net_device *, u16); 134static void igb_vlan_rx_kill_vid(struct net_device *, u16); 135static void igb_restore_vlan(struct igb_adapter *); 136static void igb_rar_set_qsel(struct igb_adapter *, u8 *, u32 , u8); 137static void igb_ping_all_vfs(struct igb_adapter *); 138static void igb_msg_task(struct igb_adapter *); 139static void igb_vmm_control(struct igb_adapter *); 140static int igb_set_vf_mac(struct igb_adapter *, int, unsigned char *); 141static void igb_restore_vf_multicasts(struct igb_adapter *adapter); 142static int igb_ndo_set_vf_mac(struct net_device *netdev, int vf, u8 *mac); 143static int igb_ndo_set_vf_vlan(struct net_device *netdev, 144 int vf, u16 vlan, u8 qos); 145static int igb_ndo_set_vf_bw(struct net_device *netdev, int vf, int tx_rate); 146static int igb_ndo_get_vf_config(struct net_device *netdev, int vf, 147 struct ifla_vf_info *ivi); 148 149#ifdef CONFIG_PM 150static int igb_suspend(struct pci_dev *, pm_message_t); 151static int igb_resume(struct pci_dev *); 152#endif 153static void igb_shutdown(struct pci_dev *); 154#ifdef CONFIG_IGB_DCA 155static int igb_notify_dca(struct notifier_block *, unsigned long, void *); 156static struct notifier_block dca_notifier = { 157 .notifier_call = igb_notify_dca, 158 .next = NULL, 159 .priority = 0 160}; 161#endif 162#ifdef CONFIG_NET_POLL_CONTROLLER 163/* for netdump / net console */ 164static void igb_netpoll(struct net_device *); 165#endif 166#ifdef CONFIG_PCI_IOV 167static unsigned int max_vfs = 0; 168module_param(max_vfs, uint, 0); 169MODULE_PARM_DESC(max_vfs, "Maximum number of virtual functions to allocate " 170 "per physical function"); 171#endif /* CONFIG_PCI_IOV */ 172 173static pci_ers_result_t igb_io_error_detected(struct pci_dev *, 174 pci_channel_state_t); 175static pci_ers_result_t igb_io_slot_reset(struct pci_dev *); 176static void igb_io_resume(struct pci_dev *); 177 178static struct pci_error_handlers igb_err_handler = { 179 .error_detected = igb_io_error_detected, 180 .slot_reset = igb_io_slot_reset, 181 .resume = igb_io_resume, 182}; 183 184 185static struct pci_driver igb_driver = { 186 .name = igb_driver_name, 187 .id_table = igb_pci_tbl, 188 .probe = igb_probe, 189 .remove = __devexit_p(igb_remove), 190#ifdef CONFIG_PM 191 /* Power Managment Hooks */ 192 .suspend = igb_suspend, 193 .resume = igb_resume, 194#endif 195 .shutdown = igb_shutdown, 196 .err_handler = &igb_err_handler 197}; 198 199MODULE_AUTHOR("Intel Corporation, <e1000-devel@lists.sourceforge.net>"); 200MODULE_DESCRIPTION("Intel(R) Gigabit Ethernet Network Driver"); 201MODULE_LICENSE("GPL"); 202MODULE_VERSION(DRV_VERSION); 203 204struct igb_reg_info { 205 u32 ofs; 206 char *name; 207}; 208 209static const struct igb_reg_info igb_reg_info_tbl[] = { 210 211 /* General Registers */ 212 {E1000_CTRL, "CTRL"}, 213 {E1000_STATUS, "STATUS"}, 214 {E1000_CTRL_EXT, "CTRL_EXT"}, 215 216 /* Interrupt Registers */ 217 {E1000_ICR, "ICR"}, 218 219 /* RX Registers */ 220 {E1000_RCTL, "RCTL"}, 221 {E1000_RDLEN(0), "RDLEN"}, 222 {E1000_RDH(0), "RDH"}, 223 {E1000_RDT(0), "RDT"}, 224 {E1000_RXDCTL(0), "RXDCTL"}, 225 {E1000_RDBAL(0), "RDBAL"}, 226 {E1000_RDBAH(0), "RDBAH"}, 227 228 /* TX Registers */ 229 {E1000_TCTL, "TCTL"}, 230 {E1000_TDBAL(0), "TDBAL"}, 231 {E1000_TDBAH(0), "TDBAH"}, 232 {E1000_TDLEN(0), "TDLEN"}, 233 {E1000_TDH(0), "TDH"}, 234 {E1000_TDT(0), "TDT"}, 235 {E1000_TXDCTL(0), "TXDCTL"}, 236 {E1000_TDFH, "TDFH"}, 237 {E1000_TDFT, "TDFT"}, 238 {E1000_TDFHS, "TDFHS"}, 239 {E1000_TDFPC, "TDFPC"}, 240 241 /* List Terminator */ 242 {} 243}; 244 245/* 246 * igb_regdump - register printout routine 247 */ 248static void igb_regdump(struct e1000_hw *hw, struct igb_reg_info *reginfo) 249{ 250 int n = 0; 251 char rname[16]; 252 u32 regs[8]; 253 254 switch (reginfo->ofs) { 255 case E1000_RDLEN(0): 256 for (n = 0; n < 4; n++) 257 regs[n] = rd32(E1000_RDLEN(n)); 258 break; 259 case E1000_RDH(0): 260 for (n = 0; n < 4; n++) 261 regs[n] = rd32(E1000_RDH(n)); 262 break; 263 case E1000_RDT(0): 264 for (n = 0; n < 4; n++) 265 regs[n] = rd32(E1000_RDT(n)); 266 break; 267 case E1000_RXDCTL(0): 268 for (n = 0; n < 4; n++) 269 regs[n] = rd32(E1000_RXDCTL(n)); 270 break; 271 case E1000_RDBAL(0): 272 for (n = 0; n < 4; n++) 273 regs[n] = rd32(E1000_RDBAL(n)); 274 break; 275 case E1000_RDBAH(0): 276 for (n = 0; n < 4; n++) 277 regs[n] = rd32(E1000_RDBAH(n)); 278 break; 279 case E1000_TDBAL(0): 280 for (n = 0; n < 4; n++) 281 regs[n] = rd32(E1000_RDBAL(n)); 282 break; 283 case E1000_TDBAH(0): 284 for (n = 0; n < 4; n++) 285 regs[n] = rd32(E1000_TDBAH(n)); 286 break; 287 case E1000_TDLEN(0): 288 for (n = 0; n < 4; n++) 289 regs[n] = rd32(E1000_TDLEN(n)); 290 break; 291 case E1000_TDH(0): 292 for (n = 0; n < 4; n++) 293 regs[n] = rd32(E1000_TDH(n)); 294 break; 295 case E1000_TDT(0): 296 for (n = 0; n < 4; n++) 297 regs[n] = rd32(E1000_TDT(n)); 298 break; 299 case E1000_TXDCTL(0): 300 for (n = 0; n < 4; n++) 301 regs[n] = rd32(E1000_TXDCTL(n)); 302 break; 303 default: 304 printk(KERN_INFO "%-15s %08x\n", 305 reginfo->name, rd32(reginfo->ofs)); 306 return; 307 } 308 309 snprintf(rname, 16, "%s%s", reginfo->name, "[0-3]"); 310 printk(KERN_INFO "%-15s ", rname); 311 for (n = 0; n < 4; n++) 312 printk(KERN_CONT "%08x ", regs[n]); 313 printk(KERN_CONT "\n"); 314} 315 316/* 317 * igb_dump - Print registers, tx-rings and rx-rings 318 */ 319static void igb_dump(struct igb_adapter *adapter) 320{ 321 struct net_device *netdev = adapter->netdev; 322 struct e1000_hw *hw = &adapter->hw; 323 struct igb_reg_info *reginfo; 324 int n = 0; 325 struct igb_ring *tx_ring; 326 union e1000_adv_tx_desc *tx_desc; 327 struct my_u0 { u64 a; u64 b; } *u0; 328 struct igb_buffer *buffer_info; 329 struct igb_ring *rx_ring; 330 union e1000_adv_rx_desc *rx_desc; 331 u32 staterr; 332 int i = 0; 333 334 if (!netif_msg_hw(adapter)) 335 return; 336 337 /* Print netdevice Info */ 338 if (netdev) { 339 dev_info(&adapter->pdev->dev, "Net device Info\n"); 340 printk(KERN_INFO "Device Name state " 341 "trans_start last_rx\n"); 342 printk(KERN_INFO "%-15s %016lX %016lX %016lX\n", 343 netdev->name, 344 netdev->state, 345 netdev->trans_start, 346 netdev->last_rx); 347 } 348 349 /* Print Registers */ 350 dev_info(&adapter->pdev->dev, "Register Dump\n"); 351 printk(KERN_INFO " Register Name Value\n"); 352 for (reginfo = (struct igb_reg_info *)igb_reg_info_tbl; 353 reginfo->name; reginfo++) { 354 igb_regdump(hw, reginfo); 355 } 356 357 /* Print TX Ring Summary */ 358 if (!netdev || !netif_running(netdev)) 359 goto exit; 360 361 dev_info(&adapter->pdev->dev, "TX Rings Summary\n"); 362 printk(KERN_INFO "Queue [NTU] [NTC] [bi(ntc)->dma ]" 363 " leng ntw timestamp\n"); 364 for (n = 0; n < adapter->num_tx_queues; n++) { 365 tx_ring = adapter->tx_ring[n]; 366 buffer_info = &tx_ring->buffer_info[tx_ring->next_to_clean]; 367 printk(KERN_INFO " %5d %5X %5X %016llX %04X %3X %016llX\n", 368 n, tx_ring->next_to_use, tx_ring->next_to_clean, 369 (u64)buffer_info->dma, 370 buffer_info->length, 371 buffer_info->next_to_watch, 372 (u64)buffer_info->time_stamp); 373 } 374 375 /* Print TX Rings */ 376 if (!netif_msg_tx_done(adapter)) 377 goto rx_ring_summary; 378 379 dev_info(&adapter->pdev->dev, "TX Rings Dump\n"); 380 381 /* Transmit Descriptor Formats 382 * 383 * Advanced Transmit Descriptor 384 * +--------------------------------------------------------------+ 385 * 0 | Buffer Address [63:0] | 386 * +--------------------------------------------------------------+ 387 * 8 | PAYLEN | PORTS |CC|IDX | STA | DCMD |DTYP|MAC|RSV| DTALEN | 388 * +--------------------------------------------------------------+ 389 * 63 46 45 40 39 38 36 35 32 31 24 15 0 390 */ 391 392 for (n = 0; n < adapter->num_tx_queues; n++) { 393 tx_ring = adapter->tx_ring[n]; 394 printk(KERN_INFO "------------------------------------\n"); 395 printk(KERN_INFO "TX QUEUE INDEX = %d\n", tx_ring->queue_index); 396 printk(KERN_INFO "------------------------------------\n"); 397 printk(KERN_INFO "T [desc] [address 63:0 ] " 398 "[PlPOCIStDDM Ln] [bi->dma ] " 399 "leng ntw timestamp bi->skb\n"); 400 401 for (i = 0; tx_ring->desc && (i < tx_ring->count); i++) { 402 tx_desc = E1000_TX_DESC_ADV(*tx_ring, i); 403 buffer_info = &tx_ring->buffer_info[i]; 404 u0 = (struct my_u0 *)tx_desc; 405 printk(KERN_INFO "T [0x%03X] %016llX %016llX %016llX" 406 " %04X %3X %016llX %p", i, 407 le64_to_cpu(u0->a), 408 le64_to_cpu(u0->b), 409 (u64)buffer_info->dma, 410 buffer_info->length, 411 buffer_info->next_to_watch, 412 (u64)buffer_info->time_stamp, 413 buffer_info->skb); 414 if (i == tx_ring->next_to_use && 415 i == tx_ring->next_to_clean) 416 printk(KERN_CONT " NTC/U\n"); 417 else if (i == tx_ring->next_to_use) 418 printk(KERN_CONT " NTU\n"); 419 else if (i == tx_ring->next_to_clean) 420 printk(KERN_CONT " NTC\n"); 421 else 422 printk(KERN_CONT "\n"); 423 424 if (netif_msg_pktdata(adapter) && buffer_info->dma != 0) 425 print_hex_dump(KERN_INFO, "", 426 DUMP_PREFIX_ADDRESS, 427 16, 1, phys_to_virt(buffer_info->dma), 428 buffer_info->length, true); 429 } 430 } 431 432 /* Print RX Rings Summary */ 433rx_ring_summary: 434 dev_info(&adapter->pdev->dev, "RX Rings Summary\n"); 435 printk(KERN_INFO "Queue [NTU] [NTC]\n"); 436 for (n = 0; n < adapter->num_rx_queues; n++) { 437 rx_ring = adapter->rx_ring[n]; 438 printk(KERN_INFO " %5d %5X %5X\n", n, 439 rx_ring->next_to_use, rx_ring->next_to_clean); 440 } 441 442 /* Print RX Rings */ 443 if (!netif_msg_rx_status(adapter)) 444 goto exit; 445 446 dev_info(&adapter->pdev->dev, "RX Rings Dump\n"); 447 448 /* Advanced Receive Descriptor (Read) Format 449 * 63 1 0 450 * +-----------------------------------------------------+ 451 * 0 | Packet Buffer Address [63:1] |A0/NSE| 452 * +----------------------------------------------+------+ 453 * 8 | Header Buffer Address [63:1] | DD | 454 * +-----------------------------------------------------+ 455 * 456 * 457 * Advanced Receive Descriptor (Write-Back) Format 458 * 459 * 63 48 47 32 31 30 21 20 17 16 4 3 0 460 * +------------------------------------------------------+ 461 * 0 | Packet IP |SPH| HDR_LEN | RSV|Packet| RSS | 462 * | Checksum Ident | | | | Type | Type | 463 * +------------------------------------------------------+ 464 * 8 | VLAN Tag | Length | Extended Error | Extended Status | 465 * +------------------------------------------------------+ 466 * 63 48 47 32 31 20 19 0 467 */ 468 469 for (n = 0; n < adapter->num_rx_queues; n++) { 470 rx_ring = adapter->rx_ring[n]; 471 printk(KERN_INFO "------------------------------------\n"); 472 printk(KERN_INFO "RX QUEUE INDEX = %d\n", rx_ring->queue_index); 473 printk(KERN_INFO "------------------------------------\n"); 474 printk(KERN_INFO "R [desc] [ PktBuf A0] " 475 "[ HeadBuf DD] [bi->dma ] [bi->skb] " 476 "<-- Adv Rx Read format\n"); 477 printk(KERN_INFO "RWB[desc] [PcsmIpSHl PtRs] " 478 "[vl er S cks ln] ---------------- [bi->skb] " 479 "<-- Adv Rx Write-Back format\n"); 480 481 for (i = 0; i < rx_ring->count; i++) { 482 buffer_info = &rx_ring->buffer_info[i]; 483 rx_desc = E1000_RX_DESC_ADV(*rx_ring, i); 484 u0 = (struct my_u0 *)rx_desc; 485 staterr = le32_to_cpu(rx_desc->wb.upper.status_error); 486 if (staterr & E1000_RXD_STAT_DD) { 487 /* Descriptor Done */ 488 printk(KERN_INFO "RWB[0x%03X] %016llX " 489 "%016llX ---------------- %p", i, 490 le64_to_cpu(u0->a), 491 le64_to_cpu(u0->b), 492 buffer_info->skb); 493 } else { 494 printk(KERN_INFO "R [0x%03X] %016llX " 495 "%016llX %016llX %p", i, 496 le64_to_cpu(u0->a), 497 le64_to_cpu(u0->b), 498 (u64)buffer_info->dma, 499 buffer_info->skb); 500 501 if (netif_msg_pktdata(adapter)) { 502 print_hex_dump(KERN_INFO, "", 503 DUMP_PREFIX_ADDRESS, 504 16, 1, 505 phys_to_virt(buffer_info->dma), 506 rx_ring->rx_buffer_len, true); 507 if (rx_ring->rx_buffer_len 508 < IGB_RXBUFFER_1024) 509 print_hex_dump(KERN_INFO, "", 510 DUMP_PREFIX_ADDRESS, 511 16, 1, 512 phys_to_virt( 513 buffer_info->page_dma + 514 buffer_info->page_offset), 515 PAGE_SIZE/2, true); 516 } 517 } 518 519 if (i == rx_ring->next_to_use) 520 printk(KERN_CONT " NTU\n"); 521 else if (i == rx_ring->next_to_clean) 522 printk(KERN_CONT " NTC\n"); 523 else 524 printk(KERN_CONT "\n"); 525 526 } 527 } 528 529exit: 530 return; 531} 532 533 534/** 535 * igb_read_clock - read raw cycle counter (to be used by time counter) 536 */ 537static cycle_t igb_read_clock(const struct cyclecounter *tc) 538{ 539 struct igb_adapter *adapter = 540 container_of(tc, struct igb_adapter, cycles); 541 struct e1000_hw *hw = &adapter->hw; 542 u64 stamp = 0; 543 int shift = 0; 544 545 /* 546 * The timestamp latches on lowest register read. For the 82580 547 * the lowest register is SYSTIMR instead of SYSTIML. However we never 548 * adjusted TIMINCA so SYSTIMR will just read as all 0s so ignore it. 549 */ 550 if (hw->mac.type == e1000_82580) { 551 stamp = rd32(E1000_SYSTIMR) >> 8; 552 shift = IGB_82580_TSYNC_SHIFT; 553 } 554 555 stamp |= (u64)rd32(E1000_SYSTIML) << shift; 556 stamp |= (u64)rd32(E1000_SYSTIMH) << (shift + 32); 557 return stamp; 558} 559 560/** 561 * igb_get_hw_dev - return device 562 * used by hardware layer to print debugging information 563 **/ 564struct net_device *igb_get_hw_dev(struct e1000_hw *hw) 565{ 566 struct igb_adapter *adapter = hw->back; 567 return adapter->netdev; 568} 569 570/** 571 * igb_init_module - Driver Registration Routine 572 * 573 * igb_init_module is the first routine called when the driver is 574 * loaded. All it does is register with the PCI subsystem. 575 **/ 576static int __init igb_init_module(void) 577{ 578 int ret; 579 printk(KERN_INFO "%s - version %s\n", 580 igb_driver_string, igb_driver_version); 581 582 printk(KERN_INFO "%s\n", igb_copyright); 583 584#ifdef CONFIG_IGB_DCA 585 dca_register_notify(&dca_notifier); 586#endif 587 ret = pci_register_driver(&igb_driver); 588 return ret; 589} 590 591module_init(igb_init_module); 592 593/** 594 * igb_exit_module - Driver Exit Cleanup Routine 595 * 596 * igb_exit_module is called just before the driver is removed 597 * from memory. 598 **/ 599static void __exit igb_exit_module(void) 600{ 601#ifdef CONFIG_IGB_DCA 602 dca_unregister_notify(&dca_notifier); 603#endif 604 pci_unregister_driver(&igb_driver); 605} 606 607module_exit(igb_exit_module); 608 609#define Q_IDX_82576(i) (((i & 0x1) << 3) + (i >> 1)) 610/** 611 * igb_cache_ring_register - Descriptor ring to register mapping 612 * @adapter: board private structure to initialize 613 * 614 * Once we know the feature-set enabled for the device, we'll cache 615 * the register offset the descriptor ring is assigned to. 616 **/ 617static void igb_cache_ring_register(struct igb_adapter *adapter) 618{ 619 int i = 0, j = 0; 620 u32 rbase_offset = adapter->vfs_allocated_count; 621 622 switch (adapter->hw.mac.type) { 623 case e1000_82576: 624 /* The queues are allocated for virtualization such that VF 0 625 * is allocated queues 0 and 8, VF 1 queues 1 and 9, etc. 626 * In order to avoid collision we start at the first free queue 627 * and continue consuming queues in the same sequence 628 */ 629 if (adapter->vfs_allocated_count) { 630 for (; i < adapter->rss_queues; i++) 631 adapter->rx_ring[i]->reg_idx = rbase_offset + 632 Q_IDX_82576(i); 633 } 634 case e1000_82575: 635 case e1000_82580: 636 case e1000_i350: 637 default: 638 for (; i < adapter->num_rx_queues; i++) 639 adapter->rx_ring[i]->reg_idx = rbase_offset + i; 640 for (; j < adapter->num_tx_queues; j++) 641 adapter->tx_ring[j]->reg_idx = rbase_offset + j; 642 break; 643 } 644} 645 646static void igb_free_queues(struct igb_adapter *adapter) 647{ 648 int i; 649 650 for (i = 0; i < adapter->num_tx_queues; i++) { 651 kfree(adapter->tx_ring[i]); 652 adapter->tx_ring[i] = NULL; 653 } 654 for (i = 0; i < adapter->num_rx_queues; i++) { 655 kfree(adapter->rx_ring[i]); 656 adapter->rx_ring[i] = NULL; 657 } 658 adapter->num_rx_queues = 0; 659 adapter->num_tx_queues = 0; 660} 661 662/** 663 * igb_alloc_queues - Allocate memory for all rings 664 * @adapter: board private structure to initialize 665 * 666 * We allocate one ring per queue at run-time since we don't know the 667 * number of queues at compile-time. 668 **/ 669static int igb_alloc_queues(struct igb_adapter *adapter) 670{ 671 struct igb_ring *ring; 672 int i; 673 674 for (i = 0; i < adapter->num_tx_queues; i++) { 675 ring = kzalloc(sizeof(struct igb_ring), GFP_KERNEL); 676 if (!ring) 677 goto err; 678 ring->count = adapter->tx_ring_count; 679 ring->queue_index = i; 680 ring->dev = &adapter->pdev->dev; 681 ring->netdev = adapter->netdev; 682 /* For 82575, context index must be unique per ring. */ 683 if (adapter->hw.mac.type == e1000_82575) 684 ring->flags = IGB_RING_FLAG_TX_CTX_IDX; 685 adapter->tx_ring[i] = ring; 686 } 687 688 for (i = 0; i < adapter->num_rx_queues; i++) { 689 ring = kzalloc(sizeof(struct igb_ring), GFP_KERNEL); 690 if (!ring) 691 goto err; 692 ring->count = adapter->rx_ring_count; 693 ring->queue_index = i; 694 ring->dev = &adapter->pdev->dev; 695 ring->netdev = adapter->netdev; 696 ring->rx_buffer_len = MAXIMUM_ETHERNET_VLAN_SIZE; 697 ring->flags = IGB_RING_FLAG_RX_CSUM; /* enable rx checksum */ 698 /* set flag indicating ring supports SCTP checksum offload */ 699 if (adapter->hw.mac.type >= e1000_82576) 700 ring->flags |= IGB_RING_FLAG_RX_SCTP_CSUM; 701 adapter->rx_ring[i] = ring; 702 } 703 704 igb_cache_ring_register(adapter); 705 706 return 0; 707 708err: 709 igb_free_queues(adapter); 710 711 return -ENOMEM; 712} 713 714#define IGB_N0_QUEUE -1 715static void igb_assign_vector(struct igb_q_vector *q_vector, int msix_vector) 716{ 717 u32 msixbm = 0; 718 struct igb_adapter *adapter = q_vector->adapter; 719 struct e1000_hw *hw = &adapter->hw; 720 u32 ivar, index; 721 int rx_queue = IGB_N0_QUEUE; 722 int tx_queue = IGB_N0_QUEUE; 723 724 if (q_vector->rx_ring) 725 rx_queue = q_vector->rx_ring->reg_idx; 726 if (q_vector->tx_ring) 727 tx_queue = q_vector->tx_ring->reg_idx; 728 729 switch (hw->mac.type) { 730 case e1000_82575: 731 /* The 82575 assigns vectors using a bitmask, which matches the 732 bitmask for the EICR/EIMS/EIMC registers. To assign one 733 or more queues to a vector, we write the appropriate bits 734 into the MSIXBM register for that vector. */ 735 if (rx_queue > IGB_N0_QUEUE) 736 msixbm = E1000_EICR_RX_QUEUE0 << rx_queue; 737 if (tx_queue > IGB_N0_QUEUE) 738 msixbm |= E1000_EICR_TX_QUEUE0 << tx_queue; 739 if (!adapter->msix_entries && msix_vector == 0) 740 msixbm |= E1000_EIMS_OTHER; 741 array_wr32(E1000_MSIXBM(0), msix_vector, msixbm); 742 q_vector->eims_value = msixbm; 743 break; 744 case e1000_82576: 745 /* 82576 uses a table-based method for assigning vectors. 746 Each queue has a single entry in the table to which we write 747 a vector number along with a "valid" bit. Sadly, the layout 748 of the table is somewhat counterintuitive. */ 749 if (rx_queue > IGB_N0_QUEUE) { 750 index = (rx_queue & 0x7); 751 ivar = array_rd32(E1000_IVAR0, index); 752 if (rx_queue < 8) { 753 /* vector goes into low byte of register */ 754 ivar = ivar & 0xFFFFFF00; 755 ivar |= msix_vector | E1000_IVAR_VALID; 756 } else { 757 /* vector goes into third byte of register */ 758 ivar = ivar & 0xFF00FFFF; 759 ivar |= (msix_vector | E1000_IVAR_VALID) << 16; 760 } 761 array_wr32(E1000_IVAR0, index, ivar); 762 } 763 if (tx_queue > IGB_N0_QUEUE) { 764 index = (tx_queue & 0x7); 765 ivar = array_rd32(E1000_IVAR0, index); 766 if (tx_queue < 8) { 767 /* vector goes into second byte of register */ 768 ivar = ivar & 0xFFFF00FF; 769 ivar |= (msix_vector | E1000_IVAR_VALID) << 8; 770 } else { 771 /* vector goes into high byte of register */ 772 ivar = ivar & 0x00FFFFFF; 773 ivar |= (msix_vector | E1000_IVAR_VALID) << 24; 774 } 775 array_wr32(E1000_IVAR0, index, ivar); 776 } 777 q_vector->eims_value = 1 << msix_vector; 778 break; 779 case e1000_82580: 780 case e1000_i350: 781 /* 82580 uses the same table-based approach as 82576 but has fewer 782 entries as a result we carry over for queues greater than 4. */ 783 if (rx_queue > IGB_N0_QUEUE) { 784 index = (rx_queue >> 1); 785 ivar = array_rd32(E1000_IVAR0, index); 786 if (rx_queue & 0x1) { 787 /* vector goes into third byte of register */ 788 ivar = ivar & 0xFF00FFFF; 789 ivar |= (msix_vector | E1000_IVAR_VALID) << 16; 790 } else { 791 /* vector goes into low byte of register */ 792 ivar = ivar & 0xFFFFFF00; 793 ivar |= msix_vector | E1000_IVAR_VALID; 794 } 795 array_wr32(E1000_IVAR0, index, ivar); 796 } 797 if (tx_queue > IGB_N0_QUEUE) { 798 index = (tx_queue >> 1); 799 ivar = array_rd32(E1000_IVAR0, index); 800 if (tx_queue & 0x1) { 801 /* vector goes into high byte of register */ 802 ivar = ivar & 0x00FFFFFF; 803 ivar |= (msix_vector | E1000_IVAR_VALID) << 24; 804 } else { 805 /* vector goes into second byte of register */ 806 ivar = ivar & 0xFFFF00FF; 807 ivar |= (msix_vector | E1000_IVAR_VALID) << 8; 808 } 809 array_wr32(E1000_IVAR0, index, ivar); 810 } 811 q_vector->eims_value = 1 << msix_vector; 812 break; 813 default: 814 BUG(); 815 break; 816 } 817 818 /* add q_vector eims value to global eims_enable_mask */ 819 adapter->eims_enable_mask |= q_vector->eims_value; 820 821 /* configure q_vector to set itr on first interrupt */ 822 q_vector->set_itr = 1; 823} 824 825/** 826 * igb_configure_msix - Configure MSI-X hardware 827 * 828 * igb_configure_msix sets up the hardware to properly 829 * generate MSI-X interrupts. 830 **/ 831static void igb_configure_msix(struct igb_adapter *adapter) 832{ 833 u32 tmp; 834 int i, vector = 0; 835 struct e1000_hw *hw = &adapter->hw; 836 837 adapter->eims_enable_mask = 0; 838 839 /* set vector for other causes, i.e. link changes */ 840 switch (hw->mac.type) { 841 case e1000_82575: 842 tmp = rd32(E1000_CTRL_EXT); 843 /* enable MSI-X PBA support*/ 844 tmp |= E1000_CTRL_EXT_PBA_CLR; 845 846 /* Auto-Mask interrupts upon ICR read. */ 847 tmp |= E1000_CTRL_EXT_EIAME; 848 tmp |= E1000_CTRL_EXT_IRCA; 849 850 wr32(E1000_CTRL_EXT, tmp); 851 852 /* enable msix_other interrupt */ 853 array_wr32(E1000_MSIXBM(0), vector++, 854 E1000_EIMS_OTHER); 855 adapter->eims_other = E1000_EIMS_OTHER; 856 857 break; 858 859 case e1000_82576: 860 case e1000_82580: 861 case e1000_i350: 862 /* Turn on MSI-X capability first, or our settings 863 * won't stick. And it will take days to debug. */ 864 wr32(E1000_GPIE, E1000_GPIE_MSIX_MODE | 865 E1000_GPIE_PBA | E1000_GPIE_EIAME | 866 E1000_GPIE_NSICR); 867 868 /* enable msix_other interrupt */ 869 adapter->eims_other = 1 << vector; 870 tmp = (vector++ | E1000_IVAR_VALID) << 8; 871 872 wr32(E1000_IVAR_MISC, tmp); 873 break; 874 default: 875 /* do nothing, since nothing else supports MSI-X */ 876 break; 877 } /* switch (hw->mac.type) */ 878 879 adapter->eims_enable_mask |= adapter->eims_other; 880 881 for (i = 0; i < adapter->num_q_vectors; i++) 882 igb_assign_vector(adapter->q_vector[i], vector++); 883 884 wrfl(); 885} 886 887/** 888 * igb_request_msix - Initialize MSI-X interrupts 889 * 890 * igb_request_msix allocates MSI-X vectors and requests interrupts from the 891 * kernel. 892 **/ 893static int igb_request_msix(struct igb_adapter *adapter) 894{ 895 struct net_device *netdev = adapter->netdev; 896 struct e1000_hw *hw = &adapter->hw; 897 int i, err = 0, vector = 0; 898 899 err = request_irq(adapter->msix_entries[vector].vector, 900 igb_msix_other, 0, netdev->name, adapter); 901 if (err) 902 goto out; 903 vector++; 904 905 for (i = 0; i < adapter->num_q_vectors; i++) { 906 struct igb_q_vector *q_vector = adapter->q_vector[i]; 907 908 q_vector->itr_register = hw->hw_addr + E1000_EITR(vector); 909 910 if (q_vector->rx_ring && q_vector->tx_ring) 911 sprintf(q_vector->name, "%s-TxRx-%u", netdev->name, 912 q_vector->rx_ring->queue_index); 913 else if (q_vector->tx_ring) 914 sprintf(q_vector->name, "%s-tx-%u", netdev->name, 915 q_vector->tx_ring->queue_index); 916 else if (q_vector->rx_ring) 917 sprintf(q_vector->name, "%s-rx-%u", netdev->name, 918 q_vector->rx_ring->queue_index); 919 else 920 sprintf(q_vector->name, "%s-unused", netdev->name); 921 922 err = request_irq(adapter->msix_entries[vector].vector, 923 igb_msix_ring, 0, q_vector->name, 924 q_vector); 925 if (err) 926 goto out; 927 vector++; 928 } 929 930 igb_configure_msix(adapter); 931 return 0; 932out: 933 return err; 934} 935 936static void igb_reset_interrupt_capability(struct igb_adapter *adapter) 937{ 938 if (adapter->msix_entries) { 939 pci_disable_msix(adapter->pdev); 940 kfree(adapter->msix_entries); 941 adapter->msix_entries = NULL; 942 } else if (adapter->flags & IGB_FLAG_HAS_MSI) { 943 pci_disable_msi(adapter->pdev); 944 } 945} 946 947/** 948 * igb_free_q_vectors - Free memory allocated for interrupt vectors 949 * @adapter: board private structure to initialize 950 * 951 * This function frees the memory allocated to the q_vectors. In addition if 952 * NAPI is enabled it will delete any references to the NAPI struct prior 953 * to freeing the q_vector. 954 **/ 955static void igb_free_q_vectors(struct igb_adapter *adapter) 956{ 957 int v_idx; 958 959 for (v_idx = 0; v_idx < adapter->num_q_vectors; v_idx++) { 960 struct igb_q_vector *q_vector = adapter->q_vector[v_idx]; 961 adapter->q_vector[v_idx] = NULL; 962 if (!q_vector) 963 continue; 964 netif_napi_del(&q_vector->napi); 965 kfree(q_vector); 966 } 967 adapter->num_q_vectors = 0; 968} 969 970/** 971 * igb_clear_interrupt_scheme - reset the device to a state of no interrupts 972 * 973 * This function resets the device so that it has 0 rx queues, tx queues, and 974 * MSI-X interrupts allocated. 975 */ 976static void igb_clear_interrupt_scheme(struct igb_adapter *adapter) 977{ 978 igb_free_queues(adapter); 979 igb_free_q_vectors(adapter); 980 igb_reset_interrupt_capability(adapter); 981} 982 983/** 984 * igb_set_interrupt_capability - set MSI or MSI-X if supported 985 * 986 * Attempt to configure interrupts using the best available 987 * capabilities of the hardware and kernel. 988 **/ 989static void igb_set_interrupt_capability(struct igb_adapter *adapter) 990{ 991 int err; 992 int numvecs, i; 993 994 /* Number of supported queues. */ 995 adapter->num_rx_queues = adapter->rss_queues; 996 if (adapter->vfs_allocated_count) 997 adapter->num_tx_queues = 1; 998 else 999 adapter->num_tx_queues = adapter->rss_queues; 1000 1001 /* start with one vector for every rx queue */ 1002 numvecs = adapter->num_rx_queues; 1003 1004 /* if tx handler is separate add 1 for every tx queue */ 1005 if (!(adapter->flags & IGB_FLAG_QUEUE_PAIRS)) 1006 numvecs += adapter->num_tx_queues; 1007 1008 /* store the number of vectors reserved for queues */ 1009 adapter->num_q_vectors = numvecs; 1010 1011 /* add 1 vector for link status interrupts */ 1012 numvecs++; 1013 adapter->msix_entries = kcalloc(numvecs, sizeof(struct msix_entry), 1014 GFP_KERNEL); 1015 if (!adapter->msix_entries) 1016 goto msi_only; 1017 1018 for (i = 0; i < numvecs; i++) 1019 adapter->msix_entries[i].entry = i; 1020 1021 err = pci_enable_msix(adapter->pdev, 1022 adapter->msix_entries, 1023 numvecs); 1024 if (err == 0) 1025 goto out; 1026 1027 igb_reset_interrupt_capability(adapter); 1028 1029 /* If we can't do MSI-X, try MSI */ 1030msi_only: 1031#ifdef CONFIG_PCI_IOV 1032 /* disable SR-IOV for non MSI-X configurations */ 1033 if (adapter->vf_data) { 1034 struct e1000_hw *hw = &adapter->hw; 1035 /* disable iov and allow time for transactions to clear */ 1036 pci_disable_sriov(adapter->pdev); 1037 msleep(500); 1038 1039 kfree(adapter->vf_data); 1040 adapter->vf_data = NULL; 1041 wr32(E1000_IOVCTL, E1000_IOVCTL_REUSE_VFQ); 1042 msleep(100); 1043 dev_info(&adapter->pdev->dev, "IOV Disabled\n"); 1044 } 1045#endif 1046 adapter->vfs_allocated_count = 0; 1047 adapter->rss_queues = 1; 1048 adapter->flags |= IGB_FLAG_QUEUE_PAIRS; 1049 adapter->num_rx_queues = 1; 1050 adapter->num_tx_queues = 1; 1051 adapter->num_q_vectors = 1; 1052 if (!pci_enable_msi(adapter->pdev)) 1053 adapter->flags |= IGB_FLAG_HAS_MSI; 1054out: 1055 /* Notify the stack of the (possibly) reduced Tx Queue count. */ 1056 adapter->netdev->real_num_tx_queues = adapter->num_tx_queues; 1057} 1058 1059/** 1060 * igb_alloc_q_vectors - Allocate memory for interrupt vectors 1061 * @adapter: board private structure to initialize 1062 * 1063 * We allocate one q_vector per queue interrupt. If allocation fails we 1064 * return -ENOMEM. 1065 **/ 1066static int igb_alloc_q_vectors(struct igb_adapter *adapter) 1067{ 1068 struct igb_q_vector *q_vector; 1069 struct e1000_hw *hw = &adapter->hw; 1070 int v_idx; 1071 1072 for (v_idx = 0; v_idx < adapter->num_q_vectors; v_idx++) { 1073 q_vector = kzalloc(sizeof(struct igb_q_vector), GFP_KERNEL); 1074 if (!q_vector) 1075 goto err_out; 1076 q_vector->adapter = adapter; 1077 q_vector->itr_register = hw->hw_addr + E1000_EITR(0); 1078 q_vector->itr_val = IGB_START_ITR; 1079 netif_napi_add(adapter->netdev, &q_vector->napi, igb_poll, 64); 1080 adapter->q_vector[v_idx] = q_vector; 1081 } 1082 return 0; 1083 1084err_out: 1085 igb_free_q_vectors(adapter); 1086 return -ENOMEM; 1087} 1088 1089static void igb_map_rx_ring_to_vector(struct igb_adapter *adapter, 1090 int ring_idx, int v_idx) 1091{ 1092 struct igb_q_vector *q_vector = adapter->q_vector[v_idx]; 1093 1094 q_vector->rx_ring = adapter->rx_ring[ring_idx]; 1095 q_vector->rx_ring->q_vector = q_vector; 1096 q_vector->itr_val = adapter->rx_itr_setting; 1097 if (q_vector->itr_val && q_vector->itr_val <= 3) 1098 q_vector->itr_val = IGB_START_ITR; 1099} 1100 1101static void igb_map_tx_ring_to_vector(struct igb_adapter *adapter, 1102 int ring_idx, int v_idx) 1103{ 1104 struct igb_q_vector *q_vector = adapter->q_vector[v_idx]; 1105 1106 q_vector->tx_ring = adapter->tx_ring[ring_idx]; 1107 q_vector->tx_ring->q_vector = q_vector; 1108 q_vector->itr_val = adapter->tx_itr_setting; 1109 if (q_vector->itr_val && q_vector->itr_val <= 3) 1110 q_vector->itr_val = IGB_START_ITR; 1111} 1112 1113/** 1114 * igb_map_ring_to_vector - maps allocated queues to vectors 1115 * 1116 * This function maps the recently allocated queues to vectors. 1117 **/ 1118static int igb_map_ring_to_vector(struct igb_adapter *adapter) 1119{ 1120 int i; 1121 int v_idx = 0; 1122 1123 if ((adapter->num_q_vectors < adapter->num_rx_queues) || 1124 (adapter->num_q_vectors < adapter->num_tx_queues)) 1125 return -ENOMEM; 1126 1127 if (adapter->num_q_vectors >= 1128 (adapter->num_rx_queues + adapter->num_tx_queues)) { 1129 for (i = 0; i < adapter->num_rx_queues; i++) 1130 igb_map_rx_ring_to_vector(adapter, i, v_idx++); 1131 for (i = 0; i < adapter->num_tx_queues; i++) 1132 igb_map_tx_ring_to_vector(adapter, i, v_idx++); 1133 } else { 1134 for (i = 0; i < adapter->num_rx_queues; i++) { 1135 if (i < adapter->num_tx_queues) 1136 igb_map_tx_ring_to_vector(adapter, i, v_idx); 1137 igb_map_rx_ring_to_vector(adapter, i, v_idx++); 1138 } 1139 for (; i < adapter->num_tx_queues; i++) 1140 igb_map_tx_ring_to_vector(adapter, i, v_idx++); 1141 } 1142 return 0; 1143} 1144 1145/** 1146 * igb_init_interrupt_scheme - initialize interrupts, allocate queues/vectors 1147 * 1148 * This function initializes the interrupts and allocates all of the queues. 1149 **/ 1150static int igb_init_interrupt_scheme(struct igb_adapter *adapter) 1151{ 1152 struct pci_dev *pdev = adapter->pdev; 1153 int err; 1154 1155 igb_set_interrupt_capability(adapter); 1156 1157 err = igb_alloc_q_vectors(adapter); 1158 if (err) { 1159 dev_err(&pdev->dev, "Unable to allocate memory for vectors\n"); 1160 goto err_alloc_q_vectors; 1161 } 1162 1163 err = igb_alloc_queues(adapter); 1164 if (err) { 1165 dev_err(&pdev->dev, "Unable to allocate memory for queues\n"); 1166 goto err_alloc_queues; 1167 } 1168 1169 err = igb_map_ring_to_vector(adapter); 1170 if (err) { 1171 dev_err(&pdev->dev, "Invalid q_vector to ring mapping\n"); 1172 goto err_map_queues; 1173 } 1174 1175 1176 return 0; 1177err_map_queues: 1178 igb_free_queues(adapter); 1179err_alloc_queues: 1180 igb_free_q_vectors(adapter); 1181err_alloc_q_vectors: 1182 igb_reset_interrupt_capability(adapter); 1183 return err; 1184} 1185 1186/** 1187 * igb_request_irq - initialize interrupts 1188 * 1189 * Attempts to configure interrupts using the best available 1190 * capabilities of the hardware and kernel. 1191 **/ 1192static int igb_request_irq(struct igb_adapter *adapter) 1193{ 1194 struct net_device *netdev = adapter->netdev; 1195 struct pci_dev *pdev = adapter->pdev; 1196 int err = 0; 1197 1198 if (adapter->msix_entries) { 1199 err = igb_request_msix(adapter); 1200 if (!err) 1201 goto request_done; 1202 /* fall back to MSI */ 1203 igb_clear_interrupt_scheme(adapter); 1204 if (!pci_enable_msi(adapter->pdev)) 1205 adapter->flags |= IGB_FLAG_HAS_MSI; 1206 igb_free_all_tx_resources(adapter); 1207 igb_free_all_rx_resources(adapter); 1208 adapter->num_tx_queues = 1; 1209 adapter->num_rx_queues = 1; 1210 adapter->num_q_vectors = 1; 1211 err = igb_alloc_q_vectors(adapter); 1212 if (err) { 1213 dev_err(&pdev->dev, 1214 "Unable to allocate memory for vectors\n"); 1215 goto request_done; 1216 } 1217 err = igb_alloc_queues(adapter); 1218 if (err) { 1219 dev_err(&pdev->dev, 1220 "Unable to allocate memory for queues\n"); 1221 igb_free_q_vectors(adapter); 1222 goto request_done; 1223 } 1224 igb_setup_all_tx_resources(adapter); 1225 igb_setup_all_rx_resources(adapter); 1226 } else { 1227 igb_assign_vector(adapter->q_vector[0], 0); 1228 } 1229 1230 if (adapter->flags & IGB_FLAG_HAS_MSI) { 1231 err = request_irq(adapter->pdev->irq, igb_intr_msi, 0, 1232 netdev->name, adapter); 1233 if (!err) 1234 goto request_done; 1235 1236 /* fall back to legacy interrupts */ 1237 igb_reset_interrupt_capability(adapter); 1238 adapter->flags &= ~IGB_FLAG_HAS_MSI; 1239 } 1240 1241 err = request_irq(adapter->pdev->irq, igb_intr, IRQF_SHARED, 1242 netdev->name, adapter); 1243 1244 if (err) 1245 dev_err(&adapter->pdev->dev, "Error %d getting interrupt\n", 1246 err); 1247 1248request_done: 1249 return err; 1250} 1251 1252static void igb_free_irq(struct igb_adapter *adapter) 1253{ 1254 if (adapter->msix_entries) { 1255 int vector = 0, i; 1256 1257 free_irq(adapter->msix_entries[vector++].vector, adapter); 1258 1259 for (i = 0; i < adapter->num_q_vectors; i++) { 1260 struct igb_q_vector *q_vector = adapter->q_vector[i]; 1261 free_irq(adapter->msix_entries[vector++].vector, 1262 q_vector); 1263 } 1264 } else { 1265 free_irq(adapter->pdev->irq, adapter); 1266 } 1267} 1268 1269/** 1270 * igb_irq_disable - Mask off interrupt generation on the NIC 1271 * @adapter: board private structure 1272 **/ 1273static void igb_irq_disable(struct igb_adapter *adapter) 1274{ 1275 struct e1000_hw *hw = &adapter->hw; 1276 1277 /* 1278 * we need to be careful when disabling interrupts. The VFs are also 1279 * mapped into these registers and so clearing the bits can cause 1280 * issues on the VF drivers so we only need to clear what we set 1281 */ 1282 if (adapter->msix_entries) { 1283 u32 regval = rd32(E1000_EIAM); 1284 wr32(E1000_EIAM, regval & ~adapter->eims_enable_mask); 1285 wr32(E1000_EIMC, adapter->eims_enable_mask); 1286 regval = rd32(E1000_EIAC); 1287 wr32(E1000_EIAC, regval & ~adapter->eims_enable_mask); 1288 } 1289 1290 wr32(E1000_IAM, 0); 1291 wr32(E1000_IMC, ~0); 1292 wrfl(); 1293 if (adapter->msix_entries) { 1294 int i; 1295 for (i = 0; i < adapter->num_q_vectors; i++) 1296 synchronize_irq(adapter->msix_entries[i].vector); 1297 } else { 1298 synchronize_irq(adapter->pdev->irq); 1299 } 1300} 1301 1302/** 1303 * igb_irq_enable - Enable default interrupt generation settings 1304 * @adapter: board private structure 1305 **/ 1306static void igb_irq_enable(struct igb_adapter *adapter) 1307{ 1308 struct e1000_hw *hw = &adapter->hw; 1309 1310 if (adapter->msix_entries) { 1311 u32 ims = E1000_IMS_LSC | E1000_IMS_DOUTSYNC; 1312 u32 regval = rd32(E1000_EIAC); 1313 wr32(E1000_EIAC, regval | adapter->eims_enable_mask); 1314 regval = rd32(E1000_EIAM); 1315 wr32(E1000_EIAM, regval | adapter->eims_enable_mask); 1316 wr32(E1000_EIMS, adapter->eims_enable_mask); 1317 if (adapter->vfs_allocated_count) { 1318 wr32(E1000_MBVFIMR, 0xFF); 1319 ims |= E1000_IMS_VMMB; 1320 } 1321 if (adapter->hw.mac.type == e1000_82580) 1322 ims |= E1000_IMS_DRSTA; 1323 1324 wr32(E1000_IMS, ims); 1325 } else { 1326 wr32(E1000_IMS, IMS_ENABLE_MASK | 1327 E1000_IMS_DRSTA); 1328 wr32(E1000_IAM, IMS_ENABLE_MASK | 1329 E1000_IMS_DRSTA); 1330 } 1331} 1332 1333static void igb_update_mng_vlan(struct igb_adapter *adapter) 1334{ 1335 struct e1000_hw *hw = &adapter->hw; 1336 u16 vid = adapter->hw.mng_cookie.vlan_id; 1337 u16 old_vid = adapter->mng_vlan_id; 1338 1339 if (hw->mng_cookie.status & E1000_MNG_DHCP_COOKIE_STATUS_VLAN) { 1340 /* add VID to filter table */ 1341 igb_vfta_set(hw, vid, true); 1342 adapter->mng_vlan_id = vid; 1343 } else { 1344 adapter->mng_vlan_id = IGB_MNG_VLAN_NONE; 1345 } 1346 1347 if ((old_vid != (u16)IGB_MNG_VLAN_NONE) && 1348 (vid != old_vid) && 1349 !vlan_group_get_device(adapter->vlgrp, old_vid)) { 1350 /* remove VID from filter table */ 1351 igb_vfta_set(hw, old_vid, false); 1352 } 1353} 1354 1355/** 1356 * igb_release_hw_control - release control of the h/w to f/w 1357 * @adapter: address of board private structure 1358 * 1359 * igb_release_hw_control resets CTRL_EXT:DRV_LOAD bit. 1360 * For ASF and Pass Through versions of f/w this means that the 1361 * driver is no longer loaded. 1362 * 1363 **/ 1364static void igb_release_hw_control(struct igb_adapter *adapter) 1365{ 1366 struct e1000_hw *hw = &adapter->hw; 1367 u32 ctrl_ext; 1368 1369 /* Let firmware take over control of h/w */ 1370 ctrl_ext = rd32(E1000_CTRL_EXT); 1371 wr32(E1000_CTRL_EXT, 1372 ctrl_ext & ~E1000_CTRL_EXT_DRV_LOAD); 1373} 1374 1375/** 1376 * igb_get_hw_control - get control of the h/w from f/w 1377 * @adapter: address of board private structure 1378 * 1379 * igb_get_hw_control sets CTRL_EXT:DRV_LOAD bit. 1380 * For ASF and Pass Through versions of f/w this means that 1381 * the driver is loaded. 1382 * 1383 **/ 1384static void igb_get_hw_control(struct igb_adapter *adapter) 1385{ 1386 struct e1000_hw *hw = &adapter->hw; 1387 u32 ctrl_ext; 1388 1389 /* Let firmware know the driver has taken over */ 1390 ctrl_ext = rd32(E1000_CTRL_EXT); 1391 wr32(E1000_CTRL_EXT, 1392 ctrl_ext | E1000_CTRL_EXT_DRV_LOAD); 1393} 1394 1395/** 1396 * igb_configure - configure the hardware for RX and TX 1397 * @adapter: private board structure 1398 **/ 1399static void igb_configure(struct igb_adapter *adapter) 1400{ 1401 struct net_device *netdev = adapter->netdev; 1402 int i; 1403 1404 igb_get_hw_control(adapter); 1405 igb_set_rx_mode(netdev); 1406 1407 igb_restore_vlan(adapter); 1408 1409 igb_setup_tctl(adapter); 1410 igb_setup_mrqc(adapter); 1411 igb_setup_rctl(adapter); 1412 1413 igb_configure_tx(adapter); 1414 igb_configure_rx(adapter); 1415 1416 igb_rx_fifo_flush_82575(&adapter->hw); 1417 1418 /* call igb_desc_unused which always leaves 1419 * at least 1 descriptor unused to make sure 1420 * next_to_use != next_to_clean */ 1421 for (i = 0; i < adapter->num_rx_queues; i++) { 1422 struct igb_ring *ring = adapter->rx_ring[i]; 1423 igb_alloc_rx_buffers_adv(ring, igb_desc_unused(ring)); 1424 } 1425} 1426 1427/** 1428 * igb_power_up_link - Power up the phy/serdes link 1429 * @adapter: address of board private structure 1430 **/ 1431void igb_power_up_link(struct igb_adapter *adapter) 1432{ 1433 if (adapter->hw.phy.media_type == e1000_media_type_copper) 1434 igb_power_up_phy_copper(&adapter->hw); 1435 else 1436 igb_power_up_serdes_link_82575(&adapter->hw); 1437} 1438 1439/** 1440 * igb_power_down_link - Power down the phy/serdes link 1441 * @adapter: address of board private structure 1442 */ 1443static void igb_power_down_link(struct igb_adapter *adapter) 1444{ 1445 if (adapter->hw.phy.media_type == e1000_media_type_copper) 1446 igb_power_down_phy_copper_82575(&adapter->hw); 1447 else 1448 igb_shutdown_serdes_link_82575(&adapter->hw); 1449} 1450 1451/** 1452 * igb_up - Open the interface and prepare it to handle traffic 1453 * @adapter: board private structure 1454 **/ 1455int igb_up(struct igb_adapter *adapter) 1456{ 1457 struct e1000_hw *hw = &adapter->hw; 1458 int i; 1459 1460 /* hardware has been reset, we need to reload some things */ 1461 igb_configure(adapter); 1462 1463 clear_bit(__IGB_DOWN, &adapter->state); 1464 1465 for (i = 0; i < adapter->num_q_vectors; i++) { 1466 struct igb_q_vector *q_vector = adapter->q_vector[i]; 1467 napi_enable(&q_vector->napi); 1468 } 1469 if (adapter->msix_entries) 1470 igb_configure_msix(adapter); 1471 else 1472 igb_assign_vector(adapter->q_vector[0], 0); 1473 1474 /* Clear any pending interrupts. */ 1475 rd32(E1000_ICR); 1476 igb_irq_enable(adapter); 1477 1478 /* notify VFs that reset has been completed */ 1479 if (adapter->vfs_allocated_count) { 1480 u32 reg_data = rd32(E1000_CTRL_EXT); 1481 reg_data |= E1000_CTRL_EXT_PFRSTD; 1482 wr32(E1000_CTRL_EXT, reg_data); 1483 } 1484 1485 netif_tx_start_all_queues(adapter->netdev); 1486 1487 /* start the watchdog. */ 1488 hw->mac.get_link_status = 1; 1489 schedule_work(&adapter->watchdog_task); 1490 1491 return 0; 1492} 1493 1494void igb_down(struct igb_adapter *adapter) 1495{ 1496 struct net_device *netdev = adapter->netdev; 1497 struct e1000_hw *hw = &adapter->hw; 1498 u32 tctl, rctl; 1499 int i; 1500 1501 /* signal that we're down so the interrupt handler does not 1502 * reschedule our watchdog timer */ 1503 set_bit(__IGB_DOWN, &adapter->state); 1504 1505 /* disable receives in the hardware */ 1506 rctl = rd32(E1000_RCTL); 1507 wr32(E1000_RCTL, rctl & ~E1000_RCTL_EN); 1508 /* flush and sleep below */ 1509 1510 netif_tx_stop_all_queues(netdev); 1511 1512 /* disable transmits in the hardware */ 1513 tctl = rd32(E1000_TCTL); 1514 tctl &= ~E1000_TCTL_EN; 1515 wr32(E1000_TCTL, tctl); 1516 /* flush both disables and wait for them to finish */ 1517 wrfl(); 1518 msleep(10); 1519 1520 for (i = 0; i < adapter->num_q_vectors; i++) { 1521 struct igb_q_vector *q_vector = adapter->q_vector[i]; 1522 napi_disable(&q_vector->napi); 1523 } 1524 1525 igb_irq_disable(adapter); 1526 1527 del_timer_sync(&adapter->watchdog_timer); 1528 del_timer_sync(&adapter->phy_info_timer); 1529 1530 netif_carrier_off(netdev); 1531 1532 /* record the stats before reset*/ 1533 igb_update_stats(adapter); 1534 1535 adapter->link_speed = 0; 1536 adapter->link_duplex = 0; 1537 1538 if (!pci_channel_offline(adapter->pdev)) 1539 igb_reset(adapter); 1540 igb_clean_all_tx_rings(adapter); 1541 igb_clean_all_rx_rings(adapter); 1542#ifdef CONFIG_IGB_DCA 1543 1544 /* since we reset the hardware DCA settings were cleared */ 1545 igb_setup_dca(adapter); 1546#endif 1547} 1548 1549void igb_reinit_locked(struct igb_adapter *adapter) 1550{ 1551 WARN_ON(in_interrupt()); 1552 while (test_and_set_bit(__IGB_RESETTING, &adapter->state)) 1553 msleep(1); 1554 igb_down(adapter); 1555 igb_up(adapter); 1556 clear_bit(__IGB_RESETTING, &adapter->state); 1557} 1558 1559void igb_reset(struct igb_adapter *adapter) 1560{ 1561 struct pci_dev *pdev = adapter->pdev; 1562 struct e1000_hw *hw = &adapter->hw; 1563 struct e1000_mac_info *mac = &hw->mac; 1564 struct e1000_fc_info *fc = &hw->fc; 1565 u32 pba = 0, tx_space, min_tx_space, min_rx_space; 1566 u16 hwm; 1567 1568 /* Repartition Pba for greater than 9k mtu 1569 * To take effect CTRL.RST is required. 1570 */ 1571 switch (mac->type) { 1572 case e1000_i350: 1573 case e1000_82580: 1574 pba = rd32(E1000_RXPBS); 1575 pba = igb_rxpbs_adjust_82580(pba); 1576 break; 1577 case e1000_82576: 1578 pba = rd32(E1000_RXPBS); 1579 pba &= E1000_RXPBS_SIZE_MASK_82576; 1580 break; 1581 case e1000_82575: 1582 default: 1583 pba = E1000_PBA_34K; 1584 break; 1585 } 1586 1587 if ((adapter->max_frame_size > ETH_FRAME_LEN + ETH_FCS_LEN) && 1588 (mac->type < e1000_82576)) { 1589 /* adjust PBA for jumbo frames */ 1590 wr32(E1000_PBA, pba); 1591 1592 /* To maintain wire speed transmits, the Tx FIFO should be 1593 * large enough to accommodate two full transmit packets, 1594 * rounded up to the next 1KB and expressed in KB. Likewise, 1595 * the Rx FIFO should be large enough to accommodate at least 1596 * one full receive packet and is similarly rounded up and 1597 * expressed in KB. */ 1598 pba = rd32(E1000_PBA); 1599 /* upper 16 bits has Tx packet buffer allocation size in KB */ 1600 tx_space = pba >> 16; 1601 /* lower 16 bits has Rx packet buffer allocation size in KB */ 1602 pba &= 0xffff; 1603 /* the tx fifo also stores 16 bytes of information about the tx 1604 * but don't include ethernet FCS because hardware appends it */ 1605 min_tx_space = (adapter->max_frame_size + 1606 sizeof(union e1000_adv_tx_desc) - 1607 ETH_FCS_LEN) * 2; 1608 min_tx_space = ALIGN(min_tx_space, 1024); 1609 min_tx_space >>= 10; 1610 /* software strips receive CRC, so leave room for it */ 1611 min_rx_space = adapter->max_frame_size; 1612 min_rx_space = ALIGN(min_rx_space, 1024); 1613 min_rx_space >>= 10; 1614 1615 /* If current Tx allocation is less than the min Tx FIFO size, 1616 * and the min Tx FIFO size is less than the current Rx FIFO 1617 * allocation, take space away from current Rx allocation */ 1618 if (tx_space < min_tx_space && 1619 ((min_tx_space - tx_space) < pba)) { 1620 pba = pba - (min_tx_space - tx_space); 1621 1622 /* if short on rx space, rx wins and must trump tx 1623 * adjustment */ 1624 if (pba < min_rx_space) 1625 pba = min_rx_space; 1626 } 1627 wr32(E1000_PBA, pba); 1628 } 1629 1630 /* flow control settings */ 1631 /* The high water mark must be low enough to fit one full frame 1632 * (or the size used for early receive) above it in the Rx FIFO. 1633 * Set it to the lower of: 1634 * - 90% of the Rx FIFO size, or 1635 * - the full Rx FIFO size minus one full frame */ 1636 hwm = min(((pba << 10) * 9 / 10), 1637 ((pba << 10) - 2 * adapter->max_frame_size)); 1638 1639 fc->high_water = hwm & 0xFFF0; /* 16-byte granularity */ 1640 fc->low_water = fc->high_water - 16; 1641 fc->pause_time = 0xFFFF; 1642 fc->send_xon = 1; 1643 fc->current_mode = fc->requested_mode; 1644 1645 /* disable receive for all VFs and wait one second */ 1646 if (adapter->vfs_allocated_count) { 1647 int i; 1648 for (i = 0 ; i < adapter->vfs_allocated_count; i++) 1649 adapter->vf_data[i].flags = 0; 1650 1651 /* ping all the active vfs to let them know we are going down */ 1652 igb_ping_all_vfs(adapter); 1653 1654 /* disable transmits and receives */ 1655 wr32(E1000_VFRE, 0); 1656 wr32(E1000_VFTE, 0); 1657 } 1658 1659 /* Allow time for pending master requests to run */ 1660 hw->mac.ops.reset_hw(hw); 1661 wr32(E1000_WUC, 0); 1662 1663 if (hw->mac.ops.init_hw(hw)) 1664 dev_err(&pdev->dev, "Hardware Error\n"); 1665 1666 if (hw->mac.type == e1000_82580) { 1667 u32 reg = rd32(E1000_PCIEMISC); 1668 wr32(E1000_PCIEMISC, 1669 reg & ~E1000_PCIEMISC_LX_DECISION); 1670 } 1671 if (!netif_running(adapter->netdev)) 1672 igb_power_down_link(adapter); 1673 1674 igb_update_mng_vlan(adapter); 1675 1676 /* Enable h/w to recognize an 802.1Q VLAN Ethernet packet */ 1677 wr32(E1000_VET, ETHERNET_IEEE_VLAN_TYPE); 1678 1679 igb_get_phy_info(hw); 1680} 1681 1682static const struct net_device_ops igb_netdev_ops = { 1683 .ndo_open = igb_open, 1684 .ndo_stop = igb_close, 1685 .ndo_start_xmit = igb_xmit_frame_adv, 1686 .ndo_get_stats = igb_get_stats, 1687 .ndo_set_rx_mode = igb_set_rx_mode, 1688 .ndo_set_multicast_list = igb_set_rx_mode, 1689 .ndo_set_mac_address = igb_set_mac, 1690 .ndo_change_mtu = igb_change_mtu, 1691 .ndo_do_ioctl = igb_ioctl, 1692 .ndo_tx_timeout = igb_tx_timeout, 1693 .ndo_validate_addr = eth_validate_addr, 1694 .ndo_vlan_rx_register = igb_vlan_rx_register, 1695 .ndo_vlan_rx_add_vid = igb_vlan_rx_add_vid, 1696 .ndo_vlan_rx_kill_vid = igb_vlan_rx_kill_vid, 1697 .ndo_set_vf_mac = igb_ndo_set_vf_mac, 1698 .ndo_set_vf_vlan = igb_ndo_set_vf_vlan, 1699 .ndo_set_vf_tx_rate = igb_ndo_set_vf_bw, 1700 .ndo_get_vf_config = igb_ndo_get_vf_config, 1701#ifdef CONFIG_NET_POLL_CONTROLLER 1702 .ndo_poll_controller = igb_netpoll, 1703#endif 1704}; 1705 1706/** 1707 * igb_probe - Device Initialization Routine 1708 * @pdev: PCI device information struct 1709 * @ent: entry in igb_pci_tbl 1710 * 1711 * Returns 0 on success, negative on failure 1712 * 1713 * igb_probe initializes an adapter identified by a pci_dev structure. 1714 * The OS initialization, configuring of the adapter private structure, 1715 * and a hardware reset occur. 1716 **/ 1717static int __devinit igb_probe(struct pci_dev *pdev, 1718 const struct pci_device_id *ent) 1719{ 1720 struct net_device *netdev; 1721 struct igb_adapter *adapter; 1722 struct e1000_hw *hw; 1723 u16 eeprom_data = 0; 1724 static int global_quad_port_a; /* global quad port a indication */ 1725 const struct e1000_info *ei = igb_info_tbl[ent->driver_data]; 1726 unsigned long mmio_start, mmio_len; 1727 int err, pci_using_dac; 1728 u16 eeprom_apme_mask = IGB_EEPROM_APME; 1729 u32 part_num; 1730 1731 /* Catch broken hardware that put the wrong VF device ID in 1732 * the PCIe SR-IOV capability. 1733 */ 1734 if (pdev->is_virtfn) { 1735 WARN(1, KERN_ERR "%s (%hx:%hx) should not be a VF!\n", 1736 pci_name(pdev), pdev->vendor, pdev->device); 1737 return -EINVAL; 1738 } 1739 1740 err = pci_enable_device_mem(pdev); 1741 if (err) 1742 return err; 1743 1744 pci_using_dac = 0; 1745 err = dma_set_mask(&pdev->dev, DMA_BIT_MASK(64)); 1746 if (!err) { 1747 err = dma_set_coherent_mask(&pdev->dev, DMA_BIT_MASK(64)); 1748 if (!err) 1749 pci_using_dac = 1; 1750 } else { 1751 err = dma_set_mask(&pdev->dev, DMA_BIT_MASK(32)); 1752 if (err) { 1753 err = dma_set_coherent_mask(&pdev->dev, DMA_BIT_MASK(32)); 1754 if (err) { 1755 dev_err(&pdev->dev, "No usable DMA " 1756 "configuration, aborting\n"); 1757 goto err_dma; 1758 } 1759 } 1760 } 1761 1762 err = pci_request_selected_regions(pdev, pci_select_bars(pdev, 1763 IORESOURCE_MEM), 1764 igb_driver_name); 1765 if (err) 1766 goto err_pci_reg; 1767 1768 pci_enable_pcie_error_reporting(pdev); 1769 1770 pci_set_master(pdev); 1771 pci_save_state(pdev); 1772 1773 err = -ENOMEM; 1774 netdev = alloc_etherdev_mq(sizeof(struct igb_adapter), 1775 IGB_ABS_MAX_TX_QUEUES); 1776 if (!netdev) 1777 goto err_alloc_etherdev; 1778 1779 SET_NETDEV_DEV(netdev, &pdev->dev); 1780 1781 pci_set_drvdata(pdev, netdev); 1782 adapter = netdev_priv(netdev); 1783 adapter->netdev = netdev; 1784 adapter->pdev = pdev; 1785 hw = &adapter->hw; 1786 hw->back = adapter; 1787 adapter->msg_enable = NETIF_MSG_DRV | NETIF_MSG_PROBE; 1788 1789 mmio_start = pci_resource_start(pdev, 0); 1790 mmio_len = pci_resource_len(pdev, 0); 1791 1792 err = -EIO; 1793 hw->hw_addr = ioremap(mmio_start, mmio_len); 1794 if (!hw->hw_addr) 1795 goto err_ioremap; 1796 1797 netdev->netdev_ops = &igb_netdev_ops; 1798 igb_set_ethtool_ops(netdev); 1799 netdev->watchdog_timeo = 5 * HZ; 1800 1801 strncpy(netdev->name, pci_name(pdev), sizeof(netdev->name) - 1); 1802 1803 netdev->mem_start = mmio_start; 1804 netdev->mem_end = mmio_start + mmio_len; 1805 1806 /* PCI config space info */ 1807 hw->vendor_id = pdev->vendor; 1808 hw->device_id = pdev->device; 1809 hw->revision_id = pdev->revision; 1810 hw->subsystem_vendor_id = pdev->subsystem_vendor; 1811 hw->subsystem_device_id = pdev->subsystem_device; 1812 1813 /* Copy the default MAC, PHY and NVM function pointers */ 1814 memcpy(&hw->mac.ops, ei->mac_ops, sizeof(hw->mac.ops)); 1815 memcpy(&hw->phy.ops, ei->phy_ops, sizeof(hw->phy.ops)); 1816 memcpy(&hw->nvm.ops, ei->nvm_ops, sizeof(hw->nvm.ops)); 1817 /* Initialize skew-specific constants */ 1818 err = ei->get_invariants(hw); 1819 if (err) 1820 goto err_sw_init; 1821 1822 /* setup the private structure */ 1823 err = igb_sw_init(adapter); 1824 if (err) 1825 goto err_sw_init; 1826 1827 igb_get_bus_info_pcie(hw); 1828 1829 hw->phy.autoneg_wait_to_complete = false; 1830 1831 /* Copper options */ 1832 if (hw->phy.media_type == e1000_media_type_copper) { 1833 hw->phy.mdix = AUTO_ALL_MODES; 1834 hw->phy.disable_polarity_correction = false; 1835 hw->phy.ms_type = e1000_ms_hw_default; 1836 } 1837 1838 if (igb_check_reset_block(hw)) 1839 dev_info(&pdev->dev, 1840 "PHY reset is blocked due to SOL/IDER session.\n"); 1841 1842 netdev->features = NETIF_F_SG | 1843 NETIF_F_IP_CSUM | 1844 NETIF_F_HW_VLAN_TX | 1845 NETIF_F_HW_VLAN_RX | 1846 NETIF_F_HW_VLAN_FILTER; 1847 1848 netdev->features |= NETIF_F_IPV6_CSUM; 1849 netdev->features |= NETIF_F_TSO; 1850 netdev->features |= NETIF_F_TSO6; 1851 netdev->features |= NETIF_F_GRO; 1852 1853 netdev->vlan_features |= NETIF_F_TSO; 1854 netdev->vlan_features |= NETIF_F_TSO6; 1855 netdev->vlan_features |= NETIF_F_IP_CSUM; 1856 netdev->vlan_features |= NETIF_F_IPV6_CSUM; 1857 netdev->vlan_features |= NETIF_F_SG; 1858 1859 if (pci_using_dac) 1860 netdev->features |= NETIF_F_HIGHDMA; 1861 1862 if (hw->mac.type >= e1000_82576) 1863 netdev->features |= NETIF_F_SCTP_CSUM; 1864 1865 adapter->en_mng_pt = igb_enable_mng_pass_thru(hw); 1866 1867 /* before reading the NVM, reset the controller to put the device in a 1868 * known good starting state */ 1869 hw->mac.ops.reset_hw(hw); 1870 1871 /* make sure the NVM is good */ 1872 if (igb_validate_nvm_checksum(hw) < 0) { 1873 dev_err(&pdev->dev, "The NVM Checksum Is Not Valid\n"); 1874 err = -EIO; 1875 goto err_eeprom; 1876 } 1877 1878 /* copy the MAC address out of the NVM */ 1879 if (hw->mac.ops.read_mac_addr(hw)) 1880 dev_err(&pdev->dev, "NVM Read Error\n"); 1881 1882 memcpy(netdev->dev_addr, hw->mac.addr, netdev->addr_len); 1883 memcpy(netdev->perm_addr, hw->mac.addr, netdev->addr_len); 1884 1885 if (!is_valid_ether_addr(netdev->perm_addr)) { 1886 dev_err(&pdev->dev, "Invalid MAC Address\n"); 1887 err = -EIO; 1888 goto err_eeprom; 1889 } 1890 1891 setup_timer(&adapter->watchdog_timer, &igb_watchdog, 1892 (unsigned long) adapter); 1893 setup_timer(&adapter->phy_info_timer, &igb_update_phy_info, 1894 (unsigned long) adapter); 1895 1896 INIT_WORK(&adapter->reset_task, igb_reset_task); 1897 INIT_WORK(&adapter->watchdog_task, igb_watchdog_task); 1898 1899 /* Initialize link properties that are user-changeable */ 1900 adapter->fc_autoneg = true; 1901 hw->mac.autoneg = true; 1902 hw->phy.autoneg_advertised = 0x2f; 1903 1904 hw->fc.requested_mode = e1000_fc_default; 1905 hw->fc.current_mode = e1000_fc_default; 1906 1907 igb_validate_mdi_setting(hw); 1908 1909 /* Initial Wake on LAN setting If APM wake is enabled in the EEPROM, 1910 * enable the ACPI Magic Packet filter 1911 */ 1912 1913 if (hw->bus.func == 0) 1914 hw->nvm.ops.read(hw, NVM_INIT_CONTROL3_PORT_A, 1, &eeprom_data); 1915 else if (hw->mac.type == e1000_82580) 1916 hw->nvm.ops.read(hw, NVM_INIT_CONTROL3_PORT_A + 1917 NVM_82580_LAN_FUNC_OFFSET(hw->bus.func), 1, 1918 &eeprom_data); 1919 else if (hw->bus.func == 1) 1920 hw->nvm.ops.read(hw, NVM_INIT_CONTROL3_PORT_B, 1, &eeprom_data); 1921 1922 if (eeprom_data & eeprom_apme_mask) 1923 adapter->eeprom_wol |= E1000_WUFC_MAG; 1924 1925 /* now that we have the eeprom settings, apply the special cases where 1926 * the eeprom may be wrong or the board simply won't support wake on 1927 * lan on a particular port */ 1928 switch (pdev->device) { 1929 case E1000_DEV_ID_82575GB_QUAD_COPPER: 1930 adapter->eeprom_wol = 0; 1931 break; 1932 case E1000_DEV_ID_82575EB_FIBER_SERDES: 1933 case E1000_DEV_ID_82576_FIBER: 1934 case E1000_DEV_ID_82576_SERDES: 1935 /* Wake events only supported on port A for dual fiber 1936 * regardless of eeprom setting */ 1937 if (rd32(E1000_STATUS) & E1000_STATUS_FUNC_1) 1938 adapter->eeprom_wol = 0; 1939 break; 1940 case E1000_DEV_ID_82576_QUAD_COPPER: 1941 case E1000_DEV_ID_82576_QUAD_COPPER_ET2: 1942 /* if quad port adapter, disable WoL on all but port A */ 1943 if (global_quad_port_a != 0) 1944 adapter->eeprom_wol = 0; 1945 else 1946 adapter->flags |= IGB_FLAG_QUAD_PORT_A; 1947 /* Reset for multiple quad port adapters */ 1948 if (++global_quad_port_a == 4) 1949 global_quad_port_a = 0; 1950 break; 1951 } 1952 1953 /* initialize the wol settings based on the eeprom settings */ 1954 adapter->wol = adapter->eeprom_wol; 1955 device_set_wakeup_enable(&adapter->pdev->dev, adapter->wol); 1956 1957 /* reset the hardware with the new settings */ 1958 igb_reset(adapter); 1959 1960 /* let the f/w know that the h/w is now under the control of the 1961 * driver. */ 1962 igb_get_hw_control(adapter); 1963 1964 strcpy(netdev->name, "eth%d"); 1965 err = register_netdev(netdev); 1966 if (err) 1967 goto err_register; 1968 1969 /* carrier off reporting is important to ethtool even BEFORE open */ 1970 netif_carrier_off(netdev); 1971 1972#ifdef CONFIG_IGB_DCA 1973 if (dca_add_requester(&pdev->dev) == 0) { 1974 adapter->flags |= IGB_FLAG_DCA_ENABLED; 1975 dev_info(&pdev->dev, "DCA enabled\n"); 1976 igb_setup_dca(adapter); 1977 } 1978 1979#endif 1980 dev_info(&pdev->dev, "Intel(R) Gigabit Ethernet Network Connection\n"); 1981 /* print bus type/speed/width info */ 1982 dev_info(&pdev->dev, "%s: (PCIe:%s:%s) %pM\n", 1983 netdev->name, 1984 ((hw->bus.speed == e1000_bus_speed_2500) ? "2.5Gb/s" : 1985 (hw->bus.speed == e1000_bus_speed_5000) ? "5.0Gb/s" : 1986 "unknown"), 1987 ((hw->bus.width == e1000_bus_width_pcie_x4) ? "Width x4" : 1988 (hw->bus.width == e1000_bus_width_pcie_x2) ? "Width x2" : 1989 (hw->bus.width == e1000_bus_width_pcie_x1) ? "Width x1" : 1990 "unknown"), 1991 netdev->dev_addr); 1992 1993 igb_read_part_num(hw, &part_num); 1994 dev_info(&pdev->dev, "%s: PBA No: %06x-%03x\n", netdev->name, 1995 (part_num >> 8), (part_num & 0xff)); 1996 1997 dev_info(&pdev->dev, 1998 "Using %s interrupts. %d rx queue(s), %d tx queue(s)\n", 1999 adapter->msix_entries ? "MSI-X" : 2000 (adapter->flags & IGB_FLAG_HAS_MSI) ? "MSI" : "legacy", 2001 adapter->num_rx_queues, adapter->num_tx_queues); 2002 2003 return 0; 2004 2005err_register: 2006 igb_release_hw_control(adapter); 2007err_eeprom: 2008 if (!igb_check_reset_block(hw)) 2009 igb_reset_phy(hw); 2010 2011 if (hw->flash_address) 2012 iounmap(hw->flash_address); 2013err_sw_init: 2014 igb_clear_interrupt_scheme(adapter); 2015 iounmap(hw->hw_addr); 2016err_ioremap: 2017 free_netdev(netdev); 2018err_alloc_etherdev: 2019 pci_release_selected_regions(pdev, 2020 pci_select_bars(pdev, IORESOURCE_MEM)); 2021err_pci_reg: 2022err_dma: 2023 pci_disable_device(pdev); 2024 return err; 2025} 2026 2027/** 2028 * igb_remove - Device Removal Routine 2029 * @pdev: PCI device information struct 2030 * 2031 * igb_remove is called by the PCI subsystem to alert the driver 2032 * that it should release a PCI device. The could be caused by a 2033 * Hot-Plug event, or because the driver is going to be removed from 2034 * memory. 2035 **/ 2036static void __devexit igb_remove(struct pci_dev *pdev) 2037{ 2038 struct net_device *netdev = pci_get_drvdata(pdev); 2039 struct igb_adapter *adapter = netdev_priv(netdev); 2040 struct e1000_hw *hw = &adapter->hw; 2041 2042 /* flush_scheduled work may reschedule our watchdog task, so 2043 * explicitly disable watchdog tasks from being rescheduled */ 2044 set_bit(__IGB_DOWN, &adapter->state); 2045 del_timer_sync(&adapter->watchdog_timer); 2046 del_timer_sync(&adapter->phy_info_timer); 2047 2048 flush_scheduled_work(); 2049 2050#ifdef CONFIG_IGB_DCA 2051 if (adapter->flags & IGB_FLAG_DCA_ENABLED) { 2052 dev_info(&pdev->dev, "DCA disabled\n"); 2053 dca_remove_requester(&pdev->dev); 2054 adapter->flags &= ~IGB_FLAG_DCA_ENABLED; 2055 wr32(E1000_DCA_CTRL, E1000_DCA_CTRL_DCA_MODE_DISABLE); 2056 } 2057#endif 2058 2059 /* Release control of h/w to f/w. If f/w is AMT enabled, this 2060 * would have already happened in close and is redundant. */ 2061 igb_release_hw_control(adapter); 2062 2063 unregister_netdev(netdev); 2064 2065 igb_clear_interrupt_scheme(adapter); 2066 2067#ifdef CONFIG_PCI_IOV 2068 /* reclaim resources allocated to VFs */ 2069 if (adapter->vf_data) { 2070 /* disable iov and allow time for transactions to clear */ 2071 pci_disable_sriov(pdev); 2072 msleep(500); 2073 2074 kfree(adapter->vf_data); 2075 adapter->vf_data = NULL; 2076 wr32(E1000_IOVCTL, E1000_IOVCTL_REUSE_VFQ); 2077 msleep(100); 2078 dev_info(&pdev->dev, "IOV Disabled\n"); 2079 } 2080#endif 2081 2082 iounmap(hw->hw_addr); 2083 if (hw->flash_address) 2084 iounmap(hw->flash_address); 2085 pci_release_selected_regions(pdev, 2086 pci_select_bars(pdev, IORESOURCE_MEM)); 2087 2088 free_netdev(netdev); 2089 2090 pci_disable_pcie_error_reporting(pdev); 2091 2092 pci_disable_device(pdev); 2093} 2094 2095/** 2096 * igb_probe_vfs - Initialize vf data storage and add VFs to pci config space 2097 * @adapter: board private structure to initialize 2098 * 2099 * This function initializes the vf specific data storage and then attempts to 2100 * allocate the VFs. The reason for ordering it this way is because it is much 2101 * mor expensive time wise to disable SR-IOV than it is to allocate and free 2102 * the memory for the VFs. 2103 **/ 2104static void __devinit igb_probe_vfs(struct igb_adapter * adapter) 2105{ 2106#ifdef CONFIG_PCI_IOV 2107 struct pci_dev *pdev = adapter->pdev; 2108 2109 if (adapter->vfs_allocated_count) { 2110 adapter->vf_data = kcalloc(adapter->vfs_allocated_count, 2111 sizeof(struct vf_data_storage), 2112 GFP_KERNEL); 2113 /* if allocation failed then we do not support SR-IOV */ 2114 if (!adapter->vf_data) { 2115 adapter->vfs_allocated_count = 0; 2116 dev_err(&pdev->dev, "Unable to allocate memory for VF " 2117 "Data Storage\n"); 2118 } 2119 } 2120 2121 if (pci_enable_sriov(pdev, adapter->vfs_allocated_count)) { 2122 kfree(adapter->vf_data); 2123 adapter->vf_data = NULL; 2124#endif /* CONFIG_PCI_IOV */ 2125 adapter->vfs_allocated_count = 0; 2126#ifdef CONFIG_PCI_IOV 2127 } else { 2128 unsigned char mac_addr[ETH_ALEN]; 2129 int i; 2130 dev_info(&pdev->dev, "%d vfs allocated\n", 2131 adapter->vfs_allocated_count); 2132 for (i = 0; i < adapter->vfs_allocated_count; i++) { 2133 random_ether_addr(mac_addr); 2134 igb_set_vf_mac(adapter, i, mac_addr); 2135 } 2136 } 2137#endif /* CONFIG_PCI_IOV */ 2138} 2139 2140 2141/** 2142 * igb_init_hw_timer - Initialize hardware timer used with IEEE 1588 timestamp 2143 * @adapter: board private structure to initialize 2144 * 2145 * igb_init_hw_timer initializes the function pointer and values for the hw 2146 * timer found in hardware. 2147 **/ 2148static void igb_init_hw_timer(struct igb_adapter *adapter) 2149{ 2150 struct e1000_hw *hw = &adapter->hw; 2151 2152 switch (hw->mac.type) { 2153 case e1000_i350: 2154 case e1000_82580: 2155 memset(&adapter->cycles, 0, sizeof(adapter->cycles)); 2156 adapter->cycles.read = igb_read_clock; 2157 adapter->cycles.mask = CLOCKSOURCE_MASK(64); 2158 adapter->cycles.mult = 1; 2159 /* 2160 * The 82580 timesync updates the system timer every 8ns by 8ns 2161 * and the value cannot be shifted. Instead we need to shift 2162 * the registers to generate a 64bit timer value. As a result 2163 * SYSTIMR/L/H, TXSTMPL/H, RXSTMPL/H all have to be shifted by 2164 * 24 in order to generate a larger value for synchronization. 2165 */ 2166 adapter->cycles.shift = IGB_82580_TSYNC_SHIFT; 2167 /* disable system timer temporarily by setting bit 31 */ 2168 wr32(E1000_TSAUXC, 0x80000000); 2169 wrfl(); 2170 2171 /* Set registers so that rollover occurs soon to test this. */ 2172 wr32(E1000_SYSTIMR, 0x00000000); 2173 wr32(E1000_SYSTIML, 0x80000000); 2174 wr32(E1000_SYSTIMH, 0x000000FF); 2175 wrfl(); 2176 2177 /* enable system timer by clearing bit 31 */ 2178 wr32(E1000_TSAUXC, 0x0); 2179 wrfl(); 2180 2181 timecounter_init(&adapter->clock, 2182 &adapter->cycles, 2183 ktime_to_ns(ktime_get_real())); 2184 /* 2185 * Synchronize our NIC clock against system wall clock. NIC 2186 * time stamp reading requires ~3us per sample, each sample 2187 * was pretty stable even under load => only require 10 2188 * samples for each offset comparison. 2189 */ 2190 memset(&adapter->compare, 0, sizeof(adapter->compare)); 2191 adapter->compare.source = &adapter->clock; 2192 adapter->compare.target = ktime_get_real; 2193 adapter->compare.num_samples = 10; 2194 timecompare_update(&adapter->compare, 0); 2195 break; 2196 case e1000_82576: 2197 /* 2198 * Initialize hardware timer: we keep it running just in case 2199 * that some program needs it later on. 2200 */ 2201 memset(&adapter->cycles, 0, sizeof(adapter->cycles)); 2202 adapter->cycles.read = igb_read_clock; 2203 adapter->cycles.mask = CLOCKSOURCE_MASK(64); 2204 adapter->cycles.mult = 1; 2205 /** 2206 * Scale the NIC clock cycle by a large factor so that 2207 * relatively small clock corrections can be added or 2208 * substracted at each clock tick. The drawbacks of a large 2209 * factor are a) that the clock register overflows more quickly 2210 * (not such a big deal) and b) that the increment per tick has 2211 * to fit into 24 bits. As a result we need to use a shift of 2212 * 19 so we can fit a value of 16 into the TIMINCA register. 2213 */ 2214 adapter->cycles.shift = IGB_82576_TSYNC_SHIFT; 2215 wr32(E1000_TIMINCA, 2216 (1 << E1000_TIMINCA_16NS_SHIFT) | 2217 (16 << IGB_82576_TSYNC_SHIFT)); 2218 2219 /* Set registers so that rollover occurs soon to test this. */ 2220 wr32(E1000_SYSTIML, 0x00000000); 2221 wr32(E1000_SYSTIMH, 0xFF800000); 2222 wrfl(); 2223 2224 timecounter_init(&adapter->clock, 2225 &adapter->cycles, 2226 ktime_to_ns(ktime_get_real())); 2227 /* 2228 * Synchronize our NIC clock against system wall clock. NIC 2229 * time stamp reading requires ~3us per sample, each sample 2230 * was pretty stable even under load => only require 10 2231 * samples for each offset comparison. 2232 */ 2233 memset(&adapter->compare, 0, sizeof(adapter->compare)); 2234 adapter->compare.source = &adapter->clock; 2235 adapter->compare.target = ktime_get_real; 2236 adapter->compare.num_samples = 10; 2237 timecompare_update(&adapter->compare, 0); 2238 break; 2239 case e1000_82575: 2240 /* 82575 does not support timesync */ 2241 default: 2242 break; 2243 } 2244 2245} 2246 2247/** 2248 * igb_sw_init - Initialize general software structures (struct igb_adapter) 2249 * @adapter: board private structure to initialize 2250 * 2251 * igb_sw_init initializes the Adapter private data structure. 2252 * Fields are initialized based on PCI device information and 2253 * OS network device settings (MTU size). 2254 **/ 2255static int __devinit igb_sw_init(struct igb_adapter *adapter) 2256{ 2257 struct e1000_hw *hw = &adapter->hw; 2258 struct net_device *netdev = adapter->netdev; 2259 struct pci_dev *pdev = adapter->pdev; 2260 2261 pci_read_config_word(pdev, PCI_COMMAND, &hw->bus.pci_cmd_word); 2262 2263 adapter->tx_ring_count = IGB_DEFAULT_TXD; 2264 adapter->rx_ring_count = IGB_DEFAULT_RXD; 2265 adapter->rx_itr_setting = IGB_DEFAULT_ITR; 2266 adapter->tx_itr_setting = IGB_DEFAULT_ITR; 2267 2268 adapter->max_frame_size = netdev->mtu + ETH_HLEN + ETH_FCS_LEN; 2269 adapter->min_frame_size = ETH_ZLEN + ETH_FCS_LEN; 2270 2271#ifdef CONFIG_PCI_IOV 2272 if (hw->mac.type == e1000_82576) 2273 adapter->vfs_allocated_count = (max_vfs > 7) ? 7 : max_vfs; 2274 2275#endif /* CONFIG_PCI_IOV */ 2276 adapter->rss_queues = min_t(u32, IGB_MAX_RX_QUEUES, num_online_cpus()); 2277 2278 /* 2279 * if rss_queues > 4 or vfs are going to be allocated with rss_queues 2280 * then we should combine the queues into a queue pair in order to 2281 * conserve interrupts due to limited supply 2282 */ 2283 if ((adapter->rss_queues > 4) || 2284 ((adapter->rss_queues > 1) && (adapter->vfs_allocated_count > 6))) 2285 adapter->flags |= IGB_FLAG_QUEUE_PAIRS; 2286 2287 /* This call may decrease the number of queues */ 2288 if (igb_init_interrupt_scheme(adapter)) { 2289 dev_err(&pdev->dev, "Unable to allocate memory for queues\n"); 2290 return -ENOMEM; 2291 } 2292 2293 igb_init_hw_timer(adapter); 2294 igb_probe_vfs(adapter); 2295 2296 /* Explicitly disable IRQ since the NIC can be in any state. */ 2297 igb_irq_disable(adapter); 2298 2299 set_bit(__IGB_DOWN, &adapter->state); 2300 return 0; 2301} 2302 2303/** 2304 * igb_open - Called when a network interface is made active 2305 * @netdev: network interface device structure 2306 * 2307 * Returns 0 on success, negative value on failure 2308 * 2309 * The open entry point is called when a network interface is made 2310 * active by the system (IFF_UP). At this point all resources needed 2311 * for transmit and receive operations are allocated, the interrupt 2312 * handler is registered with the OS, the watchdog timer is started, 2313 * and the stack is notified that the interface is ready. 2314 **/ 2315static int igb_open(struct net_device *netdev) 2316{ 2317 struct igb_adapter *adapter = netdev_priv(netdev); 2318 struct e1000_hw *hw = &adapter->hw; 2319 int err; 2320 int i; 2321 2322 /* disallow open during test */ 2323 if (test_bit(__IGB_TESTING, &adapter->state)) 2324 return -EBUSY; 2325 2326 netif_carrier_off(netdev); 2327 2328 /* allocate transmit descriptors */ 2329 err = igb_setup_all_tx_resources(adapter); 2330 if (err) 2331 goto err_setup_tx; 2332 2333 /* allocate receive descriptors */ 2334 err = igb_setup_all_rx_resources(adapter); 2335 if (err) 2336 goto err_setup_rx; 2337 2338 igb_power_up_link(adapter); 2339 2340 /* before we allocate an interrupt, we must be ready to handle it. 2341 * Setting DEBUG_SHIRQ in the kernel makes it fire an interrupt 2342 * as soon as we call pci_request_irq, so we have to setup our 2343 * clean_rx handler before we do so. */ 2344 igb_configure(adapter); 2345 2346 err = igb_request_irq(adapter); 2347 if (err) 2348 goto err_req_irq; 2349 2350 /* From here on the code is the same as igb_up() */ 2351 clear_bit(__IGB_DOWN, &adapter->state); 2352 2353 for (i = 0; i < adapter->num_q_vectors; i++) { 2354 struct igb_q_vector *q_vector = adapter->q_vector[i]; 2355 napi_enable(&q_vector->napi); 2356 } 2357 2358 /* Clear any pending interrupts. */ 2359 rd32(E1000_ICR); 2360 2361 igb_irq_enable(adapter); 2362 2363 /* notify VFs that reset has been completed */ 2364 if (adapter->vfs_allocated_count) { 2365 u32 reg_data = rd32(E1000_CTRL_EXT); 2366 reg_data |= E1000_CTRL_EXT_PFRSTD; 2367 wr32(E1000_CTRL_EXT, reg_data); 2368 } 2369 2370 netif_tx_start_all_queues(netdev); 2371 2372 /* start the watchdog. */ 2373 hw->mac.get_link_status = 1; 2374 schedule_work(&adapter->watchdog_task); 2375 2376 return 0; 2377 2378err_req_irq: 2379 igb_release_hw_control(adapter); 2380 igb_power_down_link(adapter); 2381 igb_free_all_rx_resources(adapter); 2382err_setup_rx: 2383 igb_free_all_tx_resources(adapter); 2384err_setup_tx: 2385 igb_reset(adapter); 2386 2387 return err; 2388} 2389 2390/** 2391 * igb_close - Disables a network interface 2392 * @netdev: network interface device structure 2393 * 2394 * Returns 0, this is not allowed to fail 2395 * 2396 * The close entry point is called when an interface is de-activated 2397 * by the OS. The hardware is still under the driver's control, but 2398 * needs to be disabled. A global MAC reset is issued to stop the 2399 * hardware, and all transmit and receive resources are freed. 2400 **/ 2401static int igb_close(struct net_device *netdev) 2402{ 2403 struct igb_adapter *adapter = netdev_priv(netdev); 2404 2405 WARN_ON(test_bit(__IGB_RESETTING, &adapter->state)); 2406 igb_down(adapter); 2407 2408 igb_free_irq(adapter); 2409 2410 igb_free_all_tx_resources(adapter); 2411 igb_free_all_rx_resources(adapter); 2412 2413 return 0; 2414} 2415 2416/** 2417 * igb_setup_tx_resources - allocate Tx resources (Descriptors) 2418 * @tx_ring: tx descriptor ring (for a specific queue) to setup 2419 * 2420 * Return 0 on success, negative on failure 2421 **/ 2422int igb_setup_tx_resources(struct igb_ring *tx_ring) 2423{ 2424 struct device *dev = tx_ring->dev; 2425 int size; 2426 2427 size = sizeof(struct igb_buffer) * tx_ring->count; 2428 tx_ring->buffer_info = vmalloc(size); 2429 if (!tx_ring->buffer_info) 2430 goto err; 2431 memset(tx_ring->buffer_info, 0, size); 2432 2433 /* round up to nearest 4K */ 2434 tx_ring->size = tx_ring->count * sizeof(union e1000_adv_tx_desc); 2435 tx_ring->size = ALIGN(tx_ring->size, 4096); 2436 2437 tx_ring->desc = dma_alloc_coherent(dev, 2438 tx_ring->size, 2439 &tx_ring->dma, 2440 GFP_KERNEL); 2441 2442 if (!tx_ring->desc) 2443 goto err; 2444 2445 tx_ring->next_to_use = 0; 2446 tx_ring->next_to_clean = 0; 2447 return 0; 2448 2449err: 2450 vfree(tx_ring->buffer_info); 2451 dev_err(dev, 2452 "Unable to allocate memory for the transmit descriptor ring\n"); 2453 return -ENOMEM; 2454} 2455 2456/** 2457 * igb_setup_all_tx_resources - wrapper to allocate Tx resources 2458 * (Descriptors) for all queues 2459 * @adapter: board private structure 2460 * 2461 * Return 0 on success, negative on failure 2462 **/ 2463static int igb_setup_all_tx_resources(struct igb_adapter *adapter) 2464{ 2465 struct pci_dev *pdev = adapter->pdev; 2466 int i, err = 0; 2467 2468 for (i = 0; i < adapter->num_tx_queues; i++) { 2469 err = igb_setup_tx_resources(adapter->tx_ring[i]); 2470 if (err) { 2471 dev_err(&pdev->dev, 2472 "Allocation for Tx Queue %u failed\n", i); 2473 for (i--; i >= 0; i--) 2474 igb_free_tx_resources(adapter->tx_ring[i]); 2475 break; 2476 } 2477 } 2478 2479 for (i = 0; i < IGB_ABS_MAX_TX_QUEUES; i++) { 2480 int r_idx = i % adapter->num_tx_queues; 2481 adapter->multi_tx_table[i] = adapter->tx_ring[r_idx]; 2482 } 2483 return err; 2484} 2485 2486/** 2487 * igb_setup_tctl - configure the transmit control registers 2488 * @adapter: Board private structure 2489 **/ 2490void igb_setup_tctl(struct igb_adapter *adapter) 2491{ 2492 struct e1000_hw *hw = &adapter->hw; 2493 u32 tctl; 2494 2495 /* disable queue 0 which is enabled by default on 82575 and 82576 */ 2496 wr32(E1000_TXDCTL(0), 0); 2497 2498 /* Program the Transmit Control Register */ 2499 tctl = rd32(E1000_TCTL); 2500 tctl &= ~E1000_TCTL_CT; 2501 tctl |= E1000_TCTL_PSP | E1000_TCTL_RTLC | 2502 (E1000_COLLISION_THRESHOLD << E1000_CT_SHIFT); 2503 2504 igb_config_collision_dist(hw); 2505 2506 /* Enable transmits */ 2507 tctl |= E1000_TCTL_EN; 2508 2509 wr32(E1000_TCTL, tctl); 2510} 2511 2512/** 2513 * igb_configure_tx_ring - Configure transmit ring after Reset 2514 * @adapter: board private structure 2515 * @ring: tx ring to configure 2516 * 2517 * Configure a transmit ring after a reset. 2518 **/ 2519void igb_configure_tx_ring(struct igb_adapter *adapter, 2520 struct igb_ring *ring) 2521{ 2522 struct e1000_hw *hw = &adapter->hw; 2523 u32 txdctl; 2524 u64 tdba = ring->dma; 2525 int reg_idx = ring->reg_idx; 2526 2527 /* disable the queue */ 2528 txdctl = rd32(E1000_TXDCTL(reg_idx)); 2529 wr32(E1000_TXDCTL(reg_idx), 2530 txdctl & ~E1000_TXDCTL_QUEUE_ENABLE); 2531 wrfl(); 2532 mdelay(10); 2533 2534 wr32(E1000_TDLEN(reg_idx), 2535 ring->count * sizeof(union e1000_adv_tx_desc)); 2536 wr32(E1000_TDBAL(reg_idx), 2537 tdba & 0x00000000ffffffffULL); 2538 wr32(E1000_TDBAH(reg_idx), tdba >> 32); 2539 2540 ring->head = hw->hw_addr + E1000_TDH(reg_idx); 2541 ring->tail = hw->hw_addr + E1000_TDT(reg_idx); 2542 writel(0, ring->head); 2543 writel(0, ring->tail); 2544 2545 txdctl |= IGB_TX_PTHRESH; 2546 txdctl |= IGB_TX_HTHRESH << 8; 2547 txdctl |= IGB_TX_WTHRESH << 16; 2548 2549 txdctl |= E1000_TXDCTL_QUEUE_ENABLE; 2550 wr32(E1000_TXDCTL(reg_idx), txdctl); 2551} 2552 2553/** 2554 * igb_configure_tx - Configure transmit Unit after Reset 2555 * @adapter: board private structure 2556 * 2557 * Configure the Tx unit of the MAC after a reset. 2558 **/ 2559static void igb_configure_tx(struct igb_adapter *adapter) 2560{ 2561 int i; 2562 2563 for (i = 0; i < adapter->num_tx_queues; i++) 2564 igb_configure_tx_ring(adapter, adapter->tx_ring[i]); 2565} 2566 2567/** 2568 * igb_setup_rx_resources - allocate Rx resources (Descriptors) 2569 * @rx_ring: rx descriptor ring (for a specific queue) to setup 2570 * 2571 * Returns 0 on success, negative on failure 2572 **/ 2573int igb_setup_rx_resources(struct igb_ring *rx_ring) 2574{ 2575 struct device *dev = rx_ring->dev; 2576 int size, desc_len; 2577 2578 size = sizeof(struct igb_buffer) * rx_ring->count; 2579 rx_ring->buffer_info = vmalloc(size); 2580 if (!rx_ring->buffer_info) 2581 goto err; 2582 memset(rx_ring->buffer_info, 0, size); 2583 2584 desc_len = sizeof(union e1000_adv_rx_desc); 2585 2586 /* Round up to nearest 4K */ 2587 rx_ring->size = rx_ring->count * desc_len; 2588 rx_ring->size = ALIGN(rx_ring->size, 4096); 2589 2590 rx_ring->desc = dma_alloc_coherent(dev, 2591 rx_ring->size, 2592 &rx_ring->dma, 2593 GFP_KERNEL); 2594 2595 if (!rx_ring->desc) 2596 goto err; 2597 2598 rx_ring->next_to_clean = 0; 2599 rx_ring->next_to_use = 0; 2600 2601 return 0; 2602 2603err: 2604 vfree(rx_ring->buffer_info); 2605 rx_ring->buffer_info = NULL; 2606 dev_err(dev, "Unable to allocate memory for the receive descriptor" 2607 " ring\n"); 2608 return -ENOMEM; 2609} 2610 2611/** 2612 * igb_setup_all_rx_resources - wrapper to allocate Rx resources 2613 * (Descriptors) for all queues 2614 * @adapter: board private structure 2615 * 2616 * Return 0 on success, negative on failure 2617 **/ 2618static int igb_setup_all_rx_resources(struct igb_adapter *adapter) 2619{ 2620 struct pci_dev *pdev = adapter->pdev; 2621 int i, err = 0; 2622 2623 for (i = 0; i < adapter->num_rx_queues; i++) { 2624 err = igb_setup_rx_resources(adapter->rx_ring[i]); 2625 if (err) { 2626 dev_err(&pdev->dev, 2627 "Allocation for Rx Queue %u failed\n", i); 2628 for (i--; i >= 0; i--) 2629 igb_free_rx_resources(adapter->rx_ring[i]); 2630 break; 2631 } 2632 } 2633 2634 return err; 2635} 2636 2637/** 2638 * igb_setup_mrqc - configure the multiple receive queue control registers 2639 * @adapter: Board private structure 2640 **/ 2641static void igb_setup_mrqc(struct igb_adapter *adapter) 2642{ 2643 struct e1000_hw *hw = &adapter->hw; 2644 u32 mrqc, rxcsum; 2645 u32 j, num_rx_queues, shift = 0, shift2 = 0; 2646 union e1000_reta { 2647 u32 dword; 2648 u8 bytes[4]; 2649 } reta; 2650 static const u8 rsshash[40] = { 2651 0x6d, 0x5a, 0x56, 0xda, 0x25, 0x5b, 0x0e, 0xc2, 0x41, 0x67, 2652 0x25, 0x3d, 0x43, 0xa3, 0x8f, 0xb0, 0xd0, 0xca, 0x2b, 0xcb, 2653 0xae, 0x7b, 0x30, 0xb4, 0x77, 0xcb, 0x2d, 0xa3, 0x80, 0x30, 2654 0xf2, 0x0c, 0x6a, 0x42, 0xb7, 0x3b, 0xbe, 0xac, 0x01, 0xfa }; 2655 2656 /* Fill out hash function seeds */ 2657 for (j = 0; j < 10; j++) { 2658 u32 rsskey = rsshash[(j * 4)]; 2659 rsskey |= rsshash[(j * 4) + 1] << 8; 2660 rsskey |= rsshash[(j * 4) + 2] << 16; 2661 rsskey |= rsshash[(j * 4) + 3] << 24; 2662 array_wr32(E1000_RSSRK(0), j, rsskey); 2663 } 2664 2665 num_rx_queues = adapter->rss_queues; 2666 2667 if (adapter->vfs_allocated_count) { 2668 /* 82575 and 82576 supports 2 RSS queues for VMDq */ 2669 switch (hw->mac.type) { 2670 case e1000_i350: 2671 case e1000_82580: 2672 num_rx_queues = 1; 2673 shift = 0; 2674 break; 2675 case e1000_82576: 2676 shift = 3; 2677 num_rx_queues = 2; 2678 break; 2679 case e1000_82575: 2680 shift = 2; 2681 shift2 = 6; 2682 default: 2683 break; 2684 } 2685 } else { 2686 if (hw->mac.type == e1000_82575) 2687 shift = 6; 2688 } 2689 2690 for (j = 0; j < (32 * 4); j++) { 2691 reta.bytes[j & 3] = (j % num_rx_queues) << shift; 2692 if (shift2) 2693 reta.bytes[j & 3] |= num_rx_queues << shift2; 2694 if ((j & 3) == 3) 2695 wr32(E1000_RETA(j >> 2), reta.dword); 2696 } 2697 2698 /* 2699 * Disable raw packet checksumming so that RSS hash is placed in 2700 * descriptor on writeback. No need to enable TCP/UDP/IP checksum 2701 * offloads as they are enabled by default 2702 */ 2703 rxcsum = rd32(E1000_RXCSUM); 2704 rxcsum |= E1000_RXCSUM_PCSD; 2705 2706 if (adapter->hw.mac.type >= e1000_82576) 2707 /* Enable Receive Checksum Offload for SCTP */ 2708 rxcsum |= E1000_RXCSUM_CRCOFL; 2709 2710 /* Don't need to set TUOFL or IPOFL, they default to 1 */ 2711 wr32(E1000_RXCSUM, rxcsum); 2712 2713 /* If VMDq is enabled then we set the appropriate mode for that, else 2714 * we default to RSS so that an RSS hash is calculated per packet even 2715 * if we are only using one queue */ 2716 if (adapter->vfs_allocated_count) { 2717 if (hw->mac.type > e1000_82575) { 2718 /* Set the default pool for the PF's first queue */ 2719 u32 vtctl = rd32(E1000_VT_CTL); 2720 vtctl &= ~(E1000_VT_CTL_DEFAULT_POOL_MASK | 2721 E1000_VT_CTL_DISABLE_DEF_POOL); 2722 vtctl |= adapter->vfs_allocated_count << 2723 E1000_VT_CTL_DEFAULT_POOL_SHIFT; 2724 wr32(E1000_VT_CTL, vtctl); 2725 } 2726 if (adapter->rss_queues > 1) 2727 mrqc = E1000_MRQC_ENABLE_VMDQ_RSS_2Q; 2728 else 2729 mrqc = E1000_MRQC_ENABLE_VMDQ; 2730 } else { 2731 mrqc = E1000_MRQC_ENABLE_RSS_4Q; 2732 } 2733 igb_vmm_control(adapter); 2734 2735 /* 2736 * Generate RSS hash based on TCP port numbers and/or 2737 * IPv4/v6 src and dst addresses since UDP cannot be 2738 * hashed reliably due to IP fragmentation 2739 */ 2740 mrqc |= E1000_MRQC_RSS_FIELD_IPV4 | 2741 E1000_MRQC_RSS_FIELD_IPV4_TCP | 2742 E1000_MRQC_RSS_FIELD_IPV6 | 2743 E1000_MRQC_RSS_FIELD_IPV6_TCP | 2744 E1000_MRQC_RSS_FIELD_IPV6_TCP_EX; 2745 2746 wr32(E1000_MRQC, mrqc); 2747} 2748 2749/** 2750 * igb_setup_rctl - configure the receive control registers 2751 * @adapter: Board private structure 2752 **/ 2753void igb_setup_rctl(struct igb_adapter *adapter) 2754{ 2755 struct e1000_hw *hw = &adapter->hw; 2756 u32 rctl; 2757 2758 rctl = rd32(E1000_RCTL); 2759 2760 rctl &= ~(3 << E1000_RCTL_MO_SHIFT); 2761 rctl &= ~(E1000_RCTL_LBM_TCVR | E1000_RCTL_LBM_MAC); 2762 2763 rctl |= E1000_RCTL_EN | E1000_RCTL_BAM | E1000_RCTL_RDMTS_HALF | 2764 (hw->mac.mc_filter_type << E1000_RCTL_MO_SHIFT); 2765 2766 /* 2767 * enable stripping of CRC. It's unlikely this will break BMC 2768 * redirection as it did with e1000. Newer features require 2769 * that the HW strips the CRC. 2770 */ 2771 rctl |= E1000_RCTL_SECRC; 2772 2773 /* disable store bad packets and clear size bits. */ 2774 rctl &= ~(E1000_RCTL_SBP | E1000_RCTL_SZ_256); 2775 2776 /* enable LPE to prevent packets larger than max_frame_size */ 2777 rctl |= E1000_RCTL_LPE; 2778 2779 /* disable queue 0 to prevent tail write w/o re-config */ 2780 wr32(E1000_RXDCTL(0), 0); 2781 2782 /* Attention!!! For SR-IOV PF driver operations you must enable 2783 * queue drop for all VF and PF queues to prevent head of line blocking 2784 * if an un-trusted VF does not provide descriptors to hardware. 2785 */ 2786 if (adapter->vfs_allocated_count) { 2787 /* set all queue drop enable bits */ 2788 wr32(E1000_QDE, ALL_QUEUES); 2789 } 2790 2791 wr32(E1000_RCTL, rctl); 2792} 2793 2794static inline int igb_set_vf_rlpml(struct igb_adapter *adapter, int size, 2795 int vfn) 2796{ 2797 struct e1000_hw *hw = &adapter->hw; 2798 u32 vmolr; 2799 2800 /* if it isn't the PF check to see if VFs are enabled and 2801 * increase the size to support vlan tags */ 2802 if (vfn < adapter->vfs_allocated_count && 2803 adapter->vf_data[vfn].vlans_enabled) 2804 size += VLAN_TAG_SIZE; 2805 2806 vmolr = rd32(E1000_VMOLR(vfn)); 2807 vmolr &= ~E1000_VMOLR_RLPML_MASK; 2808 vmolr |= size | E1000_VMOLR_LPE; 2809 wr32(E1000_VMOLR(vfn), vmolr); 2810 2811 return 0; 2812} 2813 2814/** 2815 * igb_rlpml_set - set maximum receive packet size 2816 * @adapter: board private structure 2817 * 2818 * Configure maximum receivable packet size. 2819 **/ 2820static void igb_rlpml_set(struct igb_adapter *adapter) 2821{ 2822 u32 max_frame_size = adapter->max_frame_size; 2823 struct e1000_hw *hw = &adapter->hw; 2824 u16 pf_id = adapter->vfs_allocated_count; 2825 2826 if (adapter->vlgrp) 2827 max_frame_size += VLAN_TAG_SIZE; 2828 2829 /* if vfs are enabled we set RLPML to the largest possible request 2830 * size and set the VMOLR RLPML to the size we need */ 2831 if (pf_id) { 2832 igb_set_vf_rlpml(adapter, max_frame_size, pf_id); 2833 max_frame_size = MAX_JUMBO_FRAME_SIZE; 2834 } 2835 2836 wr32(E1000_RLPML, max_frame_size); 2837} 2838 2839static inline void igb_set_vmolr(struct igb_adapter *adapter, 2840 int vfn, bool aupe) 2841{ 2842 struct e1000_hw *hw = &adapter->hw; 2843 u32 vmolr; 2844 2845 /* 2846 * This register exists only on 82576 and newer so if we are older then 2847 * we should exit and do nothing 2848 */ 2849 if (hw->mac.type < e1000_82576) 2850 return; 2851 2852 vmolr = rd32(E1000_VMOLR(vfn)); 2853 vmolr |= E1000_VMOLR_STRVLAN; /* Strip vlan tags */ 2854 if (aupe) 2855 vmolr |= E1000_VMOLR_AUPE; /* Accept untagged packets */ 2856 else 2857 vmolr &= ~(E1000_VMOLR_AUPE); /* Tagged packets ONLY */ 2858 2859 /* clear all bits that might not be set */ 2860 vmolr &= ~(E1000_VMOLR_BAM | E1000_VMOLR_RSSE); 2861 2862 if (adapter->rss_queues > 1 && vfn == adapter->vfs_allocated_count) 2863 vmolr |= E1000_VMOLR_RSSE; /* enable RSS */ 2864 /* 2865 * for VMDq only allow the VFs and pool 0 to accept broadcast and 2866 * multicast packets 2867 */ 2868 if (vfn <= adapter->vfs_allocated_count) 2869 vmolr |= E1000_VMOLR_BAM; /* Accept broadcast */ 2870 2871 wr32(E1000_VMOLR(vfn), vmolr); 2872} 2873 2874/** 2875 * igb_configure_rx_ring - Configure a receive ring after Reset 2876 * @adapter: board private structure 2877 * @ring: receive ring to be configured 2878 * 2879 * Configure the Rx unit of the MAC after a reset. 2880 **/ 2881void igb_configure_rx_ring(struct igb_adapter *adapter, 2882 struct igb_ring *ring) 2883{ 2884 struct e1000_hw *hw = &adapter->hw; 2885 u64 rdba = ring->dma; 2886 int reg_idx = ring->reg_idx; 2887 u32 srrctl, rxdctl; 2888 2889 /* disable the queue */ 2890 rxdctl = rd32(E1000_RXDCTL(reg_idx)); 2891 wr32(E1000_RXDCTL(reg_idx), 2892 rxdctl & ~E1000_RXDCTL_QUEUE_ENABLE); 2893 2894 /* Set DMA base address registers */ 2895 wr32(E1000_RDBAL(reg_idx), 2896 rdba & 0x00000000ffffffffULL); 2897 wr32(E1000_RDBAH(reg_idx), rdba >> 32); 2898 wr32(E1000_RDLEN(reg_idx), 2899 ring->count * sizeof(union e1000_adv_rx_desc)); 2900 2901 /* initialize head and tail */ 2902 ring->head = hw->hw_addr + E1000_RDH(reg_idx); 2903 ring->tail = hw->hw_addr + E1000_RDT(reg_idx); 2904 writel(0, ring->head); 2905 writel(0, ring->tail); 2906 2907 /* set descriptor configuration */ 2908 if (ring->rx_buffer_len < IGB_RXBUFFER_1024) { 2909 srrctl = ALIGN(ring->rx_buffer_len, 64) << 2910 E1000_SRRCTL_BSIZEHDRSIZE_SHIFT; 2911#if (PAGE_SIZE / 2) > IGB_RXBUFFER_16384 2912 srrctl |= IGB_RXBUFFER_16384 >> 2913 E1000_SRRCTL_BSIZEPKT_SHIFT; 2914#else 2915 srrctl |= (PAGE_SIZE / 2) >> 2916 E1000_SRRCTL_BSIZEPKT_SHIFT; 2917#endif 2918 srrctl |= E1000_SRRCTL_DESCTYPE_HDR_SPLIT_ALWAYS; 2919 } else { 2920 srrctl = ALIGN(ring->rx_buffer_len, 1024) >> 2921 E1000_SRRCTL_BSIZEPKT_SHIFT; 2922 srrctl |= E1000_SRRCTL_DESCTYPE_ADV_ONEBUF; 2923 } 2924 if (hw->mac.type == e1000_82580) 2925 srrctl |= E1000_SRRCTL_TIMESTAMP; 2926 /* Only set Drop Enable if we are supporting multiple queues */ 2927 if (adapter->vfs_allocated_count || adapter->num_rx_queues > 1) 2928 srrctl |= E1000_SRRCTL_DROP_EN; 2929 2930 wr32(E1000_SRRCTL(reg_idx), srrctl); 2931 2932 /* set filtering for VMDQ pools */ 2933 igb_set_vmolr(adapter, reg_idx & 0x7, true); 2934 2935 /* enable receive descriptor fetching */ 2936 rxdctl = rd32(E1000_RXDCTL(reg_idx)); 2937 rxdctl |= E1000_RXDCTL_QUEUE_ENABLE; 2938 rxdctl &= 0xFFF00000; 2939 rxdctl |= IGB_RX_PTHRESH; 2940 rxdctl |= IGB_RX_HTHRESH << 8; 2941 rxdctl |= IGB_RX_WTHRESH << 16; 2942 wr32(E1000_RXDCTL(reg_idx), rxdctl); 2943} 2944 2945/** 2946 * igb_configure_rx - Configure receive Unit after Reset 2947 * @adapter: board private structure 2948 * 2949 * Configure the Rx unit of the MAC after a reset. 2950 **/ 2951static void igb_configure_rx(struct igb_adapter *adapter) 2952{ 2953 int i; 2954 2955 /* set UTA to appropriate mode */ 2956 igb_set_uta(adapter); 2957 2958 /* set the correct pool for the PF default MAC address in entry 0 */ 2959 igb_rar_set_qsel(adapter, adapter->hw.mac.addr, 0, 2960 adapter->vfs_allocated_count); 2961 2962 /* Setup the HW Rx Head and Tail Descriptor Pointers and 2963 * the Base and Length of the Rx Descriptor Ring */ 2964 for (i = 0; i < adapter->num_rx_queues; i++) 2965 igb_configure_rx_ring(adapter, adapter->rx_ring[i]); 2966} 2967 2968/** 2969 * igb_free_tx_resources - Free Tx Resources per Queue 2970 * @tx_ring: Tx descriptor ring for a specific queue 2971 * 2972 * Free all transmit software resources 2973 **/ 2974void igb_free_tx_resources(struct igb_ring *tx_ring) 2975{ 2976 igb_clean_tx_ring(tx_ring); 2977 2978 vfree(tx_ring->buffer_info); 2979 tx_ring->buffer_info = NULL; 2980 2981 /* if not set, then don't free */ 2982 if (!tx_ring->desc) 2983 return; 2984 2985 dma_free_coherent(tx_ring->dev, tx_ring->size, 2986 tx_ring->desc, tx_ring->dma); 2987 2988 tx_ring->desc = NULL; 2989} 2990 2991/** 2992 * igb_free_all_tx_resources - Free Tx Resources for All Queues 2993 * @adapter: board private structure 2994 * 2995 * Free all transmit software resources 2996 **/ 2997static void igb_free_all_tx_resources(struct igb_adapter *adapter) 2998{ 2999 int i; 3000 3001 for (i = 0; i < adapter->num_tx_queues; i++) 3002 igb_free_tx_resources(adapter->tx_ring[i]); 3003} 3004 3005void igb_unmap_and_free_tx_resource(struct igb_ring *tx_ring, 3006 struct igb_buffer *buffer_info) 3007{ 3008 if (buffer_info->dma) { 3009 if (buffer_info->mapped_as_page) 3010 dma_unmap_page(tx_ring->dev, 3011 buffer_info->dma, 3012 buffer_info->length, 3013 DMA_TO_DEVICE); 3014 else 3015 dma_unmap_single(tx_ring->dev, 3016 buffer_info->dma, 3017 buffer_info->length, 3018 DMA_TO_DEVICE); 3019 buffer_info->dma = 0; 3020 } 3021 if (buffer_info->skb) { 3022 dev_kfree_skb_any(buffer_info->skb); 3023 buffer_info->skb = NULL; 3024 } 3025 buffer_info->time_stamp = 0; 3026 buffer_info->length = 0; 3027 buffer_info->next_to_watch = 0; 3028 buffer_info->mapped_as_page = false; 3029} 3030 3031/** 3032 * igb_clean_tx_ring - Free Tx Buffers 3033 * @tx_ring: ring to be cleaned 3034 **/ 3035static void igb_clean_tx_ring(struct igb_ring *tx_ring) 3036{ 3037 struct igb_buffer *buffer_info; 3038 unsigned long size; 3039 unsigned int i; 3040 3041 if (!tx_ring->buffer_info) 3042 return; 3043 /* Free all the Tx ring sk_buffs */ 3044 3045 for (i = 0; i < tx_ring->count; i++) { 3046 buffer_info = &tx_ring->buffer_info[i]; 3047 igb_unmap_and_free_tx_resource(tx_ring, buffer_info); 3048 } 3049 3050 size = sizeof(struct igb_buffer) * tx_ring->count; 3051 memset(tx_ring->buffer_info, 0, size); 3052 3053 /* Zero out the descriptor ring */ 3054 memset(tx_ring->desc, 0, tx_ring->size); 3055 3056 tx_ring->next_to_use = 0; 3057 tx_ring->next_to_clean = 0; 3058} 3059 3060/** 3061 * igb_clean_all_tx_rings - Free Tx Buffers for all queues 3062 * @adapter: board private structure 3063 **/ 3064static void igb_clean_all_tx_rings(struct igb_adapter *adapter) 3065{ 3066 int i; 3067 3068 for (i = 0; i < adapter->num_tx_queues; i++) 3069 igb_clean_tx_ring(adapter->tx_ring[i]); 3070} 3071 3072/** 3073 * igb_free_rx_resources - Free Rx Resources 3074 * @rx_ring: ring to clean the resources from 3075 * 3076 * Free all receive software resources 3077 **/ 3078void igb_free_rx_resources(struct igb_ring *rx_ring) 3079{ 3080 igb_clean_rx_ring(rx_ring); 3081 3082 vfree(rx_ring->buffer_info); 3083 rx_ring->buffer_info = NULL; 3084 3085 /* if not set, then don't free */ 3086 if (!rx_ring->desc) 3087 return; 3088 3089 dma_free_coherent(rx_ring->dev, rx_ring->size, 3090 rx_ring->desc, rx_ring->dma); 3091 3092 rx_ring->desc = NULL; 3093} 3094 3095/** 3096 * igb_free_all_rx_resources - Free Rx Resources for All Queues 3097 * @adapter: board private structure 3098 * 3099 * Free all receive software resources 3100 **/ 3101static void igb_free_all_rx_resources(struct igb_adapter *adapter) 3102{ 3103 int i; 3104 3105 for (i = 0; i < adapter->num_rx_queues; i++) 3106 igb_free_rx_resources(adapter->rx_ring[i]); 3107} 3108 3109/** 3110 * igb_clean_rx_ring - Free Rx Buffers per Queue 3111 * @rx_ring: ring to free buffers from 3112 **/ 3113static void igb_clean_rx_ring(struct igb_ring *rx_ring) 3114{ 3115 struct igb_buffer *buffer_info; 3116 unsigned long size; 3117 unsigned int i; 3118 3119 if (!rx_ring->buffer_info) 3120 return; 3121 3122 /* Free all the Rx ring sk_buffs */ 3123 for (i = 0; i < rx_ring->count; i++) { 3124 buffer_info = &rx_ring->buffer_info[i]; 3125 if (buffer_info->dma) { 3126 dma_unmap_single(rx_ring->dev, 3127 buffer_info->dma, 3128 rx_ring->rx_buffer_len, 3129 DMA_FROM_DEVICE); 3130 buffer_info->dma = 0; 3131 } 3132 3133 if (buffer_info->skb) { 3134 dev_kfree_skb(buffer_info->skb); 3135 buffer_info->skb = NULL; 3136 } 3137 if (buffer_info->page_dma) { 3138 dma_unmap_page(rx_ring->dev, 3139 buffer_info->page_dma, 3140 PAGE_SIZE / 2, 3141 DMA_FROM_DEVICE); 3142 buffer_info->page_dma = 0; 3143 } 3144 if (buffer_info->page) { 3145 put_page(buffer_info->page); 3146 buffer_info->page = NULL; 3147 buffer_info->page_offset = 0; 3148 } 3149 } 3150 3151 size = sizeof(struct igb_buffer) * rx_ring->count; 3152 memset(rx_ring->buffer_info, 0, size); 3153 3154 /* Zero out the descriptor ring */ 3155 memset(rx_ring->desc, 0, rx_ring->size); 3156 3157 rx_ring->next_to_clean = 0; 3158 rx_ring->next_to_use = 0; 3159} 3160 3161/** 3162 * igb_clean_all_rx_rings - Free Rx Buffers for all queues 3163 * @adapter: board private structure 3164 **/ 3165static void igb_clean_all_rx_rings(struct igb_adapter *adapter) 3166{ 3167 int i; 3168 3169 for (i = 0; i < adapter->num_rx_queues; i++) 3170 igb_clean_rx_ring(adapter->rx_ring[i]); 3171} 3172 3173/** 3174 * igb_set_mac - Change the Ethernet Address of the NIC 3175 * @netdev: network interface device structure 3176 * @p: pointer to an address structure 3177 * 3178 * Returns 0 on success, negative on failure 3179 **/ 3180static int igb_set_mac(struct net_device *netdev, void *p) 3181{ 3182 struct igb_adapter *adapter = netdev_priv(netdev); 3183 struct e1000_hw *hw = &adapter->hw; 3184 struct sockaddr *addr = p; 3185 3186 if (!is_valid_ether_addr(addr->sa_data)) 3187 return -EADDRNOTAVAIL; 3188 3189 memcpy(netdev->dev_addr, addr->sa_data, netdev->addr_len); 3190 memcpy(hw->mac.addr, addr->sa_data, netdev->addr_len); 3191 3192 /* set the correct pool for the new PF MAC address in entry 0 */ 3193 igb_rar_set_qsel(adapter, hw->mac.addr, 0, 3194 adapter->vfs_allocated_count); 3195 3196 return 0; 3197} 3198 3199/** 3200 * igb_write_mc_addr_list - write multicast addresses to MTA 3201 * @netdev: network interface device structure 3202 * 3203 * Writes multicast address list to the MTA hash table. 3204 * Returns: -ENOMEM on failure 3205 * 0 on no addresses written 3206 * X on writing X addresses to MTA 3207 **/ 3208static int igb_write_mc_addr_list(struct net_device *netdev) 3209{ 3210 struct igb_adapter *adapter = netdev_priv(netdev); 3211 struct e1000_hw *hw = &adapter->hw; 3212 struct netdev_hw_addr *ha; 3213 u8 *mta_list; 3214 int i; 3215 3216 if (netdev_mc_empty(netdev)) { 3217 /* nothing to program, so clear mc list */ 3218 igb_update_mc_addr_list(hw, NULL, 0); 3219 igb_restore_vf_multicasts(adapter); 3220 return 0; 3221 } 3222 3223 mta_list = kzalloc(netdev_mc_count(netdev) * 6, GFP_ATOMIC); 3224 if (!mta_list) 3225 return -ENOMEM; 3226 3227 /* The shared function expects a packed array of only addresses. */ 3228 i = 0; 3229 netdev_for_each_mc_addr(ha, netdev) 3230 memcpy(mta_list + (i++ * ETH_ALEN), ha->addr, ETH_ALEN); 3231 3232 igb_update_mc_addr_list(hw, mta_list, i); 3233 kfree(mta_list); 3234 3235 return netdev_mc_count(netdev); 3236} 3237 3238/** 3239 * igb_write_uc_addr_list - write unicast addresses to RAR table 3240 * @netdev: network interface device structure 3241 * 3242 * Writes unicast address list to the RAR table. 3243 * Returns: -ENOMEM on failure/insufficient address space 3244 * 0 on no addresses written 3245 * X on writing X addresses to the RAR table 3246 **/ 3247static int igb_write_uc_addr_list(struct net_device *netdev) 3248{ 3249 struct igb_adapter *adapter = netdev_priv(netdev); 3250 struct e1000_hw *hw = &adapter->hw; 3251 unsigned int vfn = adapter->vfs_allocated_count; 3252 unsigned int rar_entries = hw->mac.rar_entry_count - (vfn + 1); 3253 int count = 0; 3254 3255 /* return ENOMEM indicating insufficient memory for addresses */ 3256 if (netdev_uc_count(netdev) > rar_entries) 3257 return -ENOMEM; 3258 3259 if (!netdev_uc_empty(netdev) && rar_entries) { 3260 struct netdev_hw_addr *ha; 3261 3262 netdev_for_each_uc_addr(ha, netdev) { 3263 if (!rar_entries) 3264 break; 3265 igb_rar_set_qsel(adapter, ha->addr, 3266 rar_entries--, 3267 vfn); 3268 count++; 3269 } 3270 } 3271 /* write the addresses in reverse order to avoid write combining */ 3272 for (; rar_entries > 0 ; rar_entries--) { 3273 wr32(E1000_RAH(rar_entries), 0); 3274 wr32(E1000_RAL(rar_entries), 0); 3275 } 3276 wrfl(); 3277 3278 return count; 3279} 3280 3281/** 3282 * igb_set_rx_mode - Secondary Unicast, Multicast and Promiscuous mode set 3283 * @netdev: network interface device structure 3284 * 3285 * The set_rx_mode entry point is called whenever the unicast or multicast 3286 * address lists or the network interface flags are updated. This routine is 3287 * responsible for configuring the hardware for proper unicast, multicast, 3288 * promiscuous mode, and all-multi behavior. 3289 **/ 3290static void igb_set_rx_mode(struct net_device *netdev) 3291{ 3292 struct igb_adapter *adapter = netdev_priv(netdev); 3293 struct e1000_hw *hw = &adapter->hw; 3294 unsigned int vfn = adapter->vfs_allocated_count; 3295 u32 rctl, vmolr = 0; 3296 int count; 3297 3298 /* Check for Promiscuous and All Multicast modes */ 3299 rctl = rd32(E1000_RCTL); 3300 3301 /* clear the effected bits */ 3302 rctl &= ~(E1000_RCTL_UPE | E1000_RCTL_MPE | E1000_RCTL_VFE); 3303 3304 if (netdev->flags & IFF_PROMISC) { 3305 rctl |= (E1000_RCTL_UPE | E1000_RCTL_MPE); 3306 vmolr |= (E1000_VMOLR_ROPE | E1000_VMOLR_MPME); 3307 } else { 3308 if (netdev->flags & IFF_ALLMULTI) { 3309 rctl |= E1000_RCTL_MPE; 3310 vmolr |= E1000_VMOLR_MPME; 3311 } else { 3312 /* 3313 * Write addresses to the MTA, if the attempt fails 3314 * then we should just turn on promiscous mode so 3315 * that we can at least receive multicast traffic 3316 */ 3317 count = igb_write_mc_addr_list(netdev); 3318 if (count < 0) { 3319 rctl |= E1000_RCTL_MPE; 3320 vmolr |= E1000_VMOLR_MPME; 3321 } else if (count) { 3322 vmolr |= E1000_VMOLR_ROMPE; 3323 } 3324 } 3325 /* 3326 * Write addresses to available RAR registers, if there is not 3327 * sufficient space to store all the addresses then enable 3328 * unicast promiscous mode 3329 */ 3330 count = igb_write_uc_addr_list(netdev); 3331 if (count < 0) { 3332 rctl |= E1000_RCTL_UPE; 3333 vmolr |= E1000_VMOLR_ROPE; 3334 } 3335 rctl |= E1000_RCTL_VFE; 3336 } 3337 wr32(E1000_RCTL, rctl); 3338 3339 /* 3340 * In order to support SR-IOV and eventually VMDq it is necessary to set 3341 * the VMOLR to enable the appropriate modes. Without this workaround 3342 * we will have issues with VLAN tag stripping not being done for frames 3343 * that are only arriving because we are the default pool 3344 */ 3345 if (hw->mac.type < e1000_82576) 3346 return; 3347 3348 vmolr |= rd32(E1000_VMOLR(vfn)) & 3349 ~(E1000_VMOLR_ROPE | E1000_VMOLR_MPME | E1000_VMOLR_ROMPE); 3350 wr32(E1000_VMOLR(vfn), vmolr); 3351 igb_restore_vf_multicasts(adapter); 3352} 3353 3354/* Need to wait a few seconds after link up to get diagnostic information from 3355 * the phy */ 3356static void igb_update_phy_info(unsigned long data) 3357{ 3358 struct igb_adapter *adapter = (struct igb_adapter *) data; 3359 igb_get_phy_info(&adapter->hw); 3360} 3361 3362/** 3363 * igb_has_link - check shared code for link and determine up/down 3364 * @adapter: pointer to driver private info 3365 **/ 3366bool igb_has_link(struct igb_adapter *adapter) 3367{ 3368 struct e1000_hw *hw = &adapter->hw; 3369 bool link_active = false; 3370 s32 ret_val = 0; 3371 3372 /* get_link_status is set on LSC (link status) interrupt or 3373 * rx sequence error interrupt. get_link_status will stay 3374 * false until the e1000_check_for_link establishes link 3375 * for copper adapters ONLY 3376 */ 3377 switch (hw->phy.media_type) { 3378 case e1000_media_type_copper: 3379 if (hw->mac.get_link_status) { 3380 ret_val = hw->mac.ops.check_for_link(hw); 3381 link_active = !hw->mac.get_link_status; 3382 } else { 3383 link_active = true; 3384 } 3385 break; 3386 case e1000_media_type_internal_serdes: 3387 ret_val = hw->mac.ops.check_for_link(hw); 3388 link_active = hw->mac.serdes_has_link; 3389 break; 3390 default: 3391 case e1000_media_type_unknown: 3392 break; 3393 } 3394 3395 return link_active; 3396} 3397 3398/** 3399 * igb_watchdog - Timer Call-back 3400 * @data: pointer to adapter cast into an unsigned long 3401 **/ 3402static void igb_watchdog(unsigned long data) 3403{ 3404 struct igb_adapter *adapter = (struct igb_adapter *)data; 3405 /* Do the rest outside of interrupt context */ 3406 schedule_work(&adapter->watchdog_task); 3407} 3408 3409static void igb_watchdog_task(struct work_struct *work) 3410{ 3411 struct igb_adapter *adapter = container_of(work, 3412 struct igb_adapter, 3413 watchdog_task); 3414 struct e1000_hw *hw = &adapter->hw; 3415 struct net_device *netdev = adapter->netdev; 3416 u32 link; 3417 int i; 3418 3419 link = igb_has_link(adapter); 3420 if (link) { 3421 if (!netif_carrier_ok(netdev)) { 3422 u32 ctrl; 3423 hw->mac.ops.get_speed_and_duplex(hw, 3424 &adapter->link_speed, 3425 &adapter->link_duplex); 3426 3427 ctrl = rd32(E1000_CTRL); 3428 /* Links status message must follow this format */ 3429 printk(KERN_INFO "igb: %s NIC Link is Up %d Mbps %s, " 3430 "Flow Control: %s\n", 3431 netdev->name, 3432 adapter->link_speed, 3433 adapter->link_duplex == FULL_DUPLEX ? 3434 "Full Duplex" : "Half Duplex", 3435 ((ctrl & E1000_CTRL_TFCE) && 3436 (ctrl & E1000_CTRL_RFCE)) ? "RX/TX" : 3437 ((ctrl & E1000_CTRL_RFCE) ? "RX" : 3438 ((ctrl & E1000_CTRL_TFCE) ? "TX" : "None"))); 3439 3440 /* adjust timeout factor according to speed/duplex */ 3441 adapter->tx_timeout_factor = 1; 3442 switch (adapter->link_speed) { 3443 case SPEED_10: 3444 adapter->tx_timeout_factor = 14; 3445 break; 3446 case SPEED_100: 3447 /* maybe add some timeout factor ? */ 3448 break; 3449 } 3450 3451 netif_carrier_on(netdev); 3452 3453 igb_ping_all_vfs(adapter); 3454 3455 /* link state has changed, schedule phy info update */ 3456 if (!test_bit(__IGB_DOWN, &adapter->state)) 3457 mod_timer(&adapter->phy_info_timer, 3458 round_jiffies(jiffies + 2 * HZ)); 3459 } 3460 } else { 3461 if (netif_carrier_ok(netdev)) { 3462 adapter->link_speed = 0; 3463 adapter->link_duplex = 0; 3464 /* Links status message must follow this format */ 3465 printk(KERN_INFO "igb: %s NIC Link is Down\n", 3466 netdev->name); 3467 netif_carrier_off(netdev); 3468 3469 igb_ping_all_vfs(adapter); 3470 3471 /* link state has changed, schedule phy info update */ 3472 if (!test_bit(__IGB_DOWN, &adapter->state)) 3473 mod_timer(&adapter->phy_info_timer, 3474 round_jiffies(jiffies + 2 * HZ)); 3475 } 3476 } 3477 3478 igb_update_stats(adapter); 3479 3480 for (i = 0; i < adapter->num_tx_queues; i++) { 3481 struct igb_ring *tx_ring = adapter->tx_ring[i]; 3482 if (!netif_carrier_ok(netdev)) { 3483 /* We've lost link, so the controller stops DMA, 3484 * but we've got queued Tx work that's never going 3485 * to get done, so reset controller to flush Tx. 3486 * (Do the reset outside of interrupt context). */ 3487 if (igb_desc_unused(tx_ring) + 1 < tx_ring->count) { 3488 adapter->tx_timeout_count++; 3489 schedule_work(&adapter->reset_task); 3490 /* return immediately since reset is imminent */ 3491 return; 3492 } 3493 } 3494 3495 /* Force detection of hung controller every watchdog period */ 3496 tx_ring->detect_tx_hung = true; 3497 } 3498 3499 /* Cause software interrupt to ensure rx ring is cleaned */ 3500 if (adapter->msix_entries) { 3501 u32 eics = 0; 3502 for (i = 0; i < adapter->num_q_vectors; i++) { 3503 struct igb_q_vector *q_vector = adapter->q_vector[i]; 3504 eics |= q_vector->eims_value; 3505 } 3506 wr32(E1000_EICS, eics); 3507 } else { 3508 wr32(E1000_ICS, E1000_ICS_RXDMT0); 3509 } 3510 3511 /* Reset the timer */ 3512 if (!test_bit(__IGB_DOWN, &adapter->state)) 3513 mod_timer(&adapter->watchdog_timer, 3514 round_jiffies(jiffies + 2 * HZ)); 3515} 3516 3517enum latency_range { 3518 lowest_latency = 0, 3519 low_latency = 1, 3520 bulk_latency = 2, 3521 latency_invalid = 255 3522}; 3523 3524/** 3525 * igb_update_ring_itr - update the dynamic ITR value based on packet size 3526 * 3527 * Stores a new ITR value based on strictly on packet size. This 3528 * algorithm is less sophisticated than that used in igb_update_itr, 3529 * due to the difficulty of synchronizing statistics across multiple 3530 * receive rings. The divisors and thresholds used by this fuction 3531 * were determined based on theoretical maximum wire speed and testing 3532 * data, in order to minimize response time while increasing bulk 3533 * throughput. 3534 * This functionality is controlled by the InterruptThrottleRate module 3535 * parameter (see igb_param.c) 3536 * NOTE: This function is called only when operating in a multiqueue 3537 * receive environment. 3538 * @q_vector: pointer to q_vector 3539 **/ 3540static void igb_update_ring_itr(struct igb_q_vector *q_vector) 3541{ 3542 int new_val = q_vector->itr_val; 3543 int avg_wire_size = 0; 3544 struct igb_adapter *adapter = q_vector->adapter; 3545 3546 /* For non-gigabit speeds, just fix the interrupt rate at 4000 3547 * ints/sec - ITR timer value of 120 ticks. 3548 */ 3549 if (adapter->link_speed != SPEED_1000) { 3550 new_val = 976; 3551 goto set_itr_val; 3552 } 3553 3554 if (q_vector->rx_ring && q_vector->rx_ring->total_packets) { 3555 struct igb_ring *ring = q_vector->rx_ring; 3556 avg_wire_size = ring->total_bytes / ring->total_packets; 3557 } 3558 3559 if (q_vector->tx_ring && q_vector->tx_ring->total_packets) { 3560 struct igb_ring *ring = q_vector->tx_ring; 3561 avg_wire_size = max_t(u32, avg_wire_size, 3562 (ring->total_bytes / 3563 ring->total_packets)); 3564 } 3565 3566 /* if avg_wire_size isn't set no work was done */ 3567 if (!avg_wire_size) 3568 goto clear_counts; 3569 3570 /* Add 24 bytes to size to account for CRC, preamble, and gap */ 3571 avg_wire_size += 24; 3572 3573 /* Don't starve jumbo frames */ 3574 avg_wire_size = min(avg_wire_size, 3000); 3575 3576 /* Give a little boost to mid-size frames */ 3577 if ((avg_wire_size > 300) && (avg_wire_size < 1200)) 3578 new_val = avg_wire_size / 3; 3579 else 3580 new_val = avg_wire_size / 2; 3581 3582 /* when in itr mode 3 do not exceed 20K ints/sec */ 3583 if (adapter->rx_itr_setting == 3 && new_val < 196) 3584 new_val = 196; 3585 3586set_itr_val: 3587 if (new_val != q_vector->itr_val) { 3588 q_vector->itr_val = new_val; 3589 q_vector->set_itr = 1; 3590 } 3591clear_counts: 3592 if (q_vector->rx_ring) { 3593 q_vector->rx_ring->total_bytes = 0; 3594 q_vector->rx_ring->total_packets = 0; 3595 } 3596 if (q_vector->tx_ring) { 3597 q_vector->tx_ring->total_bytes = 0; 3598 q_vector->tx_ring->total_packets = 0; 3599 } 3600} 3601 3602/** 3603 * igb_update_itr - update the dynamic ITR value based on statistics 3604 * Stores a new ITR value based on packets and byte 3605 * counts during the last interrupt. The advantage of per interrupt 3606 * computation is faster updates and more accurate ITR for the current 3607 * traffic pattern. Constants in this function were computed 3608 * based on theoretical maximum wire speed and thresholds were set based 3609 * on testing data as well as attempting to minimize response time 3610 * while increasing bulk throughput. 3611 * this functionality is controlled by the InterruptThrottleRate module 3612 * parameter (see igb_param.c) 3613 * NOTE: These calculations are only valid when operating in a single- 3614 * queue environment. 3615 * @adapter: pointer to adapter 3616 * @itr_setting: current q_vector->itr_val 3617 * @packets: the number of packets during this measurement interval 3618 * @bytes: the number of bytes during this measurement interval 3619 **/ 3620static unsigned int igb_update_itr(struct igb_adapter *adapter, u16 itr_setting, 3621 int packets, int bytes) 3622{ 3623 unsigned int retval = itr_setting; 3624 3625 if (packets == 0) 3626 goto update_itr_done; 3627 3628 switch (itr_setting) { 3629 case lowest_latency: 3630 /* handle TSO and jumbo frames */ 3631 if (bytes/packets > 8000) 3632 retval = bulk_latency; 3633 else if ((packets < 5) && (bytes > 512)) 3634 retval = low_latency; 3635 break; 3636 case low_latency: /* 50 usec aka 20000 ints/s */ 3637 if (bytes > 10000) { 3638 /* this if handles the TSO accounting */ 3639 if (bytes/packets > 8000) { 3640 retval = bulk_latency; 3641 } else if ((packets < 10) || ((bytes/packets) > 1200)) { 3642 retval = bulk_latency; 3643 } else if ((packets > 35)) { 3644 retval = lowest_latency; 3645 } 3646 } else if (bytes/packets > 2000) { 3647 retval = bulk_latency; 3648 } else if (packets <= 2 && bytes < 512) { 3649 retval = lowest_latency; 3650 } 3651 break; 3652 case bulk_latency: /* 250 usec aka 4000 ints/s */ 3653 if (bytes > 25000) { 3654 if (packets > 35) 3655 retval = low_latency; 3656 } else if (bytes < 1500) { 3657 retval = low_latency; 3658 } 3659 break; 3660 } 3661 3662update_itr_done: 3663 return retval; 3664} 3665 3666static void igb_set_itr(struct igb_adapter *adapter) 3667{ 3668 struct igb_q_vector *q_vector = adapter->q_vector[0]; 3669 u16 current_itr; 3670 u32 new_itr = q_vector->itr_val; 3671 3672 /* for non-gigabit speeds, just fix the interrupt rate at 4000 */ 3673 if (adapter->link_speed != SPEED_1000) { 3674 current_itr = 0; 3675 new_itr = 4000; 3676 goto set_itr_now; 3677 } 3678 3679 adapter->rx_itr = igb_update_itr(adapter, 3680 adapter->rx_itr, 3681 q_vector->rx_ring->total_packets, 3682 q_vector->rx_ring->total_bytes); 3683 3684 adapter->tx_itr = igb_update_itr(adapter, 3685 adapter->tx_itr, 3686 q_vector->tx_ring->total_packets, 3687 q_vector->tx_ring->total_bytes); 3688 current_itr = max(adapter->rx_itr, adapter->tx_itr); 3689 3690 /* conservative mode (itr 3) eliminates the lowest_latency setting */ 3691 if (adapter->rx_itr_setting == 3 && current_itr == lowest_latency) 3692 current_itr = low_latency; 3693 3694 switch (current_itr) { 3695 /* counts and packets in update_itr are dependent on these numbers */ 3696 case lowest_latency: 3697 new_itr = 56; /* aka 70,000 ints/sec */ 3698 break; 3699 case low_latency: 3700 new_itr = 196; /* aka 20,000 ints/sec */ 3701 break; 3702 case bulk_latency: 3703 new_itr = 980; /* aka 4,000 ints/sec */ 3704 break; 3705 default: 3706 break; 3707 } 3708 3709set_itr_now: 3710 q_vector->rx_ring->total_bytes = 0; 3711 q_vector->rx_ring->total_packets = 0; 3712 q_vector->tx_ring->total_bytes = 0; 3713 q_vector->tx_ring->total_packets = 0; 3714 3715 if (new_itr != q_vector->itr_val) { 3716 /* this attempts to bias the interrupt rate towards Bulk 3717 * by adding intermediate steps when interrupt rate is 3718 * increasing */ 3719 new_itr = new_itr > q_vector->itr_val ? 3720 max((new_itr * q_vector->itr_val) / 3721 (new_itr + (q_vector->itr_val >> 2)), 3722 new_itr) : 3723 new_itr; 3724 /* Don't write the value here; it resets the adapter's 3725 * internal timer, and causes us to delay far longer than 3726 * we should between interrupts. Instead, we write the ITR 3727 * value at the beginning of the next interrupt so the timing 3728 * ends up being correct. 3729 */ 3730 q_vector->itr_val = new_itr; 3731 q_vector->set_itr = 1; 3732 } 3733} 3734 3735#define IGB_TX_FLAGS_CSUM 0x00000001 3736#define IGB_TX_FLAGS_VLAN 0x00000002 3737#define IGB_TX_FLAGS_TSO 0x00000004 3738#define IGB_TX_FLAGS_IPV4 0x00000008 3739#define IGB_TX_FLAGS_TSTAMP 0x00000010 3740#define IGB_TX_FLAGS_VLAN_MASK 0xffff0000 3741#define IGB_TX_FLAGS_VLAN_SHIFT 16 3742 3743static inline int igb_tso_adv(struct igb_ring *tx_ring, 3744 struct sk_buff *skb, u32 tx_flags, u8 *hdr_len) 3745{ 3746 struct e1000_adv_tx_context_desc *context_desc; 3747 unsigned int i; 3748 int err; 3749 struct igb_buffer *buffer_info; 3750 u32 info = 0, tu_cmd = 0; 3751 u32 mss_l4len_idx; 3752 u8 l4len; 3753 3754 if (skb_header_cloned(skb)) { 3755 err = pskb_expand_head(skb, 0, 0, GFP_ATOMIC); 3756 if (err) 3757 return err; 3758 } 3759 3760 l4len = tcp_hdrlen(skb); 3761 *hdr_len += l4len; 3762 3763 if (skb->protocol == htons(ETH_P_IP)) { 3764 struct iphdr *iph = ip_hdr(skb); 3765 iph->tot_len = 0; 3766 iph->check = 0; 3767 tcp_hdr(skb)->check = ~csum_tcpudp_magic(iph->saddr, 3768 iph->daddr, 0, 3769 IPPROTO_TCP, 3770 0); 3771 } else if (skb_is_gso_v6(skb)) { 3772 ipv6_hdr(skb)->payload_len = 0; 3773 tcp_hdr(skb)->check = ~csum_ipv6_magic(&ipv6_hdr(skb)->saddr, 3774 &ipv6_hdr(skb)->daddr, 3775 0, IPPROTO_TCP, 0); 3776 } 3777 3778 i = tx_ring->next_to_use; 3779 3780 buffer_info = &tx_ring->buffer_info[i]; 3781 context_desc = E1000_TX_CTXTDESC_ADV(*tx_ring, i); 3782 /* VLAN MACLEN IPLEN */ 3783 if (tx_flags & IGB_TX_FLAGS_VLAN) 3784 info |= (tx_flags & IGB_TX_FLAGS_VLAN_MASK); 3785 info |= (skb_network_offset(skb) << E1000_ADVTXD_MACLEN_SHIFT); 3786 *hdr_len += skb_network_offset(skb); 3787 info |= skb_network_header_len(skb); 3788 *hdr_len += skb_network_header_len(skb); 3789 context_desc->vlan_macip_lens = cpu_to_le32(info); 3790 3791 /* ADV DTYP TUCMD MKRLOC/ISCSIHEDLEN */ 3792 tu_cmd |= (E1000_TXD_CMD_DEXT | E1000_ADVTXD_DTYP_CTXT); 3793 3794 if (skb->protocol == htons(ETH_P_IP)) 3795 tu_cmd |= E1000_ADVTXD_TUCMD_IPV4; 3796 tu_cmd |= E1000_ADVTXD_TUCMD_L4T_TCP; 3797 3798 context_desc->type_tucmd_mlhl = cpu_to_le32(tu_cmd); 3799 3800 /* MSS L4LEN IDX */ 3801 mss_l4len_idx = (skb_shinfo(skb)->gso_size << E1000_ADVTXD_MSS_SHIFT); 3802 mss_l4len_idx |= (l4len << E1000_ADVTXD_L4LEN_SHIFT); 3803 3804 /* For 82575, context index must be unique per ring. */ 3805 if (tx_ring->flags & IGB_RING_FLAG_TX_CTX_IDX) 3806 mss_l4len_idx |= tx_ring->reg_idx << 4; 3807 3808 context_desc->mss_l4len_idx = cpu_to_le32(mss_l4len_idx); 3809 context_desc->seqnum_seed = 0; 3810 3811 buffer_info->time_stamp = jiffies; 3812 buffer_info->next_to_watch = i; 3813 buffer_info->dma = 0; 3814 i++; 3815 if (i == tx_ring->count) 3816 i = 0; 3817 3818 tx_ring->next_to_use = i; 3819 3820 return true; 3821} 3822 3823static inline bool igb_tx_csum_adv(struct igb_ring *tx_ring, 3824 struct sk_buff *skb, u32 tx_flags) 3825{ 3826 struct e1000_adv_tx_context_desc *context_desc; 3827 struct device *dev = tx_ring->dev; 3828 struct igb_buffer *buffer_info; 3829 u32 info = 0, tu_cmd = 0; 3830 unsigned int i; 3831 3832 if ((skb->ip_summed == CHECKSUM_PARTIAL) || 3833 (tx_flags & IGB_TX_FLAGS_VLAN)) { 3834 i = tx_ring->next_to_use; 3835 buffer_info = &tx_ring->buffer_info[i]; 3836 context_desc = E1000_TX_CTXTDESC_ADV(*tx_ring, i); 3837 3838 if (tx_flags & IGB_TX_FLAGS_VLAN) 3839 info |= (tx_flags & IGB_TX_FLAGS_VLAN_MASK); 3840 3841 info |= (skb_network_offset(skb) << E1000_ADVTXD_MACLEN_SHIFT); 3842 if (skb->ip_summed == CHECKSUM_PARTIAL) 3843 info |= skb_network_header_len(skb); 3844 3845 context_desc->vlan_macip_lens = cpu_to_le32(info); 3846 3847 tu_cmd |= (E1000_TXD_CMD_DEXT | E1000_ADVTXD_DTYP_CTXT); 3848 3849 if (skb->ip_summed == CHECKSUM_PARTIAL) { 3850 __be16 protocol; 3851 3852 if (skb->protocol == cpu_to_be16(ETH_P_8021Q)) { 3853 const struct vlan_ethhdr *vhdr = 3854 (const struct vlan_ethhdr*)skb->data; 3855 3856 protocol = vhdr->h_vlan_encapsulated_proto; 3857 } else { 3858 protocol = skb->protocol; 3859 } 3860 3861 switch (protocol) { 3862 case cpu_to_be16(ETH_P_IP): 3863 tu_cmd |= E1000_ADVTXD_TUCMD_IPV4; 3864 if (ip_hdr(skb)->protocol == IPPROTO_TCP) 3865 tu_cmd |= E1000_ADVTXD_TUCMD_L4T_TCP; 3866 else if (ip_hdr(skb)->protocol == IPPROTO_SCTP) 3867 tu_cmd |= E1000_ADVTXD_TUCMD_L4T_SCTP; 3868 break; 3869 case cpu_to_be16(ETH_P_IPV6): 3870 /* XXX what about other V6 headers?? */ 3871 if (ipv6_hdr(skb)->nexthdr == IPPROTO_TCP) 3872 tu_cmd |= E1000_ADVTXD_TUCMD_L4T_TCP; 3873 else if (ipv6_hdr(skb)->nexthdr == IPPROTO_SCTP) 3874 tu_cmd |= E1000_ADVTXD_TUCMD_L4T_SCTP; 3875 break; 3876 default: 3877 if (unlikely(net_ratelimit())) 3878 dev_warn(dev, 3879 "partial checksum but proto=%x!\n", 3880 skb->protocol); 3881 break; 3882 } 3883 } 3884 3885 context_desc->type_tucmd_mlhl = cpu_to_le32(tu_cmd); 3886 context_desc->seqnum_seed = 0; 3887 if (tx_ring->flags & IGB_RING_FLAG_TX_CTX_IDX) 3888 context_desc->mss_l4len_idx = 3889 cpu_to_le32(tx_ring->reg_idx << 4); 3890 3891 buffer_info->time_stamp = jiffies; 3892 buffer_info->next_to_watch = i; 3893 buffer_info->dma = 0; 3894 3895 i++; 3896 if (i == tx_ring->count) 3897 i = 0; 3898 tx_ring->next_to_use = i; 3899 3900 return true; 3901 } 3902 return false; 3903} 3904 3905#define IGB_MAX_TXD_PWR 16 3906#define IGB_MAX_DATA_PER_TXD (1<<IGB_MAX_TXD_PWR) 3907 3908static inline int igb_tx_map_adv(struct igb_ring *tx_ring, struct sk_buff *skb, 3909 unsigned int first) 3910{ 3911 struct igb_buffer *buffer_info; 3912 struct device *dev = tx_ring->dev; 3913 unsigned int hlen = skb_headlen(skb); 3914 unsigned int count = 0, i; 3915 unsigned int f; 3916 u16 gso_segs = skb_shinfo(skb)->gso_segs ?: 1; 3917 3918 i = tx_ring->next_to_use; 3919 3920 buffer_info = &tx_ring->buffer_info[i]; 3921 BUG_ON(hlen >= IGB_MAX_DATA_PER_TXD); 3922 buffer_info->length = hlen; 3923 /* set time_stamp *before* dma to help avoid a possible race */ 3924 buffer_info->time_stamp = jiffies; 3925 buffer_info->next_to_watch = i; 3926 buffer_info->dma = dma_map_single(dev, skb->data, hlen, 3927 DMA_TO_DEVICE); 3928 if (dma_mapping_error(dev, buffer_info->dma)) 3929 goto dma_error; 3930 3931 for (f = 0; f < skb_shinfo(skb)->nr_frags; f++) { 3932 struct skb_frag_struct *frag = &skb_shinfo(skb)->frags[f]; 3933 unsigned int len = frag->size; 3934 3935 count++; 3936 i++; 3937 if (i == tx_ring->count) 3938 i = 0; 3939 3940 buffer_info = &tx_ring->buffer_info[i]; 3941 BUG_ON(len >= IGB_MAX_DATA_PER_TXD); 3942 buffer_info->length = len; 3943 buffer_info->time_stamp = jiffies; 3944 buffer_info->next_to_watch = i; 3945 buffer_info->mapped_as_page = true; 3946 buffer_info->dma = dma_map_page(dev, 3947 frag->page, 3948 frag->page_offset, 3949 len, 3950 DMA_TO_DEVICE); 3951 if (dma_mapping_error(dev, buffer_info->dma)) 3952 goto dma_error; 3953 3954 } 3955 3956 tx_ring->buffer_info[i].skb = skb; 3957 tx_ring->buffer_info[i].shtx = skb_shinfo(skb)->tx_flags; 3958 /* multiply data chunks by size of headers */ 3959 tx_ring->buffer_info[i].bytecount = ((gso_segs - 1) * hlen) + skb->len; 3960 tx_ring->buffer_info[i].gso_segs = gso_segs; 3961 tx_ring->buffer_info[first].next_to_watch = i; 3962 3963 return ++count; 3964 3965dma_error: 3966 dev_err(dev, "TX DMA map failed\n"); 3967 3968 /* clear timestamp and dma mappings for failed buffer_info mapping */ 3969 buffer_info->dma = 0; 3970 buffer_info->time_stamp = 0; 3971 buffer_info->length = 0; 3972 buffer_info->next_to_watch = 0; 3973 buffer_info->mapped_as_page = false; 3974 3975 /* clear timestamp and dma mappings for remaining portion of packet */ 3976 while (count--) { 3977 if (i == 0) 3978 i = tx_ring->count; 3979 i--; 3980 buffer_info = &tx_ring->buffer_info[i]; 3981 igb_unmap_and_free_tx_resource(tx_ring, buffer_info); 3982 } 3983 3984 return 0; 3985} 3986 3987static inline void igb_tx_queue_adv(struct igb_ring *tx_ring, 3988 u32 tx_flags, int count, u32 paylen, 3989 u8 hdr_len) 3990{ 3991 union e1000_adv_tx_desc *tx_desc; 3992 struct igb_buffer *buffer_info; 3993 u32 olinfo_status = 0, cmd_type_len; 3994 unsigned int i = tx_ring->next_to_use; 3995 3996 cmd_type_len = (E1000_ADVTXD_DTYP_DATA | E1000_ADVTXD_DCMD_IFCS | 3997 E1000_ADVTXD_DCMD_DEXT); 3998 3999 if (tx_flags & IGB_TX_FLAGS_VLAN) 4000 cmd_type_len |= E1000_ADVTXD_DCMD_VLE; 4001 4002 if (tx_flags & IGB_TX_FLAGS_TSTAMP) 4003 cmd_type_len |= E1000_ADVTXD_MAC_TSTAMP; 4004 4005 if (tx_flags & IGB_TX_FLAGS_TSO) { 4006 cmd_type_len |= E1000_ADVTXD_DCMD_TSE; 4007 4008 /* insert tcp checksum */ 4009 olinfo_status |= E1000_TXD_POPTS_TXSM << 8; 4010 4011 /* insert ip checksum */ 4012 if (tx_flags & IGB_TX_FLAGS_IPV4) 4013 olinfo_status |= E1000_TXD_POPTS_IXSM << 8; 4014 4015 } else if (tx_flags & IGB_TX_FLAGS_CSUM) { 4016 olinfo_status |= E1000_TXD_POPTS_TXSM << 8; 4017 } 4018 4019 if ((tx_ring->flags & IGB_RING_FLAG_TX_CTX_IDX) && 4020 (tx_flags & (IGB_TX_FLAGS_CSUM | 4021 IGB_TX_FLAGS_TSO | 4022 IGB_TX_FLAGS_VLAN))) 4023 olinfo_status |= tx_ring->reg_idx << 4; 4024 4025 olinfo_status |= ((paylen - hdr_len) << E1000_ADVTXD_PAYLEN_SHIFT); 4026 4027 do { 4028 buffer_info = &tx_ring->buffer_info[i]; 4029 tx_desc = E1000_TX_DESC_ADV(*tx_ring, i); 4030 tx_desc->read.buffer_addr = cpu_to_le64(buffer_info->dma); 4031 tx_desc->read.cmd_type_len = 4032 cpu_to_le32(cmd_type_len | buffer_info->length); 4033 tx_desc->read.olinfo_status = cpu_to_le32(olinfo_status); 4034 count--; 4035 i++; 4036 if (i == tx_ring->count) 4037 i = 0; 4038 } while (count > 0); 4039 4040 tx_desc->read.cmd_type_len |= cpu_to_le32(IGB_ADVTXD_DCMD); 4041 /* Force memory writes to complete before letting h/w 4042 * know there are new descriptors to fetch. (Only 4043 * applicable for weak-ordered memory model archs, 4044 * such as IA-64). */ 4045 wmb(); 4046 4047 tx_ring->next_to_use = i; 4048 writel(i, tx_ring->tail); 4049 /* we need this if more than one processor can write to our tail 4050 * at a time, it syncronizes IO on IA64/Altix systems */ 4051 mmiowb(); 4052} 4053 4054static int __igb_maybe_stop_tx(struct igb_ring *tx_ring, int size) 4055{ 4056 struct net_device *netdev = tx_ring->netdev; 4057 4058 netif_stop_subqueue(netdev, tx_ring->queue_index); 4059 4060 /* Herbert's original patch had: 4061 * smp_mb__after_netif_stop_queue(); 4062 * but since that doesn't exist yet, just open code it. */ 4063 smp_mb(); 4064 4065 /* We need to check again in a case another CPU has just 4066 * made room available. */ 4067 if (igb_desc_unused(tx_ring) < size) 4068 return -EBUSY; 4069 4070 /* A reprieve! */ 4071 netif_wake_subqueue(netdev, tx_ring->queue_index); 4072 tx_ring->tx_stats.restart_queue++; 4073 return 0; 4074} 4075 4076static inline int igb_maybe_stop_tx(struct igb_ring *tx_ring, int size) 4077{ 4078 if (igb_desc_unused(tx_ring) >= size) 4079 return 0; 4080 return __igb_maybe_stop_tx(tx_ring, size); 4081} 4082 4083netdev_tx_t igb_xmit_frame_ring_adv(struct sk_buff *skb, 4084 struct igb_ring *tx_ring) 4085{ 4086 struct igb_adapter *adapter = netdev_priv(tx_ring->netdev); 4087 int tso = 0, count; 4088 u32 tx_flags = 0; 4089 u16 first; 4090 u8 hdr_len = 0; 4091 union skb_shared_tx *shtx = skb_tx(skb); 4092 4093 /* need: 1 descriptor per page, 4094 * + 2 desc gap to keep tail from touching head, 4095 * + 1 desc for skb->data, 4096 * + 1 desc for context descriptor, 4097 * otherwise try next time */ 4098 if (igb_maybe_stop_tx(tx_ring, skb_shinfo(skb)->nr_frags + 4)) { 4099 /* this is a hard error */ 4100 return NETDEV_TX_BUSY; 4101 } 4102 4103 if (unlikely(shtx->hardware)) { 4104 shtx->in_progress = 1; 4105 tx_flags |= IGB_TX_FLAGS_TSTAMP; 4106 } 4107 4108 if (vlan_tx_tag_present(skb) && adapter->vlgrp) { 4109 tx_flags |= IGB_TX_FLAGS_VLAN; 4110 tx_flags |= (vlan_tx_tag_get(skb) << IGB_TX_FLAGS_VLAN_SHIFT); 4111 } 4112 4113 if (skb->protocol == htons(ETH_P_IP)) 4114 tx_flags |= IGB_TX_FLAGS_IPV4; 4115 4116 first = tx_ring->next_to_use; 4117 if (skb_is_gso(skb)) { 4118 tso = igb_tso_adv(tx_ring, skb, tx_flags, &hdr_len); 4119 4120 if (tso < 0) { 4121 dev_kfree_skb_any(skb); 4122 return NETDEV_TX_OK; 4123 } 4124 } 4125 4126 if (tso) 4127 tx_flags |= IGB_TX_FLAGS_TSO; 4128 else if (igb_tx_csum_adv(tx_ring, skb, tx_flags) && 4129 (skb->ip_summed == CHECKSUM_PARTIAL)) 4130 tx_flags |= IGB_TX_FLAGS_CSUM; 4131 4132 /* 4133 * count reflects descriptors mapped, if 0 or less then mapping error 4134 * has occured and we need to rewind the descriptor queue 4135 */ 4136 count = igb_tx_map_adv(tx_ring, skb, first); 4137 if (!count) { 4138 dev_kfree_skb_any(skb); 4139 tx_ring->buffer_info[first].time_stamp = 0; 4140 tx_ring->next_to_use = first; 4141 return NETDEV_TX_OK; 4142 } 4143 4144 igb_tx_queue_adv(tx_ring, tx_flags, count, skb->len, hdr_len); 4145 4146 /* Make sure there is space in the ring for the next send. */ 4147 igb_maybe_stop_tx(tx_ring, MAX_SKB_FRAGS + 4); 4148 4149 return NETDEV_TX_OK; 4150} 4151 4152static netdev_tx_t igb_xmit_frame_adv(struct sk_buff *skb, 4153 struct net_device *netdev) 4154{ 4155 struct igb_adapter *adapter = netdev_priv(netdev); 4156 struct igb_ring *tx_ring; 4157 int r_idx = 0; 4158 4159 if (test_bit(__IGB_DOWN, &adapter->state)) { 4160 dev_kfree_skb_any(skb); 4161 return NETDEV_TX_OK; 4162 } 4163 4164 if (skb->len <= 0) { 4165 dev_kfree_skb_any(skb); 4166 return NETDEV_TX_OK; 4167 } 4168 4169 r_idx = skb->queue_mapping & (IGB_ABS_MAX_TX_QUEUES - 1); 4170 tx_ring = adapter->multi_tx_table[r_idx]; 4171 4172 /* This goes back to the question of how to logically map a tx queue 4173 * to a flow. Right now, performance is impacted slightly negatively 4174 * if using multiple tx queues. If the stack breaks away from a 4175 * single qdisc implementation, we can look at this again. */ 4176 return igb_xmit_frame_ring_adv(skb, tx_ring); 4177} 4178 4179/** 4180 * igb_tx_timeout - Respond to a Tx Hang 4181 * @netdev: network interface device structure 4182 **/ 4183static void igb_tx_timeout(struct net_device *netdev) 4184{ 4185 struct igb_adapter *adapter = netdev_priv(netdev); 4186 struct e1000_hw *hw = &adapter->hw; 4187 4188 /* Do the reset outside of interrupt context */ 4189 adapter->tx_timeout_count++; 4190 4191 if (hw->mac.type == e1000_82580) 4192 hw->dev_spec._82575.global_device_reset = true; 4193 4194 schedule_work(&adapter->reset_task); 4195 wr32(E1000_EICS, 4196 (adapter->eims_enable_mask & ~adapter->eims_other)); 4197} 4198 4199static void igb_reset_task(struct work_struct *work) 4200{ 4201 struct igb_adapter *adapter; 4202 adapter = container_of(work, struct igb_adapter, reset_task); 4203 4204 igb_dump(adapter); 4205 netdev_err(adapter->netdev, "Reset adapter\n"); 4206 igb_reinit_locked(adapter); 4207} 4208 4209/** 4210 * igb_get_stats - Get System Network Statistics 4211 * @netdev: network interface device structure 4212 * 4213 * Returns the address of the device statistics structure. 4214 * The statistics are actually updated from the timer callback. 4215 **/ 4216static struct net_device_stats *igb_get_stats(struct net_device *netdev) 4217{ 4218 /* only return the current stats */ 4219 return &netdev->stats; 4220} 4221 4222/** 4223 * igb_change_mtu - Change the Maximum Transfer Unit 4224 * @netdev: network interface device structure 4225 * @new_mtu: new value for maximum frame size 4226 * 4227 * Returns 0 on success, negative on failure 4228 **/ 4229static int igb_change_mtu(struct net_device *netdev, int new_mtu) 4230{ 4231 struct igb_adapter *adapter = netdev_priv(netdev); 4232 struct pci_dev *pdev = adapter->pdev; 4233 int max_frame = new_mtu + ETH_HLEN + ETH_FCS_LEN; 4234 u32 rx_buffer_len, i; 4235 4236 if ((new_mtu < 68) || (max_frame > MAX_JUMBO_FRAME_SIZE)) { 4237 dev_err(&pdev->dev, "Invalid MTU setting\n"); 4238 return -EINVAL; 4239 } 4240 4241 if (max_frame > MAX_STD_JUMBO_FRAME_SIZE) { 4242 dev_err(&pdev->dev, "MTU > 9216 not supported.\n"); 4243 return -EINVAL; 4244 } 4245 4246 while (test_and_set_bit(__IGB_RESETTING, &adapter->state)) 4247 msleep(1); 4248 4249 /* igb_down has a dependency on max_frame_size */ 4250 adapter->max_frame_size = max_frame; 4251 4252 /* NOTE: netdev_alloc_skb reserves 16 bytes, and typically NET_IP_ALIGN 4253 * means we reserve 2 more, this pushes us to allocate from the next 4254 * larger slab size. 4255 * i.e. RXBUFFER_2048 --> size-4096 slab 4256 */ 4257 4258 if (adapter->hw.mac.type == e1000_82580) 4259 max_frame += IGB_TS_HDR_LEN; 4260 4261 if (max_frame <= IGB_RXBUFFER_1024) 4262 rx_buffer_len = IGB_RXBUFFER_1024; 4263 else if (max_frame <= MAXIMUM_ETHERNET_VLAN_SIZE) 4264 rx_buffer_len = MAXIMUM_ETHERNET_VLAN_SIZE; 4265 else 4266 rx_buffer_len = IGB_RXBUFFER_128; 4267 4268 if ((max_frame == ETH_FRAME_LEN + ETH_FCS_LEN + IGB_TS_HDR_LEN) || 4269 (max_frame == MAXIMUM_ETHERNET_VLAN_SIZE + IGB_TS_HDR_LEN)) 4270 rx_buffer_len = MAXIMUM_ETHERNET_VLAN_SIZE + IGB_TS_HDR_LEN; 4271 4272 if ((adapter->hw.mac.type == e1000_82580) && 4273 (rx_buffer_len == IGB_RXBUFFER_128)) 4274 rx_buffer_len += IGB_RXBUFFER_64; 4275 4276 if (netif_running(netdev)) 4277 igb_down(adapter); 4278 4279 dev_info(&pdev->dev, "changing MTU from %d to %d\n", 4280 netdev->mtu, new_mtu); 4281 netdev->mtu = new_mtu; 4282 4283 for (i = 0; i < adapter->num_rx_queues; i++) 4284 adapter->rx_ring[i]->rx_buffer_len = rx_buffer_len; 4285 4286 if (netif_running(netdev)) 4287 igb_up(adapter); 4288 else 4289 igb_reset(adapter); 4290 4291 clear_bit(__IGB_RESETTING, &adapter->state); 4292 4293 return 0; 4294} 4295 4296/** 4297 * igb_update_stats - Update the board statistics counters 4298 * @adapter: board private structure 4299 **/ 4300 4301void igb_update_stats(struct igb_adapter *adapter) 4302{ 4303 struct net_device_stats *net_stats = igb_get_stats(adapter->netdev); 4304 struct e1000_hw *hw = &adapter->hw; 4305 struct pci_dev *pdev = adapter->pdev; 4306 u32 reg, mpc; 4307 u16 phy_tmp; 4308 int i; 4309 u64 bytes, packets; 4310 4311#define PHY_IDLE_ERROR_COUNT_MASK 0x00FF 4312 4313 /* 4314 * Prevent stats update while adapter is being reset, or if the pci 4315 * connection is down. 4316 */ 4317 if (adapter->link_speed == 0) 4318 return; 4319 if (pci_channel_offline(pdev)) 4320 return; 4321 4322 bytes = 0; 4323 packets = 0; 4324 for (i = 0; i < adapter->num_rx_queues; i++) { 4325 u32 rqdpc_tmp = rd32(E1000_RQDPC(i)) & 0x0FFF; 4326 struct igb_ring *ring = adapter->rx_ring[i]; 4327 ring->rx_stats.drops += rqdpc_tmp; 4328 net_stats->rx_fifo_errors += rqdpc_tmp; 4329 bytes += ring->rx_stats.bytes; 4330 packets += ring->rx_stats.packets; 4331 } 4332 4333 net_stats->rx_bytes = bytes; 4334 net_stats->rx_packets = packets; 4335 4336 bytes = 0; 4337 packets = 0; 4338 for (i = 0; i < adapter->num_tx_queues; i++) { 4339 struct igb_ring *ring = adapter->tx_ring[i]; 4340 bytes += ring->tx_stats.bytes; 4341 packets += ring->tx_stats.packets; 4342 } 4343 net_stats->tx_bytes = bytes; 4344 net_stats->tx_packets = packets; 4345 4346 /* read stats registers */ 4347 adapter->stats.crcerrs += rd32(E1000_CRCERRS); 4348 adapter->stats.gprc += rd32(E1000_GPRC); 4349 adapter->stats.gorc += rd32(E1000_GORCL); 4350 rd32(E1000_GORCH); /* clear GORCL */ 4351 adapter->stats.bprc += rd32(E1000_BPRC); 4352 adapter->stats.mprc += rd32(E1000_MPRC); 4353 adapter->stats.roc += rd32(E1000_ROC); 4354 4355 adapter->stats.prc64 += rd32(E1000_PRC64); 4356 adapter->stats.prc127 += rd32(E1000_PRC127); 4357 adapter->stats.prc255 += rd32(E1000_PRC255); 4358 adapter->stats.prc511 += rd32(E1000_PRC511); 4359 adapter->stats.prc1023 += rd32(E1000_PRC1023); 4360 adapter->stats.prc1522 += rd32(E1000_PRC1522); 4361 adapter->stats.symerrs += rd32(E1000_SYMERRS); 4362 adapter->stats.sec += rd32(E1000_SEC); 4363 4364 mpc = rd32(E1000_MPC); 4365 adapter->stats.mpc += mpc; 4366 net_stats->rx_fifo_errors += mpc; 4367 adapter->stats.scc += rd32(E1000_SCC); 4368 adapter->stats.ecol += rd32(E1000_ECOL); 4369 adapter->stats.mcc += rd32(E1000_MCC); 4370 adapter->stats.latecol += rd32(E1000_LATECOL); 4371 adapter->stats.dc += rd32(E1000_DC); 4372 adapter->stats.rlec += rd32(E1000_RLEC); 4373 adapter->stats.xonrxc += rd32(E1000_XONRXC); 4374 adapter->stats.xontxc += rd32(E1000_XONTXC); 4375 adapter->stats.xoffrxc += rd32(E1000_XOFFRXC); 4376 adapter->stats.xofftxc += rd32(E1000_XOFFTXC); 4377 adapter->stats.fcruc += rd32(E1000_FCRUC); 4378 adapter->stats.gptc += rd32(E1000_GPTC); 4379 adapter->stats.gotc += rd32(E1000_GOTCL); 4380 rd32(E1000_GOTCH); /* clear GOTCL */ 4381 adapter->stats.rnbc += rd32(E1000_RNBC); 4382 adapter->stats.ruc += rd32(E1000_RUC); 4383 adapter->stats.rfc += rd32(E1000_RFC); 4384 adapter->stats.rjc += rd32(E1000_RJC); 4385 adapter->stats.tor += rd32(E1000_TORH); 4386 adapter->stats.tot += rd32(E1000_TOTH); 4387 adapter->stats.tpr += rd32(E1000_TPR); 4388 4389 adapter->stats.ptc64 += rd32(E1000_PTC64); 4390 adapter->stats.ptc127 += rd32(E1000_PTC127); 4391 adapter->stats.ptc255 += rd32(E1000_PTC255); 4392 adapter->stats.ptc511 += rd32(E1000_PTC511); 4393 adapter->stats.ptc1023 += rd32(E1000_PTC1023); 4394 adapter->stats.ptc1522 += rd32(E1000_PTC1522); 4395 4396 adapter->stats.mptc += rd32(E1000_MPTC); 4397 adapter->stats.bptc += rd32(E1000_BPTC); 4398 4399 adapter->stats.tpt += rd32(E1000_TPT); 4400 adapter->stats.colc += rd32(E1000_COLC); 4401 4402 adapter->stats.algnerrc += rd32(E1000_ALGNERRC); 4403 /* read internal phy specific stats */ 4404 reg = rd32(E1000_CTRL_EXT); 4405 if (!(reg & E1000_CTRL_EXT_LINK_MODE_MASK)) { 4406 adapter->stats.rxerrc += rd32(E1000_RXERRC); 4407 adapter->stats.tncrs += rd32(E1000_TNCRS); 4408 } 4409 4410 adapter->stats.tsctc += rd32(E1000_TSCTC); 4411 adapter->stats.tsctfc += rd32(E1000_TSCTFC); 4412 4413 adapter->stats.iac += rd32(E1000_IAC); 4414 adapter->stats.icrxoc += rd32(E1000_ICRXOC); 4415 adapter->stats.icrxptc += rd32(E1000_ICRXPTC); 4416 adapter->stats.icrxatc += rd32(E1000_ICRXATC); 4417 adapter->stats.ictxptc += rd32(E1000_ICTXPTC); 4418 adapter->stats.ictxatc += rd32(E1000_ICTXATC); 4419 adapter->stats.ictxqec += rd32(E1000_ICTXQEC); 4420 adapter->stats.ictxqmtc += rd32(E1000_ICTXQMTC); 4421 adapter->stats.icrxdmtc += rd32(E1000_ICRXDMTC); 4422 4423 /* Fill out the OS statistics structure */ 4424 net_stats->multicast = adapter->stats.mprc; 4425 net_stats->collisions = adapter->stats.colc; 4426 4427 /* Rx Errors */ 4428 4429 /* RLEC on some newer hardware can be incorrect so build 4430 * our own version based on RUC and ROC */ 4431 net_stats->rx_errors = adapter->stats.rxerrc + 4432 adapter->stats.crcerrs + adapter->stats.algnerrc + 4433 adapter->stats.ruc + adapter->stats.roc + 4434 adapter->stats.cexterr; 4435 net_stats->rx_length_errors = adapter->stats.ruc + 4436 adapter->stats.roc; 4437 net_stats->rx_crc_errors = adapter->stats.crcerrs; 4438 net_stats->rx_frame_errors = adapter->stats.algnerrc; 4439 net_stats->rx_missed_errors = adapter->stats.mpc; 4440 4441 /* Tx Errors */ 4442 net_stats->tx_errors = adapter->stats.ecol + 4443 adapter->stats.latecol; 4444 net_stats->tx_aborted_errors = adapter->stats.ecol; 4445 net_stats->tx_window_errors = adapter->stats.latecol; 4446 net_stats->tx_carrier_errors = adapter->stats.tncrs; 4447 4448 /* Tx Dropped needs to be maintained elsewhere */ 4449 4450 /* Phy Stats */ 4451 if (hw->phy.media_type == e1000_media_type_copper) { 4452 if ((adapter->link_speed == SPEED_1000) && 4453 (!igb_read_phy_reg(hw, PHY_1000T_STATUS, &phy_tmp))) { 4454 phy_tmp &= PHY_IDLE_ERROR_COUNT_MASK; 4455 adapter->phy_stats.idle_errors += phy_tmp; 4456 } 4457 } 4458 4459 /* Management Stats */ 4460 adapter->stats.mgptc += rd32(E1000_MGTPTC); 4461 adapter->stats.mgprc += rd32(E1000_MGTPRC); 4462 adapter->stats.mgpdc += rd32(E1000_MGTPDC); 4463} 4464 4465static irqreturn_t igb_msix_other(int irq, void *data) 4466{ 4467 struct igb_adapter *adapter = data; 4468 struct e1000_hw *hw = &adapter->hw; 4469 u32 icr = rd32(E1000_ICR); 4470 /* reading ICR causes bit 31 of EICR to be cleared */ 4471 4472 if (icr & E1000_ICR_DRSTA) 4473 schedule_work(&adapter->reset_task); 4474 4475 if (icr & E1000_ICR_DOUTSYNC) { 4476 /* HW is reporting DMA is out of sync */ 4477 adapter->stats.doosync++; 4478 } 4479 4480 /* Check for a mailbox event */ 4481 if (icr & E1000_ICR_VMMB) 4482 igb_msg_task(adapter); 4483 4484 if (icr & E1000_ICR_LSC) { 4485 hw->mac.get_link_status = 1; 4486 /* guard against interrupt when we're going down */ 4487 if (!test_bit(__IGB_DOWN, &adapter->state)) 4488 mod_timer(&adapter->watchdog_timer, jiffies + 1); 4489 } 4490 4491 if (adapter->vfs_allocated_count) 4492 wr32(E1000_IMS, E1000_IMS_LSC | 4493 E1000_IMS_VMMB | 4494 E1000_IMS_DOUTSYNC); 4495 else 4496 wr32(E1000_IMS, E1000_IMS_LSC | E1000_IMS_DOUTSYNC); 4497 wr32(E1000_EIMS, adapter->eims_other); 4498 4499 return IRQ_HANDLED; 4500} 4501 4502static void igb_write_itr(struct igb_q_vector *q_vector) 4503{ 4504 struct igb_adapter *adapter = q_vector->adapter; 4505 u32 itr_val = q_vector->itr_val & 0x7FFC; 4506 4507 if (!q_vector->set_itr) 4508 return; 4509 4510 if (!itr_val) 4511 itr_val = 0x4; 4512 4513 if (adapter->hw.mac.type == e1000_82575) 4514 itr_val |= itr_val << 16; 4515 else 4516 itr_val |= 0x8000000; 4517 4518 writel(itr_val, q_vector->itr_register); 4519 q_vector->set_itr = 0; 4520} 4521 4522static irqreturn_t igb_msix_ring(int irq, void *data) 4523{ 4524 struct igb_q_vector *q_vector = data; 4525 4526 /* Write the ITR value calculated from the previous interrupt. */ 4527 igb_write_itr(q_vector); 4528 4529 napi_schedule(&q_vector->napi); 4530 4531 return IRQ_HANDLED; 4532} 4533 4534#ifdef CONFIG_IGB_DCA 4535static void igb_update_dca(struct igb_q_vector *q_vector) 4536{ 4537 struct igb_adapter *adapter = q_vector->adapter; 4538 struct e1000_hw *hw = &adapter->hw; 4539 int cpu = get_cpu(); 4540 4541 if (q_vector->cpu == cpu) 4542 goto out_no_update; 4543 4544 if (q_vector->tx_ring) { 4545 int q = q_vector->tx_ring->reg_idx; 4546 u32 dca_txctrl = rd32(E1000_DCA_TXCTRL(q)); 4547 if (hw->mac.type == e1000_82575) { 4548 dca_txctrl &= ~E1000_DCA_TXCTRL_CPUID_MASK; 4549 dca_txctrl |= dca3_get_tag(&adapter->pdev->dev, cpu); 4550 } else { 4551 dca_txctrl &= ~E1000_DCA_TXCTRL_CPUID_MASK_82576; 4552 dca_txctrl |= dca3_get_tag(&adapter->pdev->dev, cpu) << 4553 E1000_DCA_TXCTRL_CPUID_SHIFT; 4554 } 4555 dca_txctrl |= E1000_DCA_TXCTRL_DESC_DCA_EN; 4556 wr32(E1000_DCA_TXCTRL(q), dca_txctrl); 4557 } 4558 if (q_vector->rx_ring) { 4559 int q = q_vector->rx_ring->reg_idx; 4560 u32 dca_rxctrl = rd32(E1000_DCA_RXCTRL(q)); 4561 if (hw->mac.type == e1000_82575) { 4562 dca_rxctrl &= ~E1000_DCA_RXCTRL_CPUID_MASK; 4563 dca_rxctrl |= dca3_get_tag(&adapter->pdev->dev, cpu); 4564 } else { 4565 dca_rxctrl &= ~E1000_DCA_RXCTRL_CPUID_MASK_82576; 4566 dca_rxctrl |= dca3_get_tag(&adapter->pdev->dev, cpu) << 4567 E1000_DCA_RXCTRL_CPUID_SHIFT; 4568 } 4569 dca_rxctrl |= E1000_DCA_RXCTRL_DESC_DCA_EN; 4570 dca_rxctrl |= E1000_DCA_RXCTRL_HEAD_DCA_EN; 4571 dca_rxctrl |= E1000_DCA_RXCTRL_DATA_DCA_EN; 4572 wr32(E1000_DCA_RXCTRL(q), dca_rxctrl); 4573 } 4574 q_vector->cpu = cpu; 4575out_no_update: 4576 put_cpu(); 4577} 4578 4579static void igb_setup_dca(struct igb_adapter *adapter) 4580{ 4581 struct e1000_hw *hw = &adapter->hw; 4582 int i; 4583 4584 if (!(adapter->flags & IGB_FLAG_DCA_ENABLED)) 4585 return; 4586 4587 /* Always use CB2 mode, difference is masked in the CB driver. */ 4588 wr32(E1000_DCA_CTRL, E1000_DCA_CTRL_DCA_MODE_CB2); 4589 4590 for (i = 0; i < adapter->num_q_vectors; i++) { 4591 adapter->q_vector[i]->cpu = -1; 4592 igb_update_dca(adapter->q_vector[i]); 4593 } 4594} 4595 4596static int __igb_notify_dca(struct device *dev, void *data) 4597{ 4598 struct net_device *netdev = dev_get_drvdata(dev); 4599 struct igb_adapter *adapter = netdev_priv(netdev); 4600 struct pci_dev *pdev = adapter->pdev; 4601 struct e1000_hw *hw = &adapter->hw; 4602 unsigned long event = *(unsigned long *)data; 4603 4604 switch (event) { 4605 case DCA_PROVIDER_ADD: 4606 /* if already enabled, don't do it again */ 4607 if (adapter->flags & IGB_FLAG_DCA_ENABLED) 4608 break; 4609 if (dca_add_requester(dev) == 0) { 4610 adapter->flags |= IGB_FLAG_DCA_ENABLED; 4611 dev_info(&pdev->dev, "DCA enabled\n"); 4612 igb_setup_dca(adapter); 4613 break; 4614 } 4615 /* Fall Through since DCA is disabled. */ 4616 case DCA_PROVIDER_REMOVE: 4617 if (adapter->flags & IGB_FLAG_DCA_ENABLED) { 4618 /* without this a class_device is left 4619 * hanging around in the sysfs model */ 4620 dca_remove_requester(dev); 4621 dev_info(&pdev->dev, "DCA disabled\n"); 4622 adapter->flags &= ~IGB_FLAG_DCA_ENABLED; 4623 wr32(E1000_DCA_CTRL, E1000_DCA_CTRL_DCA_MODE_DISABLE); 4624 } 4625 break; 4626 } 4627 4628 return 0; 4629} 4630 4631static int igb_notify_dca(struct notifier_block *nb, unsigned long event, 4632 void *p) 4633{ 4634 int ret_val; 4635 4636 ret_val = driver_for_each_device(&igb_driver.driver, NULL, &event, 4637 __igb_notify_dca); 4638 4639 return ret_val ? NOTIFY_BAD : NOTIFY_DONE; 4640} 4641#endif /* CONFIG_IGB_DCA */ 4642 4643static void igb_ping_all_vfs(struct igb_adapter *adapter) 4644{ 4645 struct e1000_hw *hw = &adapter->hw; 4646 u32 ping; 4647 int i; 4648 4649 for (i = 0 ; i < adapter->vfs_allocated_count; i++) { 4650 ping = E1000_PF_CONTROL_MSG; 4651 if (adapter->vf_data[i].flags & IGB_VF_FLAG_CTS) 4652 ping |= E1000_VT_MSGTYPE_CTS; 4653 igb_write_mbx(hw, &ping, 1, i); 4654 } 4655} 4656 4657static int igb_set_vf_promisc(struct igb_adapter *adapter, u32 *msgbuf, u32 vf) 4658{ 4659 struct e1000_hw *hw = &adapter->hw; 4660 u32 vmolr = rd32(E1000_VMOLR(vf)); 4661 struct vf_data_storage *vf_data = &adapter->vf_data[vf]; 4662 4663 vf_data->flags |= ~(IGB_VF_FLAG_UNI_PROMISC | 4664 IGB_VF_FLAG_MULTI_PROMISC); 4665 vmolr &= ~(E1000_VMOLR_ROPE | E1000_VMOLR_ROMPE | E1000_VMOLR_MPME); 4666 4667 if (*msgbuf & E1000_VF_SET_PROMISC_MULTICAST) { 4668 vmolr |= E1000_VMOLR_MPME; 4669 *msgbuf &= ~E1000_VF_SET_PROMISC_MULTICAST; 4670 } else { 4671 /* 4672 * if we have hashes and we are clearing a multicast promisc 4673 * flag we need to write the hashes to the MTA as this step 4674 * was previously skipped 4675 */ 4676 if (vf_data->num_vf_mc_hashes > 30) { 4677 vmolr |= E1000_VMOLR_MPME; 4678 } else if (vf_data->num_vf_mc_hashes) { 4679 int j; 4680 vmolr |= E1000_VMOLR_ROMPE; 4681 for (j = 0; j < vf_data->num_vf_mc_hashes; j++) 4682 igb_mta_set(hw, vf_data->vf_mc_hashes[j]); 4683 } 4684 } 4685 4686 wr32(E1000_VMOLR(vf), vmolr); 4687 4688 /* there are flags left unprocessed, likely not supported */ 4689 if (*msgbuf & E1000_VT_MSGINFO_MASK) 4690 return -EINVAL; 4691 4692 return 0; 4693 4694} 4695 4696static int igb_set_vf_multicasts(struct igb_adapter *adapter, 4697 u32 *msgbuf, u32 vf) 4698{ 4699 int n = (msgbuf[0] & E1000_VT_MSGINFO_MASK) >> E1000_VT_MSGINFO_SHIFT; 4700 u16 *hash_list = (u16 *)&msgbuf[1]; 4701 struct vf_data_storage *vf_data = &adapter->vf_data[vf]; 4702 int i; 4703 4704 /* salt away the number of multicast addresses assigned 4705 * to this VF for later use to restore when the PF multi cast 4706 * list changes 4707 */ 4708 vf_data->num_vf_mc_hashes = n; 4709 4710 /* only up to 30 hash values supported */ 4711 if (n > 30) 4712 n = 30; 4713 4714 /* store the hashes for later use */ 4715 for (i = 0; i < n; i++) 4716 vf_data->vf_mc_hashes[i] = hash_list[i]; 4717 4718 /* Flush and reset the mta with the new values */ 4719 igb_set_rx_mode(adapter->netdev); 4720 4721 return 0; 4722} 4723 4724static void igb_restore_vf_multicasts(struct igb_adapter *adapter) 4725{ 4726 struct e1000_hw *hw = &adapter->hw; 4727 struct vf_data_storage *vf_data; 4728 int i, j; 4729 4730 for (i = 0; i < adapter->vfs_allocated_count; i++) { 4731 u32 vmolr = rd32(E1000_VMOLR(i)); 4732 vmolr &= ~(E1000_VMOLR_ROMPE | E1000_VMOLR_MPME); 4733 4734 vf_data = &adapter->vf_data[i]; 4735 4736 if ((vf_data->num_vf_mc_hashes > 30) || 4737 (vf_data->flags & IGB_VF_FLAG_MULTI_PROMISC)) { 4738 vmolr |= E1000_VMOLR_MPME; 4739 } else if (vf_data->num_vf_mc_hashes) { 4740 vmolr |= E1000_VMOLR_ROMPE; 4741 for (j = 0; j < vf_data->num_vf_mc_hashes; j++) 4742 igb_mta_set(hw, vf_data->vf_mc_hashes[j]); 4743 } 4744 wr32(E1000_VMOLR(i), vmolr); 4745 } 4746} 4747 4748static void igb_clear_vf_vfta(struct igb_adapter *adapter, u32 vf) 4749{ 4750 struct e1000_hw *hw = &adapter->hw; 4751 u32 pool_mask, reg, vid; 4752 int i; 4753 4754 pool_mask = 1 << (E1000_VLVF_POOLSEL_SHIFT + vf); 4755 4756 /* Find the vlan filter for this id */ 4757 for (i = 0; i < E1000_VLVF_ARRAY_SIZE; i++) { 4758 reg = rd32(E1000_VLVF(i)); 4759 4760 /* remove the vf from the pool */ 4761 reg &= ~pool_mask; 4762 4763 /* if pool is empty then remove entry from vfta */ 4764 if (!(reg & E1000_VLVF_POOLSEL_MASK) && 4765 (reg & E1000_VLVF_VLANID_ENABLE)) { 4766 reg = 0; 4767 vid = reg & E1000_VLVF_VLANID_MASK; 4768 igb_vfta_set(hw, vid, false); 4769 } 4770 4771 wr32(E1000_VLVF(i), reg); 4772 } 4773 4774 adapter->vf_data[vf].vlans_enabled = 0; 4775} 4776 4777static s32 igb_vlvf_set(struct igb_adapter *adapter, u32 vid, bool add, u32 vf) 4778{ 4779 struct e1000_hw *hw = &adapter->hw; 4780 u32 reg, i; 4781 4782 /* The vlvf table only exists on 82576 hardware and newer */ 4783 if (hw->mac.type < e1000_82576) 4784 return -1; 4785 4786 /* we only need to do this if VMDq is enabled */ 4787 if (!adapter->vfs_allocated_count) 4788 return -1; 4789 4790 /* Find the vlan filter for this id */ 4791 for (i = 0; i < E1000_VLVF_ARRAY_SIZE; i++) { 4792 reg = rd32(E1000_VLVF(i)); 4793 if ((reg & E1000_VLVF_VLANID_ENABLE) && 4794 vid == (reg & E1000_VLVF_VLANID_MASK)) 4795 break; 4796 } 4797 4798 if (add) { 4799 if (i == E1000_VLVF_ARRAY_SIZE) { 4800 /* Did not find a matching VLAN ID entry that was 4801 * enabled. Search for a free filter entry, i.e. 4802 * one without the enable bit set 4803 */ 4804 for (i = 0; i < E1000_VLVF_ARRAY_SIZE; i++) { 4805 reg = rd32(E1000_VLVF(i)); 4806 if (!(reg & E1000_VLVF_VLANID_ENABLE)) 4807 break; 4808 } 4809 } 4810 if (i < E1000_VLVF_ARRAY_SIZE) { 4811 /* Found an enabled/available entry */ 4812 reg |= 1 << (E1000_VLVF_POOLSEL_SHIFT + vf); 4813 4814 /* if !enabled we need to set this up in vfta */ 4815 if (!(reg & E1000_VLVF_VLANID_ENABLE)) { 4816 /* add VID to filter table */ 4817 igb_vfta_set(hw, vid, true); 4818 reg |= E1000_VLVF_VLANID_ENABLE; 4819 } 4820 reg &= ~E1000_VLVF_VLANID_MASK; 4821 reg |= vid; 4822 wr32(E1000_VLVF(i), reg); 4823 4824 /* do not modify RLPML for PF devices */ 4825 if (vf >= adapter->vfs_allocated_count) 4826 return 0; 4827 4828 if (!adapter->vf_data[vf].vlans_enabled) { 4829 u32 size; 4830 reg = rd32(E1000_VMOLR(vf)); 4831 size = reg & E1000_VMOLR_RLPML_MASK; 4832 size += 4; 4833 reg &= ~E1000_VMOLR_RLPML_MASK; 4834 reg |= size; 4835 wr32(E1000_VMOLR(vf), reg); 4836 } 4837 4838 adapter->vf_data[vf].vlans_enabled++; 4839 return 0; 4840 } 4841 } else { 4842 if (i < E1000_VLVF_ARRAY_SIZE) { 4843 /* remove vf from the pool */ 4844 reg &= ~(1 << (E1000_VLVF_POOLSEL_SHIFT + vf)); 4845 /* if pool is empty then remove entry from vfta */ 4846 if (!(reg & E1000_VLVF_POOLSEL_MASK)) { 4847 reg = 0; 4848 igb_vfta_set(hw, vid, false); 4849 } 4850 wr32(E1000_VLVF(i), reg); 4851 4852 /* do not modify RLPML for PF devices */ 4853 if (vf >= adapter->vfs_allocated_count) 4854 return 0; 4855 4856 adapter->vf_data[vf].vlans_enabled--; 4857 if (!adapter->vf_data[vf].vlans_enabled) { 4858 u32 size; 4859 reg = rd32(E1000_VMOLR(vf)); 4860 size = reg & E1000_VMOLR_RLPML_MASK; 4861 size -= 4; 4862 reg &= ~E1000_VMOLR_RLPML_MASK; 4863 reg |= size; 4864 wr32(E1000_VMOLR(vf), reg); 4865 } 4866 } 4867 } 4868 return 0; 4869} 4870 4871static void igb_set_vmvir(struct igb_adapter *adapter, u32 vid, u32 vf) 4872{ 4873 struct e1000_hw *hw = &adapter->hw; 4874 4875 if (vid) 4876 wr32(E1000_VMVIR(vf), (vid | E1000_VMVIR_VLANA_DEFAULT)); 4877 else 4878 wr32(E1000_VMVIR(vf), 0); 4879} 4880 4881static int igb_ndo_set_vf_vlan(struct net_device *netdev, 4882 int vf, u16 vlan, u8 qos) 4883{ 4884 int err = 0; 4885 struct igb_adapter *adapter = netdev_priv(netdev); 4886 4887 if ((vf >= adapter->vfs_allocated_count) || (vlan > 4095) || (qos > 7)) 4888 return -EINVAL; 4889 if (vlan || qos) { 4890 err = igb_vlvf_set(adapter, vlan, !!vlan, vf); 4891 if (err) 4892 goto out; 4893 igb_set_vmvir(adapter, vlan | (qos << VLAN_PRIO_SHIFT), vf); 4894 igb_set_vmolr(adapter, vf, !vlan); 4895 adapter->vf_data[vf].pf_vlan = vlan; 4896 adapter->vf_data[vf].pf_qos = qos; 4897 dev_info(&adapter->pdev->dev, 4898 "Setting VLAN %d, QOS 0x%x on VF %d\n", vlan, qos, vf); 4899 if (test_bit(__IGB_DOWN, &adapter->state)) { 4900 dev_warn(&adapter->pdev->dev, 4901 "The VF VLAN has been set," 4902 " but the PF device is not up.\n"); 4903 dev_warn(&adapter->pdev->dev, 4904 "Bring the PF device up before" 4905 " attempting to use the VF device.\n"); 4906 } 4907 } else { 4908 igb_vlvf_set(adapter, adapter->vf_data[vf].pf_vlan, 4909 false, vf); 4910 igb_set_vmvir(adapter, vlan, vf); 4911 igb_set_vmolr(adapter, vf, true); 4912 adapter->vf_data[vf].pf_vlan = 0; 4913 adapter->vf_data[vf].pf_qos = 0; 4914 } 4915out: 4916 return err; 4917} 4918 4919static int igb_set_vf_vlan(struct igb_adapter *adapter, u32 *msgbuf, u32 vf) 4920{ 4921 int add = (msgbuf[0] & E1000_VT_MSGINFO_MASK) >> E1000_VT_MSGINFO_SHIFT; 4922 int vid = (msgbuf[1] & E1000_VLVF_VLANID_MASK); 4923 4924 return igb_vlvf_set(adapter, vid, add, vf); 4925} 4926 4927static inline void igb_vf_reset(struct igb_adapter *adapter, u32 vf) 4928{ 4929 /* clear flags */ 4930 adapter->vf_data[vf].flags &= ~(IGB_VF_FLAG_PF_SET_MAC); 4931 adapter->vf_data[vf].last_nack = jiffies; 4932 4933 /* reset offloads to defaults */ 4934 igb_set_vmolr(adapter, vf, true); 4935 4936 /* reset vlans for device */ 4937 igb_clear_vf_vfta(adapter, vf); 4938 if (adapter->vf_data[vf].pf_vlan) 4939 igb_ndo_set_vf_vlan(adapter->netdev, vf, 4940 adapter->vf_data[vf].pf_vlan, 4941 adapter->vf_data[vf].pf_qos); 4942 else 4943 igb_clear_vf_vfta(adapter, vf); 4944 4945 /* reset multicast table array for vf */ 4946 adapter->vf_data[vf].num_vf_mc_hashes = 0; 4947 4948 /* Flush and reset the mta with the new values */ 4949 igb_set_rx_mode(adapter->netdev); 4950} 4951 4952static void igb_vf_reset_event(struct igb_adapter *adapter, u32 vf) 4953{ 4954 unsigned char *vf_mac = adapter->vf_data[vf].vf_mac_addresses; 4955 4956 /* generate a new mac address as we were hotplug removed/added */ 4957 if (!(adapter->vf_data[vf].flags & IGB_VF_FLAG_PF_SET_MAC)) 4958 random_ether_addr(vf_mac); 4959 4960 /* process remaining reset events */ 4961 igb_vf_reset(adapter, vf); 4962} 4963 4964static void igb_vf_reset_msg(struct igb_adapter *adapter, u32 vf) 4965{ 4966 struct e1000_hw *hw = &adapter->hw; 4967 unsigned char *vf_mac = adapter->vf_data[vf].vf_mac_addresses; 4968 int rar_entry = hw->mac.rar_entry_count - (vf + 1); 4969 u32 reg, msgbuf[3]; 4970 u8 *addr = (u8 *)(&msgbuf[1]); 4971 4972 /* process all the same items cleared in a function level reset */ 4973 igb_vf_reset(adapter, vf); 4974 4975 /* set vf mac address */ 4976 igb_rar_set_qsel(adapter, vf_mac, rar_entry, vf); 4977 4978 /* enable transmit and receive for vf */ 4979 reg = rd32(E1000_VFTE); 4980 wr32(E1000_VFTE, reg | (1 << vf)); 4981 reg = rd32(E1000_VFRE); 4982 wr32(E1000_VFRE, reg | (1 << vf)); 4983 4984 adapter->vf_data[vf].flags = IGB_VF_FLAG_CTS; 4985 4986 /* reply to reset with ack and vf mac address */ 4987 msgbuf[0] = E1000_VF_RESET | E1000_VT_MSGTYPE_ACK; 4988 memcpy(addr, vf_mac, 6); 4989 igb_write_mbx(hw, msgbuf, 3, vf); 4990} 4991 4992static int igb_set_vf_mac_addr(struct igb_adapter *adapter, u32 *msg, int vf) 4993{ 4994 /* 4995 * The VF MAC Address is stored in a packed array of bytes 4996 * starting at the second 32 bit word of the msg array 4997 */ 4998 unsigned char *addr = (char *)&msg[1]; 4999 int err = -1; 5000 5001 if (is_valid_ether_addr(addr)) 5002 err = igb_set_vf_mac(adapter, vf, addr); 5003 5004 return err; 5005} 5006 5007static void igb_rcv_ack_from_vf(struct igb_adapter *adapter, u32 vf) 5008{ 5009 struct e1000_hw *hw = &adapter->hw; 5010 struct vf_data_storage *vf_data = &adapter->vf_data[vf]; 5011 u32 msg = E1000_VT_MSGTYPE_NACK; 5012 5013 /* if device isn't clear to send it shouldn't be reading either */ 5014 if (!(vf_data->flags & IGB_VF_FLAG_CTS) && 5015 time_after(jiffies, vf_data->last_nack + (2 * HZ))) { 5016 igb_write_mbx(hw, &msg, 1, vf); 5017 vf_data->last_nack = jiffies; 5018 } 5019} 5020 5021static void igb_rcv_msg_from_vf(struct igb_adapter *adapter, u32 vf) 5022{ 5023 struct pci_dev *pdev = adapter->pdev; 5024 u32 msgbuf[E1000_VFMAILBOX_SIZE]; 5025 struct e1000_hw *hw = &adapter->hw; 5026 struct vf_data_storage *vf_data = &adapter->vf_data[vf]; 5027 s32 retval; 5028 5029 retval = igb_read_mbx(hw, msgbuf, E1000_VFMAILBOX_SIZE, vf); 5030 5031 if (retval) { 5032 /* if receive failed revoke VF CTS stats and restart init */ 5033 dev_err(&pdev->dev, "Error receiving message from VF\n"); 5034 vf_data->flags &= ~IGB_VF_FLAG_CTS; 5035 if (!time_after(jiffies, vf_data->last_nack + (2 * HZ))) 5036 return; 5037 goto out; 5038 } 5039 5040 /* this is a message we already processed, do nothing */ 5041 if (msgbuf[0] & (E1000_VT_MSGTYPE_ACK | E1000_VT_MSGTYPE_NACK)) 5042 return; 5043 5044 /* 5045 * until the vf completes a reset it should not be 5046 * allowed to start any configuration. 5047 */ 5048 5049 if (msgbuf[0] == E1000_VF_RESET) { 5050 igb_vf_reset_msg(adapter, vf); 5051 return; 5052 } 5053 5054 if (!(vf_data->flags & IGB_VF_FLAG_CTS)) { 5055 if (!time_after(jiffies, vf_data->last_nack + (2 * HZ))) 5056 return; 5057 retval = -1; 5058 goto out; 5059 } 5060 5061 switch ((msgbuf[0] & 0xFFFF)) { 5062 case E1000_VF_SET_MAC_ADDR: 5063 retval = igb_set_vf_mac_addr(adapter, msgbuf, vf); 5064 break; 5065 case E1000_VF_SET_PROMISC: 5066 retval = igb_set_vf_promisc(adapter, msgbuf, vf); 5067 break; 5068 case E1000_VF_SET_MULTICAST: 5069 retval = igb_set_vf_multicasts(adapter, msgbuf, vf); 5070 break; 5071 case E1000_VF_SET_LPE: 5072 retval = igb_set_vf_rlpml(adapter, msgbuf[1], vf); 5073 break; 5074 case E1000_VF_SET_VLAN: 5075 if (adapter->vf_data[vf].pf_vlan) 5076 retval = -1; 5077 else 5078 retval = igb_set_vf_vlan(adapter, msgbuf, vf); 5079 break; 5080 default: 5081 dev_err(&pdev->dev, "Unhandled Msg %08x\n", msgbuf[0]); 5082 retval = -1; 5083 break; 5084 } 5085 5086 msgbuf[0] |= E1000_VT_MSGTYPE_CTS; 5087out: 5088 /* notify the VF of the results of what it sent us */ 5089 if (retval) 5090 msgbuf[0] |= E1000_VT_MSGTYPE_NACK; 5091 else 5092 msgbuf[0] |= E1000_VT_MSGTYPE_ACK; 5093 5094 igb_write_mbx(hw, msgbuf, 1, vf); 5095} 5096 5097static void igb_msg_task(struct igb_adapter *adapter) 5098{ 5099 struct e1000_hw *hw = &adapter->hw; 5100 u32 vf; 5101 5102 for (vf = 0; vf < adapter->vfs_allocated_count; vf++) { 5103 /* process any reset requests */ 5104 if (!igb_check_for_rst(hw, vf)) 5105 igb_vf_reset_event(adapter, vf); 5106 5107 /* process any messages pending */ 5108 if (!igb_check_for_msg(hw, vf)) 5109 igb_rcv_msg_from_vf(adapter, vf); 5110 5111 /* process any acks */ 5112 if (!igb_check_for_ack(hw, vf)) 5113 igb_rcv_ack_from_vf(adapter, vf); 5114 } 5115} 5116 5117/** 5118 * igb_set_uta - Set unicast filter table address 5119 * @adapter: board private structure 5120 * 5121 * The unicast table address is a register array of 32-bit registers. 5122 * The table is meant to be used in a way similar to how the MTA is used 5123 * however due to certain limitations in the hardware it is necessary to 5124 * set all the hash bits to 1 and use the VMOLR ROPE bit as a promiscous 5125 * enable bit to allow vlan tag stripping when promiscous mode is enabled 5126 **/ 5127static void igb_set_uta(struct igb_adapter *adapter) 5128{ 5129 struct e1000_hw *hw = &adapter->hw; 5130 int i; 5131 5132 /* The UTA table only exists on 82576 hardware and newer */ 5133 if (hw->mac.type < e1000_82576) 5134 return; 5135 5136 /* we only need to do this if VMDq is enabled */ 5137 if (!adapter->vfs_allocated_count) 5138 return; 5139 5140 for (i = 0; i < hw->mac.uta_reg_count; i++) 5141 array_wr32(E1000_UTA, i, ~0); 5142} 5143 5144/** 5145 * igb_intr_msi - Interrupt Handler 5146 * @irq: interrupt number 5147 * @data: pointer to a network interface device structure 5148 **/ 5149static irqreturn_t igb_intr_msi(int irq, void *data) 5150{ 5151 struct igb_adapter *adapter = data; 5152 struct igb_q_vector *q_vector = adapter->q_vector[0]; 5153 struct e1000_hw *hw = &adapter->hw; 5154 /* read ICR disables interrupts using IAM */ 5155 u32 icr = rd32(E1000_ICR); 5156 5157 igb_write_itr(q_vector); 5158 5159 if (icr & E1000_ICR_DRSTA) 5160 schedule_work(&adapter->reset_task); 5161 5162 if (icr & E1000_ICR_DOUTSYNC) { 5163 /* HW is reporting DMA is out of sync */ 5164 adapter->stats.doosync++; 5165 } 5166 5167 if (icr & (E1000_ICR_RXSEQ | E1000_ICR_LSC)) { 5168 hw->mac.get_link_status = 1; 5169 if (!test_bit(__IGB_DOWN, &adapter->state)) 5170 mod_timer(&adapter->watchdog_timer, jiffies + 1); 5171 } 5172 5173 napi_schedule(&q_vector->napi); 5174 5175 return IRQ_HANDLED; 5176} 5177 5178/** 5179 * igb_intr - Legacy Interrupt Handler 5180 * @irq: interrupt number 5181 * @data: pointer to a network interface device structure 5182 **/ 5183static irqreturn_t igb_intr(int irq, void *data) 5184{ 5185 struct igb_adapter *adapter = data; 5186 struct igb_q_vector *q_vector = adapter->q_vector[0]; 5187 struct e1000_hw *hw = &adapter->hw; 5188 /* Interrupt Auto-Mask...upon reading ICR, interrupts are masked. No 5189 * need for the IMC write */ 5190 u32 icr = rd32(E1000_ICR); 5191 if (!icr) 5192 return IRQ_NONE; /* Not our interrupt */ 5193 5194 igb_write_itr(q_vector); 5195 5196 /* IMS will not auto-mask if INT_ASSERTED is not set, and if it is 5197 * not set, then the adapter didn't send an interrupt */ 5198 if (!(icr & E1000_ICR_INT_ASSERTED)) 5199 return IRQ_NONE; 5200 5201 if (icr & E1000_ICR_DRSTA) 5202 schedule_work(&adapter->reset_task); 5203 5204 if (icr & E1000_ICR_DOUTSYNC) { 5205 /* HW is reporting DMA is out of sync */ 5206 adapter->stats.doosync++; 5207 } 5208 5209 if (icr & (E1000_ICR_RXSEQ | E1000_ICR_LSC)) { 5210 hw->mac.get_link_status = 1; 5211 /* guard against interrupt when we're going down */ 5212 if (!test_bit(__IGB_DOWN, &adapter->state)) 5213 mod_timer(&adapter->watchdog_timer, jiffies + 1); 5214 } 5215 5216 napi_schedule(&q_vector->napi); 5217 5218 return IRQ_HANDLED; 5219} 5220 5221static inline void igb_ring_irq_enable(struct igb_q_vector *q_vector) 5222{ 5223 struct igb_adapter *adapter = q_vector->adapter; 5224 struct e1000_hw *hw = &adapter->hw; 5225 5226 if ((q_vector->rx_ring && (adapter->rx_itr_setting & 3)) || 5227 (!q_vector->rx_ring && (adapter->tx_itr_setting & 3))) { 5228 if (!adapter->msix_entries) 5229 igb_set_itr(adapter); 5230 else 5231 igb_update_ring_itr(q_vector); 5232 } 5233 5234 if (!test_bit(__IGB_DOWN, &adapter->state)) { 5235 if (adapter->msix_entries) 5236 wr32(E1000_EIMS, q_vector->eims_value); 5237 else 5238 igb_irq_enable(adapter); 5239 } 5240} 5241 5242/** 5243 * igb_poll - NAPI Rx polling callback 5244 * @napi: napi polling structure 5245 * @budget: count of how many packets we should handle 5246 **/ 5247static int igb_poll(struct napi_struct *napi, int budget) 5248{ 5249 struct igb_q_vector *q_vector = container_of(napi, 5250 struct igb_q_vector, 5251 napi); 5252 int tx_clean_complete = 1, work_done = 0; 5253 5254#ifdef CONFIG_IGB_DCA 5255 if (q_vector->adapter->flags & IGB_FLAG_DCA_ENABLED) 5256 igb_update_dca(q_vector); 5257#endif 5258 if (q_vector->tx_ring) 5259 tx_clean_complete = igb_clean_tx_irq(q_vector); 5260 5261 if (q_vector->rx_ring) 5262 igb_clean_rx_irq_adv(q_vector, &work_done, budget); 5263 5264 if (!tx_clean_complete) 5265 work_done = budget; 5266 5267 /* If not enough Rx work done, exit the polling mode */ 5268 if (work_done < budget) { 5269 napi_complete(napi); 5270 igb_ring_irq_enable(q_vector); 5271 } 5272 5273 return work_done; 5274} 5275 5276/** 5277 * igb_systim_to_hwtstamp - convert system time value to hw timestamp 5278 * @adapter: board private structure 5279 * @shhwtstamps: timestamp structure to update 5280 * @regval: unsigned 64bit system time value. 5281 * 5282 * We need to convert the system time value stored in the RX/TXSTMP registers 5283 * into a hwtstamp which can be used by the upper level timestamping functions 5284 */ 5285static void igb_systim_to_hwtstamp(struct igb_adapter *adapter, 5286 struct skb_shared_hwtstamps *shhwtstamps, 5287 u64 regval) 5288{ 5289 u64 ns; 5290 5291 /* 5292 * The 82580 starts with 1ns at bit 0 in RX/TXSTMPL, shift this up to 5293 * 24 to match clock shift we setup earlier. 5294 */ 5295 if (adapter->hw.mac.type == e1000_82580) 5296 regval <<= IGB_82580_TSYNC_SHIFT; 5297 5298 ns = timecounter_cyc2time(&adapter->clock, regval); 5299 timecompare_update(&adapter->compare, ns); 5300 memset(shhwtstamps, 0, sizeof(struct skb_shared_hwtstamps)); 5301 shhwtstamps->hwtstamp = ns_to_ktime(ns); 5302 shhwtstamps->syststamp = timecompare_transform(&adapter->compare, ns); 5303} 5304 5305/** 5306 * igb_tx_hwtstamp - utility function which checks for TX time stamp 5307 * @q_vector: pointer to q_vector containing needed info 5308 * @buffer: pointer to igb_buffer structure 5309 * 5310 * If we were asked to do hardware stamping and such a time stamp is 5311 * available, then it must have been for this skb here because we only 5312 * allow only one such packet into the queue. 5313 */ 5314static void igb_tx_hwtstamp(struct igb_q_vector *q_vector, struct igb_buffer *buffer_info) 5315{ 5316 struct igb_adapter *adapter = q_vector->adapter; 5317 struct e1000_hw *hw = &adapter->hw; 5318 struct skb_shared_hwtstamps shhwtstamps; 5319 u64 regval; 5320 5321 /* if skb does not support hw timestamp or TX stamp not valid exit */ 5322 if (likely(!buffer_info->shtx.hardware) || 5323 !(rd32(E1000_TSYNCTXCTL) & E1000_TSYNCTXCTL_VALID)) 5324 return; 5325 5326 regval = rd32(E1000_TXSTMPL); 5327 regval |= (u64)rd32(E1000_TXSTMPH) << 32; 5328 5329 igb_systim_to_hwtstamp(adapter, &shhwtstamps, regval); 5330 skb_tstamp_tx(buffer_info->skb, &shhwtstamps); 5331} 5332 5333/** 5334 * igb_clean_tx_irq - Reclaim resources after transmit completes 5335 * @q_vector: pointer to q_vector containing needed info 5336 * returns true if ring is completely cleaned 5337 **/ 5338static bool igb_clean_tx_irq(struct igb_q_vector *q_vector) 5339{ 5340 struct igb_adapter *adapter = q_vector->adapter; 5341 struct igb_ring *tx_ring = q_vector->tx_ring; 5342 struct net_device *netdev = tx_ring->netdev; 5343 struct e1000_hw *hw = &adapter->hw; 5344 struct igb_buffer *buffer_info; 5345 union e1000_adv_tx_desc *tx_desc, *eop_desc; 5346 unsigned int total_bytes = 0, total_packets = 0; 5347 unsigned int i, eop, count = 0; 5348 bool cleaned = false; 5349 5350 i = tx_ring->next_to_clean; 5351 eop = tx_ring->buffer_info[i].next_to_watch; 5352 eop_desc = E1000_TX_DESC_ADV(*tx_ring, eop); 5353 5354 while ((eop_desc->wb.status & cpu_to_le32(E1000_TXD_STAT_DD)) && 5355 (count < tx_ring->count)) { 5356 rmb(); /* read buffer_info after eop_desc status */ 5357 for (cleaned = false; !cleaned; count++) { 5358 tx_desc = E1000_TX_DESC_ADV(*tx_ring, i); 5359 buffer_info = &tx_ring->buffer_info[i]; 5360 cleaned = (i == eop); 5361 5362 if (buffer_info->skb) { 5363 total_bytes += buffer_info->bytecount; 5364 /* gso_segs is currently only valid for tcp */ 5365 total_packets += buffer_info->gso_segs; 5366 igb_tx_hwtstamp(q_vector, buffer_info); 5367 } 5368 5369 igb_unmap_and_free_tx_resource(tx_ring, buffer_info); 5370 tx_desc->wb.status = 0; 5371 5372 i++; 5373 if (i == tx_ring->count) 5374 i = 0; 5375 } 5376 eop = tx_ring->buffer_info[i].next_to_watch; 5377 eop_desc = E1000_TX_DESC_ADV(*tx_ring, eop); 5378 } 5379 5380 tx_ring->next_to_clean = i; 5381 5382 if (unlikely(count && 5383 netif_carrier_ok(netdev) && 5384 igb_desc_unused(tx_ring) >= IGB_TX_QUEUE_WAKE)) { 5385 /* Make sure that anybody stopping the queue after this 5386 * sees the new next_to_clean. 5387 */ 5388 smp_mb(); 5389 if (__netif_subqueue_stopped(netdev, tx_ring->queue_index) && 5390 !(test_bit(__IGB_DOWN, &adapter->state))) { 5391 netif_wake_subqueue(netdev, tx_ring->queue_index); 5392 tx_ring->tx_stats.restart_queue++; 5393 } 5394 } 5395 5396 if (tx_ring->detect_tx_hung) { 5397 /* Detect a transmit hang in hardware, this serializes the 5398 * check with the clearing of time_stamp and movement of i */ 5399 tx_ring->detect_tx_hung = false; 5400 if (tx_ring->buffer_info[i].time_stamp && 5401 time_after(jiffies, tx_ring->buffer_info[i].time_stamp + 5402 (adapter->tx_timeout_factor * HZ)) && 5403 !(rd32(E1000_STATUS) & E1000_STATUS_TXOFF)) { 5404 5405 /* detected Tx unit hang */ 5406 dev_err(tx_ring->dev, 5407 "Detected Tx Unit Hang\n" 5408 " Tx Queue <%d>\n" 5409 " TDH <%x>\n" 5410 " TDT <%x>\n" 5411 " next_to_use <%x>\n" 5412 " next_to_clean <%x>\n" 5413 "buffer_info[next_to_clean]\n" 5414 " time_stamp <%lx>\n" 5415 " next_to_watch <%x>\n" 5416 " jiffies <%lx>\n" 5417 " desc.status <%x>\n", 5418 tx_ring->queue_index, 5419 readl(tx_ring->head), 5420 readl(tx_ring->tail), 5421 tx_ring->next_to_use, 5422 tx_ring->next_to_clean, 5423 tx_ring->buffer_info[eop].time_stamp, 5424 eop, 5425 jiffies, 5426 eop_desc->wb.status); 5427 netif_stop_subqueue(netdev, tx_ring->queue_index); 5428 } 5429 } 5430 tx_ring->total_bytes += total_bytes; 5431 tx_ring->total_packets += total_packets; 5432 tx_ring->tx_stats.bytes += total_bytes; 5433 tx_ring->tx_stats.packets += total_packets; 5434 return (count < tx_ring->count); 5435} 5436 5437/** 5438 * igb_receive_skb - helper function to handle rx indications 5439 * @q_vector: structure containing interrupt and ring information 5440 * @skb: packet to send up 5441 * @vlan_tag: vlan tag for packet 5442 **/ 5443static void igb_receive_skb(struct igb_q_vector *q_vector, 5444 struct sk_buff *skb, 5445 u16 vlan_tag) 5446{ 5447 struct igb_adapter *adapter = q_vector->adapter; 5448 5449 if (vlan_tag && adapter->vlgrp) 5450 vlan_gro_receive(&q_vector->napi, adapter->vlgrp, 5451 vlan_tag, skb); 5452 else 5453 napi_gro_receive(&q_vector->napi, skb); 5454} 5455 5456static inline void igb_rx_checksum_adv(struct igb_ring *ring, 5457 u32 status_err, struct sk_buff *skb) 5458{ 5459 skb->ip_summed = CHECKSUM_NONE; 5460 5461 /* Ignore Checksum bit is set or checksum is disabled through ethtool */ 5462 if (!(ring->flags & IGB_RING_FLAG_RX_CSUM) || 5463 (status_err & E1000_RXD_STAT_IXSM)) 5464 return; 5465 5466 /* TCP/UDP checksum error bit is set */ 5467 if (status_err & 5468 (E1000_RXDEXT_STATERR_TCPE | E1000_RXDEXT_STATERR_IPE)) { 5469 /* 5470 * work around errata with sctp packets where the TCPE aka 5471 * L4E bit is set incorrectly on 64 byte (60 byte w/o crc) 5472 * packets, (aka let the stack check the crc32c) 5473 */ 5474 if ((skb->len == 60) && 5475 (ring->flags & IGB_RING_FLAG_RX_SCTP_CSUM)) 5476 ring->rx_stats.csum_err++; 5477 5478 /* let the stack verify checksum errors */ 5479 return; 5480 } 5481 /* It must be a TCP or UDP packet with a valid checksum */ 5482 if (status_err & (E1000_RXD_STAT_TCPCS | E1000_RXD_STAT_UDPCS)) 5483 skb->ip_summed = CHECKSUM_UNNECESSARY; 5484 5485 dev_dbg(ring->dev, "cksum success: bits %08X\n", status_err); 5486} 5487 5488static void igb_rx_hwtstamp(struct igb_q_vector *q_vector, u32 staterr, 5489 struct sk_buff *skb) 5490{ 5491 struct igb_adapter *adapter = q_vector->adapter; 5492 struct e1000_hw *hw = &adapter->hw; 5493 u64 regval; 5494 5495 /* 5496 * If this bit is set, then the RX registers contain the time stamp. No 5497 * other packet will be time stamped until we read these registers, so 5498 * read the registers to make them available again. Because only one 5499 * packet can be time stamped at a time, we know that the register 5500 * values must belong to this one here and therefore we don't need to 5501 * compare any of the additional attributes stored for it. 5502 * 5503 * If nothing went wrong, then it should have a skb_shared_tx that we 5504 * can turn into a skb_shared_hwtstamps. 5505 */ 5506 if (staterr & E1000_RXDADV_STAT_TSIP) { 5507 u32 *stamp = (u32 *)skb->data; 5508 regval = le32_to_cpu(*(stamp + 2)); 5509 regval |= (u64)le32_to_cpu(*(stamp + 3)) << 32; 5510 skb_pull(skb, IGB_TS_HDR_LEN); 5511 } else { 5512 if(!(rd32(E1000_TSYNCRXCTL) & E1000_TSYNCRXCTL_VALID)) 5513 return; 5514 5515 regval = rd32(E1000_RXSTMPL); 5516 regval |= (u64)rd32(E1000_RXSTMPH) << 32; 5517 } 5518 5519 igb_systim_to_hwtstamp(adapter, skb_hwtstamps(skb), regval); 5520} 5521static inline u16 igb_get_hlen(struct igb_ring *rx_ring, 5522 union e1000_adv_rx_desc *rx_desc) 5523{ 5524 /* HW will not DMA in data larger than the given buffer, even if it 5525 * parses the (NFS, of course) header to be larger. In that case, it 5526 * fills the header buffer and spills the rest into the page. 5527 */ 5528 u16 hlen = (le16_to_cpu(rx_desc->wb.lower.lo_dword.hdr_info) & 5529 E1000_RXDADV_HDRBUFLEN_MASK) >> E1000_RXDADV_HDRBUFLEN_SHIFT; 5530 if (hlen > rx_ring->rx_buffer_len) 5531 hlen = rx_ring->rx_buffer_len; 5532 return hlen; 5533} 5534 5535static bool igb_clean_rx_irq_adv(struct igb_q_vector *q_vector, 5536 int *work_done, int budget) 5537{ 5538 struct igb_ring *rx_ring = q_vector->rx_ring; 5539 struct net_device *netdev = rx_ring->netdev; 5540 struct device *dev = rx_ring->dev; 5541 union e1000_adv_rx_desc *rx_desc , *next_rxd; 5542 struct igb_buffer *buffer_info , *next_buffer; 5543 struct sk_buff *skb; 5544 bool cleaned = false; 5545 int cleaned_count = 0; 5546 int current_node = numa_node_id(); 5547 unsigned int total_bytes = 0, total_packets = 0; 5548 unsigned int i; 5549 u32 staterr; 5550 u16 length; 5551 u16 vlan_tag; 5552 5553 i = rx_ring->next_to_clean; 5554 buffer_info = &rx_ring->buffer_info[i]; 5555 rx_desc = E1000_RX_DESC_ADV(*rx_ring, i); 5556 staterr = le32_to_cpu(rx_desc->wb.upper.status_error); 5557 5558 while (staterr & E1000_RXD_STAT_DD) { 5559 if (*work_done >= budget) 5560 break; 5561 (*work_done)++; 5562 rmb(); /* read descriptor and rx_buffer_info after status DD */ 5563 5564 skb = buffer_info->skb; 5565 prefetch(skb->data - NET_IP_ALIGN); 5566 buffer_info->skb = NULL; 5567 5568 i++; 5569 if (i == rx_ring->count) 5570 i = 0; 5571 5572 next_rxd = E1000_RX_DESC_ADV(*rx_ring, i); 5573 prefetch(next_rxd); 5574 next_buffer = &rx_ring->buffer_info[i]; 5575 5576 length = le16_to_cpu(rx_desc->wb.upper.length); 5577 cleaned = true; 5578 cleaned_count++; 5579 5580 if (buffer_info->dma) { 5581 dma_unmap_single(dev, buffer_info->dma, 5582 rx_ring->rx_buffer_len, 5583 DMA_FROM_DEVICE); 5584 buffer_info->dma = 0; 5585 if (rx_ring->rx_buffer_len >= IGB_RXBUFFER_1024) { 5586 skb_put(skb, length); 5587 goto send_up; 5588 } 5589 skb_put(skb, igb_get_hlen(rx_ring, rx_desc)); 5590 } 5591 5592 if (length) { 5593 dma_unmap_page(dev, buffer_info->page_dma, 5594 PAGE_SIZE / 2, DMA_FROM_DEVICE); 5595 buffer_info->page_dma = 0; 5596 5597 skb_fill_page_desc(skb, skb_shinfo(skb)->nr_frags, 5598 buffer_info->page, 5599 buffer_info->page_offset, 5600 length); 5601 5602 if ((page_count(buffer_info->page) != 1) || 5603 (page_to_nid(buffer_info->page) != current_node)) 5604 buffer_info->page = NULL; 5605 else 5606 get_page(buffer_info->page); 5607 5608 skb->len += length; 5609 skb->data_len += length; 5610 skb->truesize += length; 5611 } 5612 5613 if (!(staterr & E1000_RXD_STAT_EOP)) { 5614 buffer_info->skb = next_buffer->skb; 5615 buffer_info->dma = next_buffer->dma; 5616 next_buffer->skb = skb; 5617 next_buffer->dma = 0; 5618 goto next_desc; 5619 } 5620send_up: 5621 if (staterr & E1000_RXDEXT_ERR_FRAME_ERR_MASK) { 5622 dev_kfree_skb_irq(skb); 5623 goto next_desc; 5624 } 5625 5626 if (staterr & (E1000_RXDADV_STAT_TSIP | E1000_RXDADV_STAT_TS)) 5627 igb_rx_hwtstamp(q_vector, staterr, skb); 5628 total_bytes += skb->len; 5629 total_packets++; 5630 5631 igb_rx_checksum_adv(rx_ring, staterr, skb); 5632 5633 skb->protocol = eth_type_trans(skb, netdev); 5634 skb_record_rx_queue(skb, rx_ring->queue_index); 5635 5636 vlan_tag = ((staterr & E1000_RXD_STAT_VP) ? 5637 le16_to_cpu(rx_desc->wb.upper.vlan) : 0); 5638 5639 igb_receive_skb(q_vector, skb, vlan_tag); 5640 5641next_desc: 5642 rx_desc->wb.upper.status_error = 0; 5643 5644 /* return some buffers to hardware, one at a time is too slow */ 5645 if (cleaned_count >= IGB_RX_BUFFER_WRITE) { 5646 igb_alloc_rx_buffers_adv(rx_ring, cleaned_count); 5647 cleaned_count = 0; 5648 } 5649 5650 /* use prefetched values */ 5651 rx_desc = next_rxd; 5652 buffer_info = next_buffer; 5653 staterr = le32_to_cpu(rx_desc->wb.upper.status_error); 5654 } 5655 5656 rx_ring->next_to_clean = i; 5657 cleaned_count = igb_desc_unused(rx_ring); 5658 5659 if (cleaned_count) 5660 igb_alloc_rx_buffers_adv(rx_ring, cleaned_count); 5661 5662 rx_ring->total_packets += total_packets; 5663 rx_ring->total_bytes += total_bytes; 5664 rx_ring->rx_stats.packets += total_packets; 5665 rx_ring->rx_stats.bytes += total_bytes; 5666 return cleaned; 5667} 5668 5669/** 5670 * igb_alloc_rx_buffers_adv - Replace used receive buffers; packet split 5671 * @adapter: address of board private structure 5672 **/ 5673void igb_alloc_rx_buffers_adv(struct igb_ring *rx_ring, int cleaned_count) 5674{ 5675 struct net_device *netdev = rx_ring->netdev; 5676 union e1000_adv_rx_desc *rx_desc; 5677 struct igb_buffer *buffer_info; 5678 struct sk_buff *skb; 5679 unsigned int i; 5680 int bufsz; 5681 5682 i = rx_ring->next_to_use; 5683 buffer_info = &rx_ring->buffer_info[i]; 5684 5685 bufsz = rx_ring->rx_buffer_len; 5686 5687 while (cleaned_count--) { 5688 rx_desc = E1000_RX_DESC_ADV(*rx_ring, i); 5689 5690 if ((bufsz < IGB_RXBUFFER_1024) && !buffer_info->page_dma) { 5691 if (!buffer_info->page) { 5692 buffer_info->page = netdev_alloc_page(netdev); 5693 if (!buffer_info->page) { 5694 rx_ring->rx_stats.alloc_failed++; 5695 goto no_buffers; 5696 } 5697 buffer_info->page_offset = 0; 5698 } else { 5699 buffer_info->page_offset ^= PAGE_SIZE / 2; 5700 } 5701 buffer_info->page_dma = 5702 dma_map_page(rx_ring->dev, buffer_info->page, 5703 buffer_info->page_offset, 5704 PAGE_SIZE / 2, 5705 DMA_FROM_DEVICE); 5706 if (dma_mapping_error(rx_ring->dev, 5707 buffer_info->page_dma)) { 5708 buffer_info->page_dma = 0; 5709 rx_ring->rx_stats.alloc_failed++; 5710 goto no_buffers; 5711 } 5712 } 5713 5714 skb = buffer_info->skb; 5715 if (!skb) { 5716 skb = netdev_alloc_skb_ip_align(netdev, bufsz); 5717 if (!skb) { 5718 rx_ring->rx_stats.alloc_failed++; 5719 goto no_buffers; 5720 } 5721 5722 buffer_info->skb = skb; 5723 } 5724 if (!buffer_info->dma) { 5725 buffer_info->dma = dma_map_single(rx_ring->dev, 5726 skb->data, 5727 bufsz, 5728 DMA_FROM_DEVICE); 5729 if (dma_mapping_error(rx_ring->dev, 5730 buffer_info->dma)) { 5731 buffer_info->dma = 0; 5732 rx_ring->rx_stats.alloc_failed++; 5733 goto no_buffers; 5734 } 5735 } 5736 /* Refresh the desc even if buffer_addrs didn't change because 5737 * each write-back erases this info. */ 5738 if (bufsz < IGB_RXBUFFER_1024) { 5739 rx_desc->read.pkt_addr = 5740 cpu_to_le64(buffer_info->page_dma); 5741 rx_desc->read.hdr_addr = cpu_to_le64(buffer_info->dma); 5742 } else { 5743 rx_desc->read.pkt_addr = cpu_to_le64(buffer_info->dma); 5744 rx_desc->read.hdr_addr = 0; 5745 } 5746 5747 i++; 5748 if (i == rx_ring->count) 5749 i = 0; 5750 buffer_info = &rx_ring->buffer_info[i]; 5751 } 5752 5753no_buffers: 5754 if (rx_ring->next_to_use != i) { 5755 rx_ring->next_to_use = i; 5756 if (i == 0) 5757 i = (rx_ring->count - 1); 5758 else 5759 i--; 5760 5761 /* Force memory writes to complete before letting h/w 5762 * know there are new descriptors to fetch. (Only 5763 * applicable for weak-ordered memory model archs, 5764 * such as IA-64). */ 5765 wmb(); 5766 writel(i, rx_ring->tail); 5767 } 5768} 5769 5770/** 5771 * igb_mii_ioctl - 5772 * @netdev: 5773 * @ifreq: 5774 * @cmd: 5775 **/ 5776static int igb_mii_ioctl(struct net_device *netdev, struct ifreq *ifr, int cmd) 5777{ 5778 struct igb_adapter *adapter = netdev_priv(netdev); 5779 struct mii_ioctl_data *data = if_mii(ifr); 5780 5781 if (adapter->hw.phy.media_type != e1000_media_type_copper) 5782 return -EOPNOTSUPP; 5783 5784 switch (cmd) { 5785 case SIOCGMIIPHY: 5786 data->phy_id = adapter->hw.phy.addr; 5787 break; 5788 case SIOCGMIIREG: 5789 if (igb_read_phy_reg(&adapter->hw, data->reg_num & 0x1F, 5790 &data->val_out)) 5791 return -EIO; 5792 break; 5793 case SIOCSMIIREG: 5794 default: 5795 return -EOPNOTSUPP; 5796 } 5797 return 0; 5798} 5799 5800/** 5801 * igb_hwtstamp_ioctl - control hardware time stamping 5802 * @netdev: 5803 * @ifreq: 5804 * @cmd: 5805 * 5806 * Outgoing time stamping can be enabled and disabled. Play nice and 5807 * disable it when requested, although it shouldn't case any overhead 5808 * when no packet needs it. At most one packet in the queue may be 5809 * marked for time stamping, otherwise it would be impossible to tell 5810 * for sure to which packet the hardware time stamp belongs. 5811 * 5812 * Incoming time stamping has to be configured via the hardware 5813 * filters. Not all combinations are supported, in particular event 5814 * type has to be specified. Matching the kind of event packet is 5815 * not supported, with the exception of "all V2 events regardless of 5816 * level 2 or 4". 5817 * 5818 **/ 5819static int igb_hwtstamp_ioctl(struct net_device *netdev, 5820 struct ifreq *ifr, int cmd) 5821{ 5822 struct igb_adapter *adapter = netdev_priv(netdev); 5823 struct e1000_hw *hw = &adapter->hw; 5824 struct hwtstamp_config config; 5825 u32 tsync_tx_ctl = E1000_TSYNCTXCTL_ENABLED; 5826 u32 tsync_rx_ctl = E1000_TSYNCRXCTL_ENABLED; 5827 u32 tsync_rx_cfg = 0; 5828 bool is_l4 = false; 5829 bool is_l2 = false; 5830 u32 regval; 5831 5832 if (copy_from_user(&config, ifr->ifr_data, sizeof(config))) 5833 return -EFAULT; 5834 5835 /* reserved for future extensions */ 5836 if (config.flags) 5837 return -EINVAL; 5838 5839 switch (config.tx_type) { 5840 case HWTSTAMP_TX_OFF: 5841 tsync_tx_ctl = 0; 5842 case HWTSTAMP_TX_ON: 5843 break; 5844 default: 5845 return -ERANGE; 5846 } 5847 5848 switch (config.rx_filter) { 5849 case HWTSTAMP_FILTER_NONE: 5850 tsync_rx_ctl = 0; 5851 break; 5852 case HWTSTAMP_FILTER_PTP_V1_L4_EVENT: 5853 case HWTSTAMP_FILTER_PTP_V2_L4_EVENT: 5854 case HWTSTAMP_FILTER_PTP_V2_L2_EVENT: 5855 case HWTSTAMP_FILTER_ALL: 5856 /* 5857 * register TSYNCRXCFG must be set, therefore it is not 5858 * possible to time stamp both Sync and Delay_Req messages 5859 * => fall back to time stamping all packets 5860 */ 5861 tsync_rx_ctl |= E1000_TSYNCRXCTL_TYPE_ALL; 5862 config.rx_filter = HWTSTAMP_FILTER_ALL; 5863 break; 5864 case HWTSTAMP_FILTER_PTP_V1_L4_SYNC: 5865 tsync_rx_ctl |= E1000_TSYNCRXCTL_TYPE_L4_V1; 5866 tsync_rx_cfg = E1000_TSYNCRXCFG_PTP_V1_SYNC_MESSAGE; 5867 is_l4 = true; 5868 break; 5869 case HWTSTAMP_FILTER_PTP_V1_L4_DELAY_REQ: 5870 tsync_rx_ctl |= E1000_TSYNCRXCTL_TYPE_L4_V1; 5871 tsync_rx_cfg = E1000_TSYNCRXCFG_PTP_V1_DELAY_REQ_MESSAGE; 5872 is_l4 = true; 5873 break; 5874 case HWTSTAMP_FILTER_PTP_V2_L2_SYNC: 5875 case HWTSTAMP_FILTER_PTP_V2_L4_SYNC: 5876 tsync_rx_ctl |= E1000_TSYNCRXCTL_TYPE_L2_L4_V2; 5877 tsync_rx_cfg = E1000_TSYNCRXCFG_PTP_V2_SYNC_MESSAGE; 5878 is_l2 = true; 5879 is_l4 = true; 5880 config.rx_filter = HWTSTAMP_FILTER_SOME; 5881 break; 5882 case HWTSTAMP_FILTER_PTP_V2_L2_DELAY_REQ: 5883 case HWTSTAMP_FILTER_PTP_V2_L4_DELAY_REQ: 5884 tsync_rx_ctl |= E1000_TSYNCRXCTL_TYPE_L2_L4_V2; 5885 tsync_rx_cfg = E1000_TSYNCRXCFG_PTP_V2_DELAY_REQ_MESSAGE; 5886 is_l2 = true; 5887 is_l4 = true; 5888 config.rx_filter = HWTSTAMP_FILTER_SOME; 5889 break; 5890 case HWTSTAMP_FILTER_PTP_V2_EVENT: 5891 case HWTSTAMP_FILTER_PTP_V2_SYNC: 5892 case HWTSTAMP_FILTER_PTP_V2_DELAY_REQ: 5893 tsync_rx_ctl |= E1000_TSYNCRXCTL_TYPE_EVENT_V2; 5894 config.rx_filter = HWTSTAMP_FILTER_PTP_V2_EVENT; 5895 is_l2 = true; 5896 break; 5897 default: 5898 return -ERANGE; 5899 } 5900 5901 if (hw->mac.type == e1000_82575) { 5902 if (tsync_rx_ctl | tsync_tx_ctl) 5903 return -EINVAL; 5904 return 0; 5905 } 5906 5907 /* 5908 * Per-packet timestamping only works if all packets are 5909 * timestamped, so enable timestamping in all packets as 5910 * long as one rx filter was configured. 5911 */ 5912 if ((hw->mac.type == e1000_82580) && tsync_rx_ctl) { 5913 tsync_rx_ctl = E1000_TSYNCRXCTL_ENABLED; 5914 tsync_rx_ctl |= E1000_TSYNCRXCTL_TYPE_ALL; 5915 } 5916 5917 /* enable/disable TX */ 5918 regval = rd32(E1000_TSYNCTXCTL); 5919 regval &= ~E1000_TSYNCTXCTL_ENABLED; 5920 regval |= tsync_tx_ctl; 5921 wr32(E1000_TSYNCTXCTL, regval); 5922 5923 /* enable/disable RX */ 5924 regval = rd32(E1000_TSYNCRXCTL); 5925 regval &= ~(E1000_TSYNCRXCTL_ENABLED | E1000_TSYNCRXCTL_TYPE_MASK); 5926 regval |= tsync_rx_ctl; 5927 wr32(E1000_TSYNCRXCTL, regval); 5928 5929 /* define which PTP packets are time stamped */ 5930 wr32(E1000_TSYNCRXCFG, tsync_rx_cfg); 5931 5932 /* define ethertype filter for timestamped packets */ 5933 if (is_l2) 5934 wr32(E1000_ETQF(3), 5935 (E1000_ETQF_FILTER_ENABLE | /* enable filter */ 5936 E1000_ETQF_1588 | /* enable timestamping */ 5937 ETH_P_1588)); /* 1588 eth protocol type */ 5938 else 5939 wr32(E1000_ETQF(3), 0); 5940 5941#define PTP_PORT 319 5942 /* L4 Queue Filter[3]: filter by destination port and protocol */ 5943 if (is_l4) { 5944 u32 ftqf = (IPPROTO_UDP /* UDP */ 5945 | E1000_FTQF_VF_BP /* VF not compared */ 5946 | E1000_FTQF_1588_TIME_STAMP /* Enable Timestamping */ 5947 | E1000_FTQF_MASK); /* mask all inputs */ 5948 ftqf &= ~E1000_FTQF_MASK_PROTO_BP; /* enable protocol check */ 5949 5950 wr32(E1000_IMIR(3), htons(PTP_PORT)); 5951 wr32(E1000_IMIREXT(3), 5952 (E1000_IMIREXT_SIZE_BP | E1000_IMIREXT_CTRL_BP)); 5953 if (hw->mac.type == e1000_82576) { 5954 /* enable source port check */ 5955 wr32(E1000_SPQF(3), htons(PTP_PORT)); 5956 ftqf &= ~E1000_FTQF_MASK_SOURCE_PORT_BP; 5957 } 5958 wr32(E1000_FTQF(3), ftqf); 5959 } else { 5960 wr32(E1000_FTQF(3), E1000_FTQF_MASK); 5961 } 5962 wrfl(); 5963 5964 adapter->hwtstamp_config = config; 5965 5966 /* clear TX/RX time stamp registers, just to be sure */ 5967 regval = rd32(E1000_TXSTMPH); 5968 regval = rd32(E1000_RXSTMPH); 5969 5970 return copy_to_user(ifr->ifr_data, &config, sizeof(config)) ? 5971 -EFAULT : 0; 5972} 5973 5974/** 5975 * igb_ioctl - 5976 * @netdev: 5977 * @ifreq: 5978 * @cmd: 5979 **/ 5980static int igb_ioctl(struct net_device *netdev, struct ifreq *ifr, int cmd) 5981{ 5982 switch (cmd) { 5983 case SIOCGMIIPHY: 5984 case SIOCGMIIREG: 5985 case SIOCSMIIREG: 5986 return igb_mii_ioctl(netdev, ifr, cmd); 5987 case SIOCSHWTSTAMP: 5988 return igb_hwtstamp_ioctl(netdev, ifr, cmd); 5989 default: 5990 return -EOPNOTSUPP; 5991 } 5992} 5993 5994s32 igb_read_pcie_cap_reg(struct e1000_hw *hw, u32 reg, u16 *value) 5995{ 5996 struct igb_adapter *adapter = hw->back; 5997 u16 cap_offset; 5998 5999 cap_offset = pci_find_capability(adapter->pdev, PCI_CAP_ID_EXP); 6000 if (!cap_offset) 6001 return -E1000_ERR_CONFIG; 6002 6003 pci_read_config_word(adapter->pdev, cap_offset + reg, value); 6004 6005 return 0; 6006} 6007 6008s32 igb_write_pcie_cap_reg(struct e1000_hw *hw, u32 reg, u16 *value) 6009{ 6010 struct igb_adapter *adapter = hw->back; 6011 u16 cap_offset; 6012 6013 cap_offset = pci_find_capability(adapter->pdev, PCI_CAP_ID_EXP); 6014 if (!cap_offset) 6015 return -E1000_ERR_CONFIG; 6016 6017 pci_write_config_word(adapter->pdev, cap_offset + reg, *value); 6018 6019 return 0; 6020} 6021 6022static void igb_vlan_rx_register(struct net_device *netdev, 6023 struct vlan_group *grp) 6024{ 6025 struct igb_adapter *adapter = netdev_priv(netdev); 6026 struct e1000_hw *hw = &adapter->hw; 6027 u32 ctrl, rctl; 6028 6029 igb_irq_disable(adapter); 6030 adapter->vlgrp = grp; 6031 6032 if (grp) { 6033 /* enable VLAN tag insert/strip */ 6034 ctrl = rd32(E1000_CTRL); 6035 ctrl |= E1000_CTRL_VME; 6036 wr32(E1000_CTRL, ctrl); 6037 6038 /* Disable CFI check */ 6039 rctl = rd32(E1000_RCTL); 6040 rctl &= ~E1000_RCTL_CFIEN; 6041 wr32(E1000_RCTL, rctl); 6042 } else { 6043 /* disable VLAN tag insert/strip */ 6044 ctrl = rd32(E1000_CTRL); 6045 ctrl &= ~E1000_CTRL_VME; 6046 wr32(E1000_CTRL, ctrl); 6047 } 6048 6049 igb_rlpml_set(adapter); 6050 6051 if (!test_bit(__IGB_DOWN, &adapter->state)) 6052 igb_irq_enable(adapter); 6053} 6054 6055static void igb_vlan_rx_add_vid(struct net_device *netdev, u16 vid) 6056{ 6057 struct igb_adapter *adapter = netdev_priv(netdev); 6058 struct e1000_hw *hw = &adapter->hw; 6059 int pf_id = adapter->vfs_allocated_count; 6060 6061 /* attempt to add filter to vlvf array */ 6062 igb_vlvf_set(adapter, vid, true, pf_id); 6063 6064 /* add the filter since PF can receive vlans w/o entry in vlvf */ 6065 igb_vfta_set(hw, vid, true); 6066} 6067 6068static void igb_vlan_rx_kill_vid(struct net_device *netdev, u16 vid) 6069{ 6070 struct igb_adapter *adapter = netdev_priv(netdev); 6071 struct e1000_hw *hw = &adapter->hw; 6072 int pf_id = adapter->vfs_allocated_count; 6073 s32 err; 6074 6075 igb_irq_disable(adapter); 6076 vlan_group_set_device(adapter->vlgrp, vid, NULL); 6077 6078 if (!test_bit(__IGB_DOWN, &adapter->state)) 6079 igb_irq_enable(adapter); 6080 6081 /* remove vlan from VLVF table array */ 6082 err = igb_vlvf_set(adapter, vid, false, pf_id); 6083 6084 /* if vid was not present in VLVF just remove it from table */ 6085 if (err) 6086 igb_vfta_set(hw, vid, false); 6087} 6088 6089static void igb_restore_vlan(struct igb_adapter *adapter) 6090{ 6091 igb_vlan_rx_register(adapter->netdev, adapter->vlgrp); 6092 6093 if (adapter->vlgrp) { 6094 u16 vid; 6095 for (vid = 0; vid < VLAN_GROUP_ARRAY_LEN; vid++) { 6096 if (!vlan_group_get_device(adapter->vlgrp, vid)) 6097 continue; 6098 igb_vlan_rx_add_vid(adapter->netdev, vid); 6099 } 6100 } 6101} 6102 6103int igb_set_spd_dplx(struct igb_adapter *adapter, u16 spddplx) 6104{ 6105 struct pci_dev *pdev = adapter->pdev; 6106 struct e1000_mac_info *mac = &adapter->hw.mac; 6107 6108 mac->autoneg = 0; 6109 6110 switch (spddplx) { 6111 case SPEED_10 + DUPLEX_HALF: 6112 mac->forced_speed_duplex = ADVERTISE_10_HALF; 6113 break; 6114 case SPEED_10 + DUPLEX_FULL: 6115 mac->forced_speed_duplex = ADVERTISE_10_FULL; 6116 break; 6117 case SPEED_100 + DUPLEX_HALF: 6118 mac->forced_speed_duplex = ADVERTISE_100_HALF; 6119 break; 6120 case SPEED_100 + DUPLEX_FULL: 6121 mac->forced_speed_duplex = ADVERTISE_100_FULL; 6122 break; 6123 case SPEED_1000 + DUPLEX_FULL: 6124 mac->autoneg = 1; 6125 adapter->hw.phy.autoneg_advertised = ADVERTISE_1000_FULL; 6126 break; 6127 case SPEED_1000 + DUPLEX_HALF: /* not supported */ 6128 default: 6129 dev_err(&pdev->dev, "Unsupported Speed/Duplex configuration\n"); 6130 return -EINVAL; 6131 } 6132 return 0; 6133} 6134 6135static int __igb_shutdown(struct pci_dev *pdev, bool *enable_wake) 6136{ 6137 struct net_device *netdev = pci_get_drvdata(pdev); 6138 struct igb_adapter *adapter = netdev_priv(netdev); 6139 struct e1000_hw *hw = &adapter->hw; 6140 u32 ctrl, rctl, status; 6141 u32 wufc = adapter->wol; 6142#ifdef CONFIG_PM 6143 int retval = 0; 6144#endif 6145 6146 netif_device_detach(netdev); 6147 6148 if (netif_running(netdev)) 6149 igb_close(netdev); 6150 6151 igb_clear_interrupt_scheme(adapter); 6152 6153#ifdef CONFIG_PM 6154 retval = pci_save_state(pdev); 6155 if (retval) 6156 return retval; 6157#endif 6158 6159 status = rd32(E1000_STATUS); 6160 if (status & E1000_STATUS_LU) 6161 wufc &= ~E1000_WUFC_LNKC; 6162 6163 if (wufc) { 6164 igb_setup_rctl(adapter); 6165 igb_set_rx_mode(netdev); 6166 6167 /* turn on all-multi mode if wake on multicast is enabled */ 6168 if (wufc & E1000_WUFC_MC) { 6169 rctl = rd32(E1000_RCTL); 6170 rctl |= E1000_RCTL_MPE; 6171 wr32(E1000_RCTL, rctl); 6172 } 6173 6174 ctrl = rd32(E1000_CTRL); 6175 /* advertise wake from D3Cold */ 6176 #define E1000_CTRL_ADVD3WUC 0x00100000 6177 /* phy power management enable */ 6178 #define E1000_CTRL_EN_PHY_PWR_MGMT 0x00200000 6179 ctrl |= E1000_CTRL_ADVD3WUC; 6180 wr32(E1000_CTRL, ctrl); 6181 6182 /* Allow time for pending master requests to run */ 6183 igb_disable_pcie_master(hw); 6184 6185 wr32(E1000_WUC, E1000_WUC_PME_EN); 6186 wr32(E1000_WUFC, wufc); 6187 } else { 6188 wr32(E1000_WUC, 0); 6189 wr32(E1000_WUFC, 0); 6190 } 6191 6192 *enable_wake = wufc || adapter->en_mng_pt; 6193 if (!*enable_wake) 6194 igb_power_down_link(adapter); 6195 else 6196 igb_power_up_link(adapter); 6197 6198 /* Release control of h/w to f/w. If f/w is AMT enabled, this 6199 * would have already happened in close and is redundant. */ 6200 igb_release_hw_control(adapter); 6201 6202 pci_disable_device(pdev); 6203 6204 return 0; 6205} 6206 6207#ifdef CONFIG_PM 6208static int igb_suspend(struct pci_dev *pdev, pm_message_t state) 6209{ 6210 int retval; 6211 bool wake; 6212 6213 retval = __igb_shutdown(pdev, &wake); 6214 if (retval) 6215 return retval; 6216 6217 if (wake) { 6218 pci_prepare_to_sleep(pdev); 6219 } else { 6220 pci_wake_from_d3(pdev, false); 6221 pci_set_power_state(pdev, PCI_D3hot); 6222 } 6223 6224 return 0; 6225} 6226 6227static int igb_resume(struct pci_dev *pdev) 6228{ 6229 struct net_device *netdev = pci_get_drvdata(pdev); 6230 struct igb_adapter *adapter = netdev_priv(netdev); 6231 struct e1000_hw *hw = &adapter->hw; 6232 u32 err; 6233 6234 pci_set_power_state(pdev, PCI_D0); 6235 pci_restore_state(pdev); 6236 pci_save_state(pdev); 6237 6238 err = pci_enable_device_mem(pdev); 6239 if (err) { 6240 dev_err(&pdev->dev, 6241 "igb: Cannot enable PCI device from suspend\n"); 6242 return err; 6243 } 6244 pci_set_master(pdev); 6245 6246 pci_enable_wake(pdev, PCI_D3hot, 0); 6247 pci_enable_wake(pdev, PCI_D3cold, 0); 6248 6249 if (igb_init_interrupt_scheme(adapter)) { 6250 dev_err(&pdev->dev, "Unable to allocate memory for queues\n"); 6251 return -ENOMEM; 6252 } 6253 6254 igb_reset(adapter); 6255 6256 /* let the f/w know that the h/w is now under the control of the 6257 * driver. */ 6258 igb_get_hw_control(adapter); 6259 6260 wr32(E1000_WUS, ~0); 6261 6262 if (netif_running(netdev)) { 6263 err = igb_open(netdev); 6264 if (err) 6265 return err; 6266 } 6267 6268 netif_device_attach(netdev); 6269 6270 return 0; 6271} 6272#endif 6273 6274static void igb_shutdown(struct pci_dev *pdev) 6275{ 6276 bool wake; 6277 6278 __igb_shutdown(pdev, &wake); 6279 6280 if (system_state == SYSTEM_POWER_OFF) { 6281 pci_wake_from_d3(pdev, wake); 6282 pci_set_power_state(pdev, PCI_D3hot); 6283 } 6284} 6285 6286#ifdef CONFIG_NET_POLL_CONTROLLER 6287/* 6288 * Polling 'interrupt' - used by things like netconsole to send skbs 6289 * without having to re-enable interrupts. It's not called while 6290 * the interrupt routine is executing. 6291 */ 6292static void igb_netpoll(struct net_device *netdev) 6293{ 6294 struct igb_adapter *adapter = netdev_priv(netdev); 6295 struct e1000_hw *hw = &adapter->hw; 6296 int i; 6297 6298 if (!adapter->msix_entries) { 6299 struct igb_q_vector *q_vector = adapter->q_vector[0]; 6300 igb_irq_disable(adapter); 6301 napi_schedule(&q_vector->napi); 6302 return; 6303 } 6304 6305 for (i = 0; i < adapter->num_q_vectors; i++) { 6306 struct igb_q_vector *q_vector = adapter->q_vector[i]; 6307 wr32(E1000_EIMC, q_vector->eims_value); 6308 napi_schedule(&q_vector->napi); 6309 } 6310} 6311#endif /* CONFIG_NET_POLL_CONTROLLER */ 6312 6313/** 6314 * igb_io_error_detected - called when PCI error is detected 6315 * @pdev: Pointer to PCI device 6316 * @state: The current pci connection state 6317 * 6318 * This function is called after a PCI bus error affecting 6319 * this device has been detected. 6320 */ 6321static pci_ers_result_t igb_io_error_detected(struct pci_dev *pdev, 6322 pci_channel_state_t state) 6323{ 6324 struct net_device *netdev = pci_get_drvdata(pdev); 6325 struct igb_adapter *adapter = netdev_priv(netdev); 6326 6327 netif_device_detach(netdev); 6328 6329 if (state == pci_channel_io_perm_failure) 6330 return PCI_ERS_RESULT_DISCONNECT; 6331 6332 if (netif_running(netdev)) 6333 igb_down(adapter); 6334 pci_disable_device(pdev); 6335 6336 /* Request a slot slot reset. */ 6337 return PCI_ERS_RESULT_NEED_RESET; 6338} 6339 6340/** 6341 * igb_io_slot_reset - called after the pci bus has been reset. 6342 * @pdev: Pointer to PCI device 6343 * 6344 * Restart the card from scratch, as if from a cold-boot. Implementation 6345 * resembles the first-half of the igb_resume routine. 6346 */ 6347static pci_ers_result_t igb_io_slot_reset(struct pci_dev *pdev) 6348{ 6349 struct net_device *netdev = pci_get_drvdata(pdev); 6350 struct igb_adapter *adapter = netdev_priv(netdev); 6351 struct e1000_hw *hw = &adapter->hw; 6352 pci_ers_result_t result; 6353 int err; 6354 6355 if (pci_enable_device_mem(pdev)) { 6356 dev_err(&pdev->dev, 6357 "Cannot re-enable PCI device after reset.\n"); 6358 result = PCI_ERS_RESULT_DISCONNECT; 6359 } else { 6360 pci_set_master(pdev); 6361 pci_restore_state(pdev); 6362 pci_save_state(pdev); 6363 6364 pci_enable_wake(pdev, PCI_D3hot, 0); 6365 pci_enable_wake(pdev, PCI_D3cold, 0); 6366 6367 igb_reset(adapter); 6368 wr32(E1000_WUS, ~0); 6369 result = PCI_ERS_RESULT_RECOVERED; 6370 } 6371 6372 err = pci_cleanup_aer_uncorrect_error_status(pdev); 6373 if (err) { 6374 dev_err(&pdev->dev, "pci_cleanup_aer_uncorrect_error_status " 6375 "failed 0x%0x\n", err); 6376 /* non-fatal, continue */ 6377 } 6378 6379 return result; 6380} 6381 6382/** 6383 * igb_io_resume - called when traffic can start flowing again. 6384 * @pdev: Pointer to PCI device 6385 * 6386 * This callback is called when the error recovery driver tells us that 6387 * its OK to resume normal operation. Implementation resembles the 6388 * second-half of the igb_resume routine. 6389 */ 6390static void igb_io_resume(struct pci_dev *pdev) 6391{ 6392 struct net_device *netdev = pci_get_drvdata(pdev); 6393 struct igb_adapter *adapter = netdev_priv(netdev); 6394 6395 if (netif_running(netdev)) { 6396 if (igb_up(adapter)) { 6397 dev_err(&pdev->dev, "igb_up failed after reset\n"); 6398 return; 6399 } 6400 } 6401 6402 netif_device_attach(netdev); 6403 6404 /* let the f/w know that the h/w is now under the control of the 6405 * driver. */ 6406 igb_get_hw_control(adapter); 6407} 6408 6409static void igb_rar_set_qsel(struct igb_adapter *adapter, u8 *addr, u32 index, 6410 u8 qsel) 6411{ 6412 u32 rar_low, rar_high; 6413 struct e1000_hw *hw = &adapter->hw; 6414 6415 /* HW expects these in little endian so we reverse the byte order 6416 * from network order (big endian) to little endian 6417 */ 6418 rar_low = ((u32) addr[0] | ((u32) addr[1] << 8) | 6419 ((u32) addr[2] << 16) | ((u32) addr[3] << 24)); 6420 rar_high = ((u32) addr[4] | ((u32) addr[5] << 8)); 6421 6422 /* Indicate to hardware the Address is Valid. */ 6423 rar_high |= E1000_RAH_AV; 6424 6425 if (hw->mac.type == e1000_82575) 6426 rar_high |= E1000_RAH_POOL_1 * qsel; 6427 else 6428 rar_high |= E1000_RAH_POOL_1 << qsel; 6429 6430 wr32(E1000_RAL(index), rar_low); 6431 wrfl(); 6432 wr32(E1000_RAH(index), rar_high); 6433 wrfl(); 6434} 6435 6436static int igb_set_vf_mac(struct igb_adapter *adapter, 6437 int vf, unsigned char *mac_addr) 6438{ 6439 struct e1000_hw *hw = &adapter->hw; 6440 /* VF MAC addresses start at end of receive addresses and moves 6441 * torwards the first, as a result a collision should not be possible */ 6442 int rar_entry = hw->mac.rar_entry_count - (vf + 1); 6443 6444 memcpy(adapter->vf_data[vf].vf_mac_addresses, mac_addr, ETH_ALEN); 6445 6446 igb_rar_set_qsel(adapter, mac_addr, rar_entry, vf); 6447 6448 return 0; 6449} 6450 6451static int igb_ndo_set_vf_mac(struct net_device *netdev, int vf, u8 *mac) 6452{ 6453 struct igb_adapter *adapter = netdev_priv(netdev); 6454 if (!is_valid_ether_addr(mac) || (vf >= adapter->vfs_allocated_count)) 6455 return -EINVAL; 6456 adapter->vf_data[vf].flags |= IGB_VF_FLAG_PF_SET_MAC; 6457 dev_info(&adapter->pdev->dev, "setting MAC %pM on VF %d\n", mac, vf); 6458 dev_info(&adapter->pdev->dev, "Reload the VF driver to make this" 6459 " change effective."); 6460 if (test_bit(__IGB_DOWN, &adapter->state)) { 6461 dev_warn(&adapter->pdev->dev, "The VF MAC address has been set," 6462 " but the PF device is not up.\n"); 6463 dev_warn(&adapter->pdev->dev, "Bring the PF device up before" 6464 " attempting to use the VF device.\n"); 6465 } 6466 return igb_set_vf_mac(adapter, vf, mac); 6467} 6468 6469static int igb_ndo_set_vf_bw(struct net_device *netdev, int vf, int tx_rate) 6470{ 6471 return -EOPNOTSUPP; 6472} 6473 6474static int igb_ndo_get_vf_config(struct net_device *netdev, 6475 int vf, struct ifla_vf_info *ivi) 6476{ 6477 struct igb_adapter *adapter = netdev_priv(netdev); 6478 if (vf >= adapter->vfs_allocated_count) 6479 return -EINVAL; 6480 ivi->vf = vf; 6481 memcpy(&ivi->mac, adapter->vf_data[vf].vf_mac_addresses, ETH_ALEN); 6482 ivi->tx_rate = 0; 6483 ivi->vlan = adapter->vf_data[vf].pf_vlan; 6484 ivi->qos = adapter->vf_data[vf].pf_qos; 6485 return 0; 6486} 6487 6488static void igb_vmm_control(struct igb_adapter *adapter) 6489{ 6490 struct e1000_hw *hw = &adapter->hw; 6491 u32 reg; 6492 6493 switch (hw->mac.type) { 6494 case e1000_82575: 6495 default: 6496 /* replication is not supported for 82575 */ 6497 return; 6498 case e1000_82576: 6499 /* notify HW that the MAC is adding vlan tags */ 6500 reg = rd32(E1000_DTXCTL); 6501 reg |= E1000_DTXCTL_VLAN_ADDED; 6502 wr32(E1000_DTXCTL, reg); 6503 case e1000_82580: 6504 /* enable replication vlan tag stripping */ 6505 reg = rd32(E1000_RPLOLR); 6506 reg |= E1000_RPLOLR_STRVLAN; 6507 wr32(E1000_RPLOLR, reg); 6508 case e1000_i350: 6509 /* none of the above registers are supported by i350 */ 6510 break; 6511 } 6512 6513 if (adapter->vfs_allocated_count) { 6514 igb_vmdq_set_loopback_pf(hw, true); 6515 igb_vmdq_set_replication_pf(hw, true); 6516 } else { 6517 igb_vmdq_set_loopback_pf(hw, false); 6518 igb_vmdq_set_replication_pf(hw, false); 6519 } 6520} 6521 6522/* igb_main.c */