e1000_main.c 145.3 KB
Newer Older
L
Linus Torvalds 已提交
1 2
/*******************************************************************************

3 4 5 6 7 8 9 10 11 12
  Intel PRO/1000 Linux driver
  Copyright(c) 1999 - 2006 Intel Corporation.

  This program is free software; you can redistribute it and/or modify it
  under the terms and conditions of the GNU General Public License,
  version 2, as published by the Free Software Foundation.

  This program is distributed in the hope it will be useful, but WITHOUT
  ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
L
Linus Torvalds 已提交
13
  more details.
14

L
Linus Torvalds 已提交
15
  You should have received a copy of the GNU General Public License along with
16 17 18 19 20 21
  this program; if not, write to the Free Software Foundation, Inc.,
  51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA.

  The full GNU General Public License is included in this distribution in
  the file called "COPYING".

L
Linus Torvalds 已提交
22 23
  Contact Information:
  Linux NICS <linux.nics@intel.com>
24
  e1000-devel Mailing List <e1000-devel@lists.sourceforge.net>
L
Linus Torvalds 已提交
25 26 27 28 29
  Intel Corporation, 5200 N.E. Elam Young Parkway, Hillsboro, OR 97124-6497

*******************************************************************************/

#include "e1000.h"
A
Andrew Morton 已提交
30
#include <net/ip6_checksum.h>
31
#include <linux/io.h>
32
#include <linux/prefetch.h>
J
Jiri Pirko 已提交
33 34
#include <linux/bitops.h>
#include <linux/if_vlan.h>
35

L
Linus Torvalds 已提交
36
char e1000_driver_name[] = "e1000";
37
static char e1000_driver_string[] = "Intel(R) PRO/1000 Network Driver";
A
Anupam Chanda 已提交
38
#define DRV_VERSION "7.3.21-k8-NAPI"
S
Stephen Hemminger 已提交
39 40
const char e1000_driver_version[] = DRV_VERSION;
static const char e1000_copyright[] = "Copyright (c) 1999-2006 Intel Corporation.";
L
Linus Torvalds 已提交
41 42 43 44 45 46 47 48

/* e1000_pci_tbl - PCI Device ID Table
 *
 * Last entry must be all 0s
 *
 * Macro expands to...
 *   {PCI_DEVICE(PCI_VENDOR_ID_INTEL, device_id)}
 */
49
static const struct pci_device_id e1000_pci_tbl[] = {
L
Linus Torvalds 已提交
50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68
	INTEL_E1000_ETHERNET_DEVICE(0x1000),
	INTEL_E1000_ETHERNET_DEVICE(0x1001),
	INTEL_E1000_ETHERNET_DEVICE(0x1004),
	INTEL_E1000_ETHERNET_DEVICE(0x1008),
	INTEL_E1000_ETHERNET_DEVICE(0x1009),
	INTEL_E1000_ETHERNET_DEVICE(0x100C),
	INTEL_E1000_ETHERNET_DEVICE(0x100D),
	INTEL_E1000_ETHERNET_DEVICE(0x100E),
	INTEL_E1000_ETHERNET_DEVICE(0x100F),
	INTEL_E1000_ETHERNET_DEVICE(0x1010),
	INTEL_E1000_ETHERNET_DEVICE(0x1011),
	INTEL_E1000_ETHERNET_DEVICE(0x1012),
	INTEL_E1000_ETHERNET_DEVICE(0x1013),
	INTEL_E1000_ETHERNET_DEVICE(0x1014),
	INTEL_E1000_ETHERNET_DEVICE(0x1015),
	INTEL_E1000_ETHERNET_DEVICE(0x1016),
	INTEL_E1000_ETHERNET_DEVICE(0x1017),
	INTEL_E1000_ETHERNET_DEVICE(0x1018),
	INTEL_E1000_ETHERNET_DEVICE(0x1019),
69
	INTEL_E1000_ETHERNET_DEVICE(0x101A),
L
Linus Torvalds 已提交
70 71 72 73 74 75 76 77 78 79 80 81 82 83
	INTEL_E1000_ETHERNET_DEVICE(0x101D),
	INTEL_E1000_ETHERNET_DEVICE(0x101E),
	INTEL_E1000_ETHERNET_DEVICE(0x1026),
	INTEL_E1000_ETHERNET_DEVICE(0x1027),
	INTEL_E1000_ETHERNET_DEVICE(0x1028),
	INTEL_E1000_ETHERNET_DEVICE(0x1075),
	INTEL_E1000_ETHERNET_DEVICE(0x1076),
	INTEL_E1000_ETHERNET_DEVICE(0x1077),
	INTEL_E1000_ETHERNET_DEVICE(0x1078),
	INTEL_E1000_ETHERNET_DEVICE(0x1079),
	INTEL_E1000_ETHERNET_DEVICE(0x107A),
	INTEL_E1000_ETHERNET_DEVICE(0x107B),
	INTEL_E1000_ETHERNET_DEVICE(0x107C),
	INTEL_E1000_ETHERNET_DEVICE(0x108A),
84 85
	INTEL_E1000_ETHERNET_DEVICE(0x1099),
	INTEL_E1000_ETHERNET_DEVICE(0x10B5),
86
	INTEL_E1000_ETHERNET_DEVICE(0x2E6E),
L
Linus Torvalds 已提交
87 88 89 90 91 92
	/* required last entry */
	{0,}
};

MODULE_DEVICE_TABLE(pci, e1000_pci_tbl);

93 94 95 96 97 98 99 100
int e1000_up(struct e1000_adapter *adapter);
void e1000_down(struct e1000_adapter *adapter);
void e1000_reinit_locked(struct e1000_adapter *adapter);
void e1000_reset(struct e1000_adapter *adapter);
int e1000_setup_all_tx_resources(struct e1000_adapter *adapter);
int e1000_setup_all_rx_resources(struct e1000_adapter *adapter);
void e1000_free_all_tx_resources(struct e1000_adapter *adapter);
void e1000_free_all_rx_resources(struct e1000_adapter *adapter);
101
static int e1000_setup_tx_resources(struct e1000_adapter *adapter,
102
                             struct e1000_tx_ring *txdr);
103
static int e1000_setup_rx_resources(struct e1000_adapter *adapter,
104
                             struct e1000_rx_ring *rxdr);
105
static void e1000_free_tx_resources(struct e1000_adapter *adapter,
106
                             struct e1000_tx_ring *tx_ring);
107
static void e1000_free_rx_resources(struct e1000_adapter *adapter,
108 109
                             struct e1000_rx_ring *rx_ring);
void e1000_update_stats(struct e1000_adapter *adapter);
L
Linus Torvalds 已提交
110 111 112 113

static int e1000_init_module(void);
static void e1000_exit_module(void);
static int e1000_probe(struct pci_dev *pdev, const struct pci_device_id *ent);
114
static void e1000_remove(struct pci_dev *pdev);
115
static int e1000_alloc_queues(struct e1000_adapter *adapter);
L
Linus Torvalds 已提交
116 117 118 119 120 121
static int e1000_sw_init(struct e1000_adapter *adapter);
static int e1000_open(struct net_device *netdev);
static int e1000_close(struct net_device *netdev);
static void e1000_configure_tx(struct e1000_adapter *adapter);
static void e1000_configure_rx(struct e1000_adapter *adapter);
static void e1000_setup_rctl(struct e1000_adapter *adapter);
122 123 124 125 126 127
static void e1000_clean_all_tx_rings(struct e1000_adapter *adapter);
static void e1000_clean_all_rx_rings(struct e1000_adapter *adapter);
static void e1000_clean_tx_ring(struct e1000_adapter *adapter,
                                struct e1000_tx_ring *tx_ring);
static void e1000_clean_rx_ring(struct e1000_adapter *adapter,
                                struct e1000_rx_ring *rx_ring);
128
static void e1000_set_rx_mode(struct net_device *netdev);
J
Jesse Brandeburg 已提交
129
static void e1000_update_phy_info_task(struct work_struct *work);
130
static void e1000_watchdog(struct work_struct *work);
J
Jesse Brandeburg 已提交
131
static void e1000_82547_tx_fifo_stall_task(struct work_struct *work);
132 133
static netdev_tx_t e1000_xmit_frame(struct sk_buff *skb,
				    struct net_device *netdev);
L
Linus Torvalds 已提交
134 135 136
static struct net_device_stats * e1000_get_stats(struct net_device *netdev);
static int e1000_change_mtu(struct net_device *netdev, int new_mtu);
static int e1000_set_mac(struct net_device *netdev, void *p);
137
static irqreturn_t e1000_intr(int irq, void *data);
J
Joe Perches 已提交
138 139
static bool e1000_clean_tx_irq(struct e1000_adapter *adapter,
			       struct e1000_tx_ring *tx_ring);
140
static int e1000_clean(struct napi_struct *napi, int budget);
J
Joe Perches 已提交
141 142 143
static bool e1000_clean_rx_irq(struct e1000_adapter *adapter,
			       struct e1000_rx_ring *rx_ring,
			       int *work_done, int work_to_do);
144 145 146
static bool e1000_clean_jumbo_rx_irq(struct e1000_adapter *adapter,
				     struct e1000_rx_ring *rx_ring,
				     int *work_done, int work_to_do);
147
static void e1000_alloc_rx_buffers(struct e1000_adapter *adapter,
148
				   struct e1000_rx_ring *rx_ring,
149
				   int cleaned_count);
150 151 152
static void e1000_alloc_jumbo_rx_buffers(struct e1000_adapter *adapter,
					 struct e1000_rx_ring *rx_ring,
					 int cleaned_count);
L
Linus Torvalds 已提交
153 154 155 156 157 158
static int e1000_ioctl(struct net_device *netdev, struct ifreq *ifr, int cmd);
static int e1000_mii_ioctl(struct net_device *netdev, struct ifreq *ifr,
			   int cmd);
static void e1000_enter_82542_rst(struct e1000_adapter *adapter);
static void e1000_leave_82542_rst(struct e1000_adapter *adapter);
static void e1000_tx_timeout(struct net_device *dev);
159
static void e1000_reset_task(struct work_struct *work);
L
Linus Torvalds 已提交
160
static void e1000_smartspeed(struct e1000_adapter *adapter);
161 162
static int e1000_82547_fifo_workaround(struct e1000_adapter *adapter,
                                       struct sk_buff *skb);
L
Linus Torvalds 已提交
163

J
Jiri Pirko 已提交
164
static bool e1000_vlan_used(struct e1000_adapter *adapter);
165 166
static void e1000_vlan_mode(struct net_device *netdev,
			    netdev_features_t features);
167 168
static void e1000_vlan_filter_on_off(struct e1000_adapter *adapter,
				     bool filter_on);
169 170 171 172
static int e1000_vlan_rx_add_vid(struct net_device *netdev,
				 __be16 proto, u16 vid);
static int e1000_vlan_rx_kill_vid(struct net_device *netdev,
				  __be16 proto, u16 vid);
L
Linus Torvalds 已提交
173 174
static void e1000_restore_vlan(struct e1000_adapter *adapter);

A
Auke Kok 已提交
175
#ifdef CONFIG_PM
176
static int e1000_suspend(struct pci_dev *pdev, pm_message_t state);
L
Linus Torvalds 已提交
177 178
static int e1000_resume(struct pci_dev *pdev);
#endif
179
static void e1000_shutdown(struct pci_dev *pdev);
L
Linus Torvalds 已提交
180 181 182 183 184 185

#ifdef CONFIG_NET_POLL_CONTROLLER
/* for netdump / net console */
static void e1000_netpoll (struct net_device *netdev);
#endif

186 187 188 189 190 191
#define COPYBREAK_DEFAULT 256
static unsigned int copybreak __read_mostly = COPYBREAK_DEFAULT;
module_param(copybreak, uint, 0644);
MODULE_PARM_DESC(copybreak,
	"Maximum size of packet that is copied to a new buffer on receive");

A
Auke Kok 已提交
192 193 194 195 196
static pci_ers_result_t e1000_io_error_detected(struct pci_dev *pdev,
                     pci_channel_state_t state);
static pci_ers_result_t e1000_io_slot_reset(struct pci_dev *pdev);
static void e1000_io_resume(struct pci_dev *pdev);

197
static const struct pci_error_handlers e1000_err_handler = {
A
Auke Kok 已提交
198 199 200 201
	.error_detected = e1000_io_error_detected,
	.slot_reset = e1000_io_slot_reset,
	.resume = e1000_io_resume,
};
202

L
Linus Torvalds 已提交
203 204 205 206
static struct pci_driver e1000_driver = {
	.name     = e1000_driver_name,
	.id_table = e1000_pci_tbl,
	.probe    = e1000_probe,
207
	.remove   = e1000_remove,
208
#ifdef CONFIG_PM
L
Lucas De Marchi 已提交
209
	/* Power Management Hooks */
L
Linus Torvalds 已提交
210
	.suspend  = e1000_suspend,
211
	.resume   = e1000_resume,
L
Linus Torvalds 已提交
212
#endif
A
Auke Kok 已提交
213 214
	.shutdown = e1000_shutdown,
	.err_handler = &e1000_err_handler
L
Linus Torvalds 已提交
215 216 217 218 219 220 221
};

MODULE_AUTHOR("Intel Corporation, <linux.nics@intel.com>");
MODULE_DESCRIPTION("Intel(R) PRO/1000 Network Driver");
MODULE_LICENSE("GPL");
MODULE_VERSION(DRV_VERSION);

222 223
#define DEFAULT_MSG_ENABLE (NETIF_MSG_DRV|NETIF_MSG_PROBE|NETIF_MSG_LINK)
static int debug = -1;
L
Linus Torvalds 已提交
224 225 226
module_param(debug, int, 0);
MODULE_PARM_DESC(debug, "Debug level (0=none,...,16=all)");

227 228 229 230 231 232 233 234 235 236 237
/**
 * e1000_get_hw_dev - return device
 * used by hardware layer to print debugging information
 *
 **/
struct net_device *e1000_get_hw_dev(struct e1000_hw *hw)
{
	struct e1000_adapter *adapter = hw->back;
	return adapter->netdev;
}

L
Linus Torvalds 已提交
238 239 240 241 242 243
/**
 * e1000_init_module - Driver Registration Routine
 *
 * e1000_init_module is the first routine called when the driver is
 * loaded. All it does is register with the PCI subsystem.
 **/
244
static int __init e1000_init_module(void)
L
Linus Torvalds 已提交
245 246
{
	int ret;
247
	pr_info("%s - version %s\n", e1000_driver_string, e1000_driver_version);
L
Linus Torvalds 已提交
248

249
	pr_info("%s\n", e1000_copyright);
L
Linus Torvalds 已提交
250

251
	ret = pci_register_driver(&e1000_driver);
252 253
	if (copybreak != COPYBREAK_DEFAULT) {
		if (copybreak == 0)
254
			pr_info("copybreak disabled\n");
255
		else
256 257
			pr_info("copybreak enabled for "
				   "packets <= %u bytes\n", copybreak);
258
	}
L
Linus Torvalds 已提交
259 260 261 262 263 264 265 266 267 268 269
	return ret;
}

module_init(e1000_init_module);

/**
 * e1000_exit_module - Driver Exit Cleanup Routine
 *
 * e1000_exit_module is called just before the driver is removed
 * from memory.
 **/
270
static void __exit e1000_exit_module(void)
L
Linus Torvalds 已提交
271 272 273 274 275 276
{
	pci_unregister_driver(&e1000_driver);
}

module_exit(e1000_exit_module);

277 278 279
static int e1000_request_irq(struct e1000_adapter *adapter)
{
	struct net_device *netdev = adapter->netdev;
A
Al Viro 已提交
280
	irq_handler_t handler = e1000_intr;
281 282
	int irq_flags = IRQF_SHARED;
	int err;
283

284 285 286
	err = request_irq(adapter->pdev->irq, handler, irq_flags, netdev->name,
	                  netdev);
	if (err) {
287
		e_err(probe, "Unable to allocate interrupt Error: %d\n", err);
288
	}
289 290 291 292 293 294 295 296 297 298 299

	return err;
}

static void e1000_free_irq(struct e1000_adapter *adapter)
{
	struct net_device *netdev = adapter->netdev;

	free_irq(adapter->pdev->irq, netdev);
}

L
Linus Torvalds 已提交
300 301 302 303
/**
 * e1000_irq_disable - Mask off interrupt generation on the NIC
 * @adapter: board private structure
 **/
304
static void e1000_irq_disable(struct e1000_adapter *adapter)
L
Linus Torvalds 已提交
305
{
J
Joe Perches 已提交
306 307 308 309
	struct e1000_hw *hw = &adapter->hw;

	ew32(IMC, ~0);
	E1000_WRITE_FLUSH();
L
Linus Torvalds 已提交
310 311 312 313 314 315 316
	synchronize_irq(adapter->pdev->irq);
}

/**
 * e1000_irq_enable - Enable default interrupt generation settings
 * @adapter: board private structure
 **/
317
static void e1000_irq_enable(struct e1000_adapter *adapter)
L
Linus Torvalds 已提交
318
{
J
Joe Perches 已提交
319 320 321 322
	struct e1000_hw *hw = &adapter->hw;

	ew32(IMS, IMS_ENABLE_MASK);
	E1000_WRITE_FLUSH();
L
Linus Torvalds 已提交
323
}
324

325
static void e1000_update_mng_vlan(struct e1000_adapter *adapter)
326
{
J
Joe Perches 已提交
327
	struct e1000_hw *hw = &adapter->hw;
328
	struct net_device *netdev = adapter->netdev;
J
Joe Perches 已提交
329
	u16 vid = hw->mng_cookie.vlan_id;
330
	u16 old_vid = adapter->mng_vlan_id;
J
Jesse Brandeburg 已提交
331

J
Jiri Pirko 已提交
332 333 334 335 336 337
	if (!e1000_vlan_used(adapter))
		return;

	if (!test_bit(vid, adapter->active_vlans)) {
		if (hw->mng_cookie.status &
		    E1000_MNG_DHCP_COOKIE_STATUS_VLAN_SUPPORT) {
338
			e1000_vlan_rx_add_vid(netdev, htons(ETH_P_8021Q), vid);
339
			adapter->mng_vlan_id = vid;
J
Jiri Pirko 已提交
340 341 342 343 344 345
		} else {
			adapter->mng_vlan_id = E1000_MNG_VLAN_NONE;
		}
		if ((old_vid != (u16)E1000_MNG_VLAN_NONE) &&
		    (vid != old_vid) &&
		    !test_bit(old_vid, adapter->active_vlans))
346 347
			e1000_vlan_rx_kill_vid(netdev, htons(ETH_P_8021Q),
					       old_vid);
J
Jiri Pirko 已提交
348 349
	} else {
		adapter->mng_vlan_id = vid;
350 351
	}
}
352

353
static void e1000_init_manageability(struct e1000_adapter *adapter)
354
{
J
Joe Perches 已提交
355 356
	struct e1000_hw *hw = &adapter->hw;

357
	if (adapter->en_mng_pt) {
J
Joe Perches 已提交
358
		u32 manc = er32(MANC);
359 360 361 362

		/* disable hardware interception of ARP */
		manc &= ~(E1000_MANC_ARP_EN);

J
Joe Perches 已提交
363
		ew32(MANC, manc);
364 365 366
	}
}

367
static void e1000_release_manageability(struct e1000_adapter *adapter)
368
{
J
Joe Perches 已提交
369 370
	struct e1000_hw *hw = &adapter->hw;

371
	if (adapter->en_mng_pt) {
J
Joe Perches 已提交
372
		u32 manc = er32(MANC);
373 374 375 376

		/* re-enable hardware interception of ARP */
		manc |= E1000_MANC_ARP_EN;

J
Joe Perches 已提交
377
		ew32(MANC, manc);
378 379 380
	}
}

381 382 383 384 385
/**
 * e1000_configure - configure the hardware for RX and TX
 * @adapter = private board structure
 **/
static void e1000_configure(struct e1000_adapter *adapter)
L
Linus Torvalds 已提交
386 387
{
	struct net_device *netdev = adapter->netdev;
388
	int i;
L
Linus Torvalds 已提交
389

390
	e1000_set_rx_mode(netdev);
L
Linus Torvalds 已提交
391 392

	e1000_restore_vlan(adapter);
393
	e1000_init_manageability(adapter);
L
Linus Torvalds 已提交
394 395 396 397

	e1000_configure_tx(adapter);
	e1000_setup_rctl(adapter);
	e1000_configure_rx(adapter);
398 399
	/* call E1000_DESC_UNUSED which always leaves
	 * at least 1 descriptor unused to make sure
400 401
	 * next_to_use != next_to_clean
	 */
402
	for (i = 0; i < adapter->num_rx_queues; i++) {
403
		struct e1000_rx_ring *ring = &adapter->rx_ring[i];
404
		adapter->alloc_rx_buf(adapter, ring,
405
				      E1000_DESC_UNUSED(ring));
406
	}
407 408 409 410
}

int e1000_up(struct e1000_adapter *adapter)
{
J
Joe Perches 已提交
411 412
	struct e1000_hw *hw = &adapter->hw;

413 414 415 416
	/* hardware has been reset, we need to reload some things */
	e1000_configure(adapter);

	clear_bit(__E1000_DOWN, &adapter->flags);
417

418
	napi_enable(&adapter->napi);
419

420 421
	e1000_irq_enable(adapter);

422 423
	netif_wake_queue(adapter->netdev);

424
	/* fire a link change interrupt to start the watchdog */
J
Joe Perches 已提交
425
	ew32(ICS, E1000_ICS_LSC);
L
Linus Torvalds 已提交
426 427 428
	return 0;
}

429 430 431 432 433 434 435 436
/**
 * e1000_power_up_phy - restore link in case the phy was powered down
 * @adapter: address of board private structure
 *
 * The phy may be powered down to save power and turn off link when the
 * driver is unloaded and wake on lan is not enabled (among others)
 * *** this routine MUST be followed by a call to e1000_reset ***
 **/
437
void e1000_power_up_phy(struct e1000_adapter *adapter)
438
{
J
Joe Perches 已提交
439
	struct e1000_hw *hw = &adapter->hw;
440
	u16 mii_reg = 0;
441 442

	/* Just clear the power down bit to wake the phy back up */
J
Joe Perches 已提交
443
	if (hw->media_type == e1000_media_type_copper) {
444
		/* according to the manual, the phy will retain its
445 446
		 * settings across a power-down/up cycle
		 */
J
Joe Perches 已提交
447
		e1000_read_phy_reg(hw, PHY_CTRL, &mii_reg);
448
		mii_reg &= ~MII_CR_POWER_DOWN;
J
Joe Perches 已提交
449
		e1000_write_phy_reg(hw, PHY_CTRL, mii_reg);
450 451 452 453 454
	}
}

static void e1000_power_down_phy(struct e1000_adapter *adapter)
{
J
Joe Perches 已提交
455 456
	struct e1000_hw *hw = &adapter->hw;

457
	/* Power down the PHY so no link is implied when interface is down *
J
Joe Perches 已提交
458
	 * The PHY cannot be powered down if any of the following is true *
459 460
	 * (a) WoL is enabled
	 * (b) AMT is active
461 462
	 * (c) SoL/IDER session is active
	 */
J
Joe Perches 已提交
463 464
	if (!adapter->wol && hw->mac_type >= e1000_82540 &&
	   hw->media_type == e1000_media_type_copper) {
465
		u16 mii_reg = 0;
466

J
Joe Perches 已提交
467
		switch (hw->mac_type) {
468 469 470 471
		case e1000_82540:
		case e1000_82545:
		case e1000_82545_rev_3:
		case e1000_82546:
472
		case e1000_ce4100:
473 474 475 476 477
		case e1000_82546_rev_3:
		case e1000_82541:
		case e1000_82541_rev_2:
		case e1000_82547:
		case e1000_82547_rev_2:
J
Joe Perches 已提交
478
			if (er32(MANC) & E1000_MANC_SMBUS_EN)
479 480 481 482 483
				goto out;
			break;
		default:
			goto out;
		}
J
Joe Perches 已提交
484
		e1000_read_phy_reg(hw, PHY_CTRL, &mii_reg);
485
		mii_reg |= MII_CR_POWER_DOWN;
J
Joe Perches 已提交
486
		e1000_write_phy_reg(hw, PHY_CTRL, mii_reg);
J
Jesse Brandeburg 已提交
487
		msleep(1);
488
	}
489 490
out:
	return;
491 492
}

493 494 495
static void e1000_down_and_stop(struct e1000_adapter *adapter)
{
	set_bit(__E1000_DOWN, &adapter->flags);
496

497
	cancel_delayed_work_sync(&adapter->watchdog_task);
498 499 500 501 502 503 504

	/*
	 * Since the watchdog task can reschedule other tasks, we should cancel
	 * it first, otherwise we can run into the situation when a work is
	 * still running after the adapter has been turned down.
	 */

505 506
	cancel_delayed_work_sync(&adapter->phy_info_task);
	cancel_delayed_work_sync(&adapter->fifo_stall_task);
507 508 509 510

	/* Only kill reset task if adapter is not resetting */
	if (!test_bit(__E1000_RESETTING, &adapter->flags))
		cancel_work_sync(&adapter->reset_task);
511 512
}

513
void e1000_down(struct e1000_adapter *adapter)
L
Linus Torvalds 已提交
514
{
515
	struct e1000_hw *hw = &adapter->hw;
L
Linus Torvalds 已提交
516
	struct net_device *netdev = adapter->netdev;
517
	u32 rctl, tctl;
L
Linus Torvalds 已提交
518

A
Auke Kok 已提交
519

520 521 522 523 524
	/* disable receives in the hardware */
	rctl = er32(RCTL);
	ew32(RCTL, rctl & ~E1000_RCTL_EN);
	/* flush and sleep below */

J
Jesse Brandeburg 已提交
525
	netif_tx_disable(netdev);
526 527 528 529 530 531 532 533 534

	/* disable transmits in the hardware */
	tctl = er32(TCTL);
	tctl &= ~E1000_TCTL_EN;
	ew32(TCTL, tctl);
	/* flush both disables and wait for them to finish */
	E1000_WRITE_FLUSH();
	msleep(10);

535
	napi_disable(&adapter->napi);
536

L
Linus Torvalds 已提交
537
	e1000_irq_disable(adapter);
538

539
	/* Setting DOWN must be after irq_disable to prevent
A
Anupam Chanda 已提交
540
	 * a screaming interrupt.  Setting DOWN also prevents
541
	 * tasks from rescheduling.
A
Anupam Chanda 已提交
542
	 */
543
	e1000_down_and_stop(adapter);
L
Linus Torvalds 已提交
544 545 546 547 548 549

	adapter->link_speed = 0;
	adapter->link_duplex = 0;
	netif_carrier_off(netdev);

	e1000_reset(adapter);
550 551
	e1000_clean_all_tx_rings(adapter);
	e1000_clean_all_rx_rings(adapter);
L
Linus Torvalds 已提交
552 553
}

554
void e1000_reinit_locked(struct e1000_adapter *adapter)
555 556 557 558 559 560 561
{
	WARN_ON(in_interrupt());
	while (test_and_set_bit(__E1000_RESETTING, &adapter->flags))
		msleep(1);
	e1000_down(adapter);
	e1000_up(adapter);
	clear_bit(__E1000_RESETTING, &adapter->flags);
L
Linus Torvalds 已提交
562 563
}

564
void e1000_reset(struct e1000_adapter *adapter)
L
Linus Torvalds 已提交
565
{
J
Joe Perches 已提交
566
	struct e1000_hw *hw = &adapter->hw;
567
	u32 pba = 0, tx_space, min_tx_space, min_rx_space;
J
Joe Perches 已提交
568
	bool legacy_pba_adjust = false;
569
	u16 hwm;
L
Linus Torvalds 已提交
570 571 572 573 574

	/* Repartition Pba for greater than 9k mtu
	 * To take effect CTRL.RST is required.
	 */

J
Joe Perches 已提交
575
	switch (hw->mac_type) {
576 577 578 579 580 581 582
	case e1000_82542_rev2_0:
	case e1000_82542_rev2_1:
	case e1000_82543:
	case e1000_82544:
	case e1000_82540:
	case e1000_82541:
	case e1000_82541_rev_2:
J
Joe Perches 已提交
583
		legacy_pba_adjust = true;
584 585 586 587 588
		pba = E1000_PBA_48K;
		break;
	case e1000_82545:
	case e1000_82545_rev_3:
	case e1000_82546:
589
	case e1000_ce4100:
590 591 592
	case e1000_82546_rev_3:
		pba = E1000_PBA_48K;
		break;
593
	case e1000_82547:
594
	case e1000_82547_rev_2:
J
Joe Perches 已提交
595
		legacy_pba_adjust = true;
596 597
		pba = E1000_PBA_30K;
		break;
598 599
	case e1000_undefined:
	case e1000_num_macs:
600 601 602
		break;
	}

J
Joe Perches 已提交
603
	if (legacy_pba_adjust) {
604
		if (hw->max_frame_size > E1000_RXBUFFER_8192)
605
			pba -= 8; /* allocate more FIFO for Tx */
606

J
Joe Perches 已提交
607
		if (hw->mac_type == e1000_82547) {
608 609 610 611 612 613
			adapter->tx_fifo_head = 0;
			adapter->tx_head_addr = pba << E1000_TX_HEAD_ADDR_SHIFT;
			adapter->tx_fifo_size =
				(E1000_PBA_40K - pba) << E1000_PBA_BYTES_SHIFT;
			atomic_set(&adapter->tx_fifo_stall, 0);
		}
614
	} else if (hw->max_frame_size >  ETH_FRAME_LEN + ETH_FCS_LEN) {
615
		/* adjust PBA for jumbo frames */
J
Joe Perches 已提交
616
		ew32(PBA, pba);
617 618

		/* To maintain wire speed transmits, the Tx FIFO should be
619
		 * large enough to accommodate two full transmit packets,
620
		 * rounded up to the next 1KB and expressed in KB.  Likewise,
621
		 * the Rx FIFO should be large enough to accommodate at least
622
		 * one full receive packet and is similarly rounded up and
623 624
		 * expressed in KB.
		 */
J
Joe Perches 已提交
625
		pba = er32(PBA);
626 627 628 629
		/* upper 16 bits has Tx packet buffer allocation size in KB */
		tx_space = pba >> 16;
		/* lower 16 bits has Rx packet buffer allocation size in KB */
		pba &= 0xffff;
630
		/* the Tx fifo also stores 16 bytes of information about the Tx
631 632 633 634 635
		 * but don't include ethernet FCS because hardware appends it
		 */
		min_tx_space = (hw->max_frame_size +
		                sizeof(struct e1000_tx_desc) -
		                ETH_FCS_LEN) * 2;
636
		min_tx_space = ALIGN(min_tx_space, 1024);
637
		min_tx_space >>= 10;
638 639
		/* software strips receive CRC, so leave room for it */
		min_rx_space = hw->max_frame_size;
640
		min_rx_space = ALIGN(min_rx_space, 1024);
641 642 643 644
		min_rx_space >>= 10;

		/* If current Tx allocation is less than the min Tx FIFO size,
		 * and the min Tx FIFO size is less than the current Rx FIFO
645 646
		 * allocation, take space away from current Rx allocation
		 */
647 648 649 650 651
		if (tx_space < min_tx_space &&
		    ((min_tx_space - tx_space) < pba)) {
			pba = pba - (min_tx_space - tx_space);

			/* PCI/PCIx hardware has PBA alignment constraints */
J
Joe Perches 已提交
652
			switch (hw->mac_type) {
653 654 655 656 657 658 659
			case e1000_82545 ... e1000_82546_rev_3:
				pba &= ~(E1000_PBA_8K - 1);
				break;
			default:
				break;
			}

660 661 662
			/* if short on Rx space, Rx wins and must trump Tx
			 * adjustment or use Early Receive if available
			 */
663 664
			if (pba < min_rx_space)
				pba = min_rx_space;
665
		}
L
Linus Torvalds 已提交
666
	}
667

J
Joe Perches 已提交
668
	ew32(PBA, pba);
L
Linus Torvalds 已提交
669

670
	/* flow control settings:
671 672 673 674 675 676 677 678 679 680 681 682 683
	 * The high water mark must be low enough to fit one full frame
	 * (or the size used for early receive) above it in the Rx FIFO.
	 * Set it to the lower of:
	 * - 90% of the Rx FIFO size, and
	 * - the full Rx FIFO size minus the early receive size (for parts
	 *   with ERT support assuming ERT set to E1000_ERT_2048), or
	 * - the full Rx FIFO size minus one full frame
	 */
	hwm = min(((pba << 10) * 9 / 10),
		  ((pba << 10) - hw->max_frame_size));

	hw->fc_high_water = hwm & 0xFFF8;	/* 8-byte granularity */
	hw->fc_low_water = hw->fc_high_water - 8;
684
	hw->fc_pause_time = E1000_FC_PAUSE_TIME;
J
Joe Perches 已提交
685 686
	hw->fc_send_xon = 1;
	hw->fc = hw->original_fc;
L
Linus Torvalds 已提交
687

688
	/* Allow time for pending master requests to run */
J
Joe Perches 已提交
689 690 691
	e1000_reset_hw(hw);
	if (hw->mac_type >= e1000_82544)
		ew32(WUC, 0);
692

J
Joe Perches 已提交
693
	if (e1000_init_hw(hw))
694
		e_dev_err("Hardware Error\n");
695
	e1000_update_mng_vlan(adapter);
696 697

	/* if (adapter->hwflags & HWFLAGS_PHY_PWR_BIT) { */
J
Joe Perches 已提交
698 699 700 701
	if (hw->mac_type >= e1000_82544 &&
	    hw->autoneg == 1 &&
	    hw->autoneg_advertised == ADVERTISE_1000_FULL) {
		u32 ctrl = er32(CTRL);
702 703
		/* clear phy power management bit if we are in gig only mode,
		 * which if enabled will attempt negotiation to 100Mb, which
704 705
		 * can cause a loss of link at power off or driver unload
		 */
706
		ctrl &= ~E1000_CTRL_SWDPIN3;
J
Joe Perches 已提交
707
		ew32(CTRL, ctrl);
708 709
	}

L
Linus Torvalds 已提交
710
	/* Enable h/w to recognize an 802.1Q VLAN Ethernet packet */
J
Joe Perches 已提交
711
	ew32(VET, ETHERNET_IEEE_VLAN_TYPE);
L
Linus Torvalds 已提交
712

J
Joe Perches 已提交
713 714
	e1000_reset_adaptive(hw);
	e1000_phy_get_info(hw, &adapter->phy_info);
A
Auke Kok 已提交
715

716
	e1000_release_manageability(adapter);
L
Linus Torvalds 已提交
717 718
}

719
/* Dump the eeprom for users having checksum issues */
720
static void e1000_dump_eeprom(struct e1000_adapter *adapter)
721 722 723 724 725 726 727 728 729 730 731 732
{
	struct net_device *netdev = adapter->netdev;
	struct ethtool_eeprom eeprom;
	const struct ethtool_ops *ops = netdev->ethtool_ops;
	u8 *data;
	int i;
	u16 csum_old, csum_new = 0;

	eeprom.len = ops->get_eeprom_len(netdev);
	eeprom.offset = 0;

	data = kmalloc(eeprom.len, GFP_KERNEL);
733
	if (!data)
734 735 736 737 738 739 740 741 742 743
		return;

	ops->get_eeprom(netdev, &eeprom, data);

	csum_old = (data[EEPROM_CHECKSUM_REG * 2]) +
		   (data[EEPROM_CHECKSUM_REG * 2 + 1] << 8);
	for (i = 0; i < EEPROM_CHECKSUM_REG * 2; i += 2)
		csum_new += data[i] + (data[i + 1] << 8);
	csum_new = EEPROM_SUM - csum_new;

744 745 746
	pr_err("/*********************/\n");
	pr_err("Current EEPROM Checksum : 0x%04x\n", csum_old);
	pr_err("Calculated              : 0x%04x\n", csum_new);
747

748 749
	pr_err("Offset    Values\n");
	pr_err("========  ======\n");
750 751
	print_hex_dump(KERN_ERR, "", DUMP_PREFIX_OFFSET, 16, 1, data, 128, 0);

752 753 754 755 756 757 758 759 760 761 762
	pr_err("Include this output when contacting your support provider.\n");
	pr_err("This is not a software error! Something bad happened to\n");
	pr_err("your hardware or EEPROM image. Ignoring this problem could\n");
	pr_err("result in further problems, possibly loss of data,\n");
	pr_err("corruption or system hangs!\n");
	pr_err("The MAC Address will be reset to 00:00:00:00:00:00,\n");
	pr_err("which is invalid and requires you to set the proper MAC\n");
	pr_err("address manually before continuing to enable this network\n");
	pr_err("device. Please inspect the EEPROM dump and report the\n");
	pr_err("issue to your hardware vendor or Intel Customer Support.\n");
	pr_err("/*********************/\n");
763 764 765 766

	kfree(data);
}

T
Taku Izumi 已提交
767 768 769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802
/**
 * e1000_is_need_ioport - determine if an adapter needs ioport resources or not
 * @pdev: PCI device information struct
 *
 * Return true if an adapter needs ioport resources
 **/
static int e1000_is_need_ioport(struct pci_dev *pdev)
{
	switch (pdev->device) {
	case E1000_DEV_ID_82540EM:
	case E1000_DEV_ID_82540EM_LOM:
	case E1000_DEV_ID_82540EP:
	case E1000_DEV_ID_82540EP_LOM:
	case E1000_DEV_ID_82540EP_LP:
	case E1000_DEV_ID_82541EI:
	case E1000_DEV_ID_82541EI_MOBILE:
	case E1000_DEV_ID_82541ER:
	case E1000_DEV_ID_82541ER_LOM:
	case E1000_DEV_ID_82541GI:
	case E1000_DEV_ID_82541GI_LF:
	case E1000_DEV_ID_82541GI_MOBILE:
	case E1000_DEV_ID_82544EI_COPPER:
	case E1000_DEV_ID_82544EI_FIBER:
	case E1000_DEV_ID_82544GC_COPPER:
	case E1000_DEV_ID_82544GC_LOM:
	case E1000_DEV_ID_82545EM_COPPER:
	case E1000_DEV_ID_82545EM_FIBER:
	case E1000_DEV_ID_82546EB_COPPER:
	case E1000_DEV_ID_82546EB_FIBER:
	case E1000_DEV_ID_82546EB_QUAD_COPPER:
		return true;
	default:
		return false;
	}
}

803 804
static netdev_features_t e1000_fix_features(struct net_device *netdev,
	netdev_features_t features)
J
Jiri Pirko 已提交
805
{
806 807
	/* Since there is no support for separate Rx/Tx vlan accel
	 * enable/disable make sure Tx flag is always in same state as Rx.
J
Jiri Pirko 已提交
808
	 */
809 810
	if (features & NETIF_F_HW_VLAN_CTAG_RX)
		features |= NETIF_F_HW_VLAN_CTAG_TX;
J
Jiri Pirko 已提交
811
	else
812
		features &= ~NETIF_F_HW_VLAN_CTAG_TX;
J
Jiri Pirko 已提交
813 814 815 816

	return features;
}

817 818
static int e1000_set_features(struct net_device *netdev,
	netdev_features_t features)
819 820
{
	struct e1000_adapter *adapter = netdev_priv(netdev);
821
	netdev_features_t changed = features ^ netdev->features;
822

823
	if (changed & NETIF_F_HW_VLAN_CTAG_RX)
J
Jiri Pirko 已提交
824 825
		e1000_vlan_mode(netdev, features);

B
Ben Greear 已提交
826
	if (!(changed & (NETIF_F_RXCSUM | NETIF_F_RXALL)))
827 828
		return 0;

B
Ben Greear 已提交
829
	netdev->features = features;
830 831 832 833 834 835 836 837 838 839
	adapter->rx_csum = !!(features & NETIF_F_RXCSUM);

	if (netif_running(netdev))
		e1000_reinit_locked(adapter);
	else
		e1000_reset(adapter);

	return 0;
}

840 841 842
static const struct net_device_ops e1000_netdev_ops = {
	.ndo_open		= e1000_open,
	.ndo_stop		= e1000_close,
843
	.ndo_start_xmit		= e1000_xmit_frame,
844 845 846
	.ndo_get_stats		= e1000_get_stats,
	.ndo_set_rx_mode	= e1000_set_rx_mode,
	.ndo_set_mac_address	= e1000_set_mac,
J
Jiri Pirko 已提交
847
	.ndo_tx_timeout		= e1000_tx_timeout,
848 849 850 851 852 853 854 855
	.ndo_change_mtu		= e1000_change_mtu,
	.ndo_do_ioctl		= e1000_ioctl,
	.ndo_validate_addr	= eth_validate_addr,
	.ndo_vlan_rx_add_vid	= e1000_vlan_rx_add_vid,
	.ndo_vlan_rx_kill_vid	= e1000_vlan_rx_kill_vid,
#ifdef CONFIG_NET_POLL_CONTROLLER
	.ndo_poll_controller	= e1000_netpoll,
#endif
J
Jiri Pirko 已提交
856 857
	.ndo_fix_features	= e1000_fix_features,
	.ndo_set_features	= e1000_set_features,
858 859
};

860 861 862 863 864 865 866 867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882 883 884 885 886 887 888 889 890 891 892 893 894 895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917 918 919 920 921 922 923
/**
 * e1000_init_hw_struct - initialize members of hw struct
 * @adapter: board private struct
 * @hw: structure used by e1000_hw.c
 *
 * Factors out initialization of the e1000_hw struct to its own function
 * that can be called very early at init (just after struct allocation).
 * Fields are initialized based on PCI device information and
 * OS network device settings (MTU size).
 * Returns negative error codes if MAC type setup fails.
 */
static int e1000_init_hw_struct(struct e1000_adapter *adapter,
				struct e1000_hw *hw)
{
	struct pci_dev *pdev = adapter->pdev;

	/* PCI config space info */
	hw->vendor_id = pdev->vendor;
	hw->device_id = pdev->device;
	hw->subsystem_vendor_id = pdev->subsystem_vendor;
	hw->subsystem_id = pdev->subsystem_device;
	hw->revision_id = pdev->revision;

	pci_read_config_word(pdev, PCI_COMMAND, &hw->pci_cmd_word);

	hw->max_frame_size = adapter->netdev->mtu +
			     ENET_HEADER_SIZE + ETHERNET_FCS_SIZE;
	hw->min_frame_size = MINIMUM_ETHERNET_FRAME_SIZE;

	/* identify the MAC */
	if (e1000_set_mac_type(hw)) {
		e_err(probe, "Unknown MAC Type\n");
		return -EIO;
	}

	switch (hw->mac_type) {
	default:
		break;
	case e1000_82541:
	case e1000_82547:
	case e1000_82541_rev_2:
	case e1000_82547_rev_2:
		hw->phy_init_script = 1;
		break;
	}

	e1000_set_media_type(hw);
	e1000_get_bus_info(hw);

	hw->wait_autoneg_complete = false;
	hw->tbi_compatibility_en = true;
	hw->adaptive_ifs = true;

	/* Copper options */

	if (hw->media_type == e1000_media_type_copper) {
		hw->mdix = AUTO_ALL_MODES;
		hw->disable_polarity_correction = false;
		hw->master_slave = E1000_MASTER_SLAVE;
	}

	return 0;
}

L
Linus Torvalds 已提交
924 925 926 927 928 929 930 931 932 933 934
/**
 * e1000_probe - Device Initialization Routine
 * @pdev: PCI device information struct
 * @ent: entry in e1000_pci_tbl
 *
 * Returns 0 on success, negative on failure
 *
 * e1000_probe initializes an adapter identified by a pci_dev structure.
 * The OS initialization, configuring of the adapter private structure,
 * and a hardware reset occur.
 **/
935
static int e1000_probe(struct pci_dev *pdev, const struct pci_device_id *ent)
L
Linus Torvalds 已提交
936 937 938
{
	struct net_device *netdev;
	struct e1000_adapter *adapter;
J
Joe Perches 已提交
939
	struct e1000_hw *hw;
940

L
Linus Torvalds 已提交
941
	static int cards_found = 0;
942
	static int global_quad_port_a = 0; /* global ksp3 port a indication */
943
	int i, err, pci_using_dac;
944
	u16 eeprom_data = 0;
945
	u16 tmp = 0;
946
	u16 eeprom_apme_mask = E1000_EEPROM_APME;
T
Taku Izumi 已提交
947
	int bars, need_ioport;
948

T
Taku Izumi 已提交
949 950 951 952 953 954 955
	/* do not allocate ioport bars when not needed */
	need_ioport = e1000_is_need_ioport(pdev);
	if (need_ioport) {
		bars = pci_select_bars(pdev, IORESOURCE_MEM | IORESOURCE_IO);
		err = pci_enable_device(pdev);
	} else {
		bars = pci_select_bars(pdev, IORESOURCE_MEM);
956
		err = pci_enable_device_mem(pdev);
T
Taku Izumi 已提交
957
	}
958
	if (err)
L
Linus Torvalds 已提交
959 960
		return err;

T
Taku Izumi 已提交
961
	err = pci_request_selected_regions(pdev, bars, e1000_driver_name);
962
	if (err)
963
		goto err_pci_reg;
L
Linus Torvalds 已提交
964 965

	pci_set_master(pdev);
966 967 968
	err = pci_save_state(pdev);
	if (err)
		goto err_alloc_etherdev;
L
Linus Torvalds 已提交
969

970
	err = -ENOMEM;
L
Linus Torvalds 已提交
971
	netdev = alloc_etherdev(sizeof(struct e1000_adapter));
972
	if (!netdev)
L
Linus Torvalds 已提交
973 974 975 976 977
		goto err_alloc_etherdev;

	SET_NETDEV_DEV(netdev, &pdev->dev);

	pci_set_drvdata(pdev, netdev);
978
	adapter = netdev_priv(netdev);
L
Linus Torvalds 已提交
979 980
	adapter->netdev = netdev;
	adapter->pdev = pdev;
981
	adapter->msg_enable = netif_msg_init(debug, DEFAULT_MSG_ENABLE);
T
Taku Izumi 已提交
982 983
	adapter->bars = bars;
	adapter->need_ioport = need_ioport;
L
Linus Torvalds 已提交
984

J
Joe Perches 已提交
985 986 987
	hw = &adapter->hw;
	hw->back = adapter;

988
	err = -EIO;
989
	hw->hw_addr = pci_ioremap_bar(pdev, BAR_0);
J
Joe Perches 已提交
990
	if (!hw->hw_addr)
L
Linus Torvalds 已提交
991 992
		goto err_ioremap;

T
Taku Izumi 已提交
993 994 995 996 997 998 999 1000
	if (adapter->need_ioport) {
		for (i = BAR_1; i <= BAR_5; i++) {
			if (pci_resource_len(pdev, i) == 0)
				continue;
			if (pci_resource_flags(pdev, i) & IORESOURCE_IO) {
				hw->io_base = pci_resource_start(pdev, i);
				break;
			}
L
Linus Torvalds 已提交
1001 1002 1003
		}
	}

1004 1005 1006 1007 1008
	/* make ready for any if (hw->...) below */
	err = e1000_init_hw_struct(adapter, hw);
	if (err)
		goto err_sw_init;

1009
	/* there is a workaround being applied below that limits
1010 1011 1012 1013 1014
	 * 64-bit DMA addresses to 64-bit hardware.  There are some
	 * 32-bit adapters that Tx hang when given 64-bit DMA addresses
	 */
	pci_using_dac = 0;
	if ((hw->bus_type == e1000_bus_type_pcix) &&
1015
	    !dma_set_mask_and_coherent(&pdev->dev, DMA_BIT_MASK(64))) {
1016 1017
		pci_using_dac = 1;
	} else {
1018
		err = dma_set_mask_and_coherent(&pdev->dev, DMA_BIT_MASK(32));
1019 1020 1021 1022
		if (err) {
			pr_err("No usable DMA config, aborting\n");
			goto err_dma;
		}
1023 1024
	}

1025
	netdev->netdev_ops = &e1000_netdev_ops;
L
Linus Torvalds 已提交
1026 1027
	e1000_set_ethtool_ops(netdev);
	netdev->watchdog_timeo = 5 * HZ;
1028
	netif_napi_add(netdev, &adapter->napi, e1000_clean, 64);
1029

1030
	strncpy(netdev->name, pci_name(pdev), sizeof(netdev->name) - 1);
L
Linus Torvalds 已提交
1031 1032 1033 1034 1035

	adapter->bd_number = cards_found;

	/* setup the private structure */

1036 1037
	err = e1000_sw_init(adapter);
	if (err)
L
Linus Torvalds 已提交
1038 1039
		goto err_sw_init;

1040
	err = -EIO;
1041
	if (hw->mac_type == e1000_ce4100) {
1042 1043
		hw->ce4100_gbe_mdio_base_virt =
					ioremap(pci_resource_start(pdev, BAR_1),
1044 1045
		                                pci_resource_len(pdev, BAR_1));

1046
		if (!hw->ce4100_gbe_mdio_base_virt)
1047 1048
			goto err_mdio_ioremap;
	}
1049

J
Joe Perches 已提交
1050
	if (hw->mac_type >= e1000_82543) {
1051
		netdev->hw_features = NETIF_F_SG |
J
Jiri Pirko 已提交
1052
				   NETIF_F_HW_CSUM |
1053 1054 1055
				   NETIF_F_HW_VLAN_CTAG_RX;
		netdev->features = NETIF_F_HW_VLAN_CTAG_TX |
				   NETIF_F_HW_VLAN_CTAG_FILTER;
L
Linus Torvalds 已提交
1056 1057
	}

J
Joe Perches 已提交
1058 1059
	if ((hw->mac_type >= e1000_82544) &&
	   (hw->mac_type != e1000_82547))
1060 1061
		netdev->hw_features |= NETIF_F_TSO;

1062 1063
	netdev->priv_flags |= IFF_SUPP_NOFCS;

1064
	netdev->features |= netdev->hw_features;
1065 1066 1067
	netdev->hw_features |= (NETIF_F_RXCSUM |
				NETIF_F_RXALL |
				NETIF_F_RXFCS);
1068

1069
	if (pci_using_dac) {
L
Linus Torvalds 已提交
1070
		netdev->features |= NETIF_F_HIGHDMA;
1071 1072
		netdev->vlan_features |= NETIF_F_HIGHDMA;
	}
L
Linus Torvalds 已提交
1073

1074 1075 1076
	netdev->vlan_features |= (NETIF_F_TSO |
				  NETIF_F_HW_CSUM |
				  NETIF_F_SG);
1077

1078 1079 1080 1081
	/* Do not set IFF_UNICAST_FLT for VMWare's 82545EM */
	if (hw->device_id != E1000_DEV_ID_82545EM_COPPER ||
	    hw->subsystem_vendor_id != PCI_VENDOR_ID_VMWARE)
		netdev->priv_flags |= IFF_UNICAST_FLT;
1082

J
Joe Perches 已提交
1083
	adapter->en_mng_pt = e1000_enable_mng_pass_thru(hw);
1084

1085
	/* initialize eeprom parameters */
J
Joe Perches 已提交
1086
	if (e1000_init_eeprom_params(hw)) {
1087
		e_err(probe, "EEPROM initialization failed\n");
1088
		goto err_eeprom;
1089 1090
	}

J
Jesse Brandeburg 已提交
1091
	/* before reading the EEPROM, reset the controller to
1092 1093
	 * put the device in a known good starting state
	 */
J
Jesse Brandeburg 已提交
1094

J
Joe Perches 已提交
1095
	e1000_reset_hw(hw);
L
Linus Torvalds 已提交
1096 1097

	/* make sure the EEPROM is good */
J
Joe Perches 已提交
1098
	if (e1000_validate_eeprom_checksum(hw) < 0) {
1099
		e_err(probe, "The EEPROM Checksum Is Not Valid\n");
1100
		e1000_dump_eeprom(adapter);
1101
		/* set MAC address to all zeroes to invalidate and temporary
1102 1103 1104 1105 1106 1107
		 * disable this device for the user. This blocks regular
		 * traffic while still permitting ethtool ioctls from reaching
		 * the hardware as well as allowing the user to run the
		 * interface after manually setting a hw addr using
		 * `ip set address`
		 */
J
Joe Perches 已提交
1108
		memset(hw->mac_addr, 0, netdev->addr_len);
1109 1110
	} else {
		/* copy the MAC address out of the EEPROM */
J
Joe Perches 已提交
1111
		if (e1000_read_mac_addr(hw))
1112
			e_err(probe, "EEPROM Read Error\n");
L
Linus Torvalds 已提交
1113
	}
1114
	/* don't block initalization here due to bad MAC address */
J
Joe Perches 已提交
1115
	memcpy(netdev->dev_addr, hw->mac_addr, netdev->addr_len);
L
Linus Torvalds 已提交
1116

1117
	if (!is_valid_ether_addr(netdev->dev_addr))
1118
		e_err(probe, "Invalid MAC Address\n");
L
Linus Torvalds 已提交
1119 1120


1121 1122 1123 1124
	INIT_DELAYED_WORK(&adapter->watchdog_task, e1000_watchdog);
	INIT_DELAYED_WORK(&adapter->fifo_stall_task,
			  e1000_82547_tx_fifo_stall_task);
	INIT_DELAYED_WORK(&adapter->phy_info_task, e1000_update_phy_info_task);
1125
	INIT_WORK(&adapter->reset_task, e1000_reset_task);
L
Linus Torvalds 已提交
1126 1127 1128 1129 1130 1131 1132 1133

	e1000_check_options(adapter);

	/* Initial Wake on LAN setting
	 * If APM wake is enabled in the EEPROM,
	 * enable the ACPI Magic Packet filter
	 */

J
Joe Perches 已提交
1134
	switch (hw->mac_type) {
L
Linus Torvalds 已提交
1135 1136 1137 1138 1139
	case e1000_82542_rev2_0:
	case e1000_82542_rev2_1:
	case e1000_82543:
		break;
	case e1000_82544:
J
Joe Perches 已提交
1140
		e1000_read_eeprom(hw,
L
Linus Torvalds 已提交
1141 1142 1143 1144 1145
			EEPROM_INIT_CONTROL2_REG, 1, &eeprom_data);
		eeprom_apme_mask = E1000_EEPROM_82544_APM;
		break;
	case e1000_82546:
	case e1000_82546_rev_3:
J
Joe Perches 已提交
1146 1147
		if (er32(STATUS) & E1000_STATUS_FUNC_1){
			e1000_read_eeprom(hw,
L
Linus Torvalds 已提交
1148 1149 1150 1151 1152
				EEPROM_INIT_CONTROL3_PORT_B, 1, &eeprom_data);
			break;
		}
		/* Fall Through */
	default:
J
Joe Perches 已提交
1153
		e1000_read_eeprom(hw,
L
Linus Torvalds 已提交
1154 1155 1156
			EEPROM_INIT_CONTROL3_PORT_A, 1, &eeprom_data);
		break;
	}
J
Jesse Brandeburg 已提交
1157
	if (eeprom_data & eeprom_apme_mask)
1158 1159 1160 1161
		adapter->eeprom_wol |= E1000_WUFC_MAG;

	/* now that we have the eeprom settings, apply the special cases
	 * where the eeprom may be wrong or the board simply won't support
1162 1163
	 * wake on lan on a particular port
	 */
1164 1165 1166 1167 1168 1169 1170
	switch (pdev->device) {
	case E1000_DEV_ID_82546GB_PCIE:
		adapter->eeprom_wol = 0;
		break;
	case E1000_DEV_ID_82546EB_FIBER:
	case E1000_DEV_ID_82546GB_FIBER:
		/* Wake events only supported on port A for dual fiber
1171 1172
		 * regardless of eeprom setting
		 */
J
Joe Perches 已提交
1173
		if (er32(STATUS) & E1000_STATUS_FUNC_1)
1174 1175 1176 1177 1178 1179 1180
			adapter->eeprom_wol = 0;
		break;
	case E1000_DEV_ID_82546GB_QUAD_COPPER_KSP3:
		/* if quad port adapter, disable WoL on all but port A */
		if (global_quad_port_a != 0)
			adapter->eeprom_wol = 0;
		else
1181
			adapter->quad_port_a = true;
1182 1183 1184 1185 1186 1187 1188 1189
		/* Reset for multiple quad port adapters */
		if (++global_quad_port_a == 4)
			global_quad_port_a = 0;
		break;
	}

	/* initialize the wol settings based on the eeprom settings */
	adapter->wol = adapter->eeprom_wol;
1190
	device_set_wakeup_enable(&adapter->pdev->dev, adapter->wol);
L
Linus Torvalds 已提交
1191

1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205
	/* Auto detect PHY address */
	if (hw->mac_type == e1000_ce4100) {
		for (i = 0; i < 32; i++) {
			hw->phy_addr = i;
			e1000_read_phy_reg(hw, PHY_ID2, &tmp);
			if (tmp == 0 || tmp == 0xFF) {
				if (i == 31)
					goto err_eeprom;
				continue;
			} else
				break;
		}
	}

1206 1207 1208 1209 1210 1211 1212 1213
	/* reset the hardware with the new settings */
	e1000_reset(adapter);

	strcpy(netdev->name, "eth%d");
	err = register_netdev(netdev);
	if (err)
		goto err_register;

1214
	e1000_vlan_filter_on_off(adapter, false);
J
Jiri Pirko 已提交
1215

1216
	/* print bus type/speed/width info */
1217
	e_info(probe, "(PCI%s:%dMHz:%d-bit) %pM\n",
J
Joe Perches 已提交
1218 1219 1220 1221 1222 1223 1224
	       ((hw->bus_type == e1000_bus_type_pcix) ? "-X" : ""),
	       ((hw->bus_speed == e1000_bus_speed_133) ? 133 :
		(hw->bus_speed == e1000_bus_speed_120) ? 120 :
		(hw->bus_speed == e1000_bus_speed_100) ? 100 :
		(hw->bus_speed == e1000_bus_speed_66) ? 66 : 33),
	       ((hw->bus_width == e1000_bus_width_64) ? 64 : 32),
	       netdev->dev_addr);
A
Auke Kok 已提交
1225

1226 1227 1228
	/* carrier off reporting is important to ethtool even BEFORE open */
	netif_carrier_off(netdev);

1229
	e_info(probe, "Intel(R) PRO/1000 Network Connection\n");
L
Linus Torvalds 已提交
1230 1231 1232 1233 1234

	cards_found++;
	return 0;

err_register:
1235
err_eeprom:
1236
	e1000_phy_hw_reset(hw);
1237

J
Joe Perches 已提交
1238 1239
	if (hw->flash_address)
		iounmap(hw->flash_address);
1240 1241
	kfree(adapter->tx_ring);
	kfree(adapter->rx_ring);
1242
err_dma:
L
Linus Torvalds 已提交
1243
err_sw_init:
1244
err_mdio_ioremap:
1245
	iounmap(hw->ce4100_gbe_mdio_base_virt);
J
Joe Perches 已提交
1246
	iounmap(hw->hw_addr);
L
Linus Torvalds 已提交
1247 1248 1249
err_ioremap:
	free_netdev(netdev);
err_alloc_etherdev:
T
Taku Izumi 已提交
1250
	pci_release_selected_regions(pdev, bars);
1251 1252
err_pci_reg:
	pci_disable_device(pdev);
L
Linus Torvalds 已提交
1253 1254 1255 1256 1257 1258 1259 1260 1261 1262 1263 1264
	return err;
}

/**
 * e1000_remove - Device Removal Routine
 * @pdev: PCI device information struct
 *
 * e1000_remove is called by the PCI subsystem to alert the driver
 * that it should release a PCI device.  The could be caused by a
 * Hot-Plug event, or because the driver is going to be removed from
 * memory.
 **/
1265
static void e1000_remove(struct pci_dev *pdev)
L
Linus Torvalds 已提交
1266 1267
{
	struct net_device *netdev = pci_get_drvdata(pdev);
1268
	struct e1000_adapter *adapter = netdev_priv(netdev);
J
Joe Perches 已提交
1269
	struct e1000_hw *hw = &adapter->hw;
L
Linus Torvalds 已提交
1270

1271
	e1000_down_and_stop(adapter);
1272
	e1000_release_manageability(adapter);
L
Linus Torvalds 已提交
1273

1274 1275
	unregister_netdev(netdev);

1276
	e1000_phy_hw_reset(hw);
L
Linus Torvalds 已提交
1277

1278 1279 1280
	kfree(adapter->tx_ring);
	kfree(adapter->rx_ring);

1281
	if (hw->mac_type == e1000_ce4100)
1282
		iounmap(hw->ce4100_gbe_mdio_base_virt);
J
Joe Perches 已提交
1283 1284 1285
	iounmap(hw->hw_addr);
	if (hw->flash_address)
		iounmap(hw->flash_address);
T
Taku Izumi 已提交
1286
	pci_release_selected_regions(pdev, adapter->bars);
L
Linus Torvalds 已提交
1287 1288 1289 1290 1291 1292 1293 1294 1295 1296 1297

	free_netdev(netdev);

	pci_disable_device(pdev);
}

/**
 * e1000_sw_init - Initialize general software structures (struct e1000_adapter)
 * @adapter: board private structure to initialize
 *
 * e1000_sw_init initializes the Adapter private data structure.
1298
 * e1000_init_hw_struct MUST be called before this function
L
Linus Torvalds 已提交
1299
 **/
1300
static int e1000_sw_init(struct e1000_adapter *adapter)
L
Linus Torvalds 已提交
1301
{
1302
	adapter->rx_buffer_len = MAXIMUM_ETHERNET_VLAN_SIZE;
L
Linus Torvalds 已提交
1303

1304 1305
	adapter->num_tx_queues = 1;
	adapter->num_rx_queues = 1;
1306 1307

	if (e1000_alloc_queues(adapter)) {
1308
		e_err(probe, "Unable to allocate memory for queues\n");
1309 1310 1311
		return -ENOMEM;
	}

1312 1313 1314
	/* Explicitly disable IRQ since the NIC can be in any state. */
	e1000_irq_disable(adapter);

L
Linus Torvalds 已提交
1315 1316
	spin_lock_init(&adapter->stats_lock);

A
Auke Kok 已提交
1317 1318
	set_bit(__E1000_DOWN, &adapter->flags);

L
Linus Torvalds 已提交
1319 1320 1321
	return 0;
}

1322 1323 1324 1325 1326
/**
 * e1000_alloc_queues - Allocate memory for all rings
 * @adapter: board private structure to initialize
 *
 * We allocate one ring per queue at run-time since we don't know the
1327
 * number of queues at compile-time.
1328
 **/
1329
static int e1000_alloc_queues(struct e1000_adapter *adapter)
1330
{
Y
Yan Burman 已提交
1331 1332
	adapter->tx_ring = kcalloc(adapter->num_tx_queues,
	                           sizeof(struct e1000_tx_ring), GFP_KERNEL);
1333 1334 1335
	if (!adapter->tx_ring)
		return -ENOMEM;

Y
Yan Burman 已提交
1336 1337
	adapter->rx_ring = kcalloc(adapter->num_rx_queues,
	                           sizeof(struct e1000_rx_ring), GFP_KERNEL);
1338 1339 1340 1341 1342 1343 1344 1345
	if (!adapter->rx_ring) {
		kfree(adapter->tx_ring);
		return -ENOMEM;
	}

	return E1000_SUCCESS;
}

L
Linus Torvalds 已提交
1346 1347 1348 1349 1350 1351 1352 1353 1354
/**
 * e1000_open - Called when a network interface is made active
 * @netdev: network interface device structure
 *
 * Returns 0 on success, negative value on failure
 *
 * The open entry point is called when a network interface is made
 * active by the system (IFF_UP).  At this point all resources needed
 * for transmit and receive operations are allocated, the interrupt
1355
 * handler is registered with the OS, the watchdog task is started,
L
Linus Torvalds 已提交
1356 1357
 * and the stack is notified that the interface is ready.
 **/
1358
static int e1000_open(struct net_device *netdev)
L
Linus Torvalds 已提交
1359
{
1360
	struct e1000_adapter *adapter = netdev_priv(netdev);
J
Joe Perches 已提交
1361
	struct e1000_hw *hw = &adapter->hw;
L
Linus Torvalds 已提交
1362 1363
	int err;

1364
	/* disallow open during test */
A
Auke Kok 已提交
1365
	if (test_bit(__E1000_TESTING, &adapter->flags))
1366 1367
		return -EBUSY;

1368 1369
	netif_carrier_off(netdev);

L
Linus Torvalds 已提交
1370
	/* allocate transmit descriptors */
1371 1372
	err = e1000_setup_all_tx_resources(adapter);
	if (err)
L
Linus Torvalds 已提交
1373 1374 1375
		goto err_setup_tx;

	/* allocate receive descriptors */
1376
	err = e1000_setup_all_rx_resources(adapter);
1377
	if (err)
1378
		goto err_setup_rx;
1379

1380 1381
	e1000_power_up_phy(adapter);

1382
	adapter->mng_vlan_id = E1000_MNG_VLAN_NONE;
J
Joe Perches 已提交
1383
	if ((hw->mng_cookie.status &
1384 1385 1386
			  E1000_MNG_DHCP_COOKIE_STATUS_VLAN_SUPPORT)) {
		e1000_update_mng_vlan(adapter);
	}
L
Linus Torvalds 已提交
1387

1388 1389 1390
	/* before we allocate an interrupt, we must be ready to handle it.
	 * Setting DEBUG_SHIRQ in the kernel makes it fire an interrupt
	 * as soon as we call pci_request_irq, so we have to setup our
1391 1392
	 * clean_rx handler before we do so.
	 */
1393 1394 1395 1396 1397 1398 1399 1400 1401
	e1000_configure(adapter);

	err = e1000_request_irq(adapter);
	if (err)
		goto err_req_irq;

	/* From here on the code is the same as e1000_up() */
	clear_bit(__E1000_DOWN, &adapter->flags);

1402
	napi_enable(&adapter->napi);
1403

1404 1405
	e1000_irq_enable(adapter);

B
Ben Hutchings 已提交
1406 1407
	netif_start_queue(netdev);

1408
	/* fire a link status change interrupt to start the watchdog */
J
Joe Perches 已提交
1409
	ew32(ICS, E1000_ICS_LSC);
1410

L
Linus Torvalds 已提交
1411 1412
	return E1000_SUCCESS;

1413
err_req_irq:
1414
	e1000_power_down_phy(adapter);
1415
	e1000_free_all_rx_resources(adapter);
L
Linus Torvalds 已提交
1416
err_setup_rx:
1417
	e1000_free_all_tx_resources(adapter);
L
Linus Torvalds 已提交
1418 1419 1420 1421 1422 1423 1424 1425 1426 1427 1428 1429 1430 1431 1432 1433 1434
err_setup_tx:
	e1000_reset(adapter);

	return err;
}

/**
 * e1000_close - Disables a network interface
 * @netdev: network interface device structure
 *
 * Returns 0, this is not allowed to fail
 *
 * The close entry point is called when an interface is de-activated
 * by the OS.  The hardware is still under the drivers control, but
 * needs to be disabled.  A global MAC reset is issued to stop the
 * hardware, and all transmit and receive resources are freed.
 **/
1435
static int e1000_close(struct net_device *netdev)
L
Linus Torvalds 已提交
1436
{
1437
	struct e1000_adapter *adapter = netdev_priv(netdev);
J
Joe Perches 已提交
1438
	struct e1000_hw *hw = &adapter->hw;
1439 1440 1441 1442
	int count = E1000_CHECK_RESET_COUNT;

	while (test_bit(__E1000_RESETTING, &adapter->flags) && count--)
		usleep_range(10000, 20000);
L
Linus Torvalds 已提交
1443

1444
	WARN_ON(test_bit(__E1000_RESETTING, &adapter->flags));
L
Linus Torvalds 已提交
1445
	e1000_down(adapter);
1446
	e1000_power_down_phy(adapter);
1447
	e1000_free_irq(adapter);
L
Linus Torvalds 已提交
1448

1449 1450
	e1000_free_all_tx_resources(adapter);
	e1000_free_all_rx_resources(adapter);
L
Linus Torvalds 已提交
1451

1452
	/* kill manageability vlan ID if supported, but not if a vlan with
1453 1454
	 * the same ID is registered on the host OS (let 8021q kill it)
	 */
J
Joe Perches 已提交
1455
	if ((hw->mng_cookie.status &
1456 1457
	     E1000_MNG_DHCP_COOKIE_STATUS_VLAN_SUPPORT) &&
	    !test_bit(adapter->mng_vlan_id, adapter->active_vlans)) {
1458 1459
		e1000_vlan_rx_kill_vid(netdev, htons(ETH_P_8021Q),
				       adapter->mng_vlan_id);
1460
	}
1461

L
Linus Torvalds 已提交
1462 1463 1464 1465 1466 1467
	return 0;
}

/**
 * e1000_check_64k_bound - check that memory doesn't cross 64kB boundary
 * @adapter: address of board private structure
1468 1469
 * @start: address of beginning of memory
 * @len: length of memory
L
Linus Torvalds 已提交
1470
 **/
1471 1472
static bool e1000_check_64k_bound(struct e1000_adapter *adapter, void *start,
				  unsigned long len)
L
Linus Torvalds 已提交
1473
{
J
Joe Perches 已提交
1474
	struct e1000_hw *hw = &adapter->hw;
1475
	unsigned long begin = (unsigned long)start;
L
Linus Torvalds 已提交
1476 1477
	unsigned long end = begin + len;

1478
	/* First rev 82545 and 82546 need to not allow any memory
1479 1480
	 * write location to cross 64k boundary due to errata 23
	 */
J
Joe Perches 已提交
1481
	if (hw->mac_type == e1000_82545 ||
1482
	    hw->mac_type == e1000_ce4100 ||
J
Joe Perches 已提交
1483
	    hw->mac_type == e1000_82546) {
J
Joe Perches 已提交
1484
		return ((begin ^ (end - 1)) >> 16) != 0 ? false : true;
L
Linus Torvalds 已提交
1485 1486
	}

J
Joe Perches 已提交
1487
	return true;
L
Linus Torvalds 已提交
1488 1489 1490 1491 1492
}

/**
 * e1000_setup_tx_resources - allocate Tx resources (Descriptors)
 * @adapter: board private structure
1493
 * @txdr:    tx descriptor ring (for a specific queue) to setup
L
Linus Torvalds 已提交
1494 1495 1496
 *
 * Return 0 on success, negative on failure
 **/
1497 1498
static int e1000_setup_tx_resources(struct e1000_adapter *adapter,
				    struct e1000_tx_ring *txdr)
L
Linus Torvalds 已提交
1499 1500 1501 1502
{
	struct pci_dev *pdev = adapter->pdev;
	int size;

1503
	size = sizeof(struct e1000_tx_buffer) * txdr->count;
E
Eric Dumazet 已提交
1504
	txdr->buffer_info = vzalloc(size);
1505
	if (!txdr->buffer_info)
L
Linus Torvalds 已提交
1506 1507 1508 1509 1510
		return -ENOMEM;

	/* round up to nearest 4K */

	txdr->size = txdr->count * sizeof(struct e1000_tx_desc);
1511
	txdr->size = ALIGN(txdr->size, 4096);
L
Linus Torvalds 已提交
1512

1513 1514
	txdr->desc = dma_alloc_coherent(&pdev->dev, txdr->size, &txdr->dma,
					GFP_KERNEL);
J
Jesse Brandeburg 已提交
1515
	if (!txdr->desc) {
L
Linus Torvalds 已提交
1516 1517 1518 1519 1520
setup_tx_desc_die:
		vfree(txdr->buffer_info);
		return -ENOMEM;
	}

1521
	/* Fix for errata 23, can't cross 64kB boundary */
L
Linus Torvalds 已提交
1522 1523 1524
	if (!e1000_check_64k_bound(adapter, txdr->desc, txdr->size)) {
		void *olddesc = txdr->desc;
		dma_addr_t olddma = txdr->dma;
1525
		e_err(tx_err, "txdr align check failed: %u bytes at %p\n",
1526
		      txdr->size, txdr->desc);
1527
		/* Try again, without freeing the previous */
1528 1529
		txdr->desc = dma_alloc_coherent(&pdev->dev, txdr->size,
						&txdr->dma, GFP_KERNEL);
1530
		/* Failed allocation, critical failure */
J
Jesse Brandeburg 已提交
1531
		if (!txdr->desc) {
1532 1533
			dma_free_coherent(&pdev->dev, txdr->size, olddesc,
					  olddma);
L
Linus Torvalds 已提交
1534 1535 1536 1537 1538
			goto setup_tx_desc_die;
		}

		if (!e1000_check_64k_bound(adapter, txdr->desc, txdr->size)) {
			/* give up */
1539 1540 1541 1542
			dma_free_coherent(&pdev->dev, txdr->size, txdr->desc,
					  txdr->dma);
			dma_free_coherent(&pdev->dev, txdr->size, olddesc,
					  olddma);
1543
			e_err(probe, "Unable to allocate aligned memory "
1544
			      "for the transmit descriptor ring\n");
L
Linus Torvalds 已提交
1545 1546 1547
			vfree(txdr->buffer_info);
			return -ENOMEM;
		} else {
1548
			/* Free old allocation, new allocation was successful */
1549 1550
			dma_free_coherent(&pdev->dev, txdr->size, olddesc,
					  olddma);
L
Linus Torvalds 已提交
1551 1552 1553 1554 1555 1556 1557 1558 1559 1560
		}
	}
	memset(txdr->desc, 0, txdr->size);

	txdr->next_to_use = 0;
	txdr->next_to_clean = 0;

	return 0;
}

1561 1562 1563 1564 1565 1566 1567
/**
 * e1000_setup_all_tx_resources - wrapper to allocate Tx resources
 * 				  (Descriptors) for all queues
 * @adapter: board private structure
 *
 * Return 0 on success, negative on failure
 **/
1568
int e1000_setup_all_tx_resources(struct e1000_adapter *adapter)
1569 1570 1571
{
	int i, err = 0;

1572
	for (i = 0; i < adapter->num_tx_queues; i++) {
1573 1574
		err = e1000_setup_tx_resources(adapter, &adapter->tx_ring[i]);
		if (err) {
1575
			e_err(probe, "Allocation for Tx Queue %u failed\n", i);
1576 1577 1578
			for (i-- ; i >= 0; i--)
				e1000_free_tx_resources(adapter,
							&adapter->tx_ring[i]);
1579 1580 1581 1582 1583 1584 1585
			break;
		}
	}

	return err;
}

L
Linus Torvalds 已提交
1586 1587 1588 1589 1590 1591
/**
 * e1000_configure_tx - Configure 8254x Transmit Unit after Reset
 * @adapter: board private structure
 *
 * Configure the Tx unit of the MAC after a reset.
 **/
1592
static void e1000_configure_tx(struct e1000_adapter *adapter)
L
Linus Torvalds 已提交
1593
{
1594
	u64 tdba;
1595
	struct e1000_hw *hw = &adapter->hw;
1596
	u32 tdlen, tctl, tipg;
1597
	u32 ipgr1, ipgr2;
L
Linus Torvalds 已提交
1598 1599 1600

	/* Setup the HW Tx Head and Tail descriptor pointers */

1601
	switch (adapter->num_tx_queues) {
1602 1603
	case 1:
	default:
1604 1605 1606
		tdba = adapter->tx_ring[0].dma;
		tdlen = adapter->tx_ring[0].count *
			sizeof(struct e1000_tx_desc);
J
Joe Perches 已提交
1607 1608 1609 1610 1611
		ew32(TDLEN, tdlen);
		ew32(TDBAH, (tdba >> 32));
		ew32(TDBAL, (tdba & 0x00000000ffffffffULL));
		ew32(TDT, 0);
		ew32(TDH, 0);
1612 1613 1614 1615
		adapter->tx_ring[0].tdh = ((hw->mac_type >= e1000_82543) ?
					   E1000_TDH : E1000_82542_TDH);
		adapter->tx_ring[0].tdt = ((hw->mac_type >= e1000_82543) ?
					   E1000_TDT : E1000_82542_TDT);
1616 1617
		break;
	}
L
Linus Torvalds 已提交
1618 1619

	/* Set the default values for the Tx Inter Packet Gap timer */
1620
	if ((hw->media_type == e1000_media_type_fiber ||
1621
	     hw->media_type == e1000_media_type_internal_serdes))
1622 1623 1624 1625
		tipg = DEFAULT_82543_TIPG_IPGT_FIBER;
	else
		tipg = DEFAULT_82543_TIPG_IPGT_COPPER;

1626
	switch (hw->mac_type) {
L
Linus Torvalds 已提交
1627 1628 1629
	case e1000_82542_rev2_0:
	case e1000_82542_rev2_1:
		tipg = DEFAULT_82542_TIPG_IPGT;
1630 1631
		ipgr1 = DEFAULT_82542_TIPG_IPGR1;
		ipgr2 = DEFAULT_82542_TIPG_IPGR2;
L
Linus Torvalds 已提交
1632 1633
		break;
	default:
1634 1635 1636
		ipgr1 = DEFAULT_82543_TIPG_IPGR1;
		ipgr2 = DEFAULT_82543_TIPG_IPGR2;
		break;
L
Linus Torvalds 已提交
1637
	}
1638 1639
	tipg |= ipgr1 << E1000_TIPG_IPGR1_SHIFT;
	tipg |= ipgr2 << E1000_TIPG_IPGR2_SHIFT;
J
Joe Perches 已提交
1640
	ew32(TIPG, tipg);
L
Linus Torvalds 已提交
1641 1642 1643

	/* Set the Tx Interrupt Delay register */

J
Joe Perches 已提交
1644
	ew32(TIDV, adapter->tx_int_delay);
1645
	if (hw->mac_type >= e1000_82540)
J
Joe Perches 已提交
1646
		ew32(TADV, adapter->tx_abs_int_delay);
L
Linus Torvalds 已提交
1647 1648 1649

	/* Program the Transmit Control Register */

J
Joe Perches 已提交
1650
	tctl = er32(TCTL);
L
Linus Torvalds 已提交
1651
	tctl &= ~E1000_TCTL_CT;
1652
	tctl |= E1000_TCTL_PSP | E1000_TCTL_RTLC |
L
Linus Torvalds 已提交
1653 1654
		(E1000_COLLISION_THRESHOLD << E1000_CT_SHIFT);

1655
	e1000_config_collision_dist(hw);
L
Linus Torvalds 已提交
1656 1657

	/* Setup Transmit Descriptor Settings for eop descriptor */
1658 1659 1660 1661 1662
	adapter->txd_cmd = E1000_TXD_CMD_EOP | E1000_TXD_CMD_IFCS;

	/* only set IDE if we are delaying interrupts using the timers */
	if (adapter->tx_int_delay)
		adapter->txd_cmd |= E1000_TXD_CMD_IDE;
L
Linus Torvalds 已提交
1663

1664
	if (hw->mac_type < e1000_82543)
L
Linus Torvalds 已提交
1665 1666 1667 1668 1669
		adapter->txd_cmd |= E1000_TXD_CMD_RPS;
	else
		adapter->txd_cmd |= E1000_TXD_CMD_RS;

	/* Cache if we're 82544 running in PCI-X because we'll
1670 1671
	 * need this to apply a workaround later in the send path.
	 */
1672 1673
	if (hw->mac_type == e1000_82544 &&
	    hw->bus_type == e1000_bus_type_pcix)
1674
		adapter->pcix_82544 = true;
1675

J
Joe Perches 已提交
1676
	ew32(TCTL, tctl);
1677

L
Linus Torvalds 已提交
1678 1679 1680 1681 1682
}

/**
 * e1000_setup_rx_resources - allocate Rx resources (Descriptors)
 * @adapter: board private structure
1683
 * @rxdr:    rx descriptor ring (for a specific queue) to setup
L
Linus Torvalds 已提交
1684 1685 1686
 *
 * Returns 0 on success, negative on failure
 **/
1687 1688
static int e1000_setup_rx_resources(struct e1000_adapter *adapter,
				    struct e1000_rx_ring *rxdr)
L
Linus Torvalds 已提交
1689 1690
{
	struct pci_dev *pdev = adapter->pdev;
1691
	int size, desc_len;
L
Linus Torvalds 已提交
1692

1693
	size = sizeof(struct e1000_rx_buffer) * rxdr->count;
E
Eric Dumazet 已提交
1694
	rxdr->buffer_info = vzalloc(size);
1695
	if (!rxdr->buffer_info)
L
Linus Torvalds 已提交
1696 1697
		return -ENOMEM;

1698
	desc_len = sizeof(struct e1000_rx_desc);
1699

L
Linus Torvalds 已提交
1700 1701
	/* Round up to nearest 4K */

1702
	rxdr->size = rxdr->count * desc_len;
1703
	rxdr->size = ALIGN(rxdr->size, 4096);
L
Linus Torvalds 已提交
1704

1705 1706
	rxdr->desc = dma_alloc_coherent(&pdev->dev, rxdr->size, &rxdr->dma,
					GFP_KERNEL);
1707
	if (!rxdr->desc) {
L
Linus Torvalds 已提交
1708 1709 1710 1711 1712
setup_rx_desc_die:
		vfree(rxdr->buffer_info);
		return -ENOMEM;
	}

1713
	/* Fix for errata 23, can't cross 64kB boundary */
L
Linus Torvalds 已提交
1714 1715 1716
	if (!e1000_check_64k_bound(adapter, rxdr->desc, rxdr->size)) {
		void *olddesc = rxdr->desc;
		dma_addr_t olddma = rxdr->dma;
1717
		e_err(rx_err, "rxdr align check failed: %u bytes at %p\n",
1718
		      rxdr->size, rxdr->desc);
1719
		/* Try again, without freeing the previous */
1720 1721
		rxdr->desc = dma_alloc_coherent(&pdev->dev, rxdr->size,
						&rxdr->dma, GFP_KERNEL);
1722
		/* Failed allocation, critical failure */
1723
		if (!rxdr->desc) {
1724 1725
			dma_free_coherent(&pdev->dev, rxdr->size, olddesc,
					  olddma);
L
Linus Torvalds 已提交
1726 1727 1728 1729 1730
			goto setup_rx_desc_die;
		}

		if (!e1000_check_64k_bound(adapter, rxdr->desc, rxdr->size)) {
			/* give up */
1731 1732 1733 1734
			dma_free_coherent(&pdev->dev, rxdr->size, rxdr->desc,
					  rxdr->dma);
			dma_free_coherent(&pdev->dev, rxdr->size, olddesc,
					  olddma);
1735 1736
			e_err(probe, "Unable to allocate aligned memory for "
			      "the Rx descriptor ring\n");
1737
			goto setup_rx_desc_die;
L
Linus Torvalds 已提交
1738
		} else {
1739
			/* Free old allocation, new allocation was successful */
1740 1741
			dma_free_coherent(&pdev->dev, rxdr->size, olddesc,
					  olddma);
L
Linus Torvalds 已提交
1742 1743 1744 1745 1746 1747
		}
	}
	memset(rxdr->desc, 0, rxdr->size);

	rxdr->next_to_clean = 0;
	rxdr->next_to_use = 0;
1748
	rxdr->rx_skb_top = NULL;
L
Linus Torvalds 已提交
1749 1750 1751 1752

	return 0;
}

1753 1754 1755 1756 1757 1758 1759
/**
 * e1000_setup_all_rx_resources - wrapper to allocate Rx resources
 * 				  (Descriptors) for all queues
 * @adapter: board private structure
 *
 * Return 0 on success, negative on failure
 **/
1760
int e1000_setup_all_rx_resources(struct e1000_adapter *adapter)
1761 1762 1763
{
	int i, err = 0;

1764
	for (i = 0; i < adapter->num_rx_queues; i++) {
1765 1766
		err = e1000_setup_rx_resources(adapter, &adapter->rx_ring[i]);
		if (err) {
1767
			e_err(probe, "Allocation for Rx Queue %u failed\n", i);
1768 1769 1770
			for (i-- ; i >= 0; i--)
				e1000_free_rx_resources(adapter,
							&adapter->rx_ring[i]);
1771 1772 1773 1774 1775 1776 1777
			break;
		}
	}

	return err;
}

L
Linus Torvalds 已提交
1778
/**
1779
 * e1000_setup_rctl - configure the receive control registers
L
Linus Torvalds 已提交
1780 1781
 * @adapter: Board private structure
 **/
1782
static void e1000_setup_rctl(struct e1000_adapter *adapter)
L
Linus Torvalds 已提交
1783
{
J
Joe Perches 已提交
1784
	struct e1000_hw *hw = &adapter->hw;
1785
	u32 rctl;
L
Linus Torvalds 已提交
1786

J
Joe Perches 已提交
1787
	rctl = er32(RCTL);
L
Linus Torvalds 已提交
1788 1789 1790

	rctl &= ~(3 << E1000_RCTL_MO_SHIFT);

1791 1792
	rctl |= E1000_RCTL_BAM | E1000_RCTL_LBM_NO |
		E1000_RCTL_RDMTS_HALF |
J
Joe Perches 已提交
1793
		(hw->mc_filter_type << E1000_RCTL_MO_SHIFT);
L
Linus Torvalds 已提交
1794

J
Joe Perches 已提交
1795
	if (hw->tbi_compatibility_on == 1)
L
Linus Torvalds 已提交
1796 1797 1798 1799
		rctl |= E1000_RCTL_SBP;
	else
		rctl &= ~E1000_RCTL_SBP;

1800 1801 1802 1803 1804
	if (adapter->netdev->mtu <= ETH_DATA_LEN)
		rctl &= ~E1000_RCTL_LPE;
	else
		rctl |= E1000_RCTL_LPE;

L
Linus Torvalds 已提交
1805
	/* Setup buffer sizes */
1806 1807 1808
	rctl &= ~E1000_RCTL_SZ_4096;
	rctl |= E1000_RCTL_BSEX;
	switch (adapter->rx_buffer_len) {
1809 1810 1811 1812 1813 1814 1815 1816 1817 1818 1819 1820 1821 1822
		case E1000_RXBUFFER_2048:
		default:
			rctl |= E1000_RCTL_SZ_2048;
			rctl &= ~E1000_RCTL_BSEX;
			break;
		case E1000_RXBUFFER_4096:
			rctl |= E1000_RCTL_SZ_4096;
			break;
		case E1000_RXBUFFER_8192:
			rctl |= E1000_RCTL_SZ_8192;
			break;
		case E1000_RXBUFFER_16384:
			rctl |= E1000_RCTL_SZ_16384;
			break;
1823 1824
	}

B
Ben Greear 已提交
1825 1826 1827
	/* This is useful for sniffing bad packets. */
	if (adapter->netdev->features & NETIF_F_RXALL) {
		/* UPE and MPE will be handled by normal PROMISC logic
1828 1829
		 * in e1000e_set_rx_mode
		 */
B
Ben Greear 已提交
1830 1831 1832 1833 1834 1835 1836 1837 1838 1839 1840 1841
		rctl |= (E1000_RCTL_SBP | /* Receive bad packets */
			 E1000_RCTL_BAM | /* RX All Bcast Pkts */
			 E1000_RCTL_PMCF); /* RX All MAC Ctrl Pkts */

		rctl &= ~(E1000_RCTL_VFE | /* Disable VLAN filter */
			  E1000_RCTL_DPF | /* Allow filtered pause */
			  E1000_RCTL_CFIEN); /* Dis VLAN CFIEN Filter */
		/* Do not mess with E1000_CTRL_VME, it affects transmit as well,
		 * and that breaks VLANs.
		 */
	}

J
Joe Perches 已提交
1842
	ew32(RCTL, rctl);
L
Linus Torvalds 已提交
1843 1844 1845 1846 1847 1848 1849 1850
}

/**
 * e1000_configure_rx - Configure 8254x Receive Unit after Reset
 * @adapter: board private structure
 *
 * Configure the Rx unit of the MAC after a reset.
 **/
1851
static void e1000_configure_rx(struct e1000_adapter *adapter)
L
Linus Torvalds 已提交
1852
{
1853
	u64 rdba;
1854
	struct e1000_hw *hw = &adapter->hw;
1855
	u32 rdlen, rctl, rxcsum;
1856

1857 1858 1859 1860 1861 1862 1863 1864 1865 1866 1867
	if (adapter->netdev->mtu > ETH_DATA_LEN) {
		rdlen = adapter->rx_ring[0].count *
		        sizeof(struct e1000_rx_desc);
		adapter->clean_rx = e1000_clean_jumbo_rx_irq;
		adapter->alloc_rx_buf = e1000_alloc_jumbo_rx_buffers;
	} else {
		rdlen = adapter->rx_ring[0].count *
		        sizeof(struct e1000_rx_desc);
		adapter->clean_rx = e1000_clean_rx_irq;
		adapter->alloc_rx_buf = e1000_alloc_rx_buffers;
	}
L
Linus Torvalds 已提交
1868 1869

	/* disable receives while setting up the descriptors */
J
Joe Perches 已提交
1870 1871
	rctl = er32(RCTL);
	ew32(RCTL, rctl & ~E1000_RCTL_EN);
L
Linus Torvalds 已提交
1872 1873

	/* set the Receive Delay Timer Register */
J
Joe Perches 已提交
1874
	ew32(RDTR, adapter->rx_int_delay);
L
Linus Torvalds 已提交
1875

1876
	if (hw->mac_type >= e1000_82540) {
J
Joe Perches 已提交
1877
		ew32(RADV, adapter->rx_abs_int_delay);
J
Jesse Brandeburg 已提交
1878
		if (adapter->itr_setting != 0)
J
Joe Perches 已提交
1879
			ew32(ITR, 1000000000 / (adapter->itr * 256));
L
Linus Torvalds 已提交
1880 1881
	}

1882
	/* Setup the HW Rx Head and Tail Descriptor Pointers and
1883 1884
	 * the Base and Length of the Rx Descriptor Ring
	 */
1885
	switch (adapter->num_rx_queues) {
1886 1887
	case 1:
	default:
1888
		rdba = adapter->rx_ring[0].dma;
J
Joe Perches 已提交
1889 1890 1891 1892 1893
		ew32(RDLEN, rdlen);
		ew32(RDBAH, (rdba >> 32));
		ew32(RDBAL, (rdba & 0x00000000ffffffffULL));
		ew32(RDT, 0);
		ew32(RDH, 0);
1894 1895 1896 1897
		adapter->rx_ring[0].rdh = ((hw->mac_type >= e1000_82543) ?
					   E1000_RDH : E1000_82542_RDH);
		adapter->rx_ring[0].rdt = ((hw->mac_type >= e1000_82543) ?
					   E1000_RDT : E1000_82542_RDT);
1898
		break;
1899 1900
	}

L
Linus Torvalds 已提交
1901
	/* Enable 82543 Receive Checksum Offload for TCP and UDP */
1902
	if (hw->mac_type >= e1000_82543) {
J
Joe Perches 已提交
1903
		rxcsum = er32(RXCSUM);
1904
		if (adapter->rx_csum)
1905
			rxcsum |= E1000_RXCSUM_TUOFL;
1906
		else
1907
			/* don't need to clear IPPCSE as it defaults to 0 */
1908
			rxcsum &= ~E1000_RXCSUM_TUOFL;
J
Joe Perches 已提交
1909
		ew32(RXCSUM, rxcsum);
L
Linus Torvalds 已提交
1910 1911 1912
	}

	/* Enable Receives */
1913
	ew32(RCTL, rctl | E1000_RCTL_EN);
L
Linus Torvalds 已提交
1914 1915 1916
}

/**
1917
 * e1000_free_tx_resources - Free Tx Resources per Queue
L
Linus Torvalds 已提交
1918
 * @adapter: board private structure
1919
 * @tx_ring: Tx descriptor ring for a specific queue
L
Linus Torvalds 已提交
1920 1921 1922
 *
 * Free all transmit software resources
 **/
1923 1924
static void e1000_free_tx_resources(struct e1000_adapter *adapter,
				    struct e1000_tx_ring *tx_ring)
L
Linus Torvalds 已提交
1925 1926 1927
{
	struct pci_dev *pdev = adapter->pdev;

1928
	e1000_clean_tx_ring(adapter, tx_ring);
L
Linus Torvalds 已提交
1929

1930 1931
	vfree(tx_ring->buffer_info);
	tx_ring->buffer_info = NULL;
L
Linus Torvalds 已提交
1932

1933 1934
	dma_free_coherent(&pdev->dev, tx_ring->size, tx_ring->desc,
			  tx_ring->dma);
L
Linus Torvalds 已提交
1935

1936 1937 1938 1939 1940 1941 1942 1943 1944
	tx_ring->desc = NULL;
}

/**
 * e1000_free_all_tx_resources - Free Tx Resources for All Queues
 * @adapter: board private structure
 *
 * Free all transmit software resources
 **/
1945
void e1000_free_all_tx_resources(struct e1000_adapter *adapter)
1946 1947 1948
{
	int i;

1949
	for (i = 0; i < adapter->num_tx_queues; i++)
1950
		e1000_free_tx_resources(adapter, &adapter->tx_ring[i]);
L
Linus Torvalds 已提交
1951 1952
}

1953 1954 1955
static void
e1000_unmap_and_free_tx_resource(struct e1000_adapter *adapter,
				 struct e1000_tx_buffer *buffer_info)
L
Linus Torvalds 已提交
1956
{
1957 1958
	if (buffer_info->dma) {
		if (buffer_info->mapped_as_page)
1959 1960
			dma_unmap_page(&adapter->pdev->dev, buffer_info->dma,
				       buffer_info->length, DMA_TO_DEVICE);
1961
		else
1962
			dma_unmap_single(&adapter->pdev->dev, buffer_info->dma,
1963
					 buffer_info->length,
1964
					 DMA_TO_DEVICE);
1965 1966
		buffer_info->dma = 0;
	}
1967
	if (buffer_info->skb) {
L
Linus Torvalds 已提交
1968
		dev_kfree_skb_any(buffer_info->skb);
1969 1970
		buffer_info->skb = NULL;
	}
1971
	buffer_info->time_stamp = 0;
1972
	/* buffer_info must be completely set up in the transmit path */
L
Linus Torvalds 已提交
1973 1974 1975 1976 1977
}

/**
 * e1000_clean_tx_ring - Free Tx Buffers
 * @adapter: board private structure
1978
 * @tx_ring: ring to be cleaned
L
Linus Torvalds 已提交
1979
 **/
1980 1981
static void e1000_clean_tx_ring(struct e1000_adapter *adapter,
				struct e1000_tx_ring *tx_ring)
L
Linus Torvalds 已提交
1982
{
J
Joe Perches 已提交
1983
	struct e1000_hw *hw = &adapter->hw;
1984
	struct e1000_tx_buffer *buffer_info;
L
Linus Torvalds 已提交
1985 1986 1987 1988 1989
	unsigned long size;
	unsigned int i;

	/* Free all the Tx ring sk_buffs */

J
Jesse Brandeburg 已提交
1990
	for (i = 0; i < tx_ring->count; i++) {
L
Linus Torvalds 已提交
1991 1992 1993 1994
		buffer_info = &tx_ring->buffer_info[i];
		e1000_unmap_and_free_tx_resource(adapter, buffer_info);
	}

1995
	netdev_reset_queue(adapter->netdev);
1996
	size = sizeof(struct e1000_tx_buffer) * tx_ring->count;
L
Linus Torvalds 已提交
1997 1998 1999 2000 2001 2002 2003 2004
	memset(tx_ring->buffer_info, 0, size);

	/* Zero out the descriptor ring */

	memset(tx_ring->desc, 0, tx_ring->size);

	tx_ring->next_to_use = 0;
	tx_ring->next_to_clean = 0;
2005
	tx_ring->last_tx_tso = false;
L
Linus Torvalds 已提交
2006

J
Joe Perches 已提交
2007 2008
	writel(0, hw->hw_addr + tx_ring->tdh);
	writel(0, hw->hw_addr + tx_ring->tdt);
2009 2010 2011 2012 2013 2014
}

/**
 * e1000_clean_all_tx_rings - Free Tx Buffers for all queues
 * @adapter: board private structure
 **/
2015
static void e1000_clean_all_tx_rings(struct e1000_adapter *adapter)
2016 2017 2018
{
	int i;

2019
	for (i = 0; i < adapter->num_tx_queues; i++)
2020
		e1000_clean_tx_ring(adapter, &adapter->tx_ring[i]);
L
Linus Torvalds 已提交
2021 2022 2023 2024 2025
}

/**
 * e1000_free_rx_resources - Free Rx Resources
 * @adapter: board private structure
2026
 * @rx_ring: ring to clean the resources from
L
Linus Torvalds 已提交
2027 2028 2029
 *
 * Free all receive software resources
 **/
2030 2031
static void e1000_free_rx_resources(struct e1000_adapter *adapter,
				    struct e1000_rx_ring *rx_ring)
L
Linus Torvalds 已提交
2032 2033 2034
{
	struct pci_dev *pdev = adapter->pdev;

2035
	e1000_clean_rx_ring(adapter, rx_ring);
L
Linus Torvalds 已提交
2036 2037 2038 2039

	vfree(rx_ring->buffer_info);
	rx_ring->buffer_info = NULL;

2040 2041
	dma_free_coherent(&pdev->dev, rx_ring->size, rx_ring->desc,
			  rx_ring->dma);
L
Linus Torvalds 已提交
2042 2043 2044 2045 2046

	rx_ring->desc = NULL;
}

/**
2047
 * e1000_free_all_rx_resources - Free Rx Resources for All Queues
L
Linus Torvalds 已提交
2048
 * @adapter: board private structure
2049 2050 2051
 *
 * Free all receive software resources
 **/
2052
void e1000_free_all_rx_resources(struct e1000_adapter *adapter)
2053 2054 2055
{
	int i;

2056
	for (i = 0; i < adapter->num_rx_queues; i++)
2057 2058 2059
		e1000_free_rx_resources(adapter, &adapter->rx_ring[i]);
}

F
Florian Westphal 已提交
2060 2061 2062 2063 2064 2065 2066 2067 2068 2069 2070 2071 2072 2073 2074 2075 2076 2077 2078 2079 2080 2081
#define E1000_HEADROOM (NET_SKB_PAD + NET_IP_ALIGN)
static unsigned int e1000_frag_len(const struct e1000_adapter *a)
{
	return SKB_DATA_ALIGN(a->rx_buffer_len + E1000_HEADROOM) +
		SKB_DATA_ALIGN(sizeof(struct skb_shared_info));
}

static void *e1000_alloc_frag(const struct e1000_adapter *a)
{
	unsigned int len = e1000_frag_len(a);
	u8 *data = netdev_alloc_frag(len);

	if (likely(data))
		data += E1000_HEADROOM;
	return data;
}

static void e1000_free_frag(const void *data)
{
	put_page(virt_to_head_page(data));
}

2082 2083 2084 2085
/**
 * e1000_clean_rx_ring - Free Rx Buffers per Queue
 * @adapter: board private structure
 * @rx_ring: ring to free buffers from
L
Linus Torvalds 已提交
2086
 **/
2087 2088
static void e1000_clean_rx_ring(struct e1000_adapter *adapter,
				struct e1000_rx_ring *rx_ring)
L
Linus Torvalds 已提交
2089
{
J
Joe Perches 已提交
2090
	struct e1000_hw *hw = &adapter->hw;
2091
	struct e1000_rx_buffer *buffer_info;
L
Linus Torvalds 已提交
2092 2093
	struct pci_dev *pdev = adapter->pdev;
	unsigned long size;
2094
	unsigned int i;
L
Linus Torvalds 已提交
2095

F
Florian Westphal 已提交
2096
	/* Free all the Rx netfrags */
J
Jesse Brandeburg 已提交
2097
	for (i = 0; i < rx_ring->count; i++) {
L
Linus Torvalds 已提交
2098
		buffer_info = &rx_ring->buffer_info[i];
F
Florian Westphal 已提交
2099 2100 2101 2102 2103 2104 2105 2106 2107 2108 2109 2110 2111 2112 2113 2114 2115 2116
		if (adapter->clean_rx == e1000_clean_rx_irq) {
			if (buffer_info->dma)
				dma_unmap_single(&pdev->dev, buffer_info->dma,
						 adapter->rx_buffer_len,
						 DMA_FROM_DEVICE);
			if (buffer_info->rxbuf.data) {
				e1000_free_frag(buffer_info->rxbuf.data);
				buffer_info->rxbuf.data = NULL;
			}
		} else if (adapter->clean_rx == e1000_clean_jumbo_rx_irq) {
			if (buffer_info->dma)
				dma_unmap_page(&pdev->dev, buffer_info->dma,
					       adapter->rx_buffer_len,
					       DMA_FROM_DEVICE);
			if (buffer_info->rxbuf.page) {
				put_page(buffer_info->rxbuf.page);
				buffer_info->rxbuf.page = NULL;
			}
J
Jesse Brandeburg 已提交
2117
		}
L
Linus Torvalds 已提交
2118

J
Jesse Brandeburg 已提交
2119
		buffer_info->dma = 0;
L
Linus Torvalds 已提交
2120 2121
	}

2122
	/* there also may be some cached data from a chained receive */
2123 2124
	napi_free_frags(&adapter->napi);
	rx_ring->rx_skb_top = NULL;
2125

2126
	size = sizeof(struct e1000_rx_buffer) * rx_ring->count;
L
Linus Torvalds 已提交
2127 2128 2129 2130 2131 2132 2133 2134
	memset(rx_ring->buffer_info, 0, size);

	/* Zero out the descriptor ring */
	memset(rx_ring->desc, 0, rx_ring->size);

	rx_ring->next_to_clean = 0;
	rx_ring->next_to_use = 0;

J
Joe Perches 已提交
2135 2136
	writel(0, hw->hw_addr + rx_ring->rdh);
	writel(0, hw->hw_addr + rx_ring->rdt);
2137 2138 2139 2140 2141 2142
}

/**
 * e1000_clean_all_rx_rings - Free Rx Buffers for all queues
 * @adapter: board private structure
 **/
2143
static void e1000_clean_all_rx_rings(struct e1000_adapter *adapter)
2144 2145 2146
{
	int i;

2147
	for (i = 0; i < adapter->num_rx_queues; i++)
2148
		e1000_clean_rx_ring(adapter, &adapter->rx_ring[i]);
L
Linus Torvalds 已提交
2149 2150 2151 2152 2153
}

/* The 82542 2.0 (revision 2) needs to have the receive unit in reset
 * and memory write and invalidate disabled for certain operations
 */
2154
static void e1000_enter_82542_rst(struct e1000_adapter *adapter)
L
Linus Torvalds 已提交
2155
{
J
Joe Perches 已提交
2156
	struct e1000_hw *hw = &adapter->hw;
L
Linus Torvalds 已提交
2157
	struct net_device *netdev = adapter->netdev;
2158
	u32 rctl;
L
Linus Torvalds 已提交
2159

J
Joe Perches 已提交
2160
	e1000_pci_clear_mwi(hw);
L
Linus Torvalds 已提交
2161

J
Joe Perches 已提交
2162
	rctl = er32(RCTL);
L
Linus Torvalds 已提交
2163
	rctl |= E1000_RCTL_RST;
J
Joe Perches 已提交
2164 2165
	ew32(RCTL, rctl);
	E1000_WRITE_FLUSH();
L
Linus Torvalds 已提交
2166 2167
	mdelay(5);

J
Jesse Brandeburg 已提交
2168
	if (netif_running(netdev))
2169
		e1000_clean_all_rx_rings(adapter);
L
Linus Torvalds 已提交
2170 2171
}

2172
static void e1000_leave_82542_rst(struct e1000_adapter *adapter)
L
Linus Torvalds 已提交
2173
{
J
Joe Perches 已提交
2174
	struct e1000_hw *hw = &adapter->hw;
L
Linus Torvalds 已提交
2175
	struct net_device *netdev = adapter->netdev;
2176
	u32 rctl;
L
Linus Torvalds 已提交
2177

J
Joe Perches 已提交
2178
	rctl = er32(RCTL);
L
Linus Torvalds 已提交
2179
	rctl &= ~E1000_RCTL_RST;
J
Joe Perches 已提交
2180 2181
	ew32(RCTL, rctl);
	E1000_WRITE_FLUSH();
L
Linus Torvalds 已提交
2182 2183
	mdelay(5);

J
Joe Perches 已提交
2184 2185
	if (hw->pci_cmd_word & PCI_COMMAND_INVALIDATE)
		e1000_pci_set_mwi(hw);
L
Linus Torvalds 已提交
2186

J
Jesse Brandeburg 已提交
2187
	if (netif_running(netdev)) {
2188 2189
		/* No need to loop, because 82542 supports only 1 queue */
		struct e1000_rx_ring *ring = &adapter->rx_ring[0];
2190
		e1000_configure_rx(adapter);
2191
		adapter->alloc_rx_buf(adapter, ring, E1000_DESC_UNUSED(ring));
L
Linus Torvalds 已提交
2192 2193 2194 2195 2196 2197 2198 2199 2200 2201
	}
}

/**
 * e1000_set_mac - Change the Ethernet Address of the NIC
 * @netdev: network interface device structure
 * @p: pointer to an address structure
 *
 * Returns 0 on success, negative on failure
 **/
2202
static int e1000_set_mac(struct net_device *netdev, void *p)
L
Linus Torvalds 已提交
2203
{
2204
	struct e1000_adapter *adapter = netdev_priv(netdev);
J
Joe Perches 已提交
2205
	struct e1000_hw *hw = &adapter->hw;
L
Linus Torvalds 已提交
2206 2207
	struct sockaddr *addr = p;

J
Jesse Brandeburg 已提交
2208
	if (!is_valid_ether_addr(addr->sa_data))
L
Linus Torvalds 已提交
2209 2210 2211 2212
		return -EADDRNOTAVAIL;

	/* 82542 2.0 needs to be in reset to write receive address registers */

J
Joe Perches 已提交
2213
	if (hw->mac_type == e1000_82542_rev2_0)
L
Linus Torvalds 已提交
2214 2215 2216
		e1000_enter_82542_rst(adapter);

	memcpy(netdev->dev_addr, addr->sa_data, netdev->addr_len);
J
Joe Perches 已提交
2217
	memcpy(hw->mac_addr, addr->sa_data, netdev->addr_len);
L
Linus Torvalds 已提交
2218

J
Joe Perches 已提交
2219
	e1000_rar_set(hw, hw->mac_addr, 0);
L
Linus Torvalds 已提交
2220

J
Joe Perches 已提交
2221
	if (hw->mac_type == e1000_82542_rev2_0)
L
Linus Torvalds 已提交
2222 2223 2224 2225 2226 2227
		e1000_leave_82542_rst(adapter);

	return 0;
}

/**
2228
 * e1000_set_rx_mode - Secondary Unicast, Multicast and Promiscuous mode set
L
Linus Torvalds 已提交
2229 2230
 * @netdev: network interface device structure
 *
2231 2232 2233
 * The set_rx_mode entry point is called whenever the unicast or multicast
 * address lists or the network interface flags are updated. This routine is
 * responsible for configuring the hardware for proper unicast, multicast,
L
Linus Torvalds 已提交
2234 2235
 * promiscuous mode, and all-multi behavior.
 **/
2236
static void e1000_set_rx_mode(struct net_device *netdev)
L
Linus Torvalds 已提交
2237
{
2238
	struct e1000_adapter *adapter = netdev_priv(netdev);
L
Linus Torvalds 已提交
2239
	struct e1000_hw *hw = &adapter->hw;
J
Jiri Pirko 已提交
2240 2241
	struct netdev_hw_addr *ha;
	bool use_uc = false;
2242 2243
	u32 rctl;
	u32 hash_value;
2244
	int i, rar_entries = E1000_RAR_ENTRIES;
2245
	int mta_reg_count = E1000_NUM_MTA_REGISTERS;
2246 2247
	u32 *mcarray = kcalloc(mta_reg_count, sizeof(u32), GFP_ATOMIC);

2248
	if (!mcarray)
2249
		return;
2250

2251 2252
	/* Check for Promiscuous and All Multicast modes */

J
Joe Perches 已提交
2253
	rctl = er32(RCTL);
L
Linus Torvalds 已提交
2254

J
Jesse Brandeburg 已提交
2255
	if (netdev->flags & IFF_PROMISC) {
L
Linus Torvalds 已提交
2256
		rctl |= (E1000_RCTL_UPE | E1000_RCTL_MPE);
2257
		rctl &= ~E1000_RCTL_VFE;
L
Linus Torvalds 已提交
2258
	} else {
2259
		if (netdev->flags & IFF_ALLMULTI)
2260
			rctl |= E1000_RCTL_MPE;
2261
		else
2262
			rctl &= ~E1000_RCTL_MPE;
2263
		/* Enable VLAN filter if there is a VLAN */
J
Jiri Pirko 已提交
2264
		if (e1000_vlan_used(adapter))
2265
			rctl |= E1000_RCTL_VFE;
2266 2267
	}

2268
	if (netdev_uc_count(netdev) > rar_entries - 1) {
2269 2270 2271
		rctl |= E1000_RCTL_UPE;
	} else if (!(netdev->flags & IFF_PROMISC)) {
		rctl &= ~E1000_RCTL_UPE;
J
Jiri Pirko 已提交
2272
		use_uc = true;
L
Linus Torvalds 已提交
2273 2274
	}

J
Joe Perches 已提交
2275
	ew32(RCTL, rctl);
L
Linus Torvalds 已提交
2276 2277 2278

	/* 82542 2.0 needs to be in reset to write receive address registers */

J
Jesse Brandeburg 已提交
2279
	if (hw->mac_type == e1000_82542_rev2_0)
L
Linus Torvalds 已提交
2280 2281
		e1000_enter_82542_rst(adapter);

2282 2283 2284 2285
	/* load the first 14 addresses into the exact filters 1-14. Unicast
	 * addresses take precedence to avoid disabling unicast filtering
	 * when possible.
	 *
2286
	 * RAR 0 is used for the station MAC address
L
Linus Torvalds 已提交
2287 2288
	 * if there are not 14 addresses, go ahead and clear the filters
	 */
J
Jiri Pirko 已提交
2289 2290
	i = 1;
	if (use_uc)
2291
		netdev_for_each_uc_addr(ha, netdev) {
J
Jiri Pirko 已提交
2292 2293 2294 2295 2296
			if (i == rar_entries)
				break;
			e1000_rar_set(hw, ha->addr, i++);
		}

2297
	netdev_for_each_mc_addr(ha, netdev) {
2298 2299 2300
		if (i == rar_entries) {
			/* load any remaining addresses into the hash table */
			u32 hash_reg, hash_bit, mta;
2301
			hash_value = e1000_hash_mc_addr(hw, ha->addr);
2302 2303 2304 2305
			hash_reg = (hash_value >> 5) & 0x7F;
			hash_bit = hash_value & 0x1F;
			mta = (1 << hash_bit);
			mcarray[hash_reg] |= mta;
2306
		} else {
2307
			e1000_rar_set(hw, ha->addr, i++);
L
Linus Torvalds 已提交
2308 2309 2310
		}
	}

2311 2312 2313 2314 2315
	for (; i < rar_entries; i++) {
		E1000_WRITE_REG_ARRAY(hw, RA, i << 1, 0);
		E1000_WRITE_FLUSH();
		E1000_WRITE_REG_ARRAY(hw, RA, (i << 1) + 1, 0);
		E1000_WRITE_FLUSH();
L
Linus Torvalds 已提交
2316 2317
	}

2318
	/* write the hash table completely, write from bottom to avoid
2319 2320
	 * both stupid write combining chipsets, and flushing each write
	 */
2321
	for (i = mta_reg_count - 1; i >= 0 ; i--) {
2322
		/* If we are on an 82544 has an errata where writing odd
2323 2324 2325 2326 2327 2328 2329 2330
		 * offsets overwrites the previous even offset, but writing
		 * backwards over the range solves the issue by always
		 * writing the odd offset first
		 */
		E1000_WRITE_REG_ARRAY(hw, MTA, i, mcarray[i]);
	}
	E1000_WRITE_FLUSH();

J
Jesse Brandeburg 已提交
2331
	if (hw->mac_type == e1000_82542_rev2_0)
L
Linus Torvalds 已提交
2332
		e1000_leave_82542_rst(adapter);
2333 2334

	kfree(mcarray);
L
Linus Torvalds 已提交
2335 2336
}

2337 2338 2339 2340 2341 2342 2343
/**
 * e1000_update_phy_info_task - get phy info
 * @work: work struct contained inside adapter struct
 *
 * Need to wait a few seconds after link up to get diagnostic information from
 * the phy
 */
J
Jesse Brandeburg 已提交
2344 2345 2346
static void e1000_update_phy_info_task(struct work_struct *work)
{
	struct e1000_adapter *adapter = container_of(work,
2347 2348
						     struct e1000_adapter,
						     phy_info_task.work);
2349

2350
	e1000_phy_get_info(&adapter->hw, &adapter->phy_info);
L
Linus Torvalds 已提交
2351 2352
}

J
Jesse Brandeburg 已提交
2353 2354 2355 2356 2357 2358 2359
/**
 * e1000_82547_tx_fifo_stall_task - task to complete work
 * @work: work struct contained inside adapter struct
 **/
static void e1000_82547_tx_fifo_stall_task(struct work_struct *work)
{
	struct e1000_adapter *adapter = container_of(work,
2360 2361
						     struct e1000_adapter,
						     fifo_stall_task.work);
J
Joe Perches 已提交
2362
	struct e1000_hw *hw = &adapter->hw;
L
Linus Torvalds 已提交
2363
	struct net_device *netdev = adapter->netdev;
2364
	u32 tctl;
L
Linus Torvalds 已提交
2365

J
Jesse Brandeburg 已提交
2366
	if (atomic_read(&adapter->tx_fifo_stall)) {
J
Joe Perches 已提交
2367 2368 2369 2370 2371 2372 2373 2374 2375 2376 2377
		if ((er32(TDT) == er32(TDH)) &&
		   (er32(TDFT) == er32(TDFH)) &&
		   (er32(TDFTS) == er32(TDFHS))) {
			tctl = er32(TCTL);
			ew32(TCTL, tctl & ~E1000_TCTL_EN);
			ew32(TDFT, adapter->tx_head_addr);
			ew32(TDFH, adapter->tx_head_addr);
			ew32(TDFTS, adapter->tx_head_addr);
			ew32(TDFHS, adapter->tx_head_addr);
			ew32(TCTL, tctl);
			E1000_WRITE_FLUSH();
L
Linus Torvalds 已提交
2378 2379 2380 2381

			adapter->tx_fifo_head = 0;
			atomic_set(&adapter->tx_fifo_stall, 0);
			netif_wake_queue(netdev);
2382
		} else if (!test_bit(__E1000_DOWN, &adapter->flags)) {
2383
			schedule_delayed_work(&adapter->fifo_stall_task, 1);
L
Linus Torvalds 已提交
2384 2385 2386 2387
		}
	}
}

2388
bool e1000_has_link(struct e1000_adapter *adapter)
2389 2390 2391 2392
{
	struct e1000_hw *hw = &adapter->hw;
	bool link_active = false;

2393 2394 2395 2396 2397
	/* get_link_status is set on LSC (link status) interrupt or rx
	 * sequence error interrupt (except on intel ce4100).
	 * get_link_status will stay false until the
	 * e1000_check_for_link establishes link for copper adapters
	 * ONLY
2398 2399 2400
	 */
	switch (hw->media_type) {
	case e1000_media_type_copper:
2401 2402
		if (hw->mac_type == e1000_ce4100)
			hw->get_link_status = 1;
2403
		if (hw->get_link_status) {
2404
			e1000_check_for_link(hw);
2405 2406 2407 2408 2409 2410
			link_active = !hw->get_link_status;
		} else {
			link_active = true;
		}
		break;
	case e1000_media_type_fiber:
2411
		e1000_check_for_link(hw);
2412 2413 2414
		link_active = !!(er32(STATUS) & E1000_STATUS_LU);
		break;
	case e1000_media_type_internal_serdes:
2415
		e1000_check_for_link(hw);
2416 2417 2418 2419 2420 2421 2422 2423 2424
		link_active = hw->serdes_has_link;
		break;
	default:
		break;
	}

	return link_active;
}

L
Linus Torvalds 已提交
2425
/**
2426 2427
 * e1000_watchdog - work function
 * @work: work struct contained inside adapter struct
L
Linus Torvalds 已提交
2428
 **/
2429
static void e1000_watchdog(struct work_struct *work)
L
Linus Torvalds 已提交
2430
{
2431 2432 2433
	struct e1000_adapter *adapter = container_of(work,
						     struct e1000_adapter,
						     watchdog_task.work);
J
Joe Perches 已提交
2434
	struct e1000_hw *hw = &adapter->hw;
L
Linus Torvalds 已提交
2435
	struct net_device *netdev = adapter->netdev;
J
Jeff Kirsher 已提交
2436
	struct e1000_tx_ring *txdr = adapter->tx_ring;
2437
	u32 link, tctl;
2438

2439 2440 2441
	link = e1000_has_link(adapter);
	if ((netif_carrier_ok(netdev)) && link)
		goto link_up;
L
Linus Torvalds 已提交
2442

J
Jesse Brandeburg 已提交
2443 2444
	if (link) {
		if (!netif_carrier_ok(netdev)) {
2445
			u32 ctrl;
J
Joe Perches 已提交
2446
			bool txb2b = true;
2447
			/* update snapshot of PHY registers on LSC */
J
Joe Perches 已提交
2448
			e1000_get_speed_and_duplex(hw,
2449 2450
						   &adapter->link_speed,
						   &adapter->link_duplex);
L
Linus Torvalds 已提交
2451

J
Joe Perches 已提交
2452
			ctrl = er32(CTRL);
2453 2454 2455 2456 2457 2458 2459 2460 2461 2462
			pr_info("%s NIC Link is Up %d Mbps %s, "
				"Flow Control: %s\n",
				netdev->name,
				adapter->link_speed,
				adapter->link_duplex == FULL_DUPLEX ?
				"Full Duplex" : "Half Duplex",
				((ctrl & E1000_CTRL_TFCE) && (ctrl &
				E1000_CTRL_RFCE)) ? "RX/TX" : ((ctrl &
				E1000_CTRL_RFCE) ? "RX" : ((ctrl &
				E1000_CTRL_TFCE) ? "TX" : "None")));
L
Linus Torvalds 已提交
2463

2464
			/* adjust timeout factor according to speed/duplex */
2465
			adapter->tx_timeout_factor = 1;
2466 2467
			switch (adapter->link_speed) {
			case SPEED_10:
J
Joe Perches 已提交
2468
				txb2b = false;
2469
				adapter->tx_timeout_factor = 16;
2470 2471
				break;
			case SPEED_100:
J
Joe Perches 已提交
2472
				txb2b = false;
2473 2474 2475 2476
				/* maybe add some timeout factor ? */
				break;
			}

2477
			/* enable transmits in the hardware */
J
Joe Perches 已提交
2478
			tctl = er32(TCTL);
2479
			tctl |= E1000_TCTL_EN;
J
Joe Perches 已提交
2480
			ew32(TCTL, tctl);
2481

L
Linus Torvalds 已提交
2482
			netif_carrier_on(netdev);
2483
			if (!test_bit(__E1000_DOWN, &adapter->flags))
2484 2485
				schedule_delayed_work(&adapter->phy_info_task,
						      2 * HZ);
L
Linus Torvalds 已提交
2486 2487 2488
			adapter->smartspeed = 0;
		}
	} else {
J
Jesse Brandeburg 已提交
2489
		if (netif_carrier_ok(netdev)) {
L
Linus Torvalds 已提交
2490 2491
			adapter->link_speed = 0;
			adapter->link_duplex = 0;
2492 2493
			pr_info("%s NIC Link is Down\n",
				netdev->name);
L
Linus Torvalds 已提交
2494
			netif_carrier_off(netdev);
2495 2496

			if (!test_bit(__E1000_DOWN, &adapter->flags))
2497 2498
				schedule_delayed_work(&adapter->phy_info_task,
						      2 * HZ);
L
Linus Torvalds 已提交
2499 2500 2501 2502 2503
		}

		e1000_smartspeed(adapter);
	}

2504
link_up:
L
Linus Torvalds 已提交
2505 2506
	e1000_update_stats(adapter);

J
Joe Perches 已提交
2507
	hw->tx_packet_delta = adapter->stats.tpt - adapter->tpt_old;
L
Linus Torvalds 已提交
2508
	adapter->tpt_old = adapter->stats.tpt;
J
Joe Perches 已提交
2509
	hw->collision_delta = adapter->stats.colc - adapter->colc_old;
L
Linus Torvalds 已提交
2510 2511 2512 2513 2514 2515 2516
	adapter->colc_old = adapter->stats.colc;

	adapter->gorcl = adapter->stats.gorcl - adapter->gorcl_old;
	adapter->gorcl_old = adapter->stats.gorcl;
	adapter->gotcl = adapter->stats.gotcl - adapter->gotcl_old;
	adapter->gotcl_old = adapter->stats.gotcl;

J
Joe Perches 已提交
2517
	e1000_update_adaptive(hw);
L
Linus Torvalds 已提交
2518

2519
	if (!netif_carrier_ok(netdev)) {
2520
		if (E1000_DESC_UNUSED(txdr) + 1 < txdr->count) {
L
Linus Torvalds 已提交
2521 2522 2523
			/* We've lost link, so the controller stops DMA,
			 * but we've got queued Tx work that's never going
			 * to get done, so reset controller to flush Tx.
2524 2525
			 * (Do the reset outside of interrupt context).
			 */
2526 2527
			adapter->tx_timeout_count++;
			schedule_work(&adapter->reset_task);
2528
			/* exit immediately since reset is imminent */
2529
			return;
L
Linus Torvalds 已提交
2530 2531 2532
		}
	}

2533 2534
	/* Simple mode for Interrupt Throttle Rate (ITR) */
	if (hw->mac_type >= e1000_82540 && adapter->itr_setting == 4) {
2535
		/* Symmetric Tx/Rx gets a reduced ITR=2000;
2536 2537 2538 2539 2540 2541 2542 2543 2544 2545 2546 2547
		 * Total asymmetrical Tx or Rx gets ITR=8000;
		 * everyone else is between 2000-8000.
		 */
		u32 goc = (adapter->gotcl + adapter->gorcl) / 10000;
		u32 dif = (adapter->gotcl > adapter->gorcl ?
			    adapter->gotcl - adapter->gorcl :
			    adapter->gorcl - adapter->gotcl) / 10000;
		u32 itr = goc > 0 ? (dif * 6000 / goc + 2000) : 8000;

		ew32(ITR, 1000000000 / (itr * 256));
	}

L
Linus Torvalds 已提交
2548
	/* Cause software interrupt to ensure rx ring is cleaned */
J
Joe Perches 已提交
2549
	ew32(ICS, E1000_ICS_RXDMT0);
L
Linus Torvalds 已提交
2550

2551
	/* Force detection of hung controller every watchdog period */
J
Joe Perches 已提交
2552
	adapter->detect_tx_hung = true;
L
Linus Torvalds 已提交
2553

2554
	/* Reschedule the task */
2555
	if (!test_bit(__E1000_DOWN, &adapter->flags))
2556
		schedule_delayed_work(&adapter->watchdog_task, 2 * HZ);
L
Linus Torvalds 已提交
2557 2558
}

J
Jesse Brandeburg 已提交
2559 2560 2561 2562 2563 2564 2565 2566 2567
enum latency_range {
	lowest_latency = 0,
	low_latency = 1,
	bulk_latency = 2,
	latency_invalid = 255
};

/**
 * e1000_update_itr - update the dynamic ITR value based on statistics
2568 2569 2570 2571 2572
 * @adapter: pointer to adapter
 * @itr_setting: current adapter->itr
 * @packets: the number of packets during this measurement interval
 * @bytes: the number of bytes during this measurement interval
 *
J
Jesse Brandeburg 已提交
2573 2574 2575 2576 2577 2578 2579 2580 2581 2582 2583
 *      Stores a new ITR value based on packets and byte
 *      counts during the last interrupt.  The advantage of per interrupt
 *      computation is faster updates and more accurate ITR for the current
 *      traffic pattern.  Constants in this function were computed
 *      based on theoretical maximum wire speed and thresholds were set based
 *      on testing data as well as attempting to minimize response time
 *      while increasing bulk throughput.
 *      this functionality is controlled by the InterruptThrottleRate module
 *      parameter (see e1000_param.c)
 **/
static unsigned int e1000_update_itr(struct e1000_adapter *adapter,
2584
				     u16 itr_setting, int packets, int bytes)
J
Jesse Brandeburg 已提交
2585 2586 2587 2588 2589 2590 2591 2592 2593 2594 2595 2596
{
	unsigned int retval = itr_setting;
	struct e1000_hw *hw = &adapter->hw;

	if (unlikely(hw->mac_type < e1000_82540))
		goto update_itr_done;

	if (packets == 0)
		goto update_itr_done;

	switch (itr_setting) {
	case lowest_latency:
2597 2598 2599 2600
		/* jumbo frames get bulk treatment*/
		if (bytes/packets > 8000)
			retval = bulk_latency;
		else if ((packets < 5) && (bytes > 512))
J
Jesse Brandeburg 已提交
2601 2602 2603 2604
			retval = low_latency;
		break;
	case low_latency:  /* 50 usec aka 20000 ints/s */
		if (bytes > 10000) {
2605 2606 2607 2608
			/* jumbo frames need bulk latency setting */
			if (bytes/packets > 8000)
				retval = bulk_latency;
			else if ((packets < 10) || ((bytes/packets) > 1200))
J
Jesse Brandeburg 已提交
2609 2610 2611
				retval = bulk_latency;
			else if ((packets > 35))
				retval = lowest_latency;
2612 2613 2614
		} else if (bytes/packets > 2000)
			retval = bulk_latency;
		else if (packets <= 2 && bytes < 512)
J
Jesse Brandeburg 已提交
2615 2616 2617 2618 2619 2620
			retval = lowest_latency;
		break;
	case bulk_latency: /* 250 usec aka 4000 ints/s */
		if (bytes > 25000) {
			if (packets > 35)
				retval = low_latency;
2621 2622
		} else if (bytes < 6000) {
			retval = low_latency;
J
Jesse Brandeburg 已提交
2623 2624 2625 2626 2627 2628 2629 2630 2631 2632 2633
		}
		break;
	}

update_itr_done:
	return retval;
}

static void e1000_set_itr(struct e1000_adapter *adapter)
{
	struct e1000_hw *hw = &adapter->hw;
2634 2635
	u16 current_itr;
	u32 new_itr = adapter->itr;
J
Jesse Brandeburg 已提交
2636 2637 2638 2639 2640 2641 2642 2643 2644 2645 2646

	if (unlikely(hw->mac_type < e1000_82540))
		return;

	/* for non-gigabit speeds, just fix the interrupt rate at 4000 */
	if (unlikely(adapter->link_speed != SPEED_1000)) {
		current_itr = 0;
		new_itr = 4000;
		goto set_itr_now;
	}

2647 2648 2649
	adapter->tx_itr = e1000_update_itr(adapter, adapter->tx_itr,
					   adapter->total_tx_packets,
					   adapter->total_tx_bytes);
2650 2651 2652 2653
	/* conservative mode (itr 3) eliminates the lowest_latency setting */
	if (adapter->itr_setting == 3 && adapter->tx_itr == lowest_latency)
		adapter->tx_itr = low_latency;

2654 2655 2656
	adapter->rx_itr = e1000_update_itr(adapter, adapter->rx_itr,
					   adapter->total_rx_packets,
					   adapter->total_rx_bytes);
2657 2658 2659
	/* conservative mode (itr 3) eliminates the lowest_latency setting */
	if (adapter->itr_setting == 3 && adapter->rx_itr == lowest_latency)
		adapter->rx_itr = low_latency;
J
Jesse Brandeburg 已提交
2660 2661 2662 2663 2664 2665 2666 2667 2668 2669 2670 2671 2672 2673 2674 2675 2676 2677 2678 2679 2680 2681

	current_itr = max(adapter->rx_itr, adapter->tx_itr);

	switch (current_itr) {
	/* counts and packets in update_itr are dependent on these numbers */
	case lowest_latency:
		new_itr = 70000;
		break;
	case low_latency:
		new_itr = 20000; /* aka hwitr = ~200 */
		break;
	case bulk_latency:
		new_itr = 4000;
		break;
	default:
		break;
	}

set_itr_now:
	if (new_itr != adapter->itr) {
		/* this attempts to bias the interrupt rate towards Bulk
		 * by adding intermediate steps when interrupt rate is
2682 2683
		 * increasing
		 */
J
Jesse Brandeburg 已提交
2684
		new_itr = new_itr > adapter->itr ?
2685 2686
			  min(adapter->itr + (new_itr >> 2), new_itr) :
			  new_itr;
J
Jesse Brandeburg 已提交
2687
		adapter->itr = new_itr;
J
Joe Perches 已提交
2688
		ew32(ITR, 1000000000 / (new_itr * 256));
J
Jesse Brandeburg 已提交
2689 2690 2691
	}
}

L
Linus Torvalds 已提交
2692 2693 2694
#define E1000_TX_FLAGS_CSUM		0x00000001
#define E1000_TX_FLAGS_VLAN		0x00000002
#define E1000_TX_FLAGS_TSO		0x00000004
2695
#define E1000_TX_FLAGS_IPV4		0x00000008
2696
#define E1000_TX_FLAGS_NO_FCS		0x00000010
L
Linus Torvalds 已提交
2697 2698 2699
#define E1000_TX_FLAGS_VLAN_MASK	0xffff0000
#define E1000_TX_FLAGS_VLAN_SHIFT	16

2700
static int e1000_tso(struct e1000_adapter *adapter,
2701 2702
		     struct e1000_tx_ring *tx_ring, struct sk_buff *skb,
		     __be16 protocol)
L
Linus Torvalds 已提交
2703 2704
{
	struct e1000_context_desc *context_desc;
2705
	struct e1000_tx_buffer *buffer_info;
L
Linus Torvalds 已提交
2706
	unsigned int i;
2707 2708 2709
	u32 cmd_length = 0;
	u16 ipcse = 0, tucse, mss;
	u8 ipcss, ipcso, tucss, tucso, hdr_len;
L
Linus Torvalds 已提交
2710

H
Herbert Xu 已提交
2711
	if (skb_is_gso(skb)) {
2712 2713 2714 2715 2716
		int err;

		err = skb_cow_head(skb, 0);
		if (err < 0)
			return err;
L
Linus Torvalds 已提交
2717

2718
		hdr_len = skb_transport_offset(skb) + tcp_hdrlen(skb);
2719
		mss = skb_shinfo(skb)->gso_size;
2720
		if (protocol == htons(ETH_P_IP)) {
2721 2722 2723
			struct iphdr *iph = ip_hdr(skb);
			iph->tot_len = 0;
			iph->check = 0;
2724 2725 2726 2727
			tcp_hdr(skb)->check = ~csum_tcpudp_magic(iph->saddr,
								 iph->daddr, 0,
								 IPPROTO_TCP,
								 0);
2728
			cmd_length = E1000_TXD_CMD_IP;
2729
			ipcse = skb_transport_offset(skb) - 1;
2730
		} else if (skb_is_gso_v6(skb)) {
2731
			ipv6_hdr(skb)->payload_len = 0;
2732
			tcp_hdr(skb)->check =
2733 2734 2735
				~csum_ipv6_magic(&ipv6_hdr(skb)->saddr,
						 &ipv6_hdr(skb)->daddr,
						 0, IPPROTO_TCP, 0);
2736 2737
			ipcse = 0;
		}
2738
		ipcss = skb_network_offset(skb);
2739
		ipcso = (void *)&(ip_hdr(skb)->check) - (void *)skb->data;
2740
		tucss = skb_transport_offset(skb);
2741
		tucso = (void *)&(tcp_hdr(skb)->check) - (void *)skb->data;
L
Linus Torvalds 已提交
2742 2743 2744
		tucse = 0;

		cmd_length |= (E1000_TXD_CMD_DEXT | E1000_TXD_CMD_TSE |
2745
			       E1000_TXD_CMD_TCP | (skb->len - (hdr_len)));
L
Linus Torvalds 已提交
2746

2747 2748
		i = tx_ring->next_to_use;
		context_desc = E1000_CONTEXT_DESC(*tx_ring, i);
J
Jeff Kirsher 已提交
2749
		buffer_info = &tx_ring->buffer_info[i];
L
Linus Torvalds 已提交
2750 2751 2752 2753 2754 2755 2756 2757 2758 2759 2760

		context_desc->lower_setup.ip_fields.ipcss  = ipcss;
		context_desc->lower_setup.ip_fields.ipcso  = ipcso;
		context_desc->lower_setup.ip_fields.ipcse  = cpu_to_le16(ipcse);
		context_desc->upper_setup.tcp_fields.tucss = tucss;
		context_desc->upper_setup.tcp_fields.tucso = tucso;
		context_desc->upper_setup.tcp_fields.tucse = cpu_to_le16(tucse);
		context_desc->tcp_seg_setup.fields.mss     = cpu_to_le16(mss);
		context_desc->tcp_seg_setup.fields.hdr_len = hdr_len;
		context_desc->cmd_and_length = cpu_to_le32(cmd_length);

J
Jeff Kirsher 已提交
2761
		buffer_info->time_stamp = jiffies;
2762
		buffer_info->next_to_watch = i;
J
Jeff Kirsher 已提交
2763

2764 2765
		if (++i == tx_ring->count) i = 0;
		tx_ring->next_to_use = i;
L
Linus Torvalds 已提交
2766

J
Joe Perches 已提交
2767
		return true;
L
Linus Torvalds 已提交
2768
	}
J
Joe Perches 已提交
2769
	return false;
L
Linus Torvalds 已提交
2770 2771
}

2772
static bool e1000_tx_csum(struct e1000_adapter *adapter,
2773 2774
			  struct e1000_tx_ring *tx_ring, struct sk_buff *skb,
			  __be16 protocol)
L
Linus Torvalds 已提交
2775 2776
{
	struct e1000_context_desc *context_desc;
2777
	struct e1000_tx_buffer *buffer_info;
L
Linus Torvalds 已提交
2778
	unsigned int i;
2779
	u8 css;
2780
	u32 cmd_len = E1000_TXD_CMD_DEXT;
L
Linus Torvalds 已提交
2781

2782 2783
	if (skb->ip_summed != CHECKSUM_PARTIAL)
		return false;
L
Linus Torvalds 已提交
2784

2785
	switch (protocol) {
2786
	case cpu_to_be16(ETH_P_IP):
2787 2788 2789
		if (ip_hdr(skb)->protocol == IPPROTO_TCP)
			cmd_len |= E1000_TXD_CMD_TCP;
		break;
2790
	case cpu_to_be16(ETH_P_IPV6):
2791 2792 2793 2794 2795 2796
		/* XXX not handling all IPV6 headers */
		if (ipv6_hdr(skb)->nexthdr == IPPROTO_TCP)
			cmd_len |= E1000_TXD_CMD_TCP;
		break;
	default:
		if (unlikely(net_ratelimit()))
2797 2798
			e_warn(drv, "checksum_partial proto=%x!\n",
			       skb->protocol);
2799 2800
		break;
	}
L
Linus Torvalds 已提交
2801

2802
	css = skb_checksum_start_offset(skb);
L
Linus Torvalds 已提交
2803

2804 2805 2806
	i = tx_ring->next_to_use;
	buffer_info = &tx_ring->buffer_info[i];
	context_desc = E1000_CONTEXT_DESC(*tx_ring, i);
J
Jeff Kirsher 已提交
2807

2808 2809 2810 2811 2812 2813 2814
	context_desc->lower_setup.ip_config = 0;
	context_desc->upper_setup.tcp_fields.tucss = css;
	context_desc->upper_setup.tcp_fields.tucso =
		css + skb->csum_offset;
	context_desc->upper_setup.tcp_fields.tucse = 0;
	context_desc->tcp_seg_setup.data = 0;
	context_desc->cmd_and_length = cpu_to_le32(cmd_len);
L
Linus Torvalds 已提交
2815

2816 2817
	buffer_info->time_stamp = jiffies;
	buffer_info->next_to_watch = i;
L
Linus Torvalds 已提交
2818

2819 2820 2821 2822
	if (unlikely(++i == tx_ring->count)) i = 0;
	tx_ring->next_to_use = i;

	return true;
L
Linus Torvalds 已提交
2823 2824 2825 2826 2827
}

#define E1000_MAX_TXD_PWR	12
#define E1000_MAX_DATA_PER_TXD	(1<<E1000_MAX_TXD_PWR)

2828 2829 2830 2831 2832
static int e1000_tx_map(struct e1000_adapter *adapter,
			struct e1000_tx_ring *tx_ring,
			struct sk_buff *skb, unsigned int first,
			unsigned int max_per_txd, unsigned int nr_frags,
			unsigned int mss)
L
Linus Torvalds 已提交
2833
{
J
Joe Perches 已提交
2834
	struct e1000_hw *hw = &adapter->hw;
2835
	struct pci_dev *pdev = adapter->pdev;
2836
	struct e1000_tx_buffer *buffer_info;
J
Jesse Brandeburg 已提交
2837
	unsigned int len = skb_headlen(skb);
2838
	unsigned int offset = 0, size, count = 0, i;
2839
	unsigned int f, bytecount, segs;
L
Linus Torvalds 已提交
2840 2841 2842

	i = tx_ring->next_to_use;

J
Jesse Brandeburg 已提交
2843
	while (len) {
2844
		buffer_info = &tx_ring->buffer_info[i];
L
Linus Torvalds 已提交
2845
		size = min(len, max_per_txd);
J
Jeff Kirsher 已提交
2846 2847 2848
		/* Workaround for Controller erratum --
		 * descriptor for non-tso packet in a linear SKB that follows a
		 * tso gets written back prematurely before the data is fully
2849 2850
		 * DMA'd to the controller
		 */
J
Jeff Kirsher 已提交
2851
		if (!skb->data_len && tx_ring->last_tx_tso &&
H
Herbert Xu 已提交
2852
		    !skb_is_gso(skb)) {
2853
			tx_ring->last_tx_tso = false;
J
Jeff Kirsher 已提交
2854 2855 2856
			size -= 4;
		}

L
Linus Torvalds 已提交
2857
		/* Workaround for premature desc write-backs
2858 2859
		 * in TSO mode.  Append 4-byte sentinel desc
		 */
J
Jesse Brandeburg 已提交
2860
		if (unlikely(mss && !nr_frags && size == len && size > 8))
L
Linus Torvalds 已提交
2861
			size -= 4;
2862 2863 2864 2865 2866
		/* work-around for errata 10 and it applies
		 * to all controllers in PCI-X mode
		 * The fix is to make sure that the first descriptor of a
		 * packet is smaller than 2048 - 16 - 16 (or 2016) bytes
		 */
J
Joe Perches 已提交
2867
		if (unlikely((hw->bus_type == e1000_bus_type_pcix) &&
2868 2869
		                (size > 2015) && count == 0))
		        size = 2015;
J
Jesse Brandeburg 已提交
2870

L
Linus Torvalds 已提交
2871
		/* Workaround for potential 82544 hang in PCI-X.  Avoid
2872 2873
		 * terminating buffers within evenly-aligned dwords.
		 */
J
Jesse Brandeburg 已提交
2874
		if (unlikely(adapter->pcix_82544 &&
L
Linus Torvalds 已提交
2875 2876 2877 2878 2879
		   !((unsigned long)(skb->data + offset + size - 1) & 4) &&
		   size > 4))
			size -= 4;

		buffer_info->length = size;
2880
		/* set time_stamp *before* dma to help avoid a possible race */
L
Linus Torvalds 已提交
2881
		buffer_info->time_stamp = jiffies;
2882
		buffer_info->mapped_as_page = false;
2883 2884
		buffer_info->dma = dma_map_single(&pdev->dev,
						  skb->data + offset,
2885
						  size, DMA_TO_DEVICE);
2886
		if (dma_mapping_error(&pdev->dev, buffer_info->dma))
2887
			goto dma_error;
2888
		buffer_info->next_to_watch = i;
L
Linus Torvalds 已提交
2889 2890 2891 2892

		len -= size;
		offset += size;
		count++;
2893 2894 2895 2896 2897
		if (len) {
			i++;
			if (unlikely(i == tx_ring->count))
				i = 0;
		}
L
Linus Torvalds 已提交
2898 2899
	}

J
Jesse Brandeburg 已提交
2900
	for (f = 0; f < nr_frags; f++) {
E
Eric Dumazet 已提交
2901
		const struct skb_frag_struct *frag;
L
Linus Torvalds 已提交
2902 2903

		frag = &skb_shinfo(skb)->frags[f];
E
Eric Dumazet 已提交
2904
		len = skb_frag_size(frag);
2905
		offset = 0;
L
Linus Torvalds 已提交
2906

J
Jesse Brandeburg 已提交
2907
		while (len) {
2908
			unsigned long bufend;
2909 2910 2911 2912
			i++;
			if (unlikely(i == tx_ring->count))
				i = 0;

L
Linus Torvalds 已提交
2913 2914 2915
			buffer_info = &tx_ring->buffer_info[i];
			size = min(len, max_per_txd);
			/* Workaround for premature desc write-backs
2916 2917 2918 2919
			 * in TSO mode.  Append 4-byte sentinel desc
			 */
			if (unlikely(mss && f == (nr_frags-1) &&
			    size == len && size > 8))
L
Linus Torvalds 已提交
2920 2921 2922
				size -= 4;
			/* Workaround for potential 82544 hang in PCI-X.
			 * Avoid terminating buffers within evenly-aligned
2923 2924
			 * dwords.
			 */
2925 2926 2927
			bufend = (unsigned long)
				page_to_phys(skb_frag_page(frag));
			bufend += offset + size - 1;
J
Jesse Brandeburg 已提交
2928
			if (unlikely(adapter->pcix_82544 &&
2929 2930
				     !(bufend & 4) &&
				     size > 4))
L
Linus Torvalds 已提交
2931 2932 2933 2934
				size -= 4;

			buffer_info->length = size;
			buffer_info->time_stamp = jiffies;
2935
			buffer_info->mapped_as_page = true;
2936 2937
			buffer_info->dma = skb_frag_dma_map(&pdev->dev, frag,
						offset, size, DMA_TO_DEVICE);
2938
			if (dma_mapping_error(&pdev->dev, buffer_info->dma))
2939
				goto dma_error;
2940
			buffer_info->next_to_watch = i;
L
Linus Torvalds 已提交
2941 2942 2943 2944 2945 2946 2947

			len -= size;
			offset += size;
			count++;
		}
	}

2948 2949 2950 2951
	segs = skb_shinfo(skb)->gso_segs ?: 1;
	/* multiply data chunks by size of headers */
	bytecount = ((segs - 1) * skb_headlen(skb)) + skb->len;

L
Linus Torvalds 已提交
2952
	tx_ring->buffer_info[i].skb = skb;
2953 2954
	tx_ring->buffer_info[i].segs = segs;
	tx_ring->buffer_info[i].bytecount = bytecount;
L
Linus Torvalds 已提交
2955 2956 2957
	tx_ring->buffer_info[first].next_to_watch = i;

	return count;
2958 2959 2960 2961

dma_error:
	dev_err(&pdev->dev, "TX DMA map failed\n");
	buffer_info->dma = 0;
2962
	if (count)
2963
		count--;
2964 2965 2966

	while (count--) {
		if (i==0)
2967
			i += tx_ring->count;
2968
		i--;
2969 2970 2971 2972 2973
		buffer_info = &tx_ring->buffer_info[i];
		e1000_unmap_and_free_tx_resource(adapter, buffer_info);
	}

	return 0;
L
Linus Torvalds 已提交
2974 2975
}

2976 2977 2978
static void e1000_tx_queue(struct e1000_adapter *adapter,
			   struct e1000_tx_ring *tx_ring, int tx_flags,
			   int count)
L
Linus Torvalds 已提交
2979 2980
{
	struct e1000_tx_desc *tx_desc = NULL;
2981
	struct e1000_tx_buffer *buffer_info;
2982
	u32 txd_upper = 0, txd_lower = E1000_TXD_CMD_IFCS;
L
Linus Torvalds 已提交
2983 2984
	unsigned int i;

J
Jesse Brandeburg 已提交
2985
	if (likely(tx_flags & E1000_TX_FLAGS_TSO)) {
L
Linus Torvalds 已提交
2986
		txd_lower |= E1000_TXD_CMD_DEXT | E1000_TXD_DTYP_D |
2987
			     E1000_TXD_CMD_TSE;
2988 2989
		txd_upper |= E1000_TXD_POPTS_TXSM << 8;

J
Jesse Brandeburg 已提交
2990
		if (likely(tx_flags & E1000_TX_FLAGS_IPV4))
2991
			txd_upper |= E1000_TXD_POPTS_IXSM << 8;
L
Linus Torvalds 已提交
2992 2993
	}

J
Jesse Brandeburg 已提交
2994
	if (likely(tx_flags & E1000_TX_FLAGS_CSUM)) {
L
Linus Torvalds 已提交
2995 2996 2997 2998
		txd_lower |= E1000_TXD_CMD_DEXT | E1000_TXD_DTYP_D;
		txd_upper |= E1000_TXD_POPTS_TXSM << 8;
	}

J
Jesse Brandeburg 已提交
2999
	if (unlikely(tx_flags & E1000_TX_FLAGS_VLAN)) {
L
Linus Torvalds 已提交
3000 3001 3002 3003
		txd_lower |= E1000_TXD_CMD_VLE;
		txd_upper |= (tx_flags & E1000_TX_FLAGS_VLAN_MASK);
	}

3004 3005 3006
	if (unlikely(tx_flags & E1000_TX_FLAGS_NO_FCS))
		txd_lower &= ~(E1000_TXD_CMD_IFCS);

L
Linus Torvalds 已提交
3007 3008
	i = tx_ring->next_to_use;

J
Jesse Brandeburg 已提交
3009
	while (count--) {
L
Linus Torvalds 已提交
3010 3011 3012 3013 3014 3015
		buffer_info = &tx_ring->buffer_info[i];
		tx_desc = E1000_TX_DESC(*tx_ring, i);
		tx_desc->buffer_addr = cpu_to_le64(buffer_info->dma);
		tx_desc->lower.data =
			cpu_to_le32(txd_lower | buffer_info->length);
		tx_desc->upper.data = cpu_to_le32(txd_upper);
J
Jesse Brandeburg 已提交
3016
		if (unlikely(++i == tx_ring->count)) i = 0;
L
Linus Torvalds 已提交
3017 3018 3019 3020
	}

	tx_desc->lower.data |= cpu_to_le32(adapter->txd_cmd);

3021 3022 3023 3024
	/* txd_cmd re-enables FCS, so we'll re-disable it here as desired. */
	if (unlikely(tx_flags & E1000_TX_FLAGS_NO_FCS))
		tx_desc->lower.data &= ~(cpu_to_le32(E1000_TXD_CMD_IFCS));

L
Linus Torvalds 已提交
3025 3026 3027
	/* Force memory writes to complete before letting h/w
	 * know there are new descriptors to fetch.  (Only
	 * applicable for weak-ordered memory model archs,
3028 3029
	 * such as IA-64).
	 */
L
Linus Torvalds 已提交
3030 3031 3032 3033 3034
	wmb();

	tx_ring->next_to_use = i;
}

3035
/* 82547 workaround to avoid controller hang in half-duplex environment.
L
Linus Torvalds 已提交
3036 3037 3038 3039 3040
 * The workaround is to avoid queuing a large packet that would span
 * the internal Tx FIFO ring boundary by notifying the stack to resend
 * the packet at a later time.  This gives the Tx FIFO an opportunity to
 * flush all packets.  When that occurs, we reset the Tx FIFO pointers
 * to the beginning of the Tx FIFO.
3041
 */
L
Linus Torvalds 已提交
3042 3043 3044 3045

#define E1000_FIFO_HDR			0x10
#define E1000_82547_PAD_LEN		0x3E0

3046 3047
static int e1000_82547_fifo_workaround(struct e1000_adapter *adapter,
				       struct sk_buff *skb)
L
Linus Torvalds 已提交
3048
{
3049 3050
	u32 fifo_space = adapter->tx_fifo_size - adapter->tx_fifo_head;
	u32 skb_fifo_len = skb->len + E1000_FIFO_HDR;
L
Linus Torvalds 已提交
3051

3052
	skb_fifo_len = ALIGN(skb_fifo_len, E1000_FIFO_HDR);
L
Linus Torvalds 已提交
3053

J
Jesse Brandeburg 已提交
3054
	if (adapter->link_duplex != HALF_DUPLEX)
L
Linus Torvalds 已提交
3055 3056
		goto no_fifo_stall_required;

J
Jesse Brandeburg 已提交
3057
	if (atomic_read(&adapter->tx_fifo_stall))
L
Linus Torvalds 已提交
3058 3059
		return 1;

J
Jesse Brandeburg 已提交
3060
	if (skb_fifo_len >= (E1000_82547_PAD_LEN + fifo_space)) {
L
Linus Torvalds 已提交
3061 3062 3063 3064 3065 3066
		atomic_set(&adapter->tx_fifo_stall, 1);
		return 1;
	}

no_fifo_stall_required:
	adapter->tx_fifo_head += skb_fifo_len;
J
Jesse Brandeburg 已提交
3067
	if (adapter->tx_fifo_head >= adapter->tx_fifo_size)
L
Linus Torvalds 已提交
3068 3069 3070 3071
		adapter->tx_fifo_head -= adapter->tx_fifo_size;
	return 0;
}

3072 3073 3074 3075 3076 3077 3078 3079
static int __e1000_maybe_stop_tx(struct net_device *netdev, int size)
{
	struct e1000_adapter *adapter = netdev_priv(netdev);
	struct e1000_tx_ring *tx_ring = adapter->tx_ring;

	netif_stop_queue(netdev);
	/* Herbert's original patch had:
	 *  smp_mb__after_netif_stop_queue();
3080 3081
	 * but since that doesn't exist yet, just open code it.
	 */
3082 3083 3084
	smp_mb();

	/* We need to check again in a case another CPU has just
3085 3086
	 * made room available.
	 */
3087 3088 3089 3090 3091
	if (likely(E1000_DESC_UNUSED(tx_ring) < size))
		return -EBUSY;

	/* A reprieve! */
	netif_start_queue(netdev);
3092
	++adapter->restart_queue;
3093 3094 3095 3096
	return 0;
}

static int e1000_maybe_stop_tx(struct net_device *netdev,
3097
			       struct e1000_tx_ring *tx_ring, int size)
3098 3099 3100 3101 3102 3103
{
	if (likely(E1000_DESC_UNUSED(tx_ring) >= size))
		return 0;
	return __e1000_maybe_stop_tx(netdev, size);
}

L
Linus Torvalds 已提交
3104
#define TXD_USE_COUNT(S, X) (((S) >> (X)) + 1 )
3105 3106
static netdev_tx_t e1000_xmit_frame(struct sk_buff *skb,
				    struct net_device *netdev)
L
Linus Torvalds 已提交
3107
{
3108
	struct e1000_adapter *adapter = netdev_priv(netdev);
J
Joe Perches 已提交
3109
	struct e1000_hw *hw = &adapter->hw;
3110
	struct e1000_tx_ring *tx_ring;
L
Linus Torvalds 已提交
3111 3112 3113
	unsigned int first, max_per_txd = E1000_MAX_DATA_PER_TXD;
	unsigned int max_txd_pwr = E1000_MAX_TXD_PWR;
	unsigned int tx_flags = 0;
E
Eric Dumazet 已提交
3114
	unsigned int len = skb_headlen(skb);
3115 3116
	unsigned int nr_frags;
	unsigned int mss;
L
Linus Torvalds 已提交
3117
	int count = 0;
3118
	int tso;
L
Linus Torvalds 已提交
3119
	unsigned int f;
3120
	__be16 protocol = vlan_get_protocol(skb);
L
Linus Torvalds 已提交
3121

3122
	/* This goes back to the question of how to logically map a Tx queue
3123
	 * to a flow.  Right now, performance is impacted slightly negatively
3124 3125 3126
	 * if using multiple Tx queues.  If the stack breaks away from a
	 * single qdisc implementation, we can look at this again.
	 */
3127
	tx_ring = adapter->tx_ring;
3128

3129 3130 3131 3132
	/* On PCI/PCI-X HW, if packet size is less than ETH_ZLEN,
	 * packets may get corrupted during padding by HW.
	 * To WA this issue, pad all small packets manually.
	 */
3133 3134
	if (eth_skb_pad(skb))
		return NETDEV_TX_OK;
3135

3136
	mss = skb_shinfo(skb)->gso_size;
3137
	/* The controller does a simple calculation to
L
Linus Torvalds 已提交
3138 3139 3140 3141
	 * make sure there is enough room in the FIFO before
	 * initiating the DMA for each buffer.  The calc is:
	 * 4 = ceil(buffer len/mss).  To make sure we don't
	 * overrun the FIFO, adjust the max buffer len if mss
3142 3143
	 * drops.
	 */
J
Jesse Brandeburg 已提交
3144
	if (mss) {
3145
		u8 hdr_len;
L
Linus Torvalds 已提交
3146 3147
		max_per_txd = min(mss << 2, max_per_txd);
		max_txd_pwr = fls(max_per_txd) - 1;
J
Jeff Kirsher 已提交
3148

3149
		hdr_len = skb_transport_offset(skb) + tcp_hdrlen(skb);
3150
		if (skb->data_len && hdr_len == len) {
J
Joe Perches 已提交
3151
			switch (hw->mac_type) {
3152
				unsigned int pull_size;
3153 3154 3155 3156 3157 3158
			case e1000_82544:
				/* Make sure we have room to chop off 4 bytes,
				 * and that the end alignment will work out to
				 * this hardware's requirements
				 * NOTE: this is a TSO only workaround
				 * if end byte alignment not correct move us
3159 3160 3161 3162
				 * into the next dword
				 */
				if ((unsigned long)(skb_tail_pointer(skb) - 1)
				    & 4)
3163 3164
					break;
				/* fall through */
3165 3166
				pull_size = min((unsigned int)4, skb->data_len);
				if (!__pskb_pull_tail(skb, pull_size)) {
3167 3168
					e_err(drv, "__pskb_pull_tail "
					      "failed.\n");
3169
					dev_kfree_skb_any(skb);
J
Jeff Garzik 已提交
3170
					return NETDEV_TX_OK;
3171
				}
E
Eric Dumazet 已提交
3172
				len = skb_headlen(skb);
3173 3174 3175 3176
				break;
			default:
				/* do nothing */
				break;
3177
			}
J
Jeff Kirsher 已提交
3178
		}
L
Linus Torvalds 已提交
3179 3180
	}

J
Jeff Kirsher 已提交
3181
	/* reserve a descriptor for the offload context */
3182
	if ((mss) || (skb->ip_summed == CHECKSUM_PARTIAL))
L
Linus Torvalds 已提交
3183
		count++;
3184
	count++;
J
Jeff Kirsher 已提交
3185 3186

	/* Controller Erratum workaround */
H
Herbert Xu 已提交
3187
	if (!skb->data_len && tx_ring->last_tx_tso && !skb_is_gso(skb))
J
Jeff Kirsher 已提交
3188 3189
		count++;

L
Linus Torvalds 已提交
3190 3191
	count += TXD_USE_COUNT(len, max_txd_pwr);

J
Jesse Brandeburg 已提交
3192
	if (adapter->pcix_82544)
L
Linus Torvalds 已提交
3193 3194
		count++;

J
Jesse Brandeburg 已提交
3195
	/* work-around for errata 10 and it applies to all controllers
3196 3197
	 * in PCI-X mode, so add one more descriptor to the count
	 */
J
Joe Perches 已提交
3198
	if (unlikely((hw->bus_type == e1000_bus_type_pcix) &&
3199 3200 3201
			(len > 2015)))
		count++;

L
Linus Torvalds 已提交
3202
	nr_frags = skb_shinfo(skb)->nr_frags;
J
Jesse Brandeburg 已提交
3203
	for (f = 0; f < nr_frags; f++)
E
Eric Dumazet 已提交
3204
		count += TXD_USE_COUNT(skb_frag_size(&skb_shinfo(skb)->frags[f]),
L
Linus Torvalds 已提交
3205
				       max_txd_pwr);
J
Jesse Brandeburg 已提交
3206
	if (adapter->pcix_82544)
L
Linus Torvalds 已提交
3207 3208 3209
		count += nr_frags;

	/* need: count + 2 desc gap to keep tail from touching
3210 3211
	 * head, otherwise try next time
	 */
3212
	if (unlikely(e1000_maybe_stop_tx(netdev, tx_ring, count + 2)))
L
Linus Torvalds 已提交
3213 3214
		return NETDEV_TX_BUSY;

3215 3216 3217 3218 3219 3220
	if (unlikely((hw->mac_type == e1000_82547) &&
		     (e1000_82547_fifo_workaround(adapter, skb)))) {
		netif_stop_queue(netdev);
		if (!test_bit(__E1000_DOWN, &adapter->flags))
			schedule_delayed_work(&adapter->fifo_stall_task, 1);
		return NETDEV_TX_BUSY;
L
Linus Torvalds 已提交
3221 3222
	}

3223
	if (skb_vlan_tag_present(skb)) {
L
Linus Torvalds 已提交
3224
		tx_flags |= E1000_TX_FLAGS_VLAN;
3225 3226
		tx_flags |= (skb_vlan_tag_get(skb) <<
			     E1000_TX_FLAGS_VLAN_SHIFT);
L
Linus Torvalds 已提交
3227 3228
	}

3229
	first = tx_ring->next_to_use;
J
Jesse Brandeburg 已提交
3230

3231
	tso = e1000_tso(adapter, tx_ring, skb, protocol);
L
Linus Torvalds 已提交
3232 3233 3234 3235 3236
	if (tso < 0) {
		dev_kfree_skb_any(skb);
		return NETDEV_TX_OK;
	}

J
Jeff Kirsher 已提交
3237
	if (likely(tso)) {
3238
		if (likely(hw->mac_type != e1000_82544))
3239
			tx_ring->last_tx_tso = true;
L
Linus Torvalds 已提交
3240
		tx_flags |= E1000_TX_FLAGS_TSO;
3241
	} else if (likely(e1000_tx_csum(adapter, tx_ring, skb, protocol)))
L
Linus Torvalds 已提交
3242 3243
		tx_flags |= E1000_TX_FLAGS_CSUM;

3244
	if (protocol == htons(ETH_P_IP))
3245 3246
		tx_flags |= E1000_TX_FLAGS_IPV4;

3247 3248 3249
	if (unlikely(skb->no_fcs))
		tx_flags |= E1000_TX_FLAGS_NO_FCS;

3250
	count = e1000_tx_map(adapter, tx_ring, skb, first, max_per_txd,
3251
			     nr_frags, mss);
L
Linus Torvalds 已提交
3252

3253
	if (count) {
3254
		netdev_sent_queue(netdev, skb->len);
3255 3256
		skb_tx_timestamp(skb);

3257 3258 3259
		e1000_tx_queue(adapter, tx_ring, tx_flags, count);
		/* Make sure there is space in the ring for the next send. */
		e1000_maybe_stop_tx(netdev, tx_ring, MAX_SKB_FRAGS + 2);
L
Linus Torvalds 已提交
3260

3261 3262 3263 3264 3265 3266 3267 3268 3269
		if (!skb->xmit_more ||
		    netif_xmit_stopped(netdev_get_tx_queue(netdev, 0))) {
			writel(tx_ring->next_to_use, hw->hw_addr + tx_ring->tdt);
			/* we need this if more than one processor can write to
			 * our tail at a time, it synchronizes IO on IA64/Altix
			 * systems
			 */
			mmiowb();
		}
3270 3271 3272 3273 3274
	} else {
		dev_kfree_skb_any(skb);
		tx_ring->buffer_info[first].time_stamp = 0;
		tx_ring->next_to_use = first;
	}
L
Linus Torvalds 已提交
3275 3276 3277 3278

	return NETDEV_TX_OK;
}

T
Tushar Dave 已提交
3279 3280 3281 3282 3283 3284 3285 3286
#define NUM_REGS 38 /* 1 based count */
static void e1000_regdump(struct e1000_adapter *adapter)
{
	struct e1000_hw *hw = &adapter->hw;
	u32 regs[NUM_REGS];
	u32 *regs_buff = regs;
	int i = 0;

3287 3288 3289 3290 3291 3292 3293 3294 3295 3296
	static const char * const reg_name[] = {
		"CTRL",  "STATUS",
		"RCTL", "RDLEN", "RDH", "RDT", "RDTR",
		"TCTL", "TDBAL", "TDBAH", "TDLEN", "TDH", "TDT",
		"TIDV", "TXDCTL", "TADV", "TARC0",
		"TDBAL1", "TDBAH1", "TDLEN1", "TDH1", "TDT1",
		"TXDCTL1", "TARC1",
		"CTRL_EXT", "ERT", "RDBAL", "RDBAH",
		"TDFH", "TDFT", "TDFHS", "TDFTS", "TDFPC",
		"RDFH", "RDFT", "RDFHS", "RDFTS", "RDFPC"
T
Tushar Dave 已提交
3297 3298 3299 3300 3301 3302 3303 3304 3305 3306 3307 3308 3309 3310 3311 3312 3313 3314 3315 3316 3317 3318 3319 3320 3321 3322 3323 3324 3325 3326 3327 3328 3329 3330 3331 3332 3333 3334 3335 3336 3337 3338 3339 3340 3341
	};

	regs_buff[0]  = er32(CTRL);
	regs_buff[1]  = er32(STATUS);

	regs_buff[2]  = er32(RCTL);
	regs_buff[3]  = er32(RDLEN);
	regs_buff[4]  = er32(RDH);
	regs_buff[5]  = er32(RDT);
	regs_buff[6]  = er32(RDTR);

	regs_buff[7]  = er32(TCTL);
	regs_buff[8]  = er32(TDBAL);
	regs_buff[9]  = er32(TDBAH);
	regs_buff[10] = er32(TDLEN);
	regs_buff[11] = er32(TDH);
	regs_buff[12] = er32(TDT);
	regs_buff[13] = er32(TIDV);
	regs_buff[14] = er32(TXDCTL);
	regs_buff[15] = er32(TADV);
	regs_buff[16] = er32(TARC0);

	regs_buff[17] = er32(TDBAL1);
	regs_buff[18] = er32(TDBAH1);
	regs_buff[19] = er32(TDLEN1);
	regs_buff[20] = er32(TDH1);
	regs_buff[21] = er32(TDT1);
	regs_buff[22] = er32(TXDCTL1);
	regs_buff[23] = er32(TARC1);
	regs_buff[24] = er32(CTRL_EXT);
	regs_buff[25] = er32(ERT);
	regs_buff[26] = er32(RDBAL0);
	regs_buff[27] = er32(RDBAH0);
	regs_buff[28] = er32(TDFH);
	regs_buff[29] = er32(TDFT);
	regs_buff[30] = er32(TDFHS);
	regs_buff[31] = er32(TDFTS);
	regs_buff[32] = er32(TDFPC);
	regs_buff[33] = er32(RDFH);
	regs_buff[34] = er32(RDFT);
	regs_buff[35] = er32(RDFHS);
	regs_buff[36] = er32(RDFTS);
	regs_buff[37] = er32(RDFPC);

	pr_info("Register dump\n");
3342 3343
	for (i = 0; i < NUM_REGS; i++)
		pr_info("%-15s  %08x\n", reg_name[i], regs_buff[i]);
T
Tushar Dave 已提交
3344 3345 3346 3347 3348 3349 3350 3351 3352 3353 3354 3355 3356 3357 3358 3359 3360 3361
}

/*
 * e1000_dump: Print registers, tx ring and rx ring
 */
static void e1000_dump(struct e1000_adapter *adapter)
{
	/* this code doesn't handle multiple rings */
	struct e1000_tx_ring *tx_ring = adapter->tx_ring;
	struct e1000_rx_ring *rx_ring = adapter->rx_ring;
	int i;

	if (!netif_msg_hw(adapter))
		return;

	/* Print Registers */
	e1000_regdump(adapter);

3362
	/* transmit dump */
T
Tushar Dave 已提交
3363 3364 3365 3366 3367 3368 3369 3370 3371 3372 3373 3374 3375 3376 3377 3378 3379 3380 3381 3382 3383 3384 3385 3386 3387 3388 3389 3390 3391
	pr_info("TX Desc ring0 dump\n");

	/* Transmit Descriptor Formats - DEXT[29] is 0 (Legacy) or 1 (Extended)
	 *
	 * Legacy Transmit Descriptor
	 *   +--------------------------------------------------------------+
	 * 0 |         Buffer Address [63:0] (Reserved on Write Back)       |
	 *   +--------------------------------------------------------------+
	 * 8 | Special  |    CSS     | Status |  CMD    |  CSO   |  Length  |
	 *   +--------------------------------------------------------------+
	 *   63       48 47        36 35    32 31     24 23    16 15        0
	 *
	 * Extended Context Descriptor (DTYP=0x0) for TSO or checksum offload
	 *   63      48 47    40 39       32 31             16 15    8 7      0
	 *   +----------------------------------------------------------------+
	 * 0 |  TUCSE  | TUCS0  |   TUCSS   |     IPCSE       | IPCS0 | IPCSS |
	 *   +----------------------------------------------------------------+
	 * 8 |   MSS   | HDRLEN | RSV | STA | TUCMD | DTYP |      PAYLEN      |
	 *   +----------------------------------------------------------------+
	 *   63      48 47    40 39 36 35 32 31   24 23  20 19                0
	 *
	 * Extended Data Descriptor (DTYP=0x1)
	 *   +----------------------------------------------------------------+
	 * 0 |                     Buffer Address [63:0]                      |
	 *   +----------------------------------------------------------------+
	 * 8 | VLAN tag |  POPTS  | Rsvd | Status | Command | DTYP |  DTALEN  |
	 *   +----------------------------------------------------------------+
	 *   63       48 47     40 39  36 35    32 31     24 23  20 19        0
	 */
3392 3393
	pr_info("Tc[desc]     [Ce CoCsIpceCoS] [MssHlRSCm0Plen] [bi->dma       ] leng  ntw timestmp         bi->skb\n");
	pr_info("Td[desc]     [address 63:0  ] [VlaPoRSCm1Dlen] [bi->dma       ] leng  ntw timestmp         bi->skb\n");
T
Tushar Dave 已提交
3394 3395 3396 3397 3398 3399

	if (!netif_msg_tx_done(adapter))
		goto rx_ring_summary;

	for (i = 0; tx_ring->desc && (i < tx_ring->count); i++) {
		struct e1000_tx_desc *tx_desc = E1000_TX_DESC(*tx_ring, i);
3400
		struct e1000_tx_buffer *buffer_info = &tx_ring->buffer_info[i];
3401
		struct my_u { __le64 a; __le64 b; };
T
Tushar Dave 已提交
3402
		struct my_u *u = (struct my_u *)tx_desc;
3403 3404
		const char *type;

T
Tushar Dave 已提交
3405
		if (i == tx_ring->next_to_use && i == tx_ring->next_to_clean)
3406
			type = "NTC/U";
T
Tushar Dave 已提交
3407
		else if (i == tx_ring->next_to_use)
3408
			type = "NTU";
T
Tushar Dave 已提交
3409
		else if (i == tx_ring->next_to_clean)
3410
			type = "NTC";
T
Tushar Dave 已提交
3411
		else
3412
			type = "";
T
Tushar Dave 已提交
3413

3414 3415 3416 3417 3418 3419
		pr_info("T%c[0x%03X]    %016llX %016llX %016llX %04X  %3X %016llX %p %s\n",
			((le64_to_cpu(u->b) & (1<<20)) ? 'd' : 'c'), i,
			le64_to_cpu(u->a), le64_to_cpu(u->b),
			(u64)buffer_info->dma, buffer_info->length,
			buffer_info->next_to_watch,
			(u64)buffer_info->time_stamp, buffer_info->skb, type);
T
Tushar Dave 已提交
3420 3421 3422
	}

rx_ring_summary:
3423
	/* receive dump */
T
Tushar Dave 已提交
3424 3425 3426 3427 3428 3429 3430 3431 3432 3433 3434
	pr_info("\nRX Desc ring dump\n");

	/* Legacy Receive Descriptor Format
	 *
	 * +-----------------------------------------------------+
	 * |                Buffer Address [63:0]                |
	 * +-----------------------------------------------------+
	 * | VLAN Tag | Errors | Status 0 | Packet csum | Length |
	 * +-----------------------------------------------------+
	 * 63       48 47    40 39      32 31         16 15      0
	 */
3435
	pr_info("R[desc]      [address 63:0  ] [vl er S cks ln] [bi->dma       ] [bi->skb]\n");
T
Tushar Dave 已提交
3436 3437 3438 3439 3440 3441

	if (!netif_msg_rx_status(adapter))
		goto exit;

	for (i = 0; rx_ring->desc && (i < rx_ring->count); i++) {
		struct e1000_rx_desc *rx_desc = E1000_RX_DESC(*rx_ring, i);
3442
		struct e1000_rx_buffer *buffer_info = &rx_ring->buffer_info[i];
3443
		struct my_u { __le64 a; __le64 b; };
T
Tushar Dave 已提交
3444
		struct my_u *u = (struct my_u *)rx_desc;
3445 3446
		const char *type;

T
Tushar Dave 已提交
3447
		if (i == rx_ring->next_to_use)
3448
			type = "NTU";
T
Tushar Dave 已提交
3449
		else if (i == rx_ring->next_to_clean)
3450
			type = "NTC";
T
Tushar Dave 已提交
3451
		else
3452
			type = "";
T
Tushar Dave 已提交
3453

3454 3455
		pr_info("R[0x%03X]     %016llX %016llX %016llX %p %s\n",
			i, le64_to_cpu(u->a), le64_to_cpu(u->b),
F
Florian Westphal 已提交
3456
			(u64)buffer_info->dma, buffer_info->rxbuf.data, type);
T
Tushar Dave 已提交
3457 3458 3459 3460
	} /* for */

	/* dump the descriptor caches */
	/* rx */
3461
	pr_info("Rx descriptor cache in 64bit format\n");
T
Tushar Dave 已提交
3462
	for (i = 0x6000; i <= 0x63FF ; i += 0x10) {
3463 3464 3465 3466 3467 3468
		pr_info("R%04X: %08X|%08X %08X|%08X\n",
			i,
			readl(adapter->hw.hw_addr + i+4),
			readl(adapter->hw.hw_addr + i),
			readl(adapter->hw.hw_addr + i+12),
			readl(adapter->hw.hw_addr + i+8));
T
Tushar Dave 已提交
3469 3470
	}
	/* tx */
3471
	pr_info("Tx descriptor cache in 64bit format\n");
T
Tushar Dave 已提交
3472
	for (i = 0x7000; i <= 0x73FF ; i += 0x10) {
3473 3474 3475 3476 3477 3478
		pr_info("T%04X: %08X|%08X %08X|%08X\n",
			i,
			readl(adapter->hw.hw_addr + i+4),
			readl(adapter->hw.hw_addr + i),
			readl(adapter->hw.hw_addr + i+12),
			readl(adapter->hw.hw_addr + i+8));
T
Tushar Dave 已提交
3479 3480 3481 3482 3483
	}
exit:
	return;
}

L
Linus Torvalds 已提交
3484 3485 3486 3487
/**
 * e1000_tx_timeout - Respond to a Tx Hang
 * @netdev: network interface device structure
 **/
3488
static void e1000_tx_timeout(struct net_device *netdev)
L
Linus Torvalds 已提交
3489
{
3490
	struct e1000_adapter *adapter = netdev_priv(netdev);
L
Linus Torvalds 已提交
3491 3492

	/* Do the reset outside of interrupt context */
3493 3494
	adapter->tx_timeout_count++;
	schedule_work(&adapter->reset_task);
L
Linus Torvalds 已提交
3495 3496
}

3497
static void e1000_reset_task(struct work_struct *work)
L
Linus Torvalds 已提交
3498
{
3499 3500
	struct e1000_adapter *adapter =
		container_of(work, struct e1000_adapter, reset_task);
L
Linus Torvalds 已提交
3501

T
Tushar Dave 已提交
3502
	e_err(drv, "Reset adapter\n");
3503
	e1000_reinit_locked(adapter);
L
Linus Torvalds 已提交
3504 3505 3506 3507 3508 3509 3510
}

/**
 * e1000_get_stats - Get System Network Statistics
 * @netdev: network interface device structure
 *
 * Returns the address of the device statistics structure.
3511
 * The statistics are actually updated from the watchdog.
L
Linus Torvalds 已提交
3512
 **/
3513
static struct net_device_stats *e1000_get_stats(struct net_device *netdev)
L
Linus Torvalds 已提交
3514
{
J
Jeff Kirsher 已提交
3515
	/* only return the current stats */
3516
	return &netdev->stats;
L
Linus Torvalds 已提交
3517 3518 3519 3520 3521 3522 3523 3524 3525
}

/**
 * e1000_change_mtu - Change the Maximum Transfer Unit
 * @netdev: network interface device structure
 * @new_mtu: new value for maximum frame size
 *
 * Returns 0 on success, negative on failure
 **/
3526
static int e1000_change_mtu(struct net_device *netdev, int new_mtu)
L
Linus Torvalds 已提交
3527
{
3528
	struct e1000_adapter *adapter = netdev_priv(netdev);
J
Joe Perches 已提交
3529
	struct e1000_hw *hw = &adapter->hw;
L
Linus Torvalds 已提交
3530 3531
	int max_frame = new_mtu + ENET_HEADER_SIZE + ETHERNET_FCS_SIZE;

J
Jesse Brandeburg 已提交
3532 3533
	if ((max_frame < MINIMUM_ETHERNET_FRAME_SIZE) ||
	    (max_frame > MAX_JUMBO_FRAME_SIZE)) {
3534
		e_err(probe, "Invalid MTU setting\n");
L
Linus Torvalds 已提交
3535
		return -EINVAL;
3536
	}
L
Linus Torvalds 已提交
3537

3538
	/* Adapter-specific max frame size limits. */
J
Joe Perches 已提交
3539
	switch (hw->mac_type) {
3540
	case e1000_undefined ... e1000_82542_rev2_1:
3541
		if (max_frame > (ETH_FRAME_LEN + ETH_FCS_LEN)) {
3542
			e_err(probe, "Jumbo Frames not supported.\n");
3543 3544
			return -EINVAL;
		}
3545 3546 3547 3548
		break;
	default:
		/* Capable of supporting up to MAX_JUMBO_FRAME_SIZE limit. */
		break;
L
Linus Torvalds 已提交
3549 3550
	}

3551 3552 3553 3554 3555 3556 3557
	while (test_and_set_bit(__E1000_RESETTING, &adapter->flags))
		msleep(1);
	/* e1000_down has a dependency on max_frame_size */
	hw->max_frame_size = max_frame;
	if (netif_running(netdev))
		e1000_down(adapter);

3558
	/* NOTE: netdev_alloc_skb reserves 16 bytes, and typically NET_IP_ALIGN
3559
	 * means we reserve 2 more, this pushes us to allocate from the next
3560 3561
	 * larger slab size.
	 * i.e. RXBUFFER_2048 --> size-4096 slab
3562 3563 3564
	 * however with the new *_jumbo_rx* routines, jumbo receives will use
	 * fragmented skbs
	 */
3565

3566
	if (max_frame <= E1000_RXBUFFER_2048)
3567
		adapter->rx_buffer_len = E1000_RXBUFFER_2048;
3568 3569
	else
#if (PAGE_SIZE >= E1000_RXBUFFER_16384)
3570
		adapter->rx_buffer_len = E1000_RXBUFFER_16384;
3571 3572 3573
#elif (PAGE_SIZE >= E1000_RXBUFFER_4096)
		adapter->rx_buffer_len = PAGE_SIZE;
#endif
3574 3575

	/* adjust allocation if LPE protects us, and we aren't using SBP */
J
Joe Perches 已提交
3576
	if (!hw->tbi_compatibility_on &&
3577
	    ((max_frame == (ETH_FRAME_LEN + ETH_FCS_LEN)) ||
3578 3579
	     (max_frame == MAXIMUM_ETHERNET_VLAN_SIZE)))
		adapter->rx_buffer_len = MAXIMUM_ETHERNET_VLAN_SIZE;
3580

3581 3582
	pr_info("%s changing MTU from %d to %d\n",
		netdev->name, netdev->mtu, new_mtu);
3583 3584
	netdev->mtu = new_mtu;

3585
	if (netif_running(netdev))
3586 3587 3588 3589 3590
		e1000_up(adapter);
	else
		e1000_reset(adapter);

	clear_bit(__E1000_RESETTING, &adapter->flags);
L
Linus Torvalds 已提交
3591 3592 3593 3594 3595 3596 3597 3598

	return 0;
}

/**
 * e1000_update_stats - Update the board statistics counters
 * @adapter: board private structure
 **/
3599
void e1000_update_stats(struct e1000_adapter *adapter)
L
Linus Torvalds 已提交
3600
{
3601
	struct net_device *netdev = adapter->netdev;
L
Linus Torvalds 已提交
3602
	struct e1000_hw *hw = &adapter->hw;
3603
	struct pci_dev *pdev = adapter->pdev;
L
Linus Torvalds 已提交
3604
	unsigned long flags;
3605
	u16 phy_tmp;
L
Linus Torvalds 已提交
3606 3607 3608

#define PHY_IDLE_ERROR_COUNT_MASK 0x00FF

3609
	/* Prevent stats update while adapter is being reset, or if the pci
3610 3611
	 * connection is down.
	 */
A
Auke Kok 已提交
3612
	if (adapter->link_speed == 0)
3613
		return;
3614
	if (pci_channel_offline(pdev))
A
Auke Kok 已提交
3615 3616
		return;

L
Linus Torvalds 已提交
3617 3618
	spin_lock_irqsave(&adapter->stats_lock, flags);

3619
	/* these counters are modified from e1000_tbi_adjust_stats,
L
Linus Torvalds 已提交
3620 3621 3622 3623
	 * called from the interrupt context, so they must only
	 * be written while holding adapter->stats_lock
	 */

J
Joe Perches 已提交
3624 3625 3626 3627 3628 3629 3630 3631
	adapter->stats.crcerrs += er32(CRCERRS);
	adapter->stats.gprc += er32(GPRC);
	adapter->stats.gorcl += er32(GORCL);
	adapter->stats.gorch += er32(GORCH);
	adapter->stats.bprc += er32(BPRC);
	adapter->stats.mprc += er32(MPRC);
	adapter->stats.roc += er32(ROC);

3632 3633 3634 3635 3636 3637
	adapter->stats.prc64 += er32(PRC64);
	adapter->stats.prc127 += er32(PRC127);
	adapter->stats.prc255 += er32(PRC255);
	adapter->stats.prc511 += er32(PRC511);
	adapter->stats.prc1023 += er32(PRC1023);
	adapter->stats.prc1522 += er32(PRC1522);
J
Joe Perches 已提交
3638 3639 3640 3641 3642 3643 3644 3645 3646 3647 3648 3649 3650 3651 3652 3653 3654 3655 3656 3657 3658 3659 3660 3661 3662 3663 3664 3665

	adapter->stats.symerrs += er32(SYMERRS);
	adapter->stats.mpc += er32(MPC);
	adapter->stats.scc += er32(SCC);
	adapter->stats.ecol += er32(ECOL);
	adapter->stats.mcc += er32(MCC);
	adapter->stats.latecol += er32(LATECOL);
	adapter->stats.dc += er32(DC);
	adapter->stats.sec += er32(SEC);
	adapter->stats.rlec += er32(RLEC);
	adapter->stats.xonrxc += er32(XONRXC);
	adapter->stats.xontxc += er32(XONTXC);
	adapter->stats.xoffrxc += er32(XOFFRXC);
	adapter->stats.xofftxc += er32(XOFFTXC);
	adapter->stats.fcruc += er32(FCRUC);
	adapter->stats.gptc += er32(GPTC);
	adapter->stats.gotcl += er32(GOTCL);
	adapter->stats.gotch += er32(GOTCH);
	adapter->stats.rnbc += er32(RNBC);
	adapter->stats.ruc += er32(RUC);
	adapter->stats.rfc += er32(RFC);
	adapter->stats.rjc += er32(RJC);
	adapter->stats.torl += er32(TORL);
	adapter->stats.torh += er32(TORH);
	adapter->stats.totl += er32(TOTL);
	adapter->stats.toth += er32(TOTH);
	adapter->stats.tpr += er32(TPR);

3666 3667 3668 3669 3670 3671
	adapter->stats.ptc64 += er32(PTC64);
	adapter->stats.ptc127 += er32(PTC127);
	adapter->stats.ptc255 += er32(PTC255);
	adapter->stats.ptc511 += er32(PTC511);
	adapter->stats.ptc1023 += er32(PTC1023);
	adapter->stats.ptc1522 += er32(PTC1522);
J
Joe Perches 已提交
3672 3673 3674

	adapter->stats.mptc += er32(MPTC);
	adapter->stats.bptc += er32(BPTC);
L
Linus Torvalds 已提交
3675 3676 3677

	/* used for adaptive IFS */

J
Joe Perches 已提交
3678
	hw->tx_packet_delta = er32(TPT);
L
Linus Torvalds 已提交
3679
	adapter->stats.tpt += hw->tx_packet_delta;
J
Joe Perches 已提交
3680
	hw->collision_delta = er32(COLC);
L
Linus Torvalds 已提交
3681 3682
	adapter->stats.colc += hw->collision_delta;

J
Jesse Brandeburg 已提交
3683
	if (hw->mac_type >= e1000_82543) {
J
Joe Perches 已提交
3684 3685 3686 3687 3688 3689
		adapter->stats.algnerrc += er32(ALGNERRC);
		adapter->stats.rxerrc += er32(RXERRC);
		adapter->stats.tncrs += er32(TNCRS);
		adapter->stats.cexterr += er32(CEXTERR);
		adapter->stats.tsctc += er32(TSCTC);
		adapter->stats.tsctfc += er32(TSCTFC);
L
Linus Torvalds 已提交
3690 3691 3692
	}

	/* Fill out the OS statistics structure */
3693 3694
	netdev->stats.multicast = adapter->stats.mprc;
	netdev->stats.collisions = adapter->stats.colc;
L
Linus Torvalds 已提交
3695 3696 3697

	/* Rx Errors */

3698
	/* RLEC on some newer hardware can be incorrect so build
3699 3700
	 * our own version based on RUC and ROC
	 */
3701
	netdev->stats.rx_errors = adapter->stats.rxerrc +
L
Linus Torvalds 已提交
3702
		adapter->stats.crcerrs + adapter->stats.algnerrc +
3703 3704
		adapter->stats.ruc + adapter->stats.roc +
		adapter->stats.cexterr;
3705
	adapter->stats.rlerrc = adapter->stats.ruc + adapter->stats.roc;
3706 3707 3708 3709
	netdev->stats.rx_length_errors = adapter->stats.rlerrc;
	netdev->stats.rx_crc_errors = adapter->stats.crcerrs;
	netdev->stats.rx_frame_errors = adapter->stats.algnerrc;
	netdev->stats.rx_missed_errors = adapter->stats.mpc;
L
Linus Torvalds 已提交
3710 3711

	/* Tx Errors */
3712
	adapter->stats.txerrc = adapter->stats.ecol + adapter->stats.latecol;
3713 3714 3715 3716
	netdev->stats.tx_errors = adapter->stats.txerrc;
	netdev->stats.tx_aborted_errors = adapter->stats.ecol;
	netdev->stats.tx_window_errors = adapter->stats.latecol;
	netdev->stats.tx_carrier_errors = adapter->stats.tncrs;
J
Joe Perches 已提交
3717
	if (hw->bad_tx_carr_stats_fd &&
3718
	    adapter->link_duplex == FULL_DUPLEX) {
3719
		netdev->stats.tx_carrier_errors = 0;
3720 3721
		adapter->stats.tncrs = 0;
	}
L
Linus Torvalds 已提交
3722 3723 3724 3725

	/* Tx Dropped needs to be maintained elsewhere */

	/* Phy Stats */
J
Jesse Brandeburg 已提交
3726 3727
	if (hw->media_type == e1000_media_type_copper) {
		if ((adapter->link_speed == SPEED_1000) &&
L
Linus Torvalds 已提交
3728 3729 3730 3731 3732
		   (!e1000_read_phy_reg(hw, PHY_1000T_STATUS, &phy_tmp))) {
			phy_tmp &= PHY_IDLE_ERROR_COUNT_MASK;
			adapter->phy_stats.idle_errors += phy_tmp;
		}

J
Jesse Brandeburg 已提交
3733
		if ((hw->mac_type <= e1000_82546) &&
L
Linus Torvalds 已提交
3734 3735 3736 3737 3738
		   (hw->phy_type == e1000_phy_m88) &&
		   !e1000_read_phy_reg(hw, M88E1000_RX_ERR_CNTR, &phy_tmp))
			adapter->phy_stats.receive_errors += phy_tmp;
	}

3739
	/* Management Stats */
J
Joe Perches 已提交
3740 3741 3742 3743
	if (hw->has_smbus) {
		adapter->stats.mgptc += er32(MGTPTC);
		adapter->stats.mgprc += er32(MGTPRC);
		adapter->stats.mgpdc += er32(MGTPDC);
3744 3745
	}

L
Linus Torvalds 已提交
3746 3747
	spin_unlock_irqrestore(&adapter->stats_lock, flags);
}
3748

L
Linus Torvalds 已提交
3749 3750 3751 3752 3753
/**
 * e1000_intr - Interrupt Handler
 * @irq: interrupt number
 * @data: pointer to a network interface device structure
 **/
3754
static irqreturn_t e1000_intr(int irq, void *data)
L
Linus Torvalds 已提交
3755 3756
{
	struct net_device *netdev = data;
3757
	struct e1000_adapter *adapter = netdev_priv(netdev);
L
Linus Torvalds 已提交
3758
	struct e1000_hw *hw = &adapter->hw;
3759
	u32 icr = er32(ICR);
3760

J
Jesse Brandeburg 已提交
3761
	if (unlikely((!icr)))
J
Jesse Brandeburg 已提交
3762 3763
		return IRQ_NONE;  /* Not our interrupt */

3764
	/* we might have caused the interrupt, but the above
J
Jesse Brandeburg 已提交
3765 3766 3767 3768 3769 3770
	 * read cleared it, and just in case the driver is
	 * down there is nothing to do so return handled
	 */
	if (unlikely(test_bit(__E1000_DOWN, &adapter->flags)))
		return IRQ_HANDLED;

J
Jesse Brandeburg 已提交
3771
	if (unlikely(icr & (E1000_ICR_RXSEQ | E1000_ICR_LSC))) {
L
Linus Torvalds 已提交
3772
		hw->get_link_status = 1;
A
Auke Kok 已提交
3773 3774
		/* guard against interrupt when we're going down */
		if (!test_bit(__E1000_DOWN, &adapter->flags))
3775
			schedule_delayed_work(&adapter->watchdog_task, 1);
L
Linus Torvalds 已提交
3776 3777
	}

3778 3779 3780 3781
	/* disable interrupts, without the synchronize_irq bit */
	ew32(IMC, ~0);
	E1000_WRITE_FLUSH();

3782
	if (likely(napi_schedule_prep(&adapter->napi))) {
J
Jesse Brandeburg 已提交
3783 3784 3785 3786
		adapter->total_tx_bytes = 0;
		adapter->total_tx_packets = 0;
		adapter->total_rx_bytes = 0;
		adapter->total_rx_packets = 0;
3787
		__napi_schedule(&adapter->napi);
3788
	} else {
3789
		/* this really should not happen! if it does it is basically a
3790 3791
		 * bug, but not a hard error, so enable ints and continue
		 */
3792 3793 3794
		if (!test_bit(__E1000_DOWN, &adapter->flags))
			e1000_irq_enable(adapter);
	}
L
Linus Torvalds 已提交
3795 3796 3797 3798 3799 3800 3801 3802

	return IRQ_HANDLED;
}

/**
 * e1000_clean - NAPI Rx polling callback
 * @adapter: board private structure
 **/
3803
static int e1000_clean(struct napi_struct *napi, int budget)
L
Linus Torvalds 已提交
3804
{
3805 3806
	struct e1000_adapter *adapter = container_of(napi, struct e1000_adapter,
						     napi);
3807
	int tx_clean_complete = 0, work_done = 0;
3808

3809
	tx_clean_complete = e1000_clean_tx_irq(adapter, &adapter->tx_ring[0]);
3810

3811
	adapter->clean_rx(adapter, &adapter->rx_ring[0], &work_done, budget);
3812

3813
	if (!tx_clean_complete)
3814 3815
		work_done = budget;

3816 3817
	/* If budget not fully consumed, exit the polling mode */
	if (work_done < budget) {
J
Jesse Brandeburg 已提交
3818 3819
		if (likely(adapter->itr_setting & 3))
			e1000_set_itr(adapter);
3820
		napi_complete(napi);
3821 3822
		if (!test_bit(__E1000_DOWN, &adapter->flags))
			e1000_irq_enable(adapter);
L
Linus Torvalds 已提交
3823 3824
	}

3825
	return work_done;
L
Linus Torvalds 已提交
3826 3827 3828 3829 3830 3831
}

/**
 * e1000_clean_tx_irq - Reclaim resources after transmit completes
 * @adapter: board private structure
 **/
3832 3833
static bool e1000_clean_tx_irq(struct e1000_adapter *adapter,
			       struct e1000_tx_ring *tx_ring)
L
Linus Torvalds 已提交
3834
{
J
Joe Perches 已提交
3835
	struct e1000_hw *hw = &adapter->hw;
L
Linus Torvalds 已提交
3836 3837
	struct net_device *netdev = adapter->netdev;
	struct e1000_tx_desc *tx_desc, *eop_desc;
3838
	struct e1000_tx_buffer *buffer_info;
L
Linus Torvalds 已提交
3839
	unsigned int i, eop;
3840
	unsigned int count = 0;
J
Jesse Brandeburg 已提交
3841
	unsigned int total_tx_bytes=0, total_tx_packets=0;
3842
	unsigned int bytes_compl = 0, pkts_compl = 0;
L
Linus Torvalds 已提交
3843 3844 3845 3846 3847

	i = tx_ring->next_to_clean;
	eop = tx_ring->buffer_info[i].next_to_watch;
	eop_desc = E1000_TX_DESC(*tx_ring, eop);

3848 3849
	while ((eop_desc->upper.data & cpu_to_le32(E1000_TXD_STAT_DD)) &&
	       (count < tx_ring->count)) {
3850
		bool cleaned = false;
3851
		rmb();	/* read buffer_info after eop_desc */
3852
		for ( ; !cleaned; count++) {
L
Linus Torvalds 已提交
3853 3854 3855 3856
			tx_desc = E1000_TX_DESC(*tx_ring, i);
			buffer_info = &tx_ring->buffer_info[i];
			cleaned = (i == eop);

J
Jesse Brandeburg 已提交
3857
			if (cleaned) {
3858 3859
				total_tx_packets += buffer_info->segs;
				total_tx_bytes += buffer_info->bytecount;
3860 3861 3862 3863 3864
				if (buffer_info->skb) {
					bytes_compl += buffer_info->skb->len;
					pkts_compl++;
				}

J
Jesse Brandeburg 已提交
3865
			}
J
Jeff Kirsher 已提交
3866
			e1000_unmap_and_free_tx_resource(adapter, buffer_info);
3867
			tx_desc->upper.data = 0;
L
Linus Torvalds 已提交
3868

J
Jesse Brandeburg 已提交
3869
			if (unlikely(++i == tx_ring->count)) i = 0;
L
Linus Torvalds 已提交
3870
		}
3871

L
Linus Torvalds 已提交
3872 3873 3874 3875 3876 3877
		eop = tx_ring->buffer_info[i].next_to_watch;
		eop_desc = E1000_TX_DESC(*tx_ring, eop);
	}

	tx_ring->next_to_clean = i;

3878 3879
	netdev_completed_queue(netdev, pkts_compl, bytes_compl);

3880
#define TX_WAKE_THRESHOLD 32
3881
	if (unlikely(count && netif_carrier_ok(netdev) &&
3882 3883 3884 3885 3886
		     E1000_DESC_UNUSED(tx_ring) >= TX_WAKE_THRESHOLD)) {
		/* Make sure that anybody stopping the queue after this
		 * sees the new next_to_clean.
		 */
		smp_mb();
3887 3888 3889

		if (netif_queue_stopped(netdev) &&
		    !(test_bit(__E1000_DOWN, &adapter->flags))) {
3890
			netif_wake_queue(netdev);
3891 3892
			++adapter->restart_queue;
		}
3893
	}
3894

3895
	if (adapter->detect_tx_hung) {
3896
		/* Detect a transmit hang in hardware, this serializes the
3897 3898
		 * check with the clearing of time_stamp and movement of i
		 */
J
Joe Perches 已提交
3899
		adapter->detect_tx_hung = false;
3900 3901
		if (tx_ring->buffer_info[eop].time_stamp &&
		    time_after(jiffies, tx_ring->buffer_info[eop].time_stamp +
3902
			       (adapter->tx_timeout_factor * HZ)) &&
3903
		    !(er32(STATUS) & E1000_STATUS_TXOFF)) {
3904 3905

			/* detected Tx unit hang */
3906
			e_err(drv, "Detected Tx Unit Hang\n"
3907 3908 3909 3910 3911 3912 3913 3914 3915 3916
			      "  Tx Queue             <%lu>\n"
			      "  TDH                  <%x>\n"
			      "  TDT                  <%x>\n"
			      "  next_to_use          <%x>\n"
			      "  next_to_clean        <%x>\n"
			      "buffer_info[next_to_clean]\n"
			      "  time_stamp           <%lx>\n"
			      "  next_to_watch        <%x>\n"
			      "  jiffies              <%lx>\n"
			      "  next_to_watch.status <%x>\n",
3917
				(unsigned long)(tx_ring - adapter->tx_ring),
J
Joe Perches 已提交
3918 3919
				readl(hw->hw_addr + tx_ring->tdh),
				readl(hw->hw_addr + tx_ring->tdt),
3920
				tx_ring->next_to_use,
3921
				tx_ring->next_to_clean,
3922
				tx_ring->buffer_info[eop].time_stamp,
3923 3924 3925
				eop,
				jiffies,
				eop_desc->upper.fields.status);
T
Tushar Dave 已提交
3926
			e1000_dump(adapter);
L
Linus Torvalds 已提交
3927
			netif_stop_queue(netdev);
3928
		}
L
Linus Torvalds 已提交
3929
	}
J
Jesse Brandeburg 已提交
3930 3931
	adapter->total_tx_bytes += total_tx_bytes;
	adapter->total_tx_packets += total_tx_packets;
3932 3933
	netdev->stats.tx_bytes += total_tx_bytes;
	netdev->stats.tx_packets += total_tx_packets;
3934
	return count < tx_ring->count;
L
Linus Torvalds 已提交
3935 3936 3937 3938
}

/**
 * e1000_rx_checksum - Receive Checksum Offload for 82543
3939 3940 3941 3942
 * @adapter:     board private structure
 * @status_err:  receive descriptor status and error fields
 * @csum:        receive descriptor csum field
 * @sk_buff:     socket buffer with received data
L
Linus Torvalds 已提交
3943
 **/
3944 3945
static void e1000_rx_checksum(struct e1000_adapter *adapter, u32 status_err,
			      u32 csum, struct sk_buff *skb)
L
Linus Torvalds 已提交
3946
{
J
Joe Perches 已提交
3947
	struct e1000_hw *hw = &adapter->hw;
3948 3949
	u16 status = (u16)status_err;
	u8 errors = (u8)(status_err >> 24);
3950 3951

	skb_checksum_none_assert(skb);
3952

L
Linus Torvalds 已提交
3953
	/* 82543 or newer only */
J
Joe Perches 已提交
3954
	if (unlikely(hw->mac_type < e1000_82543)) return;
L
Linus Torvalds 已提交
3955
	/* Ignore Checksum bit is set */
J
Jesse Brandeburg 已提交
3956
	if (unlikely(status & E1000_RXD_STAT_IXSM)) return;
3957
	/* TCP/UDP checksum error bit is set */
J
Jesse Brandeburg 已提交
3958
	if (unlikely(errors & E1000_RXD_ERR_TCPE)) {
L
Linus Torvalds 已提交
3959 3960
		/* let the stack verify checksum errors */
		adapter->hw_csum_err++;
3961 3962 3963
		return;
	}
	/* TCP/UDP Checksum has not been calculated */
3964 3965 3966
	if (!(status & E1000_RXD_STAT_TCPCS))
		return;

3967 3968
	/* It must be a TCP or UDP packet with a valid checksum */
	if (likely(status & E1000_RXD_STAT_TCPCS)) {
L
Linus Torvalds 已提交
3969 3970 3971
		/* TCP checksum is good */
		skb->ip_summed = CHECKSUM_UNNECESSARY;
	}
3972
	adapter->hw_csum_good++;
L
Linus Torvalds 已提交
3973 3974
}

3975
/**
F
Florian Westphal 已提交
3976
 * e1000_consume_page - helper function for jumbo Rx path
3977
 **/
3978
static void e1000_consume_page(struct e1000_rx_buffer *bi, struct sk_buff *skb,
3979
			       u16 length)
3980
{
F
Florian Westphal 已提交
3981
	bi->rxbuf.page = NULL;
3982 3983
	skb->len += length;
	skb->data_len += length;
3984
	skb->truesize += PAGE_SIZE;
3985 3986 3987 3988 3989 3990 3991 3992 3993 3994 3995 3996
}

/**
 * e1000_receive_skb - helper function to handle rx indications
 * @adapter: board private structure
 * @status: descriptor status field as written by hardware
 * @vlan: descriptor vlan field as written by hardware (no le/be conversion)
 * @skb: pointer to sk_buff to be indicated to stack
 */
static void e1000_receive_skb(struct e1000_adapter *adapter, u8 status,
			      __le16 vlan, struct sk_buff *skb)
{
J
Jesse Brandeburg 已提交
3997 3998
	skb->protocol = eth_type_trans(skb, adapter->netdev);

J
Jiri Pirko 已提交
3999 4000 4001
	if (status & E1000_RXD_STAT_VP) {
		u16 vid = le16_to_cpu(vlan) & E1000_RXD_SPC_VLAN_MASK;

4002
		__vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q), vid);
J
Jiri Pirko 已提交
4003 4004
	}
	napi_gro_receive(&adapter->napi, skb);
4005 4006
}

4007 4008 4009 4010 4011 4012 4013 4014 4015 4016 4017 4018 4019 4020 4021 4022 4023 4024 4025 4026 4027 4028 4029 4030 4031 4032 4033 4034 4035 4036 4037 4038 4039 4040 4041 4042 4043 4044 4045 4046 4047 4048 4049 4050 4051 4052 4053 4054 4055 4056 4057 4058 4059 4060 4061 4062 4063 4064 4065 4066 4067 4068 4069 4070 4071 4072 4073 4074 4075 4076 4077 4078 4079 4080 4081 4082 4083
/**
 * e1000_tbi_adjust_stats
 * @hw: Struct containing variables accessed by shared code
 * @frame_len: The length of the frame in question
 * @mac_addr: The Ethernet destination address of the frame in question
 *
 * Adjusts the statistic counters when a frame is accepted by TBI_ACCEPT
 */
static void e1000_tbi_adjust_stats(struct e1000_hw *hw,
				   struct e1000_hw_stats *stats,
				   u32 frame_len, const u8 *mac_addr)
{
	u64 carry_bit;

	/* First adjust the frame length. */
	frame_len--;
	/* We need to adjust the statistics counters, since the hardware
	 * counters overcount this packet as a CRC error and undercount
	 * the packet as a good packet
	 */
	/* This packet should not be counted as a CRC error. */
	stats->crcerrs--;
	/* This packet does count as a Good Packet Received. */
	stats->gprc++;

	/* Adjust the Good Octets received counters */
	carry_bit = 0x80000000 & stats->gorcl;
	stats->gorcl += frame_len;
	/* If the high bit of Gorcl (the low 32 bits of the Good Octets
	 * Received Count) was one before the addition,
	 * AND it is zero after, then we lost the carry out,
	 * need to add one to Gorch (Good Octets Received Count High).
	 * This could be simplified if all environments supported
	 * 64-bit integers.
	 */
	if (carry_bit && ((stats->gorcl & 0x80000000) == 0))
		stats->gorch++;
	/* Is this a broadcast or multicast?  Check broadcast first,
	 * since the test for a multicast frame will test positive on
	 * a broadcast frame.
	 */
	if (is_broadcast_ether_addr(mac_addr))
		stats->bprc++;
	else if (is_multicast_ether_addr(mac_addr))
		stats->mprc++;

	if (frame_len == hw->max_frame_size) {
		/* In this case, the hardware has overcounted the number of
		 * oversize frames.
		 */
		if (stats->roc > 0)
			stats->roc--;
	}

	/* Adjust the bin counters when the extra byte put the frame in the
	 * wrong bin. Remember that the frame_len was adjusted above.
	 */
	if (frame_len == 64) {
		stats->prc64++;
		stats->prc127--;
	} else if (frame_len == 127) {
		stats->prc127++;
		stats->prc255--;
	} else if (frame_len == 255) {
		stats->prc255++;
		stats->prc511--;
	} else if (frame_len == 511) {
		stats->prc511++;
		stats->prc1023--;
	} else if (frame_len == 1023) {
		stats->prc1023++;
		stats->prc1522--;
	} else if (frame_len == 1522) {
		stats->prc1522++;
	}
}

4084 4085 4086 4087 4088 4089 4090 4091 4092 4093 4094 4095 4096 4097 4098 4099 4100 4101 4102 4103
static bool e1000_tbi_should_accept(struct e1000_adapter *adapter,
				    u8 status, u8 errors,
				    u32 length, const u8 *data)
{
	struct e1000_hw *hw = &adapter->hw;
	u8 last_byte = *(data + length - 1);

	if (TBI_ACCEPT(hw, status, errors, length, last_byte)) {
		unsigned long irq_flags;

		spin_lock_irqsave(&adapter->stats_lock, irq_flags);
		e1000_tbi_adjust_stats(hw, &adapter->stats, length, data);
		spin_unlock_irqrestore(&adapter->stats_lock, irq_flags);

		return true;
	}

	return false;
}

4104 4105 4106
static struct sk_buff *e1000_alloc_rx_skb(struct e1000_adapter *adapter,
					  unsigned int bufsz)
{
4107
	struct sk_buff *skb = napi_alloc_skb(&adapter->napi, bufsz);
4108 4109 4110 4111 4112 4113

	if (unlikely(!skb))
		adapter->alloc_rx_buff_failed++;
	return skb;
}

4114 4115 4116 4117 4118 4119 4120 4121 4122 4123 4124 4125 4126 4127 4128 4129 4130
/**
 * e1000_clean_jumbo_rx_irq - Send received data up the network stack; legacy
 * @adapter: board private structure
 * @rx_ring: ring to clean
 * @work_done: amount of napi work completed this call
 * @work_to_do: max amount of work allowed for this call to do
 *
 * the return value indicates whether actual cleaning was done, there
 * is no guarantee that everything was cleaned
 */
static bool e1000_clean_jumbo_rx_irq(struct e1000_adapter *adapter,
				     struct e1000_rx_ring *rx_ring,
				     int *work_done, int work_to_do)
{
	struct net_device *netdev = adapter->netdev;
	struct pci_dev *pdev = adapter->pdev;
	struct e1000_rx_desc *rx_desc, *next_rxd;
4131
	struct e1000_rx_buffer *buffer_info, *next_buffer;
4132 4133 4134 4135 4136 4137 4138 4139 4140 4141 4142 4143 4144 4145 4146 4147 4148
	u32 length;
	unsigned int i;
	int cleaned_count = 0;
	bool cleaned = false;
	unsigned int total_rx_bytes=0, total_rx_packets=0;

	i = rx_ring->next_to_clean;
	rx_desc = E1000_RX_DESC(*rx_ring, i);
	buffer_info = &rx_ring->buffer_info[i];

	while (rx_desc->status & E1000_RXD_STAT_DD) {
		struct sk_buff *skb;
		u8 status;

		if (*work_done >= work_to_do)
			break;
		(*work_done)++;
4149
		rmb(); /* read descriptor and rx_buffer_info after status DD */
4150 4151 4152 4153 4154 4155 4156 4157 4158 4159 4160

		status = rx_desc->status;

		if (++i == rx_ring->count) i = 0;
		next_rxd = E1000_RX_DESC(*rx_ring, i);
		prefetch(next_rxd);

		next_buffer = &rx_ring->buffer_info[i];

		cleaned = true;
		cleaned_count++;
4161
		dma_unmap_page(&pdev->dev, buffer_info->dma,
4162
			       adapter->rx_buffer_len, DMA_FROM_DEVICE);
4163 4164 4165 4166 4167 4168 4169
		buffer_info->dma = 0;

		length = le16_to_cpu(rx_desc->length);

		/* errors is only valid for DD + EOP descriptors */
		if (unlikely((status & E1000_RXD_STAT_EOP) &&
		    (rx_desc->errors & E1000_RXD_ERR_FRAME_ERR_MASK))) {
F
Florian Westphal 已提交
4170
			u8 *mapped = page_address(buffer_info->rxbuf.page);
4171 4172 4173 4174

			if (e1000_tbi_should_accept(adapter, status,
						    rx_desc->errors,
						    length, mapped)) {
4175
				length--;
4176 4177
			} else if (netdev->features & NETIF_F_RXALL) {
				goto process_skb;
4178 4179
			} else {
				/* an error means any chain goes out the window
4180 4181
				 * too
				 */
4182 4183 4184 4185 4186 4187 4188 4189
				if (rx_ring->rx_skb_top)
					dev_kfree_skb(rx_ring->rx_skb_top);
				rx_ring->rx_skb_top = NULL;
				goto next_desc;
			}
		}

#define rxtop rx_ring->rx_skb_top
B
Ben Greear 已提交
4190
process_skb:
4191 4192 4193 4194
		if (!(status & E1000_RXD_STAT_EOP)) {
			/* this descriptor is only the beginning (or middle) */
			if (!rxtop) {
				/* this is the beginning of a chain */
4195
				rxtop = napi_get_frags(&adapter->napi);
F
Florian Westphal 已提交
4196 4197 4198 4199 4200
				if (!rxtop)
					break;

				skb_fill_page_desc(rxtop, 0,
						   buffer_info->rxbuf.page,
4201
						   0, length);
4202 4203 4204 4205
			} else {
				/* this is the middle of a chain */
				skb_fill_page_desc(rxtop,
				    skb_shinfo(rxtop)->nr_frags,
F
Florian Westphal 已提交
4206
				    buffer_info->rxbuf.page, 0, length);
4207 4208 4209 4210 4211 4212 4213 4214
			}
			e1000_consume_page(buffer_info, rxtop, length);
			goto next_desc;
		} else {
			if (rxtop) {
				/* end of the chain */
				skb_fill_page_desc(rxtop,
				    skb_shinfo(rxtop)->nr_frags,
F
Florian Westphal 已提交
4215
				    buffer_info->rxbuf.page, 0, length);
4216 4217 4218 4219
				skb = rxtop;
				rxtop = NULL;
				e1000_consume_page(buffer_info, skb, length);
			} else {
F
Florian Westphal 已提交
4220
				struct page *p;
4221
				/* no chain, got EOP, this buf is the packet
4222 4223
				 * copybreak to save the put_page/alloc_page
				 */
F
Florian Westphal 已提交
4224
				p = buffer_info->rxbuf.page;
4225
				if (length <= copybreak) {
4226
					u8 *vaddr;
F
Florian Westphal 已提交
4227

4228 4229 4230 4231 4232 4233 4234
					if (likely(!(netdev->features & NETIF_F_RXFCS)))
						length -= 4;
					skb = e1000_alloc_rx_skb(adapter,
								 length);
					if (!skb)
						break;

F
Florian Westphal 已提交
4235
					vaddr = kmap_atomic(p);
4236 4237
					memcpy(skb_tail_pointer(skb), vaddr,
					       length);
4238
					kunmap_atomic(vaddr);
4239
					/* re-use the page, so don't erase
F
Florian Westphal 已提交
4240
					 * buffer_info->rxbuf.page
4241
					 */
4242
					skb_put(skb, length);
4243 4244 4245 4246 4247 4248 4249 4250 4251 4252
					e1000_rx_checksum(adapter,
							  status | rx_desc->errors << 24,
							  le16_to_cpu(rx_desc->csum), skb);

					total_rx_bytes += skb->len;
					total_rx_packets++;

					e1000_receive_skb(adapter, status,
							  rx_desc->special, skb);
					goto next_desc;
4253
				} else {
4254 4255 4256 4257 4258
					skb = napi_get_frags(&adapter->napi);
					if (!skb) {
						adapter->alloc_rx_buff_failed++;
						break;
					}
F
Florian Westphal 已提交
4259
					skb_fill_page_desc(skb, 0, p, 0,
4260
							   length);
4261
					e1000_consume_page(buffer_info, skb,
4262
							   length);
4263 4264 4265 4266 4267 4268
				}
			}
		}

		/* Receive Checksum Offload XXX recompute due to CRC strip? */
		e1000_rx_checksum(adapter,
4269 4270 4271
				  (u32)(status) |
				  ((u32)(rx_desc->errors) << 24),
				  le16_to_cpu(rx_desc->csum), skb);
4272

B
Ben Greear 已提交
4273 4274 4275
		total_rx_bytes += (skb->len - 4); /* don't count FCS */
		if (likely(!(netdev->features & NETIF_F_RXFCS)))
			pskb_trim(skb, skb->len - 4);
4276 4277
		total_rx_packets++;

4278 4279 4280 4281 4282
		if (status & E1000_RXD_STAT_VP) {
			__le16 vlan = rx_desc->special;
			u16 vid = le16_to_cpu(vlan) & E1000_RXD_SPC_VLAN_MASK;

			__vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q), vid);
4283 4284
		}

4285
		napi_gro_frags(&adapter->napi);
4286 4287 4288 4289 4290 4291 4292 4293 4294 4295 4296 4297 4298 4299 4300 4301 4302 4303 4304 4305 4306 4307

next_desc:
		rx_desc->status = 0;

		/* return some buffers to hardware, one at a time is too slow */
		if (unlikely(cleaned_count >= E1000_RX_BUFFER_WRITE)) {
			adapter->alloc_rx_buf(adapter, rx_ring, cleaned_count);
			cleaned_count = 0;
		}

		/* use prefetched values */
		rx_desc = next_rxd;
		buffer_info = next_buffer;
	}
	rx_ring->next_to_clean = i;

	cleaned_count = E1000_DESC_UNUSED(rx_ring);
	if (cleaned_count)
		adapter->alloc_rx_buf(adapter, rx_ring, cleaned_count);

	adapter->total_rx_packets += total_rx_packets;
	adapter->total_rx_bytes += total_rx_bytes;
4308 4309
	netdev->stats.rx_bytes += total_rx_bytes;
	netdev->stats.rx_packets += total_rx_packets;
4310 4311 4312
	return cleaned;
}

4313
/* this should improve performance for small packets with large amounts
4314 4315
 * of reassembly being done in the stack
 */
4316
static struct sk_buff *e1000_copybreak(struct e1000_adapter *adapter,
4317
				       struct e1000_rx_buffer *buffer_info,
4318
				       u32 length, const void *data)
4319
{
4320
	struct sk_buff *skb;
4321 4322

	if (length > copybreak)
4323
		return NULL;
4324

4325 4326 4327 4328 4329 4330 4331 4332
	skb = e1000_alloc_rx_skb(adapter, length);
	if (!skb)
		return NULL;

	dma_sync_single_for_cpu(&adapter->pdev->dev, buffer_info->dma,
				length, DMA_FROM_DEVICE);

	memcpy(skb_put(skb, length), data, length);
4333

4334
	return skb;
4335 4336
}

L
Linus Torvalds 已提交
4337
/**
4338
 * e1000_clean_rx_irq - Send received data up the network stack; legacy
L
Linus Torvalds 已提交
4339
 * @adapter: board private structure
4340 4341 4342 4343
 * @rx_ring: ring to clean
 * @work_done: amount of napi work completed this call
 * @work_to_do: max amount of work allowed for this call to do
 */
4344 4345 4346
static bool e1000_clean_rx_irq(struct e1000_adapter *adapter,
			       struct e1000_rx_ring *rx_ring,
			       int *work_done, int work_to_do)
L
Linus Torvalds 已提交
4347 4348 4349
{
	struct net_device *netdev = adapter->netdev;
	struct pci_dev *pdev = adapter->pdev;
4350
	struct e1000_rx_desc *rx_desc, *next_rxd;
4351
	struct e1000_rx_buffer *buffer_info, *next_buffer;
4352
	u32 length;
L
Linus Torvalds 已提交
4353
	unsigned int i;
4354
	int cleaned_count = 0;
J
Joe Perches 已提交
4355
	bool cleaned = false;
J
Jesse Brandeburg 已提交
4356
	unsigned int total_rx_bytes=0, total_rx_packets=0;
L
Linus Torvalds 已提交
4357 4358 4359

	i = rx_ring->next_to_clean;
	rx_desc = E1000_RX_DESC(*rx_ring, i);
4360
	buffer_info = &rx_ring->buffer_info[i];
L
Linus Torvalds 已提交
4361

4362
	while (rx_desc->status & E1000_RXD_STAT_DD) {
4363
		struct sk_buff *skb;
F
Florian Westphal 已提交
4364
		u8 *data;
4365
		u8 status;
4366

J
Jesse Brandeburg 已提交
4367
		if (*work_done >= work_to_do)
L
Linus Torvalds 已提交
4368 4369
			break;
		(*work_done)++;
4370
		rmb(); /* read descriptor and rx_buffer_info after status DD */
4371

4372
		status = rx_desc->status;
4373
		length = le16_to_cpu(rx_desc->length);
4374

F
Florian Westphal 已提交
4375 4376 4377
		data = buffer_info->rxbuf.data;
		prefetch(data);
		skb = e1000_copybreak(adapter, buffer_info, length, data);
4378
		if (!skb) {
F
Florian Westphal 已提交
4379 4380 4381 4382 4383 4384 4385 4386 4387
			unsigned int frag_len = e1000_frag_len(adapter);

			skb = build_skb(data - E1000_HEADROOM, frag_len);
			if (!skb) {
				adapter->alloc_rx_buff_failed++;
				break;
			}

			skb_reserve(skb, E1000_HEADROOM);
4388
			dma_unmap_single(&pdev->dev, buffer_info->dma,
4389 4390
					 adapter->rx_buffer_len,
					 DMA_FROM_DEVICE);
4391
			buffer_info->dma = 0;
F
Florian Westphal 已提交
4392
			buffer_info->rxbuf.data = NULL;
4393
		}
4394

4395 4396
		if (++i == rx_ring->count) i = 0;
		next_rxd = E1000_RX_DESC(*rx_ring, i);
4397 4398
		prefetch(next_rxd);

4399 4400
		next_buffer = &rx_ring->buffer_info[i];

J
Joe Perches 已提交
4401
		cleaned = true;
4402
		cleaned_count++;
L
Linus Torvalds 已提交
4403

4404
		/* !EOP means multiple descriptors were used to store a single
4405 4406 4407 4408 4409 4410 4411 4412 4413
		 * packet, if thats the case we need to toss it.  In fact, we
		 * to toss every packet with the EOP bit clear and the next
		 * frame that _does_ have the EOP bit set, as it is by
		 * definition only a frame fragment
		 */
		if (unlikely(!(status & E1000_RXD_STAT_EOP)))
			adapter->discarding = true;

		if (adapter->discarding) {
4414
			/* All receives must fit into a single buffer */
4415
			netdev_dbg(netdev, "Receive packet consumed multiple buffers\n");
4416
			dev_kfree_skb(skb);
4417 4418
			if (status & E1000_RXD_STAT_EOP)
				adapter->discarding = false;
L
Linus Torvalds 已提交
4419 4420 4421
			goto next_desc;
		}

J
Jesse Brandeburg 已提交
4422
		if (unlikely(rx_desc->errors & E1000_RXD_ERR_FRAME_ERR_MASK)) {
4423 4424
			if (e1000_tbi_should_accept(adapter, status,
						    rx_desc->errors,
F
Florian Westphal 已提交
4425
						    length, data)) {
L
Linus Torvalds 已提交
4426
				length--;
4427 4428
			} else if (netdev->features & NETIF_F_RXALL) {
				goto process_skb;
L
Linus Torvalds 已提交
4429
			} else {
4430
				dev_kfree_skb(skb);
L
Linus Torvalds 已提交
4431 4432
				goto next_desc;
			}
A
Auke Kok 已提交
4433
		}
L
Linus Torvalds 已提交
4434

B
Ben Greear 已提交
4435
process_skb:
B
Ben Greear 已提交
4436
		total_rx_bytes += (length - 4); /* don't count FCS */
J
Jesse Brandeburg 已提交
4437 4438
		total_rx_packets++;

B
Ben Greear 已提交
4439 4440 4441 4442 4443 4444
		if (likely(!(netdev->features & NETIF_F_RXFCS)))
			/* adjust length to remove Ethernet CRC, this must be
			 * done after the TBI_ACCEPT workaround above
			 */
			length -= 4;

F
Florian Westphal 已提交
4445
		if (buffer_info->rxbuf.data == NULL)
4446 4447 4448
			skb_put(skb, length);
		else /* copybreak skb */
			skb_trim(skb, length);
L
Linus Torvalds 已提交
4449 4450

		/* Receive Checksum Offload */
4451
		e1000_rx_checksum(adapter,
4452 4453
				  (u32)(status) |
				  ((u32)(rx_desc->errors) << 24),
D
David S. Miller 已提交
4454
				  le16_to_cpu(rx_desc->csum), skb);
J
Jesse Brandeburg 已提交
4455

4456
		e1000_receive_skb(adapter, status, rx_desc->special, skb);
4457

L
Linus Torvalds 已提交
4458 4459 4460
next_desc:
		rx_desc->status = 0;

4461 4462 4463 4464 4465 4466
		/* return some buffers to hardware, one at a time is too slow */
		if (unlikely(cleaned_count >= E1000_RX_BUFFER_WRITE)) {
			adapter->alloc_rx_buf(adapter, rx_ring, cleaned_count);
			cleaned_count = 0;
		}

4467
		/* use prefetched values */
4468 4469
		rx_desc = next_rxd;
		buffer_info = next_buffer;
L
Linus Torvalds 已提交
4470 4471
	}
	rx_ring->next_to_clean = i;
4472 4473 4474 4475

	cleaned_count = E1000_DESC_UNUSED(rx_ring);
	if (cleaned_count)
		adapter->alloc_rx_buf(adapter, rx_ring, cleaned_count);
4476

J
Jesse Brandeburg 已提交
4477 4478
	adapter->total_rx_packets += total_rx_packets;
	adapter->total_rx_bytes += total_rx_bytes;
4479 4480
	netdev->stats.rx_bytes += total_rx_bytes;
	netdev->stats.rx_packets += total_rx_packets;
4481 4482 4483
	return cleaned;
}

4484 4485 4486 4487 4488 4489 4490 4491
/**
 * e1000_alloc_jumbo_rx_buffers - Replace used jumbo receive buffers
 * @adapter: address of board private structure
 * @rx_ring: pointer to receive ring structure
 * @cleaned_count: number of buffers to allocate this pass
 **/
static void
e1000_alloc_jumbo_rx_buffers(struct e1000_adapter *adapter,
4492
			     struct e1000_rx_ring *rx_ring, int cleaned_count)
4493 4494 4495
{
	struct pci_dev *pdev = adapter->pdev;
	struct e1000_rx_desc *rx_desc;
4496
	struct e1000_rx_buffer *buffer_info;
4497 4498 4499 4500 4501 4502 4503
	unsigned int i;

	i = rx_ring->next_to_use;
	buffer_info = &rx_ring->buffer_info[i];

	while (cleaned_count--) {
		/* allocate a new page if necessary */
F
Florian Westphal 已提交
4504 4505 4506
		if (!buffer_info->rxbuf.page) {
			buffer_info->rxbuf.page = alloc_page(GFP_ATOMIC);
			if (unlikely(!buffer_info->rxbuf.page)) {
4507 4508 4509 4510 4511
				adapter->alloc_rx_buff_failed++;
				break;
			}
		}

4512
		if (!buffer_info->dma) {
4513
			buffer_info->dma = dma_map_page(&pdev->dev,
F
Florian Westphal 已提交
4514 4515
							buffer_info->rxbuf.page, 0,
							adapter->rx_buffer_len,
4516 4517
							DMA_FROM_DEVICE);
			if (dma_mapping_error(&pdev->dev, buffer_info->dma)) {
F
Florian Westphal 已提交
4518 4519
				put_page(buffer_info->rxbuf.page);
				buffer_info->rxbuf.page = NULL;
4520 4521
				buffer_info->dma = 0;
				adapter->alloc_rx_buff_failed++;
F
Florian Westphal 已提交
4522
				break;
4523 4524
			}
		}
4525 4526 4527 4528 4529 4530 4531 4532 4533 4534 4535 4536 4537 4538 4539 4540 4541

		rx_desc = E1000_RX_DESC(*rx_ring, i);
		rx_desc->buffer_addr = cpu_to_le64(buffer_info->dma);

		if (unlikely(++i == rx_ring->count))
			i = 0;
		buffer_info = &rx_ring->buffer_info[i];
	}

	if (likely(rx_ring->next_to_use != i)) {
		rx_ring->next_to_use = i;
		if (unlikely(i-- == 0))
			i = (rx_ring->count - 1);

		/* Force memory writes to complete before letting h/w
		 * know there are new descriptors to fetch.  (Only
		 * applicable for weak-ordered memory model archs,
4542 4543
		 * such as IA-64).
		 */
4544 4545 4546 4547 4548
		wmb();
		writel(i, adapter->hw.hw_addr + rx_ring->rdt);
	}
}

L
Linus Torvalds 已提交
4549
/**
4550
 * e1000_alloc_rx_buffers - Replace used receive buffers; legacy & extended
L
Linus Torvalds 已提交
4551 4552
 * @adapter: address of board private structure
 **/
4553 4554 4555
static void e1000_alloc_rx_buffers(struct e1000_adapter *adapter,
				   struct e1000_rx_ring *rx_ring,
				   int cleaned_count)
L
Linus Torvalds 已提交
4556
{
J
Joe Perches 已提交
4557
	struct e1000_hw *hw = &adapter->hw;
L
Linus Torvalds 已提交
4558 4559
	struct pci_dev *pdev = adapter->pdev;
	struct e1000_rx_desc *rx_desc;
4560
	struct e1000_rx_buffer *buffer_info;
4561
	unsigned int i;
4562
	unsigned int bufsz = adapter->rx_buffer_len;
L
Linus Torvalds 已提交
4563 4564 4565 4566

	i = rx_ring->next_to_use;
	buffer_info = &rx_ring->buffer_info[i];

4567
	while (cleaned_count--) {
F
Florian Westphal 已提交
4568 4569 4570
		void *data;

		if (buffer_info->rxbuf.data)
4571
			goto skip;
4572

F
Florian Westphal 已提交
4573 4574
		data = e1000_alloc_frag(adapter);
		if (!data) {
L
Linus Torvalds 已提交
4575
			/* Better luck next round */
4576
			adapter->alloc_rx_buff_failed++;
L
Linus Torvalds 已提交
4577 4578 4579
			break;
		}

4580
		/* Fix for errata 23, can't cross 64kB boundary */
F
Florian Westphal 已提交
4581 4582
		if (!e1000_check_64k_bound(adapter, data, bufsz)) {
			void *olddata = data;
4583
			e_err(rx_err, "skb align check failed: %u bytes at "
F
Florian Westphal 已提交
4584
			      "%p\n", bufsz, data);
4585
			/* Try again, without freeing the previous */
F
Florian Westphal 已提交
4586
			data = e1000_alloc_frag(adapter);
4587
			/* Failed allocation, critical failure */
F
Florian Westphal 已提交
4588 4589
			if (!data) {
				e1000_free_frag(olddata);
4590
				adapter->alloc_rx_buff_failed++;
L
Linus Torvalds 已提交
4591 4592
				break;
			}
4593

F
Florian Westphal 已提交
4594
			if (!e1000_check_64k_bound(adapter, data, bufsz)) {
L
Linus Torvalds 已提交
4595
				/* give up */
F
Florian Westphal 已提交
4596 4597
				e1000_free_frag(data);
				e1000_free_frag(olddata);
4598
				adapter->alloc_rx_buff_failed++;
F
Florian Westphal 已提交
4599
				break;
L
Linus Torvalds 已提交
4600
			}
4601 4602

			/* Use new allocation */
F
Florian Westphal 已提交
4603
			e1000_free_frag(olddata);
L
Linus Torvalds 已提交
4604
		}
4605
		buffer_info->dma = dma_map_single(&pdev->dev,
F
Florian Westphal 已提交
4606
						  data,
4607
						  adapter->rx_buffer_len,
4608 4609
						  DMA_FROM_DEVICE);
		if (dma_mapping_error(&pdev->dev, buffer_info->dma)) {
F
Florian Westphal 已提交
4610
			e1000_free_frag(data);
4611 4612
			buffer_info->dma = 0;
			adapter->alloc_rx_buff_failed++;
F
Florian Westphal 已提交
4613
			break;
4614
		}
L
Linus Torvalds 已提交
4615

4616
		/* XXX if it was allocated cleanly it will never map to a
4617 4618 4619
		 * boundary crossing
		 */

4620 4621 4622 4623
		/* Fix for errata 23, can't cross 64kB boundary */
		if (!e1000_check_64k_bound(adapter,
					(void *)(unsigned long)buffer_info->dma,
					adapter->rx_buffer_len)) {
4624 4625
			e_err(rx_err, "dma align check failed: %u bytes at "
			      "%p\n", adapter->rx_buffer_len,
4626
			      (void *)(unsigned long)buffer_info->dma);
L
Linus Torvalds 已提交
4627

4628
			dma_unmap_single(&pdev->dev, buffer_info->dma,
L
Linus Torvalds 已提交
4629
					 adapter->rx_buffer_len,
4630
					 DMA_FROM_DEVICE);
F
Florian Westphal 已提交
4631 4632 4633

			e1000_free_frag(data);
			buffer_info->rxbuf.data = NULL;
J
Jesse Brandeburg 已提交
4634
			buffer_info->dma = 0;
L
Linus Torvalds 已提交
4635

4636
			adapter->alloc_rx_buff_failed++;
F
Florian Westphal 已提交
4637
			break;
L
Linus Torvalds 已提交
4638
		}
F
Florian Westphal 已提交
4639 4640
		buffer_info->rxbuf.data = data;
 skip:
L
Linus Torvalds 已提交
4641 4642 4643
		rx_desc = E1000_RX_DESC(*rx_ring, i);
		rx_desc->buffer_addr = cpu_to_le64(buffer_info->dma);

J
Jesse Brandeburg 已提交
4644 4645
		if (unlikely(++i == rx_ring->count))
			i = 0;
L
Linus Torvalds 已提交
4646 4647 4648
		buffer_info = &rx_ring->buffer_info[i];
	}

4649 4650 4651 4652 4653 4654 4655 4656
	if (likely(rx_ring->next_to_use != i)) {
		rx_ring->next_to_use = i;
		if (unlikely(i-- == 0))
			i = (rx_ring->count - 1);

		/* Force memory writes to complete before letting h/w
		 * know there are new descriptors to fetch.  (Only
		 * applicable for weak-ordered memory model archs,
4657 4658
		 * such as IA-64).
		 */
4659
		wmb();
J
Joe Perches 已提交
4660
		writel(i, hw->hw_addr + rx_ring->rdt);
4661
	}
L
Linus Torvalds 已提交
4662 4663 4664 4665 4666 4667
}

/**
 * e1000_smartspeed - Workaround for SmartSpeed on 82541 and 82547 controllers.
 * @adapter:
 **/
4668
static void e1000_smartspeed(struct e1000_adapter *adapter)
L
Linus Torvalds 已提交
4669
{
J
Joe Perches 已提交
4670
	struct e1000_hw *hw = &adapter->hw;
4671 4672
	u16 phy_status;
	u16 phy_ctrl;
L
Linus Torvalds 已提交
4673

J
Joe Perches 已提交
4674 4675
	if ((hw->phy_type != e1000_phy_igp) || !hw->autoneg ||
	   !(hw->autoneg_advertised & ADVERTISE_1000_FULL))
L
Linus Torvalds 已提交
4676 4677
		return;

J
Jesse Brandeburg 已提交
4678
	if (adapter->smartspeed == 0) {
L
Linus Torvalds 已提交
4679
		/* If Master/Slave config fault is asserted twice,
4680 4681
		 * we assume back-to-back
		 */
J
Joe Perches 已提交
4682
		e1000_read_phy_reg(hw, PHY_1000T_STATUS, &phy_status);
J
Jesse Brandeburg 已提交
4683
		if (!(phy_status & SR_1000T_MS_CONFIG_FAULT)) return;
J
Joe Perches 已提交
4684
		e1000_read_phy_reg(hw, PHY_1000T_STATUS, &phy_status);
J
Jesse Brandeburg 已提交
4685
		if (!(phy_status & SR_1000T_MS_CONFIG_FAULT)) return;
J
Joe Perches 已提交
4686
		e1000_read_phy_reg(hw, PHY_1000T_CTRL, &phy_ctrl);
J
Jesse Brandeburg 已提交
4687
		if (phy_ctrl & CR_1000T_MS_ENABLE) {
L
Linus Torvalds 已提交
4688
			phy_ctrl &= ~CR_1000T_MS_ENABLE;
J
Joe Perches 已提交
4689
			e1000_write_phy_reg(hw, PHY_1000T_CTRL,
L
Linus Torvalds 已提交
4690 4691
					    phy_ctrl);
			adapter->smartspeed++;
J
Joe Perches 已提交
4692 4693
			if (!e1000_phy_setup_autoneg(hw) &&
			   !e1000_read_phy_reg(hw, PHY_CTRL,
4694
					       &phy_ctrl)) {
L
Linus Torvalds 已提交
4695 4696
				phy_ctrl |= (MII_CR_AUTO_NEG_EN |
					     MII_CR_RESTART_AUTO_NEG);
J
Joe Perches 已提交
4697
				e1000_write_phy_reg(hw, PHY_CTRL,
L
Linus Torvalds 已提交
4698 4699 4700 4701
						    phy_ctrl);
			}
		}
		return;
J
Jesse Brandeburg 已提交
4702
	} else if (adapter->smartspeed == E1000_SMARTSPEED_DOWNSHIFT) {
L
Linus Torvalds 已提交
4703
		/* If still no link, perhaps using 2/3 pair cable */
J
Joe Perches 已提交
4704
		e1000_read_phy_reg(hw, PHY_1000T_CTRL, &phy_ctrl);
L
Linus Torvalds 已提交
4705
		phy_ctrl |= CR_1000T_MS_ENABLE;
J
Joe Perches 已提交
4706 4707 4708
		e1000_write_phy_reg(hw, PHY_1000T_CTRL, phy_ctrl);
		if (!e1000_phy_setup_autoneg(hw) &&
		   !e1000_read_phy_reg(hw, PHY_CTRL, &phy_ctrl)) {
L
Linus Torvalds 已提交
4709 4710
			phy_ctrl |= (MII_CR_AUTO_NEG_EN |
				     MII_CR_RESTART_AUTO_NEG);
J
Joe Perches 已提交
4711
			e1000_write_phy_reg(hw, PHY_CTRL, phy_ctrl);
L
Linus Torvalds 已提交
4712 4713 4714
		}
	}
	/* Restart process after E1000_SMARTSPEED_MAX iterations */
J
Jesse Brandeburg 已提交
4715
	if (adapter->smartspeed++ == E1000_SMARTSPEED_MAX)
L
Linus Torvalds 已提交
4716 4717 4718 4719 4720 4721 4722 4723 4724
		adapter->smartspeed = 0;
}

/**
 * e1000_ioctl -
 * @netdev:
 * @ifreq:
 * @cmd:
 **/
4725
static int e1000_ioctl(struct net_device *netdev, struct ifreq *ifr, int cmd)
L
Linus Torvalds 已提交
4726 4727 4728 4729 4730 4731 4732 4733 4734 4735 4736 4737 4738 4739 4740 4741 4742
{
	switch (cmd) {
	case SIOCGMIIPHY:
	case SIOCGMIIREG:
	case SIOCSMIIREG:
		return e1000_mii_ioctl(netdev, ifr, cmd);
	default:
		return -EOPNOTSUPP;
	}
}

/**
 * e1000_mii_ioctl -
 * @netdev:
 * @ifreq:
 * @cmd:
 **/
4743 4744
static int e1000_mii_ioctl(struct net_device *netdev, struct ifreq *ifr,
			   int cmd)
L
Linus Torvalds 已提交
4745
{
4746
	struct e1000_adapter *adapter = netdev_priv(netdev);
J
Joe Perches 已提交
4747
	struct e1000_hw *hw = &adapter->hw;
L
Linus Torvalds 已提交
4748 4749
	struct mii_ioctl_data *data = if_mii(ifr);
	int retval;
4750
	u16 mii_reg;
4751
	unsigned long flags;
L
Linus Torvalds 已提交
4752

J
Joe Perches 已提交
4753
	if (hw->media_type != e1000_media_type_copper)
L
Linus Torvalds 已提交
4754 4755 4756 4757
		return -EOPNOTSUPP;

	switch (cmd) {
	case SIOCGMIIPHY:
J
Joe Perches 已提交
4758
		data->phy_id = hw->phy_addr;
L
Linus Torvalds 已提交
4759 4760
		break;
	case SIOCGMIIREG:
4761
		spin_lock_irqsave(&adapter->stats_lock, flags);
J
Joe Perches 已提交
4762
		if (e1000_read_phy_reg(hw, data->reg_num & 0x1F,
4763 4764
				   &data->val_out)) {
			spin_unlock_irqrestore(&adapter->stats_lock, flags);
L
Linus Torvalds 已提交
4765
			return -EIO;
4766 4767
		}
		spin_unlock_irqrestore(&adapter->stats_lock, flags);
L
Linus Torvalds 已提交
4768 4769
		break;
	case SIOCSMIIREG:
J
Jesse Brandeburg 已提交
4770
		if (data->reg_num & ~(0x1F))
L
Linus Torvalds 已提交
4771 4772
			return -EFAULT;
		mii_reg = data->val_in;
4773
		spin_lock_irqsave(&adapter->stats_lock, flags);
J
Joe Perches 已提交
4774
		if (e1000_write_phy_reg(hw, data->reg_num,
4775 4776
					mii_reg)) {
			spin_unlock_irqrestore(&adapter->stats_lock, flags);
L
Linus Torvalds 已提交
4777
			return -EIO;
4778
		}
4779
		spin_unlock_irqrestore(&adapter->stats_lock, flags);
J
Joe Perches 已提交
4780
		if (hw->media_type == e1000_media_type_copper) {
L
Linus Torvalds 已提交
4781 4782
			switch (data->reg_num) {
			case PHY_CTRL:
J
Jesse Brandeburg 已提交
4783
				if (mii_reg & MII_CR_POWER_DOWN)
L
Linus Torvalds 已提交
4784
					break;
J
Jesse Brandeburg 已提交
4785
				if (mii_reg & MII_CR_AUTO_NEG_EN) {
J
Joe Perches 已提交
4786 4787
					hw->autoneg = 1;
					hw->autoneg_advertised = 0x2F;
L
Linus Torvalds 已提交
4788
				} else {
4789
					u32 speed;
L
Linus Torvalds 已提交
4790
					if (mii_reg & 0x40)
4791
						speed = SPEED_1000;
L
Linus Torvalds 已提交
4792
					else if (mii_reg & 0x2000)
4793
						speed = SPEED_100;
L
Linus Torvalds 已提交
4794
					else
4795 4796 4797 4798 4799 4800
						speed = SPEED_10;
					retval = e1000_set_spd_dplx(
						adapter, speed,
						((mii_reg & 0x100)
						 ? DUPLEX_FULL :
						 DUPLEX_HALF));
4801
					if (retval)
L
Linus Torvalds 已提交
4802 4803
						return retval;
				}
4804 4805 4806
				if (netif_running(adapter->netdev))
					e1000_reinit_locked(adapter);
				else
L
Linus Torvalds 已提交
4807 4808 4809 4810
					e1000_reset(adapter);
				break;
			case M88E1000_PHY_SPEC_CTRL:
			case M88E1000_EXT_PHY_SPEC_CTRL:
J
Joe Perches 已提交
4811
				if (e1000_phy_reset(hw))
L
Linus Torvalds 已提交
4812 4813 4814 4815 4816 4817
					return -EIO;
				break;
			}
		} else {
			switch (data->reg_num) {
			case PHY_CTRL:
J
Jesse Brandeburg 已提交
4818
				if (mii_reg & MII_CR_POWER_DOWN)
L
Linus Torvalds 已提交
4819
					break;
4820 4821 4822
				if (netif_running(adapter->netdev))
					e1000_reinit_locked(adapter);
				else
L
Linus Torvalds 已提交
4823 4824 4825 4826 4827 4828 4829 4830 4831 4832 4833
					e1000_reset(adapter);
				break;
			}
		}
		break;
	default:
		return -EOPNOTSUPP;
	}
	return E1000_SUCCESS;
}

4834
void e1000_pci_set_mwi(struct e1000_hw *hw)
L
Linus Torvalds 已提交
4835 4836
{
	struct e1000_adapter *adapter = hw->back;
4837
	int ret_val = pci_set_mwi(adapter->pdev);
L
Linus Torvalds 已提交
4838

J
Jesse Brandeburg 已提交
4839
	if (ret_val)
4840
		e_err(probe, "Error in setting MWI\n");
L
Linus Torvalds 已提交
4841 4842
}

4843
void e1000_pci_clear_mwi(struct e1000_hw *hw)
L
Linus Torvalds 已提交
4844 4845 4846 4847 4848 4849
{
	struct e1000_adapter *adapter = hw->back;

	pci_clear_mwi(adapter->pdev);
}

4850
int e1000_pcix_get_mmrbc(struct e1000_hw *hw)
4851 4852 4853 4854 4855
{
	struct e1000_adapter *adapter = hw->back;
	return pcix_get_mmrbc(adapter->pdev);
}

4856
void e1000_pcix_set_mmrbc(struct e1000_hw *hw, int mmrbc)
4857 4858 4859 4860 4861
{
	struct e1000_adapter *adapter = hw->back;
	pcix_set_mmrbc(adapter->pdev, mmrbc);
}

4862
void e1000_io_write(struct e1000_hw *hw, unsigned long port, u32 value)
L
Linus Torvalds 已提交
4863 4864 4865 4866
{
	outl(value, port);
}

J
Jiri Pirko 已提交
4867 4868 4869 4870 4871 4872 4873 4874 4875
static bool e1000_vlan_used(struct e1000_adapter *adapter)
{
	u16 vid;

	for_each_set_bit(vid, adapter->active_vlans, VLAN_N_VID)
		return true;
	return false;
}

4876 4877 4878 4879 4880 4881 4882
static void __e1000_vlan_mode(struct e1000_adapter *adapter,
			      netdev_features_t features)
{
	struct e1000_hw *hw = &adapter->hw;
	u32 ctrl;

	ctrl = er32(CTRL);
4883
	if (features & NETIF_F_HW_VLAN_CTAG_RX) {
4884 4885 4886 4887 4888 4889 4890 4891
		/* enable VLAN tag insert/strip */
		ctrl |= E1000_CTRL_VME;
	} else {
		/* disable VLAN tag insert/strip */
		ctrl &= ~E1000_CTRL_VME;
	}
	ew32(CTRL, ctrl);
}
J
Jiri Pirko 已提交
4892 4893
static void e1000_vlan_filter_on_off(struct e1000_adapter *adapter,
				     bool filter_on)
L
Linus Torvalds 已提交
4894
{
J
Joe Perches 已提交
4895
	struct e1000_hw *hw = &adapter->hw;
J
Jiri Pirko 已提交
4896
	u32 rctl;
L
Linus Torvalds 已提交
4897

J
Jesse Brandeburg 已提交
4898 4899
	if (!test_bit(__E1000_DOWN, &adapter->flags))
		e1000_irq_disable(adapter);
L
Linus Torvalds 已提交
4900

4901
	__e1000_vlan_mode(adapter, adapter->netdev->features);
J
Jiri Pirko 已提交
4902
	if (filter_on) {
4903 4904 4905
		/* enable VLAN receive filtering */
		rctl = er32(RCTL);
		rctl &= ~E1000_RCTL_CFIEN;
J
Jiri Pirko 已提交
4906
		if (!(adapter->netdev->flags & IFF_PROMISC))
4907 4908 4909
			rctl |= E1000_RCTL_VFE;
		ew32(RCTL, rctl);
		e1000_update_mng_vlan(adapter);
L
Linus Torvalds 已提交
4910
	} else {
4911 4912 4913 4914
		/* disable VLAN receive filtering */
		rctl = er32(RCTL);
		rctl &= ~E1000_RCTL_VFE;
		ew32(RCTL, rctl);
J
Jiri Pirko 已提交
4915
	}
4916

J
Jiri Pirko 已提交
4917 4918 4919 4920
	if (!test_bit(__E1000_DOWN, &adapter->flags))
		e1000_irq_enable(adapter);
}

4921
static void e1000_vlan_mode(struct net_device *netdev,
4922
			    netdev_features_t features)
J
Jiri Pirko 已提交
4923 4924 4925 4926 4927 4928
{
	struct e1000_adapter *adapter = netdev_priv(netdev);

	if (!test_bit(__E1000_DOWN, &adapter->flags))
		e1000_irq_disable(adapter);

4929
	__e1000_vlan_mode(adapter, features);
L
Linus Torvalds 已提交
4930

J
Jesse Brandeburg 已提交
4931 4932
	if (!test_bit(__E1000_DOWN, &adapter->flags))
		e1000_irq_enable(adapter);
L
Linus Torvalds 已提交
4933 4934
}

4935 4936
static int e1000_vlan_rx_add_vid(struct net_device *netdev,
				 __be16 proto, u16 vid)
L
Linus Torvalds 已提交
4937
{
4938
	struct e1000_adapter *adapter = netdev_priv(netdev);
J
Joe Perches 已提交
4939
	struct e1000_hw *hw = &adapter->hw;
4940
	u32 vfta, index;
J
Jesse Brandeburg 已提交
4941

J
Joe Perches 已提交
4942
	if ((hw->mng_cookie.status &
J
Jesse Brandeburg 已提交
4943 4944
	     E1000_MNG_DHCP_COOKIE_STATUS_VLAN_SUPPORT) &&
	    (vid == adapter->mng_vlan_id))
4945
		return 0;
J
Jiri Pirko 已提交
4946 4947 4948 4949

	if (!e1000_vlan_used(adapter))
		e1000_vlan_filter_on_off(adapter, true);

L
Linus Torvalds 已提交
4950 4951
	/* add VID to filter table */
	index = (vid >> 5) & 0x7F;
J
Joe Perches 已提交
4952
	vfta = E1000_READ_REG_ARRAY(hw, VFTA, index);
L
Linus Torvalds 已提交
4953
	vfta |= (1 << (vid & 0x1F));
J
Joe Perches 已提交
4954
	e1000_write_vfta(hw, index, vfta);
J
Jiri Pirko 已提交
4955 4956

	set_bit(vid, adapter->active_vlans);
4957 4958

	return 0;
L
Linus Torvalds 已提交
4959 4960
}

4961 4962
static int e1000_vlan_rx_kill_vid(struct net_device *netdev,
				  __be16 proto, u16 vid)
L
Linus Torvalds 已提交
4963
{
4964
	struct e1000_adapter *adapter = netdev_priv(netdev);
J
Joe Perches 已提交
4965
	struct e1000_hw *hw = &adapter->hw;
4966
	u32 vfta, index;
L
Linus Torvalds 已提交
4967

J
Jesse Brandeburg 已提交
4968 4969 4970 4971
	if (!test_bit(__E1000_DOWN, &adapter->flags))
		e1000_irq_disable(adapter);
	if (!test_bit(__E1000_DOWN, &adapter->flags))
		e1000_irq_enable(adapter);
L
Linus Torvalds 已提交
4972 4973 4974

	/* remove VID from filter table */
	index = (vid >> 5) & 0x7F;
J
Joe Perches 已提交
4975
	vfta = E1000_READ_REG_ARRAY(hw, VFTA, index);
L
Linus Torvalds 已提交
4976
	vfta &= ~(1 << (vid & 0x1F));
J
Joe Perches 已提交
4977
	e1000_write_vfta(hw, index, vfta);
J
Jiri Pirko 已提交
4978 4979 4980 4981 4982

	clear_bit(vid, adapter->active_vlans);

	if (!e1000_vlan_used(adapter))
		e1000_vlan_filter_on_off(adapter, false);
4983 4984

	return 0;
L
Linus Torvalds 已提交
4985 4986
}

4987
static void e1000_restore_vlan(struct e1000_adapter *adapter)
L
Linus Torvalds 已提交
4988
{
J
Jiri Pirko 已提交
4989
	u16 vid;
L
Linus Torvalds 已提交
4990

J
Jiri Pirko 已提交
4991 4992 4993 4994 4995
	if (!e1000_vlan_used(adapter))
		return;

	e1000_vlan_filter_on_off(adapter, true);
	for_each_set_bit(vid, adapter->active_vlans, VLAN_N_VID)
4996
		e1000_vlan_rx_add_vid(adapter->netdev, htons(ETH_P_8021Q), vid);
L
Linus Torvalds 已提交
4997 4998
}

4999
int e1000_set_spd_dplx(struct e1000_adapter *adapter, u32 spd, u8 dplx)
L
Linus Torvalds 已提交
5000
{
J
Joe Perches 已提交
5001 5002 5003
	struct e1000_hw *hw = &adapter->hw;

	hw->autoneg = 0;
L
Linus Torvalds 已提交
5004

5005
	/* Make sure dplx is at most 1 bit and lsb of speed is not set
5006 5007
	 * for the switch() below to work
	 */
5008 5009 5010
	if ((spd & 1) || (dplx & ~1))
		goto err_inval;

5011
	/* Fiber NICs only allow 1000 gbps Full duplex */
J
Joe Perches 已提交
5012
	if ((hw->media_type == e1000_media_type_fiber) &&
5013 5014 5015
	    spd != SPEED_1000 &&
	    dplx != DUPLEX_FULL)
		goto err_inval;
5016

5017
	switch (spd + dplx) {
L
Linus Torvalds 已提交
5018
	case SPEED_10 + DUPLEX_HALF:
J
Joe Perches 已提交
5019
		hw->forced_speed_duplex = e1000_10_half;
L
Linus Torvalds 已提交
5020 5021
		break;
	case SPEED_10 + DUPLEX_FULL:
J
Joe Perches 已提交
5022
		hw->forced_speed_duplex = e1000_10_full;
L
Linus Torvalds 已提交
5023 5024
		break;
	case SPEED_100 + DUPLEX_HALF:
J
Joe Perches 已提交
5025
		hw->forced_speed_duplex = e1000_100_half;
L
Linus Torvalds 已提交
5026 5027
		break;
	case SPEED_100 + DUPLEX_FULL:
J
Joe Perches 已提交
5028
		hw->forced_speed_duplex = e1000_100_full;
L
Linus Torvalds 已提交
5029 5030
		break;
	case SPEED_1000 + DUPLEX_FULL:
J
Joe Perches 已提交
5031 5032
		hw->autoneg = 1;
		hw->autoneg_advertised = ADVERTISE_1000_FULL;
L
Linus Torvalds 已提交
5033 5034 5035
		break;
	case SPEED_1000 + DUPLEX_HALF: /* not supported */
	default:
5036
		goto err_inval;
L
Linus Torvalds 已提交
5037
	}
5038 5039 5040 5041

	/* clear MDI, MDI(-X) override is only allowed when autoneg enabled */
	hw->mdix = AUTO_ALL_MODES;

L
Linus Torvalds 已提交
5042
	return 0;
5043 5044 5045 5046

err_inval:
	e_err(probe, "Unsupported Speed/Duplex configuration\n");
	return -EINVAL;
L
Linus Torvalds 已提交
5047 5048
}

5049
static int __e1000_shutdown(struct pci_dev *pdev, bool *enable_wake)
L
Linus Torvalds 已提交
5050 5051
{
	struct net_device *netdev = pci_get_drvdata(pdev);
5052
	struct e1000_adapter *adapter = netdev_priv(netdev);
J
Joe Perches 已提交
5053
	struct e1000_hw *hw = &adapter->hw;
5054 5055
	u32 ctrl, ctrl_ext, rctl, status;
	u32 wufc = adapter->wol;
A
Auke Kok 已提交
5056
#ifdef CONFIG_PM
5057
	int retval = 0;
A
Auke Kok 已提交
5058
#endif
L
Linus Torvalds 已提交
5059 5060 5061

	netif_device_detach(netdev);

5062
	if (netif_running(netdev)) {
5063 5064 5065 5066 5067
		int count = E1000_CHECK_RESET_COUNT;

		while (test_bit(__E1000_RESETTING, &adapter->flags) && count--)
			usleep_range(10000, 20000);

5068
		WARN_ON(test_bit(__E1000_RESETTING, &adapter->flags));
L
Linus Torvalds 已提交
5069
		e1000_down(adapter);
5070
	}
L
Linus Torvalds 已提交
5071

5072
#ifdef CONFIG_PM
5073
	retval = pci_save_state(pdev);
5074
	if (retval)
5075 5076 5077
		return retval;
#endif

J
Joe Perches 已提交
5078
	status = er32(STATUS);
J
Jesse Brandeburg 已提交
5079
	if (status & E1000_STATUS_LU)
L
Linus Torvalds 已提交
5080 5081
		wufc &= ~E1000_WUFC_LNKC;

J
Jesse Brandeburg 已提交
5082
	if (wufc) {
L
Linus Torvalds 已提交
5083
		e1000_setup_rctl(adapter);
5084
		e1000_set_rx_mode(netdev);
L
Linus Torvalds 已提交
5085

5086 5087
		rctl = er32(RCTL);

L
Linus Torvalds 已提交
5088
		/* turn on all-multi mode if wake on multicast is enabled */
5089
		if (wufc & E1000_WUFC_MC)
L
Linus Torvalds 已提交
5090
			rctl |= E1000_RCTL_MPE;
5091 5092 5093

		/* enable receives in the hardware */
		ew32(RCTL, rctl | E1000_RCTL_EN);
L
Linus Torvalds 已提交
5094

J
Joe Perches 已提交
5095 5096
		if (hw->mac_type >= e1000_82540) {
			ctrl = er32(CTRL);
L
Linus Torvalds 已提交
5097 5098 5099 5100 5101 5102
			/* advertise wake from D3Cold */
			#define E1000_CTRL_ADVD3WUC 0x00100000
			/* phy power management enable */
			#define E1000_CTRL_EN_PHY_PWR_MGMT 0x00200000
			ctrl |= E1000_CTRL_ADVD3WUC |
				E1000_CTRL_EN_PHY_PWR_MGMT;
J
Joe Perches 已提交
5103
			ew32(CTRL, ctrl);
L
Linus Torvalds 已提交
5104 5105
		}

J
Joe Perches 已提交
5106
		if (hw->media_type == e1000_media_type_fiber ||
5107
		    hw->media_type == e1000_media_type_internal_serdes) {
L
Linus Torvalds 已提交
5108
			/* keep the laser running in D3 */
J
Joe Perches 已提交
5109
			ctrl_ext = er32(CTRL_EXT);
L
Linus Torvalds 已提交
5110
			ctrl_ext |= E1000_CTRL_EXT_SDP7_DATA;
J
Joe Perches 已提交
5111
			ew32(CTRL_EXT, ctrl_ext);
L
Linus Torvalds 已提交
5112 5113
		}

J
Joe Perches 已提交
5114 5115
		ew32(WUC, E1000_WUC_PME_EN);
		ew32(WUFC, wufc);
L
Linus Torvalds 已提交
5116
	} else {
J
Joe Perches 已提交
5117 5118
		ew32(WUC, 0);
		ew32(WUFC, 0);
L
Linus Torvalds 已提交
5119 5120
	}

5121 5122
	e1000_release_manageability(adapter);

5123 5124
	*enable_wake = !!wufc;

5125
	/* make sure adapter isn't asleep if manageability is enabled */
5126 5127
	if (adapter->en_mng_pt)
		*enable_wake = true;
L
Linus Torvalds 已提交
5128

5129 5130 5131
	if (netif_running(netdev))
		e1000_free_irq(adapter);

L
Linus Torvalds 已提交
5132
	pci_disable_device(pdev);
5133

L
Linus Torvalds 已提交
5134 5135 5136
	return 0;
}

5137
#ifdef CONFIG_PM
5138 5139 5140 5141 5142 5143 5144 5145 5146 5147 5148 5149 5150 5151 5152 5153 5154 5155 5156
static int e1000_suspend(struct pci_dev *pdev, pm_message_t state)
{
	int retval;
	bool wake;

	retval = __e1000_shutdown(pdev, &wake);
	if (retval)
		return retval;

	if (wake) {
		pci_prepare_to_sleep(pdev);
	} else {
		pci_wake_from_d3(pdev, false);
		pci_set_power_state(pdev, PCI_D3hot);
	}

	return 0;
}

5157
static int e1000_resume(struct pci_dev *pdev)
L
Linus Torvalds 已提交
5158 5159
{
	struct net_device *netdev = pci_get_drvdata(pdev);
5160
	struct e1000_adapter *adapter = netdev_priv(netdev);
J
Joe Perches 已提交
5161
	struct e1000_hw *hw = &adapter->hw;
5162
	u32 err;
L
Linus Torvalds 已提交
5163

5164
	pci_set_power_state(pdev, PCI_D0);
5165
	pci_restore_state(pdev);
5166
	pci_save_state(pdev);
T
Taku Izumi 已提交
5167 5168 5169 5170 5171

	if (adapter->need_ioport)
		err = pci_enable_device(pdev);
	else
		err = pci_enable_device_mem(pdev);
5172
	if (err) {
5173
		pr_err("Cannot enable PCI device from suspend\n");
5174 5175
		return err;
	}
5176
	pci_set_master(pdev);
L
Linus Torvalds 已提交
5177

5178 5179
	pci_enable_wake(pdev, PCI_D3hot, 0);
	pci_enable_wake(pdev, PCI_D3cold, 0);
L
Linus Torvalds 已提交
5180

5181 5182 5183 5184 5185
	if (netif_running(netdev)) {
		err = e1000_request_irq(adapter);
		if (err)
			return err;
	}
5186 5187

	e1000_power_up_phy(adapter);
L
Linus Torvalds 已提交
5188
	e1000_reset(adapter);
J
Joe Perches 已提交
5189
	ew32(WUS, ~0);
L
Linus Torvalds 已提交
5190

5191 5192
	e1000_init_manageability(adapter);

J
Jesse Brandeburg 已提交
5193
	if (netif_running(netdev))
L
Linus Torvalds 已提交
5194 5195 5196 5197 5198 5199 5200
		e1000_up(adapter);

	netif_device_attach(netdev);

	return 0;
}
#endif
5201 5202 5203

static void e1000_shutdown(struct pci_dev *pdev)
{
5204 5205 5206 5207 5208 5209 5210 5211
	bool wake;

	__e1000_shutdown(pdev, &wake);

	if (system_state == SYSTEM_POWER_OFF) {
		pci_wake_from_d3(pdev, wake);
		pci_set_power_state(pdev, PCI_D3hot);
	}
5212 5213
}

L
Linus Torvalds 已提交
5214
#ifdef CONFIG_NET_POLL_CONTROLLER
5215
/* Polling 'interrupt' - used by things like netconsole to send skbs
L
Linus Torvalds 已提交
5216 5217 5218
 * without having to re-enable interrupts. It's not called while
 * the interrupt routine is executing.
 */
5219
static void e1000_netpoll(struct net_device *netdev)
L
Linus Torvalds 已提交
5220
{
5221
	struct e1000_adapter *adapter = netdev_priv(netdev);
5222

L
Linus Torvalds 已提交
5223
	disable_irq(adapter->pdev->irq);
5224
	e1000_intr(adapter->pdev->irq, netdev);
L
Linus Torvalds 已提交
5225 5226 5227 5228
	enable_irq(adapter->pdev->irq);
}
#endif

A
Auke Kok 已提交
5229 5230 5231
/**
 * e1000_io_error_detected - called when PCI error is detected
 * @pdev: Pointer to PCI device
5232
 * @state: The current pci connection state
A
Auke Kok 已提交
5233 5234 5235 5236
 *
 * This function is called after a PCI bus error affecting
 * this device has been detected.
 */
5237 5238
static pci_ers_result_t e1000_io_error_detected(struct pci_dev *pdev,
						pci_channel_state_t state)
A
Auke Kok 已提交
5239 5240
{
	struct net_device *netdev = pci_get_drvdata(pdev);
5241
	struct e1000_adapter *adapter = netdev_priv(netdev);
A
Auke Kok 已提交
5242 5243 5244

	netif_device_detach(netdev);

5245 5246 5247
	if (state == pci_channel_io_perm_failure)
		return PCI_ERS_RESULT_DISCONNECT;

A
Auke Kok 已提交
5248 5249
	if (netif_running(netdev))
		e1000_down(adapter);
5250
	pci_disable_device(pdev);
A
Auke Kok 已提交
5251 5252 5253 5254 5255 5256 5257 5258 5259 5260 5261 5262 5263 5264 5265

	/* Request a slot slot reset. */
	return PCI_ERS_RESULT_NEED_RESET;
}

/**
 * e1000_io_slot_reset - called after the pci bus has been reset.
 * @pdev: Pointer to PCI device
 *
 * Restart the card from scratch, as if from a cold-boot. Implementation
 * resembles the first-half of the e1000_resume routine.
 */
static pci_ers_result_t e1000_io_slot_reset(struct pci_dev *pdev)
{
	struct net_device *netdev = pci_get_drvdata(pdev);
5266
	struct e1000_adapter *adapter = netdev_priv(netdev);
J
Joe Perches 已提交
5267
	struct e1000_hw *hw = &adapter->hw;
T
Taku Izumi 已提交
5268
	int err;
A
Auke Kok 已提交
5269

T
Taku Izumi 已提交
5270 5271 5272 5273 5274
	if (adapter->need_ioport)
		err = pci_enable_device(pdev);
	else
		err = pci_enable_device_mem(pdev);
	if (err) {
5275
		pr_err("Cannot re-enable PCI device after reset.\n");
A
Auke Kok 已提交
5276 5277 5278 5279
		return PCI_ERS_RESULT_DISCONNECT;
	}
	pci_set_master(pdev);

5280 5281
	pci_enable_wake(pdev, PCI_D3hot, 0);
	pci_enable_wake(pdev, PCI_D3cold, 0);
A
Auke Kok 已提交
5282 5283

	e1000_reset(adapter);
J
Joe Perches 已提交
5284
	ew32(WUS, ~0);
A
Auke Kok 已提交
5285 5286 5287 5288 5289 5290 5291 5292 5293 5294 5295 5296 5297 5298 5299

	return PCI_ERS_RESULT_RECOVERED;
}

/**
 * e1000_io_resume - called when traffic can start flowing again.
 * @pdev: Pointer to PCI device
 *
 * This callback is called when the error recovery driver tells us that
 * its OK to resume normal operation. Implementation resembles the
 * second-half of the e1000_resume routine.
 */
static void e1000_io_resume(struct pci_dev *pdev)
{
	struct net_device *netdev = pci_get_drvdata(pdev);
5300
	struct e1000_adapter *adapter = netdev_priv(netdev);
5301 5302

	e1000_init_manageability(adapter);
A
Auke Kok 已提交
5303 5304 5305

	if (netif_running(netdev)) {
		if (e1000_up(adapter)) {
5306
			pr_info("can't bring device back up after reset\n");
A
Auke Kok 已提交
5307 5308 5309 5310 5311 5312 5313
			return;
		}
	}

	netif_device_attach(netdev);
}

L
Linus Torvalds 已提交
5314
/* e1000_main.c */