be_main.c 132.1 KB
Newer Older
S
Sathya Perla 已提交
1
/*
V
Vasundhara Volam 已提交
2
 * Copyright (C) 2005 - 2014 Emulex
S
Sathya Perla 已提交
3 4 5 6 7 8 9 10
 * All rights reserved.
 *
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License version 2
 * as published by the Free Software Foundation.  The full GNU General
 * Public License is included in this distribution in the file called COPYING.
 *
 * Contact Information:
11
 * linux-drivers@emulex.com
S
Sathya Perla 已提交
12
 *
13 14 15
 * Emulex
 * 3333 Susan Street
 * Costa Mesa, CA 92626
S
Sathya Perla 已提交
16 17
 */

18
#include <linux/prefetch.h>
19
#include <linux/module.h>
S
Sathya Perla 已提交
20
#include "be.h"
21
#include "be_cmds.h"
22
#include <asm/div64.h>
S
Sathya Perla 已提交
23
#include <linux/aer.h>
24
#include <linux/if_bridge.h>
25
#include <net/busy_poll.h>
26
#include <net/vxlan.h>
S
Sathya Perla 已提交
27 28 29 30

MODULE_VERSION(DRV_VER);
MODULE_DEVICE_TABLE(pci, be_dev_ids);
MODULE_DESCRIPTION(DRV_DESC " " DRV_VER);
31
MODULE_AUTHOR("Emulex Corporation");
S
Sathya Perla 已提交
32 33
MODULE_LICENSE("GPL");

34 35 36
static unsigned int num_vfs;
module_param(num_vfs, uint, S_IRUGO);
MODULE_PARM_DESC(num_vfs, "Number of PCI VFs to initialize");
S
Sathya Perla 已提交
37

38 39 40 41
static ushort rx_frag_size = 2048;
module_param(rx_frag_size, ushort, S_IRUGO);
MODULE_PARM_DESC(rx_frag_size, "Size of a fragment that holds rcvd data.");

S
Sathya Perla 已提交
42
static DEFINE_PCI_DEVICE_TABLE(be_dev_ids) = {
43
	{ PCI_DEVICE(BE_VENDOR_ID, BE_DEVICE_ID1) },
44
	{ PCI_DEVICE(BE_VENDOR_ID, BE_DEVICE_ID2) },
45 46
	{ PCI_DEVICE(BE_VENDOR_ID, OC_DEVICE_ID1) },
	{ PCI_DEVICE(BE_VENDOR_ID, OC_DEVICE_ID2) },
47
	{ PCI_DEVICE(EMULEX_VENDOR_ID, OC_DEVICE_ID3)},
48
	{ PCI_DEVICE(EMULEX_VENDOR_ID, OC_DEVICE_ID4)},
49
	{ PCI_DEVICE(EMULEX_VENDOR_ID, OC_DEVICE_ID5)},
50
	{ PCI_DEVICE(EMULEX_VENDOR_ID, OC_DEVICE_ID6)},
S
Sathya Perla 已提交
51 52 53
	{ 0 }
};
MODULE_DEVICE_TABLE(pci, be_dev_ids);
54
/* UE Status Low CSR */
55
static const char * const ue_status_low_desc[] = {
56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89
	"CEV",
	"CTX",
	"DBUF",
	"ERX",
	"Host",
	"MPU",
	"NDMA",
	"PTC ",
	"RDMA ",
	"RXF ",
	"RXIPS ",
	"RXULP0 ",
	"RXULP1 ",
	"RXULP2 ",
	"TIM ",
	"TPOST ",
	"TPRE ",
	"TXIPS ",
	"TXULP0 ",
	"TXULP1 ",
	"UC ",
	"WDMA ",
	"TXULP2 ",
	"HOST1 ",
	"P0_OB_LINK ",
	"P1_OB_LINK ",
	"HOST_GPIO ",
	"MBOX ",
	"AXGMAC0",
	"AXGMAC1",
	"JTAG",
	"MPU_INTPEND"
};
/* UE Status High CSR */
90
static const char * const ue_status_hi_desc[] = {
91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113
	"LPCMEMHOST",
	"MGMT_MAC",
	"PCS0ONLINE",
	"MPU_IRAM",
	"PCS1ONLINE",
	"PCTL0",
	"PCTL1",
	"PMEM",
	"RR",
	"TXPB",
	"RXPP",
	"XAUI",
	"TXP",
	"ARM",
	"IPC",
	"HOST2",
	"HOST3",
	"HOST4",
	"HOST5",
	"HOST6",
	"HOST7",
	"HOST8",
	"HOST9",
114
	"NETC",
115 116 117 118 119 120 121 122 123
	"Unknown",
	"Unknown",
	"Unknown",
	"Unknown",
	"Unknown",
	"Unknown",
	"Unknown",
	"Unknown"
};
S
Sathya Perla 已提交
124

125

S
Sathya Perla 已提交
126 127 128
static void be_queue_free(struct be_adapter *adapter, struct be_queue_info *q)
{
	struct be_dma_mem *mem = &q->dma_mem;
129
	if (mem->va) {
I
Ivan Vecera 已提交
130 131
		dma_free_coherent(&adapter->pdev->dev, mem->size, mem->va,
				  mem->dma);
132 133
		mem->va = NULL;
	}
S
Sathya Perla 已提交
134 135 136
}

static int be_queue_alloc(struct be_adapter *adapter, struct be_queue_info *q,
137
			  u16 len, u16 entry_size)
S
Sathya Perla 已提交
138 139 140 141 142 143 144
{
	struct be_dma_mem *mem = &q->dma_mem;

	memset(q, 0, sizeof(*q));
	q->len = len;
	q->entry_size = entry_size;
	mem->size = len * entry_size;
145 146
	mem->va = dma_zalloc_coherent(&adapter->pdev->dev, mem->size, &mem->dma,
				      GFP_KERNEL);
S
Sathya Perla 已提交
147
	if (!mem->va)
S
Sathya Perla 已提交
148
		return -ENOMEM;
S
Sathya Perla 已提交
149 150 151
	return 0;
}

152
static void be_reg_intr_set(struct be_adapter *adapter, bool enable)
S
Sathya Perla 已提交
153
{
154
	u32 reg, enabled;
155

156
	pci_read_config_dword(adapter->pdev, PCICFG_MEMBAR_CTRL_INT_CTRL_OFFSET,
157
			      &reg);
158 159
	enabled = reg & MEMBAR_CTRL_INT_CTRL_HOSTINTR_MASK;

160
	if (!enabled && enable)
S
Sathya Perla 已提交
161
		reg |= MEMBAR_CTRL_INT_CTRL_HOSTINTR_MASK;
162
	else if (enabled && !enable)
S
Sathya Perla 已提交
163
		reg &= ~MEMBAR_CTRL_INT_CTRL_HOSTINTR_MASK;
164
	else
S
Sathya Perla 已提交
165
		return;
166

167
	pci_write_config_dword(adapter->pdev,
168
			       PCICFG_MEMBAR_CTRL_INT_CTRL_OFFSET, reg);
S
Sathya Perla 已提交
169 170
}

171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186
static void be_intr_set(struct be_adapter *adapter, bool enable)
{
	int status = 0;

	/* On lancer interrupts can't be controlled via this register */
	if (lancer_chip(adapter))
		return;

	if (adapter->eeh_error)
		return;

	status = be_cmd_intr_set(adapter, enable);
	if (status)
		be_reg_intr_set(adapter, enable);
}

187
static void be_rxq_notify(struct be_adapter *adapter, u16 qid, u16 posted)
S
Sathya Perla 已提交
188 189 190 191
{
	u32 val = 0;
	val |= qid & DB_RQ_RING_ID_MASK;
	val |= posted << DB_RQ_NUM_POSTED_SHIFT;
192 193

	wmb();
194
	iowrite32(val, adapter->db + DB_RQ_OFFSET);
S
Sathya Perla 已提交
195 196
}

V
Vasundhara Volam 已提交
197 198
static void be_txq_notify(struct be_adapter *adapter, struct be_tx_obj *txo,
			  u16 posted)
S
Sathya Perla 已提交
199 200
{
	u32 val = 0;
V
Vasundhara Volam 已提交
201
	val |= txo->q.id & DB_TXULP_RING_ID_MASK;
S
Sathya Perla 已提交
202
	val |= (posted & DB_TXULP_NUM_POSTED_MASK) << DB_TXULP_NUM_POSTED_SHIFT;
203 204

	wmb();
V
Vasundhara Volam 已提交
205
	iowrite32(val, adapter->db + txo->db_offset);
S
Sathya Perla 已提交
206 207
}

208
static void be_eq_notify(struct be_adapter *adapter, u16 qid,
209
			 bool arm, bool clear_int, u16 num_popped)
S
Sathya Perla 已提交
210 211 212
{
	u32 val = 0;
	val |= qid & DB_EQ_RING_ID_MASK;
213
	val |= ((qid & DB_EQ_RING_ID_EXT_MASK) << DB_EQ_RING_ID_EXT_MASK_SHIFT);
214

215
	if (adapter->eeh_error)
216 217
		return;

S
Sathya Perla 已提交
218 219 220 221 222 223
	if (arm)
		val |= 1 << DB_EQ_REARM_SHIFT;
	if (clear_int)
		val |= 1 << DB_EQ_CLR_SHIFT;
	val |= 1 << DB_EQ_EVNT_SHIFT;
	val |= num_popped << DB_EQ_NUM_POPPED_SHIFT;
224
	iowrite32(val, adapter->db + DB_EQ_OFFSET);
S
Sathya Perla 已提交
225 226
}

227
void be_cq_notify(struct be_adapter *adapter, u16 qid, bool arm, u16 num_popped)
S
Sathya Perla 已提交
228 229 230
{
	u32 val = 0;
	val |= qid & DB_CQ_RING_ID_MASK;
231 232
	val |= ((qid & DB_CQ_RING_ID_EXT_MASK) <<
			DB_CQ_RING_ID_EXT_MASK_SHIFT);
233

234
	if (adapter->eeh_error)
235 236
		return;

S
Sathya Perla 已提交
237 238 239
	if (arm)
		val |= 1 << DB_CQ_REARM_SHIFT;
	val |= num_popped << DB_CQ_NUM_POPPED_SHIFT;
240
	iowrite32(val, adapter->db + DB_CQ_OFFSET);
S
Sathya Perla 已提交
241 242 243 244 245
}

static int be_mac_addr_set(struct net_device *netdev, void *p)
{
	struct be_adapter *adapter = netdev_priv(netdev);
246
	struct device *dev = &adapter->pdev->dev;
S
Sathya Perla 已提交
247
	struct sockaddr *addr = p;
248 249 250
	int status;
	u8 mac[ETH_ALEN];
	u32 old_pmac_id = adapter->pmac_id[0], curr_pmac_id = 0;
S
Sathya Perla 已提交
251

252 253 254
	if (!is_valid_ether_addr(addr->sa_data))
		return -EADDRNOTAVAIL;

255 256 257 258 259 260
	/* Proceed further only if, User provided MAC is different
	 * from active MAC
	 */
	if (ether_addr_equal(addr->sa_data, netdev->dev_addr))
		return 0;

261 262 263 264 265
	/* The PMAC_ADD cmd may fail if the VF doesn't have FILTMGMT
	 * privilege or if PF did not provision the new MAC address.
	 * On BE3, this cmd will always fail if the VF doesn't have the
	 * FILTMGMT privilege. This failure is OK, only if the PF programmed
	 * the MAC for the VF.
266
	 */
267 268 269 270 271 272 273 274 275 276 277
	status = be_cmd_pmac_add(adapter, (u8 *)addr->sa_data,
				 adapter->if_handle, &adapter->pmac_id[0], 0);
	if (!status) {
		curr_pmac_id = adapter->pmac_id[0];

		/* Delete the old programmed MAC. This call may fail if the
		 * old MAC was already deleted by the PF driver.
		 */
		if (adapter->pmac_id[0] != old_pmac_id)
			be_cmd_pmac_del(adapter, adapter->if_handle,
					old_pmac_id, 0);
278 279
	}

280 281
	/* Decide if the new MAC is successfully activated only after
	 * querying the FW
282
	 */
283 284
	status = be_cmd_get_active_mac(adapter, curr_pmac_id, mac,
				       adapter->if_handle, true, 0);
285
	if (status)
286
		goto err;
S
Sathya Perla 已提交
287

288 289 290
	/* The MAC change did not happen, either due to lack of privilege
	 * or PF didn't pre-provision.
	 */
291
	if (!ether_addr_equal(addr->sa_data, mac)) {
292 293 294 295
		status = -EPERM;
		goto err;
	}

296
	memcpy(netdev->dev_addr, addr->sa_data, netdev->addr_len);
297
	dev_info(dev, "MAC address changed to %pM\n", mac);
298 299
	return 0;
err:
300
	dev_warn(dev, "MAC address change to %pM failed\n", addr->sa_data);
S
Sathya Perla 已提交
301 302 303
	return status;
}

304 305 306 307 308 309 310
/* BE2 supports only v0 cmd */
static void *hw_stats_from_cmd(struct be_adapter *adapter)
{
	if (BE2_chip(adapter)) {
		struct be_cmd_resp_get_stats_v0 *cmd = adapter->stats_cmd.va;

		return &cmd->hw_stats;
311
	} else if (BE3_chip(adapter)) {
312 313
		struct be_cmd_resp_get_stats_v1 *cmd = adapter->stats_cmd.va;

314 315 316 317
		return &cmd->hw_stats;
	} else {
		struct be_cmd_resp_get_stats_v2 *cmd = adapter->stats_cmd.va;

318 319 320 321 322 323 324 325 326 327 328
		return &cmd->hw_stats;
	}
}

/* BE2 supports only v0 cmd */
static void *be_erx_stats_from_cmd(struct be_adapter *adapter)
{
	if (BE2_chip(adapter)) {
		struct be_hw_stats_v0 *hw_stats = hw_stats_from_cmd(adapter);

		return &hw_stats->erx;
329
	} else if (BE3_chip(adapter)) {
330 331
		struct be_hw_stats_v1 *hw_stats = hw_stats_from_cmd(adapter);

332 333 334 335
		return &hw_stats->erx;
	} else {
		struct be_hw_stats_v2 *hw_stats = hw_stats_from_cmd(adapter);

336 337 338 339 340
		return &hw_stats->erx;
	}
}

static void populate_be_v0_stats(struct be_adapter *adapter)
341
{
342 343 344
	struct be_hw_stats_v0 *hw_stats = hw_stats_from_cmd(adapter);
	struct be_pmem_stats *pmem_sts = &hw_stats->pmem;
	struct be_rxf_stats_v0 *rxf_stats = &hw_stats->rxf;
345
	struct be_port_rxf_stats_v0 *port_stats =
346 347
					&rxf_stats->port[adapter->port_num];
	struct be_drv_stats *drvs = &adapter->drv_stats;
348

349
	be_dws_le_to_cpu(hw_stats, sizeof(*hw_stats));
350 351 352 353 354 355 356 357 358 359 360 361 362 363
	drvs->rx_pause_frames = port_stats->rx_pause_frames;
	drvs->rx_crc_errors = port_stats->rx_crc_errors;
	drvs->rx_control_frames = port_stats->rx_control_frames;
	drvs->rx_in_range_errors = port_stats->rx_in_range_errors;
	drvs->rx_frame_too_long = port_stats->rx_frame_too_long;
	drvs->rx_dropped_runt = port_stats->rx_dropped_runt;
	drvs->rx_ip_checksum_errs = port_stats->rx_ip_checksum_errs;
	drvs->rx_tcp_checksum_errs = port_stats->rx_tcp_checksum_errs;
	drvs->rx_udp_checksum_errs = port_stats->rx_udp_checksum_errs;
	drvs->rxpp_fifo_overflow_drop = port_stats->rx_fifo_overflow;
	drvs->rx_dropped_tcp_length = port_stats->rx_dropped_tcp_length;
	drvs->rx_dropped_too_small = port_stats->rx_dropped_too_small;
	drvs->rx_dropped_too_short = port_stats->rx_dropped_too_short;
	drvs->rx_out_range_errors = port_stats->rx_out_range_errors;
364
	drvs->rx_input_fifo_overflow_drop = port_stats->rx_input_fifo_overflow;
365 366
	drvs->rx_dropped_header_too_small =
		port_stats->rx_dropped_header_too_small;
367 368 369
	drvs->rx_address_filtered =
					port_stats->rx_address_filtered +
					port_stats->rx_vlan_filtered;
370 371 372 373 374 375 376
	drvs->rx_alignment_symbol_errors =
		port_stats->rx_alignment_symbol_errors;

	drvs->tx_pauseframes = port_stats->tx_pauseframes;
	drvs->tx_controlframes = port_stats->tx_controlframes;

	if (adapter->port_num)
377
		drvs->jabber_events = rxf_stats->port1_jabber_events;
378
	else
379
		drvs->jabber_events = rxf_stats->port0_jabber_events;
380 381 382 383
	drvs->rx_drops_no_pbuf = rxf_stats->rx_drops_no_pbuf;
	drvs->rx_drops_no_erx_descr = rxf_stats->rx_drops_no_erx_descr;
	drvs->forwarded_packets = rxf_stats->forwarded_packets;
	drvs->rx_drops_mtu = rxf_stats->rx_drops_mtu;
384 385
	drvs->rx_drops_no_tpre_descr = rxf_stats->rx_drops_no_tpre_descr;
	drvs->rx_drops_too_many_frags = rxf_stats->rx_drops_too_many_frags;
386 387 388
	adapter->drv_stats.eth_red_drops = pmem_sts->eth_red_drops;
}

389
static void populate_be_v1_stats(struct be_adapter *adapter)
390
{
391 392 393
	struct be_hw_stats_v1 *hw_stats = hw_stats_from_cmd(adapter);
	struct be_pmem_stats *pmem_sts = &hw_stats->pmem;
	struct be_rxf_stats_v1 *rxf_stats = &hw_stats->rxf;
394
	struct be_port_rxf_stats_v1 *port_stats =
395 396
					&rxf_stats->port[adapter->port_num];
	struct be_drv_stats *drvs = &adapter->drv_stats;
397

398
	be_dws_le_to_cpu(hw_stats, sizeof(*hw_stats));
399 400
	drvs->pmem_fifo_overflow_drop = port_stats->pmem_fifo_overflow_drop;
	drvs->rx_priority_pause_frames = port_stats->rx_priority_pause_frames;
401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417
	drvs->rx_pause_frames = port_stats->rx_pause_frames;
	drvs->rx_crc_errors = port_stats->rx_crc_errors;
	drvs->rx_control_frames = port_stats->rx_control_frames;
	drvs->rx_in_range_errors = port_stats->rx_in_range_errors;
	drvs->rx_frame_too_long = port_stats->rx_frame_too_long;
	drvs->rx_dropped_runt = port_stats->rx_dropped_runt;
	drvs->rx_ip_checksum_errs = port_stats->rx_ip_checksum_errs;
	drvs->rx_tcp_checksum_errs = port_stats->rx_tcp_checksum_errs;
	drvs->rx_udp_checksum_errs = port_stats->rx_udp_checksum_errs;
	drvs->rx_dropped_tcp_length = port_stats->rx_dropped_tcp_length;
	drvs->rx_dropped_too_small = port_stats->rx_dropped_too_small;
	drvs->rx_dropped_too_short = port_stats->rx_dropped_too_short;
	drvs->rx_out_range_errors = port_stats->rx_out_range_errors;
	drvs->rx_dropped_header_too_small =
		port_stats->rx_dropped_header_too_small;
	drvs->rx_input_fifo_overflow_drop =
		port_stats->rx_input_fifo_overflow_drop;
418
	drvs->rx_address_filtered = port_stats->rx_address_filtered;
419 420
	drvs->rx_alignment_symbol_errors =
		port_stats->rx_alignment_symbol_errors;
421
	drvs->rxpp_fifo_overflow_drop = port_stats->rxpp_fifo_overflow_drop;
422 423
	drvs->tx_pauseframes = port_stats->tx_pauseframes;
	drvs->tx_controlframes = port_stats->tx_controlframes;
424
	drvs->tx_priority_pauseframes = port_stats->tx_priority_pauseframes;
425 426 427 428 429
	drvs->jabber_events = port_stats->jabber_events;
	drvs->rx_drops_no_pbuf = rxf_stats->rx_drops_no_pbuf;
	drvs->rx_drops_no_erx_descr = rxf_stats->rx_drops_no_erx_descr;
	drvs->forwarded_packets = rxf_stats->forwarded_packets;
	drvs->rx_drops_mtu = rxf_stats->rx_drops_mtu;
430 431
	drvs->rx_drops_no_tpre_descr = rxf_stats->rx_drops_no_tpre_descr;
	drvs->rx_drops_too_many_frags = rxf_stats->rx_drops_too_many_frags;
432 433 434
	adapter->drv_stats.eth_red_drops = pmem_sts->eth_red_drops;
}

435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478
static void populate_be_v2_stats(struct be_adapter *adapter)
{
	struct be_hw_stats_v2 *hw_stats = hw_stats_from_cmd(adapter);
	struct be_pmem_stats *pmem_sts = &hw_stats->pmem;
	struct be_rxf_stats_v2 *rxf_stats = &hw_stats->rxf;
	struct be_port_rxf_stats_v2 *port_stats =
					&rxf_stats->port[adapter->port_num];
	struct be_drv_stats *drvs = &adapter->drv_stats;

	be_dws_le_to_cpu(hw_stats, sizeof(*hw_stats));
	drvs->pmem_fifo_overflow_drop = port_stats->pmem_fifo_overflow_drop;
	drvs->rx_priority_pause_frames = port_stats->rx_priority_pause_frames;
	drvs->rx_pause_frames = port_stats->rx_pause_frames;
	drvs->rx_crc_errors = port_stats->rx_crc_errors;
	drvs->rx_control_frames = port_stats->rx_control_frames;
	drvs->rx_in_range_errors = port_stats->rx_in_range_errors;
	drvs->rx_frame_too_long = port_stats->rx_frame_too_long;
	drvs->rx_dropped_runt = port_stats->rx_dropped_runt;
	drvs->rx_ip_checksum_errs = port_stats->rx_ip_checksum_errs;
	drvs->rx_tcp_checksum_errs = port_stats->rx_tcp_checksum_errs;
	drvs->rx_udp_checksum_errs = port_stats->rx_udp_checksum_errs;
	drvs->rx_dropped_tcp_length = port_stats->rx_dropped_tcp_length;
	drvs->rx_dropped_too_small = port_stats->rx_dropped_too_small;
	drvs->rx_dropped_too_short = port_stats->rx_dropped_too_short;
	drvs->rx_out_range_errors = port_stats->rx_out_range_errors;
	drvs->rx_dropped_header_too_small =
		port_stats->rx_dropped_header_too_small;
	drvs->rx_input_fifo_overflow_drop =
		port_stats->rx_input_fifo_overflow_drop;
	drvs->rx_address_filtered = port_stats->rx_address_filtered;
	drvs->rx_alignment_symbol_errors =
		port_stats->rx_alignment_symbol_errors;
	drvs->rxpp_fifo_overflow_drop = port_stats->rxpp_fifo_overflow_drop;
	drvs->tx_pauseframes = port_stats->tx_pauseframes;
	drvs->tx_controlframes = port_stats->tx_controlframes;
	drvs->tx_priority_pauseframes = port_stats->tx_priority_pauseframes;
	drvs->jabber_events = port_stats->jabber_events;
	drvs->rx_drops_no_pbuf = rxf_stats->rx_drops_no_pbuf;
	drvs->rx_drops_no_erx_descr = rxf_stats->rx_drops_no_erx_descr;
	drvs->forwarded_packets = rxf_stats->forwarded_packets;
	drvs->rx_drops_mtu = rxf_stats->rx_drops_mtu;
	drvs->rx_drops_no_tpre_descr = rxf_stats->rx_drops_no_tpre_descr;
	drvs->rx_drops_too_many_frags = rxf_stats->rx_drops_too_many_frags;
	adapter->drv_stats.eth_red_drops = pmem_sts->eth_red_drops;
479
	if (be_roce_supported(adapter)) {
480 481 482 483 484 485 486
		drvs->rx_roce_bytes_lsd = port_stats->roce_bytes_received_lsd;
		drvs->rx_roce_bytes_msd = port_stats->roce_bytes_received_msd;
		drvs->rx_roce_frames = port_stats->roce_frames_received;
		drvs->roce_drops_crc = port_stats->roce_drops_crc;
		drvs->roce_drops_payload_len =
			port_stats->roce_drops_payload_len;
	}
487 488
}

S
Selvin Xavier 已提交
489 490
static void populate_lancer_stats(struct be_adapter *adapter)
{
491

S
Selvin Xavier 已提交
492
	struct be_drv_stats *drvs = &adapter->drv_stats;
493
	struct lancer_pport_stats *pport_stats = pport_stats_from_cmd(adapter);
494 495 496 497 498

	be_dws_le_to_cpu(pport_stats, sizeof(*pport_stats));
	drvs->rx_pause_frames = pport_stats->rx_pause_frames_lo;
	drvs->rx_crc_errors = pport_stats->rx_crc_errors_lo;
	drvs->rx_control_frames = pport_stats->rx_control_frames_lo;
S
Selvin Xavier 已提交
499
	drvs->rx_in_range_errors = pport_stats->rx_in_range_errors;
500
	drvs->rx_frame_too_long = pport_stats->rx_frames_too_long_lo;
S
Selvin Xavier 已提交
501 502 503 504 505 506 507 508 509 510 511 512
	drvs->rx_dropped_runt = pport_stats->rx_dropped_runt;
	drvs->rx_ip_checksum_errs = pport_stats->rx_ip_checksum_errors;
	drvs->rx_tcp_checksum_errs = pport_stats->rx_tcp_checksum_errors;
	drvs->rx_udp_checksum_errs = pport_stats->rx_udp_checksum_errors;
	drvs->rx_dropped_tcp_length =
				pport_stats->rx_dropped_invalid_tcp_length;
	drvs->rx_dropped_too_small = pport_stats->rx_dropped_too_small;
	drvs->rx_dropped_too_short = pport_stats->rx_dropped_too_short;
	drvs->rx_out_range_errors = pport_stats->rx_out_of_range_errors;
	drvs->rx_dropped_header_too_small =
				pport_stats->rx_dropped_header_too_small;
	drvs->rx_input_fifo_overflow_drop = pport_stats->rx_fifo_overflow;
513 514 515
	drvs->rx_address_filtered =
					pport_stats->rx_address_filtered +
					pport_stats->rx_vlan_filtered;
516
	drvs->rx_alignment_symbol_errors = pport_stats->rx_symbol_errors_lo;
S
Selvin Xavier 已提交
517
	drvs->rxpp_fifo_overflow_drop = pport_stats->rx_fifo_overflow;
518 519
	drvs->tx_pauseframes = pport_stats->tx_pause_frames_lo;
	drvs->tx_controlframes = pport_stats->tx_control_frames_lo;
S
Selvin Xavier 已提交
520
	drvs->jabber_events = pport_stats->rx_jabbers;
521 522
	drvs->forwarded_packets = pport_stats->num_forwards_lo;
	drvs->rx_drops_mtu = pport_stats->rx_drops_mtu_lo;
S
Selvin Xavier 已提交
523
	drvs->rx_drops_too_many_frags =
524
				pport_stats->rx_drops_too_many_frags_lo;
S
Selvin Xavier 已提交
525
}
526

527 528 529 530 531 532 533 534 535 536 537 538
static void accumulate_16bit_val(u32 *acc, u16 val)
{
#define lo(x)			(x & 0xFFFF)
#define hi(x)			(x & 0xFFFF0000)
	bool wrapped = val < lo(*acc);
	u32 newacc = hi(*acc) + val;

	if (wrapped)
		newacc += 65536;
	ACCESS_ONCE(*acc) = newacc;
}

J
Jingoo Han 已提交
539
static void populate_erx_stats(struct be_adapter *adapter,
540
			       struct be_rx_obj *rxo, u32 erx_stat)
541 542 543 544 545 546 547 548 549 550 551
{
	if (!BEx_chip(adapter))
		rx_stats(rxo)->rx_drops_no_frags = erx_stat;
	else
		/* below erx HW counter can actually wrap around after
		 * 65535. Driver accumulates a 32-bit value
		 */
		accumulate_16bit_val(&rx_stats(rxo)->rx_drops_no_frags,
				     (u16)erx_stat);
}

552 553
void be_parse_stats(struct be_adapter *adapter)
{
554
	struct be_erx_stats_v2 *erx = be_erx_stats_from_cmd(adapter);
555 556
	struct be_rx_obj *rxo;
	int i;
557
	u32 erx_stat;
558

559 560
	if (lancer_chip(adapter)) {
		populate_lancer_stats(adapter);
S
Selvin Xavier 已提交
561
	} else {
562 563
		if (BE2_chip(adapter))
			populate_be_v0_stats(adapter);
564 565
		else if (BE3_chip(adapter))
			/* for BE3 */
566
			populate_be_v1_stats(adapter);
567 568
		else
			populate_be_v2_stats(adapter);
569

570
		/* erx_v2 is longer than v0, v1. use v2 for v0, v1 access */
571
		for_all_rx_queues(adapter, rxo, i) {
572 573
			erx_stat = erx->rx_drops_no_fragments[rxo->q.id];
			populate_erx_stats(adapter, rxo, erx_stat);
574
		}
575
	}
576 577
}

578
static struct rtnl_link_stats64 *be_get_stats64(struct net_device *netdev,
579
						struct rtnl_link_stats64 *stats)
S
Sathya Perla 已提交
580
{
581
	struct be_adapter *adapter = netdev_priv(netdev);
582
	struct be_drv_stats *drvs = &adapter->drv_stats;
583
	struct be_rx_obj *rxo;
584
	struct be_tx_obj *txo;
585 586
	u64 pkts, bytes;
	unsigned int start;
587
	int i;
S
Sathya Perla 已提交
588

589
	for_all_rx_queues(adapter, rxo, i) {
590 591
		const struct be_rx_stats *rx_stats = rx_stats(rxo);
		do {
592
			start = u64_stats_fetch_begin_irq(&rx_stats->sync);
593 594
			pkts = rx_stats(rxo)->rx_pkts;
			bytes = rx_stats(rxo)->rx_bytes;
595
		} while (u64_stats_fetch_retry_irq(&rx_stats->sync, start));
596 597 598 599 600
		stats->rx_packets += pkts;
		stats->rx_bytes += bytes;
		stats->multicast += rx_stats(rxo)->rx_mcast_pkts;
		stats->rx_dropped += rx_stats(rxo)->rx_drops_no_skbs +
					rx_stats(rxo)->rx_drops_no_frags;
601 602
	}

603
	for_all_tx_queues(adapter, txo, i) {
604 605
		const struct be_tx_stats *tx_stats = tx_stats(txo);
		do {
606
			start = u64_stats_fetch_begin_irq(&tx_stats->sync);
607 608
			pkts = tx_stats(txo)->tx_pkts;
			bytes = tx_stats(txo)->tx_bytes;
609
		} while (u64_stats_fetch_retry_irq(&tx_stats->sync, start));
610 611
		stats->tx_packets += pkts;
		stats->tx_bytes += bytes;
612
	}
S
Sathya Perla 已提交
613 614

	/* bad pkts received */
615
	stats->rx_errors = drvs->rx_crc_errors +
616 617 618 619 620 621 622 623
		drvs->rx_alignment_symbol_errors +
		drvs->rx_in_range_errors +
		drvs->rx_out_range_errors +
		drvs->rx_frame_too_long +
		drvs->rx_dropped_too_small +
		drvs->rx_dropped_too_short +
		drvs->rx_dropped_header_too_small +
		drvs->rx_dropped_tcp_length +
624
		drvs->rx_dropped_runt;
625

S
Sathya Perla 已提交
626
	/* detailed rx errors */
627
	stats->rx_length_errors = drvs->rx_in_range_errors +
628 629
		drvs->rx_out_range_errors +
		drvs->rx_frame_too_long;
630

631
	stats->rx_crc_errors = drvs->rx_crc_errors;
S
Sathya Perla 已提交
632 633

	/* frame alignment errors */
634
	stats->rx_frame_errors = drvs->rx_alignment_symbol_errors;
635

S
Sathya Perla 已提交
636 637
	/* receiver fifo overrun */
	/* drops_no_pbuf is no per i/f, it's per BE card */
638
	stats->rx_fifo_errors = drvs->rxpp_fifo_overflow_drop +
639 640
				drvs->rx_input_fifo_overflow_drop +
				drvs->rx_drops_no_pbuf;
641
	return stats;
S
Sathya Perla 已提交
642 643
}

644
void be_link_status_update(struct be_adapter *adapter, u8 link_status)
S
Sathya Perla 已提交
645 646 647
{
	struct net_device *netdev = adapter->netdev;

648
	if (!(adapter->flags & BE_FLAGS_LINK_STATUS_INIT)) {
649
		netif_carrier_off(netdev);
650
		adapter->flags |= BE_FLAGS_LINK_STATUS_INIT;
S
Sathya Perla 已提交
651
	}
652

653
	if (link_status)
654 655 656
		netif_carrier_on(netdev);
	else
		netif_carrier_off(netdev);
S
Sathya Perla 已提交
657 658
}

659
static void be_tx_stats_update(struct be_tx_obj *txo,
660 661
			       u32 wrb_cnt, u32 copied, u32 gso_segs,
			       bool stopped)
S
Sathya Perla 已提交
662
{
663 664
	struct be_tx_stats *stats = tx_stats(txo);

665
	u64_stats_update_begin(&stats->sync);
666 667 668 669
	stats->tx_reqs++;
	stats->tx_wrbs += wrb_cnt;
	stats->tx_bytes += copied;
	stats->tx_pkts += (gso_segs ? gso_segs : 1);
S
Sathya Perla 已提交
670
	if (stopped)
671
		stats->tx_stops++;
672
	u64_stats_update_end(&stats->sync);
S
Sathya Perla 已提交
673 674 675
}

/* Determine number of WRB entries needed to xmit data in an skb */
676
static u32 wrb_cnt_for_skb(struct be_adapter *adapter, struct sk_buff *skb,
677
			   bool *dummy)
S
Sathya Perla 已提交
678
{
679 680 681 682
	int cnt = (skb->len > skb->data_len);

	cnt += skb_shinfo(skb)->nr_frags;

S
Sathya Perla 已提交
683 684
	/* to account for hdr wrb */
	cnt++;
685 686 687
	if (lancer_chip(adapter) || !(cnt & 1)) {
		*dummy = false;
	} else {
S
Sathya Perla 已提交
688 689 690
		/* add a dummy to make it an even num */
		cnt++;
		*dummy = true;
691
	}
S
Sathya Perla 已提交
692 693 694 695 696 697 698 699 700
	BUG_ON(cnt > BE_MAX_TX_FRAG_COUNT);
	return cnt;
}

static inline void wrb_fill(struct be_eth_wrb *wrb, u64 addr, int len)
{
	wrb->frag_pa_hi = upper_32_bits(addr);
	wrb->frag_pa_lo = addr & 0xFFFFFFFF;
	wrb->frag_len = len & ETH_WRB_FRAG_LEN_MASK;
701
	wrb->rsvd0 = 0;
S
Sathya Perla 已提交
702 703
}

704
static inline u16 be_get_tx_vlan_tag(struct be_adapter *adapter,
705
				     struct sk_buff *skb)
706 707 708 709 710 711 712 713 714 715 716 717 718 719
{
	u8 vlan_prio;
	u16 vlan_tag;

	vlan_tag = vlan_tx_tag_get(skb);
	vlan_prio = (vlan_tag & VLAN_PRIO_MASK) >> VLAN_PRIO_SHIFT;
	/* If vlan priority provided by OS is NOT in available bmap */
	if (!(adapter->vlan_prio_bmap & (1 << vlan_prio)))
		vlan_tag = (vlan_tag & ~VLAN_PRIO_MASK) |
				adapter->recommended_prio;

	return vlan_tag;
}

720 721 722 723 724 725 726 727 728 729 730 731 732
/* Used only for IP tunnel packets */
static u16 skb_inner_ip_proto(struct sk_buff *skb)
{
	return (inner_ip_hdr(skb)->version == 4) ?
		inner_ip_hdr(skb)->protocol : inner_ipv6_hdr(skb)->nexthdr;
}

static u16 skb_ip_proto(struct sk_buff *skb)
{
	return (ip_hdr(skb)->version == 4) ?
		ip_hdr(skb)->protocol : ipv6_hdr(skb)->nexthdr;
}

733
static void wrb_fill_hdr(struct be_adapter *adapter, struct be_eth_hdr_wrb *hdr,
734 735
			 struct sk_buff *skb, u32 wrb_cnt, u32 len,
			 bool skip_hw_vlan)
S
Sathya Perla 已提交
736
{
737
	u16 vlan_tag, proto;
738

S
Sathya Perla 已提交
739 740 741 742
	memset(hdr, 0, sizeof(*hdr));

	AMAP_SET_BITS(struct amap_eth_hdr_wrb, crc, hdr, 1);

A
Ajit Khaparde 已提交
743
	if (skb_is_gso(skb)) {
S
Sathya Perla 已提交
744 745 746
		AMAP_SET_BITS(struct amap_eth_hdr_wrb, lso, hdr, 1);
		AMAP_SET_BITS(struct amap_eth_hdr_wrb, lso_mss,
			hdr, skb_shinfo(skb)->gso_size);
747
		if (skb_is_gso_v6(skb) && !lancer_chip(adapter))
A
Ajit Khaparde 已提交
748
			AMAP_SET_BITS(struct amap_eth_hdr_wrb, lso6, hdr, 1);
S
Sathya Perla 已提交
749
	} else if (skb->ip_summed == CHECKSUM_PARTIAL) {
750 751 752 753 754 755 756
		if (skb->encapsulation) {
			AMAP_SET_BITS(struct amap_eth_hdr_wrb, ipcs, hdr, 1);
			proto = skb_inner_ip_proto(skb);
		} else {
			proto = skb_ip_proto(skb);
		}
		if (proto == IPPROTO_TCP)
S
Sathya Perla 已提交
757
			AMAP_SET_BITS(struct amap_eth_hdr_wrb, tcpcs, hdr, 1);
758
		else if (proto == IPPROTO_UDP)
S
Sathya Perla 已提交
759 760 761
			AMAP_SET_BITS(struct amap_eth_hdr_wrb, udpcs, hdr, 1);
	}

A
Ajit Khaparde 已提交
762
	if (vlan_tx_tag_present(skb)) {
S
Sathya Perla 已提交
763
		AMAP_SET_BITS(struct amap_eth_hdr_wrb, vlan, hdr, 1);
764
		vlan_tag = be_get_tx_vlan_tag(adapter, skb);
765
		AMAP_SET_BITS(struct amap_eth_hdr_wrb, vlan_tag, hdr, vlan_tag);
S
Sathya Perla 已提交
766 767
	}

768 769
	/* To skip HW VLAN tagging: evt = 1, compl = 0 */
	AMAP_SET_BITS(struct amap_eth_hdr_wrb, complete, hdr, !skip_hw_vlan);
S
Sathya Perla 已提交
770 771 772 773 774
	AMAP_SET_BITS(struct amap_eth_hdr_wrb, event, hdr, 1);
	AMAP_SET_BITS(struct amap_eth_hdr_wrb, num_wrb, hdr, wrb_cnt);
	AMAP_SET_BITS(struct amap_eth_hdr_wrb, len, hdr, len);
}

I
Ivan Vecera 已提交
775
static void unmap_tx_frag(struct device *dev, struct be_eth_wrb *wrb,
776
			  bool unmap_single)
777 778 779 780 781 782
{
	dma_addr_t dma;

	be_dws_le_to_cpu(wrb, sizeof(*wrb));

	dma = (u64)wrb->frag_pa_hi << 32 | (u64)wrb->frag_pa_lo;
783
	if (wrb->frag_len) {
784
		if (unmap_single)
I
Ivan Vecera 已提交
785 786
			dma_unmap_single(dev, dma, wrb->frag_len,
					 DMA_TO_DEVICE);
787
		else
I
Ivan Vecera 已提交
788
			dma_unmap_page(dev, dma, wrb->frag_len, DMA_TO_DEVICE);
789 790
	}
}
S
Sathya Perla 已提交
791

792
static int make_tx_wrbs(struct be_adapter *adapter, struct be_queue_info *txq,
793 794
			struct sk_buff *skb, u32 wrb_cnt, bool dummy_wrb,
			bool skip_hw_vlan)
S
Sathya Perla 已提交
795
{
796 797
	dma_addr_t busaddr;
	int i, copied = 0;
I
Ivan Vecera 已提交
798
	struct device *dev = &adapter->pdev->dev;
S
Sathya Perla 已提交
799 800 801
	struct sk_buff *first_skb = skb;
	struct be_eth_wrb *wrb;
	struct be_eth_hdr_wrb *hdr;
802 803
	bool map_single = false;
	u16 map_head;
S
Sathya Perla 已提交
804 805 806

	hdr = queue_head_node(txq);
	queue_head_inc(txq);
807
	map_head = txq->head;
S
Sathya Perla 已提交
808

809
	if (skb->len > skb->data_len) {
E
Eric Dumazet 已提交
810
		int len = skb_headlen(skb);
I
Ivan Vecera 已提交
811 812
		busaddr = dma_map_single(dev, skb->data, len, DMA_TO_DEVICE);
		if (dma_mapping_error(dev, busaddr))
813 814
			goto dma_err;
		map_single = true;
815 816 817 818 819 820
		wrb = queue_head_node(txq);
		wrb_fill(wrb, busaddr, len);
		be_dws_cpu_to_le(wrb, sizeof(*wrb));
		queue_head_inc(txq);
		copied += len;
	}
S
Sathya Perla 已提交
821

822
	for (i = 0; i < skb_shinfo(skb)->nr_frags; i++) {
823
		const struct skb_frag_struct *frag = &skb_shinfo(skb)->frags[i];
824
		busaddr = skb_frag_dma_map(dev, frag, 0,
E
Eric Dumazet 已提交
825
					   skb_frag_size(frag), DMA_TO_DEVICE);
I
Ivan Vecera 已提交
826
		if (dma_mapping_error(dev, busaddr))
827
			goto dma_err;
828
		wrb = queue_head_node(txq);
E
Eric Dumazet 已提交
829
		wrb_fill(wrb, busaddr, skb_frag_size(frag));
830 831
		be_dws_cpu_to_le(wrb, sizeof(*wrb));
		queue_head_inc(txq);
E
Eric Dumazet 已提交
832
		copied += skb_frag_size(frag);
S
Sathya Perla 已提交
833 834 835 836 837 838 839 840 841
	}

	if (dummy_wrb) {
		wrb = queue_head_node(txq);
		wrb_fill(wrb, 0, 0);
		be_dws_cpu_to_le(wrb, sizeof(*wrb));
		queue_head_inc(txq);
	}

842
	wrb_fill_hdr(adapter, hdr, first_skb, wrb_cnt, copied, skip_hw_vlan);
S
Sathya Perla 已提交
843 844 845
	be_dws_cpu_to_le(hdr, sizeof(*hdr));

	return copied;
846 847 848 849
dma_err:
	txq->head = map_head;
	while (copied) {
		wrb = queue_head_node(txq);
I
Ivan Vecera 已提交
850
		unmap_tx_frag(dev, wrb, map_single);
851 852 853 854 855
		map_single = false;
		copied -= wrb->frag_len;
		queue_head_inc(txq);
	}
	return 0;
S
Sathya Perla 已提交
856 857
}

858
static struct sk_buff *be_insert_vlan_in_pkt(struct be_adapter *adapter,
859 860
					     struct sk_buff *skb,
					     bool *skip_hw_vlan)
861 862 863 864 865 866 867
{
	u16 vlan_tag = 0;

	skb = skb_share_check(skb, GFP_ATOMIC);
	if (unlikely(!skb))
		return skb;

868
	if (vlan_tx_tag_present(skb))
869
		vlan_tag = be_get_tx_vlan_tag(adapter, skb);
870 871 872 873 874 875 876 877 878 879

	if (qnq_async_evt_rcvd(adapter) && adapter->pvid) {
		if (!vlan_tag)
			vlan_tag = adapter->pvid;
		/* f/w workaround to set skip_hw_vlan = 1, informs the F/W to
		 * skip VLAN insertion
		 */
		if (skip_hw_vlan)
			*skip_hw_vlan = true;
	}
880 881

	if (vlan_tag) {
882
		skb = __vlan_put_tag(skb, htons(ETH_P_8021Q), vlan_tag);
883 884 885 886 887 888 889 890
		if (unlikely(!skb))
			return skb;
		skb->vlan_tci = 0;
	}

	/* Insert the outer VLAN, if any */
	if (adapter->qnq_vid) {
		vlan_tag = adapter->qnq_vid;
891
		skb = __vlan_put_tag(skb, htons(ETH_P_8021Q), vlan_tag);
892 893 894 895 896 897
		if (unlikely(!skb))
			return skb;
		if (skip_hw_vlan)
			*skip_hw_vlan = true;
	}

898 899 900
	return skb;
}

901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917 918 919 920 921 922 923 924 925 926 927
static bool be_ipv6_exthdr_check(struct sk_buff *skb)
{
	struct ethhdr *eh = (struct ethhdr *)skb->data;
	u16 offset = ETH_HLEN;

	if (eh->h_proto == htons(ETH_P_IPV6)) {
		struct ipv6hdr *ip6h = (struct ipv6hdr *)(skb->data + offset);

		offset += sizeof(struct ipv6hdr);
		if (ip6h->nexthdr != NEXTHDR_TCP &&
		    ip6h->nexthdr != NEXTHDR_UDP) {
			struct ipv6_opt_hdr *ehdr =
				(struct ipv6_opt_hdr *) (skb->data + offset);

			/* offending pkt: 2nd byte following IPv6 hdr is 0xff */
			if (ehdr->hdrlen == 0xff)
				return true;
		}
	}
	return false;
}

static int be_vlan_tag_tx_chk(struct be_adapter *adapter, struct sk_buff *skb)
{
	return vlan_tx_tag_present(skb) || adapter->pvid || adapter->qnq_vid;
}

928
static int be_ipv6_tx_stall_chk(struct be_adapter *adapter, struct sk_buff *skb)
929
{
930
	return BE3_chip(adapter) && be_ipv6_exthdr_check(skb);
931 932
}

933 934 935
static struct sk_buff *be_lancer_xmit_workarounds(struct be_adapter *adapter,
						  struct sk_buff *skb,
						  bool *skip_hw_vlan)
S
Sathya Perla 已提交
936
{
937
	struct vlan_ethhdr *veh = (struct vlan_ethhdr *)skb->data;
938 939
	unsigned int eth_hdr_len;
	struct iphdr *ip;
940

941 942
	/* For padded packets, BE HW modifies tot_len field in IP header
	 * incorrecly when VLAN tag is inserted by HW.
943
	 * For padded packets, Lancer computes incorrect checksum.
944
	 */
945 946
	eth_hdr_len = ntohs(skb->protocol) == ETH_P_8021Q ?
						VLAN_ETH_HLEN : ETH_HLEN;
947 948
	if (skb->len <= 60 &&
	    (lancer_chip(adapter) || vlan_tx_tag_present(skb)) &&
949
	    is_ipv4_pkt(skb)) {
950 951 952
		ip = (struct iphdr *)ip_hdr(skb);
		pskb_trim(skb, eth_hdr_len + ntohs(ip->tot_len));
	}
953

954
	/* If vlan tag is already inlined in the packet, skip HW VLAN
955
	 * tagging in pvid-tagging mode
956
	 */
957
	if (be_pvid_tagging_enabled(adapter) &&
958
	    veh->h_vlan_proto == htons(ETH_P_8021Q))
959
		*skip_hw_vlan = true;
960

961 962 963 964 965
	/* HW has a bug wherein it will calculate CSUM for VLAN
	 * pkts even though it is disabled.
	 * Manually insert VLAN in pkt.
	 */
	if (skb->ip_summed != CHECKSUM_PARTIAL &&
966 967
	    vlan_tx_tag_present(skb)) {
		skb = be_insert_vlan_in_pkt(adapter, skb, skip_hw_vlan);
968
		if (unlikely(!skb))
969
			goto err;
970 971 972 973 974 975 976
	}

	/* HW may lockup when VLAN HW tagging is requested on
	 * certain ipv6 packets. Drop such pkts if the HW workaround to
	 * skip HW tagging is not enabled by FW.
	 */
	if (unlikely(be_ipv6_tx_stall_chk(adapter, skb) &&
977 978
	    (adapter->pvid || adapter->qnq_vid) &&
	    !qnq_async_evt_rcvd(adapter)))
979 980 981 982 983 984 985 986 987 988
		goto tx_drop;

	/* Manual VLAN tag insertion to prevent:
	 * ASIC lockup when the ASIC inserts VLAN tag into
	 * certain ipv6 packets. Insert VLAN tags in driver,
	 * and set event, completion, vlan bits accordingly
	 * in the Tx WRB.
	 */
	if (be_ipv6_tx_stall_chk(adapter, skb) &&
	    be_vlan_tag_tx_chk(adapter, skb)) {
989
		skb = be_insert_vlan_in_pkt(adapter, skb, skip_hw_vlan);
990
		if (unlikely(!skb))
991
			goto err;
992 993
	}

994 995 996
	return skb;
tx_drop:
	dev_kfree_skb_any(skb);
997
err:
998 999 1000
	return NULL;
}

1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023
static struct sk_buff *be_xmit_workarounds(struct be_adapter *adapter,
					   struct sk_buff *skb,
					   bool *skip_hw_vlan)
{
	/* Lancer, SH-R ASICs have a bug wherein Packets that are 32 bytes or
	 * less may cause a transmit stall on that port. So the work-around is
	 * to pad short packets (<= 32 bytes) to a 36-byte length.
	 */
	if (unlikely(!BEx_chip(adapter) && skb->len <= 32)) {
		if (skb_padto(skb, 36))
			return NULL;
		skb->len = 36;
	}

	if (BEx_chip(adapter) || lancer_chip(adapter)) {
		skb = be_lancer_xmit_workarounds(adapter, skb, skip_hw_vlan);
		if (!skb)
			return NULL;
	}

	return skb;
}

1024 1025 1026 1027 1028 1029 1030 1031 1032 1033 1034
static netdev_tx_t be_xmit(struct sk_buff *skb, struct net_device *netdev)
{
	struct be_adapter *adapter = netdev_priv(netdev);
	struct be_tx_obj *txo = &adapter->tx_obj[skb_get_queue_mapping(skb)];
	struct be_queue_info *txq = &txo->q;
	bool dummy_wrb, stopped = false;
	u32 wrb_cnt = 0, copied = 0;
	bool skip_hw_vlan = false;
	u32 start = txq->head;

	skb = be_xmit_workarounds(adapter, skb, &skip_hw_vlan);
1035 1036
	if (!skb) {
		tx_stats(txo)->tx_drv_drops++;
1037
		return NETDEV_TX_OK;
1038
	}
1039

1040
	wrb_cnt = wrb_cnt_for_skb(adapter, skb, &dummy_wrb);
S
Sathya Perla 已提交
1041

1042 1043
	copied = make_tx_wrbs(adapter, txq, skb, wrb_cnt, dummy_wrb,
			      skip_hw_vlan);
1044
	if (copied) {
E
Eric Dumazet 已提交
1045 1046
		int gso_segs = skb_shinfo(skb)->gso_segs;

1047
		/* record the sent skb in the sent_skb table */
1048 1049
		BUG_ON(txo->sent_skb_list[start]);
		txo->sent_skb_list[start] = skb;
1050 1051 1052 1053 1054

		/* Ensure txq has space for the next skb; Else stop the queue
		 * *BEFORE* ringing the tx doorbell, so that we serialze the
		 * tx compls of the current transmit which'll wake up the queue
		 */
1055
		atomic_add(wrb_cnt, &txq->used);
1056 1057
		if ((BE_MAX_TX_FRAG_COUNT + atomic_read(&txq->used)) >=
								txq->len) {
1058
			netif_stop_subqueue(netdev, skb_get_queue_mapping(skb));
1059 1060
			stopped = true;
		}
S
Sathya Perla 已提交
1061

V
Vasundhara Volam 已提交
1062
		be_txq_notify(adapter, txo, wrb_cnt);
S
Sathya Perla 已提交
1063

E
Eric Dumazet 已提交
1064
		be_tx_stats_update(txo, wrb_cnt, copied, gso_segs, stopped);
1065 1066
	} else {
		txq->head = start;
1067
		tx_stats(txo)->tx_drv_drops++;
1068
		dev_kfree_skb_any(skb);
S
Sathya Perla 已提交
1069 1070 1071 1072 1073 1074 1075 1076
	}
	return NETDEV_TX_OK;
}

static int be_change_mtu(struct net_device *netdev, int new_mtu)
{
	struct be_adapter *adapter = netdev_priv(netdev);
	if (new_mtu < BE_MIN_MTU ||
1077
	    new_mtu > (BE_MAX_JUMBO_FRAME_SIZE - (ETH_HLEN + ETH_FCS_LEN))) {
S
Sathya Perla 已提交
1078
		dev_info(&adapter->pdev->dev,
1079 1080 1081
			 "MTU must be between %d and %d bytes\n",
			 BE_MIN_MTU,
			 (BE_MAX_JUMBO_FRAME_SIZE - (ETH_HLEN + ETH_FCS_LEN)));
S
Sathya Perla 已提交
1082 1083 1084
		return -EINVAL;
	}
	dev_info(&adapter->pdev->dev, "MTU changed from %d to %d bytes\n",
1085
		 netdev->mtu, new_mtu);
S
Sathya Perla 已提交
1086 1087 1088 1089 1090
	netdev->mtu = new_mtu;
	return 0;
}

/*
1091 1092
 * A max of 64 (BE_NUM_VLANS_SUPPORTED) vlans can be configured in BE.
 * If the user configures more, place BE in vlan promiscuous mode.
S
Sathya Perla 已提交
1093
 */
S
Sathya Perla 已提交
1094
static int be_vid_config(struct be_adapter *adapter)
S
Sathya Perla 已提交
1095
{
S
Sathya Perla 已提交
1096
	u16 vids[BE_NUM_VLANS_SUPPORTED];
1097
	u16 num = 0, i = 0;
1098
	int status = 0;
1099

1100 1101 1102 1103
	/* No need to further configure vids if in promiscuous mode */
	if (adapter->promiscuous)
		return 0;

1104
	if (adapter->vlans_added > be_max_vlans(adapter))
1105 1106 1107
		goto set_vlan_promisc;

	/* Construct VLAN Table to give to HW */
1108 1109
	for_each_set_bit(i, adapter->vids, VLAN_N_VID)
		vids[num++] = cpu_to_le16(i);
1110

1111
	status = be_cmd_vlan_config(adapter, adapter->if_handle, vids, num);
1112
	if (status) {
1113
		/* Set to VLAN promisc mode as setting VLAN filter failed */
1114 1115
		if (addl_status(status) ==
				MCC_ADDL_STATUS_INSUFFICIENT_RESOURCES)
1116 1117 1118 1119 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129
			goto set_vlan_promisc;
		dev_err(&adapter->pdev->dev,
			"Setting HW VLAN filtering failed.\n");
	} else {
		if (adapter->flags & BE_FLAGS_VLAN_PROMISC) {
			/* hw VLAN filtering re-enabled. */
			status = be_cmd_rx_filter(adapter,
						  BE_FLAGS_VLAN_PROMISC, OFF);
			if (!status) {
				dev_info(&adapter->pdev->dev,
					 "Disabling VLAN Promiscuous mode.\n");
				adapter->flags &= ~BE_FLAGS_VLAN_PROMISC;
			}
		}
S
Sathya Perla 已提交
1130
	}
1131

1132
	return status;
1133 1134

set_vlan_promisc:
1135 1136
	if (adapter->flags & BE_FLAGS_VLAN_PROMISC)
		return 0;
1137 1138 1139 1140 1141 1142 1143 1144

	status = be_cmd_rx_filter(adapter, BE_FLAGS_VLAN_PROMISC, ON);
	if (!status) {
		dev_info(&adapter->pdev->dev, "Enable VLAN Promiscuous mode\n");
		adapter->flags |= BE_FLAGS_VLAN_PROMISC;
	} else
		dev_err(&adapter->pdev->dev,
			"Failed to enable VLAN Promiscuous mode.\n");
1145
	return status;
S
Sathya Perla 已提交
1146 1147
}

1148
static int be_vlan_add_vid(struct net_device *netdev, __be16 proto, u16 vid)
S
Sathya Perla 已提交
1149 1150
{
	struct be_adapter *adapter = netdev_priv(netdev);
A
Ajit Khaparde 已提交
1151
	int status = 0;
S
Sathya Perla 已提交
1152

1153 1154
	/* Packets with VID 0 are always received by Lancer by default */
	if (lancer_chip(adapter) && vid == 0)
1155 1156
		return status;

1157
	if (test_bit(vid, adapter->vids))
1158
		return status;
1159

1160
	set_bit(vid, adapter->vids);
1161
	adapter->vlans_added++;
1162

1163 1164 1165
	status = be_vid_config(adapter);
	if (status) {
		adapter->vlans_added--;
1166
		clear_bit(vid, adapter->vids);
1167
	}
1168

A
Ajit Khaparde 已提交
1169
	return status;
S
Sathya Perla 已提交
1170 1171
}

1172
static int be_vlan_rem_vid(struct net_device *netdev, __be16 proto, u16 vid)
S
Sathya Perla 已提交
1173 1174 1175
{
	struct be_adapter *adapter = netdev_priv(netdev);

1176 1177
	/* Packets with VID 0 are always received by Lancer by default */
	if (lancer_chip(adapter) && vid == 0)
1178
		return 0;
1179

1180
	clear_bit(vid, adapter->vids);
1181 1182 1183
	adapter->vlans_added--;

	return be_vid_config(adapter);
S
Sathya Perla 已提交
1184 1185
}

1186 1187 1188
static void be_clear_promisc(struct be_adapter *adapter)
{
	adapter->promiscuous = false;
1189
	adapter->flags &= ~(BE_FLAGS_VLAN_PROMISC | BE_FLAGS_MCAST_PROMISC);
1190 1191 1192 1193

	be_cmd_rx_filter(adapter, IFF_PROMISC, OFF);
}

1194
static void be_set_rx_mode(struct net_device *netdev)
S
Sathya Perla 已提交
1195 1196
{
	struct be_adapter *adapter = netdev_priv(netdev);
1197
	int status;
S
Sathya Perla 已提交
1198

1199
	if (netdev->flags & IFF_PROMISC) {
1200
		be_cmd_rx_filter(adapter, IFF_PROMISC, ON);
1201 1202
		adapter->promiscuous = true;
		goto done;
S
Sathya Perla 已提交
1203 1204
	}

L
Lucas De Marchi 已提交
1205
	/* BE was previously in promiscuous mode; disable it */
1206
	if (adapter->promiscuous) {
1207
		be_clear_promisc(adapter);
1208
		if (adapter->vlans_added)
S
Sathya Perla 已提交
1209
			be_vid_config(adapter);
S
Sathya Perla 已提交
1210 1211
	}

1212
	/* Enable multicast promisc if num configured exceeds what we support */
1213
	if (netdev->flags & IFF_ALLMULTI ||
1214 1215
	    netdev_mc_count(netdev) > be_max_mc(adapter))
		goto set_mcast_promisc;
S
Sathya Perla 已提交
1216

1217 1218 1219 1220 1221 1222 1223 1224 1225
	if (netdev_uc_count(netdev) != adapter->uc_macs) {
		struct netdev_hw_addr *ha;
		int i = 1; /* First slot is claimed by the Primary MAC */

		for (; adapter->uc_macs > 0; adapter->uc_macs--, i++) {
			be_cmd_pmac_del(adapter, adapter->if_handle,
					adapter->pmac_id[i], 0);
		}

1226
		if (netdev_uc_count(netdev) > be_max_uc(adapter)) {
1227 1228 1229 1230 1231 1232 1233 1234 1235 1236 1237 1238 1239
			be_cmd_rx_filter(adapter, IFF_PROMISC, ON);
			adapter->promiscuous = true;
			goto done;
		}

		netdev_for_each_uc_addr(ha, adapter->netdev) {
			adapter->uc_macs++; /* First slot is for Primary MAC */
			be_cmd_pmac_add(adapter, (u8 *)ha->addr,
					adapter->if_handle,
					&adapter->pmac_id[adapter->uc_macs], 0);
		}
	}

1240
	status = be_cmd_rx_filter(adapter, IFF_MULTICAST, ON);
1241 1242 1243 1244
	if (!status) {
		if (adapter->flags & BE_FLAGS_MCAST_PROMISC)
			adapter->flags &= ~BE_FLAGS_MCAST_PROMISC;
		goto done;
1245
	}
1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256

set_mcast_promisc:
	if (adapter->flags & BE_FLAGS_MCAST_PROMISC)
		return;

	/* Set to MCAST promisc mode if setting MULTICAST address fails
	 * or if num configured exceeds what we support
	 */
	status = be_cmd_rx_filter(adapter, IFF_ALLMULTI, ON);
	if (!status)
		adapter->flags |= BE_FLAGS_MCAST_PROMISC;
1257 1258
done:
	return;
S
Sathya Perla 已提交
1259 1260
}

1261 1262 1263
static int be_set_vf_mac(struct net_device *netdev, int vf, u8 *mac)
{
	struct be_adapter *adapter = netdev_priv(netdev);
1264
	struct be_vf_cfg *vf_cfg = &adapter->vf_cfg[vf];
1265 1266
	int status;

1267
	if (!sriov_enabled(adapter))
1268 1269
		return -EPERM;

1270
	if (!is_valid_ether_addr(mac) || vf >= adapter->num_vfs)
1271 1272
		return -EINVAL;

1273 1274 1275
	if (BEx_chip(adapter)) {
		be_cmd_pmac_del(adapter, vf_cfg->if_handle, vf_cfg->pmac_id,
				vf + 1);
1276

1277 1278
		status = be_cmd_pmac_add(adapter, mac, vf_cfg->if_handle,
					 &vf_cfg->pmac_id, vf + 1);
1279 1280 1281
	} else {
		status = be_cmd_set_mac(adapter, mac, vf_cfg->if_handle,
					vf + 1);
1282 1283
	}

1284
	if (status)
1285
		dev_err(&adapter->pdev->dev, "MAC %pM set on VF %d Failed\n",
1286
			mac, vf);
1287
	else
1288
		memcpy(vf_cfg->mac_addr, mac, ETH_ALEN);
1289

1290 1291 1292
	return status;
}

1293
static int be_get_vf_config(struct net_device *netdev, int vf,
1294
			    struct ifla_vf_info *vi)
1295 1296
{
	struct be_adapter *adapter = netdev_priv(netdev);
1297
	struct be_vf_cfg *vf_cfg = &adapter->vf_cfg[vf];
1298

1299
	if (!sriov_enabled(adapter))
1300 1301
		return -EPERM;

1302
	if (vf >= adapter->num_vfs)
1303 1304 1305
		return -EINVAL;

	vi->vf = vf;
1306 1307
	vi->max_tx_rate = vf_cfg->tx_rate;
	vi->min_tx_rate = 0;
1308 1309
	vi->vlan = vf_cfg->vlan_tag & VLAN_VID_MASK;
	vi->qos = vf_cfg->vlan_tag >> VLAN_PRIO_SHIFT;
1310
	memcpy(&vi->mac, vf_cfg->mac_addr, ETH_ALEN);
1311
	vi->linkstate = adapter->vf_cfg[vf].plink_tracking;
1312 1313 1314 1315

	return 0;
}

1316
static int be_set_vf_vlan(struct net_device *netdev, int vf, u16 vlan, u8 qos)
1317 1318
{
	struct be_adapter *adapter = netdev_priv(netdev);
1319
	struct be_vf_cfg *vf_cfg = &adapter->vf_cfg[vf];
1320 1321
	int status = 0;

1322
	if (!sriov_enabled(adapter))
1323 1324
		return -EPERM;

1325
	if (vf >= adapter->num_vfs || vlan > 4095 || qos > 7)
1326 1327
		return -EINVAL;

1328 1329
	if (vlan || qos) {
		vlan |= qos << VLAN_PRIO_SHIFT;
1330
		if (vf_cfg->vlan_tag != vlan)
1331 1332
			status = be_cmd_set_hsw_config(adapter, vlan, vf + 1,
						       vf_cfg->if_handle, 0);
1333
	} else {
1334
		/* Reset Transparent Vlan Tagging. */
1335 1336
		status = be_cmd_set_hsw_config(adapter, BE_RESET_VLAN_TAG_ID,
					       vf + 1, vf_cfg->if_handle, 0);
1337 1338
	}

1339 1340 1341
	if (!status)
		vf_cfg->vlan_tag = vlan;
	else
1342
		dev_info(&adapter->pdev->dev,
1343
			 "VLAN %d config on VF %d failed\n", vlan, vf);
1344 1345 1346
	return status;
}

1347 1348
static int be_set_vf_tx_rate(struct net_device *netdev, int vf,
			     int min_tx_rate, int max_tx_rate)
1349 1350
{
	struct be_adapter *adapter = netdev_priv(netdev);
1351 1352 1353 1354
	struct device *dev = &adapter->pdev->dev;
	int percent_rate, status = 0;
	u16 link_speed = 0;
	u8 link_status;
1355

1356
	if (!sriov_enabled(adapter))
1357 1358
		return -EPERM;

1359
	if (vf >= adapter->num_vfs)
1360 1361
		return -EINVAL;

1362 1363 1364
	if (min_tx_rate)
		return -EINVAL;

1365 1366 1367 1368 1369 1370 1371 1372 1373 1374
	if (!max_tx_rate)
		goto config_qos;

	status = be_cmd_link_status_query(adapter, &link_speed,
					  &link_status, 0);
	if (status)
		goto err;

	if (!link_status) {
		dev_err(dev, "TX-rate setting not allowed when link is down\n");
1375
		status = -ENETDOWN;
1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 1386 1387 1388 1389 1390 1391 1392
		goto err;
	}

	if (max_tx_rate < 100 || max_tx_rate > link_speed) {
		dev_err(dev, "TX-rate must be between 100 and %d Mbps\n",
			link_speed);
		status = -EINVAL;
		goto err;
	}

	/* On Skyhawk the QOS setting must be done only as a % value */
	percent_rate = link_speed / 100;
	if (skyhawk_chip(adapter) && (max_tx_rate % percent_rate)) {
		dev_err(dev, "TX-rate must be a multiple of %d Mbps\n",
			percent_rate);
		status = -EINVAL;
		goto err;
1393
	}
1394

1395 1396
config_qos:
	status = be_cmd_config_qos(adapter, max_tx_rate, link_speed, vf + 1);
1397
	if (status)
1398 1399 1400 1401 1402 1403 1404 1405
		goto err;

	adapter->vf_cfg[vf].tx_rate = max_tx_rate;
	return 0;

err:
	dev_err(dev, "TX-rate setting of %dMbps on VF%d failed\n",
		max_tx_rate, vf);
1406 1407
	return status;
}
1408 1409 1410 1411 1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422 1423 1424 1425
static int be_set_vf_link_state(struct net_device *netdev, int vf,
				int link_state)
{
	struct be_adapter *adapter = netdev_priv(netdev);
	int status;

	if (!sriov_enabled(adapter))
		return -EPERM;

	if (vf >= adapter->num_vfs)
		return -EINVAL;

	status = be_cmd_set_logical_link_config(adapter, link_state, vf+1);
	if (!status)
		adapter->vf_cfg[vf].plink_tracking = link_state;

	return status;
}
1426

1427 1428
static void be_aic_update(struct be_aic_obj *aic, u64 rx_pkts, u64 tx_pkts,
			  ulong now)
S
Sathya Perla 已提交
1429
{
1430 1431 1432 1433
	aic->rx_pkts_prev = rx_pkts;
	aic->tx_reqs_prev = tx_pkts;
	aic->jiffies = now;
}
1434

1435 1436 1437 1438 1439 1440 1441 1442 1443 1444 1445
static void be_eqd_update(struct be_adapter *adapter)
{
	struct be_set_eqd set_eqd[MAX_EVT_QS];
	int eqd, i, num = 0, start;
	struct be_aic_obj *aic;
	struct be_eq_obj *eqo;
	struct be_rx_obj *rxo;
	struct be_tx_obj *txo;
	u64 rx_pkts, tx_pkts;
	ulong now;
	u32 pps, delta;
S
Sathya Perla 已提交
1446

1447 1448 1449 1450 1451 1452 1453 1454
	for_all_evt_queues(adapter, eqo, i) {
		aic = &adapter->aic_obj[eqo->idx];
		if (!aic->enable) {
			if (aic->jiffies)
				aic->jiffies = 0;
			eqd = aic->et_eqd;
			goto modify_eqd;
		}
S
Sathya Perla 已提交
1455

1456 1457
		rxo = &adapter->rx_obj[eqo->idx];
		do {
1458
			start = u64_stats_fetch_begin_irq(&rxo->stats.sync);
1459
			rx_pkts = rxo->stats.rx_pkts;
1460
		} while (u64_stats_fetch_retry_irq(&rxo->stats.sync, start));
S
Sathya Perla 已提交
1461

1462 1463
		txo = &adapter->tx_obj[eqo->idx];
		do {
1464
			start = u64_stats_fetch_begin_irq(&txo->stats.sync);
1465
			tx_pkts = txo->stats.tx_reqs;
1466
		} while (u64_stats_fetch_retry_irq(&txo->stats.sync, start));
S
Sathya Perla 已提交
1467 1468


1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480 1481
		/* Skip, if wrapped around or first calculation */
		now = jiffies;
		if (!aic->jiffies || time_before(now, aic->jiffies) ||
		    rx_pkts < aic->rx_pkts_prev ||
		    tx_pkts < aic->tx_reqs_prev) {
			be_aic_update(aic, rx_pkts, tx_pkts, now);
			continue;
		}

		delta = jiffies_to_msecs(now - aic->jiffies);
		pps = (((u32)(rx_pkts - aic->rx_pkts_prev) * 1000) / delta) +
			(((u32)(tx_pkts - aic->tx_reqs_prev) * 1000) / delta);
		eqd = (pps / 15000) << 2;
S
Sathya Perla 已提交
1482

1483 1484 1485 1486 1487 1488
		if (eqd < 8)
			eqd = 0;
		eqd = min_t(u32, eqd, aic->max_eqd);
		eqd = max_t(u32, eqd, aic->min_eqd);

		be_aic_update(aic, rx_pkts, tx_pkts, now);
S
Sathya Perla 已提交
1489
modify_eqd:
1490 1491 1492 1493 1494 1495
		if (eqd != aic->prev_eqd) {
			set_eqd[num].delay_multiplier = (eqd * 65)/100;
			set_eqd[num].eq_id = eqo->q.id;
			aic->prev_eqd = eqd;
			num++;
		}
1496
	}
1497 1498 1499

	if (num)
		be_cmd_modify_eqd(adapter, set_eqd, num);
S
Sathya Perla 已提交
1500 1501
}

1502
static void be_rx_stats_update(struct be_rx_obj *rxo,
1503
			       struct be_rx_compl_info *rxcp)
1504
{
1505
	struct be_rx_stats *stats = rx_stats(rxo);
1506

1507
	u64_stats_update_begin(&stats->sync);
1508
	stats->rx_compl++;
1509
	stats->rx_bytes += rxcp->pkt_size;
1510
	stats->rx_pkts++;
1511
	if (rxcp->pkt_type == BE_MULTICAST_PACKET)
1512
		stats->rx_mcast_pkts++;
1513
	if (rxcp->err)
1514
		stats->rx_compl_err++;
1515
	u64_stats_update_end(&stats->sync);
1516 1517
}

1518
static inline bool csum_passed(struct be_rx_compl_info *rxcp)
1519
{
1520
	/* L4 checksum is not reliable for non TCP/UDP packets.
1521 1522
	 * Also ignore ipcksm for ipv6 pkts
	 */
1523
	return (rxcp->tcpf || rxcp->udpf) && rxcp->l4_csum &&
1524
		(rxcp->ip_csum || rxcp->ipv6) && !rxcp->err;
1525 1526
}

1527
static struct be_rx_page_info *get_rx_page_info(struct be_rx_obj *rxo)
S
Sathya Perla 已提交
1528
{
S
Sathya Perla 已提交
1529
	struct be_adapter *adapter = rxo->adapter;
S
Sathya Perla 已提交
1530
	struct be_rx_page_info *rx_page_info;
1531
	struct be_queue_info *rxq = &rxo->q;
1532
	u16 frag_idx = rxq->tail;
S
Sathya Perla 已提交
1533

1534
	rx_page_info = &rxo->page_info_tbl[frag_idx];
S
Sathya Perla 已提交
1535 1536
	BUG_ON(!rx_page_info->page);

1537
	if (rx_page_info->last_frag) {
I
Ivan Vecera 已提交
1538 1539 1540
		dma_unmap_page(&adapter->pdev->dev,
			       dma_unmap_addr(rx_page_info, bus),
			       adapter->big_page_size, DMA_FROM_DEVICE);
1541 1542 1543 1544 1545
		rx_page_info->last_frag = false;
	} else {
		dma_sync_single_for_cpu(&adapter->pdev->dev,
					dma_unmap_addr(rx_page_info, bus),
					rx_frag_size, DMA_FROM_DEVICE);
A
Ajit Khaparde 已提交
1546
	}
S
Sathya Perla 已提交
1547

1548
	queue_tail_inc(rxq);
S
Sathya Perla 已提交
1549 1550 1551 1552 1553
	atomic_dec(&rxq->used);
	return rx_page_info;
}

/* Throwaway the data in the Rx completion */
S
Sathya Perla 已提交
1554 1555
static void be_rx_compl_discard(struct be_rx_obj *rxo,
				struct be_rx_compl_info *rxcp)
S
Sathya Perla 已提交
1556 1557
{
	struct be_rx_page_info *page_info;
1558
	u16 i, num_rcvd = rxcp->num_rcvd;
S
Sathya Perla 已提交
1559

1560
	for (i = 0; i < num_rcvd; i++) {
1561
		page_info = get_rx_page_info(rxo);
1562 1563
		put_page(page_info->page);
		memset(page_info, 0, sizeof(*page_info));
S
Sathya Perla 已提交
1564 1565 1566 1567 1568 1569 1570
	}
}

/*
 * skb_fill_rx_data forms a complete skb for an ether frame
 * indicated by rxcp.
 */
S
Sathya Perla 已提交
1571 1572
static void skb_fill_rx_data(struct be_rx_obj *rxo, struct sk_buff *skb,
			     struct be_rx_compl_info *rxcp)
S
Sathya Perla 已提交
1573 1574
{
	struct be_rx_page_info *page_info;
1575 1576
	u16 i, j;
	u16 hdr_len, curr_frag_len, remaining;
S
Sathya Perla 已提交
1577 1578
	u8 *start;

1579
	page_info = get_rx_page_info(rxo);
S
Sathya Perla 已提交
1580 1581 1582 1583
	start = page_address(page_info->page) + page_info->page_offset;
	prefetch(start);

	/* Copy data in the first descriptor of this completion */
1584
	curr_frag_len = min(rxcp->pkt_size, rx_frag_size);
S
Sathya Perla 已提交
1585 1586 1587

	skb->len = curr_frag_len;
	if (curr_frag_len <= BE_HDR_LEN) { /* tiny packet */
1588
		memcpy(skb->data, start, curr_frag_len);
S
Sathya Perla 已提交
1589 1590 1591 1592 1593
		/* Complete packet has now been moved to data */
		put_page(page_info->page);
		skb->data_len = 0;
		skb->tail += curr_frag_len;
	} else {
1594 1595
		hdr_len = ETH_HLEN;
		memcpy(skb->data, start, hdr_len);
S
Sathya Perla 已提交
1596
		skb_shinfo(skb)->nr_frags = 1;
1597
		skb_frag_set_page(skb, 0, page_info->page);
S
Sathya Perla 已提交
1598 1599
		skb_shinfo(skb)->frags[0].page_offset =
					page_info->page_offset + hdr_len;
1600 1601
		skb_frag_size_set(&skb_shinfo(skb)->frags[0],
				  curr_frag_len - hdr_len);
S
Sathya Perla 已提交
1602
		skb->data_len = curr_frag_len - hdr_len;
E
Eric Dumazet 已提交
1603
		skb->truesize += rx_frag_size;
S
Sathya Perla 已提交
1604 1605
		skb->tail += hdr_len;
	}
A
Ajit Khaparde 已提交
1606
	page_info->page = NULL;
S
Sathya Perla 已提交
1607

1608 1609 1610
	if (rxcp->pkt_size <= rx_frag_size) {
		BUG_ON(rxcp->num_rcvd != 1);
		return;
S
Sathya Perla 已提交
1611 1612 1613
	}

	/* More frags present for this completion */
1614 1615
	remaining = rxcp->pkt_size - curr_frag_len;
	for (i = 1, j = 0; i < rxcp->num_rcvd; i++) {
1616
		page_info = get_rx_page_info(rxo);
1617
		curr_frag_len = min(remaining, rx_frag_size);
S
Sathya Perla 已提交
1618

1619 1620 1621 1622
		/* Coalesce all frags from the same physical page in one slot */
		if (page_info->page_offset == 0) {
			/* Fresh page */
			j++;
1623
			skb_frag_set_page(skb, j, page_info->page);
1624 1625
			skb_shinfo(skb)->frags[j].page_offset =
							page_info->page_offset;
E
Eric Dumazet 已提交
1626
			skb_frag_size_set(&skb_shinfo(skb)->frags[j], 0);
1627 1628 1629 1630 1631
			skb_shinfo(skb)->nr_frags++;
		} else {
			put_page(page_info->page);
		}

E
Eric Dumazet 已提交
1632
		skb_frag_size_add(&skb_shinfo(skb)->frags[j], curr_frag_len);
S
Sathya Perla 已提交
1633 1634
		skb->len += curr_frag_len;
		skb->data_len += curr_frag_len;
E
Eric Dumazet 已提交
1635
		skb->truesize += rx_frag_size;
1636
		remaining -= curr_frag_len;
A
Ajit Khaparde 已提交
1637
		page_info->page = NULL;
S
Sathya Perla 已提交
1638
	}
1639
	BUG_ON(j > MAX_SKB_FRAGS);
S
Sathya Perla 已提交
1640 1641
}

1642
/* Process the RX completion indicated by rxcp when GRO is disabled */
1643
static void be_rx_compl_process(struct be_rx_obj *rxo, struct napi_struct *napi,
S
Sathya Perla 已提交
1644
				struct be_rx_compl_info *rxcp)
S
Sathya Perla 已提交
1645
{
S
Sathya Perla 已提交
1646
	struct be_adapter *adapter = rxo->adapter;
1647
	struct net_device *netdev = adapter->netdev;
S
Sathya Perla 已提交
1648
	struct sk_buff *skb;
1649

1650
	skb = netdev_alloc_skb_ip_align(netdev, BE_RX_SKB_ALLOC_SIZE);
1651
	if (unlikely(!skb)) {
1652
		rx_stats(rxo)->rx_drops_no_skbs++;
S
Sathya Perla 已提交
1653
		be_rx_compl_discard(rxo, rxcp);
S
Sathya Perla 已提交
1654 1655 1656
		return;
	}

S
Sathya Perla 已提交
1657
	skb_fill_rx_data(rxo, skb, rxcp);
S
Sathya Perla 已提交
1658

1659
	if (likely((netdev->features & NETIF_F_RXCSUM) && csum_passed(rxcp)))
1660
		skb->ip_summed = CHECKSUM_UNNECESSARY;
S
Somnath Kotur 已提交
1661 1662
	else
		skb_checksum_none_assert(skb);
S
Sathya Perla 已提交
1663

1664
	skb->protocol = eth_type_trans(skb, netdev);
1665
	skb_record_rx_queue(skb, rxo - &adapter->rx_obj[0]);
S
Sathya Perla 已提交
1666
	if (netdev->features & NETIF_F_RXHASH)
T
Tom Herbert 已提交
1667
		skb_set_hash(skb, rxcp->rss_hash, PKT_HASH_TYPE_L3);
1668 1669

	skb->encapsulation = rxcp->tunneled;
1670
	skb_mark_napi_id(skb, napi);
S
Sathya Perla 已提交
1671

1672
	if (rxcp->vlanf)
1673
		__vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q), rxcp->vlan_tag);
A
Ajit Khaparde 已提交
1674 1675

	netif_receive_skb(skb);
S
Sathya Perla 已提交
1676 1677
}

1678
/* Process the RX completion indicated by rxcp when GRO is enabled */
J
Jingoo Han 已提交
1679 1680 1681
static void be_rx_compl_process_gro(struct be_rx_obj *rxo,
				    struct napi_struct *napi,
				    struct be_rx_compl_info *rxcp)
S
Sathya Perla 已提交
1682
{
S
Sathya Perla 已提交
1683
	struct be_adapter *adapter = rxo->adapter;
S
Sathya Perla 已提交
1684
	struct be_rx_page_info *page_info;
1685
	struct sk_buff *skb = NULL;
1686 1687
	u16 remaining, curr_frag_len;
	u16 i, j;
1688

S
Sathya Perla 已提交
1689
	skb = napi_get_frags(napi);
1690
	if (!skb) {
S
Sathya Perla 已提交
1691
		be_rx_compl_discard(rxo, rxcp);
1692 1693 1694
		return;
	}

1695 1696
	remaining = rxcp->pkt_size;
	for (i = 0, j = -1; i < rxcp->num_rcvd; i++) {
1697
		page_info = get_rx_page_info(rxo);
S
Sathya Perla 已提交
1698 1699 1700

		curr_frag_len = min(remaining, rx_frag_size);

1701 1702 1703 1704
		/* Coalesce all frags from the same physical page in one slot */
		if (i == 0 || page_info->page_offset == 0) {
			/* First frag or Fresh page */
			j++;
1705
			skb_frag_set_page(skb, j, page_info->page);
1706 1707
			skb_shinfo(skb)->frags[j].page_offset =
							page_info->page_offset;
E
Eric Dumazet 已提交
1708
			skb_frag_size_set(&skb_shinfo(skb)->frags[j], 0);
1709 1710 1711
		} else {
			put_page(page_info->page);
		}
E
Eric Dumazet 已提交
1712
		skb_frag_size_add(&skb_shinfo(skb)->frags[j], curr_frag_len);
E
Eric Dumazet 已提交
1713
		skb->truesize += rx_frag_size;
1714
		remaining -= curr_frag_len;
S
Sathya Perla 已提交
1715 1716
		memset(page_info, 0, sizeof(*page_info));
	}
1717
	BUG_ON(j > MAX_SKB_FRAGS);
S
Sathya Perla 已提交
1718

1719
	skb_shinfo(skb)->nr_frags = j + 1;
1720 1721
	skb->len = rxcp->pkt_size;
	skb->data_len = rxcp->pkt_size;
1722
	skb->ip_summed = CHECKSUM_UNNECESSARY;
1723
	skb_record_rx_queue(skb, rxo - &adapter->rx_obj[0]);
A
Ajit Khaparde 已提交
1724
	if (adapter->netdev->features & NETIF_F_RXHASH)
T
Tom Herbert 已提交
1725
		skb_set_hash(skb, rxcp->rss_hash, PKT_HASH_TYPE_L3);
1726 1727

	skb->encapsulation = rxcp->tunneled;
1728
	skb_mark_napi_id(skb, napi);
1729

1730
	if (rxcp->vlanf)
1731
		__vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q), rxcp->vlan_tag);
A
Ajit Khaparde 已提交
1732

S
Sathya Perla 已提交
1733
	napi_gro_frags(napi);
1734 1735
}

S
Sathya Perla 已提交
1736 1737
static void be_parse_rx_compl_v1(struct be_eth_rx_compl *compl,
				 struct be_rx_compl_info *rxcp)
1738 1739 1740 1741 1742 1743
{
	rxcp->pkt_size =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v1, pktsize, compl);
	rxcp->vlanf = AMAP_GET_BITS(struct amap_eth_rx_compl_v1, vtp, compl);
	rxcp->err = AMAP_GET_BITS(struct amap_eth_rx_compl_v1, err, compl);
	rxcp->tcpf = AMAP_GET_BITS(struct amap_eth_rx_compl_v1, tcpf, compl);
1744
	rxcp->udpf = AMAP_GET_BITS(struct amap_eth_rx_compl_v1, udpf, compl);
1745 1746 1747 1748 1749 1750 1751 1752 1753 1754
	rxcp->ip_csum =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v1, ipcksm, compl);
	rxcp->l4_csum =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v1, l4_cksm, compl);
	rxcp->ipv6 =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v1, ip_version, compl);
	rxcp->num_rcvd =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v1, numfrags, compl);
	rxcp->pkt_type =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v1, cast_enc, compl);
A
Ajit Khaparde 已提交
1755
	rxcp->rss_hash =
1756
		AMAP_GET_BITS(struct amap_eth_rx_compl_v1, rsshash, compl);
1757
	if (rxcp->vlanf) {
1758
		rxcp->qnq = AMAP_GET_BITS(struct amap_eth_rx_compl_v1, qnq,
1759
					  compl);
1760 1761
		rxcp->vlan_tag = AMAP_GET_BITS(struct amap_eth_rx_compl_v1,
					       vlan_tag, compl);
1762
	}
1763
	rxcp->port = AMAP_GET_BITS(struct amap_eth_rx_compl_v1, port, compl);
1764 1765
	rxcp->tunneled =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v1, tunneled, compl);
1766 1767
}

S
Sathya Perla 已提交
1768 1769
static void be_parse_rx_compl_v0(struct be_eth_rx_compl *compl,
				 struct be_rx_compl_info *rxcp)
1770 1771 1772 1773 1774 1775
{
	rxcp->pkt_size =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v0, pktsize, compl);
	rxcp->vlanf = AMAP_GET_BITS(struct amap_eth_rx_compl_v0, vtp, compl);
	rxcp->err = AMAP_GET_BITS(struct amap_eth_rx_compl_v0, err, compl);
	rxcp->tcpf = AMAP_GET_BITS(struct amap_eth_rx_compl_v0, tcpf, compl);
1776
	rxcp->udpf = AMAP_GET_BITS(struct amap_eth_rx_compl_v0, udpf, compl);
1777 1778 1779 1780 1781 1782 1783 1784 1785 1786
	rxcp->ip_csum =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v0, ipcksm, compl);
	rxcp->l4_csum =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v0, l4_cksm, compl);
	rxcp->ipv6 =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v0, ip_version, compl);
	rxcp->num_rcvd =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v0, numfrags, compl);
	rxcp->pkt_type =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v0, cast_enc, compl);
A
Ajit Khaparde 已提交
1787
	rxcp->rss_hash =
1788
		AMAP_GET_BITS(struct amap_eth_rx_compl_v0, rsshash, compl);
1789
	if (rxcp->vlanf) {
1790
		rxcp->qnq = AMAP_GET_BITS(struct amap_eth_rx_compl_v0, qnq,
1791
					  compl);
1792 1793
		rxcp->vlan_tag = AMAP_GET_BITS(struct amap_eth_rx_compl_v0,
					       vlan_tag, compl);
1794
	}
1795
	rxcp->port = AMAP_GET_BITS(struct amap_eth_rx_compl_v0, port, compl);
1796 1797
	rxcp->ip_frag = AMAP_GET_BITS(struct amap_eth_rx_compl_v0,
				      ip_frag, compl);
1798 1799 1800 1801 1802 1803 1804
}

static struct be_rx_compl_info *be_rx_compl_get(struct be_rx_obj *rxo)
{
	struct be_eth_rx_compl *compl = queue_tail_node(&rxo->cq);
	struct be_rx_compl_info *rxcp = &rxo->rxcp;
	struct be_adapter *adapter = rxo->adapter;
S
Sathya Perla 已提交
1805

1806 1807 1808 1809
	/* For checking the valid bit it is Ok to use either definition as the
	 * valid bit is at the same position in both v0 and v1 Rx compl */
	if (compl->dw[offsetof(struct amap_eth_rx_compl_v1, valid) / 32] == 0)
		return NULL;
S
Sathya Perla 已提交
1810

1811 1812
	rmb();
	be_dws_le_to_cpu(compl, sizeof(*compl));
S
Sathya Perla 已提交
1813

1814
	if (adapter->be3_native)
S
Sathya Perla 已提交
1815
		be_parse_rx_compl_v1(compl, rxcp);
1816
	else
S
Sathya Perla 已提交
1817
		be_parse_rx_compl_v0(compl, rxcp);
S
Sathya Perla 已提交
1818

1819 1820 1821
	if (rxcp->ip_frag)
		rxcp->l4_csum = 0;

1822
	if (rxcp->vlanf) {
1823 1824 1825 1826 1827
		/* In QNQ modes, if qnq bit is not set, then the packet was
		 * tagged only with the transparent outer vlan-tag and must
		 * not be treated as a vlan packet by host
		 */
		if (be_is_qnq_mode(adapter) && !rxcp->qnq)
1828
			rxcp->vlanf = 0;
S
Sathya Perla 已提交
1829

1830
		if (!lancer_chip(adapter))
1831
			rxcp->vlan_tag = swab16(rxcp->vlan_tag);
S
Sathya Perla 已提交
1832

1833
		if (adapter->pvid == (rxcp->vlan_tag & VLAN_VID_MASK) &&
1834
		    !test_bit(rxcp->vlan_tag, adapter->vids))
1835 1836
			rxcp->vlanf = 0;
	}
1837 1838 1839

	/* As the compl has been parsed, reset it; we wont touch it again */
	compl->dw[offsetof(struct amap_eth_rx_compl_v1, valid) / 32] = 0;
S
Sathya Perla 已提交
1840

1841
	queue_tail_inc(&rxo->cq);
S
Sathya Perla 已提交
1842 1843 1844
	return rxcp;
}

1845
static inline struct page *be_alloc_pages(u32 size, gfp_t gfp)
S
Sathya Perla 已提交
1846 1847
{
	u32 order = get_order(size);
1848

S
Sathya Perla 已提交
1849
	if (order > 0)
1850 1851
		gfp |= __GFP_COMP;
	return  alloc_pages(gfp, order);
S
Sathya Perla 已提交
1852 1853 1854 1855 1856 1857
}

/*
 * Allocate a page, split it to fragments of size rx_frag_size and post as
 * receive buffers to BE
 */
1858
static void be_post_rx_frags(struct be_rx_obj *rxo, gfp_t gfp)
S
Sathya Perla 已提交
1859
{
1860
	struct be_adapter *adapter = rxo->adapter;
1861
	struct be_rx_page_info *page_info = NULL, *prev_page_info = NULL;
1862
	struct be_queue_info *rxq = &rxo->q;
S
Sathya Perla 已提交
1863
	struct page *pagep = NULL;
1864
	struct device *dev = &adapter->pdev->dev;
S
Sathya Perla 已提交
1865 1866 1867 1868
	struct be_eth_rx_d *rxd;
	u64 page_dmaaddr = 0, frag_dmaaddr;
	u32 posted, page_offset = 0;

1869
	page_info = &rxo->page_info_tbl[rxq->head];
S
Sathya Perla 已提交
1870 1871
	for (posted = 0; posted < MAX_RX_POST && !page_info->page; posted++) {
		if (!pagep) {
1872
			pagep = be_alloc_pages(adapter->big_page_size, gfp);
S
Sathya Perla 已提交
1873
			if (unlikely(!pagep)) {
1874
				rx_stats(rxo)->rx_post_fail++;
S
Sathya Perla 已提交
1875 1876
				break;
			}
1877 1878
			page_dmaaddr = dma_map_page(dev, pagep, 0,
						    adapter->big_page_size,
I
Ivan Vecera 已提交
1879
						    DMA_FROM_DEVICE);
1880 1881 1882 1883 1884 1885
			if (dma_mapping_error(dev, page_dmaaddr)) {
				put_page(pagep);
				pagep = NULL;
				rx_stats(rxo)->rx_post_fail++;
				break;
			}
1886
			page_offset = 0;
S
Sathya Perla 已提交
1887 1888
		} else {
			get_page(pagep);
1889
			page_offset += rx_frag_size;
S
Sathya Perla 已提交
1890
		}
1891
		page_info->page_offset = page_offset;
S
Sathya Perla 已提交
1892 1893 1894
		page_info->page = pagep;

		rxd = queue_head_node(rxq);
1895
		frag_dmaaddr = page_dmaaddr + page_info->page_offset;
S
Sathya Perla 已提交
1896 1897 1898 1899 1900 1901 1902
		rxd->fragpa_lo = cpu_to_le32(frag_dmaaddr & 0xFFFFFFFF);
		rxd->fragpa_hi = cpu_to_le32(upper_32_bits(frag_dmaaddr));

		/* Any space left in the current big page for another frag? */
		if ((page_offset + rx_frag_size + rx_frag_size) >
					adapter->big_page_size) {
			pagep = NULL;
1903 1904 1905 1906
			page_info->last_frag = true;
			dma_unmap_addr_set(page_info, bus, page_dmaaddr);
		} else {
			dma_unmap_addr_set(page_info, bus, frag_dmaaddr);
S
Sathya Perla 已提交
1907
		}
1908 1909 1910

		prev_page_info = page_info;
		queue_head_inc(rxq);
S
Sathya Perla 已提交
1911
		page_info = &rxo->page_info_tbl[rxq->head];
S
Sathya Perla 已提交
1912
	}
1913 1914 1915 1916 1917 1918 1919 1920

	/* Mark the last frag of a page when we break out of the above loop
	 * with no more slots available in the RXQ
	 */
	if (pagep) {
		prev_page_info->last_frag = true;
		dma_unmap_addr_set(prev_page_info, bus, page_dmaaddr);
	}
S
Sathya Perla 已提交
1921 1922 1923

	if (posted) {
		atomic_add(posted, &rxq->used);
1924 1925
		if (rxo->rx_post_starved)
			rxo->rx_post_starved = false;
1926
		be_rxq_notify(adapter, rxq->id, posted);
1927 1928
	} else if (atomic_read(&rxq->used) == 0) {
		/* Let be_worker replenish when memory is available */
1929
		rxo->rx_post_starved = true;
S
Sathya Perla 已提交
1930 1931 1932
	}
}

1933
static struct be_eth_tx_compl *be_tx_compl_get(struct be_queue_info *tx_cq)
S
Sathya Perla 已提交
1934 1935 1936 1937 1938 1939
{
	struct be_eth_tx_compl *txcp = queue_tail_node(tx_cq);

	if (txcp->dw[offsetof(struct amap_eth_tx_compl, valid) / 32] == 0)
		return NULL;

1940
	rmb();
S
Sathya Perla 已提交
1941 1942 1943 1944 1945 1946 1947 1948
	be_dws_le_to_cpu(txcp, sizeof(*txcp));

	txcp->dw[offsetof(struct amap_eth_tx_compl, valid) / 32] = 0;

	queue_tail_inc(tx_cq);
	return txcp;
}

1949
static u16 be_tx_compl_process(struct be_adapter *adapter,
1950
			       struct be_tx_obj *txo, u16 last_index)
S
Sathya Perla 已提交
1951
{
1952
	struct be_queue_info *txq = &txo->q;
1953
	struct be_eth_wrb *wrb;
1954
	struct sk_buff **sent_skbs = txo->sent_skb_list;
S
Sathya Perla 已提交
1955
	struct sk_buff *sent_skb;
1956 1957
	u16 cur_index, num_wrbs = 1; /* account for hdr wrb */
	bool unmap_skb_hdr = true;
S
Sathya Perla 已提交
1958

1959
	sent_skb = sent_skbs[txq->tail];
S
Sathya Perla 已提交
1960
	BUG_ON(!sent_skb);
1961 1962 1963
	sent_skbs[txq->tail] = NULL;

	/* skip header wrb */
1964
	queue_tail_inc(txq);
S
Sathya Perla 已提交
1965

1966
	do {
S
Sathya Perla 已提交
1967
		cur_index = txq->tail;
1968
		wrb = queue_tail_node(txq);
I
Ivan Vecera 已提交
1969 1970
		unmap_tx_frag(&adapter->pdev->dev, wrb,
			      (unmap_skb_hdr && skb_headlen(sent_skb)));
1971 1972
		unmap_skb_hdr = false;

S
Sathya Perla 已提交
1973 1974
		num_wrbs++;
		queue_tail_inc(txq);
1975
	} while (cur_index != last_index);
S
Sathya Perla 已提交
1976

1977
	dev_kfree_skb_any(sent_skb);
1978
	return num_wrbs;
S
Sathya Perla 已提交
1979 1980
}

S
Sathya Perla 已提交
1981 1982
/* Return the number of events in the event queue */
static inline int events_get(struct be_eq_obj *eqo)
1983
{
S
Sathya Perla 已提交
1984 1985
	struct be_eq_entry *eqe;
	int num = 0;
1986

S
Sathya Perla 已提交
1987 1988 1989 1990
	do {
		eqe = queue_tail_node(&eqo->q);
		if (eqe->evt == 0)
			break;
1991

S
Sathya Perla 已提交
1992 1993 1994 1995 1996 1997 1998
		rmb();
		eqe->evt = 0;
		num++;
		queue_tail_inc(&eqo->q);
	} while (true);

	return num;
1999 2000
}

S
Sathya Perla 已提交
2001 2002
/* Leaves the EQ is disarmed state */
static void be_eq_clean(struct be_eq_obj *eqo)
2003
{
S
Sathya Perla 已提交
2004
	int num = events_get(eqo);
2005

S
Sathya Perla 已提交
2006
	be_eq_notify(eqo->adapter, eqo->q.id, false, true, num);
2007 2008
}

S
Sathya Perla 已提交
2009
static void be_rx_cq_clean(struct be_rx_obj *rxo)
S
Sathya Perla 已提交
2010 2011
{
	struct be_rx_page_info *page_info;
2012 2013
	struct be_queue_info *rxq = &rxo->q;
	struct be_queue_info *rx_cq = &rxo->cq;
2014
	struct be_rx_compl_info *rxcp;
2015 2016
	struct be_adapter *adapter = rxo->adapter;
	int flush_wait = 0;
S
Sathya Perla 已提交
2017

2018 2019 2020 2021 2022 2023 2024 2025 2026 2027 2028 2029 2030 2031 2032 2033 2034 2035 2036 2037 2038
	/* Consume pending rx completions.
	 * Wait for the flush completion (identified by zero num_rcvd)
	 * to arrive. Notify CQ even when there are no more CQ entries
	 * for HW to flush partially coalesced CQ entries.
	 * In Lancer, there is no need to wait for flush compl.
	 */
	for (;;) {
		rxcp = be_rx_compl_get(rxo);
		if (rxcp == NULL) {
			if (lancer_chip(adapter))
				break;

			if (flush_wait++ > 10 || be_hw_error(adapter)) {
				dev_warn(&adapter->pdev->dev,
					 "did not receive flush compl\n");
				break;
			}
			be_cq_notify(adapter, rx_cq->id, true, 0);
			mdelay(1);
		} else {
			be_rx_compl_discard(rxo, rxcp);
2039
			be_cq_notify(adapter, rx_cq->id, false, 1);
2040 2041 2042
			if (rxcp->num_rcvd == 0)
				break;
		}
S
Sathya Perla 已提交
2043 2044
	}

2045 2046 2047 2048
	/* After cleanup, leave the CQ in unarmed state */
	be_cq_notify(adapter, rx_cq->id, false, 0);

	/* Then free posted rx buffers that were not used */
2049 2050
	while (atomic_read(&rxq->used) > 0) {
		page_info = get_rx_page_info(rxo);
S
Sathya Perla 已提交
2051 2052 2053 2054
		put_page(page_info->page);
		memset(page_info, 0, sizeof(*page_info));
	}
	BUG_ON(atomic_read(&rxq->used));
2055
	rxq->tail = rxq->head = 0;
S
Sathya Perla 已提交
2056 2057
}

S
Sathya Perla 已提交
2058
static void be_tx_compl_clean(struct be_adapter *adapter)
S
Sathya Perla 已提交
2059
{
S
Sathya Perla 已提交
2060 2061
	struct be_tx_obj *txo;
	struct be_queue_info *txq;
2062
	struct be_eth_tx_compl *txcp;
2063
	u16 end_idx, cmpl = 0, timeo = 0, num_wrbs = 0;
2064 2065
	struct sk_buff *sent_skb;
	bool dummy_wrb;
S
Sathya Perla 已提交
2066
	int i, pending_txqs;
2067

2068
	/* Stop polling for compls when HW has been silent for 10ms */
2069
	do {
S
Sathya Perla 已提交
2070 2071 2072
		pending_txqs = adapter->num_tx_qs;

		for_all_tx_queues(adapter, txo, i) {
2073 2074
			cmpl = 0;
			num_wrbs = 0;
S
Sathya Perla 已提交
2075 2076 2077 2078 2079 2080 2081 2082 2083 2084 2085 2086
			txq = &txo->q;
			while ((txcp = be_tx_compl_get(&txo->cq))) {
				end_idx =
					AMAP_GET_BITS(struct amap_eth_tx_compl,
						      wrb_index, txcp);
				num_wrbs += be_tx_compl_process(adapter, txo,
								end_idx);
				cmpl++;
			}
			if (cmpl) {
				be_cq_notify(adapter, txo->cq.id, false, cmpl);
				atomic_sub(num_wrbs, &txq->used);
2087
				timeo = 0;
S
Sathya Perla 已提交
2088 2089 2090
			}
			if (atomic_read(&txq->used) == 0)
				pending_txqs--;
2091 2092
		}

2093
		if (pending_txqs == 0 || ++timeo > 10 || be_hw_error(adapter))
2094 2095 2096 2097 2098
			break;

		mdelay(1);
	} while (true);

S
Sathya Perla 已提交
2099 2100 2101 2102 2103 2104 2105 2106 2107 2108 2109 2110 2111 2112 2113 2114
	for_all_tx_queues(adapter, txo, i) {
		txq = &txo->q;
		if (atomic_read(&txq->used))
			dev_err(&adapter->pdev->dev, "%d pending tx-compls\n",
				atomic_read(&txq->used));

		/* free posted tx for which compls will never arrive */
		while (atomic_read(&txq->used)) {
			sent_skb = txo->sent_skb_list[txq->tail];
			end_idx = txq->tail;
			num_wrbs = wrb_cnt_for_skb(adapter, sent_skb,
						   &dummy_wrb);
			index_adv(&end_idx, num_wrbs - 1, txq->len);
			num_wrbs = be_tx_compl_process(adapter, txo, end_idx);
			atomic_sub(num_wrbs, &txq->used);
		}
2115
	}
S
Sathya Perla 已提交
2116 2117
}

S
Sathya Perla 已提交
2118 2119 2120 2121 2122 2123
static void be_evt_queues_destroy(struct be_adapter *adapter)
{
	struct be_eq_obj *eqo;
	int i;

	for_all_evt_queues(adapter, eqo, i) {
2124 2125
		if (eqo->q.created) {
			be_eq_clean(eqo);
S
Sathya Perla 已提交
2126
			be_cmd_q_destroy(adapter, &eqo->q, QTYPE_EQ);
2127
			napi_hash_del(&eqo->napi);
2128
			netif_napi_del(&eqo->napi);
2129
		}
S
Sathya Perla 已提交
2130 2131 2132 2133 2134 2135 2136 2137
		be_queue_free(adapter, &eqo->q);
	}
}

static int be_evt_queues_create(struct be_adapter *adapter)
{
	struct be_queue_info *eq;
	struct be_eq_obj *eqo;
2138
	struct be_aic_obj *aic;
S
Sathya Perla 已提交
2139 2140
	int i, rc;

2141 2142
	adapter->num_evt_qs = min_t(u16, num_irqs(adapter),
				    adapter->cfg_num_qs);
S
Sathya Perla 已提交
2143 2144

	for_all_evt_queues(adapter, eqo, i) {
2145 2146
		netif_napi_add(adapter->netdev, &eqo->napi, be_poll,
			       BE_NAPI_WEIGHT);
2147
		napi_hash_add(&eqo->napi);
2148
		aic = &adapter->aic_obj[i];
S
Sathya Perla 已提交
2149 2150 2151
		eqo->adapter = adapter;
		eqo->tx_budget = BE_TX_BUDGET;
		eqo->idx = i;
2152 2153
		aic->max_eqd = BE_MAX_EQD;
		aic->enable = true;
S
Sathya Perla 已提交
2154 2155 2156

		eq = &eqo->q;
		rc = be_queue_alloc(adapter, eq, EVNT_Q_LEN,
2157
				    sizeof(struct be_eq_entry));
S
Sathya Perla 已提交
2158 2159 2160
		if (rc)
			return rc;

S
Sathya Perla 已提交
2161
		rc = be_cmd_eq_create(adapter, eqo);
S
Sathya Perla 已提交
2162 2163 2164
		if (rc)
			return rc;
	}
2165
	return 0;
S
Sathya Perla 已提交
2166 2167
}

2168 2169 2170 2171
static void be_mcc_queues_destroy(struct be_adapter *adapter)
{
	struct be_queue_info *q;

2172
	q = &adapter->mcc_obj.q;
2173
	if (q->created)
2174
		be_cmd_q_destroy(adapter, q, QTYPE_MCCQ);
2175 2176
	be_queue_free(adapter, q);

2177
	q = &adapter->mcc_obj.cq;
2178
	if (q->created)
2179
		be_cmd_q_destroy(adapter, q, QTYPE_CQ);
2180 2181 2182 2183 2184 2185 2186 2187
	be_queue_free(adapter, q);
}

/* Must be called only after TX qs are created as MCC shares TX EQ */
static int be_mcc_queues_create(struct be_adapter *adapter)
{
	struct be_queue_info *q, *cq;

2188
	cq = &adapter->mcc_obj.cq;
2189
	if (be_queue_alloc(adapter, cq, MCC_CQ_LEN,
2190
			   sizeof(struct be_mcc_compl)))
2191 2192
		goto err;

S
Sathya Perla 已提交
2193 2194
	/* Use the default EQ for MCC completions */
	if (be_cmd_cq_create(adapter, cq, &mcc_eqo(adapter)->q, true, 0))
2195 2196
		goto mcc_cq_free;

2197
	q = &adapter->mcc_obj.q;
2198 2199 2200
	if (be_queue_alloc(adapter, q, MCC_Q_LEN, sizeof(struct be_mcc_wrb)))
		goto mcc_cq_destroy;

2201
	if (be_cmd_mccq_create(adapter, q, cq))
2202 2203 2204 2205 2206 2207 2208
		goto mcc_q_free;

	return 0;

mcc_q_free:
	be_queue_free(adapter, q);
mcc_cq_destroy:
2209
	be_cmd_q_destroy(adapter, cq, QTYPE_CQ);
2210 2211 2212 2213 2214 2215
mcc_cq_free:
	be_queue_free(adapter, cq);
err:
	return -1;
}

S
Sathya Perla 已提交
2216 2217 2218
static void be_tx_queues_destroy(struct be_adapter *adapter)
{
	struct be_queue_info *q;
2219 2220
	struct be_tx_obj *txo;
	u8 i;
S
Sathya Perla 已提交
2221

2222 2223 2224 2225 2226
	for_all_tx_queues(adapter, txo, i) {
		q = &txo->q;
		if (q->created)
			be_cmd_q_destroy(adapter, q, QTYPE_TXQ);
		be_queue_free(adapter, q);
S
Sathya Perla 已提交
2227

2228 2229 2230 2231 2232
		q = &txo->cq;
		if (q->created)
			be_cmd_q_destroy(adapter, q, QTYPE_CQ);
		be_queue_free(adapter, q);
	}
S
Sathya Perla 已提交
2233 2234
}

2235
static int be_tx_qs_create(struct be_adapter *adapter)
S
Sathya Perla 已提交
2236
{
S
Sathya Perla 已提交
2237
	struct be_queue_info *cq, *eq;
2238
	struct be_tx_obj *txo;
2239
	int status, i;
S
Sathya Perla 已提交
2240

2241
	adapter->num_tx_qs = min(adapter->num_evt_qs, be_max_txqs(adapter));
2242

S
Sathya Perla 已提交
2243 2244 2245 2246 2247 2248
	for_all_tx_queues(adapter, txo, i) {
		cq = &txo->cq;
		status = be_queue_alloc(adapter, cq, TX_CQ_LEN,
					sizeof(struct be_eth_tx_compl));
		if (status)
			return status;
2249

2250 2251 2252
		u64_stats_init(&txo->stats.sync);
		u64_stats_init(&txo->stats.sync_compl);

S
Sathya Perla 已提交
2253 2254 2255 2256 2257 2258 2259
		/* If num_evt_qs is less than num_tx_qs, then more than
		 * one txq share an eq
		 */
		eq = &adapter->eq_obj[i % adapter->num_evt_qs].q;
		status = be_cmd_cq_create(adapter, cq, eq, false, 3);
		if (status)
			return status;
S
Sathya Perla 已提交
2260

S
Sathya Perla 已提交
2261 2262 2263 2264
		status = be_queue_alloc(adapter, &txo->q, TX_Q_LEN,
					sizeof(struct be_eth_wrb));
		if (status)
			return status;
S
Sathya Perla 已提交
2265

V
Vasundhara Volam 已提交
2266
		status = be_cmd_txq_create(adapter, txo);
S
Sathya Perla 已提交
2267 2268
		if (status)
			return status;
2269
	}
S
Sathya Perla 已提交
2270

S
Sathya Perla 已提交
2271 2272
	dev_info(&adapter->pdev->dev, "created %d TX queue(s)\n",
		 adapter->num_tx_qs);
S
Sathya Perla 已提交
2273
	return 0;
S
Sathya Perla 已提交
2274 2275
}

S
Sathya Perla 已提交
2276
static void be_rx_cqs_destroy(struct be_adapter *adapter)
S
Sathya Perla 已提交
2277 2278
{
	struct be_queue_info *q;
2279 2280 2281 2282 2283 2284 2285 2286
	struct be_rx_obj *rxo;
	int i;

	for_all_rx_queues(adapter, rxo, i) {
		q = &rxo->cq;
		if (q->created)
			be_cmd_q_destroy(adapter, q, QTYPE_CQ);
		be_queue_free(adapter, q);
2287 2288 2289
	}
}

S
Sathya Perla 已提交
2290
static int be_rx_cqs_create(struct be_adapter *adapter)
S
Sathya Perla 已提交
2291
{
S
Sathya Perla 已提交
2292
	struct be_queue_info *eq, *cq;
2293 2294
	struct be_rx_obj *rxo;
	int rc, i;
S
Sathya Perla 已提交
2295

2296 2297 2298 2299 2300
	/* We can create as many RSS rings as there are EQs. */
	adapter->num_rx_qs = adapter->num_evt_qs;

	/* We'll use RSS only if atleast 2 RSS rings are supported.
	 * When RSS is used, we'll need a default RXQ for non-IP traffic.
S
Sathya Perla 已提交
2301
	 */
2302 2303 2304
	if (adapter->num_rx_qs > 1)
		adapter->num_rx_qs++;

S
Sathya Perla 已提交
2305
	adapter->big_page_size = (1 << get_order(rx_frag_size)) * PAGE_SIZE;
2306 2307 2308 2309
	for_all_rx_queues(adapter, rxo, i) {
		rxo->adapter = adapter;
		cq = &rxo->cq;
		rc = be_queue_alloc(adapter, cq, RX_CQ_LEN,
2310
				    sizeof(struct be_eth_rx_compl));
2311
		if (rc)
S
Sathya Perla 已提交
2312
			return rc;
2313

2314
		u64_stats_init(&rxo->stats.sync);
S
Sathya Perla 已提交
2315 2316
		eq = &adapter->eq_obj[i % adapter->num_evt_qs].q;
		rc = be_cmd_cq_create(adapter, cq, eq, false, 3);
2317
		if (rc)
S
Sathya Perla 已提交
2318
			return rc;
2319
	}
S
Sathya Perla 已提交
2320

S
Sathya Perla 已提交
2321 2322 2323
	dev_info(&adapter->pdev->dev,
		 "created %d RSS queue(s) and 1 default RX queue\n",
		 adapter->num_rx_qs - 1);
S
Sathya Perla 已提交
2324
	return 0;
2325 2326
}

S
Sathya Perla 已提交
2327 2328
static irqreturn_t be_intx(int irq, void *dev)
{
2329 2330 2331
	struct be_eq_obj *eqo = dev;
	struct be_adapter *adapter = eqo->adapter;
	int num_evts = 0;
S
Sathya Perla 已提交
2332

2333 2334 2335 2336 2337 2338 2339
	/* IRQ is not expected when NAPI is scheduled as the EQ
	 * will not be armed.
	 * But, this can happen on Lancer INTx where it takes
	 * a while to de-assert INTx or in BE2 where occasionaly
	 * an interrupt may be raised even when EQ is unarmed.
	 * If NAPI is already scheduled, then counting & notifying
	 * events will orphan them.
2340
	 */
2341
	if (napi_schedule_prep(&eqo->napi)) {
2342
		num_evts = events_get(eqo);
2343 2344 2345 2346 2347
		__napi_schedule(&eqo->napi);
		if (num_evts)
			eqo->spurious_intr = 0;
	}
	be_eq_notify(adapter, eqo->q.id, false, true, num_evts);
2348

2349 2350 2351
	/* Return IRQ_HANDLED only for the the first spurious intr
	 * after a valid intr to stop the kernel from branding
	 * this irq as a bad one!
2352
	 */
2353 2354 2355 2356
	if (num_evts || eqo->spurious_intr++ == 0)
		return IRQ_HANDLED;
	else
		return IRQ_NONE;
S
Sathya Perla 已提交
2357 2358
}

S
Sathya Perla 已提交
2359
static irqreturn_t be_msix(int irq, void *dev)
S
Sathya Perla 已提交
2360
{
S
Sathya Perla 已提交
2361
	struct be_eq_obj *eqo = dev;
S
Sathya Perla 已提交
2362

2363 2364
	be_eq_notify(eqo->adapter, eqo->q.id, false, true, 0);
	napi_schedule(&eqo->napi);
S
Sathya Perla 已提交
2365 2366 2367
	return IRQ_HANDLED;
}

2368
static inline bool do_gro(struct be_rx_compl_info *rxcp)
S
Sathya Perla 已提交
2369
{
2370
	return (rxcp->tcpf && !rxcp->err && rxcp->l4_csum) ? true : false;
S
Sathya Perla 已提交
2371 2372
}

S
Sathya Perla 已提交
2373
static int be_process_rx(struct be_rx_obj *rxo, struct napi_struct *napi,
2374
			 int budget, int polling)
S
Sathya Perla 已提交
2375
{
2376 2377
	struct be_adapter *adapter = rxo->adapter;
	struct be_queue_info *rx_cq = &rxo->cq;
2378
	struct be_rx_compl_info *rxcp;
S
Sathya Perla 已提交
2379 2380 2381
	u32 work_done;

	for (work_done = 0; work_done < budget; work_done++) {
2382
		rxcp = be_rx_compl_get(rxo);
S
Sathya Perla 已提交
2383 2384 2385
		if (!rxcp)
			break;

2386 2387 2388 2389 2390 2391
		/* Is it a flush compl that has no data */
		if (unlikely(rxcp->num_rcvd == 0))
			goto loop_continue;

		/* Discard compl with partial DMA Lancer B0 */
		if (unlikely(!rxcp->pkt_size)) {
S
Sathya Perla 已提交
2392
			be_rx_compl_discard(rxo, rxcp);
2393 2394 2395 2396 2397 2398 2399
			goto loop_continue;
		}

		/* On BE drop pkts that arrive due to imperfect filtering in
		 * promiscuous mode on some skews
		 */
		if (unlikely(rxcp->port != adapter->port_num &&
2400
			     !lancer_chip(adapter))) {
S
Sathya Perla 已提交
2401
			be_rx_compl_discard(rxo, rxcp);
2402
			goto loop_continue;
2403
		}
2404

2405 2406
		/* Don't do gro when we're busy_polling */
		if (do_gro(rxcp) && polling != BUSY_POLLING)
S
Sathya Perla 已提交
2407
			be_rx_compl_process_gro(rxo, napi, rxcp);
2408
		else
2409 2410
			be_rx_compl_process(rxo, napi, rxcp);

2411
loop_continue:
2412
		be_rx_stats_update(rxo, rxcp);
S
Sathya Perla 已提交
2413 2414
	}

S
Sathya Perla 已提交
2415 2416
	if (work_done) {
		be_cq_notify(adapter, rx_cq->id, true, work_done);
2417

2418 2419 2420 2421 2422
		/* When an rx-obj gets into post_starved state, just
		 * let be_worker do the posting.
		 */
		if (atomic_read(&rxo->q.used) < RX_FRAGS_REFILL_WM &&
		    !rxo->rx_post_starved)
S
Sathya Perla 已提交
2423
			be_post_rx_frags(rxo, GFP_ATOMIC);
S
Sathya Perla 已提交
2424
	}
S
Sathya Perla 已提交
2425

S
Sathya Perla 已提交
2426 2427 2428
	return work_done;
}

S
Sathya Perla 已提交
2429 2430
static bool be_process_tx(struct be_adapter *adapter, struct be_tx_obj *txo,
			  int budget, int idx)
S
Sathya Perla 已提交
2431 2432
{
	struct be_eth_tx_compl *txcp;
S
Sathya Perla 已提交
2433
	int num_wrbs = 0, work_done;
2434

S
Sathya Perla 已提交
2435 2436 2437 2438 2439
	for (work_done = 0; work_done < budget; work_done++) {
		txcp = be_tx_compl_get(&txo->cq);
		if (!txcp)
			break;
		num_wrbs += be_tx_compl_process(adapter, txo,
2440 2441 2442
						AMAP_GET_BITS(struct
							      amap_eth_tx_compl,
							      wrb_index, txcp));
S
Sathya Perla 已提交
2443
	}
S
Sathya Perla 已提交
2444

S
Sathya Perla 已提交
2445 2446 2447
	if (work_done) {
		be_cq_notify(adapter, txo->cq.id, true, work_done);
		atomic_sub(num_wrbs, &txo->q.used);
2448

S
Sathya Perla 已提交
2449 2450 2451
		/* As Tx wrbs have been freed up, wake up netdev queue
		 * if it was stopped due to lack of tx wrbs.  */
		if (__netif_subqueue_stopped(adapter->netdev, idx) &&
2452
		    atomic_read(&txo->q.used) < txo->q.len / 2) {
S
Sathya Perla 已提交
2453
			netif_wake_subqueue(adapter->netdev, idx);
2454
		}
S
Sathya Perla 已提交
2455 2456 2457 2458

		u64_stats_update_begin(&tx_stats(txo)->sync_compl);
		tx_stats(txo)->tx_compl += work_done;
		u64_stats_update_end(&tx_stats(txo)->sync_compl);
S
Sathya Perla 已提交
2459
	}
S
Sathya Perla 已提交
2460 2461
	return (work_done < budget); /* Done */
}
S
Sathya Perla 已提交
2462

2463
int be_poll(struct napi_struct *napi, int budget)
S
Sathya Perla 已提交
2464 2465 2466
{
	struct be_eq_obj *eqo = container_of(napi, struct be_eq_obj, napi);
	struct be_adapter *adapter = eqo->adapter;
2467
	int max_work = 0, work, i, num_evts;
2468
	struct be_rx_obj *rxo;
S
Sathya Perla 已提交
2469
	bool tx_done;
S
Sathya Perla 已提交
2470

2471 2472
	num_evts = events_get(eqo);

S
Sathya Perla 已提交
2473 2474 2475 2476 2477 2478
	/* Process all TXQs serviced by this EQ */
	for (i = eqo->idx; i < adapter->num_tx_qs; i += adapter->num_evt_qs) {
		tx_done = be_process_tx(adapter, &adapter->tx_obj[i],
					eqo->tx_budget, i);
		if (!tx_done)
			max_work = budget;
S
Sathya Perla 已提交
2479 2480
	}

2481 2482 2483 2484 2485 2486 2487 2488 2489 2490 2491 2492
	if (be_lock_napi(eqo)) {
		/* This loop will iterate twice for EQ0 in which
		 * completions of the last RXQ (default one) are also processed
		 * For other EQs the loop iterates only once
		 */
		for_all_rx_queues_on_eq(adapter, eqo, rxo, i) {
			work = be_process_rx(rxo, napi, budget, NAPI_POLLING);
			max_work = max(work, max_work);
		}
		be_unlock_napi(eqo);
	} else {
		max_work = budget;
S
Sathya Perla 已提交
2493
	}
S
Sathya Perla 已提交
2494

S
Sathya Perla 已提交
2495 2496
	if (is_mcc_eqo(eqo))
		be_process_mcc(adapter);
2497

S
Sathya Perla 已提交
2498 2499
	if (max_work < budget) {
		napi_complete(napi);
2500
		be_eq_notify(adapter, eqo->q.id, true, false, num_evts);
S
Sathya Perla 已提交
2501 2502
	} else {
		/* As we'll continue in polling mode, count and clear events */
2503
		be_eq_notify(adapter, eqo->q.id, false, false, num_evts);
2504
	}
S
Sathya Perla 已提交
2505
	return max_work;
S
Sathya Perla 已提交
2506 2507
}

2508 2509 2510 2511 2512 2513 2514 2515 2516 2517 2518 2519 2520 2521 2522 2523 2524 2525 2526 2527 2528 2529
#ifdef CONFIG_NET_RX_BUSY_POLL
static int be_busy_poll(struct napi_struct *napi)
{
	struct be_eq_obj *eqo = container_of(napi, struct be_eq_obj, napi);
	struct be_adapter *adapter = eqo->adapter;
	struct be_rx_obj *rxo;
	int i, work = 0;

	if (!be_lock_busy_poll(eqo))
		return LL_FLUSH_BUSY;

	for_all_rx_queues_on_eq(adapter, eqo, rxo, i) {
		work = be_process_rx(rxo, napi, 4, BUSY_POLLING);
		if (work)
			break;
	}

	be_unlock_busy_poll(eqo);
	return work;
}
#endif

2530
void be_detect_error(struct be_adapter *adapter)
2531
{
2532 2533
	u32 ue_lo = 0, ue_hi = 0, ue_lo_mask = 0, ue_hi_mask = 0;
	u32 sliport_status = 0, sliport_err1 = 0, sliport_err2 = 0;
2534
	u32 i;
2535 2536 2537
	bool error_detected = false;
	struct device *dev = &adapter->pdev->dev;
	struct net_device *netdev = adapter->netdev;
2538

2539
	if (be_hw_error(adapter))
2540 2541
		return;

2542 2543 2544 2545
	if (lancer_chip(adapter)) {
		sliport_status = ioread32(adapter->db + SLIPORT_STATUS_OFFSET);
		if (sliport_status & SLIPORT_STATUS_ERR_MASK) {
			sliport_err1 = ioread32(adapter->db +
2546
						SLIPORT_ERROR1_OFFSET);
2547
			sliport_err2 = ioread32(adapter->db +
2548
						SLIPORT_ERROR2_OFFSET);
2549 2550 2551 2552 2553 2554 2555 2556 2557 2558 2559 2560 2561 2562 2563
			adapter->hw_error = true;
			/* Do not log error messages if its a FW reset */
			if (sliport_err1 == SLIPORT_ERROR_FW_RESET1 &&
			    sliport_err2 == SLIPORT_ERROR_FW_RESET2) {
				dev_info(dev, "Firmware update in progress\n");
			} else {
				error_detected = true;
				dev_err(dev, "Error detected in the card\n");
				dev_err(dev, "ERR: sliport status 0x%x\n",
					sliport_status);
				dev_err(dev, "ERR: sliport error1 0x%x\n",
					sliport_err1);
				dev_err(dev, "ERR: sliport error2 0x%x\n",
					sliport_err2);
			}
2564 2565 2566
		}
	} else {
		pci_read_config_dword(adapter->pdev,
2567
				      PCICFG_UE_STATUS_LOW, &ue_lo);
2568
		pci_read_config_dword(adapter->pdev,
2569
				      PCICFG_UE_STATUS_HIGH, &ue_hi);
2570
		pci_read_config_dword(adapter->pdev,
2571
				      PCICFG_UE_STATUS_LOW_MASK, &ue_lo_mask);
2572
		pci_read_config_dword(adapter->pdev,
2573
				      PCICFG_UE_STATUS_HI_MASK, &ue_hi_mask);
2574

2575 2576
		ue_lo = (ue_lo & ~ue_lo_mask);
		ue_hi = (ue_hi & ~ue_hi_mask);
2577

2578 2579 2580 2581
		/* On certain platforms BE hardware can indicate spurious UEs.
		 * Allow HW to stop working completely in case of a real UE.
		 * Hence not setting the hw_error for UE detection.
		 */
2582

2583 2584 2585 2586 2587 2588 2589 2590 2591 2592 2593 2594 2595 2596 2597 2598 2599
		if (ue_lo || ue_hi) {
			error_detected = true;
			dev_err(dev,
				"Unrecoverable Error detected in the adapter");
			dev_err(dev, "Please reboot server to recover");
			if (skyhawk_chip(adapter))
				adapter->hw_error = true;
			for (i = 0; ue_lo; ue_lo >>= 1, i++) {
				if (ue_lo & 1)
					dev_err(dev, "UE: %s bit set\n",
						ue_status_low_desc[i]);
			}
			for (i = 0; ue_hi; ue_hi >>= 1, i++) {
				if (ue_hi & 1)
					dev_err(dev, "UE: %s bit set\n",
						ue_status_hi_desc[i]);
			}
2600 2601
		}
	}
2602 2603
	if (error_detected)
		netif_carrier_off(netdev);
2604 2605
}

2606 2607
static void be_msix_disable(struct be_adapter *adapter)
{
2608
	if (msix_enabled(adapter)) {
2609
		pci_disable_msix(adapter->pdev);
2610
		adapter->num_msix_vec = 0;
2611
		adapter->num_msix_roce_vec = 0;
2612 2613 2614
	}
}

2615
static int be_msix_enable(struct be_adapter *adapter)
S
Sathya Perla 已提交
2616
{
2617
	int i, num_vec;
S
Sathya Perla 已提交
2618
	struct device *dev = &adapter->pdev->dev;
S
Sathya Perla 已提交
2619

2620 2621 2622 2623 2624 2625 2626 2627 2628
	/* If RoCE is supported, program the max number of NIC vectors that
	 * may be configured via set-channels, along with vectors needed for
	 * RoCe. Else, just program the number we'll use initially.
	 */
	if (be_roce_supported(adapter))
		num_vec = min_t(int, 2 * be_max_eqs(adapter),
				2 * num_online_cpus());
	else
		num_vec = adapter->cfg_num_qs;
2629

2630
	for (i = 0; i < num_vec; i++)
S
Sathya Perla 已提交
2631 2632
		adapter->msix_entries[i].entry = i;

2633 2634 2635 2636
	num_vec = pci_enable_msix_range(adapter->pdev, adapter->msix_entries,
					MIN_MSIX_VECTORS, num_vec);
	if (num_vec < 0)
		goto fail;
2637 2638 2639 2640 2641 2642 2643 2644 2645 2646 2647

	if (be_roce_supported(adapter) && num_vec > MIN_MSIX_VECTORS) {
		adapter->num_msix_roce_vec = num_vec / 2;
		dev_info(dev, "enabled %d MSI-x vector(s) for RoCE\n",
			 adapter->num_msix_roce_vec);
	}

	adapter->num_msix_vec = num_vec - adapter->num_msix_roce_vec;

	dev_info(dev, "enabled %d MSI-x vector(s) for NIC\n",
		 adapter->num_msix_vec);
2648
	return 0;
2649 2650 2651 2652 2653 2654 2655 2656

fail:
	dev_warn(dev, "MSIx enable failed\n");

	/* INTx is not supported in VFs, so fail probe if enable_msix fails */
	if (!be_physfn(adapter))
		return num_vec;
	return 0;
S
Sathya Perla 已提交
2657 2658
}

2659
static inline int be_msix_vec_get(struct be_adapter *adapter,
2660
				  struct be_eq_obj *eqo)
2661
{
S
Sathya Perla 已提交
2662
	return adapter->msix_entries[eqo->msix_idx].vector;
2663
}
S
Sathya Perla 已提交
2664

2665 2666
static int be_msix_register(struct be_adapter *adapter)
{
S
Sathya Perla 已提交
2667 2668 2669
	struct net_device *netdev = adapter->netdev;
	struct be_eq_obj *eqo;
	int status, i, vec;
S
Sathya Perla 已提交
2670

S
Sathya Perla 已提交
2671 2672 2673 2674
	for_all_evt_queues(adapter, eqo, i) {
		sprintf(eqo->desc, "%s-q%d", netdev->name, i);
		vec = be_msix_vec_get(adapter, eqo);
		status = request_irq(vec, be_msix, 0, eqo->desc, eqo);
2675 2676 2677
		if (status)
			goto err_msix;
	}
2678

S
Sathya Perla 已提交
2679
	return 0;
2680
err_msix:
S
Sathya Perla 已提交
2681 2682 2683
	for (i--, eqo = &adapter->eq_obj[i]; i >= 0; i--, eqo--)
		free_irq(be_msix_vec_get(adapter, eqo), eqo);
	dev_warn(&adapter->pdev->dev, "MSIX Request IRQ failed - err %d\n",
2684
		 status);
2685
	be_msix_disable(adapter);
S
Sathya Perla 已提交
2686 2687 2688 2689 2690 2691 2692 2693
	return status;
}

static int be_irq_register(struct be_adapter *adapter)
{
	struct net_device *netdev = adapter->netdev;
	int status;

2694
	if (msix_enabled(adapter)) {
S
Sathya Perla 已提交
2695 2696 2697
		status = be_msix_register(adapter);
		if (status == 0)
			goto done;
2698 2699 2700
		/* INTx is not supported for VF */
		if (!be_physfn(adapter))
			return status;
S
Sathya Perla 已提交
2701 2702
	}

2703
	/* INTx: only the first EQ is used */
S
Sathya Perla 已提交
2704 2705
	netdev->irq = adapter->pdev->irq;
	status = request_irq(netdev->irq, be_intx, IRQF_SHARED, netdev->name,
2706
			     &adapter->eq_obj[0]);
S
Sathya Perla 已提交
2707 2708 2709 2710 2711 2712 2713 2714 2715 2716 2717 2718 2719
	if (status) {
		dev_err(&adapter->pdev->dev,
			"INTx request IRQ failed - err %d\n", status);
		return status;
	}
done:
	adapter->isr_registered = true;
	return 0;
}

static void be_irq_unregister(struct be_adapter *adapter)
{
	struct net_device *netdev = adapter->netdev;
S
Sathya Perla 已提交
2720
	struct be_eq_obj *eqo;
2721
	int i;
S
Sathya Perla 已提交
2722 2723 2724 2725 2726

	if (!adapter->isr_registered)
		return;

	/* INTx */
2727
	if (!msix_enabled(adapter)) {
2728
		free_irq(netdev->irq, &adapter->eq_obj[0]);
S
Sathya Perla 已提交
2729 2730 2731 2732
		goto done;
	}

	/* MSIx */
S
Sathya Perla 已提交
2733 2734
	for_all_evt_queues(adapter, eqo, i)
		free_irq(be_msix_vec_get(adapter, eqo), eqo);
2735

S
Sathya Perla 已提交
2736 2737 2738 2739
done:
	adapter->isr_registered = false;
}

S
Sathya Perla 已提交
2740
static void be_rx_qs_destroy(struct be_adapter *adapter)
2741 2742 2743 2744 2745 2746 2747 2748 2749
{
	struct be_queue_info *q;
	struct be_rx_obj *rxo;
	int i;

	for_all_rx_queues(adapter, rxo, i) {
		q = &rxo->q;
		if (q->created) {
			be_cmd_rxq_destroy(adapter, q);
S
Sathya Perla 已提交
2750
			be_rx_cq_clean(rxo);
2751
		}
S
Sathya Perla 已提交
2752
		be_queue_free(adapter, q);
2753 2754 2755
	}
}

2756 2757 2758
static int be_close(struct net_device *netdev)
{
	struct be_adapter *adapter = netdev_priv(netdev);
S
Sathya Perla 已提交
2759 2760
	struct be_eq_obj *eqo;
	int i;
2761

2762 2763 2764 2765 2766 2767
	/* This protection is needed as be_close() may be called even when the
	 * adapter is in cleared state (after eeh perm failure)
	 */
	if (!(adapter->flags & BE_FLAGS_SETUP_DONE))
		return 0;

2768 2769
	be_roce_dev_close(adapter);

2770 2771
	if (adapter->flags & BE_FLAGS_NAPI_ENABLED) {
		for_all_evt_queues(adapter, eqo, i) {
2772
			napi_disable(&eqo->napi);
2773 2774
			be_disable_busy_poll(eqo);
		}
2775
		adapter->flags &= ~BE_FLAGS_NAPI_ENABLED;
2776
	}
2777 2778 2779 2780 2781 2782

	be_async_mcc_disable(adapter);

	/* Wait for all pending tx completions to arrive so that
	 * all tx skbs are freed.
	 */
S
Sathya Perla 已提交
2783
	netif_tx_disable(netdev);
2784
	be_tx_compl_clean(adapter);
2785 2786 2787

	be_rx_qs_destroy(adapter);

2788 2789 2790 2791 2792
	for (i = 1; i < (adapter->uc_macs + 1); i++)
		be_cmd_pmac_del(adapter, adapter->if_handle,
				adapter->pmac_id[i], 0);
	adapter->uc_macs = 0;

2793
	for_all_evt_queues(adapter, eqo, i) {
S
Sathya Perla 已提交
2794 2795 2796 2797 2798
		if (msix_enabled(adapter))
			synchronize_irq(be_msix_vec_get(adapter, eqo));
		else
			synchronize_irq(netdev->irq);
		be_eq_clean(eqo);
2799 2800
	}

2801 2802
	be_irq_unregister(adapter);

2803 2804 2805
	return 0;
}

S
Sathya Perla 已提交
2806
static int be_rx_qs_create(struct be_adapter *adapter)
2807 2808
{
	struct be_rx_obj *rxo;
2809
	int rc, i, j;
2810 2811
	u8 rss_hkey[RSS_HASH_KEY_LEN];
	struct rss_info *rss = &adapter->rss_info;
2812 2813

	for_all_rx_queues(adapter, rxo, i) {
S
Sathya Perla 已提交
2814 2815 2816 2817 2818 2819 2820 2821 2822 2823 2824 2825 2826 2827
		rc = be_queue_alloc(adapter, &rxo->q, RX_Q_LEN,
				    sizeof(struct be_eth_rx_d));
		if (rc)
			return rc;
	}

	/* The FW would like the default RXQ to be created first */
	rxo = default_rxo(adapter);
	rc = be_cmd_rxq_create(adapter, &rxo->q, rxo->cq.id, rx_frag_size,
			       adapter->if_handle, false, &rxo->rss_id);
	if (rc)
		return rc;

	for_all_rss_queues(adapter, rxo, i) {
2828
		rc = be_cmd_rxq_create(adapter, &rxo->q, rxo->cq.id,
S
Sathya Perla 已提交
2829 2830
				       rx_frag_size, adapter->if_handle,
				       true, &rxo->rss_id);
2831 2832 2833 2834 2835
		if (rc)
			return rc;
	}

	if (be_multi_rxq(adapter)) {
2836 2837
		for (j = 0; j < RSS_INDIR_TABLE_LEN;
			j += adapter->num_rx_qs - 1) {
2838
			for_all_rss_queues(adapter, rxo, i) {
2839
				if ((j + i) >= RSS_INDIR_TABLE_LEN)
2840
					break;
2841 2842
				rss->rsstable[j + i] = rxo->rss_id;
				rss->rss_queue[j + i] = i;
2843 2844
			}
		}
2845 2846
		rss->rss_flags = RSS_ENABLE_TCP_IPV4 | RSS_ENABLE_IPV4 |
			RSS_ENABLE_TCP_IPV6 | RSS_ENABLE_IPV6;
2847 2848

		if (!BEx_chip(adapter))
2849 2850
			rss->rss_flags |= RSS_ENABLE_UDP_IPV4 |
				RSS_ENABLE_UDP_IPV6;
2851 2852
	} else {
		/* Disable RSS, if only default RX Q is created */
2853
		rss->rss_flags = RSS_ENABLE_NONE;
2854
	}
2855

2856
	get_random_bytes(rss_hkey, RSS_HASH_KEY_LEN);
2857
	rc = be_cmd_rss_config(adapter, rss->rsstable, rss->rss_flags,
2858
			       128, rss_hkey);
2859
	if (rc) {
2860
		rss->rss_flags = RSS_ENABLE_NONE;
2861
		return rc;
2862 2863
	}

2864 2865
	memcpy(rss->rss_hkey, rss_hkey, RSS_HASH_KEY_LEN);

2866
	/* First time posting */
S
Sathya Perla 已提交
2867
	for_all_rx_queues(adapter, rxo, i)
2868
		be_post_rx_frags(rxo, GFP_KERNEL);
2869 2870 2871
	return 0;
}

S
Sathya Perla 已提交
2872 2873 2874
static int be_open(struct net_device *netdev)
{
	struct be_adapter *adapter = netdev_priv(netdev);
S
Sathya Perla 已提交
2875
	struct be_eq_obj *eqo;
2876
	struct be_rx_obj *rxo;
S
Sathya Perla 已提交
2877
	struct be_tx_obj *txo;
2878
	u8 link_status;
2879
	int status, i;
2880

S
Sathya Perla 已提交
2881
	status = be_rx_qs_create(adapter);
2882 2883 2884
	if (status)
		goto err;

2885 2886 2887
	status = be_irq_register(adapter);
	if (status)
		goto err;
2888

S
Sathya Perla 已提交
2889
	for_all_rx_queues(adapter, rxo, i)
2890
		be_cq_notify(adapter, rxo->cq.id, true, 0);
2891

S
Sathya Perla 已提交
2892 2893 2894
	for_all_tx_queues(adapter, txo, i)
		be_cq_notify(adapter, txo->cq.id, true, 0);

2895 2896
	be_async_mcc_enable(adapter);

S
Sathya Perla 已提交
2897 2898
	for_all_evt_queues(adapter, eqo, i) {
		napi_enable(&eqo->napi);
2899
		be_enable_busy_poll(eqo);
2900
		be_eq_notify(adapter, eqo->q.id, true, true, 0);
S
Sathya Perla 已提交
2901
	}
2902
	adapter->flags |= BE_FLAGS_NAPI_ENABLED;
S
Sathya Perla 已提交
2903

2904
	status = be_cmd_link_status_query(adapter, NULL, &link_status, 0);
2905 2906 2907
	if (!status)
		be_link_status_update(adapter, link_status);

S
Sathya Perla 已提交
2908
	netif_tx_start_all_queues(netdev);
2909
	be_roce_dev_open(adapter);
2910

2911
#ifdef CONFIG_BE2NET_VXLAN
2912 2913
	if (skyhawk_chip(adapter))
		vxlan_get_rx_port(netdev);
2914 2915
#endif

2916 2917 2918 2919
	return 0;
err:
	be_close(adapter->netdev);
	return -EIO;
2920 2921
}

2922 2923 2924 2925 2926 2927 2928 2929 2930
static int be_setup_wol(struct be_adapter *adapter, bool enable)
{
	struct be_dma_mem cmd;
	int status = 0;
	u8 mac[ETH_ALEN];

	memset(mac, 0, ETH_ALEN);

	cmd.size = sizeof(struct be_cmd_req_acpi_wol_magic_config);
2931 2932
	cmd.va = dma_zalloc_coherent(&adapter->pdev->dev, cmd.size, &cmd.dma,
				     GFP_KERNEL);
2933
	if (cmd.va == NULL)
2934
		return -ENOMEM;
2935 2936 2937

	if (enable) {
		status = pci_write_config_dword(adapter->pdev,
2938 2939
						PCICFG_PM_CONTROL_OFFSET,
						PCICFG_PM_CONTROL_MASK);
2940 2941
		if (status) {
			dev_err(&adapter->pdev->dev,
2942
				"Could not enable Wake-on-lan\n");
I
Ivan Vecera 已提交
2943 2944
			dma_free_coherent(&adapter->pdev->dev, cmd.size, cmd.va,
					  cmd.dma);
2945 2946 2947
			return status;
		}
		status = be_cmd_enable_magic_wol(adapter,
2948 2949
						 adapter->netdev->dev_addr,
						 &cmd);
2950 2951 2952 2953 2954 2955 2956 2957
		pci_enable_wake(adapter->pdev, PCI_D3hot, 1);
		pci_enable_wake(adapter->pdev, PCI_D3cold, 1);
	} else {
		status = be_cmd_enable_magic_wol(adapter, mac, &cmd);
		pci_enable_wake(adapter->pdev, PCI_D3hot, 0);
		pci_enable_wake(adapter->pdev, PCI_D3cold, 0);
	}

I
Ivan Vecera 已提交
2958
	dma_free_coherent(&adapter->pdev->dev, cmd.size, cmd.va, cmd.dma);
2959 2960 2961
	return status;
}

2962 2963 2964 2965 2966 2967
/*
 * Generate a seed MAC address from the PF MAC Address using jhash.
 * MAC Address for VFs are assigned incrementally starting from the seed.
 * These addresses are programmed in the ASIC by the PF and the VF driver
 * queries for the MAC address during its probe.
 */
2968
static int be_vf_eth_addr_config(struct be_adapter *adapter)
2969
{
2970
	u32 vf;
2971
	int status = 0;
2972
	u8 mac[ETH_ALEN];
2973
	struct be_vf_cfg *vf_cfg;
2974 2975 2976

	be_vf_eth_addr_generate(adapter, mac);

2977
	for_all_vfs(adapter, vf_cfg, vf) {
2978
		if (BEx_chip(adapter))
2979
			status = be_cmd_pmac_add(adapter, mac,
2980 2981
						 vf_cfg->if_handle,
						 &vf_cfg->pmac_id, vf + 1);
2982 2983 2984
		else
			status = be_cmd_set_mac(adapter, mac, vf_cfg->if_handle,
						vf + 1);
2985

2986 2987
		if (status)
			dev_err(&adapter->pdev->dev,
2988 2989
				"Mac address assignment failed for VF %d\n",
				vf);
2990
		else
2991
			memcpy(vf_cfg->mac_addr, mac, ETH_ALEN);
2992 2993 2994 2995 2996 2997

		mac[5] += 1;
	}
	return status;
}

2998 2999 3000 3001 3002 3003 3004
static int be_vfs_mac_query(struct be_adapter *adapter)
{
	int status, vf;
	u8 mac[ETH_ALEN];
	struct be_vf_cfg *vf_cfg;

	for_all_vfs(adapter, vf_cfg, vf) {
3005 3006 3007
		status = be_cmd_get_active_mac(adapter, vf_cfg->pmac_id,
					       mac, vf_cfg->if_handle,
					       false, vf+1);
3008 3009 3010 3011 3012 3013 3014
		if (status)
			return status;
		memcpy(vf_cfg->mac_addr, mac, ETH_ALEN);
	}
	return 0;
}

3015
static void be_vf_clear(struct be_adapter *adapter)
3016
{
3017
	struct be_vf_cfg *vf_cfg;
3018 3019
	u32 vf;

3020
	if (pci_vfs_assigned(adapter->pdev)) {
3021 3022
		dev_warn(&adapter->pdev->dev,
			 "VFs are assigned to VMs: not disabling VFs\n");
3023 3024 3025
		goto done;
	}

3026 3027
	pci_disable_sriov(adapter->pdev);

3028
	for_all_vfs(adapter, vf_cfg, vf) {
3029
		if (BEx_chip(adapter))
3030 3031
			be_cmd_pmac_del(adapter, vf_cfg->if_handle,
					vf_cfg->pmac_id, vf + 1);
3032 3033 3034
		else
			be_cmd_set_mac(adapter, NULL, vf_cfg->if_handle,
				       vf + 1);
3035

3036 3037
		be_cmd_if_destroy(adapter, vf_cfg->if_handle, vf + 1);
	}
3038 3039 3040
done:
	kfree(adapter->vf_cfg);
	adapter->num_vfs = 0;
3041 3042
}

3043 3044 3045 3046 3047 3048 3049 3050
static void be_clear_queues(struct be_adapter *adapter)
{
	be_mcc_queues_destroy(adapter);
	be_rx_cqs_destroy(adapter);
	be_tx_queues_destroy(adapter);
	be_evt_queues_destroy(adapter);
}

3051
static void be_cancel_worker(struct be_adapter *adapter)
3052
{
3053 3054 3055 3056
	if (adapter->flags & BE_FLAGS_WORKER_SCHEDULED) {
		cancel_delayed_work_sync(&adapter->work);
		adapter->flags &= ~BE_FLAGS_WORKER_SCHEDULED;
	}
3057 3058
}

3059
static void be_mac_clear(struct be_adapter *adapter)
3060 3061 3062
{
	int i;

3063 3064 3065 3066 3067 3068 3069 3070 3071 3072 3073
	if (adapter->pmac_id) {
		for (i = 0; i < (adapter->uc_macs + 1); i++)
			be_cmd_pmac_del(adapter, adapter->if_handle,
					adapter->pmac_id[i], 0);
		adapter->uc_macs = 0;

		kfree(adapter->pmac_id);
		adapter->pmac_id = NULL;
	}
}

3074
#ifdef CONFIG_BE2NET_VXLAN
3075 3076 3077 3078 3079 3080 3081 3082 3083 3084 3085 3086
static void be_disable_vxlan_offloads(struct be_adapter *adapter)
{
	if (adapter->flags & BE_FLAGS_VXLAN_OFFLOADS)
		be_cmd_manage_iface(adapter, adapter->if_handle,
				    OP_CONVERT_TUNNEL_TO_NORMAL);

	if (adapter->vxlan_port)
		be_cmd_set_vxlan_port(adapter, 0);

	adapter->flags &= ~BE_FLAGS_VXLAN_OFFLOADS;
	adapter->vxlan_port = 0;
}
3087
#endif
3088

3089 3090
static int be_clear(struct be_adapter *adapter)
{
3091
	be_cancel_worker(adapter);
3092

3093
	if (sriov_enabled(adapter))
3094 3095
		be_vf_clear(adapter);

3096 3097 3098 3099 3100 3101 3102
	/* Re-configure FW to distribute resources evenly across max-supported
	 * number of VFs, only when VFs are not already enabled.
	 */
	if (be_physfn(adapter) && !pci_vfs_assigned(adapter->pdev))
		be_cmd_set_sriov_config(adapter, adapter->pool_res,
					pci_sriov_get_totalvfs(adapter->pdev));

3103
#ifdef CONFIG_BE2NET_VXLAN
3104
	be_disable_vxlan_offloads(adapter);
3105
#endif
3106
	/* delete the primary mac along with the uc-mac list */
3107
	be_mac_clear(adapter);
3108

3109
	be_cmd_if_destroy(adapter, adapter->if_handle,  0);
3110

3111
	be_clear_queues(adapter);
3112

S
Sathya Perla 已提交
3113
	be_msix_disable(adapter);
3114
	adapter->flags &= ~BE_FLAGS_SETUP_DONE;
3115 3116 3117
	return 0;
}

3118
static int be_vfs_if_create(struct be_adapter *adapter)
3119
{
3120
	struct be_resources res = {0};
3121 3122
	struct be_vf_cfg *vf_cfg;
	u32 cap_flags, en_flags, vf;
3123
	int status = 0;
3124

3125 3126
	cap_flags = BE_IF_FLAGS_UNTAGGED | BE_IF_FLAGS_BROADCAST |
		    BE_IF_FLAGS_MULTICAST;
3127

3128
	for_all_vfs(adapter, vf_cfg, vf) {
3129 3130 3131 3132 3133 3134
		if (!BE3_chip(adapter)) {
			status = be_cmd_get_profile_config(adapter, &res,
							   vf + 1);
			if (!status)
				cap_flags = res.if_cap_flags;
		}
3135 3136 3137

		/* If a FW profile exists, then cap_flags are updated */
		en_flags = cap_flags & (BE_IF_FLAGS_UNTAGGED |
3138 3139 3140 3141 3142
					BE_IF_FLAGS_BROADCAST |
					BE_IF_FLAGS_MULTICAST);
		status =
		    be_cmd_if_create(adapter, cap_flags, en_flags,
				     &vf_cfg->if_handle, vf + 1);
3143 3144 3145 3146 3147
		if (status)
			goto err;
	}
err:
	return status;
3148 3149
}

3150
static int be_vf_setup_init(struct be_adapter *adapter)
3151
{
3152
	struct be_vf_cfg *vf_cfg;
3153 3154
	int vf;

3155 3156 3157 3158 3159
	adapter->vf_cfg = kcalloc(adapter->num_vfs, sizeof(*vf_cfg),
				  GFP_KERNEL);
	if (!adapter->vf_cfg)
		return -ENOMEM;

3160 3161 3162
	for_all_vfs(adapter, vf_cfg, vf) {
		vf_cfg->if_handle = -1;
		vf_cfg->pmac_id = -1;
3163
	}
3164
	return 0;
3165 3166
}

3167 3168
static int be_vf_setup(struct be_adapter *adapter)
{
3169
	struct device *dev = &adapter->pdev->dev;
3170
	struct be_vf_cfg *vf_cfg;
3171
	int status, old_vfs, vf;
3172
	u32 privileges;
3173

3174
	old_vfs = pci_num_vf(adapter->pdev);
3175 3176 3177 3178

	status = be_vf_setup_init(adapter);
	if (status)
		goto err;
3179

3180 3181 3182 3183 3184 3185
	if (old_vfs) {
		for_all_vfs(adapter, vf_cfg, vf) {
			status = be_cmd_get_if_id(adapter, vf_cfg, vf);
			if (status)
				goto err;
		}
3186

3187 3188 3189 3190
		status = be_vfs_mac_query(adapter);
		if (status)
			goto err;
	} else {
3191 3192 3193 3194
		status = be_vfs_if_create(adapter);
		if (status)
			goto err;

3195 3196 3197 3198
		status = be_vf_eth_addr_config(adapter);
		if (status)
			goto err;
	}
3199

3200
	for_all_vfs(adapter, vf_cfg, vf) {
3201 3202 3203 3204 3205 3206 3207 3208 3209 3210 3211 3212
		/* Allow VFs to programs MAC/VLAN filters */
		status = be_cmd_get_fn_privileges(adapter, &privileges, vf + 1);
		if (!status && !(privileges & BE_PRIV_FILTMGMT)) {
			status = be_cmd_set_fn_privileges(adapter,
							  privileges |
							  BE_PRIV_FILTMGMT,
							  vf + 1);
			if (!status)
				dev_info(dev, "VF%d has FILTMGMT privilege\n",
					 vf);
		}

3213 3214 3215
		/* Allow full available bandwidth */
		if (!old_vfs)
			be_cmd_config_qos(adapter, 0, 0, vf + 1);
3216

3217
		if (!old_vfs) {
3218
			be_cmd_enable_vf(adapter, vf + 1);
3219 3220 3221 3222
			be_cmd_set_logical_link_config(adapter,
						       IFLA_VF_LINK_STATE_AUTO,
						       vf+1);
		}
3223
	}
3224 3225 3226 3227 3228 3229 3230 3231 3232

	if (!old_vfs) {
		status = pci_enable_sriov(adapter->pdev, adapter->num_vfs);
		if (status) {
			dev_err(dev, "SRIOV enable failed\n");
			adapter->num_vfs = 0;
			goto err;
		}
	}
3233 3234
	return 0;
err:
3235 3236
	dev_err(dev, "VF setup failed\n");
	be_vf_clear(adapter);
3237 3238 3239
	return status;
}

3240 3241 3242 3243
/* Converting function_mode bits on BE3 to SH mc_type enums */

static u8 be_convert_mc_type(u32 function_mode)
{
3244
	if (function_mode & VNIC_MODE && function_mode & QNQ_MODE)
3245
		return vNIC1;
3246
	else if (function_mode & QNQ_MODE)
3247 3248 3249 3250 3251 3252 3253 3254 3255
		return FLEX10;
	else if (function_mode & VNIC_MODE)
		return vNIC2;
	else if (function_mode & UMC_ENABLED)
		return UMC;
	else
		return MC_NONE;
}

3256 3257 3258 3259
/* On BE2/BE3 FW does not suggest the supported limits */
static void BEx_get_resources(struct be_adapter *adapter,
			      struct be_resources *res)
{
3260
	bool use_sriov = adapter->num_vfs ? 1 : 0;
3261 3262 3263 3264 3265 3266

	if (be_physfn(adapter))
		res->max_uc_mac = BE_UC_PMAC_COUNT;
	else
		res->max_uc_mac = BE_VF_UC_PMAC_COUNT;

3267 3268 3269 3270 3271 3272 3273 3274 3275 3276 3277 3278 3279 3280
	adapter->mc_type = be_convert_mc_type(adapter->function_mode);

	if (be_is_mc(adapter)) {
		/* Assuming that there are 4 channels per port,
		 * when multi-channel is enabled
		 */
		if (be_is_qnq_mode(adapter))
			res->max_vlans = BE_NUM_VLANS_SUPPORTED/8;
		else
			/* In a non-qnq multichannel mode, the pvid
			 * takes up one vlan entry
			 */
			res->max_vlans = (BE_NUM_VLANS_SUPPORTED / 4) - 1;
	} else {
3281
		res->max_vlans = BE_NUM_VLANS_SUPPORTED;
3282 3283
	}

3284 3285
	res->max_mcast_mac = BE_MAX_MC;

3286 3287 3288 3289 3290 3291 3292
	/* 1) For BE3 1Gb ports, FW does not support multiple TXQs
	 * 2) Create multiple TX rings on a BE3-R multi-channel interface
	 *    *only* if it is RSS-capable.
	 */
	if (BE2_chip(adapter) || use_sriov ||  (adapter->port_num > 1) ||
	    !be_physfn(adapter) || (be_is_mc(adapter) &&
	    !(adapter->function_caps & BE_FUNCTION_CAPS_RSS)))
3293 3294 3295 3296 3297 3298 3299 3300 3301 3302
		res->max_tx_qs = 1;
	else
		res->max_tx_qs = BE3_MAX_TX_QS;

	if ((adapter->function_caps & BE_FUNCTION_CAPS_RSS) &&
	    !use_sriov && be_physfn(adapter))
		res->max_rss_qs = (adapter->be3_native) ?
					   BE3_MAX_RSS_QS : BE2_MAX_RSS_QS;
	res->max_rx_qs = res->max_rss_qs + 1;

3303
	if (be_physfn(adapter))
3304
		res->max_evt_qs = (res->max_vfs > 0) ?
3305 3306 3307
					BE3_SRIOV_MAX_EVT_QS : BE3_MAX_EVT_QS;
	else
		res->max_evt_qs = 1;
3308 3309 3310 3311 3312 3313

	res->if_cap_flags = BE_IF_CAP_FLAGS_WANT;
	if (!(adapter->function_caps & BE_FUNCTION_CAPS_RSS))
		res->if_cap_flags &= ~BE_IF_FLAGS_RSS;
}

3314 3315 3316
static void be_setup_init(struct be_adapter *adapter)
{
	adapter->vlan_prio_bmap = 0xff;
A
Ajit Khaparde 已提交
3317
	adapter->phy.link_speed = -1;
3318 3319 3320
	adapter->if_handle = -1;
	adapter->be3_native = false;
	adapter->promiscuous = false;
3321 3322 3323 3324
	if (be_physfn(adapter))
		adapter->cmd_privileges = MAX_PRIVILEGES;
	else
		adapter->cmd_privileges = MIN_PRIVILEGES;
3325 3326
}

3327 3328 3329 3330 3331 3332 3333 3334 3335 3336 3337 3338 3339 3340 3341 3342 3343 3344 3345 3346 3347 3348 3349 3350 3351 3352 3353 3354 3355 3356 3357 3358 3359 3360 3361 3362 3363 3364 3365 3366 3367 3368 3369 3370 3371 3372 3373 3374
static int be_get_sriov_config(struct be_adapter *adapter)
{
	struct device *dev = &adapter->pdev->dev;
	struct be_resources res = {0};
	int status, max_vfs, old_vfs;

	status = be_cmd_get_profile_config(adapter, &res, 0);
	if (status)
		return status;

	adapter->pool_res = res;

	/* Some old versions of BE3 FW don't report max_vfs value */
	if (BE3_chip(adapter) && !res.max_vfs) {
		max_vfs = pci_sriov_get_totalvfs(adapter->pdev);
		res.max_vfs = max_vfs > 0 ? min(MAX_VFS, max_vfs) : 0;
	}

	adapter->pool_res.max_vfs = res.max_vfs;
	pci_sriov_set_totalvfs(adapter->pdev, be_max_vfs(adapter));

	if (!be_max_vfs(adapter)) {
		if (num_vfs)
			dev_warn(dev, "device doesn't support SRIOV\n");
		adapter->num_vfs = 0;
		return 0;
	}

	/* validate num_vfs module param */
	old_vfs = pci_num_vf(adapter->pdev);
	if (old_vfs) {
		dev_info(dev, "%d VFs are already enabled\n", old_vfs);
		if (old_vfs != num_vfs)
			dev_warn(dev, "Ignoring num_vfs=%d setting\n", num_vfs);
		adapter->num_vfs = old_vfs;
	} else {
		if (num_vfs > be_max_vfs(adapter)) {
			dev_info(dev, "Resources unavailable to init %d VFs\n",
				 num_vfs);
			dev_info(dev, "Limiting to %d VFs\n",
				 be_max_vfs(adapter));
		}
		adapter->num_vfs = min_t(u16, num_vfs, be_max_vfs(adapter));
	}

	return 0;
}

3375
static int be_get_resources(struct be_adapter *adapter)
3376
{
3377 3378 3379
	struct device *dev = &adapter->pdev->dev;
	struct be_resources res = {0};
	int status;
3380

3381 3382 3383
	if (BEx_chip(adapter)) {
		BEx_get_resources(adapter, &res);
		adapter->res = res;
3384 3385
	}

3386 3387 3388 3389 3390 3391 3392 3393
	/* For Lancer, SH etc read per-function resource limits from FW.
	 * GET_FUNC_CONFIG returns per function guaranteed limits.
	 * GET_PROFILE_CONFIG returns PCI-E related limits PF-pool limits
	 */
	if (!BEx_chip(adapter)) {
		status = be_cmd_get_func_config(adapter, &res);
		if (status)
			return status;
3394

3395 3396 3397 3398
		/* If RoCE may be enabled stash away half the EQs for RoCE */
		if (be_roce_supported(adapter))
			res.max_evt_qs /= 2;
		adapter->res = res;
3399

3400 3401 3402 3403 3404 3405 3406
		dev_info(dev, "Max: txqs %d, rxqs %d, rss %d, eqs %d, vfs %d\n",
			 be_max_txqs(adapter), be_max_rxqs(adapter),
			 be_max_rss(adapter), be_max_eqs(adapter),
			 be_max_vfs(adapter));
		dev_info(dev, "Max: uc-macs %d, mc-macs %d, vlans %d\n",
			 be_max_uc(adapter), be_max_mc(adapter),
			 be_max_vlans(adapter));
3407
	}
3408

3409
	return 0;
3410 3411
}

3412 3413
static int be_get_config(struct be_adapter *adapter)
{
3414
	u16 profile_id;
3415
	int status;
3416

3417 3418
	status = be_cmd_query_fw_cfg(adapter, &adapter->port_num,
				     &adapter->function_mode,
3419 3420
				     &adapter->function_caps,
				     &adapter->asic_rev);
3421
	if (status)
3422
		return status;
3423

3424 3425 3426 3427 3428
	 if (be_physfn(adapter)) {
		status = be_cmd_get_active_profile(adapter, &profile_id);
		if (!status)
			dev_info(&adapter->pdev->dev,
				 "Using profile 0x%x\n", profile_id);
3429 3430 3431 3432 3433 3434 3435 3436 3437 3438 3439 3440 3441 3442 3443 3444 3445 3446 3447 3448

		status = be_get_sriov_config(adapter);
		if (status)
			return status;

		/* When the HW is in SRIOV capable configuration, the PF-pool
		 * resources are equally distributed across the max-number of
		 * VFs. The user may request only a subset of the max-vfs to be
		 * enabled. Based on num_vfs, redistribute the resources across
		 * num_vfs so that each VF will have access to more number of
		 * resources. This facility is not available in BE3 FW.
		 * Also, this is done by FW in Lancer chip.
		 */
		if (!pci_num_vf(adapter->pdev)) {
			status = be_cmd_set_sriov_config(adapter,
							 adapter->pool_res,
							 adapter->num_vfs);
			if (status)
				return status;
		}
3449 3450
	}

3451 3452 3453
	status = be_get_resources(adapter);
	if (status)
		return status;
3454

3455 3456
	adapter->pmac_id = kcalloc(be_max_uc(adapter),
				   sizeof(*adapter->pmac_id), GFP_KERNEL);
3457 3458
	if (!adapter->pmac_id)
		return -ENOMEM;
3459

3460 3461 3462 3463
	/* Sanitize cfg_num_qs based on HW and platform limits */
	adapter->cfg_num_qs = min(adapter->cfg_num_qs, be_max_qs(adapter));

	return 0;
3464 3465
}

3466 3467 3468 3469 3470 3471 3472 3473 3474 3475 3476 3477 3478 3479 3480 3481 3482
static int be_mac_setup(struct be_adapter *adapter)
{
	u8 mac[ETH_ALEN];
	int status;

	if (is_zero_ether_addr(adapter->netdev->dev_addr)) {
		status = be_cmd_get_perm_mac(adapter, mac);
		if (status)
			return status;

		memcpy(adapter->netdev->dev_addr, mac, ETH_ALEN);
		memcpy(adapter->netdev->perm_addr, mac, ETH_ALEN);
	} else {
		/* Maybe the HW was reset; dev_addr must be re-programmed */
		memcpy(mac, adapter->netdev->dev_addr, ETH_ALEN);
	}

3483 3484 3485 3486
	/* For BE3-R VFs, the PF programs the initial MAC address */
	if (!(BEx_chip(adapter) && be_virtfn(adapter)))
		be_cmd_pmac_add(adapter, mac, adapter->if_handle,
				&adapter->pmac_id[0], 0);
3487 3488 3489
	return 0;
}

3490 3491 3492 3493 3494 3495
static void be_schedule_worker(struct be_adapter *adapter)
{
	schedule_delayed_work(&adapter->work, msecs_to_jiffies(1000));
	adapter->flags |= BE_FLAGS_WORKER_SCHEDULED;
}

3496
static int be_setup_queues(struct be_adapter *adapter)
3497
{
3498
	struct net_device *netdev = adapter->netdev;
S
Sathya Perla 已提交
3499
	int status;
3500

3501
	status = be_evt_queues_create(adapter);
3502 3503
	if (status)
		goto err;
3504

3505
	status = be_tx_qs_create(adapter);
3506 3507
	if (status)
		goto err;
S
Sathya Perla 已提交
3508

3509
	status = be_rx_cqs_create(adapter);
S
Sathya Perla 已提交
3510
	if (status)
3511
		goto err;
S
Sathya Perla 已提交
3512

3513
	status = be_mcc_queues_create(adapter);
S
Sathya Perla 已提交
3514 3515 3516
	if (status)
		goto err;

3517 3518 3519 3520 3521 3522 3523 3524
	status = netif_set_real_num_rx_queues(netdev, adapter->num_rx_qs);
	if (status)
		goto err;

	status = netif_set_real_num_tx_queues(netdev, adapter->num_tx_qs);
	if (status)
		goto err;

3525 3526 3527 3528 3529 3530
	return 0;
err:
	dev_err(&adapter->pdev->dev, "queue_setup failed\n");
	return status;
}

3531 3532 3533 3534 3535 3536 3537 3538 3539 3540 3541 3542 3543 3544 3545 3546 3547 3548 3549 3550 3551 3552 3553 3554 3555 3556 3557 3558 3559 3560 3561 3562 3563 3564 3565 3566
int be_update_queues(struct be_adapter *adapter)
{
	struct net_device *netdev = adapter->netdev;
	int status;

	if (netif_running(netdev))
		be_close(netdev);

	be_cancel_worker(adapter);

	/* If any vectors have been shared with RoCE we cannot re-program
	 * the MSIx table.
	 */
	if (!adapter->num_msix_roce_vec)
		be_msix_disable(adapter);

	be_clear_queues(adapter);

	if (!msix_enabled(adapter)) {
		status = be_msix_enable(adapter);
		if (status)
			return status;
	}

	status = be_setup_queues(adapter);
	if (status)
		return status;

	be_schedule_worker(adapter);

	if (netif_running(netdev))
		status = be_open(netdev);

	return status;
}

3567 3568 3569 3570 3571 3572 3573 3574 3575 3576 3577 3578
static int be_setup(struct be_adapter *adapter)
{
	struct device *dev = &adapter->pdev->dev;
	u32 tx_fc, rx_fc, en_flags;
	int status;

	be_setup_init(adapter);

	if (!lancer_chip(adapter))
		be_cmd_req_native_mode(adapter);

	status = be_get_config(adapter);
S
Sathya Perla 已提交
3579
	if (status)
3580
		goto err;
S
Sathya Perla 已提交
3581

3582
	status = be_msix_enable(adapter);
S
Sathya Perla 已提交
3583
	if (status)
3584
		goto err;
S
Sathya Perla 已提交
3585

3586
	en_flags = BE_IF_FLAGS_UNTAGGED | BE_IF_FLAGS_BROADCAST |
3587
		   BE_IF_FLAGS_MULTICAST | BE_IF_FLAGS_PASS_L3L4_ERRORS;
3588
	if (adapter->function_caps & BE_FUNCTION_CAPS_RSS)
3589
		en_flags |= BE_IF_FLAGS_RSS;
3590 3591
	en_flags = en_flags & be_if_cap_flags(adapter);
	status = be_cmd_if_create(adapter, be_if_cap_flags(adapter), en_flags,
3592
				  &adapter->if_handle, 0);
3593
	if (status)
3594
		goto err;
S
Sathya Perla 已提交
3595

3596 3597
	/* Updating real_num_tx/rx_queues() requires rtnl_lock() */
	rtnl_lock();
3598
	status = be_setup_queues(adapter);
3599
	rtnl_unlock();
3600
	if (status)
3601 3602
		goto err;

3603 3604 3605
	be_cmd_get_fn_privileges(adapter, &adapter->cmd_privileges, 0);

	status = be_mac_setup(adapter);
S
Sathya Perla 已提交
3606 3607 3608
	if (status)
		goto err;

S
Somnath Kotur 已提交
3609
	be_cmd_get_fw_ver(adapter, adapter->fw_ver, adapter->fw_on_flash);
3610

3611 3612 3613 3614 3615 3616
	if (BE2_chip(adapter) && fw_major_num(adapter->fw_ver) < 4) {
		dev_err(dev, "Firmware on card is old(%s), IRQs may not work.",
			adapter->fw_ver);
		dev_err(dev, "Please upgrade firmware to version >= 4.0\n");
	}

3617
	if (adapter->vlans_added)
S
Sathya Perla 已提交
3618
		be_vid_config(adapter);
3619

3620
	be_set_rx_mode(adapter->netdev);
3621

S
Suresh Reddy 已提交
3622 3623
	be_cmd_get_acpi_wol_cap(adapter);

3624
	be_cmd_get_flow_control(adapter, &tx_fc, &rx_fc);
3625

3626 3627
	if (rx_fc != adapter->rx_fc || tx_fc != adapter->tx_fc)
		be_cmd_set_flow_control(adapter, adapter->tx_fc,
3628
					adapter->rx_fc);
3629

3630 3631 3632 3633
	if (be_physfn(adapter))
		be_cmd_set_logical_link_config(adapter,
					       IFLA_VF_LINK_STATE_AUTO, 0);

3634 3635
	if (adapter->num_vfs)
		be_vf_setup(adapter);
3636

3637 3638
	status = be_cmd_get_phy_info(adapter);
	if (!status && be_pause_supported(adapter))
A
Ajit Khaparde 已提交
3639 3640
		adapter->phy.fc_autoneg = 1;

3641
	be_schedule_worker(adapter);
3642
	adapter->flags |= BE_FLAGS_SETUP_DONE;
3643
	return 0;
3644 3645 3646 3647
err:
	be_clear(adapter);
	return status;
}
S
Sathya Perla 已提交
3648

I
Ivan Vecera 已提交
3649 3650 3651 3652
#ifdef CONFIG_NET_POLL_CONTROLLER
static void be_netpoll(struct net_device *netdev)
{
	struct be_adapter *adapter = netdev_priv(netdev);
S
Sathya Perla 已提交
3653
	struct be_eq_obj *eqo;
I
Ivan Vecera 已提交
3654 3655
	int i;

3656 3657 3658 3659
	for_all_evt_queues(adapter, eqo, i) {
		be_eq_notify(eqo->adapter, eqo->q.id, false, true, 0);
		napi_schedule(&eqo->napi);
	}
S
Sathya Perla 已提交
3660 3661

	return;
I
Ivan Vecera 已提交
3662 3663 3664
}
#endif

3665
static char flash_cookie[2][16] = {"*** SE FLAS", "H DIRECTORY *** "};
3666

3667 3668
static bool phy_flashing_required(struct be_adapter *adapter)
{
A
Ajit Khaparde 已提交
3669 3670
	return (adapter->phy.phy_type == TN_8022 &&
		adapter->phy.interface_type == PHY_TYPE_BASET_10GB);
3671 3672
}

3673 3674 3675 3676 3677 3678
static bool is_comp_in_ufi(struct be_adapter *adapter,
			   struct flash_section_info *fsec, int type)
{
	int i = 0, img_type = 0;
	struct flash_section_info_g2 *fsec_g2 = NULL;

3679
	if (BE2_chip(adapter))
3680 3681 3682 3683 3684 3685 3686 3687 3688 3689 3690 3691 3692 3693 3694
		fsec_g2 = (struct flash_section_info_g2 *)fsec;

	for (i = 0; i < MAX_FLASH_COMP; i++) {
		if (fsec_g2)
			img_type = le32_to_cpu(fsec_g2->fsec_entry[i].type);
		else
			img_type = le32_to_cpu(fsec->fsec_entry[i].type);

		if (img_type == type)
			return true;
	}
	return false;

}

J
Jingoo Han 已提交
3695
static struct flash_section_info *get_fsec_info(struct be_adapter *adapter,
3696 3697
						int header_size,
						const struct firmware *fw)
3698 3699 3700 3701 3702 3703 3704 3705 3706 3707 3708 3709 3710 3711
{
	struct flash_section_info *fsec = NULL;
	const u8 *p = fw->data;

	p += header_size;
	while (p < (fw->data + fw->size)) {
		fsec = (struct flash_section_info *)p;
		if (!memcmp(flash_cookie, fsec->cookie, sizeof(flash_cookie)))
			return fsec;
		p += 32;
	}
	return NULL;
}

3712 3713 3714 3715 3716 3717 3718 3719 3720 3721 3722 3723 3724 3725 3726 3727 3728 3729 3730 3731 3732 3733 3734
static int be_check_flash_crc(struct be_adapter *adapter, const u8 *p,
			      u32 img_offset, u32 img_size, int hdr_size,
			      u16 img_optype, bool *crc_match)
{
	u32 crc_offset;
	int status;
	u8 crc[4];

	status = be_cmd_get_flash_crc(adapter, crc, img_optype, img_size - 4);
	if (status)
		return status;

	crc_offset = hdr_size + img_offset + img_size - 4;

	/* Skip flashing, if crc of flashed region matches */
	if (!memcmp(crc, p + crc_offset, 4))
		*crc_match = true;
	else
		*crc_match = false;

	return status;
}

3735
static int be_flash(struct be_adapter *adapter, const u8 *img,
3736
		    struct be_dma_mem *flash_cmd, int optype, int img_size)
3737 3738
{
	struct be_cmd_write_flashrom *req = flash_cmd->va;
3739 3740
	u32 total_bytes, flash_op, num_bytes;
	int status;
3741 3742 3743 3744 3745 3746 3747 3748 3749 3750 3751 3752 3753 3754 3755 3756 3757 3758 3759

	total_bytes = img_size;
	while (total_bytes) {
		num_bytes = min_t(u32, 32*1024, total_bytes);

		total_bytes -= num_bytes;

		if (!total_bytes) {
			if (optype == OPTYPE_PHY_FW)
				flash_op = FLASHROM_OPER_PHY_FLASH;
			else
				flash_op = FLASHROM_OPER_FLASH;
		} else {
			if (optype == OPTYPE_PHY_FW)
				flash_op = FLASHROM_OPER_PHY_SAVE;
			else
				flash_op = FLASHROM_OPER_SAVE;
		}

3760
		memcpy(req->data_buf, img, num_bytes);
3761 3762
		img += num_bytes;
		status = be_cmd_write_flashrom(adapter, flash_cmd, optype,
3763
					       flash_op, num_bytes);
3764
		if (base_status(status) == MCC_STATUS_ILLEGAL_REQUEST &&
3765 3766 3767
		    optype == OPTYPE_PHY_FW)
			break;
		else if (status)
3768 3769 3770 3771 3772
			return status;
	}
	return 0;
}

3773
/* For BE2, BE3 and BE3-R */
3774
static int be_flash_BEx(struct be_adapter *adapter,
3775 3776
			const struct firmware *fw,
			struct be_dma_mem *flash_cmd, int num_of_images)
3777
{
3778
	int img_hdrs_size = (num_of_images * sizeof(struct image_hdr));
3779
	struct device *dev = &adapter->pdev->dev;
3780
	struct flash_section_info *fsec = NULL;
3781 3782 3783 3784
	int status, i, filehdr_size, num_comp;
	const struct flash_comp *pflashcomp;
	bool crc_match;
	const u8 *p;
3785 3786 3787 3788 3789 3790 3791 3792 3793 3794 3795 3796 3797 3798 3799 3800 3801 3802 3803 3804 3805 3806

	struct flash_comp gen3_flash_types[] = {
		{ FLASH_iSCSI_PRIMARY_IMAGE_START_g3, OPTYPE_ISCSI_ACTIVE,
			FLASH_IMAGE_MAX_SIZE_g3, IMAGE_FIRMWARE_iSCSI},
		{ FLASH_REDBOOT_START_g3, OPTYPE_REDBOOT,
			FLASH_REDBOOT_IMAGE_MAX_SIZE_g3, IMAGE_BOOT_CODE},
		{ FLASH_iSCSI_BIOS_START_g3, OPTYPE_BIOS,
			FLASH_BIOS_IMAGE_MAX_SIZE_g3, IMAGE_OPTION_ROM_ISCSI},
		{ FLASH_PXE_BIOS_START_g3, OPTYPE_PXE_BIOS,
			FLASH_BIOS_IMAGE_MAX_SIZE_g3, IMAGE_OPTION_ROM_PXE},
		{ FLASH_FCoE_BIOS_START_g3, OPTYPE_FCOE_BIOS,
			FLASH_BIOS_IMAGE_MAX_SIZE_g3, IMAGE_OPTION_ROM_FCoE},
		{ FLASH_iSCSI_BACKUP_IMAGE_START_g3, OPTYPE_ISCSI_BACKUP,
			FLASH_IMAGE_MAX_SIZE_g3, IMAGE_FIRMWARE_BACKUP_iSCSI},
		{ FLASH_FCoE_PRIMARY_IMAGE_START_g3, OPTYPE_FCOE_FW_ACTIVE,
			FLASH_IMAGE_MAX_SIZE_g3, IMAGE_FIRMWARE_FCoE},
		{ FLASH_FCoE_BACKUP_IMAGE_START_g3, OPTYPE_FCOE_FW_BACKUP,
			FLASH_IMAGE_MAX_SIZE_g3, IMAGE_FIRMWARE_BACKUP_FCoE},
		{ FLASH_NCSI_START_g3, OPTYPE_NCSI_FW,
			FLASH_NCSI_IMAGE_MAX_SIZE_g3, IMAGE_NCSI},
		{ FLASH_PHY_FW_START_g3, OPTYPE_PHY_FW,
			FLASH_PHY_FW_IMAGE_MAX_SIZE_g3, IMAGE_FIRMWARE_PHY}
3807
	};
3808 3809 3810 3811 3812 3813 3814 3815 3816 3817 3818 3819 3820 3821 3822 3823 3824 3825

	struct flash_comp gen2_flash_types[] = {
		{ FLASH_iSCSI_PRIMARY_IMAGE_START_g2, OPTYPE_ISCSI_ACTIVE,
			FLASH_IMAGE_MAX_SIZE_g2, IMAGE_FIRMWARE_iSCSI},
		{ FLASH_REDBOOT_START_g2, OPTYPE_REDBOOT,
			FLASH_REDBOOT_IMAGE_MAX_SIZE_g2, IMAGE_BOOT_CODE},
		{ FLASH_iSCSI_BIOS_START_g2, OPTYPE_BIOS,
			FLASH_BIOS_IMAGE_MAX_SIZE_g2, IMAGE_OPTION_ROM_ISCSI},
		{ FLASH_PXE_BIOS_START_g2, OPTYPE_PXE_BIOS,
			FLASH_BIOS_IMAGE_MAX_SIZE_g2, IMAGE_OPTION_ROM_PXE},
		{ FLASH_FCoE_BIOS_START_g2, OPTYPE_FCOE_BIOS,
			FLASH_BIOS_IMAGE_MAX_SIZE_g2, IMAGE_OPTION_ROM_FCoE},
		{ FLASH_iSCSI_BACKUP_IMAGE_START_g2, OPTYPE_ISCSI_BACKUP,
			FLASH_IMAGE_MAX_SIZE_g2, IMAGE_FIRMWARE_BACKUP_iSCSI},
		{ FLASH_FCoE_PRIMARY_IMAGE_START_g2, OPTYPE_FCOE_FW_ACTIVE,
			FLASH_IMAGE_MAX_SIZE_g2, IMAGE_FIRMWARE_FCoE},
		{ FLASH_FCoE_BACKUP_IMAGE_START_g2, OPTYPE_FCOE_FW_BACKUP,
			 FLASH_IMAGE_MAX_SIZE_g2, IMAGE_FIRMWARE_BACKUP_FCoE}
3826 3827
	};

3828
	if (BE3_chip(adapter)) {
3829 3830
		pflashcomp = gen3_flash_types;
		filehdr_size = sizeof(struct flash_file_hdr_g3);
J
Joe Perches 已提交
3831
		num_comp = ARRAY_SIZE(gen3_flash_types);
3832 3833 3834
	} else {
		pflashcomp = gen2_flash_types;
		filehdr_size = sizeof(struct flash_file_hdr_g2);
J
Joe Perches 已提交
3835
		num_comp = ARRAY_SIZE(gen2_flash_types);
3836
	}
3837

3838 3839 3840
	/* Get flash section info*/
	fsec = get_fsec_info(adapter, filehdr_size + img_hdrs_size, fw);
	if (!fsec) {
3841
		dev_err(dev, "Invalid Cookie. FW image may be corrupted\n");
3842 3843
		return -1;
	}
3844
	for (i = 0; i < num_comp; i++) {
3845
		if (!is_comp_in_ufi(adapter, fsec, pflashcomp[i].img_type))
3846
			continue;
3847 3848 3849 3850 3851

		if ((pflashcomp[i].optype == OPTYPE_NCSI_FW) &&
		    memcmp(adapter->fw_ver, "3.102.148.0", 11) < 0)
			continue;

3852 3853
		if (pflashcomp[i].optype == OPTYPE_PHY_FW  &&
		    !phy_flashing_required(adapter))
3854
				continue;
3855

3856
		if (pflashcomp[i].optype == OPTYPE_REDBOOT) {
3857 3858 3859 3860 3861 3862 3863 3864 3865 3866 3867 3868 3869 3870
			status = be_check_flash_crc(adapter, fw->data,
						    pflashcomp[i].offset,
						    pflashcomp[i].size,
						    filehdr_size +
						    img_hdrs_size,
						    OPTYPE_REDBOOT, &crc_match);
			if (status) {
				dev_err(dev,
					"Could not get CRC for 0x%x region\n",
					pflashcomp[i].optype);
				continue;
			}

			if (crc_match)
3871 3872
				continue;
		}
3873

3874 3875
		p = fw->data + filehdr_size + pflashcomp[i].offset +
			img_hdrs_size;
3876 3877
		if (p + pflashcomp[i].size > fw->data + fw->size)
			return -1;
3878 3879

		status = be_flash(adapter, p, flash_cmd, pflashcomp[i].optype,
3880
				  pflashcomp[i].size);
3881
		if (status) {
3882
			dev_err(dev, "Flashing section type 0x%x failed\n",
3883 3884
				pflashcomp[i].img_type);
			return status;
3885 3886 3887 3888 3889
		}
	}
	return 0;
}

3890 3891 3892 3893 3894 3895 3896 3897 3898 3899 3900 3901 3902 3903 3904 3905 3906 3907 3908 3909 3910 3911 3912 3913 3914 3915 3916 3917 3918 3919 3920 3921 3922 3923 3924 3925 3926 3927 3928 3929 3930 3931 3932 3933 3934 3935 3936 3937 3938 3939 3940 3941
static u16 be_get_img_optype(struct flash_section_entry fsec_entry)
{
	u32 img_type = le32_to_cpu(fsec_entry.type);
	u16 img_optype = le16_to_cpu(fsec_entry.optype);

	if (img_optype != 0xFFFF)
		return img_optype;

	switch (img_type) {
	case IMAGE_FIRMWARE_iSCSI:
		img_optype = OPTYPE_ISCSI_ACTIVE;
		break;
	case IMAGE_BOOT_CODE:
		img_optype = OPTYPE_REDBOOT;
		break;
	case IMAGE_OPTION_ROM_ISCSI:
		img_optype = OPTYPE_BIOS;
		break;
	case IMAGE_OPTION_ROM_PXE:
		img_optype = OPTYPE_PXE_BIOS;
		break;
	case IMAGE_OPTION_ROM_FCoE:
		img_optype = OPTYPE_FCOE_BIOS;
		break;
	case IMAGE_FIRMWARE_BACKUP_iSCSI:
		img_optype = OPTYPE_ISCSI_BACKUP;
		break;
	case IMAGE_NCSI:
		img_optype = OPTYPE_NCSI_FW;
		break;
	case IMAGE_FLASHISM_JUMPVECTOR:
		img_optype = OPTYPE_FLASHISM_JUMPVECTOR;
		break;
	case IMAGE_FIRMWARE_PHY:
		img_optype = OPTYPE_SH_PHY_FW;
		break;
	case IMAGE_REDBOOT_DIR:
		img_optype = OPTYPE_REDBOOT_DIR;
		break;
	case IMAGE_REDBOOT_CONFIG:
		img_optype = OPTYPE_REDBOOT_CONFIG;
		break;
	case IMAGE_UFI_DIR:
		img_optype = OPTYPE_UFI_DIR;
		break;
	default:
		break;
	}

	return img_optype;
}

3942
static int be_flash_skyhawk(struct be_adapter *adapter,
3943 3944
			    const struct firmware *fw,
			    struct be_dma_mem *flash_cmd, int num_of_images)
3945
{
3946
	int img_hdrs_size = num_of_images * sizeof(struct image_hdr);
3947
	struct device *dev = &adapter->pdev->dev;
3948
	struct flash_section_info *fsec = NULL;
3949 3950 3951 3952 3953
	u32 img_offset, img_size, img_type;
	int status, i, filehdr_size;
	bool crc_match, old_fw_img;
	u16 img_optype;
	const u8 *p;
3954 3955 3956 3957

	filehdr_size = sizeof(struct flash_file_hdr_g3);
	fsec = get_fsec_info(adapter, filehdr_size + img_hdrs_size, fw);
	if (!fsec) {
3958
		dev_err(dev, "Invalid Cookie. FW image may be corrupted\n");
3959
		return -EINVAL;
3960 3961 3962 3963 3964
	}

	for (i = 0; i < le32_to_cpu(fsec->fsec_hdr.num_images); i++) {
		img_offset = le32_to_cpu(fsec->fsec_entry[i].offset);
		img_size   = le32_to_cpu(fsec->fsec_entry[i].pad_size);
3965 3966 3967
		img_type   = le32_to_cpu(fsec->fsec_entry[i].type);
		img_optype = be_get_img_optype(fsec->fsec_entry[i]);
		old_fw_img = fsec->fsec_entry[i].optype == 0xFFFF;
3968

3969
		if (img_optype == 0xFFFF)
3970
			continue;
3971 3972 3973 3974 3975 3976 3977 3978 3979 3980 3981 3982 3983 3984 3985 3986
		/* Don't bother verifying CRC if an old FW image is being
		 * flashed
		 */
		if (old_fw_img)
			goto flash;

		status = be_check_flash_crc(adapter, fw->data, img_offset,
					    img_size, filehdr_size +
					    img_hdrs_size, img_optype,
					    &crc_match);
		/* The current FW image on the card does not recognize the new
		 * FLASH op_type. The FW download is partially complete.
		 * Reboot the server now to enable FW image to recognize the
		 * new FLASH op_type. To complete the remaining process,
		 * download the same FW again after the reboot.
		 */
3987 3988
		if (base_status(status) == MCC_STATUS_ILLEGAL_REQUEST ||
		    base_status(status) == MCC_STATUS_ILLEGAL_FIELD) {
3989 3990 3991 3992 3993 3994 3995
			dev_err(dev, "Flash incomplete. Reset the server\n");
			dev_err(dev, "Download FW image again after reset\n");
			return -EAGAIN;
		} else if (status) {
			dev_err(dev, "Could not get CRC for 0x%x region\n",
				img_optype);
			return -EFAULT;
3996 3997
		}

3998 3999
		if (crc_match)
			continue;
4000

4001 4002
flash:
		p = fw->data + filehdr_size + img_offset + img_hdrs_size;
4003 4004 4005 4006
		if (p + img_size > fw->data + fw->size)
			return -1;

		status = be_flash(adapter, p, flash_cmd, img_optype, img_size);
4007 4008 4009
		/* For old FW images ignore ILLEGAL_FIELD error or errors on
		 * UFI_DIR region
		 */
4010 4011 4012 4013
		if (old_fw_img &&
		    (base_status(status) == MCC_STATUS_ILLEGAL_FIELD ||
		     (img_optype == OPTYPE_UFI_DIR &&
		      base_status(status) == MCC_STATUS_FAILED))) {
4014 4015 4016 4017 4018
			continue;
		} else if (status) {
			dev_err(dev, "Flashing section type 0x%x failed\n",
				img_type);
			return -EFAULT;
4019 4020 4021
		}
	}
	return 0;
4022 4023
}

4024
static int lancer_fw_download(struct be_adapter *adapter,
4025
			      const struct firmware *fw)
4026
{
4027 4028
#define LANCER_FW_DOWNLOAD_CHUNK      (32 * 1024)
#define LANCER_FW_DOWNLOAD_LOCATION   "/prg"
4029
	struct be_dma_mem flash_cmd;
4030 4031 4032 4033 4034 4035 4036 4037
	const u8 *data_ptr = NULL;
	u8 *dest_image_ptr = NULL;
	size_t image_size = 0;
	u32 chunk_size = 0;
	u32 data_written = 0;
	u32 offset = 0;
	int status = 0;
	u8 add_status = 0;
4038
	u8 change_status;
4039

4040
	if (!IS_ALIGNED(fw->size, sizeof(u32))) {
4041
		dev_err(&adapter->pdev->dev,
4042 4043 4044 4045
			"FW Image not properly aligned. "
			"Length must be 4 byte aligned.\n");
		status = -EINVAL;
		goto lancer_fw_exit;
4046 4047
	}

4048 4049 4050
	flash_cmd.size = sizeof(struct lancer_cmd_req_write_object)
				+ LANCER_FW_DOWNLOAD_CHUNK;
	flash_cmd.va = dma_alloc_coherent(&adapter->pdev->dev, flash_cmd.size,
4051
					  &flash_cmd.dma, GFP_KERNEL);
4052 4053 4054 4055
	if (!flash_cmd.va) {
		status = -ENOMEM;
		goto lancer_fw_exit;
	}
4056

4057 4058 4059 4060 4061 4062 4063 4064 4065 4066 4067 4068
	dest_image_ptr = flash_cmd.va +
				sizeof(struct lancer_cmd_req_write_object);
	image_size = fw->size;
	data_ptr = fw->data;

	while (image_size) {
		chunk_size = min_t(u32, image_size, LANCER_FW_DOWNLOAD_CHUNK);

		/* Copy the image chunk content. */
		memcpy(dest_image_ptr, data_ptr, chunk_size);

		status = lancer_cmd_write_object(adapter, &flash_cmd,
4069 4070 4071 4072
						 chunk_size, offset,
						 LANCER_FW_DOWNLOAD_LOCATION,
						 &data_written, &change_status,
						 &add_status);
4073 4074 4075 4076 4077 4078 4079 4080 4081 4082 4083
		if (status)
			break;

		offset += data_written;
		data_ptr += data_written;
		image_size -= data_written;
	}

	if (!status) {
		/* Commit the FW written */
		status = lancer_cmd_write_object(adapter, &flash_cmd,
4084 4085 4086 4087
						 0, offset,
						 LANCER_FW_DOWNLOAD_LOCATION,
						 &data_written, &change_status,
						 &add_status);
4088 4089 4090
	}

	dma_free_coherent(&adapter->pdev->dev, flash_cmd.size, flash_cmd.va,
4091
			  flash_cmd.dma);
4092 4093 4094 4095 4096 4097 4098 4099
	if (status) {
		dev_err(&adapter->pdev->dev,
			"Firmware load error. "
			"Status code: 0x%x Additional Status: 0x%x\n",
			status, add_status);
		goto lancer_fw_exit;
	}

4100
	if (change_status == LANCER_FW_RESET_NEEDED) {
4101 4102
		dev_info(&adapter->pdev->dev,
			 "Resetting adapter to activate new FW\n");
4103 4104
		status = lancer_physdev_ctrl(adapter,
					     PHYSDEV_CONTROL_FW_RESET_MASK);
4105 4106 4107 4108 4109 4110 4111
		if (status) {
			dev_err(&adapter->pdev->dev,
				"Adapter busy for FW reset.\n"
				"New FW will not be active.\n");
			goto lancer_fw_exit;
		}
	} else if (change_status != LANCER_NO_RESET_NEEDED) {
4112 4113
		dev_err(&adapter->pdev->dev,
			"System reboot required for new FW to be active\n");
4114 4115
	}

4116 4117 4118 4119 4120
	dev_info(&adapter->pdev->dev, "Firmware flashed successfully\n");
lancer_fw_exit:
	return status;
}

4121 4122
#define UFI_TYPE2		2
#define UFI_TYPE3		3
4123
#define UFI_TYPE3R		10
4124 4125
#define UFI_TYPE4		4
static int be_get_ufi_type(struct be_adapter *adapter,
4126
			   struct flash_file_hdr_g3 *fhdr)
4127 4128 4129 4130
{
	if (fhdr == NULL)
		goto be_get_ufi_exit;

4131 4132
	if (skyhawk_chip(adapter) && fhdr->build[0] == '4')
		return UFI_TYPE4;
4133 4134 4135 4136 4137 4138
	else if (BE3_chip(adapter) && fhdr->build[0] == '3') {
		if (fhdr->asic_type_rev == 0x10)
			return UFI_TYPE3R;
		else
			return UFI_TYPE3;
	} else if (BE2_chip(adapter) && fhdr->build[0] == '2')
4139
		return UFI_TYPE2;
4140 4141 4142 4143 4144 4145 4146

be_get_ufi_exit:
	dev_err(&adapter->pdev->dev,
		"UFI and Interface are not compatible for flashing\n");
	return -1;
}

4147 4148 4149 4150 4151 4152
static int be_fw_download(struct be_adapter *adapter, const struct firmware* fw)
{
	struct flash_file_hdr_g3 *fhdr3;
	struct image_hdr *img_hdr_ptr = NULL;
	struct be_dma_mem flash_cmd;
	const u8 *p;
4153
	int status = 0, i = 0, num_imgs = 0, ufi_type = 0;
4154

4155
	flash_cmd.size = sizeof(struct be_cmd_write_flashrom);
I
Ivan Vecera 已提交
4156 4157
	flash_cmd.va = dma_alloc_coherent(&adapter->pdev->dev, flash_cmd.size,
					  &flash_cmd.dma, GFP_KERNEL);
4158 4159
	if (!flash_cmd.va) {
		status = -ENOMEM;
4160
		goto be_fw_exit;
4161 4162
	}

4163
	p = fw->data;
4164
	fhdr3 = (struct flash_file_hdr_g3 *)p;
4165

4166
	ufi_type = be_get_ufi_type(adapter, fhdr3);
4167 4168 4169 4170 4171 4172 4173

	num_imgs = le32_to_cpu(fhdr3->num_imgs);
	for (i = 0; i < num_imgs; i++) {
		img_hdr_ptr = (struct image_hdr *)(fw->data +
				(sizeof(struct flash_file_hdr_g3) +
				 i * sizeof(struct image_hdr)));
		if (le32_to_cpu(img_hdr_ptr->imageid) == 1) {
4174 4175
			switch (ufi_type) {
			case UFI_TYPE4:
4176
				status = be_flash_skyhawk(adapter, fw,
4177
							  &flash_cmd, num_imgs);
4178 4179
				break;
			case UFI_TYPE3R:
4180 4181
				status = be_flash_BEx(adapter, fw, &flash_cmd,
						      num_imgs);
4182 4183 4184 4185 4186 4187 4188 4189
				break;
			case UFI_TYPE3:
				/* Do not flash this ufi on BE3-R cards */
				if (adapter->asic_rev < 0x10)
					status = be_flash_BEx(adapter, fw,
							      &flash_cmd,
							      num_imgs);
				else {
4190
					status = -EINVAL;
4191 4192 4193 4194
					dev_err(&adapter->pdev->dev,
						"Can't load BE3 UFI on BE3R\n");
				}
			}
4195
		}
4196 4197
	}

4198 4199
	if (ufi_type == UFI_TYPE2)
		status = be_flash_BEx(adapter, fw, &flash_cmd, 0);
4200
	else if (ufi_type == -1)
4201
		status = -EINVAL;
4202

I
Ivan Vecera 已提交
4203 4204
	dma_free_coherent(&adapter->pdev->dev, flash_cmd.size, flash_cmd.va,
			  flash_cmd.dma);
4205 4206
	if (status) {
		dev_err(&adapter->pdev->dev, "Firmware load error\n");
4207
		goto be_fw_exit;
4208 4209
	}

4210
	dev_info(&adapter->pdev->dev, "Firmware flashed successfully\n");
4211

4212 4213 4214 4215 4216 4217 4218 4219 4220 4221 4222 4223
be_fw_exit:
	return status;
}

int be_load_fw(struct be_adapter *adapter, u8 *fw_file)
{
	const struct firmware *fw;
	int status;

	if (!netif_running(adapter->netdev)) {
		dev_err(&adapter->pdev->dev,
			"Firmware load not allowed (interface is down)\n");
4224
		return -ENETDOWN;
4225 4226 4227 4228 4229 4230 4231 4232 4233 4234 4235 4236 4237
	}

	status = request_firmware(&fw, fw_file, &adapter->pdev->dev);
	if (status)
		goto fw_exit;

	dev_info(&adapter->pdev->dev, "Flashing firmware file %s\n", fw_file);

	if (lancer_chip(adapter))
		status = lancer_fw_download(adapter, fw);
	else
		status = be_fw_download(adapter, fw);

S
Somnath Kotur 已提交
4238 4239 4240 4241
	if (!status)
		be_cmd_get_fw_ver(adapter, adapter->fw_ver,
				  adapter->fw_on_flash);

4242 4243 4244 4245 4246
fw_exit:
	release_firmware(fw);
	return status;
}

4247
static int be_ndo_bridge_setlink(struct net_device *dev, struct nlmsghdr *nlh)
4248 4249 4250 4251 4252 4253 4254 4255 4256 4257 4258 4259 4260 4261 4262 4263 4264 4265 4266 4267 4268 4269 4270 4271 4272 4273 4274 4275 4276 4277 4278 4279 4280 4281 4282 4283 4284 4285 4286 4287 4288
{
	struct be_adapter *adapter = netdev_priv(dev);
	struct nlattr *attr, *br_spec;
	int rem;
	int status = 0;
	u16 mode = 0;

	if (!sriov_enabled(adapter))
		return -EOPNOTSUPP;

	br_spec = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg), IFLA_AF_SPEC);

	nla_for_each_nested(attr, br_spec, rem) {
		if (nla_type(attr) != IFLA_BRIDGE_MODE)
			continue;

		mode = nla_get_u16(attr);
		if (mode != BRIDGE_MODE_VEPA && mode != BRIDGE_MODE_VEB)
			return -EINVAL;

		status = be_cmd_set_hsw_config(adapter, 0, 0,
					       adapter->if_handle,
					       mode == BRIDGE_MODE_VEPA ?
					       PORT_FWD_TYPE_VEPA :
					       PORT_FWD_TYPE_VEB);
		if (status)
			goto err;

		dev_info(&adapter->pdev->dev, "enabled switch mode: %s\n",
			 mode == BRIDGE_MODE_VEPA ? "VEPA" : "VEB");

		return status;
	}
err:
	dev_err(&adapter->pdev->dev, "Failed to set switch mode %s\n",
		mode == BRIDGE_MODE_VEPA ? "VEPA" : "VEB");

	return status;
}

static int be_ndo_bridge_getlink(struct sk_buff *skb, u32 pid, u32 seq,
4289
				 struct net_device *dev, u32 filter_mask)
4290 4291 4292 4293 4294 4295 4296 4297 4298 4299 4300 4301 4302 4303 4304 4305 4306 4307 4308 4309 4310 4311 4312
{
	struct be_adapter *adapter = netdev_priv(dev);
	int status = 0;
	u8 hsw_mode;

	if (!sriov_enabled(adapter))
		return 0;

	/* BE and Lancer chips support VEB mode only */
	if (BEx_chip(adapter) || lancer_chip(adapter)) {
		hsw_mode = PORT_FWD_TYPE_VEB;
	} else {
		status = be_cmd_get_hsw_config(adapter, NULL, 0,
					       adapter->if_handle, &hsw_mode);
		if (status)
			return 0;
	}

	return ndo_dflt_bridge_getlink(skb, pid, seq, dev,
				       hsw_mode == PORT_FWD_TYPE_VEPA ?
				       BRIDGE_MODE_VEPA : BRIDGE_MODE_VEB);
}

4313
#ifdef CONFIG_BE2NET_VXLAN
4314 4315 4316 4317 4318 4319 4320 4321 4322 4323 4324 4325 4326 4327 4328 4329 4330 4331 4332 4333 4334 4335 4336 4337 4338 4339 4340 4341 4342 4343 4344 4345 4346 4347 4348 4349 4350 4351 4352 4353 4354 4355 4356 4357 4358 4359 4360 4361 4362 4363 4364 4365 4366 4367 4368 4369 4370 4371
static void be_add_vxlan_port(struct net_device *netdev, sa_family_t sa_family,
			      __be16 port)
{
	struct be_adapter *adapter = netdev_priv(netdev);
	struct device *dev = &adapter->pdev->dev;
	int status;

	if (lancer_chip(adapter) || BEx_chip(adapter))
		return;

	if (adapter->flags & BE_FLAGS_VXLAN_OFFLOADS) {
		dev_warn(dev, "Cannot add UDP port %d for VxLAN offloads\n",
			 be16_to_cpu(port));
		dev_info(dev,
			 "Only one UDP port supported for VxLAN offloads\n");
		return;
	}

	status = be_cmd_manage_iface(adapter, adapter->if_handle,
				     OP_CONVERT_NORMAL_TO_TUNNEL);
	if (status) {
		dev_warn(dev, "Failed to convert normal interface to tunnel\n");
		goto err;
	}

	status = be_cmd_set_vxlan_port(adapter, port);
	if (status) {
		dev_warn(dev, "Failed to add VxLAN port\n");
		goto err;
	}
	adapter->flags |= BE_FLAGS_VXLAN_OFFLOADS;
	adapter->vxlan_port = port;

	dev_info(dev, "Enabled VxLAN offloads for UDP port %d\n",
		 be16_to_cpu(port));
	return;
err:
	be_disable_vxlan_offloads(adapter);
	return;
}

static void be_del_vxlan_port(struct net_device *netdev, sa_family_t sa_family,
			      __be16 port)
{
	struct be_adapter *adapter = netdev_priv(netdev);

	if (lancer_chip(adapter) || BEx_chip(adapter))
		return;

	if (adapter->vxlan_port != port)
		return;

	be_disable_vxlan_offloads(adapter);

	dev_info(&adapter->pdev->dev,
		 "Disabled VxLAN offloads for UDP port %d\n",
		 be16_to_cpu(port));
}
4372
#endif
4373

4374
static const struct net_device_ops be_netdev_ops = {
S
Sathya Perla 已提交
4375 4376 4377
	.ndo_open		= be_open,
	.ndo_stop		= be_close,
	.ndo_start_xmit		= be_xmit,
4378
	.ndo_set_rx_mode	= be_set_rx_mode,
S
Sathya Perla 已提交
4379 4380
	.ndo_set_mac_address	= be_mac_addr_set,
	.ndo_change_mtu		= be_change_mtu,
4381
	.ndo_get_stats64	= be_get_stats64,
S
Sathya Perla 已提交
4382 4383 4384
	.ndo_validate_addr	= eth_validate_addr,
	.ndo_vlan_rx_add_vid	= be_vlan_add_vid,
	.ndo_vlan_rx_kill_vid	= be_vlan_rem_vid,
4385
	.ndo_set_vf_mac		= be_set_vf_mac,
4386
	.ndo_set_vf_vlan	= be_set_vf_vlan,
4387
	.ndo_set_vf_rate	= be_set_vf_tx_rate,
I
Ivan Vecera 已提交
4388
	.ndo_get_vf_config	= be_get_vf_config,
4389
	.ndo_set_vf_link_state  = be_set_vf_link_state,
I
Ivan Vecera 已提交
4390 4391 4392
#ifdef CONFIG_NET_POLL_CONTROLLER
	.ndo_poll_controller	= be_netpoll,
#endif
4393 4394
	.ndo_bridge_setlink	= be_ndo_bridge_setlink,
	.ndo_bridge_getlink	= be_ndo_bridge_getlink,
4395
#ifdef CONFIG_NET_RX_BUSY_POLL
4396
	.ndo_busy_poll		= be_busy_poll,
4397
#endif
4398
#ifdef CONFIG_BE2NET_VXLAN
4399 4400
	.ndo_add_vxlan_port	= be_add_vxlan_port,
	.ndo_del_vxlan_port	= be_del_vxlan_port,
4401
#endif
S
Sathya Perla 已提交
4402 4403 4404 4405 4406 4407
};

static void be_netdev_init(struct net_device *netdev)
{
	struct be_adapter *adapter = netdev_priv(netdev);

4408 4409 4410 4411 4412 4413
	if (skyhawk_chip(adapter)) {
		netdev->hw_enc_features |= NETIF_F_IP_CSUM | NETIF_F_IPV6_CSUM |
					   NETIF_F_TSO | NETIF_F_TSO6 |
					   NETIF_F_GSO_UDP_TUNNEL;
		netdev->hw_features |= NETIF_F_GSO_UDP_TUNNEL;
	}
4414
	netdev->hw_features |= NETIF_F_SG | NETIF_F_TSO | NETIF_F_TSO6 |
4415
		NETIF_F_IP_CSUM | NETIF_F_IPV6_CSUM | NETIF_F_RXCSUM |
4416
		NETIF_F_HW_VLAN_CTAG_TX;
4417 4418
	if (be_multi_rxq(adapter))
		netdev->hw_features |= NETIF_F_RXHASH;
4419 4420

	netdev->features |= netdev->hw_features |
4421
		NETIF_F_HW_VLAN_CTAG_RX | NETIF_F_HW_VLAN_CTAG_FILTER;
A
Ajit Khaparde 已提交
4422

4423
	netdev->vlan_features |= NETIF_F_SG | NETIF_F_TSO | NETIF_F_TSO6 |
4424
		NETIF_F_IP_CSUM | NETIF_F_IPV6_CSUM;
4425

4426 4427
	netdev->priv_flags |= IFF_UNICAST_FLT;

S
Sathya Perla 已提交
4428 4429
	netdev->flags |= IFF_MULTICAST;

4430
	netif_set_gso_max_size(netdev, 65535 - ETH_HLEN);
4431

S
Sathya Perla 已提交
4432
	netdev->netdev_ops = &be_netdev_ops;
S
Sathya Perla 已提交
4433

4434
	netdev->ethtool_ops = &be_ethtool_ops;
S
Sathya Perla 已提交
4435 4436 4437 4438
}

static void be_unmap_pci_bars(struct be_adapter *adapter)
{
4439 4440
	if (adapter->csr)
		pci_iounmap(adapter->pdev, adapter->csr);
4441
	if (adapter->db)
S
Sathya Perla 已提交
4442
		pci_iounmap(adapter->pdev, adapter->db);
4443 4444
}

S
Sathya Perla 已提交
4445 4446 4447 4448 4449 4450 4451 4452 4453
static int db_bar(struct be_adapter *adapter)
{
	if (lancer_chip(adapter) || !be_physfn(adapter))
		return 0;
	else
		return 4;
}

static int be_roce_map_pci_bars(struct be_adapter *adapter)
4454
{
S
Sathya Perla 已提交
4455
	if (skyhawk_chip(adapter)) {
S
Sathya Perla 已提交
4456 4457 4458 4459 4460 4461
		adapter->roce_db.size = 4096;
		adapter->roce_db.io_addr = pci_resource_start(adapter->pdev,
							      db_bar(adapter));
		adapter->roce_db.total_size = pci_resource_len(adapter->pdev,
							       db_bar(adapter));
	}
4462
	return 0;
S
Sathya Perla 已提交
4463 4464 4465 4466 4467
}

static int be_map_pci_bars(struct be_adapter *adapter)
{
	u8 __iomem *addr;
4468

4469 4470 4471 4472 4473 4474
	if (BEx_chip(adapter) && be_physfn(adapter)) {
		adapter->csr = pci_iomap(adapter->pdev, 2, 0);
		if (adapter->csr == NULL)
			return -ENOMEM;
	}

S
Sathya Perla 已提交
4475
	addr = pci_iomap(adapter->pdev, db_bar(adapter), 0);
S
Sathya Perla 已提交
4476 4477
	if (addr == NULL)
		goto pci_map_err;
4478
	adapter->db = addr;
S
Sathya Perla 已提交
4479 4480

	be_roce_map_pci_bars(adapter);
S
Sathya Perla 已提交
4481
	return 0;
S
Sathya Perla 已提交
4482

S
Sathya Perla 已提交
4483 4484 4485 4486 4487 4488 4489
pci_map_err:
	be_unmap_pci_bars(adapter);
	return -ENOMEM;
}

static void be_ctrl_cleanup(struct be_adapter *adapter)
{
4490
	struct be_dma_mem *mem = &adapter->mbox_mem_alloced;
S
Sathya Perla 已提交
4491 4492 4493 4494

	be_unmap_pci_bars(adapter);

	if (mem->va)
I
Ivan Vecera 已提交
4495 4496
		dma_free_coherent(&adapter->pdev->dev, mem->size, mem->va,
				  mem->dma);
4497

4498
	mem = &adapter->rx_filter;
4499
	if (mem->va)
I
Ivan Vecera 已提交
4500 4501
		dma_free_coherent(&adapter->pdev->dev, mem->size, mem->va,
				  mem->dma);
S
Sathya Perla 已提交
4502 4503 4504 4505
}

static int be_ctrl_init(struct be_adapter *adapter)
{
4506 4507
	struct be_dma_mem *mbox_mem_alloc = &adapter->mbox_mem_alloced;
	struct be_dma_mem *mbox_mem_align = &adapter->mbox_mem;
4508
	struct be_dma_mem *rx_filter = &adapter->rx_filter;
S
Sathya Perla 已提交
4509
	u32 sli_intf;
S
Sathya Perla 已提交
4510 4511
	int status;

S
Sathya Perla 已提交
4512 4513 4514 4515 4516
	pci_read_config_dword(adapter->pdev, SLI_INTF_REG_OFFSET, &sli_intf);
	adapter->sli_family = (sli_intf & SLI_INTF_FAMILY_MASK) >>
				 SLI_INTF_FAMILY_SHIFT;
	adapter->virtfn = (sli_intf & SLI_INTF_FT_MASK) ? 1 : 0;

S
Sathya Perla 已提交
4517 4518
	status = be_map_pci_bars(adapter);
	if (status)
4519
		goto done;
S
Sathya Perla 已提交
4520 4521

	mbox_mem_alloc->size = sizeof(struct be_mcc_mailbox) + 16;
I
Ivan Vecera 已提交
4522 4523 4524 4525
	mbox_mem_alloc->va = dma_alloc_coherent(&adapter->pdev->dev,
						mbox_mem_alloc->size,
						&mbox_mem_alloc->dma,
						GFP_KERNEL);
S
Sathya Perla 已提交
4526
	if (!mbox_mem_alloc->va) {
4527 4528
		status = -ENOMEM;
		goto unmap_pci_bars;
S
Sathya Perla 已提交
4529 4530 4531 4532 4533
	}
	mbox_mem_align->size = sizeof(struct be_mcc_mailbox);
	mbox_mem_align->va = PTR_ALIGN(mbox_mem_alloc->va, 16);
	mbox_mem_align->dma = PTR_ALIGN(mbox_mem_alloc->dma, 16);
	memset(mbox_mem_align->va, 0, sizeof(struct be_mcc_mailbox));
4534

4535
	rx_filter->size = sizeof(struct be_cmd_req_rx_filter);
4536 4537 4538
	rx_filter->va = dma_zalloc_coherent(&adapter->pdev->dev,
					    rx_filter->size, &rx_filter->dma,
					    GFP_KERNEL);
4539
	if (rx_filter->va == NULL) {
4540 4541 4542
		status = -ENOMEM;
		goto free_mbox;
	}
4543

4544
	mutex_init(&adapter->mbox_lock);
4545 4546
	spin_lock_init(&adapter->mcc_lock);
	spin_lock_init(&adapter->mcc_cq_lock);
4547

4548
	init_completion(&adapter->et_cmd_compl);
4549
	pci_save_state(adapter->pdev);
S
Sathya Perla 已提交
4550
	return 0;
4551 4552

free_mbox:
I
Ivan Vecera 已提交
4553 4554
	dma_free_coherent(&adapter->pdev->dev, mbox_mem_alloc->size,
			  mbox_mem_alloc->va, mbox_mem_alloc->dma);
4555 4556 4557 4558 4559 4560

unmap_pci_bars:
	be_unmap_pci_bars(adapter);

done:
	return status;
S
Sathya Perla 已提交
4561 4562 4563 4564
}

static void be_stats_cleanup(struct be_adapter *adapter)
{
4565
	struct be_dma_mem *cmd = &adapter->stats_cmd;
S
Sathya Perla 已提交
4566 4567

	if (cmd->va)
I
Ivan Vecera 已提交
4568 4569
		dma_free_coherent(&adapter->pdev->dev, cmd->size,
				  cmd->va, cmd->dma);
S
Sathya Perla 已提交
4570 4571 4572 4573
}

static int be_stats_init(struct be_adapter *adapter)
{
4574
	struct be_dma_mem *cmd = &adapter->stats_cmd;
S
Sathya Perla 已提交
4575

4576 4577 4578
	if (lancer_chip(adapter))
		cmd->size = sizeof(struct lancer_cmd_req_pport_stats);
	else if (BE2_chip(adapter))
4579
		cmd->size = sizeof(struct be_cmd_req_get_stats_v0);
4580
	else if (BE3_chip(adapter))
4581
		cmd->size = sizeof(struct be_cmd_req_get_stats_v1);
4582 4583 4584
	else
		/* ALL non-BE ASICs */
		cmd->size = sizeof(struct be_cmd_req_get_stats_v2);
4585

4586 4587
	cmd->va = dma_zalloc_coherent(&adapter->pdev->dev, cmd->size, &cmd->dma,
				      GFP_KERNEL);
S
Sathya Perla 已提交
4588
	if (cmd->va == NULL)
4589
		return -ENOMEM;
S
Sathya Perla 已提交
4590 4591 4592
	return 0;
}

B
Bill Pemberton 已提交
4593
static void be_remove(struct pci_dev *pdev)
S
Sathya Perla 已提交
4594 4595
{
	struct be_adapter *adapter = pci_get_drvdata(pdev);
4596

S
Sathya Perla 已提交
4597 4598 4599
	if (!adapter)
		return;

4600
	be_roce_dev_remove(adapter);
4601
	be_intr_set(adapter, false);
4602

4603 4604
	cancel_delayed_work_sync(&adapter->func_recovery_work);

S
Sathya Perla 已提交
4605 4606
	unregister_netdev(adapter->netdev);

4607 4608
	be_clear(adapter);

4609 4610 4611
	/* tell fw we're done with firing cmds */
	be_cmd_fw_clean(adapter);

S
Sathya Perla 已提交
4612 4613 4614 4615
	be_stats_cleanup(adapter);

	be_ctrl_cleanup(adapter);

S
Sathya Perla 已提交
4616 4617
	pci_disable_pcie_error_reporting(pdev);

S
Sathya Perla 已提交
4618 4619 4620 4621 4622 4623
	pci_release_regions(pdev);
	pci_disable_device(pdev);

	free_netdev(adapter->netdev);
}

4624
static int be_get_initial_config(struct be_adapter *adapter)
S
Sathya Perla 已提交
4625
{
4626
	int status, level;
S
Sathya Perla 已提交
4627

4628 4629 4630 4631
	status = be_cmd_get_cntl_attributes(adapter);
	if (status)
		return status;

4632 4633 4634
	/* Must be a power of 2 or else MODULO will BUG_ON */
	adapter->be_get_temp_freq = 64;

4635 4636 4637 4638 4639
	if (BEx_chip(adapter)) {
		level = be_cmd_get_fw_log_level(adapter);
		adapter->msg_enable =
			level <= FW_LOG_LEVEL_DEFAULT ? NETIF_MSG_HW : 0;
	}
4640

4641
	adapter->cfg_num_qs = netif_get_num_default_rss_queues();
4642
	return 0;
S
Sathya Perla 已提交
4643 4644
}

4645
static int lancer_recover_func(struct be_adapter *adapter)
4646
{
4647
	struct device *dev = &adapter->pdev->dev;
4648 4649
	int status;

4650 4651 4652
	status = lancer_test_and_set_rdy_state(adapter);
	if (status)
		goto err;
4653

4654 4655
	if (netif_running(adapter->netdev))
		be_close(adapter->netdev);
4656

4657 4658
	be_clear(adapter);

4659
	be_clear_all_error(adapter);
4660 4661 4662 4663

	status = be_setup(adapter);
	if (status)
		goto err;
4664

4665 4666
	if (netif_running(adapter->netdev)) {
		status = be_open(adapter->netdev);
4667 4668
		if (status)
			goto err;
4669
	}
4670

4671
	dev_err(dev, "Adapter recovery successful\n");
4672 4673
	return 0;
err:
4674 4675 4676
	if (status == -EAGAIN)
		dev_err(dev, "Waiting for resource provisioning\n");
	else
4677
		dev_err(dev, "Adapter recovery failed\n");
4678

4679 4680 4681 4682 4683 4684 4685
	return status;
}

static void be_func_recovery_task(struct work_struct *work)
{
	struct be_adapter *adapter =
		container_of(work, struct be_adapter,  func_recovery_work.work);
4686
	int status = 0;
4687

4688
	be_detect_error(adapter);
4689

4690
	if (adapter->hw_error && lancer_chip(adapter)) {
4691

4692 4693 4694
		rtnl_lock();
		netif_device_detach(adapter->netdev);
		rtnl_unlock();
4695

4696 4697 4698
		status = lancer_recover_func(adapter);
		if (!status)
			netif_device_attach(adapter->netdev);
4699
	}
4700

4701 4702 4703 4704 4705 4706
	/* In Lancer, for all errors other than provisioning error (-EAGAIN),
	 * no need to attempt further recovery.
	 */
	if (!status || status == -EAGAIN)
		schedule_delayed_work(&adapter->func_recovery_work,
				      msecs_to_jiffies(1000));
4707 4708 4709 4710 4711 4712 4713 4714 4715 4716 4717 4718
}

static void be_worker(struct work_struct *work)
{
	struct be_adapter *adapter =
		container_of(work, struct be_adapter, work.work);
	struct be_rx_obj *rxo;
	int i;

	/* when interrupts are not yet enabled, just reap any pending
	* mcc completions */
	if (!netif_running(adapter->netdev)) {
4719
		local_bh_disable();
S
Sathya Perla 已提交
4720
		be_process_mcc(adapter);
4721
		local_bh_enable();
4722 4723 4724 4725 4726 4727 4728 4729 4730 4731 4732
		goto reschedule;
	}

	if (!adapter->stats_cmd_sent) {
		if (lancer_chip(adapter))
			lancer_cmd_get_pport_stats(adapter,
						&adapter->stats_cmd);
		else
			be_cmd_get_stats(adapter, &adapter->stats_cmd);
	}

4733 4734
	if (be_physfn(adapter) &&
	    MODULO(adapter->work_counter, adapter->be_get_temp_freq) == 0)
4735 4736
		be_cmd_get_die_temperature(adapter);

4737
	for_all_rx_queues(adapter, rxo, i) {
4738 4739 4740 4741
		/* Replenish RX-queues starved due to memory
		 * allocation failures.
		 */
		if (rxo->rx_post_starved)
4742 4743 4744
			be_post_rx_frags(rxo, GFP_KERNEL);
	}

4745
	be_eqd_update(adapter);
S
Sathya Perla 已提交
4746

4747 4748 4749 4750 4751
reschedule:
	adapter->work_counter++;
	schedule_delayed_work(&adapter->work, msecs_to_jiffies(1000));
}

4752
/* If any VFs are already enabled don't FLR the PF */
4753 4754
static bool be_reset_required(struct be_adapter *adapter)
{
4755
	return pci_num_vf(adapter->pdev) ? false : true;
4756 4757
}

S
Sathya Perla 已提交
4758 4759
static char *mc_name(struct be_adapter *adapter)
{
4760 4761 4762 4763 4764 4765 4766 4767 4768 4769 4770 4771 4772 4773 4774 4775 4776 4777 4778 4779 4780 4781 4782 4783 4784 4785
	char *str = "";	/* default */

	switch (adapter->mc_type) {
	case UMC:
		str = "UMC";
		break;
	case FLEX10:
		str = "FLEX10";
		break;
	case vNIC1:
		str = "vNIC-1";
		break;
	case nPAR:
		str = "nPAR";
		break;
	case UFP:
		str = "UFP";
		break;
	case vNIC2:
		str = "vNIC-2";
		break;
	default:
		str = "";
	}

	return str;
S
Sathya Perla 已提交
4786 4787 4788 4789 4790 4791 4792
}

static inline char *func_name(struct be_adapter *adapter)
{
	return be_physfn(adapter) ? "PF" : "VF";
}

4793
static int be_probe(struct pci_dev *pdev, const struct pci_device_id *pdev_id)
S
Sathya Perla 已提交
4794 4795 4796 4797
{
	int status = 0;
	struct be_adapter *adapter;
	struct net_device *netdev;
4798
	char port_name;
S
Sathya Perla 已提交
4799 4800 4801 4802 4803 4804 4805 4806 4807 4808

	status = pci_enable_device(pdev);
	if (status)
		goto do_none;

	status = pci_request_regions(pdev, DRV_NAME);
	if (status)
		goto disable_dev;
	pci_set_master(pdev);

4809
	netdev = alloc_etherdev_mqs(sizeof(*adapter), MAX_TX_QS, MAX_RX_QS);
S
Sathya Perla 已提交
4810 4811 4812 4813 4814 4815 4816 4817
	if (netdev == NULL) {
		status = -ENOMEM;
		goto rel_reg;
	}
	adapter = netdev_priv(netdev);
	adapter->pdev = pdev;
	pci_set_drvdata(pdev, adapter);
	adapter->netdev = netdev;
4818
	SET_NETDEV_DEV(netdev, &pdev->dev);
S
Sathya Perla 已提交
4819

4820
	status = dma_set_mask_and_coherent(&pdev->dev, DMA_BIT_MASK(64));
S
Sathya Perla 已提交
4821 4822 4823
	if (!status) {
		netdev->features |= NETIF_F_HIGHDMA;
	} else {
4824
		status = dma_set_mask_and_coherent(&pdev->dev, DMA_BIT_MASK(32));
S
Sathya Perla 已提交
4825 4826 4827 4828 4829 4830
		if (status) {
			dev_err(&pdev->dev, "Could not set PCI DMA Mask\n");
			goto free_netdev;
		}
	}

4831 4832 4833 4834 4835
	if (be_physfn(adapter)) {
		status = pci_enable_pcie_error_reporting(pdev);
		if (!status)
			dev_info(&pdev->dev, "PCIe error reporting enabled\n");
	}
S
Sathya Perla 已提交
4836

S
Sathya Perla 已提交
4837 4838
	status = be_ctrl_init(adapter);
	if (status)
4839
		goto free_netdev;
S
Sathya Perla 已提交
4840

4841
	/* sync up with fw's ready state */
4842
	if (be_physfn(adapter)) {
4843
		status = be_fw_wait_ready(adapter);
4844 4845 4846
		if (status)
			goto ctrl_clean;
	}
S
Sathya Perla 已提交
4847

4848 4849 4850 4851
	if (be_reset_required(adapter)) {
		status = be_cmd_reset_function(adapter);
		if (status)
			goto ctrl_clean;
4852

4853 4854 4855
		/* Wait for interrupts to quiesce after an FLR */
		msleep(100);
	}
4856 4857 4858

	/* Allow interrupts for other ULPs running on NIC function */
	be_intr_set(adapter, true);
S
Sathya Perla 已提交
4859

4860 4861 4862 4863 4864
	/* tell fw we're ready to fire cmds */
	status = be_cmd_fw_init(adapter);
	if (status)
		goto ctrl_clean;

4865 4866 4867 4868
	status = be_stats_init(adapter);
	if (status)
		goto ctrl_clean;

4869
	status = be_get_initial_config(adapter);
S
Sathya Perla 已提交
4870 4871 4872 4873
	if (status)
		goto stats_clean;

	INIT_DELAYED_WORK(&adapter->work, be_worker);
4874
	INIT_DELAYED_WORK(&adapter->func_recovery_work, be_func_recovery_task);
4875
	adapter->rx_fc = adapter->tx_fc = true;
S
Sathya Perla 已提交
4876

4877 4878
	status = be_setup(adapter);
	if (status)
4879
		goto stats_clean;
4880

4881
	be_netdev_init(netdev);
S
Sathya Perla 已提交
4882 4883
	status = register_netdev(netdev);
	if (status != 0)
4884
		goto unsetup;
S
Sathya Perla 已提交
4885

4886 4887
	be_roce_dev_add(adapter);

4888 4889
	schedule_delayed_work(&adapter->func_recovery_work,
			      msecs_to_jiffies(1000));
4890 4891 4892

	be_cmd_query_port_name(adapter, &port_name);

S
Sathya Perla 已提交
4893 4894
	dev_info(&pdev->dev, "%s: %s %s port %c\n", nic_name(pdev),
		 func_name(adapter), mc_name(adapter), port_name);
4895

S
Sathya Perla 已提交
4896 4897
	return 0;

4898 4899
unsetup:
	be_clear(adapter);
S
Sathya Perla 已提交
4900 4901 4902 4903
stats_clean:
	be_stats_cleanup(adapter);
ctrl_clean:
	be_ctrl_cleanup(adapter);
4904
free_netdev:
4905
	free_netdev(netdev);
S
Sathya Perla 已提交
4906 4907 4908 4909 4910
rel_reg:
	pci_release_regions(pdev);
disable_dev:
	pci_disable_device(pdev);
do_none:
4911
	dev_err(&pdev->dev, "%s initialization failed\n", nic_name(pdev));
S
Sathya Perla 已提交
4912 4913 4914 4915 4916 4917 4918 4919
	return status;
}

static int be_suspend(struct pci_dev *pdev, pm_message_t state)
{
	struct be_adapter *adapter = pci_get_drvdata(pdev);
	struct net_device *netdev =  adapter->netdev;

S
Suresh Reddy 已提交
4920
	if (adapter->wol_en)
4921 4922
		be_setup_wol(adapter, true);

4923
	be_intr_set(adapter, false);
4924 4925
	cancel_delayed_work_sync(&adapter->func_recovery_work);

S
Sathya Perla 已提交
4926 4927 4928 4929 4930 4931
	netif_device_detach(netdev);
	if (netif_running(netdev)) {
		rtnl_lock();
		be_close(netdev);
		rtnl_unlock();
	}
4932
	be_clear(adapter);
S
Sathya Perla 已提交
4933 4934 4935 4936 4937 4938 4939 4940 4941 4942 4943 4944 4945 4946 4947 4948 4949 4950 4951

	pci_save_state(pdev);
	pci_disable_device(pdev);
	pci_set_power_state(pdev, pci_choose_state(pdev, state));
	return 0;
}

static int be_resume(struct pci_dev *pdev)
{
	int status = 0;
	struct be_adapter *adapter = pci_get_drvdata(pdev);
	struct net_device *netdev =  adapter->netdev;

	netif_device_detach(netdev);

	status = pci_enable_device(pdev);
	if (status)
		return status;

4952
	pci_set_power_state(pdev, PCI_D0);
S
Sathya Perla 已提交
4953 4954
	pci_restore_state(pdev);

4955 4956 4957 4958
	status = be_fw_wait_ready(adapter);
	if (status)
		return status;

4959
	be_intr_set(adapter, true);
4960 4961 4962 4963 4964
	/* tell fw we're ready to fire cmds */
	status = be_cmd_fw_init(adapter);
	if (status)
		return status;

4965
	be_setup(adapter);
S
Sathya Perla 已提交
4966 4967 4968 4969 4970
	if (netif_running(netdev)) {
		rtnl_lock();
		be_open(netdev);
		rtnl_unlock();
	}
4971 4972 4973

	schedule_delayed_work(&adapter->func_recovery_work,
			      msecs_to_jiffies(1000));
S
Sathya Perla 已提交
4974
	netif_device_attach(netdev);
4975

S
Suresh Reddy 已提交
4976
	if (adapter->wol_en)
4977
		be_setup_wol(adapter, false);
4978

S
Sathya Perla 已提交
4979 4980 4981
	return 0;
}

4982 4983 4984 4985 4986 4987 4988
/*
 * An FLR will stop BE from DMAing any data.
 */
static void be_shutdown(struct pci_dev *pdev)
{
	struct be_adapter *adapter = pci_get_drvdata(pdev);

4989 4990
	if (!adapter)
		return;
4991

4992
	cancel_delayed_work_sync(&adapter->work);
4993
	cancel_delayed_work_sync(&adapter->func_recovery_work);
4994

4995
	netif_device_detach(adapter->netdev);
4996

4997 4998
	be_cmd_reset_function(adapter);

4999 5000 5001
	pci_disable_device(pdev);
}

5002
static pci_ers_result_t be_eeh_err_detected(struct pci_dev *pdev,
5003
					    pci_channel_state_t state)
5004 5005 5006 5007 5008 5009
{
	struct be_adapter *adapter = pci_get_drvdata(pdev);
	struct net_device *netdev =  adapter->netdev;

	dev_err(&adapter->pdev->dev, "EEH error detected\n");

5010 5011
	if (!adapter->eeh_error) {
		adapter->eeh_error = true;
5012

5013
		cancel_delayed_work_sync(&adapter->func_recovery_work);
5014 5015

		rtnl_lock();
5016 5017 5018
		netif_device_detach(netdev);
		if (netif_running(netdev))
			be_close(netdev);
5019
		rtnl_unlock();
5020 5021

		be_clear(adapter);
5022 5023 5024 5025 5026 5027 5028
	}

	if (state == pci_channel_io_perm_failure)
		return PCI_ERS_RESULT_DISCONNECT;

	pci_disable_device(pdev);

5029 5030
	/* The error could cause the FW to trigger a flash debug dump.
	 * Resetting the card while flash dump is in progress
5031 5032 5033
	 * can cause it not to recover; wait for it to finish.
	 * Wait only for first function as it is needed only once per
	 * adapter.
5034
	 */
5035 5036 5037
	if (pdev->devfn == 0)
		ssleep(30);

5038 5039 5040 5041 5042 5043 5044 5045 5046 5047 5048 5049 5050 5051 5052
	return PCI_ERS_RESULT_NEED_RESET;
}

static pci_ers_result_t be_eeh_reset(struct pci_dev *pdev)
{
	struct be_adapter *adapter = pci_get_drvdata(pdev);
	int status;

	dev_info(&adapter->pdev->dev, "EEH reset\n");

	status = pci_enable_device(pdev);
	if (status)
		return PCI_ERS_RESULT_DISCONNECT;

	pci_set_master(pdev);
5053
	pci_set_power_state(pdev, PCI_D0);
5054 5055 5056
	pci_restore_state(pdev);

	/* Check if card is ok and fw is ready */
5057 5058
	dev_info(&adapter->pdev->dev,
		 "Waiting for FW to be ready after EEH reset\n");
5059
	status = be_fw_wait_ready(adapter);
5060 5061 5062
	if (status)
		return PCI_ERS_RESULT_DISCONNECT;

S
Sathya Perla 已提交
5063
	pci_cleanup_aer_uncorrect_error_status(pdev);
5064
	be_clear_all_error(adapter);
5065 5066 5067 5068 5069 5070 5071 5072 5073 5074 5075 5076 5077
	return PCI_ERS_RESULT_RECOVERED;
}

static void be_eeh_resume(struct pci_dev *pdev)
{
	int status = 0;
	struct be_adapter *adapter = pci_get_drvdata(pdev);
	struct net_device *netdev =  adapter->netdev;

	dev_info(&adapter->pdev->dev, "EEH resume\n");

	pci_save_state(pdev);

5078
	status = be_cmd_reset_function(adapter);
5079 5080 5081
	if (status)
		goto err;

5082 5083 5084 5085 5086 5087
	/* On some BE3 FW versions, after a HW reset,
	 * interrupts will remain disabled for each function.
	 * So, explicitly enable interrupts
	 */
	be_intr_set(adapter, true);

5088 5089
	/* tell fw we're ready to fire cmds */
	status = be_cmd_fw_init(adapter);
5090 5091 5092
	if (status)
		goto err;

5093 5094 5095 5096 5097 5098 5099 5100 5101
	status = be_setup(adapter);
	if (status)
		goto err;

	if (netif_running(netdev)) {
		status = be_open(netdev);
		if (status)
			goto err;
	}
5102 5103 5104

	schedule_delayed_work(&adapter->func_recovery_work,
			      msecs_to_jiffies(1000));
5105 5106 5107 5108 5109 5110
	netif_device_attach(netdev);
	return;
err:
	dev_err(&adapter->pdev->dev, "EEH resume failed\n");
}

5111
static const struct pci_error_handlers be_eeh_handlers = {
5112 5113 5114 5115 5116
	.error_detected = be_eeh_err_detected,
	.slot_reset = be_eeh_reset,
	.resume = be_eeh_resume,
};

S
Sathya Perla 已提交
5117 5118 5119 5120 5121 5122
static struct pci_driver be_driver = {
	.name = DRV_NAME,
	.id_table = be_dev_ids,
	.probe = be_probe,
	.remove = be_remove,
	.suspend = be_suspend,
5123
	.resume = be_resume,
5124
	.shutdown = be_shutdown,
5125
	.err_handler = &be_eeh_handlers
S
Sathya Perla 已提交
5126 5127 5128 5129
};

static int __init be_init_module(void)
{
5130 5131
	if (rx_frag_size != 8192 && rx_frag_size != 4096 &&
	    rx_frag_size != 2048) {
S
Sathya Perla 已提交
5132 5133 5134 5135 5136 5137 5138 5139 5140 5141 5142 5143 5144 5145 5146
		printk(KERN_WARNING DRV_NAME
			" : Module param rx_frag_size must be 2048/4096/8192."
			" Using 2048\n");
		rx_frag_size = 2048;
	}

	return pci_register_driver(&be_driver);
}
module_init(be_init_module);

static void __exit be_exit_module(void)
{
	pci_unregister_driver(&be_driver);
}
module_exit(be_exit_module);