be_main.c 132.2 KB
Newer Older
S
Sathya Perla 已提交
1
/*
V
Vasundhara Volam 已提交
2
 * Copyright (C) 2005 - 2014 Emulex
S
Sathya Perla 已提交
3 4 5 6 7 8 9 10
 * All rights reserved.
 *
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License version 2
 * as published by the Free Software Foundation.  The full GNU General
 * Public License is included in this distribution in the file called COPYING.
 *
 * Contact Information:
11
 * linux-drivers@emulex.com
S
Sathya Perla 已提交
12
 *
13 14 15
 * Emulex
 * 3333 Susan Street
 * Costa Mesa, CA 92626
S
Sathya Perla 已提交
16 17
 */

18
#include <linux/prefetch.h>
19
#include <linux/module.h>
S
Sathya Perla 已提交
20
#include "be.h"
21
#include "be_cmds.h"
22
#include <asm/div64.h>
S
Sathya Perla 已提交
23
#include <linux/aer.h>
24
#include <linux/if_bridge.h>
25
#include <net/busy_poll.h>
26
#include <net/vxlan.h>
S
Sathya Perla 已提交
27 28 29 30

MODULE_VERSION(DRV_VER);
MODULE_DEVICE_TABLE(pci, be_dev_ids);
MODULE_DESCRIPTION(DRV_DESC " " DRV_VER);
31
MODULE_AUTHOR("Emulex Corporation");
S
Sathya Perla 已提交
32 33
MODULE_LICENSE("GPL");

34 35 36
static unsigned int num_vfs;
module_param(num_vfs, uint, S_IRUGO);
MODULE_PARM_DESC(num_vfs, "Number of PCI VFs to initialize");
S
Sathya Perla 已提交
37

38 39 40 41
static ushort rx_frag_size = 2048;
module_param(rx_frag_size, ushort, S_IRUGO);
MODULE_PARM_DESC(rx_frag_size, "Size of a fragment that holds rcvd data.");

S
Sathya Perla 已提交
42
static DEFINE_PCI_DEVICE_TABLE(be_dev_ids) = {
43
	{ PCI_DEVICE(BE_VENDOR_ID, BE_DEVICE_ID1) },
44
	{ PCI_DEVICE(BE_VENDOR_ID, BE_DEVICE_ID2) },
45 46
	{ PCI_DEVICE(BE_VENDOR_ID, OC_DEVICE_ID1) },
	{ PCI_DEVICE(BE_VENDOR_ID, OC_DEVICE_ID2) },
47
	{ PCI_DEVICE(EMULEX_VENDOR_ID, OC_DEVICE_ID3)},
48
	{ PCI_DEVICE(EMULEX_VENDOR_ID, OC_DEVICE_ID4)},
49
	{ PCI_DEVICE(EMULEX_VENDOR_ID, OC_DEVICE_ID5)},
50
	{ PCI_DEVICE(EMULEX_VENDOR_ID, OC_DEVICE_ID6)},
S
Sathya Perla 已提交
51 52 53
	{ 0 }
};
MODULE_DEVICE_TABLE(pci, be_dev_ids);
54
/* UE Status Low CSR */
55
static const char * const ue_status_low_desc[] = {
56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83
	"CEV",
	"CTX",
	"DBUF",
	"ERX",
	"Host",
	"MPU",
	"NDMA",
	"PTC ",
	"RDMA ",
	"RXF ",
	"RXIPS ",
	"RXULP0 ",
	"RXULP1 ",
	"RXULP2 ",
	"TIM ",
	"TPOST ",
	"TPRE ",
	"TXIPS ",
	"TXULP0 ",
	"TXULP1 ",
	"UC ",
	"WDMA ",
	"TXULP2 ",
	"HOST1 ",
	"P0_OB_LINK ",
	"P1_OB_LINK ",
	"HOST_GPIO ",
	"MBOX ",
84 85 86 87
	"ERX2 ",
	"SPARE ",
	"JTAG ",
	"MPU_INTPEND "
88 89
};
/* UE Status High CSR */
90
static const char * const ue_status_hi_desc[] = {
91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111
	"LPCMEMHOST",
	"MGMT_MAC",
	"PCS0ONLINE",
	"MPU_IRAM",
	"PCS1ONLINE",
	"PCTL0",
	"PCTL1",
	"PMEM",
	"RR",
	"TXPB",
	"RXPP",
	"XAUI",
	"TXP",
	"ARM",
	"IPC",
	"HOST2",
	"HOST3",
	"HOST4",
	"HOST5",
	"HOST6",
	"HOST7",
112 113
	"ECRC",
	"Poison TLP",
114
	"NETC",
115 116 117 118 119 120 121
	"PERIPH",
	"LLTXULP",
	"D2P",
	"RCON",
	"LDMA",
	"LLTXP",
	"LLTXPB",
122 123
	"Unknown"
};
S
Sathya Perla 已提交
124

125

S
Sathya Perla 已提交
126 127 128
static void be_queue_free(struct be_adapter *adapter, struct be_queue_info *q)
{
	struct be_dma_mem *mem = &q->dma_mem;
129
	if (mem->va) {
I
Ivan Vecera 已提交
130 131
		dma_free_coherent(&adapter->pdev->dev, mem->size, mem->va,
				  mem->dma);
132 133
		mem->va = NULL;
	}
S
Sathya Perla 已提交
134 135 136
}

static int be_queue_alloc(struct be_adapter *adapter, struct be_queue_info *q,
137
			  u16 len, u16 entry_size)
S
Sathya Perla 已提交
138 139 140 141 142 143 144
{
	struct be_dma_mem *mem = &q->dma_mem;

	memset(q, 0, sizeof(*q));
	q->len = len;
	q->entry_size = entry_size;
	mem->size = len * entry_size;
145 146
	mem->va = dma_zalloc_coherent(&adapter->pdev->dev, mem->size, &mem->dma,
				      GFP_KERNEL);
S
Sathya Perla 已提交
147
	if (!mem->va)
S
Sathya Perla 已提交
148
		return -ENOMEM;
S
Sathya Perla 已提交
149 150 151
	return 0;
}

152
static void be_reg_intr_set(struct be_adapter *adapter, bool enable)
S
Sathya Perla 已提交
153
{
154
	u32 reg, enabled;
155

156
	pci_read_config_dword(adapter->pdev, PCICFG_MEMBAR_CTRL_INT_CTRL_OFFSET,
157
			      &reg);
158 159
	enabled = reg & MEMBAR_CTRL_INT_CTRL_HOSTINTR_MASK;

160
	if (!enabled && enable)
S
Sathya Perla 已提交
161
		reg |= MEMBAR_CTRL_INT_CTRL_HOSTINTR_MASK;
162
	else if (enabled && !enable)
S
Sathya Perla 已提交
163
		reg &= ~MEMBAR_CTRL_INT_CTRL_HOSTINTR_MASK;
164
	else
S
Sathya Perla 已提交
165
		return;
166

167
	pci_write_config_dword(adapter->pdev,
168
			       PCICFG_MEMBAR_CTRL_INT_CTRL_OFFSET, reg);
S
Sathya Perla 已提交
169 170
}

171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186
static void be_intr_set(struct be_adapter *adapter, bool enable)
{
	int status = 0;

	/* On lancer interrupts can't be controlled via this register */
	if (lancer_chip(adapter))
		return;

	if (adapter->eeh_error)
		return;

	status = be_cmd_intr_set(adapter, enable);
	if (status)
		be_reg_intr_set(adapter, enable);
}

187
static void be_rxq_notify(struct be_adapter *adapter, u16 qid, u16 posted)
S
Sathya Perla 已提交
188 189 190 191
{
	u32 val = 0;
	val |= qid & DB_RQ_RING_ID_MASK;
	val |= posted << DB_RQ_NUM_POSTED_SHIFT;
192 193

	wmb();
194
	iowrite32(val, adapter->db + DB_RQ_OFFSET);
S
Sathya Perla 已提交
195 196
}

V
Vasundhara Volam 已提交
197 198
static void be_txq_notify(struct be_adapter *adapter, struct be_tx_obj *txo,
			  u16 posted)
S
Sathya Perla 已提交
199 200
{
	u32 val = 0;
V
Vasundhara Volam 已提交
201
	val |= txo->q.id & DB_TXULP_RING_ID_MASK;
S
Sathya Perla 已提交
202
	val |= (posted & DB_TXULP_NUM_POSTED_MASK) << DB_TXULP_NUM_POSTED_SHIFT;
203 204

	wmb();
V
Vasundhara Volam 已提交
205
	iowrite32(val, adapter->db + txo->db_offset);
S
Sathya Perla 已提交
206 207
}

208
static void be_eq_notify(struct be_adapter *adapter, u16 qid,
209
			 bool arm, bool clear_int, u16 num_popped)
S
Sathya Perla 已提交
210 211 212
{
	u32 val = 0;
	val |= qid & DB_EQ_RING_ID_MASK;
213
	val |= ((qid & DB_EQ_RING_ID_EXT_MASK) << DB_EQ_RING_ID_EXT_MASK_SHIFT);
214

215
	if (adapter->eeh_error)
216 217
		return;

S
Sathya Perla 已提交
218 219 220 221 222 223
	if (arm)
		val |= 1 << DB_EQ_REARM_SHIFT;
	if (clear_int)
		val |= 1 << DB_EQ_CLR_SHIFT;
	val |= 1 << DB_EQ_EVNT_SHIFT;
	val |= num_popped << DB_EQ_NUM_POPPED_SHIFT;
224
	iowrite32(val, adapter->db + DB_EQ_OFFSET);
S
Sathya Perla 已提交
225 226
}

227
void be_cq_notify(struct be_adapter *adapter, u16 qid, bool arm, u16 num_popped)
S
Sathya Perla 已提交
228 229 230
{
	u32 val = 0;
	val |= qid & DB_CQ_RING_ID_MASK;
231 232
	val |= ((qid & DB_CQ_RING_ID_EXT_MASK) <<
			DB_CQ_RING_ID_EXT_MASK_SHIFT);
233

234
	if (adapter->eeh_error)
235 236
		return;

S
Sathya Perla 已提交
237 238 239
	if (arm)
		val |= 1 << DB_CQ_REARM_SHIFT;
	val |= num_popped << DB_CQ_NUM_POPPED_SHIFT;
240
	iowrite32(val, adapter->db + DB_CQ_OFFSET);
S
Sathya Perla 已提交
241 242 243 244 245
}

static int be_mac_addr_set(struct net_device *netdev, void *p)
{
	struct be_adapter *adapter = netdev_priv(netdev);
246
	struct device *dev = &adapter->pdev->dev;
S
Sathya Perla 已提交
247
	struct sockaddr *addr = p;
248 249 250
	int status;
	u8 mac[ETH_ALEN];
	u32 old_pmac_id = adapter->pmac_id[0], curr_pmac_id = 0;
S
Sathya Perla 已提交
251

252 253 254
	if (!is_valid_ether_addr(addr->sa_data))
		return -EADDRNOTAVAIL;

255 256 257 258 259 260
	/* Proceed further only if, User provided MAC is different
	 * from active MAC
	 */
	if (ether_addr_equal(addr->sa_data, netdev->dev_addr))
		return 0;

261 262 263 264 265
	/* The PMAC_ADD cmd may fail if the VF doesn't have FILTMGMT
	 * privilege or if PF did not provision the new MAC address.
	 * On BE3, this cmd will always fail if the VF doesn't have the
	 * FILTMGMT privilege. This failure is OK, only if the PF programmed
	 * the MAC for the VF.
266
	 */
267 268 269 270 271 272 273 274 275 276 277
	status = be_cmd_pmac_add(adapter, (u8 *)addr->sa_data,
				 adapter->if_handle, &adapter->pmac_id[0], 0);
	if (!status) {
		curr_pmac_id = adapter->pmac_id[0];

		/* Delete the old programmed MAC. This call may fail if the
		 * old MAC was already deleted by the PF driver.
		 */
		if (adapter->pmac_id[0] != old_pmac_id)
			be_cmd_pmac_del(adapter, adapter->if_handle,
					old_pmac_id, 0);
278 279
	}

280 281
	/* Decide if the new MAC is successfully activated only after
	 * querying the FW
282
	 */
283 284
	status = be_cmd_get_active_mac(adapter, curr_pmac_id, mac,
				       adapter->if_handle, true, 0);
285
	if (status)
286
		goto err;
S
Sathya Perla 已提交
287

288 289 290
	/* The MAC change did not happen, either due to lack of privilege
	 * or PF didn't pre-provision.
	 */
291
	if (!ether_addr_equal(addr->sa_data, mac)) {
292 293 294 295
		status = -EPERM;
		goto err;
	}

296
	memcpy(netdev->dev_addr, addr->sa_data, netdev->addr_len);
297
	dev_info(dev, "MAC address changed to %pM\n", mac);
298 299
	return 0;
err:
300
	dev_warn(dev, "MAC address change to %pM failed\n", addr->sa_data);
S
Sathya Perla 已提交
301 302 303
	return status;
}

304 305 306 307 308 309 310
/* BE2 supports only v0 cmd */
static void *hw_stats_from_cmd(struct be_adapter *adapter)
{
	if (BE2_chip(adapter)) {
		struct be_cmd_resp_get_stats_v0 *cmd = adapter->stats_cmd.va;

		return &cmd->hw_stats;
311
	} else if (BE3_chip(adapter)) {
312 313
		struct be_cmd_resp_get_stats_v1 *cmd = adapter->stats_cmd.va;

314 315 316 317
		return &cmd->hw_stats;
	} else {
		struct be_cmd_resp_get_stats_v2 *cmd = adapter->stats_cmd.va;

318 319 320 321 322 323 324 325 326 327 328
		return &cmd->hw_stats;
	}
}

/* BE2 supports only v0 cmd */
static void *be_erx_stats_from_cmd(struct be_adapter *adapter)
{
	if (BE2_chip(adapter)) {
		struct be_hw_stats_v0 *hw_stats = hw_stats_from_cmd(adapter);

		return &hw_stats->erx;
329
	} else if (BE3_chip(adapter)) {
330 331
		struct be_hw_stats_v1 *hw_stats = hw_stats_from_cmd(adapter);

332 333 334 335
		return &hw_stats->erx;
	} else {
		struct be_hw_stats_v2 *hw_stats = hw_stats_from_cmd(adapter);

336 337 338 339 340
		return &hw_stats->erx;
	}
}

static void populate_be_v0_stats(struct be_adapter *adapter)
341
{
342 343 344
	struct be_hw_stats_v0 *hw_stats = hw_stats_from_cmd(adapter);
	struct be_pmem_stats *pmem_sts = &hw_stats->pmem;
	struct be_rxf_stats_v0 *rxf_stats = &hw_stats->rxf;
345
	struct be_port_rxf_stats_v0 *port_stats =
346 347
					&rxf_stats->port[adapter->port_num];
	struct be_drv_stats *drvs = &adapter->drv_stats;
348

349
	be_dws_le_to_cpu(hw_stats, sizeof(*hw_stats));
350 351 352 353 354 355 356 357 358 359 360 361 362 363
	drvs->rx_pause_frames = port_stats->rx_pause_frames;
	drvs->rx_crc_errors = port_stats->rx_crc_errors;
	drvs->rx_control_frames = port_stats->rx_control_frames;
	drvs->rx_in_range_errors = port_stats->rx_in_range_errors;
	drvs->rx_frame_too_long = port_stats->rx_frame_too_long;
	drvs->rx_dropped_runt = port_stats->rx_dropped_runt;
	drvs->rx_ip_checksum_errs = port_stats->rx_ip_checksum_errs;
	drvs->rx_tcp_checksum_errs = port_stats->rx_tcp_checksum_errs;
	drvs->rx_udp_checksum_errs = port_stats->rx_udp_checksum_errs;
	drvs->rxpp_fifo_overflow_drop = port_stats->rx_fifo_overflow;
	drvs->rx_dropped_tcp_length = port_stats->rx_dropped_tcp_length;
	drvs->rx_dropped_too_small = port_stats->rx_dropped_too_small;
	drvs->rx_dropped_too_short = port_stats->rx_dropped_too_short;
	drvs->rx_out_range_errors = port_stats->rx_out_range_errors;
364
	drvs->rx_input_fifo_overflow_drop = port_stats->rx_input_fifo_overflow;
365 366
	drvs->rx_dropped_header_too_small =
		port_stats->rx_dropped_header_too_small;
367 368 369
	drvs->rx_address_filtered =
					port_stats->rx_address_filtered +
					port_stats->rx_vlan_filtered;
370 371 372 373 374 375 376
	drvs->rx_alignment_symbol_errors =
		port_stats->rx_alignment_symbol_errors;

	drvs->tx_pauseframes = port_stats->tx_pauseframes;
	drvs->tx_controlframes = port_stats->tx_controlframes;

	if (adapter->port_num)
377
		drvs->jabber_events = rxf_stats->port1_jabber_events;
378
	else
379
		drvs->jabber_events = rxf_stats->port0_jabber_events;
380 381 382 383
	drvs->rx_drops_no_pbuf = rxf_stats->rx_drops_no_pbuf;
	drvs->rx_drops_no_erx_descr = rxf_stats->rx_drops_no_erx_descr;
	drvs->forwarded_packets = rxf_stats->forwarded_packets;
	drvs->rx_drops_mtu = rxf_stats->rx_drops_mtu;
384 385
	drvs->rx_drops_no_tpre_descr = rxf_stats->rx_drops_no_tpre_descr;
	drvs->rx_drops_too_many_frags = rxf_stats->rx_drops_too_many_frags;
386 387 388
	adapter->drv_stats.eth_red_drops = pmem_sts->eth_red_drops;
}

389
static void populate_be_v1_stats(struct be_adapter *adapter)
390
{
391 392 393
	struct be_hw_stats_v1 *hw_stats = hw_stats_from_cmd(adapter);
	struct be_pmem_stats *pmem_sts = &hw_stats->pmem;
	struct be_rxf_stats_v1 *rxf_stats = &hw_stats->rxf;
394
	struct be_port_rxf_stats_v1 *port_stats =
395 396
					&rxf_stats->port[adapter->port_num];
	struct be_drv_stats *drvs = &adapter->drv_stats;
397

398
	be_dws_le_to_cpu(hw_stats, sizeof(*hw_stats));
399 400
	drvs->pmem_fifo_overflow_drop = port_stats->pmem_fifo_overflow_drop;
	drvs->rx_priority_pause_frames = port_stats->rx_priority_pause_frames;
401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417
	drvs->rx_pause_frames = port_stats->rx_pause_frames;
	drvs->rx_crc_errors = port_stats->rx_crc_errors;
	drvs->rx_control_frames = port_stats->rx_control_frames;
	drvs->rx_in_range_errors = port_stats->rx_in_range_errors;
	drvs->rx_frame_too_long = port_stats->rx_frame_too_long;
	drvs->rx_dropped_runt = port_stats->rx_dropped_runt;
	drvs->rx_ip_checksum_errs = port_stats->rx_ip_checksum_errs;
	drvs->rx_tcp_checksum_errs = port_stats->rx_tcp_checksum_errs;
	drvs->rx_udp_checksum_errs = port_stats->rx_udp_checksum_errs;
	drvs->rx_dropped_tcp_length = port_stats->rx_dropped_tcp_length;
	drvs->rx_dropped_too_small = port_stats->rx_dropped_too_small;
	drvs->rx_dropped_too_short = port_stats->rx_dropped_too_short;
	drvs->rx_out_range_errors = port_stats->rx_out_range_errors;
	drvs->rx_dropped_header_too_small =
		port_stats->rx_dropped_header_too_small;
	drvs->rx_input_fifo_overflow_drop =
		port_stats->rx_input_fifo_overflow_drop;
418
	drvs->rx_address_filtered = port_stats->rx_address_filtered;
419 420
	drvs->rx_alignment_symbol_errors =
		port_stats->rx_alignment_symbol_errors;
421
	drvs->rxpp_fifo_overflow_drop = port_stats->rxpp_fifo_overflow_drop;
422 423
	drvs->tx_pauseframes = port_stats->tx_pauseframes;
	drvs->tx_controlframes = port_stats->tx_controlframes;
424
	drvs->tx_priority_pauseframes = port_stats->tx_priority_pauseframes;
425 426 427 428 429
	drvs->jabber_events = port_stats->jabber_events;
	drvs->rx_drops_no_pbuf = rxf_stats->rx_drops_no_pbuf;
	drvs->rx_drops_no_erx_descr = rxf_stats->rx_drops_no_erx_descr;
	drvs->forwarded_packets = rxf_stats->forwarded_packets;
	drvs->rx_drops_mtu = rxf_stats->rx_drops_mtu;
430 431
	drvs->rx_drops_no_tpre_descr = rxf_stats->rx_drops_no_tpre_descr;
	drvs->rx_drops_too_many_frags = rxf_stats->rx_drops_too_many_frags;
432 433 434
	adapter->drv_stats.eth_red_drops = pmem_sts->eth_red_drops;
}

435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478
static void populate_be_v2_stats(struct be_adapter *adapter)
{
	struct be_hw_stats_v2 *hw_stats = hw_stats_from_cmd(adapter);
	struct be_pmem_stats *pmem_sts = &hw_stats->pmem;
	struct be_rxf_stats_v2 *rxf_stats = &hw_stats->rxf;
	struct be_port_rxf_stats_v2 *port_stats =
					&rxf_stats->port[adapter->port_num];
	struct be_drv_stats *drvs = &adapter->drv_stats;

	be_dws_le_to_cpu(hw_stats, sizeof(*hw_stats));
	drvs->pmem_fifo_overflow_drop = port_stats->pmem_fifo_overflow_drop;
	drvs->rx_priority_pause_frames = port_stats->rx_priority_pause_frames;
	drvs->rx_pause_frames = port_stats->rx_pause_frames;
	drvs->rx_crc_errors = port_stats->rx_crc_errors;
	drvs->rx_control_frames = port_stats->rx_control_frames;
	drvs->rx_in_range_errors = port_stats->rx_in_range_errors;
	drvs->rx_frame_too_long = port_stats->rx_frame_too_long;
	drvs->rx_dropped_runt = port_stats->rx_dropped_runt;
	drvs->rx_ip_checksum_errs = port_stats->rx_ip_checksum_errs;
	drvs->rx_tcp_checksum_errs = port_stats->rx_tcp_checksum_errs;
	drvs->rx_udp_checksum_errs = port_stats->rx_udp_checksum_errs;
	drvs->rx_dropped_tcp_length = port_stats->rx_dropped_tcp_length;
	drvs->rx_dropped_too_small = port_stats->rx_dropped_too_small;
	drvs->rx_dropped_too_short = port_stats->rx_dropped_too_short;
	drvs->rx_out_range_errors = port_stats->rx_out_range_errors;
	drvs->rx_dropped_header_too_small =
		port_stats->rx_dropped_header_too_small;
	drvs->rx_input_fifo_overflow_drop =
		port_stats->rx_input_fifo_overflow_drop;
	drvs->rx_address_filtered = port_stats->rx_address_filtered;
	drvs->rx_alignment_symbol_errors =
		port_stats->rx_alignment_symbol_errors;
	drvs->rxpp_fifo_overflow_drop = port_stats->rxpp_fifo_overflow_drop;
	drvs->tx_pauseframes = port_stats->tx_pauseframes;
	drvs->tx_controlframes = port_stats->tx_controlframes;
	drvs->tx_priority_pauseframes = port_stats->tx_priority_pauseframes;
	drvs->jabber_events = port_stats->jabber_events;
	drvs->rx_drops_no_pbuf = rxf_stats->rx_drops_no_pbuf;
	drvs->rx_drops_no_erx_descr = rxf_stats->rx_drops_no_erx_descr;
	drvs->forwarded_packets = rxf_stats->forwarded_packets;
	drvs->rx_drops_mtu = rxf_stats->rx_drops_mtu;
	drvs->rx_drops_no_tpre_descr = rxf_stats->rx_drops_no_tpre_descr;
	drvs->rx_drops_too_many_frags = rxf_stats->rx_drops_too_many_frags;
	adapter->drv_stats.eth_red_drops = pmem_sts->eth_red_drops;
479
	if (be_roce_supported(adapter)) {
480 481 482 483 484 485 486
		drvs->rx_roce_bytes_lsd = port_stats->roce_bytes_received_lsd;
		drvs->rx_roce_bytes_msd = port_stats->roce_bytes_received_msd;
		drvs->rx_roce_frames = port_stats->roce_frames_received;
		drvs->roce_drops_crc = port_stats->roce_drops_crc;
		drvs->roce_drops_payload_len =
			port_stats->roce_drops_payload_len;
	}
487 488
}

S
Selvin Xavier 已提交
489 490
static void populate_lancer_stats(struct be_adapter *adapter)
{
491

S
Selvin Xavier 已提交
492
	struct be_drv_stats *drvs = &adapter->drv_stats;
493
	struct lancer_pport_stats *pport_stats = pport_stats_from_cmd(adapter);
494 495 496 497 498

	be_dws_le_to_cpu(pport_stats, sizeof(*pport_stats));
	drvs->rx_pause_frames = pport_stats->rx_pause_frames_lo;
	drvs->rx_crc_errors = pport_stats->rx_crc_errors_lo;
	drvs->rx_control_frames = pport_stats->rx_control_frames_lo;
S
Selvin Xavier 已提交
499
	drvs->rx_in_range_errors = pport_stats->rx_in_range_errors;
500
	drvs->rx_frame_too_long = pport_stats->rx_frames_too_long_lo;
S
Selvin Xavier 已提交
501 502 503 504 505 506 507 508 509 510 511 512
	drvs->rx_dropped_runt = pport_stats->rx_dropped_runt;
	drvs->rx_ip_checksum_errs = pport_stats->rx_ip_checksum_errors;
	drvs->rx_tcp_checksum_errs = pport_stats->rx_tcp_checksum_errors;
	drvs->rx_udp_checksum_errs = pport_stats->rx_udp_checksum_errors;
	drvs->rx_dropped_tcp_length =
				pport_stats->rx_dropped_invalid_tcp_length;
	drvs->rx_dropped_too_small = pport_stats->rx_dropped_too_small;
	drvs->rx_dropped_too_short = pport_stats->rx_dropped_too_short;
	drvs->rx_out_range_errors = pport_stats->rx_out_of_range_errors;
	drvs->rx_dropped_header_too_small =
				pport_stats->rx_dropped_header_too_small;
	drvs->rx_input_fifo_overflow_drop = pport_stats->rx_fifo_overflow;
513 514 515
	drvs->rx_address_filtered =
					pport_stats->rx_address_filtered +
					pport_stats->rx_vlan_filtered;
516
	drvs->rx_alignment_symbol_errors = pport_stats->rx_symbol_errors_lo;
S
Selvin Xavier 已提交
517
	drvs->rxpp_fifo_overflow_drop = pport_stats->rx_fifo_overflow;
518 519
	drvs->tx_pauseframes = pport_stats->tx_pause_frames_lo;
	drvs->tx_controlframes = pport_stats->tx_control_frames_lo;
S
Selvin Xavier 已提交
520
	drvs->jabber_events = pport_stats->rx_jabbers;
521 522
	drvs->forwarded_packets = pport_stats->num_forwards_lo;
	drvs->rx_drops_mtu = pport_stats->rx_drops_mtu_lo;
S
Selvin Xavier 已提交
523
	drvs->rx_drops_too_many_frags =
524
				pport_stats->rx_drops_too_many_frags_lo;
S
Selvin Xavier 已提交
525
}
526

527 528 529 530 531 532 533 534 535 536 537 538
static void accumulate_16bit_val(u32 *acc, u16 val)
{
#define lo(x)			(x & 0xFFFF)
#define hi(x)			(x & 0xFFFF0000)
	bool wrapped = val < lo(*acc);
	u32 newacc = hi(*acc) + val;

	if (wrapped)
		newacc += 65536;
	ACCESS_ONCE(*acc) = newacc;
}

J
Jingoo Han 已提交
539
static void populate_erx_stats(struct be_adapter *adapter,
540
			       struct be_rx_obj *rxo, u32 erx_stat)
541 542 543 544 545 546 547 548 549 550 551
{
	if (!BEx_chip(adapter))
		rx_stats(rxo)->rx_drops_no_frags = erx_stat;
	else
		/* below erx HW counter can actually wrap around after
		 * 65535. Driver accumulates a 32-bit value
		 */
		accumulate_16bit_val(&rx_stats(rxo)->rx_drops_no_frags,
				     (u16)erx_stat);
}

552 553
void be_parse_stats(struct be_adapter *adapter)
{
554
	struct be_erx_stats_v2 *erx = be_erx_stats_from_cmd(adapter);
555 556
	struct be_rx_obj *rxo;
	int i;
557
	u32 erx_stat;
558

559 560
	if (lancer_chip(adapter)) {
		populate_lancer_stats(adapter);
S
Selvin Xavier 已提交
561
	} else {
562 563
		if (BE2_chip(adapter))
			populate_be_v0_stats(adapter);
564 565
		else if (BE3_chip(adapter))
			/* for BE3 */
566
			populate_be_v1_stats(adapter);
567 568
		else
			populate_be_v2_stats(adapter);
569

570
		/* erx_v2 is longer than v0, v1. use v2 for v0, v1 access */
571
		for_all_rx_queues(adapter, rxo, i) {
572 573
			erx_stat = erx->rx_drops_no_fragments[rxo->q.id];
			populate_erx_stats(adapter, rxo, erx_stat);
574
		}
575
	}
576 577
}

578
static struct rtnl_link_stats64 *be_get_stats64(struct net_device *netdev,
579
						struct rtnl_link_stats64 *stats)
S
Sathya Perla 已提交
580
{
581
	struct be_adapter *adapter = netdev_priv(netdev);
582
	struct be_drv_stats *drvs = &adapter->drv_stats;
583
	struct be_rx_obj *rxo;
584
	struct be_tx_obj *txo;
585 586
	u64 pkts, bytes;
	unsigned int start;
587
	int i;
S
Sathya Perla 已提交
588

589
	for_all_rx_queues(adapter, rxo, i) {
590 591
		const struct be_rx_stats *rx_stats = rx_stats(rxo);
		do {
592
			start = u64_stats_fetch_begin_irq(&rx_stats->sync);
593 594
			pkts = rx_stats(rxo)->rx_pkts;
			bytes = rx_stats(rxo)->rx_bytes;
595
		} while (u64_stats_fetch_retry_irq(&rx_stats->sync, start));
596 597 598 599 600
		stats->rx_packets += pkts;
		stats->rx_bytes += bytes;
		stats->multicast += rx_stats(rxo)->rx_mcast_pkts;
		stats->rx_dropped += rx_stats(rxo)->rx_drops_no_skbs +
					rx_stats(rxo)->rx_drops_no_frags;
601 602
	}

603
	for_all_tx_queues(adapter, txo, i) {
604 605
		const struct be_tx_stats *tx_stats = tx_stats(txo);
		do {
606
			start = u64_stats_fetch_begin_irq(&tx_stats->sync);
607 608
			pkts = tx_stats(txo)->tx_pkts;
			bytes = tx_stats(txo)->tx_bytes;
609
		} while (u64_stats_fetch_retry_irq(&tx_stats->sync, start));
610 611
		stats->tx_packets += pkts;
		stats->tx_bytes += bytes;
612
	}
S
Sathya Perla 已提交
613 614

	/* bad pkts received */
615
	stats->rx_errors = drvs->rx_crc_errors +
616 617 618 619 620 621 622 623
		drvs->rx_alignment_symbol_errors +
		drvs->rx_in_range_errors +
		drvs->rx_out_range_errors +
		drvs->rx_frame_too_long +
		drvs->rx_dropped_too_small +
		drvs->rx_dropped_too_short +
		drvs->rx_dropped_header_too_small +
		drvs->rx_dropped_tcp_length +
624
		drvs->rx_dropped_runt;
625

S
Sathya Perla 已提交
626
	/* detailed rx errors */
627
	stats->rx_length_errors = drvs->rx_in_range_errors +
628 629
		drvs->rx_out_range_errors +
		drvs->rx_frame_too_long;
630

631
	stats->rx_crc_errors = drvs->rx_crc_errors;
S
Sathya Perla 已提交
632 633

	/* frame alignment errors */
634
	stats->rx_frame_errors = drvs->rx_alignment_symbol_errors;
635

S
Sathya Perla 已提交
636 637
	/* receiver fifo overrun */
	/* drops_no_pbuf is no per i/f, it's per BE card */
638
	stats->rx_fifo_errors = drvs->rxpp_fifo_overflow_drop +
639 640
				drvs->rx_input_fifo_overflow_drop +
				drvs->rx_drops_no_pbuf;
641
	return stats;
S
Sathya Perla 已提交
642 643
}

644
void be_link_status_update(struct be_adapter *adapter, u8 link_status)
S
Sathya Perla 已提交
645 646 647
{
	struct net_device *netdev = adapter->netdev;

648
	if (!(adapter->flags & BE_FLAGS_LINK_STATUS_INIT)) {
649
		netif_carrier_off(netdev);
650
		adapter->flags |= BE_FLAGS_LINK_STATUS_INIT;
S
Sathya Perla 已提交
651
	}
652

653
	if (link_status)
654 655 656
		netif_carrier_on(netdev);
	else
		netif_carrier_off(netdev);
S
Sathya Perla 已提交
657 658
}

659
static void be_tx_stats_update(struct be_tx_obj *txo,
660 661
			       u32 wrb_cnt, u32 copied, u32 gso_segs,
			       bool stopped)
S
Sathya Perla 已提交
662
{
663 664
	struct be_tx_stats *stats = tx_stats(txo);

665
	u64_stats_update_begin(&stats->sync);
666 667 668 669
	stats->tx_reqs++;
	stats->tx_wrbs += wrb_cnt;
	stats->tx_bytes += copied;
	stats->tx_pkts += (gso_segs ? gso_segs : 1);
S
Sathya Perla 已提交
670
	if (stopped)
671
		stats->tx_stops++;
672
	u64_stats_update_end(&stats->sync);
S
Sathya Perla 已提交
673 674 675
}

/* Determine number of WRB entries needed to xmit data in an skb */
676
static u32 wrb_cnt_for_skb(struct be_adapter *adapter, struct sk_buff *skb,
677
			   bool *dummy)
S
Sathya Perla 已提交
678
{
679 680 681 682
	int cnt = (skb->len > skb->data_len);

	cnt += skb_shinfo(skb)->nr_frags;

S
Sathya Perla 已提交
683 684
	/* to account for hdr wrb */
	cnt++;
685 686 687
	if (lancer_chip(adapter) || !(cnt & 1)) {
		*dummy = false;
	} else {
S
Sathya Perla 已提交
688 689 690
		/* add a dummy to make it an even num */
		cnt++;
		*dummy = true;
691
	}
S
Sathya Perla 已提交
692 693 694 695 696 697 698 699 700
	BUG_ON(cnt > BE_MAX_TX_FRAG_COUNT);
	return cnt;
}

static inline void wrb_fill(struct be_eth_wrb *wrb, u64 addr, int len)
{
	wrb->frag_pa_hi = upper_32_bits(addr);
	wrb->frag_pa_lo = addr & 0xFFFFFFFF;
	wrb->frag_len = len & ETH_WRB_FRAG_LEN_MASK;
701
	wrb->rsvd0 = 0;
S
Sathya Perla 已提交
702 703
}

704
static inline u16 be_get_tx_vlan_tag(struct be_adapter *adapter,
705
				     struct sk_buff *skb)
706 707 708 709 710 711 712 713 714 715 716 717 718 719
{
	u8 vlan_prio;
	u16 vlan_tag;

	vlan_tag = vlan_tx_tag_get(skb);
	vlan_prio = (vlan_tag & VLAN_PRIO_MASK) >> VLAN_PRIO_SHIFT;
	/* If vlan priority provided by OS is NOT in available bmap */
	if (!(adapter->vlan_prio_bmap & (1 << vlan_prio)))
		vlan_tag = (vlan_tag & ~VLAN_PRIO_MASK) |
				adapter->recommended_prio;

	return vlan_tag;
}

720 721 722 723 724 725 726 727 728 729 730 731 732
/* Used only for IP tunnel packets */
static u16 skb_inner_ip_proto(struct sk_buff *skb)
{
	return (inner_ip_hdr(skb)->version == 4) ?
		inner_ip_hdr(skb)->protocol : inner_ipv6_hdr(skb)->nexthdr;
}

static u16 skb_ip_proto(struct sk_buff *skb)
{
	return (ip_hdr(skb)->version == 4) ?
		ip_hdr(skb)->protocol : ipv6_hdr(skb)->nexthdr;
}

733
static void wrb_fill_hdr(struct be_adapter *adapter, struct be_eth_hdr_wrb *hdr,
734 735
			 struct sk_buff *skb, u32 wrb_cnt, u32 len,
			 bool skip_hw_vlan)
S
Sathya Perla 已提交
736
{
737
	u16 vlan_tag, proto;
738

S
Sathya Perla 已提交
739 740 741 742
	memset(hdr, 0, sizeof(*hdr));

	AMAP_SET_BITS(struct amap_eth_hdr_wrb, crc, hdr, 1);

A
Ajit Khaparde 已提交
743
	if (skb_is_gso(skb)) {
S
Sathya Perla 已提交
744 745 746
		AMAP_SET_BITS(struct amap_eth_hdr_wrb, lso, hdr, 1);
		AMAP_SET_BITS(struct amap_eth_hdr_wrb, lso_mss,
			hdr, skb_shinfo(skb)->gso_size);
747
		if (skb_is_gso_v6(skb) && !lancer_chip(adapter))
A
Ajit Khaparde 已提交
748
			AMAP_SET_BITS(struct amap_eth_hdr_wrb, lso6, hdr, 1);
S
Sathya Perla 已提交
749
	} else if (skb->ip_summed == CHECKSUM_PARTIAL) {
750 751 752 753 754 755 756
		if (skb->encapsulation) {
			AMAP_SET_BITS(struct amap_eth_hdr_wrb, ipcs, hdr, 1);
			proto = skb_inner_ip_proto(skb);
		} else {
			proto = skb_ip_proto(skb);
		}
		if (proto == IPPROTO_TCP)
S
Sathya Perla 已提交
757
			AMAP_SET_BITS(struct amap_eth_hdr_wrb, tcpcs, hdr, 1);
758
		else if (proto == IPPROTO_UDP)
S
Sathya Perla 已提交
759 760 761
			AMAP_SET_BITS(struct amap_eth_hdr_wrb, udpcs, hdr, 1);
	}

A
Ajit Khaparde 已提交
762
	if (vlan_tx_tag_present(skb)) {
S
Sathya Perla 已提交
763
		AMAP_SET_BITS(struct amap_eth_hdr_wrb, vlan, hdr, 1);
764
		vlan_tag = be_get_tx_vlan_tag(adapter, skb);
765
		AMAP_SET_BITS(struct amap_eth_hdr_wrb, vlan_tag, hdr, vlan_tag);
S
Sathya Perla 已提交
766 767
	}

768 769
	/* To skip HW VLAN tagging: evt = 1, compl = 0 */
	AMAP_SET_BITS(struct amap_eth_hdr_wrb, complete, hdr, !skip_hw_vlan);
S
Sathya Perla 已提交
770 771 772 773 774
	AMAP_SET_BITS(struct amap_eth_hdr_wrb, event, hdr, 1);
	AMAP_SET_BITS(struct amap_eth_hdr_wrb, num_wrb, hdr, wrb_cnt);
	AMAP_SET_BITS(struct amap_eth_hdr_wrb, len, hdr, len);
}

I
Ivan Vecera 已提交
775
static void unmap_tx_frag(struct device *dev, struct be_eth_wrb *wrb,
776
			  bool unmap_single)
777 778 779 780 781 782
{
	dma_addr_t dma;

	be_dws_le_to_cpu(wrb, sizeof(*wrb));

	dma = (u64)wrb->frag_pa_hi << 32 | (u64)wrb->frag_pa_lo;
783
	if (wrb->frag_len) {
784
		if (unmap_single)
I
Ivan Vecera 已提交
785 786
			dma_unmap_single(dev, dma, wrb->frag_len,
					 DMA_TO_DEVICE);
787
		else
I
Ivan Vecera 已提交
788
			dma_unmap_page(dev, dma, wrb->frag_len, DMA_TO_DEVICE);
789 790
	}
}
S
Sathya Perla 已提交
791

792
static int make_tx_wrbs(struct be_adapter *adapter, struct be_queue_info *txq,
793 794
			struct sk_buff *skb, u32 wrb_cnt, bool dummy_wrb,
			bool skip_hw_vlan)
S
Sathya Perla 已提交
795
{
796 797
	dma_addr_t busaddr;
	int i, copied = 0;
I
Ivan Vecera 已提交
798
	struct device *dev = &adapter->pdev->dev;
S
Sathya Perla 已提交
799 800 801
	struct sk_buff *first_skb = skb;
	struct be_eth_wrb *wrb;
	struct be_eth_hdr_wrb *hdr;
802 803
	bool map_single = false;
	u16 map_head;
S
Sathya Perla 已提交
804 805 806

	hdr = queue_head_node(txq);
	queue_head_inc(txq);
807
	map_head = txq->head;
S
Sathya Perla 已提交
808

809
	if (skb->len > skb->data_len) {
E
Eric Dumazet 已提交
810
		int len = skb_headlen(skb);
I
Ivan Vecera 已提交
811 812
		busaddr = dma_map_single(dev, skb->data, len, DMA_TO_DEVICE);
		if (dma_mapping_error(dev, busaddr))
813 814
			goto dma_err;
		map_single = true;
815 816 817 818 819 820
		wrb = queue_head_node(txq);
		wrb_fill(wrb, busaddr, len);
		be_dws_cpu_to_le(wrb, sizeof(*wrb));
		queue_head_inc(txq);
		copied += len;
	}
S
Sathya Perla 已提交
821

822
	for (i = 0; i < skb_shinfo(skb)->nr_frags; i++) {
823
		const struct skb_frag_struct *frag = &skb_shinfo(skb)->frags[i];
824
		busaddr = skb_frag_dma_map(dev, frag, 0,
E
Eric Dumazet 已提交
825
					   skb_frag_size(frag), DMA_TO_DEVICE);
I
Ivan Vecera 已提交
826
		if (dma_mapping_error(dev, busaddr))
827
			goto dma_err;
828
		wrb = queue_head_node(txq);
E
Eric Dumazet 已提交
829
		wrb_fill(wrb, busaddr, skb_frag_size(frag));
830 831
		be_dws_cpu_to_le(wrb, sizeof(*wrb));
		queue_head_inc(txq);
E
Eric Dumazet 已提交
832
		copied += skb_frag_size(frag);
S
Sathya Perla 已提交
833 834 835 836 837 838 839 840 841
	}

	if (dummy_wrb) {
		wrb = queue_head_node(txq);
		wrb_fill(wrb, 0, 0);
		be_dws_cpu_to_le(wrb, sizeof(*wrb));
		queue_head_inc(txq);
	}

842
	wrb_fill_hdr(adapter, hdr, first_skb, wrb_cnt, copied, skip_hw_vlan);
S
Sathya Perla 已提交
843 844 845
	be_dws_cpu_to_le(hdr, sizeof(*hdr));

	return copied;
846 847 848 849
dma_err:
	txq->head = map_head;
	while (copied) {
		wrb = queue_head_node(txq);
I
Ivan Vecera 已提交
850
		unmap_tx_frag(dev, wrb, map_single);
851 852 853 854 855
		map_single = false;
		copied -= wrb->frag_len;
		queue_head_inc(txq);
	}
	return 0;
S
Sathya Perla 已提交
856 857
}

858
static struct sk_buff *be_insert_vlan_in_pkt(struct be_adapter *adapter,
859 860
					     struct sk_buff *skb,
					     bool *skip_hw_vlan)
861 862 863 864 865 866 867
{
	u16 vlan_tag = 0;

	skb = skb_share_check(skb, GFP_ATOMIC);
	if (unlikely(!skb))
		return skb;

868
	if (vlan_tx_tag_present(skb))
869
		vlan_tag = be_get_tx_vlan_tag(adapter, skb);
870 871 872 873 874 875 876 877 878 879

	if (qnq_async_evt_rcvd(adapter) && adapter->pvid) {
		if (!vlan_tag)
			vlan_tag = adapter->pvid;
		/* f/w workaround to set skip_hw_vlan = 1, informs the F/W to
		 * skip VLAN insertion
		 */
		if (skip_hw_vlan)
			*skip_hw_vlan = true;
	}
880 881

	if (vlan_tag) {
882
		skb = __vlan_put_tag(skb, htons(ETH_P_8021Q), vlan_tag);
883 884 885 886 887 888 889 890
		if (unlikely(!skb))
			return skb;
		skb->vlan_tci = 0;
	}

	/* Insert the outer VLAN, if any */
	if (adapter->qnq_vid) {
		vlan_tag = adapter->qnq_vid;
891
		skb = __vlan_put_tag(skb, htons(ETH_P_8021Q), vlan_tag);
892 893 894 895 896 897
		if (unlikely(!skb))
			return skb;
		if (skip_hw_vlan)
			*skip_hw_vlan = true;
	}

898 899 900
	return skb;
}

901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917 918 919 920 921 922 923 924 925 926 927
static bool be_ipv6_exthdr_check(struct sk_buff *skb)
{
	struct ethhdr *eh = (struct ethhdr *)skb->data;
	u16 offset = ETH_HLEN;

	if (eh->h_proto == htons(ETH_P_IPV6)) {
		struct ipv6hdr *ip6h = (struct ipv6hdr *)(skb->data + offset);

		offset += sizeof(struct ipv6hdr);
		if (ip6h->nexthdr != NEXTHDR_TCP &&
		    ip6h->nexthdr != NEXTHDR_UDP) {
			struct ipv6_opt_hdr *ehdr =
				(struct ipv6_opt_hdr *) (skb->data + offset);

			/* offending pkt: 2nd byte following IPv6 hdr is 0xff */
			if (ehdr->hdrlen == 0xff)
				return true;
		}
	}
	return false;
}

static int be_vlan_tag_tx_chk(struct be_adapter *adapter, struct sk_buff *skb)
{
	return vlan_tx_tag_present(skb) || adapter->pvid || adapter->qnq_vid;
}

928
static int be_ipv6_tx_stall_chk(struct be_adapter *adapter, struct sk_buff *skb)
929
{
930
	return BE3_chip(adapter) && be_ipv6_exthdr_check(skb);
931 932
}

933 934 935
static struct sk_buff *be_lancer_xmit_workarounds(struct be_adapter *adapter,
						  struct sk_buff *skb,
						  bool *skip_hw_vlan)
S
Sathya Perla 已提交
936
{
937
	struct vlan_ethhdr *veh = (struct vlan_ethhdr *)skb->data;
938 939
	unsigned int eth_hdr_len;
	struct iphdr *ip;
940

941 942
	/* For padded packets, BE HW modifies tot_len field in IP header
	 * incorrecly when VLAN tag is inserted by HW.
943
	 * For padded packets, Lancer computes incorrect checksum.
944
	 */
945 946
	eth_hdr_len = ntohs(skb->protocol) == ETH_P_8021Q ?
						VLAN_ETH_HLEN : ETH_HLEN;
947 948
	if (skb->len <= 60 &&
	    (lancer_chip(adapter) || vlan_tx_tag_present(skb)) &&
949
	    is_ipv4_pkt(skb)) {
950 951 952
		ip = (struct iphdr *)ip_hdr(skb);
		pskb_trim(skb, eth_hdr_len + ntohs(ip->tot_len));
	}
953

954
	/* If vlan tag is already inlined in the packet, skip HW VLAN
955
	 * tagging in pvid-tagging mode
956
	 */
957
	if (be_pvid_tagging_enabled(adapter) &&
958
	    veh->h_vlan_proto == htons(ETH_P_8021Q))
959
		*skip_hw_vlan = true;
960

961 962 963 964 965
	/* HW has a bug wherein it will calculate CSUM for VLAN
	 * pkts even though it is disabled.
	 * Manually insert VLAN in pkt.
	 */
	if (skb->ip_summed != CHECKSUM_PARTIAL &&
966 967
	    vlan_tx_tag_present(skb)) {
		skb = be_insert_vlan_in_pkt(adapter, skb, skip_hw_vlan);
968
		if (unlikely(!skb))
969
			goto err;
970 971 972 973 974 975 976
	}

	/* HW may lockup when VLAN HW tagging is requested on
	 * certain ipv6 packets. Drop such pkts if the HW workaround to
	 * skip HW tagging is not enabled by FW.
	 */
	if (unlikely(be_ipv6_tx_stall_chk(adapter, skb) &&
977 978
	    (adapter->pvid || adapter->qnq_vid) &&
	    !qnq_async_evt_rcvd(adapter)))
979 980 981 982 983 984 985 986 987 988
		goto tx_drop;

	/* Manual VLAN tag insertion to prevent:
	 * ASIC lockup when the ASIC inserts VLAN tag into
	 * certain ipv6 packets. Insert VLAN tags in driver,
	 * and set event, completion, vlan bits accordingly
	 * in the Tx WRB.
	 */
	if (be_ipv6_tx_stall_chk(adapter, skb) &&
	    be_vlan_tag_tx_chk(adapter, skb)) {
989
		skb = be_insert_vlan_in_pkt(adapter, skb, skip_hw_vlan);
990
		if (unlikely(!skb))
991
			goto err;
992 993
	}

994 995 996
	return skb;
tx_drop:
	dev_kfree_skb_any(skb);
997
err:
998 999 1000
	return NULL;
}

1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023
static struct sk_buff *be_xmit_workarounds(struct be_adapter *adapter,
					   struct sk_buff *skb,
					   bool *skip_hw_vlan)
{
	/* Lancer, SH-R ASICs have a bug wherein Packets that are 32 bytes or
	 * less may cause a transmit stall on that port. So the work-around is
	 * to pad short packets (<= 32 bytes) to a 36-byte length.
	 */
	if (unlikely(!BEx_chip(adapter) && skb->len <= 32)) {
		if (skb_padto(skb, 36))
			return NULL;
		skb->len = 36;
	}

	if (BEx_chip(adapter) || lancer_chip(adapter)) {
		skb = be_lancer_xmit_workarounds(adapter, skb, skip_hw_vlan);
		if (!skb)
			return NULL;
	}

	return skb;
}

1024 1025 1026 1027 1028 1029 1030 1031 1032 1033 1034
static netdev_tx_t be_xmit(struct sk_buff *skb, struct net_device *netdev)
{
	struct be_adapter *adapter = netdev_priv(netdev);
	struct be_tx_obj *txo = &adapter->tx_obj[skb_get_queue_mapping(skb)];
	struct be_queue_info *txq = &txo->q;
	bool dummy_wrb, stopped = false;
	u32 wrb_cnt = 0, copied = 0;
	bool skip_hw_vlan = false;
	u32 start = txq->head;

	skb = be_xmit_workarounds(adapter, skb, &skip_hw_vlan);
1035 1036
	if (!skb) {
		tx_stats(txo)->tx_drv_drops++;
1037
		return NETDEV_TX_OK;
1038
	}
1039

1040
	wrb_cnt = wrb_cnt_for_skb(adapter, skb, &dummy_wrb);
S
Sathya Perla 已提交
1041

1042 1043
	copied = make_tx_wrbs(adapter, txq, skb, wrb_cnt, dummy_wrb,
			      skip_hw_vlan);
1044
	if (copied) {
E
Eric Dumazet 已提交
1045 1046
		int gso_segs = skb_shinfo(skb)->gso_segs;

1047
		/* record the sent skb in the sent_skb table */
1048 1049
		BUG_ON(txo->sent_skb_list[start]);
		txo->sent_skb_list[start] = skb;
1050 1051 1052 1053 1054

		/* Ensure txq has space for the next skb; Else stop the queue
		 * *BEFORE* ringing the tx doorbell, so that we serialze the
		 * tx compls of the current transmit which'll wake up the queue
		 */
1055
		atomic_add(wrb_cnt, &txq->used);
1056 1057
		if ((BE_MAX_TX_FRAG_COUNT + atomic_read(&txq->used)) >=
								txq->len) {
1058
			netif_stop_subqueue(netdev, skb_get_queue_mapping(skb));
1059 1060
			stopped = true;
		}
S
Sathya Perla 已提交
1061

V
Vasundhara Volam 已提交
1062
		be_txq_notify(adapter, txo, wrb_cnt);
S
Sathya Perla 已提交
1063

E
Eric Dumazet 已提交
1064
		be_tx_stats_update(txo, wrb_cnt, copied, gso_segs, stopped);
1065 1066
	} else {
		txq->head = start;
1067
		tx_stats(txo)->tx_drv_drops++;
1068
		dev_kfree_skb_any(skb);
S
Sathya Perla 已提交
1069 1070 1071 1072 1073 1074 1075 1076
	}
	return NETDEV_TX_OK;
}

static int be_change_mtu(struct net_device *netdev, int new_mtu)
{
	struct be_adapter *adapter = netdev_priv(netdev);
	if (new_mtu < BE_MIN_MTU ||
1077
	    new_mtu > (BE_MAX_JUMBO_FRAME_SIZE - (ETH_HLEN + ETH_FCS_LEN))) {
S
Sathya Perla 已提交
1078
		dev_info(&adapter->pdev->dev,
1079 1080 1081
			 "MTU must be between %d and %d bytes\n",
			 BE_MIN_MTU,
			 (BE_MAX_JUMBO_FRAME_SIZE - (ETH_HLEN + ETH_FCS_LEN)));
S
Sathya Perla 已提交
1082 1083 1084
		return -EINVAL;
	}
	dev_info(&adapter->pdev->dev, "MTU changed from %d to %d bytes\n",
1085
		 netdev->mtu, new_mtu);
S
Sathya Perla 已提交
1086 1087 1088 1089 1090
	netdev->mtu = new_mtu;
	return 0;
}

/*
1091 1092
 * A max of 64 (BE_NUM_VLANS_SUPPORTED) vlans can be configured in BE.
 * If the user configures more, place BE in vlan promiscuous mode.
S
Sathya Perla 已提交
1093
 */
S
Sathya Perla 已提交
1094
static int be_vid_config(struct be_adapter *adapter)
S
Sathya Perla 已提交
1095
{
S
Sathya Perla 已提交
1096
	u16 vids[BE_NUM_VLANS_SUPPORTED];
1097
	u16 num = 0, i = 0;
1098
	int status = 0;
1099

1100 1101 1102 1103
	/* No need to further configure vids if in promiscuous mode */
	if (adapter->promiscuous)
		return 0;

1104
	if (adapter->vlans_added > be_max_vlans(adapter))
1105 1106 1107
		goto set_vlan_promisc;

	/* Construct VLAN Table to give to HW */
1108 1109
	for_each_set_bit(i, adapter->vids, VLAN_N_VID)
		vids[num++] = cpu_to_le16(i);
1110

1111
	status = be_cmd_vlan_config(adapter, adapter->if_handle, vids, num);
1112
	if (status) {
1113
		/* Set to VLAN promisc mode as setting VLAN filter failed */
1114 1115
		if (addl_status(status) ==
				MCC_ADDL_STATUS_INSUFFICIENT_RESOURCES)
1116 1117 1118 1119 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129
			goto set_vlan_promisc;
		dev_err(&adapter->pdev->dev,
			"Setting HW VLAN filtering failed.\n");
	} else {
		if (adapter->flags & BE_FLAGS_VLAN_PROMISC) {
			/* hw VLAN filtering re-enabled. */
			status = be_cmd_rx_filter(adapter,
						  BE_FLAGS_VLAN_PROMISC, OFF);
			if (!status) {
				dev_info(&adapter->pdev->dev,
					 "Disabling VLAN Promiscuous mode.\n");
				adapter->flags &= ~BE_FLAGS_VLAN_PROMISC;
			}
		}
S
Sathya Perla 已提交
1130
	}
1131

1132
	return status;
1133 1134

set_vlan_promisc:
1135 1136
	if (adapter->flags & BE_FLAGS_VLAN_PROMISC)
		return 0;
1137 1138 1139 1140 1141 1142 1143 1144

	status = be_cmd_rx_filter(adapter, BE_FLAGS_VLAN_PROMISC, ON);
	if (!status) {
		dev_info(&adapter->pdev->dev, "Enable VLAN Promiscuous mode\n");
		adapter->flags |= BE_FLAGS_VLAN_PROMISC;
	} else
		dev_err(&adapter->pdev->dev,
			"Failed to enable VLAN Promiscuous mode.\n");
1145
	return status;
S
Sathya Perla 已提交
1146 1147
}

1148
static int be_vlan_add_vid(struct net_device *netdev, __be16 proto, u16 vid)
S
Sathya Perla 已提交
1149 1150
{
	struct be_adapter *adapter = netdev_priv(netdev);
A
Ajit Khaparde 已提交
1151
	int status = 0;
S
Sathya Perla 已提交
1152

1153 1154
	/* Packets with VID 0 are always received by Lancer by default */
	if (lancer_chip(adapter) && vid == 0)
1155 1156
		return status;

1157
	if (test_bit(vid, adapter->vids))
1158
		return status;
1159

1160
	set_bit(vid, adapter->vids);
1161
	adapter->vlans_added++;
1162

1163 1164 1165
	status = be_vid_config(adapter);
	if (status) {
		adapter->vlans_added--;
1166
		clear_bit(vid, adapter->vids);
1167
	}
1168

A
Ajit Khaparde 已提交
1169
	return status;
S
Sathya Perla 已提交
1170 1171
}

1172
static int be_vlan_rem_vid(struct net_device *netdev, __be16 proto, u16 vid)
S
Sathya Perla 已提交
1173 1174 1175
{
	struct be_adapter *adapter = netdev_priv(netdev);

1176 1177
	/* Packets with VID 0 are always received by Lancer by default */
	if (lancer_chip(adapter) && vid == 0)
1178
		return 0;
1179

1180
	clear_bit(vid, adapter->vids);
1181 1182 1183
	adapter->vlans_added--;

	return be_vid_config(adapter);
S
Sathya Perla 已提交
1184 1185
}

1186 1187 1188
static void be_clear_promisc(struct be_adapter *adapter)
{
	adapter->promiscuous = false;
1189
	adapter->flags &= ~(BE_FLAGS_VLAN_PROMISC | BE_FLAGS_MCAST_PROMISC);
1190 1191 1192 1193

	be_cmd_rx_filter(adapter, IFF_PROMISC, OFF);
}

1194
static void be_set_rx_mode(struct net_device *netdev)
S
Sathya Perla 已提交
1195 1196
{
	struct be_adapter *adapter = netdev_priv(netdev);
1197
	int status;
S
Sathya Perla 已提交
1198

1199
	if (netdev->flags & IFF_PROMISC) {
1200
		be_cmd_rx_filter(adapter, IFF_PROMISC, ON);
1201 1202
		adapter->promiscuous = true;
		goto done;
S
Sathya Perla 已提交
1203 1204
	}

L
Lucas De Marchi 已提交
1205
	/* BE was previously in promiscuous mode; disable it */
1206
	if (adapter->promiscuous) {
1207
		be_clear_promisc(adapter);
1208
		if (adapter->vlans_added)
S
Sathya Perla 已提交
1209
			be_vid_config(adapter);
S
Sathya Perla 已提交
1210 1211
	}

1212
	/* Enable multicast promisc if num configured exceeds what we support */
1213
	if (netdev->flags & IFF_ALLMULTI ||
1214 1215
	    netdev_mc_count(netdev) > be_max_mc(adapter))
		goto set_mcast_promisc;
S
Sathya Perla 已提交
1216

1217 1218 1219 1220 1221 1222 1223 1224 1225
	if (netdev_uc_count(netdev) != adapter->uc_macs) {
		struct netdev_hw_addr *ha;
		int i = 1; /* First slot is claimed by the Primary MAC */

		for (; adapter->uc_macs > 0; adapter->uc_macs--, i++) {
			be_cmd_pmac_del(adapter, adapter->if_handle,
					adapter->pmac_id[i], 0);
		}

1226
		if (netdev_uc_count(netdev) > be_max_uc(adapter)) {
1227 1228 1229 1230 1231 1232 1233 1234 1235 1236 1237 1238 1239
			be_cmd_rx_filter(adapter, IFF_PROMISC, ON);
			adapter->promiscuous = true;
			goto done;
		}

		netdev_for_each_uc_addr(ha, adapter->netdev) {
			adapter->uc_macs++; /* First slot is for Primary MAC */
			be_cmd_pmac_add(adapter, (u8 *)ha->addr,
					adapter->if_handle,
					&adapter->pmac_id[adapter->uc_macs], 0);
		}
	}

1240
	status = be_cmd_rx_filter(adapter, IFF_MULTICAST, ON);
1241 1242 1243 1244
	if (!status) {
		if (adapter->flags & BE_FLAGS_MCAST_PROMISC)
			adapter->flags &= ~BE_FLAGS_MCAST_PROMISC;
		goto done;
1245
	}
1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256

set_mcast_promisc:
	if (adapter->flags & BE_FLAGS_MCAST_PROMISC)
		return;

	/* Set to MCAST promisc mode if setting MULTICAST address fails
	 * or if num configured exceeds what we support
	 */
	status = be_cmd_rx_filter(adapter, IFF_ALLMULTI, ON);
	if (!status)
		adapter->flags |= BE_FLAGS_MCAST_PROMISC;
1257 1258
done:
	return;
S
Sathya Perla 已提交
1259 1260
}

1261 1262 1263
static int be_set_vf_mac(struct net_device *netdev, int vf, u8 *mac)
{
	struct be_adapter *adapter = netdev_priv(netdev);
1264
	struct be_vf_cfg *vf_cfg = &adapter->vf_cfg[vf];
1265 1266
	int status;

1267
	if (!sriov_enabled(adapter))
1268 1269
		return -EPERM;

1270
	if (!is_valid_ether_addr(mac) || vf >= adapter->num_vfs)
1271 1272
		return -EINVAL;

1273 1274 1275
	if (BEx_chip(adapter)) {
		be_cmd_pmac_del(adapter, vf_cfg->if_handle, vf_cfg->pmac_id,
				vf + 1);
1276

1277 1278
		status = be_cmd_pmac_add(adapter, mac, vf_cfg->if_handle,
					 &vf_cfg->pmac_id, vf + 1);
1279 1280 1281
	} else {
		status = be_cmd_set_mac(adapter, mac, vf_cfg->if_handle,
					vf + 1);
1282 1283
	}

1284 1285 1286 1287 1288
	if (status) {
		dev_err(&adapter->pdev->dev, "MAC %pM set on VF %d Failed: %#x",
			mac, vf, status);
		return be_cmd_status(status);
	}
1289

1290 1291 1292
	ether_addr_copy(vf_cfg->mac_addr, mac);

	return 0;
1293 1294
}

1295
static int be_get_vf_config(struct net_device *netdev, int vf,
1296
			    struct ifla_vf_info *vi)
1297 1298
{
	struct be_adapter *adapter = netdev_priv(netdev);
1299
	struct be_vf_cfg *vf_cfg = &adapter->vf_cfg[vf];
1300

1301
	if (!sriov_enabled(adapter))
1302 1303
		return -EPERM;

1304
	if (vf >= adapter->num_vfs)
1305 1306 1307
		return -EINVAL;

	vi->vf = vf;
1308 1309
	vi->max_tx_rate = vf_cfg->tx_rate;
	vi->min_tx_rate = 0;
1310 1311
	vi->vlan = vf_cfg->vlan_tag & VLAN_VID_MASK;
	vi->qos = vf_cfg->vlan_tag >> VLAN_PRIO_SHIFT;
1312
	memcpy(&vi->mac, vf_cfg->mac_addr, ETH_ALEN);
1313
	vi->linkstate = adapter->vf_cfg[vf].plink_tracking;
1314 1315 1316 1317

	return 0;
}

1318
static int be_set_vf_vlan(struct net_device *netdev, int vf, u16 vlan, u8 qos)
1319 1320
{
	struct be_adapter *adapter = netdev_priv(netdev);
1321
	struct be_vf_cfg *vf_cfg = &adapter->vf_cfg[vf];
1322 1323
	int status = 0;

1324
	if (!sriov_enabled(adapter))
1325 1326
		return -EPERM;

1327
	if (vf >= adapter->num_vfs || vlan > 4095 || qos > 7)
1328 1329
		return -EINVAL;

1330 1331
	if (vlan || qos) {
		vlan |= qos << VLAN_PRIO_SHIFT;
1332
		if (vf_cfg->vlan_tag != vlan)
1333 1334
			status = be_cmd_set_hsw_config(adapter, vlan, vf + 1,
						       vf_cfg->if_handle, 0);
1335
	} else {
1336
		/* Reset Transparent Vlan Tagging. */
1337 1338
		status = be_cmd_set_hsw_config(adapter, BE_RESET_VLAN_TAG_ID,
					       vf + 1, vf_cfg->if_handle, 0);
1339 1340
	}

1341 1342 1343 1344 1345 1346 1347 1348 1349 1350
	if (status) {
		dev_err(&adapter->pdev->dev,
			"VLAN %d config on VF %d failed : %#x\n", vlan,
			vf, status);
		return be_cmd_status(status);
	}

	vf_cfg->vlan_tag = vlan;

	return 0;
1351 1352
}

1353 1354
static int be_set_vf_tx_rate(struct net_device *netdev, int vf,
			     int min_tx_rate, int max_tx_rate)
1355 1356
{
	struct be_adapter *adapter = netdev_priv(netdev);
1357 1358 1359 1360
	struct device *dev = &adapter->pdev->dev;
	int percent_rate, status = 0;
	u16 link_speed = 0;
	u8 link_status;
1361

1362
	if (!sriov_enabled(adapter))
1363 1364
		return -EPERM;

1365
	if (vf >= adapter->num_vfs)
1366 1367
		return -EINVAL;

1368 1369 1370
	if (min_tx_rate)
		return -EINVAL;

1371 1372 1373 1374 1375 1376 1377 1378 1379 1380
	if (!max_tx_rate)
		goto config_qos;

	status = be_cmd_link_status_query(adapter, &link_speed,
					  &link_status, 0);
	if (status)
		goto err;

	if (!link_status) {
		dev_err(dev, "TX-rate setting not allowed when link is down\n");
1381
		status = -ENETDOWN;
1382 1383 1384 1385 1386 1387 1388 1389 1390 1391 1392 1393 1394 1395 1396 1397 1398
		goto err;
	}

	if (max_tx_rate < 100 || max_tx_rate > link_speed) {
		dev_err(dev, "TX-rate must be between 100 and %d Mbps\n",
			link_speed);
		status = -EINVAL;
		goto err;
	}

	/* On Skyhawk the QOS setting must be done only as a % value */
	percent_rate = link_speed / 100;
	if (skyhawk_chip(adapter) && (max_tx_rate % percent_rate)) {
		dev_err(dev, "TX-rate must be a multiple of %d Mbps\n",
			percent_rate);
		status = -EINVAL;
		goto err;
1399
	}
1400

1401 1402
config_qos:
	status = be_cmd_config_qos(adapter, max_tx_rate, link_speed, vf + 1);
1403
	if (status)
1404 1405 1406 1407 1408 1409 1410 1411
		goto err;

	adapter->vf_cfg[vf].tx_rate = max_tx_rate;
	return 0;

err:
	dev_err(dev, "TX-rate setting of %dMbps on VF%d failed\n",
		max_tx_rate, vf);
1412
	return be_cmd_status(status);
1413
}
1414 1415 1416 1417 1418 1419 1420 1421 1422 1423 1424 1425 1426
static int be_set_vf_link_state(struct net_device *netdev, int vf,
				int link_state)
{
	struct be_adapter *adapter = netdev_priv(netdev);
	int status;

	if (!sriov_enabled(adapter))
		return -EPERM;

	if (vf >= adapter->num_vfs)
		return -EINVAL;

	status = be_cmd_set_logical_link_config(adapter, link_state, vf+1);
1427 1428 1429 1430 1431
	if (status) {
		dev_err(&adapter->pdev->dev,
			"Link state change on VF %d failed: %#x\n", vf, status);
		return be_cmd_status(status);
	}
1432

1433 1434 1435
	adapter->vf_cfg[vf].plink_tracking = link_state;

	return 0;
1436
}
1437

1438 1439
static void be_aic_update(struct be_aic_obj *aic, u64 rx_pkts, u64 tx_pkts,
			  ulong now)
S
Sathya Perla 已提交
1440
{
1441 1442 1443 1444
	aic->rx_pkts_prev = rx_pkts;
	aic->tx_reqs_prev = tx_pkts;
	aic->jiffies = now;
}
1445

1446 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456
static void be_eqd_update(struct be_adapter *adapter)
{
	struct be_set_eqd set_eqd[MAX_EVT_QS];
	int eqd, i, num = 0, start;
	struct be_aic_obj *aic;
	struct be_eq_obj *eqo;
	struct be_rx_obj *rxo;
	struct be_tx_obj *txo;
	u64 rx_pkts, tx_pkts;
	ulong now;
	u32 pps, delta;
S
Sathya Perla 已提交
1457

1458 1459 1460 1461 1462 1463 1464 1465
	for_all_evt_queues(adapter, eqo, i) {
		aic = &adapter->aic_obj[eqo->idx];
		if (!aic->enable) {
			if (aic->jiffies)
				aic->jiffies = 0;
			eqd = aic->et_eqd;
			goto modify_eqd;
		}
S
Sathya Perla 已提交
1466

1467 1468
		rxo = &adapter->rx_obj[eqo->idx];
		do {
1469
			start = u64_stats_fetch_begin_irq(&rxo->stats.sync);
1470
			rx_pkts = rxo->stats.rx_pkts;
1471
		} while (u64_stats_fetch_retry_irq(&rxo->stats.sync, start));
S
Sathya Perla 已提交
1472

1473 1474
		txo = &adapter->tx_obj[eqo->idx];
		do {
1475
			start = u64_stats_fetch_begin_irq(&txo->stats.sync);
1476
			tx_pkts = txo->stats.tx_reqs;
1477
		} while (u64_stats_fetch_retry_irq(&txo->stats.sync, start));
S
Sathya Perla 已提交
1478 1479


1480 1481 1482 1483 1484 1485 1486 1487 1488 1489 1490 1491 1492
		/* Skip, if wrapped around or first calculation */
		now = jiffies;
		if (!aic->jiffies || time_before(now, aic->jiffies) ||
		    rx_pkts < aic->rx_pkts_prev ||
		    tx_pkts < aic->tx_reqs_prev) {
			be_aic_update(aic, rx_pkts, tx_pkts, now);
			continue;
		}

		delta = jiffies_to_msecs(now - aic->jiffies);
		pps = (((u32)(rx_pkts - aic->rx_pkts_prev) * 1000) / delta) +
			(((u32)(tx_pkts - aic->tx_reqs_prev) * 1000) / delta);
		eqd = (pps / 15000) << 2;
S
Sathya Perla 已提交
1493

1494 1495 1496 1497 1498 1499
		if (eqd < 8)
			eqd = 0;
		eqd = min_t(u32, eqd, aic->max_eqd);
		eqd = max_t(u32, eqd, aic->min_eqd);

		be_aic_update(aic, rx_pkts, tx_pkts, now);
S
Sathya Perla 已提交
1500
modify_eqd:
1501 1502 1503 1504 1505 1506
		if (eqd != aic->prev_eqd) {
			set_eqd[num].delay_multiplier = (eqd * 65)/100;
			set_eqd[num].eq_id = eqo->q.id;
			aic->prev_eqd = eqd;
			num++;
		}
1507
	}
1508 1509 1510

	if (num)
		be_cmd_modify_eqd(adapter, set_eqd, num);
S
Sathya Perla 已提交
1511 1512
}

1513
static void be_rx_stats_update(struct be_rx_obj *rxo,
1514
			       struct be_rx_compl_info *rxcp)
1515
{
1516
	struct be_rx_stats *stats = rx_stats(rxo);
1517

1518
	u64_stats_update_begin(&stats->sync);
1519
	stats->rx_compl++;
1520
	stats->rx_bytes += rxcp->pkt_size;
1521
	stats->rx_pkts++;
1522
	if (rxcp->pkt_type == BE_MULTICAST_PACKET)
1523
		stats->rx_mcast_pkts++;
1524
	if (rxcp->err)
1525
		stats->rx_compl_err++;
1526
	u64_stats_update_end(&stats->sync);
1527 1528
}

1529
static inline bool csum_passed(struct be_rx_compl_info *rxcp)
1530
{
1531
	/* L4 checksum is not reliable for non TCP/UDP packets.
1532 1533
	 * Also ignore ipcksm for ipv6 pkts
	 */
1534
	return (rxcp->tcpf || rxcp->udpf) && rxcp->l4_csum &&
1535
		(rxcp->ip_csum || rxcp->ipv6) && !rxcp->err;
1536 1537
}

1538
static struct be_rx_page_info *get_rx_page_info(struct be_rx_obj *rxo)
S
Sathya Perla 已提交
1539
{
S
Sathya Perla 已提交
1540
	struct be_adapter *adapter = rxo->adapter;
S
Sathya Perla 已提交
1541
	struct be_rx_page_info *rx_page_info;
1542
	struct be_queue_info *rxq = &rxo->q;
1543
	u16 frag_idx = rxq->tail;
S
Sathya Perla 已提交
1544

1545
	rx_page_info = &rxo->page_info_tbl[frag_idx];
S
Sathya Perla 已提交
1546 1547
	BUG_ON(!rx_page_info->page);

1548
	if (rx_page_info->last_frag) {
I
Ivan Vecera 已提交
1549 1550 1551
		dma_unmap_page(&adapter->pdev->dev,
			       dma_unmap_addr(rx_page_info, bus),
			       adapter->big_page_size, DMA_FROM_DEVICE);
1552 1553 1554 1555 1556
		rx_page_info->last_frag = false;
	} else {
		dma_sync_single_for_cpu(&adapter->pdev->dev,
					dma_unmap_addr(rx_page_info, bus),
					rx_frag_size, DMA_FROM_DEVICE);
A
Ajit Khaparde 已提交
1557
	}
S
Sathya Perla 已提交
1558

1559
	queue_tail_inc(rxq);
S
Sathya Perla 已提交
1560 1561 1562 1563 1564
	atomic_dec(&rxq->used);
	return rx_page_info;
}

/* Throwaway the data in the Rx completion */
S
Sathya Perla 已提交
1565 1566
static void be_rx_compl_discard(struct be_rx_obj *rxo,
				struct be_rx_compl_info *rxcp)
S
Sathya Perla 已提交
1567 1568
{
	struct be_rx_page_info *page_info;
1569
	u16 i, num_rcvd = rxcp->num_rcvd;
S
Sathya Perla 已提交
1570

1571
	for (i = 0; i < num_rcvd; i++) {
1572
		page_info = get_rx_page_info(rxo);
1573 1574
		put_page(page_info->page);
		memset(page_info, 0, sizeof(*page_info));
S
Sathya Perla 已提交
1575 1576 1577 1578 1579 1580 1581
	}
}

/*
 * skb_fill_rx_data forms a complete skb for an ether frame
 * indicated by rxcp.
 */
S
Sathya Perla 已提交
1582 1583
static void skb_fill_rx_data(struct be_rx_obj *rxo, struct sk_buff *skb,
			     struct be_rx_compl_info *rxcp)
S
Sathya Perla 已提交
1584 1585
{
	struct be_rx_page_info *page_info;
1586 1587
	u16 i, j;
	u16 hdr_len, curr_frag_len, remaining;
S
Sathya Perla 已提交
1588 1589
	u8 *start;

1590
	page_info = get_rx_page_info(rxo);
S
Sathya Perla 已提交
1591 1592 1593 1594
	start = page_address(page_info->page) + page_info->page_offset;
	prefetch(start);

	/* Copy data in the first descriptor of this completion */
1595
	curr_frag_len = min(rxcp->pkt_size, rx_frag_size);
S
Sathya Perla 已提交
1596 1597 1598

	skb->len = curr_frag_len;
	if (curr_frag_len <= BE_HDR_LEN) { /* tiny packet */
1599
		memcpy(skb->data, start, curr_frag_len);
S
Sathya Perla 已提交
1600 1601 1602 1603 1604
		/* Complete packet has now been moved to data */
		put_page(page_info->page);
		skb->data_len = 0;
		skb->tail += curr_frag_len;
	} else {
1605 1606
		hdr_len = ETH_HLEN;
		memcpy(skb->data, start, hdr_len);
S
Sathya Perla 已提交
1607
		skb_shinfo(skb)->nr_frags = 1;
1608
		skb_frag_set_page(skb, 0, page_info->page);
S
Sathya Perla 已提交
1609 1610
		skb_shinfo(skb)->frags[0].page_offset =
					page_info->page_offset + hdr_len;
1611 1612
		skb_frag_size_set(&skb_shinfo(skb)->frags[0],
				  curr_frag_len - hdr_len);
S
Sathya Perla 已提交
1613
		skb->data_len = curr_frag_len - hdr_len;
E
Eric Dumazet 已提交
1614
		skb->truesize += rx_frag_size;
S
Sathya Perla 已提交
1615 1616
		skb->tail += hdr_len;
	}
A
Ajit Khaparde 已提交
1617
	page_info->page = NULL;
S
Sathya Perla 已提交
1618

1619 1620 1621
	if (rxcp->pkt_size <= rx_frag_size) {
		BUG_ON(rxcp->num_rcvd != 1);
		return;
S
Sathya Perla 已提交
1622 1623 1624
	}

	/* More frags present for this completion */
1625 1626
	remaining = rxcp->pkt_size - curr_frag_len;
	for (i = 1, j = 0; i < rxcp->num_rcvd; i++) {
1627
		page_info = get_rx_page_info(rxo);
1628
		curr_frag_len = min(remaining, rx_frag_size);
S
Sathya Perla 已提交
1629

1630 1631 1632 1633
		/* Coalesce all frags from the same physical page in one slot */
		if (page_info->page_offset == 0) {
			/* Fresh page */
			j++;
1634
			skb_frag_set_page(skb, j, page_info->page);
1635 1636
			skb_shinfo(skb)->frags[j].page_offset =
							page_info->page_offset;
E
Eric Dumazet 已提交
1637
			skb_frag_size_set(&skb_shinfo(skb)->frags[j], 0);
1638 1639 1640 1641 1642
			skb_shinfo(skb)->nr_frags++;
		} else {
			put_page(page_info->page);
		}

E
Eric Dumazet 已提交
1643
		skb_frag_size_add(&skb_shinfo(skb)->frags[j], curr_frag_len);
S
Sathya Perla 已提交
1644 1645
		skb->len += curr_frag_len;
		skb->data_len += curr_frag_len;
E
Eric Dumazet 已提交
1646
		skb->truesize += rx_frag_size;
1647
		remaining -= curr_frag_len;
A
Ajit Khaparde 已提交
1648
		page_info->page = NULL;
S
Sathya Perla 已提交
1649
	}
1650
	BUG_ON(j > MAX_SKB_FRAGS);
S
Sathya Perla 已提交
1651 1652
}

1653
/* Process the RX completion indicated by rxcp when GRO is disabled */
1654
static void be_rx_compl_process(struct be_rx_obj *rxo, struct napi_struct *napi,
S
Sathya Perla 已提交
1655
				struct be_rx_compl_info *rxcp)
S
Sathya Perla 已提交
1656
{
S
Sathya Perla 已提交
1657
	struct be_adapter *adapter = rxo->adapter;
1658
	struct net_device *netdev = adapter->netdev;
S
Sathya Perla 已提交
1659
	struct sk_buff *skb;
1660

1661
	skb = netdev_alloc_skb_ip_align(netdev, BE_RX_SKB_ALLOC_SIZE);
1662
	if (unlikely(!skb)) {
1663
		rx_stats(rxo)->rx_drops_no_skbs++;
S
Sathya Perla 已提交
1664
		be_rx_compl_discard(rxo, rxcp);
S
Sathya Perla 已提交
1665 1666 1667
		return;
	}

S
Sathya Perla 已提交
1668
	skb_fill_rx_data(rxo, skb, rxcp);
S
Sathya Perla 已提交
1669

1670
	if (likely((netdev->features & NETIF_F_RXCSUM) && csum_passed(rxcp)))
1671
		skb->ip_summed = CHECKSUM_UNNECESSARY;
S
Somnath Kotur 已提交
1672 1673
	else
		skb_checksum_none_assert(skb);
S
Sathya Perla 已提交
1674

1675
	skb->protocol = eth_type_trans(skb, netdev);
1676
	skb_record_rx_queue(skb, rxo - &adapter->rx_obj[0]);
S
Sathya Perla 已提交
1677
	if (netdev->features & NETIF_F_RXHASH)
T
Tom Herbert 已提交
1678
		skb_set_hash(skb, rxcp->rss_hash, PKT_HASH_TYPE_L3);
1679 1680

	skb->encapsulation = rxcp->tunneled;
1681
	skb_mark_napi_id(skb, napi);
S
Sathya Perla 已提交
1682

1683
	if (rxcp->vlanf)
1684
		__vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q), rxcp->vlan_tag);
A
Ajit Khaparde 已提交
1685 1686

	netif_receive_skb(skb);
S
Sathya Perla 已提交
1687 1688
}

1689
/* Process the RX completion indicated by rxcp when GRO is enabled */
J
Jingoo Han 已提交
1690 1691 1692
static void be_rx_compl_process_gro(struct be_rx_obj *rxo,
				    struct napi_struct *napi,
				    struct be_rx_compl_info *rxcp)
S
Sathya Perla 已提交
1693
{
S
Sathya Perla 已提交
1694
	struct be_adapter *adapter = rxo->adapter;
S
Sathya Perla 已提交
1695
	struct be_rx_page_info *page_info;
1696
	struct sk_buff *skb = NULL;
1697 1698
	u16 remaining, curr_frag_len;
	u16 i, j;
1699

S
Sathya Perla 已提交
1700
	skb = napi_get_frags(napi);
1701
	if (!skb) {
S
Sathya Perla 已提交
1702
		be_rx_compl_discard(rxo, rxcp);
1703 1704 1705
		return;
	}

1706 1707
	remaining = rxcp->pkt_size;
	for (i = 0, j = -1; i < rxcp->num_rcvd; i++) {
1708
		page_info = get_rx_page_info(rxo);
S
Sathya Perla 已提交
1709 1710 1711

		curr_frag_len = min(remaining, rx_frag_size);

1712 1713 1714 1715
		/* Coalesce all frags from the same physical page in one slot */
		if (i == 0 || page_info->page_offset == 0) {
			/* First frag or Fresh page */
			j++;
1716
			skb_frag_set_page(skb, j, page_info->page);
1717 1718
			skb_shinfo(skb)->frags[j].page_offset =
							page_info->page_offset;
E
Eric Dumazet 已提交
1719
			skb_frag_size_set(&skb_shinfo(skb)->frags[j], 0);
1720 1721 1722
		} else {
			put_page(page_info->page);
		}
E
Eric Dumazet 已提交
1723
		skb_frag_size_add(&skb_shinfo(skb)->frags[j], curr_frag_len);
E
Eric Dumazet 已提交
1724
		skb->truesize += rx_frag_size;
1725
		remaining -= curr_frag_len;
S
Sathya Perla 已提交
1726 1727
		memset(page_info, 0, sizeof(*page_info));
	}
1728
	BUG_ON(j > MAX_SKB_FRAGS);
S
Sathya Perla 已提交
1729

1730
	skb_shinfo(skb)->nr_frags = j + 1;
1731 1732
	skb->len = rxcp->pkt_size;
	skb->data_len = rxcp->pkt_size;
1733
	skb->ip_summed = CHECKSUM_UNNECESSARY;
1734
	skb_record_rx_queue(skb, rxo - &adapter->rx_obj[0]);
A
Ajit Khaparde 已提交
1735
	if (adapter->netdev->features & NETIF_F_RXHASH)
T
Tom Herbert 已提交
1736
		skb_set_hash(skb, rxcp->rss_hash, PKT_HASH_TYPE_L3);
1737 1738

	skb->encapsulation = rxcp->tunneled;
1739
	skb_mark_napi_id(skb, napi);
1740

1741
	if (rxcp->vlanf)
1742
		__vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q), rxcp->vlan_tag);
A
Ajit Khaparde 已提交
1743

S
Sathya Perla 已提交
1744
	napi_gro_frags(napi);
1745 1746
}

S
Sathya Perla 已提交
1747 1748
static void be_parse_rx_compl_v1(struct be_eth_rx_compl *compl,
				 struct be_rx_compl_info *rxcp)
1749 1750 1751 1752 1753 1754
{
	rxcp->pkt_size =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v1, pktsize, compl);
	rxcp->vlanf = AMAP_GET_BITS(struct amap_eth_rx_compl_v1, vtp, compl);
	rxcp->err = AMAP_GET_BITS(struct amap_eth_rx_compl_v1, err, compl);
	rxcp->tcpf = AMAP_GET_BITS(struct amap_eth_rx_compl_v1, tcpf, compl);
1755
	rxcp->udpf = AMAP_GET_BITS(struct amap_eth_rx_compl_v1, udpf, compl);
1756 1757 1758 1759 1760 1761 1762 1763 1764 1765
	rxcp->ip_csum =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v1, ipcksm, compl);
	rxcp->l4_csum =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v1, l4_cksm, compl);
	rxcp->ipv6 =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v1, ip_version, compl);
	rxcp->num_rcvd =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v1, numfrags, compl);
	rxcp->pkt_type =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v1, cast_enc, compl);
A
Ajit Khaparde 已提交
1766
	rxcp->rss_hash =
1767
		AMAP_GET_BITS(struct amap_eth_rx_compl_v1, rsshash, compl);
1768
	if (rxcp->vlanf) {
1769
		rxcp->qnq = AMAP_GET_BITS(struct amap_eth_rx_compl_v1, qnq,
1770
					  compl);
1771 1772
		rxcp->vlan_tag = AMAP_GET_BITS(struct amap_eth_rx_compl_v1,
					       vlan_tag, compl);
1773
	}
1774
	rxcp->port = AMAP_GET_BITS(struct amap_eth_rx_compl_v1, port, compl);
1775 1776
	rxcp->tunneled =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v1, tunneled, compl);
1777 1778
}

S
Sathya Perla 已提交
1779 1780
static void be_parse_rx_compl_v0(struct be_eth_rx_compl *compl,
				 struct be_rx_compl_info *rxcp)
1781 1782 1783 1784 1785 1786
{
	rxcp->pkt_size =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v0, pktsize, compl);
	rxcp->vlanf = AMAP_GET_BITS(struct amap_eth_rx_compl_v0, vtp, compl);
	rxcp->err = AMAP_GET_BITS(struct amap_eth_rx_compl_v0, err, compl);
	rxcp->tcpf = AMAP_GET_BITS(struct amap_eth_rx_compl_v0, tcpf, compl);
1787
	rxcp->udpf = AMAP_GET_BITS(struct amap_eth_rx_compl_v0, udpf, compl);
1788 1789 1790 1791 1792 1793 1794 1795 1796 1797
	rxcp->ip_csum =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v0, ipcksm, compl);
	rxcp->l4_csum =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v0, l4_cksm, compl);
	rxcp->ipv6 =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v0, ip_version, compl);
	rxcp->num_rcvd =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v0, numfrags, compl);
	rxcp->pkt_type =
		AMAP_GET_BITS(struct amap_eth_rx_compl_v0, cast_enc, compl);
A
Ajit Khaparde 已提交
1798
	rxcp->rss_hash =
1799
		AMAP_GET_BITS(struct amap_eth_rx_compl_v0, rsshash, compl);
1800
	if (rxcp->vlanf) {
1801
		rxcp->qnq = AMAP_GET_BITS(struct amap_eth_rx_compl_v0, qnq,
1802
					  compl);
1803 1804
		rxcp->vlan_tag = AMAP_GET_BITS(struct amap_eth_rx_compl_v0,
					       vlan_tag, compl);
1805
	}
1806
	rxcp->port = AMAP_GET_BITS(struct amap_eth_rx_compl_v0, port, compl);
1807 1808
	rxcp->ip_frag = AMAP_GET_BITS(struct amap_eth_rx_compl_v0,
				      ip_frag, compl);
1809 1810 1811 1812 1813 1814 1815
}

static struct be_rx_compl_info *be_rx_compl_get(struct be_rx_obj *rxo)
{
	struct be_eth_rx_compl *compl = queue_tail_node(&rxo->cq);
	struct be_rx_compl_info *rxcp = &rxo->rxcp;
	struct be_adapter *adapter = rxo->adapter;
S
Sathya Perla 已提交
1816

1817 1818 1819 1820
	/* For checking the valid bit it is Ok to use either definition as the
	 * valid bit is at the same position in both v0 and v1 Rx compl */
	if (compl->dw[offsetof(struct amap_eth_rx_compl_v1, valid) / 32] == 0)
		return NULL;
S
Sathya Perla 已提交
1821

1822 1823
	rmb();
	be_dws_le_to_cpu(compl, sizeof(*compl));
S
Sathya Perla 已提交
1824

1825
	if (adapter->be3_native)
S
Sathya Perla 已提交
1826
		be_parse_rx_compl_v1(compl, rxcp);
1827
	else
S
Sathya Perla 已提交
1828
		be_parse_rx_compl_v0(compl, rxcp);
S
Sathya Perla 已提交
1829

1830 1831 1832
	if (rxcp->ip_frag)
		rxcp->l4_csum = 0;

1833
	if (rxcp->vlanf) {
1834 1835 1836 1837 1838
		/* In QNQ modes, if qnq bit is not set, then the packet was
		 * tagged only with the transparent outer vlan-tag and must
		 * not be treated as a vlan packet by host
		 */
		if (be_is_qnq_mode(adapter) && !rxcp->qnq)
1839
			rxcp->vlanf = 0;
S
Sathya Perla 已提交
1840

1841
		if (!lancer_chip(adapter))
1842
			rxcp->vlan_tag = swab16(rxcp->vlan_tag);
S
Sathya Perla 已提交
1843

1844
		if (adapter->pvid == (rxcp->vlan_tag & VLAN_VID_MASK) &&
1845
		    !test_bit(rxcp->vlan_tag, adapter->vids))
1846 1847
			rxcp->vlanf = 0;
	}
1848 1849 1850

	/* As the compl has been parsed, reset it; we wont touch it again */
	compl->dw[offsetof(struct amap_eth_rx_compl_v1, valid) / 32] = 0;
S
Sathya Perla 已提交
1851

1852
	queue_tail_inc(&rxo->cq);
S
Sathya Perla 已提交
1853 1854 1855
	return rxcp;
}

1856
static inline struct page *be_alloc_pages(u32 size, gfp_t gfp)
S
Sathya Perla 已提交
1857 1858
{
	u32 order = get_order(size);
1859

S
Sathya Perla 已提交
1860
	if (order > 0)
1861 1862
		gfp |= __GFP_COMP;
	return  alloc_pages(gfp, order);
S
Sathya Perla 已提交
1863 1864 1865 1866 1867 1868
}

/*
 * Allocate a page, split it to fragments of size rx_frag_size and post as
 * receive buffers to BE
 */
1869
static void be_post_rx_frags(struct be_rx_obj *rxo, gfp_t gfp)
S
Sathya Perla 已提交
1870
{
1871
	struct be_adapter *adapter = rxo->adapter;
1872
	struct be_rx_page_info *page_info = NULL, *prev_page_info = NULL;
1873
	struct be_queue_info *rxq = &rxo->q;
S
Sathya Perla 已提交
1874
	struct page *pagep = NULL;
1875
	struct device *dev = &adapter->pdev->dev;
S
Sathya Perla 已提交
1876 1877 1878 1879
	struct be_eth_rx_d *rxd;
	u64 page_dmaaddr = 0, frag_dmaaddr;
	u32 posted, page_offset = 0;

1880
	page_info = &rxo->page_info_tbl[rxq->head];
S
Sathya Perla 已提交
1881 1882
	for (posted = 0; posted < MAX_RX_POST && !page_info->page; posted++) {
		if (!pagep) {
1883
			pagep = be_alloc_pages(adapter->big_page_size, gfp);
S
Sathya Perla 已提交
1884
			if (unlikely(!pagep)) {
1885
				rx_stats(rxo)->rx_post_fail++;
S
Sathya Perla 已提交
1886 1887
				break;
			}
1888 1889
			page_dmaaddr = dma_map_page(dev, pagep, 0,
						    adapter->big_page_size,
I
Ivan Vecera 已提交
1890
						    DMA_FROM_DEVICE);
1891 1892 1893 1894 1895 1896
			if (dma_mapping_error(dev, page_dmaaddr)) {
				put_page(pagep);
				pagep = NULL;
				rx_stats(rxo)->rx_post_fail++;
				break;
			}
1897
			page_offset = 0;
S
Sathya Perla 已提交
1898 1899
		} else {
			get_page(pagep);
1900
			page_offset += rx_frag_size;
S
Sathya Perla 已提交
1901
		}
1902
		page_info->page_offset = page_offset;
S
Sathya Perla 已提交
1903 1904 1905
		page_info->page = pagep;

		rxd = queue_head_node(rxq);
1906
		frag_dmaaddr = page_dmaaddr + page_info->page_offset;
S
Sathya Perla 已提交
1907 1908 1909 1910 1911 1912 1913
		rxd->fragpa_lo = cpu_to_le32(frag_dmaaddr & 0xFFFFFFFF);
		rxd->fragpa_hi = cpu_to_le32(upper_32_bits(frag_dmaaddr));

		/* Any space left in the current big page for another frag? */
		if ((page_offset + rx_frag_size + rx_frag_size) >
					adapter->big_page_size) {
			pagep = NULL;
1914 1915 1916 1917
			page_info->last_frag = true;
			dma_unmap_addr_set(page_info, bus, page_dmaaddr);
		} else {
			dma_unmap_addr_set(page_info, bus, frag_dmaaddr);
S
Sathya Perla 已提交
1918
		}
1919 1920 1921

		prev_page_info = page_info;
		queue_head_inc(rxq);
S
Sathya Perla 已提交
1922
		page_info = &rxo->page_info_tbl[rxq->head];
S
Sathya Perla 已提交
1923
	}
1924 1925 1926 1927 1928 1929 1930 1931

	/* Mark the last frag of a page when we break out of the above loop
	 * with no more slots available in the RXQ
	 */
	if (pagep) {
		prev_page_info->last_frag = true;
		dma_unmap_addr_set(prev_page_info, bus, page_dmaaddr);
	}
S
Sathya Perla 已提交
1932 1933 1934

	if (posted) {
		atomic_add(posted, &rxq->used);
1935 1936
		if (rxo->rx_post_starved)
			rxo->rx_post_starved = false;
1937
		be_rxq_notify(adapter, rxq->id, posted);
1938 1939
	} else if (atomic_read(&rxq->used) == 0) {
		/* Let be_worker replenish when memory is available */
1940
		rxo->rx_post_starved = true;
S
Sathya Perla 已提交
1941 1942 1943
	}
}

1944
static struct be_eth_tx_compl *be_tx_compl_get(struct be_queue_info *tx_cq)
S
Sathya Perla 已提交
1945 1946 1947 1948 1949 1950
{
	struct be_eth_tx_compl *txcp = queue_tail_node(tx_cq);

	if (txcp->dw[offsetof(struct amap_eth_tx_compl, valid) / 32] == 0)
		return NULL;

1951
	rmb();
S
Sathya Perla 已提交
1952 1953 1954 1955 1956 1957 1958 1959
	be_dws_le_to_cpu(txcp, sizeof(*txcp));

	txcp->dw[offsetof(struct amap_eth_tx_compl, valid) / 32] = 0;

	queue_tail_inc(tx_cq);
	return txcp;
}

1960
static u16 be_tx_compl_process(struct be_adapter *adapter,
1961
			       struct be_tx_obj *txo, u16 last_index)
S
Sathya Perla 已提交
1962
{
1963
	struct be_queue_info *txq = &txo->q;
1964
	struct be_eth_wrb *wrb;
1965
	struct sk_buff **sent_skbs = txo->sent_skb_list;
S
Sathya Perla 已提交
1966
	struct sk_buff *sent_skb;
1967 1968
	u16 cur_index, num_wrbs = 1; /* account for hdr wrb */
	bool unmap_skb_hdr = true;
S
Sathya Perla 已提交
1969

1970
	sent_skb = sent_skbs[txq->tail];
S
Sathya Perla 已提交
1971
	BUG_ON(!sent_skb);
1972 1973 1974
	sent_skbs[txq->tail] = NULL;

	/* skip header wrb */
1975
	queue_tail_inc(txq);
S
Sathya Perla 已提交
1976

1977
	do {
S
Sathya Perla 已提交
1978
		cur_index = txq->tail;
1979
		wrb = queue_tail_node(txq);
I
Ivan Vecera 已提交
1980 1981
		unmap_tx_frag(&adapter->pdev->dev, wrb,
			      (unmap_skb_hdr && skb_headlen(sent_skb)));
1982 1983
		unmap_skb_hdr = false;

S
Sathya Perla 已提交
1984 1985
		num_wrbs++;
		queue_tail_inc(txq);
1986
	} while (cur_index != last_index);
S
Sathya Perla 已提交
1987

1988
	dev_kfree_skb_any(sent_skb);
1989
	return num_wrbs;
S
Sathya Perla 已提交
1990 1991
}

S
Sathya Perla 已提交
1992 1993
/* Return the number of events in the event queue */
static inline int events_get(struct be_eq_obj *eqo)
1994
{
S
Sathya Perla 已提交
1995 1996
	struct be_eq_entry *eqe;
	int num = 0;
1997

S
Sathya Perla 已提交
1998 1999 2000 2001
	do {
		eqe = queue_tail_node(&eqo->q);
		if (eqe->evt == 0)
			break;
2002

S
Sathya Perla 已提交
2003 2004 2005 2006 2007 2008 2009
		rmb();
		eqe->evt = 0;
		num++;
		queue_tail_inc(&eqo->q);
	} while (true);

	return num;
2010 2011
}

S
Sathya Perla 已提交
2012 2013
/* Leaves the EQ is disarmed state */
static void be_eq_clean(struct be_eq_obj *eqo)
2014
{
S
Sathya Perla 已提交
2015
	int num = events_get(eqo);
2016

S
Sathya Perla 已提交
2017
	be_eq_notify(eqo->adapter, eqo->q.id, false, true, num);
2018 2019
}

S
Sathya Perla 已提交
2020
static void be_rx_cq_clean(struct be_rx_obj *rxo)
S
Sathya Perla 已提交
2021 2022
{
	struct be_rx_page_info *page_info;
2023 2024
	struct be_queue_info *rxq = &rxo->q;
	struct be_queue_info *rx_cq = &rxo->cq;
2025
	struct be_rx_compl_info *rxcp;
2026 2027
	struct be_adapter *adapter = rxo->adapter;
	int flush_wait = 0;
S
Sathya Perla 已提交
2028

2029 2030 2031 2032 2033 2034 2035 2036
	/* Consume pending rx completions.
	 * Wait for the flush completion (identified by zero num_rcvd)
	 * to arrive. Notify CQ even when there are no more CQ entries
	 * for HW to flush partially coalesced CQ entries.
	 * In Lancer, there is no need to wait for flush compl.
	 */
	for (;;) {
		rxcp = be_rx_compl_get(rxo);
K
Kalesh AP 已提交
2037
		if (!rxcp) {
2038 2039 2040 2041 2042 2043 2044 2045 2046 2047 2048 2049
			if (lancer_chip(adapter))
				break;

			if (flush_wait++ > 10 || be_hw_error(adapter)) {
				dev_warn(&adapter->pdev->dev,
					 "did not receive flush compl\n");
				break;
			}
			be_cq_notify(adapter, rx_cq->id, true, 0);
			mdelay(1);
		} else {
			be_rx_compl_discard(rxo, rxcp);
2050
			be_cq_notify(adapter, rx_cq->id, false, 1);
2051 2052 2053
			if (rxcp->num_rcvd == 0)
				break;
		}
S
Sathya Perla 已提交
2054 2055
	}

2056 2057 2058 2059
	/* After cleanup, leave the CQ in unarmed state */
	be_cq_notify(adapter, rx_cq->id, false, 0);

	/* Then free posted rx buffers that were not used */
2060 2061
	while (atomic_read(&rxq->used) > 0) {
		page_info = get_rx_page_info(rxo);
S
Sathya Perla 已提交
2062 2063 2064 2065
		put_page(page_info->page);
		memset(page_info, 0, sizeof(*page_info));
	}
	BUG_ON(atomic_read(&rxq->used));
2066
	rxq->tail = rxq->head = 0;
S
Sathya Perla 已提交
2067 2068
}

S
Sathya Perla 已提交
2069
static void be_tx_compl_clean(struct be_adapter *adapter)
S
Sathya Perla 已提交
2070
{
S
Sathya Perla 已提交
2071 2072
	struct be_tx_obj *txo;
	struct be_queue_info *txq;
2073
	struct be_eth_tx_compl *txcp;
2074
	u16 end_idx, cmpl = 0, timeo = 0, num_wrbs = 0;
2075 2076
	struct sk_buff *sent_skb;
	bool dummy_wrb;
S
Sathya Perla 已提交
2077
	int i, pending_txqs;
2078

2079
	/* Stop polling for compls when HW has been silent for 10ms */
2080
	do {
S
Sathya Perla 已提交
2081 2082 2083
		pending_txqs = adapter->num_tx_qs;

		for_all_tx_queues(adapter, txo, i) {
2084 2085
			cmpl = 0;
			num_wrbs = 0;
S
Sathya Perla 已提交
2086 2087 2088 2089 2090 2091 2092 2093 2094 2095 2096 2097
			txq = &txo->q;
			while ((txcp = be_tx_compl_get(&txo->cq))) {
				end_idx =
					AMAP_GET_BITS(struct amap_eth_tx_compl,
						      wrb_index, txcp);
				num_wrbs += be_tx_compl_process(adapter, txo,
								end_idx);
				cmpl++;
			}
			if (cmpl) {
				be_cq_notify(adapter, txo->cq.id, false, cmpl);
				atomic_sub(num_wrbs, &txq->used);
2098
				timeo = 0;
S
Sathya Perla 已提交
2099 2100 2101
			}
			if (atomic_read(&txq->used) == 0)
				pending_txqs--;
2102 2103
		}

2104
		if (pending_txqs == 0 || ++timeo > 10 || be_hw_error(adapter))
2105 2106 2107 2108 2109
			break;

		mdelay(1);
	} while (true);

S
Sathya Perla 已提交
2110 2111 2112 2113 2114 2115 2116 2117 2118 2119 2120 2121 2122 2123 2124 2125
	for_all_tx_queues(adapter, txo, i) {
		txq = &txo->q;
		if (atomic_read(&txq->used))
			dev_err(&adapter->pdev->dev, "%d pending tx-compls\n",
				atomic_read(&txq->used));

		/* free posted tx for which compls will never arrive */
		while (atomic_read(&txq->used)) {
			sent_skb = txo->sent_skb_list[txq->tail];
			end_idx = txq->tail;
			num_wrbs = wrb_cnt_for_skb(adapter, sent_skb,
						   &dummy_wrb);
			index_adv(&end_idx, num_wrbs - 1, txq->len);
			num_wrbs = be_tx_compl_process(adapter, txo, end_idx);
			atomic_sub(num_wrbs, &txq->used);
		}
2126
	}
S
Sathya Perla 已提交
2127 2128
}

S
Sathya Perla 已提交
2129 2130 2131 2132 2133 2134
static void be_evt_queues_destroy(struct be_adapter *adapter)
{
	struct be_eq_obj *eqo;
	int i;

	for_all_evt_queues(adapter, eqo, i) {
2135 2136
		if (eqo->q.created) {
			be_eq_clean(eqo);
S
Sathya Perla 已提交
2137
			be_cmd_q_destroy(adapter, &eqo->q, QTYPE_EQ);
2138
			napi_hash_del(&eqo->napi);
2139
			netif_napi_del(&eqo->napi);
2140
		}
S
Sathya Perla 已提交
2141 2142 2143 2144 2145 2146 2147 2148
		be_queue_free(adapter, &eqo->q);
	}
}

static int be_evt_queues_create(struct be_adapter *adapter)
{
	struct be_queue_info *eq;
	struct be_eq_obj *eqo;
2149
	struct be_aic_obj *aic;
S
Sathya Perla 已提交
2150 2151
	int i, rc;

2152 2153
	adapter->num_evt_qs = min_t(u16, num_irqs(adapter),
				    adapter->cfg_num_qs);
S
Sathya Perla 已提交
2154 2155

	for_all_evt_queues(adapter, eqo, i) {
2156 2157
		netif_napi_add(adapter->netdev, &eqo->napi, be_poll,
			       BE_NAPI_WEIGHT);
2158
		napi_hash_add(&eqo->napi);
2159
		aic = &adapter->aic_obj[i];
S
Sathya Perla 已提交
2160 2161 2162
		eqo->adapter = adapter;
		eqo->tx_budget = BE_TX_BUDGET;
		eqo->idx = i;
2163 2164
		aic->max_eqd = BE_MAX_EQD;
		aic->enable = true;
S
Sathya Perla 已提交
2165 2166 2167

		eq = &eqo->q;
		rc = be_queue_alloc(adapter, eq, EVNT_Q_LEN,
2168
				    sizeof(struct be_eq_entry));
S
Sathya Perla 已提交
2169 2170 2171
		if (rc)
			return rc;

S
Sathya Perla 已提交
2172
		rc = be_cmd_eq_create(adapter, eqo);
S
Sathya Perla 已提交
2173 2174 2175
		if (rc)
			return rc;
	}
2176
	return 0;
S
Sathya Perla 已提交
2177 2178
}

2179 2180 2181 2182
static void be_mcc_queues_destroy(struct be_adapter *adapter)
{
	struct be_queue_info *q;

2183
	q = &adapter->mcc_obj.q;
2184
	if (q->created)
2185
		be_cmd_q_destroy(adapter, q, QTYPE_MCCQ);
2186 2187
	be_queue_free(adapter, q);

2188
	q = &adapter->mcc_obj.cq;
2189
	if (q->created)
2190
		be_cmd_q_destroy(adapter, q, QTYPE_CQ);
2191 2192 2193 2194 2195 2196 2197 2198
	be_queue_free(adapter, q);
}

/* Must be called only after TX qs are created as MCC shares TX EQ */
static int be_mcc_queues_create(struct be_adapter *adapter)
{
	struct be_queue_info *q, *cq;

2199
	cq = &adapter->mcc_obj.cq;
2200
	if (be_queue_alloc(adapter, cq, MCC_CQ_LEN,
2201
			   sizeof(struct be_mcc_compl)))
2202 2203
		goto err;

S
Sathya Perla 已提交
2204 2205
	/* Use the default EQ for MCC completions */
	if (be_cmd_cq_create(adapter, cq, &mcc_eqo(adapter)->q, true, 0))
2206 2207
		goto mcc_cq_free;

2208
	q = &adapter->mcc_obj.q;
2209 2210 2211
	if (be_queue_alloc(adapter, q, MCC_Q_LEN, sizeof(struct be_mcc_wrb)))
		goto mcc_cq_destroy;

2212
	if (be_cmd_mccq_create(adapter, q, cq))
2213 2214 2215 2216 2217 2218 2219
		goto mcc_q_free;

	return 0;

mcc_q_free:
	be_queue_free(adapter, q);
mcc_cq_destroy:
2220
	be_cmd_q_destroy(adapter, cq, QTYPE_CQ);
2221 2222 2223 2224 2225 2226
mcc_cq_free:
	be_queue_free(adapter, cq);
err:
	return -1;
}

S
Sathya Perla 已提交
2227 2228 2229
static void be_tx_queues_destroy(struct be_adapter *adapter)
{
	struct be_queue_info *q;
2230 2231
	struct be_tx_obj *txo;
	u8 i;
S
Sathya Perla 已提交
2232

2233 2234 2235 2236 2237
	for_all_tx_queues(adapter, txo, i) {
		q = &txo->q;
		if (q->created)
			be_cmd_q_destroy(adapter, q, QTYPE_TXQ);
		be_queue_free(adapter, q);
S
Sathya Perla 已提交
2238

2239 2240 2241 2242 2243
		q = &txo->cq;
		if (q->created)
			be_cmd_q_destroy(adapter, q, QTYPE_CQ);
		be_queue_free(adapter, q);
	}
S
Sathya Perla 已提交
2244 2245
}

2246
static int be_tx_qs_create(struct be_adapter *adapter)
S
Sathya Perla 已提交
2247
{
S
Sathya Perla 已提交
2248
	struct be_queue_info *cq, *eq;
2249
	struct be_tx_obj *txo;
2250
	int status, i;
S
Sathya Perla 已提交
2251

2252
	adapter->num_tx_qs = min(adapter->num_evt_qs, be_max_txqs(adapter));
2253

S
Sathya Perla 已提交
2254 2255 2256 2257 2258 2259
	for_all_tx_queues(adapter, txo, i) {
		cq = &txo->cq;
		status = be_queue_alloc(adapter, cq, TX_CQ_LEN,
					sizeof(struct be_eth_tx_compl));
		if (status)
			return status;
2260

2261 2262 2263
		u64_stats_init(&txo->stats.sync);
		u64_stats_init(&txo->stats.sync_compl);

S
Sathya Perla 已提交
2264 2265 2266 2267 2268 2269 2270
		/* If num_evt_qs is less than num_tx_qs, then more than
		 * one txq share an eq
		 */
		eq = &adapter->eq_obj[i % adapter->num_evt_qs].q;
		status = be_cmd_cq_create(adapter, cq, eq, false, 3);
		if (status)
			return status;
S
Sathya Perla 已提交
2271

S
Sathya Perla 已提交
2272 2273 2274 2275
		status = be_queue_alloc(adapter, &txo->q, TX_Q_LEN,
					sizeof(struct be_eth_wrb));
		if (status)
			return status;
S
Sathya Perla 已提交
2276

V
Vasundhara Volam 已提交
2277
		status = be_cmd_txq_create(adapter, txo);
S
Sathya Perla 已提交
2278 2279
		if (status)
			return status;
2280
	}
S
Sathya Perla 已提交
2281

S
Sathya Perla 已提交
2282 2283
	dev_info(&adapter->pdev->dev, "created %d TX queue(s)\n",
		 adapter->num_tx_qs);
S
Sathya Perla 已提交
2284
	return 0;
S
Sathya Perla 已提交
2285 2286
}

S
Sathya Perla 已提交
2287
static void be_rx_cqs_destroy(struct be_adapter *adapter)
S
Sathya Perla 已提交
2288 2289
{
	struct be_queue_info *q;
2290 2291 2292 2293 2294 2295 2296 2297
	struct be_rx_obj *rxo;
	int i;

	for_all_rx_queues(adapter, rxo, i) {
		q = &rxo->cq;
		if (q->created)
			be_cmd_q_destroy(adapter, q, QTYPE_CQ);
		be_queue_free(adapter, q);
2298 2299 2300
	}
}

S
Sathya Perla 已提交
2301
static int be_rx_cqs_create(struct be_adapter *adapter)
S
Sathya Perla 已提交
2302
{
S
Sathya Perla 已提交
2303
	struct be_queue_info *eq, *cq;
2304 2305
	struct be_rx_obj *rxo;
	int rc, i;
S
Sathya Perla 已提交
2306

2307 2308 2309 2310 2311
	/* We can create as many RSS rings as there are EQs. */
	adapter->num_rx_qs = adapter->num_evt_qs;

	/* We'll use RSS only if atleast 2 RSS rings are supported.
	 * When RSS is used, we'll need a default RXQ for non-IP traffic.
S
Sathya Perla 已提交
2312
	 */
2313 2314 2315
	if (adapter->num_rx_qs > 1)
		adapter->num_rx_qs++;

S
Sathya Perla 已提交
2316
	adapter->big_page_size = (1 << get_order(rx_frag_size)) * PAGE_SIZE;
2317 2318 2319 2320
	for_all_rx_queues(adapter, rxo, i) {
		rxo->adapter = adapter;
		cq = &rxo->cq;
		rc = be_queue_alloc(adapter, cq, RX_CQ_LEN,
2321
				    sizeof(struct be_eth_rx_compl));
2322
		if (rc)
S
Sathya Perla 已提交
2323
			return rc;
2324

2325
		u64_stats_init(&rxo->stats.sync);
S
Sathya Perla 已提交
2326 2327
		eq = &adapter->eq_obj[i % adapter->num_evt_qs].q;
		rc = be_cmd_cq_create(adapter, cq, eq, false, 3);
2328
		if (rc)
S
Sathya Perla 已提交
2329
			return rc;
2330
	}
S
Sathya Perla 已提交
2331

S
Sathya Perla 已提交
2332 2333 2334
	dev_info(&adapter->pdev->dev,
		 "created %d RSS queue(s) and 1 default RX queue\n",
		 adapter->num_rx_qs - 1);
S
Sathya Perla 已提交
2335
	return 0;
2336 2337
}

S
Sathya Perla 已提交
2338 2339
static irqreturn_t be_intx(int irq, void *dev)
{
2340 2341 2342
	struct be_eq_obj *eqo = dev;
	struct be_adapter *adapter = eqo->adapter;
	int num_evts = 0;
S
Sathya Perla 已提交
2343

2344 2345 2346 2347 2348 2349 2350
	/* IRQ is not expected when NAPI is scheduled as the EQ
	 * will not be armed.
	 * But, this can happen on Lancer INTx where it takes
	 * a while to de-assert INTx or in BE2 where occasionaly
	 * an interrupt may be raised even when EQ is unarmed.
	 * If NAPI is already scheduled, then counting & notifying
	 * events will orphan them.
2351
	 */
2352
	if (napi_schedule_prep(&eqo->napi)) {
2353
		num_evts = events_get(eqo);
2354 2355 2356 2357 2358
		__napi_schedule(&eqo->napi);
		if (num_evts)
			eqo->spurious_intr = 0;
	}
	be_eq_notify(adapter, eqo->q.id, false, true, num_evts);
2359

2360 2361 2362
	/* Return IRQ_HANDLED only for the the first spurious intr
	 * after a valid intr to stop the kernel from branding
	 * this irq as a bad one!
2363
	 */
2364 2365 2366 2367
	if (num_evts || eqo->spurious_intr++ == 0)
		return IRQ_HANDLED;
	else
		return IRQ_NONE;
S
Sathya Perla 已提交
2368 2369
}

S
Sathya Perla 已提交
2370
static irqreturn_t be_msix(int irq, void *dev)
S
Sathya Perla 已提交
2371
{
S
Sathya Perla 已提交
2372
	struct be_eq_obj *eqo = dev;
S
Sathya Perla 已提交
2373

2374 2375
	be_eq_notify(eqo->adapter, eqo->q.id, false, true, 0);
	napi_schedule(&eqo->napi);
S
Sathya Perla 已提交
2376 2377 2378
	return IRQ_HANDLED;
}

2379
static inline bool do_gro(struct be_rx_compl_info *rxcp)
S
Sathya Perla 已提交
2380
{
2381
	return (rxcp->tcpf && !rxcp->err && rxcp->l4_csum) ? true : false;
S
Sathya Perla 已提交
2382 2383
}

S
Sathya Perla 已提交
2384
static int be_process_rx(struct be_rx_obj *rxo, struct napi_struct *napi,
2385
			 int budget, int polling)
S
Sathya Perla 已提交
2386
{
2387 2388
	struct be_adapter *adapter = rxo->adapter;
	struct be_queue_info *rx_cq = &rxo->cq;
2389
	struct be_rx_compl_info *rxcp;
S
Sathya Perla 已提交
2390 2391 2392
	u32 work_done;

	for (work_done = 0; work_done < budget; work_done++) {
2393
		rxcp = be_rx_compl_get(rxo);
S
Sathya Perla 已提交
2394 2395 2396
		if (!rxcp)
			break;

2397 2398 2399 2400 2401 2402
		/* Is it a flush compl that has no data */
		if (unlikely(rxcp->num_rcvd == 0))
			goto loop_continue;

		/* Discard compl with partial DMA Lancer B0 */
		if (unlikely(!rxcp->pkt_size)) {
S
Sathya Perla 已提交
2403
			be_rx_compl_discard(rxo, rxcp);
2404 2405 2406 2407 2408 2409 2410
			goto loop_continue;
		}

		/* On BE drop pkts that arrive due to imperfect filtering in
		 * promiscuous mode on some skews
		 */
		if (unlikely(rxcp->port != adapter->port_num &&
2411
			     !lancer_chip(adapter))) {
S
Sathya Perla 已提交
2412
			be_rx_compl_discard(rxo, rxcp);
2413
			goto loop_continue;
2414
		}
2415

2416 2417
		/* Don't do gro when we're busy_polling */
		if (do_gro(rxcp) && polling != BUSY_POLLING)
S
Sathya Perla 已提交
2418
			be_rx_compl_process_gro(rxo, napi, rxcp);
2419
		else
2420 2421
			be_rx_compl_process(rxo, napi, rxcp);

2422
loop_continue:
2423
		be_rx_stats_update(rxo, rxcp);
S
Sathya Perla 已提交
2424 2425
	}

S
Sathya Perla 已提交
2426 2427
	if (work_done) {
		be_cq_notify(adapter, rx_cq->id, true, work_done);
2428

2429 2430 2431 2432 2433
		/* When an rx-obj gets into post_starved state, just
		 * let be_worker do the posting.
		 */
		if (atomic_read(&rxo->q.used) < RX_FRAGS_REFILL_WM &&
		    !rxo->rx_post_starved)
S
Sathya Perla 已提交
2434
			be_post_rx_frags(rxo, GFP_ATOMIC);
S
Sathya Perla 已提交
2435
	}
S
Sathya Perla 已提交
2436

S
Sathya Perla 已提交
2437 2438 2439
	return work_done;
}

S
Sathya Perla 已提交
2440 2441
static bool be_process_tx(struct be_adapter *adapter, struct be_tx_obj *txo,
			  int budget, int idx)
S
Sathya Perla 已提交
2442 2443
{
	struct be_eth_tx_compl *txcp;
S
Sathya Perla 已提交
2444
	int num_wrbs = 0, work_done;
2445

S
Sathya Perla 已提交
2446 2447 2448 2449 2450
	for (work_done = 0; work_done < budget; work_done++) {
		txcp = be_tx_compl_get(&txo->cq);
		if (!txcp)
			break;
		num_wrbs += be_tx_compl_process(adapter, txo,
2451 2452 2453
						AMAP_GET_BITS(struct
							      amap_eth_tx_compl,
							      wrb_index, txcp));
S
Sathya Perla 已提交
2454
	}
S
Sathya Perla 已提交
2455

S
Sathya Perla 已提交
2456 2457 2458
	if (work_done) {
		be_cq_notify(adapter, txo->cq.id, true, work_done);
		atomic_sub(num_wrbs, &txo->q.used);
2459

S
Sathya Perla 已提交
2460 2461 2462
		/* As Tx wrbs have been freed up, wake up netdev queue
		 * if it was stopped due to lack of tx wrbs.  */
		if (__netif_subqueue_stopped(adapter->netdev, idx) &&
2463
		    atomic_read(&txo->q.used) < txo->q.len / 2) {
S
Sathya Perla 已提交
2464
			netif_wake_subqueue(adapter->netdev, idx);
2465
		}
S
Sathya Perla 已提交
2466 2467 2468 2469

		u64_stats_update_begin(&tx_stats(txo)->sync_compl);
		tx_stats(txo)->tx_compl += work_done;
		u64_stats_update_end(&tx_stats(txo)->sync_compl);
S
Sathya Perla 已提交
2470
	}
S
Sathya Perla 已提交
2471 2472
	return (work_done < budget); /* Done */
}
S
Sathya Perla 已提交
2473

2474
int be_poll(struct napi_struct *napi, int budget)
S
Sathya Perla 已提交
2475 2476 2477
{
	struct be_eq_obj *eqo = container_of(napi, struct be_eq_obj, napi);
	struct be_adapter *adapter = eqo->adapter;
2478
	int max_work = 0, work, i, num_evts;
2479
	struct be_rx_obj *rxo;
S
Sathya Perla 已提交
2480
	bool tx_done;
S
Sathya Perla 已提交
2481

2482 2483
	num_evts = events_get(eqo);

S
Sathya Perla 已提交
2484 2485 2486 2487 2488 2489
	/* Process all TXQs serviced by this EQ */
	for (i = eqo->idx; i < adapter->num_tx_qs; i += adapter->num_evt_qs) {
		tx_done = be_process_tx(adapter, &adapter->tx_obj[i],
					eqo->tx_budget, i);
		if (!tx_done)
			max_work = budget;
S
Sathya Perla 已提交
2490 2491
	}

2492 2493 2494 2495 2496 2497 2498 2499 2500 2501 2502 2503
	if (be_lock_napi(eqo)) {
		/* This loop will iterate twice for EQ0 in which
		 * completions of the last RXQ (default one) are also processed
		 * For other EQs the loop iterates only once
		 */
		for_all_rx_queues_on_eq(adapter, eqo, rxo, i) {
			work = be_process_rx(rxo, napi, budget, NAPI_POLLING);
			max_work = max(work, max_work);
		}
		be_unlock_napi(eqo);
	} else {
		max_work = budget;
S
Sathya Perla 已提交
2504
	}
S
Sathya Perla 已提交
2505

S
Sathya Perla 已提交
2506 2507
	if (is_mcc_eqo(eqo))
		be_process_mcc(adapter);
2508

S
Sathya Perla 已提交
2509 2510
	if (max_work < budget) {
		napi_complete(napi);
2511
		be_eq_notify(adapter, eqo->q.id, true, false, num_evts);
S
Sathya Perla 已提交
2512 2513
	} else {
		/* As we'll continue in polling mode, count and clear events */
2514
		be_eq_notify(adapter, eqo->q.id, false, false, num_evts);
2515
	}
S
Sathya Perla 已提交
2516
	return max_work;
S
Sathya Perla 已提交
2517 2518
}

2519 2520 2521 2522 2523 2524 2525 2526 2527 2528 2529 2530 2531 2532 2533 2534 2535 2536 2537 2538 2539 2540
#ifdef CONFIG_NET_RX_BUSY_POLL
static int be_busy_poll(struct napi_struct *napi)
{
	struct be_eq_obj *eqo = container_of(napi, struct be_eq_obj, napi);
	struct be_adapter *adapter = eqo->adapter;
	struct be_rx_obj *rxo;
	int i, work = 0;

	if (!be_lock_busy_poll(eqo))
		return LL_FLUSH_BUSY;

	for_all_rx_queues_on_eq(adapter, eqo, rxo, i) {
		work = be_process_rx(rxo, napi, 4, BUSY_POLLING);
		if (work)
			break;
	}

	be_unlock_busy_poll(eqo);
	return work;
}
#endif

2541
void be_detect_error(struct be_adapter *adapter)
2542
{
2543 2544
	u32 ue_lo = 0, ue_hi = 0, ue_lo_mask = 0, ue_hi_mask = 0;
	u32 sliport_status = 0, sliport_err1 = 0, sliport_err2 = 0;
2545
	u32 i;
2546 2547 2548
	bool error_detected = false;
	struct device *dev = &adapter->pdev->dev;
	struct net_device *netdev = adapter->netdev;
2549

2550
	if (be_hw_error(adapter))
2551 2552
		return;

2553 2554 2555 2556
	if (lancer_chip(adapter)) {
		sliport_status = ioread32(adapter->db + SLIPORT_STATUS_OFFSET);
		if (sliport_status & SLIPORT_STATUS_ERR_MASK) {
			sliport_err1 = ioread32(adapter->db +
2557
						SLIPORT_ERROR1_OFFSET);
2558
			sliport_err2 = ioread32(adapter->db +
2559
						SLIPORT_ERROR2_OFFSET);
2560 2561 2562 2563 2564 2565 2566 2567 2568 2569 2570 2571 2572 2573 2574
			adapter->hw_error = true;
			/* Do not log error messages if its a FW reset */
			if (sliport_err1 == SLIPORT_ERROR_FW_RESET1 &&
			    sliport_err2 == SLIPORT_ERROR_FW_RESET2) {
				dev_info(dev, "Firmware update in progress\n");
			} else {
				error_detected = true;
				dev_err(dev, "Error detected in the card\n");
				dev_err(dev, "ERR: sliport status 0x%x\n",
					sliport_status);
				dev_err(dev, "ERR: sliport error1 0x%x\n",
					sliport_err1);
				dev_err(dev, "ERR: sliport error2 0x%x\n",
					sliport_err2);
			}
2575 2576 2577
		}
	} else {
		pci_read_config_dword(adapter->pdev,
2578
				      PCICFG_UE_STATUS_LOW, &ue_lo);
2579
		pci_read_config_dword(adapter->pdev,
2580
				      PCICFG_UE_STATUS_HIGH, &ue_hi);
2581
		pci_read_config_dword(adapter->pdev,
2582
				      PCICFG_UE_STATUS_LOW_MASK, &ue_lo_mask);
2583
		pci_read_config_dword(adapter->pdev,
2584
				      PCICFG_UE_STATUS_HI_MASK, &ue_hi_mask);
2585

2586 2587
		ue_lo = (ue_lo & ~ue_lo_mask);
		ue_hi = (ue_hi & ~ue_hi_mask);
2588

2589 2590 2591 2592
		/* On certain platforms BE hardware can indicate spurious UEs.
		 * Allow HW to stop working completely in case of a real UE.
		 * Hence not setting the hw_error for UE detection.
		 */
2593

2594 2595 2596 2597 2598 2599 2600 2601 2602 2603 2604 2605 2606 2607 2608 2609 2610
		if (ue_lo || ue_hi) {
			error_detected = true;
			dev_err(dev,
				"Unrecoverable Error detected in the adapter");
			dev_err(dev, "Please reboot server to recover");
			if (skyhawk_chip(adapter))
				adapter->hw_error = true;
			for (i = 0; ue_lo; ue_lo >>= 1, i++) {
				if (ue_lo & 1)
					dev_err(dev, "UE: %s bit set\n",
						ue_status_low_desc[i]);
			}
			for (i = 0; ue_hi; ue_hi >>= 1, i++) {
				if (ue_hi & 1)
					dev_err(dev, "UE: %s bit set\n",
						ue_status_hi_desc[i]);
			}
2611 2612
		}
	}
2613 2614
	if (error_detected)
		netif_carrier_off(netdev);
2615 2616
}

2617 2618
static void be_msix_disable(struct be_adapter *adapter)
{
2619
	if (msix_enabled(adapter)) {
2620
		pci_disable_msix(adapter->pdev);
2621
		adapter->num_msix_vec = 0;
2622
		adapter->num_msix_roce_vec = 0;
2623 2624 2625
	}
}

2626
static int be_msix_enable(struct be_adapter *adapter)
S
Sathya Perla 已提交
2627
{
2628
	int i, num_vec;
S
Sathya Perla 已提交
2629
	struct device *dev = &adapter->pdev->dev;
S
Sathya Perla 已提交
2630

2631 2632 2633 2634 2635 2636 2637 2638 2639
	/* If RoCE is supported, program the max number of NIC vectors that
	 * may be configured via set-channels, along with vectors needed for
	 * RoCe. Else, just program the number we'll use initially.
	 */
	if (be_roce_supported(adapter))
		num_vec = min_t(int, 2 * be_max_eqs(adapter),
				2 * num_online_cpus());
	else
		num_vec = adapter->cfg_num_qs;
2640

2641
	for (i = 0; i < num_vec; i++)
S
Sathya Perla 已提交
2642 2643
		adapter->msix_entries[i].entry = i;

2644 2645 2646 2647
	num_vec = pci_enable_msix_range(adapter->pdev, adapter->msix_entries,
					MIN_MSIX_VECTORS, num_vec);
	if (num_vec < 0)
		goto fail;
2648 2649 2650 2651 2652 2653 2654 2655 2656 2657 2658

	if (be_roce_supported(adapter) && num_vec > MIN_MSIX_VECTORS) {
		adapter->num_msix_roce_vec = num_vec / 2;
		dev_info(dev, "enabled %d MSI-x vector(s) for RoCE\n",
			 adapter->num_msix_roce_vec);
	}

	adapter->num_msix_vec = num_vec - adapter->num_msix_roce_vec;

	dev_info(dev, "enabled %d MSI-x vector(s) for NIC\n",
		 adapter->num_msix_vec);
2659
	return 0;
2660 2661 2662 2663 2664 2665 2666 2667

fail:
	dev_warn(dev, "MSIx enable failed\n");

	/* INTx is not supported in VFs, so fail probe if enable_msix fails */
	if (!be_physfn(adapter))
		return num_vec;
	return 0;
S
Sathya Perla 已提交
2668 2669
}

2670
static inline int be_msix_vec_get(struct be_adapter *adapter,
2671
				  struct be_eq_obj *eqo)
2672
{
S
Sathya Perla 已提交
2673
	return adapter->msix_entries[eqo->msix_idx].vector;
2674
}
S
Sathya Perla 已提交
2675

2676 2677
static int be_msix_register(struct be_adapter *adapter)
{
S
Sathya Perla 已提交
2678 2679 2680
	struct net_device *netdev = adapter->netdev;
	struct be_eq_obj *eqo;
	int status, i, vec;
S
Sathya Perla 已提交
2681

S
Sathya Perla 已提交
2682 2683 2684 2685
	for_all_evt_queues(adapter, eqo, i) {
		sprintf(eqo->desc, "%s-q%d", netdev->name, i);
		vec = be_msix_vec_get(adapter, eqo);
		status = request_irq(vec, be_msix, 0, eqo->desc, eqo);
2686 2687 2688
		if (status)
			goto err_msix;
	}
2689

S
Sathya Perla 已提交
2690
	return 0;
2691
err_msix:
S
Sathya Perla 已提交
2692 2693 2694
	for (i--, eqo = &adapter->eq_obj[i]; i >= 0; i--, eqo--)
		free_irq(be_msix_vec_get(adapter, eqo), eqo);
	dev_warn(&adapter->pdev->dev, "MSIX Request IRQ failed - err %d\n",
2695
		 status);
2696
	be_msix_disable(adapter);
S
Sathya Perla 已提交
2697 2698 2699 2700 2701 2702 2703 2704
	return status;
}

static int be_irq_register(struct be_adapter *adapter)
{
	struct net_device *netdev = adapter->netdev;
	int status;

2705
	if (msix_enabled(adapter)) {
S
Sathya Perla 已提交
2706 2707 2708
		status = be_msix_register(adapter);
		if (status == 0)
			goto done;
2709 2710 2711
		/* INTx is not supported for VF */
		if (!be_physfn(adapter))
			return status;
S
Sathya Perla 已提交
2712 2713
	}

2714
	/* INTx: only the first EQ is used */
S
Sathya Perla 已提交
2715 2716
	netdev->irq = adapter->pdev->irq;
	status = request_irq(netdev->irq, be_intx, IRQF_SHARED, netdev->name,
2717
			     &adapter->eq_obj[0]);
S
Sathya Perla 已提交
2718 2719 2720 2721 2722 2723 2724 2725 2726 2727 2728 2729 2730
	if (status) {
		dev_err(&adapter->pdev->dev,
			"INTx request IRQ failed - err %d\n", status);
		return status;
	}
done:
	adapter->isr_registered = true;
	return 0;
}

static void be_irq_unregister(struct be_adapter *adapter)
{
	struct net_device *netdev = adapter->netdev;
S
Sathya Perla 已提交
2731
	struct be_eq_obj *eqo;
2732
	int i;
S
Sathya Perla 已提交
2733 2734 2735 2736 2737

	if (!adapter->isr_registered)
		return;

	/* INTx */
2738
	if (!msix_enabled(adapter)) {
2739
		free_irq(netdev->irq, &adapter->eq_obj[0]);
S
Sathya Perla 已提交
2740 2741 2742 2743
		goto done;
	}

	/* MSIx */
S
Sathya Perla 已提交
2744 2745
	for_all_evt_queues(adapter, eqo, i)
		free_irq(be_msix_vec_get(adapter, eqo), eqo);
2746

S
Sathya Perla 已提交
2747 2748 2749 2750
done:
	adapter->isr_registered = false;
}

S
Sathya Perla 已提交
2751
static void be_rx_qs_destroy(struct be_adapter *adapter)
2752 2753 2754 2755 2756 2757 2758 2759 2760
{
	struct be_queue_info *q;
	struct be_rx_obj *rxo;
	int i;

	for_all_rx_queues(adapter, rxo, i) {
		q = &rxo->q;
		if (q->created) {
			be_cmd_rxq_destroy(adapter, q);
S
Sathya Perla 已提交
2761
			be_rx_cq_clean(rxo);
2762
		}
S
Sathya Perla 已提交
2763
		be_queue_free(adapter, q);
2764 2765 2766
	}
}

2767 2768 2769
static int be_close(struct net_device *netdev)
{
	struct be_adapter *adapter = netdev_priv(netdev);
S
Sathya Perla 已提交
2770 2771
	struct be_eq_obj *eqo;
	int i;
2772

2773 2774 2775 2776 2777 2778
	/* This protection is needed as be_close() may be called even when the
	 * adapter is in cleared state (after eeh perm failure)
	 */
	if (!(adapter->flags & BE_FLAGS_SETUP_DONE))
		return 0;

2779 2780
	be_roce_dev_close(adapter);

2781 2782
	if (adapter->flags & BE_FLAGS_NAPI_ENABLED) {
		for_all_evt_queues(adapter, eqo, i) {
2783
			napi_disable(&eqo->napi);
2784 2785
			be_disable_busy_poll(eqo);
		}
2786
		adapter->flags &= ~BE_FLAGS_NAPI_ENABLED;
2787
	}
2788 2789 2790 2791 2792 2793

	be_async_mcc_disable(adapter);

	/* Wait for all pending tx completions to arrive so that
	 * all tx skbs are freed.
	 */
S
Sathya Perla 已提交
2794
	netif_tx_disable(netdev);
2795
	be_tx_compl_clean(adapter);
2796 2797 2798

	be_rx_qs_destroy(adapter);

2799 2800 2801 2802 2803
	for (i = 1; i < (adapter->uc_macs + 1); i++)
		be_cmd_pmac_del(adapter, adapter->if_handle,
				adapter->pmac_id[i], 0);
	adapter->uc_macs = 0;

2804
	for_all_evt_queues(adapter, eqo, i) {
S
Sathya Perla 已提交
2805 2806 2807 2808 2809
		if (msix_enabled(adapter))
			synchronize_irq(be_msix_vec_get(adapter, eqo));
		else
			synchronize_irq(netdev->irq);
		be_eq_clean(eqo);
2810 2811
	}

2812 2813
	be_irq_unregister(adapter);

2814 2815 2816
	return 0;
}

S
Sathya Perla 已提交
2817
static int be_rx_qs_create(struct be_adapter *adapter)
2818 2819
{
	struct be_rx_obj *rxo;
2820
	int rc, i, j;
2821 2822
	u8 rss_hkey[RSS_HASH_KEY_LEN];
	struct rss_info *rss = &adapter->rss_info;
2823 2824

	for_all_rx_queues(adapter, rxo, i) {
S
Sathya Perla 已提交
2825 2826 2827 2828 2829 2830 2831 2832 2833 2834 2835 2836 2837 2838
		rc = be_queue_alloc(adapter, &rxo->q, RX_Q_LEN,
				    sizeof(struct be_eth_rx_d));
		if (rc)
			return rc;
	}

	/* The FW would like the default RXQ to be created first */
	rxo = default_rxo(adapter);
	rc = be_cmd_rxq_create(adapter, &rxo->q, rxo->cq.id, rx_frag_size,
			       adapter->if_handle, false, &rxo->rss_id);
	if (rc)
		return rc;

	for_all_rss_queues(adapter, rxo, i) {
2839
		rc = be_cmd_rxq_create(adapter, &rxo->q, rxo->cq.id,
S
Sathya Perla 已提交
2840 2841
				       rx_frag_size, adapter->if_handle,
				       true, &rxo->rss_id);
2842 2843 2844 2845 2846
		if (rc)
			return rc;
	}

	if (be_multi_rxq(adapter)) {
2847 2848
		for (j = 0; j < RSS_INDIR_TABLE_LEN;
			j += adapter->num_rx_qs - 1) {
2849
			for_all_rss_queues(adapter, rxo, i) {
2850
				if ((j + i) >= RSS_INDIR_TABLE_LEN)
2851
					break;
2852 2853
				rss->rsstable[j + i] = rxo->rss_id;
				rss->rss_queue[j + i] = i;
2854 2855
			}
		}
2856 2857
		rss->rss_flags = RSS_ENABLE_TCP_IPV4 | RSS_ENABLE_IPV4 |
			RSS_ENABLE_TCP_IPV6 | RSS_ENABLE_IPV6;
2858 2859

		if (!BEx_chip(adapter))
2860 2861
			rss->rss_flags |= RSS_ENABLE_UDP_IPV4 |
				RSS_ENABLE_UDP_IPV6;
2862 2863
	} else {
		/* Disable RSS, if only default RX Q is created */
2864
		rss->rss_flags = RSS_ENABLE_NONE;
2865
	}
2866

2867
	get_random_bytes(rss_hkey, RSS_HASH_KEY_LEN);
2868
	rc = be_cmd_rss_config(adapter, rss->rsstable, rss->rss_flags,
2869
			       128, rss_hkey);
2870
	if (rc) {
2871
		rss->rss_flags = RSS_ENABLE_NONE;
2872
		return rc;
2873 2874
	}

2875 2876
	memcpy(rss->rss_hkey, rss_hkey, RSS_HASH_KEY_LEN);

2877
	/* First time posting */
S
Sathya Perla 已提交
2878
	for_all_rx_queues(adapter, rxo, i)
2879
		be_post_rx_frags(rxo, GFP_KERNEL);
2880 2881 2882
	return 0;
}

S
Sathya Perla 已提交
2883 2884 2885
static int be_open(struct net_device *netdev)
{
	struct be_adapter *adapter = netdev_priv(netdev);
S
Sathya Perla 已提交
2886
	struct be_eq_obj *eqo;
2887
	struct be_rx_obj *rxo;
S
Sathya Perla 已提交
2888
	struct be_tx_obj *txo;
2889
	u8 link_status;
2890
	int status, i;
2891

S
Sathya Perla 已提交
2892
	status = be_rx_qs_create(adapter);
2893 2894 2895
	if (status)
		goto err;

2896 2897 2898
	status = be_irq_register(adapter);
	if (status)
		goto err;
2899

S
Sathya Perla 已提交
2900
	for_all_rx_queues(adapter, rxo, i)
2901
		be_cq_notify(adapter, rxo->cq.id, true, 0);
2902

S
Sathya Perla 已提交
2903 2904 2905
	for_all_tx_queues(adapter, txo, i)
		be_cq_notify(adapter, txo->cq.id, true, 0);

2906 2907
	be_async_mcc_enable(adapter);

S
Sathya Perla 已提交
2908 2909
	for_all_evt_queues(adapter, eqo, i) {
		napi_enable(&eqo->napi);
2910
		be_enable_busy_poll(eqo);
2911
		be_eq_notify(adapter, eqo->q.id, true, true, 0);
S
Sathya Perla 已提交
2912
	}
2913
	adapter->flags |= BE_FLAGS_NAPI_ENABLED;
S
Sathya Perla 已提交
2914

2915
	status = be_cmd_link_status_query(adapter, NULL, &link_status, 0);
2916 2917 2918
	if (!status)
		be_link_status_update(adapter, link_status);

S
Sathya Perla 已提交
2919
	netif_tx_start_all_queues(netdev);
2920
	be_roce_dev_open(adapter);
2921

2922
#ifdef CONFIG_BE2NET_VXLAN
2923 2924
	if (skyhawk_chip(adapter))
		vxlan_get_rx_port(netdev);
2925 2926
#endif

2927 2928 2929 2930
	return 0;
err:
	be_close(adapter->netdev);
	return -EIO;
2931 2932
}

2933 2934 2935 2936 2937 2938 2939 2940 2941
static int be_setup_wol(struct be_adapter *adapter, bool enable)
{
	struct be_dma_mem cmd;
	int status = 0;
	u8 mac[ETH_ALEN];

	memset(mac, 0, ETH_ALEN);

	cmd.size = sizeof(struct be_cmd_req_acpi_wol_magic_config);
2942 2943
	cmd.va = dma_zalloc_coherent(&adapter->pdev->dev, cmd.size, &cmd.dma,
				     GFP_KERNEL);
K
Kalesh AP 已提交
2944
	if (!cmd.va)
2945
		return -ENOMEM;
2946 2947 2948

	if (enable) {
		status = pci_write_config_dword(adapter->pdev,
2949 2950
						PCICFG_PM_CONTROL_OFFSET,
						PCICFG_PM_CONTROL_MASK);
2951 2952
		if (status) {
			dev_err(&adapter->pdev->dev,
2953
				"Could not enable Wake-on-lan\n");
I
Ivan Vecera 已提交
2954 2955
			dma_free_coherent(&adapter->pdev->dev, cmd.size, cmd.va,
					  cmd.dma);
2956 2957 2958
			return status;
		}
		status = be_cmd_enable_magic_wol(adapter,
2959 2960
						 adapter->netdev->dev_addr,
						 &cmd);
2961 2962 2963 2964 2965 2966 2967 2968
		pci_enable_wake(adapter->pdev, PCI_D3hot, 1);
		pci_enable_wake(adapter->pdev, PCI_D3cold, 1);
	} else {
		status = be_cmd_enable_magic_wol(adapter, mac, &cmd);
		pci_enable_wake(adapter->pdev, PCI_D3hot, 0);
		pci_enable_wake(adapter->pdev, PCI_D3cold, 0);
	}

I
Ivan Vecera 已提交
2969
	dma_free_coherent(&adapter->pdev->dev, cmd.size, cmd.va, cmd.dma);
2970 2971 2972
	return status;
}

2973 2974 2975 2976 2977 2978
/*
 * Generate a seed MAC address from the PF MAC Address using jhash.
 * MAC Address for VFs are assigned incrementally starting from the seed.
 * These addresses are programmed in the ASIC by the PF and the VF driver
 * queries for the MAC address during its probe.
 */
2979
static int be_vf_eth_addr_config(struct be_adapter *adapter)
2980
{
2981
	u32 vf;
2982
	int status = 0;
2983
	u8 mac[ETH_ALEN];
2984
	struct be_vf_cfg *vf_cfg;
2985 2986 2987

	be_vf_eth_addr_generate(adapter, mac);

2988
	for_all_vfs(adapter, vf_cfg, vf) {
2989
		if (BEx_chip(adapter))
2990
			status = be_cmd_pmac_add(adapter, mac,
2991 2992
						 vf_cfg->if_handle,
						 &vf_cfg->pmac_id, vf + 1);
2993 2994 2995
		else
			status = be_cmd_set_mac(adapter, mac, vf_cfg->if_handle,
						vf + 1);
2996

2997 2998
		if (status)
			dev_err(&adapter->pdev->dev,
2999 3000
				"Mac address assignment failed for VF %d\n",
				vf);
3001
		else
3002
			memcpy(vf_cfg->mac_addr, mac, ETH_ALEN);
3003 3004 3005 3006 3007 3008

		mac[5] += 1;
	}
	return status;
}

3009 3010 3011 3012 3013 3014 3015
static int be_vfs_mac_query(struct be_adapter *adapter)
{
	int status, vf;
	u8 mac[ETH_ALEN];
	struct be_vf_cfg *vf_cfg;

	for_all_vfs(adapter, vf_cfg, vf) {
3016 3017 3018
		status = be_cmd_get_active_mac(adapter, vf_cfg->pmac_id,
					       mac, vf_cfg->if_handle,
					       false, vf+1);
3019 3020 3021 3022 3023 3024 3025
		if (status)
			return status;
		memcpy(vf_cfg->mac_addr, mac, ETH_ALEN);
	}
	return 0;
}

3026
static void be_vf_clear(struct be_adapter *adapter)
3027
{
3028
	struct be_vf_cfg *vf_cfg;
3029 3030
	u32 vf;

3031
	if (pci_vfs_assigned(adapter->pdev)) {
3032 3033
		dev_warn(&adapter->pdev->dev,
			 "VFs are assigned to VMs: not disabling VFs\n");
3034 3035 3036
		goto done;
	}

3037 3038
	pci_disable_sriov(adapter->pdev);

3039
	for_all_vfs(adapter, vf_cfg, vf) {
3040
		if (BEx_chip(adapter))
3041 3042
			be_cmd_pmac_del(adapter, vf_cfg->if_handle,
					vf_cfg->pmac_id, vf + 1);
3043 3044 3045
		else
			be_cmd_set_mac(adapter, NULL, vf_cfg->if_handle,
				       vf + 1);
3046

3047 3048
		be_cmd_if_destroy(adapter, vf_cfg->if_handle, vf + 1);
	}
3049 3050 3051
done:
	kfree(adapter->vf_cfg);
	adapter->num_vfs = 0;
3052
	adapter->flags &= ~BE_FLAGS_SRIOV_ENABLED;
3053 3054
}

3055 3056 3057 3058 3059 3060 3061 3062
static void be_clear_queues(struct be_adapter *adapter)
{
	be_mcc_queues_destroy(adapter);
	be_rx_cqs_destroy(adapter);
	be_tx_queues_destroy(adapter);
	be_evt_queues_destroy(adapter);
}

3063
static void be_cancel_worker(struct be_adapter *adapter)
3064
{
3065 3066 3067 3068
	if (adapter->flags & BE_FLAGS_WORKER_SCHEDULED) {
		cancel_delayed_work_sync(&adapter->work);
		adapter->flags &= ~BE_FLAGS_WORKER_SCHEDULED;
	}
3069 3070
}

3071
static void be_mac_clear(struct be_adapter *adapter)
3072 3073 3074
{
	int i;

3075 3076 3077 3078 3079 3080 3081 3082 3083 3084 3085
	if (adapter->pmac_id) {
		for (i = 0; i < (adapter->uc_macs + 1); i++)
			be_cmd_pmac_del(adapter, adapter->if_handle,
					adapter->pmac_id[i], 0);
		adapter->uc_macs = 0;

		kfree(adapter->pmac_id);
		adapter->pmac_id = NULL;
	}
}

3086
#ifdef CONFIG_BE2NET_VXLAN
3087 3088 3089 3090 3091 3092 3093 3094 3095 3096 3097 3098
static void be_disable_vxlan_offloads(struct be_adapter *adapter)
{
	if (adapter->flags & BE_FLAGS_VXLAN_OFFLOADS)
		be_cmd_manage_iface(adapter, adapter->if_handle,
				    OP_CONVERT_TUNNEL_TO_NORMAL);

	if (adapter->vxlan_port)
		be_cmd_set_vxlan_port(adapter, 0);

	adapter->flags &= ~BE_FLAGS_VXLAN_OFFLOADS;
	adapter->vxlan_port = 0;
}
3099
#endif
3100

3101 3102
static int be_clear(struct be_adapter *adapter)
{
3103
	be_cancel_worker(adapter);
3104

3105
	if (sriov_enabled(adapter))
3106 3107
		be_vf_clear(adapter);

3108 3109 3110 3111 3112 3113 3114
	/* Re-configure FW to distribute resources evenly across max-supported
	 * number of VFs, only when VFs are not already enabled.
	 */
	if (be_physfn(adapter) && !pci_vfs_assigned(adapter->pdev))
		be_cmd_set_sriov_config(adapter, adapter->pool_res,
					pci_sriov_get_totalvfs(adapter->pdev));

3115
#ifdef CONFIG_BE2NET_VXLAN
3116
	be_disable_vxlan_offloads(adapter);
3117
#endif
3118
	/* delete the primary mac along with the uc-mac list */
3119
	be_mac_clear(adapter);
3120

3121
	be_cmd_if_destroy(adapter, adapter->if_handle,  0);
3122

3123
	be_clear_queues(adapter);
3124

S
Sathya Perla 已提交
3125
	be_msix_disable(adapter);
3126
	adapter->flags &= ~BE_FLAGS_SETUP_DONE;
3127 3128 3129
	return 0;
}

3130
static int be_vfs_if_create(struct be_adapter *adapter)
3131
{
3132
	struct be_resources res = {0};
3133 3134
	struct be_vf_cfg *vf_cfg;
	u32 cap_flags, en_flags, vf;
3135
	int status = 0;
3136

3137 3138
	cap_flags = BE_IF_FLAGS_UNTAGGED | BE_IF_FLAGS_BROADCAST |
		    BE_IF_FLAGS_MULTICAST;
3139

3140
	for_all_vfs(adapter, vf_cfg, vf) {
3141 3142 3143 3144 3145 3146
		if (!BE3_chip(adapter)) {
			status = be_cmd_get_profile_config(adapter, &res,
							   vf + 1);
			if (!status)
				cap_flags = res.if_cap_flags;
		}
3147 3148 3149

		/* If a FW profile exists, then cap_flags are updated */
		en_flags = cap_flags & (BE_IF_FLAGS_UNTAGGED |
3150 3151 3152 3153 3154
					BE_IF_FLAGS_BROADCAST |
					BE_IF_FLAGS_MULTICAST);
		status =
		    be_cmd_if_create(adapter, cap_flags, en_flags,
				     &vf_cfg->if_handle, vf + 1);
3155 3156 3157 3158 3159
		if (status)
			goto err;
	}
err:
	return status;
3160 3161
}

3162
static int be_vf_setup_init(struct be_adapter *adapter)
3163
{
3164
	struct be_vf_cfg *vf_cfg;
3165 3166
	int vf;

3167 3168 3169 3170 3171
	adapter->vf_cfg = kcalloc(adapter->num_vfs, sizeof(*vf_cfg),
				  GFP_KERNEL);
	if (!adapter->vf_cfg)
		return -ENOMEM;

3172 3173 3174
	for_all_vfs(adapter, vf_cfg, vf) {
		vf_cfg->if_handle = -1;
		vf_cfg->pmac_id = -1;
3175
	}
3176
	return 0;
3177 3178
}

3179 3180
static int be_vf_setup(struct be_adapter *adapter)
{
3181
	struct device *dev = &adapter->pdev->dev;
3182
	struct be_vf_cfg *vf_cfg;
3183
	int status, old_vfs, vf;
3184
	u32 privileges;
3185

3186
	old_vfs = pci_num_vf(adapter->pdev);
3187 3188 3189 3190

	status = be_vf_setup_init(adapter);
	if (status)
		goto err;
3191

3192 3193 3194 3195 3196 3197
	if (old_vfs) {
		for_all_vfs(adapter, vf_cfg, vf) {
			status = be_cmd_get_if_id(adapter, vf_cfg, vf);
			if (status)
				goto err;
		}
3198

3199 3200 3201 3202
		status = be_vfs_mac_query(adapter);
		if (status)
			goto err;
	} else {
3203 3204 3205 3206
		status = be_vfs_if_create(adapter);
		if (status)
			goto err;

3207 3208 3209 3210
		status = be_vf_eth_addr_config(adapter);
		if (status)
			goto err;
	}
3211

3212
	for_all_vfs(adapter, vf_cfg, vf) {
3213 3214 3215 3216 3217 3218 3219 3220 3221 3222 3223 3224
		/* Allow VFs to programs MAC/VLAN filters */
		status = be_cmd_get_fn_privileges(adapter, &privileges, vf + 1);
		if (!status && !(privileges & BE_PRIV_FILTMGMT)) {
			status = be_cmd_set_fn_privileges(adapter,
							  privileges |
							  BE_PRIV_FILTMGMT,
							  vf + 1);
			if (!status)
				dev_info(dev, "VF%d has FILTMGMT privilege\n",
					 vf);
		}

3225 3226 3227
		/* Allow full available bandwidth */
		if (!old_vfs)
			be_cmd_config_qos(adapter, 0, 0, vf + 1);
3228

3229
		if (!old_vfs) {
3230
			be_cmd_enable_vf(adapter, vf + 1);
3231 3232 3233 3234
			be_cmd_set_logical_link_config(adapter,
						       IFLA_VF_LINK_STATE_AUTO,
						       vf+1);
		}
3235
	}
3236 3237 3238 3239 3240 3241 3242 3243 3244

	if (!old_vfs) {
		status = pci_enable_sriov(adapter->pdev, adapter->num_vfs);
		if (status) {
			dev_err(dev, "SRIOV enable failed\n");
			adapter->num_vfs = 0;
			goto err;
		}
	}
3245 3246

	adapter->flags |= BE_FLAGS_SRIOV_ENABLED;
3247 3248
	return 0;
err:
3249 3250
	dev_err(dev, "VF setup failed\n");
	be_vf_clear(adapter);
3251 3252 3253
	return status;
}

3254 3255 3256 3257
/* Converting function_mode bits on BE3 to SH mc_type enums */

static u8 be_convert_mc_type(u32 function_mode)
{
3258
	if (function_mode & VNIC_MODE && function_mode & QNQ_MODE)
3259
		return vNIC1;
3260
	else if (function_mode & QNQ_MODE)
3261 3262 3263 3264 3265 3266 3267 3268 3269
		return FLEX10;
	else if (function_mode & VNIC_MODE)
		return vNIC2;
	else if (function_mode & UMC_ENABLED)
		return UMC;
	else
		return MC_NONE;
}

3270 3271 3272 3273
/* On BE2/BE3 FW does not suggest the supported limits */
static void BEx_get_resources(struct be_adapter *adapter,
			      struct be_resources *res)
{
3274
	bool use_sriov = adapter->num_vfs ? 1 : 0;
3275 3276 3277 3278 3279 3280

	if (be_physfn(adapter))
		res->max_uc_mac = BE_UC_PMAC_COUNT;
	else
		res->max_uc_mac = BE_VF_UC_PMAC_COUNT;

3281 3282 3283 3284 3285 3286 3287 3288 3289 3290 3291 3292 3293 3294
	adapter->mc_type = be_convert_mc_type(adapter->function_mode);

	if (be_is_mc(adapter)) {
		/* Assuming that there are 4 channels per port,
		 * when multi-channel is enabled
		 */
		if (be_is_qnq_mode(adapter))
			res->max_vlans = BE_NUM_VLANS_SUPPORTED/8;
		else
			/* In a non-qnq multichannel mode, the pvid
			 * takes up one vlan entry
			 */
			res->max_vlans = (BE_NUM_VLANS_SUPPORTED / 4) - 1;
	} else {
3295
		res->max_vlans = BE_NUM_VLANS_SUPPORTED;
3296 3297
	}

3298 3299
	res->max_mcast_mac = BE_MAX_MC;

3300 3301 3302 3303 3304 3305 3306
	/* 1) For BE3 1Gb ports, FW does not support multiple TXQs
	 * 2) Create multiple TX rings on a BE3-R multi-channel interface
	 *    *only* if it is RSS-capable.
	 */
	if (BE2_chip(adapter) || use_sriov ||  (adapter->port_num > 1) ||
	    !be_physfn(adapter) || (be_is_mc(adapter) &&
	    !(adapter->function_caps & BE_FUNCTION_CAPS_RSS)))
3307 3308 3309 3310 3311 3312 3313 3314 3315 3316
		res->max_tx_qs = 1;
	else
		res->max_tx_qs = BE3_MAX_TX_QS;

	if ((adapter->function_caps & BE_FUNCTION_CAPS_RSS) &&
	    !use_sriov && be_physfn(adapter))
		res->max_rss_qs = (adapter->be3_native) ?
					   BE3_MAX_RSS_QS : BE2_MAX_RSS_QS;
	res->max_rx_qs = res->max_rss_qs + 1;

3317
	if (be_physfn(adapter))
3318
		res->max_evt_qs = (be_max_vfs(adapter) > 0) ?
3319 3320 3321
					BE3_SRIOV_MAX_EVT_QS : BE3_MAX_EVT_QS;
	else
		res->max_evt_qs = 1;
3322 3323 3324 3325 3326 3327

	res->if_cap_flags = BE_IF_CAP_FLAGS_WANT;
	if (!(adapter->function_caps & BE_FUNCTION_CAPS_RSS))
		res->if_cap_flags &= ~BE_IF_FLAGS_RSS;
}

3328 3329 3330
static void be_setup_init(struct be_adapter *adapter)
{
	adapter->vlan_prio_bmap = 0xff;
A
Ajit Khaparde 已提交
3331
	adapter->phy.link_speed = -1;
3332 3333 3334
	adapter->if_handle = -1;
	adapter->be3_native = false;
	adapter->promiscuous = false;
3335 3336 3337 3338
	if (be_physfn(adapter))
		adapter->cmd_privileges = MAX_PRIVILEGES;
	else
		adapter->cmd_privileges = MIN_PRIVILEGES;
3339 3340
}

3341 3342 3343 3344 3345 3346 3347 3348 3349 3350 3351 3352 3353 3354 3355 3356 3357 3358 3359 3360 3361 3362 3363 3364 3365 3366 3367 3368 3369 3370 3371 3372 3373 3374 3375 3376 3377 3378 3379 3380 3381 3382 3383 3384 3385 3386 3387 3388
static int be_get_sriov_config(struct be_adapter *adapter)
{
	struct device *dev = &adapter->pdev->dev;
	struct be_resources res = {0};
	int status, max_vfs, old_vfs;

	status = be_cmd_get_profile_config(adapter, &res, 0);
	if (status)
		return status;

	adapter->pool_res = res;

	/* Some old versions of BE3 FW don't report max_vfs value */
	if (BE3_chip(adapter) && !res.max_vfs) {
		max_vfs = pci_sriov_get_totalvfs(adapter->pdev);
		res.max_vfs = max_vfs > 0 ? min(MAX_VFS, max_vfs) : 0;
	}

	adapter->pool_res.max_vfs = res.max_vfs;
	pci_sriov_set_totalvfs(adapter->pdev, be_max_vfs(adapter));

	if (!be_max_vfs(adapter)) {
		if (num_vfs)
			dev_warn(dev, "device doesn't support SRIOV\n");
		adapter->num_vfs = 0;
		return 0;
	}

	/* validate num_vfs module param */
	old_vfs = pci_num_vf(adapter->pdev);
	if (old_vfs) {
		dev_info(dev, "%d VFs are already enabled\n", old_vfs);
		if (old_vfs != num_vfs)
			dev_warn(dev, "Ignoring num_vfs=%d setting\n", num_vfs);
		adapter->num_vfs = old_vfs;
	} else {
		if (num_vfs > be_max_vfs(adapter)) {
			dev_info(dev, "Resources unavailable to init %d VFs\n",
				 num_vfs);
			dev_info(dev, "Limiting to %d VFs\n",
				 be_max_vfs(adapter));
		}
		adapter->num_vfs = min_t(u16, num_vfs, be_max_vfs(adapter));
	}

	return 0;
}

3389
static int be_get_resources(struct be_adapter *adapter)
3390
{
3391 3392 3393
	struct device *dev = &adapter->pdev->dev;
	struct be_resources res = {0};
	int status;
3394

3395 3396 3397
	if (BEx_chip(adapter)) {
		BEx_get_resources(adapter, &res);
		adapter->res = res;
3398 3399
	}

3400 3401 3402 3403 3404 3405 3406 3407
	/* For Lancer, SH etc read per-function resource limits from FW.
	 * GET_FUNC_CONFIG returns per function guaranteed limits.
	 * GET_PROFILE_CONFIG returns PCI-E related limits PF-pool limits
	 */
	if (!BEx_chip(adapter)) {
		status = be_cmd_get_func_config(adapter, &res);
		if (status)
			return status;
3408

3409 3410 3411 3412
		/* If RoCE may be enabled stash away half the EQs for RoCE */
		if (be_roce_supported(adapter))
			res.max_evt_qs /= 2;
		adapter->res = res;
3413

3414 3415 3416 3417 3418 3419 3420
		dev_info(dev, "Max: txqs %d, rxqs %d, rss %d, eqs %d, vfs %d\n",
			 be_max_txqs(adapter), be_max_rxqs(adapter),
			 be_max_rss(adapter), be_max_eqs(adapter),
			 be_max_vfs(adapter));
		dev_info(dev, "Max: uc-macs %d, mc-macs %d, vlans %d\n",
			 be_max_uc(adapter), be_max_mc(adapter),
			 be_max_vlans(adapter));
3421
	}
3422

3423
	return 0;
3424 3425
}

3426 3427
static int be_get_config(struct be_adapter *adapter)
{
3428
	u16 profile_id;
3429
	int status;
3430

3431
	status = be_cmd_query_fw_cfg(adapter);
3432
	if (status)
3433
		return status;
3434

3435 3436 3437 3438 3439
	 if (be_physfn(adapter)) {
		status = be_cmd_get_active_profile(adapter, &profile_id);
		if (!status)
			dev_info(&adapter->pdev->dev,
				 "Using profile 0x%x\n", profile_id);
3440
	}
3441

3442
	if (!BE2_chip(adapter) && be_physfn(adapter)) {
3443 3444 3445 3446 3447 3448 3449 3450 3451 3452 3453 3454 3455 3456 3457 3458 3459 3460 3461
		status = be_get_sriov_config(adapter);
		if (status)
			return status;

		/* When the HW is in SRIOV capable configuration, the PF-pool
		 * resources are equally distributed across the max-number of
		 * VFs. The user may request only a subset of the max-vfs to be
		 * enabled. Based on num_vfs, redistribute the resources across
		 * num_vfs so that each VF will have access to more number of
		 * resources. This facility is not available in BE3 FW.
		 * Also, this is done by FW in Lancer chip.
		 */
		if (!pci_num_vf(adapter->pdev)) {
			status = be_cmd_set_sriov_config(adapter,
							 adapter->pool_res,
							 adapter->num_vfs);
			if (status)
				return status;
		}
3462 3463
	}

3464 3465 3466
	status = be_get_resources(adapter);
	if (status)
		return status;
3467

3468 3469
	adapter->pmac_id = kcalloc(be_max_uc(adapter),
				   sizeof(*adapter->pmac_id), GFP_KERNEL);
3470 3471
	if (!adapter->pmac_id)
		return -ENOMEM;
3472

3473 3474 3475 3476
	/* Sanitize cfg_num_qs based on HW and platform limits */
	adapter->cfg_num_qs = min(adapter->cfg_num_qs, be_max_qs(adapter));

	return 0;
3477 3478
}

3479 3480 3481 3482 3483 3484 3485 3486 3487 3488 3489 3490 3491 3492 3493 3494 3495
static int be_mac_setup(struct be_adapter *adapter)
{
	u8 mac[ETH_ALEN];
	int status;

	if (is_zero_ether_addr(adapter->netdev->dev_addr)) {
		status = be_cmd_get_perm_mac(adapter, mac);
		if (status)
			return status;

		memcpy(adapter->netdev->dev_addr, mac, ETH_ALEN);
		memcpy(adapter->netdev->perm_addr, mac, ETH_ALEN);
	} else {
		/* Maybe the HW was reset; dev_addr must be re-programmed */
		memcpy(mac, adapter->netdev->dev_addr, ETH_ALEN);
	}

3496 3497 3498 3499
	/* For BE3-R VFs, the PF programs the initial MAC address */
	if (!(BEx_chip(adapter) && be_virtfn(adapter)))
		be_cmd_pmac_add(adapter, mac, adapter->if_handle,
				&adapter->pmac_id[0], 0);
3500 3501 3502
	return 0;
}

3503 3504 3505 3506 3507 3508
static void be_schedule_worker(struct be_adapter *adapter)
{
	schedule_delayed_work(&adapter->work, msecs_to_jiffies(1000));
	adapter->flags |= BE_FLAGS_WORKER_SCHEDULED;
}

3509
static int be_setup_queues(struct be_adapter *adapter)
3510
{
3511
	struct net_device *netdev = adapter->netdev;
S
Sathya Perla 已提交
3512
	int status;
3513

3514
	status = be_evt_queues_create(adapter);
3515 3516
	if (status)
		goto err;
3517

3518
	status = be_tx_qs_create(adapter);
3519 3520
	if (status)
		goto err;
S
Sathya Perla 已提交
3521

3522
	status = be_rx_cqs_create(adapter);
S
Sathya Perla 已提交
3523
	if (status)
3524
		goto err;
S
Sathya Perla 已提交
3525

3526
	status = be_mcc_queues_create(adapter);
S
Sathya Perla 已提交
3527 3528 3529
	if (status)
		goto err;

3530 3531 3532 3533 3534 3535 3536 3537
	status = netif_set_real_num_rx_queues(netdev, adapter->num_rx_qs);
	if (status)
		goto err;

	status = netif_set_real_num_tx_queues(netdev, adapter->num_tx_qs);
	if (status)
		goto err;

3538 3539 3540 3541 3542 3543
	return 0;
err:
	dev_err(&adapter->pdev->dev, "queue_setup failed\n");
	return status;
}

3544 3545 3546 3547 3548 3549 3550 3551 3552 3553 3554 3555 3556 3557 3558 3559 3560 3561 3562 3563 3564 3565 3566 3567 3568 3569 3570 3571 3572 3573 3574 3575 3576 3577 3578 3579
int be_update_queues(struct be_adapter *adapter)
{
	struct net_device *netdev = adapter->netdev;
	int status;

	if (netif_running(netdev))
		be_close(netdev);

	be_cancel_worker(adapter);

	/* If any vectors have been shared with RoCE we cannot re-program
	 * the MSIx table.
	 */
	if (!adapter->num_msix_roce_vec)
		be_msix_disable(adapter);

	be_clear_queues(adapter);

	if (!msix_enabled(adapter)) {
		status = be_msix_enable(adapter);
		if (status)
			return status;
	}

	status = be_setup_queues(adapter);
	if (status)
		return status;

	be_schedule_worker(adapter);

	if (netif_running(netdev))
		status = be_open(netdev);

	return status;
}

3580 3581 3582 3583 3584 3585 3586 3587 3588 3589 3590 3591
static int be_setup(struct be_adapter *adapter)
{
	struct device *dev = &adapter->pdev->dev;
	u32 tx_fc, rx_fc, en_flags;
	int status;

	be_setup_init(adapter);

	if (!lancer_chip(adapter))
		be_cmd_req_native_mode(adapter);

	status = be_get_config(adapter);
S
Sathya Perla 已提交
3592
	if (status)
3593
		goto err;
S
Sathya Perla 已提交
3594

3595
	status = be_msix_enable(adapter);
S
Sathya Perla 已提交
3596
	if (status)
3597
		goto err;
S
Sathya Perla 已提交
3598

3599
	en_flags = BE_IF_FLAGS_UNTAGGED | BE_IF_FLAGS_BROADCAST |
3600
		   BE_IF_FLAGS_MULTICAST | BE_IF_FLAGS_PASS_L3L4_ERRORS;
3601
	if (adapter->function_caps & BE_FUNCTION_CAPS_RSS)
3602
		en_flags |= BE_IF_FLAGS_RSS;
3603 3604
	en_flags = en_flags & be_if_cap_flags(adapter);
	status = be_cmd_if_create(adapter, be_if_cap_flags(adapter), en_flags,
3605
				  &adapter->if_handle, 0);
3606
	if (status)
3607
		goto err;
S
Sathya Perla 已提交
3608

3609 3610
	/* Updating real_num_tx/rx_queues() requires rtnl_lock() */
	rtnl_lock();
3611
	status = be_setup_queues(adapter);
3612
	rtnl_unlock();
3613
	if (status)
3614 3615
		goto err;

3616 3617 3618
	be_cmd_get_fn_privileges(adapter, &adapter->cmd_privileges, 0);

	status = be_mac_setup(adapter);
S
Sathya Perla 已提交
3619 3620 3621
	if (status)
		goto err;

3622
	be_cmd_get_fw_ver(adapter);
3623

3624 3625 3626 3627 3628 3629
	if (BE2_chip(adapter) && fw_major_num(adapter->fw_ver) < 4) {
		dev_err(dev, "Firmware on card is old(%s), IRQs may not work.",
			adapter->fw_ver);
		dev_err(dev, "Please upgrade firmware to version >= 4.0\n");
	}

3630
	if (adapter->vlans_added)
S
Sathya Perla 已提交
3631
		be_vid_config(adapter);
3632

3633
	be_set_rx_mode(adapter->netdev);
3634

S
Suresh Reddy 已提交
3635 3636
	be_cmd_get_acpi_wol_cap(adapter);

3637
	be_cmd_get_flow_control(adapter, &tx_fc, &rx_fc);
3638

3639 3640
	if (rx_fc != adapter->rx_fc || tx_fc != adapter->tx_fc)
		be_cmd_set_flow_control(adapter, adapter->tx_fc,
3641
					adapter->rx_fc);
3642

3643 3644 3645 3646
	if (be_physfn(adapter))
		be_cmd_set_logical_link_config(adapter,
					       IFLA_VF_LINK_STATE_AUTO, 0);

3647 3648
	if (adapter->num_vfs)
		be_vf_setup(adapter);
3649

3650 3651
	status = be_cmd_get_phy_info(adapter);
	if (!status && be_pause_supported(adapter))
A
Ajit Khaparde 已提交
3652 3653
		adapter->phy.fc_autoneg = 1;

3654
	be_schedule_worker(adapter);
3655
	adapter->flags |= BE_FLAGS_SETUP_DONE;
3656
	return 0;
3657 3658 3659 3660
err:
	be_clear(adapter);
	return status;
}
S
Sathya Perla 已提交
3661

I
Ivan Vecera 已提交
3662 3663 3664 3665
#ifdef CONFIG_NET_POLL_CONTROLLER
static void be_netpoll(struct net_device *netdev)
{
	struct be_adapter *adapter = netdev_priv(netdev);
S
Sathya Perla 已提交
3666
	struct be_eq_obj *eqo;
I
Ivan Vecera 已提交
3667 3668
	int i;

3669 3670 3671 3672
	for_all_evt_queues(adapter, eqo, i) {
		be_eq_notify(eqo->adapter, eqo->q.id, false, true, 0);
		napi_schedule(&eqo->napi);
	}
S
Sathya Perla 已提交
3673 3674

	return;
I
Ivan Vecera 已提交
3675 3676 3677
}
#endif

3678
static char flash_cookie[2][16] = {"*** SE FLAS", "H DIRECTORY *** "};
3679

3680 3681
static bool phy_flashing_required(struct be_adapter *adapter)
{
A
Ajit Khaparde 已提交
3682 3683
	return (adapter->phy.phy_type == TN_8022 &&
		adapter->phy.interface_type == PHY_TYPE_BASET_10GB);
3684 3685
}

3686 3687 3688 3689 3690 3691
static bool is_comp_in_ufi(struct be_adapter *adapter,
			   struct flash_section_info *fsec, int type)
{
	int i = 0, img_type = 0;
	struct flash_section_info_g2 *fsec_g2 = NULL;

3692
	if (BE2_chip(adapter))
3693 3694 3695 3696 3697 3698 3699 3700 3701 3702 3703 3704 3705 3706 3707
		fsec_g2 = (struct flash_section_info_g2 *)fsec;

	for (i = 0; i < MAX_FLASH_COMP; i++) {
		if (fsec_g2)
			img_type = le32_to_cpu(fsec_g2->fsec_entry[i].type);
		else
			img_type = le32_to_cpu(fsec->fsec_entry[i].type);

		if (img_type == type)
			return true;
	}
	return false;

}

J
Jingoo Han 已提交
3708
static struct flash_section_info *get_fsec_info(struct be_adapter *adapter,
3709 3710
						int header_size,
						const struct firmware *fw)
3711 3712 3713 3714 3715 3716 3717 3718 3719 3720 3721 3722 3723 3724
{
	struct flash_section_info *fsec = NULL;
	const u8 *p = fw->data;

	p += header_size;
	while (p < (fw->data + fw->size)) {
		fsec = (struct flash_section_info *)p;
		if (!memcmp(flash_cookie, fsec->cookie, sizeof(flash_cookie)))
			return fsec;
		p += 32;
	}
	return NULL;
}

3725 3726 3727 3728 3729 3730 3731 3732 3733 3734 3735 3736 3737 3738 3739 3740 3741 3742 3743 3744 3745 3746 3747
static int be_check_flash_crc(struct be_adapter *adapter, const u8 *p,
			      u32 img_offset, u32 img_size, int hdr_size,
			      u16 img_optype, bool *crc_match)
{
	u32 crc_offset;
	int status;
	u8 crc[4];

	status = be_cmd_get_flash_crc(adapter, crc, img_optype, img_size - 4);
	if (status)
		return status;

	crc_offset = hdr_size + img_offset + img_size - 4;

	/* Skip flashing, if crc of flashed region matches */
	if (!memcmp(crc, p + crc_offset, 4))
		*crc_match = true;
	else
		*crc_match = false;

	return status;
}

3748
static int be_flash(struct be_adapter *adapter, const u8 *img,
3749
		    struct be_dma_mem *flash_cmd, int optype, int img_size)
3750 3751
{
	struct be_cmd_write_flashrom *req = flash_cmd->va;
3752 3753
	u32 total_bytes, flash_op, num_bytes;
	int status;
3754 3755 3756 3757 3758 3759 3760 3761 3762 3763 3764 3765 3766 3767 3768 3769 3770 3771 3772

	total_bytes = img_size;
	while (total_bytes) {
		num_bytes = min_t(u32, 32*1024, total_bytes);

		total_bytes -= num_bytes;

		if (!total_bytes) {
			if (optype == OPTYPE_PHY_FW)
				flash_op = FLASHROM_OPER_PHY_FLASH;
			else
				flash_op = FLASHROM_OPER_FLASH;
		} else {
			if (optype == OPTYPE_PHY_FW)
				flash_op = FLASHROM_OPER_PHY_SAVE;
			else
				flash_op = FLASHROM_OPER_SAVE;
		}

3773
		memcpy(req->data_buf, img, num_bytes);
3774 3775
		img += num_bytes;
		status = be_cmd_write_flashrom(adapter, flash_cmd, optype,
3776
					       flash_op, num_bytes);
3777
		if (base_status(status) == MCC_STATUS_ILLEGAL_REQUEST &&
3778 3779 3780
		    optype == OPTYPE_PHY_FW)
			break;
		else if (status)
3781 3782 3783 3784 3785
			return status;
	}
	return 0;
}

3786
/* For BE2, BE3 and BE3-R */
3787
static int be_flash_BEx(struct be_adapter *adapter,
3788 3789
			const struct firmware *fw,
			struct be_dma_mem *flash_cmd, int num_of_images)
3790
{
3791
	int img_hdrs_size = (num_of_images * sizeof(struct image_hdr));
3792
	struct device *dev = &adapter->pdev->dev;
3793
	struct flash_section_info *fsec = NULL;
3794 3795 3796 3797
	int status, i, filehdr_size, num_comp;
	const struct flash_comp *pflashcomp;
	bool crc_match;
	const u8 *p;
3798 3799 3800 3801 3802 3803 3804 3805 3806 3807 3808 3809 3810 3811 3812 3813 3814 3815 3816 3817 3818 3819

	struct flash_comp gen3_flash_types[] = {
		{ FLASH_iSCSI_PRIMARY_IMAGE_START_g3, OPTYPE_ISCSI_ACTIVE,
			FLASH_IMAGE_MAX_SIZE_g3, IMAGE_FIRMWARE_iSCSI},
		{ FLASH_REDBOOT_START_g3, OPTYPE_REDBOOT,
			FLASH_REDBOOT_IMAGE_MAX_SIZE_g3, IMAGE_BOOT_CODE},
		{ FLASH_iSCSI_BIOS_START_g3, OPTYPE_BIOS,
			FLASH_BIOS_IMAGE_MAX_SIZE_g3, IMAGE_OPTION_ROM_ISCSI},
		{ FLASH_PXE_BIOS_START_g3, OPTYPE_PXE_BIOS,
			FLASH_BIOS_IMAGE_MAX_SIZE_g3, IMAGE_OPTION_ROM_PXE},
		{ FLASH_FCoE_BIOS_START_g3, OPTYPE_FCOE_BIOS,
			FLASH_BIOS_IMAGE_MAX_SIZE_g3, IMAGE_OPTION_ROM_FCoE},
		{ FLASH_iSCSI_BACKUP_IMAGE_START_g3, OPTYPE_ISCSI_BACKUP,
			FLASH_IMAGE_MAX_SIZE_g3, IMAGE_FIRMWARE_BACKUP_iSCSI},
		{ FLASH_FCoE_PRIMARY_IMAGE_START_g3, OPTYPE_FCOE_FW_ACTIVE,
			FLASH_IMAGE_MAX_SIZE_g3, IMAGE_FIRMWARE_FCoE},
		{ FLASH_FCoE_BACKUP_IMAGE_START_g3, OPTYPE_FCOE_FW_BACKUP,
			FLASH_IMAGE_MAX_SIZE_g3, IMAGE_FIRMWARE_BACKUP_FCoE},
		{ FLASH_NCSI_START_g3, OPTYPE_NCSI_FW,
			FLASH_NCSI_IMAGE_MAX_SIZE_g3, IMAGE_NCSI},
		{ FLASH_PHY_FW_START_g3, OPTYPE_PHY_FW,
			FLASH_PHY_FW_IMAGE_MAX_SIZE_g3, IMAGE_FIRMWARE_PHY}
3820
	};
3821 3822 3823 3824 3825 3826 3827 3828 3829 3830 3831 3832 3833 3834 3835 3836 3837 3838

	struct flash_comp gen2_flash_types[] = {
		{ FLASH_iSCSI_PRIMARY_IMAGE_START_g2, OPTYPE_ISCSI_ACTIVE,
			FLASH_IMAGE_MAX_SIZE_g2, IMAGE_FIRMWARE_iSCSI},
		{ FLASH_REDBOOT_START_g2, OPTYPE_REDBOOT,
			FLASH_REDBOOT_IMAGE_MAX_SIZE_g2, IMAGE_BOOT_CODE},
		{ FLASH_iSCSI_BIOS_START_g2, OPTYPE_BIOS,
			FLASH_BIOS_IMAGE_MAX_SIZE_g2, IMAGE_OPTION_ROM_ISCSI},
		{ FLASH_PXE_BIOS_START_g2, OPTYPE_PXE_BIOS,
			FLASH_BIOS_IMAGE_MAX_SIZE_g2, IMAGE_OPTION_ROM_PXE},
		{ FLASH_FCoE_BIOS_START_g2, OPTYPE_FCOE_BIOS,
			FLASH_BIOS_IMAGE_MAX_SIZE_g2, IMAGE_OPTION_ROM_FCoE},
		{ FLASH_iSCSI_BACKUP_IMAGE_START_g2, OPTYPE_ISCSI_BACKUP,
			FLASH_IMAGE_MAX_SIZE_g2, IMAGE_FIRMWARE_BACKUP_iSCSI},
		{ FLASH_FCoE_PRIMARY_IMAGE_START_g2, OPTYPE_FCOE_FW_ACTIVE,
			FLASH_IMAGE_MAX_SIZE_g2, IMAGE_FIRMWARE_FCoE},
		{ FLASH_FCoE_BACKUP_IMAGE_START_g2, OPTYPE_FCOE_FW_BACKUP,
			 FLASH_IMAGE_MAX_SIZE_g2, IMAGE_FIRMWARE_BACKUP_FCoE}
3839 3840
	};

3841
	if (BE3_chip(adapter)) {
3842 3843
		pflashcomp = gen3_flash_types;
		filehdr_size = sizeof(struct flash_file_hdr_g3);
J
Joe Perches 已提交
3844
		num_comp = ARRAY_SIZE(gen3_flash_types);
3845 3846 3847
	} else {
		pflashcomp = gen2_flash_types;
		filehdr_size = sizeof(struct flash_file_hdr_g2);
J
Joe Perches 已提交
3848
		num_comp = ARRAY_SIZE(gen2_flash_types);
3849
	}
3850

3851 3852 3853
	/* Get flash section info*/
	fsec = get_fsec_info(adapter, filehdr_size + img_hdrs_size, fw);
	if (!fsec) {
3854
		dev_err(dev, "Invalid Cookie. FW image may be corrupted\n");
3855 3856
		return -1;
	}
3857
	for (i = 0; i < num_comp; i++) {
3858
		if (!is_comp_in_ufi(adapter, fsec, pflashcomp[i].img_type))
3859
			continue;
3860 3861 3862 3863 3864

		if ((pflashcomp[i].optype == OPTYPE_NCSI_FW) &&
		    memcmp(adapter->fw_ver, "3.102.148.0", 11) < 0)
			continue;

3865 3866
		if (pflashcomp[i].optype == OPTYPE_PHY_FW  &&
		    !phy_flashing_required(adapter))
3867
				continue;
3868

3869
		if (pflashcomp[i].optype == OPTYPE_REDBOOT) {
3870 3871 3872 3873 3874 3875 3876 3877 3878 3879 3880 3881 3882 3883
			status = be_check_flash_crc(adapter, fw->data,
						    pflashcomp[i].offset,
						    pflashcomp[i].size,
						    filehdr_size +
						    img_hdrs_size,
						    OPTYPE_REDBOOT, &crc_match);
			if (status) {
				dev_err(dev,
					"Could not get CRC for 0x%x region\n",
					pflashcomp[i].optype);
				continue;
			}

			if (crc_match)
3884 3885
				continue;
		}
3886

3887 3888
		p = fw->data + filehdr_size + pflashcomp[i].offset +
			img_hdrs_size;
3889 3890
		if (p + pflashcomp[i].size > fw->data + fw->size)
			return -1;
3891 3892

		status = be_flash(adapter, p, flash_cmd, pflashcomp[i].optype,
3893
				  pflashcomp[i].size);
3894
		if (status) {
3895
			dev_err(dev, "Flashing section type 0x%x failed\n",
3896 3897
				pflashcomp[i].img_type);
			return status;
3898 3899 3900 3901 3902
		}
	}
	return 0;
}

3903 3904 3905 3906 3907 3908 3909 3910 3911 3912 3913 3914 3915 3916 3917 3918 3919 3920 3921 3922 3923 3924 3925 3926 3927 3928 3929 3930 3931 3932 3933 3934 3935 3936 3937 3938 3939 3940 3941 3942 3943 3944 3945 3946 3947 3948 3949 3950 3951 3952 3953 3954
static u16 be_get_img_optype(struct flash_section_entry fsec_entry)
{
	u32 img_type = le32_to_cpu(fsec_entry.type);
	u16 img_optype = le16_to_cpu(fsec_entry.optype);

	if (img_optype != 0xFFFF)
		return img_optype;

	switch (img_type) {
	case IMAGE_FIRMWARE_iSCSI:
		img_optype = OPTYPE_ISCSI_ACTIVE;
		break;
	case IMAGE_BOOT_CODE:
		img_optype = OPTYPE_REDBOOT;
		break;
	case IMAGE_OPTION_ROM_ISCSI:
		img_optype = OPTYPE_BIOS;
		break;
	case IMAGE_OPTION_ROM_PXE:
		img_optype = OPTYPE_PXE_BIOS;
		break;
	case IMAGE_OPTION_ROM_FCoE:
		img_optype = OPTYPE_FCOE_BIOS;
		break;
	case IMAGE_FIRMWARE_BACKUP_iSCSI:
		img_optype = OPTYPE_ISCSI_BACKUP;
		break;
	case IMAGE_NCSI:
		img_optype = OPTYPE_NCSI_FW;
		break;
	case IMAGE_FLASHISM_JUMPVECTOR:
		img_optype = OPTYPE_FLASHISM_JUMPVECTOR;
		break;
	case IMAGE_FIRMWARE_PHY:
		img_optype = OPTYPE_SH_PHY_FW;
		break;
	case IMAGE_REDBOOT_DIR:
		img_optype = OPTYPE_REDBOOT_DIR;
		break;
	case IMAGE_REDBOOT_CONFIG:
		img_optype = OPTYPE_REDBOOT_CONFIG;
		break;
	case IMAGE_UFI_DIR:
		img_optype = OPTYPE_UFI_DIR;
		break;
	default:
		break;
	}

	return img_optype;
}

3955
static int be_flash_skyhawk(struct be_adapter *adapter,
3956 3957
			    const struct firmware *fw,
			    struct be_dma_mem *flash_cmd, int num_of_images)
3958
{
3959
	int img_hdrs_size = num_of_images * sizeof(struct image_hdr);
3960
	struct device *dev = &adapter->pdev->dev;
3961
	struct flash_section_info *fsec = NULL;
3962 3963 3964 3965 3966
	u32 img_offset, img_size, img_type;
	int status, i, filehdr_size;
	bool crc_match, old_fw_img;
	u16 img_optype;
	const u8 *p;
3967 3968 3969 3970

	filehdr_size = sizeof(struct flash_file_hdr_g3);
	fsec = get_fsec_info(adapter, filehdr_size + img_hdrs_size, fw);
	if (!fsec) {
3971
		dev_err(dev, "Invalid Cookie. FW image may be corrupted\n");
3972
		return -EINVAL;
3973 3974 3975 3976 3977
	}

	for (i = 0; i < le32_to_cpu(fsec->fsec_hdr.num_images); i++) {
		img_offset = le32_to_cpu(fsec->fsec_entry[i].offset);
		img_size   = le32_to_cpu(fsec->fsec_entry[i].pad_size);
3978 3979 3980
		img_type   = le32_to_cpu(fsec->fsec_entry[i].type);
		img_optype = be_get_img_optype(fsec->fsec_entry[i]);
		old_fw_img = fsec->fsec_entry[i].optype == 0xFFFF;
3981

3982
		if (img_optype == 0xFFFF)
3983
			continue;
3984 3985 3986 3987 3988 3989 3990 3991 3992 3993 3994 3995 3996 3997 3998 3999
		/* Don't bother verifying CRC if an old FW image is being
		 * flashed
		 */
		if (old_fw_img)
			goto flash;

		status = be_check_flash_crc(adapter, fw->data, img_offset,
					    img_size, filehdr_size +
					    img_hdrs_size, img_optype,
					    &crc_match);
		/* The current FW image on the card does not recognize the new
		 * FLASH op_type. The FW download is partially complete.
		 * Reboot the server now to enable FW image to recognize the
		 * new FLASH op_type. To complete the remaining process,
		 * download the same FW again after the reboot.
		 */
4000 4001
		if (base_status(status) == MCC_STATUS_ILLEGAL_REQUEST ||
		    base_status(status) == MCC_STATUS_ILLEGAL_FIELD) {
4002 4003 4004 4005 4006 4007 4008
			dev_err(dev, "Flash incomplete. Reset the server\n");
			dev_err(dev, "Download FW image again after reset\n");
			return -EAGAIN;
		} else if (status) {
			dev_err(dev, "Could not get CRC for 0x%x region\n",
				img_optype);
			return -EFAULT;
4009 4010
		}

4011 4012
		if (crc_match)
			continue;
4013

4014 4015
flash:
		p = fw->data + filehdr_size + img_offset + img_hdrs_size;
4016 4017 4018 4019
		if (p + img_size > fw->data + fw->size)
			return -1;

		status = be_flash(adapter, p, flash_cmd, img_optype, img_size);
4020 4021 4022
		/* For old FW images ignore ILLEGAL_FIELD error or errors on
		 * UFI_DIR region
		 */
4023 4024 4025 4026
		if (old_fw_img &&
		    (base_status(status) == MCC_STATUS_ILLEGAL_FIELD ||
		     (img_optype == OPTYPE_UFI_DIR &&
		      base_status(status) == MCC_STATUS_FAILED))) {
4027 4028 4029 4030 4031
			continue;
		} else if (status) {
			dev_err(dev, "Flashing section type 0x%x failed\n",
				img_type);
			return -EFAULT;
4032 4033 4034
		}
	}
	return 0;
4035 4036
}

4037
static int lancer_fw_download(struct be_adapter *adapter,
4038
			      const struct firmware *fw)
4039
{
4040 4041
#define LANCER_FW_DOWNLOAD_CHUNK      (32 * 1024)
#define LANCER_FW_DOWNLOAD_LOCATION   "/prg"
4042
	struct be_dma_mem flash_cmd;
4043 4044 4045 4046 4047 4048 4049 4050
	const u8 *data_ptr = NULL;
	u8 *dest_image_ptr = NULL;
	size_t image_size = 0;
	u32 chunk_size = 0;
	u32 data_written = 0;
	u32 offset = 0;
	int status = 0;
	u8 add_status = 0;
4051
	u8 change_status;
4052

4053
	if (!IS_ALIGNED(fw->size, sizeof(u32))) {
4054
		dev_err(&adapter->pdev->dev,
4055 4056 4057 4058
			"FW Image not properly aligned. "
			"Length must be 4 byte aligned.\n");
		status = -EINVAL;
		goto lancer_fw_exit;
4059 4060
	}

4061 4062 4063
	flash_cmd.size = sizeof(struct lancer_cmd_req_write_object)
				+ LANCER_FW_DOWNLOAD_CHUNK;
	flash_cmd.va = dma_alloc_coherent(&adapter->pdev->dev, flash_cmd.size,
4064
					  &flash_cmd.dma, GFP_KERNEL);
4065 4066 4067 4068
	if (!flash_cmd.va) {
		status = -ENOMEM;
		goto lancer_fw_exit;
	}
4069

4070 4071 4072 4073 4074 4075 4076 4077 4078 4079 4080 4081
	dest_image_ptr = flash_cmd.va +
				sizeof(struct lancer_cmd_req_write_object);
	image_size = fw->size;
	data_ptr = fw->data;

	while (image_size) {
		chunk_size = min_t(u32, image_size, LANCER_FW_DOWNLOAD_CHUNK);

		/* Copy the image chunk content. */
		memcpy(dest_image_ptr, data_ptr, chunk_size);

		status = lancer_cmd_write_object(adapter, &flash_cmd,
4082 4083 4084 4085
						 chunk_size, offset,
						 LANCER_FW_DOWNLOAD_LOCATION,
						 &data_written, &change_status,
						 &add_status);
4086 4087 4088 4089 4090 4091 4092 4093 4094 4095 4096
		if (status)
			break;

		offset += data_written;
		data_ptr += data_written;
		image_size -= data_written;
	}

	if (!status) {
		/* Commit the FW written */
		status = lancer_cmd_write_object(adapter, &flash_cmd,
4097 4098 4099 4100
						 0, offset,
						 LANCER_FW_DOWNLOAD_LOCATION,
						 &data_written, &change_status,
						 &add_status);
4101 4102 4103
	}

	dma_free_coherent(&adapter->pdev->dev, flash_cmd.size, flash_cmd.va,
4104
			  flash_cmd.dma);
4105 4106 4107 4108 4109 4110 4111 4112
	if (status) {
		dev_err(&adapter->pdev->dev,
			"Firmware load error. "
			"Status code: 0x%x Additional Status: 0x%x\n",
			status, add_status);
		goto lancer_fw_exit;
	}

4113
	if (change_status == LANCER_FW_RESET_NEEDED) {
4114 4115
		dev_info(&adapter->pdev->dev,
			 "Resetting adapter to activate new FW\n");
4116 4117
		status = lancer_physdev_ctrl(adapter,
					     PHYSDEV_CONTROL_FW_RESET_MASK);
4118 4119 4120 4121 4122 4123 4124
		if (status) {
			dev_err(&adapter->pdev->dev,
				"Adapter busy for FW reset.\n"
				"New FW will not be active.\n");
			goto lancer_fw_exit;
		}
	} else if (change_status != LANCER_NO_RESET_NEEDED) {
4125 4126
		dev_err(&adapter->pdev->dev,
			"System reboot required for new FW to be active\n");
4127 4128
	}

4129 4130 4131 4132 4133
	dev_info(&adapter->pdev->dev, "Firmware flashed successfully\n");
lancer_fw_exit:
	return status;
}

4134 4135
#define UFI_TYPE2		2
#define UFI_TYPE3		3
4136
#define UFI_TYPE3R		10
4137 4138
#define UFI_TYPE4		4
static int be_get_ufi_type(struct be_adapter *adapter,
4139
			   struct flash_file_hdr_g3 *fhdr)
4140
{
K
Kalesh AP 已提交
4141
	if (!fhdr)
4142 4143
		goto be_get_ufi_exit;

4144 4145
	if (skyhawk_chip(adapter) && fhdr->build[0] == '4')
		return UFI_TYPE4;
4146 4147 4148 4149 4150 4151
	else if (BE3_chip(adapter) && fhdr->build[0] == '3') {
		if (fhdr->asic_type_rev == 0x10)
			return UFI_TYPE3R;
		else
			return UFI_TYPE3;
	} else if (BE2_chip(adapter) && fhdr->build[0] == '2')
4152
		return UFI_TYPE2;
4153 4154 4155 4156 4157 4158 4159

be_get_ufi_exit:
	dev_err(&adapter->pdev->dev,
		"UFI and Interface are not compatible for flashing\n");
	return -1;
}

4160 4161 4162 4163 4164 4165
static int be_fw_download(struct be_adapter *adapter, const struct firmware* fw)
{
	struct flash_file_hdr_g3 *fhdr3;
	struct image_hdr *img_hdr_ptr = NULL;
	struct be_dma_mem flash_cmd;
	const u8 *p;
4166
	int status = 0, i = 0, num_imgs = 0, ufi_type = 0;
4167

4168
	flash_cmd.size = sizeof(struct be_cmd_write_flashrom);
I
Ivan Vecera 已提交
4169 4170
	flash_cmd.va = dma_alloc_coherent(&adapter->pdev->dev, flash_cmd.size,
					  &flash_cmd.dma, GFP_KERNEL);
4171 4172
	if (!flash_cmd.va) {
		status = -ENOMEM;
4173
		goto be_fw_exit;
4174 4175
	}

4176
	p = fw->data;
4177
	fhdr3 = (struct flash_file_hdr_g3 *)p;
4178

4179
	ufi_type = be_get_ufi_type(adapter, fhdr3);
4180 4181 4182 4183 4184 4185 4186

	num_imgs = le32_to_cpu(fhdr3->num_imgs);
	for (i = 0; i < num_imgs; i++) {
		img_hdr_ptr = (struct image_hdr *)(fw->data +
				(sizeof(struct flash_file_hdr_g3) +
				 i * sizeof(struct image_hdr)));
		if (le32_to_cpu(img_hdr_ptr->imageid) == 1) {
4187 4188
			switch (ufi_type) {
			case UFI_TYPE4:
4189
				status = be_flash_skyhawk(adapter, fw,
4190
							  &flash_cmd, num_imgs);
4191 4192
				break;
			case UFI_TYPE3R:
4193 4194
				status = be_flash_BEx(adapter, fw, &flash_cmd,
						      num_imgs);
4195 4196 4197 4198 4199 4200 4201 4202
				break;
			case UFI_TYPE3:
				/* Do not flash this ufi on BE3-R cards */
				if (adapter->asic_rev < 0x10)
					status = be_flash_BEx(adapter, fw,
							      &flash_cmd,
							      num_imgs);
				else {
4203
					status = -EINVAL;
4204 4205 4206 4207
					dev_err(&adapter->pdev->dev,
						"Can't load BE3 UFI on BE3R\n");
				}
			}
4208
		}
4209 4210
	}

4211 4212
	if (ufi_type == UFI_TYPE2)
		status = be_flash_BEx(adapter, fw, &flash_cmd, 0);
4213
	else if (ufi_type == -1)
4214
		status = -EINVAL;
4215

I
Ivan Vecera 已提交
4216 4217
	dma_free_coherent(&adapter->pdev->dev, flash_cmd.size, flash_cmd.va,
			  flash_cmd.dma);
4218 4219
	if (status) {
		dev_err(&adapter->pdev->dev, "Firmware load error\n");
4220
		goto be_fw_exit;
4221 4222
	}

4223
	dev_info(&adapter->pdev->dev, "Firmware flashed successfully\n");
4224

4225 4226 4227 4228 4229 4230 4231 4232 4233 4234 4235 4236
be_fw_exit:
	return status;
}

int be_load_fw(struct be_adapter *adapter, u8 *fw_file)
{
	const struct firmware *fw;
	int status;

	if (!netif_running(adapter->netdev)) {
		dev_err(&adapter->pdev->dev,
			"Firmware load not allowed (interface is down)\n");
4237
		return -ENETDOWN;
4238 4239 4240 4241 4242 4243 4244 4245 4246 4247 4248 4249 4250
	}

	status = request_firmware(&fw, fw_file, &adapter->pdev->dev);
	if (status)
		goto fw_exit;

	dev_info(&adapter->pdev->dev, "Flashing firmware file %s\n", fw_file);

	if (lancer_chip(adapter))
		status = lancer_fw_download(adapter, fw);
	else
		status = be_fw_download(adapter, fw);

S
Somnath Kotur 已提交
4251
	if (!status)
4252
		be_cmd_get_fw_ver(adapter);
S
Somnath Kotur 已提交
4253

4254 4255 4256 4257 4258
fw_exit:
	release_firmware(fw);
	return status;
}

4259
static int be_ndo_bridge_setlink(struct net_device *dev, struct nlmsghdr *nlh)
4260 4261 4262 4263 4264 4265 4266 4267 4268 4269 4270 4271 4272 4273 4274 4275 4276 4277 4278 4279 4280 4281 4282 4283 4284 4285 4286 4287 4288 4289 4290 4291 4292 4293 4294 4295 4296 4297 4298 4299 4300
{
	struct be_adapter *adapter = netdev_priv(dev);
	struct nlattr *attr, *br_spec;
	int rem;
	int status = 0;
	u16 mode = 0;

	if (!sriov_enabled(adapter))
		return -EOPNOTSUPP;

	br_spec = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg), IFLA_AF_SPEC);

	nla_for_each_nested(attr, br_spec, rem) {
		if (nla_type(attr) != IFLA_BRIDGE_MODE)
			continue;

		mode = nla_get_u16(attr);
		if (mode != BRIDGE_MODE_VEPA && mode != BRIDGE_MODE_VEB)
			return -EINVAL;

		status = be_cmd_set_hsw_config(adapter, 0, 0,
					       adapter->if_handle,
					       mode == BRIDGE_MODE_VEPA ?
					       PORT_FWD_TYPE_VEPA :
					       PORT_FWD_TYPE_VEB);
		if (status)
			goto err;

		dev_info(&adapter->pdev->dev, "enabled switch mode: %s\n",
			 mode == BRIDGE_MODE_VEPA ? "VEPA" : "VEB");

		return status;
	}
err:
	dev_err(&adapter->pdev->dev, "Failed to set switch mode %s\n",
		mode == BRIDGE_MODE_VEPA ? "VEPA" : "VEB");

	return status;
}

static int be_ndo_bridge_getlink(struct sk_buff *skb, u32 pid, u32 seq,
4301
				 struct net_device *dev, u32 filter_mask)
4302 4303 4304 4305 4306 4307 4308 4309 4310 4311 4312 4313 4314 4315 4316 4317 4318 4319 4320 4321 4322 4323 4324
{
	struct be_adapter *adapter = netdev_priv(dev);
	int status = 0;
	u8 hsw_mode;

	if (!sriov_enabled(adapter))
		return 0;

	/* BE and Lancer chips support VEB mode only */
	if (BEx_chip(adapter) || lancer_chip(adapter)) {
		hsw_mode = PORT_FWD_TYPE_VEB;
	} else {
		status = be_cmd_get_hsw_config(adapter, NULL, 0,
					       adapter->if_handle, &hsw_mode);
		if (status)
			return 0;
	}

	return ndo_dflt_bridge_getlink(skb, pid, seq, dev,
				       hsw_mode == PORT_FWD_TYPE_VEPA ?
				       BRIDGE_MODE_VEPA : BRIDGE_MODE_VEB);
}

4325
#ifdef CONFIG_BE2NET_VXLAN
4326 4327 4328 4329 4330 4331 4332 4333 4334 4335 4336 4337 4338 4339 4340 4341 4342 4343 4344 4345 4346 4347 4348 4349 4350 4351 4352 4353 4354 4355 4356 4357 4358 4359 4360 4361 4362 4363 4364 4365 4366 4367 4368 4369 4370 4371 4372 4373 4374 4375 4376 4377 4378 4379 4380 4381 4382 4383
static void be_add_vxlan_port(struct net_device *netdev, sa_family_t sa_family,
			      __be16 port)
{
	struct be_adapter *adapter = netdev_priv(netdev);
	struct device *dev = &adapter->pdev->dev;
	int status;

	if (lancer_chip(adapter) || BEx_chip(adapter))
		return;

	if (adapter->flags & BE_FLAGS_VXLAN_OFFLOADS) {
		dev_warn(dev, "Cannot add UDP port %d for VxLAN offloads\n",
			 be16_to_cpu(port));
		dev_info(dev,
			 "Only one UDP port supported for VxLAN offloads\n");
		return;
	}

	status = be_cmd_manage_iface(adapter, adapter->if_handle,
				     OP_CONVERT_NORMAL_TO_TUNNEL);
	if (status) {
		dev_warn(dev, "Failed to convert normal interface to tunnel\n");
		goto err;
	}

	status = be_cmd_set_vxlan_port(adapter, port);
	if (status) {
		dev_warn(dev, "Failed to add VxLAN port\n");
		goto err;
	}
	adapter->flags |= BE_FLAGS_VXLAN_OFFLOADS;
	adapter->vxlan_port = port;

	dev_info(dev, "Enabled VxLAN offloads for UDP port %d\n",
		 be16_to_cpu(port));
	return;
err:
	be_disable_vxlan_offloads(adapter);
	return;
}

static void be_del_vxlan_port(struct net_device *netdev, sa_family_t sa_family,
			      __be16 port)
{
	struct be_adapter *adapter = netdev_priv(netdev);

	if (lancer_chip(adapter) || BEx_chip(adapter))
		return;

	if (adapter->vxlan_port != port)
		return;

	be_disable_vxlan_offloads(adapter);

	dev_info(&adapter->pdev->dev,
		 "Disabled VxLAN offloads for UDP port %d\n",
		 be16_to_cpu(port));
}
4384
#endif
4385

4386
static const struct net_device_ops be_netdev_ops = {
S
Sathya Perla 已提交
4387 4388 4389
	.ndo_open		= be_open,
	.ndo_stop		= be_close,
	.ndo_start_xmit		= be_xmit,
4390
	.ndo_set_rx_mode	= be_set_rx_mode,
S
Sathya Perla 已提交
4391 4392
	.ndo_set_mac_address	= be_mac_addr_set,
	.ndo_change_mtu		= be_change_mtu,
4393
	.ndo_get_stats64	= be_get_stats64,
S
Sathya Perla 已提交
4394 4395 4396
	.ndo_validate_addr	= eth_validate_addr,
	.ndo_vlan_rx_add_vid	= be_vlan_add_vid,
	.ndo_vlan_rx_kill_vid	= be_vlan_rem_vid,
4397
	.ndo_set_vf_mac		= be_set_vf_mac,
4398
	.ndo_set_vf_vlan	= be_set_vf_vlan,
4399
	.ndo_set_vf_rate	= be_set_vf_tx_rate,
I
Ivan Vecera 已提交
4400
	.ndo_get_vf_config	= be_get_vf_config,
4401
	.ndo_set_vf_link_state  = be_set_vf_link_state,
I
Ivan Vecera 已提交
4402 4403 4404
#ifdef CONFIG_NET_POLL_CONTROLLER
	.ndo_poll_controller	= be_netpoll,
#endif
4405 4406
	.ndo_bridge_setlink	= be_ndo_bridge_setlink,
	.ndo_bridge_getlink	= be_ndo_bridge_getlink,
4407
#ifdef CONFIG_NET_RX_BUSY_POLL
4408
	.ndo_busy_poll		= be_busy_poll,
4409
#endif
4410
#ifdef CONFIG_BE2NET_VXLAN
4411 4412
	.ndo_add_vxlan_port	= be_add_vxlan_port,
	.ndo_del_vxlan_port	= be_del_vxlan_port,
4413
#endif
S
Sathya Perla 已提交
4414 4415 4416 4417 4418 4419
};

static void be_netdev_init(struct net_device *netdev)
{
	struct be_adapter *adapter = netdev_priv(netdev);

4420 4421 4422 4423 4424 4425
	if (skyhawk_chip(adapter)) {
		netdev->hw_enc_features |= NETIF_F_IP_CSUM | NETIF_F_IPV6_CSUM |
					   NETIF_F_TSO | NETIF_F_TSO6 |
					   NETIF_F_GSO_UDP_TUNNEL;
		netdev->hw_features |= NETIF_F_GSO_UDP_TUNNEL;
	}
4426
	netdev->hw_features |= NETIF_F_SG | NETIF_F_TSO | NETIF_F_TSO6 |
4427
		NETIF_F_IP_CSUM | NETIF_F_IPV6_CSUM | NETIF_F_RXCSUM |
4428
		NETIF_F_HW_VLAN_CTAG_TX;
4429 4430
	if (be_multi_rxq(adapter))
		netdev->hw_features |= NETIF_F_RXHASH;
4431 4432

	netdev->features |= netdev->hw_features |
4433
		NETIF_F_HW_VLAN_CTAG_RX | NETIF_F_HW_VLAN_CTAG_FILTER;
A
Ajit Khaparde 已提交
4434

4435
	netdev->vlan_features |= NETIF_F_SG | NETIF_F_TSO | NETIF_F_TSO6 |
4436
		NETIF_F_IP_CSUM | NETIF_F_IPV6_CSUM;
4437

4438 4439
	netdev->priv_flags |= IFF_UNICAST_FLT;

S
Sathya Perla 已提交
4440 4441
	netdev->flags |= IFF_MULTICAST;

4442
	netif_set_gso_max_size(netdev, 65535 - ETH_HLEN);
4443

S
Sathya Perla 已提交
4444
	netdev->netdev_ops = &be_netdev_ops;
S
Sathya Perla 已提交
4445

4446
	netdev->ethtool_ops = &be_ethtool_ops;
S
Sathya Perla 已提交
4447 4448 4449 4450
}

static void be_unmap_pci_bars(struct be_adapter *adapter)
{
4451 4452
	if (adapter->csr)
		pci_iounmap(adapter->pdev, adapter->csr);
4453
	if (adapter->db)
S
Sathya Perla 已提交
4454
		pci_iounmap(adapter->pdev, adapter->db);
4455 4456
}

S
Sathya Perla 已提交
4457 4458 4459 4460 4461 4462 4463 4464 4465
static int db_bar(struct be_adapter *adapter)
{
	if (lancer_chip(adapter) || !be_physfn(adapter))
		return 0;
	else
		return 4;
}

static int be_roce_map_pci_bars(struct be_adapter *adapter)
4466
{
S
Sathya Perla 已提交
4467
	if (skyhawk_chip(adapter)) {
S
Sathya Perla 已提交
4468 4469 4470 4471 4472 4473
		adapter->roce_db.size = 4096;
		adapter->roce_db.io_addr = pci_resource_start(adapter->pdev,
							      db_bar(adapter));
		adapter->roce_db.total_size = pci_resource_len(adapter->pdev,
							       db_bar(adapter));
	}
4474
	return 0;
S
Sathya Perla 已提交
4475 4476 4477 4478 4479
}

static int be_map_pci_bars(struct be_adapter *adapter)
{
	u8 __iomem *addr;
4480

4481 4482
	if (BEx_chip(adapter) && be_physfn(adapter)) {
		adapter->csr = pci_iomap(adapter->pdev, 2, 0);
K
Kalesh AP 已提交
4483
		if (!adapter->csr)
4484 4485 4486
			return -ENOMEM;
	}

S
Sathya Perla 已提交
4487
	addr = pci_iomap(adapter->pdev, db_bar(adapter), 0);
K
Kalesh AP 已提交
4488
	if (!addr)
S
Sathya Perla 已提交
4489
		goto pci_map_err;
4490
	adapter->db = addr;
S
Sathya Perla 已提交
4491 4492

	be_roce_map_pci_bars(adapter);
S
Sathya Perla 已提交
4493
	return 0;
S
Sathya Perla 已提交
4494

S
Sathya Perla 已提交
4495 4496 4497 4498 4499 4500 4501
pci_map_err:
	be_unmap_pci_bars(adapter);
	return -ENOMEM;
}

static void be_ctrl_cleanup(struct be_adapter *adapter)
{
4502
	struct be_dma_mem *mem = &adapter->mbox_mem_alloced;
S
Sathya Perla 已提交
4503 4504 4505 4506

	be_unmap_pci_bars(adapter);

	if (mem->va)
I
Ivan Vecera 已提交
4507 4508
		dma_free_coherent(&adapter->pdev->dev, mem->size, mem->va,
				  mem->dma);
4509

4510
	mem = &adapter->rx_filter;
4511
	if (mem->va)
I
Ivan Vecera 已提交
4512 4513
		dma_free_coherent(&adapter->pdev->dev, mem->size, mem->va,
				  mem->dma);
S
Sathya Perla 已提交
4514 4515 4516 4517
}

static int be_ctrl_init(struct be_adapter *adapter)
{
4518 4519
	struct be_dma_mem *mbox_mem_alloc = &adapter->mbox_mem_alloced;
	struct be_dma_mem *mbox_mem_align = &adapter->mbox_mem;
4520
	struct be_dma_mem *rx_filter = &adapter->rx_filter;
S
Sathya Perla 已提交
4521
	u32 sli_intf;
S
Sathya Perla 已提交
4522 4523
	int status;

S
Sathya Perla 已提交
4524 4525 4526 4527 4528
	pci_read_config_dword(adapter->pdev, SLI_INTF_REG_OFFSET, &sli_intf);
	adapter->sli_family = (sli_intf & SLI_INTF_FAMILY_MASK) >>
				 SLI_INTF_FAMILY_SHIFT;
	adapter->virtfn = (sli_intf & SLI_INTF_FT_MASK) ? 1 : 0;

S
Sathya Perla 已提交
4529 4530
	status = be_map_pci_bars(adapter);
	if (status)
4531
		goto done;
S
Sathya Perla 已提交
4532 4533

	mbox_mem_alloc->size = sizeof(struct be_mcc_mailbox) + 16;
I
Ivan Vecera 已提交
4534 4535 4536 4537
	mbox_mem_alloc->va = dma_alloc_coherent(&adapter->pdev->dev,
						mbox_mem_alloc->size,
						&mbox_mem_alloc->dma,
						GFP_KERNEL);
S
Sathya Perla 已提交
4538
	if (!mbox_mem_alloc->va) {
4539 4540
		status = -ENOMEM;
		goto unmap_pci_bars;
S
Sathya Perla 已提交
4541 4542 4543 4544 4545
	}
	mbox_mem_align->size = sizeof(struct be_mcc_mailbox);
	mbox_mem_align->va = PTR_ALIGN(mbox_mem_alloc->va, 16);
	mbox_mem_align->dma = PTR_ALIGN(mbox_mem_alloc->dma, 16);
	memset(mbox_mem_align->va, 0, sizeof(struct be_mcc_mailbox));
4546

4547
	rx_filter->size = sizeof(struct be_cmd_req_rx_filter);
4548 4549 4550
	rx_filter->va = dma_zalloc_coherent(&adapter->pdev->dev,
					    rx_filter->size, &rx_filter->dma,
					    GFP_KERNEL);
K
Kalesh AP 已提交
4551
	if (!rx_filter->va) {
4552 4553 4554
		status = -ENOMEM;
		goto free_mbox;
	}
4555

4556
	mutex_init(&adapter->mbox_lock);
4557 4558
	spin_lock_init(&adapter->mcc_lock);
	spin_lock_init(&adapter->mcc_cq_lock);
4559

4560
	init_completion(&adapter->et_cmd_compl);
4561
	pci_save_state(adapter->pdev);
S
Sathya Perla 已提交
4562
	return 0;
4563 4564

free_mbox:
I
Ivan Vecera 已提交
4565 4566
	dma_free_coherent(&adapter->pdev->dev, mbox_mem_alloc->size,
			  mbox_mem_alloc->va, mbox_mem_alloc->dma);
4567 4568 4569 4570 4571 4572

unmap_pci_bars:
	be_unmap_pci_bars(adapter);

done:
	return status;
S
Sathya Perla 已提交
4573 4574 4575 4576
}

static void be_stats_cleanup(struct be_adapter *adapter)
{
4577
	struct be_dma_mem *cmd = &adapter->stats_cmd;
S
Sathya Perla 已提交
4578 4579

	if (cmd->va)
I
Ivan Vecera 已提交
4580 4581
		dma_free_coherent(&adapter->pdev->dev, cmd->size,
				  cmd->va, cmd->dma);
S
Sathya Perla 已提交
4582 4583 4584 4585
}

static int be_stats_init(struct be_adapter *adapter)
{
4586
	struct be_dma_mem *cmd = &adapter->stats_cmd;
S
Sathya Perla 已提交
4587

4588 4589 4590
	if (lancer_chip(adapter))
		cmd->size = sizeof(struct lancer_cmd_req_pport_stats);
	else if (BE2_chip(adapter))
4591
		cmd->size = sizeof(struct be_cmd_req_get_stats_v0);
4592
	else if (BE3_chip(adapter))
4593
		cmd->size = sizeof(struct be_cmd_req_get_stats_v1);
4594 4595 4596
	else
		/* ALL non-BE ASICs */
		cmd->size = sizeof(struct be_cmd_req_get_stats_v2);
4597

4598 4599
	cmd->va = dma_zalloc_coherent(&adapter->pdev->dev, cmd->size, &cmd->dma,
				      GFP_KERNEL);
K
Kalesh AP 已提交
4600
	if (!cmd->va)
4601
		return -ENOMEM;
S
Sathya Perla 已提交
4602 4603 4604
	return 0;
}

B
Bill Pemberton 已提交
4605
static void be_remove(struct pci_dev *pdev)
S
Sathya Perla 已提交
4606 4607
{
	struct be_adapter *adapter = pci_get_drvdata(pdev);
4608

S
Sathya Perla 已提交
4609 4610 4611
	if (!adapter)
		return;

4612
	be_roce_dev_remove(adapter);
4613
	be_intr_set(adapter, false);
4614

4615 4616
	cancel_delayed_work_sync(&adapter->func_recovery_work);

S
Sathya Perla 已提交
4617 4618
	unregister_netdev(adapter->netdev);

4619 4620
	be_clear(adapter);

4621 4622 4623
	/* tell fw we're done with firing cmds */
	be_cmd_fw_clean(adapter);

S
Sathya Perla 已提交
4624 4625 4626 4627
	be_stats_cleanup(adapter);

	be_ctrl_cleanup(adapter);

S
Sathya Perla 已提交
4628 4629
	pci_disable_pcie_error_reporting(pdev);

S
Sathya Perla 已提交
4630 4631 4632 4633 4634 4635
	pci_release_regions(pdev);
	pci_disable_device(pdev);

	free_netdev(adapter->netdev);
}

4636
static int be_get_initial_config(struct be_adapter *adapter)
S
Sathya Perla 已提交
4637
{
4638
	int status, level;
S
Sathya Perla 已提交
4639

4640 4641 4642 4643
	status = be_cmd_get_cntl_attributes(adapter);
	if (status)
		return status;

4644 4645 4646
	/* Must be a power of 2 or else MODULO will BUG_ON */
	adapter->be_get_temp_freq = 64;

4647 4648 4649 4650 4651
	if (BEx_chip(adapter)) {
		level = be_cmd_get_fw_log_level(adapter);
		adapter->msg_enable =
			level <= FW_LOG_LEVEL_DEFAULT ? NETIF_MSG_HW : 0;
	}
4652

4653
	adapter->cfg_num_qs = netif_get_num_default_rss_queues();
4654
	return 0;
S
Sathya Perla 已提交
4655 4656
}

4657
static int lancer_recover_func(struct be_adapter *adapter)
4658
{
4659
	struct device *dev = &adapter->pdev->dev;
4660 4661
	int status;

4662 4663 4664
	status = lancer_test_and_set_rdy_state(adapter);
	if (status)
		goto err;
4665

4666 4667
	if (netif_running(adapter->netdev))
		be_close(adapter->netdev);
4668

4669 4670
	be_clear(adapter);

4671
	be_clear_all_error(adapter);
4672 4673 4674 4675

	status = be_setup(adapter);
	if (status)
		goto err;
4676

4677 4678
	if (netif_running(adapter->netdev)) {
		status = be_open(adapter->netdev);
4679 4680
		if (status)
			goto err;
4681
	}
4682

4683
	dev_err(dev, "Adapter recovery successful\n");
4684 4685
	return 0;
err:
4686 4687 4688
	if (status == -EAGAIN)
		dev_err(dev, "Waiting for resource provisioning\n");
	else
4689
		dev_err(dev, "Adapter recovery failed\n");
4690

4691 4692 4693 4694 4695 4696 4697
	return status;
}

static void be_func_recovery_task(struct work_struct *work)
{
	struct be_adapter *adapter =
		container_of(work, struct be_adapter,  func_recovery_work.work);
4698
	int status = 0;
4699

4700
	be_detect_error(adapter);
4701

4702
	if (adapter->hw_error && lancer_chip(adapter)) {
4703

4704 4705 4706
		rtnl_lock();
		netif_device_detach(adapter->netdev);
		rtnl_unlock();
4707

4708 4709 4710
		status = lancer_recover_func(adapter);
		if (!status)
			netif_device_attach(adapter->netdev);
4711
	}
4712

4713 4714 4715 4716 4717 4718
	/* In Lancer, for all errors other than provisioning error (-EAGAIN),
	 * no need to attempt further recovery.
	 */
	if (!status || status == -EAGAIN)
		schedule_delayed_work(&adapter->func_recovery_work,
				      msecs_to_jiffies(1000));
4719 4720 4721 4722 4723 4724 4725 4726 4727 4728 4729 4730
}

static void be_worker(struct work_struct *work)
{
	struct be_adapter *adapter =
		container_of(work, struct be_adapter, work.work);
	struct be_rx_obj *rxo;
	int i;

	/* when interrupts are not yet enabled, just reap any pending
	* mcc completions */
	if (!netif_running(adapter->netdev)) {
4731
		local_bh_disable();
S
Sathya Perla 已提交
4732
		be_process_mcc(adapter);
4733
		local_bh_enable();
4734 4735 4736 4737 4738 4739 4740 4741 4742 4743 4744
		goto reschedule;
	}

	if (!adapter->stats_cmd_sent) {
		if (lancer_chip(adapter))
			lancer_cmd_get_pport_stats(adapter,
						&adapter->stats_cmd);
		else
			be_cmd_get_stats(adapter, &adapter->stats_cmd);
	}

4745 4746
	if (be_physfn(adapter) &&
	    MODULO(adapter->work_counter, adapter->be_get_temp_freq) == 0)
4747 4748
		be_cmd_get_die_temperature(adapter);

4749
	for_all_rx_queues(adapter, rxo, i) {
4750 4751 4752 4753
		/* Replenish RX-queues starved due to memory
		 * allocation failures.
		 */
		if (rxo->rx_post_starved)
4754 4755 4756
			be_post_rx_frags(rxo, GFP_KERNEL);
	}

4757
	be_eqd_update(adapter);
S
Sathya Perla 已提交
4758

4759 4760 4761 4762 4763
reschedule:
	adapter->work_counter++;
	schedule_delayed_work(&adapter->work, msecs_to_jiffies(1000));
}

4764
/* If any VFs are already enabled don't FLR the PF */
4765 4766
static bool be_reset_required(struct be_adapter *adapter)
{
4767
	return pci_num_vf(adapter->pdev) ? false : true;
4768 4769
}

S
Sathya Perla 已提交
4770 4771
static char *mc_name(struct be_adapter *adapter)
{
4772 4773 4774 4775 4776 4777 4778 4779 4780 4781 4782 4783 4784 4785 4786 4787 4788 4789 4790 4791 4792 4793 4794 4795 4796 4797
	char *str = "";	/* default */

	switch (adapter->mc_type) {
	case UMC:
		str = "UMC";
		break;
	case FLEX10:
		str = "FLEX10";
		break;
	case vNIC1:
		str = "vNIC-1";
		break;
	case nPAR:
		str = "nPAR";
		break;
	case UFP:
		str = "UFP";
		break;
	case vNIC2:
		str = "vNIC-2";
		break;
	default:
		str = "";
	}

	return str;
S
Sathya Perla 已提交
4798 4799 4800 4801 4802 4803 4804
}

static inline char *func_name(struct be_adapter *adapter)
{
	return be_physfn(adapter) ? "PF" : "VF";
}

4805
static int be_probe(struct pci_dev *pdev, const struct pci_device_id *pdev_id)
S
Sathya Perla 已提交
4806 4807 4808 4809
{
	int status = 0;
	struct be_adapter *adapter;
	struct net_device *netdev;
4810
	char port_name;
S
Sathya Perla 已提交
4811 4812 4813 4814 4815 4816 4817 4818 4819 4820

	status = pci_enable_device(pdev);
	if (status)
		goto do_none;

	status = pci_request_regions(pdev, DRV_NAME);
	if (status)
		goto disable_dev;
	pci_set_master(pdev);

4821
	netdev = alloc_etherdev_mqs(sizeof(*adapter), MAX_TX_QS, MAX_RX_QS);
K
Kalesh AP 已提交
4822
	if (!netdev) {
S
Sathya Perla 已提交
4823 4824 4825 4826 4827 4828 4829
		status = -ENOMEM;
		goto rel_reg;
	}
	adapter = netdev_priv(netdev);
	adapter->pdev = pdev;
	pci_set_drvdata(pdev, adapter);
	adapter->netdev = netdev;
4830
	SET_NETDEV_DEV(netdev, &pdev->dev);
S
Sathya Perla 已提交
4831

4832
	status = dma_set_mask_and_coherent(&pdev->dev, DMA_BIT_MASK(64));
S
Sathya Perla 已提交
4833 4834 4835
	if (!status) {
		netdev->features |= NETIF_F_HIGHDMA;
	} else {
4836
		status = dma_set_mask_and_coherent(&pdev->dev, DMA_BIT_MASK(32));
S
Sathya Perla 已提交
4837 4838 4839 4840 4841 4842
		if (status) {
			dev_err(&pdev->dev, "Could not set PCI DMA Mask\n");
			goto free_netdev;
		}
	}

4843 4844 4845 4846 4847
	if (be_physfn(adapter)) {
		status = pci_enable_pcie_error_reporting(pdev);
		if (!status)
			dev_info(&pdev->dev, "PCIe error reporting enabled\n");
	}
S
Sathya Perla 已提交
4848

S
Sathya Perla 已提交
4849 4850
	status = be_ctrl_init(adapter);
	if (status)
4851
		goto free_netdev;
S
Sathya Perla 已提交
4852

4853
	/* sync up with fw's ready state */
4854
	if (be_physfn(adapter)) {
4855
		status = be_fw_wait_ready(adapter);
4856 4857 4858
		if (status)
			goto ctrl_clean;
	}
S
Sathya Perla 已提交
4859

4860 4861 4862 4863
	if (be_reset_required(adapter)) {
		status = be_cmd_reset_function(adapter);
		if (status)
			goto ctrl_clean;
4864

4865 4866 4867
		/* Wait for interrupts to quiesce after an FLR */
		msleep(100);
	}
4868 4869 4870

	/* Allow interrupts for other ULPs running on NIC function */
	be_intr_set(adapter, true);
S
Sathya Perla 已提交
4871

4872 4873 4874 4875 4876
	/* tell fw we're ready to fire cmds */
	status = be_cmd_fw_init(adapter);
	if (status)
		goto ctrl_clean;

4877 4878 4879 4880
	status = be_stats_init(adapter);
	if (status)
		goto ctrl_clean;

4881
	status = be_get_initial_config(adapter);
S
Sathya Perla 已提交
4882 4883 4884 4885
	if (status)
		goto stats_clean;

	INIT_DELAYED_WORK(&adapter->work, be_worker);
4886
	INIT_DELAYED_WORK(&adapter->func_recovery_work, be_func_recovery_task);
4887
	adapter->rx_fc = adapter->tx_fc = true;
S
Sathya Perla 已提交
4888

4889 4890
	status = be_setup(adapter);
	if (status)
4891
		goto stats_clean;
4892

4893
	be_netdev_init(netdev);
S
Sathya Perla 已提交
4894 4895
	status = register_netdev(netdev);
	if (status != 0)
4896
		goto unsetup;
S
Sathya Perla 已提交
4897

4898 4899
	be_roce_dev_add(adapter);

4900 4901
	schedule_delayed_work(&adapter->func_recovery_work,
			      msecs_to_jiffies(1000));
4902 4903 4904

	be_cmd_query_port_name(adapter, &port_name);

S
Sathya Perla 已提交
4905 4906
	dev_info(&pdev->dev, "%s: %s %s port %c\n", nic_name(pdev),
		 func_name(adapter), mc_name(adapter), port_name);
4907

S
Sathya Perla 已提交
4908 4909
	return 0;

4910 4911
unsetup:
	be_clear(adapter);
S
Sathya Perla 已提交
4912 4913 4914 4915
stats_clean:
	be_stats_cleanup(adapter);
ctrl_clean:
	be_ctrl_cleanup(adapter);
4916
free_netdev:
4917
	free_netdev(netdev);
S
Sathya Perla 已提交
4918 4919 4920 4921 4922
rel_reg:
	pci_release_regions(pdev);
disable_dev:
	pci_disable_device(pdev);
do_none:
4923
	dev_err(&pdev->dev, "%s initialization failed\n", nic_name(pdev));
S
Sathya Perla 已提交
4924 4925 4926 4927 4928 4929 4930 4931
	return status;
}

static int be_suspend(struct pci_dev *pdev, pm_message_t state)
{
	struct be_adapter *adapter = pci_get_drvdata(pdev);
	struct net_device *netdev =  adapter->netdev;

S
Suresh Reddy 已提交
4932
	if (adapter->wol_en)
4933 4934
		be_setup_wol(adapter, true);

4935
	be_intr_set(adapter, false);
4936 4937
	cancel_delayed_work_sync(&adapter->func_recovery_work);

S
Sathya Perla 已提交
4938 4939 4940 4941 4942 4943
	netif_device_detach(netdev);
	if (netif_running(netdev)) {
		rtnl_lock();
		be_close(netdev);
		rtnl_unlock();
	}
4944
	be_clear(adapter);
S
Sathya Perla 已提交
4945 4946 4947 4948 4949 4950 4951 4952 4953 4954 4955 4956 4957 4958 4959 4960 4961 4962 4963

	pci_save_state(pdev);
	pci_disable_device(pdev);
	pci_set_power_state(pdev, pci_choose_state(pdev, state));
	return 0;
}

static int be_resume(struct pci_dev *pdev)
{
	int status = 0;
	struct be_adapter *adapter = pci_get_drvdata(pdev);
	struct net_device *netdev =  adapter->netdev;

	netif_device_detach(netdev);

	status = pci_enable_device(pdev);
	if (status)
		return status;

4964
	pci_set_power_state(pdev, PCI_D0);
S
Sathya Perla 已提交
4965 4966
	pci_restore_state(pdev);

4967 4968 4969 4970
	status = be_fw_wait_ready(adapter);
	if (status)
		return status;

4971
	be_intr_set(adapter, true);
4972 4973 4974 4975 4976
	/* tell fw we're ready to fire cmds */
	status = be_cmd_fw_init(adapter);
	if (status)
		return status;

4977
	be_setup(adapter);
S
Sathya Perla 已提交
4978 4979 4980 4981 4982
	if (netif_running(netdev)) {
		rtnl_lock();
		be_open(netdev);
		rtnl_unlock();
	}
4983 4984 4985

	schedule_delayed_work(&adapter->func_recovery_work,
			      msecs_to_jiffies(1000));
S
Sathya Perla 已提交
4986
	netif_device_attach(netdev);
4987

S
Suresh Reddy 已提交
4988
	if (adapter->wol_en)
4989
		be_setup_wol(adapter, false);
4990

S
Sathya Perla 已提交
4991 4992 4993
	return 0;
}

4994 4995 4996 4997 4998 4999 5000
/*
 * An FLR will stop BE from DMAing any data.
 */
static void be_shutdown(struct pci_dev *pdev)
{
	struct be_adapter *adapter = pci_get_drvdata(pdev);

5001 5002
	if (!adapter)
		return;
5003

5004
	cancel_delayed_work_sync(&adapter->work);
5005
	cancel_delayed_work_sync(&adapter->func_recovery_work);
5006

5007
	netif_device_detach(adapter->netdev);
5008

5009 5010
	be_cmd_reset_function(adapter);

5011 5012 5013
	pci_disable_device(pdev);
}

5014
static pci_ers_result_t be_eeh_err_detected(struct pci_dev *pdev,
5015
					    pci_channel_state_t state)
5016 5017 5018 5019 5020 5021
{
	struct be_adapter *adapter = pci_get_drvdata(pdev);
	struct net_device *netdev =  adapter->netdev;

	dev_err(&adapter->pdev->dev, "EEH error detected\n");

5022 5023
	if (!adapter->eeh_error) {
		adapter->eeh_error = true;
5024

5025
		cancel_delayed_work_sync(&adapter->func_recovery_work);
5026 5027

		rtnl_lock();
5028 5029 5030
		netif_device_detach(netdev);
		if (netif_running(netdev))
			be_close(netdev);
5031
		rtnl_unlock();
5032 5033

		be_clear(adapter);
5034 5035 5036 5037 5038 5039 5040
	}

	if (state == pci_channel_io_perm_failure)
		return PCI_ERS_RESULT_DISCONNECT;

	pci_disable_device(pdev);

5041 5042
	/* The error could cause the FW to trigger a flash debug dump.
	 * Resetting the card while flash dump is in progress
5043 5044 5045
	 * can cause it not to recover; wait for it to finish.
	 * Wait only for first function as it is needed only once per
	 * adapter.
5046
	 */
5047 5048 5049
	if (pdev->devfn == 0)
		ssleep(30);

5050 5051 5052 5053 5054 5055 5056 5057 5058 5059 5060 5061 5062 5063 5064
	return PCI_ERS_RESULT_NEED_RESET;
}

static pci_ers_result_t be_eeh_reset(struct pci_dev *pdev)
{
	struct be_adapter *adapter = pci_get_drvdata(pdev);
	int status;

	dev_info(&adapter->pdev->dev, "EEH reset\n");

	status = pci_enable_device(pdev);
	if (status)
		return PCI_ERS_RESULT_DISCONNECT;

	pci_set_master(pdev);
5065
	pci_set_power_state(pdev, PCI_D0);
5066 5067 5068
	pci_restore_state(pdev);

	/* Check if card is ok and fw is ready */
5069 5070
	dev_info(&adapter->pdev->dev,
		 "Waiting for FW to be ready after EEH reset\n");
5071
	status = be_fw_wait_ready(adapter);
5072 5073 5074
	if (status)
		return PCI_ERS_RESULT_DISCONNECT;

S
Sathya Perla 已提交
5075
	pci_cleanup_aer_uncorrect_error_status(pdev);
5076
	be_clear_all_error(adapter);
5077 5078 5079 5080 5081 5082 5083 5084 5085 5086 5087 5088 5089
	return PCI_ERS_RESULT_RECOVERED;
}

static void be_eeh_resume(struct pci_dev *pdev)
{
	int status = 0;
	struct be_adapter *adapter = pci_get_drvdata(pdev);
	struct net_device *netdev =  adapter->netdev;

	dev_info(&adapter->pdev->dev, "EEH resume\n");

	pci_save_state(pdev);

5090
	status = be_cmd_reset_function(adapter);
5091 5092 5093
	if (status)
		goto err;

5094 5095 5096 5097 5098 5099
	/* On some BE3 FW versions, after a HW reset,
	 * interrupts will remain disabled for each function.
	 * So, explicitly enable interrupts
	 */
	be_intr_set(adapter, true);

5100 5101
	/* tell fw we're ready to fire cmds */
	status = be_cmd_fw_init(adapter);
5102 5103 5104
	if (status)
		goto err;

5105 5106 5107 5108 5109 5110 5111 5112 5113
	status = be_setup(adapter);
	if (status)
		goto err;

	if (netif_running(netdev)) {
		status = be_open(netdev);
		if (status)
			goto err;
	}
5114 5115 5116

	schedule_delayed_work(&adapter->func_recovery_work,
			      msecs_to_jiffies(1000));
5117 5118 5119 5120 5121 5122
	netif_device_attach(netdev);
	return;
err:
	dev_err(&adapter->pdev->dev, "EEH resume failed\n");
}

5123
static const struct pci_error_handlers be_eeh_handlers = {
5124 5125 5126 5127 5128
	.error_detected = be_eeh_err_detected,
	.slot_reset = be_eeh_reset,
	.resume = be_eeh_resume,
};

S
Sathya Perla 已提交
5129 5130 5131 5132 5133 5134
static struct pci_driver be_driver = {
	.name = DRV_NAME,
	.id_table = be_dev_ids,
	.probe = be_probe,
	.remove = be_remove,
	.suspend = be_suspend,
5135
	.resume = be_resume,
5136
	.shutdown = be_shutdown,
5137
	.err_handler = &be_eeh_handlers
S
Sathya Perla 已提交
5138 5139 5140 5141
};

static int __init be_init_module(void)
{
5142 5143
	if (rx_frag_size != 8192 && rx_frag_size != 4096 &&
	    rx_frag_size != 2048) {
S
Sathya Perla 已提交
5144 5145 5146 5147 5148 5149 5150 5151 5152 5153 5154 5155 5156 5157 5158
		printk(KERN_WARNING DRV_NAME
			" : Module param rx_frag_size must be 2048/4096/8192."
			" Using 2048\n");
		rx_frag_size = 2048;
	}

	return pci_register_driver(&be_driver);
}
module_init(be_init_module);

static void __exit be_exit_module(void)
{
	pci_unregister_driver(&be_driver);
}
module_exit(be_exit_module);