be_main.c 154.5 KB
Newer Older
S
Sathya Perla 已提交
1
/*
2
 * Copyright (C) 2005 - 2015 Emulex
S
Sathya Perla 已提交
3 4 5 6 7 8 9 10
 * All rights reserved.
 *
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License version 2
 * as published by the Free Software Foundation.  The full GNU General
 * Public License is included in this distribution in the file called COPYING.
 *
 * Contact Information:
11
 * linux-drivers@emulex.com
S
Sathya Perla 已提交
12
 *
13 14 15
 * Emulex
 * 3333 Susan Street
 * Costa Mesa, CA 92626
S
Sathya Perla 已提交
16 17
 */

18
#include <linux/prefetch.h>
19
#include <linux/module.h>
S
Sathya Perla 已提交
20
#include "be.h"
21
#include "be_cmds.h"
22
#include <asm/div64.h>
S
Sathya Perla 已提交
23
#include <linux/aer.h>
24
#include <linux/if_bridge.h>
25
#include <net/busy_poll.h>
26
#include <net/vxlan.h>
S
Sathya Perla 已提交
27 28 29

MODULE_VERSION(DRV_VER);
MODULE_DESCRIPTION(DRV_DESC " " DRV_VER);
30
MODULE_AUTHOR("Emulex Corporation");
S
Sathya Perla 已提交
31 32
MODULE_LICENSE("GPL");

33 34 35
/* num_vfs module param is obsolete.
 * Use sysfs method to enable/disable VFs.
 */
36 37 38
static unsigned int num_vfs;
module_param(num_vfs, uint, S_IRUGO);
MODULE_PARM_DESC(num_vfs, "Number of PCI VFs to initialize");
S
Sathya Perla 已提交
39

40 41 42 43
static ushort rx_frag_size = 2048;
module_param(rx_frag_size, ushort, S_IRUGO);
MODULE_PARM_DESC(rx_frag_size, "Size of a fragment that holds rcvd data.");

44
static const struct pci_device_id be_dev_ids[] = {
45
	{ PCI_DEVICE(BE_VENDOR_ID, BE_DEVICE_ID1) },
46
	{ PCI_DEVICE(BE_VENDOR_ID, BE_DEVICE_ID2) },
47 48
	{ PCI_DEVICE(BE_VENDOR_ID, OC_DEVICE_ID1) },
	{ PCI_DEVICE(BE_VENDOR_ID, OC_DEVICE_ID2) },
49
	{ PCI_DEVICE(EMULEX_VENDOR_ID, OC_DEVICE_ID3)},
50
	{ PCI_DEVICE(EMULEX_VENDOR_ID, OC_DEVICE_ID4)},
51
	{ PCI_DEVICE(EMULEX_VENDOR_ID, OC_DEVICE_ID5)},
52
	{ PCI_DEVICE(EMULEX_VENDOR_ID, OC_DEVICE_ID6)},
S
Sathya Perla 已提交
53 54 55
	{ 0 }
};
MODULE_DEVICE_TABLE(pci, be_dev_ids);
56
/* UE Status Low CSR */
57
static const char * const ue_status_low_desc[] = {
58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85
	"CEV",
	"CTX",
	"DBUF",
	"ERX",
	"Host",
	"MPU",
	"NDMA",
	"PTC ",
	"RDMA ",
	"RXF ",
	"RXIPS ",
	"RXULP0 ",
	"RXULP1 ",
	"RXULP2 ",
	"TIM ",
	"TPOST ",
	"TPRE ",
	"TXIPS ",
	"TXULP0 ",
	"TXULP1 ",
	"UC ",
	"WDMA ",
	"TXULP2 ",
	"HOST1 ",
	"P0_OB_LINK ",
	"P1_OB_LINK ",
	"HOST_GPIO ",
	"MBOX ",
86 87 88 89
	"ERX2 ",
	"SPARE ",
	"JTAG ",
	"MPU_INTPEND "
90
};
91

92
/* UE Status High CSR */
93
static const char * const ue_status_hi_desc[] = {
94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114
	"LPCMEMHOST",
	"MGMT_MAC",
	"PCS0ONLINE",
	"MPU_IRAM",
	"PCS1ONLINE",
	"PCTL0",
	"PCTL1",
	"PMEM",
	"RR",
	"TXPB",
	"RXPP",
	"XAUI",
	"TXP",
	"ARM",
	"IPC",
	"HOST2",
	"HOST3",
	"HOST4",
	"HOST5",
	"HOST6",
	"HOST7",
115 116
	"ECRC",
	"Poison TLP",
117
	"NETC",
118 119 120 121 122 123 124
	"PERIPH",
	"LLTXULP",
	"D2P",
	"RCON",
	"LDMA",
	"LLTXP",
	"LLTXPB",
125 126
	"Unknown"
};
S
Sathya Perla 已提交
127 128 129 130

static void be_queue_free(struct be_adapter *adapter, struct be_queue_info *q)
{
	struct be_dma_mem *mem = &q->dma_mem;
131

132
	if (mem->va) {
I
Ivan Vecera 已提交
133 134
		dma_free_coherent(&adapter->pdev->dev, mem->size, mem->va,
				  mem->dma);
135 136
		mem->va = NULL;
	}
S
Sathya Perla 已提交
137 138 139
}

static int be_queue_alloc(struct be_adapter *adapter, struct be_queue_info *q,
140
			  u16 len, u16 entry_size)
S
Sathya Perla 已提交
141 142 143 144 145 146 147
{
	struct be_dma_mem *mem = &q->dma_mem;

	memset(q, 0, sizeof(*q));
	q->len = len;
	q->entry_size = entry_size;
	mem->size = len * entry_size;
148 149
	mem->va = dma_zalloc_coherent(&adapter->pdev->dev, mem->size, &mem->dma,
				      GFP_KERNEL);
S
Sathya Perla 已提交
150
	if (!mem->va)
S
Sathya Perla 已提交
151
		return -ENOMEM;
S
Sathya Perla 已提交
152 153 154
	return 0;
}

155
static void be_reg_intr_set(struct be_adapter *adapter, bool enable)
S
Sathya Perla 已提交
156
{
157
	u32 reg, enabled;
158

159
	pci_read_config_dword(adapter->pdev, PCICFG_MEMBAR_CTRL_INT_CTRL_OFFSET,
160
			      &reg);
161 162
	enabled = reg & MEMBAR_CTRL_INT_CTRL_HOSTINTR_MASK;

163
	if (!enabled && enable)
S
Sathya Perla 已提交
164
		reg |= MEMBAR_CTRL_INT_CTRL_HOSTINTR_MASK;
165
	else if (enabled && !enable)
S
Sathya Perla 已提交
166
		reg &= ~MEMBAR_CTRL_INT_CTRL_HOSTINTR_MASK;
167
	else
S
Sathya Perla 已提交
168
		return;
169

170
	pci_write_config_dword(adapter->pdev,
171
			       PCICFG_MEMBAR_CTRL_INT_CTRL_OFFSET, reg);
S
Sathya Perla 已提交
172 173
}

174 175 176 177 178 179 180 181
static void be_intr_set(struct be_adapter *adapter, bool enable)
{
	int status = 0;

	/* On lancer interrupts can't be controlled via this register */
	if (lancer_chip(adapter))
		return;

182
	if (be_check_error(adapter, BE_ERROR_EEH))
183 184 185 186 187 188 189
		return;

	status = be_cmd_intr_set(adapter, enable);
	if (status)
		be_reg_intr_set(adapter, enable);
}

190
static void be_rxq_notify(struct be_adapter *adapter, u16 qid, u16 posted)
S
Sathya Perla 已提交
191 192
{
	u32 val = 0;
193

194 195 196
	if (be_check_error(adapter, BE_ERROR_HW))
		return;

S
Sathya Perla 已提交
197 198
	val |= qid & DB_RQ_RING_ID_MASK;
	val |= posted << DB_RQ_NUM_POSTED_SHIFT;
199 200

	wmb();
201
	iowrite32(val, adapter->db + DB_RQ_OFFSET);
S
Sathya Perla 已提交
202 203
}

V
Vasundhara Volam 已提交
204 205
static void be_txq_notify(struct be_adapter *adapter, struct be_tx_obj *txo,
			  u16 posted)
S
Sathya Perla 已提交
206 207
{
	u32 val = 0;
208

209 210 211
	if (be_check_error(adapter, BE_ERROR_HW))
		return;

V
Vasundhara Volam 已提交
212
	val |= txo->q.id & DB_TXULP_RING_ID_MASK;
S
Sathya Perla 已提交
213
	val |= (posted & DB_TXULP_NUM_POSTED_MASK) << DB_TXULP_NUM_POSTED_SHIFT;
214 215

	wmb();
V
Vasundhara Volam 已提交
216
	iowrite32(val, adapter->db + txo->db_offset);
S
Sathya Perla 已提交
217 218
}

219
static void be_eq_notify(struct be_adapter *adapter, u16 qid,
220 221
			 bool arm, bool clear_int, u16 num_popped,
			 u32 eq_delay_mult_enc)
S
Sathya Perla 已提交
222 223
{
	u32 val = 0;
224

S
Sathya Perla 已提交
225
	val |= qid & DB_EQ_RING_ID_MASK;
226
	val |= ((qid & DB_EQ_RING_ID_EXT_MASK) << DB_EQ_RING_ID_EXT_MASK_SHIFT);
227

228
	if (be_check_error(adapter, BE_ERROR_HW))
229 230
		return;

S
Sathya Perla 已提交
231 232 233 234 235 236
	if (arm)
		val |= 1 << DB_EQ_REARM_SHIFT;
	if (clear_int)
		val |= 1 << DB_EQ_CLR_SHIFT;
	val |= 1 << DB_EQ_EVNT_SHIFT;
	val |= num_popped << DB_EQ_NUM_POPPED_SHIFT;
237
	val |= eq_delay_mult_enc << DB_EQ_R2I_DLY_SHIFT;
238
	iowrite32(val, adapter->db + DB_EQ_OFFSET);
S
Sathya Perla 已提交
239 240
}

241
void be_cq_notify(struct be_adapter *adapter, u16 qid, bool arm, u16 num_popped)
S
Sathya Perla 已提交
242 243
{
	u32 val = 0;
244

S
Sathya Perla 已提交
245
	val |= qid & DB_CQ_RING_ID_MASK;
246 247
	val |= ((qid & DB_CQ_RING_ID_EXT_MASK) <<
			DB_CQ_RING_ID_EXT_MASK_SHIFT);
248

249
	if (be_check_error(adapter, BE_ERROR_HW))
250 251
		return;

S
Sathya Perla 已提交
252 253 254
	if (arm)
		val |= 1 << DB_CQ_REARM_SHIFT;
	val |= num_popped << DB_CQ_NUM_POPPED_SHIFT;
255
	iowrite32(val, adapter->db + DB_CQ_OFFSET);
S
Sathya Perla 已提交
256 257 258 259 260
}

static int be_mac_addr_set(struct net_device *netdev, void *p)
{
	struct be_adapter *adapter = netdev_priv(netdev);
261
	struct device *dev = &adapter->pdev->dev;
S
Sathya Perla 已提交
262
	struct sockaddr *addr = p;
263 264 265
	int status;
	u8 mac[ETH_ALEN];
	u32 old_pmac_id = adapter->pmac_id[0], curr_pmac_id = 0;
S
Sathya Perla 已提交
266

267 268 269
	if (!is_valid_ether_addr(addr->sa_data))
		return -EADDRNOTAVAIL;

270 271 272 273 274 275
	/* Proceed further only if, User provided MAC is different
	 * from active MAC
	 */
	if (ether_addr_equal(addr->sa_data, netdev->dev_addr))
		return 0;

276 277 278 279 280
	/* The PMAC_ADD cmd may fail if the VF doesn't have FILTMGMT
	 * privilege or if PF did not provision the new MAC address.
	 * On BE3, this cmd will always fail if the VF doesn't have the
	 * FILTMGMT privilege. This failure is OK, only if the PF programmed
	 * the MAC for the VF.
281
	 */
282 283 284 285 286 287 288 289 290 291 292
	status = be_cmd_pmac_add(adapter, (u8 *)addr->sa_data,
				 adapter->if_handle, &adapter->pmac_id[0], 0);
	if (!status) {
		curr_pmac_id = adapter->pmac_id[0];

		/* Delete the old programmed MAC. This call may fail if the
		 * old MAC was already deleted by the PF driver.
		 */
		if (adapter->pmac_id[0] != old_pmac_id)
			be_cmd_pmac_del(adapter, adapter->if_handle,
					old_pmac_id, 0);
293 294
	}

295 296
	/* Decide if the new MAC is successfully activated only after
	 * querying the FW
297
	 */
298 299
	status = be_cmd_get_active_mac(adapter, curr_pmac_id, mac,
				       adapter->if_handle, true, 0);
300
	if (status)
301
		goto err;
S
Sathya Perla 已提交
302

303 304 305
	/* The MAC change did not happen, either due to lack of privilege
	 * or PF didn't pre-provision.
	 */
306
	if (!ether_addr_equal(addr->sa_data, mac)) {
307 308 309 310
		status = -EPERM;
		goto err;
	}

311
	memcpy(netdev->dev_addr, addr->sa_data, netdev->addr_len);
312
	dev_info(dev, "MAC address changed to %pM\n", mac);
313 314
	return 0;
err:
315
	dev_warn(dev, "MAC address change to %pM failed\n", addr->sa_data);
S
Sathya Perla 已提交
316 317 318
	return status;
}

319 320 321 322 323 324 325
/* BE2 supports only v0 cmd */
static void *hw_stats_from_cmd(struct be_adapter *adapter)
{
	if (BE2_chip(adapter)) {
		struct be_cmd_resp_get_stats_v0 *cmd = adapter->stats_cmd.va;

		return &cmd->hw_stats;
326
	} else if (BE3_chip(adapter)) {
327 328
		struct be_cmd_resp_get_stats_v1 *cmd = adapter->stats_cmd.va;

329 330 331 332
		return &cmd->hw_stats;
	} else {
		struct be_cmd_resp_get_stats_v2 *cmd = adapter->stats_cmd.va;

333 334 335 336 337 338 339 340 341 342 343
		return &cmd->hw_stats;
	}
}

/* BE2 supports only v0 cmd */
static void *be_erx_stats_from_cmd(struct be_adapter *adapter)
{
	if (BE2_chip(adapter)) {
		struct be_hw_stats_v0 *hw_stats = hw_stats_from_cmd(adapter);

		return &hw_stats->erx;
344
	} else if (BE3_chip(adapter)) {
345 346
		struct be_hw_stats_v1 *hw_stats = hw_stats_from_cmd(adapter);

347 348 349 350
		return &hw_stats->erx;
	} else {
		struct be_hw_stats_v2 *hw_stats = hw_stats_from_cmd(adapter);

351 352 353 354 355
		return &hw_stats->erx;
	}
}

static void populate_be_v0_stats(struct be_adapter *adapter)
356
{
357 358 359
	struct be_hw_stats_v0 *hw_stats = hw_stats_from_cmd(adapter);
	struct be_pmem_stats *pmem_sts = &hw_stats->pmem;
	struct be_rxf_stats_v0 *rxf_stats = &hw_stats->rxf;
360
	struct be_port_rxf_stats_v0 *port_stats =
361 362
					&rxf_stats->port[adapter->port_num];
	struct be_drv_stats *drvs = &adapter->drv_stats;
363

364
	be_dws_le_to_cpu(hw_stats, sizeof(*hw_stats));
365 366 367 368 369 370 371 372 373 374 375 376 377 378
	drvs->rx_pause_frames = port_stats->rx_pause_frames;
	drvs->rx_crc_errors = port_stats->rx_crc_errors;
	drvs->rx_control_frames = port_stats->rx_control_frames;
	drvs->rx_in_range_errors = port_stats->rx_in_range_errors;
	drvs->rx_frame_too_long = port_stats->rx_frame_too_long;
	drvs->rx_dropped_runt = port_stats->rx_dropped_runt;
	drvs->rx_ip_checksum_errs = port_stats->rx_ip_checksum_errs;
	drvs->rx_tcp_checksum_errs = port_stats->rx_tcp_checksum_errs;
	drvs->rx_udp_checksum_errs = port_stats->rx_udp_checksum_errs;
	drvs->rxpp_fifo_overflow_drop = port_stats->rx_fifo_overflow;
	drvs->rx_dropped_tcp_length = port_stats->rx_dropped_tcp_length;
	drvs->rx_dropped_too_small = port_stats->rx_dropped_too_small;
	drvs->rx_dropped_too_short = port_stats->rx_dropped_too_short;
	drvs->rx_out_range_errors = port_stats->rx_out_range_errors;
379
	drvs->rx_input_fifo_overflow_drop = port_stats->rx_input_fifo_overflow;
380 381
	drvs->rx_dropped_header_too_small =
		port_stats->rx_dropped_header_too_small;
382 383 384
	drvs->rx_address_filtered =
					port_stats->rx_address_filtered +
					port_stats->rx_vlan_filtered;
385 386 387 388 389 390 391
	drvs->rx_alignment_symbol_errors =
		port_stats->rx_alignment_symbol_errors;

	drvs->tx_pauseframes = port_stats->tx_pauseframes;
	drvs->tx_controlframes = port_stats->tx_controlframes;

	if (adapter->port_num)
392
		drvs->jabber_events = rxf_stats->port1_jabber_events;
393
	else
394
		drvs->jabber_events = rxf_stats->port0_jabber_events;
395 396 397 398
	drvs->rx_drops_no_pbuf = rxf_stats->rx_drops_no_pbuf;
	drvs->rx_drops_no_erx_descr = rxf_stats->rx_drops_no_erx_descr;
	drvs->forwarded_packets = rxf_stats->forwarded_packets;
	drvs->rx_drops_mtu = rxf_stats->rx_drops_mtu;
399 400
	drvs->rx_drops_no_tpre_descr = rxf_stats->rx_drops_no_tpre_descr;
	drvs->rx_drops_too_many_frags = rxf_stats->rx_drops_too_many_frags;
401 402 403
	adapter->drv_stats.eth_red_drops = pmem_sts->eth_red_drops;
}

404
static void populate_be_v1_stats(struct be_adapter *adapter)
405
{
406 407 408
	struct be_hw_stats_v1 *hw_stats = hw_stats_from_cmd(adapter);
	struct be_pmem_stats *pmem_sts = &hw_stats->pmem;
	struct be_rxf_stats_v1 *rxf_stats = &hw_stats->rxf;
409
	struct be_port_rxf_stats_v1 *port_stats =
410 411
					&rxf_stats->port[adapter->port_num];
	struct be_drv_stats *drvs = &adapter->drv_stats;
412

413
	be_dws_le_to_cpu(hw_stats, sizeof(*hw_stats));
414 415
	drvs->pmem_fifo_overflow_drop = port_stats->pmem_fifo_overflow_drop;
	drvs->rx_priority_pause_frames = port_stats->rx_priority_pause_frames;
416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432
	drvs->rx_pause_frames = port_stats->rx_pause_frames;
	drvs->rx_crc_errors = port_stats->rx_crc_errors;
	drvs->rx_control_frames = port_stats->rx_control_frames;
	drvs->rx_in_range_errors = port_stats->rx_in_range_errors;
	drvs->rx_frame_too_long = port_stats->rx_frame_too_long;
	drvs->rx_dropped_runt = port_stats->rx_dropped_runt;
	drvs->rx_ip_checksum_errs = port_stats->rx_ip_checksum_errs;
	drvs->rx_tcp_checksum_errs = port_stats->rx_tcp_checksum_errs;
	drvs->rx_udp_checksum_errs = port_stats->rx_udp_checksum_errs;
	drvs->rx_dropped_tcp_length = port_stats->rx_dropped_tcp_length;
	drvs->rx_dropped_too_small = port_stats->rx_dropped_too_small;
	drvs->rx_dropped_too_short = port_stats->rx_dropped_too_short;
	drvs->rx_out_range_errors = port_stats->rx_out_range_errors;
	drvs->rx_dropped_header_too_small =
		port_stats->rx_dropped_header_too_small;
	drvs->rx_input_fifo_overflow_drop =
		port_stats->rx_input_fifo_overflow_drop;
433
	drvs->rx_address_filtered = port_stats->rx_address_filtered;
434 435
	drvs->rx_alignment_symbol_errors =
		port_stats->rx_alignment_symbol_errors;
436
	drvs->rxpp_fifo_overflow_drop = port_stats->rxpp_fifo_overflow_drop;
437 438
	drvs->tx_pauseframes = port_stats->tx_pauseframes;
	drvs->tx_controlframes = port_stats->tx_controlframes;
439
	drvs->tx_priority_pauseframes = port_stats->tx_priority_pauseframes;
440 441 442 443 444
	drvs->jabber_events = port_stats->jabber_events;
	drvs->rx_drops_no_pbuf = rxf_stats->rx_drops_no_pbuf;
	drvs->rx_drops_no_erx_descr = rxf_stats->rx_drops_no_erx_descr;
	drvs->forwarded_packets = rxf_stats->forwarded_packets;
	drvs->rx_drops_mtu = rxf_stats->rx_drops_mtu;
445 446
	drvs->rx_drops_no_tpre_descr = rxf_stats->rx_drops_no_tpre_descr;
	drvs->rx_drops_too_many_frags = rxf_stats->rx_drops_too_many_frags;
447 448 449
	adapter->drv_stats.eth_red_drops = pmem_sts->eth_red_drops;
}

450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493
static void populate_be_v2_stats(struct be_adapter *adapter)
{
	struct be_hw_stats_v2 *hw_stats = hw_stats_from_cmd(adapter);
	struct be_pmem_stats *pmem_sts = &hw_stats->pmem;
	struct be_rxf_stats_v2 *rxf_stats = &hw_stats->rxf;
	struct be_port_rxf_stats_v2 *port_stats =
					&rxf_stats->port[adapter->port_num];
	struct be_drv_stats *drvs = &adapter->drv_stats;

	be_dws_le_to_cpu(hw_stats, sizeof(*hw_stats));
	drvs->pmem_fifo_overflow_drop = port_stats->pmem_fifo_overflow_drop;
	drvs->rx_priority_pause_frames = port_stats->rx_priority_pause_frames;
	drvs->rx_pause_frames = port_stats->rx_pause_frames;
	drvs->rx_crc_errors = port_stats->rx_crc_errors;
	drvs->rx_control_frames = port_stats->rx_control_frames;
	drvs->rx_in_range_errors = port_stats->rx_in_range_errors;
	drvs->rx_frame_too_long = port_stats->rx_frame_too_long;
	drvs->rx_dropped_runt = port_stats->rx_dropped_runt;
	drvs->rx_ip_checksum_errs = port_stats->rx_ip_checksum_errs;
	drvs->rx_tcp_checksum_errs = port_stats->rx_tcp_checksum_errs;
	drvs->rx_udp_checksum_errs = port_stats->rx_udp_checksum_errs;
	drvs->rx_dropped_tcp_length = port_stats->rx_dropped_tcp_length;
	drvs->rx_dropped_too_small = port_stats->rx_dropped_too_small;
	drvs->rx_dropped_too_short = port_stats->rx_dropped_too_short;
	drvs->rx_out_range_errors = port_stats->rx_out_range_errors;
	drvs->rx_dropped_header_too_small =
		port_stats->rx_dropped_header_too_small;
	drvs->rx_input_fifo_overflow_drop =
		port_stats->rx_input_fifo_overflow_drop;
	drvs->rx_address_filtered = port_stats->rx_address_filtered;
	drvs->rx_alignment_symbol_errors =
		port_stats->rx_alignment_symbol_errors;
	drvs->rxpp_fifo_overflow_drop = port_stats->rxpp_fifo_overflow_drop;
	drvs->tx_pauseframes = port_stats->tx_pauseframes;
	drvs->tx_controlframes = port_stats->tx_controlframes;
	drvs->tx_priority_pauseframes = port_stats->tx_priority_pauseframes;
	drvs->jabber_events = port_stats->jabber_events;
	drvs->rx_drops_no_pbuf = rxf_stats->rx_drops_no_pbuf;
	drvs->rx_drops_no_erx_descr = rxf_stats->rx_drops_no_erx_descr;
	drvs->forwarded_packets = rxf_stats->forwarded_packets;
	drvs->rx_drops_mtu = rxf_stats->rx_drops_mtu;
	drvs->rx_drops_no_tpre_descr = rxf_stats->rx_drops_no_tpre_descr;
	drvs->rx_drops_too_many_frags = rxf_stats->rx_drops_too_many_frags;
	adapter->drv_stats.eth_red_drops = pmem_sts->eth_red_drops;
494
	if (be_roce_supported(adapter)) {
495 496 497 498 499 500 501
		drvs->rx_roce_bytes_lsd = port_stats->roce_bytes_received_lsd;
		drvs->rx_roce_bytes_msd = port_stats->roce_bytes_received_msd;
		drvs->rx_roce_frames = port_stats->roce_frames_received;
		drvs->roce_drops_crc = port_stats->roce_drops_crc;
		drvs->roce_drops_payload_len =
			port_stats->roce_drops_payload_len;
	}
502 503
}

S
Selvin Xavier 已提交
504 505 506
static void populate_lancer_stats(struct be_adapter *adapter)
{
	struct be_drv_stats *drvs = &adapter->drv_stats;
507
	struct lancer_pport_stats *pport_stats = pport_stats_from_cmd(adapter);
508 509 510 511 512

	be_dws_le_to_cpu(pport_stats, sizeof(*pport_stats));
	drvs->rx_pause_frames = pport_stats->rx_pause_frames_lo;
	drvs->rx_crc_errors = pport_stats->rx_crc_errors_lo;
	drvs->rx_control_frames = pport_stats->rx_control_frames_lo;
S
Selvin Xavier 已提交
513
	drvs->rx_in_range_errors = pport_stats->rx_in_range_errors;
514
	drvs->rx_frame_too_long = pport_stats->rx_frames_too_long_lo;
S
Selvin Xavier 已提交
515 516 517 518 519 520 521 522 523 524 525 526
	drvs->rx_dropped_runt = pport_stats->rx_dropped_runt;
	drvs->rx_ip_checksum_errs = pport_stats->rx_ip_checksum_errors;
	drvs->rx_tcp_checksum_errs = pport_stats->rx_tcp_checksum_errors;
	drvs->rx_udp_checksum_errs = pport_stats->rx_udp_checksum_errors;
	drvs->rx_dropped_tcp_length =
				pport_stats->rx_dropped_invalid_tcp_length;
	drvs->rx_dropped_too_small = pport_stats->rx_dropped_too_small;
	drvs->rx_dropped_too_short = pport_stats->rx_dropped_too_short;
	drvs->rx_out_range_errors = pport_stats->rx_out_of_range_errors;
	drvs->rx_dropped_header_too_small =
				pport_stats->rx_dropped_header_too_small;
	drvs->rx_input_fifo_overflow_drop = pport_stats->rx_fifo_overflow;
527 528 529
	drvs->rx_address_filtered =
					pport_stats->rx_address_filtered +
					pport_stats->rx_vlan_filtered;
530
	drvs->rx_alignment_symbol_errors = pport_stats->rx_symbol_errors_lo;
S
Selvin Xavier 已提交
531
	drvs->rxpp_fifo_overflow_drop = pport_stats->rx_fifo_overflow;
532 533
	drvs->tx_pauseframes = pport_stats->tx_pause_frames_lo;
	drvs->tx_controlframes = pport_stats->tx_control_frames_lo;
S
Selvin Xavier 已提交
534
	drvs->jabber_events = pport_stats->rx_jabbers;
535 536
	drvs->forwarded_packets = pport_stats->num_forwards_lo;
	drvs->rx_drops_mtu = pport_stats->rx_drops_mtu_lo;
S
Selvin Xavier 已提交
537
	drvs->rx_drops_too_many_frags =
538
				pport_stats->rx_drops_too_many_frags_lo;
S
Selvin Xavier 已提交
539
}
540

541 542 543 544 545 546 547 548 549 550 551 552
static void accumulate_16bit_val(u32 *acc, u16 val)
{
#define lo(x)			(x & 0xFFFF)
#define hi(x)			(x & 0xFFFF0000)
	bool wrapped = val < lo(*acc);
	u32 newacc = hi(*acc) + val;

	if (wrapped)
		newacc += 65536;
	ACCESS_ONCE(*acc) = newacc;
}

J
Jingoo Han 已提交
553
static void populate_erx_stats(struct be_adapter *adapter,
554
			       struct be_rx_obj *rxo, u32 erx_stat)
555 556 557 558 559 560 561 562 563 564 565
{
	if (!BEx_chip(adapter))
		rx_stats(rxo)->rx_drops_no_frags = erx_stat;
	else
		/* below erx HW counter can actually wrap around after
		 * 65535. Driver accumulates a 32-bit value
		 */
		accumulate_16bit_val(&rx_stats(rxo)->rx_drops_no_frags,
				     (u16)erx_stat);
}

566 567
void be_parse_stats(struct be_adapter *adapter)
{
568
	struct be_erx_stats_v2 *erx = be_erx_stats_from_cmd(adapter);
569 570
	struct be_rx_obj *rxo;
	int i;
571
	u32 erx_stat;
572

573 574
	if (lancer_chip(adapter)) {
		populate_lancer_stats(adapter);
S
Selvin Xavier 已提交
575
	} else {
576 577
		if (BE2_chip(adapter))
			populate_be_v0_stats(adapter);
578 579
		else if (BE3_chip(adapter))
			/* for BE3 */
580
			populate_be_v1_stats(adapter);
581 582
		else
			populate_be_v2_stats(adapter);
583

584
		/* erx_v2 is longer than v0, v1. use v2 for v0, v1 access */
585
		for_all_rx_queues(adapter, rxo, i) {
586 587
			erx_stat = erx->rx_drops_no_fragments[rxo->q.id];
			populate_erx_stats(adapter, rxo, erx_stat);
588
		}
589
	}
590 591
}

592
static struct rtnl_link_stats64 *be_get_stats64(struct net_device *netdev,
593
						struct rtnl_link_stats64 *stats)
S
Sathya Perla 已提交
594
{
595
	struct be_adapter *adapter = netdev_priv(netdev);
596
	struct be_drv_stats *drvs = &adapter->drv_stats;
597
	struct be_rx_obj *rxo;
598
	struct be_tx_obj *txo;
599 600
	u64 pkts, bytes;
	unsigned int start;
601
	int i;
S
Sathya Perla 已提交
602

603
	for_all_rx_queues(adapter, rxo, i) {
604
		const struct be_rx_stats *rx_stats = rx_stats(rxo);
605

606
		do {
607
			start = u64_stats_fetch_begin_irq(&rx_stats->sync);
608 609
			pkts = rx_stats(rxo)->rx_pkts;
			bytes = rx_stats(rxo)->rx_bytes;
610
		} while (u64_stats_fetch_retry_irq(&rx_stats->sync, start));
611 612 613 614 615
		stats->rx_packets += pkts;
		stats->rx_bytes += bytes;
		stats->multicast += rx_stats(rxo)->rx_mcast_pkts;
		stats->rx_dropped += rx_stats(rxo)->rx_drops_no_skbs +
					rx_stats(rxo)->rx_drops_no_frags;
616 617
	}

618
	for_all_tx_queues(adapter, txo, i) {
619
		const struct be_tx_stats *tx_stats = tx_stats(txo);
620

621
		do {
622
			start = u64_stats_fetch_begin_irq(&tx_stats->sync);
623 624
			pkts = tx_stats(txo)->tx_pkts;
			bytes = tx_stats(txo)->tx_bytes;
625
		} while (u64_stats_fetch_retry_irq(&tx_stats->sync, start));
626 627
		stats->tx_packets += pkts;
		stats->tx_bytes += bytes;
628
	}
S
Sathya Perla 已提交
629 630

	/* bad pkts received */
631
	stats->rx_errors = drvs->rx_crc_errors +
632 633 634 635 636 637 638 639
		drvs->rx_alignment_symbol_errors +
		drvs->rx_in_range_errors +
		drvs->rx_out_range_errors +
		drvs->rx_frame_too_long +
		drvs->rx_dropped_too_small +
		drvs->rx_dropped_too_short +
		drvs->rx_dropped_header_too_small +
		drvs->rx_dropped_tcp_length +
640
		drvs->rx_dropped_runt;
641

S
Sathya Perla 已提交
642
	/* detailed rx errors */
643
	stats->rx_length_errors = drvs->rx_in_range_errors +
644 645
		drvs->rx_out_range_errors +
		drvs->rx_frame_too_long;
646

647
	stats->rx_crc_errors = drvs->rx_crc_errors;
S
Sathya Perla 已提交
648 649

	/* frame alignment errors */
650
	stats->rx_frame_errors = drvs->rx_alignment_symbol_errors;
651

S
Sathya Perla 已提交
652 653
	/* receiver fifo overrun */
	/* drops_no_pbuf is no per i/f, it's per BE card */
654
	stats->rx_fifo_errors = drvs->rxpp_fifo_overflow_drop +
655 656
				drvs->rx_input_fifo_overflow_drop +
				drvs->rx_drops_no_pbuf;
657
	return stats;
S
Sathya Perla 已提交
658 659
}

660
void be_link_status_update(struct be_adapter *adapter, u8 link_status)
S
Sathya Perla 已提交
661 662 663
{
	struct net_device *netdev = adapter->netdev;

664
	if (!(adapter->flags & BE_FLAGS_LINK_STATUS_INIT)) {
665
		netif_carrier_off(netdev);
666
		adapter->flags |= BE_FLAGS_LINK_STATUS_INIT;
S
Sathya Perla 已提交
667
	}
668

669
	if (link_status)
670 671 672
		netif_carrier_on(netdev);
	else
		netif_carrier_off(netdev);
I
Ivan Vecera 已提交
673 674

	netdev_info(netdev, "Link is %s\n", link_status ? "Up" : "Down");
S
Sathya Perla 已提交
675 676
}

677
static void be_tx_stats_update(struct be_tx_obj *txo, struct sk_buff *skb)
S
Sathya Perla 已提交
678
{
679 680
	struct be_tx_stats *stats = tx_stats(txo);

681
	u64_stats_update_begin(&stats->sync);
682
	stats->tx_reqs++;
683 684
	stats->tx_bytes += skb->len;
	stats->tx_pkts += (skb_shinfo(skb)->gso_segs ? : 1);
685
	u64_stats_update_end(&stats->sync);
S
Sathya Perla 已提交
686 687
}

688 689
/* Returns number of WRBs needed for the skb */
static u32 skb_wrb_cnt(struct sk_buff *skb)
S
Sathya Perla 已提交
690
{
691 692
	/* +1 for the header wrb */
	return 1 + (skb_headlen(skb) ? 1 : 0) + skb_shinfo(skb)->nr_frags;
S
Sathya Perla 已提交
693 694 695 696
}

static inline void wrb_fill(struct be_eth_wrb *wrb, u64 addr, int len)
{
697 698 699 700 701 702 703 704 705 706 707 708 709 710
	wrb->frag_pa_hi = cpu_to_le32(upper_32_bits(addr));
	wrb->frag_pa_lo = cpu_to_le32(lower_32_bits(addr));
	wrb->frag_len = cpu_to_le32(len & ETH_WRB_FRAG_LEN_MASK);
	wrb->rsvd0 = 0;
}

/* A dummy wrb is just all zeros. Using a separate routine for dummy-wrb
 * to avoid the swap and shift/mask operations in wrb_fill().
 */
static inline void wrb_fill_dummy(struct be_eth_wrb *wrb)
{
	wrb->frag_pa_hi = 0;
	wrb->frag_pa_lo = 0;
	wrb->frag_len = 0;
711
	wrb->rsvd0 = 0;
S
Sathya Perla 已提交
712 713
}

714
static inline u16 be_get_tx_vlan_tag(struct be_adapter *adapter,
715
				     struct sk_buff *skb)
716 717 718 719
{
	u8 vlan_prio;
	u16 vlan_tag;

720
	vlan_tag = skb_vlan_tag_get(skb);
721 722 723 724 725 726 727 728 729
	vlan_prio = (vlan_tag & VLAN_PRIO_MASK) >> VLAN_PRIO_SHIFT;
	/* If vlan priority provided by OS is NOT in available bmap */
	if (!(adapter->vlan_prio_bmap & (1 << vlan_prio)))
		vlan_tag = (vlan_tag & ~VLAN_PRIO_MASK) |
				adapter->recommended_prio;

	return vlan_tag;
}

730 731 732 733 734 735 736 737 738 739 740 741 742
/* Used only for IP tunnel packets */
static u16 skb_inner_ip_proto(struct sk_buff *skb)
{
	return (inner_ip_hdr(skb)->version == 4) ?
		inner_ip_hdr(skb)->protocol : inner_ipv6_hdr(skb)->nexthdr;
}

static u16 skb_ip_proto(struct sk_buff *skb)
{
	return (ip_hdr(skb)->version == 4) ?
		ip_hdr(skb)->protocol : ipv6_hdr(skb)->nexthdr;
}

743 744 745 746 747 748 749 750 751 752 753 754 755 756 757
static inline bool be_is_txq_full(struct be_tx_obj *txo)
{
	return atomic_read(&txo->q.used) + BE_MAX_TX_FRAG_COUNT >= txo->q.len;
}

static inline bool be_can_txq_wake(struct be_tx_obj *txo)
{
	return atomic_read(&txo->q.used) < txo->q.len / 2;
}

static inline bool be_is_tx_compl_pending(struct be_tx_obj *txo)
{
	return atomic_read(&txo->q.used) > txo->pend_wrb_cnt;
}

758 759 760
static void be_get_wrb_params_from_skb(struct be_adapter *adapter,
				       struct sk_buff *skb,
				       struct be_wrb_params *wrb_params)
S
Sathya Perla 已提交
761
{
762
	u16 proto;
S
Sathya Perla 已提交
763

A
Ajit Khaparde 已提交
764
	if (skb_is_gso(skb)) {
765 766
		BE_WRB_F_SET(wrb_params->features, LSO, 1);
		wrb_params->lso_mss = skb_shinfo(skb)->gso_size;
767
		if (skb_is_gso_v6(skb) && !lancer_chip(adapter))
768
			BE_WRB_F_SET(wrb_params->features, LSO6, 1);
S
Sathya Perla 已提交
769
	} else if (skb->ip_summed == CHECKSUM_PARTIAL) {
770
		if (skb->encapsulation) {
771
			BE_WRB_F_SET(wrb_params->features, IPCS, 1);
772 773 774 775 776
			proto = skb_inner_ip_proto(skb);
		} else {
			proto = skb_ip_proto(skb);
		}
		if (proto == IPPROTO_TCP)
777
			BE_WRB_F_SET(wrb_params->features, TCPCS, 1);
778
		else if (proto == IPPROTO_UDP)
779
			BE_WRB_F_SET(wrb_params->features, UDPCS, 1);
S
Sathya Perla 已提交
780 781
	}

782
	if (skb_vlan_tag_present(skb)) {
783 784
		BE_WRB_F_SET(wrb_params->features, VLAN, 1);
		wrb_params->vlan_tag = be_get_tx_vlan_tag(adapter, skb);
S
Sathya Perla 已提交
785 786
	}

787 788
	BE_WRB_F_SET(wrb_params->features, CRC, 1);
}
789

790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813
static void wrb_fill_hdr(struct be_adapter *adapter,
			 struct be_eth_hdr_wrb *hdr,
			 struct be_wrb_params *wrb_params,
			 struct sk_buff *skb)
{
	memset(hdr, 0, sizeof(*hdr));

	SET_TX_WRB_HDR_BITS(crc, hdr,
			    BE_WRB_F_GET(wrb_params->features, CRC));
	SET_TX_WRB_HDR_BITS(ipcs, hdr,
			    BE_WRB_F_GET(wrb_params->features, IPCS));
	SET_TX_WRB_HDR_BITS(tcpcs, hdr,
			    BE_WRB_F_GET(wrb_params->features, TCPCS));
	SET_TX_WRB_HDR_BITS(udpcs, hdr,
			    BE_WRB_F_GET(wrb_params->features, UDPCS));

	SET_TX_WRB_HDR_BITS(lso, hdr,
			    BE_WRB_F_GET(wrb_params->features, LSO));
	SET_TX_WRB_HDR_BITS(lso6, hdr,
			    BE_WRB_F_GET(wrb_params->features, LSO6));
	SET_TX_WRB_HDR_BITS(lso_mss, hdr, wrb_params->lso_mss);

	/* Hack to skip HW VLAN tagging needs evt = 1, compl = 0. When this
	 * hack is not needed, the evt bit is set while ringing DB.
814
	 */
815 816 817 818 819 820 821 822
	SET_TX_WRB_HDR_BITS(event, hdr,
			    BE_WRB_F_GET(wrb_params->features, VLAN_SKIP_HW));
	SET_TX_WRB_HDR_BITS(vlan, hdr,
			    BE_WRB_F_GET(wrb_params->features, VLAN));
	SET_TX_WRB_HDR_BITS(vlan_tag, hdr, wrb_params->vlan_tag);

	SET_TX_WRB_HDR_BITS(num_wrb, hdr, skb_wrb_cnt(skb));
	SET_TX_WRB_HDR_BITS(len, hdr, skb->len);
V
Venkata Duvvuru 已提交
823 824
	SET_TX_WRB_HDR_BITS(mgmt, hdr,
			    BE_WRB_F_GET(wrb_params->features, OS2BMC));
S
Sathya Perla 已提交
825 826
}

I
Ivan Vecera 已提交
827
static void unmap_tx_frag(struct device *dev, struct be_eth_wrb *wrb,
828
			  bool unmap_single)
829 830
{
	dma_addr_t dma;
831
	u32 frag_len = le32_to_cpu(wrb->frag_len);
832 833


834 835 836
	dma = (u64)le32_to_cpu(wrb->frag_pa_hi) << 32 |
		(u64)le32_to_cpu(wrb->frag_pa_lo);
	if (frag_len) {
837
		if (unmap_single)
838
			dma_unmap_single(dev, dma, frag_len, DMA_TO_DEVICE);
839
		else
840
			dma_unmap_page(dev, dma, frag_len, DMA_TO_DEVICE);
841 842
	}
}
S
Sathya Perla 已提交
843

844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865 866 867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882 883 884 885 886 887 888 889 890 891 892 893 894 895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917
/* Grab a WRB header for xmit */
static u16 be_tx_get_wrb_hdr(struct be_tx_obj *txo)
{
	u16 head = txo->q.head;

	queue_head_inc(&txo->q);
	return head;
}

/* Set up the WRB header for xmit */
static void be_tx_setup_wrb_hdr(struct be_adapter *adapter,
				struct be_tx_obj *txo,
				struct be_wrb_params *wrb_params,
				struct sk_buff *skb, u16 head)
{
	u32 num_frags = skb_wrb_cnt(skb);
	struct be_queue_info *txq = &txo->q;
	struct be_eth_hdr_wrb *hdr = queue_index_node(txq, head);

	wrb_fill_hdr(adapter, hdr, wrb_params, skb);
	be_dws_cpu_to_le(hdr, sizeof(*hdr));

	BUG_ON(txo->sent_skb_list[head]);
	txo->sent_skb_list[head] = skb;
	txo->last_req_hdr = head;
	atomic_add(num_frags, &txq->used);
	txo->last_req_wrb_cnt = num_frags;
	txo->pend_wrb_cnt += num_frags;
}

/* Setup a WRB fragment (buffer descriptor) for xmit */
static void be_tx_setup_wrb_frag(struct be_tx_obj *txo, dma_addr_t busaddr,
				 int len)
{
	struct be_eth_wrb *wrb;
	struct be_queue_info *txq = &txo->q;

	wrb = queue_head_node(txq);
	wrb_fill(wrb, busaddr, len);
	queue_head_inc(txq);
}

/* Bring the queue back to the state it was in before be_xmit_enqueue() routine
 * was invoked. The producer index is restored to the previous packet and the
 * WRBs of the current packet are unmapped. Invoked to handle tx setup errors.
 */
static void be_xmit_restore(struct be_adapter *adapter,
			    struct be_tx_obj *txo, u16 head, bool map_single,
			    u32 copied)
{
	struct device *dev;
	struct be_eth_wrb *wrb;
	struct be_queue_info *txq = &txo->q;

	dev = &adapter->pdev->dev;
	txq->head = head;

	/* skip the first wrb (hdr); it's not mapped */
	queue_head_inc(txq);
	while (copied) {
		wrb = queue_head_node(txq);
		unmap_tx_frag(dev, wrb, map_single);
		map_single = false;
		copied -= le32_to_cpu(wrb->frag_len);
		queue_head_inc(txq);
	}

	txq->head = head;
}

/* Enqueue the given packet for transmit. This routine allocates WRBs for the
 * packet, dma maps the packet buffers and sets up the WRBs. Returns the number
 * of WRBs used up by the packet.
 */
918
static u32 be_xmit_enqueue(struct be_adapter *adapter, struct be_tx_obj *txo,
919 920
			   struct sk_buff *skb,
			   struct be_wrb_params *wrb_params)
S
Sathya Perla 已提交
921
{
922
	u32 i, copied = 0, wrb_cnt = skb_wrb_cnt(skb);
I
Ivan Vecera 已提交
923
	struct device *dev = &adapter->pdev->dev;
924
	struct be_queue_info *txq = &txo->q;
925
	bool map_single = false;
926
	u16 head = txq->head;
927 928
	dma_addr_t busaddr;
	int len;
S
Sathya Perla 已提交
929

930
	head = be_tx_get_wrb_hdr(txo);
S
Sathya Perla 已提交
931

932
	if (skb->len > skb->data_len) {
933
		len = skb_headlen(skb);
934

I
Ivan Vecera 已提交
935 936
		busaddr = dma_map_single(dev, skb->data, len, DMA_TO_DEVICE);
		if (dma_mapping_error(dev, busaddr))
937 938
			goto dma_err;
		map_single = true;
939
		be_tx_setup_wrb_frag(txo, busaddr, len);
940 941
		copied += len;
	}
S
Sathya Perla 已提交
942

943
	for (i = 0; i < skb_shinfo(skb)->nr_frags; i++) {
944
		const struct skb_frag_struct *frag = &skb_shinfo(skb)->frags[i];
945
		len = skb_frag_size(frag);
946

947
		busaddr = skb_frag_dma_map(dev, frag, 0, len, DMA_TO_DEVICE);
I
Ivan Vecera 已提交
948
		if (dma_mapping_error(dev, busaddr))
949
			goto dma_err;
950 951
		be_tx_setup_wrb_frag(txo, busaddr, len);
		copied += len;
S
Sathya Perla 已提交
952 953
	}

954
	be_tx_setup_wrb_hdr(adapter, txo, wrb_params, skb, head);
S
Sathya Perla 已提交
955

956 957
	be_tx_stats_update(txo, skb);
	return wrb_cnt;
S
Sathya Perla 已提交
958

959
dma_err:
960 961
	adapter->drv_stats.dma_map_errors++;
	be_xmit_restore(adapter, txo, head, map_single, copied);
962
	return 0;
S
Sathya Perla 已提交
963 964
}

965 966 967 968 969
static inline int qnq_async_evt_rcvd(struct be_adapter *adapter)
{
	return adapter->flags & BE_FLAGS_QNQ_ASYNC_EVT_RCVD;
}

970
static struct sk_buff *be_insert_vlan_in_pkt(struct be_adapter *adapter,
971
					     struct sk_buff *skb,
972 973
					     struct be_wrb_params
					     *wrb_params)
974 975 976 977 978 979 980
{
	u16 vlan_tag = 0;

	skb = skb_share_check(skb, GFP_ATOMIC);
	if (unlikely(!skb))
		return skb;

981
	if (skb_vlan_tag_present(skb))
982
		vlan_tag = be_get_tx_vlan_tag(adapter, skb);
983 984 985 986 987 988 989

	if (qnq_async_evt_rcvd(adapter) && adapter->pvid) {
		if (!vlan_tag)
			vlan_tag = adapter->pvid;
		/* f/w workaround to set skip_hw_vlan = 1, informs the F/W to
		 * skip VLAN insertion
		 */
990
		BE_WRB_F_SET(wrb_params->features, VLAN_SKIP_HW, 1);
991
	}
992 993

	if (vlan_tag) {
994 995
		skb = vlan_insert_tag_set_proto(skb, htons(ETH_P_8021Q),
						vlan_tag);
996 997 998 999 1000 1001 1002 1003
		if (unlikely(!skb))
			return skb;
		skb->vlan_tci = 0;
	}

	/* Insert the outer VLAN, if any */
	if (adapter->qnq_vid) {
		vlan_tag = adapter->qnq_vid;
1004 1005
		skb = vlan_insert_tag_set_proto(skb, htons(ETH_P_8021Q),
						vlan_tag);
1006 1007
		if (unlikely(!skb))
			return skb;
1008
		BE_WRB_F_SET(wrb_params->features, VLAN_SKIP_HW, 1);
1009 1010
	}

1011 1012 1013
	return skb;
}

1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025
static bool be_ipv6_exthdr_check(struct sk_buff *skb)
{
	struct ethhdr *eh = (struct ethhdr *)skb->data;
	u16 offset = ETH_HLEN;

	if (eh->h_proto == htons(ETH_P_IPV6)) {
		struct ipv6hdr *ip6h = (struct ipv6hdr *)(skb->data + offset);

		offset += sizeof(struct ipv6hdr);
		if (ip6h->nexthdr != NEXTHDR_TCP &&
		    ip6h->nexthdr != NEXTHDR_UDP) {
			struct ipv6_opt_hdr *ehdr =
K
Kalesh AP 已提交
1026
				(struct ipv6_opt_hdr *)(skb->data + offset);
1027 1028 1029 1030 1031 1032 1033 1034 1035 1036 1037

			/* offending pkt: 2nd byte following IPv6 hdr is 0xff */
			if (ehdr->hdrlen == 0xff)
				return true;
		}
	}
	return false;
}

static int be_vlan_tag_tx_chk(struct be_adapter *adapter, struct sk_buff *skb)
{
1038
	return skb_vlan_tag_present(skb) || adapter->pvid || adapter->qnq_vid;
1039 1040
}

1041
static int be_ipv6_tx_stall_chk(struct be_adapter *adapter, struct sk_buff *skb)
1042
{
1043
	return BE3_chip(adapter) && be_ipv6_exthdr_check(skb);
1044 1045
}

1046 1047
static struct sk_buff *be_lancer_xmit_workarounds(struct be_adapter *adapter,
						  struct sk_buff *skb,
1048 1049
						  struct be_wrb_params
						  *wrb_params)
S
Sathya Perla 已提交
1050
{
1051
	struct vlan_ethhdr *veh = (struct vlan_ethhdr *)skb->data;
1052 1053
	unsigned int eth_hdr_len;
	struct iphdr *ip;
1054

1055 1056
	/* For padded packets, BE HW modifies tot_len field in IP header
	 * incorrecly when VLAN tag is inserted by HW.
1057
	 * For padded packets, Lancer computes incorrect checksum.
1058
	 */
1059 1060
	eth_hdr_len = ntohs(skb->protocol) == ETH_P_8021Q ?
						VLAN_ETH_HLEN : ETH_HLEN;
1061
	if (skb->len <= 60 &&
1062
	    (lancer_chip(adapter) || skb_vlan_tag_present(skb)) &&
1063
	    is_ipv4_pkt(skb)) {
1064 1065 1066
		ip = (struct iphdr *)ip_hdr(skb);
		pskb_trim(skb, eth_hdr_len + ntohs(ip->tot_len));
	}
1067

1068
	/* If vlan tag is already inlined in the packet, skip HW VLAN
1069
	 * tagging in pvid-tagging mode
1070
	 */
1071
	if (be_pvid_tagging_enabled(adapter) &&
1072
	    veh->h_vlan_proto == htons(ETH_P_8021Q))
1073
		BE_WRB_F_SET(wrb_params->features, VLAN_SKIP_HW, 1);
1074

1075 1076 1077 1078 1079
	/* HW has a bug wherein it will calculate CSUM for VLAN
	 * pkts even though it is disabled.
	 * Manually insert VLAN in pkt.
	 */
	if (skb->ip_summed != CHECKSUM_PARTIAL &&
1080
	    skb_vlan_tag_present(skb)) {
1081
		skb = be_insert_vlan_in_pkt(adapter, skb, wrb_params);
1082
		if (unlikely(!skb))
1083
			goto err;
1084 1085 1086 1087 1088 1089 1090
	}

	/* HW may lockup when VLAN HW tagging is requested on
	 * certain ipv6 packets. Drop such pkts if the HW workaround to
	 * skip HW tagging is not enabled by FW.
	 */
	if (unlikely(be_ipv6_tx_stall_chk(adapter, skb) &&
K
Kalesh AP 已提交
1091 1092
		     (adapter->pvid || adapter->qnq_vid) &&
		     !qnq_async_evt_rcvd(adapter)))
1093 1094 1095 1096 1097 1098 1099 1100 1101 1102
		goto tx_drop;

	/* Manual VLAN tag insertion to prevent:
	 * ASIC lockup when the ASIC inserts VLAN tag into
	 * certain ipv6 packets. Insert VLAN tags in driver,
	 * and set event, completion, vlan bits accordingly
	 * in the Tx WRB.
	 */
	if (be_ipv6_tx_stall_chk(adapter, skb) &&
	    be_vlan_tag_tx_chk(adapter, skb)) {
1103
		skb = be_insert_vlan_in_pkt(adapter, skb, wrb_params);
1104
		if (unlikely(!skb))
1105
			goto err;
1106 1107
	}

1108 1109 1110
	return skb;
tx_drop:
	dev_kfree_skb_any(skb);
1111
err:
1112 1113 1114
	return NULL;
}

1115 1116
static struct sk_buff *be_xmit_workarounds(struct be_adapter *adapter,
					   struct sk_buff *skb,
1117
					   struct be_wrb_params *wrb_params)
1118 1119 1120 1121 1122 1123
{
	/* Lancer, SH-R ASICs have a bug wherein Packets that are 32 bytes or
	 * less may cause a transmit stall on that port. So the work-around is
	 * to pad short packets (<= 32 bytes) to a 36-byte length.
	 */
	if (unlikely(!BEx_chip(adapter) && skb->len <= 32)) {
1124
		if (skb_put_padto(skb, 36))
1125 1126 1127 1128
			return NULL;
	}

	if (BEx_chip(adapter) || lancer_chip(adapter)) {
1129
		skb = be_lancer_xmit_workarounds(adapter, skb, wrb_params);
1130 1131 1132 1133 1134 1135 1136
		if (!skb)
			return NULL;
	}

	return skb;
}

1137 1138 1139 1140 1141 1142 1143 1144 1145 1146 1147
static void be_xmit_flush(struct be_adapter *adapter, struct be_tx_obj *txo)
{
	struct be_queue_info *txq = &txo->q;
	struct be_eth_hdr_wrb *hdr = queue_index_node(txq, txo->last_req_hdr);

	/* Mark the last request eventable if it hasn't been marked already */
	if (!(hdr->dw[2] & cpu_to_le32(TX_HDR_WRB_EVT)))
		hdr->dw[2] |= cpu_to_le32(TX_HDR_WRB_EVT | TX_HDR_WRB_COMPL);

	/* compose a dummy wrb if there are odd set of wrbs to notify */
	if (!lancer_chip(adapter) && (txo->pend_wrb_cnt & 1)) {
1148
		wrb_fill_dummy(queue_head_node(txq));
1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160
		queue_head_inc(txq);
		atomic_inc(&txq->used);
		txo->pend_wrb_cnt++;
		hdr->dw[2] &= ~cpu_to_le32(TX_HDR_WRB_NUM_MASK <<
					   TX_HDR_WRB_NUM_SHIFT);
		hdr->dw[2] |= cpu_to_le32((txo->last_req_wrb_cnt + 1) <<
					  TX_HDR_WRB_NUM_SHIFT);
	}
	be_txq_notify(adapter, txo, txo->pend_wrb_cnt);
	txo->pend_wrb_cnt = 0;
}

V
Venkata Duvvuru 已提交
1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208 1209 1210 1211 1212 1213 1214 1215 1216 1217 1218 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233 1234 1235 1236 1237 1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256 1257 1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269 1270 1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284
/* OS2BMC related */

#define DHCP_CLIENT_PORT	68
#define DHCP_SERVER_PORT	67
#define NET_BIOS_PORT1		137
#define NET_BIOS_PORT2		138
#define DHCPV6_RAS_PORT		547

#define is_mc_allowed_on_bmc(adapter, eh)	\
	(!is_multicast_filt_enabled(adapter) &&	\
	 is_multicast_ether_addr(eh->h_dest) &&	\
	 !is_broadcast_ether_addr(eh->h_dest))

#define is_bc_allowed_on_bmc(adapter, eh)	\
	(!is_broadcast_filt_enabled(adapter) &&	\
	 is_broadcast_ether_addr(eh->h_dest))

#define is_arp_allowed_on_bmc(adapter, skb)	\
	(is_arp(skb) && is_arp_filt_enabled(adapter))

#define is_broadcast_packet(eh, adapter)	\
		(is_multicast_ether_addr(eh->h_dest) && \
		!compare_ether_addr(eh->h_dest, adapter->netdev->broadcast))

#define is_arp(skb)	(skb->protocol == htons(ETH_P_ARP))

#define is_arp_filt_enabled(adapter)	\
		(adapter->bmc_filt_mask & (BMC_FILT_BROADCAST_ARP))

#define is_dhcp_client_filt_enabled(adapter)	\
		(adapter->bmc_filt_mask & BMC_FILT_BROADCAST_DHCP_CLIENT)

#define is_dhcp_srvr_filt_enabled(adapter)	\
		(adapter->bmc_filt_mask & BMC_FILT_BROADCAST_DHCP_SERVER)

#define is_nbios_filt_enabled(adapter)	\
		(adapter->bmc_filt_mask & BMC_FILT_BROADCAST_NET_BIOS)

#define is_ipv6_na_filt_enabled(adapter)	\
		(adapter->bmc_filt_mask &	\
			BMC_FILT_MULTICAST_IPV6_NEIGH_ADVER)

#define is_ipv6_ra_filt_enabled(adapter)	\
		(adapter->bmc_filt_mask & BMC_FILT_MULTICAST_IPV6_RA)

#define is_ipv6_ras_filt_enabled(adapter)	\
		(adapter->bmc_filt_mask & BMC_FILT_MULTICAST_IPV6_RAS)

#define is_broadcast_filt_enabled(adapter)	\
		(adapter->bmc_filt_mask & BMC_FILT_BROADCAST)

#define is_multicast_filt_enabled(adapter)	\
		(adapter->bmc_filt_mask & BMC_FILT_MULTICAST)

static bool be_send_pkt_to_bmc(struct be_adapter *adapter,
			       struct sk_buff **skb)
{
	struct ethhdr *eh = (struct ethhdr *)(*skb)->data;
	bool os2bmc = false;

	if (!be_is_os2bmc_enabled(adapter))
		goto done;

	if (!is_multicast_ether_addr(eh->h_dest))
		goto done;

	if (is_mc_allowed_on_bmc(adapter, eh) ||
	    is_bc_allowed_on_bmc(adapter, eh) ||
	    is_arp_allowed_on_bmc(adapter, (*skb))) {
		os2bmc = true;
		goto done;
	}

	if ((*skb)->protocol == htons(ETH_P_IPV6)) {
		struct ipv6hdr *hdr = ipv6_hdr((*skb));
		u8 nexthdr = hdr->nexthdr;

		if (nexthdr == IPPROTO_ICMPV6) {
			struct icmp6hdr *icmp6 = icmp6_hdr((*skb));

			switch (icmp6->icmp6_type) {
			case NDISC_ROUTER_ADVERTISEMENT:
				os2bmc = is_ipv6_ra_filt_enabled(adapter);
				goto done;
			case NDISC_NEIGHBOUR_ADVERTISEMENT:
				os2bmc = is_ipv6_na_filt_enabled(adapter);
				goto done;
			default:
				break;
			}
		}
	}

	if (is_udp_pkt((*skb))) {
		struct udphdr *udp = udp_hdr((*skb));

		switch (udp->dest) {
		case DHCP_CLIENT_PORT:
			os2bmc = is_dhcp_client_filt_enabled(adapter);
			goto done;
		case DHCP_SERVER_PORT:
			os2bmc = is_dhcp_srvr_filt_enabled(adapter);
			goto done;
		case NET_BIOS_PORT1:
		case NET_BIOS_PORT2:
			os2bmc = is_nbios_filt_enabled(adapter);
			goto done;
		case DHCPV6_RAS_PORT:
			os2bmc = is_ipv6_ras_filt_enabled(adapter);
			goto done;
		default:
			break;
		}
	}
done:
	/* For packets over a vlan, which are destined
	 * to BMC, asic expects the vlan to be inline in the packet.
	 */
	if (os2bmc)
		*skb = be_insert_vlan_in_pkt(adapter, *skb, NULL);

	return os2bmc;
}

1285 1286 1287
static netdev_tx_t be_xmit(struct sk_buff *skb, struct net_device *netdev)
{
	struct be_adapter *adapter = netdev_priv(netdev);
1288 1289
	u16 q_idx = skb_get_queue_mapping(skb);
	struct be_tx_obj *txo = &adapter->tx_obj[q_idx];
1290 1291
	struct be_wrb_params wrb_params = { 0 };
	bool flush = !skb->xmit_more;
1292
	u16 wrb_cnt;
1293

1294
	skb = be_xmit_workarounds(adapter, skb, &wrb_params);
1295 1296
	if (unlikely(!skb))
		goto drop;
S
Sathya Perla 已提交
1297

1298 1299 1300
	be_get_wrb_params_from_skb(adapter, skb, &wrb_params);

	wrb_cnt = be_xmit_enqueue(adapter, txo, skb, &wrb_params);
1301 1302 1303 1304
	if (unlikely(!wrb_cnt)) {
		dev_kfree_skb_any(skb);
		goto drop;
	}
E
Eric Dumazet 已提交
1305

V
Venkata Duvvuru 已提交
1306 1307 1308 1309 1310 1311 1312 1313 1314 1315 1316 1317
	/* if os2bmc is enabled and if the pkt is destined to bmc,
	 * enqueue the pkt a 2nd time with mgmt bit set.
	 */
	if (be_send_pkt_to_bmc(adapter, &skb)) {
		BE_WRB_F_SET(wrb_params.features, OS2BMC, 1);
		wrb_cnt = be_xmit_enqueue(adapter, txo, skb, &wrb_params);
		if (unlikely(!wrb_cnt))
			goto drop;
		else
			skb_get(skb);
	}

1318
	if (be_is_txq_full(txo)) {
1319 1320 1321
		netif_stop_subqueue(netdev, q_idx);
		tx_stats(txo)->tx_stops++;
	}
1322

1323 1324
	if (flush || __netif_subqueue_stopped(netdev, q_idx))
		be_xmit_flush(adapter, txo);
S
Sathya Perla 已提交
1325

1326 1327 1328 1329 1330 1331
	return NETDEV_TX_OK;
drop:
	tx_stats(txo)->tx_drv_drops++;
	/* Flush the already enqueued tx requests */
	if (flush && txo->pend_wrb_cnt)
		be_xmit_flush(adapter, txo);
S
Sathya Perla 已提交
1332 1333 1334 1335 1336 1337 1338

	return NETDEV_TX_OK;
}

static int be_change_mtu(struct net_device *netdev, int new_mtu)
{
	struct be_adapter *adapter = netdev_priv(netdev);
K
Kalesh AP 已提交
1339 1340 1341 1342 1343
	struct device *dev = &adapter->pdev->dev;

	if (new_mtu < BE_MIN_MTU || new_mtu > BE_MAX_MTU) {
		dev_info(dev, "MTU must be between %d and %d bytes\n",
			 BE_MIN_MTU, BE_MAX_MTU);
S
Sathya Perla 已提交
1344 1345
		return -EINVAL;
	}
K
Kalesh AP 已提交
1346 1347

	dev_info(dev, "MTU changed from %d to %d bytes\n",
1348
		 netdev->mtu, new_mtu);
S
Sathya Perla 已提交
1349 1350 1351 1352
	netdev->mtu = new_mtu;
	return 0;
}

1353 1354 1355 1356 1357 1358 1359 1360 1361 1362 1363 1364 1365 1366 1367 1368 1369 1370 1371 1372 1373 1374 1375 1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 1386 1387 1388 1389
static inline bool be_in_all_promisc(struct be_adapter *adapter)
{
	return (adapter->if_flags & BE_IF_FLAGS_ALL_PROMISCUOUS) ==
			BE_IF_FLAGS_ALL_PROMISCUOUS;
}

static int be_set_vlan_promisc(struct be_adapter *adapter)
{
	struct device *dev = &adapter->pdev->dev;
	int status;

	if (adapter->if_flags & BE_IF_FLAGS_VLAN_PROMISCUOUS)
		return 0;

	status = be_cmd_rx_filter(adapter, BE_IF_FLAGS_VLAN_PROMISCUOUS, ON);
	if (!status) {
		dev_info(dev, "Enabled VLAN promiscuous mode\n");
		adapter->if_flags |= BE_IF_FLAGS_VLAN_PROMISCUOUS;
	} else {
		dev_err(dev, "Failed to enable VLAN promiscuous mode\n");
	}
	return status;
}

static int be_clear_vlan_promisc(struct be_adapter *adapter)
{
	struct device *dev = &adapter->pdev->dev;
	int status;

	status = be_cmd_rx_filter(adapter, BE_IF_FLAGS_VLAN_PROMISCUOUS, OFF);
	if (!status) {
		dev_info(dev, "Disabling VLAN promiscuous mode\n");
		adapter->if_flags &= ~BE_IF_FLAGS_VLAN_PROMISCUOUS;
	}
	return status;
}

S
Sathya Perla 已提交
1390
/*
1391 1392
 * A max of 64 (BE_NUM_VLANS_SUPPORTED) vlans can be configured in BE.
 * If the user configures more, place BE in vlan promiscuous mode.
S
Sathya Perla 已提交
1393
 */
S
Sathya Perla 已提交
1394
static int be_vid_config(struct be_adapter *adapter)
S
Sathya Perla 已提交
1395
{
V
Vasundhara Volam 已提交
1396
	struct device *dev = &adapter->pdev->dev;
S
Sathya Perla 已提交
1397
	u16 vids[BE_NUM_VLANS_SUPPORTED];
1398
	u16 num = 0, i = 0;
1399
	int status = 0;
1400

1401
	/* No need to further configure vids if in promiscuous mode */
1402
	if (be_in_all_promisc(adapter))
1403 1404
		return 0;

1405
	if (adapter->vlans_added > be_max_vlans(adapter))
1406
		return be_set_vlan_promisc(adapter);
1407 1408

	/* Construct VLAN Table to give to HW */
1409 1410
	for_each_set_bit(i, adapter->vids, VLAN_N_VID)
		vids[num++] = cpu_to_le16(i);
1411

1412
	status = be_cmd_vlan_config(adapter, adapter->if_handle, vids, num, 0);
1413
	if (status) {
1414
		dev_err(dev, "Setting HW VLAN filtering failed\n");
1415
		/* Set to VLAN promisc mode as setting VLAN filter failed */
1416 1417
		if (addl_status(status) == MCC_ADDL_STATUS_INSUFFICIENT_VLANS ||
		    addl_status(status) ==
1418
				MCC_ADDL_STATUS_INSUFFICIENT_RESOURCES)
1419 1420 1421
			return be_set_vlan_promisc(adapter);
	} else if (adapter->if_flags & BE_IF_FLAGS_VLAN_PROMISCUOUS) {
		status = be_clear_vlan_promisc(adapter);
S
Sathya Perla 已提交
1422
	}
1423
	return status;
S
Sathya Perla 已提交
1424 1425
}

1426
static int be_vlan_add_vid(struct net_device *netdev, __be16 proto, u16 vid)
S
Sathya Perla 已提交
1427 1428
{
	struct be_adapter *adapter = netdev_priv(netdev);
A
Ajit Khaparde 已提交
1429
	int status = 0;
S
Sathya Perla 已提交
1430

1431 1432
	/* Packets with VID 0 are always received by Lancer by default */
	if (lancer_chip(adapter) && vid == 0)
1433 1434
		return status;

1435
	if (test_bit(vid, adapter->vids))
1436
		return status;
1437

1438
	set_bit(vid, adapter->vids);
1439
	adapter->vlans_added++;
1440

1441 1442 1443
	status = be_vid_config(adapter);
	if (status) {
		adapter->vlans_added--;
1444
		clear_bit(vid, adapter->vids);
1445
	}
1446

A
Ajit Khaparde 已提交
1447
	return status;
S
Sathya Perla 已提交
1448 1449
}

1450
static int be_vlan_rem_vid(struct net_device *netdev, __be16 proto, u16 vid)
S
Sathya Perla 已提交
1451 1452 1453
{
	struct be_adapter *adapter = netdev_priv(netdev);

1454 1455
	/* Packets with VID 0 are always received by Lancer by default */
	if (lancer_chip(adapter) && vid == 0)
1456
		return 0;
1457

1458
	clear_bit(vid, adapter->vids);
1459 1460 1461
	adapter->vlans_added--;

	return be_vid_config(adapter);
S
Sathya Perla 已提交
1462 1463
}

1464
static void be_clear_all_promisc(struct be_adapter *adapter)
1465
{
1466
	be_cmd_rx_filter(adapter, BE_IF_FLAGS_ALL_PROMISCUOUS, OFF);
1467
	adapter->if_flags &= ~BE_IF_FLAGS_ALL_PROMISCUOUS;
1468 1469
}

1470 1471 1472 1473 1474 1475 1476
static void be_set_all_promisc(struct be_adapter *adapter)
{
	be_cmd_rx_filter(adapter, BE_IF_FLAGS_ALL_PROMISCUOUS, ON);
	adapter->if_flags |= BE_IF_FLAGS_ALL_PROMISCUOUS;
}

static void be_set_mc_promisc(struct be_adapter *adapter)
S
Sathya Perla 已提交
1477
{
1478
	int status;
S
Sathya Perla 已提交
1479

1480 1481
	if (adapter->if_flags & BE_IF_FLAGS_MCAST_PROMISCUOUS)
		return;
S
Sathya Perla 已提交
1482

1483 1484 1485 1486 1487 1488 1489 1490 1491 1492 1493 1494 1495 1496 1497 1498 1499 1500 1501 1502 1503 1504 1505 1506 1507 1508 1509 1510
	status = be_cmd_rx_filter(adapter, BE_IF_FLAGS_MCAST_PROMISCUOUS, ON);
	if (!status)
		adapter->if_flags |= BE_IF_FLAGS_MCAST_PROMISCUOUS;
}

static void be_set_mc_list(struct be_adapter *adapter)
{
	int status;

	status = be_cmd_rx_filter(adapter, BE_IF_FLAGS_MULTICAST, ON);
	if (!status)
		adapter->if_flags &= ~BE_IF_FLAGS_MCAST_PROMISCUOUS;
	else
		be_set_mc_promisc(adapter);
}

static void be_set_uc_list(struct be_adapter *adapter)
{
	struct netdev_hw_addr *ha;
	int i = 1; /* First slot is claimed by the Primary MAC */

	for (; adapter->uc_macs > 0; adapter->uc_macs--, i++)
		be_cmd_pmac_del(adapter, adapter->if_handle,
				adapter->pmac_id[i], 0);

	if (netdev_uc_count(adapter->netdev) > be_max_uc(adapter)) {
		be_set_all_promisc(adapter);
		return;
S
Sathya Perla 已提交
1511 1512
	}

1513 1514 1515 1516 1517 1518
	netdev_for_each_uc_addr(ha, adapter->netdev) {
		adapter->uc_macs++; /* First slot is for Primary MAC */
		be_cmd_pmac_add(adapter, (u8 *)ha->addr, adapter->if_handle,
				&adapter->pmac_id[adapter->uc_macs], 0);
	}
}
S
Sathya Perla 已提交
1519

1520 1521 1522
static void be_clear_uc_list(struct be_adapter *adapter)
{
	int i;
1523

1524 1525 1526 1527 1528
	for (i = 1; i < (adapter->uc_macs + 1); i++)
		be_cmd_pmac_del(adapter, adapter->if_handle,
				adapter->pmac_id[i], 0);
	adapter->uc_macs = 0;
}
1529

1530 1531 1532
static void be_set_rx_mode(struct net_device *netdev)
{
	struct be_adapter *adapter = netdev_priv(netdev);
1533

1534 1535 1536
	if (netdev->flags & IFF_PROMISC) {
		be_set_all_promisc(adapter);
		return;
1537 1538
	}

1539 1540 1541 1542 1543
	/* Interface was previously in promiscuous mode; disable it */
	if (be_in_all_promisc(adapter)) {
		be_clear_all_promisc(adapter);
		if (adapter->vlans_added)
			be_vid_config(adapter);
1544
	}
1545

1546 1547 1548 1549
	/* Enable multicast promisc if num configured exceeds what we support */
	if (netdev->flags & IFF_ALLMULTI ||
	    netdev_mc_count(netdev) > be_max_mc(adapter)) {
		be_set_mc_promisc(adapter);
1550
		return;
1551
	}
1552

1553 1554 1555 1556
	if (netdev_uc_count(netdev) != adapter->uc_macs)
		be_set_uc_list(adapter);

	be_set_mc_list(adapter);
S
Sathya Perla 已提交
1557 1558
}

1559 1560 1561
static int be_set_vf_mac(struct net_device *netdev, int vf, u8 *mac)
{
	struct be_adapter *adapter = netdev_priv(netdev);
1562
	struct be_vf_cfg *vf_cfg = &adapter->vf_cfg[vf];
1563 1564
	int status;

1565
	if (!sriov_enabled(adapter))
1566 1567
		return -EPERM;

1568
	if (!is_valid_ether_addr(mac) || vf >= adapter->num_vfs)
1569 1570
		return -EINVAL;

1571 1572 1573 1574 1575 1576
	/* Proceed further only if user provided MAC is different
	 * from active MAC
	 */
	if (ether_addr_equal(mac, vf_cfg->mac_addr))
		return 0;

1577 1578 1579
	if (BEx_chip(adapter)) {
		be_cmd_pmac_del(adapter, vf_cfg->if_handle, vf_cfg->pmac_id,
				vf + 1);
1580

1581 1582
		status = be_cmd_pmac_add(adapter, mac, vf_cfg->if_handle,
					 &vf_cfg->pmac_id, vf + 1);
1583 1584 1585
	} else {
		status = be_cmd_set_mac(adapter, mac, vf_cfg->if_handle,
					vf + 1);
1586 1587
	}

1588 1589 1590 1591 1592
	if (status) {
		dev_err(&adapter->pdev->dev, "MAC %pM set on VF %d Failed: %#x",
			mac, vf, status);
		return be_cmd_status(status);
	}
1593

1594 1595 1596
	ether_addr_copy(vf_cfg->mac_addr, mac);

	return 0;
1597 1598
}

1599
static int be_get_vf_config(struct net_device *netdev, int vf,
1600
			    struct ifla_vf_info *vi)
1601 1602
{
	struct be_adapter *adapter = netdev_priv(netdev);
1603
	struct be_vf_cfg *vf_cfg = &adapter->vf_cfg[vf];
1604

1605
	if (!sriov_enabled(adapter))
1606 1607
		return -EPERM;

1608
	if (vf >= adapter->num_vfs)
1609 1610 1611
		return -EINVAL;

	vi->vf = vf;
1612 1613
	vi->max_tx_rate = vf_cfg->tx_rate;
	vi->min_tx_rate = 0;
1614 1615
	vi->vlan = vf_cfg->vlan_tag & VLAN_VID_MASK;
	vi->qos = vf_cfg->vlan_tag >> VLAN_PRIO_SHIFT;
1616
	memcpy(&vi->mac, vf_cfg->mac_addr, ETH_ALEN);
1617
	vi->linkstate = adapter->vf_cfg[vf].plink_tracking;
1618
	vi->spoofchk = adapter->vf_cfg[vf].spoofchk;
1619 1620 1621 1622

	return 0;
}

1623 1624 1625 1626 1627 1628 1629 1630
static int be_set_vf_tvt(struct be_adapter *adapter, int vf, u16 vlan)
{
	struct be_vf_cfg *vf_cfg = &adapter->vf_cfg[vf];
	u16 vids[BE_NUM_VLANS_SUPPORTED];
	int vf_if_id = vf_cfg->if_handle;
	int status;

	/* Enable Transparent VLAN Tagging */
1631
	status = be_cmd_set_hsw_config(adapter, vlan, vf + 1, vf_if_id, 0, 0);
1632 1633 1634 1635 1636 1637 1638 1639 1640 1641 1642 1643 1644 1645 1646 1647 1648 1649 1650 1651 1652 1653 1654 1655 1656 1657 1658 1659
	if (status)
		return status;

	/* Clear pre-programmed VLAN filters on VF if any, if TVT is enabled */
	vids[0] = 0;
	status = be_cmd_vlan_config(adapter, vf_if_id, vids, 1, vf + 1);
	if (!status)
		dev_info(&adapter->pdev->dev,
			 "Cleared guest VLANs on VF%d", vf);

	/* After TVT is enabled, disallow VFs to program VLAN filters */
	if (vf_cfg->privileges & BE_PRIV_FILTMGMT) {
		status = be_cmd_set_fn_privileges(adapter, vf_cfg->privileges &
						  ~BE_PRIV_FILTMGMT, vf + 1);
		if (!status)
			vf_cfg->privileges &= ~BE_PRIV_FILTMGMT;
	}
	return 0;
}

static int be_clear_vf_tvt(struct be_adapter *adapter, int vf)
{
	struct be_vf_cfg *vf_cfg = &adapter->vf_cfg[vf];
	struct device *dev = &adapter->pdev->dev;
	int status;

	/* Reset Transparent VLAN Tagging. */
	status = be_cmd_set_hsw_config(adapter, BE_RESET_VLAN_TAG_ID, vf + 1,
1660
				       vf_cfg->if_handle, 0, 0);
1661 1662 1663 1664 1665 1666 1667 1668 1669 1670 1671 1672 1673 1674 1675 1676 1677 1678
	if (status)
		return status;

	/* Allow VFs to program VLAN filtering */
	if (!(vf_cfg->privileges & BE_PRIV_FILTMGMT)) {
		status = be_cmd_set_fn_privileges(adapter, vf_cfg->privileges |
						  BE_PRIV_FILTMGMT, vf + 1);
		if (!status) {
			vf_cfg->privileges |= BE_PRIV_FILTMGMT;
			dev_info(dev, "VF%d: FILTMGMT priv enabled", vf);
		}
	}

	dev_info(dev,
		 "Disable/re-enable i/f in VM to clear Transparent VLAN tag");
	return 0;
}

1679
static int be_set_vf_vlan(struct net_device *netdev, int vf, u16 vlan, u8 qos)
1680 1681
{
	struct be_adapter *adapter = netdev_priv(netdev);
1682
	struct be_vf_cfg *vf_cfg = &adapter->vf_cfg[vf];
1683
	int status;
1684

1685
	if (!sriov_enabled(adapter))
1686 1687
		return -EPERM;

1688
	if (vf >= adapter->num_vfs || vlan > 4095 || qos > 7)
1689 1690
		return -EINVAL;

1691 1692
	if (vlan || qos) {
		vlan |= qos << VLAN_PRIO_SHIFT;
1693
		status = be_set_vf_tvt(adapter, vf, vlan);
1694
	} else {
1695
		status = be_clear_vf_tvt(adapter, vf);
1696 1697
	}

1698 1699
	if (status) {
		dev_err(&adapter->pdev->dev,
1700 1701
			"VLAN %d config on VF %d failed : %#x\n", vlan, vf,
			status);
1702 1703 1704 1705 1706
		return be_cmd_status(status);
	}

	vf_cfg->vlan_tag = vlan;
	return 0;
1707 1708
}

1709 1710
static int be_set_vf_tx_rate(struct net_device *netdev, int vf,
			     int min_tx_rate, int max_tx_rate)
1711 1712
{
	struct be_adapter *adapter = netdev_priv(netdev);
1713 1714 1715 1716
	struct device *dev = &adapter->pdev->dev;
	int percent_rate, status = 0;
	u16 link_speed = 0;
	u8 link_status;
1717

1718
	if (!sriov_enabled(adapter))
1719 1720
		return -EPERM;

1721
	if (vf >= adapter->num_vfs)
1722 1723
		return -EINVAL;

1724 1725 1726
	if (min_tx_rate)
		return -EINVAL;

1727 1728 1729 1730 1731 1732 1733 1734 1735 1736
	if (!max_tx_rate)
		goto config_qos;

	status = be_cmd_link_status_query(adapter, &link_speed,
					  &link_status, 0);
	if (status)
		goto err;

	if (!link_status) {
		dev_err(dev, "TX-rate setting not allowed when link is down\n");
1737
		status = -ENETDOWN;
1738 1739 1740 1741 1742 1743 1744 1745 1746 1747 1748 1749 1750 1751 1752 1753 1754
		goto err;
	}

	if (max_tx_rate < 100 || max_tx_rate > link_speed) {
		dev_err(dev, "TX-rate must be between 100 and %d Mbps\n",
			link_speed);
		status = -EINVAL;
		goto err;
	}

	/* On Skyhawk the QOS setting must be done only as a % value */
	percent_rate = link_speed / 100;
	if (skyhawk_chip(adapter) && (max_tx_rate % percent_rate)) {
		dev_err(dev, "TX-rate must be a multiple of %d Mbps\n",
			percent_rate);
		status = -EINVAL;
		goto err;
1755
	}
1756

1757 1758
config_qos:
	status = be_cmd_config_qos(adapter, max_tx_rate, link_speed, vf + 1);
1759
	if (status)
1760 1761 1762 1763 1764 1765 1766 1767
		goto err;

	adapter->vf_cfg[vf].tx_rate = max_tx_rate;
	return 0;

err:
	dev_err(dev, "TX-rate setting of %dMbps on VF%d failed\n",
		max_tx_rate, vf);
1768
	return be_cmd_status(status);
1769
}
1770

1771 1772 1773 1774 1775 1776 1777 1778 1779 1780 1781 1782 1783
static int be_set_vf_link_state(struct net_device *netdev, int vf,
				int link_state)
{
	struct be_adapter *adapter = netdev_priv(netdev);
	int status;

	if (!sriov_enabled(adapter))
		return -EPERM;

	if (vf >= adapter->num_vfs)
		return -EINVAL;

	status = be_cmd_set_logical_link_config(adapter, link_state, vf+1);
1784 1785 1786 1787 1788
	if (status) {
		dev_err(&adapter->pdev->dev,
			"Link state change on VF %d failed: %#x\n", vf, status);
		return be_cmd_status(status);
	}
1789

1790 1791 1792
	adapter->vf_cfg[vf].plink_tracking = link_state;

	return 0;
1793
}
1794

1795 1796 1797 1798 1799 1800 1801 1802 1803 1804 1805 1806 1807 1808 1809 1810 1811 1812 1813 1814 1815 1816 1817 1818 1819 1820 1821 1822 1823 1824 1825 1826 1827
static int be_set_vf_spoofchk(struct net_device *netdev, int vf, bool enable)
{
	struct be_adapter *adapter = netdev_priv(netdev);
	struct be_vf_cfg *vf_cfg = &adapter->vf_cfg[vf];
	u8 spoofchk;
	int status;

	if (!sriov_enabled(adapter))
		return -EPERM;

	if (vf >= adapter->num_vfs)
		return -EINVAL;

	if (BEx_chip(adapter))
		return -EOPNOTSUPP;

	if (enable == vf_cfg->spoofchk)
		return 0;

	spoofchk = enable ? ENABLE_MAC_SPOOFCHK : DISABLE_MAC_SPOOFCHK;

	status = be_cmd_set_hsw_config(adapter, 0, vf + 1, vf_cfg->if_handle,
				       0, spoofchk);
	if (status) {
		dev_err(&adapter->pdev->dev,
			"Spoofchk change on VF %d failed: %#x\n", vf, status);
		return be_cmd_status(status);
	}

	vf_cfg->spoofchk = enable;
	return 0;
}

1828 1829
static void be_aic_update(struct be_aic_obj *aic, u64 rx_pkts, u64 tx_pkts,
			  ulong now)
S
Sathya Perla 已提交
1830
{
1831 1832 1833 1834
	aic->rx_pkts_prev = rx_pkts;
	aic->tx_reqs_prev = tx_pkts;
	aic->jiffies = now;
}
1835

1836
static int be_get_new_eqd(struct be_eq_obj *eqo)
1837
{
1838 1839
	struct be_adapter *adapter = eqo->adapter;
	int eqd, start;
1840 1841 1842
	struct be_aic_obj *aic;
	struct be_rx_obj *rxo;
	struct be_tx_obj *txo;
1843
	u64 rx_pkts = 0, tx_pkts = 0;
1844 1845
	ulong now;
	u32 pps, delta;
1846
	int i;
S
Sathya Perla 已提交
1847

1848 1849 1850 1851 1852 1853 1854
	aic = &adapter->aic_obj[eqo->idx];
	if (!aic->enable) {
		if (aic->jiffies)
			aic->jiffies = 0;
		eqd = aic->et_eqd;
		return eqd;
	}
S
Sathya Perla 已提交
1855

1856
	for_all_rx_queues_on_eq(adapter, eqo, rxo, i) {
1857
		do {
1858
			start = u64_stats_fetch_begin_irq(&rxo->stats.sync);
1859
			rx_pkts += rxo->stats.rx_pkts;
1860
		} while (u64_stats_fetch_retry_irq(&rxo->stats.sync, start));
1861
	}
S
Sathya Perla 已提交
1862

1863
	for_all_tx_queues_on_eq(adapter, eqo, txo, i) {
1864
		do {
1865
			start = u64_stats_fetch_begin_irq(&txo->stats.sync);
1866
			tx_pkts += txo->stats.tx_reqs;
1867
		} while (u64_stats_fetch_retry_irq(&txo->stats.sync, start));
1868
	}
S
Sathya Perla 已提交
1869

1870 1871 1872 1873 1874 1875 1876 1877
	/* Skip, if wrapped around or first calculation */
	now = jiffies;
	if (!aic->jiffies || time_before(now, aic->jiffies) ||
	    rx_pkts < aic->rx_pkts_prev ||
	    tx_pkts < aic->tx_reqs_prev) {
		be_aic_update(aic, rx_pkts, tx_pkts, now);
		return aic->prev_eqd;
	}
1878

1879 1880 1881
	delta = jiffies_to_msecs(now - aic->jiffies);
	if (delta == 0)
		return aic->prev_eqd;
S
Sathya Perla 已提交
1882

1883 1884 1885
	pps = (((u32)(rx_pkts - aic->rx_pkts_prev) * 1000) / delta) +
		(((u32)(tx_pkts - aic->tx_reqs_prev) * 1000) / delta);
	eqd = (pps / 15000) << 2;
1886

1887 1888 1889 1890 1891 1892 1893 1894 1895 1896 1897 1898 1899 1900 1901 1902 1903 1904 1905 1906 1907 1908 1909 1910 1911 1912 1913 1914 1915 1916 1917 1918 1919 1920 1921 1922 1923 1924 1925 1926 1927 1928 1929 1930 1931 1932 1933 1934 1935 1936 1937 1938 1939
	if (eqd < 8)
		eqd = 0;
	eqd = min_t(u32, eqd, aic->max_eqd);
	eqd = max_t(u32, eqd, aic->min_eqd);

	be_aic_update(aic, rx_pkts, tx_pkts, now);

	return eqd;
}

/* For Skyhawk-R only */
static u32 be_get_eq_delay_mult_enc(struct be_eq_obj *eqo)
{
	struct be_adapter *adapter = eqo->adapter;
	struct be_aic_obj *aic = &adapter->aic_obj[eqo->idx];
	ulong now = jiffies;
	int eqd;
	u32 mult_enc;

	if (!aic->enable)
		return 0;

	if (time_before_eq(now, aic->jiffies) ||
	    jiffies_to_msecs(now - aic->jiffies) < 1)
		eqd = aic->prev_eqd;
	else
		eqd = be_get_new_eqd(eqo);

	if (eqd > 100)
		mult_enc = R2I_DLY_ENC_1;
	else if (eqd > 60)
		mult_enc = R2I_DLY_ENC_2;
	else if (eqd > 20)
		mult_enc = R2I_DLY_ENC_3;
	else
		mult_enc = R2I_DLY_ENC_0;

	aic->prev_eqd = eqd;

	return mult_enc;
}

void be_eqd_update(struct be_adapter *adapter, bool force_update)
{
	struct be_set_eqd set_eqd[MAX_EVT_QS];
	struct be_aic_obj *aic;
	struct be_eq_obj *eqo;
	int i, num = 0, eqd;

	for_all_evt_queues(adapter, eqo, i) {
		aic = &adapter->aic_obj[eqo->idx];
		eqd = be_get_new_eqd(eqo);
		if (force_update || eqd != aic->prev_eqd) {
1940 1941 1942 1943 1944
			set_eqd[num].delay_multiplier = (eqd * 65)/100;
			set_eqd[num].eq_id = eqo->q.id;
			aic->prev_eqd = eqd;
			num++;
		}
1945
	}
1946 1947 1948

	if (num)
		be_cmd_modify_eqd(adapter, set_eqd, num);
S
Sathya Perla 已提交
1949 1950
}

1951
static void be_rx_stats_update(struct be_rx_obj *rxo,
1952
			       struct be_rx_compl_info *rxcp)
1953
{
1954
	struct be_rx_stats *stats = rx_stats(rxo);
1955

1956
	u64_stats_update_begin(&stats->sync);
1957
	stats->rx_compl++;
1958
	stats->rx_bytes += rxcp->pkt_size;
1959
	stats->rx_pkts++;
1960
	if (rxcp->pkt_type == BE_MULTICAST_PACKET)
1961
		stats->rx_mcast_pkts++;
1962
	if (rxcp->err)
1963
		stats->rx_compl_err++;
1964
	u64_stats_update_end(&stats->sync);
1965 1966
}

1967
static inline bool csum_passed(struct be_rx_compl_info *rxcp)
1968
{
1969
	/* L4 checksum is not reliable for non TCP/UDP packets.
1970 1971
	 * Also ignore ipcksm for ipv6 pkts
	 */
1972
	return (rxcp->tcpf || rxcp->udpf) && rxcp->l4_csum &&
1973
		(rxcp->ip_csum || rxcp->ipv6) && !rxcp->err;
1974 1975
}

1976
static struct be_rx_page_info *get_rx_page_info(struct be_rx_obj *rxo)
S
Sathya Perla 已提交
1977
{
S
Sathya Perla 已提交
1978
	struct be_adapter *adapter = rxo->adapter;
S
Sathya Perla 已提交
1979
	struct be_rx_page_info *rx_page_info;
1980
	struct be_queue_info *rxq = &rxo->q;
1981
	u16 frag_idx = rxq->tail;
S
Sathya Perla 已提交
1982

1983
	rx_page_info = &rxo->page_info_tbl[frag_idx];
S
Sathya Perla 已提交
1984 1985
	BUG_ON(!rx_page_info->page);

1986
	if (rx_page_info->last_frag) {
I
Ivan Vecera 已提交
1987 1988 1989
		dma_unmap_page(&adapter->pdev->dev,
			       dma_unmap_addr(rx_page_info, bus),
			       adapter->big_page_size, DMA_FROM_DEVICE);
1990 1991 1992 1993 1994
		rx_page_info->last_frag = false;
	} else {
		dma_sync_single_for_cpu(&adapter->pdev->dev,
					dma_unmap_addr(rx_page_info, bus),
					rx_frag_size, DMA_FROM_DEVICE);
A
Ajit Khaparde 已提交
1995
	}
S
Sathya Perla 已提交
1996

1997
	queue_tail_inc(rxq);
S
Sathya Perla 已提交
1998 1999 2000 2001 2002
	atomic_dec(&rxq->used);
	return rx_page_info;
}

/* Throwaway the data in the Rx completion */
S
Sathya Perla 已提交
2003 2004
static void be_rx_compl_discard(struct be_rx_obj *rxo,
				struct be_rx_compl_info *rxcp)
S
Sathya Perla 已提交
2005 2006
{
	struct be_rx_page_info *page_info;
2007
	u16 i, num_rcvd = rxcp->num_rcvd;
S
Sathya Perla 已提交
2008

2009
	for (i = 0; i < num_rcvd; i++) {
2010
		page_info = get_rx_page_info(rxo);
2011 2012
		put_page(page_info->page);
		memset(page_info, 0, sizeof(*page_info));
S
Sathya Perla 已提交
2013 2014 2015 2016 2017 2018 2019
	}
}

/*
 * skb_fill_rx_data forms a complete skb for an ether frame
 * indicated by rxcp.
 */
S
Sathya Perla 已提交
2020 2021
static void skb_fill_rx_data(struct be_rx_obj *rxo, struct sk_buff *skb,
			     struct be_rx_compl_info *rxcp)
S
Sathya Perla 已提交
2022 2023
{
	struct be_rx_page_info *page_info;
2024 2025
	u16 i, j;
	u16 hdr_len, curr_frag_len, remaining;
S
Sathya Perla 已提交
2026 2027
	u8 *start;

2028
	page_info = get_rx_page_info(rxo);
S
Sathya Perla 已提交
2029 2030 2031 2032
	start = page_address(page_info->page) + page_info->page_offset;
	prefetch(start);

	/* Copy data in the first descriptor of this completion */
2033
	curr_frag_len = min(rxcp->pkt_size, rx_frag_size);
S
Sathya Perla 已提交
2034 2035 2036

	skb->len = curr_frag_len;
	if (curr_frag_len <= BE_HDR_LEN) { /* tiny packet */
2037
		memcpy(skb->data, start, curr_frag_len);
S
Sathya Perla 已提交
2038 2039 2040 2041 2042
		/* Complete packet has now been moved to data */
		put_page(page_info->page);
		skb->data_len = 0;
		skb->tail += curr_frag_len;
	} else {
2043 2044
		hdr_len = ETH_HLEN;
		memcpy(skb->data, start, hdr_len);
S
Sathya Perla 已提交
2045
		skb_shinfo(skb)->nr_frags = 1;
2046
		skb_frag_set_page(skb, 0, page_info->page);
S
Sathya Perla 已提交
2047 2048
		skb_shinfo(skb)->frags[0].page_offset =
					page_info->page_offset + hdr_len;
2049 2050
		skb_frag_size_set(&skb_shinfo(skb)->frags[0],
				  curr_frag_len - hdr_len);
S
Sathya Perla 已提交
2051
		skb->data_len = curr_frag_len - hdr_len;
E
Eric Dumazet 已提交
2052
		skb->truesize += rx_frag_size;
S
Sathya Perla 已提交
2053 2054
		skb->tail += hdr_len;
	}
A
Ajit Khaparde 已提交
2055
	page_info->page = NULL;
S
Sathya Perla 已提交
2056

2057 2058 2059
	if (rxcp->pkt_size <= rx_frag_size) {
		BUG_ON(rxcp->num_rcvd != 1);
		return;
S
Sathya Perla 已提交
2060 2061 2062
	}

	/* More frags present for this completion */
2063 2064
	remaining = rxcp->pkt_size - curr_frag_len;
	for (i = 1, j = 0; i < rxcp->num_rcvd; i++) {
2065
		page_info = get_rx_page_info(rxo);
2066
		curr_frag_len = min(remaining, rx_frag_size);
S
Sathya Perla 已提交
2067

2068 2069 2070 2071
		/* Coalesce all frags from the same physical page in one slot */
		if (page_info->page_offset == 0) {
			/* Fresh page */
			j++;
2072
			skb_frag_set_page(skb, j, page_info->page);
2073 2074
			skb_shinfo(skb)->frags[j].page_offset =
							page_info->page_offset;
E
Eric Dumazet 已提交
2075
			skb_frag_size_set(&skb_shinfo(skb)->frags[j], 0);
2076 2077 2078 2079 2080
			skb_shinfo(skb)->nr_frags++;
		} else {
			put_page(page_info->page);
		}

E
Eric Dumazet 已提交
2081
		skb_frag_size_add(&skb_shinfo(skb)->frags[j], curr_frag_len);
S
Sathya Perla 已提交
2082 2083
		skb->len += curr_frag_len;
		skb->data_len += curr_frag_len;
E
Eric Dumazet 已提交
2084
		skb->truesize += rx_frag_size;
2085
		remaining -= curr_frag_len;
A
Ajit Khaparde 已提交
2086
		page_info->page = NULL;
S
Sathya Perla 已提交
2087
	}
2088
	BUG_ON(j > MAX_SKB_FRAGS);
S
Sathya Perla 已提交
2089 2090
}

2091
/* Process the RX completion indicated by rxcp when GRO is disabled */
2092
static void be_rx_compl_process(struct be_rx_obj *rxo, struct napi_struct *napi,
S
Sathya Perla 已提交
2093
				struct be_rx_compl_info *rxcp)
S
Sathya Perla 已提交
2094
{
S
Sathya Perla 已提交
2095
	struct be_adapter *adapter = rxo->adapter;
2096
	struct net_device *netdev = adapter->netdev;
S
Sathya Perla 已提交
2097
	struct sk_buff *skb;
2098

2099
	skb = netdev_alloc_skb_ip_align(netdev, BE_RX_SKB_ALLOC_SIZE);
2100
	if (unlikely(!skb)) {
2101
		rx_stats(rxo)->rx_drops_no_skbs++;
S
Sathya Perla 已提交
2102
		be_rx_compl_discard(rxo, rxcp);
S
Sathya Perla 已提交
2103 2104 2105
		return;
	}

S
Sathya Perla 已提交
2106
	skb_fill_rx_data(rxo, skb, rxcp);
S
Sathya Perla 已提交
2107

2108
	if (likely((netdev->features & NETIF_F_RXCSUM) && csum_passed(rxcp)))
2109
		skb->ip_summed = CHECKSUM_UNNECESSARY;
S
Somnath Kotur 已提交
2110 2111
	else
		skb_checksum_none_assert(skb);
S
Sathya Perla 已提交
2112

2113
	skb->protocol = eth_type_trans(skb, netdev);
2114
	skb_record_rx_queue(skb, rxo - &adapter->rx_obj[0]);
S
Sathya Perla 已提交
2115
	if (netdev->features & NETIF_F_RXHASH)
T
Tom Herbert 已提交
2116
		skb_set_hash(skb, rxcp->rss_hash, PKT_HASH_TYPE_L3);
2117

2118
	skb->csum_level = rxcp->tunneled;
2119
	skb_mark_napi_id(skb, napi);
S
Sathya Perla 已提交
2120

2121
	if (rxcp->vlanf)
2122
		__vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q), rxcp->vlan_tag);
A
Ajit Khaparde 已提交
2123 2124

	netif_receive_skb(skb);
S
Sathya Perla 已提交
2125 2126
}

2127
/* Process the RX completion indicated by rxcp when GRO is enabled */
J
Jingoo Han 已提交
2128 2129 2130
static void be_rx_compl_process_gro(struct be_rx_obj *rxo,
				    struct napi_struct *napi,
				    struct be_rx_compl_info *rxcp)
S
Sathya Perla 已提交
2131
{
S
Sathya Perla 已提交
2132
	struct be_adapter *adapter = rxo->adapter;
S
Sathya Perla 已提交
2133
	struct be_rx_page_info *page_info;
2134
	struct sk_buff *skb = NULL;
2135 2136
	u16 remaining, curr_frag_len;
	u16 i, j;
2137

S
Sathya Perla 已提交
2138
	skb = napi_get_frags(napi);
2139
	if (!skb) {
S
Sathya Perla 已提交
2140
		be_rx_compl_discard(rxo, rxcp);
2141 2142 2143
		return;
	}

2144 2145
	remaining = rxcp->pkt_size;
	for (i = 0, j = -1; i < rxcp->num_rcvd; i++) {
2146
		page_info = get_rx_page_info(rxo);
S
Sathya Perla 已提交
2147 2148 2149

		curr_frag_len = min(remaining, rx_frag_size);

2150 2151 2152 2153
		/* Coalesce all frags from the same physical page in one slot */
		if (i == 0 || page_info->page_offset == 0) {
			/* First frag or Fresh page */
			j++;
2154
			skb_frag_set_page(skb, j, page_info->page);
2155 2156
			skb_shinfo(skb)->frags[j].page_offset =
							page_info->page_offset;
E
Eric Dumazet 已提交
2157
			skb_frag_size_set(&skb_shinfo(skb)->frags[j], 0);
2158 2159 2160
		} else {
			put_page(page_info->page);
		}
E
Eric Dumazet 已提交
2161
		skb_frag_size_add(&skb_shinfo(skb)->frags[j], curr_frag_len);
E
Eric Dumazet 已提交
2162
		skb->truesize += rx_frag_size;
2163
		remaining -= curr_frag_len;
S
Sathya Perla 已提交
2164 2165
		memset(page_info, 0, sizeof(*page_info));
	}
2166
	BUG_ON(j > MAX_SKB_FRAGS);
S
Sathya Perla 已提交
2167

2168
	skb_shinfo(skb)->nr_frags = j + 1;
2169 2170
	skb->len = rxcp->pkt_size;
	skb->data_len = rxcp->pkt_size;
2171
	skb->ip_summed = CHECKSUM_UNNECESSARY;
2172
	skb_record_rx_queue(skb, rxo - &adapter->rx_obj[0]);
A
Ajit Khaparde 已提交
2173
	if (adapter->netdev->features & NETIF_F_RXHASH)
T
Tom Herbert 已提交
2174
		skb_set_hash(skb, rxcp->rss_hash, PKT_HASH_TYPE_L3);
2175

2176
	skb->csum_level = rxcp->tunneled;
2177
	skb_mark_napi_id(skb, napi);
2178

2179
	if (rxcp->vlanf)
2180
		__vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q), rxcp->vlan_tag);
A
Ajit Khaparde 已提交
2181

S
Sathya Perla 已提交
2182
	napi_gro_frags(napi);
2183 2184
}

S
Sathya Perla 已提交
2185 2186
static void be_parse_rx_compl_v1(struct be_eth_rx_compl *compl,
				 struct be_rx_compl_info *rxcp)
2187
{
2188 2189 2190 2191 2192 2193 2194 2195 2196 2197 2198
	rxcp->pkt_size = GET_RX_COMPL_V1_BITS(pktsize, compl);
	rxcp->vlanf = GET_RX_COMPL_V1_BITS(vtp, compl);
	rxcp->err = GET_RX_COMPL_V1_BITS(err, compl);
	rxcp->tcpf = GET_RX_COMPL_V1_BITS(tcpf, compl);
	rxcp->udpf = GET_RX_COMPL_V1_BITS(udpf, compl);
	rxcp->ip_csum = GET_RX_COMPL_V1_BITS(ipcksm, compl);
	rxcp->l4_csum = GET_RX_COMPL_V1_BITS(l4_cksm, compl);
	rxcp->ipv6 = GET_RX_COMPL_V1_BITS(ip_version, compl);
	rxcp->num_rcvd = GET_RX_COMPL_V1_BITS(numfrags, compl);
	rxcp->pkt_type = GET_RX_COMPL_V1_BITS(cast_enc, compl);
	rxcp->rss_hash = GET_RX_COMPL_V1_BITS(rsshash, compl);
2199
	if (rxcp->vlanf) {
2200 2201
		rxcp->qnq = GET_RX_COMPL_V1_BITS(qnq, compl);
		rxcp->vlan_tag = GET_RX_COMPL_V1_BITS(vlan_tag, compl);
2202
	}
2203
	rxcp->port = GET_RX_COMPL_V1_BITS(port, compl);
2204
	rxcp->tunneled =
2205
		GET_RX_COMPL_V1_BITS(tunneled, compl);
2206 2207
}

S
Sathya Perla 已提交
2208 2209
static void be_parse_rx_compl_v0(struct be_eth_rx_compl *compl,
				 struct be_rx_compl_info *rxcp)
2210
{
2211 2212 2213 2214 2215 2216 2217 2218 2219 2220 2221
	rxcp->pkt_size = GET_RX_COMPL_V0_BITS(pktsize, compl);
	rxcp->vlanf = GET_RX_COMPL_V0_BITS(vtp, compl);
	rxcp->err = GET_RX_COMPL_V0_BITS(err, compl);
	rxcp->tcpf = GET_RX_COMPL_V0_BITS(tcpf, compl);
	rxcp->udpf = GET_RX_COMPL_V0_BITS(udpf, compl);
	rxcp->ip_csum = GET_RX_COMPL_V0_BITS(ipcksm, compl);
	rxcp->l4_csum = GET_RX_COMPL_V0_BITS(l4_cksm, compl);
	rxcp->ipv6 = GET_RX_COMPL_V0_BITS(ip_version, compl);
	rxcp->num_rcvd = GET_RX_COMPL_V0_BITS(numfrags, compl);
	rxcp->pkt_type = GET_RX_COMPL_V0_BITS(cast_enc, compl);
	rxcp->rss_hash = GET_RX_COMPL_V0_BITS(rsshash, compl);
2222
	if (rxcp->vlanf) {
2223 2224
		rxcp->qnq = GET_RX_COMPL_V0_BITS(qnq, compl);
		rxcp->vlan_tag = GET_RX_COMPL_V0_BITS(vlan_tag, compl);
2225
	}
2226 2227
	rxcp->port = GET_RX_COMPL_V0_BITS(port, compl);
	rxcp->ip_frag = GET_RX_COMPL_V0_BITS(ip_frag, compl);
2228 2229 2230 2231 2232 2233 2234
}

static struct be_rx_compl_info *be_rx_compl_get(struct be_rx_obj *rxo)
{
	struct be_eth_rx_compl *compl = queue_tail_node(&rxo->cq);
	struct be_rx_compl_info *rxcp = &rxo->rxcp;
	struct be_adapter *adapter = rxo->adapter;
S
Sathya Perla 已提交
2235

2236 2237 2238 2239
	/* For checking the valid bit it is Ok to use either definition as the
	 * valid bit is at the same position in both v0 and v1 Rx compl */
	if (compl->dw[offsetof(struct amap_eth_rx_compl_v1, valid) / 32] == 0)
		return NULL;
S
Sathya Perla 已提交
2240

2241 2242
	rmb();
	be_dws_le_to_cpu(compl, sizeof(*compl));
S
Sathya Perla 已提交
2243

2244
	if (adapter->be3_native)
S
Sathya Perla 已提交
2245
		be_parse_rx_compl_v1(compl, rxcp);
2246
	else
S
Sathya Perla 已提交
2247
		be_parse_rx_compl_v0(compl, rxcp);
S
Sathya Perla 已提交
2248

2249 2250 2251
	if (rxcp->ip_frag)
		rxcp->l4_csum = 0;

2252
	if (rxcp->vlanf) {
2253 2254 2255 2256 2257
		/* In QNQ modes, if qnq bit is not set, then the packet was
		 * tagged only with the transparent outer vlan-tag and must
		 * not be treated as a vlan packet by host
		 */
		if (be_is_qnq_mode(adapter) && !rxcp->qnq)
2258
			rxcp->vlanf = 0;
S
Sathya Perla 已提交
2259

2260
		if (!lancer_chip(adapter))
2261
			rxcp->vlan_tag = swab16(rxcp->vlan_tag);
S
Sathya Perla 已提交
2262

2263
		if (adapter->pvid == (rxcp->vlan_tag & VLAN_VID_MASK) &&
2264
		    !test_bit(rxcp->vlan_tag, adapter->vids))
2265 2266
			rxcp->vlanf = 0;
	}
2267 2268 2269

	/* As the compl has been parsed, reset it; we wont touch it again */
	compl->dw[offsetof(struct amap_eth_rx_compl_v1, valid) / 32] = 0;
S
Sathya Perla 已提交
2270

2271
	queue_tail_inc(&rxo->cq);
S
Sathya Perla 已提交
2272 2273 2274
	return rxcp;
}

2275
static inline struct page *be_alloc_pages(u32 size, gfp_t gfp)
S
Sathya Perla 已提交
2276 2277
{
	u32 order = get_order(size);
2278

S
Sathya Perla 已提交
2279
	if (order > 0)
2280 2281
		gfp |= __GFP_COMP;
	return  alloc_pages(gfp, order);
S
Sathya Perla 已提交
2282 2283 2284 2285 2286 2287
}

/*
 * Allocate a page, split it to fragments of size rx_frag_size and post as
 * receive buffers to BE
 */
2288
static void be_post_rx_frags(struct be_rx_obj *rxo, gfp_t gfp, u32 frags_needed)
S
Sathya Perla 已提交
2289
{
2290
	struct be_adapter *adapter = rxo->adapter;
2291
	struct be_rx_page_info *page_info = NULL, *prev_page_info = NULL;
2292
	struct be_queue_info *rxq = &rxo->q;
S
Sathya Perla 已提交
2293
	struct page *pagep = NULL;
2294
	struct device *dev = &adapter->pdev->dev;
S
Sathya Perla 已提交
2295 2296
	struct be_eth_rx_d *rxd;
	u64 page_dmaaddr = 0, frag_dmaaddr;
2297
	u32 posted, page_offset = 0, notify = 0;
S
Sathya Perla 已提交
2298

2299
	page_info = &rxo->page_info_tbl[rxq->head];
2300
	for (posted = 0; posted < frags_needed && !page_info->page; posted++) {
S
Sathya Perla 已提交
2301
		if (!pagep) {
2302
			pagep = be_alloc_pages(adapter->big_page_size, gfp);
S
Sathya Perla 已提交
2303
			if (unlikely(!pagep)) {
2304
				rx_stats(rxo)->rx_post_fail++;
S
Sathya Perla 已提交
2305 2306
				break;
			}
2307 2308
			page_dmaaddr = dma_map_page(dev, pagep, 0,
						    adapter->big_page_size,
I
Ivan Vecera 已提交
2309
						    DMA_FROM_DEVICE);
2310 2311 2312
			if (dma_mapping_error(dev, page_dmaaddr)) {
				put_page(pagep);
				pagep = NULL;
2313
				adapter->drv_stats.dma_map_errors++;
2314 2315
				break;
			}
2316
			page_offset = 0;
S
Sathya Perla 已提交
2317 2318
		} else {
			get_page(pagep);
2319
			page_offset += rx_frag_size;
S
Sathya Perla 已提交
2320
		}
2321
		page_info->page_offset = page_offset;
S
Sathya Perla 已提交
2322 2323 2324
		page_info->page = pagep;

		rxd = queue_head_node(rxq);
2325
		frag_dmaaddr = page_dmaaddr + page_info->page_offset;
S
Sathya Perla 已提交
2326 2327 2328 2329 2330 2331 2332
		rxd->fragpa_lo = cpu_to_le32(frag_dmaaddr & 0xFFFFFFFF);
		rxd->fragpa_hi = cpu_to_le32(upper_32_bits(frag_dmaaddr));

		/* Any space left in the current big page for another frag? */
		if ((page_offset + rx_frag_size + rx_frag_size) >
					adapter->big_page_size) {
			pagep = NULL;
2333 2334 2335 2336
			page_info->last_frag = true;
			dma_unmap_addr_set(page_info, bus, page_dmaaddr);
		} else {
			dma_unmap_addr_set(page_info, bus, frag_dmaaddr);
S
Sathya Perla 已提交
2337
		}
2338 2339 2340

		prev_page_info = page_info;
		queue_head_inc(rxq);
S
Sathya Perla 已提交
2341
		page_info = &rxo->page_info_tbl[rxq->head];
S
Sathya Perla 已提交
2342
	}
2343 2344 2345 2346 2347 2348 2349 2350

	/* Mark the last frag of a page when we break out of the above loop
	 * with no more slots available in the RXQ
	 */
	if (pagep) {
		prev_page_info->last_frag = true;
		dma_unmap_addr_set(prev_page_info, bus, page_dmaaddr);
	}
S
Sathya Perla 已提交
2351 2352 2353

	if (posted) {
		atomic_add(posted, &rxq->used);
2354 2355
		if (rxo->rx_post_starved)
			rxo->rx_post_starved = false;
2356
		do {
2357
			notify = min(MAX_NUM_POST_ERX_DB, posted);
2358 2359 2360
			be_rxq_notify(adapter, rxq->id, notify);
			posted -= notify;
		} while (posted);
2361 2362
	} else if (atomic_read(&rxq->used) == 0) {
		/* Let be_worker replenish when memory is available */
2363
		rxo->rx_post_starved = true;
S
Sathya Perla 已提交
2364 2365 2366
	}
}

2367
static struct be_tx_compl_info *be_tx_compl_get(struct be_tx_obj *txo)
S
Sathya Perla 已提交
2368
{
2369 2370 2371
	struct be_queue_info *tx_cq = &txo->cq;
	struct be_tx_compl_info *txcp = &txo->txcp;
	struct be_eth_tx_compl *compl = queue_tail_node(tx_cq);
S
Sathya Perla 已提交
2372

2373
	if (compl->dw[offsetof(struct amap_eth_tx_compl, valid) / 32] == 0)
S
Sathya Perla 已提交
2374 2375
		return NULL;

2376
	/* Ensure load ordering of valid bit dword and other dwords below */
2377
	rmb();
2378
	be_dws_le_to_cpu(compl, sizeof(*compl));
S
Sathya Perla 已提交
2379

2380 2381
	txcp->status = GET_TX_COMPL_BITS(status, compl);
	txcp->end_index = GET_TX_COMPL_BITS(wrb_index, compl);
S
Sathya Perla 已提交
2382

2383
	compl->dw[offsetof(struct amap_eth_tx_compl, valid) / 32] = 0;
S
Sathya Perla 已提交
2384 2385 2386 2387
	queue_tail_inc(tx_cq);
	return txcp;
}

2388
static u16 be_tx_compl_process(struct be_adapter *adapter,
2389
			       struct be_tx_obj *txo, u16 last_index)
S
Sathya Perla 已提交
2390
{
2391
	struct sk_buff **sent_skbs = txo->sent_skb_list;
2392
	struct be_queue_info *txq = &txo->q;
2393 2394 2395
	u16 frag_index, num_wrbs = 0;
	struct sk_buff *skb = NULL;
	bool unmap_skb_hdr = false;
2396
	struct be_eth_wrb *wrb;
S
Sathya Perla 已提交
2397

2398
	do {
2399 2400 2401 2402 2403 2404 2405 2406 2407 2408
		if (sent_skbs[txq->tail]) {
			/* Free skb from prev req */
			if (skb)
				dev_consume_skb_any(skb);
			skb = sent_skbs[txq->tail];
			sent_skbs[txq->tail] = NULL;
			queue_tail_inc(txq);  /* skip hdr wrb */
			num_wrbs++;
			unmap_skb_hdr = true;
		}
2409
		wrb = queue_tail_node(txq);
2410
		frag_index = txq->tail;
I
Ivan Vecera 已提交
2411
		unmap_tx_frag(&adapter->pdev->dev, wrb,
2412
			      (unmap_skb_hdr && skb_headlen(skb)));
2413
		unmap_skb_hdr = false;
S
Sathya Perla 已提交
2414
		queue_tail_inc(txq);
2415 2416 2417
		num_wrbs++;
	} while (frag_index != last_index);
	dev_consume_skb_any(skb);
S
Sathya Perla 已提交
2418

2419
	return num_wrbs;
S
Sathya Perla 已提交
2420 2421
}

S
Sathya Perla 已提交
2422 2423
/* Return the number of events in the event queue */
static inline int events_get(struct be_eq_obj *eqo)
2424
{
S
Sathya Perla 已提交
2425 2426
	struct be_eq_entry *eqe;
	int num = 0;
2427

S
Sathya Perla 已提交
2428 2429 2430 2431
	do {
		eqe = queue_tail_node(&eqo->q);
		if (eqe->evt == 0)
			break;
2432

S
Sathya Perla 已提交
2433 2434 2435 2436 2437 2438 2439
		rmb();
		eqe->evt = 0;
		num++;
		queue_tail_inc(&eqo->q);
	} while (true);

	return num;
2440 2441
}

S
Sathya Perla 已提交
2442 2443
/* Leaves the EQ is disarmed state */
static void be_eq_clean(struct be_eq_obj *eqo)
2444
{
S
Sathya Perla 已提交
2445
	int num = events_get(eqo);
2446

2447
	be_eq_notify(eqo->adapter, eqo->q.id, false, true, num, 0);
2448 2449
}

S
Sathya Perla 已提交
2450
static void be_rx_cq_clean(struct be_rx_obj *rxo)
S
Sathya Perla 已提交
2451 2452
{
	struct be_rx_page_info *page_info;
2453 2454
	struct be_queue_info *rxq = &rxo->q;
	struct be_queue_info *rx_cq = &rxo->cq;
2455
	struct be_rx_compl_info *rxcp;
2456 2457
	struct be_adapter *adapter = rxo->adapter;
	int flush_wait = 0;
S
Sathya Perla 已提交
2458

2459 2460 2461 2462 2463 2464 2465 2466
	/* Consume pending rx completions.
	 * Wait for the flush completion (identified by zero num_rcvd)
	 * to arrive. Notify CQ even when there are no more CQ entries
	 * for HW to flush partially coalesced CQ entries.
	 * In Lancer, there is no need to wait for flush compl.
	 */
	for (;;) {
		rxcp = be_rx_compl_get(rxo);
K
Kalesh AP 已提交
2467
		if (!rxcp) {
2468 2469 2470
			if (lancer_chip(adapter))
				break;

2471 2472 2473
			if (flush_wait++ > 50 ||
			    be_check_error(adapter,
					   BE_ERROR_HW)) {
2474 2475 2476 2477 2478 2479 2480 2481
				dev_warn(&adapter->pdev->dev,
					 "did not receive flush compl\n");
				break;
			}
			be_cq_notify(adapter, rx_cq->id, true, 0);
			mdelay(1);
		} else {
			be_rx_compl_discard(rxo, rxcp);
2482
			be_cq_notify(adapter, rx_cq->id, false, 1);
2483 2484 2485
			if (rxcp->num_rcvd == 0)
				break;
		}
S
Sathya Perla 已提交
2486 2487
	}

2488 2489 2490 2491
	/* After cleanup, leave the CQ in unarmed state */
	be_cq_notify(adapter, rx_cq->id, false, 0);

	/* Then free posted rx buffers that were not used */
2492 2493
	while (atomic_read(&rxq->used) > 0) {
		page_info = get_rx_page_info(rxo);
S
Sathya Perla 已提交
2494 2495 2496 2497
		put_page(page_info->page);
		memset(page_info, 0, sizeof(*page_info));
	}
	BUG_ON(atomic_read(&rxq->used));
2498 2499
	rxq->tail = 0;
	rxq->head = 0;
S
Sathya Perla 已提交
2500 2501
}

S
Sathya Perla 已提交
2502
static void be_tx_compl_clean(struct be_adapter *adapter)
S
Sathya Perla 已提交
2503
{
2504 2505
	u16 end_idx, notified_idx, cmpl = 0, timeo = 0, num_wrbs = 0;
	struct device *dev = &adapter->pdev->dev;
2506
	struct be_tx_compl_info *txcp;
S
Sathya Perla 已提交
2507
	struct be_queue_info *txq;
2508
	struct be_tx_obj *txo;
S
Sathya Perla 已提交
2509
	int i, pending_txqs;
2510

2511
	/* Stop polling for compls when HW has been silent for 10ms */
2512
	do {
S
Sathya Perla 已提交
2513 2514 2515
		pending_txqs = adapter->num_tx_qs;

		for_all_tx_queues(adapter, txo, i) {
2516 2517
			cmpl = 0;
			num_wrbs = 0;
S
Sathya Perla 已提交
2518
			txq = &txo->q;
2519 2520 2521 2522
			while ((txcp = be_tx_compl_get(txo))) {
				num_wrbs +=
					be_tx_compl_process(adapter, txo,
							    txcp->end_index);
S
Sathya Perla 已提交
2523 2524 2525 2526 2527
				cmpl++;
			}
			if (cmpl) {
				be_cq_notify(adapter, txo->cq.id, false, cmpl);
				atomic_sub(num_wrbs, &txq->used);
2528
				timeo = 0;
S
Sathya Perla 已提交
2529
			}
2530
			if (!be_is_tx_compl_pending(txo))
S
Sathya Perla 已提交
2531
				pending_txqs--;
2532 2533
		}

2534 2535
		if (pending_txqs == 0 || ++timeo > 10 ||
		    be_check_error(adapter, BE_ERROR_HW))
2536 2537 2538 2539 2540
			break;

		mdelay(1);
	} while (true);

2541
	/* Free enqueued TX that was never notified to HW */
S
Sathya Perla 已提交
2542 2543 2544
	for_all_tx_queues(adapter, txo, i) {
		txq = &txo->q;

2545 2546 2547 2548
		if (atomic_read(&txq->used)) {
			dev_info(dev, "txq%d: cleaning %d pending tx-wrbs\n",
				 i, atomic_read(&txq->used));
			notified_idx = txq->tail;
S
Sathya Perla 已提交
2549
			end_idx = txq->tail;
2550 2551 2552 2553 2554
			index_adv(&end_idx, atomic_read(&txq->used) - 1,
				  txq->len);
			/* Use the tx-compl process logic to handle requests
			 * that were not sent to the HW.
			 */
S
Sathya Perla 已提交
2555 2556
			num_wrbs = be_tx_compl_process(adapter, txo, end_idx);
			atomic_sub(num_wrbs, &txq->used);
2557 2558 2559 2560 2561 2562 2563
			BUG_ON(atomic_read(&txq->used));
			txo->pend_wrb_cnt = 0;
			/* Since hw was never notified of these requests,
			 * reset TXQ indices
			 */
			txq->head = notified_idx;
			txq->tail = notified_idx;
S
Sathya Perla 已提交
2564
		}
2565
	}
S
Sathya Perla 已提交
2566 2567
}

S
Sathya Perla 已提交
2568 2569 2570 2571 2572 2573
static void be_evt_queues_destroy(struct be_adapter *adapter)
{
	struct be_eq_obj *eqo;
	int i;

	for_all_evt_queues(adapter, eqo, i) {
2574 2575
		if (eqo->q.created) {
			be_eq_clean(eqo);
S
Sathya Perla 已提交
2576
			be_cmd_q_destroy(adapter, &eqo->q, QTYPE_EQ);
2577
			napi_hash_del(&eqo->napi);
2578
			netif_napi_del(&eqo->napi);
2579
		}
2580
		free_cpumask_var(eqo->affinity_mask);
S
Sathya Perla 已提交
2581 2582 2583 2584 2585 2586 2587 2588
		be_queue_free(adapter, &eqo->q);
	}
}

static int be_evt_queues_create(struct be_adapter *adapter)
{
	struct be_queue_info *eq;
	struct be_eq_obj *eqo;
2589
	struct be_aic_obj *aic;
S
Sathya Perla 已提交
2590 2591
	int i, rc;

2592 2593
	adapter->num_evt_qs = min_t(u16, num_irqs(adapter),
				    adapter->cfg_num_qs);
S
Sathya Perla 已提交
2594 2595

	for_all_evt_queues(adapter, eqo, i) {
2596
		int numa_node = dev_to_node(&adapter->pdev->dev);
2597 2598
		if (!zalloc_cpumask_var(&eqo->affinity_mask, GFP_KERNEL))
			return -ENOMEM;
2599 2600
		cpumask_set_cpu(cpumask_local_spread(i, numa_node),
				eqo->affinity_mask);
2601 2602
		netif_napi_add(adapter->netdev, &eqo->napi, be_poll,
			       BE_NAPI_WEIGHT);
2603
		napi_hash_add(&eqo->napi);
2604
		aic = &adapter->aic_obj[i];
S
Sathya Perla 已提交
2605 2606
		eqo->adapter = adapter;
		eqo->idx = i;
2607 2608
		aic->max_eqd = BE_MAX_EQD;
		aic->enable = true;
S
Sathya Perla 已提交
2609 2610 2611

		eq = &eqo->q;
		rc = be_queue_alloc(adapter, eq, EVNT_Q_LEN,
2612
				    sizeof(struct be_eq_entry));
S
Sathya Perla 已提交
2613 2614 2615
		if (rc)
			return rc;

S
Sathya Perla 已提交
2616
		rc = be_cmd_eq_create(adapter, eqo);
S
Sathya Perla 已提交
2617 2618 2619
		if (rc)
			return rc;
	}
2620
	return 0;
S
Sathya Perla 已提交
2621 2622
}

2623 2624 2625 2626
static void be_mcc_queues_destroy(struct be_adapter *adapter)
{
	struct be_queue_info *q;

2627
	q = &adapter->mcc_obj.q;
2628
	if (q->created)
2629
		be_cmd_q_destroy(adapter, q, QTYPE_MCCQ);
2630 2631
	be_queue_free(adapter, q);

2632
	q = &adapter->mcc_obj.cq;
2633
	if (q->created)
2634
		be_cmd_q_destroy(adapter, q, QTYPE_CQ);
2635 2636 2637 2638 2639 2640 2641 2642
	be_queue_free(adapter, q);
}

/* Must be called only after TX qs are created as MCC shares TX EQ */
static int be_mcc_queues_create(struct be_adapter *adapter)
{
	struct be_queue_info *q, *cq;

2643
	cq = &adapter->mcc_obj.cq;
2644
	if (be_queue_alloc(adapter, cq, MCC_CQ_LEN,
2645
			   sizeof(struct be_mcc_compl)))
2646 2647
		goto err;

S
Sathya Perla 已提交
2648 2649
	/* Use the default EQ for MCC completions */
	if (be_cmd_cq_create(adapter, cq, &mcc_eqo(adapter)->q, true, 0))
2650 2651
		goto mcc_cq_free;

2652
	q = &adapter->mcc_obj.q;
2653 2654 2655
	if (be_queue_alloc(adapter, q, MCC_Q_LEN, sizeof(struct be_mcc_wrb)))
		goto mcc_cq_destroy;

2656
	if (be_cmd_mccq_create(adapter, q, cq))
2657 2658 2659 2660 2661 2662 2663
		goto mcc_q_free;

	return 0;

mcc_q_free:
	be_queue_free(adapter, q);
mcc_cq_destroy:
2664
	be_cmd_q_destroy(adapter, cq, QTYPE_CQ);
2665 2666 2667 2668 2669 2670
mcc_cq_free:
	be_queue_free(adapter, cq);
err:
	return -1;
}

S
Sathya Perla 已提交
2671 2672 2673
static void be_tx_queues_destroy(struct be_adapter *adapter)
{
	struct be_queue_info *q;
2674 2675
	struct be_tx_obj *txo;
	u8 i;
S
Sathya Perla 已提交
2676

2677 2678 2679 2680 2681
	for_all_tx_queues(adapter, txo, i) {
		q = &txo->q;
		if (q->created)
			be_cmd_q_destroy(adapter, q, QTYPE_TXQ);
		be_queue_free(adapter, q);
S
Sathya Perla 已提交
2682

2683 2684 2685 2686 2687
		q = &txo->cq;
		if (q->created)
			be_cmd_q_destroy(adapter, q, QTYPE_CQ);
		be_queue_free(adapter, q);
	}
S
Sathya Perla 已提交
2688 2689
}

2690
static int be_tx_qs_create(struct be_adapter *adapter)
S
Sathya Perla 已提交
2691
{
S
Sathya Perla 已提交
2692
	struct be_queue_info *cq;
2693
	struct be_tx_obj *txo;
S
Sathya Perla 已提交
2694
	struct be_eq_obj *eqo;
2695
	int status, i;
S
Sathya Perla 已提交
2696

2697
	adapter->num_tx_qs = min(adapter->num_evt_qs, be_max_txqs(adapter));
2698

S
Sathya Perla 已提交
2699 2700 2701 2702 2703 2704
	for_all_tx_queues(adapter, txo, i) {
		cq = &txo->cq;
		status = be_queue_alloc(adapter, cq, TX_CQ_LEN,
					sizeof(struct be_eth_tx_compl));
		if (status)
			return status;
2705

2706 2707 2708
		u64_stats_init(&txo->stats.sync);
		u64_stats_init(&txo->stats.sync_compl);

S
Sathya Perla 已提交
2709 2710 2711
		/* If num_evt_qs is less than num_tx_qs, then more than
		 * one txq share an eq
		 */
S
Sathya Perla 已提交
2712 2713
		eqo = &adapter->eq_obj[i % adapter->num_evt_qs];
		status = be_cmd_cq_create(adapter, cq, &eqo->q, false, 3);
S
Sathya Perla 已提交
2714 2715
		if (status)
			return status;
S
Sathya Perla 已提交
2716

S
Sathya Perla 已提交
2717 2718 2719 2720
		status = be_queue_alloc(adapter, &txo->q, TX_Q_LEN,
					sizeof(struct be_eth_wrb));
		if (status)
			return status;
S
Sathya Perla 已提交
2721

V
Vasundhara Volam 已提交
2722
		status = be_cmd_txq_create(adapter, txo);
S
Sathya Perla 已提交
2723 2724
		if (status)
			return status;
S
Sathya Perla 已提交
2725 2726 2727

		netif_set_xps_queue(adapter->netdev, eqo->affinity_mask,
				    eqo->idx);
2728
	}
S
Sathya Perla 已提交
2729

S
Sathya Perla 已提交
2730 2731
	dev_info(&adapter->pdev->dev, "created %d TX queue(s)\n",
		 adapter->num_tx_qs);
S
Sathya Perla 已提交
2732
	return 0;
S
Sathya Perla 已提交
2733 2734
}

S
Sathya Perla 已提交
2735
static void be_rx_cqs_destroy(struct be_adapter *adapter)
S
Sathya Perla 已提交
2736 2737
{
	struct be_queue_info *q;
2738 2739 2740 2741 2742 2743 2744 2745
	struct be_rx_obj *rxo;
	int i;

	for_all_rx_queues(adapter, rxo, i) {
		q = &rxo->cq;
		if (q->created)
			be_cmd_q_destroy(adapter, q, QTYPE_CQ);
		be_queue_free(adapter, q);
2746 2747 2748
	}
}

S
Sathya Perla 已提交
2749
static int be_rx_cqs_create(struct be_adapter *adapter)
S
Sathya Perla 已提交
2750
{
S
Sathya Perla 已提交
2751
	struct be_queue_info *eq, *cq;
2752 2753
	struct be_rx_obj *rxo;
	int rc, i;
S
Sathya Perla 已提交
2754

2755
	/* We can create as many RSS rings as there are EQs. */
2756
	adapter->num_rss_qs = adapter->num_evt_qs;
2757

2758 2759 2760 2761 2762 2763 2764 2765
	/* We'll use RSS only if atleast 2 RSS rings are supported. */
	if (adapter->num_rss_qs <= 1)
		adapter->num_rss_qs = 0;

	adapter->num_rx_qs = adapter->num_rss_qs + adapter->need_def_rxq;

	/* When the interface is not capable of RSS rings (and there is no
	 * need to create a default RXQ) we'll still need one RXQ
S
Sathya Perla 已提交
2766
	 */
2767 2768
	if (adapter->num_rx_qs == 0)
		adapter->num_rx_qs = 1;
2769

S
Sathya Perla 已提交
2770
	adapter->big_page_size = (1 << get_order(rx_frag_size)) * PAGE_SIZE;
2771 2772 2773 2774
	for_all_rx_queues(adapter, rxo, i) {
		rxo->adapter = adapter;
		cq = &rxo->cq;
		rc = be_queue_alloc(adapter, cq, RX_CQ_LEN,
2775
				    sizeof(struct be_eth_rx_compl));
2776
		if (rc)
S
Sathya Perla 已提交
2777
			return rc;
2778

2779
		u64_stats_init(&rxo->stats.sync);
S
Sathya Perla 已提交
2780 2781
		eq = &adapter->eq_obj[i % adapter->num_evt_qs].q;
		rc = be_cmd_cq_create(adapter, cq, eq, false, 3);
2782
		if (rc)
S
Sathya Perla 已提交
2783
			return rc;
2784
	}
S
Sathya Perla 已提交
2785

S
Sathya Perla 已提交
2786
	dev_info(&adapter->pdev->dev,
2787
		 "created %d RX queue(s)\n", adapter->num_rx_qs);
S
Sathya Perla 已提交
2788
	return 0;
2789 2790
}

S
Sathya Perla 已提交
2791 2792
static irqreturn_t be_intx(int irq, void *dev)
{
2793 2794 2795
	struct be_eq_obj *eqo = dev;
	struct be_adapter *adapter = eqo->adapter;
	int num_evts = 0;
S
Sathya Perla 已提交
2796

2797 2798 2799 2800 2801 2802 2803
	/* IRQ is not expected when NAPI is scheduled as the EQ
	 * will not be armed.
	 * But, this can happen on Lancer INTx where it takes
	 * a while to de-assert INTx or in BE2 where occasionaly
	 * an interrupt may be raised even when EQ is unarmed.
	 * If NAPI is already scheduled, then counting & notifying
	 * events will orphan them.
2804
	 */
2805
	if (napi_schedule_prep(&eqo->napi)) {
2806
		num_evts = events_get(eqo);
2807 2808 2809 2810
		__napi_schedule(&eqo->napi);
		if (num_evts)
			eqo->spurious_intr = 0;
	}
2811
	be_eq_notify(adapter, eqo->q.id, false, true, num_evts, 0);
2812

2813 2814 2815
	/* Return IRQ_HANDLED only for the the first spurious intr
	 * after a valid intr to stop the kernel from branding
	 * this irq as a bad one!
2816
	 */
2817 2818 2819 2820
	if (num_evts || eqo->spurious_intr++ == 0)
		return IRQ_HANDLED;
	else
		return IRQ_NONE;
S
Sathya Perla 已提交
2821 2822
}

S
Sathya Perla 已提交
2823
static irqreturn_t be_msix(int irq, void *dev)
S
Sathya Perla 已提交
2824
{
S
Sathya Perla 已提交
2825
	struct be_eq_obj *eqo = dev;
S
Sathya Perla 已提交
2826

2827
	be_eq_notify(eqo->adapter, eqo->q.id, false, true, 0, 0);
2828
	napi_schedule(&eqo->napi);
S
Sathya Perla 已提交
2829 2830 2831
	return IRQ_HANDLED;
}

2832
static inline bool do_gro(struct be_rx_compl_info *rxcp)
S
Sathya Perla 已提交
2833
{
2834
	return (rxcp->tcpf && !rxcp->err && rxcp->l4_csum) ? true : false;
S
Sathya Perla 已提交
2835 2836
}

S
Sathya Perla 已提交
2837
static int be_process_rx(struct be_rx_obj *rxo, struct napi_struct *napi,
2838
			 int budget, int polling)
S
Sathya Perla 已提交
2839
{
2840 2841
	struct be_adapter *adapter = rxo->adapter;
	struct be_queue_info *rx_cq = &rxo->cq;
2842
	struct be_rx_compl_info *rxcp;
S
Sathya Perla 已提交
2843
	u32 work_done;
2844
	u32 frags_consumed = 0;
S
Sathya Perla 已提交
2845 2846

	for (work_done = 0; work_done < budget; work_done++) {
2847
		rxcp = be_rx_compl_get(rxo);
S
Sathya Perla 已提交
2848 2849 2850
		if (!rxcp)
			break;

2851 2852 2853 2854 2855 2856
		/* Is it a flush compl that has no data */
		if (unlikely(rxcp->num_rcvd == 0))
			goto loop_continue;

		/* Discard compl with partial DMA Lancer B0 */
		if (unlikely(!rxcp->pkt_size)) {
S
Sathya Perla 已提交
2857
			be_rx_compl_discard(rxo, rxcp);
2858 2859 2860 2861 2862 2863 2864
			goto loop_continue;
		}

		/* On BE drop pkts that arrive due to imperfect filtering in
		 * promiscuous mode on some skews
		 */
		if (unlikely(rxcp->port != adapter->port_num &&
2865
			     !lancer_chip(adapter))) {
S
Sathya Perla 已提交
2866
			be_rx_compl_discard(rxo, rxcp);
2867
			goto loop_continue;
2868
		}
2869

2870 2871
		/* Don't do gro when we're busy_polling */
		if (do_gro(rxcp) && polling != BUSY_POLLING)
S
Sathya Perla 已提交
2872
			be_rx_compl_process_gro(rxo, napi, rxcp);
2873
		else
2874 2875
			be_rx_compl_process(rxo, napi, rxcp);

2876
loop_continue:
2877
		frags_consumed += rxcp->num_rcvd;
2878
		be_rx_stats_update(rxo, rxcp);
S
Sathya Perla 已提交
2879 2880
	}

S
Sathya Perla 已提交
2881 2882
	if (work_done) {
		be_cq_notify(adapter, rx_cq->id, true, work_done);
2883

2884 2885 2886 2887 2888
		/* When an rx-obj gets into post_starved state, just
		 * let be_worker do the posting.
		 */
		if (atomic_read(&rxo->q.used) < RX_FRAGS_REFILL_WM &&
		    !rxo->rx_post_starved)
2889 2890 2891
			be_post_rx_frags(rxo, GFP_ATOMIC,
					 max_t(u32, MAX_RX_POST,
					       frags_consumed));
S
Sathya Perla 已提交
2892
	}
S
Sathya Perla 已提交
2893

S
Sathya Perla 已提交
2894 2895 2896
	return work_done;
}

2897
static inline void be_update_tx_err(struct be_tx_obj *txo, u8 status)
2898 2899 2900 2901 2902 2903 2904 2905 2906 2907 2908 2909 2910 2911
{
	switch (status) {
	case BE_TX_COMP_HDR_PARSE_ERR:
		tx_stats(txo)->tx_hdr_parse_err++;
		break;
	case BE_TX_COMP_NDMA_ERR:
		tx_stats(txo)->tx_dma_err++;
		break;
	case BE_TX_COMP_ACL_ERR:
		tx_stats(txo)->tx_spoof_check_err++;
		break;
	}
}

2912
static inline void lancer_update_tx_err(struct be_tx_obj *txo, u8 status)
2913 2914 2915 2916 2917 2918 2919 2920 2921 2922 2923 2924 2925 2926 2927 2928 2929 2930 2931 2932 2933
{
	switch (status) {
	case LANCER_TX_COMP_LSO_ERR:
		tx_stats(txo)->tx_tso_err++;
		break;
	case LANCER_TX_COMP_HSW_DROP_MAC_ERR:
	case LANCER_TX_COMP_HSW_DROP_VLAN_ERR:
		tx_stats(txo)->tx_spoof_check_err++;
		break;
	case LANCER_TX_COMP_QINQ_ERR:
		tx_stats(txo)->tx_qinq_err++;
		break;
	case LANCER_TX_COMP_PARITY_ERR:
		tx_stats(txo)->tx_internal_parity_err++;
		break;
	case LANCER_TX_COMP_DMA_ERR:
		tx_stats(txo)->tx_dma_err++;
		break;
	}
}

S
Sathya Perla 已提交
2934 2935
static void be_process_tx(struct be_adapter *adapter, struct be_tx_obj *txo,
			  int idx)
S
Sathya Perla 已提交
2936
{
S
Sathya Perla 已提交
2937
	int num_wrbs = 0, work_done = 0;
2938
	struct be_tx_compl_info *txcp;
S
Sathya Perla 已提交
2939

2940 2941
	while ((txcp = be_tx_compl_get(txo))) {
		num_wrbs += be_tx_compl_process(adapter, txo, txcp->end_index);
S
Sathya Perla 已提交
2942
		work_done++;
2943

2944
		if (txcp->status) {
2945
			if (lancer_chip(adapter))
2946
				lancer_update_tx_err(txo, txcp->status);
2947
			else
2948
				be_update_tx_err(txo, txcp->status);
2949
		}
S
Sathya Perla 已提交
2950
	}
S
Sathya Perla 已提交
2951

S
Sathya Perla 已提交
2952 2953 2954
	if (work_done) {
		be_cq_notify(adapter, txo->cq.id, true, work_done);
		atomic_sub(num_wrbs, &txo->q.used);
2955

S
Sathya Perla 已提交
2956 2957 2958
		/* As Tx wrbs have been freed up, wake up netdev queue
		 * if it was stopped due to lack of tx wrbs.  */
		if (__netif_subqueue_stopped(adapter->netdev, idx) &&
2959
		    be_can_txq_wake(txo)) {
S
Sathya Perla 已提交
2960
			netif_wake_subqueue(adapter->netdev, idx);
2961
		}
S
Sathya Perla 已提交
2962 2963 2964 2965

		u64_stats_update_begin(&tx_stats(txo)->sync_compl);
		tx_stats(txo)->tx_compl += work_done;
		u64_stats_update_end(&tx_stats(txo)->sync_compl);
S
Sathya Perla 已提交
2966
	}
S
Sathya Perla 已提交
2967
}
S
Sathya Perla 已提交
2968

2969 2970 2971 2972 2973 2974 2975 2976 2977 2978 2979 2980 2981 2982 2983 2984 2985 2986 2987 2988 2989 2990 2991 2992 2993 2994 2995 2996 2997 2998 2999 3000 3001 3002 3003 3004 3005 3006 3007 3008 3009 3010 3011 3012 3013 3014 3015 3016 3017 3018 3019 3020 3021 3022 3023 3024 3025 3026 3027 3028 3029 3030 3031 3032 3033 3034 3035 3036 3037 3038 3039 3040 3041 3042 3043 3044 3045 3046 3047 3048 3049 3050 3051 3052 3053 3054 3055 3056 3057 3058 3059 3060 3061 3062 3063 3064 3065 3066 3067 3068
#ifdef CONFIG_NET_RX_BUSY_POLL
static inline bool be_lock_napi(struct be_eq_obj *eqo)
{
	bool status = true;

	spin_lock(&eqo->lock); /* BH is already disabled */
	if (eqo->state & BE_EQ_LOCKED) {
		WARN_ON(eqo->state & BE_EQ_NAPI);
		eqo->state |= BE_EQ_NAPI_YIELD;
		status = false;
	} else {
		eqo->state = BE_EQ_NAPI;
	}
	spin_unlock(&eqo->lock);
	return status;
}

static inline void be_unlock_napi(struct be_eq_obj *eqo)
{
	spin_lock(&eqo->lock); /* BH is already disabled */

	WARN_ON(eqo->state & (BE_EQ_POLL | BE_EQ_NAPI_YIELD));
	eqo->state = BE_EQ_IDLE;

	spin_unlock(&eqo->lock);
}

static inline bool be_lock_busy_poll(struct be_eq_obj *eqo)
{
	bool status = true;

	spin_lock_bh(&eqo->lock);
	if (eqo->state & BE_EQ_LOCKED) {
		eqo->state |= BE_EQ_POLL_YIELD;
		status = false;
	} else {
		eqo->state |= BE_EQ_POLL;
	}
	spin_unlock_bh(&eqo->lock);
	return status;
}

static inline void be_unlock_busy_poll(struct be_eq_obj *eqo)
{
	spin_lock_bh(&eqo->lock);

	WARN_ON(eqo->state & (BE_EQ_NAPI));
	eqo->state = BE_EQ_IDLE;

	spin_unlock_bh(&eqo->lock);
}

static inline void be_enable_busy_poll(struct be_eq_obj *eqo)
{
	spin_lock_init(&eqo->lock);
	eqo->state = BE_EQ_IDLE;
}

static inline void be_disable_busy_poll(struct be_eq_obj *eqo)
{
	local_bh_disable();

	/* It's enough to just acquire napi lock on the eqo to stop
	 * be_busy_poll() from processing any queueus.
	 */
	while (!be_lock_napi(eqo))
		mdelay(1);

	local_bh_enable();
}

#else /* CONFIG_NET_RX_BUSY_POLL */

static inline bool be_lock_napi(struct be_eq_obj *eqo)
{
	return true;
}

static inline void be_unlock_napi(struct be_eq_obj *eqo)
{
}

static inline bool be_lock_busy_poll(struct be_eq_obj *eqo)
{
	return false;
}

static inline void be_unlock_busy_poll(struct be_eq_obj *eqo)
{
}

static inline void be_enable_busy_poll(struct be_eq_obj *eqo)
{
}

static inline void be_disable_busy_poll(struct be_eq_obj *eqo)
{
}
#endif /* CONFIG_NET_RX_BUSY_POLL */

3069
int be_poll(struct napi_struct *napi, int budget)
S
Sathya Perla 已提交
3070 3071 3072
{
	struct be_eq_obj *eqo = container_of(napi, struct be_eq_obj, napi);
	struct be_adapter *adapter = eqo->adapter;
3073
	int max_work = 0, work, i, num_evts;
3074
	struct be_rx_obj *rxo;
3075
	struct be_tx_obj *txo;
3076
	u32 mult_enc = 0;
S
Sathya Perla 已提交
3077

3078 3079
	num_evts = events_get(eqo);

3080 3081
	for_all_tx_queues_on_eq(adapter, eqo, txo, i)
		be_process_tx(adapter, txo, i);
S
Sathya Perla 已提交
3082

3083 3084 3085 3086 3087 3088 3089 3090 3091 3092 3093 3094
	if (be_lock_napi(eqo)) {
		/* This loop will iterate twice for EQ0 in which
		 * completions of the last RXQ (default one) are also processed
		 * For other EQs the loop iterates only once
		 */
		for_all_rx_queues_on_eq(adapter, eqo, rxo, i) {
			work = be_process_rx(rxo, napi, budget, NAPI_POLLING);
			max_work = max(work, max_work);
		}
		be_unlock_napi(eqo);
	} else {
		max_work = budget;
S
Sathya Perla 已提交
3095
	}
S
Sathya Perla 已提交
3096

S
Sathya Perla 已提交
3097 3098
	if (is_mcc_eqo(eqo))
		be_process_mcc(adapter);
3099

S
Sathya Perla 已提交
3100 3101
	if (max_work < budget) {
		napi_complete(napi);
3102 3103 3104 3105 3106 3107 3108 3109 3110

		/* Skyhawk EQ_DB has a provision to set the rearm to interrupt
		 * delay via a delay multiplier encoding value
		 */
		if (skyhawk_chip(adapter))
			mult_enc = be_get_eq_delay_mult_enc(eqo);

		be_eq_notify(adapter, eqo->q.id, true, false, num_evts,
			     mult_enc);
S
Sathya Perla 已提交
3111 3112
	} else {
		/* As we'll continue in polling mode, count and clear events */
3113
		be_eq_notify(adapter, eqo->q.id, false, false, num_evts, 0);
3114
	}
S
Sathya Perla 已提交
3115
	return max_work;
S
Sathya Perla 已提交
3116 3117
}

3118 3119 3120 3121 3122 3123 3124 3125 3126 3127 3128 3129 3130 3131 3132 3133 3134 3135 3136 3137 3138 3139
#ifdef CONFIG_NET_RX_BUSY_POLL
static int be_busy_poll(struct napi_struct *napi)
{
	struct be_eq_obj *eqo = container_of(napi, struct be_eq_obj, napi);
	struct be_adapter *adapter = eqo->adapter;
	struct be_rx_obj *rxo;
	int i, work = 0;

	if (!be_lock_busy_poll(eqo))
		return LL_FLUSH_BUSY;

	for_all_rx_queues_on_eq(adapter, eqo, rxo, i) {
		work = be_process_rx(rxo, napi, 4, BUSY_POLLING);
		if (work)
			break;
	}

	be_unlock_busy_poll(eqo);
	return work;
}
#endif

3140
void be_detect_error(struct be_adapter *adapter)
3141
{
3142 3143
	u32 ue_lo = 0, ue_hi = 0, ue_lo_mask = 0, ue_hi_mask = 0;
	u32 sliport_status = 0, sliport_err1 = 0, sliport_err2 = 0;
3144
	u32 i;
3145
	struct device *dev = &adapter->pdev->dev;
3146

3147
	if (be_check_error(adapter, BE_ERROR_HW))
3148 3149
		return;

3150 3151 3152
	if (lancer_chip(adapter)) {
		sliport_status = ioread32(adapter->db + SLIPORT_STATUS_OFFSET);
		if (sliport_status & SLIPORT_STATUS_ERR_MASK) {
3153
			be_set_error(adapter, BE_ERROR_UE);
3154
			sliport_err1 = ioread32(adapter->db +
3155
						SLIPORT_ERROR1_OFFSET);
3156
			sliport_err2 = ioread32(adapter->db +
3157
						SLIPORT_ERROR2_OFFSET);
3158 3159 3160 3161 3162 3163 3164 3165 3166 3167 3168 3169 3170
			/* Do not log error messages if its a FW reset */
			if (sliport_err1 == SLIPORT_ERROR_FW_RESET1 &&
			    sliport_err2 == SLIPORT_ERROR_FW_RESET2) {
				dev_info(dev, "Firmware update in progress\n");
			} else {
				dev_err(dev, "Error detected in the card\n");
				dev_err(dev, "ERR: sliport status 0x%x\n",
					sliport_status);
				dev_err(dev, "ERR: sliport error1 0x%x\n",
					sliport_err1);
				dev_err(dev, "ERR: sliport error2 0x%x\n",
					sliport_err2);
			}
3171 3172
		}
	} else {
3173 3174 3175 3176 3177 3178
		ue_lo = ioread32(adapter->pcicfg + PCICFG_UE_STATUS_LOW);
		ue_hi = ioread32(adapter->pcicfg + PCICFG_UE_STATUS_HIGH);
		ue_lo_mask = ioread32(adapter->pcicfg +
				      PCICFG_UE_STATUS_LOW_MASK);
		ue_hi_mask = ioread32(adapter->pcicfg +
				      PCICFG_UE_STATUS_HI_MASK);
3179

3180 3181
		ue_lo = (ue_lo & ~ue_lo_mask);
		ue_hi = (ue_hi & ~ue_hi_mask);
3182

3183 3184 3185 3186
		/* On certain platforms BE hardware can indicate spurious UEs.
		 * Allow HW to stop working completely in case of a real UE.
		 * Hence not setting the hw_error for UE detection.
		 */
3187

3188 3189 3190 3191 3192
		if (ue_lo || ue_hi) {
			dev_err(dev,
				"Unrecoverable Error detected in the adapter");
			dev_err(dev, "Please reboot server to recover");
			if (skyhawk_chip(adapter))
3193 3194
				be_set_error(adapter, BE_ERROR_UE);

3195 3196 3197 3198 3199 3200 3201 3202 3203 3204
			for (i = 0; ue_lo; ue_lo >>= 1, i++) {
				if (ue_lo & 1)
					dev_err(dev, "UE: %s bit set\n",
						ue_status_low_desc[i]);
			}
			for (i = 0; ue_hi; ue_hi >>= 1, i++) {
				if (ue_hi & 1)
					dev_err(dev, "UE: %s bit set\n",
						ue_status_hi_desc[i]);
			}
3205 3206 3207 3208
		}
	}
}

3209 3210
static void be_msix_disable(struct be_adapter *adapter)
{
3211
	if (msix_enabled(adapter)) {
3212
		pci_disable_msix(adapter->pdev);
3213
		adapter->num_msix_vec = 0;
3214
		adapter->num_msix_roce_vec = 0;
3215 3216 3217
	}
}

3218
static int be_msix_enable(struct be_adapter *adapter)
S
Sathya Perla 已提交
3219
{
3220
	int i, num_vec;
S
Sathya Perla 已提交
3221
	struct device *dev = &adapter->pdev->dev;
S
Sathya Perla 已提交
3222

3223 3224 3225 3226 3227 3228 3229 3230 3231
	/* If RoCE is supported, program the max number of NIC vectors that
	 * may be configured via set-channels, along with vectors needed for
	 * RoCe. Else, just program the number we'll use initially.
	 */
	if (be_roce_supported(adapter))
		num_vec = min_t(int, 2 * be_max_eqs(adapter),
				2 * num_online_cpus());
	else
		num_vec = adapter->cfg_num_qs;
3232

3233
	for (i = 0; i < num_vec; i++)
S
Sathya Perla 已提交
3234 3235
		adapter->msix_entries[i].entry = i;

3236 3237 3238 3239
	num_vec = pci_enable_msix_range(adapter->pdev, adapter->msix_entries,
					MIN_MSIX_VECTORS, num_vec);
	if (num_vec < 0)
		goto fail;
3240 3241 3242 3243 3244 3245 3246 3247 3248 3249 3250

	if (be_roce_supported(adapter) && num_vec > MIN_MSIX_VECTORS) {
		adapter->num_msix_roce_vec = num_vec / 2;
		dev_info(dev, "enabled %d MSI-x vector(s) for RoCE\n",
			 adapter->num_msix_roce_vec);
	}

	adapter->num_msix_vec = num_vec - adapter->num_msix_roce_vec;

	dev_info(dev, "enabled %d MSI-x vector(s) for NIC\n",
		 adapter->num_msix_vec);
3251
	return 0;
3252 3253 3254 3255 3256

fail:
	dev_warn(dev, "MSIx enable failed\n");

	/* INTx is not supported in VFs, so fail probe if enable_msix fails */
3257
	if (be_virtfn(adapter))
3258 3259
		return num_vec;
	return 0;
S
Sathya Perla 已提交
3260 3261
}

3262
static inline int be_msix_vec_get(struct be_adapter *adapter,
3263
				  struct be_eq_obj *eqo)
3264
{
S
Sathya Perla 已提交
3265
	return adapter->msix_entries[eqo->msix_idx].vector;
3266
}
S
Sathya Perla 已提交
3267

3268 3269
static int be_msix_register(struct be_adapter *adapter)
{
S
Sathya Perla 已提交
3270 3271 3272
	struct net_device *netdev = adapter->netdev;
	struct be_eq_obj *eqo;
	int status, i, vec;
S
Sathya Perla 已提交
3273

S
Sathya Perla 已提交
3274 3275 3276 3277
	for_all_evt_queues(adapter, eqo, i) {
		sprintf(eqo->desc, "%s-q%d", netdev->name, i);
		vec = be_msix_vec_get(adapter, eqo);
		status = request_irq(vec, be_msix, 0, eqo->desc, eqo);
3278 3279
		if (status)
			goto err_msix;
3280 3281

		irq_set_affinity_hint(vec, eqo->affinity_mask);
3282
	}
3283

S
Sathya Perla 已提交
3284
	return 0;
3285
err_msix:
S
Sathya Perla 已提交
3286 3287 3288
	for (i--, eqo = &adapter->eq_obj[i]; i >= 0; i--, eqo--)
		free_irq(be_msix_vec_get(adapter, eqo), eqo);
	dev_warn(&adapter->pdev->dev, "MSIX Request IRQ failed - err %d\n",
3289
		 status);
3290
	be_msix_disable(adapter);
S
Sathya Perla 已提交
3291 3292 3293 3294 3295 3296 3297 3298
	return status;
}

static int be_irq_register(struct be_adapter *adapter)
{
	struct net_device *netdev = adapter->netdev;
	int status;

3299
	if (msix_enabled(adapter)) {
S
Sathya Perla 已提交
3300 3301 3302
		status = be_msix_register(adapter);
		if (status == 0)
			goto done;
3303
		/* INTx is not supported for VF */
3304
		if (be_virtfn(adapter))
3305
			return status;
S
Sathya Perla 已提交
3306 3307
	}

3308
	/* INTx: only the first EQ is used */
S
Sathya Perla 已提交
3309 3310
	netdev->irq = adapter->pdev->irq;
	status = request_irq(netdev->irq, be_intx, IRQF_SHARED, netdev->name,
3311
			     &adapter->eq_obj[0]);
S
Sathya Perla 已提交
3312 3313 3314 3315 3316 3317 3318 3319 3320 3321 3322 3323 3324
	if (status) {
		dev_err(&adapter->pdev->dev,
			"INTx request IRQ failed - err %d\n", status);
		return status;
	}
done:
	adapter->isr_registered = true;
	return 0;
}

static void be_irq_unregister(struct be_adapter *adapter)
{
	struct net_device *netdev = adapter->netdev;
S
Sathya Perla 已提交
3325
	struct be_eq_obj *eqo;
3326
	int i, vec;
S
Sathya Perla 已提交
3327 3328 3329 3330 3331

	if (!adapter->isr_registered)
		return;

	/* INTx */
3332
	if (!msix_enabled(adapter)) {
3333
		free_irq(netdev->irq, &adapter->eq_obj[0]);
S
Sathya Perla 已提交
3334 3335 3336 3337
		goto done;
	}

	/* MSIx */
3338 3339 3340 3341 3342
	for_all_evt_queues(adapter, eqo, i) {
		vec = be_msix_vec_get(adapter, eqo);
		irq_set_affinity_hint(vec, NULL);
		free_irq(vec, eqo);
	}
3343

S
Sathya Perla 已提交
3344 3345 3346 3347
done:
	adapter->isr_registered = false;
}

S
Sathya Perla 已提交
3348
static void be_rx_qs_destroy(struct be_adapter *adapter)
3349 3350 3351 3352 3353 3354 3355 3356 3357
{
	struct be_queue_info *q;
	struct be_rx_obj *rxo;
	int i;

	for_all_rx_queues(adapter, rxo, i) {
		q = &rxo->q;
		if (q->created) {
			be_cmd_rxq_destroy(adapter, q);
S
Sathya Perla 已提交
3358
			be_rx_cq_clean(rxo);
3359
		}
S
Sathya Perla 已提交
3360
		be_queue_free(adapter, q);
3361 3362 3363
	}
}

3364 3365 3366
static int be_close(struct net_device *netdev)
{
	struct be_adapter *adapter = netdev_priv(netdev);
S
Sathya Perla 已提交
3367 3368
	struct be_eq_obj *eqo;
	int i;
3369

3370 3371 3372 3373 3374 3375
	/* This protection is needed as be_close() may be called even when the
	 * adapter is in cleared state (after eeh perm failure)
	 */
	if (!(adapter->flags & BE_FLAGS_SETUP_DONE))
		return 0;

3376 3377
	be_roce_dev_close(adapter);

3378 3379
	if (adapter->flags & BE_FLAGS_NAPI_ENABLED) {
		for_all_evt_queues(adapter, eqo, i) {
3380
			napi_disable(&eqo->napi);
3381 3382
			be_disable_busy_poll(eqo);
		}
3383
		adapter->flags &= ~BE_FLAGS_NAPI_ENABLED;
3384
	}
3385 3386 3387 3388 3389 3390

	be_async_mcc_disable(adapter);

	/* Wait for all pending tx completions to arrive so that
	 * all tx skbs are freed.
	 */
S
Sathya Perla 已提交
3391
	netif_tx_disable(netdev);
3392
	be_tx_compl_clean(adapter);
3393 3394

	be_rx_qs_destroy(adapter);
3395
	be_clear_uc_list(adapter);
3396

3397
	for_all_evt_queues(adapter, eqo, i) {
S
Sathya Perla 已提交
3398 3399 3400 3401 3402
		if (msix_enabled(adapter))
			synchronize_irq(be_msix_vec_get(adapter, eqo));
		else
			synchronize_irq(netdev->irq);
		be_eq_clean(eqo);
3403 3404
	}

3405 3406
	be_irq_unregister(adapter);

3407 3408 3409
	return 0;
}

S
Sathya Perla 已提交
3410
static int be_rx_qs_create(struct be_adapter *adapter)
3411
{
3412 3413
	struct rss_info *rss = &adapter->rss_info;
	u8 rss_key[RSS_HASH_KEY_LEN];
3414
	struct be_rx_obj *rxo;
3415
	int rc, i, j;
3416 3417

	for_all_rx_queues(adapter, rxo, i) {
S
Sathya Perla 已提交
3418 3419 3420 3421 3422 3423
		rc = be_queue_alloc(adapter, &rxo->q, RX_Q_LEN,
				    sizeof(struct be_eth_rx_d));
		if (rc)
			return rc;
	}

3424 3425 3426 3427 3428 3429 3430 3431
	if (adapter->need_def_rxq || !adapter->num_rss_qs) {
		rxo = default_rxo(adapter);
		rc = be_cmd_rxq_create(adapter, &rxo->q, rxo->cq.id,
				       rx_frag_size, adapter->if_handle,
				       false, &rxo->rss_id);
		if (rc)
			return rc;
	}
S
Sathya Perla 已提交
3432 3433

	for_all_rss_queues(adapter, rxo, i) {
3434
		rc = be_cmd_rxq_create(adapter, &rxo->q, rxo->cq.id,
S
Sathya Perla 已提交
3435 3436
				       rx_frag_size, adapter->if_handle,
				       true, &rxo->rss_id);
3437 3438 3439 3440 3441
		if (rc)
			return rc;
	}

	if (be_multi_rxq(adapter)) {
3442
		for (j = 0; j < RSS_INDIR_TABLE_LEN; j += adapter->num_rss_qs) {
3443
			for_all_rss_queues(adapter, rxo, i) {
3444
				if ((j + i) >= RSS_INDIR_TABLE_LEN)
3445
					break;
3446 3447
				rss->rsstable[j + i] = rxo->rss_id;
				rss->rss_queue[j + i] = i;
3448 3449
			}
		}
3450 3451
		rss->rss_flags = RSS_ENABLE_TCP_IPV4 | RSS_ENABLE_IPV4 |
			RSS_ENABLE_TCP_IPV6 | RSS_ENABLE_IPV6;
3452 3453

		if (!BEx_chip(adapter))
3454 3455
			rss->rss_flags |= RSS_ENABLE_UDP_IPV4 |
				RSS_ENABLE_UDP_IPV6;
3456 3457
	} else {
		/* Disable RSS, if only default RX Q is created */
3458
		rss->rss_flags = RSS_ENABLE_NONE;
3459
	}
3460

3461
	netdev_rss_key_fill(rss_key, RSS_HASH_KEY_LEN);
3462
	rc = be_cmd_rss_config(adapter, rss->rsstable, rss->rss_flags,
3463
			       128, rss_key);
3464
	if (rc) {
3465
		rss->rss_flags = RSS_ENABLE_NONE;
3466
		return rc;
3467 3468
	}

3469
	memcpy(rss->rss_hkey, rss_key, RSS_HASH_KEY_LEN);
3470

3471 3472 3473
	/* Post 1 less than RXQ-len to avoid head being equal to tail,
	 * which is a queue empty condition
	 */
S
Sathya Perla 已提交
3474
	for_all_rx_queues(adapter, rxo, i)
3475 3476
		be_post_rx_frags(rxo, GFP_KERNEL, RX_Q_LEN - 1);

3477 3478 3479
	return 0;
}

S
Sathya Perla 已提交
3480 3481 3482
static int be_open(struct net_device *netdev)
{
	struct be_adapter *adapter = netdev_priv(netdev);
S
Sathya Perla 已提交
3483
	struct be_eq_obj *eqo;
3484
	struct be_rx_obj *rxo;
S
Sathya Perla 已提交
3485
	struct be_tx_obj *txo;
3486
	u8 link_status;
3487
	int status, i;
3488

S
Sathya Perla 已提交
3489
	status = be_rx_qs_create(adapter);
3490 3491 3492
	if (status)
		goto err;

3493 3494 3495
	status = be_irq_register(adapter);
	if (status)
		goto err;
3496

S
Sathya Perla 已提交
3497
	for_all_rx_queues(adapter, rxo, i)
3498
		be_cq_notify(adapter, rxo->cq.id, true, 0);
3499

S
Sathya Perla 已提交
3500 3501 3502
	for_all_tx_queues(adapter, txo, i)
		be_cq_notify(adapter, txo->cq.id, true, 0);

3503 3504
	be_async_mcc_enable(adapter);

S
Sathya Perla 已提交
3505 3506
	for_all_evt_queues(adapter, eqo, i) {
		napi_enable(&eqo->napi);
3507
		be_enable_busy_poll(eqo);
3508
		be_eq_notify(adapter, eqo->q.id, true, true, 0, 0);
S
Sathya Perla 已提交
3509
	}
3510
	adapter->flags |= BE_FLAGS_NAPI_ENABLED;
S
Sathya Perla 已提交
3511

3512
	status = be_cmd_link_status_query(adapter, NULL, &link_status, 0);
3513 3514 3515
	if (!status)
		be_link_status_update(adapter, link_status);

S
Sathya Perla 已提交
3516
	netif_tx_start_all_queues(netdev);
3517
	be_roce_dev_open(adapter);
3518

3519
#ifdef CONFIG_BE2NET_VXLAN
3520 3521
	if (skyhawk_chip(adapter))
		vxlan_get_rx_port(netdev);
3522 3523
#endif

3524 3525 3526 3527
	return 0;
err:
	be_close(adapter->netdev);
	return -EIO;
3528 3529
}

3530 3531
static int be_setup_wol(struct be_adapter *adapter, bool enable)
{
3532
	struct device *dev = &adapter->pdev->dev;
3533 3534
	struct be_dma_mem cmd;
	u8 mac[ETH_ALEN];
3535
	int status;
3536

3537
	eth_zero_addr(mac);
3538 3539

	cmd.size = sizeof(struct be_cmd_req_acpi_wol_magic_config);
3540
	cmd.va = dma_zalloc_coherent(dev, cmd.size, &cmd.dma, GFP_KERNEL);
K
Kalesh AP 已提交
3541
	if (!cmd.va)
3542
		return -ENOMEM;
3543 3544 3545

	if (enable) {
		status = pci_write_config_dword(adapter->pdev,
3546 3547
						PCICFG_PM_CONTROL_OFFSET,
						PCICFG_PM_CONTROL_MASK);
3548
		if (status) {
3549 3550
			dev_err(dev, "Could not enable Wake-on-lan\n");
			goto err;
3551 3552
		}
	} else {
3553
		ether_addr_copy(mac, adapter->netdev->dev_addr);
3554 3555
	}

3556 3557 3558 3559 3560
	status = be_cmd_enable_magic_wol(adapter, mac, &cmd);
	pci_enable_wake(adapter->pdev, PCI_D3hot, enable);
	pci_enable_wake(adapter->pdev, PCI_D3cold, enable);
err:
	dma_free_coherent(dev, cmd.size, cmd.va, cmd.dma);
3561 3562 3563
	return status;
}

3564 3565 3566 3567 3568 3569 3570 3571 3572 3573 3574 3575 3576
static void be_vf_eth_addr_generate(struct be_adapter *adapter, u8 *mac)
{
	u32 addr;

	addr = jhash(adapter->netdev->dev_addr, ETH_ALEN, 0);

	mac[5] = (u8)(addr & 0xFF);
	mac[4] = (u8)((addr >> 8) & 0xFF);
	mac[3] = (u8)((addr >> 16) & 0xFF);
	/* Use the OUI from the current MAC address */
	memcpy(mac, adapter->netdev->dev_addr, 3);
}

3577 3578 3579 3580 3581 3582
/*
 * Generate a seed MAC address from the PF MAC Address using jhash.
 * MAC Address for VFs are assigned incrementally starting from the seed.
 * These addresses are programmed in the ASIC by the PF and the VF driver
 * queries for the MAC address during its probe.
 */
3583
static int be_vf_eth_addr_config(struct be_adapter *adapter)
3584
{
3585
	u32 vf;
3586
	int status = 0;
3587
	u8 mac[ETH_ALEN];
3588
	struct be_vf_cfg *vf_cfg;
3589 3590 3591

	be_vf_eth_addr_generate(adapter, mac);

3592
	for_all_vfs(adapter, vf_cfg, vf) {
3593
		if (BEx_chip(adapter))
3594
			status = be_cmd_pmac_add(adapter, mac,
3595 3596
						 vf_cfg->if_handle,
						 &vf_cfg->pmac_id, vf + 1);
3597 3598 3599
		else
			status = be_cmd_set_mac(adapter, mac, vf_cfg->if_handle,
						vf + 1);
3600

3601 3602
		if (status)
			dev_err(&adapter->pdev->dev,
3603 3604
				"Mac address assignment failed for VF %d\n",
				vf);
3605
		else
3606
			memcpy(vf_cfg->mac_addr, mac, ETH_ALEN);
3607 3608 3609 3610 3611 3612

		mac[5] += 1;
	}
	return status;
}

3613 3614 3615 3616 3617 3618 3619
static int be_vfs_mac_query(struct be_adapter *adapter)
{
	int status, vf;
	u8 mac[ETH_ALEN];
	struct be_vf_cfg *vf_cfg;

	for_all_vfs(adapter, vf_cfg, vf) {
3620 3621 3622
		status = be_cmd_get_active_mac(adapter, vf_cfg->pmac_id,
					       mac, vf_cfg->if_handle,
					       false, vf+1);
3623 3624 3625 3626 3627 3628 3629
		if (status)
			return status;
		memcpy(vf_cfg->mac_addr, mac, ETH_ALEN);
	}
	return 0;
}

3630
static void be_vf_clear(struct be_adapter *adapter)
3631
{
3632
	struct be_vf_cfg *vf_cfg;
3633 3634
	u32 vf;

3635
	if (pci_vfs_assigned(adapter->pdev)) {
3636 3637
		dev_warn(&adapter->pdev->dev,
			 "VFs are assigned to VMs: not disabling VFs\n");
3638 3639 3640
		goto done;
	}

3641 3642
	pci_disable_sriov(adapter->pdev);

3643
	for_all_vfs(adapter, vf_cfg, vf) {
3644
		if (BEx_chip(adapter))
3645 3646
			be_cmd_pmac_del(adapter, vf_cfg->if_handle,
					vf_cfg->pmac_id, vf + 1);
3647 3648 3649
		else
			be_cmd_set_mac(adapter, NULL, vf_cfg->if_handle,
				       vf + 1);
3650

3651 3652
		be_cmd_if_destroy(adapter, vf_cfg->if_handle, vf + 1);
	}
3653 3654 3655
done:
	kfree(adapter->vf_cfg);
	adapter->num_vfs = 0;
3656
	adapter->flags &= ~BE_FLAGS_SRIOV_ENABLED;
3657 3658
}

3659 3660 3661 3662 3663 3664 3665 3666
static void be_clear_queues(struct be_adapter *adapter)
{
	be_mcc_queues_destroy(adapter);
	be_rx_cqs_destroy(adapter);
	be_tx_queues_destroy(adapter);
	be_evt_queues_destroy(adapter);
}

3667
static void be_cancel_worker(struct be_adapter *adapter)
3668
{
3669 3670 3671 3672
	if (adapter->flags & BE_FLAGS_WORKER_SCHEDULED) {
		cancel_delayed_work_sync(&adapter->work);
		adapter->flags &= ~BE_FLAGS_WORKER_SCHEDULED;
	}
3673 3674
}

3675 3676 3677 3678 3679 3680 3681 3682
static void be_cancel_err_detection(struct be_adapter *adapter)
{
	if (adapter->flags & BE_FLAGS_ERR_DETECTION_SCHEDULED) {
		cancel_delayed_work_sync(&adapter->be_err_detection_work);
		adapter->flags &= ~BE_FLAGS_ERR_DETECTION_SCHEDULED;
	}
}

3683
static void be_mac_clear(struct be_adapter *adapter)
3684
{
3685
	if (adapter->pmac_id) {
3686 3687
		be_cmd_pmac_del(adapter, adapter->if_handle,
				adapter->pmac_id[0], 0);
3688 3689 3690 3691 3692
		kfree(adapter->pmac_id);
		adapter->pmac_id = NULL;
	}
}

3693
#ifdef CONFIG_BE2NET_VXLAN
3694 3695
static void be_disable_vxlan_offloads(struct be_adapter *adapter)
{
3696 3697
	struct net_device *netdev = adapter->netdev;

3698 3699 3700 3701 3702 3703 3704 3705 3706
	if (adapter->flags & BE_FLAGS_VXLAN_OFFLOADS)
		be_cmd_manage_iface(adapter, adapter->if_handle,
				    OP_CONVERT_TUNNEL_TO_NORMAL);

	if (adapter->vxlan_port)
		be_cmd_set_vxlan_port(adapter, 0);

	adapter->flags &= ~BE_FLAGS_VXLAN_OFFLOADS;
	adapter->vxlan_port = 0;
3707 3708 3709

	netdev->hw_enc_features = 0;
	netdev->hw_features &= ~(NETIF_F_GSO_UDP_TUNNEL);
3710
	netdev->features &= ~(NETIF_F_GSO_UDP_TUNNEL);
3711
}
3712
#endif
3713

3714 3715 3716 3717 3718 3719 3720 3721 3722 3723 3724 3725 3726 3727 3728 3729 3730 3731 3732 3733 3734 3735 3736 3737 3738 3739 3740 3741
static u16 be_calculate_vf_qs(struct be_adapter *adapter, u16 num_vfs)
{
	struct be_resources res = adapter->pool_res;
	u16 num_vf_qs = 1;

	/* Distribute the queue resources equally among the PF and it's VFs
	 * Do not distribute queue resources in multi-channel configuration.
	 */
	if (num_vfs && !be_is_mc(adapter)) {
		/* If number of VFs requested is 8 less than max supported,
		 * assign 8 queue pairs to the PF and divide the remaining
		 * resources evenly among the VFs
		 */
		if (num_vfs < (be_max_vfs(adapter) - 8))
			num_vf_qs = (res.max_rss_qs - 8) / num_vfs;
		else
			num_vf_qs = res.max_rss_qs / num_vfs;

		/* Skyhawk-R chip supports only MAX_RSS_IFACES RSS capable
		 * interfaces per port. Provide RSS on VFs, only if number
		 * of VFs requested is less than MAX_RSS_IFACES limit.
		 */
		if (num_vfs >= MAX_RSS_IFACES)
			num_vf_qs = 1;
	}
	return num_vf_qs;
}

3742 3743
static int be_clear(struct be_adapter *adapter)
{
3744 3745 3746
	struct pci_dev *pdev = adapter->pdev;
	u16 num_vf_qs;

3747
	be_cancel_worker(adapter);
3748

3749
	if (sriov_enabled(adapter))
3750 3751
		be_vf_clear(adapter);

3752 3753 3754
	/* Re-configure FW to distribute resources evenly across max-supported
	 * number of VFs, only when VFs are not already enabled.
	 */
3755 3756
	if (skyhawk_chip(adapter) && be_physfn(adapter) &&
	    !pci_vfs_assigned(pdev)) {
3757 3758
		num_vf_qs = be_calculate_vf_qs(adapter,
					       pci_sriov_get_totalvfs(pdev));
3759
		be_cmd_set_sriov_config(adapter, adapter->pool_res,
3760 3761 3762
					pci_sriov_get_totalvfs(pdev),
					num_vf_qs);
	}
3763

3764
#ifdef CONFIG_BE2NET_VXLAN
3765
	be_disable_vxlan_offloads(adapter);
3766
#endif
3767
	/* delete the primary mac along with the uc-mac list */
3768
	be_mac_clear(adapter);
3769

3770
	be_cmd_if_destroy(adapter, adapter->if_handle,  0);
3771

3772
	be_clear_queues(adapter);
3773

S
Sathya Perla 已提交
3774
	be_msix_disable(adapter);
3775
	adapter->flags &= ~BE_FLAGS_SETUP_DONE;
3776 3777 3778
	return 0;
}

3779 3780 3781 3782 3783 3784 3785
static int be_if_create(struct be_adapter *adapter, u32 *if_handle,
			u32 cap_flags, u32 vf)
{
	u32 en_flags;

	en_flags = BE_IF_FLAGS_UNTAGGED | BE_IF_FLAGS_BROADCAST |
		   BE_IF_FLAGS_MULTICAST | BE_IF_FLAGS_PASS_L3L4_ERRORS |
3786
		   BE_IF_FLAGS_RSS | BE_IF_FLAGS_DEFQ_RSS;
3787 3788 3789

	en_flags &= cap_flags;

3790
	return be_cmd_if_create(adapter, cap_flags, en_flags, if_handle, vf);
3791 3792
}

3793
static int be_vfs_if_create(struct be_adapter *adapter)
3794
{
3795
	struct be_resources res = {0};
3796
	struct be_vf_cfg *vf_cfg;
3797 3798
	u32 cap_flags, vf;
	int status;
3799

3800
	/* If a FW profile exists, then cap_flags are updated */
3801
	cap_flags = BE_IF_FLAGS_UNTAGGED | BE_IF_FLAGS_BROADCAST |
3802
		    BE_IF_FLAGS_MULTICAST | BE_IF_FLAGS_PASS_L3L4_ERRORS;
3803

3804
	for_all_vfs(adapter, vf_cfg, vf) {
3805 3806
		if (!BE3_chip(adapter)) {
			status = be_cmd_get_profile_config(adapter, &res,
3807
							   RESOURCE_LIMITS,
3808
							   vf + 1);
3809
			if (!status) {
3810
				cap_flags = res.if_cap_flags;
3811 3812 3813 3814 3815
				/* Prevent VFs from enabling VLAN promiscuous
				 * mode
				 */
				cap_flags &= ~BE_IF_FLAGS_VLAN_PROMISCUOUS;
			}
3816
		}
3817

3818 3819
		status = be_if_create(adapter, &vf_cfg->if_handle,
				      cap_flags, vf + 1);
3820
		if (status)
3821
			return status;
3822
	}
3823 3824

	return 0;
3825 3826
}

3827
static int be_vf_setup_init(struct be_adapter *adapter)
3828
{
3829
	struct be_vf_cfg *vf_cfg;
3830 3831
	int vf;

3832 3833 3834 3835 3836
	adapter->vf_cfg = kcalloc(adapter->num_vfs, sizeof(*vf_cfg),
				  GFP_KERNEL);
	if (!adapter->vf_cfg)
		return -ENOMEM;

3837 3838 3839
	for_all_vfs(adapter, vf_cfg, vf) {
		vf_cfg->if_handle = -1;
		vf_cfg->pmac_id = -1;
3840
	}
3841
	return 0;
3842 3843
}

3844 3845
static int be_vf_setup(struct be_adapter *adapter)
{
3846
	struct device *dev = &adapter->pdev->dev;
3847
	struct be_vf_cfg *vf_cfg;
3848
	int status, old_vfs, vf;
3849
	bool spoofchk;
3850

3851
	old_vfs = pci_num_vf(adapter->pdev);
3852 3853 3854 3855

	status = be_vf_setup_init(adapter);
	if (status)
		goto err;
3856

3857 3858 3859 3860 3861 3862
	if (old_vfs) {
		for_all_vfs(adapter, vf_cfg, vf) {
			status = be_cmd_get_if_id(adapter, vf_cfg, vf);
			if (status)
				goto err;
		}
3863

3864 3865 3866 3867
		status = be_vfs_mac_query(adapter);
		if (status)
			goto err;
	} else {
3868 3869 3870 3871
		status = be_vfs_if_create(adapter);
		if (status)
			goto err;

3872 3873 3874 3875
		status = be_vf_eth_addr_config(adapter);
		if (status)
			goto err;
	}
3876

3877
	for_all_vfs(adapter, vf_cfg, vf) {
3878
		/* Allow VFs to programs MAC/VLAN filters */
3879 3880 3881
		status = be_cmd_get_fn_privileges(adapter, &vf_cfg->privileges,
						  vf + 1);
		if (!status && !(vf_cfg->privileges & BE_PRIV_FILTMGMT)) {
3882
			status = be_cmd_set_fn_privileges(adapter,
3883
							  vf_cfg->privileges |
3884 3885
							  BE_PRIV_FILTMGMT,
							  vf + 1);
3886 3887
			if (!status) {
				vf_cfg->privileges |= BE_PRIV_FILTMGMT;
3888 3889
				dev_info(dev, "VF%d has FILTMGMT privilege\n",
					 vf);
3890
			}
3891 3892
		}

3893 3894 3895
		/* Allow full available bandwidth */
		if (!old_vfs)
			be_cmd_config_qos(adapter, 0, 0, vf + 1);
3896

3897 3898 3899 3900 3901 3902
		status = be_cmd_get_hsw_config(adapter, NULL, vf + 1,
					       vf_cfg->if_handle, NULL,
					       &spoofchk);
		if (!status)
			vf_cfg->spoofchk = spoofchk;

3903
		if (!old_vfs) {
3904
			be_cmd_enable_vf(adapter, vf + 1);
3905 3906 3907 3908
			be_cmd_set_logical_link_config(adapter,
						       IFLA_VF_LINK_STATE_AUTO,
						       vf+1);
		}
3909
	}
3910 3911 3912 3913 3914 3915 3916 3917 3918

	if (!old_vfs) {
		status = pci_enable_sriov(adapter->pdev, adapter->num_vfs);
		if (status) {
			dev_err(dev, "SRIOV enable failed\n");
			adapter->num_vfs = 0;
			goto err;
		}
	}
3919 3920

	adapter->flags |= BE_FLAGS_SRIOV_ENABLED;
3921 3922
	return 0;
err:
3923 3924
	dev_err(dev, "VF setup failed\n");
	be_vf_clear(adapter);
3925 3926 3927
	return status;
}

3928 3929 3930 3931
/* Converting function_mode bits on BE3 to SH mc_type enums */

static u8 be_convert_mc_type(u32 function_mode)
{
3932
	if (function_mode & VNIC_MODE && function_mode & QNQ_MODE)
3933
		return vNIC1;
3934
	else if (function_mode & QNQ_MODE)
3935 3936 3937 3938 3939 3940 3941 3942 3943
		return FLEX10;
	else if (function_mode & VNIC_MODE)
		return vNIC2;
	else if (function_mode & UMC_ENABLED)
		return UMC;
	else
		return MC_NONE;
}

3944 3945 3946 3947
/* On BE2/BE3 FW does not suggest the supported limits */
static void BEx_get_resources(struct be_adapter *adapter,
			      struct be_resources *res)
{
3948
	bool use_sriov = adapter->num_vfs ? 1 : 0;
3949 3950 3951 3952 3953 3954

	if (be_physfn(adapter))
		res->max_uc_mac = BE_UC_PMAC_COUNT;
	else
		res->max_uc_mac = BE_VF_UC_PMAC_COUNT;

3955 3956 3957 3958 3959 3960 3961 3962 3963 3964 3965 3966 3967 3968
	adapter->mc_type = be_convert_mc_type(adapter->function_mode);

	if (be_is_mc(adapter)) {
		/* Assuming that there are 4 channels per port,
		 * when multi-channel is enabled
		 */
		if (be_is_qnq_mode(adapter))
			res->max_vlans = BE_NUM_VLANS_SUPPORTED/8;
		else
			/* In a non-qnq multichannel mode, the pvid
			 * takes up one vlan entry
			 */
			res->max_vlans = (BE_NUM_VLANS_SUPPORTED / 4) - 1;
	} else {
3969
		res->max_vlans = BE_NUM_VLANS_SUPPORTED;
3970 3971
	}

3972 3973
	res->max_mcast_mac = BE_MAX_MC;

3974 3975 3976 3977 3978
	/* 1) For BE3 1Gb ports, FW does not support multiple TXQs
	 * 2) Create multiple TX rings on a BE3-R multi-channel interface
	 *    *only* if it is RSS-capable.
	 */
	if (BE2_chip(adapter) || use_sriov ||  (adapter->port_num > 1) ||
3979 3980 3981
	    be_virtfn(adapter) ||
	    (be_is_mc(adapter) &&
	     !(adapter->function_caps & BE_FUNCTION_CAPS_RSS))) {
3982
		res->max_tx_qs = 1;
3983 3984 3985 3986 3987 3988
	} else if (adapter->function_caps & BE_FUNCTION_CAPS_SUPER_NIC) {
		struct be_resources super_nic_res = {0};

		/* On a SuperNIC profile, the driver needs to use the
		 * GET_PROFILE_CONFIG cmd to query the per-function TXQ limits
		 */
3989 3990
		be_cmd_get_profile_config(adapter, &super_nic_res,
					  RESOURCE_LIMITS, 0);
3991 3992 3993
		/* Some old versions of BE3 FW don't report max_tx_qs value */
		res->max_tx_qs = super_nic_res.max_tx_qs ? : BE3_MAX_TX_QS;
	} else {
3994
		res->max_tx_qs = BE3_MAX_TX_QS;
3995
	}
3996 3997 3998 3999 4000 4001 4002

	if ((adapter->function_caps & BE_FUNCTION_CAPS_RSS) &&
	    !use_sriov && be_physfn(adapter))
		res->max_rss_qs = (adapter->be3_native) ?
					   BE3_MAX_RSS_QS : BE2_MAX_RSS_QS;
	res->max_rx_qs = res->max_rss_qs + 1;

4003
	if (be_physfn(adapter))
4004
		res->max_evt_qs = (be_max_vfs(adapter) > 0) ?
4005 4006 4007
					BE3_SRIOV_MAX_EVT_QS : BE3_MAX_EVT_QS;
	else
		res->max_evt_qs = 1;
4008 4009

	res->if_cap_flags = BE_IF_CAP_FLAGS_WANT;
4010
	res->if_cap_flags &= ~BE_IF_FLAGS_DEFQ_RSS;
4011 4012 4013 4014
	if (!(adapter->function_caps & BE_FUNCTION_CAPS_RSS))
		res->if_cap_flags &= ~BE_IF_FLAGS_RSS;
}

4015 4016 4017
static void be_setup_init(struct be_adapter *adapter)
{
	adapter->vlan_prio_bmap = 0xff;
A
Ajit Khaparde 已提交
4018
	adapter->phy.link_speed = -1;
4019 4020
	adapter->if_handle = -1;
	adapter->be3_native = false;
4021
	adapter->if_flags = 0;
4022 4023 4024 4025
	if (be_physfn(adapter))
		adapter->cmd_privileges = MAX_PRIVILEGES;
	else
		adapter->cmd_privileges = MIN_PRIVILEGES;
4026 4027
}

4028 4029 4030
static int be_get_sriov_config(struct be_adapter *adapter)
{
	struct be_resources res = {0};
4031
	int max_vfs, old_vfs;
4032

4033
	be_cmd_get_profile_config(adapter, &res, RESOURCE_LIMITS, 0);
4034

4035
	/* Some old versions of BE3 FW don't report max_vfs value */
4036 4037 4038 4039 4040
	if (BE3_chip(adapter) && !res.max_vfs) {
		max_vfs = pci_sriov_get_totalvfs(adapter->pdev);
		res.max_vfs = max_vfs > 0 ? min(MAX_VFS, max_vfs) : 0;
	}

4041
	adapter->pool_res = res;
4042

4043 4044 4045 4046
	/* If during previous unload of the driver, the VFs were not disabled,
	 * then we cannot rely on the PF POOL limits for the TotalVFs value.
	 * Instead use the TotalVFs value stored in the pci-dev struct.
	 */
4047 4048
	old_vfs = pci_num_vf(adapter->pdev);
	if (old_vfs) {
4049 4050 4051 4052 4053
		dev_info(&adapter->pdev->dev, "%d VFs are already enabled\n",
			 old_vfs);

		adapter->pool_res.max_vfs =
			pci_sriov_get_totalvfs(adapter->pdev);
4054 4055 4056 4057 4058 4059
		adapter->num_vfs = old_vfs;
	}

	return 0;
}

4060 4061 4062 4063 4064 4065 4066 4067 4068 4069 4070 4071 4072 4073 4074 4075 4076 4077 4078 4079 4080 4081 4082 4083 4084 4085
static void be_alloc_sriov_res(struct be_adapter *adapter)
{
	int old_vfs = pci_num_vf(adapter->pdev);
	u16 num_vf_qs;
	int status;

	be_get_sriov_config(adapter);

	if (!old_vfs)
		pci_sriov_set_totalvfs(adapter->pdev, be_max_vfs(adapter));

	/* When the HW is in SRIOV capable configuration, the PF-pool
	 * resources are given to PF during driver load, if there are no
	 * old VFs. This facility is not available in BE3 FW.
	 * Also, this is done by FW in Lancer chip.
	 */
	if (skyhawk_chip(adapter) && be_max_vfs(adapter) && !old_vfs) {
		num_vf_qs = be_calculate_vf_qs(adapter, 0);
		status = be_cmd_set_sriov_config(adapter, adapter->pool_res, 0,
						 num_vf_qs);
		if (status)
			dev_err(&adapter->pdev->dev,
				"Failed to optimize SRIOV resources\n");
	}
}

4086
static int be_get_resources(struct be_adapter *adapter)
4087
{
4088 4089 4090
	struct device *dev = &adapter->pdev->dev;
	struct be_resources res = {0};
	int status;
4091

4092 4093 4094
	if (BEx_chip(adapter)) {
		BEx_get_resources(adapter, &res);
		adapter->res = res;
4095 4096
	}

4097 4098 4099 4100 4101 4102 4103 4104
	/* For Lancer, SH etc read per-function resource limits from FW.
	 * GET_FUNC_CONFIG returns per function guaranteed limits.
	 * GET_PROFILE_CONFIG returns PCI-E related limits PF-pool limits
	 */
	if (!BEx_chip(adapter)) {
		status = be_cmd_get_func_config(adapter, &res);
		if (status)
			return status;
4105

4106 4107 4108 4109 4110
		/* If a deafault RXQ must be created, we'll use up one RSSQ*/
		if (res.max_rss_qs && res.max_rss_qs == res.max_rx_qs &&
		    !(res.if_cap_flags & BE_IF_FLAGS_DEFQ_RSS))
			res.max_rss_qs -= 1;

4111 4112 4113 4114
		/* If RoCE may be enabled stash away half the EQs for RoCE */
		if (be_roce_supported(adapter))
			res.max_evt_qs /= 2;
		adapter->res = res;
4115
	}
4116

4117 4118 4119 4120 4121 4122
	/* If FW supports RSS default queue, then skip creating non-RSS
	 * queue for non-IP traffic.
	 */
	adapter->need_def_rxq = (be_if_cap_flags(adapter) &
				 BE_IF_FLAGS_DEFQ_RSS) ? 0 : 1;

S
Sathya Perla 已提交
4123 4124 4125 4126 4127 4128 4129 4130
	dev_info(dev, "Max: txqs %d, rxqs %d, rss %d, eqs %d, vfs %d\n",
		 be_max_txqs(adapter), be_max_rxqs(adapter),
		 be_max_rss(adapter), be_max_eqs(adapter),
		 be_max_vfs(adapter));
	dev_info(dev, "Max: uc-macs %d, mc-macs %d, vlans %d\n",
		 be_max_uc(adapter), be_max_mc(adapter),
		 be_max_vlans(adapter));

4131 4132 4133
	/* Sanitize cfg_num_qs based on HW and platform limits */
	adapter->cfg_num_qs = min_t(u16, netif_get_num_default_rss_queues(),
				    be_max_qs(adapter));
4134
	return 0;
4135 4136
}

4137 4138
static int be_get_config(struct be_adapter *adapter)
{
4139
	int status, level;
4140
	u16 profile_id;
4141 4142 4143 4144

	status = be_cmd_get_cntl_attributes(adapter);
	if (status)
		return status;
4145

4146
	status = be_cmd_query_fw_cfg(adapter);
4147
	if (status)
4148
		return status;
4149

4150 4151 4152 4153 4154 4155 4156 4157
	if (BEx_chip(adapter)) {
		level = be_cmd_get_fw_log_level(adapter);
		adapter->msg_enable =
			level <= FW_LOG_LEVEL_DEFAULT ? NETIF_MSG_HW : 0;
	}

	be_cmd_get_acpi_wol_cap(adapter);

4158 4159 4160
	be_cmd_query_port_name(adapter);

	if (be_physfn(adapter)) {
4161 4162 4163 4164
		status = be_cmd_get_active_profile(adapter, &profile_id);
		if (!status)
			dev_info(&adapter->pdev->dev,
				 "Using profile 0x%x\n", profile_id);
4165
	}
4166

4167 4168 4169
	status = be_get_resources(adapter);
	if (status)
		return status;
4170

4171 4172
	adapter->pmac_id = kcalloc(be_max_uc(adapter),
				   sizeof(*adapter->pmac_id), GFP_KERNEL);
4173 4174
	if (!adapter->pmac_id)
		return -ENOMEM;
4175

4176
	return 0;
4177 4178
}

4179 4180 4181 4182 4183 4184 4185 4186 4187 4188 4189 4190 4191 4192 4193 4194 4195
static int be_mac_setup(struct be_adapter *adapter)
{
	u8 mac[ETH_ALEN];
	int status;

	if (is_zero_ether_addr(adapter->netdev->dev_addr)) {
		status = be_cmd_get_perm_mac(adapter, mac);
		if (status)
			return status;

		memcpy(adapter->netdev->dev_addr, mac, ETH_ALEN);
		memcpy(adapter->netdev->perm_addr, mac, ETH_ALEN);
	} else {
		/* Maybe the HW was reset; dev_addr must be re-programmed */
		memcpy(mac, adapter->netdev->dev_addr, ETH_ALEN);
	}

4196 4197 4198 4199
	/* For BE3-R VFs, the PF programs the initial MAC address */
	if (!(BEx_chip(adapter) && be_virtfn(adapter)))
		be_cmd_pmac_add(adapter, mac, adapter->if_handle,
				&adapter->pmac_id[0], 0);
4200 4201 4202
	return 0;
}

4203 4204 4205 4206 4207 4208
static void be_schedule_worker(struct be_adapter *adapter)
{
	schedule_delayed_work(&adapter->work, msecs_to_jiffies(1000));
	adapter->flags |= BE_FLAGS_WORKER_SCHEDULED;
}

4209 4210 4211 4212 4213 4214 4215
static void be_schedule_err_detection(struct be_adapter *adapter)
{
	schedule_delayed_work(&adapter->be_err_detection_work,
			      msecs_to_jiffies(1000));
	adapter->flags |= BE_FLAGS_ERR_DETECTION_SCHEDULED;
}

4216
static int be_setup_queues(struct be_adapter *adapter)
4217
{
4218
	struct net_device *netdev = adapter->netdev;
S
Sathya Perla 已提交
4219
	int status;
4220

4221
	status = be_evt_queues_create(adapter);
4222 4223
	if (status)
		goto err;
4224

4225
	status = be_tx_qs_create(adapter);
4226 4227
	if (status)
		goto err;
S
Sathya Perla 已提交
4228

4229
	status = be_rx_cqs_create(adapter);
S
Sathya Perla 已提交
4230
	if (status)
4231
		goto err;
S
Sathya Perla 已提交
4232

4233
	status = be_mcc_queues_create(adapter);
S
Sathya Perla 已提交
4234 4235 4236
	if (status)
		goto err;

4237 4238 4239 4240 4241 4242 4243 4244
	status = netif_set_real_num_rx_queues(netdev, adapter->num_rx_qs);
	if (status)
		goto err;

	status = netif_set_real_num_tx_queues(netdev, adapter->num_tx_qs);
	if (status)
		goto err;

4245 4246 4247 4248 4249 4250
	return 0;
err:
	dev_err(&adapter->pdev->dev, "queue_setup failed\n");
	return status;
}

4251 4252 4253 4254 4255 4256 4257 4258 4259 4260 4261 4262 4263 4264 4265 4266 4267 4268 4269 4270 4271 4272 4273 4274 4275 4276 4277 4278 4279 4280 4281 4282 4283 4284 4285 4286
int be_update_queues(struct be_adapter *adapter)
{
	struct net_device *netdev = adapter->netdev;
	int status;

	if (netif_running(netdev))
		be_close(netdev);

	be_cancel_worker(adapter);

	/* If any vectors have been shared with RoCE we cannot re-program
	 * the MSIx table.
	 */
	if (!adapter->num_msix_roce_vec)
		be_msix_disable(adapter);

	be_clear_queues(adapter);

	if (!msix_enabled(adapter)) {
		status = be_msix_enable(adapter);
		if (status)
			return status;
	}

	status = be_setup_queues(adapter);
	if (status)
		return status;

	be_schedule_worker(adapter);

	if (netif_running(netdev))
		status = be_open(netdev);

	return status;
}

4287 4288 4289 4290 4291 4292 4293 4294 4295 4296 4297
static inline int fw_major_num(const char *fw_ver)
{
	int fw_major = 0, i;

	i = sscanf(fw_ver, "%d.", &fw_major);
	if (i != 1)
		return 0;

	return fw_major;
}

4298 4299 4300 4301 4302 4303 4304 4305 4306 4307 4308 4309 4310 4311 4312 4313 4314 4315 4316 4317 4318 4319 4320 4321
/* If any VFs are already enabled don't FLR the PF */
static bool be_reset_required(struct be_adapter *adapter)
{
	return pci_num_vf(adapter->pdev) ? false : true;
}

/* Wait for the FW to be ready and perform the required initialization */
static int be_func_init(struct be_adapter *adapter)
{
	int status;

	status = be_fw_wait_ready(adapter);
	if (status)
		return status;

	if (be_reset_required(adapter)) {
		status = be_cmd_reset_function(adapter);
		if (status)
			return status;

		/* Wait for interrupts to quiesce after an FLR */
		msleep(100);

		/* We can clear all errors when function reset succeeds */
4322
		be_clear_error(adapter, BE_CLEAR_ALL);
4323 4324 4325 4326 4327 4328 4329 4330 4331 4332 4333 4334 4335
	}

	/* Tell FW we're ready to fire cmds */
	status = be_cmd_fw_init(adapter);
	if (status)
		return status;

	/* Allow interrupts for other ULPs running on NIC function */
	be_intr_set(adapter, true);

	return 0;
}

4336 4337 4338 4339 4340
static int be_setup(struct be_adapter *adapter)
{
	struct device *dev = &adapter->pdev->dev;
	int status;

4341 4342 4343 4344
	status = be_func_init(adapter);
	if (status)
		return status;

4345 4346 4347 4348 4349
	be_setup_init(adapter);

	if (!lancer_chip(adapter))
		be_cmd_req_native_mode(adapter);

4350 4351 4352
	if (!BE2_chip(adapter) && be_physfn(adapter))
		be_alloc_sriov_res(adapter);

4353
	status = be_get_config(adapter);
S
Sathya Perla 已提交
4354
	if (status)
4355
		goto err;
S
Sathya Perla 已提交
4356

4357
	status = be_msix_enable(adapter);
S
Sathya Perla 已提交
4358
	if (status)
4359
		goto err;
S
Sathya Perla 已提交
4360

4361 4362
	status = be_if_create(adapter, &adapter->if_handle,
			      be_if_cap_flags(adapter), 0);
4363
	if (status)
4364
		goto err;
S
Sathya Perla 已提交
4365

4366 4367
	/* Updating real_num_tx/rx_queues() requires rtnl_lock() */
	rtnl_lock();
4368
	status = be_setup_queues(adapter);
4369
	rtnl_unlock();
4370
	if (status)
4371 4372
		goto err;

4373 4374 4375
	be_cmd_get_fn_privileges(adapter, &adapter->cmd_privileges, 0);

	status = be_mac_setup(adapter);
S
Sathya Perla 已提交
4376 4377 4378
	if (status)
		goto err;

4379
	be_cmd_get_fw_ver(adapter);
S
Sathya Perla 已提交
4380
	dev_info(dev, "FW version is %s\n", adapter->fw_ver);
4381

4382
	if (BE2_chip(adapter) && fw_major_num(adapter->fw_ver) < 4) {
V
Vasundhara Volam 已提交
4383
		dev_err(dev, "Firmware on card is old(%s), IRQs may not work",
4384 4385 4386 4387
			adapter->fw_ver);
		dev_err(dev, "Please upgrade firmware to version >= 4.0\n");
	}

4388
	if (adapter->vlans_added)
S
Sathya Perla 已提交
4389
		be_vid_config(adapter);
4390

4391
	be_set_rx_mode(adapter->netdev);
4392

4393 4394 4395 4396 4397
	status = be_cmd_set_flow_control(adapter, adapter->tx_fc,
					 adapter->rx_fc);
	if (status)
		be_cmd_get_flow_control(adapter, &adapter->tx_fc,
					&adapter->rx_fc);
4398

4399 4400
	dev_info(&adapter->pdev->dev, "HW Flow control - TX:%d RX:%d\n",
		 adapter->tx_fc, adapter->rx_fc);
4401

4402 4403 4404 4405
	if (be_physfn(adapter))
		be_cmd_set_logical_link_config(adapter,
					       IFLA_VF_LINK_STATE_AUTO, 0);

4406 4407
	if (adapter->num_vfs)
		be_vf_setup(adapter);
4408

4409 4410
	status = be_cmd_get_phy_info(adapter);
	if (!status && be_pause_supported(adapter))
A
Ajit Khaparde 已提交
4411 4412
		adapter->phy.fc_autoneg = 1;

4413
	be_schedule_worker(adapter);
4414
	adapter->flags |= BE_FLAGS_SETUP_DONE;
4415
	return 0;
4416 4417 4418 4419
err:
	be_clear(adapter);
	return status;
}
S
Sathya Perla 已提交
4420

I
Ivan Vecera 已提交
4421 4422 4423 4424
#ifdef CONFIG_NET_POLL_CONTROLLER
static void be_netpoll(struct net_device *netdev)
{
	struct be_adapter *adapter = netdev_priv(netdev);
S
Sathya Perla 已提交
4425
	struct be_eq_obj *eqo;
I
Ivan Vecera 已提交
4426 4427
	int i;

4428
	for_all_evt_queues(adapter, eqo, i) {
4429
		be_eq_notify(eqo->adapter, eqo->q.id, false, true, 0, 0);
4430 4431
		napi_schedule(&eqo->napi);
	}
I
Ivan Vecera 已提交
4432 4433 4434
}
#endif

4435
static char flash_cookie[2][16] = {"*** SE FLAS", "H DIRECTORY *** "};
4436

4437 4438
static bool phy_flashing_required(struct be_adapter *adapter)
{
4439
	return (adapter->phy.phy_type == PHY_TYPE_TN_8022 &&
A
Ajit Khaparde 已提交
4440
		adapter->phy.interface_type == PHY_TYPE_BASET_10GB);
4441 4442
}

4443 4444 4445 4446 4447 4448
static bool is_comp_in_ufi(struct be_adapter *adapter,
			   struct flash_section_info *fsec, int type)
{
	int i = 0, img_type = 0;
	struct flash_section_info_g2 *fsec_g2 = NULL;

4449
	if (BE2_chip(adapter))
4450 4451 4452 4453 4454 4455 4456 4457 4458 4459 4460 4461 4462 4463 4464
		fsec_g2 = (struct flash_section_info_g2 *)fsec;

	for (i = 0; i < MAX_FLASH_COMP; i++) {
		if (fsec_g2)
			img_type = le32_to_cpu(fsec_g2->fsec_entry[i].type);
		else
			img_type = le32_to_cpu(fsec->fsec_entry[i].type);

		if (img_type == type)
			return true;
	}
	return false;

}

J
Jingoo Han 已提交
4465
static struct flash_section_info *get_fsec_info(struct be_adapter *adapter,
4466 4467
						int header_size,
						const struct firmware *fw)
4468 4469 4470 4471 4472 4473 4474 4475 4476 4477 4478 4479 4480 4481
{
	struct flash_section_info *fsec = NULL;
	const u8 *p = fw->data;

	p += header_size;
	while (p < (fw->data + fw->size)) {
		fsec = (struct flash_section_info *)p;
		if (!memcmp(flash_cookie, fsec->cookie, sizeof(flash_cookie)))
			return fsec;
		p += 32;
	}
	return NULL;
}

4482 4483 4484 4485 4486 4487 4488 4489
static int be_check_flash_crc(struct be_adapter *adapter, const u8 *p,
			      u32 img_offset, u32 img_size, int hdr_size,
			      u16 img_optype, bool *crc_match)
{
	u32 crc_offset;
	int status;
	u8 crc[4];

4490 4491
	status = be_cmd_get_flash_crc(adapter, crc, img_optype, img_offset,
				      img_size - 4);
4492 4493 4494 4495 4496 4497 4498 4499 4500 4501 4502 4503 4504 4505
	if (status)
		return status;

	crc_offset = hdr_size + img_offset + img_size - 4;

	/* Skip flashing, if crc of flashed region matches */
	if (!memcmp(crc, p + crc_offset, 4))
		*crc_match = true;
	else
		*crc_match = false;

	return status;
}

4506
static int be_flash(struct be_adapter *adapter, const u8 *img,
4507 4508
		    struct be_dma_mem *flash_cmd, int optype, int img_size,
		    u32 img_offset)
4509
{
4510
	u32 flash_op, num_bytes, total_bytes = img_size, bytes_sent = 0;
4511
	struct be_cmd_write_flashrom *req = flash_cmd->va;
4512
	int status;
4513 4514 4515 4516 4517 4518 4519 4520 4521 4522 4523 4524 4525 4526 4527 4528 4529 4530

	while (total_bytes) {
		num_bytes = min_t(u32, 32*1024, total_bytes);

		total_bytes -= num_bytes;

		if (!total_bytes) {
			if (optype == OPTYPE_PHY_FW)
				flash_op = FLASHROM_OPER_PHY_FLASH;
			else
				flash_op = FLASHROM_OPER_FLASH;
		} else {
			if (optype == OPTYPE_PHY_FW)
				flash_op = FLASHROM_OPER_PHY_SAVE;
			else
				flash_op = FLASHROM_OPER_SAVE;
		}

4531
		memcpy(req->data_buf, img, num_bytes);
4532 4533
		img += num_bytes;
		status = be_cmd_write_flashrom(adapter, flash_cmd, optype,
4534 4535
					       flash_op, img_offset +
					       bytes_sent, num_bytes);
4536
		if (base_status(status) == MCC_STATUS_ILLEGAL_REQUEST &&
4537 4538 4539
		    optype == OPTYPE_PHY_FW)
			break;
		else if (status)
4540
			return status;
4541 4542

		bytes_sent += num_bytes;
4543 4544 4545 4546
	}
	return 0;
}

4547
/* For BE2, BE3 and BE3-R */
4548
static int be_flash_BEx(struct be_adapter *adapter,
4549 4550
			const struct firmware *fw,
			struct be_dma_mem *flash_cmd, int num_of_images)
4551
{
4552
	int img_hdrs_size = (num_of_images * sizeof(struct image_hdr));
4553
	struct device *dev = &adapter->pdev->dev;
4554
	struct flash_section_info *fsec = NULL;
4555 4556 4557 4558
	int status, i, filehdr_size, num_comp;
	const struct flash_comp *pflashcomp;
	bool crc_match;
	const u8 *p;
4559 4560 4561 4562 4563 4564 4565 4566 4567 4568 4569 4570 4571 4572 4573 4574 4575 4576 4577 4578 4579 4580

	struct flash_comp gen3_flash_types[] = {
		{ FLASH_iSCSI_PRIMARY_IMAGE_START_g3, OPTYPE_ISCSI_ACTIVE,
			FLASH_IMAGE_MAX_SIZE_g3, IMAGE_FIRMWARE_iSCSI},
		{ FLASH_REDBOOT_START_g3, OPTYPE_REDBOOT,
			FLASH_REDBOOT_IMAGE_MAX_SIZE_g3, IMAGE_BOOT_CODE},
		{ FLASH_iSCSI_BIOS_START_g3, OPTYPE_BIOS,
			FLASH_BIOS_IMAGE_MAX_SIZE_g3, IMAGE_OPTION_ROM_ISCSI},
		{ FLASH_PXE_BIOS_START_g3, OPTYPE_PXE_BIOS,
			FLASH_BIOS_IMAGE_MAX_SIZE_g3, IMAGE_OPTION_ROM_PXE},
		{ FLASH_FCoE_BIOS_START_g3, OPTYPE_FCOE_BIOS,
			FLASH_BIOS_IMAGE_MAX_SIZE_g3, IMAGE_OPTION_ROM_FCoE},
		{ FLASH_iSCSI_BACKUP_IMAGE_START_g3, OPTYPE_ISCSI_BACKUP,
			FLASH_IMAGE_MAX_SIZE_g3, IMAGE_FIRMWARE_BACKUP_iSCSI},
		{ FLASH_FCoE_PRIMARY_IMAGE_START_g3, OPTYPE_FCOE_FW_ACTIVE,
			FLASH_IMAGE_MAX_SIZE_g3, IMAGE_FIRMWARE_FCoE},
		{ FLASH_FCoE_BACKUP_IMAGE_START_g3, OPTYPE_FCOE_FW_BACKUP,
			FLASH_IMAGE_MAX_SIZE_g3, IMAGE_FIRMWARE_BACKUP_FCoE},
		{ FLASH_NCSI_START_g3, OPTYPE_NCSI_FW,
			FLASH_NCSI_IMAGE_MAX_SIZE_g3, IMAGE_NCSI},
		{ FLASH_PHY_FW_START_g3, OPTYPE_PHY_FW,
			FLASH_PHY_FW_IMAGE_MAX_SIZE_g3, IMAGE_FIRMWARE_PHY}
4581
	};
4582 4583 4584 4585 4586 4587 4588 4589 4590 4591 4592 4593 4594 4595 4596 4597 4598 4599

	struct flash_comp gen2_flash_types[] = {
		{ FLASH_iSCSI_PRIMARY_IMAGE_START_g2, OPTYPE_ISCSI_ACTIVE,
			FLASH_IMAGE_MAX_SIZE_g2, IMAGE_FIRMWARE_iSCSI},
		{ FLASH_REDBOOT_START_g2, OPTYPE_REDBOOT,
			FLASH_REDBOOT_IMAGE_MAX_SIZE_g2, IMAGE_BOOT_CODE},
		{ FLASH_iSCSI_BIOS_START_g2, OPTYPE_BIOS,
			FLASH_BIOS_IMAGE_MAX_SIZE_g2, IMAGE_OPTION_ROM_ISCSI},
		{ FLASH_PXE_BIOS_START_g2, OPTYPE_PXE_BIOS,
			FLASH_BIOS_IMAGE_MAX_SIZE_g2, IMAGE_OPTION_ROM_PXE},
		{ FLASH_FCoE_BIOS_START_g2, OPTYPE_FCOE_BIOS,
			FLASH_BIOS_IMAGE_MAX_SIZE_g2, IMAGE_OPTION_ROM_FCoE},
		{ FLASH_iSCSI_BACKUP_IMAGE_START_g2, OPTYPE_ISCSI_BACKUP,
			FLASH_IMAGE_MAX_SIZE_g2, IMAGE_FIRMWARE_BACKUP_iSCSI},
		{ FLASH_FCoE_PRIMARY_IMAGE_START_g2, OPTYPE_FCOE_FW_ACTIVE,
			FLASH_IMAGE_MAX_SIZE_g2, IMAGE_FIRMWARE_FCoE},
		{ FLASH_FCoE_BACKUP_IMAGE_START_g2, OPTYPE_FCOE_FW_BACKUP,
			 FLASH_IMAGE_MAX_SIZE_g2, IMAGE_FIRMWARE_BACKUP_FCoE}
4600 4601
	};

4602
	if (BE3_chip(adapter)) {
4603 4604
		pflashcomp = gen3_flash_types;
		filehdr_size = sizeof(struct flash_file_hdr_g3);
J
Joe Perches 已提交
4605
		num_comp = ARRAY_SIZE(gen3_flash_types);
4606 4607 4608
	} else {
		pflashcomp = gen2_flash_types;
		filehdr_size = sizeof(struct flash_file_hdr_g2);
J
Joe Perches 已提交
4609
		num_comp = ARRAY_SIZE(gen2_flash_types);
4610
		img_hdrs_size = 0;
4611
	}
4612

4613 4614 4615
	/* Get flash section info*/
	fsec = get_fsec_info(adapter, filehdr_size + img_hdrs_size, fw);
	if (!fsec) {
4616
		dev_err(dev, "Invalid Cookie. FW image may be corrupted\n");
4617 4618
		return -1;
	}
4619
	for (i = 0; i < num_comp; i++) {
4620
		if (!is_comp_in_ufi(adapter, fsec, pflashcomp[i].img_type))
4621
			continue;
4622 4623 4624 4625 4626

		if ((pflashcomp[i].optype == OPTYPE_NCSI_FW) &&
		    memcmp(adapter->fw_ver, "3.102.148.0", 11) < 0)
			continue;

4627 4628
		if (pflashcomp[i].optype == OPTYPE_PHY_FW  &&
		    !phy_flashing_required(adapter))
4629
				continue;
4630

4631
		if (pflashcomp[i].optype == OPTYPE_REDBOOT) {
4632 4633 4634 4635 4636 4637 4638 4639 4640 4641 4642 4643 4644 4645
			status = be_check_flash_crc(adapter, fw->data,
						    pflashcomp[i].offset,
						    pflashcomp[i].size,
						    filehdr_size +
						    img_hdrs_size,
						    OPTYPE_REDBOOT, &crc_match);
			if (status) {
				dev_err(dev,
					"Could not get CRC for 0x%x region\n",
					pflashcomp[i].optype);
				continue;
			}

			if (crc_match)
4646 4647
				continue;
		}
4648

4649 4650
		p = fw->data + filehdr_size + pflashcomp[i].offset +
			img_hdrs_size;
4651 4652
		if (p + pflashcomp[i].size > fw->data + fw->size)
			return -1;
4653 4654

		status = be_flash(adapter, p, flash_cmd, pflashcomp[i].optype,
4655
				  pflashcomp[i].size, 0);
4656
		if (status) {
4657
			dev_err(dev, "Flashing section type 0x%x failed\n",
4658 4659
				pflashcomp[i].img_type);
			return status;
4660 4661 4662 4663 4664
		}
	}
	return 0;
}

4665 4666 4667 4668 4669 4670 4671 4672 4673 4674 4675 4676 4677 4678 4679 4680 4681 4682 4683 4684 4685 4686 4687 4688 4689 4690 4691 4692 4693 4694 4695 4696 4697 4698 4699 4700 4701 4702 4703 4704 4705 4706 4707 4708 4709 4710 4711 4712 4713 4714 4715 4716
static u16 be_get_img_optype(struct flash_section_entry fsec_entry)
{
	u32 img_type = le32_to_cpu(fsec_entry.type);
	u16 img_optype = le16_to_cpu(fsec_entry.optype);

	if (img_optype != 0xFFFF)
		return img_optype;

	switch (img_type) {
	case IMAGE_FIRMWARE_iSCSI:
		img_optype = OPTYPE_ISCSI_ACTIVE;
		break;
	case IMAGE_BOOT_CODE:
		img_optype = OPTYPE_REDBOOT;
		break;
	case IMAGE_OPTION_ROM_ISCSI:
		img_optype = OPTYPE_BIOS;
		break;
	case IMAGE_OPTION_ROM_PXE:
		img_optype = OPTYPE_PXE_BIOS;
		break;
	case IMAGE_OPTION_ROM_FCoE:
		img_optype = OPTYPE_FCOE_BIOS;
		break;
	case IMAGE_FIRMWARE_BACKUP_iSCSI:
		img_optype = OPTYPE_ISCSI_BACKUP;
		break;
	case IMAGE_NCSI:
		img_optype = OPTYPE_NCSI_FW;
		break;
	case IMAGE_FLASHISM_JUMPVECTOR:
		img_optype = OPTYPE_FLASHISM_JUMPVECTOR;
		break;
	case IMAGE_FIRMWARE_PHY:
		img_optype = OPTYPE_SH_PHY_FW;
		break;
	case IMAGE_REDBOOT_DIR:
		img_optype = OPTYPE_REDBOOT_DIR;
		break;
	case IMAGE_REDBOOT_CONFIG:
		img_optype = OPTYPE_REDBOOT_CONFIG;
		break;
	case IMAGE_UFI_DIR:
		img_optype = OPTYPE_UFI_DIR;
		break;
	default:
		break;
	}

	return img_optype;
}

4717
static int be_flash_skyhawk(struct be_adapter *adapter,
4718 4719
			    const struct firmware *fw,
			    struct be_dma_mem *flash_cmd, int num_of_images)
4720
{
4721
	int img_hdrs_size = num_of_images * sizeof(struct image_hdr);
4722
	bool crc_match, old_fw_img, flash_offset_support = true;
4723
	struct device *dev = &adapter->pdev->dev;
4724
	struct flash_section_info *fsec = NULL;
4725
	u32 img_offset, img_size, img_type;
4726
	u16 img_optype, flash_optype;
4727 4728
	int status, i, filehdr_size;
	const u8 *p;
4729 4730 4731 4732

	filehdr_size = sizeof(struct flash_file_hdr_g3);
	fsec = get_fsec_info(adapter, filehdr_size + img_hdrs_size, fw);
	if (!fsec) {
4733
		dev_err(dev, "Invalid Cookie. FW image may be corrupted\n");
4734
		return -EINVAL;
4735 4736
	}

4737
retry_flash:
4738 4739 4740
	for (i = 0; i < le32_to_cpu(fsec->fsec_hdr.num_images); i++) {
		img_offset = le32_to_cpu(fsec->fsec_entry[i].offset);
		img_size   = le32_to_cpu(fsec->fsec_entry[i].pad_size);
4741 4742 4743
		img_type   = le32_to_cpu(fsec->fsec_entry[i].type);
		img_optype = be_get_img_optype(fsec->fsec_entry[i]);
		old_fw_img = fsec->fsec_entry[i].optype == 0xFFFF;
4744

4745
		if (img_optype == 0xFFFF)
4746
			continue;
4747 4748 4749 4750 4751 4752

		if (flash_offset_support)
			flash_optype = OPTYPE_OFFSET_SPECIFIED;
		else
			flash_optype = img_optype;

4753 4754 4755 4756 4757 4758 4759 4760
		/* Don't bother verifying CRC if an old FW image is being
		 * flashed
		 */
		if (old_fw_img)
			goto flash;

		status = be_check_flash_crc(adapter, fw->data, img_offset,
					    img_size, filehdr_size +
4761
					    img_hdrs_size, flash_optype,
4762
					    &crc_match);
4763 4764
		if (base_status(status) == MCC_STATUS_ILLEGAL_REQUEST ||
		    base_status(status) == MCC_STATUS_ILLEGAL_FIELD) {
4765 4766 4767 4768 4769 4770 4771 4772 4773 4774 4775 4776 4777 4778 4779 4780
			/* The current FW image on the card does not support
			 * OFFSET based flashing. Retry using older mechanism
			 * of OPTYPE based flashing
			 */
			if (flash_optype == OPTYPE_OFFSET_SPECIFIED) {
				flash_offset_support = false;
				goto retry_flash;
			}

			/* The current FW image on the card does not recognize
			 * the new FLASH op_type. The FW download is partially
			 * complete. Reboot the server now to enable FW image
			 * to recognize the new FLASH op_type. To complete the
			 * remaining process, download the same FW again after
			 * the reboot.
			 */
4781 4782 4783 4784 4785 4786 4787
			dev_err(dev, "Flash incomplete. Reset the server\n");
			dev_err(dev, "Download FW image again after reset\n");
			return -EAGAIN;
		} else if (status) {
			dev_err(dev, "Could not get CRC for 0x%x region\n",
				img_optype);
			return -EFAULT;
4788 4789
		}

4790 4791
		if (crc_match)
			continue;
4792

4793 4794
flash:
		p = fw->data + filehdr_size + img_offset + img_hdrs_size;
4795 4796 4797
		if (p + img_size > fw->data + fw->size)
			return -1;

4798 4799 4800 4801 4802 4803 4804 4805 4806 4807 4808 4809 4810
		status = be_flash(adapter, p, flash_cmd, flash_optype, img_size,
				  img_offset);

		/* The current FW image on the card does not support OFFSET
		 * based flashing. Retry using older mechanism of OPTYPE based
		 * flashing
		 */
		if (base_status(status) == MCC_STATUS_ILLEGAL_FIELD &&
		    flash_optype == OPTYPE_OFFSET_SPECIFIED) {
			flash_offset_support = false;
			goto retry_flash;
		}

4811 4812 4813
		/* For old FW images ignore ILLEGAL_FIELD error or errors on
		 * UFI_DIR region
		 */
4814 4815 4816 4817
		if (old_fw_img &&
		    (base_status(status) == MCC_STATUS_ILLEGAL_FIELD ||
		     (img_optype == OPTYPE_UFI_DIR &&
		      base_status(status) == MCC_STATUS_FAILED))) {
4818 4819 4820 4821 4822
			continue;
		} else if (status) {
			dev_err(dev, "Flashing section type 0x%x failed\n",
				img_type);
			return -EFAULT;
4823 4824 4825
		}
	}
	return 0;
4826 4827
}

4828
static int lancer_fw_download(struct be_adapter *adapter,
4829
			      const struct firmware *fw)
4830
{
4831 4832
#define LANCER_FW_DOWNLOAD_CHUNK      (32 * 1024)
#define LANCER_FW_DOWNLOAD_LOCATION   "/prg"
4833
	struct device *dev = &adapter->pdev->dev;
4834
	struct be_dma_mem flash_cmd;
4835 4836 4837 4838 4839 4840 4841 4842
	const u8 *data_ptr = NULL;
	u8 *dest_image_ptr = NULL;
	size_t image_size = 0;
	u32 chunk_size = 0;
	u32 data_written = 0;
	u32 offset = 0;
	int status = 0;
	u8 add_status = 0;
4843
	u8 change_status;
4844

4845
	if (!IS_ALIGNED(fw->size, sizeof(u32))) {
4846
		dev_err(dev, "FW image size should be multiple of 4\n");
K
Kalesh AP 已提交
4847
		return -EINVAL;
4848 4849
	}

4850 4851
	flash_cmd.size = sizeof(struct lancer_cmd_req_write_object)
				+ LANCER_FW_DOWNLOAD_CHUNK;
4852 4853
	flash_cmd.va = dma_zalloc_coherent(dev, flash_cmd.size,
					   &flash_cmd.dma, GFP_KERNEL);
K
Kalesh AP 已提交
4854 4855
	if (!flash_cmd.va)
		return -ENOMEM;
4856

4857 4858 4859 4860 4861 4862 4863 4864 4865 4866 4867 4868
	dest_image_ptr = flash_cmd.va +
				sizeof(struct lancer_cmd_req_write_object);
	image_size = fw->size;
	data_ptr = fw->data;

	while (image_size) {
		chunk_size = min_t(u32, image_size, LANCER_FW_DOWNLOAD_CHUNK);

		/* Copy the image chunk content. */
		memcpy(dest_image_ptr, data_ptr, chunk_size);

		status = lancer_cmd_write_object(adapter, &flash_cmd,
4869 4870 4871 4872
						 chunk_size, offset,
						 LANCER_FW_DOWNLOAD_LOCATION,
						 &data_written, &change_status,
						 &add_status);
4873 4874 4875 4876 4877 4878 4879 4880 4881 4882 4883
		if (status)
			break;

		offset += data_written;
		data_ptr += data_written;
		image_size -= data_written;
	}

	if (!status) {
		/* Commit the FW written */
		status = lancer_cmd_write_object(adapter, &flash_cmd,
4884 4885 4886 4887
						 0, offset,
						 LANCER_FW_DOWNLOAD_LOCATION,
						 &data_written, &change_status,
						 &add_status);
4888 4889
	}

4890
	dma_free_coherent(dev, flash_cmd.size, flash_cmd.va, flash_cmd.dma);
4891
	if (status) {
4892
		dev_err(dev, "Firmware load error\n");
K
Kalesh AP 已提交
4893
		return be_cmd_status(status);
4894 4895
	}

4896 4897
	dev_info(dev, "Firmware flashed successfully\n");

4898
	if (change_status == LANCER_FW_RESET_NEEDED) {
4899
		dev_info(dev, "Resetting adapter to activate new FW\n");
4900 4901
		status = lancer_physdev_ctrl(adapter,
					     PHYSDEV_CONTROL_FW_RESET_MASK);
4902
		if (status) {
4903 4904
			dev_err(dev, "Adapter busy, could not reset FW\n");
			dev_err(dev, "Reboot server to activate new FW\n");
4905 4906
		}
	} else if (change_status != LANCER_NO_RESET_NEEDED) {
4907
		dev_info(dev, "Reboot server to activate new FW\n");
4908
	}
K
Kalesh AP 已提交
4909 4910

	return 0;
4911 4912
}

4913 4914 4915 4916 4917
/* Check if the flash image file is compatible with the adapter that
 * is being flashed.
 */
static bool be_check_ufi_compatibility(struct be_adapter *adapter,
				       struct flash_file_hdr_g3 *fhdr)
4918
{
4919 4920 4921 4922
	if (!fhdr) {
		dev_err(&adapter->pdev->dev, "Invalid FW UFI file");
		return -1;
	}
4923

4924 4925 4926 4927 4928
	/* First letter of the build version is used to identify
	 * which chip this image file is meant for.
	 */
	switch (fhdr->build[0]) {
	case BLD_STR_UFI_TYPE_SH:
4929 4930 4931
		if (!skyhawk_chip(adapter))
			return false;
		break;
4932
	case BLD_STR_UFI_TYPE_BE3:
4933 4934 4935
		if (!BE3_chip(adapter))
			return false;
		break;
4936
	case BLD_STR_UFI_TYPE_BE2:
4937 4938 4939
		if (!BE2_chip(adapter))
			return false;
		break;
4940 4941 4942
	default:
		return false;
	}
4943 4944

	return (fhdr->asic_type_rev >= adapter->asic_rev);
4945 4946
}

4947 4948
static int be_fw_download(struct be_adapter *adapter, const struct firmware* fw)
{
4949
	struct device *dev = &adapter->pdev->dev;
4950
	struct flash_file_hdr_g3 *fhdr3;
4951 4952
	struct image_hdr *img_hdr_ptr;
	int status = 0, i, num_imgs;
4953
	struct be_dma_mem flash_cmd;
4954

4955 4956 4957 4958
	fhdr3 = (struct flash_file_hdr_g3 *)fw->data;
	if (!be_check_ufi_compatibility(adapter, fhdr3)) {
		dev_err(dev, "Flash image is not compatible with adapter\n");
		return -EINVAL;
4959 4960
	}

4961
	flash_cmd.size = sizeof(struct be_cmd_write_flashrom);
4962 4963
	flash_cmd.va = dma_zalloc_coherent(dev, flash_cmd.size, &flash_cmd.dma,
					   GFP_KERNEL);
4964 4965
	if (!flash_cmd.va)
		return -ENOMEM;
4966 4967 4968 4969 4970 4971

	num_imgs = le32_to_cpu(fhdr3->num_imgs);
	for (i = 0; i < num_imgs; i++) {
		img_hdr_ptr = (struct image_hdr *)(fw->data +
				(sizeof(struct flash_file_hdr_g3) +
				 i * sizeof(struct image_hdr)));
4972 4973 4974
		if (!BE2_chip(adapter) &&
		    le32_to_cpu(img_hdr_ptr->imageid) != 1)
			continue;
4975

4976 4977 4978 4979 4980 4981
		if (skyhawk_chip(adapter))
			status = be_flash_skyhawk(adapter, fw, &flash_cmd,
						  num_imgs);
		else
			status = be_flash_BEx(adapter, fw, &flash_cmd,
					      num_imgs);
4982 4983
	}

4984 4985 4986
	dma_free_coherent(dev, flash_cmd.size, flash_cmd.va, flash_cmd.dma);
	if (!status)
		dev_info(dev, "Firmware flashed successfully\n");
4987

4988 4989 4990 4991 4992 4993 4994 4995 4996 4997 4998
	return status;
}

int be_load_fw(struct be_adapter *adapter, u8 *fw_file)
{
	const struct firmware *fw;
	int status;

	if (!netif_running(adapter->netdev)) {
		dev_err(&adapter->pdev->dev,
			"Firmware load not allowed (interface is down)\n");
4999
		return -ENETDOWN;
5000 5001 5002 5003 5004 5005 5006 5007 5008 5009 5010 5011 5012
	}

	status = request_firmware(&fw, fw_file, &adapter->pdev->dev);
	if (status)
		goto fw_exit;

	dev_info(&adapter->pdev->dev, "Flashing firmware file %s\n", fw_file);

	if (lancer_chip(adapter))
		status = lancer_fw_download(adapter, fw);
	else
		status = be_fw_download(adapter, fw);

S
Somnath Kotur 已提交
5013
	if (!status)
5014
		be_cmd_get_fw_ver(adapter);
S
Somnath Kotur 已提交
5015

5016 5017 5018 5019 5020
fw_exit:
	release_firmware(fw);
	return status;
}

5021 5022
static int be_ndo_bridge_setlink(struct net_device *dev, struct nlmsghdr *nlh,
				 u16 flags)
5023 5024 5025 5026 5027 5028 5029 5030 5031 5032 5033
{
	struct be_adapter *adapter = netdev_priv(dev);
	struct nlattr *attr, *br_spec;
	int rem;
	int status = 0;
	u16 mode = 0;

	if (!sriov_enabled(adapter))
		return -EOPNOTSUPP;

	br_spec = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg), IFLA_AF_SPEC);
5034 5035
	if (!br_spec)
		return -EINVAL;
5036 5037 5038 5039 5040

	nla_for_each_nested(attr, br_spec, rem) {
		if (nla_type(attr) != IFLA_BRIDGE_MODE)
			continue;

5041 5042 5043
		if (nla_len(attr) < sizeof(mode))
			return -EINVAL;

5044 5045 5046 5047 5048 5049 5050 5051
		mode = nla_get_u16(attr);
		if (mode != BRIDGE_MODE_VEPA && mode != BRIDGE_MODE_VEB)
			return -EINVAL;

		status = be_cmd_set_hsw_config(adapter, 0, 0,
					       adapter->if_handle,
					       mode == BRIDGE_MODE_VEPA ?
					       PORT_FWD_TYPE_VEPA :
5052
					       PORT_FWD_TYPE_VEB, 0);
5053 5054 5055 5056 5057 5058 5059 5060 5061 5062 5063 5064 5065 5066 5067 5068
		if (status)
			goto err;

		dev_info(&adapter->pdev->dev, "enabled switch mode: %s\n",
			 mode == BRIDGE_MODE_VEPA ? "VEPA" : "VEB");

		return status;
	}
err:
	dev_err(&adapter->pdev->dev, "Failed to set switch mode %s\n",
		mode == BRIDGE_MODE_VEPA ? "VEPA" : "VEB");

	return status;
}

static int be_ndo_bridge_getlink(struct sk_buff *skb, u32 pid, u32 seq,
5069 5070
				 struct net_device *dev, u32 filter_mask,
				 int nlflags)
5071 5072 5073 5074 5075 5076 5077 5078 5079 5080 5081 5082 5083
{
	struct be_adapter *adapter = netdev_priv(dev);
	int status = 0;
	u8 hsw_mode;

	if (!sriov_enabled(adapter))
		return 0;

	/* BE and Lancer chips support VEB mode only */
	if (BEx_chip(adapter) || lancer_chip(adapter)) {
		hsw_mode = PORT_FWD_TYPE_VEB;
	} else {
		status = be_cmd_get_hsw_config(adapter, NULL, 0,
5084 5085
					       adapter->if_handle, &hsw_mode,
					       NULL);
5086 5087 5088 5089 5090 5091
		if (status)
			return 0;
	}

	return ndo_dflt_bridge_getlink(skb, pid, seq, dev,
				       hsw_mode == PORT_FWD_TYPE_VEPA ?
5092
				       BRIDGE_MODE_VEPA : BRIDGE_MODE_VEB,
5093
				       0, 0, nlflags, filter_mask, NULL);
5094 5095
}

5096
#ifdef CONFIG_BE2NET_VXLAN
5097 5098 5099 5100 5101 5102
/* VxLAN offload Notes:
 *
 * The stack defines tunnel offload flags (hw_enc_features) for IP and doesn't
 * distinguish various types of transports (VxLAN, GRE, NVGRE ..). So, offload
 * is expected to work across all types of IP tunnels once exported. Skyhawk
 * supports offloads for either VxLAN or NVGRE, exclusively. So we export VxLAN
5103 5104 5105
 * offloads in hw_enc_features only when a VxLAN port is added. If other (non
 * VxLAN) tunnels are configured while VxLAN offloads are enabled, offloads for
 * those other tunnels are unexported on the fly through ndo_features_check().
5106 5107 5108 5109 5110
 *
 * Skyhawk supports VxLAN offloads only for one UDP dport. So, if the stack
 * adds more than one port, disable offloads and don't re-enable them again
 * until after all the tunnels are removed.
 */
5111 5112 5113 5114 5115 5116 5117 5118 5119 5120 5121 5122 5123
static void be_add_vxlan_port(struct net_device *netdev, sa_family_t sa_family,
			      __be16 port)
{
	struct be_adapter *adapter = netdev_priv(netdev);
	struct device *dev = &adapter->pdev->dev;
	int status;

	if (lancer_chip(adapter) || BEx_chip(adapter))
		return;

	if (adapter->flags & BE_FLAGS_VXLAN_OFFLOADS) {
		dev_info(dev,
			 "Only one UDP port supported for VxLAN offloads\n");
5124 5125 5126
		dev_info(dev, "Disabling VxLAN offloads\n");
		adapter->vxlan_port_count++;
		goto err;
5127 5128
	}

5129 5130 5131
	if (adapter->vxlan_port_count++ >= 1)
		return;

5132 5133 5134 5135 5136 5137 5138 5139 5140 5141 5142 5143 5144 5145 5146
	status = be_cmd_manage_iface(adapter, adapter->if_handle,
				     OP_CONVERT_NORMAL_TO_TUNNEL);
	if (status) {
		dev_warn(dev, "Failed to convert normal interface to tunnel\n");
		goto err;
	}

	status = be_cmd_set_vxlan_port(adapter, port);
	if (status) {
		dev_warn(dev, "Failed to add VxLAN port\n");
		goto err;
	}
	adapter->flags |= BE_FLAGS_VXLAN_OFFLOADS;
	adapter->vxlan_port = port;

5147 5148 5149 5150
	netdev->hw_enc_features |= NETIF_F_IP_CSUM | NETIF_F_IPV6_CSUM |
				   NETIF_F_TSO | NETIF_F_TSO6 |
				   NETIF_F_GSO_UDP_TUNNEL;
	netdev->hw_features |= NETIF_F_GSO_UDP_TUNNEL;
5151
	netdev->features |= NETIF_F_GSO_UDP_TUNNEL;
5152

5153 5154 5155 5156 5157 5158 5159 5160 5161 5162 5163 5164 5165 5166 5167 5168
	dev_info(dev, "Enabled VxLAN offloads for UDP port %d\n",
		 be16_to_cpu(port));
	return;
err:
	be_disable_vxlan_offloads(adapter);
}

static void be_del_vxlan_port(struct net_device *netdev, sa_family_t sa_family,
			      __be16 port)
{
	struct be_adapter *adapter = netdev_priv(netdev);

	if (lancer_chip(adapter) || BEx_chip(adapter))
		return;

	if (adapter->vxlan_port != port)
5169
		goto done;
5170 5171 5172 5173 5174 5175

	be_disable_vxlan_offloads(adapter);

	dev_info(&adapter->pdev->dev,
		 "Disabled VxLAN offloads for UDP port %d\n",
		 be16_to_cpu(port));
5176 5177
done:
	adapter->vxlan_port_count--;
5178
}
J
Joe Stringer 已提交
5179

5180 5181 5182
static netdev_features_t be_features_check(struct sk_buff *skb,
					   struct net_device *dev,
					   netdev_features_t features)
J
Joe Stringer 已提交
5183
{
5184 5185 5186 5187 5188 5189 5190 5191 5192 5193 5194 5195 5196 5197 5198 5199 5200 5201 5202 5203 5204 5205 5206 5207 5208 5209 5210 5211 5212 5213 5214 5215 5216 5217 5218
	struct be_adapter *adapter = netdev_priv(dev);
	u8 l4_hdr = 0;

	/* The code below restricts offload features for some tunneled packets.
	 * Offload features for normal (non tunnel) packets are unchanged.
	 */
	if (!skb->encapsulation ||
	    !(adapter->flags & BE_FLAGS_VXLAN_OFFLOADS))
		return features;

	/* It's an encapsulated packet and VxLAN offloads are enabled. We
	 * should disable tunnel offload features if it's not a VxLAN packet,
	 * as tunnel offloads have been enabled only for VxLAN. This is done to
	 * allow other tunneled traffic like GRE work fine while VxLAN
	 * offloads are configured in Skyhawk-R.
	 */
	switch (vlan_get_protocol(skb)) {
	case htons(ETH_P_IP):
		l4_hdr = ip_hdr(skb)->protocol;
		break;
	case htons(ETH_P_IPV6):
		l4_hdr = ipv6_hdr(skb)->nexthdr;
		break;
	default:
		return features;
	}

	if (l4_hdr != IPPROTO_UDP ||
	    skb->inner_protocol_type != ENCAP_TYPE_ETHER ||
	    skb->inner_protocol != htons(ETH_P_TEB) ||
	    skb_inner_mac_header(skb) - skb_transport_header(skb) !=
	    sizeof(struct udphdr) + sizeof(struct vxlanhdr))
		return features & ~(NETIF_F_ALL_CSUM | NETIF_F_GSO_MASK);

	return features;
J
Joe Stringer 已提交
5219
}
5220
#endif
5221

5222
static const struct net_device_ops be_netdev_ops = {
S
Sathya Perla 已提交
5223 5224 5225
	.ndo_open		= be_open,
	.ndo_stop		= be_close,
	.ndo_start_xmit		= be_xmit,
5226
	.ndo_set_rx_mode	= be_set_rx_mode,
S
Sathya Perla 已提交
5227 5228
	.ndo_set_mac_address	= be_mac_addr_set,
	.ndo_change_mtu		= be_change_mtu,
5229
	.ndo_get_stats64	= be_get_stats64,
S
Sathya Perla 已提交
5230 5231 5232
	.ndo_validate_addr	= eth_validate_addr,
	.ndo_vlan_rx_add_vid	= be_vlan_add_vid,
	.ndo_vlan_rx_kill_vid	= be_vlan_rem_vid,
5233
	.ndo_set_vf_mac		= be_set_vf_mac,
5234
	.ndo_set_vf_vlan	= be_set_vf_vlan,
5235
	.ndo_set_vf_rate	= be_set_vf_tx_rate,
I
Ivan Vecera 已提交
5236
	.ndo_get_vf_config	= be_get_vf_config,
5237
	.ndo_set_vf_link_state  = be_set_vf_link_state,
5238
	.ndo_set_vf_spoofchk    = be_set_vf_spoofchk,
I
Ivan Vecera 已提交
5239 5240 5241
#ifdef CONFIG_NET_POLL_CONTROLLER
	.ndo_poll_controller	= be_netpoll,
#endif
5242 5243
	.ndo_bridge_setlink	= be_ndo_bridge_setlink,
	.ndo_bridge_getlink	= be_ndo_bridge_getlink,
5244
#ifdef CONFIG_NET_RX_BUSY_POLL
5245
	.ndo_busy_poll		= be_busy_poll,
5246
#endif
5247
#ifdef CONFIG_BE2NET_VXLAN
5248 5249
	.ndo_add_vxlan_port	= be_add_vxlan_port,
	.ndo_del_vxlan_port	= be_del_vxlan_port,
5250
	.ndo_features_check	= be_features_check,
5251
#endif
S
Sathya Perla 已提交
5252 5253 5254 5255 5256 5257
};

static void be_netdev_init(struct net_device *netdev)
{
	struct be_adapter *adapter = netdev_priv(netdev);

5258
	netdev->hw_features |= NETIF_F_SG | NETIF_F_TSO | NETIF_F_TSO6 |
5259
		NETIF_F_IP_CSUM | NETIF_F_IPV6_CSUM | NETIF_F_RXCSUM |
5260
		NETIF_F_HW_VLAN_CTAG_TX;
5261 5262
	if (be_multi_rxq(adapter))
		netdev->hw_features |= NETIF_F_RXHASH;
5263 5264

	netdev->features |= netdev->hw_features |
5265
		NETIF_F_HW_VLAN_CTAG_RX | NETIF_F_HW_VLAN_CTAG_FILTER;
A
Ajit Khaparde 已提交
5266

5267
	netdev->vlan_features |= NETIF_F_SG | NETIF_F_TSO | NETIF_F_TSO6 |
5268
		NETIF_F_IP_CSUM | NETIF_F_IPV6_CSUM;
5269

5270 5271
	netdev->priv_flags |= IFF_UNICAST_FLT;

S
Sathya Perla 已提交
5272 5273
	netdev->flags |= IFF_MULTICAST;

5274
	netif_set_gso_max_size(netdev, 65535 - ETH_HLEN);
5275

S
Sathya Perla 已提交
5276
	netdev->netdev_ops = &be_netdev_ops;
S
Sathya Perla 已提交
5277

5278
	netdev->ethtool_ops = &be_ethtool_ops;
S
Sathya Perla 已提交
5279 5280
}

5281 5282 5283 5284 5285 5286 5287 5288 5289 5290 5291 5292 5293
static void be_cleanup(struct be_adapter *adapter)
{
	struct net_device *netdev = adapter->netdev;

	rtnl_lock();
	netif_device_detach(netdev);
	if (netif_running(netdev))
		be_close(netdev);
	rtnl_unlock();

	be_clear(adapter);
}

5294
static int be_resume(struct be_adapter *adapter)
5295
{
5296
	struct net_device *netdev = adapter->netdev;
5297 5298 5299 5300
	int status;

	status = be_setup(adapter);
	if (status)
5301
		return status;
5302

5303 5304
	if (netif_running(netdev)) {
		status = be_open(netdev);
5305
		if (status)
5306
			return status;
5307 5308
	}

5309 5310
	netif_device_attach(netdev);

5311 5312 5313 5314 5315 5316 5317 5318 5319 5320 5321 5322
	return 0;
}

static int be_err_recover(struct be_adapter *adapter)
{
	struct device *dev = &adapter->pdev->dev;
	int status;

	status = be_resume(adapter);
	if (status)
		goto err;

5323
	dev_info(dev, "Adapter recovery successful\n");
5324 5325
	return 0;
err:
5326
	if (be_physfn(adapter))
5327
		dev_err(dev, "Adapter recovery failed\n");
5328 5329
	else
		dev_err(dev, "Re-trying adapter recovery\n");
5330 5331 5332 5333

	return status;
}

5334
static void be_err_detection_task(struct work_struct *work)
5335 5336
{
	struct be_adapter *adapter =
5337 5338
				container_of(work, struct be_adapter,
					     be_err_detection_work.work);
5339 5340 5341 5342
	int status = 0;

	be_detect_error(adapter);

5343
	if (be_check_error(adapter, BE_ERROR_HW)) {
5344
		be_cleanup(adapter);
5345 5346 5347 5348

		/* As of now error recovery support is in Lancer only */
		if (lancer_chip(adapter))
			status = be_err_recover(adapter);
5349 5350
	}

5351 5352
	/* Always attempt recovery on VFs */
	if (!status || be_virtfn(adapter))
5353
		be_schedule_err_detection(adapter);
5354 5355 5356 5357 5358 5359 5360 5361 5362 5363 5364 5365 5366 5367 5368 5369 5370 5371 5372 5373 5374 5375 5376 5377 5378 5379 5380 5381 5382 5383 5384 5385 5386 5387 5388 5389 5390 5391 5392 5393 5394 5395 5396 5397 5398 5399 5400 5401 5402 5403 5404 5405 5406
}

static void be_log_sfp_info(struct be_adapter *adapter)
{
	int status;

	status = be_cmd_query_sfp_info(adapter);
	if (!status) {
		dev_err(&adapter->pdev->dev,
			"Unqualified SFP+ detected on %c from %s part no: %s",
			adapter->port_name, adapter->phy.vendor_name,
			adapter->phy.vendor_pn);
	}
	adapter->flags &= ~BE_FLAGS_EVT_INCOMPATIBLE_SFP;
}

static void be_worker(struct work_struct *work)
{
	struct be_adapter *adapter =
		container_of(work, struct be_adapter, work.work);
	struct be_rx_obj *rxo;
	int i;

	/* when interrupts are not yet enabled, just reap any pending
	 * mcc completions
	 */
	if (!netif_running(adapter->netdev)) {
		local_bh_disable();
		be_process_mcc(adapter);
		local_bh_enable();
		goto reschedule;
	}

	if (!adapter->stats_cmd_sent) {
		if (lancer_chip(adapter))
			lancer_cmd_get_pport_stats(adapter,
						   &adapter->stats_cmd);
		else
			be_cmd_get_stats(adapter, &adapter->stats_cmd);
	}

	if (be_physfn(adapter) &&
	    MODULO(adapter->work_counter, adapter->be_get_temp_freq) == 0)
		be_cmd_get_die_temperature(adapter);

	for_all_rx_queues(adapter, rxo, i) {
		/* Replenish RX-queues starved due to memory
		 * allocation failures.
		 */
		if (rxo->rx_post_starved)
			be_post_rx_frags(rxo, GFP_KERNEL, MAX_RX_POST);
	}

5407 5408 5409
	/* EQ-delay update for Skyhawk is done while notifying EQ */
	if (!skyhawk_chip(adapter))
		be_eqd_update(adapter, false);
5410 5411 5412 5413 5414 5415 5416 5417 5418

	if (adapter->flags & BE_FLAGS_EVT_INCOMPATIBLE_SFP)
		be_log_sfp_info(adapter);

reschedule:
	adapter->work_counter++;
	schedule_delayed_work(&adapter->work, msecs_to_jiffies(1000));
}

S
Sathya Perla 已提交
5419 5420
static void be_unmap_pci_bars(struct be_adapter *adapter)
{
5421 5422
	if (adapter->csr)
		pci_iounmap(adapter->pdev, adapter->csr);
5423
	if (adapter->db)
S
Sathya Perla 已提交
5424
		pci_iounmap(adapter->pdev, adapter->db);
5425 5426
}

S
Sathya Perla 已提交
5427 5428
static int db_bar(struct be_adapter *adapter)
{
5429
	if (lancer_chip(adapter) || be_virtfn(adapter))
S
Sathya Perla 已提交
5430 5431 5432 5433 5434 5435
		return 0;
	else
		return 4;
}

static int be_roce_map_pci_bars(struct be_adapter *adapter)
5436
{
S
Sathya Perla 已提交
5437
	if (skyhawk_chip(adapter)) {
S
Sathya Perla 已提交
5438 5439 5440 5441 5442 5443
		adapter->roce_db.size = 4096;
		adapter->roce_db.io_addr = pci_resource_start(adapter->pdev,
							      db_bar(adapter));
		adapter->roce_db.total_size = pci_resource_len(adapter->pdev,
							       db_bar(adapter));
	}
5444
	return 0;
S
Sathya Perla 已提交
5445 5446 5447 5448
}

static int be_map_pci_bars(struct be_adapter *adapter)
{
5449
	struct pci_dev *pdev = adapter->pdev;
S
Sathya Perla 已提交
5450
	u8 __iomem *addr;
5451 5452 5453 5454 5455 5456
	u32 sli_intf;

	pci_read_config_dword(adapter->pdev, SLI_INTF_REG_OFFSET, &sli_intf);
	adapter->sli_family = (sli_intf & SLI_INTF_FAMILY_MASK) >>
				SLI_INTF_FAMILY_SHIFT;
	adapter->virtfn = (sli_intf & SLI_INTF_FT_MASK) ? 1 : 0;
5457

5458
	if (BEx_chip(adapter) && be_physfn(adapter)) {
5459
		adapter->csr = pci_iomap(pdev, 2, 0);
K
Kalesh AP 已提交
5460
		if (!adapter->csr)
5461 5462 5463
			return -ENOMEM;
	}

5464
	addr = pci_iomap(pdev, db_bar(adapter), 0);
K
Kalesh AP 已提交
5465
	if (!addr)
S
Sathya Perla 已提交
5466
		goto pci_map_err;
5467
	adapter->db = addr;
S
Sathya Perla 已提交
5468

5469 5470 5471 5472 5473 5474 5475 5476 5477 5478 5479 5480
	if (skyhawk_chip(adapter) || BEx_chip(adapter)) {
		if (be_physfn(adapter)) {
			/* PCICFG is the 2nd BAR in BE2 */
			addr = pci_iomap(pdev, BE2_chip(adapter) ? 1 : 0, 0);
			if (!addr)
				goto pci_map_err;
			adapter->pcicfg = addr;
		} else {
			adapter->pcicfg = adapter->db + SRIOV_VF_PCICFG_OFFSET;
		}
	}

S
Sathya Perla 已提交
5481
	be_roce_map_pci_bars(adapter);
S
Sathya Perla 已提交
5482
	return 0;
S
Sathya Perla 已提交
5483

S
Sathya Perla 已提交
5484
pci_map_err:
5485
	dev_err(&pdev->dev, "Error in mapping PCI BARs\n");
S
Sathya Perla 已提交
5486 5487 5488 5489
	be_unmap_pci_bars(adapter);
	return -ENOMEM;
}

5490
static void be_drv_cleanup(struct be_adapter *adapter)
S
Sathya Perla 已提交
5491
{
5492
	struct be_dma_mem *mem = &adapter->mbox_mem_alloced;
5493
	struct device *dev = &adapter->pdev->dev;
S
Sathya Perla 已提交
5494 5495

	if (mem->va)
5496
		dma_free_coherent(dev, mem->size, mem->va, mem->dma);
5497

5498
	mem = &adapter->rx_filter;
5499
	if (mem->va)
5500 5501 5502 5503 5504
		dma_free_coherent(dev, mem->size, mem->va, mem->dma);

	mem = &adapter->stats_cmd;
	if (mem->va)
		dma_free_coherent(dev, mem->size, mem->va, mem->dma);
S
Sathya Perla 已提交
5505 5506
}

5507 5508
/* Allocate and initialize various fields in be_adapter struct */
static int be_drv_init(struct be_adapter *adapter)
S
Sathya Perla 已提交
5509
{
5510 5511
	struct be_dma_mem *mbox_mem_alloc = &adapter->mbox_mem_alloced;
	struct be_dma_mem *mbox_mem_align = &adapter->mbox_mem;
5512
	struct be_dma_mem *rx_filter = &adapter->rx_filter;
5513 5514 5515
	struct be_dma_mem *stats_cmd = &adapter->stats_cmd;
	struct device *dev = &adapter->pdev->dev;
	int status = 0;
S
Sathya Perla 已提交
5516 5517

	mbox_mem_alloc->size = sizeof(struct be_mcc_mailbox) + 16;
5518 5519 5520
	mbox_mem_alloc->va = dma_zalloc_coherent(dev, mbox_mem_alloc->size,
						 &mbox_mem_alloc->dma,
						 GFP_KERNEL);
5521 5522 5523
	if (!mbox_mem_alloc->va)
		return -ENOMEM;

S
Sathya Perla 已提交
5524 5525 5526
	mbox_mem_align->size = sizeof(struct be_mcc_mailbox);
	mbox_mem_align->va = PTR_ALIGN(mbox_mem_alloc->va, 16);
	mbox_mem_align->dma = PTR_ALIGN(mbox_mem_alloc->dma, 16);
5527

5528
	rx_filter->size = sizeof(struct be_cmd_req_rx_filter);
5529 5530
	rx_filter->va = dma_zalloc_coherent(dev, rx_filter->size,
					    &rx_filter->dma, GFP_KERNEL);
K
Kalesh AP 已提交
5531
	if (!rx_filter->va) {
5532 5533 5534
		status = -ENOMEM;
		goto free_mbox;
	}
5535

5536 5537 5538 5539 5540 5541 5542 5543 5544 5545 5546 5547 5548 5549 5550
	if (lancer_chip(adapter))
		stats_cmd->size = sizeof(struct lancer_cmd_req_pport_stats);
	else if (BE2_chip(adapter))
		stats_cmd->size = sizeof(struct be_cmd_req_get_stats_v0);
	else if (BE3_chip(adapter))
		stats_cmd->size = sizeof(struct be_cmd_req_get_stats_v1);
	else
		stats_cmd->size = sizeof(struct be_cmd_req_get_stats_v2);
	stats_cmd->va = dma_zalloc_coherent(dev, stats_cmd->size,
					    &stats_cmd->dma, GFP_KERNEL);
	if (!stats_cmd->va) {
		status = -ENOMEM;
		goto free_rx_filter;
	}

5551
	mutex_init(&adapter->mbox_lock);
5552 5553
	spin_lock_init(&adapter->mcc_lock);
	spin_lock_init(&adapter->mcc_cq_lock);
5554
	init_completion(&adapter->et_cmd_compl);
5555

5556
	pci_save_state(adapter->pdev);
S
Sathya Perla 已提交
5557

5558
	INIT_DELAYED_WORK(&adapter->work, be_worker);
5559 5560
	INIT_DELAYED_WORK(&adapter->be_err_detection_work,
			  be_err_detection_task);
S
Sathya Perla 已提交
5561

5562 5563
	adapter->rx_fc = true;
	adapter->tx_fc = true;
S
Sathya Perla 已提交
5564

5565 5566
	/* Must be a power of 2 or else MODULO will BUG_ON */
	adapter->be_get_temp_freq = 64;
5567

S
Sathya Perla 已提交
5568
	return 0;
5569 5570 5571 5572 5573 5574 5575

free_rx_filter:
	dma_free_coherent(dev, rx_filter->size, rx_filter->va, rx_filter->dma);
free_mbox:
	dma_free_coherent(dev, mbox_mem_alloc->size, mbox_mem_alloc->va,
			  mbox_mem_alloc->dma);
	return status;
S
Sathya Perla 已提交
5576 5577
}

B
Bill Pemberton 已提交
5578
static void be_remove(struct pci_dev *pdev)
S
Sathya Perla 已提交
5579 5580
{
	struct be_adapter *adapter = pci_get_drvdata(pdev);
5581

S
Sathya Perla 已提交
5582 5583 5584
	if (!adapter)
		return;

5585
	be_roce_dev_remove(adapter);
5586
	be_intr_set(adapter, false);
5587

5588
	be_cancel_err_detection(adapter);
5589

S
Sathya Perla 已提交
5590 5591
	unregister_netdev(adapter->netdev);

5592 5593
	be_clear(adapter);

5594 5595 5596
	/* tell fw we're done with firing cmds */
	be_cmd_fw_clean(adapter);

5597 5598
	be_unmap_pci_bars(adapter);
	be_drv_cleanup(adapter);
S
Sathya Perla 已提交
5599

S
Sathya Perla 已提交
5600 5601
	pci_disable_pcie_error_reporting(pdev);

S
Sathya Perla 已提交
5602 5603 5604 5605 5606 5607
	pci_release_regions(pdev);
	pci_disable_device(pdev);

	free_netdev(adapter->netdev);
}

5608 5609 5610
static ssize_t be_hwmon_show_temp(struct device *dev,
				  struct device_attribute *dev_attr,
				  char *buf)
5611 5612 5613 5614 5615 5616 5617 5618 5619 5620 5621 5622 5623 5624 5625 5626 5627 5628 5629 5630 5631
{
	struct be_adapter *adapter = dev_get_drvdata(dev);

	/* Unit: millidegree Celsius */
	if (adapter->hwmon_info.be_on_die_temp == BE_INVALID_DIE_TEMP)
		return -EIO;
	else
		return sprintf(buf, "%u\n",
			       adapter->hwmon_info.be_on_die_temp * 1000);
}

static SENSOR_DEVICE_ATTR(temp1_input, S_IRUGO,
			  be_hwmon_show_temp, NULL, 1);

static struct attribute *be_hwmon_attrs[] = {
	&sensor_dev_attr_temp1_input.dev_attr.attr,
	NULL
};

ATTRIBUTE_GROUPS(be_hwmon);

S
Sathya Perla 已提交
5632 5633
static char *mc_name(struct be_adapter *adapter)
{
5634 5635 5636 5637 5638 5639 5640 5641 5642 5643 5644 5645 5646 5647 5648 5649 5650 5651 5652 5653 5654 5655 5656 5657 5658 5659
	char *str = "";	/* default */

	switch (adapter->mc_type) {
	case UMC:
		str = "UMC";
		break;
	case FLEX10:
		str = "FLEX10";
		break;
	case vNIC1:
		str = "vNIC-1";
		break;
	case nPAR:
		str = "nPAR";
		break;
	case UFP:
		str = "UFP";
		break;
	case vNIC2:
		str = "vNIC-2";
		break;
	default:
		str = "";
	}

	return str;
S
Sathya Perla 已提交
5660 5661 5662 5663 5664 5665 5666
}

static inline char *func_name(struct be_adapter *adapter)
{
	return be_physfn(adapter) ? "PF" : "VF";
}

5667 5668 5669 5670 5671 5672 5673 5674 5675 5676 5677 5678 5679 5680 5681 5682 5683 5684 5685 5686
static inline char *nic_name(struct pci_dev *pdev)
{
	switch (pdev->device) {
	case OC_DEVICE_ID1:
		return OC_NAME;
	case OC_DEVICE_ID2:
		return OC_NAME_BE;
	case OC_DEVICE_ID3:
	case OC_DEVICE_ID4:
		return OC_NAME_LANCER;
	case BE_DEVICE_ID2:
		return BE3_NAME;
	case OC_DEVICE_ID5:
	case OC_DEVICE_ID6:
		return OC_NAME_SH;
	default:
		return BE_NAME;
	}
}

5687
static int be_probe(struct pci_dev *pdev, const struct pci_device_id *pdev_id)
S
Sathya Perla 已提交
5688 5689 5690
{
	struct be_adapter *adapter;
	struct net_device *netdev;
5691
	int status = 0;
S
Sathya Perla 已提交
5692

S
Sathya Perla 已提交
5693 5694
	dev_info(&pdev->dev, "%s version is %s\n", DRV_NAME, DRV_VER);

S
Sathya Perla 已提交
5695 5696 5697 5698 5699 5700 5701 5702 5703
	status = pci_enable_device(pdev);
	if (status)
		goto do_none;

	status = pci_request_regions(pdev, DRV_NAME);
	if (status)
		goto disable_dev;
	pci_set_master(pdev);

5704
	netdev = alloc_etherdev_mqs(sizeof(*adapter), MAX_TX_QS, MAX_RX_QS);
K
Kalesh AP 已提交
5705
	if (!netdev) {
S
Sathya Perla 已提交
5706 5707 5708 5709 5710 5711 5712
		status = -ENOMEM;
		goto rel_reg;
	}
	adapter = netdev_priv(netdev);
	adapter->pdev = pdev;
	pci_set_drvdata(pdev, adapter);
	adapter->netdev = netdev;
5713
	SET_NETDEV_DEV(netdev, &pdev->dev);
S
Sathya Perla 已提交
5714

5715
	status = dma_set_mask_and_coherent(&pdev->dev, DMA_BIT_MASK(64));
S
Sathya Perla 已提交
5716 5717 5718
	if (!status) {
		netdev->features |= NETIF_F_HIGHDMA;
	} else {
5719
		status = dma_set_mask_and_coherent(&pdev->dev, DMA_BIT_MASK(32));
S
Sathya Perla 已提交
5720 5721 5722 5723 5724 5725
		if (status) {
			dev_err(&pdev->dev, "Could not set PCI DMA Mask\n");
			goto free_netdev;
		}
	}

5726 5727 5728
	status = pci_enable_pcie_error_reporting(pdev);
	if (!status)
		dev_info(&pdev->dev, "PCIe error reporting enabled\n");
S
Sathya Perla 已提交
5729

5730
	status = be_map_pci_bars(adapter);
S
Sathya Perla 已提交
5731
	if (status)
5732
		goto free_netdev;
S
Sathya Perla 已提交
5733

5734 5735 5736 5737
	status = be_drv_init(adapter);
	if (status)
		goto unmap_bars;

5738 5739
	status = be_setup(adapter);
	if (status)
5740
		goto drv_cleanup;
5741

5742
	be_netdev_init(netdev);
S
Sathya Perla 已提交
5743 5744
	status = register_netdev(netdev);
	if (status != 0)
5745
		goto unsetup;
S
Sathya Perla 已提交
5746

5747 5748
	be_roce_dev_add(adapter);

5749
	be_schedule_err_detection(adapter);
5750

5751
	/* On Die temperature not supported for VF. */
5752
	if (be_physfn(adapter) && IS_ENABLED(CONFIG_BE2NET_HWMON)) {
5753 5754 5755 5756 5757 5758 5759 5760
		adapter->hwmon_info.hwmon_dev =
			devm_hwmon_device_register_with_groups(&pdev->dev,
							       DRV_NAME,
							       adapter,
							       be_hwmon_groups);
		adapter->hwmon_info.be_on_die_temp = BE_INVALID_DIE_TEMP;
	}

S
Sathya Perla 已提交
5761
	dev_info(&pdev->dev, "%s: %s %s port %c\n", nic_name(pdev),
5762
		 func_name(adapter), mc_name(adapter), adapter->port_name);
5763

S
Sathya Perla 已提交
5764 5765
	return 0;

5766 5767
unsetup:
	be_clear(adapter);
5768 5769 5770 5771
drv_cleanup:
	be_drv_cleanup(adapter);
unmap_bars:
	be_unmap_pci_bars(adapter);
5772
free_netdev:
5773
	free_netdev(netdev);
S
Sathya Perla 已提交
5774 5775 5776 5777 5778
rel_reg:
	pci_release_regions(pdev);
disable_dev:
	pci_disable_device(pdev);
do_none:
5779
	dev_err(&pdev->dev, "%s initialization failed\n", nic_name(pdev));
S
Sathya Perla 已提交
5780 5781 5782 5783 5784 5785 5786
	return status;
}

static int be_suspend(struct pci_dev *pdev, pm_message_t state)
{
	struct be_adapter *adapter = pci_get_drvdata(pdev);

S
Suresh Reddy 已提交
5787
	if (adapter->wol_en)
5788 5789
		be_setup_wol(adapter, true);

5790
	be_intr_set(adapter, false);
5791
	be_cancel_err_detection(adapter);
5792

5793
	be_cleanup(adapter);
S
Sathya Perla 已提交
5794 5795 5796 5797 5798 5799 5800

	pci_save_state(pdev);
	pci_disable_device(pdev);
	pci_set_power_state(pdev, pci_choose_state(pdev, state));
	return 0;
}

5801
static int be_pci_resume(struct pci_dev *pdev)
S
Sathya Perla 已提交
5802 5803
{
	struct be_adapter *adapter = pci_get_drvdata(pdev);
5804
	int status = 0;
S
Sathya Perla 已提交
5805 5806 5807 5808 5809

	status = pci_enable_device(pdev);
	if (status)
		return status;

5810
	pci_set_power_state(pdev, PCI_D0);
S
Sathya Perla 已提交
5811 5812
	pci_restore_state(pdev);

5813
	status = be_resume(adapter);
5814 5815 5816
	if (status)
		return status;

5817 5818
	be_schedule_err_detection(adapter);

S
Suresh Reddy 已提交
5819
	if (adapter->wol_en)
5820
		be_setup_wol(adapter, false);
5821

S
Sathya Perla 已提交
5822 5823 5824
	return 0;
}

5825 5826 5827 5828 5829 5830 5831
/*
 * An FLR will stop BE from DMAing any data.
 */
static void be_shutdown(struct pci_dev *pdev)
{
	struct be_adapter *adapter = pci_get_drvdata(pdev);

5832 5833
	if (!adapter)
		return;
5834

5835
	be_roce_dev_shutdown(adapter);
5836
	cancel_delayed_work_sync(&adapter->work);
5837
	be_cancel_err_detection(adapter);
5838

5839
	netif_device_detach(adapter->netdev);
5840

5841 5842
	be_cmd_reset_function(adapter);

5843 5844 5845
	pci_disable_device(pdev);
}

5846
static pci_ers_result_t be_eeh_err_detected(struct pci_dev *pdev,
5847
					    pci_channel_state_t state)
5848 5849 5850 5851 5852
{
	struct be_adapter *adapter = pci_get_drvdata(pdev);

	dev_err(&adapter->pdev->dev, "EEH error detected\n");

5853 5854
	if (!be_check_error(adapter, BE_ERROR_EEH)) {
		be_set_error(adapter, BE_ERROR_EEH);
5855

5856
		be_cancel_err_detection(adapter);
5857

5858
		be_cleanup(adapter);
5859 5860 5861 5862 5863 5864 5865
	}

	if (state == pci_channel_io_perm_failure)
		return PCI_ERS_RESULT_DISCONNECT;

	pci_disable_device(pdev);

5866 5867
	/* The error could cause the FW to trigger a flash debug dump.
	 * Resetting the card while flash dump is in progress
5868 5869 5870
	 * can cause it not to recover; wait for it to finish.
	 * Wait only for first function as it is needed only once per
	 * adapter.
5871
	 */
5872 5873 5874
	if (pdev->devfn == 0)
		ssleep(30);

5875 5876 5877 5878 5879 5880 5881 5882 5883 5884 5885 5886 5887 5888 5889
	return PCI_ERS_RESULT_NEED_RESET;
}

static pci_ers_result_t be_eeh_reset(struct pci_dev *pdev)
{
	struct be_adapter *adapter = pci_get_drvdata(pdev);
	int status;

	dev_info(&adapter->pdev->dev, "EEH reset\n");

	status = pci_enable_device(pdev);
	if (status)
		return PCI_ERS_RESULT_DISCONNECT;

	pci_set_master(pdev);
5890
	pci_set_power_state(pdev, PCI_D0);
5891 5892 5893
	pci_restore_state(pdev);

	/* Check if card is ok and fw is ready */
5894 5895
	dev_info(&adapter->pdev->dev,
		 "Waiting for FW to be ready after EEH reset\n");
5896
	status = be_fw_wait_ready(adapter);
5897 5898 5899
	if (status)
		return PCI_ERS_RESULT_DISCONNECT;

S
Sathya Perla 已提交
5900
	pci_cleanup_aer_uncorrect_error_status(pdev);
5901
	be_clear_error(adapter, BE_CLEAR_ALL);
5902 5903 5904 5905 5906 5907 5908 5909 5910 5911 5912 5913
	return PCI_ERS_RESULT_RECOVERED;
}

static void be_eeh_resume(struct pci_dev *pdev)
{
	int status = 0;
	struct be_adapter *adapter = pci_get_drvdata(pdev);

	dev_info(&adapter->pdev->dev, "EEH resume\n");

	pci_save_state(pdev);

5914
	status = be_resume(adapter);
5915 5916 5917
	if (status)
		goto err;

5918
	be_schedule_err_detection(adapter);
5919 5920 5921 5922 5923
	return;
err:
	dev_err(&adapter->pdev->dev, "EEH resume failed\n");
}

5924 5925 5926 5927 5928 5929 5930 5931 5932 5933 5934 5935 5936 5937 5938 5939 5940 5941 5942 5943 5944 5945 5946 5947 5948 5949 5950 5951 5952 5953 5954 5955 5956 5957 5958 5959 5960 5961 5962 5963 5964 5965 5966 5967 5968 5969 5970 5971 5972 5973 5974 5975 5976 5977
static int be_pci_sriov_configure(struct pci_dev *pdev, int num_vfs)
{
	struct be_adapter *adapter = pci_get_drvdata(pdev);
	u16 num_vf_qs;
	int status;

	if (!num_vfs)
		be_vf_clear(adapter);

	adapter->num_vfs = num_vfs;

	if (adapter->num_vfs == 0 && pci_vfs_assigned(pdev)) {
		dev_warn(&pdev->dev,
			 "Cannot disable VFs while they are assigned\n");
		return -EBUSY;
	}

	/* When the HW is in SRIOV capable configuration, the PF-pool resources
	 * are equally distributed across the max-number of VFs. The user may
	 * request only a subset of the max-vfs to be enabled.
	 * Based on num_vfs, redistribute the resources across num_vfs so that
	 * each VF will have access to more number of resources.
	 * This facility is not available in BE3 FW.
	 * Also, this is done by FW in Lancer chip.
	 */
	if (skyhawk_chip(adapter) && !pci_num_vf(pdev)) {
		num_vf_qs = be_calculate_vf_qs(adapter, adapter->num_vfs);
		status = be_cmd_set_sriov_config(adapter, adapter->pool_res,
						 adapter->num_vfs, num_vf_qs);
		if (status)
			dev_err(&pdev->dev,
				"Failed to optimize SR-IOV resources\n");
	}

	status = be_get_resources(adapter);
	if (status)
		return be_cmd_status(status);

	/* Updating real_num_tx/rx_queues() requires rtnl_lock() */
	rtnl_lock();
	status = be_update_queues(adapter);
	rtnl_unlock();
	if (status)
		return be_cmd_status(status);

	if (adapter->num_vfs)
		status = be_vf_setup(adapter);

	if (!status)
		return adapter->num_vfs;

	return 0;
}

5978
static const struct pci_error_handlers be_eeh_handlers = {
5979 5980 5981 5982 5983
	.error_detected = be_eeh_err_detected,
	.slot_reset = be_eeh_reset,
	.resume = be_eeh_resume,
};

S
Sathya Perla 已提交
5984 5985 5986 5987 5988 5989
static struct pci_driver be_driver = {
	.name = DRV_NAME,
	.id_table = be_dev_ids,
	.probe = be_probe,
	.remove = be_remove,
	.suspend = be_suspend,
5990
	.resume = be_pci_resume,
5991
	.shutdown = be_shutdown,
5992
	.sriov_configure = be_pci_sriov_configure,
5993
	.err_handler = &be_eeh_handlers
S
Sathya Perla 已提交
5994 5995 5996 5997
};

static int __init be_init_module(void)
{
5998 5999
	if (rx_frag_size != 8192 && rx_frag_size != 4096 &&
	    rx_frag_size != 2048) {
S
Sathya Perla 已提交
6000 6001 6002 6003 6004 6005
		printk(KERN_WARNING DRV_NAME
			" : Module param rx_frag_size must be 2048/4096/8192."
			" Using 2048\n");
		rx_frag_size = 2048;
	}

6006 6007 6008 6009 6010
	if (num_vfs > 0) {
		pr_info(DRV_NAME " : Module param num_vfs is obsolete.");
		pr_info(DRV_NAME " : Use sysfs method to enable VFs\n");
	}

S
Sathya Perla 已提交
6011 6012 6013 6014 6015 6016 6017 6018 6019
	return pci_register_driver(&be_driver);
}
module_init(be_init_module);

static void __exit be_exit_module(void)
{
	pci_unregister_driver(&be_driver);
}
module_exit(be_exit_module);