1 /* bnx2x_cmn.c: Broadcom Everest network driver.
2  *
3  * Copyright (c) 2007-2013 Broadcom Corporation
4  *
5  * This program is free software; you can redistribute it and/or modify
6  * it under the terms of the GNU General Public License as published by
7  * the Free Software Foundation.
8  *
9  * Maintained by: Eilon Greenstein <eilong@broadcom.com>
10  * Written by: Eliezer Tamir
11  * Based on code from Michael Chan's bnx2 driver
12  * UDP CSUM errata workaround by Arik Gendelman
13  * Slowpath and fastpath rework by Vladislav Zolotarov
14  * Statistics and Link management by Yitchak Gertner
15  *
16  */
17 
18 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
19 
20 #include <linux/etherdevice.h>
21 #include <linux/if_vlan.h>
22 #include <linux/interrupt.h>
23 #include <linux/ip.h>
24 #include <net/tcp.h>
25 #include <net/ipv6.h>
26 #include <net/ip6_checksum.h>
27 #include <net/busy_poll.h>
28 #include <linux/prefetch.h>
29 #include "bnx2x_cmn.h"
30 #include "bnx2x_init.h"
31 #include "bnx2x_sp.h"
32 
33 /**
34  * bnx2x_move_fp - move content of the fastpath structure.
35  *
36  * @bp:		driver handle
37  * @from:	source FP index
38  * @to:		destination FP index
39  *
40  * Makes sure the contents of the bp->fp[to].napi is kept
41  * intact. This is done by first copying the napi struct from
42  * the target to the source, and then mem copying the entire
43  * source onto the target. Update txdata pointers and related
44  * content.
45  */
46 static inline void bnx2x_move_fp(struct bnx2x *bp, int from, int to)
47 {
48 	struct bnx2x_fastpath *from_fp = &bp->fp[from];
49 	struct bnx2x_fastpath *to_fp = &bp->fp[to];
50 	struct bnx2x_sp_objs *from_sp_objs = &bp->sp_objs[from];
51 	struct bnx2x_sp_objs *to_sp_objs = &bp->sp_objs[to];
52 	struct bnx2x_fp_stats *from_fp_stats = &bp->fp_stats[from];
53 	struct bnx2x_fp_stats *to_fp_stats = &bp->fp_stats[to];
54 	int old_max_eth_txqs, new_max_eth_txqs;
55 	int old_txdata_index = 0, new_txdata_index = 0;
56 	struct bnx2x_agg_info *old_tpa_info = to_fp->tpa_info;
57 
58 	/* Copy the NAPI object as it has been already initialized */
59 	from_fp->napi = to_fp->napi;
60 
61 	/* Move bnx2x_fastpath contents */
62 	memcpy(to_fp, from_fp, sizeof(*to_fp));
63 	to_fp->index = to;
64 
65 	/* Retain the tpa_info of the original `to' version as we don't want
66 	 * 2 FPs to contain the same tpa_info pointer.
67 	 */
68 	to_fp->tpa_info = old_tpa_info;
69 
70 	/* move sp_objs contents as well, as their indices match fp ones */
71 	memcpy(to_sp_objs, from_sp_objs, sizeof(*to_sp_objs));
72 
73 	/* move fp_stats contents as well, as their indices match fp ones */
74 	memcpy(to_fp_stats, from_fp_stats, sizeof(*to_fp_stats));
75 
76 	/* Update txdata pointers in fp and move txdata content accordingly:
77 	 * Each fp consumes 'max_cos' txdata structures, so the index should be
78 	 * decremented by max_cos x delta.
79 	 */
80 
81 	old_max_eth_txqs = BNX2X_NUM_ETH_QUEUES(bp) * (bp)->max_cos;
82 	new_max_eth_txqs = (BNX2X_NUM_ETH_QUEUES(bp) - from + to) *
83 				(bp)->max_cos;
84 	if (from == FCOE_IDX(bp)) {
85 		old_txdata_index = old_max_eth_txqs + FCOE_TXQ_IDX_OFFSET;
86 		new_txdata_index = new_max_eth_txqs + FCOE_TXQ_IDX_OFFSET;
87 	}
88 
89 	memcpy(&bp->bnx2x_txq[new_txdata_index],
90 	       &bp->bnx2x_txq[old_txdata_index],
91 	       sizeof(struct bnx2x_fp_txdata));
92 	to_fp->txdata_ptr[0] = &bp->bnx2x_txq[new_txdata_index];
93 }
94 
95 /**
96  * bnx2x_fill_fw_str - Fill buffer with FW version string.
97  *
98  * @bp:        driver handle
99  * @buf:       character buffer to fill with the fw name
100  * @buf_len:   length of the above buffer
101  *
102  */
103 void bnx2x_fill_fw_str(struct bnx2x *bp, char *buf, size_t buf_len)
104 {
105 	if (IS_PF(bp)) {
106 		u8 phy_fw_ver[PHY_FW_VER_LEN];
107 
108 		phy_fw_ver[0] = '\0';
109 		bnx2x_get_ext_phy_fw_version(&bp->link_params,
110 					     phy_fw_ver, PHY_FW_VER_LEN);
111 		strlcpy(buf, bp->fw_ver, buf_len);
112 		snprintf(buf + strlen(bp->fw_ver), 32 - strlen(bp->fw_ver),
113 			 "bc %d.%d.%d%s%s",
114 			 (bp->common.bc_ver & 0xff0000) >> 16,
115 			 (bp->common.bc_ver & 0xff00) >> 8,
116 			 (bp->common.bc_ver & 0xff),
117 			 ((phy_fw_ver[0] != '\0') ? " phy " : ""), phy_fw_ver);
118 	} else {
119 		bnx2x_vf_fill_fw_str(bp, buf, buf_len);
120 	}
121 }
122 
123 /**
124  * bnx2x_shrink_eth_fp - guarantees fastpath structures stay intact
125  *
126  * @bp:	driver handle
127  * @delta:	number of eth queues which were not allocated
128  */
129 static void bnx2x_shrink_eth_fp(struct bnx2x *bp, int delta)
130 {
131 	int i, cos, old_eth_num = BNX2X_NUM_ETH_QUEUES(bp);
132 
133 	/* Queue pointer cannot be re-set on an fp-basis, as moving pointer
134 	 * backward along the array could cause memory to be overridden
135 	 */
136 	for (cos = 1; cos < bp->max_cos; cos++) {
137 		for (i = 0; i < old_eth_num - delta; i++) {
138 			struct bnx2x_fastpath *fp = &bp->fp[i];
139 			int new_idx = cos * (old_eth_num - delta) + i;
140 
141 			memcpy(&bp->bnx2x_txq[new_idx], fp->txdata_ptr[cos],
142 			       sizeof(struct bnx2x_fp_txdata));
143 			fp->txdata_ptr[cos] = &bp->bnx2x_txq[new_idx];
144 		}
145 	}
146 }
147 
148 int load_count[2][3] = { {0} }; /* per-path: 0-common, 1-port0, 2-port1 */
149 
150 /* free skb in the packet ring at pos idx
151  * return idx of last bd freed
152  */
153 static u16 bnx2x_free_tx_pkt(struct bnx2x *bp, struct bnx2x_fp_txdata *txdata,
154 			     u16 idx, unsigned int *pkts_compl,
155 			     unsigned int *bytes_compl)
156 {
157 	struct sw_tx_bd *tx_buf = &txdata->tx_buf_ring[idx];
158 	struct eth_tx_start_bd *tx_start_bd;
159 	struct eth_tx_bd *tx_data_bd;
160 	struct sk_buff *skb = tx_buf->skb;
161 	u16 bd_idx = TX_BD(tx_buf->first_bd), new_cons;
162 	int nbd;
163 
164 	/* prefetch skb end pointer to speedup dev_kfree_skb() */
165 	prefetch(&skb->end);
166 
167 	DP(NETIF_MSG_TX_DONE, "fp[%d]: pkt_idx %d  buff @(%p)->skb %p\n",
168 	   txdata->txq_index, idx, tx_buf, skb);
169 
170 	/* unmap first bd */
171 	tx_start_bd = &txdata->tx_desc_ring[bd_idx].start_bd;
172 	dma_unmap_single(&bp->pdev->dev, BD_UNMAP_ADDR(tx_start_bd),
173 			 BD_UNMAP_LEN(tx_start_bd), DMA_TO_DEVICE);
174 
175 	nbd = le16_to_cpu(tx_start_bd->nbd) - 1;
176 #ifdef BNX2X_STOP_ON_ERROR
177 	if ((nbd - 1) > (MAX_SKB_FRAGS + 2)) {
178 		BNX2X_ERR("BAD nbd!\n");
179 		bnx2x_panic();
180 	}
181 #endif
182 	new_cons = nbd + tx_buf->first_bd;
183 
184 	/* Get the next bd */
185 	bd_idx = TX_BD(NEXT_TX_IDX(bd_idx));
186 
187 	/* Skip a parse bd... */
188 	--nbd;
189 	bd_idx = TX_BD(NEXT_TX_IDX(bd_idx));
190 
191 	/* ...and the TSO split header bd since they have no mapping */
192 	if (tx_buf->flags & BNX2X_TSO_SPLIT_BD) {
193 		--nbd;
194 		bd_idx = TX_BD(NEXT_TX_IDX(bd_idx));
195 	}
196 
197 	/* now free frags */
198 	while (nbd > 0) {
199 
200 		tx_data_bd = &txdata->tx_desc_ring[bd_idx].reg_bd;
201 		dma_unmap_page(&bp->pdev->dev, BD_UNMAP_ADDR(tx_data_bd),
202 			       BD_UNMAP_LEN(tx_data_bd), DMA_TO_DEVICE);
203 		if (--nbd)
204 			bd_idx = TX_BD(NEXT_TX_IDX(bd_idx));
205 	}
206 
207 	/* release skb */
208 	WARN_ON(!skb);
209 	if (likely(skb)) {
210 		(*pkts_compl)++;
211 		(*bytes_compl) += skb->len;
212 	}
213 
214 	dev_kfree_skb_any(skb);
215 	tx_buf->first_bd = 0;
216 	tx_buf->skb = NULL;
217 
218 	return new_cons;
219 }
220 
221 int bnx2x_tx_int(struct bnx2x *bp, struct bnx2x_fp_txdata *txdata)
222 {
223 	struct netdev_queue *txq;
224 	u16 hw_cons, sw_cons, bd_cons = txdata->tx_bd_cons;
225 	unsigned int pkts_compl = 0, bytes_compl = 0;
226 
227 #ifdef BNX2X_STOP_ON_ERROR
228 	if (unlikely(bp->panic))
229 		return -1;
230 #endif
231 
232 	txq = netdev_get_tx_queue(bp->dev, txdata->txq_index);
233 	hw_cons = le16_to_cpu(*txdata->tx_cons_sb);
234 	sw_cons = txdata->tx_pkt_cons;
235 
236 	while (sw_cons != hw_cons) {
237 		u16 pkt_cons;
238 
239 		pkt_cons = TX_BD(sw_cons);
240 
241 		DP(NETIF_MSG_TX_DONE,
242 		   "queue[%d]: hw_cons %u  sw_cons %u  pkt_cons %u\n",
243 		   txdata->txq_index, hw_cons, sw_cons, pkt_cons);
244 
245 		bd_cons = bnx2x_free_tx_pkt(bp, txdata, pkt_cons,
246 					    &pkts_compl, &bytes_compl);
247 
248 		sw_cons++;
249 	}
250 
251 	netdev_tx_completed_queue(txq, pkts_compl, bytes_compl);
252 
253 	txdata->tx_pkt_cons = sw_cons;
254 	txdata->tx_bd_cons = bd_cons;
255 
256 	/* Need to make the tx_bd_cons update visible to start_xmit()
257 	 * before checking for netif_tx_queue_stopped().  Without the
258 	 * memory barrier, there is a small possibility that
259 	 * start_xmit() will miss it and cause the queue to be stopped
260 	 * forever.
261 	 * On the other hand we need an rmb() here to ensure the proper
262 	 * ordering of bit testing in the following
263 	 * netif_tx_queue_stopped(txq) call.
264 	 */
265 	smp_mb();
266 
267 	if (unlikely(netif_tx_queue_stopped(txq))) {
268 		/* Taking tx_lock() is needed to prevent re-enabling the queue
269 		 * while it's empty. This could have happen if rx_action() gets
270 		 * suspended in bnx2x_tx_int() after the condition before
271 		 * netif_tx_wake_queue(), while tx_action (bnx2x_start_xmit()):
272 		 *
273 		 * stops the queue->sees fresh tx_bd_cons->releases the queue->
274 		 * sends some packets consuming the whole queue again->
275 		 * stops the queue
276 		 */
277 
278 		__netif_tx_lock(txq, smp_processor_id());
279 
280 		if ((netif_tx_queue_stopped(txq)) &&
281 		    (bp->state == BNX2X_STATE_OPEN) &&
282 		    (bnx2x_tx_avail(bp, txdata) >= MAX_DESC_PER_TX_PKT))
283 			netif_tx_wake_queue(txq);
284 
285 		__netif_tx_unlock(txq);
286 	}
287 	return 0;
288 }
289 
290 static inline void bnx2x_update_last_max_sge(struct bnx2x_fastpath *fp,
291 					     u16 idx)
292 {
293 	u16 last_max = fp->last_max_sge;
294 
295 	if (SUB_S16(idx, last_max) > 0)
296 		fp->last_max_sge = idx;
297 }
298 
299 static inline void bnx2x_update_sge_prod(struct bnx2x_fastpath *fp,
300 					 u16 sge_len,
301 					 struct eth_end_agg_rx_cqe *cqe)
302 {
303 	struct bnx2x *bp = fp->bp;
304 	u16 last_max, last_elem, first_elem;
305 	u16 delta = 0;
306 	u16 i;
307 
308 	if (!sge_len)
309 		return;
310 
311 	/* First mark all used pages */
312 	for (i = 0; i < sge_len; i++)
313 		BIT_VEC64_CLEAR_BIT(fp->sge_mask,
314 			RX_SGE(le16_to_cpu(cqe->sgl_or_raw_data.sgl[i])));
315 
316 	DP(NETIF_MSG_RX_STATUS, "fp_cqe->sgl[%d] = %d\n",
317 	   sge_len - 1, le16_to_cpu(cqe->sgl_or_raw_data.sgl[sge_len - 1]));
318 
319 	/* Here we assume that the last SGE index is the biggest */
320 	prefetch((void *)(fp->sge_mask));
321 	bnx2x_update_last_max_sge(fp,
322 		le16_to_cpu(cqe->sgl_or_raw_data.sgl[sge_len - 1]));
323 
324 	last_max = RX_SGE(fp->last_max_sge);
325 	last_elem = last_max >> BIT_VEC64_ELEM_SHIFT;
326 	first_elem = RX_SGE(fp->rx_sge_prod) >> BIT_VEC64_ELEM_SHIFT;
327 
328 	/* If ring is not full */
329 	if (last_elem + 1 != first_elem)
330 		last_elem++;
331 
332 	/* Now update the prod */
333 	for (i = first_elem; i != last_elem; i = NEXT_SGE_MASK_ELEM(i)) {
334 		if (likely(fp->sge_mask[i]))
335 			break;
336 
337 		fp->sge_mask[i] = BIT_VEC64_ELEM_ONE_MASK;
338 		delta += BIT_VEC64_ELEM_SZ;
339 	}
340 
341 	if (delta > 0) {
342 		fp->rx_sge_prod += delta;
343 		/* clear page-end entries */
344 		bnx2x_clear_sge_mask_next_elems(fp);
345 	}
346 
347 	DP(NETIF_MSG_RX_STATUS,
348 	   "fp->last_max_sge = %d  fp->rx_sge_prod = %d\n",
349 	   fp->last_max_sge, fp->rx_sge_prod);
350 }
351 
352 /* Get Toeplitz hash value in the skb using the value from the
353  * CQE (calculated by HW).
354  */
355 static u32 bnx2x_get_rxhash(const struct bnx2x *bp,
356 			    const struct eth_fast_path_rx_cqe *cqe,
357 			    bool *l4_rxhash)
358 {
359 	/* Get Toeplitz hash from CQE */
360 	if ((bp->dev->features & NETIF_F_RXHASH) &&
361 	    (cqe->status_flags & ETH_FAST_PATH_RX_CQE_RSS_HASH_FLG)) {
362 		enum eth_rss_hash_type htype;
363 
364 		htype = cqe->status_flags & ETH_FAST_PATH_RX_CQE_RSS_HASH_TYPE;
365 		*l4_rxhash = (htype == TCP_IPV4_HASH_TYPE) ||
366 			     (htype == TCP_IPV6_HASH_TYPE);
367 		return le32_to_cpu(cqe->rss_hash_result);
368 	}
369 	*l4_rxhash = false;
370 	return 0;
371 }
372 
373 static void bnx2x_tpa_start(struct bnx2x_fastpath *fp, u16 queue,
374 			    u16 cons, u16 prod,
375 			    struct eth_fast_path_rx_cqe *cqe)
376 {
377 	struct bnx2x *bp = fp->bp;
378 	struct sw_rx_bd *cons_rx_buf = &fp->rx_buf_ring[cons];
379 	struct sw_rx_bd *prod_rx_buf = &fp->rx_buf_ring[prod];
380 	struct eth_rx_bd *prod_bd = &fp->rx_desc_ring[prod];
381 	dma_addr_t mapping;
382 	struct bnx2x_agg_info *tpa_info = &fp->tpa_info[queue];
383 	struct sw_rx_bd *first_buf = &tpa_info->first_buf;
384 
385 	/* print error if current state != stop */
386 	if (tpa_info->tpa_state != BNX2X_TPA_STOP)
387 		BNX2X_ERR("start of bin not in stop [%d]\n", queue);
388 
389 	/* Try to map an empty data buffer from the aggregation info  */
390 	mapping = dma_map_single(&bp->pdev->dev,
391 				 first_buf->data + NET_SKB_PAD,
392 				 fp->rx_buf_size, DMA_FROM_DEVICE);
393 	/*
394 	 *  ...if it fails - move the skb from the consumer to the producer
395 	 *  and set the current aggregation state as ERROR to drop it
396 	 *  when TPA_STOP arrives.
397 	 */
398 
399 	if (unlikely(dma_mapping_error(&bp->pdev->dev, mapping))) {
400 		/* Move the BD from the consumer to the producer */
401 		bnx2x_reuse_rx_data(fp, cons, prod);
402 		tpa_info->tpa_state = BNX2X_TPA_ERROR;
403 		return;
404 	}
405 
406 	/* move empty data from pool to prod */
407 	prod_rx_buf->data = first_buf->data;
408 	dma_unmap_addr_set(prod_rx_buf, mapping, mapping);
409 	/* point prod_bd to new data */
410 	prod_bd->addr_hi = cpu_to_le32(U64_HI(mapping));
411 	prod_bd->addr_lo = cpu_to_le32(U64_LO(mapping));
412 
413 	/* move partial skb from cons to pool (don't unmap yet) */
414 	*first_buf = *cons_rx_buf;
415 
416 	/* mark bin state as START */
417 	tpa_info->parsing_flags =
418 		le16_to_cpu(cqe->pars_flags.flags);
419 	tpa_info->vlan_tag = le16_to_cpu(cqe->vlan_tag);
420 	tpa_info->tpa_state = BNX2X_TPA_START;
421 	tpa_info->len_on_bd = le16_to_cpu(cqe->len_on_bd);
422 	tpa_info->placement_offset = cqe->placement_offset;
423 	tpa_info->rxhash = bnx2x_get_rxhash(bp, cqe, &tpa_info->l4_rxhash);
424 	if (fp->mode == TPA_MODE_GRO) {
425 		u16 gro_size = le16_to_cpu(cqe->pkt_len_or_gro_seg_len);
426 		tpa_info->full_page = SGE_PAGES / gro_size * gro_size;
427 		tpa_info->gro_size = gro_size;
428 	}
429 
430 #ifdef BNX2X_STOP_ON_ERROR
431 	fp->tpa_queue_used |= (1 << queue);
432 #ifdef _ASM_GENERIC_INT_L64_H
433 	DP(NETIF_MSG_RX_STATUS, "fp->tpa_queue_used = 0x%lx\n",
434 #else
435 	DP(NETIF_MSG_RX_STATUS, "fp->tpa_queue_used = 0x%llx\n",
436 #endif
437 	   fp->tpa_queue_used);
438 #endif
439 }
440 
441 /* Timestamp option length allowed for TPA aggregation:
442  *
443  *		nop nop kind length echo val
444  */
445 #define TPA_TSTAMP_OPT_LEN	12
446 /**
447  * bnx2x_set_gro_params - compute GRO values
448  *
449  * @skb:		packet skb
450  * @parsing_flags:	parsing flags from the START CQE
451  * @len_on_bd:		total length of the first packet for the
452  *			aggregation.
453  * @pkt_len:		length of all segments
454  *
455  * Approximate value of the MSS for this aggregation calculated using
456  * the first packet of it.
457  * Compute number of aggregated segments, and gso_type.
458  */
459 static void bnx2x_set_gro_params(struct sk_buff *skb, u16 parsing_flags,
460 				 u16 len_on_bd, unsigned int pkt_len,
461 				 u16 num_of_coalesced_segs)
462 {
463 	/* TPA aggregation won't have either IP options or TCP options
464 	 * other than timestamp or IPv6 extension headers.
465 	 */
466 	u16 hdrs_len = ETH_HLEN + sizeof(struct tcphdr);
467 
468 	if (GET_FLAG(parsing_flags, PARSING_FLAGS_OVER_ETHERNET_PROTOCOL) ==
469 	    PRS_FLAG_OVERETH_IPV6) {
470 		hdrs_len += sizeof(struct ipv6hdr);
471 		skb_shinfo(skb)->gso_type = SKB_GSO_TCPV6;
472 	} else {
473 		hdrs_len += sizeof(struct iphdr);
474 		skb_shinfo(skb)->gso_type = SKB_GSO_TCPV4;
475 	}
476 
477 	/* Check if there was a TCP timestamp, if there is it's will
478 	 * always be 12 bytes length: nop nop kind length echo val.
479 	 *
480 	 * Otherwise FW would close the aggregation.
481 	 */
482 	if (parsing_flags & PARSING_FLAGS_TIME_STAMP_EXIST_FLAG)
483 		hdrs_len += TPA_TSTAMP_OPT_LEN;
484 
485 	skb_shinfo(skb)->gso_size = len_on_bd - hdrs_len;
486 
487 	/* tcp_gro_complete() will copy NAPI_GRO_CB(skb)->count
488 	 * to skb_shinfo(skb)->gso_segs
489 	 */
490 	NAPI_GRO_CB(skb)->count = num_of_coalesced_segs;
491 }
492 
493 static int bnx2x_alloc_rx_sge(struct bnx2x *bp, struct bnx2x_fastpath *fp,
494 			      u16 index, gfp_t gfp_mask)
495 {
496 	struct page *page = alloc_pages(gfp_mask, PAGES_PER_SGE_SHIFT);
497 	struct sw_rx_page *sw_buf = &fp->rx_page_ring[index];
498 	struct eth_rx_sge *sge = &fp->rx_sge_ring[index];
499 	dma_addr_t mapping;
500 
501 	if (unlikely(page == NULL)) {
502 		BNX2X_ERR("Can't alloc sge\n");
503 		return -ENOMEM;
504 	}
505 
506 	mapping = dma_map_page(&bp->pdev->dev, page, 0,
507 			       SGE_PAGES, DMA_FROM_DEVICE);
508 	if (unlikely(dma_mapping_error(&bp->pdev->dev, mapping))) {
509 		__free_pages(page, PAGES_PER_SGE_SHIFT);
510 		BNX2X_ERR("Can't map sge\n");
511 		return -ENOMEM;
512 	}
513 
514 	sw_buf->page = page;
515 	dma_unmap_addr_set(sw_buf, mapping, mapping);
516 
517 	sge->addr_hi = cpu_to_le32(U64_HI(mapping));
518 	sge->addr_lo = cpu_to_le32(U64_LO(mapping));
519 
520 	return 0;
521 }
522 
523 static int bnx2x_fill_frag_skb(struct bnx2x *bp, struct bnx2x_fastpath *fp,
524 			       struct bnx2x_agg_info *tpa_info,
525 			       u16 pages,
526 			       struct sk_buff *skb,
527 			       struct eth_end_agg_rx_cqe *cqe,
528 			       u16 cqe_idx)
529 {
530 	struct sw_rx_page *rx_pg, old_rx_pg;
531 	u32 i, frag_len, frag_size;
532 	int err, j, frag_id = 0;
533 	u16 len_on_bd = tpa_info->len_on_bd;
534 	u16 full_page = 0, gro_size = 0;
535 
536 	frag_size = le16_to_cpu(cqe->pkt_len) - len_on_bd;
537 
538 	if (fp->mode == TPA_MODE_GRO) {
539 		gro_size = tpa_info->gro_size;
540 		full_page = tpa_info->full_page;
541 	}
542 
543 	/* This is needed in order to enable forwarding support */
544 	if (frag_size)
545 		bnx2x_set_gro_params(skb, tpa_info->parsing_flags, len_on_bd,
546 				     le16_to_cpu(cqe->pkt_len),
547 				     le16_to_cpu(cqe->num_of_coalesced_segs));
548 
549 #ifdef BNX2X_STOP_ON_ERROR
550 	if (pages > min_t(u32, 8, MAX_SKB_FRAGS) * SGE_PAGES) {
551 		BNX2X_ERR("SGL length is too long: %d. CQE index is %d\n",
552 			  pages, cqe_idx);
553 		BNX2X_ERR("cqe->pkt_len = %d\n", cqe->pkt_len);
554 		bnx2x_panic();
555 		return -EINVAL;
556 	}
557 #endif
558 
559 	/* Run through the SGL and compose the fragmented skb */
560 	for (i = 0, j = 0; i < pages; i += PAGES_PER_SGE, j++) {
561 		u16 sge_idx = RX_SGE(le16_to_cpu(cqe->sgl_or_raw_data.sgl[j]));
562 
563 		/* FW gives the indices of the SGE as if the ring is an array
564 		   (meaning that "next" element will consume 2 indices) */
565 		if (fp->mode == TPA_MODE_GRO)
566 			frag_len = min_t(u32, frag_size, (u32)full_page);
567 		else /* LRO */
568 			frag_len = min_t(u32, frag_size, (u32)SGE_PAGES);
569 
570 		rx_pg = &fp->rx_page_ring[sge_idx];
571 		old_rx_pg = *rx_pg;
572 
573 		/* If we fail to allocate a substitute page, we simply stop
574 		   where we are and drop the whole packet */
575 		err = bnx2x_alloc_rx_sge(bp, fp, sge_idx, GFP_ATOMIC);
576 		if (unlikely(err)) {
577 			bnx2x_fp_qstats(bp, fp)->rx_skb_alloc_failed++;
578 			return err;
579 		}
580 
581 		/* Unmap the page as we're going to pass it to the stack */
582 		dma_unmap_page(&bp->pdev->dev,
583 			       dma_unmap_addr(&old_rx_pg, mapping),
584 			       SGE_PAGES, DMA_FROM_DEVICE);
585 		/* Add one frag and update the appropriate fields in the skb */
586 		if (fp->mode == TPA_MODE_LRO)
587 			skb_fill_page_desc(skb, j, old_rx_pg.page, 0, frag_len);
588 		else { /* GRO */
589 			int rem;
590 			int offset = 0;
591 			for (rem = frag_len; rem > 0; rem -= gro_size) {
592 				int len = rem > gro_size ? gro_size : rem;
593 				skb_fill_page_desc(skb, frag_id++,
594 						   old_rx_pg.page, offset, len);
595 				if (offset)
596 					get_page(old_rx_pg.page);
597 				offset += len;
598 			}
599 		}
600 
601 		skb->data_len += frag_len;
602 		skb->truesize += SGE_PAGES;
603 		skb->len += frag_len;
604 
605 		frag_size -= frag_len;
606 	}
607 
608 	return 0;
609 }
610 
611 static void bnx2x_frag_free(const struct bnx2x_fastpath *fp, void *data)
612 {
613 	if (fp->rx_frag_size)
614 		put_page(virt_to_head_page(data));
615 	else
616 		kfree(data);
617 }
618 
619 static void *bnx2x_frag_alloc(const struct bnx2x_fastpath *fp, gfp_t gfp_mask)
620 {
621 	if (fp->rx_frag_size) {
622 		/* GFP_KERNEL allocations are used only during initialization */
623 		if (unlikely(gfp_mask & __GFP_WAIT))
624 			return (void *)__get_free_page(gfp_mask);
625 
626 		return netdev_alloc_frag(fp->rx_frag_size);
627 	}
628 
629 	return kmalloc(fp->rx_buf_size + NET_SKB_PAD, gfp_mask);
630 }
631 
632 #ifdef CONFIG_INET
633 static void bnx2x_gro_ip_csum(struct bnx2x *bp, struct sk_buff *skb)
634 {
635 	const struct iphdr *iph = ip_hdr(skb);
636 	struct tcphdr *th;
637 
638 	skb_set_transport_header(skb, sizeof(struct iphdr));
639 	th = tcp_hdr(skb);
640 
641 	th->check = ~tcp_v4_check(skb->len - skb_transport_offset(skb),
642 				  iph->saddr, iph->daddr, 0);
643 }
644 
645 static void bnx2x_gro_ipv6_csum(struct bnx2x *bp, struct sk_buff *skb)
646 {
647 	struct ipv6hdr *iph = ipv6_hdr(skb);
648 	struct tcphdr *th;
649 
650 	skb_set_transport_header(skb, sizeof(struct ipv6hdr));
651 	th = tcp_hdr(skb);
652 
653 	th->check = ~tcp_v6_check(skb->len - skb_transport_offset(skb),
654 				  &iph->saddr, &iph->daddr, 0);
655 }
656 
657 static void bnx2x_gro_csum(struct bnx2x *bp, struct sk_buff *skb,
658 			    void (*gro_func)(struct bnx2x*, struct sk_buff*))
659 {
660 	skb_set_network_header(skb, 0);
661 	gro_func(bp, skb);
662 	tcp_gro_complete(skb);
663 }
664 #endif
665 
666 static void bnx2x_gro_receive(struct bnx2x *bp, struct bnx2x_fastpath *fp,
667 			       struct sk_buff *skb)
668 {
669 #ifdef CONFIG_INET
670 	if (skb_shinfo(skb)->gso_size) {
671 		switch (be16_to_cpu(skb->protocol)) {
672 		case ETH_P_IP:
673 			bnx2x_gro_csum(bp, skb, bnx2x_gro_ip_csum);
674 			break;
675 		case ETH_P_IPV6:
676 			bnx2x_gro_csum(bp, skb, bnx2x_gro_ipv6_csum);
677 			break;
678 		default:
679 			BNX2X_ERR("Error: FW GRO supports only IPv4/IPv6, not 0x%04x\n",
680 				  be16_to_cpu(skb->protocol));
681 		}
682 	}
683 #endif
684 	skb_record_rx_queue(skb, fp->rx_queue);
685 	napi_gro_receive(&fp->napi, skb);
686 }
687 
688 static void bnx2x_tpa_stop(struct bnx2x *bp, struct bnx2x_fastpath *fp,
689 			   struct bnx2x_agg_info *tpa_info,
690 			   u16 pages,
691 			   struct eth_end_agg_rx_cqe *cqe,
692 			   u16 cqe_idx)
693 {
694 	struct sw_rx_bd *rx_buf = &tpa_info->first_buf;
695 	u8 pad = tpa_info->placement_offset;
696 	u16 len = tpa_info->len_on_bd;
697 	struct sk_buff *skb = NULL;
698 	u8 *new_data, *data = rx_buf->data;
699 	u8 old_tpa_state = tpa_info->tpa_state;
700 
701 	tpa_info->tpa_state = BNX2X_TPA_STOP;
702 
703 	/* If we there was an error during the handling of the TPA_START -
704 	 * drop this aggregation.
705 	 */
706 	if (old_tpa_state == BNX2X_TPA_ERROR)
707 		goto drop;
708 
709 	/* Try to allocate the new data */
710 	new_data = bnx2x_frag_alloc(fp, GFP_ATOMIC);
711 	/* Unmap skb in the pool anyway, as we are going to change
712 	   pool entry status to BNX2X_TPA_STOP even if new skb allocation
713 	   fails. */
714 	dma_unmap_single(&bp->pdev->dev, dma_unmap_addr(rx_buf, mapping),
715 			 fp->rx_buf_size, DMA_FROM_DEVICE);
716 	if (likely(new_data))
717 		skb = build_skb(data, fp->rx_frag_size);
718 
719 	if (likely(skb)) {
720 #ifdef BNX2X_STOP_ON_ERROR
721 		if (pad + len > fp->rx_buf_size) {
722 			BNX2X_ERR("skb_put is about to fail...  pad %d  len %d  rx_buf_size %d\n",
723 				  pad, len, fp->rx_buf_size);
724 			bnx2x_panic();
725 			return;
726 		}
727 #endif
728 
729 		skb_reserve(skb, pad + NET_SKB_PAD);
730 		skb_put(skb, len);
731 		skb->rxhash = tpa_info->rxhash;
732 		skb->l4_rxhash = tpa_info->l4_rxhash;
733 
734 		skb->protocol = eth_type_trans(skb, bp->dev);
735 		skb->ip_summed = CHECKSUM_UNNECESSARY;
736 
737 		if (!bnx2x_fill_frag_skb(bp, fp, tpa_info, pages,
738 					 skb, cqe, cqe_idx)) {
739 			if (tpa_info->parsing_flags & PARSING_FLAGS_VLAN)
740 				__vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q), tpa_info->vlan_tag);
741 			bnx2x_gro_receive(bp, fp, skb);
742 		} else {
743 			DP(NETIF_MSG_RX_STATUS,
744 			   "Failed to allocate new pages - dropping packet!\n");
745 			dev_kfree_skb_any(skb);
746 		}
747 
748 		/* put new data in bin */
749 		rx_buf->data = new_data;
750 
751 		return;
752 	}
753 	bnx2x_frag_free(fp, new_data);
754 drop:
755 	/* drop the packet and keep the buffer in the bin */
756 	DP(NETIF_MSG_RX_STATUS,
757 	   "Failed to allocate or map a new skb - dropping packet!\n");
758 	bnx2x_fp_stats(bp, fp)->eth_q_stats.rx_skb_alloc_failed++;
759 }
760 
761 static int bnx2x_alloc_rx_data(struct bnx2x *bp, struct bnx2x_fastpath *fp,
762 			       u16 index, gfp_t gfp_mask)
763 {
764 	u8 *data;
765 	struct sw_rx_bd *rx_buf = &fp->rx_buf_ring[index];
766 	struct eth_rx_bd *rx_bd = &fp->rx_desc_ring[index];
767 	dma_addr_t mapping;
768 
769 	data = bnx2x_frag_alloc(fp, gfp_mask);
770 	if (unlikely(data == NULL))
771 		return -ENOMEM;
772 
773 	mapping = dma_map_single(&bp->pdev->dev, data + NET_SKB_PAD,
774 				 fp->rx_buf_size,
775 				 DMA_FROM_DEVICE);
776 	if (unlikely(dma_mapping_error(&bp->pdev->dev, mapping))) {
777 		bnx2x_frag_free(fp, data);
778 		BNX2X_ERR("Can't map rx data\n");
779 		return -ENOMEM;
780 	}
781 
782 	rx_buf->data = data;
783 	dma_unmap_addr_set(rx_buf, mapping, mapping);
784 
785 	rx_bd->addr_hi = cpu_to_le32(U64_HI(mapping));
786 	rx_bd->addr_lo = cpu_to_le32(U64_LO(mapping));
787 
788 	return 0;
789 }
790 
791 static
792 void bnx2x_csum_validate(struct sk_buff *skb, union eth_rx_cqe *cqe,
793 				 struct bnx2x_fastpath *fp,
794 				 struct bnx2x_eth_q_stats *qstats)
795 {
796 	/* Do nothing if no L4 csum validation was done.
797 	 * We do not check whether IP csum was validated. For IPv4 we assume
798 	 * that if the card got as far as validating the L4 csum, it also
799 	 * validated the IP csum. IPv6 has no IP csum.
800 	 */
801 	if (cqe->fast_path_cqe.status_flags &
802 	    ETH_FAST_PATH_RX_CQE_L4_XSUM_NO_VALIDATION_FLG)
803 		return;
804 
805 	/* If L4 validation was done, check if an error was found. */
806 
807 	if (cqe->fast_path_cqe.type_error_flags &
808 	    (ETH_FAST_PATH_RX_CQE_IP_BAD_XSUM_FLG |
809 	     ETH_FAST_PATH_RX_CQE_L4_BAD_XSUM_FLG))
810 		qstats->hw_csum_err++;
811 	else
812 		skb->ip_summed = CHECKSUM_UNNECESSARY;
813 }
814 
815 int bnx2x_rx_int(struct bnx2x_fastpath *fp, int budget)
816 {
817 	struct bnx2x *bp = fp->bp;
818 	u16 bd_cons, bd_prod, bd_prod_fw, comp_ring_cons;
819 	u16 sw_comp_cons, sw_comp_prod;
820 	int rx_pkt = 0;
821 	union eth_rx_cqe *cqe;
822 	struct eth_fast_path_rx_cqe *cqe_fp;
823 
824 #ifdef BNX2X_STOP_ON_ERROR
825 	if (unlikely(bp->panic))
826 		return 0;
827 #endif
828 
829 	bd_cons = fp->rx_bd_cons;
830 	bd_prod = fp->rx_bd_prod;
831 	bd_prod_fw = bd_prod;
832 	sw_comp_cons = fp->rx_comp_cons;
833 	sw_comp_prod = fp->rx_comp_prod;
834 
835 	comp_ring_cons = RCQ_BD(sw_comp_cons);
836 	cqe = &fp->rx_comp_ring[comp_ring_cons];
837 	cqe_fp = &cqe->fast_path_cqe;
838 
839 	DP(NETIF_MSG_RX_STATUS,
840 	   "queue[%d]: sw_comp_cons %u\n", fp->index, sw_comp_cons);
841 
842 	while (BNX2X_IS_CQE_COMPLETED(cqe_fp)) {
843 		struct sw_rx_bd *rx_buf = NULL;
844 		struct sk_buff *skb;
845 		u8 cqe_fp_flags;
846 		enum eth_rx_cqe_type cqe_fp_type;
847 		u16 len, pad, queue;
848 		u8 *data;
849 		bool l4_rxhash;
850 
851 #ifdef BNX2X_STOP_ON_ERROR
852 		if (unlikely(bp->panic))
853 			return 0;
854 #endif
855 
856 		bd_prod = RX_BD(bd_prod);
857 		bd_cons = RX_BD(bd_cons);
858 
859 		cqe_fp_flags = cqe_fp->type_error_flags;
860 		cqe_fp_type = cqe_fp_flags & ETH_FAST_PATH_RX_CQE_TYPE;
861 
862 		DP(NETIF_MSG_RX_STATUS,
863 		   "CQE type %x  err %x  status %x  queue %x  vlan %x  len %u\n",
864 		   CQE_TYPE(cqe_fp_flags),
865 		   cqe_fp_flags, cqe_fp->status_flags,
866 		   le32_to_cpu(cqe_fp->rss_hash_result),
867 		   le16_to_cpu(cqe_fp->vlan_tag),
868 		   le16_to_cpu(cqe_fp->pkt_len_or_gro_seg_len));
869 
870 		/* is this a slowpath msg? */
871 		if (unlikely(CQE_TYPE_SLOW(cqe_fp_type))) {
872 			bnx2x_sp_event(fp, cqe);
873 			goto next_cqe;
874 		}
875 
876 		rx_buf = &fp->rx_buf_ring[bd_cons];
877 		data = rx_buf->data;
878 
879 		if (!CQE_TYPE_FAST(cqe_fp_type)) {
880 			struct bnx2x_agg_info *tpa_info;
881 			u16 frag_size, pages;
882 #ifdef BNX2X_STOP_ON_ERROR
883 			/* sanity check */
884 			if (fp->disable_tpa &&
885 			    (CQE_TYPE_START(cqe_fp_type) ||
886 			     CQE_TYPE_STOP(cqe_fp_type)))
887 				BNX2X_ERR("START/STOP packet while disable_tpa type %x\n",
888 					  CQE_TYPE(cqe_fp_type));
889 #endif
890 
891 			if (CQE_TYPE_START(cqe_fp_type)) {
892 				u16 queue = cqe_fp->queue_index;
893 				DP(NETIF_MSG_RX_STATUS,
894 				   "calling tpa_start on queue %d\n",
895 				   queue);
896 
897 				bnx2x_tpa_start(fp, queue,
898 						bd_cons, bd_prod,
899 						cqe_fp);
900 
901 				goto next_rx;
902 			}
903 			queue = cqe->end_agg_cqe.queue_index;
904 			tpa_info = &fp->tpa_info[queue];
905 			DP(NETIF_MSG_RX_STATUS,
906 			   "calling tpa_stop on queue %d\n",
907 			   queue);
908 
909 			frag_size = le16_to_cpu(cqe->end_agg_cqe.pkt_len) -
910 				    tpa_info->len_on_bd;
911 
912 			if (fp->mode == TPA_MODE_GRO)
913 				pages = (frag_size + tpa_info->full_page - 1) /
914 					 tpa_info->full_page;
915 			else
916 				pages = SGE_PAGE_ALIGN(frag_size) >>
917 					SGE_PAGE_SHIFT;
918 
919 			bnx2x_tpa_stop(bp, fp, tpa_info, pages,
920 				       &cqe->end_agg_cqe, comp_ring_cons);
921 #ifdef BNX2X_STOP_ON_ERROR
922 			if (bp->panic)
923 				return 0;
924 #endif
925 
926 			bnx2x_update_sge_prod(fp, pages, &cqe->end_agg_cqe);
927 			goto next_cqe;
928 		}
929 		/* non TPA */
930 		len = le16_to_cpu(cqe_fp->pkt_len_or_gro_seg_len);
931 		pad = cqe_fp->placement_offset;
932 		dma_sync_single_for_cpu(&bp->pdev->dev,
933 					dma_unmap_addr(rx_buf, mapping),
934 					pad + RX_COPY_THRESH,
935 					DMA_FROM_DEVICE);
936 		pad += NET_SKB_PAD;
937 		prefetch(data + pad); /* speedup eth_type_trans() */
938 		/* is this an error packet? */
939 		if (unlikely(cqe_fp_flags & ETH_RX_ERROR_FALGS)) {
940 			DP(NETIF_MSG_RX_ERR | NETIF_MSG_RX_STATUS,
941 			   "ERROR  flags %x  rx packet %u\n",
942 			   cqe_fp_flags, sw_comp_cons);
943 			bnx2x_fp_qstats(bp, fp)->rx_err_discard_pkt++;
944 			goto reuse_rx;
945 		}
946 
947 		/* Since we don't have a jumbo ring
948 		 * copy small packets if mtu > 1500
949 		 */
950 		if ((bp->dev->mtu > ETH_MAX_PACKET_SIZE) &&
951 		    (len <= RX_COPY_THRESH)) {
952 			skb = netdev_alloc_skb_ip_align(bp->dev, len);
953 			if (skb == NULL) {
954 				DP(NETIF_MSG_RX_ERR | NETIF_MSG_RX_STATUS,
955 				   "ERROR  packet dropped because of alloc failure\n");
956 				bnx2x_fp_qstats(bp, fp)->rx_skb_alloc_failed++;
957 				goto reuse_rx;
958 			}
959 			memcpy(skb->data, data + pad, len);
960 			bnx2x_reuse_rx_data(fp, bd_cons, bd_prod);
961 		} else {
962 			if (likely(bnx2x_alloc_rx_data(bp, fp, bd_prod,
963 						       GFP_ATOMIC) == 0)) {
964 				dma_unmap_single(&bp->pdev->dev,
965 						 dma_unmap_addr(rx_buf, mapping),
966 						 fp->rx_buf_size,
967 						 DMA_FROM_DEVICE);
968 				skb = build_skb(data, fp->rx_frag_size);
969 				if (unlikely(!skb)) {
970 					bnx2x_frag_free(fp, data);
971 					bnx2x_fp_qstats(bp, fp)->
972 							rx_skb_alloc_failed++;
973 					goto next_rx;
974 				}
975 				skb_reserve(skb, pad);
976 			} else {
977 				DP(NETIF_MSG_RX_ERR | NETIF_MSG_RX_STATUS,
978 				   "ERROR  packet dropped because of alloc failure\n");
979 				bnx2x_fp_qstats(bp, fp)->rx_skb_alloc_failed++;
980 reuse_rx:
981 				bnx2x_reuse_rx_data(fp, bd_cons, bd_prod);
982 				goto next_rx;
983 			}
984 		}
985 
986 		skb_put(skb, len);
987 		skb->protocol = eth_type_trans(skb, bp->dev);
988 
989 		/* Set Toeplitz hash for a none-LRO skb */
990 		skb->rxhash = bnx2x_get_rxhash(bp, cqe_fp, &l4_rxhash);
991 		skb->l4_rxhash = l4_rxhash;
992 
993 		skb_checksum_none_assert(skb);
994 
995 		if (bp->dev->features & NETIF_F_RXCSUM)
996 			bnx2x_csum_validate(skb, cqe, fp,
997 					    bnx2x_fp_qstats(bp, fp));
998 
999 		skb_record_rx_queue(skb, fp->rx_queue);
1000 
1001 		if (le16_to_cpu(cqe_fp->pars_flags.flags) &
1002 		    PARSING_FLAGS_VLAN)
1003 			__vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q),
1004 					       le16_to_cpu(cqe_fp->vlan_tag));
1005 
1006 		skb_mark_napi_id(skb, &fp->napi);
1007 
1008 		if (bnx2x_fp_ll_polling(fp))
1009 			netif_receive_skb(skb);
1010 		else
1011 			napi_gro_receive(&fp->napi, skb);
1012 next_rx:
1013 		rx_buf->data = NULL;
1014 
1015 		bd_cons = NEXT_RX_IDX(bd_cons);
1016 		bd_prod = NEXT_RX_IDX(bd_prod);
1017 		bd_prod_fw = NEXT_RX_IDX(bd_prod_fw);
1018 		rx_pkt++;
1019 next_cqe:
1020 		sw_comp_prod = NEXT_RCQ_IDX(sw_comp_prod);
1021 		sw_comp_cons = NEXT_RCQ_IDX(sw_comp_cons);
1022 
1023 		/* mark CQE as free */
1024 		BNX2X_SEED_CQE(cqe_fp);
1025 
1026 		if (rx_pkt == budget)
1027 			break;
1028 
1029 		comp_ring_cons = RCQ_BD(sw_comp_cons);
1030 		cqe = &fp->rx_comp_ring[comp_ring_cons];
1031 		cqe_fp = &cqe->fast_path_cqe;
1032 	} /* while */
1033 
1034 	fp->rx_bd_cons = bd_cons;
1035 	fp->rx_bd_prod = bd_prod_fw;
1036 	fp->rx_comp_cons = sw_comp_cons;
1037 	fp->rx_comp_prod = sw_comp_prod;
1038 
1039 	/* Update producers */
1040 	bnx2x_update_rx_prod(bp, fp, bd_prod_fw, sw_comp_prod,
1041 			     fp->rx_sge_prod);
1042 
1043 	fp->rx_pkt += rx_pkt;
1044 	fp->rx_calls++;
1045 
1046 	return rx_pkt;
1047 }
1048 
1049 static irqreturn_t bnx2x_msix_fp_int(int irq, void *fp_cookie)
1050 {
1051 	struct bnx2x_fastpath *fp = fp_cookie;
1052 	struct bnx2x *bp = fp->bp;
1053 	u8 cos;
1054 
1055 	DP(NETIF_MSG_INTR,
1056 	   "got an MSI-X interrupt on IDX:SB [fp %d fw_sd %d igusb %d]\n",
1057 	   fp->index, fp->fw_sb_id, fp->igu_sb_id);
1058 
1059 	bnx2x_ack_sb(bp, fp->igu_sb_id, USTORM_ID, 0, IGU_INT_DISABLE, 0);
1060 
1061 #ifdef BNX2X_STOP_ON_ERROR
1062 	if (unlikely(bp->panic))
1063 		return IRQ_HANDLED;
1064 #endif
1065 
1066 	/* Handle Rx and Tx according to MSI-X vector */
1067 	for_each_cos_in_tx_queue(fp, cos)
1068 		prefetch(fp->txdata_ptr[cos]->tx_cons_sb);
1069 
1070 	prefetch(&fp->sb_running_index[SM_RX_ID]);
1071 	napi_schedule(&bnx2x_fp(bp, fp->index, napi));
1072 
1073 	return IRQ_HANDLED;
1074 }
1075 
1076 /* HW Lock for shared dual port PHYs */
1077 void bnx2x_acquire_phy_lock(struct bnx2x *bp)
1078 {
1079 	mutex_lock(&bp->port.phy_mutex);
1080 
1081 	bnx2x_acquire_hw_lock(bp, HW_LOCK_RESOURCE_MDIO);
1082 }
1083 
1084 void bnx2x_release_phy_lock(struct bnx2x *bp)
1085 {
1086 	bnx2x_release_hw_lock(bp, HW_LOCK_RESOURCE_MDIO);
1087 
1088 	mutex_unlock(&bp->port.phy_mutex);
1089 }
1090 
1091 /* calculates MF speed according to current linespeed and MF configuration */
1092 u16 bnx2x_get_mf_speed(struct bnx2x *bp)
1093 {
1094 	u16 line_speed = bp->link_vars.line_speed;
1095 	if (IS_MF(bp)) {
1096 		u16 maxCfg = bnx2x_extract_max_cfg(bp,
1097 						   bp->mf_config[BP_VN(bp)]);
1098 
1099 		/* Calculate the current MAX line speed limit for the MF
1100 		 * devices
1101 		 */
1102 		if (IS_MF_SI(bp))
1103 			line_speed = (line_speed * maxCfg) / 100;
1104 		else { /* SD mode */
1105 			u16 vn_max_rate = maxCfg * 100;
1106 
1107 			if (vn_max_rate < line_speed)
1108 				line_speed = vn_max_rate;
1109 		}
1110 	}
1111 
1112 	return line_speed;
1113 }
1114 
1115 /**
1116  * bnx2x_fill_report_data - fill link report data to report
1117  *
1118  * @bp:		driver handle
1119  * @data:	link state to update
1120  *
1121  * It uses a none-atomic bit operations because is called under the mutex.
1122  */
1123 static void bnx2x_fill_report_data(struct bnx2x *bp,
1124 				   struct bnx2x_link_report_data *data)
1125 {
1126 	u16 line_speed = bnx2x_get_mf_speed(bp);
1127 
1128 	memset(data, 0, sizeof(*data));
1129 
1130 	/* Fill the report data: effective line speed */
1131 	data->line_speed = line_speed;
1132 
1133 	/* Link is down */
1134 	if (!bp->link_vars.link_up || (bp->flags & MF_FUNC_DIS))
1135 		__set_bit(BNX2X_LINK_REPORT_LINK_DOWN,
1136 			  &data->link_report_flags);
1137 
1138 	/* Full DUPLEX */
1139 	if (bp->link_vars.duplex == DUPLEX_FULL)
1140 		__set_bit(BNX2X_LINK_REPORT_FD, &data->link_report_flags);
1141 
1142 	/* Rx Flow Control is ON */
1143 	if (bp->link_vars.flow_ctrl & BNX2X_FLOW_CTRL_RX)
1144 		__set_bit(BNX2X_LINK_REPORT_RX_FC_ON, &data->link_report_flags);
1145 
1146 	/* Tx Flow Control is ON */
1147 	if (bp->link_vars.flow_ctrl & BNX2X_FLOW_CTRL_TX)
1148 		__set_bit(BNX2X_LINK_REPORT_TX_FC_ON, &data->link_report_flags);
1149 }
1150 
1151 /**
1152  * bnx2x_link_report - report link status to OS.
1153  *
1154  * @bp:		driver handle
1155  *
1156  * Calls the __bnx2x_link_report() under the same locking scheme
1157  * as a link/PHY state managing code to ensure a consistent link
1158  * reporting.
1159  */
1160 
1161 void bnx2x_link_report(struct bnx2x *bp)
1162 {
1163 	bnx2x_acquire_phy_lock(bp);
1164 	__bnx2x_link_report(bp);
1165 	bnx2x_release_phy_lock(bp);
1166 }
1167 
1168 /**
1169  * __bnx2x_link_report - report link status to OS.
1170  *
1171  * @bp:		driver handle
1172  *
1173  * None atomic implementation.
1174  * Should be called under the phy_lock.
1175  */
1176 void __bnx2x_link_report(struct bnx2x *bp)
1177 {
1178 	struct bnx2x_link_report_data cur_data;
1179 
1180 	/* reread mf_cfg */
1181 	if (IS_PF(bp) && !CHIP_IS_E1(bp))
1182 		bnx2x_read_mf_cfg(bp);
1183 
1184 	/* Read the current link report info */
1185 	bnx2x_fill_report_data(bp, &cur_data);
1186 
1187 	/* Don't report link down or exactly the same link status twice */
1188 	if (!memcmp(&cur_data, &bp->last_reported_link, sizeof(cur_data)) ||
1189 	    (test_bit(BNX2X_LINK_REPORT_LINK_DOWN,
1190 		      &bp->last_reported_link.link_report_flags) &&
1191 	     test_bit(BNX2X_LINK_REPORT_LINK_DOWN,
1192 		      &cur_data.link_report_flags)))
1193 		return;
1194 
1195 	bp->link_cnt++;
1196 
1197 	/* We are going to report a new link parameters now -
1198 	 * remember the current data for the next time.
1199 	 */
1200 	memcpy(&bp->last_reported_link, &cur_data, sizeof(cur_data));
1201 
1202 	if (test_bit(BNX2X_LINK_REPORT_LINK_DOWN,
1203 		     &cur_data.link_report_flags)) {
1204 		netif_carrier_off(bp->dev);
1205 		netdev_err(bp->dev, "NIC Link is Down\n");
1206 		return;
1207 	} else {
1208 		const char *duplex;
1209 		const char *flow;
1210 
1211 		netif_carrier_on(bp->dev);
1212 
1213 		if (test_and_clear_bit(BNX2X_LINK_REPORT_FD,
1214 				       &cur_data.link_report_flags))
1215 			duplex = "full";
1216 		else
1217 			duplex = "half";
1218 
1219 		/* Handle the FC at the end so that only these flags would be
1220 		 * possibly set. This way we may easily check if there is no FC
1221 		 * enabled.
1222 		 */
1223 		if (cur_data.link_report_flags) {
1224 			if (test_bit(BNX2X_LINK_REPORT_RX_FC_ON,
1225 				     &cur_data.link_report_flags)) {
1226 				if (test_bit(BNX2X_LINK_REPORT_TX_FC_ON,
1227 				     &cur_data.link_report_flags))
1228 					flow = "ON - receive & transmit";
1229 				else
1230 					flow = "ON - receive";
1231 			} else {
1232 				flow = "ON - transmit";
1233 			}
1234 		} else {
1235 			flow = "none";
1236 		}
1237 		netdev_info(bp->dev, "NIC Link is Up, %d Mbps %s duplex, Flow control: %s\n",
1238 			    cur_data.line_speed, duplex, flow);
1239 	}
1240 }
1241 
1242 static void bnx2x_set_next_page_sgl(struct bnx2x_fastpath *fp)
1243 {
1244 	int i;
1245 
1246 	for (i = 1; i <= NUM_RX_SGE_PAGES; i++) {
1247 		struct eth_rx_sge *sge;
1248 
1249 		sge = &fp->rx_sge_ring[RX_SGE_CNT * i - 2];
1250 		sge->addr_hi =
1251 			cpu_to_le32(U64_HI(fp->rx_sge_mapping +
1252 			BCM_PAGE_SIZE*(i % NUM_RX_SGE_PAGES)));
1253 
1254 		sge->addr_lo =
1255 			cpu_to_le32(U64_LO(fp->rx_sge_mapping +
1256 			BCM_PAGE_SIZE*(i % NUM_RX_SGE_PAGES)));
1257 	}
1258 }
1259 
1260 static void bnx2x_free_tpa_pool(struct bnx2x *bp,
1261 				struct bnx2x_fastpath *fp, int last)
1262 {
1263 	int i;
1264 
1265 	for (i = 0; i < last; i++) {
1266 		struct bnx2x_agg_info *tpa_info = &fp->tpa_info[i];
1267 		struct sw_rx_bd *first_buf = &tpa_info->first_buf;
1268 		u8 *data = first_buf->data;
1269 
1270 		if (data == NULL) {
1271 			DP(NETIF_MSG_IFDOWN, "tpa bin %d empty on free\n", i);
1272 			continue;
1273 		}
1274 		if (tpa_info->tpa_state == BNX2X_TPA_START)
1275 			dma_unmap_single(&bp->pdev->dev,
1276 					 dma_unmap_addr(first_buf, mapping),
1277 					 fp->rx_buf_size, DMA_FROM_DEVICE);
1278 		bnx2x_frag_free(fp, data);
1279 		first_buf->data = NULL;
1280 	}
1281 }
1282 
1283 void bnx2x_init_rx_rings_cnic(struct bnx2x *bp)
1284 {
1285 	int j;
1286 
1287 	for_each_rx_queue_cnic(bp, j) {
1288 		struct bnx2x_fastpath *fp = &bp->fp[j];
1289 
1290 		fp->rx_bd_cons = 0;
1291 
1292 		/* Activate BD ring */
1293 		/* Warning!
1294 		 * this will generate an interrupt (to the TSTORM)
1295 		 * must only be done after chip is initialized
1296 		 */
1297 		bnx2x_update_rx_prod(bp, fp, fp->rx_bd_prod, fp->rx_comp_prod,
1298 				     fp->rx_sge_prod);
1299 	}
1300 }
1301 
1302 void bnx2x_init_rx_rings(struct bnx2x *bp)
1303 {
1304 	int func = BP_FUNC(bp);
1305 	u16 ring_prod;
1306 	int i, j;
1307 
1308 	/* Allocate TPA resources */
1309 	for_each_eth_queue(bp, j) {
1310 		struct bnx2x_fastpath *fp = &bp->fp[j];
1311 
1312 		DP(NETIF_MSG_IFUP,
1313 		   "mtu %d  rx_buf_size %d\n", bp->dev->mtu, fp->rx_buf_size);
1314 
1315 		if (!fp->disable_tpa) {
1316 			/* Fill the per-aggregation pool */
1317 			for (i = 0; i < MAX_AGG_QS(bp); i++) {
1318 				struct bnx2x_agg_info *tpa_info =
1319 					&fp->tpa_info[i];
1320 				struct sw_rx_bd *first_buf =
1321 					&tpa_info->first_buf;
1322 
1323 				first_buf->data =
1324 					bnx2x_frag_alloc(fp, GFP_KERNEL);
1325 				if (!first_buf->data) {
1326 					BNX2X_ERR("Failed to allocate TPA skb pool for queue[%d] - disabling TPA on this queue!\n",
1327 						  j);
1328 					bnx2x_free_tpa_pool(bp, fp, i);
1329 					fp->disable_tpa = 1;
1330 					break;
1331 				}
1332 				dma_unmap_addr_set(first_buf, mapping, 0);
1333 				tpa_info->tpa_state = BNX2X_TPA_STOP;
1334 			}
1335 
1336 			/* "next page" elements initialization */
1337 			bnx2x_set_next_page_sgl(fp);
1338 
1339 			/* set SGEs bit mask */
1340 			bnx2x_init_sge_ring_bit_mask(fp);
1341 
1342 			/* Allocate SGEs and initialize the ring elements */
1343 			for (i = 0, ring_prod = 0;
1344 			     i < MAX_RX_SGE_CNT*NUM_RX_SGE_PAGES; i++) {
1345 
1346 				if (bnx2x_alloc_rx_sge(bp, fp, ring_prod,
1347 						       GFP_KERNEL) < 0) {
1348 					BNX2X_ERR("was only able to allocate %d rx sges\n",
1349 						  i);
1350 					BNX2X_ERR("disabling TPA for queue[%d]\n",
1351 						  j);
1352 					/* Cleanup already allocated elements */
1353 					bnx2x_free_rx_sge_range(bp, fp,
1354 								ring_prod);
1355 					bnx2x_free_tpa_pool(bp, fp,
1356 							    MAX_AGG_QS(bp));
1357 					fp->disable_tpa = 1;
1358 					ring_prod = 0;
1359 					break;
1360 				}
1361 				ring_prod = NEXT_SGE_IDX(ring_prod);
1362 			}
1363 
1364 			fp->rx_sge_prod = ring_prod;
1365 		}
1366 	}
1367 
1368 	for_each_eth_queue(bp, j) {
1369 		struct bnx2x_fastpath *fp = &bp->fp[j];
1370 
1371 		fp->rx_bd_cons = 0;
1372 
1373 		/* Activate BD ring */
1374 		/* Warning!
1375 		 * this will generate an interrupt (to the TSTORM)
1376 		 * must only be done after chip is initialized
1377 		 */
1378 		bnx2x_update_rx_prod(bp, fp, fp->rx_bd_prod, fp->rx_comp_prod,
1379 				     fp->rx_sge_prod);
1380 
1381 		if (j != 0)
1382 			continue;
1383 
1384 		if (CHIP_IS_E1(bp)) {
1385 			REG_WR(bp, BAR_USTRORM_INTMEM +
1386 			       USTORM_MEM_WORKAROUND_ADDRESS_OFFSET(func),
1387 			       U64_LO(fp->rx_comp_mapping));
1388 			REG_WR(bp, BAR_USTRORM_INTMEM +
1389 			       USTORM_MEM_WORKAROUND_ADDRESS_OFFSET(func) + 4,
1390 			       U64_HI(fp->rx_comp_mapping));
1391 		}
1392 	}
1393 }
1394 
1395 static void bnx2x_free_tx_skbs_queue(struct bnx2x_fastpath *fp)
1396 {
1397 	u8 cos;
1398 	struct bnx2x *bp = fp->bp;
1399 
1400 	for_each_cos_in_tx_queue(fp, cos) {
1401 		struct bnx2x_fp_txdata *txdata = fp->txdata_ptr[cos];
1402 		unsigned pkts_compl = 0, bytes_compl = 0;
1403 
1404 		u16 sw_prod = txdata->tx_pkt_prod;
1405 		u16 sw_cons = txdata->tx_pkt_cons;
1406 
1407 		while (sw_cons != sw_prod) {
1408 			bnx2x_free_tx_pkt(bp, txdata, TX_BD(sw_cons),
1409 					  &pkts_compl, &bytes_compl);
1410 			sw_cons++;
1411 		}
1412 
1413 		netdev_tx_reset_queue(
1414 			netdev_get_tx_queue(bp->dev,
1415 					    txdata->txq_index));
1416 	}
1417 }
1418 
1419 static void bnx2x_free_tx_skbs_cnic(struct bnx2x *bp)
1420 {
1421 	int i;
1422 
1423 	for_each_tx_queue_cnic(bp, i) {
1424 		bnx2x_free_tx_skbs_queue(&bp->fp[i]);
1425 	}
1426 }
1427 
1428 static void bnx2x_free_tx_skbs(struct bnx2x *bp)
1429 {
1430 	int i;
1431 
1432 	for_each_eth_queue(bp, i) {
1433 		bnx2x_free_tx_skbs_queue(&bp->fp[i]);
1434 	}
1435 }
1436 
1437 static void bnx2x_free_rx_bds(struct bnx2x_fastpath *fp)
1438 {
1439 	struct bnx2x *bp = fp->bp;
1440 	int i;
1441 
1442 	/* ring wasn't allocated */
1443 	if (fp->rx_buf_ring == NULL)
1444 		return;
1445 
1446 	for (i = 0; i < NUM_RX_BD; i++) {
1447 		struct sw_rx_bd *rx_buf = &fp->rx_buf_ring[i];
1448 		u8 *data = rx_buf->data;
1449 
1450 		if (data == NULL)
1451 			continue;
1452 		dma_unmap_single(&bp->pdev->dev,
1453 				 dma_unmap_addr(rx_buf, mapping),
1454 				 fp->rx_buf_size, DMA_FROM_DEVICE);
1455 
1456 		rx_buf->data = NULL;
1457 		bnx2x_frag_free(fp, data);
1458 	}
1459 }
1460 
1461 static void bnx2x_free_rx_skbs_cnic(struct bnx2x *bp)
1462 {
1463 	int j;
1464 
1465 	for_each_rx_queue_cnic(bp, j) {
1466 		bnx2x_free_rx_bds(&bp->fp[j]);
1467 	}
1468 }
1469 
1470 static void bnx2x_free_rx_skbs(struct bnx2x *bp)
1471 {
1472 	int j;
1473 
1474 	for_each_eth_queue(bp, j) {
1475 		struct bnx2x_fastpath *fp = &bp->fp[j];
1476 
1477 		bnx2x_free_rx_bds(fp);
1478 
1479 		if (!fp->disable_tpa)
1480 			bnx2x_free_tpa_pool(bp, fp, MAX_AGG_QS(bp));
1481 	}
1482 }
1483 
1484 void bnx2x_free_skbs_cnic(struct bnx2x *bp)
1485 {
1486 	bnx2x_free_tx_skbs_cnic(bp);
1487 	bnx2x_free_rx_skbs_cnic(bp);
1488 }
1489 
1490 void bnx2x_free_skbs(struct bnx2x *bp)
1491 {
1492 	bnx2x_free_tx_skbs(bp);
1493 	bnx2x_free_rx_skbs(bp);
1494 }
1495 
1496 void bnx2x_update_max_mf_config(struct bnx2x *bp, u32 value)
1497 {
1498 	/* load old values */
1499 	u32 mf_cfg = bp->mf_config[BP_VN(bp)];
1500 
1501 	if (value != bnx2x_extract_max_cfg(bp, mf_cfg)) {
1502 		/* leave all but MAX value */
1503 		mf_cfg &= ~FUNC_MF_CFG_MAX_BW_MASK;
1504 
1505 		/* set new MAX value */
1506 		mf_cfg |= (value << FUNC_MF_CFG_MAX_BW_SHIFT)
1507 				& FUNC_MF_CFG_MAX_BW_MASK;
1508 
1509 		bnx2x_fw_command(bp, DRV_MSG_CODE_SET_MF_BW, mf_cfg);
1510 	}
1511 }
1512 
1513 /**
1514  * bnx2x_free_msix_irqs - free previously requested MSI-X IRQ vectors
1515  *
1516  * @bp:		driver handle
1517  * @nvecs:	number of vectors to be released
1518  */
1519 static void bnx2x_free_msix_irqs(struct bnx2x *bp, int nvecs)
1520 {
1521 	int i, offset = 0;
1522 
1523 	if (nvecs == offset)
1524 		return;
1525 
1526 	/* VFs don't have a default SB */
1527 	if (IS_PF(bp)) {
1528 		free_irq(bp->msix_table[offset].vector, bp->dev);
1529 		DP(NETIF_MSG_IFDOWN, "released sp irq (%d)\n",
1530 		   bp->msix_table[offset].vector);
1531 		offset++;
1532 	}
1533 
1534 	if (CNIC_SUPPORT(bp)) {
1535 		if (nvecs == offset)
1536 			return;
1537 		offset++;
1538 	}
1539 
1540 	for_each_eth_queue(bp, i) {
1541 		if (nvecs == offset)
1542 			return;
1543 		DP(NETIF_MSG_IFDOWN, "about to release fp #%d->%d irq\n",
1544 		   i, bp->msix_table[offset].vector);
1545 
1546 		free_irq(bp->msix_table[offset++].vector, &bp->fp[i]);
1547 	}
1548 }
1549 
1550 void bnx2x_free_irq(struct bnx2x *bp)
1551 {
1552 	if (bp->flags & USING_MSIX_FLAG &&
1553 	    !(bp->flags & USING_SINGLE_MSIX_FLAG)) {
1554 		int nvecs = BNX2X_NUM_ETH_QUEUES(bp) + CNIC_SUPPORT(bp);
1555 
1556 		/* vfs don't have a default status block */
1557 		if (IS_PF(bp))
1558 			nvecs++;
1559 
1560 		bnx2x_free_msix_irqs(bp, nvecs);
1561 	} else {
1562 		free_irq(bp->dev->irq, bp->dev);
1563 	}
1564 }
1565 
1566 int bnx2x_enable_msix(struct bnx2x *bp)
1567 {
1568 	int msix_vec = 0, i, rc;
1569 
1570 	/* VFs don't have a default status block */
1571 	if (IS_PF(bp)) {
1572 		bp->msix_table[msix_vec].entry = msix_vec;
1573 		BNX2X_DEV_INFO("msix_table[0].entry = %d (slowpath)\n",
1574 			       bp->msix_table[0].entry);
1575 		msix_vec++;
1576 	}
1577 
1578 	/* Cnic requires an msix vector for itself */
1579 	if (CNIC_SUPPORT(bp)) {
1580 		bp->msix_table[msix_vec].entry = msix_vec;
1581 		BNX2X_DEV_INFO("msix_table[%d].entry = %d (CNIC)\n",
1582 			       msix_vec, bp->msix_table[msix_vec].entry);
1583 		msix_vec++;
1584 	}
1585 
1586 	/* We need separate vectors for ETH queues only (not FCoE) */
1587 	for_each_eth_queue(bp, i) {
1588 		bp->msix_table[msix_vec].entry = msix_vec;
1589 		BNX2X_DEV_INFO("msix_table[%d].entry = %d (fastpath #%u)\n",
1590 			       msix_vec, msix_vec, i);
1591 		msix_vec++;
1592 	}
1593 
1594 	DP(BNX2X_MSG_SP, "about to request enable msix with %d vectors\n",
1595 	   msix_vec);
1596 
1597 	rc = pci_enable_msix(bp->pdev, &bp->msix_table[0], msix_vec);
1598 
1599 	/*
1600 	 * reconfigure number of tx/rx queues according to available
1601 	 * MSI-X vectors
1602 	 */
1603 	if (rc >= BNX2X_MIN_MSIX_VEC_CNT(bp)) {
1604 		/* how less vectors we will have? */
1605 		int diff = msix_vec - rc;
1606 
1607 		BNX2X_DEV_INFO("Trying to use less MSI-X vectors: %d\n", rc);
1608 
1609 		rc = pci_enable_msix(bp->pdev, &bp->msix_table[0], rc);
1610 
1611 		if (rc) {
1612 			BNX2X_DEV_INFO("MSI-X is not attainable rc %d\n", rc);
1613 			goto no_msix;
1614 		}
1615 		/*
1616 		 * decrease number of queues by number of unallocated entries
1617 		 */
1618 		bp->num_ethernet_queues -= diff;
1619 		bp->num_queues = bp->num_ethernet_queues + bp->num_cnic_queues;
1620 
1621 		BNX2X_DEV_INFO("New queue configuration set: %d\n",
1622 			       bp->num_queues);
1623 	} else if (rc > 0) {
1624 		/* Get by with single vector */
1625 		rc = pci_enable_msix(bp->pdev, &bp->msix_table[0], 1);
1626 		if (rc) {
1627 			BNX2X_DEV_INFO("Single MSI-X is not attainable rc %d\n",
1628 				       rc);
1629 			goto no_msix;
1630 		}
1631 
1632 		BNX2X_DEV_INFO("Using single MSI-X vector\n");
1633 		bp->flags |= USING_SINGLE_MSIX_FLAG;
1634 
1635 		BNX2X_DEV_INFO("set number of queues to 1\n");
1636 		bp->num_ethernet_queues = 1;
1637 		bp->num_queues = bp->num_ethernet_queues + bp->num_cnic_queues;
1638 	} else if (rc < 0) {
1639 		BNX2X_DEV_INFO("MSI-X is not attainable  rc %d\n", rc);
1640 		goto no_msix;
1641 	}
1642 
1643 	bp->flags |= USING_MSIX_FLAG;
1644 
1645 	return 0;
1646 
1647 no_msix:
1648 	/* fall to INTx if not enough memory */
1649 	if (rc == -ENOMEM)
1650 		bp->flags |= DISABLE_MSI_FLAG;
1651 
1652 	return rc;
1653 }
1654 
1655 static int bnx2x_req_msix_irqs(struct bnx2x *bp)
1656 {
1657 	int i, rc, offset = 0;
1658 
1659 	/* no default status block for vf */
1660 	if (IS_PF(bp)) {
1661 		rc = request_irq(bp->msix_table[offset++].vector,
1662 				 bnx2x_msix_sp_int, 0,
1663 				 bp->dev->name, bp->dev);
1664 		if (rc) {
1665 			BNX2X_ERR("request sp irq failed\n");
1666 			return -EBUSY;
1667 		}
1668 	}
1669 
1670 	if (CNIC_SUPPORT(bp))
1671 		offset++;
1672 
1673 	for_each_eth_queue(bp, i) {
1674 		struct bnx2x_fastpath *fp = &bp->fp[i];
1675 		snprintf(fp->name, sizeof(fp->name), "%s-fp-%d",
1676 			 bp->dev->name, i);
1677 
1678 		rc = request_irq(bp->msix_table[offset].vector,
1679 				 bnx2x_msix_fp_int, 0, fp->name, fp);
1680 		if (rc) {
1681 			BNX2X_ERR("request fp #%d irq (%d) failed  rc %d\n", i,
1682 			      bp->msix_table[offset].vector, rc);
1683 			bnx2x_free_msix_irqs(bp, offset);
1684 			return -EBUSY;
1685 		}
1686 
1687 		offset++;
1688 	}
1689 
1690 	i = BNX2X_NUM_ETH_QUEUES(bp);
1691 	if (IS_PF(bp)) {
1692 		offset = 1 + CNIC_SUPPORT(bp);
1693 		netdev_info(bp->dev,
1694 			    "using MSI-X  IRQs: sp %d  fp[%d] %d ... fp[%d] %d\n",
1695 			    bp->msix_table[0].vector,
1696 			    0, bp->msix_table[offset].vector,
1697 			    i - 1, bp->msix_table[offset + i - 1].vector);
1698 	} else {
1699 		offset = CNIC_SUPPORT(bp);
1700 		netdev_info(bp->dev,
1701 			    "using MSI-X  IRQs: fp[%d] %d ... fp[%d] %d\n",
1702 			    0, bp->msix_table[offset].vector,
1703 			    i - 1, bp->msix_table[offset + i - 1].vector);
1704 	}
1705 	return 0;
1706 }
1707 
1708 int bnx2x_enable_msi(struct bnx2x *bp)
1709 {
1710 	int rc;
1711 
1712 	rc = pci_enable_msi(bp->pdev);
1713 	if (rc) {
1714 		BNX2X_DEV_INFO("MSI is not attainable\n");
1715 		return -1;
1716 	}
1717 	bp->flags |= USING_MSI_FLAG;
1718 
1719 	return 0;
1720 }
1721 
1722 static int bnx2x_req_irq(struct bnx2x *bp)
1723 {
1724 	unsigned long flags;
1725 	unsigned int irq;
1726 
1727 	if (bp->flags & (USING_MSI_FLAG | USING_MSIX_FLAG))
1728 		flags = 0;
1729 	else
1730 		flags = IRQF_SHARED;
1731 
1732 	if (bp->flags & USING_MSIX_FLAG)
1733 		irq = bp->msix_table[0].vector;
1734 	else
1735 		irq = bp->pdev->irq;
1736 
1737 	return request_irq(irq, bnx2x_interrupt, flags, bp->dev->name, bp->dev);
1738 }
1739 
1740 static int bnx2x_setup_irqs(struct bnx2x *bp)
1741 {
1742 	int rc = 0;
1743 	if (bp->flags & USING_MSIX_FLAG &&
1744 	    !(bp->flags & USING_SINGLE_MSIX_FLAG)) {
1745 		rc = bnx2x_req_msix_irqs(bp);
1746 		if (rc)
1747 			return rc;
1748 	} else {
1749 		rc = bnx2x_req_irq(bp);
1750 		if (rc) {
1751 			BNX2X_ERR("IRQ request failed  rc %d, aborting\n", rc);
1752 			return rc;
1753 		}
1754 		if (bp->flags & USING_MSI_FLAG) {
1755 			bp->dev->irq = bp->pdev->irq;
1756 			netdev_info(bp->dev, "using MSI IRQ %d\n",
1757 				    bp->dev->irq);
1758 		}
1759 		if (bp->flags & USING_MSIX_FLAG) {
1760 			bp->dev->irq = bp->msix_table[0].vector;
1761 			netdev_info(bp->dev, "using MSIX IRQ %d\n",
1762 				    bp->dev->irq);
1763 		}
1764 	}
1765 
1766 	return 0;
1767 }
1768 
1769 static void bnx2x_napi_enable_cnic(struct bnx2x *bp)
1770 {
1771 	int i;
1772 
1773 	for_each_rx_queue_cnic(bp, i) {
1774 		bnx2x_fp_init_lock(&bp->fp[i]);
1775 		napi_enable(&bnx2x_fp(bp, i, napi));
1776 	}
1777 }
1778 
1779 static void bnx2x_napi_enable(struct bnx2x *bp)
1780 {
1781 	int i;
1782 
1783 	for_each_eth_queue(bp, i) {
1784 		bnx2x_fp_init_lock(&bp->fp[i]);
1785 		napi_enable(&bnx2x_fp(bp, i, napi));
1786 	}
1787 }
1788 
1789 static void bnx2x_napi_disable_cnic(struct bnx2x *bp)
1790 {
1791 	int i;
1792 
1793 	local_bh_disable();
1794 	for_each_rx_queue_cnic(bp, i) {
1795 		napi_disable(&bnx2x_fp(bp, i, napi));
1796 		while (!bnx2x_fp_lock_napi(&bp->fp[i]))
1797 			mdelay(1);
1798 	}
1799 	local_bh_enable();
1800 }
1801 
1802 static void bnx2x_napi_disable(struct bnx2x *bp)
1803 {
1804 	int i;
1805 
1806 	local_bh_disable();
1807 	for_each_eth_queue(bp, i) {
1808 		napi_disable(&bnx2x_fp(bp, i, napi));
1809 		while (!bnx2x_fp_lock_napi(&bp->fp[i]))
1810 			mdelay(1);
1811 	}
1812 	local_bh_enable();
1813 }
1814 
1815 void bnx2x_netif_start(struct bnx2x *bp)
1816 {
1817 	if (netif_running(bp->dev)) {
1818 		bnx2x_napi_enable(bp);
1819 		if (CNIC_LOADED(bp))
1820 			bnx2x_napi_enable_cnic(bp);
1821 		bnx2x_int_enable(bp);
1822 		if (bp->state == BNX2X_STATE_OPEN)
1823 			netif_tx_wake_all_queues(bp->dev);
1824 	}
1825 }
1826 
1827 void bnx2x_netif_stop(struct bnx2x *bp, int disable_hw)
1828 {
1829 	bnx2x_int_disable_sync(bp, disable_hw);
1830 	bnx2x_napi_disable(bp);
1831 	if (CNIC_LOADED(bp))
1832 		bnx2x_napi_disable_cnic(bp);
1833 }
1834 
1835 u16 bnx2x_select_queue(struct net_device *dev, struct sk_buff *skb)
1836 {
1837 	struct bnx2x *bp = netdev_priv(dev);
1838 
1839 	if (CNIC_LOADED(bp) && !NO_FCOE(bp)) {
1840 		struct ethhdr *hdr = (struct ethhdr *)skb->data;
1841 		u16 ether_type = ntohs(hdr->h_proto);
1842 
1843 		/* Skip VLAN tag if present */
1844 		if (ether_type == ETH_P_8021Q) {
1845 			struct vlan_ethhdr *vhdr =
1846 				(struct vlan_ethhdr *)skb->data;
1847 
1848 			ether_type = ntohs(vhdr->h_vlan_encapsulated_proto);
1849 		}
1850 
1851 		/* If ethertype is FCoE or FIP - use FCoE ring */
1852 		if ((ether_type == ETH_P_FCOE) || (ether_type == ETH_P_FIP))
1853 			return bnx2x_fcoe_tx(bp, txq_index);
1854 	}
1855 
1856 	/* select a non-FCoE queue */
1857 	return __netdev_pick_tx(dev, skb) % BNX2X_NUM_ETH_QUEUES(bp);
1858 }
1859 
1860 void bnx2x_set_num_queues(struct bnx2x *bp)
1861 {
1862 	/* RSS queues */
1863 	bp->num_ethernet_queues = bnx2x_calc_num_queues(bp);
1864 
1865 	/* override in STORAGE SD modes */
1866 	if (IS_MF_STORAGE_SD(bp) || IS_MF_FCOE_AFEX(bp))
1867 		bp->num_ethernet_queues = 1;
1868 
1869 	/* Add special queues */
1870 	bp->num_cnic_queues = CNIC_SUPPORT(bp); /* For FCOE */
1871 	bp->num_queues = bp->num_ethernet_queues + bp->num_cnic_queues;
1872 
1873 	BNX2X_DEV_INFO("set number of queues to %d\n", bp->num_queues);
1874 }
1875 
1876 /**
1877  * bnx2x_set_real_num_queues - configure netdev->real_num_[tx,rx]_queues
1878  *
1879  * @bp:		Driver handle
1880  *
1881  * We currently support for at most 16 Tx queues for each CoS thus we will
1882  * allocate a multiple of 16 for ETH L2 rings according to the value of the
1883  * bp->max_cos.
1884  *
1885  * If there is an FCoE L2 queue the appropriate Tx queue will have the next
1886  * index after all ETH L2 indices.
1887  *
1888  * If the actual number of Tx queues (for each CoS) is less than 16 then there
1889  * will be the holes at the end of each group of 16 ETh L2 indices (0..15,
1890  * 16..31,...) with indices that are not coupled with any real Tx queue.
1891  *
1892  * The proper configuration of skb->queue_mapping is handled by
1893  * bnx2x_select_queue() and __skb_tx_hash().
1894  *
1895  * bnx2x_setup_tc() takes care of the proper TC mappings so that __skb_tx_hash()
1896  * will return a proper Tx index if TC is enabled (netdev->num_tc > 0).
1897  */
1898 static int bnx2x_set_real_num_queues(struct bnx2x *bp, int include_cnic)
1899 {
1900 	int rc, tx, rx;
1901 
1902 	tx = BNX2X_NUM_ETH_QUEUES(bp) * bp->max_cos;
1903 	rx = BNX2X_NUM_ETH_QUEUES(bp);
1904 
1905 /* account for fcoe queue */
1906 	if (include_cnic && !NO_FCOE(bp)) {
1907 		rx++;
1908 		tx++;
1909 	}
1910 
1911 	rc = netif_set_real_num_tx_queues(bp->dev, tx);
1912 	if (rc) {
1913 		BNX2X_ERR("Failed to set real number of Tx queues: %d\n", rc);
1914 		return rc;
1915 	}
1916 	rc = netif_set_real_num_rx_queues(bp->dev, rx);
1917 	if (rc) {
1918 		BNX2X_ERR("Failed to set real number of Rx queues: %d\n", rc);
1919 		return rc;
1920 	}
1921 
1922 	DP(NETIF_MSG_IFUP, "Setting real num queues to (tx, rx) (%d, %d)\n",
1923 			  tx, rx);
1924 
1925 	return rc;
1926 }
1927 
1928 static void bnx2x_set_rx_buf_size(struct bnx2x *bp)
1929 {
1930 	int i;
1931 
1932 	for_each_queue(bp, i) {
1933 		struct bnx2x_fastpath *fp = &bp->fp[i];
1934 		u32 mtu;
1935 
1936 		/* Always use a mini-jumbo MTU for the FCoE L2 ring */
1937 		if (IS_FCOE_IDX(i))
1938 			/*
1939 			 * Although there are no IP frames expected to arrive to
1940 			 * this ring we still want to add an
1941 			 * IP_HEADER_ALIGNMENT_PADDING to prevent a buffer
1942 			 * overrun attack.
1943 			 */
1944 			mtu = BNX2X_FCOE_MINI_JUMBO_MTU;
1945 		else
1946 			mtu = bp->dev->mtu;
1947 		fp->rx_buf_size = BNX2X_FW_RX_ALIGN_START +
1948 				  IP_HEADER_ALIGNMENT_PADDING +
1949 				  ETH_OVREHEAD +
1950 				  mtu +
1951 				  BNX2X_FW_RX_ALIGN_END;
1952 		/* Note : rx_buf_size doesn't take into account NET_SKB_PAD */
1953 		if (fp->rx_buf_size + NET_SKB_PAD <= PAGE_SIZE)
1954 			fp->rx_frag_size = fp->rx_buf_size + NET_SKB_PAD;
1955 		else
1956 			fp->rx_frag_size = 0;
1957 	}
1958 }
1959 
1960 static int bnx2x_init_rss(struct bnx2x *bp)
1961 {
1962 	int i;
1963 	u8 num_eth_queues = BNX2X_NUM_ETH_QUEUES(bp);
1964 
1965 	/* Prepare the initial contents for the indirection table if RSS is
1966 	 * enabled
1967 	 */
1968 	for (i = 0; i < sizeof(bp->rss_conf_obj.ind_table); i++)
1969 		bp->rss_conf_obj.ind_table[i] =
1970 			bp->fp->cl_id +
1971 			ethtool_rxfh_indir_default(i, num_eth_queues);
1972 
1973 	/*
1974 	 * For 57710 and 57711 SEARCHER configuration (rss_keys) is
1975 	 * per-port, so if explicit configuration is needed , do it only
1976 	 * for a PMF.
1977 	 *
1978 	 * For 57712 and newer on the other hand it's a per-function
1979 	 * configuration.
1980 	 */
1981 	return bnx2x_config_rss_eth(bp, bp->port.pmf || !CHIP_IS_E1x(bp));
1982 }
1983 
1984 int bnx2x_rss(struct bnx2x *bp, struct bnx2x_rss_config_obj *rss_obj,
1985 	      bool config_hash, bool enable)
1986 {
1987 	struct bnx2x_config_rss_params params = {NULL};
1988 
1989 	/* Although RSS is meaningless when there is a single HW queue we
1990 	 * still need it enabled in order to have HW Rx hash generated.
1991 	 *
1992 	 * if (!is_eth_multi(bp))
1993 	 *      bp->multi_mode = ETH_RSS_MODE_DISABLED;
1994 	 */
1995 
1996 	params.rss_obj = rss_obj;
1997 
1998 	__set_bit(RAMROD_COMP_WAIT, &params.ramrod_flags);
1999 
2000 	if (enable) {
2001 		__set_bit(BNX2X_RSS_MODE_REGULAR, &params.rss_flags);
2002 
2003 		/* RSS configuration */
2004 		__set_bit(BNX2X_RSS_IPV4, &params.rss_flags);
2005 		__set_bit(BNX2X_RSS_IPV4_TCP, &params.rss_flags);
2006 		__set_bit(BNX2X_RSS_IPV6, &params.rss_flags);
2007 		__set_bit(BNX2X_RSS_IPV6_TCP, &params.rss_flags);
2008 		if (rss_obj->udp_rss_v4)
2009 			__set_bit(BNX2X_RSS_IPV4_UDP, &params.rss_flags);
2010 		if (rss_obj->udp_rss_v6)
2011 			__set_bit(BNX2X_RSS_IPV6_UDP, &params.rss_flags);
2012 	} else {
2013 		__set_bit(BNX2X_RSS_MODE_DISABLED, &params.rss_flags);
2014 	}
2015 
2016 	/* Hash bits */
2017 	params.rss_result_mask = MULTI_MASK;
2018 
2019 	memcpy(params.ind_table, rss_obj->ind_table, sizeof(params.ind_table));
2020 
2021 	if (config_hash) {
2022 		/* RSS keys */
2023 		prandom_bytes(params.rss_key, T_ETH_RSS_KEY * 4);
2024 		__set_bit(BNX2X_RSS_SET_SRCH, &params.rss_flags);
2025 	}
2026 
2027 	if (IS_PF(bp))
2028 		return bnx2x_config_rss(bp, &params);
2029 	else
2030 		return bnx2x_vfpf_config_rss(bp, &params);
2031 }
2032 
2033 static int bnx2x_init_hw(struct bnx2x *bp, u32 load_code)
2034 {
2035 	struct bnx2x_func_state_params func_params = {NULL};
2036 
2037 	/* Prepare parameters for function state transitions */
2038 	__set_bit(RAMROD_COMP_WAIT, &func_params.ramrod_flags);
2039 
2040 	func_params.f_obj = &bp->func_obj;
2041 	func_params.cmd = BNX2X_F_CMD_HW_INIT;
2042 
2043 	func_params.params.hw_init.load_phase = load_code;
2044 
2045 	return bnx2x_func_state_change(bp, &func_params);
2046 }
2047 
2048 /*
2049  * Cleans the object that have internal lists without sending
2050  * ramrods. Should be run when interrupts are disabled.
2051  */
2052 void bnx2x_squeeze_objects(struct bnx2x *bp)
2053 {
2054 	int rc;
2055 	unsigned long ramrod_flags = 0, vlan_mac_flags = 0;
2056 	struct bnx2x_mcast_ramrod_params rparam = {NULL};
2057 	struct bnx2x_vlan_mac_obj *mac_obj = &bp->sp_objs->mac_obj;
2058 
2059 	/***************** Cleanup MACs' object first *************************/
2060 
2061 	/* Wait for completion of requested */
2062 	__set_bit(RAMROD_COMP_WAIT, &ramrod_flags);
2063 	/* Perform a dry cleanup */
2064 	__set_bit(RAMROD_DRV_CLR_ONLY, &ramrod_flags);
2065 
2066 	/* Clean ETH primary MAC */
2067 	__set_bit(BNX2X_ETH_MAC, &vlan_mac_flags);
2068 	rc = mac_obj->delete_all(bp, &bp->sp_objs->mac_obj, &vlan_mac_flags,
2069 				 &ramrod_flags);
2070 	if (rc != 0)
2071 		BNX2X_ERR("Failed to clean ETH MACs: %d\n", rc);
2072 
2073 	/* Cleanup UC list */
2074 	vlan_mac_flags = 0;
2075 	__set_bit(BNX2X_UC_LIST_MAC, &vlan_mac_flags);
2076 	rc = mac_obj->delete_all(bp, mac_obj, &vlan_mac_flags,
2077 				 &ramrod_flags);
2078 	if (rc != 0)
2079 		BNX2X_ERR("Failed to clean UC list MACs: %d\n", rc);
2080 
2081 	/***************** Now clean mcast object *****************************/
2082 	rparam.mcast_obj = &bp->mcast_obj;
2083 	__set_bit(RAMROD_DRV_CLR_ONLY, &rparam.ramrod_flags);
2084 
2085 	/* Add a DEL command... - Since we're doing a driver cleanup only,
2086 	 * we take a lock surrounding both the initial send and the CONTs,
2087 	 * as we don't want a true completion to disrupt us in the middle.
2088 	 */
2089 	netif_addr_lock_bh(bp->dev);
2090 	rc = bnx2x_config_mcast(bp, &rparam, BNX2X_MCAST_CMD_DEL);
2091 	if (rc < 0)
2092 		BNX2X_ERR("Failed to add a new DEL command to a multi-cast object: %d\n",
2093 			  rc);
2094 
2095 	/* ...and wait until all pending commands are cleared */
2096 	rc = bnx2x_config_mcast(bp, &rparam, BNX2X_MCAST_CMD_CONT);
2097 	while (rc != 0) {
2098 		if (rc < 0) {
2099 			BNX2X_ERR("Failed to clean multi-cast object: %d\n",
2100 				  rc);
2101 			netif_addr_unlock_bh(bp->dev);
2102 			return;
2103 		}
2104 
2105 		rc = bnx2x_config_mcast(bp, &rparam, BNX2X_MCAST_CMD_CONT);
2106 	}
2107 	netif_addr_unlock_bh(bp->dev);
2108 }
2109 
2110 #ifndef BNX2X_STOP_ON_ERROR
2111 #define LOAD_ERROR_EXIT(bp, label) \
2112 	do { \
2113 		(bp)->state = BNX2X_STATE_ERROR; \
2114 		goto label; \
2115 	} while (0)
2116 
2117 #define LOAD_ERROR_EXIT_CNIC(bp, label) \
2118 	do { \
2119 		bp->cnic_loaded = false; \
2120 		goto label; \
2121 	} while (0)
2122 #else /*BNX2X_STOP_ON_ERROR*/
2123 #define LOAD_ERROR_EXIT(bp, label) \
2124 	do { \
2125 		(bp)->state = BNX2X_STATE_ERROR; \
2126 		(bp)->panic = 1; \
2127 		return -EBUSY; \
2128 	} while (0)
2129 #define LOAD_ERROR_EXIT_CNIC(bp, label) \
2130 	do { \
2131 		bp->cnic_loaded = false; \
2132 		(bp)->panic = 1; \
2133 		return -EBUSY; \
2134 	} while (0)
2135 #endif /*BNX2X_STOP_ON_ERROR*/
2136 
2137 static void bnx2x_free_fw_stats_mem(struct bnx2x *bp)
2138 {
2139 	BNX2X_PCI_FREE(bp->fw_stats, bp->fw_stats_mapping,
2140 		       bp->fw_stats_data_sz + bp->fw_stats_req_sz);
2141 	return;
2142 }
2143 
2144 static int bnx2x_alloc_fw_stats_mem(struct bnx2x *bp)
2145 {
2146 	int num_groups, vf_headroom = 0;
2147 	int is_fcoe_stats = NO_FCOE(bp) ? 0 : 1;
2148 
2149 	/* number of queues for statistics is number of eth queues + FCoE */
2150 	u8 num_queue_stats = BNX2X_NUM_ETH_QUEUES(bp) + is_fcoe_stats;
2151 
2152 	/* Total number of FW statistics requests =
2153 	 * 1 for port stats + 1 for PF stats + potential 2 for FCoE (fcoe proper
2154 	 * and fcoe l2 queue) stats + num of queues (which includes another 1
2155 	 * for fcoe l2 queue if applicable)
2156 	 */
2157 	bp->fw_stats_num = 2 + is_fcoe_stats + num_queue_stats;
2158 
2159 	/* vf stats appear in the request list, but their data is allocated by
2160 	 * the VFs themselves. We don't include them in the bp->fw_stats_num as
2161 	 * it is used to determine where to place the vf stats queries in the
2162 	 * request struct
2163 	 */
2164 	if (IS_SRIOV(bp))
2165 		vf_headroom = bnx2x_vf_headroom(bp);
2166 
2167 	/* Request is built from stats_query_header and an array of
2168 	 * stats_query_cmd_group each of which contains
2169 	 * STATS_QUERY_CMD_COUNT rules. The real number or requests is
2170 	 * configured in the stats_query_header.
2171 	 */
2172 	num_groups =
2173 		(((bp->fw_stats_num + vf_headroom) / STATS_QUERY_CMD_COUNT) +
2174 		 (((bp->fw_stats_num + vf_headroom) % STATS_QUERY_CMD_COUNT) ?
2175 		 1 : 0));
2176 
2177 	DP(BNX2X_MSG_SP, "stats fw_stats_num %d, vf headroom %d, num_groups %d\n",
2178 	   bp->fw_stats_num, vf_headroom, num_groups);
2179 	bp->fw_stats_req_sz = sizeof(struct stats_query_header) +
2180 		num_groups * sizeof(struct stats_query_cmd_group);
2181 
2182 	/* Data for statistics requests + stats_counter
2183 	 * stats_counter holds per-STORM counters that are incremented
2184 	 * when STORM has finished with the current request.
2185 	 * memory for FCoE offloaded statistics are counted anyway,
2186 	 * even if they will not be sent.
2187 	 * VF stats are not accounted for here as the data of VF stats is stored
2188 	 * in memory allocated by the VF, not here.
2189 	 */
2190 	bp->fw_stats_data_sz = sizeof(struct per_port_stats) +
2191 		sizeof(struct per_pf_stats) +
2192 		sizeof(struct fcoe_statistics_params) +
2193 		sizeof(struct per_queue_stats) * num_queue_stats +
2194 		sizeof(struct stats_counter);
2195 
2196 	BNX2X_PCI_ALLOC(bp->fw_stats, &bp->fw_stats_mapping,
2197 			bp->fw_stats_data_sz + bp->fw_stats_req_sz);
2198 
2199 	/* Set shortcuts */
2200 	bp->fw_stats_req = (struct bnx2x_fw_stats_req *)bp->fw_stats;
2201 	bp->fw_stats_req_mapping = bp->fw_stats_mapping;
2202 	bp->fw_stats_data = (struct bnx2x_fw_stats_data *)
2203 		((u8 *)bp->fw_stats + bp->fw_stats_req_sz);
2204 	bp->fw_stats_data_mapping = bp->fw_stats_mapping +
2205 		bp->fw_stats_req_sz;
2206 
2207 	DP(BNX2X_MSG_SP, "statistics request base address set to %x %x\n",
2208 	   U64_HI(bp->fw_stats_req_mapping),
2209 	   U64_LO(bp->fw_stats_req_mapping));
2210 	DP(BNX2X_MSG_SP, "statistics data base address set to %x %x\n",
2211 	   U64_HI(bp->fw_stats_data_mapping),
2212 	   U64_LO(bp->fw_stats_data_mapping));
2213 	return 0;
2214 
2215 alloc_mem_err:
2216 	bnx2x_free_fw_stats_mem(bp);
2217 	BNX2X_ERR("Can't allocate FW stats memory\n");
2218 	return -ENOMEM;
2219 }
2220 
2221 /* send load request to mcp and analyze response */
2222 static int bnx2x_nic_load_request(struct bnx2x *bp, u32 *load_code)
2223 {
2224 	u32 param;
2225 
2226 	/* init fw_seq */
2227 	bp->fw_seq =
2228 		(SHMEM_RD(bp, func_mb[BP_FW_MB_IDX(bp)].drv_mb_header) &
2229 		 DRV_MSG_SEQ_NUMBER_MASK);
2230 	BNX2X_DEV_INFO("fw_seq 0x%08x\n", bp->fw_seq);
2231 
2232 	/* Get current FW pulse sequence */
2233 	bp->fw_drv_pulse_wr_seq =
2234 		(SHMEM_RD(bp, func_mb[BP_FW_MB_IDX(bp)].drv_pulse_mb) &
2235 		 DRV_PULSE_SEQ_MASK);
2236 	BNX2X_DEV_INFO("drv_pulse 0x%x\n", bp->fw_drv_pulse_wr_seq);
2237 
2238 	param = DRV_MSG_CODE_LOAD_REQ_WITH_LFA;
2239 
2240 	if (IS_MF_SD(bp) && bnx2x_port_after_undi(bp))
2241 		param |= DRV_MSG_CODE_LOAD_REQ_FORCE_LFA;
2242 
2243 	/* load request */
2244 	(*load_code) = bnx2x_fw_command(bp, DRV_MSG_CODE_LOAD_REQ, param);
2245 
2246 	/* if mcp fails to respond we must abort */
2247 	if (!(*load_code)) {
2248 		BNX2X_ERR("MCP response failure, aborting\n");
2249 		return -EBUSY;
2250 	}
2251 
2252 	/* If mcp refused (e.g. other port is in diagnostic mode) we
2253 	 * must abort
2254 	 */
2255 	if ((*load_code) == FW_MSG_CODE_DRV_LOAD_REFUSED) {
2256 		BNX2X_ERR("MCP refused load request, aborting\n");
2257 		return -EBUSY;
2258 	}
2259 	return 0;
2260 }
2261 
2262 /* check whether another PF has already loaded FW to chip. In
2263  * virtualized environments a pf from another VM may have already
2264  * initialized the device including loading FW
2265  */
2266 int bnx2x_nic_load_analyze_req(struct bnx2x *bp, u32 load_code)
2267 {
2268 	/* is another pf loaded on this engine? */
2269 	if (load_code != FW_MSG_CODE_DRV_LOAD_COMMON_CHIP &&
2270 	    load_code != FW_MSG_CODE_DRV_LOAD_COMMON) {
2271 		/* build my FW version dword */
2272 		u32 my_fw = (BCM_5710_FW_MAJOR_VERSION) +
2273 			(BCM_5710_FW_MINOR_VERSION << 8) +
2274 			(BCM_5710_FW_REVISION_VERSION << 16) +
2275 			(BCM_5710_FW_ENGINEERING_VERSION << 24);
2276 
2277 		/* read loaded FW from chip */
2278 		u32 loaded_fw = REG_RD(bp, XSEM_REG_PRAM);
2279 
2280 		DP(BNX2X_MSG_SP, "loaded fw %x, my fw %x\n",
2281 		   loaded_fw, my_fw);
2282 
2283 		/* abort nic load if version mismatch */
2284 		if (my_fw != loaded_fw) {
2285 			BNX2X_ERR("bnx2x with FW %x was already loaded which mismatches my %x FW. Aborting\n",
2286 				  loaded_fw, my_fw);
2287 			return -EBUSY;
2288 		}
2289 	}
2290 	return 0;
2291 }
2292 
2293 /* returns the "mcp load_code" according to global load_count array */
2294 static int bnx2x_nic_load_no_mcp(struct bnx2x *bp, int port)
2295 {
2296 	int path = BP_PATH(bp);
2297 
2298 	DP(NETIF_MSG_IFUP, "NO MCP - load counts[%d]      %d, %d, %d\n",
2299 	   path, load_count[path][0], load_count[path][1],
2300 	   load_count[path][2]);
2301 	load_count[path][0]++;
2302 	load_count[path][1 + port]++;
2303 	DP(NETIF_MSG_IFUP, "NO MCP - new load counts[%d]  %d, %d, %d\n",
2304 	   path, load_count[path][0], load_count[path][1],
2305 	   load_count[path][2]);
2306 	if (load_count[path][0] == 1)
2307 		return FW_MSG_CODE_DRV_LOAD_COMMON;
2308 	else if (load_count[path][1 + port] == 1)
2309 		return FW_MSG_CODE_DRV_LOAD_PORT;
2310 	else
2311 		return FW_MSG_CODE_DRV_LOAD_FUNCTION;
2312 }
2313 
2314 /* mark PMF if applicable */
2315 static void bnx2x_nic_load_pmf(struct bnx2x *bp, u32 load_code)
2316 {
2317 	if ((load_code == FW_MSG_CODE_DRV_LOAD_COMMON) ||
2318 	    (load_code == FW_MSG_CODE_DRV_LOAD_COMMON_CHIP) ||
2319 	    (load_code == FW_MSG_CODE_DRV_LOAD_PORT)) {
2320 		bp->port.pmf = 1;
2321 		/* We need the barrier to ensure the ordering between the
2322 		 * writing to bp->port.pmf here and reading it from the
2323 		 * bnx2x_periodic_task().
2324 		 */
2325 		smp_mb();
2326 	} else {
2327 		bp->port.pmf = 0;
2328 	}
2329 
2330 	DP(NETIF_MSG_LINK, "pmf %d\n", bp->port.pmf);
2331 }
2332 
2333 static void bnx2x_nic_load_afex_dcc(struct bnx2x *bp, int load_code)
2334 {
2335 	if (((load_code == FW_MSG_CODE_DRV_LOAD_COMMON) ||
2336 	     (load_code == FW_MSG_CODE_DRV_LOAD_COMMON_CHIP)) &&
2337 	    (bp->common.shmem2_base)) {
2338 		if (SHMEM2_HAS(bp, dcc_support))
2339 			SHMEM2_WR(bp, dcc_support,
2340 				  (SHMEM_DCC_SUPPORT_DISABLE_ENABLE_PF_TLV |
2341 				   SHMEM_DCC_SUPPORT_BANDWIDTH_ALLOCATION_TLV));
2342 		if (SHMEM2_HAS(bp, afex_driver_support))
2343 			SHMEM2_WR(bp, afex_driver_support,
2344 				  SHMEM_AFEX_SUPPORTED_VERSION_ONE);
2345 	}
2346 
2347 	/* Set AFEX default VLAN tag to an invalid value */
2348 	bp->afex_def_vlan_tag = -1;
2349 }
2350 
2351 /**
2352  * bnx2x_bz_fp - zero content of the fastpath structure.
2353  *
2354  * @bp:		driver handle
2355  * @index:	fastpath index to be zeroed
2356  *
2357  * Makes sure the contents of the bp->fp[index].napi is kept
2358  * intact.
2359  */
2360 static void bnx2x_bz_fp(struct bnx2x *bp, int index)
2361 {
2362 	struct bnx2x_fastpath *fp = &bp->fp[index];
2363 	int cos;
2364 	struct napi_struct orig_napi = fp->napi;
2365 	struct bnx2x_agg_info *orig_tpa_info = fp->tpa_info;
2366 
2367 	/* bzero bnx2x_fastpath contents */
2368 	if (fp->tpa_info)
2369 		memset(fp->tpa_info, 0, ETH_MAX_AGGREGATION_QUEUES_E1H_E2 *
2370 		       sizeof(struct bnx2x_agg_info));
2371 	memset(fp, 0, sizeof(*fp));
2372 
2373 	/* Restore the NAPI object as it has been already initialized */
2374 	fp->napi = orig_napi;
2375 	fp->tpa_info = orig_tpa_info;
2376 	fp->bp = bp;
2377 	fp->index = index;
2378 	if (IS_ETH_FP(fp))
2379 		fp->max_cos = bp->max_cos;
2380 	else
2381 		/* Special queues support only one CoS */
2382 		fp->max_cos = 1;
2383 
2384 	/* Init txdata pointers */
2385 	if (IS_FCOE_FP(fp))
2386 		fp->txdata_ptr[0] = &bp->bnx2x_txq[FCOE_TXQ_IDX(bp)];
2387 	if (IS_ETH_FP(fp))
2388 		for_each_cos_in_tx_queue(fp, cos)
2389 			fp->txdata_ptr[cos] = &bp->bnx2x_txq[cos *
2390 				BNX2X_NUM_ETH_QUEUES(bp) + index];
2391 
2392 	/* set the tpa flag for each queue. The tpa flag determines the queue
2393 	 * minimal size so it must be set prior to queue memory allocation
2394 	 */
2395 	fp->disable_tpa = !(bp->flags & TPA_ENABLE_FLAG ||
2396 				  (bp->flags & GRO_ENABLE_FLAG &&
2397 				   bnx2x_mtu_allows_gro(bp->dev->mtu)));
2398 	if (bp->flags & TPA_ENABLE_FLAG)
2399 		fp->mode = TPA_MODE_LRO;
2400 	else if (bp->flags & GRO_ENABLE_FLAG)
2401 		fp->mode = TPA_MODE_GRO;
2402 
2403 	/* We don't want TPA on an FCoE L2 ring */
2404 	if (IS_FCOE_FP(fp))
2405 		fp->disable_tpa = 1;
2406 }
2407 
2408 int bnx2x_load_cnic(struct bnx2x *bp)
2409 {
2410 	int i, rc, port = BP_PORT(bp);
2411 
2412 	DP(NETIF_MSG_IFUP, "Starting CNIC-related load\n");
2413 
2414 	mutex_init(&bp->cnic_mutex);
2415 
2416 	if (IS_PF(bp)) {
2417 		rc = bnx2x_alloc_mem_cnic(bp);
2418 		if (rc) {
2419 			BNX2X_ERR("Unable to allocate bp memory for cnic\n");
2420 			LOAD_ERROR_EXIT_CNIC(bp, load_error_cnic0);
2421 		}
2422 	}
2423 
2424 	rc = bnx2x_alloc_fp_mem_cnic(bp);
2425 	if (rc) {
2426 		BNX2X_ERR("Unable to allocate memory for cnic fps\n");
2427 		LOAD_ERROR_EXIT_CNIC(bp, load_error_cnic0);
2428 	}
2429 
2430 	/* Update the number of queues with the cnic queues */
2431 	rc = bnx2x_set_real_num_queues(bp, 1);
2432 	if (rc) {
2433 		BNX2X_ERR("Unable to set real_num_queues including cnic\n");
2434 		LOAD_ERROR_EXIT_CNIC(bp, load_error_cnic0);
2435 	}
2436 
2437 	/* Add all CNIC NAPI objects */
2438 	bnx2x_add_all_napi_cnic(bp);
2439 	DP(NETIF_MSG_IFUP, "cnic napi added\n");
2440 	bnx2x_napi_enable_cnic(bp);
2441 
2442 	rc = bnx2x_init_hw_func_cnic(bp);
2443 	if (rc)
2444 		LOAD_ERROR_EXIT_CNIC(bp, load_error_cnic1);
2445 
2446 	bnx2x_nic_init_cnic(bp);
2447 
2448 	if (IS_PF(bp)) {
2449 		/* Enable Timer scan */
2450 		REG_WR(bp, TM_REG_EN_LINEAR0_TIMER + port*4, 1);
2451 
2452 		/* setup cnic queues */
2453 		for_each_cnic_queue(bp, i) {
2454 			rc = bnx2x_setup_queue(bp, &bp->fp[i], 0);
2455 			if (rc) {
2456 				BNX2X_ERR("Queue setup failed\n");
2457 				LOAD_ERROR_EXIT(bp, load_error_cnic2);
2458 			}
2459 		}
2460 	}
2461 
2462 	/* Initialize Rx filter. */
2463 	bnx2x_set_rx_mode_inner(bp);
2464 
2465 	/* re-read iscsi info */
2466 	bnx2x_get_iscsi_info(bp);
2467 	bnx2x_setup_cnic_irq_info(bp);
2468 	bnx2x_setup_cnic_info(bp);
2469 	bp->cnic_loaded = true;
2470 	if (bp->state == BNX2X_STATE_OPEN)
2471 		bnx2x_cnic_notify(bp, CNIC_CTL_START_CMD);
2472 
2473 	DP(NETIF_MSG_IFUP, "Ending successfully CNIC-related load\n");
2474 
2475 	return 0;
2476 
2477 #ifndef BNX2X_STOP_ON_ERROR
2478 load_error_cnic2:
2479 	/* Disable Timer scan */
2480 	REG_WR(bp, TM_REG_EN_LINEAR0_TIMER + port*4, 0);
2481 
2482 load_error_cnic1:
2483 	bnx2x_napi_disable_cnic(bp);
2484 	/* Update the number of queues without the cnic queues */
2485 	if (bnx2x_set_real_num_queues(bp, 0))
2486 		BNX2X_ERR("Unable to set real_num_queues not including cnic\n");
2487 load_error_cnic0:
2488 	BNX2X_ERR("CNIC-related load failed\n");
2489 	bnx2x_free_fp_mem_cnic(bp);
2490 	bnx2x_free_mem_cnic(bp);
2491 	return rc;
2492 #endif /* ! BNX2X_STOP_ON_ERROR */
2493 }
2494 
2495 /* must be called with rtnl_lock */
2496 int bnx2x_nic_load(struct bnx2x *bp, int load_mode)
2497 {
2498 	int port = BP_PORT(bp);
2499 	int i, rc = 0, load_code = 0;
2500 
2501 	DP(NETIF_MSG_IFUP, "Starting NIC load\n");
2502 	DP(NETIF_MSG_IFUP,
2503 	   "CNIC is %s\n", CNIC_ENABLED(bp) ? "enabled" : "disabled");
2504 
2505 #ifdef BNX2X_STOP_ON_ERROR
2506 	if (unlikely(bp->panic)) {
2507 		BNX2X_ERR("Can't load NIC when there is panic\n");
2508 		return -EPERM;
2509 	}
2510 #endif
2511 
2512 	bp->state = BNX2X_STATE_OPENING_WAIT4_LOAD;
2513 
2514 	/* zero the structure w/o any lock, before SP handler is initialized */
2515 	memset(&bp->last_reported_link, 0, sizeof(bp->last_reported_link));
2516 	__set_bit(BNX2X_LINK_REPORT_LINK_DOWN,
2517 		&bp->last_reported_link.link_report_flags);
2518 
2519 	if (IS_PF(bp))
2520 		/* must be called before memory allocation and HW init */
2521 		bnx2x_ilt_set_info(bp);
2522 
2523 	/*
2524 	 * Zero fastpath structures preserving invariants like napi, which are
2525 	 * allocated only once, fp index, max_cos, bp pointer.
2526 	 * Also set fp->disable_tpa and txdata_ptr.
2527 	 */
2528 	DP(NETIF_MSG_IFUP, "num queues: %d", bp->num_queues);
2529 	for_each_queue(bp, i)
2530 		bnx2x_bz_fp(bp, i);
2531 	memset(bp->bnx2x_txq, 0, (BNX2X_MAX_RSS_COUNT(bp) * BNX2X_MULTI_TX_COS +
2532 				  bp->num_cnic_queues) *
2533 				  sizeof(struct bnx2x_fp_txdata));
2534 
2535 	bp->fcoe_init = false;
2536 
2537 	/* Set the receive queues buffer size */
2538 	bnx2x_set_rx_buf_size(bp);
2539 
2540 	if (IS_PF(bp)) {
2541 		rc = bnx2x_alloc_mem(bp);
2542 		if (rc) {
2543 			BNX2X_ERR("Unable to allocate bp memory\n");
2544 			return rc;
2545 		}
2546 	}
2547 
2548 	/* need to be done after alloc mem, since it's self adjusting to amount
2549 	 * of memory available for RSS queues
2550 	 */
2551 	rc = bnx2x_alloc_fp_mem(bp);
2552 	if (rc) {
2553 		BNX2X_ERR("Unable to allocate memory for fps\n");
2554 		LOAD_ERROR_EXIT(bp, load_error0);
2555 	}
2556 
2557 	/* Allocated memory for FW statistics  */
2558 	if (bnx2x_alloc_fw_stats_mem(bp))
2559 		LOAD_ERROR_EXIT(bp, load_error0);
2560 
2561 	/* request pf to initialize status blocks */
2562 	if (IS_VF(bp)) {
2563 		rc = bnx2x_vfpf_init(bp);
2564 		if (rc)
2565 			LOAD_ERROR_EXIT(bp, load_error0);
2566 	}
2567 
2568 	/* As long as bnx2x_alloc_mem() may possibly update
2569 	 * bp->num_queues, bnx2x_set_real_num_queues() should always
2570 	 * come after it. At this stage cnic queues are not counted.
2571 	 */
2572 	rc = bnx2x_set_real_num_queues(bp, 0);
2573 	if (rc) {
2574 		BNX2X_ERR("Unable to set real_num_queues\n");
2575 		LOAD_ERROR_EXIT(bp, load_error0);
2576 	}
2577 
2578 	/* configure multi cos mappings in kernel.
2579 	 * this configuration may be overridden by a multi class queue
2580 	 * discipline or by a dcbx negotiation result.
2581 	 */
2582 	bnx2x_setup_tc(bp->dev, bp->max_cos);
2583 
2584 	/* Add all NAPI objects */
2585 	bnx2x_add_all_napi(bp);
2586 	DP(NETIF_MSG_IFUP, "napi added\n");
2587 	bnx2x_napi_enable(bp);
2588 
2589 	if (IS_PF(bp)) {
2590 		/* set pf load just before approaching the MCP */
2591 		bnx2x_set_pf_load(bp);
2592 
2593 		/* if mcp exists send load request and analyze response */
2594 		if (!BP_NOMCP(bp)) {
2595 			/* attempt to load pf */
2596 			rc = bnx2x_nic_load_request(bp, &load_code);
2597 			if (rc)
2598 				LOAD_ERROR_EXIT(bp, load_error1);
2599 
2600 			/* what did mcp say? */
2601 			rc = bnx2x_nic_load_analyze_req(bp, load_code);
2602 			if (rc) {
2603 				bnx2x_fw_command(bp, DRV_MSG_CODE_LOAD_DONE, 0);
2604 				LOAD_ERROR_EXIT(bp, load_error2);
2605 			}
2606 		} else {
2607 			load_code = bnx2x_nic_load_no_mcp(bp, port);
2608 		}
2609 
2610 		/* mark pmf if applicable */
2611 		bnx2x_nic_load_pmf(bp, load_code);
2612 
2613 		/* Init Function state controlling object */
2614 		bnx2x__init_func_obj(bp);
2615 
2616 		/* Initialize HW */
2617 		rc = bnx2x_init_hw(bp, load_code);
2618 		if (rc) {
2619 			BNX2X_ERR("HW init failed, aborting\n");
2620 			bnx2x_fw_command(bp, DRV_MSG_CODE_LOAD_DONE, 0);
2621 			LOAD_ERROR_EXIT(bp, load_error2);
2622 		}
2623 	}
2624 
2625 	bnx2x_pre_irq_nic_init(bp);
2626 
2627 	/* Connect to IRQs */
2628 	rc = bnx2x_setup_irqs(bp);
2629 	if (rc) {
2630 		BNX2X_ERR("setup irqs failed\n");
2631 		if (IS_PF(bp))
2632 			bnx2x_fw_command(bp, DRV_MSG_CODE_LOAD_DONE, 0);
2633 		LOAD_ERROR_EXIT(bp, load_error2);
2634 	}
2635 
2636 	/* Init per-function objects */
2637 	if (IS_PF(bp)) {
2638 		/* Setup NIC internals and enable interrupts */
2639 		bnx2x_post_irq_nic_init(bp, load_code);
2640 
2641 		bnx2x_init_bp_objs(bp);
2642 		bnx2x_iov_nic_init(bp);
2643 
2644 		/* Set AFEX default VLAN tag to an invalid value */
2645 		bp->afex_def_vlan_tag = -1;
2646 		bnx2x_nic_load_afex_dcc(bp, load_code);
2647 		bp->state = BNX2X_STATE_OPENING_WAIT4_PORT;
2648 		rc = bnx2x_func_start(bp);
2649 		if (rc) {
2650 			BNX2X_ERR("Function start failed!\n");
2651 			bnx2x_fw_command(bp, DRV_MSG_CODE_LOAD_DONE, 0);
2652 
2653 			LOAD_ERROR_EXIT(bp, load_error3);
2654 		}
2655 
2656 		/* Send LOAD_DONE command to MCP */
2657 		if (!BP_NOMCP(bp)) {
2658 			load_code = bnx2x_fw_command(bp,
2659 						     DRV_MSG_CODE_LOAD_DONE, 0);
2660 			if (!load_code) {
2661 				BNX2X_ERR("MCP response failure, aborting\n");
2662 				rc = -EBUSY;
2663 				LOAD_ERROR_EXIT(bp, load_error3);
2664 			}
2665 		}
2666 
2667 		/* initialize FW coalescing state machines in RAM */
2668 		bnx2x_update_coalesce(bp);
2669 	}
2670 
2671 	/* setup the leading queue */
2672 	rc = bnx2x_setup_leading(bp);
2673 	if (rc) {
2674 		BNX2X_ERR("Setup leading failed!\n");
2675 		LOAD_ERROR_EXIT(bp, load_error3);
2676 	}
2677 
2678 	/* set up the rest of the queues */
2679 	for_each_nondefault_eth_queue(bp, i) {
2680 		if (IS_PF(bp))
2681 			rc = bnx2x_setup_queue(bp, &bp->fp[i], false);
2682 		else /* VF */
2683 			rc = bnx2x_vfpf_setup_q(bp, &bp->fp[i], false);
2684 		if (rc) {
2685 			BNX2X_ERR("Queue %d setup failed\n", i);
2686 			LOAD_ERROR_EXIT(bp, load_error3);
2687 		}
2688 	}
2689 
2690 	/* setup rss */
2691 	rc = bnx2x_init_rss(bp);
2692 	if (rc) {
2693 		BNX2X_ERR("PF RSS init failed\n");
2694 		LOAD_ERROR_EXIT(bp, load_error3);
2695 	}
2696 
2697 	/* Now when Clients are configured we are ready to work */
2698 	bp->state = BNX2X_STATE_OPEN;
2699 
2700 	/* Configure a ucast MAC */
2701 	if (IS_PF(bp))
2702 		rc = bnx2x_set_eth_mac(bp, true);
2703 	else /* vf */
2704 		rc = bnx2x_vfpf_config_mac(bp, bp->dev->dev_addr, bp->fp->index,
2705 					   true);
2706 	if (rc) {
2707 		BNX2X_ERR("Setting Ethernet MAC failed\n");
2708 		LOAD_ERROR_EXIT(bp, load_error3);
2709 	}
2710 
2711 	if (IS_PF(bp) && bp->pending_max) {
2712 		bnx2x_update_max_mf_config(bp, bp->pending_max);
2713 		bp->pending_max = 0;
2714 	}
2715 
2716 	if (bp->port.pmf) {
2717 		rc = bnx2x_initial_phy_init(bp, load_mode);
2718 		if (rc)
2719 			LOAD_ERROR_EXIT(bp, load_error3);
2720 	}
2721 	bp->link_params.feature_config_flags &= ~FEATURE_CONFIG_BOOT_FROM_SAN;
2722 
2723 	/* Start fast path */
2724 
2725 	/* Initialize Rx filter. */
2726 	bnx2x_set_rx_mode_inner(bp);
2727 
2728 	/* Start the Tx */
2729 	switch (load_mode) {
2730 	case LOAD_NORMAL:
2731 		/* Tx queue should be only re-enabled */
2732 		netif_tx_wake_all_queues(bp->dev);
2733 		break;
2734 
2735 	case LOAD_OPEN:
2736 		netif_tx_start_all_queues(bp->dev);
2737 		smp_mb__after_clear_bit();
2738 		break;
2739 
2740 	case LOAD_DIAG:
2741 	case LOAD_LOOPBACK_EXT:
2742 		bp->state = BNX2X_STATE_DIAG;
2743 		break;
2744 
2745 	default:
2746 		break;
2747 	}
2748 
2749 	if (bp->port.pmf)
2750 		bnx2x_update_drv_flags(bp, 1 << DRV_FLAGS_PORT_MASK, 0);
2751 	else
2752 		bnx2x__link_status_update(bp);
2753 
2754 	/* start the timer */
2755 	mod_timer(&bp->timer, jiffies + bp->current_interval);
2756 
2757 	if (CNIC_ENABLED(bp))
2758 		bnx2x_load_cnic(bp);
2759 
2760 	if (IS_PF(bp) && SHMEM2_HAS(bp, drv_capabilities_flag)) {
2761 		/* mark driver is loaded in shmem2 */
2762 		u32 val;
2763 		val = SHMEM2_RD(bp, drv_capabilities_flag[BP_FW_MB_IDX(bp)]);
2764 		SHMEM2_WR(bp, drv_capabilities_flag[BP_FW_MB_IDX(bp)],
2765 			  val | DRV_FLAGS_CAPABILITIES_LOADED_SUPPORTED |
2766 			  DRV_FLAGS_CAPABILITIES_LOADED_L2);
2767 	}
2768 
2769 	/* Wait for all pending SP commands to complete */
2770 	if (IS_PF(bp) && !bnx2x_wait_sp_comp(bp, ~0x0UL)) {
2771 		BNX2X_ERR("Timeout waiting for SP elements to complete\n");
2772 		bnx2x_nic_unload(bp, UNLOAD_CLOSE, false);
2773 		return -EBUSY;
2774 	}
2775 
2776 	/* If PMF - send ADMIN DCBX msg to MFW to initiate DCBX FSM */
2777 	if (bp->port.pmf && (bp->state != BNX2X_STATE_DIAG))
2778 		bnx2x_dcbx_init(bp, false);
2779 
2780 	DP(NETIF_MSG_IFUP, "Ending successfully NIC load\n");
2781 
2782 	return 0;
2783 
2784 #ifndef BNX2X_STOP_ON_ERROR
2785 load_error3:
2786 	if (IS_PF(bp)) {
2787 		bnx2x_int_disable_sync(bp, 1);
2788 
2789 		/* Clean queueable objects */
2790 		bnx2x_squeeze_objects(bp);
2791 	}
2792 
2793 	/* Free SKBs, SGEs, TPA pool and driver internals */
2794 	bnx2x_free_skbs(bp);
2795 	for_each_rx_queue(bp, i)
2796 		bnx2x_free_rx_sge_range(bp, bp->fp + i, NUM_RX_SGE);
2797 
2798 	/* Release IRQs */
2799 	bnx2x_free_irq(bp);
2800 load_error2:
2801 	if (IS_PF(bp) && !BP_NOMCP(bp)) {
2802 		bnx2x_fw_command(bp, DRV_MSG_CODE_UNLOAD_REQ_WOL_MCP, 0);
2803 		bnx2x_fw_command(bp, DRV_MSG_CODE_UNLOAD_DONE, 0);
2804 	}
2805 
2806 	bp->port.pmf = 0;
2807 load_error1:
2808 	bnx2x_napi_disable(bp);
2809 	bnx2x_del_all_napi(bp);
2810 
2811 	/* clear pf_load status, as it was already set */
2812 	if (IS_PF(bp))
2813 		bnx2x_clear_pf_load(bp);
2814 load_error0:
2815 	bnx2x_free_fw_stats_mem(bp);
2816 	bnx2x_free_fp_mem(bp);
2817 	bnx2x_free_mem(bp);
2818 
2819 	return rc;
2820 #endif /* ! BNX2X_STOP_ON_ERROR */
2821 }
2822 
2823 int bnx2x_drain_tx_queues(struct bnx2x *bp)
2824 {
2825 	u8 rc = 0, cos, i;
2826 
2827 	/* Wait until tx fastpath tasks complete */
2828 	for_each_tx_queue(bp, i) {
2829 		struct bnx2x_fastpath *fp = &bp->fp[i];
2830 
2831 		for_each_cos_in_tx_queue(fp, cos)
2832 			rc = bnx2x_clean_tx_queue(bp, fp->txdata_ptr[cos]);
2833 		if (rc)
2834 			return rc;
2835 	}
2836 	return 0;
2837 }
2838 
2839 /* must be called with rtnl_lock */
2840 int bnx2x_nic_unload(struct bnx2x *bp, int unload_mode, bool keep_link)
2841 {
2842 	int i;
2843 	bool global = false;
2844 
2845 	DP(NETIF_MSG_IFUP, "Starting NIC unload\n");
2846 
2847 	/* mark driver is unloaded in shmem2 */
2848 	if (IS_PF(bp) && SHMEM2_HAS(bp, drv_capabilities_flag)) {
2849 		u32 val;
2850 		val = SHMEM2_RD(bp, drv_capabilities_flag[BP_FW_MB_IDX(bp)]);
2851 		SHMEM2_WR(bp, drv_capabilities_flag[BP_FW_MB_IDX(bp)],
2852 			  val & ~DRV_FLAGS_CAPABILITIES_LOADED_L2);
2853 	}
2854 
2855 	if (IS_PF(bp) && bp->recovery_state != BNX2X_RECOVERY_DONE &&
2856 	    (bp->state == BNX2X_STATE_CLOSED ||
2857 	     bp->state == BNX2X_STATE_ERROR)) {
2858 		/* We can get here if the driver has been unloaded
2859 		 * during parity error recovery and is either waiting for a
2860 		 * leader to complete or for other functions to unload and
2861 		 * then ifdown has been issued. In this case we want to
2862 		 * unload and let other functions to complete a recovery
2863 		 * process.
2864 		 */
2865 		bp->recovery_state = BNX2X_RECOVERY_DONE;
2866 		bp->is_leader = 0;
2867 		bnx2x_release_leader_lock(bp);
2868 		smp_mb();
2869 
2870 		DP(NETIF_MSG_IFDOWN, "Releasing a leadership...\n");
2871 		BNX2X_ERR("Can't unload in closed or error state\n");
2872 		return -EINVAL;
2873 	}
2874 
2875 	/* Nothing to do during unload if previous bnx2x_nic_load()
2876 	 * have not completed successfully - all resources are released.
2877 	 *
2878 	 * we can get here only after unsuccessful ndo_* callback, during which
2879 	 * dev->IFF_UP flag is still on.
2880 	 */
2881 	if (bp->state == BNX2X_STATE_CLOSED || bp->state == BNX2X_STATE_ERROR)
2882 		return 0;
2883 
2884 	/* It's important to set the bp->state to the value different from
2885 	 * BNX2X_STATE_OPEN and only then stop the Tx. Otherwise bnx2x_tx_int()
2886 	 * may restart the Tx from the NAPI context (see bnx2x_tx_int()).
2887 	 */
2888 	bp->state = BNX2X_STATE_CLOSING_WAIT4_HALT;
2889 	smp_mb();
2890 
2891 	/* indicate to VFs that the PF is going down */
2892 	bnx2x_iov_channel_down(bp);
2893 
2894 	if (CNIC_LOADED(bp))
2895 		bnx2x_cnic_notify(bp, CNIC_CTL_STOP_CMD);
2896 
2897 	/* Stop Tx */
2898 	bnx2x_tx_disable(bp);
2899 	netdev_reset_tc(bp->dev);
2900 
2901 	bp->rx_mode = BNX2X_RX_MODE_NONE;
2902 
2903 	del_timer_sync(&bp->timer);
2904 
2905 	if (IS_PF(bp)) {
2906 		/* Set ALWAYS_ALIVE bit in shmem */
2907 		bp->fw_drv_pulse_wr_seq |= DRV_PULSE_ALWAYS_ALIVE;
2908 		bnx2x_drv_pulse(bp);
2909 		bnx2x_stats_handle(bp, STATS_EVENT_STOP);
2910 		bnx2x_save_statistics(bp);
2911 	}
2912 
2913 	/* wait till consumers catch up with producers in all queues */
2914 	bnx2x_drain_tx_queues(bp);
2915 
2916 	/* if VF indicate to PF this function is going down (PF will delete sp
2917 	 * elements and clear initializations
2918 	 */
2919 	if (IS_VF(bp))
2920 		bnx2x_vfpf_close_vf(bp);
2921 	else if (unload_mode != UNLOAD_RECOVERY)
2922 		/* if this is a normal/close unload need to clean up chip*/
2923 		bnx2x_chip_cleanup(bp, unload_mode, keep_link);
2924 	else {
2925 		/* Send the UNLOAD_REQUEST to the MCP */
2926 		bnx2x_send_unload_req(bp, unload_mode);
2927 
2928 		/* Prevent transactions to host from the functions on the
2929 		 * engine that doesn't reset global blocks in case of global
2930 		 * attention once global blocks are reset and gates are opened
2931 		 * (the engine which leader will perform the recovery
2932 		 * last).
2933 		 */
2934 		if (!CHIP_IS_E1x(bp))
2935 			bnx2x_pf_disable(bp);
2936 
2937 		/* Disable HW interrupts, NAPI */
2938 		bnx2x_netif_stop(bp, 1);
2939 		/* Delete all NAPI objects */
2940 		bnx2x_del_all_napi(bp);
2941 		if (CNIC_LOADED(bp))
2942 			bnx2x_del_all_napi_cnic(bp);
2943 		/* Release IRQs */
2944 		bnx2x_free_irq(bp);
2945 
2946 		/* Report UNLOAD_DONE to MCP */
2947 		bnx2x_send_unload_done(bp, false);
2948 	}
2949 
2950 	/*
2951 	 * At this stage no more interrupts will arrive so we may safely clean
2952 	 * the queueable objects here in case they failed to get cleaned so far.
2953 	 */
2954 	if (IS_PF(bp))
2955 		bnx2x_squeeze_objects(bp);
2956 
2957 	/* There should be no more pending SP commands at this stage */
2958 	bp->sp_state = 0;
2959 
2960 	bp->port.pmf = 0;
2961 
2962 	/* clear pending work in rtnl task */
2963 	bp->sp_rtnl_state = 0;
2964 	smp_mb();
2965 
2966 	/* Free SKBs, SGEs, TPA pool and driver internals */
2967 	bnx2x_free_skbs(bp);
2968 	if (CNIC_LOADED(bp))
2969 		bnx2x_free_skbs_cnic(bp);
2970 	for_each_rx_queue(bp, i)
2971 		bnx2x_free_rx_sge_range(bp, bp->fp + i, NUM_RX_SGE);
2972 
2973 	bnx2x_free_fp_mem(bp);
2974 	if (CNIC_LOADED(bp))
2975 		bnx2x_free_fp_mem_cnic(bp);
2976 
2977 	if (IS_PF(bp)) {
2978 		if (CNIC_LOADED(bp))
2979 			bnx2x_free_mem_cnic(bp);
2980 	}
2981 	bnx2x_free_mem(bp);
2982 
2983 	bp->state = BNX2X_STATE_CLOSED;
2984 	bp->cnic_loaded = false;
2985 
2986 	/* Check if there are pending parity attentions. If there are - set
2987 	 * RECOVERY_IN_PROGRESS.
2988 	 */
2989 	if (IS_PF(bp) && bnx2x_chk_parity_attn(bp, &global, false)) {
2990 		bnx2x_set_reset_in_progress(bp);
2991 
2992 		/* Set RESET_IS_GLOBAL if needed */
2993 		if (global)
2994 			bnx2x_set_reset_global(bp);
2995 	}
2996 
2997 	/* The last driver must disable a "close the gate" if there is no
2998 	 * parity attention or "process kill" pending.
2999 	 */
3000 	if (IS_PF(bp) &&
3001 	    !bnx2x_clear_pf_load(bp) &&
3002 	    bnx2x_reset_is_done(bp, BP_PATH(bp)))
3003 		bnx2x_disable_close_the_gate(bp);
3004 
3005 	DP(NETIF_MSG_IFUP, "Ending NIC unload\n");
3006 
3007 	return 0;
3008 }
3009 
3010 int bnx2x_set_power_state(struct bnx2x *bp, pci_power_t state)
3011 {
3012 	u16 pmcsr;
3013 
3014 	/* If there is no power capability, silently succeed */
3015 	if (!bp->pdev->pm_cap) {
3016 		BNX2X_DEV_INFO("No power capability. Breaking.\n");
3017 		return 0;
3018 	}
3019 
3020 	pci_read_config_word(bp->pdev, bp->pdev->pm_cap + PCI_PM_CTRL, &pmcsr);
3021 
3022 	switch (state) {
3023 	case PCI_D0:
3024 		pci_write_config_word(bp->pdev, bp->pdev->pm_cap + PCI_PM_CTRL,
3025 				      ((pmcsr & ~PCI_PM_CTRL_STATE_MASK) |
3026 				       PCI_PM_CTRL_PME_STATUS));
3027 
3028 		if (pmcsr & PCI_PM_CTRL_STATE_MASK)
3029 			/* delay required during transition out of D3hot */
3030 			msleep(20);
3031 		break;
3032 
3033 	case PCI_D3hot:
3034 		/* If there are other clients above don't
3035 		   shut down the power */
3036 		if (atomic_read(&bp->pdev->enable_cnt) != 1)
3037 			return 0;
3038 		/* Don't shut down the power for emulation and FPGA */
3039 		if (CHIP_REV_IS_SLOW(bp))
3040 			return 0;
3041 
3042 		pmcsr &= ~PCI_PM_CTRL_STATE_MASK;
3043 		pmcsr |= 3;
3044 
3045 		if (bp->wol)
3046 			pmcsr |= PCI_PM_CTRL_PME_ENABLE;
3047 
3048 		pci_write_config_word(bp->pdev, bp->pdev->pm_cap + PCI_PM_CTRL,
3049 				      pmcsr);
3050 
3051 		/* No more memory access after this point until
3052 		* device is brought back to D0.
3053 		*/
3054 		break;
3055 
3056 	default:
3057 		dev_err(&bp->pdev->dev, "Can't support state = %d\n", state);
3058 		return -EINVAL;
3059 	}
3060 	return 0;
3061 }
3062 
3063 /*
3064  * net_device service functions
3065  */
3066 int bnx2x_poll(struct napi_struct *napi, int budget)
3067 {
3068 	int work_done = 0;
3069 	u8 cos;
3070 	struct bnx2x_fastpath *fp = container_of(napi, struct bnx2x_fastpath,
3071 						 napi);
3072 	struct bnx2x *bp = fp->bp;
3073 
3074 	while (1) {
3075 #ifdef BNX2X_STOP_ON_ERROR
3076 		if (unlikely(bp->panic)) {
3077 			napi_complete(napi);
3078 			return 0;
3079 		}
3080 #endif
3081 		if (!bnx2x_fp_lock_napi(fp))
3082 			return work_done;
3083 
3084 		for_each_cos_in_tx_queue(fp, cos)
3085 			if (bnx2x_tx_queue_has_work(fp->txdata_ptr[cos]))
3086 				bnx2x_tx_int(bp, fp->txdata_ptr[cos]);
3087 
3088 		if (bnx2x_has_rx_work(fp)) {
3089 			work_done += bnx2x_rx_int(fp, budget - work_done);
3090 
3091 			/* must not complete if we consumed full budget */
3092 			if (work_done >= budget) {
3093 				bnx2x_fp_unlock_napi(fp);
3094 				break;
3095 			}
3096 		}
3097 
3098 		/* Fall out from the NAPI loop if needed */
3099 		if (!bnx2x_fp_unlock_napi(fp) &&
3100 		    !(bnx2x_has_rx_work(fp) || bnx2x_has_tx_work(fp))) {
3101 
3102 			/* No need to update SB for FCoE L2 ring as long as
3103 			 * it's connected to the default SB and the SB
3104 			 * has been updated when NAPI was scheduled.
3105 			 */
3106 			if (IS_FCOE_FP(fp)) {
3107 				napi_complete(napi);
3108 				break;
3109 			}
3110 			bnx2x_update_fpsb_idx(fp);
3111 			/* bnx2x_has_rx_work() reads the status block,
3112 			 * thus we need to ensure that status block indices
3113 			 * have been actually read (bnx2x_update_fpsb_idx)
3114 			 * prior to this check (bnx2x_has_rx_work) so that
3115 			 * we won't write the "newer" value of the status block
3116 			 * to IGU (if there was a DMA right after
3117 			 * bnx2x_has_rx_work and if there is no rmb, the memory
3118 			 * reading (bnx2x_update_fpsb_idx) may be postponed
3119 			 * to right before bnx2x_ack_sb). In this case there
3120 			 * will never be another interrupt until there is
3121 			 * another update of the status block, while there
3122 			 * is still unhandled work.
3123 			 */
3124 			rmb();
3125 
3126 			if (!(bnx2x_has_rx_work(fp) || bnx2x_has_tx_work(fp))) {
3127 				napi_complete(napi);
3128 				/* Re-enable interrupts */
3129 				DP(NETIF_MSG_RX_STATUS,
3130 				   "Update index to %d\n", fp->fp_hc_idx);
3131 				bnx2x_ack_sb(bp, fp->igu_sb_id, USTORM_ID,
3132 					     le16_to_cpu(fp->fp_hc_idx),
3133 					     IGU_INT_ENABLE, 1);
3134 				break;
3135 			}
3136 		}
3137 	}
3138 
3139 	return work_done;
3140 }
3141 
3142 #ifdef CONFIG_NET_RX_BUSY_POLL
3143 /* must be called with local_bh_disable()d */
3144 int bnx2x_low_latency_recv(struct napi_struct *napi)
3145 {
3146 	struct bnx2x_fastpath *fp = container_of(napi, struct bnx2x_fastpath,
3147 						 napi);
3148 	struct bnx2x *bp = fp->bp;
3149 	int found = 0;
3150 
3151 	if ((bp->state == BNX2X_STATE_CLOSED) ||
3152 	    (bp->state == BNX2X_STATE_ERROR) ||
3153 	    (bp->flags & (TPA_ENABLE_FLAG | GRO_ENABLE_FLAG)))
3154 		return LL_FLUSH_FAILED;
3155 
3156 	if (!bnx2x_fp_lock_poll(fp))
3157 		return LL_FLUSH_BUSY;
3158 
3159 	if (bnx2x_has_rx_work(fp))
3160 		found = bnx2x_rx_int(fp, 4);
3161 
3162 	bnx2x_fp_unlock_poll(fp);
3163 
3164 	return found;
3165 }
3166 #endif
3167 
3168 /* we split the first BD into headers and data BDs
3169  * to ease the pain of our fellow microcode engineers
3170  * we use one mapping for both BDs
3171  */
3172 static u16 bnx2x_tx_split(struct bnx2x *bp,
3173 			  struct bnx2x_fp_txdata *txdata,
3174 			  struct sw_tx_bd *tx_buf,
3175 			  struct eth_tx_start_bd **tx_bd, u16 hlen,
3176 			  u16 bd_prod)
3177 {
3178 	struct eth_tx_start_bd *h_tx_bd = *tx_bd;
3179 	struct eth_tx_bd *d_tx_bd;
3180 	dma_addr_t mapping;
3181 	int old_len = le16_to_cpu(h_tx_bd->nbytes);
3182 
3183 	/* first fix first BD */
3184 	h_tx_bd->nbytes = cpu_to_le16(hlen);
3185 
3186 	DP(NETIF_MSG_TX_QUEUED,	"TSO split header size is %d (%x:%x)\n",
3187 	   h_tx_bd->nbytes, h_tx_bd->addr_hi, h_tx_bd->addr_lo);
3188 
3189 	/* now get a new data BD
3190 	 * (after the pbd) and fill it */
3191 	bd_prod = TX_BD(NEXT_TX_IDX(bd_prod));
3192 	d_tx_bd = &txdata->tx_desc_ring[bd_prod].reg_bd;
3193 
3194 	mapping = HILO_U64(le32_to_cpu(h_tx_bd->addr_hi),
3195 			   le32_to_cpu(h_tx_bd->addr_lo)) + hlen;
3196 
3197 	d_tx_bd->addr_hi = cpu_to_le32(U64_HI(mapping));
3198 	d_tx_bd->addr_lo = cpu_to_le32(U64_LO(mapping));
3199 	d_tx_bd->nbytes = cpu_to_le16(old_len - hlen);
3200 
3201 	/* this marks the BD as one that has no individual mapping */
3202 	tx_buf->flags |= BNX2X_TSO_SPLIT_BD;
3203 
3204 	DP(NETIF_MSG_TX_QUEUED,
3205 	   "TSO split data size is %d (%x:%x)\n",
3206 	   d_tx_bd->nbytes, d_tx_bd->addr_hi, d_tx_bd->addr_lo);
3207 
3208 	/* update tx_bd */
3209 	*tx_bd = (struct eth_tx_start_bd *)d_tx_bd;
3210 
3211 	return bd_prod;
3212 }
3213 
3214 #define bswab32(b32) ((__force __le32) swab32((__force __u32) (b32)))
3215 #define bswab16(b16) ((__force __le16) swab16((__force __u16) (b16)))
3216 static __le16 bnx2x_csum_fix(unsigned char *t_header, u16 csum, s8 fix)
3217 {
3218 	__sum16 tsum = (__force __sum16) csum;
3219 
3220 	if (fix > 0)
3221 		tsum = ~csum_fold(csum_sub((__force __wsum) csum,
3222 				  csum_partial(t_header - fix, fix, 0)));
3223 
3224 	else if (fix < 0)
3225 		tsum = ~csum_fold(csum_add((__force __wsum) csum,
3226 				  csum_partial(t_header, -fix, 0)));
3227 
3228 	return bswab16(tsum);
3229 }
3230 
3231 static u32 bnx2x_xmit_type(struct bnx2x *bp, struct sk_buff *skb)
3232 {
3233 	u32 rc;
3234 	__u8 prot = 0;
3235 	__be16 protocol;
3236 
3237 	if (skb->ip_summed != CHECKSUM_PARTIAL)
3238 		return XMIT_PLAIN;
3239 
3240 	protocol = vlan_get_protocol(skb);
3241 	if (protocol == htons(ETH_P_IPV6)) {
3242 		rc = XMIT_CSUM_V6;
3243 		prot = ipv6_hdr(skb)->nexthdr;
3244 	} else {
3245 		rc = XMIT_CSUM_V4;
3246 		prot = ip_hdr(skb)->protocol;
3247 	}
3248 
3249 	if (!CHIP_IS_E1x(bp) && skb->encapsulation) {
3250 		if (inner_ip_hdr(skb)->version == 6) {
3251 			rc |= XMIT_CSUM_ENC_V6;
3252 			if (inner_ipv6_hdr(skb)->nexthdr == IPPROTO_TCP)
3253 				rc |= XMIT_CSUM_TCP;
3254 		} else {
3255 			rc |= XMIT_CSUM_ENC_V4;
3256 			if (inner_ip_hdr(skb)->protocol == IPPROTO_TCP)
3257 				rc |= XMIT_CSUM_TCP;
3258 		}
3259 	}
3260 	if (prot == IPPROTO_TCP)
3261 		rc |= XMIT_CSUM_TCP;
3262 
3263 	if (skb_is_gso(skb)) {
3264 		if (skb_is_gso_v6(skb)) {
3265 			rc |= (XMIT_GSO_V6 | XMIT_CSUM_TCP);
3266 			if (rc & XMIT_CSUM_ENC)
3267 				rc |= XMIT_GSO_ENC_V6;
3268 		} else {
3269 			rc |= (XMIT_GSO_V4 | XMIT_CSUM_TCP);
3270 			if (rc & XMIT_CSUM_ENC)
3271 				rc |= XMIT_GSO_ENC_V4;
3272 		}
3273 	}
3274 
3275 	return rc;
3276 }
3277 
3278 #if (MAX_SKB_FRAGS >= MAX_FETCH_BD - 3)
3279 /* check if packet requires linearization (packet is too fragmented)
3280    no need to check fragmentation if page size > 8K (there will be no
3281    violation to FW restrictions) */
3282 static int bnx2x_pkt_req_lin(struct bnx2x *bp, struct sk_buff *skb,
3283 			     u32 xmit_type)
3284 {
3285 	int to_copy = 0;
3286 	int hlen = 0;
3287 	int first_bd_sz = 0;
3288 
3289 	/* 3 = 1 (for linear data BD) + 2 (for PBD and last BD) */
3290 	if (skb_shinfo(skb)->nr_frags >= (MAX_FETCH_BD - 3)) {
3291 
3292 		if (xmit_type & XMIT_GSO) {
3293 			unsigned short lso_mss = skb_shinfo(skb)->gso_size;
3294 			/* Check if LSO packet needs to be copied:
3295 			   3 = 1 (for headers BD) + 2 (for PBD and last BD) */
3296 			int wnd_size = MAX_FETCH_BD - 3;
3297 			/* Number of windows to check */
3298 			int num_wnds = skb_shinfo(skb)->nr_frags - wnd_size;
3299 			int wnd_idx = 0;
3300 			int frag_idx = 0;
3301 			u32 wnd_sum = 0;
3302 
3303 			/* Headers length */
3304 			hlen = (int)(skb_transport_header(skb) - skb->data) +
3305 				tcp_hdrlen(skb);
3306 
3307 			/* Amount of data (w/o headers) on linear part of SKB*/
3308 			first_bd_sz = skb_headlen(skb) - hlen;
3309 
3310 			wnd_sum  = first_bd_sz;
3311 
3312 			/* Calculate the first sum - it's special */
3313 			for (frag_idx = 0; frag_idx < wnd_size - 1; frag_idx++)
3314 				wnd_sum +=
3315 					skb_frag_size(&skb_shinfo(skb)->frags[frag_idx]);
3316 
3317 			/* If there was data on linear skb data - check it */
3318 			if (first_bd_sz > 0) {
3319 				if (unlikely(wnd_sum < lso_mss)) {
3320 					to_copy = 1;
3321 					goto exit_lbl;
3322 				}
3323 
3324 				wnd_sum -= first_bd_sz;
3325 			}
3326 
3327 			/* Others are easier: run through the frag list and
3328 			   check all windows */
3329 			for (wnd_idx = 0; wnd_idx <= num_wnds; wnd_idx++) {
3330 				wnd_sum +=
3331 			  skb_frag_size(&skb_shinfo(skb)->frags[wnd_idx + wnd_size - 1]);
3332 
3333 				if (unlikely(wnd_sum < lso_mss)) {
3334 					to_copy = 1;
3335 					break;
3336 				}
3337 				wnd_sum -=
3338 					skb_frag_size(&skb_shinfo(skb)->frags[wnd_idx]);
3339 			}
3340 		} else {
3341 			/* in non-LSO too fragmented packet should always
3342 			   be linearized */
3343 			to_copy = 1;
3344 		}
3345 	}
3346 
3347 exit_lbl:
3348 	if (unlikely(to_copy))
3349 		DP(NETIF_MSG_TX_QUEUED,
3350 		   "Linearization IS REQUIRED for %s packet. num_frags %d  hlen %d  first_bd_sz %d\n",
3351 		   (xmit_type & XMIT_GSO) ? "LSO" : "non-LSO",
3352 		   skb_shinfo(skb)->nr_frags, hlen, first_bd_sz);
3353 
3354 	return to_copy;
3355 }
3356 #endif
3357 
3358 static void bnx2x_set_pbd_gso_e2(struct sk_buff *skb, u32 *parsing_data,
3359 				 u32 xmit_type)
3360 {
3361 	struct ipv6hdr *ipv6;
3362 
3363 	*parsing_data |= (skb_shinfo(skb)->gso_size <<
3364 			      ETH_TX_PARSE_BD_E2_LSO_MSS_SHIFT) &
3365 			      ETH_TX_PARSE_BD_E2_LSO_MSS;
3366 
3367 	if (xmit_type & XMIT_GSO_ENC_V6)
3368 		ipv6 = inner_ipv6_hdr(skb);
3369 	else if (xmit_type & XMIT_GSO_V6)
3370 		ipv6 = ipv6_hdr(skb);
3371 	else
3372 		ipv6 = NULL;
3373 
3374 	if (ipv6 && ipv6->nexthdr == NEXTHDR_IPV6)
3375 		*parsing_data |= ETH_TX_PARSE_BD_E2_IPV6_WITH_EXT_HDR;
3376 }
3377 
3378 /**
3379  * bnx2x_set_pbd_gso - update PBD in GSO case.
3380  *
3381  * @skb:	packet skb
3382  * @pbd:	parse BD
3383  * @xmit_type:	xmit flags
3384  */
3385 static void bnx2x_set_pbd_gso(struct sk_buff *skb,
3386 			      struct eth_tx_parse_bd_e1x *pbd,
3387 			      struct eth_tx_start_bd *tx_start_bd,
3388 			      u32 xmit_type)
3389 {
3390 	pbd->lso_mss = cpu_to_le16(skb_shinfo(skb)->gso_size);
3391 	pbd->tcp_send_seq = bswab32(tcp_hdr(skb)->seq);
3392 	pbd->tcp_flags = pbd_tcp_flags(tcp_hdr(skb));
3393 
3394 	if (xmit_type & XMIT_GSO_V4) {
3395 		pbd->ip_id = bswab16(ip_hdr(skb)->id);
3396 		pbd->tcp_pseudo_csum =
3397 			bswab16(~csum_tcpudp_magic(ip_hdr(skb)->saddr,
3398 						   ip_hdr(skb)->daddr,
3399 						   0, IPPROTO_TCP, 0));
3400 
3401 		/* GSO on 57710/57711 needs FW to calculate IP checksum */
3402 		tx_start_bd->bd_flags.as_bitfield |= ETH_TX_BD_FLAGS_IP_CSUM;
3403 	} else {
3404 		pbd->tcp_pseudo_csum =
3405 			bswab16(~csum_ipv6_magic(&ipv6_hdr(skb)->saddr,
3406 						 &ipv6_hdr(skb)->daddr,
3407 						 0, IPPROTO_TCP, 0));
3408 	}
3409 
3410 	pbd->global_data |=
3411 		cpu_to_le16(ETH_TX_PARSE_BD_E1X_PSEUDO_CS_WITHOUT_LEN);
3412 }
3413 
3414 /**
3415  * bnx2x_set_pbd_csum_enc - update PBD with checksum and return header length
3416  *
3417  * @bp:			driver handle
3418  * @skb:		packet skb
3419  * @parsing_data:	data to be updated
3420  * @xmit_type:		xmit flags
3421  *
3422  * 57712/578xx related, when skb has encapsulation
3423  */
3424 static u8 bnx2x_set_pbd_csum_enc(struct bnx2x *bp, struct sk_buff *skb,
3425 				 u32 *parsing_data, u32 xmit_type)
3426 {
3427 	*parsing_data |=
3428 		((((u8 *)skb_inner_transport_header(skb) - skb->data) >> 1) <<
3429 		ETH_TX_PARSE_BD_E2_L4_HDR_START_OFFSET_W_SHIFT) &
3430 		ETH_TX_PARSE_BD_E2_L4_HDR_START_OFFSET_W;
3431 
3432 	if (xmit_type & XMIT_CSUM_TCP) {
3433 		*parsing_data |= ((inner_tcp_hdrlen(skb) / 4) <<
3434 			ETH_TX_PARSE_BD_E2_TCP_HDR_LENGTH_DW_SHIFT) &
3435 			ETH_TX_PARSE_BD_E2_TCP_HDR_LENGTH_DW;
3436 
3437 		return skb_inner_transport_header(skb) +
3438 			inner_tcp_hdrlen(skb) - skb->data;
3439 	}
3440 
3441 	/* We support checksum offload for TCP and UDP only.
3442 	 * No need to pass the UDP header length - it's a constant.
3443 	 */
3444 	return skb_inner_transport_header(skb) +
3445 		sizeof(struct udphdr) - skb->data;
3446 }
3447 
3448 /**
3449  * bnx2x_set_pbd_csum_e2 - update PBD with checksum and return header length
3450  *
3451  * @bp:			driver handle
3452  * @skb:		packet skb
3453  * @parsing_data:	data to be updated
3454  * @xmit_type:		xmit flags
3455  *
3456  * 57712/578xx related
3457  */
3458 static u8 bnx2x_set_pbd_csum_e2(struct bnx2x *bp, struct sk_buff *skb,
3459 				u32 *parsing_data, u32 xmit_type)
3460 {
3461 	*parsing_data |=
3462 		((((u8 *)skb_transport_header(skb) - skb->data) >> 1) <<
3463 		ETH_TX_PARSE_BD_E2_L4_HDR_START_OFFSET_W_SHIFT) &
3464 		ETH_TX_PARSE_BD_E2_L4_HDR_START_OFFSET_W;
3465 
3466 	if (xmit_type & XMIT_CSUM_TCP) {
3467 		*parsing_data |= ((tcp_hdrlen(skb) / 4) <<
3468 			ETH_TX_PARSE_BD_E2_TCP_HDR_LENGTH_DW_SHIFT) &
3469 			ETH_TX_PARSE_BD_E2_TCP_HDR_LENGTH_DW;
3470 
3471 		return skb_transport_header(skb) + tcp_hdrlen(skb) - skb->data;
3472 	}
3473 	/* We support checksum offload for TCP and UDP only.
3474 	 * No need to pass the UDP header length - it's a constant.
3475 	 */
3476 	return skb_transport_header(skb) + sizeof(struct udphdr) - skb->data;
3477 }
3478 
3479 /* set FW indication according to inner or outer protocols if tunneled */
3480 static void bnx2x_set_sbd_csum(struct bnx2x *bp, struct sk_buff *skb,
3481 			       struct eth_tx_start_bd *tx_start_bd,
3482 			       u32 xmit_type)
3483 {
3484 	tx_start_bd->bd_flags.as_bitfield |= ETH_TX_BD_FLAGS_L4_CSUM;
3485 
3486 	if (xmit_type & (XMIT_CSUM_ENC_V6 | XMIT_CSUM_V6))
3487 		tx_start_bd->bd_flags.as_bitfield |= ETH_TX_BD_FLAGS_IPV6;
3488 
3489 	if (!(xmit_type & XMIT_CSUM_TCP))
3490 		tx_start_bd->bd_flags.as_bitfield |= ETH_TX_BD_FLAGS_IS_UDP;
3491 }
3492 
3493 /**
3494  * bnx2x_set_pbd_csum - update PBD with checksum and return header length
3495  *
3496  * @bp:		driver handle
3497  * @skb:	packet skb
3498  * @pbd:	parse BD to be updated
3499  * @xmit_type:	xmit flags
3500  */
3501 static u8 bnx2x_set_pbd_csum(struct bnx2x *bp, struct sk_buff *skb,
3502 			     struct eth_tx_parse_bd_e1x *pbd,
3503 			     u32 xmit_type)
3504 {
3505 	u8 hlen = (skb_network_header(skb) - skb->data) >> 1;
3506 
3507 	/* for now NS flag is not used in Linux */
3508 	pbd->global_data =
3509 		cpu_to_le16(hlen |
3510 			    ((skb->protocol == cpu_to_be16(ETH_P_8021Q)) <<
3511 			     ETH_TX_PARSE_BD_E1X_LLC_SNAP_EN_SHIFT));
3512 
3513 	pbd->ip_hlen_w = (skb_transport_header(skb) -
3514 			skb_network_header(skb)) >> 1;
3515 
3516 	hlen += pbd->ip_hlen_w;
3517 
3518 	/* We support checksum offload for TCP and UDP only */
3519 	if (xmit_type & XMIT_CSUM_TCP)
3520 		hlen += tcp_hdrlen(skb) / 2;
3521 	else
3522 		hlen += sizeof(struct udphdr) / 2;
3523 
3524 	pbd->total_hlen_w = cpu_to_le16(hlen);
3525 	hlen = hlen*2;
3526 
3527 	if (xmit_type & XMIT_CSUM_TCP) {
3528 		pbd->tcp_pseudo_csum = bswab16(tcp_hdr(skb)->check);
3529 
3530 	} else {
3531 		s8 fix = SKB_CS_OFF(skb); /* signed! */
3532 
3533 		DP(NETIF_MSG_TX_QUEUED,
3534 		   "hlen %d  fix %d  csum before fix %x\n",
3535 		   le16_to_cpu(pbd->total_hlen_w), fix, SKB_CS(skb));
3536 
3537 		/* HW bug: fixup the CSUM */
3538 		pbd->tcp_pseudo_csum =
3539 			bnx2x_csum_fix(skb_transport_header(skb),
3540 				       SKB_CS(skb), fix);
3541 
3542 		DP(NETIF_MSG_TX_QUEUED, "csum after fix %x\n",
3543 		   pbd->tcp_pseudo_csum);
3544 	}
3545 
3546 	return hlen;
3547 }
3548 
3549 static void bnx2x_update_pbds_gso_enc(struct sk_buff *skb,
3550 				      struct eth_tx_parse_bd_e2 *pbd_e2,
3551 				      struct eth_tx_parse_2nd_bd *pbd2,
3552 				      u16 *global_data,
3553 				      u32 xmit_type)
3554 {
3555 	u16 hlen_w = 0;
3556 	u8 outerip_off, outerip_len = 0;
3557 
3558 	/* from outer IP to transport */
3559 	hlen_w = (skb_inner_transport_header(skb) -
3560 		  skb_network_header(skb)) >> 1;
3561 
3562 	/* transport len */
3563 	hlen_w += inner_tcp_hdrlen(skb) >> 1;
3564 
3565 	pbd2->fw_ip_hdr_to_payload_w = hlen_w;
3566 
3567 	/* outer IP header info */
3568 	if (xmit_type & XMIT_CSUM_V4) {
3569 		struct iphdr *iph = ip_hdr(skb);
3570 		u32 csum = (__force u32)(~iph->check) -
3571 			   (__force u32)iph->tot_len -
3572 			   (__force u32)iph->frag_off;
3573 
3574 		pbd2->fw_ip_csum_wo_len_flags_frag =
3575 			bswab16(csum_fold((__force __wsum)csum));
3576 	} else {
3577 		pbd2->fw_ip_hdr_to_payload_w =
3578 			hlen_w - ((sizeof(struct ipv6hdr)) >> 1);
3579 	}
3580 
3581 	pbd2->tcp_send_seq = bswab32(inner_tcp_hdr(skb)->seq);
3582 
3583 	pbd2->tcp_flags = pbd_tcp_flags(inner_tcp_hdr(skb));
3584 
3585 	if (xmit_type & XMIT_GSO_V4) {
3586 		pbd2->hw_ip_id = bswab16(inner_ip_hdr(skb)->id);
3587 
3588 		pbd_e2->data.tunnel_data.pseudo_csum =
3589 			bswab16(~csum_tcpudp_magic(
3590 					inner_ip_hdr(skb)->saddr,
3591 					inner_ip_hdr(skb)->daddr,
3592 					0, IPPROTO_TCP, 0));
3593 
3594 		outerip_len = ip_hdr(skb)->ihl << 1;
3595 	} else {
3596 		pbd_e2->data.tunnel_data.pseudo_csum =
3597 			bswab16(~csum_ipv6_magic(
3598 					&inner_ipv6_hdr(skb)->saddr,
3599 					&inner_ipv6_hdr(skb)->daddr,
3600 					0, IPPROTO_TCP, 0));
3601 	}
3602 
3603 	outerip_off = (skb_network_header(skb) - skb->data) >> 1;
3604 
3605 	*global_data |=
3606 		outerip_off |
3607 		(!!(xmit_type & XMIT_CSUM_V6) <<
3608 			ETH_TX_PARSE_2ND_BD_IP_HDR_TYPE_OUTER_SHIFT) |
3609 		(outerip_len <<
3610 			ETH_TX_PARSE_2ND_BD_IP_HDR_LEN_OUTER_W_SHIFT) |
3611 		((skb->protocol == cpu_to_be16(ETH_P_8021Q)) <<
3612 			ETH_TX_PARSE_2ND_BD_LLC_SNAP_EN_SHIFT);
3613 
3614 	if (ip_hdr(skb)->protocol == IPPROTO_UDP) {
3615 		SET_FLAG(*global_data, ETH_TX_PARSE_2ND_BD_TUNNEL_UDP_EXIST, 1);
3616 		pbd2->tunnel_udp_hdr_start_w = skb_transport_offset(skb) >> 1;
3617 	}
3618 }
3619 
3620 /* called with netif_tx_lock
3621  * bnx2x_tx_int() runs without netif_tx_lock unless it needs to call
3622  * netif_wake_queue()
3623  */
3624 netdev_tx_t bnx2x_start_xmit(struct sk_buff *skb, struct net_device *dev)
3625 {
3626 	struct bnx2x *bp = netdev_priv(dev);
3627 
3628 	struct netdev_queue *txq;
3629 	struct bnx2x_fp_txdata *txdata;
3630 	struct sw_tx_bd *tx_buf;
3631 	struct eth_tx_start_bd *tx_start_bd, *first_bd;
3632 	struct eth_tx_bd *tx_data_bd, *total_pkt_bd = NULL;
3633 	struct eth_tx_parse_bd_e1x *pbd_e1x = NULL;
3634 	struct eth_tx_parse_bd_e2 *pbd_e2 = NULL;
3635 	struct eth_tx_parse_2nd_bd *pbd2 = NULL;
3636 	u32 pbd_e2_parsing_data = 0;
3637 	u16 pkt_prod, bd_prod;
3638 	int nbd, txq_index;
3639 	dma_addr_t mapping;
3640 	u32 xmit_type = bnx2x_xmit_type(bp, skb);
3641 	int i;
3642 	u8 hlen = 0;
3643 	__le16 pkt_size = 0;
3644 	struct ethhdr *eth;
3645 	u8 mac_type = UNICAST_ADDRESS;
3646 
3647 #ifdef BNX2X_STOP_ON_ERROR
3648 	if (unlikely(bp->panic))
3649 		return NETDEV_TX_BUSY;
3650 #endif
3651 
3652 	txq_index = skb_get_queue_mapping(skb);
3653 	txq = netdev_get_tx_queue(dev, txq_index);
3654 
3655 	BUG_ON(txq_index >= MAX_ETH_TXQ_IDX(bp) + (CNIC_LOADED(bp) ? 1 : 0));
3656 
3657 	txdata = &bp->bnx2x_txq[txq_index];
3658 
3659 	/* enable this debug print to view the transmission queue being used
3660 	DP(NETIF_MSG_TX_QUEUED, "indices: txq %d, fp %d, txdata %d\n",
3661 	   txq_index, fp_index, txdata_index); */
3662 
3663 	/* enable this debug print to view the transmission details
3664 	DP(NETIF_MSG_TX_QUEUED,
3665 	   "transmitting packet cid %d fp index %d txdata_index %d tx_data ptr %p fp pointer %p\n",
3666 	   txdata->cid, fp_index, txdata_index, txdata, fp); */
3667 
3668 	if (unlikely(bnx2x_tx_avail(bp, txdata) <
3669 			skb_shinfo(skb)->nr_frags +
3670 			BDS_PER_TX_PKT +
3671 			NEXT_CNT_PER_TX_PKT(MAX_BDS_PER_TX_PKT))) {
3672 		/* Handle special storage cases separately */
3673 		if (txdata->tx_ring_size == 0) {
3674 			struct bnx2x_eth_q_stats *q_stats =
3675 				bnx2x_fp_qstats(bp, txdata->parent_fp);
3676 			q_stats->driver_filtered_tx_pkt++;
3677 			dev_kfree_skb(skb);
3678 			return NETDEV_TX_OK;
3679 		}
3680 		bnx2x_fp_qstats(bp, txdata->parent_fp)->driver_xoff++;
3681 		netif_tx_stop_queue(txq);
3682 		BNX2X_ERR("BUG! Tx ring full when queue awake!\n");
3683 
3684 		return NETDEV_TX_BUSY;
3685 	}
3686 
3687 	DP(NETIF_MSG_TX_QUEUED,
3688 	   "queue[%d]: SKB: summed %x  protocol %x protocol(%x,%x) gso type %x  xmit_type %x len %d\n",
3689 	   txq_index, skb->ip_summed, skb->protocol, ipv6_hdr(skb)->nexthdr,
3690 	   ip_hdr(skb)->protocol, skb_shinfo(skb)->gso_type, xmit_type,
3691 	   skb->len);
3692 
3693 	eth = (struct ethhdr *)skb->data;
3694 
3695 	/* set flag according to packet type (UNICAST_ADDRESS is default)*/
3696 	if (unlikely(is_multicast_ether_addr(eth->h_dest))) {
3697 		if (is_broadcast_ether_addr(eth->h_dest))
3698 			mac_type = BROADCAST_ADDRESS;
3699 		else
3700 			mac_type = MULTICAST_ADDRESS;
3701 	}
3702 
3703 #if (MAX_SKB_FRAGS >= MAX_FETCH_BD - BDS_PER_TX_PKT)
3704 	/* First, check if we need to linearize the skb (due to FW
3705 	   restrictions). No need to check fragmentation if page size > 8K
3706 	   (there will be no violation to FW restrictions) */
3707 	if (bnx2x_pkt_req_lin(bp, skb, xmit_type)) {
3708 		/* Statistics of linearization */
3709 		bp->lin_cnt++;
3710 		if (skb_linearize(skb) != 0) {
3711 			DP(NETIF_MSG_TX_QUEUED,
3712 			   "SKB linearization failed - silently dropping this SKB\n");
3713 			dev_kfree_skb_any(skb);
3714 			return NETDEV_TX_OK;
3715 		}
3716 	}
3717 #endif
3718 	/* Map skb linear data for DMA */
3719 	mapping = dma_map_single(&bp->pdev->dev, skb->data,
3720 				 skb_headlen(skb), DMA_TO_DEVICE);
3721 	if (unlikely(dma_mapping_error(&bp->pdev->dev, mapping))) {
3722 		DP(NETIF_MSG_TX_QUEUED,
3723 		   "SKB mapping failed - silently dropping this SKB\n");
3724 		dev_kfree_skb_any(skb);
3725 		return NETDEV_TX_OK;
3726 	}
3727 	/*
3728 	Please read carefully. First we use one BD which we mark as start,
3729 	then we have a parsing info BD (used for TSO or xsum),
3730 	and only then we have the rest of the TSO BDs.
3731 	(don't forget to mark the last one as last,
3732 	and to unmap only AFTER you write to the BD ...)
3733 	And above all, all pdb sizes are in words - NOT DWORDS!
3734 	*/
3735 
3736 	/* get current pkt produced now - advance it just before sending packet
3737 	 * since mapping of pages may fail and cause packet to be dropped
3738 	 */
3739 	pkt_prod = txdata->tx_pkt_prod;
3740 	bd_prod = TX_BD(txdata->tx_bd_prod);
3741 
3742 	/* get a tx_buf and first BD
3743 	 * tx_start_bd may be changed during SPLIT,
3744 	 * but first_bd will always stay first
3745 	 */
3746 	tx_buf = &txdata->tx_buf_ring[TX_BD(pkt_prod)];
3747 	tx_start_bd = &txdata->tx_desc_ring[bd_prod].start_bd;
3748 	first_bd = tx_start_bd;
3749 
3750 	tx_start_bd->bd_flags.as_bitfield = ETH_TX_BD_FLAGS_START_BD;
3751 
3752 	/* header nbd: indirectly zero other flags! */
3753 	tx_start_bd->general_data = 1 << ETH_TX_START_BD_HDR_NBDS_SHIFT;
3754 
3755 	/* remember the first BD of the packet */
3756 	tx_buf->first_bd = txdata->tx_bd_prod;
3757 	tx_buf->skb = skb;
3758 	tx_buf->flags = 0;
3759 
3760 	DP(NETIF_MSG_TX_QUEUED,
3761 	   "sending pkt %u @%p  next_idx %u  bd %u @%p\n",
3762 	   pkt_prod, tx_buf, txdata->tx_pkt_prod, bd_prod, tx_start_bd);
3763 
3764 	if (vlan_tx_tag_present(skb)) {
3765 		tx_start_bd->vlan_or_ethertype =
3766 		    cpu_to_le16(vlan_tx_tag_get(skb));
3767 		tx_start_bd->bd_flags.as_bitfield |=
3768 		    (X_ETH_OUTBAND_VLAN << ETH_TX_BD_FLAGS_VLAN_MODE_SHIFT);
3769 	} else {
3770 		/* when transmitting in a vf, start bd must hold the ethertype
3771 		 * for fw to enforce it
3772 		 */
3773 		if (IS_VF(bp))
3774 			tx_start_bd->vlan_or_ethertype =
3775 				cpu_to_le16(ntohs(eth->h_proto));
3776 		else
3777 			/* used by FW for packet accounting */
3778 			tx_start_bd->vlan_or_ethertype = cpu_to_le16(pkt_prod);
3779 	}
3780 
3781 	nbd = 2; /* start_bd + pbd + frags (updated when pages are mapped) */
3782 
3783 	/* turn on parsing and get a BD */
3784 	bd_prod = TX_BD(NEXT_TX_IDX(bd_prod));
3785 
3786 	if (xmit_type & XMIT_CSUM)
3787 		bnx2x_set_sbd_csum(bp, skb, tx_start_bd, xmit_type);
3788 
3789 	if (!CHIP_IS_E1x(bp)) {
3790 		pbd_e2 = &txdata->tx_desc_ring[bd_prod].parse_bd_e2;
3791 		memset(pbd_e2, 0, sizeof(struct eth_tx_parse_bd_e2));
3792 
3793 		if (xmit_type & XMIT_CSUM_ENC) {
3794 			u16 global_data = 0;
3795 
3796 			/* Set PBD in enc checksum offload case */
3797 			hlen = bnx2x_set_pbd_csum_enc(bp, skb,
3798 						      &pbd_e2_parsing_data,
3799 						      xmit_type);
3800 
3801 			/* turn on 2nd parsing and get a BD */
3802 			bd_prod = TX_BD(NEXT_TX_IDX(bd_prod));
3803 
3804 			pbd2 = &txdata->tx_desc_ring[bd_prod].parse_2nd_bd;
3805 
3806 			memset(pbd2, 0, sizeof(*pbd2));
3807 
3808 			pbd_e2->data.tunnel_data.ip_hdr_start_inner_w =
3809 				(skb_inner_network_header(skb) -
3810 				 skb->data) >> 1;
3811 
3812 			if (xmit_type & XMIT_GSO_ENC)
3813 				bnx2x_update_pbds_gso_enc(skb, pbd_e2, pbd2,
3814 							  &global_data,
3815 							  xmit_type);
3816 
3817 			pbd2->global_data = cpu_to_le16(global_data);
3818 
3819 			/* add addition parse BD indication to start BD */
3820 			SET_FLAG(tx_start_bd->general_data,
3821 				 ETH_TX_START_BD_PARSE_NBDS, 1);
3822 			/* set encapsulation flag in start BD */
3823 			SET_FLAG(tx_start_bd->general_data,
3824 				 ETH_TX_START_BD_TUNNEL_EXIST, 1);
3825 			nbd++;
3826 		} else if (xmit_type & XMIT_CSUM) {
3827 			/* Set PBD in checksum offload case w/o encapsulation */
3828 			hlen = bnx2x_set_pbd_csum_e2(bp, skb,
3829 						     &pbd_e2_parsing_data,
3830 						     xmit_type);
3831 		}
3832 
3833 		/* Add the macs to the parsing BD this is a vf */
3834 		if (IS_VF(bp)) {
3835 			/* override GRE parameters in BD */
3836 			bnx2x_set_fw_mac_addr(&pbd_e2->data.mac_addr.src_hi,
3837 					      &pbd_e2->data.mac_addr.src_mid,
3838 					      &pbd_e2->data.mac_addr.src_lo,
3839 					      eth->h_source);
3840 
3841 			bnx2x_set_fw_mac_addr(&pbd_e2->data.mac_addr.dst_hi,
3842 					      &pbd_e2->data.mac_addr.dst_mid,
3843 					      &pbd_e2->data.mac_addr.dst_lo,
3844 					      eth->h_dest);
3845 		}
3846 
3847 		SET_FLAG(pbd_e2_parsing_data,
3848 			 ETH_TX_PARSE_BD_E2_ETH_ADDR_TYPE, mac_type);
3849 	} else {
3850 		u16 global_data = 0;
3851 		pbd_e1x = &txdata->tx_desc_ring[bd_prod].parse_bd_e1x;
3852 		memset(pbd_e1x, 0, sizeof(struct eth_tx_parse_bd_e1x));
3853 		/* Set PBD in checksum offload case */
3854 		if (xmit_type & XMIT_CSUM)
3855 			hlen = bnx2x_set_pbd_csum(bp, skb, pbd_e1x, xmit_type);
3856 
3857 		SET_FLAG(global_data,
3858 			 ETH_TX_PARSE_BD_E1X_ETH_ADDR_TYPE, mac_type);
3859 		pbd_e1x->global_data |= cpu_to_le16(global_data);
3860 	}
3861 
3862 	/* Setup the data pointer of the first BD of the packet */
3863 	tx_start_bd->addr_hi = cpu_to_le32(U64_HI(mapping));
3864 	tx_start_bd->addr_lo = cpu_to_le32(U64_LO(mapping));
3865 	tx_start_bd->nbytes = cpu_to_le16(skb_headlen(skb));
3866 	pkt_size = tx_start_bd->nbytes;
3867 
3868 	DP(NETIF_MSG_TX_QUEUED,
3869 	   "first bd @%p  addr (%x:%x)  nbytes %d  flags %x  vlan %x\n",
3870 	   tx_start_bd, tx_start_bd->addr_hi, tx_start_bd->addr_lo,
3871 	   le16_to_cpu(tx_start_bd->nbytes),
3872 	   tx_start_bd->bd_flags.as_bitfield,
3873 	   le16_to_cpu(tx_start_bd->vlan_or_ethertype));
3874 
3875 	if (xmit_type & XMIT_GSO) {
3876 
3877 		DP(NETIF_MSG_TX_QUEUED,
3878 		   "TSO packet len %d  hlen %d  total len %d  tso size %d\n",
3879 		   skb->len, hlen, skb_headlen(skb),
3880 		   skb_shinfo(skb)->gso_size);
3881 
3882 		tx_start_bd->bd_flags.as_bitfield |= ETH_TX_BD_FLAGS_SW_LSO;
3883 
3884 		if (unlikely(skb_headlen(skb) > hlen)) {
3885 			nbd++;
3886 			bd_prod = bnx2x_tx_split(bp, txdata, tx_buf,
3887 						 &tx_start_bd, hlen,
3888 						 bd_prod);
3889 		}
3890 		if (!CHIP_IS_E1x(bp))
3891 			bnx2x_set_pbd_gso_e2(skb, &pbd_e2_parsing_data,
3892 					     xmit_type);
3893 		else
3894 			bnx2x_set_pbd_gso(skb, pbd_e1x, first_bd, xmit_type);
3895 	}
3896 
3897 	/* Set the PBD's parsing_data field if not zero
3898 	 * (for the chips newer than 57711).
3899 	 */
3900 	if (pbd_e2_parsing_data)
3901 		pbd_e2->parsing_data = cpu_to_le32(pbd_e2_parsing_data);
3902 
3903 	tx_data_bd = (struct eth_tx_bd *)tx_start_bd;
3904 
3905 	/* Handle fragmented skb */
3906 	for (i = 0; i < skb_shinfo(skb)->nr_frags; i++) {
3907 		skb_frag_t *frag = &skb_shinfo(skb)->frags[i];
3908 
3909 		mapping = skb_frag_dma_map(&bp->pdev->dev, frag, 0,
3910 					   skb_frag_size(frag), DMA_TO_DEVICE);
3911 		if (unlikely(dma_mapping_error(&bp->pdev->dev, mapping))) {
3912 			unsigned int pkts_compl = 0, bytes_compl = 0;
3913 
3914 			DP(NETIF_MSG_TX_QUEUED,
3915 			   "Unable to map page - dropping packet...\n");
3916 
3917 			/* we need unmap all buffers already mapped
3918 			 * for this SKB;
3919 			 * first_bd->nbd need to be properly updated
3920 			 * before call to bnx2x_free_tx_pkt
3921 			 */
3922 			first_bd->nbd = cpu_to_le16(nbd);
3923 			bnx2x_free_tx_pkt(bp, txdata,
3924 					  TX_BD(txdata->tx_pkt_prod),
3925 					  &pkts_compl, &bytes_compl);
3926 			return NETDEV_TX_OK;
3927 		}
3928 
3929 		bd_prod = TX_BD(NEXT_TX_IDX(bd_prod));
3930 		tx_data_bd = &txdata->tx_desc_ring[bd_prod].reg_bd;
3931 		if (total_pkt_bd == NULL)
3932 			total_pkt_bd = &txdata->tx_desc_ring[bd_prod].reg_bd;
3933 
3934 		tx_data_bd->addr_hi = cpu_to_le32(U64_HI(mapping));
3935 		tx_data_bd->addr_lo = cpu_to_le32(U64_LO(mapping));
3936 		tx_data_bd->nbytes = cpu_to_le16(skb_frag_size(frag));
3937 		le16_add_cpu(&pkt_size, skb_frag_size(frag));
3938 		nbd++;
3939 
3940 		DP(NETIF_MSG_TX_QUEUED,
3941 		   "frag %d  bd @%p  addr (%x:%x)  nbytes %d\n",
3942 		   i, tx_data_bd, tx_data_bd->addr_hi, tx_data_bd->addr_lo,
3943 		   le16_to_cpu(tx_data_bd->nbytes));
3944 	}
3945 
3946 	DP(NETIF_MSG_TX_QUEUED, "last bd @%p\n", tx_data_bd);
3947 
3948 	/* update with actual num BDs */
3949 	first_bd->nbd = cpu_to_le16(nbd);
3950 
3951 	bd_prod = TX_BD(NEXT_TX_IDX(bd_prod));
3952 
3953 	/* now send a tx doorbell, counting the next BD
3954 	 * if the packet contains or ends with it
3955 	 */
3956 	if (TX_BD_POFF(bd_prod) < nbd)
3957 		nbd++;
3958 
3959 	/* total_pkt_bytes should be set on the first data BD if
3960 	 * it's not an LSO packet and there is more than one
3961 	 * data BD. In this case pkt_size is limited by an MTU value.
3962 	 * However we prefer to set it for an LSO packet (while we don't
3963 	 * have to) in order to save some CPU cycles in a none-LSO
3964 	 * case, when we much more care about them.
3965 	 */
3966 	if (total_pkt_bd != NULL)
3967 		total_pkt_bd->total_pkt_bytes = pkt_size;
3968 
3969 	if (pbd_e1x)
3970 		DP(NETIF_MSG_TX_QUEUED,
3971 		   "PBD (E1X) @%p  ip_data %x  ip_hlen %u  ip_id %u  lso_mss %u  tcp_flags %x  xsum %x  seq %u  hlen %u\n",
3972 		   pbd_e1x, pbd_e1x->global_data, pbd_e1x->ip_hlen_w,
3973 		   pbd_e1x->ip_id, pbd_e1x->lso_mss, pbd_e1x->tcp_flags,
3974 		   pbd_e1x->tcp_pseudo_csum, pbd_e1x->tcp_send_seq,
3975 		    le16_to_cpu(pbd_e1x->total_hlen_w));
3976 	if (pbd_e2)
3977 		DP(NETIF_MSG_TX_QUEUED,
3978 		   "PBD (E2) @%p  dst %x %x %x src %x %x %x parsing_data %x\n",
3979 		   pbd_e2,
3980 		   pbd_e2->data.mac_addr.dst_hi,
3981 		   pbd_e2->data.mac_addr.dst_mid,
3982 		   pbd_e2->data.mac_addr.dst_lo,
3983 		   pbd_e2->data.mac_addr.src_hi,
3984 		   pbd_e2->data.mac_addr.src_mid,
3985 		   pbd_e2->data.mac_addr.src_lo,
3986 		   pbd_e2->parsing_data);
3987 	DP(NETIF_MSG_TX_QUEUED, "doorbell: nbd %d  bd %u\n", nbd, bd_prod);
3988 
3989 	netdev_tx_sent_queue(txq, skb->len);
3990 
3991 	skb_tx_timestamp(skb);
3992 
3993 	txdata->tx_pkt_prod++;
3994 	/*
3995 	 * Make sure that the BD data is updated before updating the producer
3996 	 * since FW might read the BD right after the producer is updated.
3997 	 * This is only applicable for weak-ordered memory model archs such
3998 	 * as IA-64. The following barrier is also mandatory since FW will
3999 	 * assumes packets must have BDs.
4000 	 */
4001 	wmb();
4002 
4003 	txdata->tx_db.data.prod += nbd;
4004 	barrier();
4005 
4006 	DOORBELL(bp, txdata->cid, txdata->tx_db.raw);
4007 
4008 	mmiowb();
4009 
4010 	txdata->tx_bd_prod += nbd;
4011 
4012 	if (unlikely(bnx2x_tx_avail(bp, txdata) < MAX_DESC_PER_TX_PKT)) {
4013 		netif_tx_stop_queue(txq);
4014 
4015 		/* paired memory barrier is in bnx2x_tx_int(), we have to keep
4016 		 * ordering of set_bit() in netif_tx_stop_queue() and read of
4017 		 * fp->bd_tx_cons */
4018 		smp_mb();
4019 
4020 		bnx2x_fp_qstats(bp, txdata->parent_fp)->driver_xoff++;
4021 		if (bnx2x_tx_avail(bp, txdata) >= MAX_DESC_PER_TX_PKT)
4022 			netif_tx_wake_queue(txq);
4023 	}
4024 	txdata->tx_pkt++;
4025 
4026 	return NETDEV_TX_OK;
4027 }
4028 
4029 /**
4030  * bnx2x_setup_tc - routine to configure net_device for multi tc
4031  *
4032  * @netdev: net device to configure
4033  * @tc: number of traffic classes to enable
4034  *
4035  * callback connected to the ndo_setup_tc function pointer
4036  */
4037 int bnx2x_setup_tc(struct net_device *dev, u8 num_tc)
4038 {
4039 	int cos, prio, count, offset;
4040 	struct bnx2x *bp = netdev_priv(dev);
4041 
4042 	/* setup tc must be called under rtnl lock */
4043 	ASSERT_RTNL();
4044 
4045 	/* no traffic classes requested. Aborting */
4046 	if (!num_tc) {
4047 		netdev_reset_tc(dev);
4048 		return 0;
4049 	}
4050 
4051 	/* requested to support too many traffic classes */
4052 	if (num_tc > bp->max_cos) {
4053 		BNX2X_ERR("support for too many traffic classes requested: %d. Max supported is %d\n",
4054 			  num_tc, bp->max_cos);
4055 		return -EINVAL;
4056 	}
4057 
4058 	/* declare amount of supported traffic classes */
4059 	if (netdev_set_num_tc(dev, num_tc)) {
4060 		BNX2X_ERR("failed to declare %d traffic classes\n", num_tc);
4061 		return -EINVAL;
4062 	}
4063 
4064 	/* configure priority to traffic class mapping */
4065 	for (prio = 0; prio < BNX2X_MAX_PRIORITY; prio++) {
4066 		netdev_set_prio_tc_map(dev, prio, bp->prio_to_cos[prio]);
4067 		DP(BNX2X_MSG_SP | NETIF_MSG_IFUP,
4068 		   "mapping priority %d to tc %d\n",
4069 		   prio, bp->prio_to_cos[prio]);
4070 	}
4071 
4072 	/* Use this configuration to differentiate tc0 from other COSes
4073 	   This can be used for ets or pfc, and save the effort of setting
4074 	   up a multio class queue disc or negotiating DCBX with a switch
4075 	netdev_set_prio_tc_map(dev, 0, 0);
4076 	DP(BNX2X_MSG_SP, "mapping priority %d to tc %d\n", 0, 0);
4077 	for (prio = 1; prio < 16; prio++) {
4078 		netdev_set_prio_tc_map(dev, prio, 1);
4079 		DP(BNX2X_MSG_SP, "mapping priority %d to tc %d\n", prio, 1);
4080 	} */
4081 
4082 	/* configure traffic class to transmission queue mapping */
4083 	for (cos = 0; cos < bp->max_cos; cos++) {
4084 		count = BNX2X_NUM_ETH_QUEUES(bp);
4085 		offset = cos * BNX2X_NUM_NON_CNIC_QUEUES(bp);
4086 		netdev_set_tc_queue(dev, cos, count, offset);
4087 		DP(BNX2X_MSG_SP | NETIF_MSG_IFUP,
4088 		   "mapping tc %d to offset %d count %d\n",
4089 		   cos, offset, count);
4090 	}
4091 
4092 	return 0;
4093 }
4094 
4095 /* called with rtnl_lock */
4096 int bnx2x_change_mac_addr(struct net_device *dev, void *p)
4097 {
4098 	struct sockaddr *addr = p;
4099 	struct bnx2x *bp = netdev_priv(dev);
4100 	int rc = 0;
4101 
4102 	if (!bnx2x_is_valid_ether_addr(bp, addr->sa_data)) {
4103 		BNX2X_ERR("Requested MAC address is not valid\n");
4104 		return -EINVAL;
4105 	}
4106 
4107 	if ((IS_MF_STORAGE_SD(bp) || IS_MF_FCOE_AFEX(bp)) &&
4108 	    !is_zero_ether_addr(addr->sa_data)) {
4109 		BNX2X_ERR("Can't configure non-zero address on iSCSI or FCoE functions in MF-SD mode\n");
4110 		return -EINVAL;
4111 	}
4112 
4113 	if (netif_running(dev))  {
4114 		rc = bnx2x_set_eth_mac(bp, false);
4115 		if (rc)
4116 			return rc;
4117 	}
4118 
4119 	memcpy(dev->dev_addr, addr->sa_data, dev->addr_len);
4120 
4121 	if (netif_running(dev))
4122 		rc = bnx2x_set_eth_mac(bp, true);
4123 
4124 	return rc;
4125 }
4126 
4127 static void bnx2x_free_fp_mem_at(struct bnx2x *bp, int fp_index)
4128 {
4129 	union host_hc_status_block *sb = &bnx2x_fp(bp, fp_index, status_blk);
4130 	struct bnx2x_fastpath *fp = &bp->fp[fp_index];
4131 	u8 cos;
4132 
4133 	/* Common */
4134 
4135 	if (IS_FCOE_IDX(fp_index)) {
4136 		memset(sb, 0, sizeof(union host_hc_status_block));
4137 		fp->status_blk_mapping = 0;
4138 	} else {
4139 		/* status blocks */
4140 		if (!CHIP_IS_E1x(bp))
4141 			BNX2X_PCI_FREE(sb->e2_sb,
4142 				       bnx2x_fp(bp, fp_index,
4143 						status_blk_mapping),
4144 				       sizeof(struct host_hc_status_block_e2));
4145 		else
4146 			BNX2X_PCI_FREE(sb->e1x_sb,
4147 				       bnx2x_fp(bp, fp_index,
4148 						status_blk_mapping),
4149 				       sizeof(struct host_hc_status_block_e1x));
4150 	}
4151 
4152 	/* Rx */
4153 	if (!skip_rx_queue(bp, fp_index)) {
4154 		bnx2x_free_rx_bds(fp);
4155 
4156 		/* fastpath rx rings: rx_buf rx_desc rx_comp */
4157 		BNX2X_FREE(bnx2x_fp(bp, fp_index, rx_buf_ring));
4158 		BNX2X_PCI_FREE(bnx2x_fp(bp, fp_index, rx_desc_ring),
4159 			       bnx2x_fp(bp, fp_index, rx_desc_mapping),
4160 			       sizeof(struct eth_rx_bd) * NUM_RX_BD);
4161 
4162 		BNX2X_PCI_FREE(bnx2x_fp(bp, fp_index, rx_comp_ring),
4163 			       bnx2x_fp(bp, fp_index, rx_comp_mapping),
4164 			       sizeof(struct eth_fast_path_rx_cqe) *
4165 			       NUM_RCQ_BD);
4166 
4167 		/* SGE ring */
4168 		BNX2X_FREE(bnx2x_fp(bp, fp_index, rx_page_ring));
4169 		BNX2X_PCI_FREE(bnx2x_fp(bp, fp_index, rx_sge_ring),
4170 			       bnx2x_fp(bp, fp_index, rx_sge_mapping),
4171 			       BCM_PAGE_SIZE * NUM_RX_SGE_PAGES);
4172 	}
4173 
4174 	/* Tx */
4175 	if (!skip_tx_queue(bp, fp_index)) {
4176 		/* fastpath tx rings: tx_buf tx_desc */
4177 		for_each_cos_in_tx_queue(fp, cos) {
4178 			struct bnx2x_fp_txdata *txdata = fp->txdata_ptr[cos];
4179 
4180 			DP(NETIF_MSG_IFDOWN,
4181 			   "freeing tx memory of fp %d cos %d cid %d\n",
4182 			   fp_index, cos, txdata->cid);
4183 
4184 			BNX2X_FREE(txdata->tx_buf_ring);
4185 			BNX2X_PCI_FREE(txdata->tx_desc_ring,
4186 				txdata->tx_desc_mapping,
4187 				sizeof(union eth_tx_bd_types) * NUM_TX_BD);
4188 		}
4189 	}
4190 	/* end of fastpath */
4191 }
4192 
4193 void bnx2x_free_fp_mem_cnic(struct bnx2x *bp)
4194 {
4195 	int i;
4196 	for_each_cnic_queue(bp, i)
4197 		bnx2x_free_fp_mem_at(bp, i);
4198 }
4199 
4200 void bnx2x_free_fp_mem(struct bnx2x *bp)
4201 {
4202 	int i;
4203 	for_each_eth_queue(bp, i)
4204 		bnx2x_free_fp_mem_at(bp, i);
4205 }
4206 
4207 static void set_sb_shortcuts(struct bnx2x *bp, int index)
4208 {
4209 	union host_hc_status_block status_blk = bnx2x_fp(bp, index, status_blk);
4210 	if (!CHIP_IS_E1x(bp)) {
4211 		bnx2x_fp(bp, index, sb_index_values) =
4212 			(__le16 *)status_blk.e2_sb->sb.index_values;
4213 		bnx2x_fp(bp, index, sb_running_index) =
4214 			(__le16 *)status_blk.e2_sb->sb.running_index;
4215 	} else {
4216 		bnx2x_fp(bp, index, sb_index_values) =
4217 			(__le16 *)status_blk.e1x_sb->sb.index_values;
4218 		bnx2x_fp(bp, index, sb_running_index) =
4219 			(__le16 *)status_blk.e1x_sb->sb.running_index;
4220 	}
4221 }
4222 
4223 /* Returns the number of actually allocated BDs */
4224 static int bnx2x_alloc_rx_bds(struct bnx2x_fastpath *fp,
4225 			      int rx_ring_size)
4226 {
4227 	struct bnx2x *bp = fp->bp;
4228 	u16 ring_prod, cqe_ring_prod;
4229 	int i, failure_cnt = 0;
4230 
4231 	fp->rx_comp_cons = 0;
4232 	cqe_ring_prod = ring_prod = 0;
4233 
4234 	/* This routine is called only during fo init so
4235 	 * fp->eth_q_stats.rx_skb_alloc_failed = 0
4236 	 */
4237 	for (i = 0; i < rx_ring_size; i++) {
4238 		if (bnx2x_alloc_rx_data(bp, fp, ring_prod, GFP_KERNEL) < 0) {
4239 			failure_cnt++;
4240 			continue;
4241 		}
4242 		ring_prod = NEXT_RX_IDX(ring_prod);
4243 		cqe_ring_prod = NEXT_RCQ_IDX(cqe_ring_prod);
4244 		WARN_ON(ring_prod <= (i - failure_cnt));
4245 	}
4246 
4247 	if (failure_cnt)
4248 		BNX2X_ERR("was only able to allocate %d rx skbs on queue[%d]\n",
4249 			  i - failure_cnt, fp->index);
4250 
4251 	fp->rx_bd_prod = ring_prod;
4252 	/* Limit the CQE producer by the CQE ring size */
4253 	fp->rx_comp_prod = min_t(u16, NUM_RCQ_RINGS*RCQ_DESC_CNT,
4254 			       cqe_ring_prod);
4255 	fp->rx_pkt = fp->rx_calls = 0;
4256 
4257 	bnx2x_fp_stats(bp, fp)->eth_q_stats.rx_skb_alloc_failed += failure_cnt;
4258 
4259 	return i - failure_cnt;
4260 }
4261 
4262 static void bnx2x_set_next_page_rx_cq(struct bnx2x_fastpath *fp)
4263 {
4264 	int i;
4265 
4266 	for (i = 1; i <= NUM_RCQ_RINGS; i++) {
4267 		struct eth_rx_cqe_next_page *nextpg;
4268 
4269 		nextpg = (struct eth_rx_cqe_next_page *)
4270 			&fp->rx_comp_ring[RCQ_DESC_CNT * i - 1];
4271 		nextpg->addr_hi =
4272 			cpu_to_le32(U64_HI(fp->rx_comp_mapping +
4273 				   BCM_PAGE_SIZE*(i % NUM_RCQ_RINGS)));
4274 		nextpg->addr_lo =
4275 			cpu_to_le32(U64_LO(fp->rx_comp_mapping +
4276 				   BCM_PAGE_SIZE*(i % NUM_RCQ_RINGS)));
4277 	}
4278 }
4279 
4280 static int bnx2x_alloc_fp_mem_at(struct bnx2x *bp, int index)
4281 {
4282 	union host_hc_status_block *sb;
4283 	struct bnx2x_fastpath *fp = &bp->fp[index];
4284 	int ring_size = 0;
4285 	u8 cos;
4286 	int rx_ring_size = 0;
4287 
4288 	if (!bp->rx_ring_size &&
4289 	    (IS_MF_STORAGE_SD(bp) || IS_MF_FCOE_AFEX(bp))) {
4290 		rx_ring_size = MIN_RX_SIZE_NONTPA;
4291 		bp->rx_ring_size = rx_ring_size;
4292 	} else if (!bp->rx_ring_size) {
4293 		rx_ring_size = MAX_RX_AVAIL/BNX2X_NUM_RX_QUEUES(bp);
4294 
4295 		if (CHIP_IS_E3(bp)) {
4296 			u32 cfg = SHMEM_RD(bp,
4297 					   dev_info.port_hw_config[BP_PORT(bp)].
4298 					   default_cfg);
4299 
4300 			/* Decrease ring size for 1G functions */
4301 			if ((cfg & PORT_HW_CFG_NET_SERDES_IF_MASK) ==
4302 			    PORT_HW_CFG_NET_SERDES_IF_SGMII)
4303 				rx_ring_size /= 10;
4304 		}
4305 
4306 		/* allocate at least number of buffers required by FW */
4307 		rx_ring_size = max_t(int, bp->disable_tpa ? MIN_RX_SIZE_NONTPA :
4308 				     MIN_RX_SIZE_TPA, rx_ring_size);
4309 
4310 		bp->rx_ring_size = rx_ring_size;
4311 	} else /* if rx_ring_size specified - use it */
4312 		rx_ring_size = bp->rx_ring_size;
4313 
4314 	DP(BNX2X_MSG_SP, "calculated rx_ring_size %d\n", rx_ring_size);
4315 
4316 	/* Common */
4317 	sb = &bnx2x_fp(bp, index, status_blk);
4318 
4319 	if (!IS_FCOE_IDX(index)) {
4320 		/* status blocks */
4321 		if (!CHIP_IS_E1x(bp))
4322 			BNX2X_PCI_ALLOC(sb->e2_sb,
4323 				&bnx2x_fp(bp, index, status_blk_mapping),
4324 				sizeof(struct host_hc_status_block_e2));
4325 		else
4326 			BNX2X_PCI_ALLOC(sb->e1x_sb,
4327 				&bnx2x_fp(bp, index, status_blk_mapping),
4328 			    sizeof(struct host_hc_status_block_e1x));
4329 	}
4330 
4331 	/* FCoE Queue uses Default SB and doesn't ACK the SB, thus no need to
4332 	 * set shortcuts for it.
4333 	 */
4334 	if (!IS_FCOE_IDX(index))
4335 		set_sb_shortcuts(bp, index);
4336 
4337 	/* Tx */
4338 	if (!skip_tx_queue(bp, index)) {
4339 		/* fastpath tx rings: tx_buf tx_desc */
4340 		for_each_cos_in_tx_queue(fp, cos) {
4341 			struct bnx2x_fp_txdata *txdata = fp->txdata_ptr[cos];
4342 
4343 			DP(NETIF_MSG_IFUP,
4344 			   "allocating tx memory of fp %d cos %d\n",
4345 			   index, cos);
4346 
4347 			BNX2X_ALLOC(txdata->tx_buf_ring,
4348 				sizeof(struct sw_tx_bd) * NUM_TX_BD);
4349 			BNX2X_PCI_ALLOC(txdata->tx_desc_ring,
4350 				&txdata->tx_desc_mapping,
4351 				sizeof(union eth_tx_bd_types) * NUM_TX_BD);
4352 		}
4353 	}
4354 
4355 	/* Rx */
4356 	if (!skip_rx_queue(bp, index)) {
4357 		/* fastpath rx rings: rx_buf rx_desc rx_comp */
4358 		BNX2X_ALLOC(bnx2x_fp(bp, index, rx_buf_ring),
4359 				sizeof(struct sw_rx_bd) * NUM_RX_BD);
4360 		BNX2X_PCI_ALLOC(bnx2x_fp(bp, index, rx_desc_ring),
4361 				&bnx2x_fp(bp, index, rx_desc_mapping),
4362 				sizeof(struct eth_rx_bd) * NUM_RX_BD);
4363 
4364 		/* Seed all CQEs by 1s */
4365 		BNX2X_PCI_FALLOC(bnx2x_fp(bp, index, rx_comp_ring),
4366 				 &bnx2x_fp(bp, index, rx_comp_mapping),
4367 				 sizeof(struct eth_fast_path_rx_cqe) *
4368 				 NUM_RCQ_BD);
4369 
4370 		/* SGE ring */
4371 		BNX2X_ALLOC(bnx2x_fp(bp, index, rx_page_ring),
4372 				sizeof(struct sw_rx_page) * NUM_RX_SGE);
4373 		BNX2X_PCI_ALLOC(bnx2x_fp(bp, index, rx_sge_ring),
4374 				&bnx2x_fp(bp, index, rx_sge_mapping),
4375 				BCM_PAGE_SIZE * NUM_RX_SGE_PAGES);
4376 		/* RX BD ring */
4377 		bnx2x_set_next_page_rx_bd(fp);
4378 
4379 		/* CQ ring */
4380 		bnx2x_set_next_page_rx_cq(fp);
4381 
4382 		/* BDs */
4383 		ring_size = bnx2x_alloc_rx_bds(fp, rx_ring_size);
4384 		if (ring_size < rx_ring_size)
4385 			goto alloc_mem_err;
4386 	}
4387 
4388 	return 0;
4389 
4390 /* handles low memory cases */
4391 alloc_mem_err:
4392 	BNX2X_ERR("Unable to allocate full memory for queue %d (size %d)\n",
4393 						index, ring_size);
4394 	/* FW will drop all packets if queue is not big enough,
4395 	 * In these cases we disable the queue
4396 	 * Min size is different for OOO, TPA and non-TPA queues
4397 	 */
4398 	if (ring_size < (fp->disable_tpa ?
4399 				MIN_RX_SIZE_NONTPA : MIN_RX_SIZE_TPA)) {
4400 			/* release memory allocated for this queue */
4401 			bnx2x_free_fp_mem_at(bp, index);
4402 			return -ENOMEM;
4403 	}
4404 	return 0;
4405 }
4406 
4407 int bnx2x_alloc_fp_mem_cnic(struct bnx2x *bp)
4408 {
4409 	if (!NO_FCOE(bp))
4410 		/* FCoE */
4411 		if (bnx2x_alloc_fp_mem_at(bp, FCOE_IDX(bp)))
4412 			/* we will fail load process instead of mark
4413 			 * NO_FCOE_FLAG
4414 			 */
4415 			return -ENOMEM;
4416 
4417 	return 0;
4418 }
4419 
4420 int bnx2x_alloc_fp_mem(struct bnx2x *bp)
4421 {
4422 	int i;
4423 
4424 	/* 1. Allocate FP for leading - fatal if error
4425 	 * 2. Allocate RSS - fix number of queues if error
4426 	 */
4427 
4428 	/* leading */
4429 	if (bnx2x_alloc_fp_mem_at(bp, 0))
4430 		return -ENOMEM;
4431 
4432 	/* RSS */
4433 	for_each_nondefault_eth_queue(bp, i)
4434 		if (bnx2x_alloc_fp_mem_at(bp, i))
4435 			break;
4436 
4437 	/* handle memory failures */
4438 	if (i != BNX2X_NUM_ETH_QUEUES(bp)) {
4439 		int delta = BNX2X_NUM_ETH_QUEUES(bp) - i;
4440 
4441 		WARN_ON(delta < 0);
4442 		bnx2x_shrink_eth_fp(bp, delta);
4443 		if (CNIC_SUPPORT(bp))
4444 			/* move non eth FPs next to last eth FP
4445 			 * must be done in that order
4446 			 * FCOE_IDX < FWD_IDX < OOO_IDX
4447 			 */
4448 
4449 			/* move FCoE fp even NO_FCOE_FLAG is on */
4450 			bnx2x_move_fp(bp, FCOE_IDX(bp), FCOE_IDX(bp) - delta);
4451 		bp->num_ethernet_queues -= delta;
4452 		bp->num_queues = bp->num_ethernet_queues +
4453 				 bp->num_cnic_queues;
4454 		BNX2X_ERR("Adjusted num of queues from %d to %d\n",
4455 			  bp->num_queues + delta, bp->num_queues);
4456 	}
4457 
4458 	return 0;
4459 }
4460 
4461 void bnx2x_free_mem_bp(struct bnx2x *bp)
4462 {
4463 	int i;
4464 
4465 	for (i = 0; i < bp->fp_array_size; i++)
4466 		kfree(bp->fp[i].tpa_info);
4467 	kfree(bp->fp);
4468 	kfree(bp->sp_objs);
4469 	kfree(bp->fp_stats);
4470 	kfree(bp->bnx2x_txq);
4471 	kfree(bp->msix_table);
4472 	kfree(bp->ilt);
4473 }
4474 
4475 int bnx2x_alloc_mem_bp(struct bnx2x *bp)
4476 {
4477 	struct bnx2x_fastpath *fp;
4478 	struct msix_entry *tbl;
4479 	struct bnx2x_ilt *ilt;
4480 	int msix_table_size = 0;
4481 	int fp_array_size, txq_array_size;
4482 	int i;
4483 
4484 	/*
4485 	 * The biggest MSI-X table we might need is as a maximum number of fast
4486 	 * path IGU SBs plus default SB (for PF only).
4487 	 */
4488 	msix_table_size = bp->igu_sb_cnt;
4489 	if (IS_PF(bp))
4490 		msix_table_size++;
4491 	BNX2X_DEV_INFO("msix_table_size %d\n", msix_table_size);
4492 
4493 	/* fp array: RSS plus CNIC related L2 queues */
4494 	fp_array_size = BNX2X_MAX_RSS_COUNT(bp) + CNIC_SUPPORT(bp);
4495 	bp->fp_array_size = fp_array_size;
4496 	BNX2X_DEV_INFO("fp_array_size %d\n", bp->fp_array_size);
4497 
4498 	fp = kcalloc(bp->fp_array_size, sizeof(*fp), GFP_KERNEL);
4499 	if (!fp)
4500 		goto alloc_err;
4501 	for (i = 0; i < bp->fp_array_size; i++) {
4502 		fp[i].tpa_info =
4503 			kcalloc(ETH_MAX_AGGREGATION_QUEUES_E1H_E2,
4504 				sizeof(struct bnx2x_agg_info), GFP_KERNEL);
4505 		if (!(fp[i].tpa_info))
4506 			goto alloc_err;
4507 	}
4508 
4509 	bp->fp = fp;
4510 
4511 	/* allocate sp objs */
4512 	bp->sp_objs = kcalloc(bp->fp_array_size, sizeof(struct bnx2x_sp_objs),
4513 			      GFP_KERNEL);
4514 	if (!bp->sp_objs)
4515 		goto alloc_err;
4516 
4517 	/* allocate fp_stats */
4518 	bp->fp_stats = kcalloc(bp->fp_array_size, sizeof(struct bnx2x_fp_stats),
4519 			       GFP_KERNEL);
4520 	if (!bp->fp_stats)
4521 		goto alloc_err;
4522 
4523 	/* Allocate memory for the transmission queues array */
4524 	txq_array_size =
4525 		BNX2X_MAX_RSS_COUNT(bp) * BNX2X_MULTI_TX_COS + CNIC_SUPPORT(bp);
4526 	BNX2X_DEV_INFO("txq_array_size %d", txq_array_size);
4527 
4528 	bp->bnx2x_txq = kcalloc(txq_array_size, sizeof(struct bnx2x_fp_txdata),
4529 				GFP_KERNEL);
4530 	if (!bp->bnx2x_txq)
4531 		goto alloc_err;
4532 
4533 	/* msix table */
4534 	tbl = kcalloc(msix_table_size, sizeof(*tbl), GFP_KERNEL);
4535 	if (!tbl)
4536 		goto alloc_err;
4537 	bp->msix_table = tbl;
4538 
4539 	/* ilt */
4540 	ilt = kzalloc(sizeof(*ilt), GFP_KERNEL);
4541 	if (!ilt)
4542 		goto alloc_err;
4543 	bp->ilt = ilt;
4544 
4545 	return 0;
4546 alloc_err:
4547 	bnx2x_free_mem_bp(bp);
4548 	return -ENOMEM;
4549 }
4550 
4551 int bnx2x_reload_if_running(struct net_device *dev)
4552 {
4553 	struct bnx2x *bp = netdev_priv(dev);
4554 
4555 	if (unlikely(!netif_running(dev)))
4556 		return 0;
4557 
4558 	bnx2x_nic_unload(bp, UNLOAD_NORMAL, true);
4559 	return bnx2x_nic_load(bp, LOAD_NORMAL);
4560 }
4561 
4562 int bnx2x_get_cur_phy_idx(struct bnx2x *bp)
4563 {
4564 	u32 sel_phy_idx = 0;
4565 	if (bp->link_params.num_phys <= 1)
4566 		return INT_PHY;
4567 
4568 	if (bp->link_vars.link_up) {
4569 		sel_phy_idx = EXT_PHY1;
4570 		/* In case link is SERDES, check if the EXT_PHY2 is the one */
4571 		if ((bp->link_vars.link_status & LINK_STATUS_SERDES_LINK) &&
4572 		    (bp->link_params.phy[EXT_PHY2].supported & SUPPORTED_FIBRE))
4573 			sel_phy_idx = EXT_PHY2;
4574 	} else {
4575 
4576 		switch (bnx2x_phy_selection(&bp->link_params)) {
4577 		case PORT_HW_CFG_PHY_SELECTION_HARDWARE_DEFAULT:
4578 		case PORT_HW_CFG_PHY_SELECTION_FIRST_PHY:
4579 		case PORT_HW_CFG_PHY_SELECTION_FIRST_PHY_PRIORITY:
4580 		       sel_phy_idx = EXT_PHY1;
4581 		       break;
4582 		case PORT_HW_CFG_PHY_SELECTION_SECOND_PHY:
4583 		case PORT_HW_CFG_PHY_SELECTION_SECOND_PHY_PRIORITY:
4584 		       sel_phy_idx = EXT_PHY2;
4585 		       break;
4586 		}
4587 	}
4588 
4589 	return sel_phy_idx;
4590 }
4591 int bnx2x_get_link_cfg_idx(struct bnx2x *bp)
4592 {
4593 	u32 sel_phy_idx = bnx2x_get_cur_phy_idx(bp);
4594 	/*
4595 	 * The selected activated PHY is always after swapping (in case PHY
4596 	 * swapping is enabled). So when swapping is enabled, we need to reverse
4597 	 * the configuration
4598 	 */
4599 
4600 	if (bp->link_params.multi_phy_config &
4601 	    PORT_HW_CFG_PHY_SWAPPED_ENABLED) {
4602 		if (sel_phy_idx == EXT_PHY1)
4603 			sel_phy_idx = EXT_PHY2;
4604 		else if (sel_phy_idx == EXT_PHY2)
4605 			sel_phy_idx = EXT_PHY1;
4606 	}
4607 	return LINK_CONFIG_IDX(sel_phy_idx);
4608 }
4609 
4610 #ifdef NETDEV_FCOE_WWNN
4611 int bnx2x_fcoe_get_wwn(struct net_device *dev, u64 *wwn, int type)
4612 {
4613 	struct bnx2x *bp = netdev_priv(dev);
4614 	struct cnic_eth_dev *cp = &bp->cnic_eth_dev;
4615 
4616 	switch (type) {
4617 	case NETDEV_FCOE_WWNN:
4618 		*wwn = HILO_U64(cp->fcoe_wwn_node_name_hi,
4619 				cp->fcoe_wwn_node_name_lo);
4620 		break;
4621 	case NETDEV_FCOE_WWPN:
4622 		*wwn = HILO_U64(cp->fcoe_wwn_port_name_hi,
4623 				cp->fcoe_wwn_port_name_lo);
4624 		break;
4625 	default:
4626 		BNX2X_ERR("Wrong WWN type requested - %d\n", type);
4627 		return -EINVAL;
4628 	}
4629 
4630 	return 0;
4631 }
4632 #endif
4633 
4634 /* called with rtnl_lock */
4635 int bnx2x_change_mtu(struct net_device *dev, int new_mtu)
4636 {
4637 	struct bnx2x *bp = netdev_priv(dev);
4638 
4639 	if (bp->recovery_state != BNX2X_RECOVERY_DONE) {
4640 		BNX2X_ERR("Can't perform change MTU during parity recovery\n");
4641 		return -EAGAIN;
4642 	}
4643 
4644 	if ((new_mtu > ETH_MAX_JUMBO_PACKET_SIZE) ||
4645 	    ((new_mtu + ETH_HLEN) < ETH_MIN_PACKET_SIZE)) {
4646 		BNX2X_ERR("Can't support requested MTU size\n");
4647 		return -EINVAL;
4648 	}
4649 
4650 	/* This does not race with packet allocation
4651 	 * because the actual alloc size is
4652 	 * only updated as part of load
4653 	 */
4654 	dev->mtu = new_mtu;
4655 
4656 	return bnx2x_reload_if_running(dev);
4657 }
4658 
4659 netdev_features_t bnx2x_fix_features(struct net_device *dev,
4660 				     netdev_features_t features)
4661 {
4662 	struct bnx2x *bp = netdev_priv(dev);
4663 
4664 	/* TPA requires Rx CSUM offloading */
4665 	if (!(features & NETIF_F_RXCSUM) || bp->disable_tpa) {
4666 		features &= ~NETIF_F_LRO;
4667 		features &= ~NETIF_F_GRO;
4668 	}
4669 
4670 	return features;
4671 }
4672 
4673 int bnx2x_set_features(struct net_device *dev, netdev_features_t features)
4674 {
4675 	struct bnx2x *bp = netdev_priv(dev);
4676 	u32 flags = bp->flags;
4677 	u32 changes;
4678 	bool bnx2x_reload = false;
4679 
4680 	if (features & NETIF_F_LRO)
4681 		flags |= TPA_ENABLE_FLAG;
4682 	else
4683 		flags &= ~TPA_ENABLE_FLAG;
4684 
4685 	if (features & NETIF_F_GRO)
4686 		flags |= GRO_ENABLE_FLAG;
4687 	else
4688 		flags &= ~GRO_ENABLE_FLAG;
4689 
4690 	if (features & NETIF_F_LOOPBACK) {
4691 		if (bp->link_params.loopback_mode != LOOPBACK_BMAC) {
4692 			bp->link_params.loopback_mode = LOOPBACK_BMAC;
4693 			bnx2x_reload = true;
4694 		}
4695 	} else {
4696 		if (bp->link_params.loopback_mode != LOOPBACK_NONE) {
4697 			bp->link_params.loopback_mode = LOOPBACK_NONE;
4698 			bnx2x_reload = true;
4699 		}
4700 	}
4701 
4702 	changes = flags ^ bp->flags;
4703 
4704 	/* if GRO is changed while LRO is enabled, don't force a reload */
4705 	if ((changes & GRO_ENABLE_FLAG) && (flags & TPA_ENABLE_FLAG))
4706 		changes &= ~GRO_ENABLE_FLAG;
4707 
4708 	if (changes)
4709 		bnx2x_reload = true;
4710 
4711 	bp->flags = flags;
4712 
4713 	if (bnx2x_reload) {
4714 		if (bp->recovery_state == BNX2X_RECOVERY_DONE)
4715 			return bnx2x_reload_if_running(dev);
4716 		/* else: bnx2x_nic_load() will be called at end of recovery */
4717 	}
4718 
4719 	return 0;
4720 }
4721 
4722 void bnx2x_tx_timeout(struct net_device *dev)
4723 {
4724 	struct bnx2x *bp = netdev_priv(dev);
4725 
4726 #ifdef BNX2X_STOP_ON_ERROR
4727 	if (!bp->panic)
4728 		bnx2x_panic();
4729 #endif
4730 
4731 	smp_mb__before_clear_bit();
4732 	set_bit(BNX2X_SP_RTNL_TX_TIMEOUT, &bp->sp_rtnl_state);
4733 	smp_mb__after_clear_bit();
4734 
4735 	/* This allows the netif to be shutdown gracefully before resetting */
4736 	schedule_delayed_work(&bp->sp_rtnl_task, 0);
4737 }
4738 
4739 int bnx2x_suspend(struct pci_dev *pdev, pm_message_t state)
4740 {
4741 	struct net_device *dev = pci_get_drvdata(pdev);
4742 	struct bnx2x *bp;
4743 
4744 	if (!dev) {
4745 		dev_err(&pdev->dev, "BAD net device from bnx2x_init_one\n");
4746 		return -ENODEV;
4747 	}
4748 	bp = netdev_priv(dev);
4749 
4750 	rtnl_lock();
4751 
4752 	pci_save_state(pdev);
4753 
4754 	if (!netif_running(dev)) {
4755 		rtnl_unlock();
4756 		return 0;
4757 	}
4758 
4759 	netif_device_detach(dev);
4760 
4761 	bnx2x_nic_unload(bp, UNLOAD_CLOSE, false);
4762 
4763 	bnx2x_set_power_state(bp, pci_choose_state(pdev, state));
4764 
4765 	rtnl_unlock();
4766 
4767 	return 0;
4768 }
4769 
4770 int bnx2x_resume(struct pci_dev *pdev)
4771 {
4772 	struct net_device *dev = pci_get_drvdata(pdev);
4773 	struct bnx2x *bp;
4774 	int rc;
4775 
4776 	if (!dev) {
4777 		dev_err(&pdev->dev, "BAD net device from bnx2x_init_one\n");
4778 		return -ENODEV;
4779 	}
4780 	bp = netdev_priv(dev);
4781 
4782 	if (bp->recovery_state != BNX2X_RECOVERY_DONE) {
4783 		BNX2X_ERR("Handling parity error recovery. Try again later\n");
4784 		return -EAGAIN;
4785 	}
4786 
4787 	rtnl_lock();
4788 
4789 	pci_restore_state(pdev);
4790 
4791 	if (!netif_running(dev)) {
4792 		rtnl_unlock();
4793 		return 0;
4794 	}
4795 
4796 	bnx2x_set_power_state(bp, PCI_D0);
4797 	netif_device_attach(dev);
4798 
4799 	rc = bnx2x_nic_load(bp, LOAD_OPEN);
4800 
4801 	rtnl_unlock();
4802 
4803 	return rc;
4804 }
4805 
4806 void bnx2x_set_ctx_validation(struct bnx2x *bp, struct eth_context *cxt,
4807 			      u32 cid)
4808 {
4809 	if (!cxt) {
4810 		BNX2X_ERR("bad context pointer %p\n", cxt);
4811 		return;
4812 	}
4813 
4814 	/* ustorm cxt validation */
4815 	cxt->ustorm_ag_context.cdu_usage =
4816 		CDU_RSRVD_VALUE_TYPE_A(HW_CID(bp, cid),
4817 			CDU_REGION_NUMBER_UCM_AG, ETH_CONNECTION_TYPE);
4818 	/* xcontext validation */
4819 	cxt->xstorm_ag_context.cdu_reserved =
4820 		CDU_RSRVD_VALUE_TYPE_A(HW_CID(bp, cid),
4821 			CDU_REGION_NUMBER_XCM_AG, ETH_CONNECTION_TYPE);
4822 }
4823 
4824 static void storm_memset_hc_timeout(struct bnx2x *bp, u8 port,
4825 				    u8 fw_sb_id, u8 sb_index,
4826 				    u8 ticks)
4827 {
4828 	u32 addr = BAR_CSTRORM_INTMEM +
4829 		   CSTORM_STATUS_BLOCK_DATA_TIMEOUT_OFFSET(fw_sb_id, sb_index);
4830 	REG_WR8(bp, addr, ticks);
4831 	DP(NETIF_MSG_IFUP,
4832 	   "port %x fw_sb_id %d sb_index %d ticks %d\n",
4833 	   port, fw_sb_id, sb_index, ticks);
4834 }
4835 
4836 static void storm_memset_hc_disable(struct bnx2x *bp, u8 port,
4837 				    u16 fw_sb_id, u8 sb_index,
4838 				    u8 disable)
4839 {
4840 	u32 enable_flag = disable ? 0 : (1 << HC_INDEX_DATA_HC_ENABLED_SHIFT);
4841 	u32 addr = BAR_CSTRORM_INTMEM +
4842 		   CSTORM_STATUS_BLOCK_DATA_FLAGS_OFFSET(fw_sb_id, sb_index);
4843 	u8 flags = REG_RD8(bp, addr);
4844 	/* clear and set */
4845 	flags &= ~HC_INDEX_DATA_HC_ENABLED;
4846 	flags |= enable_flag;
4847 	REG_WR8(bp, addr, flags);
4848 	DP(NETIF_MSG_IFUP,
4849 	   "port %x fw_sb_id %d sb_index %d disable %d\n",
4850 	   port, fw_sb_id, sb_index, disable);
4851 }
4852 
4853 void bnx2x_update_coalesce_sb_index(struct bnx2x *bp, u8 fw_sb_id,
4854 				    u8 sb_index, u8 disable, u16 usec)
4855 {
4856 	int port = BP_PORT(bp);
4857 	u8 ticks = usec / BNX2X_BTR;
4858 
4859 	storm_memset_hc_timeout(bp, port, fw_sb_id, sb_index, ticks);
4860 
4861 	disable = disable ? 1 : (usec ? 0 : 1);
4862 	storm_memset_hc_disable(bp, port, fw_sb_id, sb_index, disable);
4863 }
4864