Merge git://git.kernel.org/pub/scm/linux/kernel/git/davem/net
[linux-2.6-block.git] / drivers / net / ethernet / broadcom / bnx2x / bnx2x_cmn.c
1 /* bnx2x_cmn.c: Broadcom Everest network driver.
2  *
3  * Copyright (c) 2007-2013 Broadcom Corporation
4  *
5  * This program is free software; you can redistribute it and/or modify
6  * it under the terms of the GNU General Public License as published by
7  * the Free Software Foundation.
8  *
9  * Maintained by: Ariel Elior <ariel.elior@qlogic.com>
10  * Written by: Eliezer Tamir
11  * Based on code from Michael Chan's bnx2 driver
12  * UDP CSUM errata workaround by Arik Gendelman
13  * Slowpath and fastpath rework by Vladislav Zolotarov
14  * Statistics and Link management by Yitchak Gertner
15  *
16  */
17
18 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
19
20 #include <linux/etherdevice.h>
21 #include <linux/if_vlan.h>
22 #include <linux/interrupt.h>
23 #include <linux/ip.h>
24 #include <net/tcp.h>
25 #include <net/ipv6.h>
26 #include <net/ip6_checksum.h>
27 #include <net/busy_poll.h>
28 #include <linux/prefetch.h>
29 #include "bnx2x_cmn.h"
30 #include "bnx2x_init.h"
31 #include "bnx2x_sp.h"
32
33 static void bnx2x_free_fp_mem_cnic(struct bnx2x *bp);
34 static int bnx2x_alloc_fp_mem_cnic(struct bnx2x *bp);
35 static int bnx2x_alloc_fp_mem(struct bnx2x *bp);
36 static int bnx2x_poll(struct napi_struct *napi, int budget);
37
38 static void bnx2x_add_all_napi_cnic(struct bnx2x *bp)
39 {
40         int i;
41
42         /* Add NAPI objects */
43         for_each_rx_queue_cnic(bp, i) {
44                 netif_napi_add(bp->dev, &bnx2x_fp(bp, i, napi),
45                                bnx2x_poll, NAPI_POLL_WEIGHT);
46                 napi_hash_add(&bnx2x_fp(bp, i, napi));
47         }
48 }
49
50 static void bnx2x_add_all_napi(struct bnx2x *bp)
51 {
52         int i;
53
54         /* Add NAPI objects */
55         for_each_eth_queue(bp, i) {
56                 netif_napi_add(bp->dev, &bnx2x_fp(bp, i, napi),
57                                bnx2x_poll, NAPI_POLL_WEIGHT);
58                 napi_hash_add(&bnx2x_fp(bp, i, napi));
59         }
60 }
61
62 static int bnx2x_calc_num_queues(struct bnx2x *bp)
63 {
64         int nq = bnx2x_num_queues ? : netif_get_num_default_rss_queues();
65
66         /* Reduce memory usage in kdump environment by using only one queue */
67         if (reset_devices)
68                 nq = 1;
69
70         nq = clamp(nq, 1, BNX2X_MAX_QUEUES(bp));
71         return nq;
72 }
73
74 /**
75  * bnx2x_move_fp - move content of the fastpath structure.
76  *
77  * @bp:         driver handle
78  * @from:       source FP index
79  * @to:         destination FP index
80  *
81  * Makes sure the contents of the bp->fp[to].napi is kept
82  * intact. This is done by first copying the napi struct from
83  * the target to the source, and then mem copying the entire
84  * source onto the target. Update txdata pointers and related
85  * content.
86  */
87 static inline void bnx2x_move_fp(struct bnx2x *bp, int from, int to)
88 {
89         struct bnx2x_fastpath *from_fp = &bp->fp[from];
90         struct bnx2x_fastpath *to_fp = &bp->fp[to];
91         struct bnx2x_sp_objs *from_sp_objs = &bp->sp_objs[from];
92         struct bnx2x_sp_objs *to_sp_objs = &bp->sp_objs[to];
93         struct bnx2x_fp_stats *from_fp_stats = &bp->fp_stats[from];
94         struct bnx2x_fp_stats *to_fp_stats = &bp->fp_stats[to];
95         int old_max_eth_txqs, new_max_eth_txqs;
96         int old_txdata_index = 0, new_txdata_index = 0;
97         struct bnx2x_agg_info *old_tpa_info = to_fp->tpa_info;
98
99         /* Copy the NAPI object as it has been already initialized */
100         from_fp->napi = to_fp->napi;
101
102         /* Move bnx2x_fastpath contents */
103         memcpy(to_fp, from_fp, sizeof(*to_fp));
104         to_fp->index = to;
105
106         /* Retain the tpa_info of the original `to' version as we don't want
107          * 2 FPs to contain the same tpa_info pointer.
108          */
109         to_fp->tpa_info = old_tpa_info;
110
111         /* move sp_objs contents as well, as their indices match fp ones */
112         memcpy(to_sp_objs, from_sp_objs, sizeof(*to_sp_objs));
113
114         /* move fp_stats contents as well, as their indices match fp ones */
115         memcpy(to_fp_stats, from_fp_stats, sizeof(*to_fp_stats));
116
117         /* Update txdata pointers in fp and move txdata content accordingly:
118          * Each fp consumes 'max_cos' txdata structures, so the index should be
119          * decremented by max_cos x delta.
120          */
121
122         old_max_eth_txqs = BNX2X_NUM_ETH_QUEUES(bp) * (bp)->max_cos;
123         new_max_eth_txqs = (BNX2X_NUM_ETH_QUEUES(bp) - from + to) *
124                                 (bp)->max_cos;
125         if (from == FCOE_IDX(bp)) {
126                 old_txdata_index = old_max_eth_txqs + FCOE_TXQ_IDX_OFFSET;
127                 new_txdata_index = new_max_eth_txqs + FCOE_TXQ_IDX_OFFSET;
128         }
129
130         memcpy(&bp->bnx2x_txq[new_txdata_index],
131                &bp->bnx2x_txq[old_txdata_index],
132                sizeof(struct bnx2x_fp_txdata));
133         to_fp->txdata_ptr[0] = &bp->bnx2x_txq[new_txdata_index];
134 }
135
136 /**
137  * bnx2x_fill_fw_str - Fill buffer with FW version string.
138  *
139  * @bp:        driver handle
140  * @buf:       character buffer to fill with the fw name
141  * @buf_len:   length of the above buffer
142  *
143  */
144 void bnx2x_fill_fw_str(struct bnx2x *bp, char *buf, size_t buf_len)
145 {
146         if (IS_PF(bp)) {
147                 u8 phy_fw_ver[PHY_FW_VER_LEN];
148
149                 phy_fw_ver[0] = '\0';
150                 bnx2x_get_ext_phy_fw_version(&bp->link_params,
151                                              phy_fw_ver, PHY_FW_VER_LEN);
152                 strlcpy(buf, bp->fw_ver, buf_len);
153                 snprintf(buf + strlen(bp->fw_ver), 32 - strlen(bp->fw_ver),
154                          "bc %d.%d.%d%s%s",
155                          (bp->common.bc_ver & 0xff0000) >> 16,
156                          (bp->common.bc_ver & 0xff00) >> 8,
157                          (bp->common.bc_ver & 0xff),
158                          ((phy_fw_ver[0] != '\0') ? " phy " : ""), phy_fw_ver);
159         } else {
160                 bnx2x_vf_fill_fw_str(bp, buf, buf_len);
161         }
162 }
163
164 /**
165  * bnx2x_shrink_eth_fp - guarantees fastpath structures stay intact
166  *
167  * @bp: driver handle
168  * @delta:      number of eth queues which were not allocated
169  */
170 static void bnx2x_shrink_eth_fp(struct bnx2x *bp, int delta)
171 {
172         int i, cos, old_eth_num = BNX2X_NUM_ETH_QUEUES(bp);
173
174         /* Queue pointer cannot be re-set on an fp-basis, as moving pointer
175          * backward along the array could cause memory to be overridden
176          */
177         for (cos = 1; cos < bp->max_cos; cos++) {
178                 for (i = 0; i < old_eth_num - delta; i++) {
179                         struct bnx2x_fastpath *fp = &bp->fp[i];
180                         int new_idx = cos * (old_eth_num - delta) + i;
181
182                         memcpy(&bp->bnx2x_txq[new_idx], fp->txdata_ptr[cos],
183                                sizeof(struct bnx2x_fp_txdata));
184                         fp->txdata_ptr[cos] = &bp->bnx2x_txq[new_idx];
185                 }
186         }
187 }
188
189 int bnx2x_load_count[2][3] = { {0} }; /* per-path: 0-common, 1-port0, 2-port1 */
190
191 /* free skb in the packet ring at pos idx
192  * return idx of last bd freed
193  */
194 static u16 bnx2x_free_tx_pkt(struct bnx2x *bp, struct bnx2x_fp_txdata *txdata,
195                              u16 idx, unsigned int *pkts_compl,
196                              unsigned int *bytes_compl)
197 {
198         struct sw_tx_bd *tx_buf = &txdata->tx_buf_ring[idx];
199         struct eth_tx_start_bd *tx_start_bd;
200         struct eth_tx_bd *tx_data_bd;
201         struct sk_buff *skb = tx_buf->skb;
202         u16 bd_idx = TX_BD(tx_buf->first_bd), new_cons;
203         int nbd;
204         u16 split_bd_len = 0;
205
206         /* prefetch skb end pointer to speedup dev_kfree_skb() */
207         prefetch(&skb->end);
208
209         DP(NETIF_MSG_TX_DONE, "fp[%d]: pkt_idx %d  buff @(%p)->skb %p\n",
210            txdata->txq_index, idx, tx_buf, skb);
211
212         tx_start_bd = &txdata->tx_desc_ring[bd_idx].start_bd;
213
214         nbd = le16_to_cpu(tx_start_bd->nbd) - 1;
215 #ifdef BNX2X_STOP_ON_ERROR
216         if ((nbd - 1) > (MAX_SKB_FRAGS + 2)) {
217                 BNX2X_ERR("BAD nbd!\n");
218                 bnx2x_panic();
219         }
220 #endif
221         new_cons = nbd + tx_buf->first_bd;
222
223         /* Get the next bd */
224         bd_idx = TX_BD(NEXT_TX_IDX(bd_idx));
225
226         /* Skip a parse bd... */
227         --nbd;
228         bd_idx = TX_BD(NEXT_TX_IDX(bd_idx));
229
230         if (tx_buf->flags & BNX2X_HAS_SECOND_PBD) {
231                 /* Skip second parse bd... */
232                 --nbd;
233                 bd_idx = TX_BD(NEXT_TX_IDX(bd_idx));
234         }
235
236         /* TSO headers+data bds share a common mapping. See bnx2x_tx_split() */
237         if (tx_buf->flags & BNX2X_TSO_SPLIT_BD) {
238                 tx_data_bd = &txdata->tx_desc_ring[bd_idx].reg_bd;
239                 split_bd_len = BD_UNMAP_LEN(tx_data_bd);
240                 --nbd;
241                 bd_idx = TX_BD(NEXT_TX_IDX(bd_idx));
242         }
243
244         /* unmap first bd */
245         dma_unmap_single(&bp->pdev->dev, BD_UNMAP_ADDR(tx_start_bd),
246                          BD_UNMAP_LEN(tx_start_bd) + split_bd_len,
247                          DMA_TO_DEVICE);
248
249         /* now free frags */
250         while (nbd > 0) {
251
252                 tx_data_bd = &txdata->tx_desc_ring[bd_idx].reg_bd;
253                 dma_unmap_page(&bp->pdev->dev, BD_UNMAP_ADDR(tx_data_bd),
254                                BD_UNMAP_LEN(tx_data_bd), DMA_TO_DEVICE);
255                 if (--nbd)
256                         bd_idx = TX_BD(NEXT_TX_IDX(bd_idx));
257         }
258
259         /* release skb */
260         WARN_ON(!skb);
261         if (likely(skb)) {
262                 (*pkts_compl)++;
263                 (*bytes_compl) += skb->len;
264         }
265
266         dev_kfree_skb_any(skb);
267         tx_buf->first_bd = 0;
268         tx_buf->skb = NULL;
269
270         return new_cons;
271 }
272
273 int bnx2x_tx_int(struct bnx2x *bp, struct bnx2x_fp_txdata *txdata)
274 {
275         struct netdev_queue *txq;
276         u16 hw_cons, sw_cons, bd_cons = txdata->tx_bd_cons;
277         unsigned int pkts_compl = 0, bytes_compl = 0;
278
279 #ifdef BNX2X_STOP_ON_ERROR
280         if (unlikely(bp->panic))
281                 return -1;
282 #endif
283
284         txq = netdev_get_tx_queue(bp->dev, txdata->txq_index);
285         hw_cons = le16_to_cpu(*txdata->tx_cons_sb);
286         sw_cons = txdata->tx_pkt_cons;
287
288         while (sw_cons != hw_cons) {
289                 u16 pkt_cons;
290
291                 pkt_cons = TX_BD(sw_cons);
292
293                 DP(NETIF_MSG_TX_DONE,
294                    "queue[%d]: hw_cons %u  sw_cons %u  pkt_cons %u\n",
295                    txdata->txq_index, hw_cons, sw_cons, pkt_cons);
296
297                 bd_cons = bnx2x_free_tx_pkt(bp, txdata, pkt_cons,
298                                             &pkts_compl, &bytes_compl);
299
300                 sw_cons++;
301         }
302
303         netdev_tx_completed_queue(txq, pkts_compl, bytes_compl);
304
305         txdata->tx_pkt_cons = sw_cons;
306         txdata->tx_bd_cons = bd_cons;
307
308         /* Need to make the tx_bd_cons update visible to start_xmit()
309          * before checking for netif_tx_queue_stopped().  Without the
310          * memory barrier, there is a small possibility that
311          * start_xmit() will miss it and cause the queue to be stopped
312          * forever.
313          * On the other hand we need an rmb() here to ensure the proper
314          * ordering of bit testing in the following
315          * netif_tx_queue_stopped(txq) call.
316          */
317         smp_mb();
318
319         if (unlikely(netif_tx_queue_stopped(txq))) {
320                 /* Taking tx_lock() is needed to prevent re-enabling the queue
321                  * while it's empty. This could have happen if rx_action() gets
322                  * suspended in bnx2x_tx_int() after the condition before
323                  * netif_tx_wake_queue(), while tx_action (bnx2x_start_xmit()):
324                  *
325                  * stops the queue->sees fresh tx_bd_cons->releases the queue->
326                  * sends some packets consuming the whole queue again->
327                  * stops the queue
328                  */
329
330                 __netif_tx_lock(txq, smp_processor_id());
331
332                 if ((netif_tx_queue_stopped(txq)) &&
333                     (bp->state == BNX2X_STATE_OPEN) &&
334                     (bnx2x_tx_avail(bp, txdata) >= MAX_DESC_PER_TX_PKT))
335                         netif_tx_wake_queue(txq);
336
337                 __netif_tx_unlock(txq);
338         }
339         return 0;
340 }
341
342 static inline void bnx2x_update_last_max_sge(struct bnx2x_fastpath *fp,
343                                              u16 idx)
344 {
345         u16 last_max = fp->last_max_sge;
346
347         if (SUB_S16(idx, last_max) > 0)
348                 fp->last_max_sge = idx;
349 }
350
351 static inline void bnx2x_update_sge_prod(struct bnx2x_fastpath *fp,
352                                          u16 sge_len,
353                                          struct eth_end_agg_rx_cqe *cqe)
354 {
355         struct bnx2x *bp = fp->bp;
356         u16 last_max, last_elem, first_elem;
357         u16 delta = 0;
358         u16 i;
359
360         if (!sge_len)
361                 return;
362
363         /* First mark all used pages */
364         for (i = 0; i < sge_len; i++)
365                 BIT_VEC64_CLEAR_BIT(fp->sge_mask,
366                         RX_SGE(le16_to_cpu(cqe->sgl_or_raw_data.sgl[i])));
367
368         DP(NETIF_MSG_RX_STATUS, "fp_cqe->sgl[%d] = %d\n",
369            sge_len - 1, le16_to_cpu(cqe->sgl_or_raw_data.sgl[sge_len - 1]));
370
371         /* Here we assume that the last SGE index is the biggest */
372         prefetch((void *)(fp->sge_mask));
373         bnx2x_update_last_max_sge(fp,
374                 le16_to_cpu(cqe->sgl_or_raw_data.sgl[sge_len - 1]));
375
376         last_max = RX_SGE(fp->last_max_sge);
377         last_elem = last_max >> BIT_VEC64_ELEM_SHIFT;
378         first_elem = RX_SGE(fp->rx_sge_prod) >> BIT_VEC64_ELEM_SHIFT;
379
380         /* If ring is not full */
381         if (last_elem + 1 != first_elem)
382                 last_elem++;
383
384         /* Now update the prod */
385         for (i = first_elem; i != last_elem; i = NEXT_SGE_MASK_ELEM(i)) {
386                 if (likely(fp->sge_mask[i]))
387                         break;
388
389                 fp->sge_mask[i] = BIT_VEC64_ELEM_ONE_MASK;
390                 delta += BIT_VEC64_ELEM_SZ;
391         }
392
393         if (delta > 0) {
394                 fp->rx_sge_prod += delta;
395                 /* clear page-end entries */
396                 bnx2x_clear_sge_mask_next_elems(fp);
397         }
398
399         DP(NETIF_MSG_RX_STATUS,
400            "fp->last_max_sge = %d  fp->rx_sge_prod = %d\n",
401            fp->last_max_sge, fp->rx_sge_prod);
402 }
403
404 /* Get Toeplitz hash value in the skb using the value from the
405  * CQE (calculated by HW).
406  */
407 static u32 bnx2x_get_rxhash(const struct bnx2x *bp,
408                             const struct eth_fast_path_rx_cqe *cqe,
409                             enum pkt_hash_types *rxhash_type)
410 {
411         /* Get Toeplitz hash from CQE */
412         if ((bp->dev->features & NETIF_F_RXHASH) &&
413             (cqe->status_flags & ETH_FAST_PATH_RX_CQE_RSS_HASH_FLG)) {
414                 enum eth_rss_hash_type htype;
415
416                 htype = cqe->status_flags & ETH_FAST_PATH_RX_CQE_RSS_HASH_TYPE;
417                 *rxhash_type = ((htype == TCP_IPV4_HASH_TYPE) ||
418                                 (htype == TCP_IPV6_HASH_TYPE)) ?
419                                PKT_HASH_TYPE_L4 : PKT_HASH_TYPE_L3;
420
421                 return le32_to_cpu(cqe->rss_hash_result);
422         }
423         *rxhash_type = PKT_HASH_TYPE_NONE;
424         return 0;
425 }
426
427 static void bnx2x_tpa_start(struct bnx2x_fastpath *fp, u16 queue,
428                             u16 cons, u16 prod,
429                             struct eth_fast_path_rx_cqe *cqe)
430 {
431         struct bnx2x *bp = fp->bp;
432         struct sw_rx_bd *cons_rx_buf = &fp->rx_buf_ring[cons];
433         struct sw_rx_bd *prod_rx_buf = &fp->rx_buf_ring[prod];
434         struct eth_rx_bd *prod_bd = &fp->rx_desc_ring[prod];
435         dma_addr_t mapping;
436         struct bnx2x_agg_info *tpa_info = &fp->tpa_info[queue];
437         struct sw_rx_bd *first_buf = &tpa_info->first_buf;
438
439         /* print error if current state != stop */
440         if (tpa_info->tpa_state != BNX2X_TPA_STOP)
441                 BNX2X_ERR("start of bin not in stop [%d]\n", queue);
442
443         /* Try to map an empty data buffer from the aggregation info  */
444         mapping = dma_map_single(&bp->pdev->dev,
445                                  first_buf->data + NET_SKB_PAD,
446                                  fp->rx_buf_size, DMA_FROM_DEVICE);
447         /*
448          *  ...if it fails - move the skb from the consumer to the producer
449          *  and set the current aggregation state as ERROR to drop it
450          *  when TPA_STOP arrives.
451          */
452
453         if (unlikely(dma_mapping_error(&bp->pdev->dev, mapping))) {
454                 /* Move the BD from the consumer to the producer */
455                 bnx2x_reuse_rx_data(fp, cons, prod);
456                 tpa_info->tpa_state = BNX2X_TPA_ERROR;
457                 return;
458         }
459
460         /* move empty data from pool to prod */
461         prod_rx_buf->data = first_buf->data;
462         dma_unmap_addr_set(prod_rx_buf, mapping, mapping);
463         /* point prod_bd to new data */
464         prod_bd->addr_hi = cpu_to_le32(U64_HI(mapping));
465         prod_bd->addr_lo = cpu_to_le32(U64_LO(mapping));
466
467         /* move partial skb from cons to pool (don't unmap yet) */
468         *first_buf = *cons_rx_buf;
469
470         /* mark bin state as START */
471         tpa_info->parsing_flags =
472                 le16_to_cpu(cqe->pars_flags.flags);
473         tpa_info->vlan_tag = le16_to_cpu(cqe->vlan_tag);
474         tpa_info->tpa_state = BNX2X_TPA_START;
475         tpa_info->len_on_bd = le16_to_cpu(cqe->len_on_bd);
476         tpa_info->placement_offset = cqe->placement_offset;
477         tpa_info->rxhash = bnx2x_get_rxhash(bp, cqe, &tpa_info->rxhash_type);
478         if (fp->mode == TPA_MODE_GRO) {
479                 u16 gro_size = le16_to_cpu(cqe->pkt_len_or_gro_seg_len);
480                 tpa_info->full_page = SGE_PAGES / gro_size * gro_size;
481                 tpa_info->gro_size = gro_size;
482         }
483
484 #ifdef BNX2X_STOP_ON_ERROR
485         fp->tpa_queue_used |= (1 << queue);
486 #ifdef _ASM_GENERIC_INT_L64_H
487         DP(NETIF_MSG_RX_STATUS, "fp->tpa_queue_used = 0x%lx\n",
488 #else
489         DP(NETIF_MSG_RX_STATUS, "fp->tpa_queue_used = 0x%llx\n",
490 #endif
491            fp->tpa_queue_used);
492 #endif
493 }
494
495 /* Timestamp option length allowed for TPA aggregation:
496  *
497  *              nop nop kind length echo val
498  */
499 #define TPA_TSTAMP_OPT_LEN      12
500 /**
501  * bnx2x_set_gro_params - compute GRO values
502  *
503  * @skb:                packet skb
504  * @parsing_flags:      parsing flags from the START CQE
505  * @len_on_bd:          total length of the first packet for the
506  *                      aggregation.
507  * @pkt_len:            length of all segments
508  *
509  * Approximate value of the MSS for this aggregation calculated using
510  * the first packet of it.
511  * Compute number of aggregated segments, and gso_type.
512  */
513 static void bnx2x_set_gro_params(struct sk_buff *skb, u16 parsing_flags,
514                                  u16 len_on_bd, unsigned int pkt_len,
515                                  u16 num_of_coalesced_segs)
516 {
517         /* TPA aggregation won't have either IP options or TCP options
518          * other than timestamp or IPv6 extension headers.
519          */
520         u16 hdrs_len = ETH_HLEN + sizeof(struct tcphdr);
521
522         if (GET_FLAG(parsing_flags, PARSING_FLAGS_OVER_ETHERNET_PROTOCOL) ==
523             PRS_FLAG_OVERETH_IPV6) {
524                 hdrs_len += sizeof(struct ipv6hdr);
525                 skb_shinfo(skb)->gso_type = SKB_GSO_TCPV6;
526         } else {
527                 hdrs_len += sizeof(struct iphdr);
528                 skb_shinfo(skb)->gso_type = SKB_GSO_TCPV4;
529         }
530
531         /* Check if there was a TCP timestamp, if there is it's will
532          * always be 12 bytes length: nop nop kind length echo val.
533          *
534          * Otherwise FW would close the aggregation.
535          */
536         if (parsing_flags & PARSING_FLAGS_TIME_STAMP_EXIST_FLAG)
537                 hdrs_len += TPA_TSTAMP_OPT_LEN;
538
539         skb_shinfo(skb)->gso_size = len_on_bd - hdrs_len;
540
541         /* tcp_gro_complete() will copy NAPI_GRO_CB(skb)->count
542          * to skb_shinfo(skb)->gso_segs
543          */
544         NAPI_GRO_CB(skb)->count = num_of_coalesced_segs;
545 }
546
547 static int bnx2x_alloc_rx_sge(struct bnx2x *bp, struct bnx2x_fastpath *fp,
548                               u16 index, gfp_t gfp_mask)
549 {
550         struct page *page = alloc_pages(gfp_mask, PAGES_PER_SGE_SHIFT);
551         struct sw_rx_page *sw_buf = &fp->rx_page_ring[index];
552         struct eth_rx_sge *sge = &fp->rx_sge_ring[index];
553         dma_addr_t mapping;
554
555         if (unlikely(page == NULL)) {
556                 BNX2X_ERR("Can't alloc sge\n");
557                 return -ENOMEM;
558         }
559
560         mapping = dma_map_page(&bp->pdev->dev, page, 0,
561                                SGE_PAGES, DMA_FROM_DEVICE);
562         if (unlikely(dma_mapping_error(&bp->pdev->dev, mapping))) {
563                 __free_pages(page, PAGES_PER_SGE_SHIFT);
564                 BNX2X_ERR("Can't map sge\n");
565                 return -ENOMEM;
566         }
567
568         sw_buf->page = page;
569         dma_unmap_addr_set(sw_buf, mapping, mapping);
570
571         sge->addr_hi = cpu_to_le32(U64_HI(mapping));
572         sge->addr_lo = cpu_to_le32(U64_LO(mapping));
573
574         return 0;
575 }
576
577 static int bnx2x_fill_frag_skb(struct bnx2x *bp, struct bnx2x_fastpath *fp,
578                                struct bnx2x_agg_info *tpa_info,
579                                u16 pages,
580                                struct sk_buff *skb,
581                                struct eth_end_agg_rx_cqe *cqe,
582                                u16 cqe_idx)
583 {
584         struct sw_rx_page *rx_pg, old_rx_pg;
585         u32 i, frag_len, frag_size;
586         int err, j, frag_id = 0;
587         u16 len_on_bd = tpa_info->len_on_bd;
588         u16 full_page = 0, gro_size = 0;
589
590         frag_size = le16_to_cpu(cqe->pkt_len) - len_on_bd;
591
592         if (fp->mode == TPA_MODE_GRO) {
593                 gro_size = tpa_info->gro_size;
594                 full_page = tpa_info->full_page;
595         }
596
597         /* This is needed in order to enable forwarding support */
598         if (frag_size)
599                 bnx2x_set_gro_params(skb, tpa_info->parsing_flags, len_on_bd,
600                                      le16_to_cpu(cqe->pkt_len),
601                                      le16_to_cpu(cqe->num_of_coalesced_segs));
602
603 #ifdef BNX2X_STOP_ON_ERROR
604         if (pages > min_t(u32, 8, MAX_SKB_FRAGS) * SGE_PAGES) {
605                 BNX2X_ERR("SGL length is too long: %d. CQE index is %d\n",
606                           pages, cqe_idx);
607                 BNX2X_ERR("cqe->pkt_len = %d\n", cqe->pkt_len);
608                 bnx2x_panic();
609                 return -EINVAL;
610         }
611 #endif
612
613         /* Run through the SGL and compose the fragmented skb */
614         for (i = 0, j = 0; i < pages; i += PAGES_PER_SGE, j++) {
615                 u16 sge_idx = RX_SGE(le16_to_cpu(cqe->sgl_or_raw_data.sgl[j]));
616
617                 /* FW gives the indices of the SGE as if the ring is an array
618                    (meaning that "next" element will consume 2 indices) */
619                 if (fp->mode == TPA_MODE_GRO)
620                         frag_len = min_t(u32, frag_size, (u32)full_page);
621                 else /* LRO */
622                         frag_len = min_t(u32, frag_size, (u32)SGE_PAGES);
623
624                 rx_pg = &fp->rx_page_ring[sge_idx];
625                 old_rx_pg = *rx_pg;
626
627                 /* If we fail to allocate a substitute page, we simply stop
628                    where we are and drop the whole packet */
629                 err = bnx2x_alloc_rx_sge(bp, fp, sge_idx, GFP_ATOMIC);
630                 if (unlikely(err)) {
631                         bnx2x_fp_qstats(bp, fp)->rx_skb_alloc_failed++;
632                         return err;
633                 }
634
635                 /* Unmap the page as we're going to pass it to the stack */
636                 dma_unmap_page(&bp->pdev->dev,
637                                dma_unmap_addr(&old_rx_pg, mapping),
638                                SGE_PAGES, DMA_FROM_DEVICE);
639                 /* Add one frag and update the appropriate fields in the skb */
640                 if (fp->mode == TPA_MODE_LRO)
641                         skb_fill_page_desc(skb, j, old_rx_pg.page, 0, frag_len);
642                 else { /* GRO */
643                         int rem;
644                         int offset = 0;
645                         for (rem = frag_len; rem > 0; rem -= gro_size) {
646                                 int len = rem > gro_size ? gro_size : rem;
647                                 skb_fill_page_desc(skb, frag_id++,
648                                                    old_rx_pg.page, offset, len);
649                                 if (offset)
650                                         get_page(old_rx_pg.page);
651                                 offset += len;
652                         }
653                 }
654
655                 skb->data_len += frag_len;
656                 skb->truesize += SGE_PAGES;
657                 skb->len += frag_len;
658
659                 frag_size -= frag_len;
660         }
661
662         return 0;
663 }
664
665 static void bnx2x_frag_free(const struct bnx2x_fastpath *fp, void *data)
666 {
667         if (fp->rx_frag_size)
668                 put_page(virt_to_head_page(data));
669         else
670                 kfree(data);
671 }
672
673 static void *bnx2x_frag_alloc(const struct bnx2x_fastpath *fp, gfp_t gfp_mask)
674 {
675         if (fp->rx_frag_size) {
676                 /* GFP_KERNEL allocations are used only during initialization */
677                 if (unlikely(gfp_mask & __GFP_WAIT))
678                         return (void *)__get_free_page(gfp_mask);
679
680                 return netdev_alloc_frag(fp->rx_frag_size);
681         }
682
683         return kmalloc(fp->rx_buf_size + NET_SKB_PAD, gfp_mask);
684 }
685
686 #ifdef CONFIG_INET
687 static void bnx2x_gro_ip_csum(struct bnx2x *bp, struct sk_buff *skb)
688 {
689         const struct iphdr *iph = ip_hdr(skb);
690         struct tcphdr *th;
691
692         skb_set_transport_header(skb, sizeof(struct iphdr));
693         th = tcp_hdr(skb);
694
695         th->check = ~tcp_v4_check(skb->len - skb_transport_offset(skb),
696                                   iph->saddr, iph->daddr, 0);
697 }
698
699 static void bnx2x_gro_ipv6_csum(struct bnx2x *bp, struct sk_buff *skb)
700 {
701         struct ipv6hdr *iph = ipv6_hdr(skb);
702         struct tcphdr *th;
703
704         skb_set_transport_header(skb, sizeof(struct ipv6hdr));
705         th = tcp_hdr(skb);
706
707         th->check = ~tcp_v6_check(skb->len - skb_transport_offset(skb),
708                                   &iph->saddr, &iph->daddr, 0);
709 }
710
711 static void bnx2x_gro_csum(struct bnx2x *bp, struct sk_buff *skb,
712                             void (*gro_func)(struct bnx2x*, struct sk_buff*))
713 {
714         skb_set_network_header(skb, 0);
715         gro_func(bp, skb);
716         tcp_gro_complete(skb);
717 }
718 #endif
719
720 static void bnx2x_gro_receive(struct bnx2x *bp, struct bnx2x_fastpath *fp,
721                                struct sk_buff *skb)
722 {
723 #ifdef CONFIG_INET
724         if (skb_shinfo(skb)->gso_size) {
725                 switch (be16_to_cpu(skb->protocol)) {
726                 case ETH_P_IP:
727                         bnx2x_gro_csum(bp, skb, bnx2x_gro_ip_csum);
728                         break;
729                 case ETH_P_IPV6:
730                         bnx2x_gro_csum(bp, skb, bnx2x_gro_ipv6_csum);
731                         break;
732                 default:
733                         BNX2X_ERR("Error: FW GRO supports only IPv4/IPv6, not 0x%04x\n",
734                                   be16_to_cpu(skb->protocol));
735                 }
736         }
737 #endif
738         skb_record_rx_queue(skb, fp->rx_queue);
739         napi_gro_receive(&fp->napi, skb);
740 }
741
742 static void bnx2x_tpa_stop(struct bnx2x *bp, struct bnx2x_fastpath *fp,
743                            struct bnx2x_agg_info *tpa_info,
744                            u16 pages,
745                            struct eth_end_agg_rx_cqe *cqe,
746                            u16 cqe_idx)
747 {
748         struct sw_rx_bd *rx_buf = &tpa_info->first_buf;
749         u8 pad = tpa_info->placement_offset;
750         u16 len = tpa_info->len_on_bd;
751         struct sk_buff *skb = NULL;
752         u8 *new_data, *data = rx_buf->data;
753         u8 old_tpa_state = tpa_info->tpa_state;
754
755         tpa_info->tpa_state = BNX2X_TPA_STOP;
756
757         /* If we there was an error during the handling of the TPA_START -
758          * drop this aggregation.
759          */
760         if (old_tpa_state == BNX2X_TPA_ERROR)
761                 goto drop;
762
763         /* Try to allocate the new data */
764         new_data = bnx2x_frag_alloc(fp, GFP_ATOMIC);
765         /* Unmap skb in the pool anyway, as we are going to change
766            pool entry status to BNX2X_TPA_STOP even if new skb allocation
767            fails. */
768         dma_unmap_single(&bp->pdev->dev, dma_unmap_addr(rx_buf, mapping),
769                          fp->rx_buf_size, DMA_FROM_DEVICE);
770         if (likely(new_data))
771                 skb = build_skb(data, fp->rx_frag_size);
772
773         if (likely(skb)) {
774 #ifdef BNX2X_STOP_ON_ERROR
775                 if (pad + len > fp->rx_buf_size) {
776                         BNX2X_ERR("skb_put is about to fail...  pad %d  len %d  rx_buf_size %d\n",
777                                   pad, len, fp->rx_buf_size);
778                         bnx2x_panic();
779                         return;
780                 }
781 #endif
782
783                 skb_reserve(skb, pad + NET_SKB_PAD);
784                 skb_put(skb, len);
785                 skb_set_hash(skb, tpa_info->rxhash, tpa_info->rxhash_type);
786
787                 skb->protocol = eth_type_trans(skb, bp->dev);
788                 skb->ip_summed = CHECKSUM_UNNECESSARY;
789
790                 if (!bnx2x_fill_frag_skb(bp, fp, tpa_info, pages,
791                                          skb, cqe, cqe_idx)) {
792                         if (tpa_info->parsing_flags & PARSING_FLAGS_VLAN)
793                                 __vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q), tpa_info->vlan_tag);
794                         bnx2x_gro_receive(bp, fp, skb);
795                 } else {
796                         DP(NETIF_MSG_RX_STATUS,
797                            "Failed to allocate new pages - dropping packet!\n");
798                         dev_kfree_skb_any(skb);
799                 }
800
801                 /* put new data in bin */
802                 rx_buf->data = new_data;
803
804                 return;
805         }
806         if (new_data)
807                 bnx2x_frag_free(fp, new_data);
808 drop:
809         /* drop the packet and keep the buffer in the bin */
810         DP(NETIF_MSG_RX_STATUS,
811            "Failed to allocate or map a new skb - dropping packet!\n");
812         bnx2x_fp_stats(bp, fp)->eth_q_stats.rx_skb_alloc_failed++;
813 }
814
815 static int bnx2x_alloc_rx_data(struct bnx2x *bp, struct bnx2x_fastpath *fp,
816                                u16 index, gfp_t gfp_mask)
817 {
818         u8 *data;
819         struct sw_rx_bd *rx_buf = &fp->rx_buf_ring[index];
820         struct eth_rx_bd *rx_bd = &fp->rx_desc_ring[index];
821         dma_addr_t mapping;
822
823         data = bnx2x_frag_alloc(fp, gfp_mask);
824         if (unlikely(data == NULL))
825                 return -ENOMEM;
826
827         mapping = dma_map_single(&bp->pdev->dev, data + NET_SKB_PAD,
828                                  fp->rx_buf_size,
829                                  DMA_FROM_DEVICE);
830         if (unlikely(dma_mapping_error(&bp->pdev->dev, mapping))) {
831                 bnx2x_frag_free(fp, data);
832                 BNX2X_ERR("Can't map rx data\n");
833                 return -ENOMEM;
834         }
835
836         rx_buf->data = data;
837         dma_unmap_addr_set(rx_buf, mapping, mapping);
838
839         rx_bd->addr_hi = cpu_to_le32(U64_HI(mapping));
840         rx_bd->addr_lo = cpu_to_le32(U64_LO(mapping));
841
842         return 0;
843 }
844
845 static
846 void bnx2x_csum_validate(struct sk_buff *skb, union eth_rx_cqe *cqe,
847                                  struct bnx2x_fastpath *fp,
848                                  struct bnx2x_eth_q_stats *qstats)
849 {
850         /* Do nothing if no L4 csum validation was done.
851          * We do not check whether IP csum was validated. For IPv4 we assume
852          * that if the card got as far as validating the L4 csum, it also
853          * validated the IP csum. IPv6 has no IP csum.
854          */
855         if (cqe->fast_path_cqe.status_flags &
856             ETH_FAST_PATH_RX_CQE_L4_XSUM_NO_VALIDATION_FLG)
857                 return;
858
859         /* If L4 validation was done, check if an error was found. */
860
861         if (cqe->fast_path_cqe.type_error_flags &
862             (ETH_FAST_PATH_RX_CQE_IP_BAD_XSUM_FLG |
863              ETH_FAST_PATH_RX_CQE_L4_BAD_XSUM_FLG))
864                 qstats->hw_csum_err++;
865         else
866                 skb->ip_summed = CHECKSUM_UNNECESSARY;
867 }
868
869 static int bnx2x_rx_int(struct bnx2x_fastpath *fp, int budget)
870 {
871         struct bnx2x *bp = fp->bp;
872         u16 bd_cons, bd_prod, bd_prod_fw, comp_ring_cons;
873         u16 sw_comp_cons, sw_comp_prod;
874         int rx_pkt = 0;
875         union eth_rx_cqe *cqe;
876         struct eth_fast_path_rx_cqe *cqe_fp;
877
878 #ifdef BNX2X_STOP_ON_ERROR
879         if (unlikely(bp->panic))
880                 return 0;
881 #endif
882         if (budget <= 0)
883                 return rx_pkt;
884
885         bd_cons = fp->rx_bd_cons;
886         bd_prod = fp->rx_bd_prod;
887         bd_prod_fw = bd_prod;
888         sw_comp_cons = fp->rx_comp_cons;
889         sw_comp_prod = fp->rx_comp_prod;
890
891         comp_ring_cons = RCQ_BD(sw_comp_cons);
892         cqe = &fp->rx_comp_ring[comp_ring_cons];
893         cqe_fp = &cqe->fast_path_cqe;
894
895         DP(NETIF_MSG_RX_STATUS,
896            "queue[%d]: sw_comp_cons %u\n", fp->index, sw_comp_cons);
897
898         while (BNX2X_IS_CQE_COMPLETED(cqe_fp)) {
899                 struct sw_rx_bd *rx_buf = NULL;
900                 struct sk_buff *skb;
901                 u8 cqe_fp_flags;
902                 enum eth_rx_cqe_type cqe_fp_type;
903                 u16 len, pad, queue;
904                 u8 *data;
905                 u32 rxhash;
906                 enum pkt_hash_types rxhash_type;
907
908 #ifdef BNX2X_STOP_ON_ERROR
909                 if (unlikely(bp->panic))
910                         return 0;
911 #endif
912
913                 bd_prod = RX_BD(bd_prod);
914                 bd_cons = RX_BD(bd_cons);
915
916                 /* A rmb() is required to ensure that the CQE is not read
917                  * before it is written by the adapter DMA.  PCI ordering
918                  * rules will make sure the other fields are written before
919                  * the marker at the end of struct eth_fast_path_rx_cqe
920                  * but without rmb() a weakly ordered processor can process
921                  * stale data.  Without the barrier TPA state-machine might
922                  * enter inconsistent state and kernel stack might be
923                  * provided with incorrect packet description - these lead
924                  * to various kernel crashed.
925                  */
926                 rmb();
927
928                 cqe_fp_flags = cqe_fp->type_error_flags;
929                 cqe_fp_type = cqe_fp_flags & ETH_FAST_PATH_RX_CQE_TYPE;
930
931                 DP(NETIF_MSG_RX_STATUS,
932                    "CQE type %x  err %x  status %x  queue %x  vlan %x  len %u\n",
933                    CQE_TYPE(cqe_fp_flags),
934                    cqe_fp_flags, cqe_fp->status_flags,
935                    le32_to_cpu(cqe_fp->rss_hash_result),
936                    le16_to_cpu(cqe_fp->vlan_tag),
937                    le16_to_cpu(cqe_fp->pkt_len_or_gro_seg_len));
938
939                 /* is this a slowpath msg? */
940                 if (unlikely(CQE_TYPE_SLOW(cqe_fp_type))) {
941                         bnx2x_sp_event(fp, cqe);
942                         goto next_cqe;
943                 }
944
945                 rx_buf = &fp->rx_buf_ring[bd_cons];
946                 data = rx_buf->data;
947
948                 if (!CQE_TYPE_FAST(cqe_fp_type)) {
949                         struct bnx2x_agg_info *tpa_info;
950                         u16 frag_size, pages;
951 #ifdef BNX2X_STOP_ON_ERROR
952                         /* sanity check */
953                         if (fp->disable_tpa &&
954                             (CQE_TYPE_START(cqe_fp_type) ||
955                              CQE_TYPE_STOP(cqe_fp_type)))
956                                 BNX2X_ERR("START/STOP packet while disable_tpa type %x\n",
957                                           CQE_TYPE(cqe_fp_type));
958 #endif
959
960                         if (CQE_TYPE_START(cqe_fp_type)) {
961                                 u16 queue = cqe_fp->queue_index;
962                                 DP(NETIF_MSG_RX_STATUS,
963                                    "calling tpa_start on queue %d\n",
964                                    queue);
965
966                                 bnx2x_tpa_start(fp, queue,
967                                                 bd_cons, bd_prod,
968                                                 cqe_fp);
969
970                                 goto next_rx;
971                         }
972                         queue = cqe->end_agg_cqe.queue_index;
973                         tpa_info = &fp->tpa_info[queue];
974                         DP(NETIF_MSG_RX_STATUS,
975                            "calling tpa_stop on queue %d\n",
976                            queue);
977
978                         frag_size = le16_to_cpu(cqe->end_agg_cqe.pkt_len) -
979                                     tpa_info->len_on_bd;
980
981                         if (fp->mode == TPA_MODE_GRO)
982                                 pages = (frag_size + tpa_info->full_page - 1) /
983                                          tpa_info->full_page;
984                         else
985                                 pages = SGE_PAGE_ALIGN(frag_size) >>
986                                         SGE_PAGE_SHIFT;
987
988                         bnx2x_tpa_stop(bp, fp, tpa_info, pages,
989                                        &cqe->end_agg_cqe, comp_ring_cons);
990 #ifdef BNX2X_STOP_ON_ERROR
991                         if (bp->panic)
992                                 return 0;
993 #endif
994
995                         bnx2x_update_sge_prod(fp, pages, &cqe->end_agg_cqe);
996                         goto next_cqe;
997                 }
998                 /* non TPA */
999                 len = le16_to_cpu(cqe_fp->pkt_len_or_gro_seg_len);
1000                 pad = cqe_fp->placement_offset;
1001                 dma_sync_single_for_cpu(&bp->pdev->dev,
1002                                         dma_unmap_addr(rx_buf, mapping),
1003                                         pad + RX_COPY_THRESH,
1004                                         DMA_FROM_DEVICE);
1005                 pad += NET_SKB_PAD;
1006                 prefetch(data + pad); /* speedup eth_type_trans() */
1007                 /* is this an error packet? */
1008                 if (unlikely(cqe_fp_flags & ETH_RX_ERROR_FALGS)) {
1009                         DP(NETIF_MSG_RX_ERR | NETIF_MSG_RX_STATUS,
1010                            "ERROR  flags %x  rx packet %u\n",
1011                            cqe_fp_flags, sw_comp_cons);
1012                         bnx2x_fp_qstats(bp, fp)->rx_err_discard_pkt++;
1013                         goto reuse_rx;
1014                 }
1015
1016                 /* Since we don't have a jumbo ring
1017                  * copy small packets if mtu > 1500
1018                  */
1019                 if ((bp->dev->mtu > ETH_MAX_PACKET_SIZE) &&
1020                     (len <= RX_COPY_THRESH)) {
1021                         skb = netdev_alloc_skb_ip_align(bp->dev, len);
1022                         if (skb == NULL) {
1023                                 DP(NETIF_MSG_RX_ERR | NETIF_MSG_RX_STATUS,
1024                                    "ERROR  packet dropped because of alloc failure\n");
1025                                 bnx2x_fp_qstats(bp, fp)->rx_skb_alloc_failed++;
1026                                 goto reuse_rx;
1027                         }
1028                         memcpy(skb->data, data + pad, len);
1029                         bnx2x_reuse_rx_data(fp, bd_cons, bd_prod);
1030                 } else {
1031                         if (likely(bnx2x_alloc_rx_data(bp, fp, bd_prod,
1032                                                        GFP_ATOMIC) == 0)) {
1033                                 dma_unmap_single(&bp->pdev->dev,
1034                                                  dma_unmap_addr(rx_buf, mapping),
1035                                                  fp->rx_buf_size,
1036                                                  DMA_FROM_DEVICE);
1037                                 skb = build_skb(data, fp->rx_frag_size);
1038                                 if (unlikely(!skb)) {
1039                                         bnx2x_frag_free(fp, data);
1040                                         bnx2x_fp_qstats(bp, fp)->
1041                                                         rx_skb_alloc_failed++;
1042                                         goto next_rx;
1043                                 }
1044                                 skb_reserve(skb, pad);
1045                         } else {
1046                                 DP(NETIF_MSG_RX_ERR | NETIF_MSG_RX_STATUS,
1047                                    "ERROR  packet dropped because of alloc failure\n");
1048                                 bnx2x_fp_qstats(bp, fp)->rx_skb_alloc_failed++;
1049 reuse_rx:
1050                                 bnx2x_reuse_rx_data(fp, bd_cons, bd_prod);
1051                                 goto next_rx;
1052                         }
1053                 }
1054
1055                 skb_put(skb, len);
1056                 skb->protocol = eth_type_trans(skb, bp->dev);
1057
1058                 /* Set Toeplitz hash for a none-LRO skb */
1059                 rxhash = bnx2x_get_rxhash(bp, cqe_fp, &rxhash_type);
1060                 skb_set_hash(skb, rxhash, rxhash_type);
1061
1062                 skb_checksum_none_assert(skb);
1063
1064                 if (bp->dev->features & NETIF_F_RXCSUM)
1065                         bnx2x_csum_validate(skb, cqe, fp,
1066                                             bnx2x_fp_qstats(bp, fp));
1067
1068                 skb_record_rx_queue(skb, fp->rx_queue);
1069
1070                 if (le16_to_cpu(cqe_fp->pars_flags.flags) &
1071                     PARSING_FLAGS_VLAN)
1072                         __vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q),
1073                                                le16_to_cpu(cqe_fp->vlan_tag));
1074
1075                 skb_mark_napi_id(skb, &fp->napi);
1076
1077                 if (bnx2x_fp_ll_polling(fp))
1078                         netif_receive_skb(skb);
1079                 else
1080                         napi_gro_receive(&fp->napi, skb);
1081 next_rx:
1082                 rx_buf->data = NULL;
1083
1084                 bd_cons = NEXT_RX_IDX(bd_cons);
1085                 bd_prod = NEXT_RX_IDX(bd_prod);
1086                 bd_prod_fw = NEXT_RX_IDX(bd_prod_fw);
1087                 rx_pkt++;
1088 next_cqe:
1089                 sw_comp_prod = NEXT_RCQ_IDX(sw_comp_prod);
1090                 sw_comp_cons = NEXT_RCQ_IDX(sw_comp_cons);
1091
1092                 /* mark CQE as free */
1093                 BNX2X_SEED_CQE(cqe_fp);
1094
1095                 if (rx_pkt == budget)
1096                         break;
1097
1098                 comp_ring_cons = RCQ_BD(sw_comp_cons);
1099                 cqe = &fp->rx_comp_ring[comp_ring_cons];
1100                 cqe_fp = &cqe->fast_path_cqe;
1101         } /* while */
1102
1103         fp->rx_bd_cons = bd_cons;
1104         fp->rx_bd_prod = bd_prod_fw;
1105         fp->rx_comp_cons = sw_comp_cons;
1106         fp->rx_comp_prod = sw_comp_prod;
1107
1108         /* Update producers */
1109         bnx2x_update_rx_prod(bp, fp, bd_prod_fw, sw_comp_prod,
1110                              fp->rx_sge_prod);
1111
1112         fp->rx_pkt += rx_pkt;
1113         fp->rx_calls++;
1114
1115         return rx_pkt;
1116 }
1117
1118 static irqreturn_t bnx2x_msix_fp_int(int irq, void *fp_cookie)
1119 {
1120         struct bnx2x_fastpath *fp = fp_cookie;
1121         struct bnx2x *bp = fp->bp;
1122         u8 cos;
1123
1124         DP(NETIF_MSG_INTR,
1125            "got an MSI-X interrupt on IDX:SB [fp %d fw_sd %d igusb %d]\n",
1126            fp->index, fp->fw_sb_id, fp->igu_sb_id);
1127
1128         bnx2x_ack_sb(bp, fp->igu_sb_id, USTORM_ID, 0, IGU_INT_DISABLE, 0);
1129
1130 #ifdef BNX2X_STOP_ON_ERROR
1131         if (unlikely(bp->panic))
1132                 return IRQ_HANDLED;
1133 #endif
1134
1135         /* Handle Rx and Tx according to MSI-X vector */
1136         for_each_cos_in_tx_queue(fp, cos)
1137                 prefetch(fp->txdata_ptr[cos]->tx_cons_sb);
1138
1139         prefetch(&fp->sb_running_index[SM_RX_ID]);
1140         napi_schedule(&bnx2x_fp(bp, fp->index, napi));
1141
1142         return IRQ_HANDLED;
1143 }
1144
1145 /* HW Lock for shared dual port PHYs */
1146 void bnx2x_acquire_phy_lock(struct bnx2x *bp)
1147 {
1148         mutex_lock(&bp->port.phy_mutex);
1149
1150         bnx2x_acquire_hw_lock(bp, HW_LOCK_RESOURCE_MDIO);
1151 }
1152
1153 void bnx2x_release_phy_lock(struct bnx2x *bp)
1154 {
1155         bnx2x_release_hw_lock(bp, HW_LOCK_RESOURCE_MDIO);
1156
1157         mutex_unlock(&bp->port.phy_mutex);
1158 }
1159
1160 /* calculates MF speed according to current linespeed and MF configuration */
1161 u16 bnx2x_get_mf_speed(struct bnx2x *bp)
1162 {
1163         u16 line_speed = bp->link_vars.line_speed;
1164         if (IS_MF(bp)) {
1165                 u16 maxCfg = bnx2x_extract_max_cfg(bp,
1166                                                    bp->mf_config[BP_VN(bp)]);
1167
1168                 /* Calculate the current MAX line speed limit for the MF
1169                  * devices
1170                  */
1171                 if (IS_MF_SI(bp))
1172                         line_speed = (line_speed * maxCfg) / 100;
1173                 else { /* SD mode */
1174                         u16 vn_max_rate = maxCfg * 100;
1175
1176                         if (vn_max_rate < line_speed)
1177                                 line_speed = vn_max_rate;
1178                 }
1179         }
1180
1181         return line_speed;
1182 }
1183
1184 /**
1185  * bnx2x_fill_report_data - fill link report data to report
1186  *
1187  * @bp:         driver handle
1188  * @data:       link state to update
1189  *
1190  * It uses a none-atomic bit operations because is called under the mutex.
1191  */
1192 static void bnx2x_fill_report_data(struct bnx2x *bp,
1193                                    struct bnx2x_link_report_data *data)
1194 {
1195         memset(data, 0, sizeof(*data));
1196
1197         if (IS_PF(bp)) {
1198                 /* Fill the report data: effective line speed */
1199                 data->line_speed = bnx2x_get_mf_speed(bp);
1200
1201                 /* Link is down */
1202                 if (!bp->link_vars.link_up || (bp->flags & MF_FUNC_DIS))
1203                         __set_bit(BNX2X_LINK_REPORT_LINK_DOWN,
1204                                   &data->link_report_flags);
1205
1206                 if (!BNX2X_NUM_ETH_QUEUES(bp))
1207                         __set_bit(BNX2X_LINK_REPORT_LINK_DOWN,
1208                                   &data->link_report_flags);
1209
1210                 /* Full DUPLEX */
1211                 if (bp->link_vars.duplex == DUPLEX_FULL)
1212                         __set_bit(BNX2X_LINK_REPORT_FD,
1213                                   &data->link_report_flags);
1214
1215                 /* Rx Flow Control is ON */
1216                 if (bp->link_vars.flow_ctrl & BNX2X_FLOW_CTRL_RX)
1217                         __set_bit(BNX2X_LINK_REPORT_RX_FC_ON,
1218                                   &data->link_report_flags);
1219
1220                 /* Tx Flow Control is ON */
1221                 if (bp->link_vars.flow_ctrl & BNX2X_FLOW_CTRL_TX)
1222                         __set_bit(BNX2X_LINK_REPORT_TX_FC_ON,
1223                                   &data->link_report_flags);
1224         } else { /* VF */
1225                 *data = bp->vf_link_vars;
1226         }
1227 }
1228
1229 /**
1230  * bnx2x_link_report - report link status to OS.
1231  *
1232  * @bp:         driver handle
1233  *
1234  * Calls the __bnx2x_link_report() under the same locking scheme
1235  * as a link/PHY state managing code to ensure a consistent link
1236  * reporting.
1237  */
1238
1239 void bnx2x_link_report(struct bnx2x *bp)
1240 {
1241         bnx2x_acquire_phy_lock(bp);
1242         __bnx2x_link_report(bp);
1243         bnx2x_release_phy_lock(bp);
1244 }
1245
1246 /**
1247  * __bnx2x_link_report - report link status to OS.
1248  *
1249  * @bp:         driver handle
1250  *
1251  * None atomic implementation.
1252  * Should be called under the phy_lock.
1253  */
1254 void __bnx2x_link_report(struct bnx2x *bp)
1255 {
1256         struct bnx2x_link_report_data cur_data;
1257
1258         /* reread mf_cfg */
1259         if (IS_PF(bp) && !CHIP_IS_E1(bp))
1260                 bnx2x_read_mf_cfg(bp);
1261
1262         /* Read the current link report info */
1263         bnx2x_fill_report_data(bp, &cur_data);
1264
1265         /* Don't report link down or exactly the same link status twice */
1266         if (!memcmp(&cur_data, &bp->last_reported_link, sizeof(cur_data)) ||
1267             (test_bit(BNX2X_LINK_REPORT_LINK_DOWN,
1268                       &bp->last_reported_link.link_report_flags) &&
1269              test_bit(BNX2X_LINK_REPORT_LINK_DOWN,
1270                       &cur_data.link_report_flags)))
1271                 return;
1272
1273         bp->link_cnt++;
1274
1275         /* We are going to report a new link parameters now -
1276          * remember the current data for the next time.
1277          */
1278         memcpy(&bp->last_reported_link, &cur_data, sizeof(cur_data));
1279
1280         /* propagate status to VFs */
1281         if (IS_PF(bp))
1282                 bnx2x_iov_link_update(bp);
1283
1284         if (test_bit(BNX2X_LINK_REPORT_LINK_DOWN,
1285                      &cur_data.link_report_flags)) {
1286                 netif_carrier_off(bp->dev);
1287                 netdev_err(bp->dev, "NIC Link is Down\n");
1288                 return;
1289         } else {
1290                 const char *duplex;
1291                 const char *flow;
1292
1293                 netif_carrier_on(bp->dev);
1294
1295                 if (test_and_clear_bit(BNX2X_LINK_REPORT_FD,
1296                                        &cur_data.link_report_flags))
1297                         duplex = "full";
1298                 else
1299                         duplex = "half";
1300
1301                 /* Handle the FC at the end so that only these flags would be
1302                  * possibly set. This way we may easily check if there is no FC
1303                  * enabled.
1304                  */
1305                 if (cur_data.link_report_flags) {
1306                         if (test_bit(BNX2X_LINK_REPORT_RX_FC_ON,
1307                                      &cur_data.link_report_flags)) {
1308                                 if (test_bit(BNX2X_LINK_REPORT_TX_FC_ON,
1309                                      &cur_data.link_report_flags))
1310                                         flow = "ON - receive & transmit";
1311                                 else
1312                                         flow = "ON - receive";
1313                         } else {
1314                                 flow = "ON - transmit";
1315                         }
1316                 } else {
1317                         flow = "none";
1318                 }
1319                 netdev_info(bp->dev, "NIC Link is Up, %d Mbps %s duplex, Flow control: %s\n",
1320                             cur_data.line_speed, duplex, flow);
1321         }
1322 }
1323
1324 static void bnx2x_set_next_page_sgl(struct bnx2x_fastpath *fp)
1325 {
1326         int i;
1327
1328         for (i = 1; i <= NUM_RX_SGE_PAGES; i++) {
1329                 struct eth_rx_sge *sge;
1330
1331                 sge = &fp->rx_sge_ring[RX_SGE_CNT * i - 2];
1332                 sge->addr_hi =
1333                         cpu_to_le32(U64_HI(fp->rx_sge_mapping +
1334                         BCM_PAGE_SIZE*(i % NUM_RX_SGE_PAGES)));
1335
1336                 sge->addr_lo =
1337                         cpu_to_le32(U64_LO(fp->rx_sge_mapping +
1338                         BCM_PAGE_SIZE*(i % NUM_RX_SGE_PAGES)));
1339         }
1340 }
1341
1342 static void bnx2x_free_tpa_pool(struct bnx2x *bp,
1343                                 struct bnx2x_fastpath *fp, int last)
1344 {
1345         int i;
1346
1347         for (i = 0; i < last; i++) {
1348                 struct bnx2x_agg_info *tpa_info = &fp->tpa_info[i];
1349                 struct sw_rx_bd *first_buf = &tpa_info->first_buf;
1350                 u8 *data = first_buf->data;
1351
1352                 if (data == NULL) {
1353                         DP(NETIF_MSG_IFDOWN, "tpa bin %d empty on free\n", i);
1354                         continue;
1355                 }
1356                 if (tpa_info->tpa_state == BNX2X_TPA_START)
1357                         dma_unmap_single(&bp->pdev->dev,
1358                                          dma_unmap_addr(first_buf, mapping),
1359                                          fp->rx_buf_size, DMA_FROM_DEVICE);
1360                 bnx2x_frag_free(fp, data);
1361                 first_buf->data = NULL;
1362         }
1363 }
1364
1365 void bnx2x_init_rx_rings_cnic(struct bnx2x *bp)
1366 {
1367         int j;
1368
1369         for_each_rx_queue_cnic(bp, j) {
1370                 struct bnx2x_fastpath *fp = &bp->fp[j];
1371
1372                 fp->rx_bd_cons = 0;
1373
1374                 /* Activate BD ring */
1375                 /* Warning!
1376                  * this will generate an interrupt (to the TSTORM)
1377                  * must only be done after chip is initialized
1378                  */
1379                 bnx2x_update_rx_prod(bp, fp, fp->rx_bd_prod, fp->rx_comp_prod,
1380                                      fp->rx_sge_prod);
1381         }
1382 }
1383
1384 void bnx2x_init_rx_rings(struct bnx2x *bp)
1385 {
1386         int func = BP_FUNC(bp);
1387         u16 ring_prod;
1388         int i, j;
1389
1390         /* Allocate TPA resources */
1391         for_each_eth_queue(bp, j) {
1392                 struct bnx2x_fastpath *fp = &bp->fp[j];
1393
1394                 DP(NETIF_MSG_IFUP,
1395                    "mtu %d  rx_buf_size %d\n", bp->dev->mtu, fp->rx_buf_size);
1396
1397                 if (!fp->disable_tpa) {
1398                         /* Fill the per-aggregation pool */
1399                         for (i = 0; i < MAX_AGG_QS(bp); i++) {
1400                                 struct bnx2x_agg_info *tpa_info =
1401                                         &fp->tpa_info[i];
1402                                 struct sw_rx_bd *first_buf =
1403                                         &tpa_info->first_buf;
1404
1405                                 first_buf->data =
1406                                         bnx2x_frag_alloc(fp, GFP_KERNEL);
1407                                 if (!first_buf->data) {
1408                                         BNX2X_ERR("Failed to allocate TPA skb pool for queue[%d] - disabling TPA on this queue!\n",
1409                                                   j);
1410                                         bnx2x_free_tpa_pool(bp, fp, i);
1411                                         fp->disable_tpa = 1;
1412                                         break;
1413                                 }
1414                                 dma_unmap_addr_set(first_buf, mapping, 0);
1415                                 tpa_info->tpa_state = BNX2X_TPA_STOP;
1416                         }
1417
1418                         /* "next page" elements initialization */
1419                         bnx2x_set_next_page_sgl(fp);
1420
1421                         /* set SGEs bit mask */
1422                         bnx2x_init_sge_ring_bit_mask(fp);
1423
1424                         /* Allocate SGEs and initialize the ring elements */
1425                         for (i = 0, ring_prod = 0;
1426                              i < MAX_RX_SGE_CNT*NUM_RX_SGE_PAGES; i++) {
1427
1428                                 if (bnx2x_alloc_rx_sge(bp, fp, ring_prod,
1429                                                        GFP_KERNEL) < 0) {
1430                                         BNX2X_ERR("was only able to allocate %d rx sges\n",
1431                                                   i);
1432                                         BNX2X_ERR("disabling TPA for queue[%d]\n",
1433                                                   j);
1434                                         /* Cleanup already allocated elements */
1435                                         bnx2x_free_rx_sge_range(bp, fp,
1436                                                                 ring_prod);
1437                                         bnx2x_free_tpa_pool(bp, fp,
1438                                                             MAX_AGG_QS(bp));
1439                                         fp->disable_tpa = 1;
1440                                         ring_prod = 0;
1441                                         break;
1442                                 }
1443                                 ring_prod = NEXT_SGE_IDX(ring_prod);
1444                         }
1445
1446                         fp->rx_sge_prod = ring_prod;
1447                 }
1448         }
1449
1450         for_each_eth_queue(bp, j) {
1451                 struct bnx2x_fastpath *fp = &bp->fp[j];
1452
1453                 fp->rx_bd_cons = 0;
1454
1455                 /* Activate BD ring */
1456                 /* Warning!
1457                  * this will generate an interrupt (to the TSTORM)
1458                  * must only be done after chip is initialized
1459                  */
1460                 bnx2x_update_rx_prod(bp, fp, fp->rx_bd_prod, fp->rx_comp_prod,
1461                                      fp->rx_sge_prod);
1462
1463                 if (j != 0)
1464                         continue;
1465
1466                 if (CHIP_IS_E1(bp)) {
1467                         REG_WR(bp, BAR_USTRORM_INTMEM +
1468                                USTORM_MEM_WORKAROUND_ADDRESS_OFFSET(func),
1469                                U64_LO(fp->rx_comp_mapping));
1470                         REG_WR(bp, BAR_USTRORM_INTMEM +
1471                                USTORM_MEM_WORKAROUND_ADDRESS_OFFSET(func) + 4,
1472                                U64_HI(fp->rx_comp_mapping));
1473                 }
1474         }
1475 }
1476
1477 static void bnx2x_free_tx_skbs_queue(struct bnx2x_fastpath *fp)
1478 {
1479         u8 cos;
1480         struct bnx2x *bp = fp->bp;
1481
1482         for_each_cos_in_tx_queue(fp, cos) {
1483                 struct bnx2x_fp_txdata *txdata = fp->txdata_ptr[cos];
1484                 unsigned pkts_compl = 0, bytes_compl = 0;
1485
1486                 u16 sw_prod = txdata->tx_pkt_prod;
1487                 u16 sw_cons = txdata->tx_pkt_cons;
1488
1489                 while (sw_cons != sw_prod) {
1490                         bnx2x_free_tx_pkt(bp, txdata, TX_BD(sw_cons),
1491                                           &pkts_compl, &bytes_compl);
1492                         sw_cons++;
1493                 }
1494
1495                 netdev_tx_reset_queue(
1496                         netdev_get_tx_queue(bp->dev,
1497                                             txdata->txq_index));
1498         }
1499 }
1500
1501 static void bnx2x_free_tx_skbs_cnic(struct bnx2x *bp)
1502 {
1503         int i;
1504
1505         for_each_tx_queue_cnic(bp, i) {
1506                 bnx2x_free_tx_skbs_queue(&bp->fp[i]);
1507         }
1508 }
1509
1510 static void bnx2x_free_tx_skbs(struct bnx2x *bp)
1511 {
1512         int i;
1513
1514         for_each_eth_queue(bp, i) {
1515                 bnx2x_free_tx_skbs_queue(&bp->fp[i]);
1516         }
1517 }
1518
1519 static void bnx2x_free_rx_bds(struct bnx2x_fastpath *fp)
1520 {
1521         struct bnx2x *bp = fp->bp;
1522         int i;
1523
1524         /* ring wasn't allocated */
1525         if (fp->rx_buf_ring == NULL)
1526                 return;
1527
1528         for (i = 0; i < NUM_RX_BD; i++) {
1529                 struct sw_rx_bd *rx_buf = &fp->rx_buf_ring[i];
1530                 u8 *data = rx_buf->data;
1531
1532                 if (data == NULL)
1533                         continue;
1534                 dma_unmap_single(&bp->pdev->dev,
1535                                  dma_unmap_addr(rx_buf, mapping),
1536                                  fp->rx_buf_size, DMA_FROM_DEVICE);
1537
1538                 rx_buf->data = NULL;
1539                 bnx2x_frag_free(fp, data);
1540         }
1541 }
1542
1543 static void bnx2x_free_rx_skbs_cnic(struct bnx2x *bp)
1544 {
1545         int j;
1546
1547         for_each_rx_queue_cnic(bp, j) {
1548                 bnx2x_free_rx_bds(&bp->fp[j]);
1549         }
1550 }
1551
1552 static void bnx2x_free_rx_skbs(struct bnx2x *bp)
1553 {
1554         int j;
1555
1556         for_each_eth_queue(bp, j) {
1557                 struct bnx2x_fastpath *fp = &bp->fp[j];
1558
1559                 bnx2x_free_rx_bds(fp);
1560
1561                 if (!fp->disable_tpa)
1562                         bnx2x_free_tpa_pool(bp, fp, MAX_AGG_QS(bp));
1563         }
1564 }
1565
1566 static void bnx2x_free_skbs_cnic(struct bnx2x *bp)
1567 {
1568         bnx2x_free_tx_skbs_cnic(bp);
1569         bnx2x_free_rx_skbs_cnic(bp);
1570 }
1571
1572 void bnx2x_free_skbs(struct bnx2x *bp)
1573 {
1574         bnx2x_free_tx_skbs(bp);
1575         bnx2x_free_rx_skbs(bp);
1576 }
1577
1578 void bnx2x_update_max_mf_config(struct bnx2x *bp, u32 value)
1579 {
1580         /* load old values */
1581         u32 mf_cfg = bp->mf_config[BP_VN(bp)];
1582
1583         if (value != bnx2x_extract_max_cfg(bp, mf_cfg)) {
1584                 /* leave all but MAX value */
1585                 mf_cfg &= ~FUNC_MF_CFG_MAX_BW_MASK;
1586
1587                 /* set new MAX value */
1588                 mf_cfg |= (value << FUNC_MF_CFG_MAX_BW_SHIFT)
1589                                 & FUNC_MF_CFG_MAX_BW_MASK;
1590
1591                 bnx2x_fw_command(bp, DRV_MSG_CODE_SET_MF_BW, mf_cfg);
1592         }
1593 }
1594
1595 /**
1596  * bnx2x_free_msix_irqs - free previously requested MSI-X IRQ vectors
1597  *
1598  * @bp:         driver handle
1599  * @nvecs:      number of vectors to be released
1600  */
1601 static void bnx2x_free_msix_irqs(struct bnx2x *bp, int nvecs)
1602 {
1603         int i, offset = 0;
1604
1605         if (nvecs == offset)
1606                 return;
1607
1608         /* VFs don't have a default SB */
1609         if (IS_PF(bp)) {
1610                 free_irq(bp->msix_table[offset].vector, bp->dev);
1611                 DP(NETIF_MSG_IFDOWN, "released sp irq (%d)\n",
1612                    bp->msix_table[offset].vector);
1613                 offset++;
1614         }
1615
1616         if (CNIC_SUPPORT(bp)) {
1617                 if (nvecs == offset)
1618                         return;
1619                 offset++;
1620         }
1621
1622         for_each_eth_queue(bp, i) {
1623                 if (nvecs == offset)
1624                         return;
1625                 DP(NETIF_MSG_IFDOWN, "about to release fp #%d->%d irq\n",
1626                    i, bp->msix_table[offset].vector);
1627
1628                 free_irq(bp->msix_table[offset++].vector, &bp->fp[i]);
1629         }
1630 }
1631
1632 void bnx2x_free_irq(struct bnx2x *bp)
1633 {
1634         if (bp->flags & USING_MSIX_FLAG &&
1635             !(bp->flags & USING_SINGLE_MSIX_FLAG)) {
1636                 int nvecs = BNX2X_NUM_ETH_QUEUES(bp) + CNIC_SUPPORT(bp);
1637
1638                 /* vfs don't have a default status block */
1639                 if (IS_PF(bp))
1640                         nvecs++;
1641
1642                 bnx2x_free_msix_irqs(bp, nvecs);
1643         } else {
1644                 free_irq(bp->dev->irq, bp->dev);
1645         }
1646 }
1647
1648 int bnx2x_enable_msix(struct bnx2x *bp)
1649 {
1650         int msix_vec = 0, i, rc;
1651
1652         /* VFs don't have a default status block */
1653         if (IS_PF(bp)) {
1654                 bp->msix_table[msix_vec].entry = msix_vec;
1655                 BNX2X_DEV_INFO("msix_table[0].entry = %d (slowpath)\n",
1656                                bp->msix_table[0].entry);
1657                 msix_vec++;
1658         }
1659
1660         /* Cnic requires an msix vector for itself */
1661         if (CNIC_SUPPORT(bp)) {
1662                 bp->msix_table[msix_vec].entry = msix_vec;
1663                 BNX2X_DEV_INFO("msix_table[%d].entry = %d (CNIC)\n",
1664                                msix_vec, bp->msix_table[msix_vec].entry);
1665                 msix_vec++;
1666         }
1667
1668         /* We need separate vectors for ETH queues only (not FCoE) */
1669         for_each_eth_queue(bp, i) {
1670                 bp->msix_table[msix_vec].entry = msix_vec;
1671                 BNX2X_DEV_INFO("msix_table[%d].entry = %d (fastpath #%u)\n",
1672                                msix_vec, msix_vec, i);
1673                 msix_vec++;
1674         }
1675
1676         DP(BNX2X_MSG_SP, "about to request enable msix with %d vectors\n",
1677            msix_vec);
1678
1679         rc = pci_enable_msix_range(bp->pdev, &bp->msix_table[0],
1680                                    BNX2X_MIN_MSIX_VEC_CNT(bp), msix_vec);
1681         /*
1682          * reconfigure number of tx/rx queues according to available
1683          * MSI-X vectors
1684          */
1685         if (rc == -ENOSPC) {
1686                 /* Get by with single vector */
1687                 rc = pci_enable_msix_range(bp->pdev, &bp->msix_table[0], 1, 1);
1688                 if (rc < 0) {
1689                         BNX2X_DEV_INFO("Single MSI-X is not attainable rc %d\n",
1690                                        rc);
1691                         goto no_msix;
1692                 }
1693
1694                 BNX2X_DEV_INFO("Using single MSI-X vector\n");
1695                 bp->flags |= USING_SINGLE_MSIX_FLAG;
1696
1697                 BNX2X_DEV_INFO("set number of queues to 1\n");
1698                 bp->num_ethernet_queues = 1;
1699                 bp->num_queues = bp->num_ethernet_queues + bp->num_cnic_queues;
1700         } else if (rc < 0) {
1701                 BNX2X_DEV_INFO("MSI-X is not attainable rc %d\n", rc);
1702                 goto no_msix;
1703         } else if (rc < msix_vec) {
1704                 /* how less vectors we will have? */
1705                 int diff = msix_vec - rc;
1706
1707                 BNX2X_DEV_INFO("Trying to use less MSI-X vectors: %d\n", rc);
1708
1709                 /*
1710                  * decrease number of queues by number of unallocated entries
1711                  */
1712                 bp->num_ethernet_queues -= diff;
1713                 bp->num_queues = bp->num_ethernet_queues + bp->num_cnic_queues;
1714
1715                 BNX2X_DEV_INFO("New queue configuration set: %d\n",
1716                                bp->num_queues);
1717         }
1718
1719         bp->flags |= USING_MSIX_FLAG;
1720
1721         return 0;
1722
1723 no_msix:
1724         /* fall to INTx if not enough memory */
1725         if (rc == -ENOMEM)
1726                 bp->flags |= DISABLE_MSI_FLAG;
1727
1728         return rc;
1729 }
1730
1731 static int bnx2x_req_msix_irqs(struct bnx2x *bp)
1732 {
1733         int i, rc, offset = 0;
1734
1735         /* no default status block for vf */
1736         if (IS_PF(bp)) {
1737                 rc = request_irq(bp->msix_table[offset++].vector,
1738                                  bnx2x_msix_sp_int, 0,
1739                                  bp->dev->name, bp->dev);
1740                 if (rc) {
1741                         BNX2X_ERR("request sp irq failed\n");
1742                         return -EBUSY;
1743                 }
1744         }
1745
1746         if (CNIC_SUPPORT(bp))
1747                 offset++;
1748
1749         for_each_eth_queue(bp, i) {
1750                 struct bnx2x_fastpath *fp = &bp->fp[i];
1751                 snprintf(fp->name, sizeof(fp->name), "%s-fp-%d",
1752                          bp->dev->name, i);
1753
1754                 rc = request_irq(bp->msix_table[offset].vector,
1755                                  bnx2x_msix_fp_int, 0, fp->name, fp);
1756                 if (rc) {
1757                         BNX2X_ERR("request fp #%d irq (%d) failed  rc %d\n", i,
1758                               bp->msix_table[offset].vector, rc);
1759                         bnx2x_free_msix_irqs(bp, offset);
1760                         return -EBUSY;
1761                 }
1762
1763                 offset++;
1764         }
1765
1766         i = BNX2X_NUM_ETH_QUEUES(bp);
1767         if (IS_PF(bp)) {
1768                 offset = 1 + CNIC_SUPPORT(bp);
1769                 netdev_info(bp->dev,
1770                             "using MSI-X  IRQs: sp %d  fp[%d] %d ... fp[%d] %d\n",
1771                             bp->msix_table[0].vector,
1772                             0, bp->msix_table[offset].vector,
1773                             i - 1, bp->msix_table[offset + i - 1].vector);
1774         } else {
1775                 offset = CNIC_SUPPORT(bp);
1776                 netdev_info(bp->dev,
1777                             "using MSI-X  IRQs: fp[%d] %d ... fp[%d] %d\n",
1778                             0, bp->msix_table[offset].vector,
1779                             i - 1, bp->msix_table[offset + i - 1].vector);
1780         }
1781         return 0;
1782 }
1783
1784 int bnx2x_enable_msi(struct bnx2x *bp)
1785 {
1786         int rc;
1787
1788         rc = pci_enable_msi(bp->pdev);
1789         if (rc) {
1790                 BNX2X_DEV_INFO("MSI is not attainable\n");
1791                 return -1;
1792         }
1793         bp->flags |= USING_MSI_FLAG;
1794
1795         return 0;
1796 }
1797
1798 static int bnx2x_req_irq(struct bnx2x *bp)
1799 {
1800         unsigned long flags;
1801         unsigned int irq;
1802
1803         if (bp->flags & (USING_MSI_FLAG | USING_MSIX_FLAG))
1804                 flags = 0;
1805         else
1806                 flags = IRQF_SHARED;
1807
1808         if (bp->flags & USING_MSIX_FLAG)
1809                 irq = bp->msix_table[0].vector;
1810         else
1811                 irq = bp->pdev->irq;
1812
1813         return request_irq(irq, bnx2x_interrupt, flags, bp->dev->name, bp->dev);
1814 }
1815
1816 static int bnx2x_setup_irqs(struct bnx2x *bp)
1817 {
1818         int rc = 0;
1819         if (bp->flags & USING_MSIX_FLAG &&
1820             !(bp->flags & USING_SINGLE_MSIX_FLAG)) {
1821                 rc = bnx2x_req_msix_irqs(bp);
1822                 if (rc)
1823                         return rc;
1824         } else {
1825                 rc = bnx2x_req_irq(bp);
1826                 if (rc) {
1827                         BNX2X_ERR("IRQ request failed  rc %d, aborting\n", rc);
1828                         return rc;
1829                 }
1830                 if (bp->flags & USING_MSI_FLAG) {
1831                         bp->dev->irq = bp->pdev->irq;
1832                         netdev_info(bp->dev, "using MSI IRQ %d\n",
1833                                     bp->dev->irq);
1834                 }
1835                 if (bp->flags & USING_MSIX_FLAG) {
1836                         bp->dev->irq = bp->msix_table[0].vector;
1837                         netdev_info(bp->dev, "using MSIX IRQ %d\n",
1838                                     bp->dev->irq);
1839                 }
1840         }
1841
1842         return 0;
1843 }
1844
1845 static void bnx2x_napi_enable_cnic(struct bnx2x *bp)
1846 {
1847         int i;
1848
1849         for_each_rx_queue_cnic(bp, i) {
1850                 bnx2x_fp_init_lock(&bp->fp[i]);
1851                 napi_enable(&bnx2x_fp(bp, i, napi));
1852         }
1853 }
1854
1855 static void bnx2x_napi_enable(struct bnx2x *bp)
1856 {
1857         int i;
1858
1859         for_each_eth_queue(bp, i) {
1860                 bnx2x_fp_init_lock(&bp->fp[i]);
1861                 napi_enable(&bnx2x_fp(bp, i, napi));
1862         }
1863 }
1864
1865 static void bnx2x_napi_disable_cnic(struct bnx2x *bp)
1866 {
1867         int i;
1868
1869         for_each_rx_queue_cnic(bp, i) {
1870                 napi_disable(&bnx2x_fp(bp, i, napi));
1871                 while (!bnx2x_fp_ll_disable(&bp->fp[i]))
1872                         usleep_range(1000, 2000);
1873         }
1874 }
1875
1876 static void bnx2x_napi_disable(struct bnx2x *bp)
1877 {
1878         int i;
1879
1880         for_each_eth_queue(bp, i) {
1881                 napi_disable(&bnx2x_fp(bp, i, napi));
1882                 while (!bnx2x_fp_ll_disable(&bp->fp[i]))
1883                         usleep_range(1000, 2000);
1884         }
1885 }
1886
1887 void bnx2x_netif_start(struct bnx2x *bp)
1888 {
1889         if (netif_running(bp->dev)) {
1890                 bnx2x_napi_enable(bp);
1891                 if (CNIC_LOADED(bp))
1892                         bnx2x_napi_enable_cnic(bp);
1893                 bnx2x_int_enable(bp);
1894                 if (bp->state == BNX2X_STATE_OPEN)
1895                         netif_tx_wake_all_queues(bp->dev);
1896         }
1897 }
1898
1899 void bnx2x_netif_stop(struct bnx2x *bp, int disable_hw)
1900 {
1901         bnx2x_int_disable_sync(bp, disable_hw);
1902         bnx2x_napi_disable(bp);
1903         if (CNIC_LOADED(bp))
1904                 bnx2x_napi_disable_cnic(bp);
1905 }
1906
1907 u16 bnx2x_select_queue(struct net_device *dev, struct sk_buff *skb,
1908                        void *accel_priv, select_queue_fallback_t fallback)
1909 {
1910         struct bnx2x *bp = netdev_priv(dev);
1911
1912         if (CNIC_LOADED(bp) && !NO_FCOE(bp)) {
1913                 struct ethhdr *hdr = (struct ethhdr *)skb->data;
1914                 u16 ether_type = ntohs(hdr->h_proto);
1915
1916                 /* Skip VLAN tag if present */
1917                 if (ether_type == ETH_P_8021Q) {
1918                         struct vlan_ethhdr *vhdr =
1919                                 (struct vlan_ethhdr *)skb->data;
1920
1921                         ether_type = ntohs(vhdr->h_vlan_encapsulated_proto);
1922                 }
1923
1924                 /* If ethertype is FCoE or FIP - use FCoE ring */
1925                 if ((ether_type == ETH_P_FCOE) || (ether_type == ETH_P_FIP))
1926                         return bnx2x_fcoe_tx(bp, txq_index);
1927         }
1928
1929         /* select a non-FCoE queue */
1930         return fallback(dev, skb) % BNX2X_NUM_ETH_QUEUES(bp);
1931 }
1932
1933 void bnx2x_set_num_queues(struct bnx2x *bp)
1934 {
1935         /* RSS queues */
1936         bp->num_ethernet_queues = bnx2x_calc_num_queues(bp);
1937
1938         /* override in STORAGE SD modes */
1939         if (IS_MF_STORAGE_SD(bp) || IS_MF_FCOE_AFEX(bp))
1940                 bp->num_ethernet_queues = 1;
1941
1942         /* Add special queues */
1943         bp->num_cnic_queues = CNIC_SUPPORT(bp); /* For FCOE */
1944         bp->num_queues = bp->num_ethernet_queues + bp->num_cnic_queues;
1945
1946         BNX2X_DEV_INFO("set number of queues to %d\n", bp->num_queues);
1947 }
1948
1949 /**
1950  * bnx2x_set_real_num_queues - configure netdev->real_num_[tx,rx]_queues
1951  *
1952  * @bp:         Driver handle
1953  *
1954  * We currently support for at most 16 Tx queues for each CoS thus we will
1955  * allocate a multiple of 16 for ETH L2 rings according to the value of the
1956  * bp->max_cos.
1957  *
1958  * If there is an FCoE L2 queue the appropriate Tx queue will have the next
1959  * index after all ETH L2 indices.
1960  *
1961  * If the actual number of Tx queues (for each CoS) is less than 16 then there
1962  * will be the holes at the end of each group of 16 ETh L2 indices (0..15,
1963  * 16..31,...) with indices that are not coupled with any real Tx queue.
1964  *
1965  * The proper configuration of skb->queue_mapping is handled by
1966  * bnx2x_select_queue() and __skb_tx_hash().
1967  *
1968  * bnx2x_setup_tc() takes care of the proper TC mappings so that __skb_tx_hash()
1969  * will return a proper Tx index if TC is enabled (netdev->num_tc > 0).
1970  */
1971 static int bnx2x_set_real_num_queues(struct bnx2x *bp, int include_cnic)
1972 {
1973         int rc, tx, rx;
1974
1975         tx = BNX2X_NUM_ETH_QUEUES(bp) * bp->max_cos;
1976         rx = BNX2X_NUM_ETH_QUEUES(bp);
1977
1978 /* account for fcoe queue */
1979         if (include_cnic && !NO_FCOE(bp)) {
1980                 rx++;
1981                 tx++;
1982         }
1983
1984         rc = netif_set_real_num_tx_queues(bp->dev, tx);
1985         if (rc) {
1986                 BNX2X_ERR("Failed to set real number of Tx queues: %d\n", rc);
1987                 return rc;
1988         }
1989         rc = netif_set_real_num_rx_queues(bp->dev, rx);
1990         if (rc) {
1991                 BNX2X_ERR("Failed to set real number of Rx queues: %d\n", rc);
1992                 return rc;
1993         }
1994
1995         DP(NETIF_MSG_IFUP, "Setting real num queues to (tx, rx) (%d, %d)\n",
1996                           tx, rx);
1997
1998         return rc;
1999 }
2000
2001 static void bnx2x_set_rx_buf_size(struct bnx2x *bp)
2002 {
2003         int i;
2004
2005         for_each_queue(bp, i) {
2006                 struct bnx2x_fastpath *fp = &bp->fp[i];
2007                 u32 mtu;
2008
2009                 /* Always use a mini-jumbo MTU for the FCoE L2 ring */
2010                 if (IS_FCOE_IDX(i))
2011                         /*
2012                          * Although there are no IP frames expected to arrive to
2013                          * this ring we still want to add an
2014                          * IP_HEADER_ALIGNMENT_PADDING to prevent a buffer
2015                          * overrun attack.
2016                          */
2017                         mtu = BNX2X_FCOE_MINI_JUMBO_MTU;
2018                 else
2019                         mtu = bp->dev->mtu;
2020                 fp->rx_buf_size = BNX2X_FW_RX_ALIGN_START +
2021                                   IP_HEADER_ALIGNMENT_PADDING +
2022                                   ETH_OVREHEAD +
2023                                   mtu +
2024                                   BNX2X_FW_RX_ALIGN_END;
2025                 /* Note : rx_buf_size doesn't take into account NET_SKB_PAD */
2026                 if (fp->rx_buf_size + NET_SKB_PAD <= PAGE_SIZE)
2027                         fp->rx_frag_size = fp->rx_buf_size + NET_SKB_PAD;
2028                 else
2029                         fp->rx_frag_size = 0;
2030         }
2031 }
2032
2033 static int bnx2x_init_rss(struct bnx2x *bp)
2034 {
2035         int i;
2036         u8 num_eth_queues = BNX2X_NUM_ETH_QUEUES(bp);
2037
2038         /* Prepare the initial contents for the indirection table if RSS is
2039          * enabled
2040          */
2041         for (i = 0; i < sizeof(bp->rss_conf_obj.ind_table); i++)
2042                 bp->rss_conf_obj.ind_table[i] =
2043                         bp->fp->cl_id +
2044                         ethtool_rxfh_indir_default(i, num_eth_queues);
2045
2046         /*
2047          * For 57710 and 57711 SEARCHER configuration (rss_keys) is
2048          * per-port, so if explicit configuration is needed , do it only
2049          * for a PMF.
2050          *
2051          * For 57712 and newer on the other hand it's a per-function
2052          * configuration.
2053          */
2054         return bnx2x_config_rss_eth(bp, bp->port.pmf || !CHIP_IS_E1x(bp));
2055 }
2056
2057 int bnx2x_rss(struct bnx2x *bp, struct bnx2x_rss_config_obj *rss_obj,
2058               bool config_hash, bool enable)
2059 {
2060         struct bnx2x_config_rss_params params = {NULL};
2061
2062         /* Although RSS is meaningless when there is a single HW queue we
2063          * still need it enabled in order to have HW Rx hash generated.
2064          *
2065          * if (!is_eth_multi(bp))
2066          *      bp->multi_mode = ETH_RSS_MODE_DISABLED;
2067          */
2068
2069         params.rss_obj = rss_obj;
2070
2071         __set_bit(RAMROD_COMP_WAIT, &params.ramrod_flags);
2072
2073         if (enable) {
2074                 __set_bit(BNX2X_RSS_MODE_REGULAR, &params.rss_flags);
2075
2076                 /* RSS configuration */
2077                 __set_bit(BNX2X_RSS_IPV4, &params.rss_flags);
2078                 __set_bit(BNX2X_RSS_IPV4_TCP, &params.rss_flags);
2079                 __set_bit(BNX2X_RSS_IPV6, &params.rss_flags);
2080                 __set_bit(BNX2X_RSS_IPV6_TCP, &params.rss_flags);
2081                 if (rss_obj->udp_rss_v4)
2082                         __set_bit(BNX2X_RSS_IPV4_UDP, &params.rss_flags);
2083                 if (rss_obj->udp_rss_v6)
2084                         __set_bit(BNX2X_RSS_IPV6_UDP, &params.rss_flags);
2085         } else {
2086                 __set_bit(BNX2X_RSS_MODE_DISABLED, &params.rss_flags);
2087         }
2088
2089         /* Hash bits */
2090         params.rss_result_mask = MULTI_MASK;
2091
2092         memcpy(params.ind_table, rss_obj->ind_table, sizeof(params.ind_table));
2093
2094         if (config_hash) {
2095                 /* RSS keys */
2096                 prandom_bytes(params.rss_key, T_ETH_RSS_KEY * 4);
2097                 __set_bit(BNX2X_RSS_SET_SRCH, &params.rss_flags);
2098         }
2099
2100         if (IS_PF(bp))
2101                 return bnx2x_config_rss(bp, &params);
2102         else
2103                 return bnx2x_vfpf_config_rss(bp, &params);
2104 }
2105
2106 static int bnx2x_init_hw(struct bnx2x *bp, u32 load_code)
2107 {
2108         struct bnx2x_func_state_params func_params = {NULL};
2109
2110         /* Prepare parameters for function state transitions */
2111         __set_bit(RAMROD_COMP_WAIT, &func_params.ramrod_flags);
2112
2113         func_params.f_obj = &bp->func_obj;
2114         func_params.cmd = BNX2X_F_CMD_HW_INIT;
2115
2116         func_params.params.hw_init.load_phase = load_code;
2117
2118         return bnx2x_func_state_change(bp, &func_params);
2119 }
2120
2121 /*
2122  * Cleans the object that have internal lists without sending
2123  * ramrods. Should be run when interrupts are disabled.
2124  */
2125 void bnx2x_squeeze_objects(struct bnx2x *bp)
2126 {
2127         int rc;
2128         unsigned long ramrod_flags = 0, vlan_mac_flags = 0;
2129         struct bnx2x_mcast_ramrod_params rparam = {NULL};
2130         struct bnx2x_vlan_mac_obj *mac_obj = &bp->sp_objs->mac_obj;
2131
2132         /***************** Cleanup MACs' object first *************************/
2133
2134         /* Wait for completion of requested */
2135         __set_bit(RAMROD_COMP_WAIT, &ramrod_flags);
2136         /* Perform a dry cleanup */
2137         __set_bit(RAMROD_DRV_CLR_ONLY, &ramrod_flags);
2138
2139         /* Clean ETH primary MAC */
2140         __set_bit(BNX2X_ETH_MAC, &vlan_mac_flags);
2141         rc = mac_obj->delete_all(bp, &bp->sp_objs->mac_obj, &vlan_mac_flags,
2142                                  &ramrod_flags);
2143         if (rc != 0)
2144                 BNX2X_ERR("Failed to clean ETH MACs: %d\n", rc);
2145
2146         /* Cleanup UC list */
2147         vlan_mac_flags = 0;
2148         __set_bit(BNX2X_UC_LIST_MAC, &vlan_mac_flags);
2149         rc = mac_obj->delete_all(bp, mac_obj, &vlan_mac_flags,
2150                                  &ramrod_flags);
2151         if (rc != 0)
2152                 BNX2X_ERR("Failed to clean UC list MACs: %d\n", rc);
2153
2154         /***************** Now clean mcast object *****************************/
2155         rparam.mcast_obj = &bp->mcast_obj;
2156         __set_bit(RAMROD_DRV_CLR_ONLY, &rparam.ramrod_flags);
2157
2158         /* Add a DEL command... - Since we're doing a driver cleanup only,
2159          * we take a lock surrounding both the initial send and the CONTs,
2160          * as we don't want a true completion to disrupt us in the middle.
2161          */
2162         netif_addr_lock_bh(bp->dev);
2163         rc = bnx2x_config_mcast(bp, &rparam, BNX2X_MCAST_CMD_DEL);
2164         if (rc < 0)
2165                 BNX2X_ERR("Failed to add a new DEL command to a multi-cast object: %d\n",
2166                           rc);
2167
2168         /* ...and wait until all pending commands are cleared */
2169         rc = bnx2x_config_mcast(bp, &rparam, BNX2X_MCAST_CMD_CONT);
2170         while (rc != 0) {
2171                 if (rc < 0) {
2172                         BNX2X_ERR("Failed to clean multi-cast object: %d\n",
2173                                   rc);
2174                         netif_addr_unlock_bh(bp->dev);
2175                         return;
2176                 }
2177
2178                 rc = bnx2x_config_mcast(bp, &rparam, BNX2X_MCAST_CMD_CONT);
2179         }
2180         netif_addr_unlock_bh(bp->dev);
2181 }
2182
2183 #ifndef BNX2X_STOP_ON_ERROR
2184 #define LOAD_ERROR_EXIT(bp, label) \
2185         do { \
2186                 (bp)->state = BNX2X_STATE_ERROR; \
2187                 goto label; \
2188         } while (0)
2189
2190 #define LOAD_ERROR_EXIT_CNIC(bp, label) \
2191         do { \
2192                 bp->cnic_loaded = false; \
2193                 goto label; \
2194         } while (0)
2195 #else /*BNX2X_STOP_ON_ERROR*/
2196 #define LOAD_ERROR_EXIT(bp, label) \
2197         do { \
2198                 (bp)->state = BNX2X_STATE_ERROR; \
2199                 (bp)->panic = 1; \
2200                 return -EBUSY; \
2201         } while (0)
2202 #define LOAD_ERROR_EXIT_CNIC(bp, label) \
2203         do { \
2204                 bp->cnic_loaded = false; \
2205                 (bp)->panic = 1; \
2206                 return -EBUSY; \
2207         } while (0)
2208 #endif /*BNX2X_STOP_ON_ERROR*/
2209
2210 static void bnx2x_free_fw_stats_mem(struct bnx2x *bp)
2211 {
2212         BNX2X_PCI_FREE(bp->fw_stats, bp->fw_stats_mapping,
2213                        bp->fw_stats_data_sz + bp->fw_stats_req_sz);
2214         return;
2215 }
2216
2217 static int bnx2x_alloc_fw_stats_mem(struct bnx2x *bp)
2218 {
2219         int num_groups, vf_headroom = 0;
2220         int is_fcoe_stats = NO_FCOE(bp) ? 0 : 1;
2221
2222         /* number of queues for statistics is number of eth queues + FCoE */
2223         u8 num_queue_stats = BNX2X_NUM_ETH_QUEUES(bp) + is_fcoe_stats;
2224
2225         /* Total number of FW statistics requests =
2226          * 1 for port stats + 1 for PF stats + potential 2 for FCoE (fcoe proper
2227          * and fcoe l2 queue) stats + num of queues (which includes another 1
2228          * for fcoe l2 queue if applicable)
2229          */
2230         bp->fw_stats_num = 2 + is_fcoe_stats + num_queue_stats;
2231
2232         /* vf stats appear in the request list, but their data is allocated by
2233          * the VFs themselves. We don't include them in the bp->fw_stats_num as
2234          * it is used to determine where to place the vf stats queries in the
2235          * request struct
2236          */
2237         if (IS_SRIOV(bp))
2238                 vf_headroom = bnx2x_vf_headroom(bp);
2239
2240         /* Request is built from stats_query_header and an array of
2241          * stats_query_cmd_group each of which contains
2242          * STATS_QUERY_CMD_COUNT rules. The real number or requests is
2243          * configured in the stats_query_header.
2244          */
2245         num_groups =
2246                 (((bp->fw_stats_num + vf_headroom) / STATS_QUERY_CMD_COUNT) +
2247                  (((bp->fw_stats_num + vf_headroom) % STATS_QUERY_CMD_COUNT) ?
2248                  1 : 0));
2249
2250         DP(BNX2X_MSG_SP, "stats fw_stats_num %d, vf headroom %d, num_groups %d\n",
2251            bp->fw_stats_num, vf_headroom, num_groups);
2252         bp->fw_stats_req_sz = sizeof(struct stats_query_header) +
2253                 num_groups * sizeof(struct stats_query_cmd_group);
2254
2255         /* Data for statistics requests + stats_counter
2256          * stats_counter holds per-STORM counters that are incremented
2257          * when STORM has finished with the current request.
2258          * memory for FCoE offloaded statistics are counted anyway,
2259          * even if they will not be sent.
2260          * VF stats are not accounted for here as the data of VF stats is stored
2261          * in memory allocated by the VF, not here.
2262          */
2263         bp->fw_stats_data_sz = sizeof(struct per_port_stats) +
2264                 sizeof(struct per_pf_stats) +
2265                 sizeof(struct fcoe_statistics_params) +
2266                 sizeof(struct per_queue_stats) * num_queue_stats +
2267                 sizeof(struct stats_counter);
2268
2269         bp->fw_stats = BNX2X_PCI_ALLOC(&bp->fw_stats_mapping,
2270                                        bp->fw_stats_data_sz + bp->fw_stats_req_sz);
2271         if (!bp->fw_stats)
2272                 goto alloc_mem_err;
2273
2274         /* Set shortcuts */
2275         bp->fw_stats_req = (struct bnx2x_fw_stats_req *)bp->fw_stats;
2276         bp->fw_stats_req_mapping = bp->fw_stats_mapping;
2277         bp->fw_stats_data = (struct bnx2x_fw_stats_data *)
2278                 ((u8 *)bp->fw_stats + bp->fw_stats_req_sz);
2279         bp->fw_stats_data_mapping = bp->fw_stats_mapping +
2280                 bp->fw_stats_req_sz;
2281
2282         DP(BNX2X_MSG_SP, "statistics request base address set to %x %x\n",
2283            U64_HI(bp->fw_stats_req_mapping),
2284            U64_LO(bp->fw_stats_req_mapping));
2285         DP(BNX2X_MSG_SP, "statistics data base address set to %x %x\n",
2286            U64_HI(bp->fw_stats_data_mapping),
2287            U64_LO(bp->fw_stats_data_mapping));
2288         return 0;
2289
2290 alloc_mem_err:
2291         bnx2x_free_fw_stats_mem(bp);
2292         BNX2X_ERR("Can't allocate FW stats memory\n");
2293         return -ENOMEM;
2294 }
2295
2296 /* send load request to mcp and analyze response */
2297 static int bnx2x_nic_load_request(struct bnx2x *bp, u32 *load_code)
2298 {
2299         u32 param;
2300
2301         /* init fw_seq */
2302         bp->fw_seq =
2303                 (SHMEM_RD(bp, func_mb[BP_FW_MB_IDX(bp)].drv_mb_header) &
2304                  DRV_MSG_SEQ_NUMBER_MASK);
2305         BNX2X_DEV_INFO("fw_seq 0x%08x\n", bp->fw_seq);
2306
2307         /* Get current FW pulse sequence */
2308         bp->fw_drv_pulse_wr_seq =
2309                 (SHMEM_RD(bp, func_mb[BP_FW_MB_IDX(bp)].drv_pulse_mb) &
2310                  DRV_PULSE_SEQ_MASK);
2311         BNX2X_DEV_INFO("drv_pulse 0x%x\n", bp->fw_drv_pulse_wr_seq);
2312
2313         param = DRV_MSG_CODE_LOAD_REQ_WITH_LFA;
2314
2315         if (IS_MF_SD(bp) && bnx2x_port_after_undi(bp))
2316                 param |= DRV_MSG_CODE_LOAD_REQ_FORCE_LFA;
2317
2318         /* load request */
2319         (*load_code) = bnx2x_fw_command(bp, DRV_MSG_CODE_LOAD_REQ, param);
2320
2321         /* if mcp fails to respond we must abort */
2322         if (!(*load_code)) {
2323                 BNX2X_ERR("MCP response failure, aborting\n");
2324                 return -EBUSY;
2325         }
2326
2327         /* If mcp refused (e.g. other port is in diagnostic mode) we
2328          * must abort
2329          */
2330         if ((*load_code) == FW_MSG_CODE_DRV_LOAD_REFUSED) {
2331                 BNX2X_ERR("MCP refused load request, aborting\n");
2332                 return -EBUSY;
2333         }
2334         return 0;
2335 }
2336
2337 /* check whether another PF has already loaded FW to chip. In
2338  * virtualized environments a pf from another VM may have already
2339  * initialized the device including loading FW
2340  */
2341 int bnx2x_compare_fw_ver(struct bnx2x *bp, u32 load_code, bool print_err)
2342 {
2343         /* is another pf loaded on this engine? */
2344         if (load_code != FW_MSG_CODE_DRV_LOAD_COMMON_CHIP &&
2345             load_code != FW_MSG_CODE_DRV_LOAD_COMMON) {
2346                 /* build my FW version dword */
2347                 u32 my_fw = (BCM_5710_FW_MAJOR_VERSION) +
2348                         (BCM_5710_FW_MINOR_VERSION << 8) +
2349                         (BCM_5710_FW_REVISION_VERSION << 16) +
2350                         (BCM_5710_FW_ENGINEERING_VERSION << 24);
2351
2352                 /* read loaded FW from chip */
2353                 u32 loaded_fw = REG_RD(bp, XSEM_REG_PRAM);
2354
2355                 DP(BNX2X_MSG_SP, "loaded fw %x, my fw %x\n",
2356                    loaded_fw, my_fw);
2357
2358                 /* abort nic load if version mismatch */
2359                 if (my_fw != loaded_fw) {
2360                         if (print_err)
2361                                 BNX2X_ERR("bnx2x with FW %x was already loaded which mismatches my %x FW. Aborting\n",
2362                                           loaded_fw, my_fw);
2363                         else
2364                                 BNX2X_DEV_INFO("bnx2x with FW %x was already loaded which mismatches my %x FW, possibly due to MF UNDI\n",
2365                                                loaded_fw, my_fw);
2366                         return -EBUSY;
2367                 }
2368         }
2369         return 0;
2370 }
2371
2372 /* returns the "mcp load_code" according to global load_count array */
2373 static int bnx2x_nic_load_no_mcp(struct bnx2x *bp, int port)
2374 {
2375         int path = BP_PATH(bp);
2376
2377         DP(NETIF_MSG_IFUP, "NO MCP - load counts[%d]      %d, %d, %d\n",
2378            path, bnx2x_load_count[path][0], bnx2x_load_count[path][1],
2379            bnx2x_load_count[path][2]);
2380         bnx2x_load_count[path][0]++;
2381         bnx2x_load_count[path][1 + port]++;
2382         DP(NETIF_MSG_IFUP, "NO MCP - new load counts[%d]  %d, %d, %d\n",
2383            path, bnx2x_load_count[path][0], bnx2x_load_count[path][1],
2384            bnx2x_load_count[path][2]);
2385         if (bnx2x_load_count[path][0] == 1)
2386                 return FW_MSG_CODE_DRV_LOAD_COMMON;
2387         else if (bnx2x_load_count[path][1 + port] == 1)
2388                 return FW_MSG_CODE_DRV_LOAD_PORT;
2389         else
2390                 return FW_MSG_CODE_DRV_LOAD_FUNCTION;
2391 }
2392
2393 /* mark PMF if applicable */
2394 static void bnx2x_nic_load_pmf(struct bnx2x *bp, u32 load_code)
2395 {
2396         if ((load_code == FW_MSG_CODE_DRV_LOAD_COMMON) ||
2397             (load_code == FW_MSG_CODE_DRV_LOAD_COMMON_CHIP) ||
2398             (load_code == FW_MSG_CODE_DRV_LOAD_PORT)) {
2399                 bp->port.pmf = 1;
2400                 /* We need the barrier to ensure the ordering between the
2401                  * writing to bp->port.pmf here and reading it from the
2402                  * bnx2x_periodic_task().
2403                  */
2404                 smp_mb();
2405         } else {
2406                 bp->port.pmf = 0;
2407         }
2408
2409         DP(NETIF_MSG_LINK, "pmf %d\n", bp->port.pmf);
2410 }
2411
2412 static void bnx2x_nic_load_afex_dcc(struct bnx2x *bp, int load_code)
2413 {
2414         if (((load_code == FW_MSG_CODE_DRV_LOAD_COMMON) ||
2415              (load_code == FW_MSG_CODE_DRV_LOAD_COMMON_CHIP)) &&
2416             (bp->common.shmem2_base)) {
2417                 if (SHMEM2_HAS(bp, dcc_support))
2418                         SHMEM2_WR(bp, dcc_support,
2419                                   (SHMEM_DCC_SUPPORT_DISABLE_ENABLE_PF_TLV |
2420                                    SHMEM_DCC_SUPPORT_BANDWIDTH_ALLOCATION_TLV));
2421                 if (SHMEM2_HAS(bp, afex_driver_support))
2422                         SHMEM2_WR(bp, afex_driver_support,
2423                                   SHMEM_AFEX_SUPPORTED_VERSION_ONE);
2424         }
2425
2426         /* Set AFEX default VLAN tag to an invalid value */
2427         bp->afex_def_vlan_tag = -1;
2428 }
2429
2430 /**
2431  * bnx2x_bz_fp - zero content of the fastpath structure.
2432  *
2433  * @bp:         driver handle
2434  * @index:      fastpath index to be zeroed
2435  *
2436  * Makes sure the contents of the bp->fp[index].napi is kept
2437  * intact.
2438  */
2439 static void bnx2x_bz_fp(struct bnx2x *bp, int index)
2440 {
2441         struct bnx2x_fastpath *fp = &bp->fp[index];
2442         int cos;
2443         struct napi_struct orig_napi = fp->napi;
2444         struct bnx2x_agg_info *orig_tpa_info = fp->tpa_info;
2445
2446         /* bzero bnx2x_fastpath contents */
2447         if (fp->tpa_info)
2448                 memset(fp->tpa_info, 0, ETH_MAX_AGGREGATION_QUEUES_E1H_E2 *
2449                        sizeof(struct bnx2x_agg_info));
2450         memset(fp, 0, sizeof(*fp));
2451
2452         /* Restore the NAPI object as it has been already initialized */
2453         fp->napi = orig_napi;
2454         fp->tpa_info = orig_tpa_info;
2455         fp->bp = bp;
2456         fp->index = index;
2457         if (IS_ETH_FP(fp))
2458                 fp->max_cos = bp->max_cos;
2459         else
2460                 /* Special queues support only one CoS */
2461                 fp->max_cos = 1;
2462
2463         /* Init txdata pointers */
2464         if (IS_FCOE_FP(fp))
2465                 fp->txdata_ptr[0] = &bp->bnx2x_txq[FCOE_TXQ_IDX(bp)];
2466         if (IS_ETH_FP(fp))
2467                 for_each_cos_in_tx_queue(fp, cos)
2468                         fp->txdata_ptr[cos] = &bp->bnx2x_txq[cos *
2469                                 BNX2X_NUM_ETH_QUEUES(bp) + index];
2470
2471         /* set the tpa flag for each queue. The tpa flag determines the queue
2472          * minimal size so it must be set prior to queue memory allocation
2473          */
2474         fp->disable_tpa = !(bp->flags & TPA_ENABLE_FLAG ||
2475                                   (bp->flags & GRO_ENABLE_FLAG &&
2476                                    bnx2x_mtu_allows_gro(bp->dev->mtu)));
2477         if (bp->flags & TPA_ENABLE_FLAG)
2478                 fp->mode = TPA_MODE_LRO;
2479         else if (bp->flags & GRO_ENABLE_FLAG)
2480                 fp->mode = TPA_MODE_GRO;
2481
2482         /* We don't want TPA on an FCoE L2 ring */
2483         if (IS_FCOE_FP(fp))
2484                 fp->disable_tpa = 1;
2485 }
2486
2487 int bnx2x_load_cnic(struct bnx2x *bp)
2488 {
2489         int i, rc, port = BP_PORT(bp);
2490
2491         DP(NETIF_MSG_IFUP, "Starting CNIC-related load\n");
2492
2493         mutex_init(&bp->cnic_mutex);
2494
2495         if (IS_PF(bp)) {
2496                 rc = bnx2x_alloc_mem_cnic(bp);
2497                 if (rc) {
2498                         BNX2X_ERR("Unable to allocate bp memory for cnic\n");
2499                         LOAD_ERROR_EXIT_CNIC(bp, load_error_cnic0);
2500                 }
2501         }
2502
2503         rc = bnx2x_alloc_fp_mem_cnic(bp);
2504         if (rc) {
2505                 BNX2X_ERR("Unable to allocate memory for cnic fps\n");
2506                 LOAD_ERROR_EXIT_CNIC(bp, load_error_cnic0);
2507         }
2508
2509         /* Update the number of queues with the cnic queues */
2510         rc = bnx2x_set_real_num_queues(bp, 1);
2511         if (rc) {
2512                 BNX2X_ERR("Unable to set real_num_queues including cnic\n");
2513                 LOAD_ERROR_EXIT_CNIC(bp, load_error_cnic0);
2514         }
2515
2516         /* Add all CNIC NAPI objects */
2517         bnx2x_add_all_napi_cnic(bp);
2518         DP(NETIF_MSG_IFUP, "cnic napi added\n");
2519         bnx2x_napi_enable_cnic(bp);
2520
2521         rc = bnx2x_init_hw_func_cnic(bp);
2522         if (rc)
2523                 LOAD_ERROR_EXIT_CNIC(bp, load_error_cnic1);
2524
2525         bnx2x_nic_init_cnic(bp);
2526
2527         if (IS_PF(bp)) {
2528                 /* Enable Timer scan */
2529                 REG_WR(bp, TM_REG_EN_LINEAR0_TIMER + port*4, 1);
2530
2531                 /* setup cnic queues */
2532                 for_each_cnic_queue(bp, i) {
2533                         rc = bnx2x_setup_queue(bp, &bp->fp[i], 0);
2534                         if (rc) {
2535                                 BNX2X_ERR("Queue setup failed\n");
2536                                 LOAD_ERROR_EXIT(bp, load_error_cnic2);
2537                         }
2538                 }
2539         }
2540
2541         /* Initialize Rx filter. */
2542         bnx2x_set_rx_mode_inner(bp);
2543
2544         /* re-read iscsi info */
2545         bnx2x_get_iscsi_info(bp);
2546         bnx2x_setup_cnic_irq_info(bp);
2547         bnx2x_setup_cnic_info(bp);
2548         bp->cnic_loaded = true;
2549         if (bp->state == BNX2X_STATE_OPEN)
2550                 bnx2x_cnic_notify(bp, CNIC_CTL_START_CMD);
2551
2552         DP(NETIF_MSG_IFUP, "Ending successfully CNIC-related load\n");
2553
2554         return 0;
2555
2556 #ifndef BNX2X_STOP_ON_ERROR
2557 load_error_cnic2:
2558         /* Disable Timer scan */
2559         REG_WR(bp, TM_REG_EN_LINEAR0_TIMER + port*4, 0);
2560
2561 load_error_cnic1:
2562         bnx2x_napi_disable_cnic(bp);
2563         /* Update the number of queues without the cnic queues */
2564         if (bnx2x_set_real_num_queues(bp, 0))
2565                 BNX2X_ERR("Unable to set real_num_queues not including cnic\n");
2566 load_error_cnic0:
2567         BNX2X_ERR("CNIC-related load failed\n");
2568         bnx2x_free_fp_mem_cnic(bp);
2569         bnx2x_free_mem_cnic(bp);
2570         return rc;
2571 #endif /* ! BNX2X_STOP_ON_ERROR */
2572 }
2573
2574 /* must be called with rtnl_lock */
2575 int bnx2x_nic_load(struct bnx2x *bp, int load_mode)
2576 {
2577         int port = BP_PORT(bp);
2578         int i, rc = 0, load_code = 0;
2579
2580         DP(NETIF_MSG_IFUP, "Starting NIC load\n");
2581         DP(NETIF_MSG_IFUP,
2582            "CNIC is %s\n", CNIC_ENABLED(bp) ? "enabled" : "disabled");
2583
2584 #ifdef BNX2X_STOP_ON_ERROR
2585         if (unlikely(bp->panic)) {
2586                 BNX2X_ERR("Can't load NIC when there is panic\n");
2587                 return -EPERM;
2588         }
2589 #endif
2590
2591         bp->state = BNX2X_STATE_OPENING_WAIT4_LOAD;
2592
2593         /* zero the structure w/o any lock, before SP handler is initialized */
2594         memset(&bp->last_reported_link, 0, sizeof(bp->last_reported_link));
2595         __set_bit(BNX2X_LINK_REPORT_LINK_DOWN,
2596                 &bp->last_reported_link.link_report_flags);
2597
2598         if (IS_PF(bp))
2599                 /* must be called before memory allocation and HW init */
2600                 bnx2x_ilt_set_info(bp);
2601
2602         /*
2603          * Zero fastpath structures preserving invariants like napi, which are
2604          * allocated only once, fp index, max_cos, bp pointer.
2605          * Also set fp->disable_tpa and txdata_ptr.
2606          */
2607         DP(NETIF_MSG_IFUP, "num queues: %d", bp->num_queues);
2608         for_each_queue(bp, i)
2609                 bnx2x_bz_fp(bp, i);
2610         memset(bp->bnx2x_txq, 0, (BNX2X_MAX_RSS_COUNT(bp) * BNX2X_MULTI_TX_COS +
2611                                   bp->num_cnic_queues) *
2612                                   sizeof(struct bnx2x_fp_txdata));
2613
2614         bp->fcoe_init = false;
2615
2616         /* Set the receive queues buffer size */
2617         bnx2x_set_rx_buf_size(bp);
2618
2619         if (IS_PF(bp)) {
2620                 rc = bnx2x_alloc_mem(bp);
2621                 if (rc) {
2622                         BNX2X_ERR("Unable to allocate bp memory\n");
2623                         return rc;
2624                 }
2625         }
2626
2627         /* need to be done after alloc mem, since it's self adjusting to amount
2628          * of memory available for RSS queues
2629          */
2630         rc = bnx2x_alloc_fp_mem(bp);
2631         if (rc) {
2632                 BNX2X_ERR("Unable to allocate memory for fps\n");
2633                 LOAD_ERROR_EXIT(bp, load_error0);
2634         }
2635
2636         /* Allocated memory for FW statistics  */
2637         if (bnx2x_alloc_fw_stats_mem(bp))
2638                 LOAD_ERROR_EXIT(bp, load_error0);
2639
2640         /* request pf to initialize status blocks */
2641         if (IS_VF(bp)) {
2642                 rc = bnx2x_vfpf_init(bp);
2643                 if (rc)
2644                         LOAD_ERROR_EXIT(bp, load_error0);
2645         }
2646
2647         /* As long as bnx2x_alloc_mem() may possibly update
2648          * bp->num_queues, bnx2x_set_real_num_queues() should always
2649          * come after it. At this stage cnic queues are not counted.
2650          */
2651         rc = bnx2x_set_real_num_queues(bp, 0);
2652         if (rc) {
2653                 BNX2X_ERR("Unable to set real_num_queues\n");
2654                 LOAD_ERROR_EXIT(bp, load_error0);
2655         }
2656
2657         /* configure multi cos mappings in kernel.
2658          * this configuration may be overridden by a multi class queue
2659          * discipline or by a dcbx negotiation result.
2660          */
2661         bnx2x_setup_tc(bp->dev, bp->max_cos);
2662
2663         /* Add all NAPI objects */
2664         bnx2x_add_all_napi(bp);
2665         DP(NETIF_MSG_IFUP, "napi added\n");
2666         bnx2x_napi_enable(bp);
2667
2668         if (IS_PF(bp)) {
2669                 /* set pf load just before approaching the MCP */
2670                 bnx2x_set_pf_load(bp);
2671
2672                 /* if mcp exists send load request and analyze response */
2673                 if (!BP_NOMCP(bp)) {
2674                         /* attempt to load pf */
2675                         rc = bnx2x_nic_load_request(bp, &load_code);
2676                         if (rc)
2677                                 LOAD_ERROR_EXIT(bp, load_error1);
2678
2679                         /* what did mcp say? */
2680                         rc = bnx2x_compare_fw_ver(bp, load_code, true);
2681                         if (rc) {
2682                                 bnx2x_fw_command(bp, DRV_MSG_CODE_LOAD_DONE, 0);
2683                                 LOAD_ERROR_EXIT(bp, load_error2);
2684                         }
2685                 } else {
2686                         load_code = bnx2x_nic_load_no_mcp(bp, port);
2687                 }
2688
2689                 /* mark pmf if applicable */
2690                 bnx2x_nic_load_pmf(bp, load_code);
2691
2692                 /* Init Function state controlling object */
2693                 bnx2x__init_func_obj(bp);
2694
2695                 /* Initialize HW */
2696                 rc = bnx2x_init_hw(bp, load_code);
2697                 if (rc) {
2698                         BNX2X_ERR("HW init failed, aborting\n");
2699                         bnx2x_fw_command(bp, DRV_MSG_CODE_LOAD_DONE, 0);
2700                         LOAD_ERROR_EXIT(bp, load_error2);
2701                 }
2702         }
2703
2704         bnx2x_pre_irq_nic_init(bp);
2705
2706         /* Connect to IRQs */
2707         rc = bnx2x_setup_irqs(bp);
2708         if (rc) {
2709                 BNX2X_ERR("setup irqs failed\n");
2710                 if (IS_PF(bp))
2711                         bnx2x_fw_command(bp, DRV_MSG_CODE_LOAD_DONE, 0);
2712                 LOAD_ERROR_EXIT(bp, load_error2);
2713         }
2714
2715         /* Init per-function objects */
2716         if (IS_PF(bp)) {
2717                 /* Setup NIC internals and enable interrupts */
2718                 bnx2x_post_irq_nic_init(bp, load_code);
2719
2720                 bnx2x_init_bp_objs(bp);
2721                 bnx2x_iov_nic_init(bp);
2722
2723                 /* Set AFEX default VLAN tag to an invalid value */
2724                 bp->afex_def_vlan_tag = -1;
2725                 bnx2x_nic_load_afex_dcc(bp, load_code);
2726                 bp->state = BNX2X_STATE_OPENING_WAIT4_PORT;
2727                 rc = bnx2x_func_start(bp);
2728                 if (rc) {
2729                         BNX2X_ERR("Function start failed!\n");
2730                         bnx2x_fw_command(bp, DRV_MSG_CODE_LOAD_DONE, 0);
2731
2732                         LOAD_ERROR_EXIT(bp, load_error3);
2733                 }
2734
2735                 /* Send LOAD_DONE command to MCP */
2736                 if (!BP_NOMCP(bp)) {
2737                         load_code = bnx2x_fw_command(bp,
2738                                                      DRV_MSG_CODE_LOAD_DONE, 0);
2739                         if (!load_code) {
2740                                 BNX2X_ERR("MCP response failure, aborting\n");
2741                                 rc = -EBUSY;
2742                                 LOAD_ERROR_EXIT(bp, load_error3);
2743                         }
2744                 }
2745
2746                 /* initialize FW coalescing state machines in RAM */
2747                 bnx2x_update_coalesce(bp);
2748         }
2749
2750         /* setup the leading queue */
2751         rc = bnx2x_setup_leading(bp);
2752         if (rc) {
2753                 BNX2X_ERR("Setup leading failed!\n");
2754                 LOAD_ERROR_EXIT(bp, load_error3);
2755         }
2756
2757         /* set up the rest of the queues */
2758         for_each_nondefault_eth_queue(bp, i) {
2759                 if (IS_PF(bp))
2760                         rc = bnx2x_setup_queue(bp, &bp->fp[i], false);
2761                 else /* VF */
2762                         rc = bnx2x_vfpf_setup_q(bp, &bp->fp[i], false);
2763                 if (rc) {
2764                         BNX2X_ERR("Queue %d setup failed\n", i);
2765                         LOAD_ERROR_EXIT(bp, load_error3);
2766                 }
2767         }
2768
2769         /* setup rss */
2770         rc = bnx2x_init_rss(bp);
2771         if (rc) {
2772                 BNX2X_ERR("PF RSS init failed\n");
2773                 LOAD_ERROR_EXIT(bp, load_error3);
2774         }
2775
2776         /* Now when Clients are configured we are ready to work */
2777         bp->state = BNX2X_STATE_OPEN;
2778
2779         /* Configure a ucast MAC */
2780         if (IS_PF(bp))
2781                 rc = bnx2x_set_eth_mac(bp, true);
2782         else /* vf */
2783                 rc = bnx2x_vfpf_config_mac(bp, bp->dev->dev_addr, bp->fp->index,
2784                                            true);
2785         if (rc) {
2786                 BNX2X_ERR("Setting Ethernet MAC failed\n");
2787                 LOAD_ERROR_EXIT(bp, load_error3);
2788         }
2789
2790         if (IS_PF(bp) && bp->pending_max) {
2791                 bnx2x_update_max_mf_config(bp, bp->pending_max);
2792                 bp->pending_max = 0;
2793         }
2794
2795         if (bp->port.pmf) {
2796                 rc = bnx2x_initial_phy_init(bp, load_mode);
2797                 if (rc)
2798                         LOAD_ERROR_EXIT(bp, load_error3);
2799         }
2800         bp->link_params.feature_config_flags &= ~FEATURE_CONFIG_BOOT_FROM_SAN;
2801
2802         /* Start fast path */
2803
2804         /* Initialize Rx filter. */
2805         bnx2x_set_rx_mode_inner(bp);
2806
2807         /* Start the Tx */
2808         switch (load_mode) {
2809         case LOAD_NORMAL:
2810                 /* Tx queue should be only re-enabled */
2811                 netif_tx_wake_all_queues(bp->dev);
2812                 break;
2813
2814         case LOAD_OPEN:
2815                 netif_tx_start_all_queues(bp->dev);
2816                 smp_mb__after_atomic();
2817                 break;
2818
2819         case LOAD_DIAG:
2820         case LOAD_LOOPBACK_EXT:
2821                 bp->state = BNX2X_STATE_DIAG;
2822                 break;
2823
2824         default:
2825                 break;
2826         }
2827
2828         if (bp->port.pmf)
2829                 bnx2x_update_drv_flags(bp, 1 << DRV_FLAGS_PORT_MASK, 0);
2830         else
2831                 bnx2x__link_status_update(bp);
2832
2833         /* start the timer */
2834         mod_timer(&bp->timer, jiffies + bp->current_interval);
2835
2836         if (CNIC_ENABLED(bp))
2837                 bnx2x_load_cnic(bp);
2838
2839         if (IS_PF(bp))
2840                 bnx2x_schedule_sp_rtnl(bp, BNX2X_SP_RTNL_GET_DRV_VERSION, 0);
2841
2842         if (IS_PF(bp) && SHMEM2_HAS(bp, drv_capabilities_flag)) {
2843                 /* mark driver is loaded in shmem2 */
2844                 u32 val;
2845                 val = SHMEM2_RD(bp, drv_capabilities_flag[BP_FW_MB_IDX(bp)]);
2846                 SHMEM2_WR(bp, drv_capabilities_flag[BP_FW_MB_IDX(bp)],
2847                           val | DRV_FLAGS_CAPABILITIES_LOADED_SUPPORTED |
2848                           DRV_FLAGS_CAPABILITIES_LOADED_L2);
2849         }
2850
2851         /* Wait for all pending SP commands to complete */
2852         if (IS_PF(bp) && !bnx2x_wait_sp_comp(bp, ~0x0UL)) {
2853                 BNX2X_ERR("Timeout waiting for SP elements to complete\n");
2854                 bnx2x_nic_unload(bp, UNLOAD_CLOSE, false);
2855                 return -EBUSY;
2856         }
2857
2858         /* If PMF - send ADMIN DCBX msg to MFW to initiate DCBX FSM */
2859         if (bp->port.pmf && (bp->state != BNX2X_STATE_DIAG))
2860                 bnx2x_dcbx_init(bp, false);
2861
2862         DP(NETIF_MSG_IFUP, "Ending successfully NIC load\n");
2863
2864         return 0;
2865
2866 #ifndef BNX2X_STOP_ON_ERROR
2867 load_error3:
2868         if (IS_PF(bp)) {
2869                 bnx2x_int_disable_sync(bp, 1);
2870
2871                 /* Clean queueable objects */
2872                 bnx2x_squeeze_objects(bp);
2873         }
2874
2875         /* Free SKBs, SGEs, TPA pool and driver internals */
2876         bnx2x_free_skbs(bp);
2877         for_each_rx_queue(bp, i)
2878                 bnx2x_free_rx_sge_range(bp, bp->fp + i, NUM_RX_SGE);
2879
2880         /* Release IRQs */
2881         bnx2x_free_irq(bp);
2882 load_error2:
2883         if (IS_PF(bp) && !BP_NOMCP(bp)) {
2884                 bnx2x_fw_command(bp, DRV_MSG_CODE_UNLOAD_REQ_WOL_MCP, 0);
2885                 bnx2x_fw_command(bp, DRV_MSG_CODE_UNLOAD_DONE, 0);
2886         }
2887
2888         bp->port.pmf = 0;
2889 load_error1:
2890         bnx2x_napi_disable(bp);
2891         bnx2x_del_all_napi(bp);
2892
2893         /* clear pf_load status, as it was already set */
2894         if (IS_PF(bp))
2895                 bnx2x_clear_pf_load(bp);
2896 load_error0:
2897         bnx2x_free_fw_stats_mem(bp);
2898         bnx2x_free_fp_mem(bp);
2899         bnx2x_free_mem(bp);
2900
2901         return rc;
2902 #endif /* ! BNX2X_STOP_ON_ERROR */
2903 }
2904
2905 int bnx2x_drain_tx_queues(struct bnx2x *bp)
2906 {
2907         u8 rc = 0, cos, i;
2908
2909         /* Wait until tx fastpath tasks complete */
2910         for_each_tx_queue(bp, i) {
2911                 struct bnx2x_fastpath *fp = &bp->fp[i];
2912
2913                 for_each_cos_in_tx_queue(fp, cos)
2914                         rc = bnx2x_clean_tx_queue(bp, fp->txdata_ptr[cos]);
2915                 if (rc)
2916                         return rc;
2917         }
2918         return 0;
2919 }
2920
2921 /* must be called with rtnl_lock */
2922 int bnx2x_nic_unload(struct bnx2x *bp, int unload_mode, bool keep_link)
2923 {
2924         int i;
2925         bool global = false;
2926
2927         DP(NETIF_MSG_IFUP, "Starting NIC unload\n");
2928
2929         /* mark driver is unloaded in shmem2 */
2930         if (IS_PF(bp) && SHMEM2_HAS(bp, drv_capabilities_flag)) {
2931                 u32 val;
2932                 val = SHMEM2_RD(bp, drv_capabilities_flag[BP_FW_MB_IDX(bp)]);
2933                 SHMEM2_WR(bp, drv_capabilities_flag[BP_FW_MB_IDX(bp)],
2934                           val & ~DRV_FLAGS_CAPABILITIES_LOADED_L2);
2935         }
2936
2937         if (IS_PF(bp) && bp->recovery_state != BNX2X_RECOVERY_DONE &&
2938             (bp->state == BNX2X_STATE_CLOSED ||
2939              bp->state == BNX2X_STATE_ERROR)) {
2940                 /* We can get here if the driver has been unloaded
2941                  * during parity error recovery and is either waiting for a
2942                  * leader to complete or for other functions to unload and
2943                  * then ifdown has been issued. In this case we want to
2944                  * unload and let other functions to complete a recovery
2945                  * process.
2946                  */
2947                 bp->recovery_state = BNX2X_RECOVERY_DONE;
2948                 bp->is_leader = 0;
2949                 bnx2x_release_leader_lock(bp);
2950                 smp_mb();
2951
2952                 DP(NETIF_MSG_IFDOWN, "Releasing a leadership...\n");
2953                 BNX2X_ERR("Can't unload in closed or error state\n");
2954                 return -EINVAL;
2955         }
2956
2957         /* Nothing to do during unload if previous bnx2x_nic_load()
2958          * have not completed successfully - all resources are released.
2959          *
2960          * we can get here only after unsuccessful ndo_* callback, during which
2961          * dev->IFF_UP flag is still on.
2962          */
2963         if (bp->state == BNX2X_STATE_CLOSED || bp->state == BNX2X_STATE_ERROR)
2964                 return 0;
2965
2966         /* It's important to set the bp->state to the value different from
2967          * BNX2X_STATE_OPEN and only then stop the Tx. Otherwise bnx2x_tx_int()
2968          * may restart the Tx from the NAPI context (see bnx2x_tx_int()).
2969          */
2970         bp->state = BNX2X_STATE_CLOSING_WAIT4_HALT;
2971         smp_mb();
2972
2973         /* indicate to VFs that the PF is going down */
2974         bnx2x_iov_channel_down(bp);
2975
2976         if (CNIC_LOADED(bp))
2977                 bnx2x_cnic_notify(bp, CNIC_CTL_STOP_CMD);
2978
2979         /* Stop Tx */
2980         bnx2x_tx_disable(bp);
2981         netdev_reset_tc(bp->dev);
2982
2983         bp->rx_mode = BNX2X_RX_MODE_NONE;
2984
2985         del_timer_sync(&bp->timer);
2986
2987         if (IS_PF(bp)) {
2988                 /* Set ALWAYS_ALIVE bit in shmem */
2989                 bp->fw_drv_pulse_wr_seq |= DRV_PULSE_ALWAYS_ALIVE;
2990                 bnx2x_drv_pulse(bp);
2991                 bnx2x_stats_handle(bp, STATS_EVENT_STOP);
2992                 bnx2x_save_statistics(bp);
2993         }
2994
2995         /* wait till consumers catch up with producers in all queues */
2996         bnx2x_drain_tx_queues(bp);
2997
2998         /* if VF indicate to PF this function is going down (PF will delete sp
2999          * elements and clear initializations
3000          */
3001         if (IS_VF(bp))
3002                 bnx2x_vfpf_close_vf(bp);
3003         else if (unload_mode != UNLOAD_RECOVERY)
3004                 /* if this is a normal/close unload need to clean up chip*/
3005                 bnx2x_chip_cleanup(bp, unload_mode, keep_link);
3006         else {
3007                 /* Send the UNLOAD_REQUEST to the MCP */
3008                 bnx2x_send_unload_req(bp, unload_mode);
3009
3010                 /* Prevent transactions to host from the functions on the
3011                  * engine that doesn't reset global blocks in case of global
3012                  * attention once global blocks are reset and gates are opened
3013                  * (the engine which leader will perform the recovery
3014                  * last).
3015                  */
3016                 if (!CHIP_IS_E1x(bp))
3017                         bnx2x_pf_disable(bp);
3018
3019                 /* Disable HW interrupts, NAPI */
3020                 bnx2x_netif_stop(bp, 1);
3021                 /* Delete all NAPI objects */
3022                 bnx2x_del_all_napi(bp);
3023                 if (CNIC_LOADED(bp))
3024                         bnx2x_del_all_napi_cnic(bp);
3025                 /* Release IRQs */
3026                 bnx2x_free_irq(bp);
3027
3028                 /* Report UNLOAD_DONE to MCP */
3029                 bnx2x_send_unload_done(bp, false);
3030         }
3031
3032         /*
3033          * At this stage no more interrupts will arrive so we may safely clean
3034          * the queueable objects here in case they failed to get cleaned so far.
3035          */
3036         if (IS_PF(bp))
3037                 bnx2x_squeeze_objects(bp);
3038
3039         /* There should be no more pending SP commands at this stage */
3040         bp->sp_state = 0;
3041
3042         bp->port.pmf = 0;
3043
3044         /* clear pending work in rtnl task */
3045         bp->sp_rtnl_state = 0;
3046         smp_mb();
3047
3048         /* Free SKBs, SGEs, TPA pool and driver internals */
3049         bnx2x_free_skbs(bp);
3050         if (CNIC_LOADED(bp))
3051                 bnx2x_free_skbs_cnic(bp);
3052         for_each_rx_queue(bp, i)
3053                 bnx2x_free_rx_sge_range(bp, bp->fp + i, NUM_RX_SGE);
3054
3055         bnx2x_free_fp_mem(bp);
3056         if (CNIC_LOADED(bp))
3057                 bnx2x_free_fp_mem_cnic(bp);
3058
3059         if (IS_PF(bp)) {
3060                 if (CNIC_LOADED(bp))
3061                         bnx2x_free_mem_cnic(bp);
3062         }
3063         bnx2x_free_mem(bp);
3064
3065         bp->state = BNX2X_STATE_CLOSED;
3066         bp->cnic_loaded = false;
3067
3068         /* Clear driver version indication in shmem */
3069         if (IS_PF(bp))
3070                 bnx2x_update_mng_version(bp);
3071
3072         /* Check if there are pending parity attentions. If there are - set
3073          * RECOVERY_IN_PROGRESS.
3074          */
3075         if (IS_PF(bp) && bnx2x_chk_parity_attn(bp, &global, false)) {
3076                 bnx2x_set_reset_in_progress(bp);
3077
3078                 /* Set RESET_IS_GLOBAL if needed */
3079                 if (global)
3080                         bnx2x_set_reset_global(bp);
3081         }
3082
3083         /* The last driver must disable a "close the gate" if there is no
3084          * parity attention or "process kill" pending.
3085          */
3086         if (IS_PF(bp) &&
3087             !bnx2x_clear_pf_load(bp) &&
3088             bnx2x_reset_is_done(bp, BP_PATH(bp)))
3089                 bnx2x_disable_close_the_gate(bp);
3090
3091         DP(NETIF_MSG_IFUP, "Ending NIC unload\n");
3092
3093         return 0;
3094 }
3095
3096 int bnx2x_set_power_state(struct bnx2x *bp, pci_power_t state)
3097 {
3098         u16 pmcsr;
3099
3100         /* If there is no power capability, silently succeed */
3101         if (!bp->pdev->pm_cap) {
3102                 BNX2X_DEV_INFO("No power capability. Breaking.\n");
3103                 return 0;
3104         }
3105
3106         pci_read_config_word(bp->pdev, bp->pdev->pm_cap + PCI_PM_CTRL, &pmcsr);
3107
3108         switch (state) {
3109         case PCI_D0:
3110                 pci_write_config_word(bp->pdev, bp->pdev->pm_cap + PCI_PM_CTRL,
3111                                       ((pmcsr & ~PCI_PM_CTRL_STATE_MASK) |
3112                                        PCI_PM_CTRL_PME_STATUS));
3113
3114                 if (pmcsr & PCI_PM_CTRL_STATE_MASK)
3115                         /* delay required during transition out of D3hot */
3116                         msleep(20);
3117                 break;
3118
3119         case PCI_D3hot:
3120                 /* If there are other clients above don't
3121                    shut down the power */
3122                 if (atomic_read(&bp->pdev->enable_cnt) != 1)
3123                         return 0;
3124                 /* Don't shut down the power for emulation and FPGA */
3125                 if (CHIP_REV_IS_SLOW(bp))
3126                         return 0;
3127
3128                 pmcsr &= ~PCI_PM_CTRL_STATE_MASK;
3129                 pmcsr |= 3;
3130
3131                 if (bp->wol)
3132                         pmcsr |= PCI_PM_CTRL_PME_ENABLE;
3133
3134                 pci_write_config_word(bp->pdev, bp->pdev->pm_cap + PCI_PM_CTRL,
3135                                       pmcsr);
3136
3137                 /* No more memory access after this point until
3138                 * device is brought back to D0.
3139                 */
3140                 break;
3141
3142         default:
3143                 dev_err(&bp->pdev->dev, "Can't support state = %d\n", state);
3144                 return -EINVAL;
3145         }
3146         return 0;
3147 }
3148
3149 /*
3150  * net_device service functions
3151  */
3152 static int bnx2x_poll(struct napi_struct *napi, int budget)
3153 {
3154         int work_done = 0;
3155         u8 cos;
3156         struct bnx2x_fastpath *fp = container_of(napi, struct bnx2x_fastpath,
3157                                                  napi);
3158         struct bnx2x *bp = fp->bp;
3159
3160         while (1) {
3161 #ifdef BNX2X_STOP_ON_ERROR
3162                 if (unlikely(bp->panic)) {
3163                         napi_complete(napi);
3164                         return 0;
3165                 }
3166 #endif
3167                 if (!bnx2x_fp_lock_napi(fp))
3168                         return work_done;
3169
3170                 for_each_cos_in_tx_queue(fp, cos)
3171                         if (bnx2x_tx_queue_has_work(fp->txdata_ptr[cos]))
3172                                 bnx2x_tx_int(bp, fp->txdata_ptr[cos]);
3173
3174                 if (bnx2x_has_rx_work(fp)) {
3175                         work_done += bnx2x_rx_int(fp, budget - work_done);
3176
3177                         /* must not complete if we consumed full budget */
3178                         if (work_done >= budget) {
3179                                 bnx2x_fp_unlock_napi(fp);
3180                                 break;
3181                         }
3182                 }
3183
3184                 /* Fall out from the NAPI loop if needed */
3185                 if (!bnx2x_fp_unlock_napi(fp) &&
3186                     !(bnx2x_has_rx_work(fp) || bnx2x_has_tx_work(fp))) {
3187
3188                         /* No need to update SB for FCoE L2 ring as long as
3189                          * it's connected to the default SB and the SB
3190                          * has been updated when NAPI was scheduled.
3191                          */
3192                         if (IS_FCOE_FP(fp)) {
3193                                 napi_complete(napi);
3194                                 break;
3195                         }
3196                         bnx2x_update_fpsb_idx(fp);
3197                         /* bnx2x_has_rx_work() reads the status block,
3198                          * thus we need to ensure that status block indices
3199                          * have been actually read (bnx2x_update_fpsb_idx)
3200                          * prior to this check (bnx2x_has_rx_work) so that
3201                          * we won't write the "newer" value of the status block
3202                          * to IGU (if there was a DMA right after
3203                          * bnx2x_has_rx_work and if there is no rmb, the memory
3204                          * reading (bnx2x_update_fpsb_idx) may be postponed
3205                          * to right before bnx2x_ack_sb). In this case there
3206                          * will never be another interrupt until there is
3207                          * another update of the status block, while there
3208                          * is still unhandled work.
3209                          */
3210                         rmb();
3211
3212                         if (!(bnx2x_has_rx_work(fp) || bnx2x_has_tx_work(fp))) {
3213                                 napi_complete(napi);
3214                                 /* Re-enable interrupts */
3215                                 DP(NETIF_MSG_RX_STATUS,
3216                                    "Update index to %d\n", fp->fp_hc_idx);
3217                                 bnx2x_ack_sb(bp, fp->igu_sb_id, USTORM_ID,
3218                                              le16_to_cpu(fp->fp_hc_idx),
3219                                              IGU_INT_ENABLE, 1);
3220                                 break;
3221                         }
3222                 }
3223         }
3224
3225         return work_done;
3226 }
3227
3228 #ifdef CONFIG_NET_RX_BUSY_POLL
3229 /* must be called with local_bh_disable()d */
3230 int bnx2x_low_latency_recv(struct napi_struct *napi)
3231 {
3232         struct bnx2x_fastpath *fp = container_of(napi, struct bnx2x_fastpath,
3233                                                  napi);
3234         struct bnx2x *bp = fp->bp;
3235         int found = 0;
3236
3237         if ((bp->state == BNX2X_STATE_CLOSED) ||
3238             (bp->state == BNX2X_STATE_ERROR) ||
3239             (bp->flags & (TPA_ENABLE_FLAG | GRO_ENABLE_FLAG)))
3240                 return LL_FLUSH_FAILED;
3241
3242         if (!bnx2x_fp_lock_poll(fp))
3243                 return LL_FLUSH_BUSY;
3244
3245         if (bnx2x_has_rx_work(fp))
3246                 found = bnx2x_rx_int(fp, 4);
3247
3248         bnx2x_fp_unlock_poll(fp);
3249
3250         return found;
3251 }
3252 #endif
3253
3254 /* we split the first BD into headers and data BDs
3255  * to ease the pain of our fellow microcode engineers
3256  * we use one mapping for both BDs
3257  */
3258 static u16 bnx2x_tx_split(struct bnx2x *bp,
3259                           struct bnx2x_fp_txdata *txdata,
3260                           struct sw_tx_bd *tx_buf,
3261                           struct eth_tx_start_bd **tx_bd, u16 hlen,
3262                           u16 bd_prod)
3263 {
3264         struct eth_tx_start_bd *h_tx_bd = *tx_bd;
3265         struct eth_tx_bd *d_tx_bd;
3266         dma_addr_t mapping;
3267         int old_len = le16_to_cpu(h_tx_bd->nbytes);
3268
3269         /* first fix first BD */
3270         h_tx_bd->nbytes = cpu_to_le16(hlen);
3271
3272         DP(NETIF_MSG_TX_QUEUED, "TSO split header size is %d (%x:%x)\n",
3273            h_tx_bd->nbytes, h_tx_bd->addr_hi, h_tx_bd->addr_lo);
3274
3275         /* now get a new data BD
3276          * (after the pbd) and fill it */
3277         bd_prod = TX_BD(NEXT_TX_IDX(bd_prod));
3278         d_tx_bd = &txdata->tx_desc_ring[bd_prod].reg_bd;
3279
3280         mapping = HILO_U64(le32_to_cpu(h_tx_bd->addr_hi),
3281                            le32_to_cpu(h_tx_bd->addr_lo)) + hlen;
3282
3283         d_tx_bd->addr_hi = cpu_to_le32(U64_HI(mapping));
3284         d_tx_bd->addr_lo = cpu_to_le32(U64_LO(mapping));
3285         d_tx_bd->nbytes = cpu_to_le16(old_len - hlen);
3286
3287         /* this marks the BD as one that has no individual mapping */
3288         tx_buf->flags |= BNX2X_TSO_SPLIT_BD;
3289
3290         DP(NETIF_MSG_TX_QUEUED,
3291            "TSO split data size is %d (%x:%x)\n",
3292            d_tx_bd->nbytes, d_tx_bd->addr_hi, d_tx_bd->addr_lo);
3293
3294         /* update tx_bd */
3295         *tx_bd = (struct eth_tx_start_bd *)d_tx_bd;
3296
3297         return bd_prod;
3298 }
3299
3300 #define bswab32(b32) ((__force __le32) swab32((__force __u32) (b32)))
3301 #define bswab16(b16) ((__force __le16) swab16((__force __u16) (b16)))
3302 static __le16 bnx2x_csum_fix(unsigned char *t_header, u16 csum, s8 fix)
3303 {
3304         __sum16 tsum = (__force __sum16) csum;
3305
3306         if (fix > 0)
3307                 tsum = ~csum_fold(csum_sub((__force __wsum) csum,
3308                                   csum_partial(t_header - fix, fix, 0)));
3309
3310         else if (fix < 0)
3311                 tsum = ~csum_fold(csum_add((__force __wsum) csum,
3312                                   csum_partial(t_header, -fix, 0)));
3313
3314         return bswab16(tsum);
3315 }
3316
3317 static u32 bnx2x_xmit_type(struct bnx2x *bp, struct sk_buff *skb)
3318 {
3319         u32 rc;
3320         __u8 prot = 0;
3321         __be16 protocol;
3322
3323         if (skb->ip_summed != CHECKSUM_PARTIAL)
3324                 return XMIT_PLAIN;
3325
3326         protocol = vlan_get_protocol(skb);
3327         if (protocol == htons(ETH_P_IPV6)) {
3328                 rc = XMIT_CSUM_V6;
3329                 prot = ipv6_hdr(skb)->nexthdr;
3330         } else {
3331                 rc = XMIT_CSUM_V4;
3332                 prot = ip_hdr(skb)->protocol;
3333         }
3334
3335         if (!CHIP_IS_E1x(bp) && skb->encapsulation) {
3336                 if (inner_ip_hdr(skb)->version == 6) {
3337                         rc |= XMIT_CSUM_ENC_V6;
3338                         if (inner_ipv6_hdr(skb)->nexthdr == IPPROTO_TCP)
3339                                 rc |= XMIT_CSUM_TCP;
3340                 } else {
3341                         rc |= XMIT_CSUM_ENC_V4;
3342                         if (inner_ip_hdr(skb)->protocol == IPPROTO_TCP)
3343                                 rc |= XMIT_CSUM_TCP;
3344                 }
3345         }
3346         if (prot == IPPROTO_TCP)
3347                 rc |= XMIT_CSUM_TCP;
3348
3349         if (skb_is_gso(skb)) {
3350                 if (skb_is_gso_v6(skb)) {
3351                         rc |= (XMIT_GSO_V6 | XMIT_CSUM_TCP);
3352                         if (rc & XMIT_CSUM_ENC)
3353                                 rc |= XMIT_GSO_ENC_V6;
3354                 } else {
3355                         rc |= (XMIT_GSO_V4 | XMIT_CSUM_TCP);
3356                         if (rc & XMIT_CSUM_ENC)
3357                                 rc |= XMIT_GSO_ENC_V4;
3358                 }
3359         }
3360
3361         return rc;
3362 }
3363
3364 #if (MAX_SKB_FRAGS >= MAX_FETCH_BD - 3)
3365 /* check if packet requires linearization (packet is too fragmented)
3366    no need to check fragmentation if page size > 8K (there will be no
3367    violation to FW restrictions) */
3368 static int bnx2x_pkt_req_lin(struct bnx2x *bp, struct sk_buff *skb,
3369                              u32 xmit_type)
3370 {
3371         int to_copy = 0;
3372         int hlen = 0;
3373         int first_bd_sz = 0;
3374
3375         /* 3 = 1 (for linear data BD) + 2 (for PBD and last BD) */
3376         if (skb_shinfo(skb)->nr_frags >= (MAX_FETCH_BD - 3)) {
3377
3378                 if (xmit_type & XMIT_GSO) {
3379                         unsigned short lso_mss = skb_shinfo(skb)->gso_size;
3380                         /* Check if LSO packet needs to be copied:
3381                            3 = 1 (for headers BD) + 2 (for PBD and last BD) */
3382                         int wnd_size = MAX_FETCH_BD - 3;
3383                         /* Number of windows to check */
3384                         int num_wnds = skb_shinfo(skb)->nr_frags - wnd_size;
3385                         int wnd_idx = 0;
3386                         int frag_idx = 0;
3387                         u32 wnd_sum = 0;
3388
3389                         /* Headers length */
3390                         hlen = (int)(skb_transport_header(skb) - skb->data) +
3391                                 tcp_hdrlen(skb);
3392
3393                         /* Amount of data (w/o headers) on linear part of SKB*/
3394                         first_bd_sz = skb_headlen(skb) - hlen;
3395
3396                         wnd_sum  = first_bd_sz;
3397
3398                         /* Calculate the first sum - it's special */
3399                         for (frag_idx = 0; frag_idx < wnd_size - 1; frag_idx++)
3400                                 wnd_sum +=
3401                                         skb_frag_size(&skb_shinfo(skb)->frags[frag_idx]);
3402
3403                         /* If there was data on linear skb data - check it */
3404                         if (first_bd_sz > 0) {
3405                                 if (unlikely(wnd_sum < lso_mss)) {
3406                                         to_copy = 1;
3407                                         goto exit_lbl;
3408                                 }
3409
3410                                 wnd_sum -= first_bd_sz;
3411                         }
3412
3413                         /* Others are easier: run through the frag list and
3414                            check all windows */
3415                         for (wnd_idx = 0; wnd_idx <= num_wnds; wnd_idx++) {
3416                                 wnd_sum +=
3417                           skb_frag_size(&skb_shinfo(skb)->frags[wnd_idx + wnd_size - 1]);
3418
3419                                 if (unlikely(wnd_sum < lso_mss)) {
3420                                         to_copy = 1;
3421                                         break;
3422                                 }
3423                                 wnd_sum -=
3424                                         skb_frag_size(&skb_shinfo(skb)->frags[wnd_idx]);
3425                         }
3426                 } else {
3427                         /* in non-LSO too fragmented packet should always
3428                            be linearized */
3429                         to_copy = 1;
3430                 }
3431         }
3432
3433 exit_lbl:
3434         if (unlikely(to_copy))
3435                 DP(NETIF_MSG_TX_QUEUED,
3436                    "Linearization IS REQUIRED for %s packet. num_frags %d  hlen %d  first_bd_sz %d\n",
3437                    (xmit_type & XMIT_GSO) ? "LSO" : "non-LSO",
3438                    skb_shinfo(skb)->nr_frags, hlen, first_bd_sz);
3439
3440         return to_copy;
3441 }
3442 #endif
3443
3444 static void bnx2x_set_pbd_gso_e2(struct sk_buff *skb, u32 *parsing_data,
3445                                  u32 xmit_type)
3446 {
3447         struct ipv6hdr *ipv6;
3448
3449         *parsing_data |= (skb_shinfo(skb)->gso_size <<
3450                               ETH_TX_PARSE_BD_E2_LSO_MSS_SHIFT) &
3451                               ETH_TX_PARSE_BD_E2_LSO_MSS;
3452
3453         if (xmit_type & XMIT_GSO_ENC_V6)
3454                 ipv6 = inner_ipv6_hdr(skb);
3455         else if (xmit_type & XMIT_GSO_V6)
3456                 ipv6 = ipv6_hdr(skb);
3457         else
3458                 ipv6 = NULL;
3459
3460         if (ipv6 && ipv6->nexthdr == NEXTHDR_IPV6)
3461                 *parsing_data |= ETH_TX_PARSE_BD_E2_IPV6_WITH_EXT_HDR;
3462 }
3463
3464 /**
3465  * bnx2x_set_pbd_gso - update PBD in GSO case.
3466  *
3467  * @skb:        packet skb
3468  * @pbd:        parse BD
3469  * @xmit_type:  xmit flags
3470  */
3471 static void bnx2x_set_pbd_gso(struct sk_buff *skb,
3472                               struct eth_tx_parse_bd_e1x *pbd,
3473                               struct eth_tx_start_bd *tx_start_bd,
3474                               u32 xmit_type)
3475 {
3476         pbd->lso_mss = cpu_to_le16(skb_shinfo(skb)->gso_size);
3477         pbd->tcp_send_seq = bswab32(tcp_hdr(skb)->seq);
3478         pbd->tcp_flags = pbd_tcp_flags(tcp_hdr(skb));
3479
3480         if (xmit_type & XMIT_GSO_V4) {
3481                 pbd->ip_id = bswab16(ip_hdr(skb)->id);
3482                 pbd->tcp_pseudo_csum =
3483                         bswab16(~csum_tcpudp_magic(ip_hdr(skb)->saddr,
3484                                                    ip_hdr(skb)->daddr,
3485                                                    0, IPPROTO_TCP, 0));
3486
3487                 /* GSO on 57710/57711 needs FW to calculate IP checksum */
3488                 tx_start_bd->bd_flags.as_bitfield |= ETH_TX_BD_FLAGS_IP_CSUM;
3489         } else {
3490                 pbd->tcp_pseudo_csum =
3491                         bswab16(~csum_ipv6_magic(&ipv6_hdr(skb)->saddr,
3492                                                  &ipv6_hdr(skb)->daddr,
3493                                                  0, IPPROTO_TCP, 0));
3494         }
3495
3496         pbd->global_data |=
3497                 cpu_to_le16(ETH_TX_PARSE_BD_E1X_PSEUDO_CS_WITHOUT_LEN);
3498 }
3499
3500 /**
3501  * bnx2x_set_pbd_csum_enc - update PBD with checksum and return header length
3502  *
3503  * @bp:                 driver handle
3504  * @skb:                packet skb
3505  * @parsing_data:       data to be updated
3506  * @xmit_type:          xmit flags
3507  *
3508  * 57712/578xx related, when skb has encapsulation
3509  */
3510 static u8 bnx2x_set_pbd_csum_enc(struct bnx2x *bp, struct sk_buff *skb,
3511                                  u32 *parsing_data, u32 xmit_type)
3512 {
3513         *parsing_data |=
3514                 ((((u8 *)skb_inner_transport_header(skb) - skb->data) >> 1) <<
3515                 ETH_TX_PARSE_BD_E2_L4_HDR_START_OFFSET_W_SHIFT) &
3516                 ETH_TX_PARSE_BD_E2_L4_HDR_START_OFFSET_W;
3517
3518         if (xmit_type & XMIT_CSUM_TCP) {
3519                 *parsing_data |= ((inner_tcp_hdrlen(skb) / 4) <<
3520                         ETH_TX_PARSE_BD_E2_TCP_HDR_LENGTH_DW_SHIFT) &
3521                         ETH_TX_PARSE_BD_E2_TCP_HDR_LENGTH_DW;
3522
3523                 return skb_inner_transport_header(skb) +
3524                         inner_tcp_hdrlen(skb) - skb->data;
3525         }
3526
3527         /* We support checksum offload for TCP and UDP only.
3528          * No need to pass the UDP header length - it's a constant.
3529          */
3530         return skb_inner_transport_header(skb) +
3531                 sizeof(struct udphdr) - skb->data;
3532 }
3533
3534 /**
3535  * bnx2x_set_pbd_csum_e2 - update PBD with checksum and return header length
3536  *
3537  * @bp:                 driver handle
3538  * @skb:                packet skb
3539  * @parsing_data:       data to be updated
3540  * @xmit_type:          xmit flags
3541  *
3542  * 57712/578xx related
3543  */
3544 static u8 bnx2x_set_pbd_csum_e2(struct bnx2x *bp, struct sk_buff *skb,
3545                                 u32 *parsing_data, u32 xmit_type)
3546 {
3547         *parsing_data |=
3548                 ((((u8 *)skb_transport_header(skb) - skb->data) >> 1) <<
3549                 ETH_TX_PARSE_BD_E2_L4_HDR_START_OFFSET_W_SHIFT) &
3550                 ETH_TX_PARSE_BD_E2_L4_HDR_START_OFFSET_W;
3551
3552         if (xmit_type & XMIT_CSUM_TCP) {
3553                 *parsing_data |= ((tcp_hdrlen(skb) / 4) <<
3554                         ETH_TX_PARSE_BD_E2_TCP_HDR_LENGTH_DW_SHIFT) &
3555                         ETH_TX_PARSE_BD_E2_TCP_HDR_LENGTH_DW;
3556
3557                 return skb_transport_header(skb) + tcp_hdrlen(skb) - skb->data;
3558         }
3559         /* We support checksum offload for TCP and UDP only.
3560          * No need to pass the UDP header length - it's a constant.
3561          */
3562         return skb_transport_header(skb) + sizeof(struct udphdr) - skb->data;
3563 }
3564
3565 /* set FW indication according to inner or outer protocols if tunneled */
3566 static void bnx2x_set_sbd_csum(struct bnx2x *bp, struct sk_buff *skb,
3567                                struct eth_tx_start_bd *tx_start_bd,
3568                                u32 xmit_type)
3569 {
3570         tx_start_bd->bd_flags.as_bitfield |= ETH_TX_BD_FLAGS_L4_CSUM;
3571
3572         if (xmit_type & (XMIT_CSUM_ENC_V6 | XMIT_CSUM_V6))
3573                 tx_start_bd->bd_flags.as_bitfield |= ETH_TX_BD_FLAGS_IPV6;
3574
3575         if (!(xmit_type & XMIT_CSUM_TCP))
3576                 tx_start_bd->bd_flags.as_bitfield |= ETH_TX_BD_FLAGS_IS_UDP;
3577 }
3578
3579 /**
3580  * bnx2x_set_pbd_csum - update PBD with checksum and return header length
3581  *
3582  * @bp:         driver handle
3583  * @skb:        packet skb
3584  * @pbd:        parse BD to be updated
3585  * @xmit_type:  xmit flags
3586  */
3587 static u8 bnx2x_set_pbd_csum(struct bnx2x *bp, struct sk_buff *skb,
3588                              struct eth_tx_parse_bd_e1x *pbd,
3589                              u32 xmit_type)
3590 {
3591         u8 hlen = (skb_network_header(skb) - skb->data) >> 1;
3592
3593         /* for now NS flag is not used in Linux */
3594         pbd->global_data =
3595                 cpu_to_le16(hlen |
3596                             ((skb->protocol == cpu_to_be16(ETH_P_8021Q)) <<
3597                              ETH_TX_PARSE_BD_E1X_LLC_SNAP_EN_SHIFT));
3598
3599         pbd->ip_hlen_w = (skb_transport_header(skb) -
3600                         skb_network_header(skb)) >> 1;
3601
3602         hlen += pbd->ip_hlen_w;
3603
3604         /* We support checksum offload for TCP and UDP only */
3605         if (xmit_type & XMIT_CSUM_TCP)
3606                 hlen += tcp_hdrlen(skb) / 2;
3607         else
3608                 hlen += sizeof(struct udphdr) / 2;
3609
3610         pbd->total_hlen_w = cpu_to_le16(hlen);
3611         hlen = hlen*2;
3612
3613         if (xmit_type & XMIT_CSUM_TCP) {
3614                 pbd->tcp_pseudo_csum = bswab16(tcp_hdr(skb)->check);
3615
3616         } else {
3617                 s8 fix = SKB_CS_OFF(skb); /* signed! */
3618
3619                 DP(NETIF_MSG_TX_QUEUED,
3620                    "hlen %d  fix %d  csum before fix %x\n",
3621                    le16_to_cpu(pbd->total_hlen_w), fix, SKB_CS(skb));
3622
3623                 /* HW bug: fixup the CSUM */
3624                 pbd->tcp_pseudo_csum =
3625                         bnx2x_csum_fix(skb_transport_header(skb),
3626                                        SKB_CS(skb), fix);
3627
3628                 DP(NETIF_MSG_TX_QUEUED, "csum after fix %x\n",
3629                    pbd->tcp_pseudo_csum);
3630         }
3631
3632         return hlen;
3633 }
3634
3635 static void bnx2x_update_pbds_gso_enc(struct sk_buff *skb,
3636                                       struct eth_tx_parse_bd_e2 *pbd_e2,
3637                                       struct eth_tx_parse_2nd_bd *pbd2,
3638                                       u16 *global_data,
3639                                       u32 xmit_type)
3640 {
3641         u16 hlen_w = 0;
3642         u8 outerip_off, outerip_len = 0;
3643
3644         /* from outer IP to transport */
3645         hlen_w = (skb_inner_transport_header(skb) -
3646                   skb_network_header(skb)) >> 1;
3647
3648         /* transport len */
3649         hlen_w += inner_tcp_hdrlen(skb) >> 1;
3650
3651         pbd2->fw_ip_hdr_to_payload_w = hlen_w;
3652
3653         /* outer IP header info */
3654         if (xmit_type & XMIT_CSUM_V4) {
3655                 struct iphdr *iph = ip_hdr(skb);
3656                 u32 csum = (__force u32)(~iph->check) -
3657                            (__force u32)iph->tot_len -
3658                            (__force u32)iph->frag_off;
3659
3660                 pbd2->fw_ip_csum_wo_len_flags_frag =
3661                         bswab16(csum_fold((__force __wsum)csum));
3662         } else {
3663                 pbd2->fw_ip_hdr_to_payload_w =
3664                         hlen_w - ((sizeof(struct ipv6hdr)) >> 1);
3665         }
3666
3667         pbd2->tcp_send_seq = bswab32(inner_tcp_hdr(skb)->seq);
3668
3669         pbd2->tcp_flags = pbd_tcp_flags(inner_tcp_hdr(skb));
3670
3671         if (xmit_type & XMIT_GSO_V4) {
3672                 pbd2->hw_ip_id = bswab16(inner_ip_hdr(skb)->id);
3673
3674                 pbd_e2->data.tunnel_data.pseudo_csum =
3675                         bswab16(~csum_tcpudp_magic(
3676                                         inner_ip_hdr(skb)->saddr,
3677                                         inner_ip_hdr(skb)->daddr,
3678                                         0, IPPROTO_TCP, 0));
3679
3680                 outerip_len = ip_hdr(skb)->ihl << 1;
3681         } else {
3682                 pbd_e2->data.tunnel_data.pseudo_csum =
3683                         bswab16(~csum_ipv6_magic(
3684                                         &inner_ipv6_hdr(skb)->saddr,
3685                                         &inner_ipv6_hdr(skb)->daddr,
3686                                         0, IPPROTO_TCP, 0));
3687         }
3688
3689         outerip_off = (skb_network_header(skb) - skb->data) >> 1;
3690
3691         *global_data |=
3692                 outerip_off |
3693                 (!!(xmit_type & XMIT_CSUM_V6) <<
3694                         ETH_TX_PARSE_2ND_BD_IP_HDR_TYPE_OUTER_SHIFT) |
3695                 (outerip_len <<
3696                         ETH_TX_PARSE_2ND_BD_IP_HDR_LEN_OUTER_W_SHIFT) |
3697                 ((skb->protocol == cpu_to_be16(ETH_P_8021Q)) <<
3698                         ETH_TX_PARSE_2ND_BD_LLC_SNAP_EN_SHIFT);
3699
3700         if (ip_hdr(skb)->protocol == IPPROTO_UDP) {
3701                 SET_FLAG(*global_data, ETH_TX_PARSE_2ND_BD_TUNNEL_UDP_EXIST, 1);
3702                 pbd2->tunnel_udp_hdr_start_w = skb_transport_offset(skb) >> 1;
3703         }
3704 }
3705
3706 /* called with netif_tx_lock
3707  * bnx2x_tx_int() runs without netif_tx_lock unless it needs to call
3708  * netif_wake_queue()
3709  */
3710 netdev_tx_t bnx2x_start_xmit(struct sk_buff *skb, struct net_device *dev)
3711 {
3712         struct bnx2x *bp = netdev_priv(dev);
3713
3714         struct netdev_queue *txq;
3715         struct bnx2x_fp_txdata *txdata;
3716         struct sw_tx_bd *tx_buf;
3717         struct eth_tx_start_bd *tx_start_bd, *first_bd;
3718         struct eth_tx_bd *tx_data_bd, *total_pkt_bd = NULL;
3719         struct eth_tx_parse_bd_e1x *pbd_e1x = NULL;
3720         struct eth_tx_parse_bd_e2 *pbd_e2 = NULL;
3721         struct eth_tx_parse_2nd_bd *pbd2 = NULL;
3722         u32 pbd_e2_parsing_data = 0;
3723         u16 pkt_prod, bd_prod;
3724         int nbd, txq_index;
3725         dma_addr_t mapping;
3726         u32 xmit_type = bnx2x_xmit_type(bp, skb);
3727         int i;
3728         u8 hlen = 0;
3729         __le16 pkt_size = 0;
3730         struct ethhdr *eth;
3731         u8 mac_type = UNICAST_ADDRESS;
3732
3733 #ifdef BNX2X_STOP_ON_ERROR
3734         if (unlikely(bp->panic))
3735                 return NETDEV_TX_BUSY;
3736 #endif
3737
3738         txq_index = skb_get_queue_mapping(skb);
3739         txq = netdev_get_tx_queue(dev, txq_index);
3740
3741         BUG_ON(txq_index >= MAX_ETH_TXQ_IDX(bp) + (CNIC_LOADED(bp) ? 1 : 0));
3742
3743         txdata = &bp->bnx2x_txq[txq_index];
3744
3745         /* enable this debug print to view the transmission queue being used
3746         DP(NETIF_MSG_TX_QUEUED, "indices: txq %d, fp %d, txdata %d\n",
3747            txq_index, fp_index, txdata_index); */
3748
3749         /* enable this debug print to view the transmission details
3750         DP(NETIF_MSG_TX_QUEUED,
3751            "transmitting packet cid %d fp index %d txdata_index %d tx_data ptr %p fp pointer %p\n",
3752            txdata->cid, fp_index, txdata_index, txdata, fp); */
3753
3754         if (unlikely(bnx2x_tx_avail(bp, txdata) <
3755                         skb_shinfo(skb)->nr_frags +
3756                         BDS_PER_TX_PKT +
3757                         NEXT_CNT_PER_TX_PKT(MAX_BDS_PER_TX_PKT))) {
3758                 /* Handle special storage cases separately */
3759                 if (txdata->tx_ring_size == 0) {
3760                         struct bnx2x_eth_q_stats *q_stats =
3761                                 bnx2x_fp_qstats(bp, txdata->parent_fp);
3762                         q_stats->driver_filtered_tx_pkt++;
3763                         dev_kfree_skb(skb);
3764                         return NETDEV_TX_OK;
3765                 }
3766                 bnx2x_fp_qstats(bp, txdata->parent_fp)->driver_xoff++;
3767                 netif_tx_stop_queue(txq);
3768                 BNX2X_ERR("BUG! Tx ring full when queue awake!\n");
3769
3770                 return NETDEV_TX_BUSY;
3771         }
3772
3773         DP(NETIF_MSG_TX_QUEUED,
3774            "queue[%d]: SKB: summed %x  protocol %x protocol(%x,%x) gso type %x  xmit_type %x len %d\n",
3775            txq_index, skb->ip_summed, skb->protocol, ipv6_hdr(skb)->nexthdr,
3776            ip_hdr(skb)->protocol, skb_shinfo(skb)->gso_type, xmit_type,
3777            skb->len);
3778
3779         eth = (struct ethhdr *)skb->data;
3780
3781         /* set flag according to packet type (UNICAST_ADDRESS is default)*/
3782         if (unlikely(is_multicast_ether_addr(eth->h_dest))) {
3783                 if (is_broadcast_ether_addr(eth->h_dest))
3784                         mac_type = BROADCAST_ADDRESS;
3785                 else
3786                         mac_type = MULTICAST_ADDRESS;
3787         }
3788
3789 #if (MAX_SKB_FRAGS >= MAX_FETCH_BD - BDS_PER_TX_PKT)
3790         /* First, check if we need to linearize the skb (due to FW
3791            restrictions). No need to check fragmentation if page size > 8K
3792            (there will be no violation to FW restrictions) */
3793         if (bnx2x_pkt_req_lin(bp, skb, xmit_type)) {
3794                 /* Statistics of linearization */
3795                 bp->lin_cnt++;
3796                 if (skb_linearize(skb) != 0) {
3797                         DP(NETIF_MSG_TX_QUEUED,
3798                            "SKB linearization failed - silently dropping this SKB\n");
3799                         dev_kfree_skb_any(skb);
3800                         return NETDEV_TX_OK;
3801                 }
3802         }
3803 #endif
3804         /* Map skb linear data for DMA */
3805         mapping = dma_map_single(&bp->pdev->dev, skb->data,
3806                                  skb_headlen(skb), DMA_TO_DEVICE);
3807         if (unlikely(dma_mapping_error(&bp->pdev->dev, mapping))) {
3808                 DP(NETIF_MSG_TX_QUEUED,
3809                    "SKB mapping failed - silently dropping this SKB\n");
3810                 dev_kfree_skb_any(skb);
3811                 return NETDEV_TX_OK;
3812         }
3813         /*
3814         Please read carefully. First we use one BD which we mark as start,
3815         then we have a parsing info BD (used for TSO or xsum),
3816         and only then we have the rest of the TSO BDs.
3817         (don't forget to mark the last one as last,
3818         and to unmap only AFTER you write to the BD ...)
3819         And above all, all pdb sizes are in words - NOT DWORDS!
3820         */
3821
3822         /* get current pkt produced now - advance it just before sending packet
3823          * since mapping of pages may fail and cause packet to be dropped
3824          */
3825         pkt_prod = txdata->tx_pkt_prod;
3826         bd_prod = TX_BD(txdata->tx_bd_prod);
3827
3828         /* get a tx_buf and first BD
3829          * tx_start_bd may be changed during SPLIT,
3830          * but first_bd will always stay first
3831          */
3832         tx_buf = &txdata->tx_buf_ring[TX_BD(pkt_prod)];
3833         tx_start_bd = &txdata->tx_desc_ring[bd_prod].start_bd;
3834         first_bd = tx_start_bd;
3835
3836         tx_start_bd->bd_flags.as_bitfield = ETH_TX_BD_FLAGS_START_BD;
3837
3838         /* header nbd: indirectly zero other flags! */
3839         tx_start_bd->general_data = 1 << ETH_TX_START_BD_HDR_NBDS_SHIFT;
3840
3841         /* remember the first BD of the packet */
3842         tx_buf->first_bd = txdata->tx_bd_prod;
3843         tx_buf->skb = skb;
3844         tx_buf->flags = 0;
3845
3846         DP(NETIF_MSG_TX_QUEUED,
3847            "sending pkt %u @%p  next_idx %u  bd %u @%p\n",
3848            pkt_prod, tx_buf, txdata->tx_pkt_prod, bd_prod, tx_start_bd);
3849
3850         if (vlan_tx_tag_present(skb)) {
3851                 tx_start_bd->vlan_or_ethertype =
3852                     cpu_to_le16(vlan_tx_tag_get(skb));
3853                 tx_start_bd->bd_flags.as_bitfield |=
3854                     (X_ETH_OUTBAND_VLAN << ETH_TX_BD_FLAGS_VLAN_MODE_SHIFT);
3855         } else {
3856                 /* when transmitting in a vf, start bd must hold the ethertype
3857                  * for fw to enforce it
3858                  */
3859                 if (IS_VF(bp))
3860                         tx_start_bd->vlan_or_ethertype =
3861                                 cpu_to_le16(ntohs(eth->h_proto));
3862                 else
3863                         /* used by FW for packet accounting */
3864                         tx_start_bd->vlan_or_ethertype = cpu_to_le16(pkt_prod);
3865         }
3866
3867         nbd = 2; /* start_bd + pbd + frags (updated when pages are mapped) */
3868
3869         /* turn on parsing and get a BD */
3870         bd_prod = TX_BD(NEXT_TX_IDX(bd_prod));
3871
3872         if (xmit_type & XMIT_CSUM)
3873                 bnx2x_set_sbd_csum(bp, skb, tx_start_bd, xmit_type);
3874
3875         if (!CHIP_IS_E1x(bp)) {
3876                 pbd_e2 = &txdata->tx_desc_ring[bd_prod].parse_bd_e2;
3877                 memset(pbd_e2, 0, sizeof(struct eth_tx_parse_bd_e2));
3878
3879                 if (xmit_type & XMIT_CSUM_ENC) {
3880                         u16 global_data = 0;
3881
3882                         /* Set PBD in enc checksum offload case */
3883                         hlen = bnx2x_set_pbd_csum_enc(bp, skb,
3884                                                       &pbd_e2_parsing_data,
3885                                                       xmit_type);
3886
3887                         /* turn on 2nd parsing and get a BD */
3888                         bd_prod = TX_BD(NEXT_TX_IDX(bd_prod));
3889
3890                         pbd2 = &txdata->tx_desc_ring[bd_prod].parse_2nd_bd;
3891
3892                         memset(pbd2, 0, sizeof(*pbd2));
3893
3894                         pbd_e2->data.tunnel_data.ip_hdr_start_inner_w =
3895                                 (skb_inner_network_header(skb) -
3896                                  skb->data) >> 1;
3897
3898                         if (xmit_type & XMIT_GSO_ENC)
3899                                 bnx2x_update_pbds_gso_enc(skb, pbd_e2, pbd2,
3900                                                           &global_data,
3901                                                           xmit_type);
3902
3903                         pbd2->global_data = cpu_to_le16(global_data);
3904
3905                         /* add addition parse BD indication to start BD */
3906                         SET_FLAG(tx_start_bd->general_data,
3907                                  ETH_TX_START_BD_PARSE_NBDS, 1);
3908                         /* set encapsulation flag in start BD */
3909                         SET_FLAG(tx_start_bd->general_data,
3910                                  ETH_TX_START_BD_TUNNEL_EXIST, 1);
3911
3912                         tx_buf->flags |= BNX2X_HAS_SECOND_PBD;
3913
3914                         nbd++;
3915                 } else if (xmit_type & XMIT_CSUM) {
3916                         /* Set PBD in checksum offload case w/o encapsulation */
3917                         hlen = bnx2x_set_pbd_csum_e2(bp, skb,
3918                                                      &pbd_e2_parsing_data,
3919                                                      xmit_type);
3920                 }
3921
3922                 /* Add the macs to the parsing BD if this is a vf or if
3923                  * Tx Switching is enabled.
3924                  */
3925                 if (IS_VF(bp)) {
3926                         /* override GRE parameters in BD */
3927                         bnx2x_set_fw_mac_addr(&pbd_e2->data.mac_addr.src_hi,
3928                                               &pbd_e2->data.mac_addr.src_mid,
3929                                               &pbd_e2->data.mac_addr.src_lo,
3930                                               eth->h_source);
3931
3932                         bnx2x_set_fw_mac_addr(&pbd_e2->data.mac_addr.dst_hi,
3933                                               &pbd_e2->data.mac_addr.dst_mid,
3934                                               &pbd_e2->data.mac_addr.dst_lo,
3935                                               eth->h_dest);
3936                 } else if (bp->flags & TX_SWITCHING) {
3937                         bnx2x_set_fw_mac_addr(&pbd_e2->data.mac_addr.dst_hi,
3938                                               &pbd_e2->data.mac_addr.dst_mid,
3939                                               &pbd_e2->data.mac_addr.dst_lo,
3940                                               eth->h_dest);
3941                 }
3942
3943                 SET_FLAG(pbd_e2_parsing_data,
3944                          ETH_TX_PARSE_BD_E2_ETH_ADDR_TYPE, mac_type);
3945         } else {
3946                 u16 global_data = 0;
3947                 pbd_e1x = &txdata->tx_desc_ring[bd_prod].parse_bd_e1x;
3948                 memset(pbd_e1x, 0, sizeof(struct eth_tx_parse_bd_e1x));
3949                 /* Set PBD in checksum offload case */
3950                 if (xmit_type & XMIT_CSUM)
3951                         hlen = bnx2x_set_pbd_csum(bp, skb, pbd_e1x, xmit_type);
3952
3953                 SET_FLAG(global_data,
3954                          ETH_TX_PARSE_BD_E1X_ETH_ADDR_TYPE, mac_type);
3955                 pbd_e1x->global_data |= cpu_to_le16(global_data);
3956         }
3957
3958         /* Setup the data pointer of the first BD of the packet */
3959         tx_start_bd->addr_hi = cpu_to_le32(U64_HI(mapping));
3960         tx_start_bd->addr_lo = cpu_to_le32(U64_LO(mapping));
3961         tx_start_bd->nbytes = cpu_to_le16(skb_headlen(skb));
3962         pkt_size = tx_start_bd->nbytes;
3963
3964         DP(NETIF_MSG_TX_QUEUED,
3965            "first bd @%p  addr (%x:%x)  nbytes %d  flags %x  vlan %x\n",
3966            tx_start_bd, tx_start_bd->addr_hi, tx_start_bd->addr_lo,
3967            le16_to_cpu(tx_start_bd->nbytes),
3968            tx_start_bd->bd_flags.as_bitfield,
3969            le16_to_cpu(tx_start_bd->vlan_or_ethertype));
3970
3971         if (xmit_type & XMIT_GSO) {
3972
3973                 DP(NETIF_MSG_TX_QUEUED,
3974                    "TSO packet len %d  hlen %d  total len %d  tso size %d\n",
3975                    skb->len, hlen, skb_headlen(skb),
3976                    skb_shinfo(skb)->gso_size);
3977
3978                 tx_start_bd->bd_flags.as_bitfield |= ETH_TX_BD_FLAGS_SW_LSO;
3979
3980                 if (unlikely(skb_headlen(skb) > hlen)) {
3981                         nbd++;
3982                         bd_prod = bnx2x_tx_split(bp, txdata, tx_buf,
3983                                                  &tx_start_bd, hlen,
3984                                                  bd_prod);
3985                 }
3986                 if (!CHIP_IS_E1x(bp))
3987                         bnx2x_set_pbd_gso_e2(skb, &pbd_e2_parsing_data,
3988                                              xmit_type);
3989                 else
3990                         bnx2x_set_pbd_gso(skb, pbd_e1x, first_bd, xmit_type);
3991         }
3992
3993         /* Set the PBD's parsing_data field if not zero
3994          * (for the chips newer than 57711).
3995          */
3996         if (pbd_e2_parsing_data)
3997                 pbd_e2->parsing_data = cpu_to_le32(pbd_e2_parsing_data);
3998
3999         tx_data_bd = (struct eth_tx_bd *)tx_start_bd;
4000
4001         /* Handle fragmented skb */
4002         for (i = 0; i < skb_shinfo(skb)->nr_frags; i++) {
4003                 skb_frag_t *frag = &skb_shinfo(skb)->frags[i];
4004
4005                 mapping = skb_frag_dma_map(&bp->pdev->dev, frag, 0,
4006                                            skb_frag_size(frag), DMA_TO_DEVICE);
4007                 if (unlikely(dma_mapping_error(&bp->pdev->dev, mapping))) {
4008                         unsigned int pkts_compl = 0, bytes_compl = 0;
4009
4010                         DP(NETIF_MSG_TX_QUEUED,
4011                            "Unable to map page - dropping packet...\n");
4012
4013                         /* we need unmap all buffers already mapped
4014                          * for this SKB;
4015                          * first_bd->nbd need to be properly updated
4016                          * before call to bnx2x_free_tx_pkt
4017                          */
4018                         first_bd->nbd = cpu_to_le16(nbd);
4019                         bnx2x_free_tx_pkt(bp, txdata,
4020                                           TX_BD(txdata->tx_pkt_prod),
4021                                           &pkts_compl, &bytes_compl);
4022                         return NETDEV_TX_OK;
4023                 }
4024
4025                 bd_prod = TX_BD(NEXT_TX_IDX(bd_prod));
4026                 tx_data_bd = &txdata->tx_desc_ring[bd_prod].reg_bd;
4027                 if (total_pkt_bd == NULL)
4028                         total_pkt_bd = &txdata->tx_desc_ring[bd_prod].reg_bd;
4029
4030                 tx_data_bd->addr_hi = cpu_to_le32(U64_HI(mapping));
4031                 tx_data_bd->addr_lo = cpu_to_le32(U64_LO(mapping));
4032                 tx_data_bd->nbytes = cpu_to_le16(skb_frag_size(frag));
4033                 le16_add_cpu(&pkt_size, skb_frag_size(frag));
4034                 nbd++;
4035
4036                 DP(NETIF_MSG_TX_QUEUED,
4037                    "frag %d  bd @%p  addr (%x:%x)  nbytes %d\n",
4038                    i, tx_data_bd, tx_data_bd->addr_hi, tx_data_bd->addr_lo,
4039                    le16_to_cpu(tx_data_bd->nbytes));
4040         }
4041
4042         DP(NETIF_MSG_TX_QUEUED, "last bd @%p\n", tx_data_bd);
4043
4044         /* update with actual num BDs */
4045         first_bd->nbd = cpu_to_le16(nbd);
4046
4047         bd_prod = TX_BD(NEXT_TX_IDX(bd_prod));
4048
4049         /* now send a tx doorbell, counting the next BD
4050          * if the packet contains or ends with it
4051          */
4052         if (TX_BD_POFF(bd_prod) < nbd)
4053                 nbd++;
4054
4055         /* total_pkt_bytes should be set on the first data BD if
4056          * it's not an LSO packet and there is more than one
4057          * data BD. In this case pkt_size is limited by an MTU value.
4058          * However we prefer to set it for an LSO packet (while we don't
4059          * have to) in order to save some CPU cycles in a none-LSO
4060          * case, when we much more care about them.
4061          */
4062         if (total_pkt_bd != NULL)
4063                 total_pkt_bd->total_pkt_bytes = pkt_size;
4064
4065         if (pbd_e1x)
4066                 DP(NETIF_MSG_TX_QUEUED,
4067                    "PBD (E1X) @%p  ip_data %x  ip_hlen %u  ip_id %u  lso_mss %u  tcp_flags %x  xsum %x  seq %u  hlen %u\n",
4068                    pbd_e1x, pbd_e1x->global_data, pbd_e1x->ip_hlen_w,
4069                    pbd_e1x->ip_id, pbd_e1x->lso_mss, pbd_e1x->tcp_flags,
4070                    pbd_e1x->tcp_pseudo_csum, pbd_e1x->tcp_send_seq,
4071                     le16_to_cpu(pbd_e1x->total_hlen_w));
4072         if (pbd_e2)
4073                 DP(NETIF_MSG_TX_QUEUED,
4074                    "PBD (E2) @%p  dst %x %x %x src %x %x %x parsing_data %x\n",
4075                    pbd_e2,
4076                    pbd_e2->data.mac_addr.dst_hi,
4077                    pbd_e2->data.mac_addr.dst_mid,
4078                    pbd_e2->data.mac_addr.dst_lo,
4079                    pbd_e2->data.mac_addr.src_hi,
4080                    pbd_e2->data.mac_addr.src_mid,
4081                    pbd_e2->data.mac_addr.src_lo,
4082                    pbd_e2->parsing_data);
4083         DP(NETIF_MSG_TX_QUEUED, "doorbell: nbd %d  bd %u\n", nbd, bd_prod);
4084
4085         netdev_tx_sent_queue(txq, skb->len);
4086
4087         skb_tx_timestamp(skb);
4088
4089         txdata->tx_pkt_prod++;
4090         /*
4091          * Make sure that the BD data is updated before updating the producer
4092          * since FW might read the BD right after the producer is updated.
4093          * This is only applicable for weak-ordered memory model archs such
4094          * as IA-64. The following barrier is also mandatory since FW will
4095          * assumes packets must have BDs.
4096          */
4097         wmb();
4098
4099         txdata->tx_db.data.prod += nbd;
4100         barrier();
4101
4102         DOORBELL(bp, txdata->cid, txdata->tx_db.raw);
4103
4104         mmiowb();
4105
4106         txdata->tx_bd_prod += nbd;
4107
4108         if (unlikely(bnx2x_tx_avail(bp, txdata) < MAX_DESC_PER_TX_PKT)) {
4109                 netif_tx_stop_queue(txq);
4110
4111                 /* paired memory barrier is in bnx2x_tx_int(), we have to keep
4112                  * ordering of set_bit() in netif_tx_stop_queue() and read of
4113                  * fp->bd_tx_cons */
4114                 smp_mb();
4115
4116                 bnx2x_fp_qstats(bp, txdata->parent_fp)->driver_xoff++;
4117                 if (bnx2x_tx_avail(bp, txdata) >= MAX_DESC_PER_TX_PKT)
4118                         netif_tx_wake_queue(txq);
4119         }
4120         txdata->tx_pkt++;
4121
4122         return NETDEV_TX_OK;
4123 }
4124
4125 /**
4126  * bnx2x_setup_tc - routine to configure net_device for multi tc
4127  *
4128  * @netdev: net device to configure
4129  * @tc: number of traffic classes to enable
4130  *
4131  * callback connected to the ndo_setup_tc function pointer
4132  */
4133 int bnx2x_setup_tc(struct net_device *dev, u8 num_tc)
4134 {
4135         int cos, prio, count, offset;
4136         struct bnx2x *bp = netdev_priv(dev);
4137
4138         /* setup tc must be called under rtnl lock */
4139         ASSERT_RTNL();
4140
4141         /* no traffic classes requested. Aborting */
4142         if (!num_tc) {
4143                 netdev_reset_tc(dev);
4144                 return 0;
4145         }
4146
4147         /* requested to support too many traffic classes */
4148         if (num_tc > bp->max_cos) {
4149                 BNX2X_ERR("support for too many traffic classes requested: %d. Max supported is %d\n",
4150                           num_tc, bp->max_cos);
4151                 return -EINVAL;
4152         }
4153
4154         /* declare amount of supported traffic classes */
4155         if (netdev_set_num_tc(dev, num_tc)) {
4156                 BNX2X_ERR("failed to declare %d traffic classes\n", num_tc);
4157                 return -EINVAL;
4158         }
4159
4160         /* configure priority to traffic class mapping */
4161         for (prio = 0; prio < BNX2X_MAX_PRIORITY; prio++) {
4162                 netdev_set_prio_tc_map(dev, prio, bp->prio_to_cos[prio]);
4163                 DP(BNX2X_MSG_SP | NETIF_MSG_IFUP,
4164                    "mapping priority %d to tc %d\n",
4165                    prio, bp->prio_to_cos[prio]);
4166         }
4167
4168         /* Use this configuration to differentiate tc0 from other COSes
4169            This can be used for ets or pfc, and save the effort of setting
4170            up a multio class queue disc or negotiating DCBX with a switch
4171         netdev_set_prio_tc_map(dev, 0, 0);
4172         DP(BNX2X_MSG_SP, "mapping priority %d to tc %d\n", 0, 0);
4173         for (prio = 1; prio < 16; prio++) {
4174                 netdev_set_prio_tc_map(dev, prio, 1);
4175                 DP(BNX2X_MSG_SP, "mapping priority %d to tc %d\n", prio, 1);
4176         } */
4177
4178         /* configure traffic class to transmission queue mapping */
4179         for (cos = 0; cos < bp->max_cos; cos++) {
4180                 count = BNX2X_NUM_ETH_QUEUES(bp);
4181                 offset = cos * BNX2X_NUM_NON_CNIC_QUEUES(bp);
4182                 netdev_set_tc_queue(dev, cos, count, offset);
4183                 DP(BNX2X_MSG_SP | NETIF_MSG_IFUP,
4184                    "mapping tc %d to offset %d count %d\n",
4185                    cos, offset, count);
4186         }
4187
4188         return 0;
4189 }
4190
4191 /* called with rtnl_lock */
4192 int bnx2x_change_mac_addr(struct net_device *dev, void *p)
4193 {
4194         struct sockaddr *addr = p;
4195         struct bnx2x *bp = netdev_priv(dev);
4196         int rc = 0;
4197
4198         if (!bnx2x_is_valid_ether_addr(bp, addr->sa_data)) {
4199                 BNX2X_ERR("Requested MAC address is not valid\n");
4200                 return -EINVAL;
4201         }
4202
4203         if ((IS_MF_STORAGE_SD(bp) || IS_MF_FCOE_AFEX(bp)) &&
4204             !is_zero_ether_addr(addr->sa_data)) {
4205                 BNX2X_ERR("Can't configure non-zero address on iSCSI or FCoE functions in MF-SD mode\n");
4206                 return -EINVAL;
4207         }
4208
4209         if (netif_running(dev))  {
4210                 rc = bnx2x_set_eth_mac(bp, false);
4211                 if (rc)
4212                         return rc;
4213         }
4214
4215         memcpy(dev->dev_addr, addr->sa_data, dev->addr_len);
4216
4217         if (netif_running(dev))
4218                 rc = bnx2x_set_eth_mac(bp, true);
4219
4220         return rc;
4221 }
4222
4223 static void bnx2x_free_fp_mem_at(struct bnx2x *bp, int fp_index)
4224 {
4225         union host_hc_status_block *sb = &bnx2x_fp(bp, fp_index, status_blk);
4226         struct bnx2x_fastpath *fp = &bp->fp[fp_index];
4227         u8 cos;
4228
4229         /* Common */
4230
4231         if (IS_FCOE_IDX(fp_index)) {
4232                 memset(sb, 0, sizeof(union host_hc_status_block));
4233                 fp->status_blk_mapping = 0;
4234         } else {
4235                 /* status blocks */
4236                 if (!CHIP_IS_E1x(bp))
4237                         BNX2X_PCI_FREE(sb->e2_sb,
4238                                        bnx2x_fp(bp, fp_index,
4239                                                 status_blk_mapping),
4240                                        sizeof(struct host_hc_status_block_e2));
4241                 else
4242                         BNX2X_PCI_FREE(sb->e1x_sb,
4243                                        bnx2x_fp(bp, fp_index,
4244                                                 status_blk_mapping),
4245                                        sizeof(struct host_hc_status_block_e1x));
4246         }
4247
4248         /* Rx */
4249         if (!skip_rx_queue(bp, fp_index)) {
4250                 bnx2x_free_rx_bds(fp);
4251
4252                 /* fastpath rx rings: rx_buf rx_desc rx_comp */
4253                 BNX2X_FREE(bnx2x_fp(bp, fp_index, rx_buf_ring));
4254                 BNX2X_PCI_FREE(bnx2x_fp(bp, fp_index, rx_desc_ring),
4255                                bnx2x_fp(bp, fp_index, rx_desc_mapping),
4256                                sizeof(struct eth_rx_bd) * NUM_RX_BD);
4257
4258                 BNX2X_PCI_FREE(bnx2x_fp(bp, fp_index, rx_comp_ring),
4259                                bnx2x_fp(bp, fp_index, rx_comp_mapping),
4260                                sizeof(struct eth_fast_path_rx_cqe) *
4261                                NUM_RCQ_BD);
4262
4263                 /* SGE ring */
4264                 BNX2X_FREE(bnx2x_fp(bp, fp_index, rx_page_ring));
4265                 BNX2X_PCI_FREE(bnx2x_fp(bp, fp_index, rx_sge_ring),
4266                                bnx2x_fp(bp, fp_index, rx_sge_mapping),
4267                                BCM_PAGE_SIZE * NUM_RX_SGE_PAGES);
4268         }
4269
4270         /* Tx */
4271         if (!skip_tx_queue(bp, fp_index)) {
4272                 /* fastpath tx rings: tx_buf tx_desc */
4273                 for_each_cos_in_tx_queue(fp, cos) {
4274                         struct bnx2x_fp_txdata *txdata = fp->txdata_ptr[cos];
4275
4276                         DP(NETIF_MSG_IFDOWN,
4277                            "freeing tx memory of fp %d cos %d cid %d\n",
4278                            fp_index, cos, txdata->cid);
4279
4280                         BNX2X_FREE(txdata->tx_buf_ring);
4281                         BNX2X_PCI_FREE(txdata->tx_desc_ring,
4282                                 txdata->tx_desc_mapping,
4283                                 sizeof(union eth_tx_bd_types) * NUM_TX_BD);
4284                 }
4285         }
4286         /* end of fastpath */
4287 }
4288
4289 static void bnx2x_free_fp_mem_cnic(struct bnx2x *bp)
4290 {
4291         int i;
4292         for_each_cnic_queue(bp, i)
4293                 bnx2x_free_fp_mem_at(bp, i);
4294 }
4295
4296 void bnx2x_free_fp_mem(struct bnx2x *bp)
4297 {
4298         int i;
4299         for_each_eth_queue(bp, i)
4300                 bnx2x_free_fp_mem_at(bp, i);
4301 }
4302
4303 static void set_sb_shortcuts(struct bnx2x *bp, int index)
4304 {
4305         union host_hc_status_block status_blk = bnx2x_fp(bp, index, status_blk);
4306         if (!CHIP_IS_E1x(bp)) {
4307                 bnx2x_fp(bp, index, sb_index_values) =
4308                         (__le16 *)status_blk.e2_sb->sb.index_values;
4309                 bnx2x_fp(bp, index, sb_running_index) =
4310                         (__le16 *)status_blk.e2_sb->sb.running_index;
4311         } else {
4312                 bnx2x_fp(bp, index, sb_index_values) =
4313                         (__le16 *)status_blk.e1x_sb->sb.index_values;
4314                 bnx2x_fp(bp, index, sb_running_index) =
4315                         (__le16 *)status_blk.e1x_sb->sb.running_index;
4316         }
4317 }
4318
4319 /* Returns the number of actually allocated BDs */
4320 static int bnx2x_alloc_rx_bds(struct bnx2x_fastpath *fp,
4321                               int rx_ring_size)
4322 {
4323         struct bnx2x *bp = fp->bp;
4324         u16 ring_prod, cqe_ring_prod;
4325         int i, failure_cnt = 0;
4326
4327         fp->rx_comp_cons = 0;
4328         cqe_ring_prod = ring_prod = 0;
4329
4330         /* This routine is called only during fo init so
4331          * fp->eth_q_stats.rx_skb_alloc_failed = 0
4332          */
4333         for (i = 0; i < rx_ring_size; i++) {
4334                 if (bnx2x_alloc_rx_data(bp, fp, ring_prod, GFP_KERNEL) < 0) {
4335                         failure_cnt++;
4336                         continue;
4337                 }
4338                 ring_prod = NEXT_RX_IDX(ring_prod);
4339                 cqe_ring_prod = NEXT_RCQ_IDX(cqe_ring_prod);
4340                 WARN_ON(ring_prod <= (i - failure_cnt));
4341         }
4342
4343         if (failure_cnt)
4344                 BNX2X_ERR("was only able to allocate %d rx skbs on queue[%d]\n",
4345                           i - failure_cnt, fp->index);
4346
4347         fp->rx_bd_prod = ring_prod;
4348         /* Limit the CQE producer by the CQE ring size */
4349         fp->rx_comp_prod = min_t(u16, NUM_RCQ_RINGS*RCQ_DESC_CNT,
4350                                cqe_ring_prod);
4351         fp->rx_pkt = fp->rx_calls = 0;
4352
4353         bnx2x_fp_stats(bp, fp)->eth_q_stats.rx_skb_alloc_failed += failure_cnt;
4354
4355         return i - failure_cnt;
4356 }
4357
4358 static void bnx2x_set_next_page_rx_cq(struct bnx2x_fastpath *fp)
4359 {
4360         int i;
4361
4362         for (i = 1; i <= NUM_RCQ_RINGS; i++) {
4363                 struct eth_rx_cqe_next_page *nextpg;
4364
4365                 nextpg = (struct eth_rx_cqe_next_page *)
4366                         &fp->rx_comp_ring[RCQ_DESC_CNT * i - 1];
4367                 nextpg->addr_hi =
4368                         cpu_to_le32(U64_HI(fp->rx_comp_mapping +
4369                                    BCM_PAGE_SIZE*(i % NUM_RCQ_RINGS)));
4370                 nextpg->addr_lo =
4371                         cpu_to_le32(U64_LO(fp->rx_comp_mapping +
4372                                    BCM_PAGE_SIZE*(i % NUM_RCQ_RINGS)));
4373         }
4374 }
4375
4376 static int bnx2x_alloc_fp_mem_at(struct bnx2x *bp, int index)
4377 {
4378         union host_hc_status_block *sb;
4379         struct bnx2x_fastpath *fp = &bp->fp[index];
4380         int ring_size = 0;
4381         u8 cos;
4382         int rx_ring_size = 0;
4383
4384         if (!bp->rx_ring_size &&
4385             (IS_MF_STORAGE_SD(bp) || IS_MF_FCOE_AFEX(bp))) {
4386                 rx_ring_size = MIN_RX_SIZE_NONTPA;
4387                 bp->rx_ring_size = rx_ring_size;
4388         } else if (!bp->rx_ring_size) {
4389                 rx_ring_size = MAX_RX_AVAIL/BNX2X_NUM_RX_QUEUES(bp);
4390
4391                 if (CHIP_IS_E3(bp)) {
4392                         u32 cfg = SHMEM_RD(bp,
4393                                            dev_info.port_hw_config[BP_PORT(bp)].
4394                                            default_cfg);
4395
4396                         /* Decrease ring size for 1G functions */
4397                         if ((cfg & PORT_HW_CFG_NET_SERDES_IF_MASK) ==
4398                             PORT_HW_CFG_NET_SERDES_IF_SGMII)
4399                                 rx_ring_size /= 10;
4400                 }
4401
4402                 /* allocate at least number of buffers required by FW */
4403                 rx_ring_size = max_t(int, bp->disable_tpa ? MIN_RX_SIZE_NONTPA :
4404                                      MIN_RX_SIZE_TPA, rx_ring_size);
4405
4406                 bp->rx_ring_size = rx_ring_size;
4407         } else /* if rx_ring_size specified - use it */
4408                 rx_ring_size = bp->rx_ring_size;
4409
4410         DP(BNX2X_MSG_SP, "calculated rx_ring_size %d\n", rx_ring_size);
4411
4412         /* Common */
4413         sb = &bnx2x_fp(bp, index, status_blk);
4414
4415         if (!IS_FCOE_IDX(index)) {
4416                 /* status blocks */
4417                 if (!CHIP_IS_E1x(bp)) {
4418                         sb->e2_sb = BNX2X_PCI_ALLOC(&bnx2x_fp(bp, index, status_blk_mapping),
4419                                                     sizeof(struct host_hc_status_block_e2));
4420                         if (!sb->e2_sb)
4421                                 goto alloc_mem_err;
4422                 } else {
4423                         sb->e1x_sb = BNX2X_PCI_ALLOC(&bnx2x_fp(bp, index, status_blk_mapping),
4424                                                      sizeof(struct host_hc_status_block_e1x));
4425                         if (!sb->e1x_sb)
4426                                 goto alloc_mem_err;
4427                 }
4428         }
4429
4430         /* FCoE Queue uses Default SB and doesn't ACK the SB, thus no need to
4431          * set shortcuts for it.
4432          */
4433         if (!IS_FCOE_IDX(index))
4434                 set_sb_shortcuts(bp, index);
4435
4436         /* Tx */
4437         if (!skip_tx_queue(bp, index)) {
4438                 /* fastpath tx rings: tx_buf tx_desc */
4439                 for_each_cos_in_tx_queue(fp, cos) {
4440                         struct bnx2x_fp_txdata *txdata = fp->txdata_ptr[cos];
4441
4442                         DP(NETIF_MSG_IFUP,
4443                            "allocating tx memory of fp %d cos %d\n",
4444                            index, cos);
4445
4446                         txdata->tx_buf_ring = kcalloc(NUM_TX_BD,
4447                                                       sizeof(struct sw_tx_bd),
4448                                                       GFP_KERNEL);
4449                         if (!txdata->tx_buf_ring)
4450                                 goto alloc_mem_err;
4451                         txdata->tx_desc_ring = BNX2X_PCI_ALLOC(&txdata->tx_desc_mapping,
4452                                                                sizeof(union eth_tx_bd_types) * NUM_TX_BD);
4453                         if (!txdata->tx_desc_ring)
4454                                 goto alloc_mem_err;
4455                 }
4456         }
4457
4458         /* Rx */
4459         if (!skip_rx_queue(bp, index)) {
4460                 /* fastpath rx rings: rx_buf rx_desc rx_comp */
4461                 bnx2x_fp(bp, index, rx_buf_ring) =
4462                         kcalloc(NUM_RX_BD, sizeof(struct sw_rx_bd), GFP_KERNEL);
4463                 if (!bnx2x_fp(bp, index, rx_buf_ring))
4464                         goto alloc_mem_err;
4465                 bnx2x_fp(bp, index, rx_desc_ring) =
4466                         BNX2X_PCI_ALLOC(&bnx2x_fp(bp, index, rx_desc_mapping),
4467                                         sizeof(struct eth_rx_bd) * NUM_RX_BD);
4468                 if (!bnx2x_fp(bp, index, rx_desc_ring))
4469                         goto alloc_mem_err;
4470
4471                 /* Seed all CQEs by 1s */
4472                 bnx2x_fp(bp, index, rx_comp_ring) =
4473                         BNX2X_PCI_FALLOC(&bnx2x_fp(bp, index, rx_comp_mapping),
4474                                          sizeof(struct eth_fast_path_rx_cqe) * NUM_RCQ_BD);
4475                 if (!bnx2x_fp(bp, index, rx_comp_ring))
4476                         goto alloc_mem_err;
4477
4478                 /* SGE ring */
4479                 bnx2x_fp(bp, index, rx_page_ring) =
4480                         kcalloc(NUM_RX_SGE, sizeof(struct sw_rx_page),
4481                                 GFP_KERNEL);
4482                 if (!bnx2x_fp(bp, index, rx_page_ring))
4483                         goto alloc_mem_err;
4484                 bnx2x_fp(bp, index, rx_sge_ring) =
4485                         BNX2X_PCI_ALLOC(&bnx2x_fp(bp, index, rx_sge_mapping),
4486                                         BCM_PAGE_SIZE * NUM_RX_SGE_PAGES);
4487                 if (!bnx2x_fp(bp, index, rx_sge_ring))
4488                         goto alloc_mem_err;
4489                 /* RX BD ring */
4490                 bnx2x_set_next_page_rx_bd(fp);
4491
4492                 /* CQ ring */
4493                 bnx2x_set_next_page_rx_cq(fp);
4494
4495                 /* BDs */
4496                 ring_size = bnx2x_alloc_rx_bds(fp, rx_ring_size);
4497                 if (ring_size < rx_ring_size)
4498                         goto alloc_mem_err;
4499         }
4500
4501         return 0;
4502
4503 /* handles low memory cases */
4504 alloc_mem_err:
4505         BNX2X_ERR("Unable to allocate full memory for queue %d (size %d)\n",
4506                                                 index, ring_size);
4507         /* FW will drop all packets if queue is not big enough,
4508          * In these cases we disable the queue
4509          * Min size is different for OOO, TPA and non-TPA queues
4510          */
4511         if (ring_size < (fp->disable_tpa ?
4512                                 MIN_RX_SIZE_NONTPA : MIN_RX_SIZE_TPA)) {
4513                         /* release memory allocated for this queue */
4514                         bnx2x_free_fp_mem_at(bp, index);
4515                         return -ENOMEM;
4516         }
4517         return 0;
4518 }
4519
4520 static int bnx2x_alloc_fp_mem_cnic(struct bnx2x *bp)
4521 {
4522         if (!NO_FCOE(bp))
4523                 /* FCoE */
4524                 if (bnx2x_alloc_fp_mem_at(bp, FCOE_IDX(bp)))
4525                         /* we will fail load process instead of mark
4526                          * NO_FCOE_FLAG
4527                          */
4528                         return -ENOMEM;
4529
4530         return 0;
4531 }
4532
4533 static int bnx2x_alloc_fp_mem(struct bnx2x *bp)
4534 {
4535         int i;
4536
4537         /* 1. Allocate FP for leading - fatal if error
4538          * 2. Allocate RSS - fix number of queues if error
4539          */
4540
4541         /* leading */
4542         if (bnx2x_alloc_fp_mem_at(bp, 0))
4543                 return -ENOMEM;
4544
4545         /* RSS */
4546         for_each_nondefault_eth_queue(bp, i)
4547                 if (bnx2x_alloc_fp_mem_at(bp, i))
4548                         break;
4549
4550         /* handle memory failures */
4551         if (i != BNX2X_NUM_ETH_QUEUES(bp)) {
4552                 int delta = BNX2X_NUM_ETH_QUEUES(bp) - i;
4553
4554                 WARN_ON(delta < 0);
4555                 bnx2x_shrink_eth_fp(bp, delta);
4556                 if (CNIC_SUPPORT(bp))
4557                         /* move non eth FPs next to last eth FP
4558                          * must be done in that order
4559                          * FCOE_IDX < FWD_IDX < OOO_IDX
4560                          */
4561
4562                         /* move FCoE fp even NO_FCOE_FLAG is on */
4563                         bnx2x_move_fp(bp, FCOE_IDX(bp), FCOE_IDX(bp) - delta);
4564                 bp->num_ethernet_queues -= delta;
4565                 bp->num_queues = bp->num_ethernet_queues +
4566                                  bp->num_cnic_queues;
4567                 BNX2X_ERR("Adjusted num of queues from %d to %d\n",
4568                           bp->num_queues + delta, bp->num_queues);
4569         }
4570
4571         return 0;
4572 }
4573
4574 void bnx2x_free_mem_bp(struct bnx2x *bp)
4575 {
4576         int i;
4577
4578         for (i = 0; i < bp->fp_array_size; i++)
4579                 kfree(bp->fp[i].tpa_info);
4580         kfree(bp->fp);
4581         kfree(bp->sp_objs);
4582         kfree(bp->fp_stats);
4583         kfree(bp->bnx2x_txq);
4584         kfree(bp->msix_table);
4585         kfree(bp->ilt);
4586 }
4587
4588 int bnx2x_alloc_mem_bp(struct bnx2x *bp)
4589 {
4590         struct bnx2x_fastpath *fp;
4591         struct msix_entry *tbl;
4592         struct bnx2x_ilt *ilt;
4593         int msix_table_size = 0;
4594         int fp_array_size, txq_array_size;
4595         int i;
4596
4597         /*
4598          * The biggest MSI-X table we might need is as a maximum number of fast
4599          * path IGU SBs plus default SB (for PF only).
4600          */
4601         msix_table_size = bp->igu_sb_cnt;
4602         if (IS_PF(bp))
4603                 msix_table_size++;
4604         BNX2X_DEV_INFO("msix_table_size %d\n", msix_table_size);
4605
4606         /* fp array: RSS plus CNIC related L2 queues */
4607         fp_array_size = BNX2X_MAX_RSS_COUNT(bp) + CNIC_SUPPORT(bp);
4608         bp->fp_array_size = fp_array_size;
4609         BNX2X_DEV_INFO("fp_array_size %d\n", bp->fp_array_size);
4610
4611         fp = kcalloc(bp->fp_array_size, sizeof(*fp), GFP_KERNEL);
4612         if (!fp)
4613                 goto alloc_err;
4614         for (i = 0; i < bp->fp_array_size; i++) {
4615                 fp[i].tpa_info =
4616                         kcalloc(ETH_MAX_AGGREGATION_QUEUES_E1H_E2,
4617                                 sizeof(struct bnx2x_agg_info), GFP_KERNEL);
4618                 if (!(fp[i].tpa_info))
4619                         goto alloc_err;
4620         }
4621
4622         bp->fp = fp;
4623
4624         /* allocate sp objs */
4625         bp->sp_objs = kcalloc(bp->fp_array_size, sizeof(struct bnx2x_sp_objs),
4626                               GFP_KERNEL);
4627         if (!bp->sp_objs)
4628                 goto alloc_err;
4629
4630         /* allocate fp_stats */
4631         bp->fp_stats = kcalloc(bp->fp_array_size, sizeof(struct bnx2x_fp_stats),
4632                                GFP_KERNEL);
4633         if (!bp->fp_stats)
4634                 goto alloc_err;
4635
4636         /* Allocate memory for the transmission queues array */
4637         txq_array_size =
4638                 BNX2X_MAX_RSS_COUNT(bp) * BNX2X_MULTI_TX_COS + CNIC_SUPPORT(bp);
4639         BNX2X_DEV_INFO("txq_array_size %d", txq_array_size);
4640
4641         bp->bnx2x_txq = kcalloc(txq_array_size, sizeof(struct bnx2x_fp_txdata),
4642                                 GFP_KERNEL);
4643         if (!bp->bnx2x_txq)
4644                 goto alloc_err;
4645
4646         /* msix table */
4647         tbl = kcalloc(msix_table_size, sizeof(*tbl), GFP_KERNEL);
4648         if (!tbl)
4649                 goto alloc_err;
4650         bp->msix_table = tbl;
4651
4652         /* ilt */
4653         ilt = kzalloc(sizeof(*ilt), GFP_KERNEL);
4654         if (!ilt)
4655                 goto alloc_err;
4656         bp->ilt = ilt;
4657
4658         return 0;
4659 alloc_err:
4660         bnx2x_free_mem_bp(bp);
4661         return -ENOMEM;
4662 }
4663
4664 int bnx2x_reload_if_running(struct net_device *dev)
4665 {
4666         struct bnx2x *bp = netdev_priv(dev);
4667
4668         if (unlikely(!netif_running(dev)))
4669                 return 0;
4670
4671         bnx2x_nic_unload(bp, UNLOAD_NORMAL, true);
4672         return bnx2x_nic_load(bp, LOAD_NORMAL);
4673 }
4674
4675 int bnx2x_get_cur_phy_idx(struct bnx2x *bp)
4676 {
4677         u32 sel_phy_idx = 0;
4678         if (bp->link_params.num_phys <= 1)
4679                 return INT_PHY;
4680
4681         if (bp->link_vars.link_up) {
4682                 sel_phy_idx = EXT_PHY1;
4683                 /* In case link is SERDES, check if the EXT_PHY2 is the one */
4684                 if ((bp->link_vars.link_status & LINK_STATUS_SERDES_LINK) &&
4685                     (bp->link_params.phy[EXT_PHY2].supported & SUPPORTED_FIBRE))
4686                         sel_phy_idx = EXT_PHY2;
4687         } else {
4688
4689                 switch (bnx2x_phy_selection(&bp->link_params)) {
4690                 case PORT_HW_CFG_PHY_SELECTION_HARDWARE_DEFAULT:
4691                 case PORT_HW_CFG_PHY_SELECTION_FIRST_PHY:
4692                 case PORT_HW_CFG_PHY_SELECTION_FIRST_PHY_PRIORITY:
4693                        sel_phy_idx = EXT_PHY1;
4694                        break;
4695                 case PORT_HW_CFG_PHY_SELECTION_SECOND_PHY:
4696                 case PORT_HW_CFG_PHY_SELECTION_SECOND_PHY_PRIORITY:
4697                        sel_phy_idx = EXT_PHY2;
4698                        break;
4699                 }
4700         }
4701
4702         return sel_phy_idx;
4703 }
4704 int bnx2x_get_link_cfg_idx(struct bnx2x *bp)
4705 {
4706         u32 sel_phy_idx = bnx2x_get_cur_phy_idx(bp);
4707         /*
4708          * The selected activated PHY is always after swapping (in case PHY
4709          * swapping is enabled). So when swapping is enabled, we need to reverse
4710          * the configuration
4711          */
4712
4713         if (bp->link_params.multi_phy_config &
4714             PORT_HW_CFG_PHY_SWAPPED_ENABLED) {
4715                 if (sel_phy_idx == EXT_PHY1)
4716                         sel_phy_idx = EXT_PHY2;
4717                 else if (sel_phy_idx == EXT_PHY2)
4718                         sel_phy_idx = EXT_PHY1;
4719         }
4720         return LINK_CONFIG_IDX(sel_phy_idx);
4721 }
4722
4723 #ifdef NETDEV_FCOE_WWNN
4724 int bnx2x_fcoe_get_wwn(struct net_device *dev, u64 *wwn, int type)
4725 {
4726         struct bnx2x *bp = netdev_priv(dev);
4727         struct cnic_eth_dev *cp = &bp->cnic_eth_dev;
4728
4729         switch (type) {
4730         case NETDEV_FCOE_WWNN:
4731                 *wwn = HILO_U64(cp->fcoe_wwn_node_name_hi,
4732                                 cp->fcoe_wwn_node_name_lo);
4733                 break;
4734         case NETDEV_FCOE_WWPN:
4735                 *wwn = HILO_U64(cp->fcoe_wwn_port_name_hi,
4736                                 cp->fcoe_wwn_port_name_lo);
4737                 break;
4738         default:
4739                 BNX2X_ERR("Wrong WWN type requested - %d\n", type);
4740                 return -EINVAL;
4741         }
4742
4743         return 0;
4744 }
4745 #endif
4746
4747 /* called with rtnl_lock */
4748 int bnx2x_change_mtu(struct net_device *dev, int new_mtu)
4749 {
4750         struct bnx2x *bp = netdev_priv(dev);
4751
4752         if (bp->recovery_state != BNX2X_RECOVERY_DONE) {
4753                 BNX2X_ERR("Can't perform change MTU during parity recovery\n");
4754                 return -EAGAIN;
4755         }
4756
4757         if ((new_mtu > ETH_MAX_JUMBO_PACKET_SIZE) ||
4758             ((new_mtu + ETH_HLEN) < ETH_MIN_PACKET_SIZE)) {
4759                 BNX2X_ERR("Can't support requested MTU size\n");
4760                 return -EINVAL;
4761         }
4762
4763         /* This does not race with packet allocation
4764          * because the actual alloc size is
4765          * only updated as part of load
4766          */
4767         dev->mtu = new_mtu;
4768
4769         return bnx2x_reload_if_running(dev);
4770 }
4771
4772 netdev_features_t bnx2x_fix_features(struct net_device *dev,
4773                                      netdev_features_t features)
4774 {
4775         struct bnx2x *bp = netdev_priv(dev);
4776
4777         /* TPA requires Rx CSUM offloading */
4778         if (!(features & NETIF_F_RXCSUM) || bp->disable_tpa) {
4779                 features &= ~NETIF_F_LRO;
4780                 features &= ~NETIF_F_GRO;
4781         }
4782
4783         return features;
4784 }
4785
4786 int bnx2x_set_features(struct net_device *dev, netdev_features_t features)
4787 {
4788         struct bnx2x *bp = netdev_priv(dev);
4789         u32 flags = bp->flags;
4790         u32 changes;
4791         bool bnx2x_reload = false;
4792
4793         if (features & NETIF_F_LRO)
4794                 flags |= TPA_ENABLE_FLAG;
4795         else
4796                 flags &= ~TPA_ENABLE_FLAG;
4797
4798         if (features & NETIF_F_GRO)
4799                 flags |= GRO_ENABLE_FLAG;
4800         else
4801                 flags &= ~GRO_ENABLE_FLAG;
4802
4803         if (features & NETIF_F_LOOPBACK) {
4804                 if (bp->link_params.loopback_mode != LOOPBACK_BMAC) {
4805                         bp->link_params.loopback_mode = LOOPBACK_BMAC;
4806                         bnx2x_reload = true;
4807                 }
4808         } else {
4809                 if (bp->link_params.loopback_mode != LOOPBACK_NONE) {
4810                         bp->link_params.loopback_mode = LOOPBACK_NONE;
4811                         bnx2x_reload = true;
4812                 }
4813         }
4814
4815         changes = flags ^ bp->flags;
4816
4817         /* if GRO is changed while LRO is enabled, don't force a reload */
4818         if ((changes & GRO_ENABLE_FLAG) && (flags & TPA_ENABLE_FLAG))
4819                 changes &= ~GRO_ENABLE_FLAG;
4820
4821         if (changes)
4822                 bnx2x_reload = true;
4823
4824         bp->flags = flags;
4825
4826         if (bnx2x_reload) {
4827                 if (bp->recovery_state == BNX2X_RECOVERY_DONE)
4828                         return bnx2x_reload_if_running(dev);
4829                 /* else: bnx2x_nic_load() will be called at end of recovery */
4830         }
4831
4832         return 0;
4833 }
4834
4835 void bnx2x_tx_timeout(struct net_device *dev)
4836 {
4837         struct bnx2x *bp = netdev_priv(dev);
4838
4839 #ifdef BNX2X_STOP_ON_ERROR
4840         if (!bp->panic)
4841                 bnx2x_panic();
4842 #endif
4843
4844         /* This allows the netif to be shutdown gracefully before resetting */
4845         bnx2x_schedule_sp_rtnl(bp, BNX2X_SP_RTNL_TX_TIMEOUT, 0);
4846 }
4847
4848 int bnx2x_suspend(struct pci_dev *pdev, pm_message_t state)
4849 {
4850         struct net_device *dev = pci_get_drvdata(pdev);
4851         struct bnx2x *bp;
4852
4853         if (!dev) {
4854                 dev_err(&pdev->dev, "BAD net device from bnx2x_init_one\n");
4855                 return -ENODEV;
4856         }
4857         bp = netdev_priv(dev);
4858
4859         rtnl_lock();
4860
4861         pci_save_state(pdev);
4862
4863         if (!netif_running(dev)) {
4864                 rtnl_unlock();
4865                 return 0;
4866         }
4867
4868         netif_device_detach(dev);
4869
4870         bnx2x_nic_unload(bp, UNLOAD_CLOSE, false);
4871
4872         bnx2x_set_power_state(bp, pci_choose_state(pdev, state));
4873
4874         rtnl_unlock();
4875
4876         return 0;
4877 }
4878
4879 int bnx2x_resume(struct pci_dev *pdev)
4880 {
4881         struct net_device *dev = pci_get_drvdata(pdev);
4882         struct bnx2x *bp;
4883         int rc;
4884
4885         if (!dev) {
4886                 dev_err(&pdev->dev, "BAD net device from bnx2x_init_one\n");
4887                 return -ENODEV;
4888         }
4889         bp = netdev_priv(dev);
4890
4891         if (bp->recovery_state != BNX2X_RECOVERY_DONE) {
4892                 BNX2X_ERR("Handling parity error recovery. Try again later\n");
4893                 return -EAGAIN;
4894         }
4895
4896         rtnl_lock();
4897
4898         pci_restore_state(pdev);
4899
4900         if (!netif_running(dev)) {
4901                 rtnl_unlock();
4902                 return 0;
4903         }
4904
4905         bnx2x_set_power_state(bp, PCI_D0);
4906         netif_device_attach(dev);
4907
4908         rc = bnx2x_nic_load(bp, LOAD_OPEN);
4909
4910         rtnl_unlock();
4911
4912         return rc;
4913 }
4914
4915 void bnx2x_set_ctx_validation(struct bnx2x *bp, struct eth_context *cxt,
4916                               u32 cid)
4917 {
4918         if (!cxt) {
4919                 BNX2X_ERR("bad context pointer %p\n", cxt);
4920                 return;
4921         }
4922
4923         /* ustorm cxt validation */
4924         cxt->ustorm_ag_context.cdu_usage =
4925                 CDU_RSRVD_VALUE_TYPE_A(HW_CID(bp, cid),
4926                         CDU_REGION_NUMBER_UCM_AG, ETH_CONNECTION_TYPE);
4927         /* xcontext validation */
4928         cxt->xstorm_ag_context.cdu_reserved =
4929                 CDU_RSRVD_VALUE_TYPE_A(HW_CID(bp, cid),
4930                         CDU_REGION_NUMBER_XCM_AG, ETH_CONNECTION_TYPE);
4931 }
4932
4933 static void storm_memset_hc_timeout(struct bnx2x *bp, u8 port,
4934                                     u8 fw_sb_id, u8 sb_index,
4935                                     u8 ticks)
4936 {
4937         u32 addr = BAR_CSTRORM_INTMEM +
4938                    CSTORM_STATUS_BLOCK_DATA_TIMEOUT_OFFSET(fw_sb_id, sb_index);
4939         REG_WR8(bp, addr, ticks);
4940         DP(NETIF_MSG_IFUP,
4941            "port %x fw_sb_id %d sb_index %d ticks %d\n",
4942            port, fw_sb_id, sb_index, ticks);
4943 }
4944
4945 static void storm_memset_hc_disable(struct bnx2x *bp, u8 port,
4946                                     u16 fw_sb_id, u8 sb_index,
4947                                     u8 disable)
4948 {
4949         u32 enable_flag = disable ? 0 : (1 << HC_INDEX_DATA_HC_ENABLED_SHIFT);
4950         u32 addr = BAR_CSTRORM_INTMEM +
4951                    CSTORM_STATUS_BLOCK_DATA_FLAGS_OFFSET(fw_sb_id, sb_index);
4952         u8 flags = REG_RD8(bp, addr);
4953         /* clear and set */
4954         flags &= ~HC_INDEX_DATA_HC_ENABLED;
4955         flags |= enable_flag;
4956         REG_WR8(bp, addr, flags);
4957         DP(NETIF_MSG_IFUP,
4958            "port %x fw_sb_id %d sb_index %d disable %d\n",
4959            port, fw_sb_id, sb_index, disable);
4960 }
4961
4962 void bnx2x_update_coalesce_sb_index(struct bnx2x *bp, u8 fw_sb_id,
4963                                     u8 sb_index, u8 disable, u16 usec)
4964 {
4965         int port = BP_PORT(bp);
4966         u8 ticks = usec / BNX2X_BTR;
4967
4968         storm_memset_hc_timeout(bp, port, fw_sb_id, sb_index, ticks);
4969
4970         disable = disable ? 1 : (usec ? 0 : 1);
4971         storm_memset_hc_disable(bp, port, fw_sb_id, sb_index, disable);
4972 }
4973
4974 void bnx2x_schedule_sp_rtnl(struct bnx2x *bp, enum sp_rtnl_flag flag,
4975                             u32 verbose)
4976 {
4977         smp_mb__before_atomic();
4978         set_bit(flag, &bp->sp_rtnl_state);
4979         smp_mb__after_atomic();
4980         DP((BNX2X_MSG_SP | verbose), "Scheduling sp_rtnl task [Flag: %d]\n",
4981            flag);
4982         schedule_delayed_work(&bp->sp_rtnl_task, 0);
4983 }
4984 EXPORT_SYMBOL(bnx2x_schedule_sp_rtnl);