2 * Copyright (C) 2005 - 2013 Emulex
5 * This program is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU General Public License version 2
7 * as published by the Free Software Foundation. The full GNU General
8 * Public License is included in this distribution in the file called COPYING.
10 * Contact Information:
11 * linux-drivers@emulex.com
15 * Costa Mesa, CA 92626
21 #include <linux/pci.h>
22 #include <linux/etherdevice.h>
23 #include <linux/delay.h>
27 #include <linux/if_vlan.h>
28 #include <linux/workqueue.h>
29 #include <linux/interrupt.h>
30 #include <linux/firmware.h>
31 #include <linux/slab.h>
32 #include <linux/u64_stats_sync.h>
37 #define DRV_VER "4.9.134.0u"
38 #define DRV_NAME "be2net"
39 #define BE_NAME "Emulex BladeEngine2"
40 #define BE3_NAME "Emulex BladeEngine3"
41 #define OC_NAME "Emulex OneConnect"
42 #define OC_NAME_BE OC_NAME "(be3)"
43 #define OC_NAME_LANCER OC_NAME "(Lancer)"
44 #define OC_NAME_SH OC_NAME "(Skyhawk)"
45 #define DRV_DESC "Emulex OneConnect 10Gbps NIC Driver"
47 #define BE_VENDOR_ID 0x19a2
48 #define EMULEX_VENDOR_ID 0x10df
49 #define BE_DEVICE_ID1 0x211
50 #define BE_DEVICE_ID2 0x221
51 #define OC_DEVICE_ID1 0x700 /* Device Id for BE2 cards */
52 #define OC_DEVICE_ID2 0x710 /* Device Id for BE3 cards */
53 #define OC_DEVICE_ID3 0xe220 /* Device id for Lancer cards */
54 #define OC_DEVICE_ID4 0xe228 /* Device id for VF in Lancer */
55 #define OC_DEVICE_ID5 0x720 /* Device Id for Skyhawk cards */
56 #define OC_DEVICE_ID6 0x728 /* Device id for VF in SkyHawk */
57 #define OC_SUBSYS_DEVICE_ID1 0xE602
58 #define OC_SUBSYS_DEVICE_ID2 0xE642
59 #define OC_SUBSYS_DEVICE_ID3 0xE612
60 #define OC_SUBSYS_DEVICE_ID4 0xE652
62 static inline char *nic_name(struct pci_dev *pdev)
64 switch (pdev->device) {
71 return OC_NAME_LANCER;
82 /* Number of bytes of an RX frame that are copied to skb->data */
83 #define BE_HDR_LEN ((u16) 64)
84 /* allocate extra space to allow tunneling decapsulation without head reallocation */
85 #define BE_RX_SKB_ALLOC_SIZE (BE_HDR_LEN + 64)
87 #define BE_MAX_JUMBO_FRAME_SIZE 9018
88 #define BE_MIN_MTU 256
90 #define BE_NUM_VLANS_SUPPORTED 64
91 #define BE_UMC_NUM_VLANS_SUPPORTED 15
92 #define BE_MAX_EQD 128u
93 #define BE_MAX_TX_FRAG_COUNT 30
95 #define EVNT_Q_LEN 1024
97 #define TX_CQ_LEN 1024
98 #define RX_Q_LEN 1024 /* Does not support any other value */
99 #define RX_CQ_LEN 1024
100 #define MCC_Q_LEN 128 /* total size not to exceed 8 pages */
101 #define MCC_CQ_LEN 256
103 #define BE2_MAX_RSS_QS 4
104 #define BE3_MAX_RSS_QS 16
105 #define BE3_MAX_TX_QS 16
106 #define BE3_MAX_EVT_QS 16
109 #define MAX_EVT_QS 32
112 #define MAX_ROCE_EQS 5
113 #define MAX_MSIX_VECTORS 32
114 #define MIN_MSIX_VECTORS 1
115 #define BE_TX_BUDGET 256
116 #define BE_NAPI_WEIGHT 64
117 #define MAX_RX_POST BE_NAPI_WEIGHT /* Frags posted at a time */
118 #define RX_FRAGS_REFILL_WM (RX_Q_LEN - MAX_RX_POST)
120 #define MAX_VFS 30 /* Max VFs supported by BE3 FW */
121 #define FW_VER_LEN 32
129 struct be_queue_info {
130 struct be_dma_mem dma_mem;
132 u16 entry_size; /* Size of an element in the queue */
136 atomic_t used; /* Number of valid elements in the queue */
139 static inline u32 MODULO(u16 val, u16 limit)
141 BUG_ON(limit & (limit - 1));
142 return val & (limit - 1);
145 static inline void index_adv(u16 *index, u16 val, u16 limit)
147 *index = MODULO((*index + val), limit);
150 static inline void index_inc(u16 *index, u16 limit)
152 *index = MODULO((*index + 1), limit);
155 static inline void *queue_head_node(struct be_queue_info *q)
157 return q->dma_mem.va + q->head * q->entry_size;
160 static inline void *queue_tail_node(struct be_queue_info *q)
162 return q->dma_mem.va + q->tail * q->entry_size;
165 static inline void *queue_index_node(struct be_queue_info *q, u16 index)
167 return q->dma_mem.va + index * q->entry_size;
170 static inline void queue_head_inc(struct be_queue_info *q)
172 index_inc(&q->head, q->len);
175 static inline void index_dec(u16 *index, u16 limit)
177 *index = MODULO((*index - 1), limit);
180 static inline void queue_tail_inc(struct be_queue_info *q)
182 index_inc(&q->tail, q->len);
186 struct be_queue_info q;
189 /* Adaptive interrupt coalescing (AIC) info */
191 u32 min_eqd; /* in usecs */
192 u32 max_eqd; /* in usecs */
193 u32 eqd; /* configured val when aic is off */
194 u32 cur_eqd; /* in usecs */
196 u8 idx; /* array index */
200 struct napi_struct napi;
201 struct be_adapter *adapter;
202 } ____cacheline_aligned_in_smp;
204 struct be_aic_obj { /* Adaptive interrupt coalescing (AIC) info */
206 u32 min_eqd; /* in usecs */
207 u32 max_eqd; /* in usecs */
208 u32 prev_eqd; /* in usecs */
209 u32 et_eqd; /* configured val when aic is off */
211 u64 rx_pkts_prev; /* Used to calculate RX pps */
212 u64 tx_reqs_prev; /* Used to calculate TX pps */
216 struct be_queue_info q;
217 struct be_queue_info cq;
229 u32 tx_drv_drops; /* pkts dropped by driver */
230 struct u64_stats_sync sync;
231 struct u64_stats_sync sync_compl;
236 struct be_queue_info q;
237 struct be_queue_info cq;
238 /* Remember the skbs that were transmitted */
239 struct sk_buff *sent_skb_list[TX_Q_LEN];
240 struct be_tx_stats stats;
241 } ____cacheline_aligned_in_smp;
243 /* Struct to remember the pages posted for rx frags */
244 struct be_rx_page_info {
246 DEFINE_DMA_UNMAP_ADDR(bus);
254 u32 rx_drops_no_skbs; /* skb allocation errors */
255 u32 rx_drops_no_frags; /* HW has no fetched frags */
256 u32 rx_post_fail; /* page post alloc failures */
259 u32 rx_compl_err; /* completions with err set */
260 struct u64_stats_sync sync;
263 struct be_rx_compl_info {
284 struct be_adapter *adapter;
285 struct be_queue_info q;
286 struct be_queue_info cq;
287 struct be_rx_compl_info rxcp;
288 struct be_rx_page_info page_info_tbl[RX_Q_LEN];
289 struct be_rx_stats stats;
291 bool rx_post_starved; /* Zero rx frags have been posted to BE */
292 } ____cacheline_aligned_in_smp;
294 struct be_drv_stats {
295 u32 be_on_die_temperature;
297 u32 rx_drops_no_pbuf;
298 u32 rx_drops_no_txpb;
299 u32 rx_drops_no_erx_descr;
300 u32 rx_drops_no_tpre_descr;
301 u32 rx_drops_too_many_frags;
302 u32 forwarded_packets;
305 u32 rx_alignment_symbol_errors;
307 u32 rx_priority_pause_frames;
308 u32 rx_control_frames;
309 u32 rx_in_range_errors;
310 u32 rx_out_range_errors;
311 u32 rx_frame_too_long;
312 u32 rx_address_filtered;
313 u32 rx_dropped_too_small;
314 u32 rx_dropped_too_short;
315 u32 rx_dropped_header_too_small;
316 u32 rx_dropped_tcp_length;
318 u32 rx_ip_checksum_errs;
319 u32 rx_tcp_checksum_errs;
320 u32 rx_udp_checksum_errs;
322 u32 tx_priority_pauseframes;
323 u32 tx_controlframes;
324 u32 rxpp_fifo_overflow_drop;
325 u32 rx_input_fifo_overflow_drop;
326 u32 pmem_fifo_overflow_drop;
328 u32 rx_roce_bytes_lsd;
329 u32 rx_roce_bytes_msd;
331 u32 roce_drops_payload_len;
336 unsigned char mac_addr[ETH_ALEN];
349 #define BE_FLAGS_LINK_STATUS_INIT 1
350 #define BE_FLAGS_WORKER_SCHEDULED (1 << 3)
351 #define BE_FLAGS_VLAN_PROMISC (1 << 4)
352 #define BE_FLAGS_NAPI_ENABLED (1 << 9)
353 #define BE_UC_PMAC_COUNT 30
354 #define BE_VF_UC_PMAC_COUNT 2
355 #define BE_FLAGS_QNQ_ASYNC_EVT_RCVD (1 << 11)
357 /* Ethtool set_dump flags */
358 #define LANCER_INITIATE_FW_DUMP 0x1
368 u16 auto_speeds_supported;
369 u16 fixed_speeds_supported;
376 struct be_resources {
377 u16 max_vfs; /* Total VFs "really" supported by FW/HW */
382 u16 max_uc_mac; /* Max UC MACs programmable */
383 u16 max_vlans; /* Number of vlans supported */
389 struct pci_dev *pdev;
390 struct net_device *netdev;
392 u8 __iomem *csr; /* CSR BAR used only for BE2/3 */
393 u8 __iomem *db; /* Door Bell */
395 struct mutex mbox_lock; /* For serializing mbox cmds to BE card */
396 struct be_dma_mem mbox_mem;
397 /* Mbox mem is adjusted to align to 16 bytes. The allocated addr
398 * is stored for freeing purpose */
399 struct be_dma_mem mbox_mem_alloced;
401 struct be_mcc_obj mcc_obj;
402 spinlock_t mcc_lock; /* For serializing mcc cmds to BE card */
403 spinlock_t mcc_cq_lock;
405 u16 cfg_num_qs; /* configured via set-channels */
408 struct be_eq_obj eq_obj[MAX_EVT_QS];
409 struct msix_entry msix_entries[MAX_MSIX_VECTORS];
414 struct be_tx_obj tx_obj[MAX_TX_QS];
418 struct be_rx_obj rx_obj[MAX_RX_QS];
419 u32 big_page_size; /* Compounded page size shared by rx wrbs */
421 struct be_drv_stats drv_stats;
422 struct be_aic_obj aic_obj[MAX_EVT_QS];
424 u8 vlan_tag[VLAN_N_VID];
425 u8 vlan_prio_bmap; /* Available Priority BitMap */
426 u16 recommended_prio; /* Recommended Priority */
427 struct be_dma_mem rx_filter; /* Cmd DMA mem for rx-filter */
429 struct be_dma_mem stats_cmd;
430 /* Work queue used to perform periodic tasks like getting statistics */
431 struct delayed_work work;
434 struct delayed_work func_recovery_work;
437 /* Ethtool knobs and info */
438 char fw_ver[FW_VER_LEN];
439 char fw_on_flash[FW_VER_LEN];
440 int if_handle; /* Used to configure filtering */
441 u32 *pmac_id; /* MAC addr handle used by BE card */
442 u32 beacon_state; /* for set_phys_id */
452 u32 rx_fc; /* Rx flow control */
453 u32 tx_fc; /* Tx flow control */
461 u32 num_msix_roce_vec;
462 struct ocrdma_dev *ocrdma_dev;
463 struct list_head entry;
466 struct completion flash_compl;
468 struct be_resources res; /* resources available for the func */
469 u16 num_vfs; /* Number of VFs provisioned by PF */
471 struct be_vf_cfg *vf_cfg;
479 u32 uc_macs; /* Count of secondary UC MAC programmed */
483 int be_get_temp_freq;
488 #define be_physfn(adapter) (!adapter->virtfn)
489 #define sriov_enabled(adapter) (adapter->num_vfs > 0)
490 #define sriov_want(adapter) (be_physfn(adapter) && \
491 (num_vfs || pci_num_vf(adapter->pdev)))
492 #define for_all_vfs(adapter, vf_cfg, i) \
493 for (i = 0, vf_cfg = &adapter->vf_cfg[i]; i < adapter->num_vfs; \
499 #define be_max_vlans(adapter) (adapter->res.max_vlans)
500 #define be_max_uc(adapter) (adapter->res.max_uc_mac)
501 #define be_max_mc(adapter) (adapter->res.max_mcast_mac)
502 #define be_max_vfs(adapter) (adapter->res.max_vfs)
503 #define be_max_rss(adapter) (adapter->res.max_rss_qs)
504 #define be_max_txqs(adapter) (adapter->res.max_tx_qs)
505 #define be_max_prio_txqs(adapter) (adapter->res.max_prio_tx_qs)
506 #define be_max_rxqs(adapter) (adapter->res.max_rx_qs)
507 #define be_max_eqs(adapter) (adapter->res.max_evt_qs)
508 #define be_if_cap_flags(adapter) (adapter->res.if_cap_flags)
510 static inline u16 be_max_qs(struct be_adapter *adapter)
512 /* If no RSS, need atleast the one def RXQ */
513 u16 num = max_t(u16, be_max_rss(adapter), 1);
515 num = min(num, be_max_eqs(adapter));
516 return min_t(u16, num, num_online_cpus());
519 #define lancer_chip(adapter) (adapter->pdev->device == OC_DEVICE_ID3 || \
520 adapter->pdev->device == OC_DEVICE_ID4)
522 #define skyhawk_chip(adapter) (adapter->pdev->device == OC_DEVICE_ID5 || \
523 adapter->pdev->device == OC_DEVICE_ID6)
525 #define BE3_chip(adapter) (adapter->pdev->device == BE_DEVICE_ID2 || \
526 adapter->pdev->device == OC_DEVICE_ID2)
528 #define BE2_chip(adapter) (adapter->pdev->device == BE_DEVICE_ID1 || \
529 adapter->pdev->device == OC_DEVICE_ID1)
531 #define BEx_chip(adapter) (BE3_chip(adapter) || BE2_chip(adapter))
533 #define be_roce_supported(adapter) (skyhawk_chip(adapter) && \
534 (adapter->function_mode & RDMA_ENABLED))
536 extern const struct ethtool_ops be_ethtool_ops;
538 #define msix_enabled(adapter) (adapter->num_msix_vec > 0)
539 #define num_irqs(adapter) (msix_enabled(adapter) ? \
540 adapter->num_msix_vec : 1)
541 #define tx_stats(txo) (&(txo)->stats)
542 #define rx_stats(rxo) (&(rxo)->stats)
544 /* The default RXQ is the last RXQ */
545 #define default_rxo(adpt) (&adpt->rx_obj[adpt->num_rx_qs - 1])
547 #define for_all_rx_queues(adapter, rxo, i) \
548 for (i = 0, rxo = &adapter->rx_obj[i]; i < adapter->num_rx_qs; \
551 /* Skip the default non-rss queue (last one)*/
552 #define for_all_rss_queues(adapter, rxo, i) \
553 for (i = 0, rxo = &adapter->rx_obj[i]; i < (adapter->num_rx_qs - 1);\
556 #define for_all_tx_queues(adapter, txo, i) \
557 for (i = 0, txo = &adapter->tx_obj[i]; i < adapter->num_tx_qs; \
560 #define for_all_evt_queues(adapter, eqo, i) \
561 for (i = 0, eqo = &adapter->eq_obj[i]; i < adapter->num_evt_qs; \
564 #define is_mcc_eqo(eqo) (eqo->idx == 0)
565 #define mcc_eqo(adapter) (&adapter->eq_obj[0])
567 #define PAGE_SHIFT_4K 12
568 #define PAGE_SIZE_4K (1 << PAGE_SHIFT_4K)
570 /* Returns number of pages spanned by the data starting at the given addr */
571 #define PAGES_4K_SPANNED(_address, size) \
572 ((u32)((((size_t)(_address) & (PAGE_SIZE_4K - 1)) + \
573 (size) + (PAGE_SIZE_4K - 1)) >> PAGE_SHIFT_4K))
575 /* Returns bit offset within a DWORD of a bitfield */
576 #define AMAP_BIT_OFFSET(_struct, field) \
577 (((size_t)&(((_struct *)0)->field))%32)
579 /* Returns the bit mask of the field that is NOT shifted into location. */
580 static inline u32 amap_mask(u32 bitsize)
582 return (bitsize == 32 ? 0xFFFFFFFF : (1 << bitsize) - 1);
586 amap_set(void *ptr, u32 dw_offset, u32 mask, u32 offset, u32 value)
588 u32 *dw = (u32 *) ptr + dw_offset;
589 *dw &= ~(mask << offset);
590 *dw |= (mask & value) << offset;
593 #define AMAP_SET_BITS(_struct, field, ptr, val) \
595 offsetof(_struct, field)/32, \
596 amap_mask(sizeof(((_struct *)0)->field)), \
597 AMAP_BIT_OFFSET(_struct, field), \
600 static inline u32 amap_get(void *ptr, u32 dw_offset, u32 mask, u32 offset)
602 u32 *dw = (u32 *) ptr;
603 return mask & (*(dw + dw_offset) >> offset);
606 #define AMAP_GET_BITS(_struct, field, ptr) \
608 offsetof(_struct, field)/32, \
609 amap_mask(sizeof(((_struct *)0)->field)), \
610 AMAP_BIT_OFFSET(_struct, field))
612 #define be_dws_cpu_to_le(wrb, len) swap_dws(wrb, len)
613 #define be_dws_le_to_cpu(wrb, len) swap_dws(wrb, len)
614 static inline void swap_dws(void *wrb, int len)
620 *dw = cpu_to_le32(*dw);
624 #endif /* __BIG_ENDIAN */
627 static inline u8 is_tcp_pkt(struct sk_buff *skb)
631 if (ip_hdr(skb)->version == 4)
632 val = (ip_hdr(skb)->protocol == IPPROTO_TCP);
633 else if (ip_hdr(skb)->version == 6)
634 val = (ipv6_hdr(skb)->nexthdr == NEXTHDR_TCP);
639 static inline u8 is_udp_pkt(struct sk_buff *skb)
643 if (ip_hdr(skb)->version == 4)
644 val = (ip_hdr(skb)->protocol == IPPROTO_UDP);
645 else if (ip_hdr(skb)->version == 6)
646 val = (ipv6_hdr(skb)->nexthdr == NEXTHDR_UDP);
651 static inline bool is_ipv4_pkt(struct sk_buff *skb)
653 return skb->protocol == htons(ETH_P_IP) && ip_hdr(skb)->version == 4;
656 static inline void be_vf_eth_addr_generate(struct be_adapter *adapter, u8 *mac)
660 addr = jhash(adapter->netdev->dev_addr, ETH_ALEN, 0);
662 mac[5] = (u8)(addr & 0xFF);
663 mac[4] = (u8)((addr >> 8) & 0xFF);
664 mac[3] = (u8)((addr >> 16) & 0xFF);
665 /* Use the OUI from the current MAC address */
666 memcpy(mac, adapter->netdev->dev_addr, 3);
669 static inline bool be_multi_rxq(const struct be_adapter *adapter)
671 return adapter->num_rx_qs > 1;
674 static inline bool be_error(struct be_adapter *adapter)
676 return adapter->eeh_error || adapter->hw_error || adapter->fw_timeout;
679 static inline bool be_hw_error(struct be_adapter *adapter)
681 return adapter->eeh_error || adapter->hw_error;
684 static inline void be_clear_all_error(struct be_adapter *adapter)
686 adapter->eeh_error = false;
687 adapter->hw_error = false;
688 adapter->fw_timeout = false;
691 static inline bool be_is_wol_excluded(struct be_adapter *adapter)
693 struct pci_dev *pdev = adapter->pdev;
695 if (!be_physfn(adapter))
698 switch (pdev->subsystem_device) {
699 case OC_SUBSYS_DEVICE_ID1:
700 case OC_SUBSYS_DEVICE_ID2:
701 case OC_SUBSYS_DEVICE_ID3:
702 case OC_SUBSYS_DEVICE_ID4:
709 static inline int qnq_async_evt_rcvd(struct be_adapter *adapter)
711 return adapter->flags & BE_FLAGS_QNQ_ASYNC_EVT_RCVD;
714 void be_cq_notify(struct be_adapter *adapter, u16 qid, bool arm,
716 void be_link_status_update(struct be_adapter *adapter, u8 link_status);
717 void be_parse_stats(struct be_adapter *adapter);
718 int be_load_fw(struct be_adapter *adapter, u8 *func);
719 bool be_is_wol_supported(struct be_adapter *adapter);
720 bool be_pause_supported(struct be_adapter *adapter);
721 u32 be_get_fw_log_level(struct be_adapter *adapter);
722 int be_update_queues(struct be_adapter *adapter);
723 int be_poll(struct napi_struct *napi, int budget);
726 * internal function to initialize-cleanup roce device.
728 void be_roce_dev_add(struct be_adapter *);
729 void be_roce_dev_remove(struct be_adapter *);
732 * internal function to open-close roce device during ifup-ifdown.
734 void be_roce_dev_open(struct be_adapter *);
735 void be_roce_dev_close(struct be_adapter *);