2 * Copyright (C) 2005 - 2014 Emulex
5 * This program is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU General Public License version 2
7 * as published by the Free Software Foundation. The full GNU General
8 * Public License is included in this distribution in the file called COPYING.
10 * Contact Information:
11 * linux-drivers@emulex.com
15 * Costa Mesa, CA 92626
21 #include <linux/pci.h>
22 #include <linux/etherdevice.h>
23 #include <linux/delay.h>
27 #include <linux/if_vlan.h>
28 #include <linux/workqueue.h>
29 #include <linux/interrupt.h>
30 #include <linux/firmware.h>
31 #include <linux/slab.h>
32 #include <linux/u64_stats_sync.h>
37 #define DRV_VER "10.4u"
38 #define DRV_NAME "be2net"
39 #define BE_NAME "Emulex BladeEngine2"
40 #define BE3_NAME "Emulex BladeEngine3"
41 #define OC_NAME "Emulex OneConnect"
42 #define OC_NAME_BE OC_NAME "(be3)"
43 #define OC_NAME_LANCER OC_NAME "(Lancer)"
44 #define OC_NAME_SH OC_NAME "(Skyhawk)"
45 #define DRV_DESC "Emulex OneConnect NIC Driver"
47 #define BE_VENDOR_ID 0x19a2
48 #define EMULEX_VENDOR_ID 0x10df
49 #define BE_DEVICE_ID1 0x211
50 #define BE_DEVICE_ID2 0x221
51 #define OC_DEVICE_ID1 0x700 /* Device Id for BE2 cards */
52 #define OC_DEVICE_ID2 0x710 /* Device Id for BE3 cards */
53 #define OC_DEVICE_ID3 0xe220 /* Device id for Lancer cards */
54 #define OC_DEVICE_ID4 0xe228 /* Device id for VF in Lancer */
55 #define OC_DEVICE_ID5 0x720 /* Device Id for Skyhawk cards */
56 #define OC_DEVICE_ID6 0x728 /* Device id for VF in SkyHawk */
57 #define OC_SUBSYS_DEVICE_ID1 0xE602
58 #define OC_SUBSYS_DEVICE_ID2 0xE642
59 #define OC_SUBSYS_DEVICE_ID3 0xE612
60 #define OC_SUBSYS_DEVICE_ID4 0xE652
62 /* Number of bytes of an RX frame that are copied to skb->data */
63 #define BE_HDR_LEN ((u16) 64)
64 /* allocate extra space to allow tunneling decapsulation without head reallocation */
65 #define BE_RX_SKB_ALLOC_SIZE (BE_HDR_LEN + 64)
67 #define BE_MAX_JUMBO_FRAME_SIZE 9018
68 #define BE_MIN_MTU 256
69 #define BE_MAX_MTU (BE_MAX_JUMBO_FRAME_SIZE - \
70 (ETH_HLEN + ETH_FCS_LEN))
72 #define BE_NUM_VLANS_SUPPORTED 64
73 #define BE_MAX_EQD 128u
74 #define BE_MAX_TX_FRAG_COUNT 30
76 #define EVNT_Q_LEN 1024
78 #define TX_CQ_LEN 1024
79 #define RX_Q_LEN 1024 /* Does not support any other value */
80 #define RX_CQ_LEN 1024
81 #define MCC_Q_LEN 128 /* total size not to exceed 8 pages */
82 #define MCC_CQ_LEN 256
84 #define BE2_MAX_RSS_QS 4
85 #define BE3_MAX_RSS_QS 16
86 #define BE3_MAX_TX_QS 16
87 #define BE3_MAX_EVT_QS 16
88 #define BE3_SRIOV_MAX_EVT_QS 8
94 #define MAX_ROCE_EQS 5
95 #define MAX_MSIX_VECTORS 32
96 #define MIN_MSIX_VECTORS 1
97 #define BE_NAPI_WEIGHT 64
98 #define MAX_RX_POST BE_NAPI_WEIGHT /* Frags posted at a time */
99 #define RX_FRAGS_REFILL_WM (RX_Q_LEN - MAX_RX_POST)
101 #define MAX_VFS 30 /* Max VFs supported by BE3 FW */
102 #define FW_VER_LEN 32
104 #define RSS_INDIR_TABLE_LEN 128
105 #define RSS_HASH_KEY_LEN 40
113 struct be_queue_info {
114 struct be_dma_mem dma_mem;
116 u16 entry_size; /* Size of an element in the queue */
120 atomic_t used; /* Number of valid elements in the queue */
123 static inline u32 MODULO(u16 val, u16 limit)
125 BUG_ON(limit & (limit - 1));
126 return val & (limit - 1);
129 static inline void index_adv(u16 *index, u16 val, u16 limit)
131 *index = MODULO((*index + val), limit);
134 static inline void index_inc(u16 *index, u16 limit)
136 *index = MODULO((*index + 1), limit);
139 static inline void *queue_head_node(struct be_queue_info *q)
141 return q->dma_mem.va + q->head * q->entry_size;
144 static inline void *queue_tail_node(struct be_queue_info *q)
146 return q->dma_mem.va + q->tail * q->entry_size;
149 static inline void *queue_index_node(struct be_queue_info *q, u16 index)
151 return q->dma_mem.va + index * q->entry_size;
154 static inline void queue_head_inc(struct be_queue_info *q)
156 index_inc(&q->head, q->len);
159 static inline void index_dec(u16 *index, u16 limit)
161 *index = MODULO((*index - 1), limit);
164 static inline void queue_tail_inc(struct be_queue_info *q)
166 index_inc(&q->tail, q->len);
170 struct be_queue_info q;
173 /* Adaptive interrupt coalescing (AIC) info */
175 u32 min_eqd; /* in usecs */
176 u32 max_eqd; /* in usecs */
177 u32 eqd; /* configured val when aic is off */
178 u32 cur_eqd; /* in usecs */
180 u8 idx; /* array index */
183 struct napi_struct napi;
184 struct be_adapter *adapter;
186 #ifdef CONFIG_NET_RX_BUSY_POLL
188 #define BE_EQ_NAPI 1 /* napi owns this EQ */
189 #define BE_EQ_POLL 2 /* poll owns this EQ */
190 #define BE_EQ_LOCKED (BE_EQ_NAPI | BE_EQ_POLL)
191 #define BE_EQ_NAPI_YIELD 4 /* napi yielded this EQ */
192 #define BE_EQ_POLL_YIELD 8 /* poll yielded this EQ */
193 #define BE_EQ_YIELD (BE_EQ_NAPI_YIELD | BE_EQ_POLL_YIELD)
194 #define BE_EQ_USER_PEND (BE_EQ_POLL | BE_EQ_POLL_YIELD)
196 spinlock_t lock; /* lock to serialize napi and busy-poll */
197 #endif /* CONFIG_NET_RX_BUSY_POLL */
198 } ____cacheline_aligned_in_smp;
200 struct be_aic_obj { /* Adaptive interrupt coalescing (AIC) info */
202 u32 min_eqd; /* in usecs */
203 u32 max_eqd; /* in usecs */
204 u32 prev_eqd; /* in usecs */
205 u32 et_eqd; /* configured val when aic is off */
207 u64 rx_pkts_prev; /* Used to calculate RX pps */
208 u64 tx_reqs_prev; /* Used to calculate TX pps */
217 struct be_queue_info q;
218 struct be_queue_info cq;
229 u32 tx_drv_drops; /* pkts dropped by driver */
230 /* the error counters are described in be_ethtool.c */
231 u32 tx_hdr_parse_err;
234 u32 tx_spoof_check_err;
236 u32 tx_internal_parity_err;
237 struct u64_stats_sync sync;
238 struct u64_stats_sync sync_compl;
243 struct be_queue_info q;
244 struct be_queue_info cq;
245 /* Remember the skbs that were transmitted */
246 struct sk_buff *sent_skb_list[TX_Q_LEN];
247 struct be_tx_stats stats;
248 u16 pend_wrb_cnt; /* Number of WRBs yet to be given to HW */
249 u16 last_req_wrb_cnt; /* wrb cnt of the last req in the Q */
250 u16 last_req_hdr; /* index of the last req's hdr-wrb */
251 } ____cacheline_aligned_in_smp;
253 /* Struct to remember the pages posted for rx frags */
254 struct be_rx_page_info {
256 /* set to page-addr for last frag of the page & frag-addr otherwise */
257 DEFINE_DMA_UNMAP_ADDR(bus);
259 bool last_frag; /* last frag of the page */
265 u32 rx_drops_no_skbs; /* skb allocation errors */
266 u32 rx_drops_no_frags; /* HW has no fetched frags */
267 u32 rx_post_fail; /* page post alloc failures */
270 u32 rx_compl_err; /* completions with err set */
271 struct u64_stats_sync sync;
274 struct be_rx_compl_info {
295 struct be_adapter *adapter;
296 struct be_queue_info q;
297 struct be_queue_info cq;
298 struct be_rx_compl_info rxcp;
299 struct be_rx_page_info page_info_tbl[RX_Q_LEN];
300 struct be_rx_stats stats;
302 bool rx_post_starved; /* Zero rx frags have been posted to BE */
303 } ____cacheline_aligned_in_smp;
305 struct be_drv_stats {
306 u32 be_on_die_temperature;
309 u32 rx_drops_no_pbuf;
310 u32 rx_drops_no_txpb;
311 u32 rx_drops_no_erx_descr;
312 u32 rx_drops_no_tpre_descr;
313 u32 rx_drops_too_many_frags;
314 u32 forwarded_packets;
317 u32 rx_alignment_symbol_errors;
319 u32 rx_priority_pause_frames;
320 u32 rx_control_frames;
321 u32 rx_in_range_errors;
322 u32 rx_out_range_errors;
323 u32 rx_frame_too_long;
324 u32 rx_address_filtered;
325 u32 rx_dropped_too_small;
326 u32 rx_dropped_too_short;
327 u32 rx_dropped_header_too_small;
328 u32 rx_dropped_tcp_length;
330 u32 rx_ip_checksum_errs;
331 u32 rx_tcp_checksum_errs;
332 u32 rx_udp_checksum_errs;
334 u32 tx_priority_pauseframes;
335 u32 tx_controlframes;
336 u32 rxpp_fifo_overflow_drop;
337 u32 rx_input_fifo_overflow_drop;
338 u32 pmem_fifo_overflow_drop;
340 u32 rx_roce_bytes_lsd;
341 u32 rx_roce_bytes_msd;
343 u32 roce_drops_payload_len;
347 /* A vlan-id of 0xFFFF must be used to clear transparent vlan-tagging */
348 #define BE_RESET_VLAN_TAG_ID 0xFFFF
351 unsigned char mac_addr[ETH_ALEN];
364 #define BE_FLAGS_LINK_STATUS_INIT BIT(1)
365 #define BE_FLAGS_SRIOV_ENABLED BIT(2)
366 #define BE_FLAGS_WORKER_SCHEDULED BIT(3)
367 #define BE_FLAGS_VLAN_PROMISC BIT(4)
368 #define BE_FLAGS_MCAST_PROMISC BIT(5)
369 #define BE_FLAGS_NAPI_ENABLED BIT(6)
370 #define BE_FLAGS_QNQ_ASYNC_EVT_RCVD BIT(7)
371 #define BE_FLAGS_VXLAN_OFFLOADS BIT(8)
372 #define BE_FLAGS_SETUP_DONE BIT(9)
374 #define BE_UC_PMAC_COUNT 30
375 #define BE_VF_UC_PMAC_COUNT 2
377 /* Ethtool set_dump flags */
378 #define LANCER_INITIATE_FW_DUMP 0x1
379 #define LANCER_DELETE_FW_DUMP 0x2
389 u16 auto_speeds_supported;
390 u16 fixed_speeds_supported;
397 struct be_resources {
398 u16 max_vfs; /* Total VFs "really" supported by FW/HW */
403 u16 max_uc_mac; /* Max UC MACs programmable */
404 u16 max_vlans; /* Number of vlans supported */
407 u32 vf_if_cap_flags; /* VF if capability flags */
412 u8 rsstable[RSS_INDIR_TABLE_LEN];
413 u8 rss_queue[RSS_INDIR_TABLE_LEN];
414 u8 rss_hkey[RSS_HASH_KEY_LEN];
418 struct pci_dev *pdev;
419 struct net_device *netdev;
421 u8 __iomem *csr; /* CSR BAR used only for BE2/3 */
422 u8 __iomem *db; /* Door Bell */
424 struct mutex mbox_lock; /* For serializing mbox cmds to BE card */
425 struct be_dma_mem mbox_mem;
426 /* Mbox mem is adjusted to align to 16 bytes. The allocated addr
427 * is stored for freeing purpose */
428 struct be_dma_mem mbox_mem_alloced;
430 struct be_mcc_obj mcc_obj;
431 spinlock_t mcc_lock; /* For serializing mcc cmds to BE card */
432 spinlock_t mcc_cq_lock;
434 u16 cfg_num_qs; /* configured via set-channels */
437 struct be_eq_obj eq_obj[MAX_EVT_QS];
438 struct msix_entry msix_entries[MAX_MSIX_VECTORS];
443 struct be_tx_obj tx_obj[MAX_TX_QS];
447 struct be_rx_obj rx_obj[MAX_RX_QS];
448 u32 big_page_size; /* Compounded page size shared by rx wrbs */
450 struct be_drv_stats drv_stats;
451 struct be_aic_obj aic_obj[MAX_EVT_QS];
453 unsigned long vids[BITS_TO_LONGS(VLAN_N_VID)];
454 u8 vlan_prio_bmap; /* Available Priority BitMap */
455 u16 recommended_prio; /* Recommended Priority */
456 struct be_dma_mem rx_filter; /* Cmd DMA mem for rx-filter */
458 struct be_dma_mem stats_cmd;
459 /* Work queue used to perform periodic tasks like getting statistics */
460 struct delayed_work work;
463 struct delayed_work func_recovery_work;
466 /* Ethtool knobs and info */
467 char fw_ver[FW_VER_LEN];
468 char fw_on_flash[FW_VER_LEN];
469 int if_handle; /* Used to configure filtering */
470 u32 *pmac_id; /* MAC addr handle used by BE card */
471 u32 beacon_state; /* for set_phys_id */
482 u32 rx_fc; /* Rx flow control */
483 u32 tx_fc; /* Tx flow control */
490 u32 num_msix_roce_vec;
491 struct ocrdma_dev *ocrdma_dev;
492 struct list_head entry;
495 struct completion et_cmd_compl;
497 struct be_resources pool_res; /* resources available for the port */
498 struct be_resources res; /* resources available for the func */
499 u16 num_vfs; /* Number of VFs provisioned by PF */
501 struct be_vf_cfg *vf_cfg;
507 int vxlan_port_count;
511 u32 uc_macs; /* Count of secondary UC MAC programmed */
515 int be_get_temp_freq;
517 struct rss_info rss_info;
520 #define be_physfn(adapter) (!adapter->virtfn)
521 #define be_virtfn(adapter) (adapter->virtfn)
522 #define sriov_enabled(adapter) (adapter->flags & \
523 BE_FLAGS_SRIOV_ENABLED)
525 #define for_all_vfs(adapter, vf_cfg, i) \
526 for (i = 0, vf_cfg = &adapter->vf_cfg[i]; i < adapter->num_vfs; \
532 #define be_max_vlans(adapter) (adapter->res.max_vlans)
533 #define be_max_uc(adapter) (adapter->res.max_uc_mac)
534 #define be_max_mc(adapter) (adapter->res.max_mcast_mac)
535 #define be_max_vfs(adapter) (adapter->pool_res.max_vfs)
536 #define be_max_rss(adapter) (adapter->res.max_rss_qs)
537 #define be_max_txqs(adapter) (adapter->res.max_tx_qs)
538 #define be_max_prio_txqs(adapter) (adapter->res.max_prio_tx_qs)
539 #define be_max_rxqs(adapter) (adapter->res.max_rx_qs)
540 #define be_max_eqs(adapter) (adapter->res.max_evt_qs)
541 #define be_if_cap_flags(adapter) (adapter->res.if_cap_flags)
543 static inline u16 be_max_qs(struct be_adapter *adapter)
545 /* If no RSS, need atleast the one def RXQ */
546 u16 num = max_t(u16, be_max_rss(adapter), 1);
548 num = min(num, be_max_eqs(adapter));
549 return min_t(u16, num, num_online_cpus());
552 /* Is BE in pvid_tagging mode */
553 #define be_pvid_tagging_enabled(adapter) (adapter->pvid)
555 /* Is BE in QNQ multi-channel mode */
556 #define be_is_qnq_mode(adapter) (adapter->function_mode & QNQ_MODE)
558 #define lancer_chip(adapter) (adapter->pdev->device == OC_DEVICE_ID3 || \
559 adapter->pdev->device == OC_DEVICE_ID4)
561 #define skyhawk_chip(adapter) (adapter->pdev->device == OC_DEVICE_ID5 || \
562 adapter->pdev->device == OC_DEVICE_ID6)
564 #define BE3_chip(adapter) (adapter->pdev->device == BE_DEVICE_ID2 || \
565 adapter->pdev->device == OC_DEVICE_ID2)
567 #define BE2_chip(adapter) (adapter->pdev->device == BE_DEVICE_ID1 || \
568 adapter->pdev->device == OC_DEVICE_ID1)
570 #define BEx_chip(adapter) (BE3_chip(adapter) || BE2_chip(adapter))
572 #define be_roce_supported(adapter) (skyhawk_chip(adapter) && \
573 (adapter->function_mode & RDMA_ENABLED))
575 extern const struct ethtool_ops be_ethtool_ops;
577 #define msix_enabled(adapter) (adapter->num_msix_vec > 0)
578 #define num_irqs(adapter) (msix_enabled(adapter) ? \
579 adapter->num_msix_vec : 1)
580 #define tx_stats(txo) (&(txo)->stats)
581 #define rx_stats(rxo) (&(rxo)->stats)
583 /* The default RXQ is the last RXQ */
584 #define default_rxo(adpt) (&adpt->rx_obj[adpt->num_rx_qs - 1])
586 #define for_all_rx_queues(adapter, rxo, i) \
587 for (i = 0, rxo = &adapter->rx_obj[i]; i < adapter->num_rx_qs; \
590 /* Skip the default non-rss queue (last one)*/
591 #define for_all_rss_queues(adapter, rxo, i) \
592 for (i = 0, rxo = &adapter->rx_obj[i]; i < (adapter->num_rx_qs - 1);\
595 #define for_all_tx_queues(adapter, txo, i) \
596 for (i = 0, txo = &adapter->tx_obj[i]; i < adapter->num_tx_qs; \
599 #define for_all_evt_queues(adapter, eqo, i) \
600 for (i = 0, eqo = &adapter->eq_obj[i]; i < adapter->num_evt_qs; \
603 #define for_all_rx_queues_on_eq(adapter, eqo, rxo, i) \
604 for (i = eqo->idx, rxo = &adapter->rx_obj[i]; i < adapter->num_rx_qs;\
605 i += adapter->num_evt_qs, rxo += adapter->num_evt_qs)
607 #define for_all_tx_queues_on_eq(adapter, eqo, txo, i) \
608 for (i = eqo->idx, txo = &adapter->tx_obj[i]; i < adapter->num_tx_qs;\
609 i += adapter->num_evt_qs, txo += adapter->num_evt_qs)
611 #define is_mcc_eqo(eqo) (eqo->idx == 0)
612 #define mcc_eqo(adapter) (&adapter->eq_obj[0])
614 #define PAGE_SHIFT_4K 12
615 #define PAGE_SIZE_4K (1 << PAGE_SHIFT_4K)
617 /* Returns number of pages spanned by the data starting at the given addr */
618 #define PAGES_4K_SPANNED(_address, size) \
619 ((u32)((((size_t)(_address) & (PAGE_SIZE_4K - 1)) + \
620 (size) + (PAGE_SIZE_4K - 1)) >> PAGE_SHIFT_4K))
622 /* Returns bit offset within a DWORD of a bitfield */
623 #define AMAP_BIT_OFFSET(_struct, field) \
624 (((size_t)&(((_struct *)0)->field))%32)
626 /* Returns the bit mask of the field that is NOT shifted into location. */
627 static inline u32 amap_mask(u32 bitsize)
629 return (bitsize == 32 ? 0xFFFFFFFF : (1 << bitsize) - 1);
633 amap_set(void *ptr, u32 dw_offset, u32 mask, u32 offset, u32 value)
635 u32 *dw = (u32 *) ptr + dw_offset;
636 *dw &= ~(mask << offset);
637 *dw |= (mask & value) << offset;
640 #define AMAP_SET_BITS(_struct, field, ptr, val) \
642 offsetof(_struct, field)/32, \
643 amap_mask(sizeof(((_struct *)0)->field)), \
644 AMAP_BIT_OFFSET(_struct, field), \
647 static inline u32 amap_get(void *ptr, u32 dw_offset, u32 mask, u32 offset)
649 u32 *dw = (u32 *) ptr;
650 return mask & (*(dw + dw_offset) >> offset);
653 #define AMAP_GET_BITS(_struct, field, ptr) \
655 offsetof(_struct, field)/32, \
656 amap_mask(sizeof(((_struct *)0)->field)), \
657 AMAP_BIT_OFFSET(_struct, field))
659 #define GET_RX_COMPL_V0_BITS(field, ptr) \
660 AMAP_GET_BITS(struct amap_eth_rx_compl_v0, field, ptr)
662 #define GET_RX_COMPL_V1_BITS(field, ptr) \
663 AMAP_GET_BITS(struct amap_eth_rx_compl_v1, field, ptr)
665 #define GET_TX_COMPL_BITS(field, ptr) \
666 AMAP_GET_BITS(struct amap_eth_tx_compl, field, ptr)
668 #define SET_TX_WRB_HDR_BITS(field, ptr, val) \
669 AMAP_SET_BITS(struct amap_eth_hdr_wrb, field, ptr, val)
671 #define be_dws_cpu_to_le(wrb, len) swap_dws(wrb, len)
672 #define be_dws_le_to_cpu(wrb, len) swap_dws(wrb, len)
673 static inline void swap_dws(void *wrb, int len)
679 *dw = cpu_to_le32(*dw);
683 #endif /* __BIG_ENDIAN */
686 #define be_cmd_status(status) (status > 0 ? -EIO : status)
688 static inline u8 is_tcp_pkt(struct sk_buff *skb)
692 if (ip_hdr(skb)->version == 4)
693 val = (ip_hdr(skb)->protocol == IPPROTO_TCP);
694 else if (ip_hdr(skb)->version == 6)
695 val = (ipv6_hdr(skb)->nexthdr == NEXTHDR_TCP);
700 static inline u8 is_udp_pkt(struct sk_buff *skb)
704 if (ip_hdr(skb)->version == 4)
705 val = (ip_hdr(skb)->protocol == IPPROTO_UDP);
706 else if (ip_hdr(skb)->version == 6)
707 val = (ipv6_hdr(skb)->nexthdr == NEXTHDR_UDP);
712 static inline bool is_ipv4_pkt(struct sk_buff *skb)
714 return skb->protocol == htons(ETH_P_IP) && ip_hdr(skb)->version == 4;
717 static inline bool be_multi_rxq(const struct be_adapter *adapter)
719 return adapter->num_rx_qs > 1;
722 static inline bool be_error(struct be_adapter *adapter)
724 return adapter->eeh_error || adapter->hw_error || adapter->fw_timeout;
727 static inline bool be_hw_error(struct be_adapter *adapter)
729 return adapter->eeh_error || adapter->hw_error;
732 static inline void be_clear_all_error(struct be_adapter *adapter)
734 adapter->eeh_error = false;
735 adapter->hw_error = false;
736 adapter->fw_timeout = false;
739 void be_cq_notify(struct be_adapter *adapter, u16 qid, bool arm,
741 void be_link_status_update(struct be_adapter *adapter, u8 link_status);
742 void be_parse_stats(struct be_adapter *adapter);
743 int be_load_fw(struct be_adapter *adapter, u8 *func);
744 bool be_is_wol_supported(struct be_adapter *adapter);
745 bool be_pause_supported(struct be_adapter *adapter);
746 u32 be_get_fw_log_level(struct be_adapter *adapter);
747 int be_update_queues(struct be_adapter *adapter);
748 int be_poll(struct napi_struct *napi, int budget);
751 * internal function to initialize-cleanup roce device.
753 void be_roce_dev_add(struct be_adapter *);
754 void be_roce_dev_remove(struct be_adapter *);
757 * internal function to open-close roce device during ifup-ifdown.
759 void be_roce_dev_open(struct be_adapter *);
760 void be_roce_dev_close(struct be_adapter *);
761 void be_roce_dev_shutdown(struct be_adapter *);