2 * Copyright (C) 2005 - 2011 Emulex
5 * This program is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU General Public License version 2
7 * as published by the Free Software Foundation. The full GNU General
8 * Public License is included in this distribution in the file called COPYING.
10 * Contact Information:
11 * linux-drivers@emulex.com
15 * Costa Mesa, CA 92626
21 #include <linux/pci.h>
22 #include <linux/etherdevice.h>
23 #include <linux/delay.h>
27 #include <linux/if_vlan.h>
28 #include <linux/workqueue.h>
29 #include <linux/interrupt.h>
30 #include <linux/firmware.h>
31 #include <linux/slab.h>
32 #include <linux/u64_stats_sync.h>
37 #define DRV_VER "4.2.248.0u"
38 #define DRV_NAME "be2net"
39 #define BE_NAME "ServerEngines BladeEngine2 10Gbps NIC"
40 #define BE3_NAME "ServerEngines BladeEngine3 10Gbps NIC"
41 #define OC_NAME "Emulex OneConnect 10Gbps NIC"
42 #define OC_NAME_BE OC_NAME "(be3)"
43 #define OC_NAME_LANCER OC_NAME "(Lancer)"
44 #define OC_NAME_SH OC_NAME "(Skyhawk)"
45 #define DRV_DESC "ServerEngines BladeEngine 10Gbps NIC Driver"
47 #define BE_VENDOR_ID 0x19a2
48 #define EMULEX_VENDOR_ID 0x10df
49 #define BE_DEVICE_ID1 0x211
50 #define BE_DEVICE_ID2 0x221
51 #define OC_DEVICE_ID1 0x700 /* Device Id for BE2 cards */
52 #define OC_DEVICE_ID2 0x710 /* Device Id for BE3 cards */
53 #define OC_DEVICE_ID3 0xe220 /* Device id for Lancer cards */
54 #define OC_DEVICE_ID4 0xe228 /* Device id for VF in Lancer */
55 #define OC_DEVICE_ID5 0x720 /* Device Id for Skyhawk cards */
56 #define OC_SUBSYS_DEVICE_ID1 0xE602
57 #define OC_SUBSYS_DEVICE_ID2 0xE642
58 #define OC_SUBSYS_DEVICE_ID3 0xE612
59 #define OC_SUBSYS_DEVICE_ID4 0xE652
61 static inline char *nic_name(struct pci_dev *pdev)
63 switch (pdev->device) {
70 return OC_NAME_LANCER;
80 /* Number of bytes of an RX frame that are copied to skb->data */
81 #define BE_HDR_LEN ((u16) 64)
82 /* allocate extra space to allow tunneling decapsulation without head reallocation */
83 #define BE_RX_SKB_ALLOC_SIZE (BE_HDR_LEN + 64)
85 #define BE_MAX_JUMBO_FRAME_SIZE 9018
86 #define BE_MIN_MTU 256
88 #define BE_NUM_VLANS_SUPPORTED 64
89 #define BE_MAX_EQD 96u
90 #define BE_MAX_TX_FRAG_COUNT 30
92 #define EVNT_Q_LEN 1024
94 #define TX_CQ_LEN 1024
95 #define RX_Q_LEN 1024 /* Does not support any other value */
96 #define RX_CQ_LEN 1024
97 #define MCC_Q_LEN 128 /* total size not to exceed 8 pages */
98 #define MCC_CQ_LEN 256
100 #define BE3_MAX_RSS_QS 8
101 #define BE2_MAX_RSS_QS 4
102 #define MAX_RSS_QS BE3_MAX_RSS_QS
103 #define MAX_RX_QS (MAX_RSS_QS + 1) /* RSS qs + 1 def Rx */
106 #define MAX_ROCE_EQS 5
107 #define MAX_MSIX_VECTORS (MAX_RSS_QS + MAX_ROCE_EQS) /* RSS qs + RoCE */
108 #define BE_TX_BUDGET 256
109 #define BE_NAPI_WEIGHT 64
110 #define MAX_RX_POST BE_NAPI_WEIGHT /* Frags posted at a time */
111 #define RX_FRAGS_REFILL_WM (RX_Q_LEN - MAX_RX_POST)
113 #define FW_VER_LEN 32
121 struct be_queue_info {
122 struct be_dma_mem dma_mem;
124 u16 entry_size; /* Size of an element in the queue */
128 atomic_t used; /* Number of valid elements in the queue */
131 static inline u32 MODULO(u16 val, u16 limit)
133 BUG_ON(limit & (limit - 1));
134 return val & (limit - 1);
137 static inline void index_adv(u16 *index, u16 val, u16 limit)
139 *index = MODULO((*index + val), limit);
142 static inline void index_inc(u16 *index, u16 limit)
144 *index = MODULO((*index + 1), limit);
147 static inline void *queue_head_node(struct be_queue_info *q)
149 return q->dma_mem.va + q->head * q->entry_size;
152 static inline void *queue_tail_node(struct be_queue_info *q)
154 return q->dma_mem.va + q->tail * q->entry_size;
157 static inline void *queue_index_node(struct be_queue_info *q, u16 index)
159 return q->dma_mem.va + index * q->entry_size;
162 static inline void queue_head_inc(struct be_queue_info *q)
164 index_inc(&q->head, q->len);
167 static inline void index_dec(u16 *index, u16 limit)
169 *index = MODULO((*index - 1), limit);
172 static inline void queue_tail_inc(struct be_queue_info *q)
174 index_inc(&q->tail, q->len);
178 struct be_queue_info q;
181 /* Adaptive interrupt coalescing (AIC) info */
183 u32 min_eqd; /* in usecs */
184 u32 max_eqd; /* in usecs */
185 u32 eqd; /* configured val when aic is off */
186 u32 cur_eqd; /* in usecs */
188 u8 idx; /* array index */
190 struct napi_struct napi;
191 struct be_adapter *adapter;
192 } ____cacheline_aligned_in_smp;
195 struct be_queue_info q;
196 struct be_queue_info cq;
208 struct u64_stats_sync sync;
209 struct u64_stats_sync sync_compl;
213 struct be_queue_info q;
214 struct be_queue_info cq;
215 /* Remember the skbs that were transmitted */
216 struct sk_buff *sent_skb_list[TX_Q_LEN];
217 struct be_tx_stats stats;
218 } ____cacheline_aligned_in_smp;
220 /* Struct to remember the pages posted for rx frags */
221 struct be_rx_page_info {
223 DEFINE_DMA_UNMAP_ADDR(bus);
233 u32 rx_drops_no_skbs; /* skb allocation errors */
234 u32 rx_drops_no_frags; /* HW has no fetched frags */
235 u32 rx_post_fail; /* page post alloc failures */
238 u32 rx_compl_err; /* completions with err set */
239 u32 rx_pps; /* pkts per second */
240 struct u64_stats_sync sync;
243 struct be_rx_compl_info {
263 struct be_adapter *adapter;
264 struct be_queue_info q;
265 struct be_queue_info cq;
266 struct be_rx_compl_info rxcp;
267 struct be_rx_page_info page_info_tbl[RX_Q_LEN];
268 struct be_rx_stats stats;
270 bool rx_post_starved; /* Zero rx frags have been posted to BE */
271 } ____cacheline_aligned_in_smp;
273 struct be_drv_stats {
274 u32 be_on_die_temperature;
276 u32 rx_drops_no_pbuf;
277 u32 rx_drops_no_txpb;
278 u32 rx_drops_no_erx_descr;
279 u32 rx_drops_no_tpre_descr;
280 u32 rx_drops_too_many_frags;
281 u32 forwarded_packets;
284 u32 rx_alignment_symbol_errors;
286 u32 rx_priority_pause_frames;
287 u32 rx_control_frames;
288 u32 rx_in_range_errors;
289 u32 rx_out_range_errors;
290 u32 rx_frame_too_long;
291 u32 rx_address_mismatch_drops;
292 u32 rx_dropped_too_small;
293 u32 rx_dropped_too_short;
294 u32 rx_dropped_header_too_small;
295 u32 rx_dropped_tcp_length;
297 u32 rx_ip_checksum_errs;
298 u32 rx_tcp_checksum_errs;
299 u32 rx_udp_checksum_errs;
301 u32 tx_priority_pauseframes;
302 u32 tx_controlframes;
303 u32 rxpp_fifo_overflow_drop;
304 u32 rx_input_fifo_overflow_drop;
305 u32 pmem_fifo_overflow_drop;
310 unsigned char mac_addr[ETH_ALEN];
323 #define BE_FLAGS_LINK_STATUS_INIT 1
324 #define BE_FLAGS_WORKER_SCHEDULED (1 << 3)
325 #define BE_UC_PMAC_COUNT 30
326 #define BE_VF_UC_PMAC_COUNT 2
336 u16 auto_speeds_supported;
337 u16 fixed_speeds_supported;
339 int forced_port_speed;
346 struct pci_dev *pdev;
347 struct net_device *netdev;
350 u8 __iomem *db; /* Door Bell */
352 struct mutex mbox_lock; /* For serializing mbox cmds to BE card */
353 struct be_dma_mem mbox_mem;
354 /* Mbox mem is adjusted to align to 16 bytes. The allocated addr
355 * is stored for freeing purpose */
356 struct be_dma_mem mbox_mem_alloced;
358 struct be_mcc_obj mcc_obj;
359 spinlock_t mcc_lock; /* For serializing mcc cmds to BE card */
360 spinlock_t mcc_cq_lock;
364 struct be_eq_obj eq_obj[MAX_MSIX_VECTORS];
365 struct msix_entry msix_entries[MAX_MSIX_VECTORS];
370 struct be_tx_obj tx_obj[MAX_TX_QS];
374 struct be_rx_obj rx_obj[MAX_RX_QS];
375 u32 big_page_size; /* Compounded page size shared by rx wrbs */
378 struct be_drv_stats drv_stats;
381 u16 max_vlans; /* Number of vlans supported */
382 u8 vlan_tag[VLAN_N_VID];
383 u8 vlan_prio_bmap; /* Available Priority BitMap */
384 u16 recommended_prio; /* Recommended Priority */
385 struct be_dma_mem rx_filter; /* Cmd DMA mem for rx-filter */
387 struct be_dma_mem stats_cmd;
388 /* Work queue used to perform periodic tasks like getting statistics */
389 struct delayed_work work;
392 struct delayed_work func_recovery_work;
394 /* Ethtool knobs and info */
395 char fw_ver[FW_VER_LEN];
396 int if_handle; /* Used to configure filtering */
397 u32 *pmac_id; /* MAC addr handle used by BE card */
398 u32 beacon_state; /* for set_phys_id */
408 u32 rx_fc; /* Rx flow control */
409 u32 tx_fc; /* Tx flow control */
411 u8 generation; /* BladeEngine ASIC generation */
414 u8 __iomem *base; /* Door Bell */
419 u32 num_msix_roce_vec;
420 struct ocrdma_dev *ocrdma_dev;
421 struct list_head entry;
424 struct completion flash_compl;
426 u32 num_vfs; /* Number of VFs provisioned by PF driver */
427 u32 dev_num_vfs; /* Number of VFs supported by HW */
429 struct be_vf_cfg *vf_cfg;
437 u32 max_pmac_cnt; /* Max secondary UC MACs programmable */
438 u32 uc_macs; /* Count of secondary UC MAC programmed */
440 int be_get_temp_freq;
443 #define be_physfn(adapter) (!adapter->virtfn)
444 #define sriov_enabled(adapter) (adapter->num_vfs > 0)
445 #define sriov_want(adapter) (adapter->dev_num_vfs && num_vfs && \
447 #define for_all_vfs(adapter, vf_cfg, i) \
448 for (i = 0, vf_cfg = &adapter->vf_cfg[i]; i < adapter->num_vfs; \
451 /* BladeEngine Generation numbers */
457 #define lancer_chip(adapter) ((adapter->pdev->device == OC_DEVICE_ID3) || \
458 (adapter->pdev->device == OC_DEVICE_ID4))
460 #define be_roce_supported(adapter) ((adapter->if_type == SLI_INTF_TYPE_3 || \
461 adapter->sli_family == SKYHAWK_SLI_FAMILY) && \
462 (adapter->function_mode & RDMA_ENABLED))
464 extern const struct ethtool_ops be_ethtool_ops;
466 #define msix_enabled(adapter) (adapter->num_msix_vec > 0)
467 #define num_irqs(adapter) (msix_enabled(adapter) ? \
468 adapter->num_msix_vec : 1)
469 #define tx_stats(txo) (&(txo)->stats)
470 #define rx_stats(rxo) (&(rxo)->stats)
472 /* The default RXQ is the last RXQ */
473 #define default_rxo(adpt) (&adpt->rx_obj[adpt->num_rx_qs - 1])
475 #define for_all_rx_queues(adapter, rxo, i) \
476 for (i = 0, rxo = &adapter->rx_obj[i]; i < adapter->num_rx_qs; \
479 /* Skip the default non-rss queue (last one)*/
480 #define for_all_rss_queues(adapter, rxo, i) \
481 for (i = 0, rxo = &adapter->rx_obj[i]; i < (adapter->num_rx_qs - 1);\
484 #define for_all_tx_queues(adapter, txo, i) \
485 for (i = 0, txo = &adapter->tx_obj[i]; i < adapter->num_tx_qs; \
488 #define for_all_evt_queues(adapter, eqo, i) \
489 for (i = 0, eqo = &adapter->eq_obj[i]; i < adapter->num_evt_qs; \
492 #define is_mcc_eqo(eqo) (eqo->idx == 0)
493 #define mcc_eqo(adapter) (&adapter->eq_obj[0])
495 #define PAGE_SHIFT_4K 12
496 #define PAGE_SIZE_4K (1 << PAGE_SHIFT_4K)
498 /* Returns number of pages spanned by the data starting at the given addr */
499 #define PAGES_4K_SPANNED(_address, size) \
500 ((u32)((((size_t)(_address) & (PAGE_SIZE_4K - 1)) + \
501 (size) + (PAGE_SIZE_4K - 1)) >> PAGE_SHIFT_4K))
503 /* Returns bit offset within a DWORD of a bitfield */
504 #define AMAP_BIT_OFFSET(_struct, field) \
505 (((size_t)&(((_struct *)0)->field))%32)
507 /* Returns the bit mask of the field that is NOT shifted into location. */
508 static inline u32 amap_mask(u32 bitsize)
510 return (bitsize == 32 ? 0xFFFFFFFF : (1 << bitsize) - 1);
514 amap_set(void *ptr, u32 dw_offset, u32 mask, u32 offset, u32 value)
516 u32 *dw = (u32 *) ptr + dw_offset;
517 *dw &= ~(mask << offset);
518 *dw |= (mask & value) << offset;
521 #define AMAP_SET_BITS(_struct, field, ptr, val) \
523 offsetof(_struct, field)/32, \
524 amap_mask(sizeof(((_struct *)0)->field)), \
525 AMAP_BIT_OFFSET(_struct, field), \
528 static inline u32 amap_get(void *ptr, u32 dw_offset, u32 mask, u32 offset)
530 u32 *dw = (u32 *) ptr;
531 return mask & (*(dw + dw_offset) >> offset);
534 #define AMAP_GET_BITS(_struct, field, ptr) \
536 offsetof(_struct, field)/32, \
537 amap_mask(sizeof(((_struct *)0)->field)), \
538 AMAP_BIT_OFFSET(_struct, field))
540 #define be_dws_cpu_to_le(wrb, len) swap_dws(wrb, len)
541 #define be_dws_le_to_cpu(wrb, len) swap_dws(wrb, len)
542 static inline void swap_dws(void *wrb, int len)
548 *dw = cpu_to_le32(*dw);
552 #endif /* __BIG_ENDIAN */
555 static inline u8 is_tcp_pkt(struct sk_buff *skb)
559 if (ip_hdr(skb)->version == 4)
560 val = (ip_hdr(skb)->protocol == IPPROTO_TCP);
561 else if (ip_hdr(skb)->version == 6)
562 val = (ipv6_hdr(skb)->nexthdr == NEXTHDR_TCP);
567 static inline u8 is_udp_pkt(struct sk_buff *skb)
571 if (ip_hdr(skb)->version == 4)
572 val = (ip_hdr(skb)->protocol == IPPROTO_UDP);
573 else if (ip_hdr(skb)->version == 6)
574 val = (ipv6_hdr(skb)->nexthdr == NEXTHDR_UDP);
579 static inline bool is_ipv4_pkt(struct sk_buff *skb)
581 return skb->protocol == htons(ETH_P_IP) && ip_hdr(skb)->version == 4;
584 static inline void be_vf_eth_addr_generate(struct be_adapter *adapter, u8 *mac)
588 addr = jhash(adapter->netdev->dev_addr, ETH_ALEN, 0);
590 mac[5] = (u8)(addr & 0xFF);
591 mac[4] = (u8)((addr >> 8) & 0xFF);
592 mac[3] = (u8)((addr >> 16) & 0xFF);
593 /* Use the OUI from the current MAC address */
594 memcpy(mac, adapter->netdev->dev_addr, 3);
597 static inline bool be_multi_rxq(const struct be_adapter *adapter)
599 return adapter->num_rx_qs > 1;
602 static inline bool be_error(struct be_adapter *adapter)
604 return adapter->eeh_error || adapter->hw_error || adapter->fw_timeout;
607 static inline bool be_crit_error(struct be_adapter *adapter)
609 return adapter->eeh_error || adapter->hw_error;
612 static inline void be_clear_all_error(struct be_adapter *adapter)
614 adapter->eeh_error = false;
615 adapter->hw_error = false;
616 adapter->fw_timeout = false;
619 static inline bool be_is_wol_excluded(struct be_adapter *adapter)
621 struct pci_dev *pdev = adapter->pdev;
623 if (!be_physfn(adapter))
626 switch (pdev->subsystem_device) {
627 case OC_SUBSYS_DEVICE_ID1:
628 case OC_SUBSYS_DEVICE_ID2:
629 case OC_SUBSYS_DEVICE_ID3:
630 case OC_SUBSYS_DEVICE_ID4:
637 static inline bool be_type_2_3(struct be_adapter *adapter)
639 return (adapter->if_type == SLI_INTF_TYPE_2 ||
640 adapter->if_type == SLI_INTF_TYPE_3) ? true : false;
643 extern void be_cq_notify(struct be_adapter *adapter, u16 qid, bool arm,
645 extern void be_link_status_update(struct be_adapter *adapter, u8 link_status);
646 extern void be_parse_stats(struct be_adapter *adapter);
647 extern int be_load_fw(struct be_adapter *adapter, u8 *func);
648 extern bool be_is_wol_supported(struct be_adapter *adapter);
649 extern bool be_pause_supported(struct be_adapter *adapter);
650 extern u32 be_get_fw_log_level(struct be_adapter *adapter);
653 * internal function to initialize-cleanup roce device.
655 extern void be_roce_dev_add(struct be_adapter *);
656 extern void be_roce_dev_remove(struct be_adapter *);
659 * internal function to open-close roce device during ifup-ifdown.
661 extern void be_roce_dev_open(struct be_adapter *);
662 extern void be_roce_dev_close(struct be_adapter *);