1 /* SPDX-License-Identifier: GPL-2.0 */
2 /* Copyright (c) 2018, Intel Corporation. */
7 #include <linux/types.h>
8 #include <linux/errno.h>
9 #include <linux/kernel.h>
10 #include <linux/module.h>
11 #include <linux/firmware.h>
12 #include <linux/netdevice.h>
13 #include <linux/compiler.h>
14 #include <linux/etherdevice.h>
15 #include <linux/skbuff.h>
16 #include <linux/cpumask.h>
17 #include <linux/rtnetlink.h>
18 #include <linux/if_vlan.h>
19 #include <linux/dma-mapping.h>
20 #include <linux/pci.h>
21 #include <linux/workqueue.h>
22 #include <linux/aer.h>
23 #include <linux/interrupt.h>
24 #include <linux/ethtool.h>
25 #include <linux/timer.h>
26 #include <linux/delay.h>
27 #include <linux/bitmap.h>
28 #include <linux/log2.h>
30 #include <linux/sctp.h>
31 #include <linux/ipv6.h>
32 #include <linux/pkt_sched.h>
33 #include <linux/if_bridge.h>
34 #include <linux/ctype.h>
35 #include <linux/bpf.h>
36 #include <linux/avf/virtchnl.h>
37 #include <net/devlink.h>
39 #include <net/xdp_sock.h>
40 #include <net/geneve.h>
42 #include <net/udp_tunnel.h>
43 #include <net/vxlan.h>
44 #include "ice_devids.h"
48 #include "ice_switch.h"
49 #include "ice_common.h"
50 #include "ice_sched.h"
51 #include "ice_virtchnl_pf.h"
52 #include "ice_sriov.h"
55 extern const char ice_drv_ver[];
57 #define ICE_REQ_DESC_MULTIPLE 32
58 #define ICE_MIN_NUM_DESC 64
59 #define ICE_MAX_NUM_DESC 8160
60 #define ICE_DFLT_MIN_RX_DESC 512
61 #define ICE_DFLT_NUM_TX_DESC 256
62 #define ICE_DFLT_NUM_RX_DESC 2048
64 #define ICE_DFLT_TRAFFIC_CLASS BIT(0)
65 #define ICE_INT_NAME_STR_LEN (IFNAMSIZ + 16)
67 #define ICE_MBXSQ_LEN 64
68 #define ICE_MIN_MSIX 2
69 #define ICE_NO_VSI 0xffff
70 #define ICE_VSI_MAP_CONTIG 0
71 #define ICE_VSI_MAP_SCATTER 1
72 #define ICE_MAX_SCATTER_TXQS 16
73 #define ICE_MAX_SCATTER_RXQS 16
74 #define ICE_Q_WAIT_RETRY_LIMIT 10
75 #define ICE_Q_WAIT_MAX_RETRY (5 * ICE_Q_WAIT_RETRY_LIMIT)
76 #define ICE_MAX_LG_RSS_QS 256
77 #define ICE_RES_VALID_BIT 0x8000
78 #define ICE_RES_MISC_VEC_ID (ICE_RES_VALID_BIT - 1)
79 #define ICE_INVAL_Q_INDEX 0xffff
80 #define ICE_INVAL_VFID 256
82 #define ICE_MAX_RESET_WAIT 20
84 #define ICE_VSIQF_HKEY_ARRAY_SIZE ((VSIQF_HKEY_MAX_INDEX + 1) * 4)
86 #define ICE_DFLT_NETIF_M (NETIF_MSG_DRV | NETIF_MSG_PROBE | NETIF_MSG_LINK)
88 #define ICE_MAX_MTU (ICE_AQ_SET_MAC_FRAME_SIZE_MAX - ICE_ETH_PKT_HDR_PAD)
90 #define ICE_UP_TABLE_TRANSLATE(val, i) \
91 (((val) << ICE_AQ_VSI_UP_TABLE_UP##i##_S) & \
92 ICE_AQ_VSI_UP_TABLE_UP##i##_M)
94 #define ICE_TX_DESC(R, i) (&(((struct ice_tx_desc *)((R)->desc))[i]))
95 #define ICE_RX_DESC(R, i) (&(((union ice_32b_rx_flex_desc *)((R)->desc))[i]))
96 #define ICE_TX_CTX_DESC(R, i) (&(((struct ice_tx_ctx_desc *)((R)->desc))[i]))
98 /* Macro for each VSI in a PF */
99 #define ice_for_each_vsi(pf, i) \
100 for ((i) = 0; (i) < (pf)->num_alloc_vsi; (i)++)
102 /* Macros for each Tx/Rx ring in a VSI */
103 #define ice_for_each_txq(vsi, i) \
104 for ((i) = 0; (i) < (vsi)->num_txq; (i)++)
106 #define ice_for_each_rxq(vsi, i) \
107 for ((i) = 0; (i) < (vsi)->num_rxq; (i)++)
109 /* Macros for each allocated Tx/Rx ring whether used or not in a VSI */
110 #define ice_for_each_alloc_txq(vsi, i) \
111 for ((i) = 0; (i) < (vsi)->alloc_txq; (i)++)
113 #define ice_for_each_alloc_rxq(vsi, i) \
114 for ((i) = 0; (i) < (vsi)->alloc_rxq; (i)++)
116 #define ice_for_each_q_vector(vsi, i) \
117 for ((i) = 0; (i) < (vsi)->num_q_vectors; (i)++)
119 #define ICE_UCAST_PROMISC_BITS (ICE_PROMISC_UCAST_TX | ICE_PROMISC_MCAST_TX | \
120 ICE_PROMISC_UCAST_RX | ICE_PROMISC_MCAST_RX)
122 #define ICE_UCAST_VLAN_PROMISC_BITS (ICE_PROMISC_UCAST_TX | \
123 ICE_PROMISC_MCAST_TX | \
124 ICE_PROMISC_UCAST_RX | \
125 ICE_PROMISC_MCAST_RX | \
126 ICE_PROMISC_VLAN_TX | \
129 #define ICE_MCAST_PROMISC_BITS (ICE_PROMISC_MCAST_TX | ICE_PROMISC_MCAST_RX)
131 #define ICE_MCAST_VLAN_PROMISC_BITS (ICE_PROMISC_MCAST_TX | \
132 ICE_PROMISC_MCAST_RX | \
133 ICE_PROMISC_VLAN_TX | \
136 #define ice_pf_to_dev(pf) (&((pf)->pdev->dev))
138 struct ice_txq_meta {
139 u32 q_teid; /* Tx-scheduler element identifier */
140 u16 q_id; /* Entry in VSI's txq_map bitmap */
141 u16 q_handle; /* Relative index of Tx queue within TC */
142 u16 vsi_idx; /* VSI index that Tx queue belongs to */
143 u8 tc; /* TC number that Tx queue belongs to */
154 u8 numtc; /* Total number of enabled TCs */
155 u8 ena_tc; /* Tx map */
156 struct ice_tc_info tc_info[ICE_MAX_TRAFFIC_CLASS];
159 struct ice_res_tracker {
166 struct mutex *qs_mutex; /* will be assigned to &pf->avail_q_mutex */
167 unsigned long *pf_map;
168 unsigned long pf_map_size;
169 unsigned int q_count;
170 unsigned int scatter_count;
178 u16 sw_id; /* switch ID for this switch */
179 u16 bridge_mode; /* VEB/VEPA/Port Virtualizer */
180 struct ice_vsi *dflt_vsi; /* default VSI for this switch */
181 u8 dflt_vsi_ena:1; /* true if above dflt_vsi is enabled */
188 __ICE_PREPARED_FOR_RESET, /* set by driver when prepared */
189 __ICE_RESET_OICR_RECV, /* set by driver after rcv reset OICR */
190 __ICE_DCBNL_DEVRESET, /* set by dcbnl devreset */
191 __ICE_PFR_REQ, /* set by driver and peers */
192 __ICE_CORER_REQ, /* set by driver and peers */
193 __ICE_GLOBR_REQ, /* set by driver and peers */
194 __ICE_CORER_RECV, /* set by OICR handler */
195 __ICE_GLOBR_RECV, /* set by OICR handler */
196 __ICE_EMPR_RECV, /* set by OICR handler */
197 __ICE_SUSPENDED, /* set on module remove path */
198 __ICE_RESET_FAILED, /* set by reset/rebuild */
199 /* When checking for the PF to be in a nominal operating state, the
200 * bits that are grouped at the beginning of the list need to be
201 * checked. Bits occurring before __ICE_STATE_NOMINAL_CHECK_BITS will
202 * be checked. If you need to add a bit into consideration for nominal
203 * operating state, it must be added before
204 * __ICE_STATE_NOMINAL_CHECK_BITS. Do not move this entry's position
205 * without appropriate consideration.
207 __ICE_STATE_NOMINAL_CHECK_BITS,
208 __ICE_ADMINQ_EVENT_PENDING,
209 __ICE_MAILBOXQ_EVENT_PENDING,
210 __ICE_MDD_EVENT_PENDING,
211 __ICE_VFLR_EVENT_PENDING,
212 __ICE_FLTR_OVERFLOW_PROMISC,
217 __ICE_OICR_INTR_DIS, /* Global OICR interrupt disabled */
218 __ICE_MDD_VF_PRINT_PENDING, /* set when MDD event handle */
219 __ICE_VF_RESETS_DISABLED, /* disable resets during ice_remove */
220 __ICE_STATE_NBITS /* must be last */
224 ICE_VSI_FLAG_UMAC_FLTR_CHANGED,
225 ICE_VSI_FLAG_MMAC_FLTR_CHANGED,
226 ICE_VSI_FLAG_VLAN_FLTR_CHANGED,
227 ICE_VSI_FLAG_PROMISC_CHANGED,
228 ICE_VSI_FLAG_NBITS /* must be last */
231 /* struct that defines a VSI, associated with a dev */
233 struct net_device *netdev;
234 struct ice_sw *vsw; /* switch this VSI is on */
235 struct ice_pf *back; /* back pointer to PF */
236 struct ice_port_info *port_info; /* back pointer to port_info */
237 struct ice_ring **rx_rings; /* Rx ring array */
238 struct ice_ring **tx_rings; /* Tx ring array */
239 struct ice_q_vector **q_vectors; /* q_vector array */
241 irqreturn_t (*irq_handler)(int irq, void *data);
244 DECLARE_BITMAP(state, __ICE_STATE_NBITS);
245 DECLARE_BITMAP(flags, ICE_VSI_FLAG_NBITS);
246 unsigned int current_netdev_flags;
252 int base_vector; /* IRQ base for OS reserved vectors */
253 enum ice_vsi_type type;
254 u16 vsi_num; /* HW (absolute) index of this VSI */
255 u16 idx; /* software index in pf->vsi[] */
257 s16 vf_id; /* VF ID for SR-IOV VSIs */
259 u16 ethtype; /* Ethernet protocol for pause frame */
262 u16 rss_table_size; /* HW RSS table size */
263 u16 rss_size; /* Allocated RSS queues */
264 u8 *rss_hkey_user; /* User configured hash keys */
265 u8 *rss_lut_user; /* User configured lookup table entries */
266 u8 rss_lut_type; /* used to configure Get/Set RSS LUT AQ call */
271 struct ice_aqc_vsi_props info; /* VSI properties */
274 struct rtnl_link_stats64 net_stats;
275 struct ice_eth_stats eth_stats;
276 struct ice_eth_stats eth_stats_prev;
278 struct list_head tmp_sync_list; /* MAC filters to be synced */
279 struct list_head tmp_unsync_list; /* MAC filters to be unsynced */
282 u8 current_isup:1; /* Sync 'link up' logging */
283 u8 stat_offsets_loaded:1;
287 /* queue information */
288 u8 tx_mapping_mode; /* ICE_MAP_MODE_[CONTIG|SCATTER] */
289 u8 rx_mapping_mode; /* ICE_MAP_MODE_[CONTIG|SCATTER] */
290 u16 *txq_map; /* index in pf->avail_txqs */
291 u16 *rxq_map; /* index in pf->avail_rxqs */
292 u16 alloc_txq; /* Allocated Tx queues */
293 u16 num_txq; /* Used Tx queues */
294 u16 alloc_rxq; /* Allocated Rx queues */
295 u16 num_rxq; /* Used Rx queues */
296 u16 req_txq; /* User requested Tx queues */
297 u16 req_rxq; /* User requested Rx queues */
300 struct ice_tc_cfg tc_cfg;
301 struct bpf_prog *xdp_prog;
302 struct ice_ring **xdp_rings; /* XDP ring array */
303 u16 num_xdp_txq; /* Used XDP queues */
304 u8 xdp_mapping_mode; /* ICE_MAP_MODE_[CONTIG|SCATTER] */
305 struct xdp_umem **xsk_umems;
306 u16 num_xsk_umems_used;
308 } ____cacheline_internodealigned_in_smp;
310 /* struct that defines an interrupt vector */
311 struct ice_q_vector {
314 u16 v_idx; /* index in the vsi->q_vector array. */
316 u8 num_ring_rx; /* total number of Rx rings in vector */
317 u8 num_ring_tx; /* total number of Tx rings in vector */
318 u8 itr_countdown; /* when 0 should adjust adaptive ITR */
319 /* in usecs, need to use ice_intrl_to_usecs_reg() before writing this
320 * value to the device
324 struct napi_struct napi;
326 struct ice_ring_container rx;
327 struct ice_ring_container tx;
329 cpumask_t affinity_mask;
330 struct irq_affinity_notify affinity_notify;
332 char name[ICE_INT_NAME_STR_LEN];
333 } ____cacheline_internodealigned_in_smp;
339 ICE_FLAG_SRIOV_CAPABLE,
340 ICE_FLAG_DCB_CAPABLE,
342 ICE_FLAG_ADV_FEATURES,
343 ICE_FLAG_LINK_DOWN_ON_CLOSE_ENA,
345 ICE_FLAG_FW_LLDP_AGENT,
346 ICE_FLAG_ETHTOOL_CTXT, /* set when ethtool holds RTNL lock */
348 ICE_FLAG_VF_TRUE_PROMISC_ENA,
349 ICE_FLAG_MDD_AUTO_RESET_VF,
350 ICE_PF_FLAGS_NBITS /* must be last */
354 struct pci_dev *pdev;
356 /* devlink port data */
357 struct devlink_port devlink_port;
359 struct devlink_region *nvm_region;
361 /* OS reserved IRQ details */
362 struct msix_entry *msix_entries;
363 struct ice_res_tracker *irq_tracker;
364 /* First MSIX vector used by SR-IOV VFs. Calculated by subtracting the
365 * number of MSIX vectors needed for all SR-IOV VFs from the number of
366 * MSIX vectors allowed on this PF.
368 u16 sriov_base_vector;
370 struct ice_vsi **vsi; /* VSIs created by the driver */
371 struct ice_sw *first_sw; /* first switch created by firmware */
372 /* Virtchnl/SR-IOV config info */
374 int num_alloc_vfs; /* actual number of VFs allocated */
375 u16 num_vfs_supported; /* num VFs supported for this PF */
378 /* used to ratelimit the MDD event logging */
379 unsigned long last_printed_mdd_jiffies;
380 DECLARE_BITMAP(state, __ICE_STATE_NBITS);
381 DECLARE_BITMAP(flags, ICE_PF_FLAGS_NBITS);
382 unsigned long *avail_txqs; /* bitmap to track PF Tx queue usage */
383 unsigned long *avail_rxqs; /* bitmap to track PF Rx queue usage */
384 unsigned long serv_tmr_period;
385 unsigned long serv_tmr_prev;
386 struct timer_list serv_tmr;
387 struct work_struct serv_task;
388 struct mutex avail_q_mutex; /* protects access to avail_[rx|tx]qs */
389 struct mutex sw_mutex; /* lock for protecting VSI alloc flow */
390 struct mutex tc_mutex; /* lock to protect TC changes */
392 u32 hw_csum_rx_error;
393 u32 oicr_idx; /* Other interrupt cause MSIX vector index */
394 u32 num_avail_sw_msix; /* remaining MSIX SW vectors left unclaimed */
395 u16 max_pf_txqs; /* Total Tx queues PF wide */
396 u16 max_pf_rxqs; /* Total Rx queues PF wide */
397 u32 num_lan_msix; /* Total MSIX vectors for base driver */
398 u16 num_lan_tx; /* num LAN Tx queues setup */
399 u16 num_lan_rx; /* num LAN Rx queues setup */
400 u16 next_vsi; /* Next free slot in pf->vsi[] - 0-based! */
402 u16 corer_count; /* Core reset count */
403 u16 globr_count; /* Global reset count */
404 u16 empr_count; /* EMP reset count */
405 u16 pfr_count; /* PF reset count */
407 struct ice_hw_port_stats stats;
408 struct ice_hw_port_stats stats_prev;
410 u8 stat_prev_loaded:1; /* has previous stats been loaded */
413 #endif /* CONFIG_DCB */
414 u32 tx_timeout_count;
415 unsigned long tx_timeout_last_recovery;
416 u32 tx_timeout_recovery_level;
417 char int_name[ICE_INT_NAME_STR_LEN];
421 struct ice_netdev_priv {
426 * ice_irq_dynamic_ena - Enable default interrupt generation settings
427 * @hw: pointer to HW struct
428 * @vsi: pointer to VSI struct, can be NULL
429 * @q_vector: pointer to q_vector, can be NULL
432 ice_irq_dynamic_ena(struct ice_hw *hw, struct ice_vsi *vsi,
433 struct ice_q_vector *q_vector)
435 u32 vector = (vsi && q_vector) ? q_vector->reg_idx :
436 ((struct ice_pf *)hw->back)->oicr_idx;
437 int itr = ICE_ITR_NONE;
440 /* clear the PBA here, as this function is meant to clean out all
441 * previous interrupts and enable the interrupt
443 val = GLINT_DYN_CTL_INTENA_M | GLINT_DYN_CTL_CLEARPBA_M |
444 (itr << GLINT_DYN_CTL_ITR_INDX_S);
446 if (test_bit(__ICE_DOWN, vsi->state))
448 wr32(hw, GLINT_DYN_CTL(vector), val);
452 * ice_netdev_to_pf - Retrieve the PF struct associated with a netdev
453 * @netdev: pointer to the netdev struct
455 static inline struct ice_pf *ice_netdev_to_pf(struct net_device *netdev)
457 struct ice_netdev_priv *np = netdev_priv(netdev);
459 return np->vsi->back;
462 static inline bool ice_is_xdp_ena_vsi(struct ice_vsi *vsi)
464 return !!vsi->xdp_prog;
467 static inline void ice_set_ring_xdp(struct ice_ring *ring)
469 ring->flags |= ICE_TX_FLAGS_RING_XDP;
473 * ice_xsk_umem - get XDP UMEM bound to a ring
474 * @ring - ring to use
476 * Returns a pointer to xdp_umem structure if there is an UMEM present,
479 static inline struct xdp_umem *ice_xsk_umem(struct ice_ring *ring)
481 struct xdp_umem **umems = ring->vsi->xsk_umems;
482 u16 qid = ring->q_index;
484 if (ice_ring_is_xdp(ring))
485 qid -= ring->vsi->num_xdp_txq;
487 if (qid >= ring->vsi->num_xsk_umems || !umems || !umems[qid] ||
488 !ice_is_xdp_ena_vsi(ring->vsi))
495 * ice_get_main_vsi - Get the PF VSI
498 * returns pf->vsi[0], which by definition is the PF VSI
500 static inline struct ice_vsi *ice_get_main_vsi(struct ice_pf *pf)
508 int ice_vsi_setup_tx_rings(struct ice_vsi *vsi);
509 int ice_vsi_setup_rx_rings(struct ice_vsi *vsi);
510 void ice_set_ethtool_ops(struct net_device *netdev);
511 void ice_set_ethtool_safe_mode_ops(struct net_device *netdev);
512 u16 ice_get_avail_txq_count(struct ice_pf *pf);
513 u16 ice_get_avail_rxq_count(struct ice_pf *pf);
514 int ice_vsi_recfg_qs(struct ice_vsi *vsi, int new_rx, int new_tx);
515 void ice_update_vsi_stats(struct ice_vsi *vsi);
516 void ice_update_pf_stats(struct ice_pf *pf);
517 int ice_up(struct ice_vsi *vsi);
518 int ice_down(struct ice_vsi *vsi);
519 int ice_vsi_cfg(struct ice_vsi *vsi);
520 struct ice_vsi *ice_lb_vsi_setup(struct ice_pf *pf, struct ice_port_info *pi);
521 int ice_prepare_xdp_rings(struct ice_vsi *vsi, struct bpf_prog *prog);
522 int ice_destroy_xdp_rings(struct ice_vsi *vsi);
524 ice_xdp_xmit(struct net_device *dev, int n, struct xdp_frame **frames,
526 int ice_set_rss(struct ice_vsi *vsi, u8 *seed, u8 *lut, u16 lut_size);
527 int ice_get_rss(struct ice_vsi *vsi, u8 *seed, u8 *lut, u16 lut_size);
528 void ice_fill_rss_lut(u8 *lut, u16 rss_table_size, u16 rss_size);
529 int ice_schedule_reset(struct ice_pf *pf, enum ice_reset_req reset);
530 void ice_print_link_msg(struct ice_vsi *vsi, bool isup);
531 int ice_open(struct net_device *netdev);
532 int ice_stop(struct net_device *netdev);