1 /* SPDX-License-Identifier: GPL-2.0 */
2 /* Copyright (c) 2018, Intel Corporation. */
7 #include <linux/types.h>
8 #include <linux/errno.h>
9 #include <linux/kernel.h>
10 #include <linux/module.h>
11 #include <linux/firmware.h>
12 #include <linux/netdevice.h>
13 #include <linux/compiler.h>
14 #include <linux/etherdevice.h>
15 #include <linux/skbuff.h>
16 #include <linux/cpumask.h>
17 #include <linux/rtnetlink.h>
18 #include <linux/if_vlan.h>
19 #include <linux/dma-mapping.h>
20 #include <linux/pci.h>
21 #include <linux/workqueue.h>
22 #include <linux/aer.h>
23 #include <linux/interrupt.h>
24 #include <linux/ethtool.h>
25 #include <linux/timer.h>
26 #include <linux/delay.h>
27 #include <linux/bitmap.h>
28 #include <linux/log2.h>
30 #include <linux/sctp.h>
31 #include <linux/ipv6.h>
32 #include <linux/pkt_sched.h>
33 #include <linux/if_bridge.h>
34 #include <linux/ctype.h>
35 #include <linux/bpf.h>
36 #include <linux/avf/virtchnl.h>
38 #include <net/xdp_sock.h>
39 #include "ice_devids.h"
43 #include "ice_switch.h"
44 #include "ice_common.h"
45 #include "ice_sched.h"
46 #include "ice_virtchnl_pf.h"
47 #include "ice_sriov.h"
50 extern const char ice_drv_ver[];
52 #define ICE_REQ_DESC_MULTIPLE 32
53 #define ICE_MIN_NUM_DESC 64
54 #define ICE_MAX_NUM_DESC 8160
55 #define ICE_DFLT_MIN_RX_DESC 512
56 #define ICE_DFLT_NUM_TX_DESC 256
57 #define ICE_DFLT_NUM_RX_DESC 2048
59 #define ICE_DFLT_TRAFFIC_CLASS BIT(0)
60 #define ICE_INT_NAME_STR_LEN (IFNAMSIZ + 16)
62 #define ICE_MBXSQ_LEN 64
63 #define ICE_MBXRQ_LEN 512
64 #define ICE_MIN_MSIX 2
65 #define ICE_NO_VSI 0xffff
66 #define ICE_VSI_MAP_CONTIG 0
67 #define ICE_VSI_MAP_SCATTER 1
68 #define ICE_MAX_SCATTER_TXQS 16
69 #define ICE_MAX_SCATTER_RXQS 16
70 #define ICE_Q_WAIT_RETRY_LIMIT 10
71 #define ICE_Q_WAIT_MAX_RETRY (5 * ICE_Q_WAIT_RETRY_LIMIT)
72 #define ICE_MAX_LG_RSS_QS 256
73 #define ICE_MAX_SMALL_RSS_QS 8
74 #define ICE_RES_VALID_BIT 0x8000
75 #define ICE_RES_MISC_VEC_ID (ICE_RES_VALID_BIT - 1)
76 #define ICE_INVAL_Q_INDEX 0xffff
77 #define ICE_INVAL_VFID 256
79 #define ICE_MAX_RESET_WAIT 20
81 #define ICE_VSIQF_HKEY_ARRAY_SIZE ((VSIQF_HKEY_MAX_INDEX + 1) * 4)
83 #define ICE_DFLT_NETIF_M (NETIF_MSG_DRV | NETIF_MSG_PROBE | NETIF_MSG_LINK)
85 #define ICE_MAX_MTU (ICE_AQ_SET_MAC_FRAME_SIZE_MAX - ICE_ETH_PKT_HDR_PAD)
87 #define ICE_UP_TABLE_TRANSLATE(val, i) \
88 (((val) << ICE_AQ_VSI_UP_TABLE_UP##i##_S) & \
89 ICE_AQ_VSI_UP_TABLE_UP##i##_M)
91 #define ICE_TX_DESC(R, i) (&(((struct ice_tx_desc *)((R)->desc))[i]))
92 #define ICE_RX_DESC(R, i) (&(((union ice_32b_rx_flex_desc *)((R)->desc))[i]))
93 #define ICE_TX_CTX_DESC(R, i) (&(((struct ice_tx_ctx_desc *)((R)->desc))[i]))
95 /* Macro for each VSI in a PF */
96 #define ice_for_each_vsi(pf, i) \
97 for ((i) = 0; (i) < (pf)->num_alloc_vsi; (i)++)
99 /* Macros for each Tx/Rx ring in a VSI */
100 #define ice_for_each_txq(vsi, i) \
101 for ((i) = 0; (i) < (vsi)->num_txq; (i)++)
103 #define ice_for_each_rxq(vsi, i) \
104 for ((i) = 0; (i) < (vsi)->num_rxq; (i)++)
106 /* Macros for each allocated Tx/Rx ring whether used or not in a VSI */
107 #define ice_for_each_alloc_txq(vsi, i) \
108 for ((i) = 0; (i) < (vsi)->alloc_txq; (i)++)
110 #define ice_for_each_alloc_rxq(vsi, i) \
111 for ((i) = 0; (i) < (vsi)->alloc_rxq; (i)++)
113 #define ice_for_each_q_vector(vsi, i) \
114 for ((i) = 0; (i) < (vsi)->num_q_vectors; (i)++)
116 #define ICE_UCAST_PROMISC_BITS (ICE_PROMISC_UCAST_TX | ICE_PROMISC_MCAST_TX | \
117 ICE_PROMISC_UCAST_RX | ICE_PROMISC_MCAST_RX)
119 #define ICE_UCAST_VLAN_PROMISC_BITS (ICE_PROMISC_UCAST_TX | \
120 ICE_PROMISC_MCAST_TX | \
121 ICE_PROMISC_UCAST_RX | \
122 ICE_PROMISC_MCAST_RX | \
123 ICE_PROMISC_VLAN_TX | \
126 #define ICE_MCAST_PROMISC_BITS (ICE_PROMISC_MCAST_TX | ICE_PROMISC_MCAST_RX)
128 #define ICE_MCAST_VLAN_PROMISC_BITS (ICE_PROMISC_MCAST_TX | \
129 ICE_PROMISC_MCAST_RX | \
130 ICE_PROMISC_VLAN_TX | \
133 #define ice_pf_to_dev(pf) (&((pf)->pdev->dev))
135 struct ice_txq_meta {
136 u32 q_teid; /* Tx-scheduler element identifier */
137 u16 q_id; /* Entry in VSI's txq_map bitmap */
138 u16 q_handle; /* Relative index of Tx queue within TC */
139 u16 vsi_idx; /* VSI index that Tx queue belongs to */
140 u8 tc; /* TC number that Tx queue belongs to */
151 u8 numtc; /* Total number of enabled TCs */
152 u8 ena_tc; /* Tx map */
153 struct ice_tc_info tc_info[ICE_MAX_TRAFFIC_CLASS];
156 struct ice_res_tracker {
163 struct mutex *qs_mutex; /* will be assigned to &pf->avail_q_mutex */
164 unsigned long *pf_map;
165 unsigned long pf_map_size;
166 unsigned int q_count;
167 unsigned int scatter_count;
175 u16 sw_id; /* switch ID for this switch */
176 u16 bridge_mode; /* VEB/VEPA/Port Virtualizer */
177 struct ice_vsi *dflt_vsi; /* default VSI for this switch */
178 u8 dflt_vsi_ena:1; /* true if above dflt_vsi is enabled */
185 __ICE_PREPARED_FOR_RESET, /* set by driver when prepared */
186 __ICE_RESET_OICR_RECV, /* set by driver after rcv reset OICR */
187 __ICE_DCBNL_DEVRESET, /* set by dcbnl devreset */
188 __ICE_PFR_REQ, /* set by driver and peers */
189 __ICE_CORER_REQ, /* set by driver and peers */
190 __ICE_GLOBR_REQ, /* set by driver and peers */
191 __ICE_CORER_RECV, /* set by OICR handler */
192 __ICE_GLOBR_RECV, /* set by OICR handler */
193 __ICE_EMPR_RECV, /* set by OICR handler */
194 __ICE_SUSPENDED, /* set on module remove path */
195 __ICE_RESET_FAILED, /* set by reset/rebuild */
196 /* When checking for the PF to be in a nominal operating state, the
197 * bits that are grouped at the beginning of the list need to be
198 * checked. Bits occurring before __ICE_STATE_NOMINAL_CHECK_BITS will
199 * be checked. If you need to add a bit into consideration for nominal
200 * operating state, it must be added before
201 * __ICE_STATE_NOMINAL_CHECK_BITS. Do not move this entry's position
202 * without appropriate consideration.
204 __ICE_STATE_NOMINAL_CHECK_BITS,
205 __ICE_ADMINQ_EVENT_PENDING,
206 __ICE_MAILBOXQ_EVENT_PENDING,
207 __ICE_MDD_EVENT_PENDING,
208 __ICE_VFLR_EVENT_PENDING,
209 __ICE_FLTR_OVERFLOW_PROMISC,
214 __ICE_OICR_INTR_DIS, /* Global OICR interrupt disabled */
215 __ICE_STATE_NBITS /* must be last */
219 ICE_VSI_FLAG_UMAC_FLTR_CHANGED,
220 ICE_VSI_FLAG_MMAC_FLTR_CHANGED,
221 ICE_VSI_FLAG_VLAN_FLTR_CHANGED,
222 ICE_VSI_FLAG_PROMISC_CHANGED,
223 ICE_VSI_FLAG_NBITS /* must be last */
226 /* struct that defines a VSI, associated with a dev */
228 struct net_device *netdev;
229 struct ice_sw *vsw; /* switch this VSI is on */
230 struct ice_pf *back; /* back pointer to PF */
231 struct ice_port_info *port_info; /* back pointer to port_info */
232 struct ice_ring **rx_rings; /* Rx ring array */
233 struct ice_ring **tx_rings; /* Tx ring array */
234 struct ice_q_vector **q_vectors; /* q_vector array */
236 irqreturn_t (*irq_handler)(int irq, void *data);
239 DECLARE_BITMAP(state, __ICE_STATE_NBITS);
240 DECLARE_BITMAP(flags, ICE_VSI_FLAG_NBITS);
241 unsigned int current_netdev_flags;
247 int base_vector; /* IRQ base for OS reserved vectors */
248 enum ice_vsi_type type;
249 u16 vsi_num; /* HW (absolute) index of this VSI */
250 u16 idx; /* software index in pf->vsi[] */
252 s16 vf_id; /* VF ID for SR-IOV VSIs */
254 u16 ethtype; /* Ethernet protocol for pause frame */
257 u16 rss_table_size; /* HW RSS table size */
258 u16 rss_size; /* Allocated RSS queues */
259 u8 *rss_hkey_user; /* User configured hash keys */
260 u8 *rss_lut_user; /* User configured lookup table entries */
261 u8 rss_lut_type; /* used to configure Get/Set RSS LUT AQ call */
266 struct ice_aqc_vsi_props info; /* VSI properties */
269 struct rtnl_link_stats64 net_stats;
270 struct ice_eth_stats eth_stats;
271 struct ice_eth_stats eth_stats_prev;
273 struct list_head tmp_sync_list; /* MAC filters to be synced */
274 struct list_head tmp_unsync_list; /* MAC filters to be unsynced */
277 u8 current_isup:1; /* Sync 'link up' logging */
278 u8 stat_offsets_loaded:1;
282 /* queue information */
283 u8 tx_mapping_mode; /* ICE_MAP_MODE_[CONTIG|SCATTER] */
284 u8 rx_mapping_mode; /* ICE_MAP_MODE_[CONTIG|SCATTER] */
285 u16 *txq_map; /* index in pf->avail_txqs */
286 u16 *rxq_map; /* index in pf->avail_rxqs */
287 u16 alloc_txq; /* Allocated Tx queues */
288 u16 num_txq; /* Used Tx queues */
289 u16 alloc_rxq; /* Allocated Rx queues */
290 u16 num_rxq; /* Used Rx queues */
291 u16 req_txq; /* User requested Tx queues */
292 u16 req_rxq; /* User requested Rx queues */
295 struct ice_tc_cfg tc_cfg;
296 struct bpf_prog *xdp_prog;
297 struct ice_ring **xdp_rings; /* XDP ring array */
298 u16 num_xdp_txq; /* Used XDP queues */
299 u8 xdp_mapping_mode; /* ICE_MAP_MODE_[CONTIG|SCATTER] */
300 struct xdp_umem **xsk_umems;
301 u16 num_xsk_umems_used;
303 } ____cacheline_internodealigned_in_smp;
305 /* struct that defines an interrupt vector */
306 struct ice_q_vector {
309 u16 v_idx; /* index in the vsi->q_vector array. */
311 u8 num_ring_rx; /* total number of Rx rings in vector */
312 u8 num_ring_tx; /* total number of Tx rings in vector */
313 u8 itr_countdown; /* when 0 should adjust adaptive ITR */
314 /* in usecs, need to use ice_intrl_to_usecs_reg() before writing this
315 * value to the device
319 struct napi_struct napi;
321 struct ice_ring_container rx;
322 struct ice_ring_container tx;
324 cpumask_t affinity_mask;
325 struct irq_affinity_notify affinity_notify;
327 char name[ICE_INT_NAME_STR_LEN];
328 } ____cacheline_internodealigned_in_smp;
334 ICE_FLAG_SRIOV_CAPABLE,
335 ICE_FLAG_DCB_CAPABLE,
337 ICE_FLAG_ADV_FEATURES,
338 ICE_FLAG_LINK_DOWN_ON_CLOSE_ENA,
340 ICE_FLAG_FW_LLDP_AGENT,
341 ICE_FLAG_ETHTOOL_CTXT, /* set when ethtool holds RTNL lock */
343 ICE_PF_FLAGS_NBITS /* must be last */
347 struct pci_dev *pdev;
349 /* OS reserved IRQ details */
350 struct msix_entry *msix_entries;
351 struct ice_res_tracker *irq_tracker;
352 /* First MSIX vector used by SR-IOV VFs. Calculated by subtracting the
353 * number of MSIX vectors needed for all SR-IOV VFs from the number of
354 * MSIX vectors allowed on this PF.
356 u16 sriov_base_vector;
358 struct ice_vsi **vsi; /* VSIs created by the driver */
359 struct ice_sw *first_sw; /* first switch created by firmware */
360 /* Virtchnl/SR-IOV config info */
362 int num_alloc_vfs; /* actual number of VFs allocated */
363 u16 num_vfs_supported; /* num VFs supported for this PF */
364 u16 num_vf_qps; /* num queue pairs per VF */
365 u16 num_vf_msix; /* num vectors per VF */
366 DECLARE_BITMAP(state, __ICE_STATE_NBITS);
367 DECLARE_BITMAP(flags, ICE_PF_FLAGS_NBITS);
368 unsigned long *avail_txqs; /* bitmap to track PF Tx queue usage */
369 unsigned long *avail_rxqs; /* bitmap to track PF Rx queue usage */
370 unsigned long serv_tmr_period;
371 unsigned long serv_tmr_prev;
372 struct timer_list serv_tmr;
373 struct work_struct serv_task;
374 struct mutex avail_q_mutex; /* protects access to avail_[rx|tx]qs */
375 struct mutex sw_mutex; /* lock for protecting VSI alloc flow */
376 struct mutex tc_mutex; /* lock to protect TC changes */
378 u32 hw_csum_rx_error;
379 u32 oicr_idx; /* Other interrupt cause MSIX vector index */
380 u32 num_avail_sw_msix; /* remaining MSIX SW vectors left unclaimed */
381 u16 max_pf_txqs; /* Total Tx queues PF wide */
382 u16 max_pf_rxqs; /* Total Rx queues PF wide */
383 u32 num_lan_msix; /* Total MSIX vectors for base driver */
384 u16 num_lan_tx; /* num LAN Tx queues setup */
385 u16 num_lan_rx; /* num LAN Rx queues setup */
386 u16 next_vsi; /* Next free slot in pf->vsi[] - 0-based! */
388 u16 corer_count; /* Core reset count */
389 u16 globr_count; /* Global reset count */
390 u16 empr_count; /* EMP reset count */
391 u16 pfr_count; /* PF reset count */
393 struct ice_hw_port_stats stats;
394 struct ice_hw_port_stats stats_prev;
396 u8 stat_prev_loaded:1; /* has previous stats been loaded */
399 #endif /* CONFIG_DCB */
400 u32 tx_timeout_count;
401 unsigned long tx_timeout_last_recovery;
402 u32 tx_timeout_recovery_level;
403 char int_name[ICE_INT_NAME_STR_LEN];
407 struct ice_netdev_priv {
412 * ice_irq_dynamic_ena - Enable default interrupt generation settings
413 * @hw: pointer to HW struct
414 * @vsi: pointer to VSI struct, can be NULL
415 * @q_vector: pointer to q_vector, can be NULL
418 ice_irq_dynamic_ena(struct ice_hw *hw, struct ice_vsi *vsi,
419 struct ice_q_vector *q_vector)
421 u32 vector = (vsi && q_vector) ? q_vector->reg_idx :
422 ((struct ice_pf *)hw->back)->oicr_idx;
423 int itr = ICE_ITR_NONE;
426 /* clear the PBA here, as this function is meant to clean out all
427 * previous interrupts and enable the interrupt
429 val = GLINT_DYN_CTL_INTENA_M | GLINT_DYN_CTL_CLEARPBA_M |
430 (itr << GLINT_DYN_CTL_ITR_INDX_S);
432 if (test_bit(__ICE_DOWN, vsi->state))
434 wr32(hw, GLINT_DYN_CTL(vector), val);
438 * ice_netdev_to_pf - Retrieve the PF struct associated with a netdev
439 * @netdev: pointer to the netdev struct
441 static inline struct ice_pf *ice_netdev_to_pf(struct net_device *netdev)
443 struct ice_netdev_priv *np = netdev_priv(netdev);
445 return np->vsi->back;
448 static inline bool ice_is_xdp_ena_vsi(struct ice_vsi *vsi)
450 return !!vsi->xdp_prog;
453 static inline void ice_set_ring_xdp(struct ice_ring *ring)
455 ring->flags |= ICE_TX_FLAGS_RING_XDP;
459 * ice_xsk_umem - get XDP UMEM bound to a ring
460 * @ring - ring to use
462 * Returns a pointer to xdp_umem structure if there is an UMEM present,
465 static inline struct xdp_umem *ice_xsk_umem(struct ice_ring *ring)
467 struct xdp_umem **umems = ring->vsi->xsk_umems;
468 int qid = ring->q_index;
470 if (ice_ring_is_xdp(ring))
471 qid -= ring->vsi->num_xdp_txq;
473 if (!umems || !umems[qid] || !ice_is_xdp_ena_vsi(ring->vsi))
480 * ice_get_main_vsi - Get the PF VSI
483 * returns pf->vsi[0], which by definition is the PF VSI
485 static inline struct ice_vsi *ice_get_main_vsi(struct ice_pf *pf)
493 int ice_vsi_setup_tx_rings(struct ice_vsi *vsi);
494 int ice_vsi_setup_rx_rings(struct ice_vsi *vsi);
495 void ice_set_ethtool_ops(struct net_device *netdev);
496 void ice_set_ethtool_safe_mode_ops(struct net_device *netdev);
497 u16 ice_get_avail_txq_count(struct ice_pf *pf);
498 u16 ice_get_avail_rxq_count(struct ice_pf *pf);
499 int ice_vsi_recfg_qs(struct ice_vsi *vsi, int new_rx, int new_tx);
500 void ice_update_vsi_stats(struct ice_vsi *vsi);
501 void ice_update_pf_stats(struct ice_pf *pf);
502 int ice_up(struct ice_vsi *vsi);
503 int ice_down(struct ice_vsi *vsi);
504 int ice_vsi_cfg(struct ice_vsi *vsi);
505 struct ice_vsi *ice_lb_vsi_setup(struct ice_pf *pf, struct ice_port_info *pi);
506 int ice_prepare_xdp_rings(struct ice_vsi *vsi, struct bpf_prog *prog);
507 int ice_destroy_xdp_rings(struct ice_vsi *vsi);
509 ice_xdp_xmit(struct net_device *dev, int n, struct xdp_frame **frames,
511 int ice_set_rss(struct ice_vsi *vsi, u8 *seed, u8 *lut, u16 lut_size);
512 int ice_get_rss(struct ice_vsi *vsi, u8 *seed, u8 *lut, u16 lut_size);
513 void ice_fill_rss_lut(u8 *lut, u16 rss_table_size, u16 rss_size);
514 int ice_schedule_reset(struct ice_pf *pf, enum ice_reset_req reset);
515 void ice_print_link_msg(struct ice_vsi *vsi, bool isup);
516 int ice_open(struct net_device *netdev);
517 int ice_stop(struct net_device *netdev);