1 /* SPDX-License-Identifier: GPL-2.0 */
2 /* Copyright (c) 2018, Intel Corporation. */
7 #include <linux/types.h>
8 #include <linux/errno.h>
9 #include <linux/kernel.h>
10 #include <linux/module.h>
11 #include <linux/firmware.h>
12 #include <linux/netdevice.h>
13 #include <linux/compiler.h>
14 #include <linux/etherdevice.h>
15 #include <linux/skbuff.h>
16 #include <linux/cpumask.h>
17 #include <linux/rtnetlink.h>
18 #include <linux/if_vlan.h>
19 #include <linux/dma-mapping.h>
20 #include <linux/pci.h>
21 #include <linux/workqueue.h>
22 #include <linux/aer.h>
23 #include <linux/interrupt.h>
24 #include <linux/ethtool.h>
25 #include <linux/timer.h>
26 #include <linux/delay.h>
27 #include <linux/bitmap.h>
28 #include <linux/log2.h>
30 #include <linux/sctp.h>
31 #include <linux/ipv6.h>
32 #include <linux/pkt_sched.h>
33 #include <linux/if_bridge.h>
34 #include <linux/ctype.h>
35 #include <linux/bpf.h>
36 #include <linux/avf/virtchnl.h>
38 #include <net/xdp_sock.h>
39 #include "ice_devids.h"
43 #include "ice_switch.h"
44 #include "ice_common.h"
45 #include "ice_sched.h"
46 #include "ice_virtchnl_pf.h"
47 #include "ice_sriov.h"
50 extern const char ice_drv_ver[];
52 #define ICE_REQ_DESC_MULTIPLE 32
53 #define ICE_MIN_NUM_DESC 64
54 #define ICE_MAX_NUM_DESC 8160
55 #define ICE_DFLT_MIN_RX_DESC 512
56 #define ICE_DFLT_NUM_TX_DESC 256
57 #define ICE_DFLT_NUM_RX_DESC 2048
59 #define ICE_DFLT_TRAFFIC_CLASS BIT(0)
60 #define ICE_INT_NAME_STR_LEN (IFNAMSIZ + 16)
62 #define ICE_MBXSQ_LEN 64
63 #define ICE_MBXRQ_LEN 512
64 #define ICE_MIN_MSIX 2
65 #define ICE_NO_VSI 0xffff
66 #define ICE_VSI_MAP_CONTIG 0
67 #define ICE_VSI_MAP_SCATTER 1
68 #define ICE_MAX_SCATTER_TXQS 16
69 #define ICE_MAX_SCATTER_RXQS 16
70 #define ICE_Q_WAIT_RETRY_LIMIT 10
71 #define ICE_Q_WAIT_MAX_RETRY (5 * ICE_Q_WAIT_RETRY_LIMIT)
72 #define ICE_MAX_LG_RSS_QS 256
73 #define ICE_MAX_SMALL_RSS_QS 8
74 #define ICE_RES_VALID_BIT 0x8000
75 #define ICE_RES_MISC_VEC_ID (ICE_RES_VALID_BIT - 1)
76 #define ICE_INVAL_Q_INDEX 0xffff
77 #define ICE_INVAL_VFID 256
79 #define ICE_MAX_RESET_WAIT 20
81 #define ICE_VSIQF_HKEY_ARRAY_SIZE ((VSIQF_HKEY_MAX_INDEX + 1) * 4)
83 #define ICE_DFLT_NETIF_M (NETIF_MSG_DRV | NETIF_MSG_PROBE | NETIF_MSG_LINK)
85 #define ICE_MAX_MTU (ICE_AQ_SET_MAC_FRAME_SIZE_MAX - ICE_ETH_PKT_HDR_PAD)
87 #define ICE_UP_TABLE_TRANSLATE(val, i) \
88 (((val) << ICE_AQ_VSI_UP_TABLE_UP##i##_S) & \
89 ICE_AQ_VSI_UP_TABLE_UP##i##_M)
91 #define ICE_TX_DESC(R, i) (&(((struct ice_tx_desc *)((R)->desc))[i]))
92 #define ICE_RX_DESC(R, i) (&(((union ice_32b_rx_flex_desc *)((R)->desc))[i]))
93 #define ICE_TX_CTX_DESC(R, i) (&(((struct ice_tx_ctx_desc *)((R)->desc))[i]))
95 /* Macro for each VSI in a PF */
96 #define ice_for_each_vsi(pf, i) \
97 for ((i) = 0; (i) < (pf)->num_alloc_vsi; (i)++)
99 /* Macros for each Tx/Rx ring in a VSI */
100 #define ice_for_each_txq(vsi, i) \
101 for ((i) = 0; (i) < (vsi)->num_txq; (i)++)
103 #define ice_for_each_rxq(vsi, i) \
104 for ((i) = 0; (i) < (vsi)->num_rxq; (i)++)
106 /* Macros for each allocated Tx/Rx ring whether used or not in a VSI */
107 #define ice_for_each_alloc_txq(vsi, i) \
108 for ((i) = 0; (i) < (vsi)->alloc_txq; (i)++)
110 #define ice_for_each_alloc_rxq(vsi, i) \
111 for ((i) = 0; (i) < (vsi)->alloc_rxq; (i)++)
113 #define ice_for_each_q_vector(vsi, i) \
114 for ((i) = 0; (i) < (vsi)->num_q_vectors; (i)++)
116 #define ICE_UCAST_PROMISC_BITS (ICE_PROMISC_UCAST_TX | ICE_PROMISC_MCAST_TX | \
117 ICE_PROMISC_UCAST_RX | ICE_PROMISC_MCAST_RX)
119 #define ICE_UCAST_VLAN_PROMISC_BITS (ICE_PROMISC_UCAST_TX | \
120 ICE_PROMISC_MCAST_TX | \
121 ICE_PROMISC_UCAST_RX | \
122 ICE_PROMISC_MCAST_RX | \
123 ICE_PROMISC_VLAN_TX | \
126 #define ICE_MCAST_PROMISC_BITS (ICE_PROMISC_MCAST_TX | ICE_PROMISC_MCAST_RX)
128 #define ICE_MCAST_VLAN_PROMISC_BITS (ICE_PROMISC_MCAST_TX | \
129 ICE_PROMISC_MCAST_RX | \
130 ICE_PROMISC_VLAN_TX | \
133 #define ice_pf_to_dev(pf) (&((pf)->pdev->dev))
135 struct ice_txq_meta {
136 u32 q_teid; /* Tx-scheduler element identifier */
137 u16 q_id; /* Entry in VSI's txq_map bitmap */
138 u16 q_handle; /* Relative index of Tx queue within TC */
139 u16 vsi_idx; /* VSI index that Tx queue belongs to */
140 u8 tc; /* TC number that Tx queue belongs to */
151 u8 numtc; /* Total number of enabled TCs */
152 u8 ena_tc; /* Tx map */
153 struct ice_tc_info tc_info[ICE_MAX_TRAFFIC_CLASS];
156 struct ice_res_tracker {
163 struct mutex *qs_mutex; /* will be assigned to &pf->avail_q_mutex */
164 unsigned long *pf_map;
165 unsigned long pf_map_size;
166 unsigned int q_count;
167 unsigned int scatter_count;
175 u16 sw_id; /* switch ID for this switch */
176 u16 bridge_mode; /* VEB/VEPA/Port Virtualizer */
183 __ICE_PREPARED_FOR_RESET, /* set by driver when prepared */
184 __ICE_RESET_OICR_RECV, /* set by driver after rcv reset OICR */
185 __ICE_DCBNL_DEVRESET, /* set by dcbnl devreset */
186 __ICE_PFR_REQ, /* set by driver and peers */
187 __ICE_CORER_REQ, /* set by driver and peers */
188 __ICE_GLOBR_REQ, /* set by driver and peers */
189 __ICE_CORER_RECV, /* set by OICR handler */
190 __ICE_GLOBR_RECV, /* set by OICR handler */
191 __ICE_EMPR_RECV, /* set by OICR handler */
192 __ICE_SUSPENDED, /* set on module remove path */
193 __ICE_RESET_FAILED, /* set by reset/rebuild */
194 /* When checking for the PF to be in a nominal operating state, the
195 * bits that are grouped at the beginning of the list need to be
196 * checked. Bits occurring before __ICE_STATE_NOMINAL_CHECK_BITS will
197 * be checked. If you need to add a bit into consideration for nominal
198 * operating state, it must be added before
199 * __ICE_STATE_NOMINAL_CHECK_BITS. Do not move this entry's position
200 * without appropriate consideration.
202 __ICE_STATE_NOMINAL_CHECK_BITS,
203 __ICE_ADMINQ_EVENT_PENDING,
204 __ICE_MAILBOXQ_EVENT_PENDING,
205 __ICE_MDD_EVENT_PENDING,
206 __ICE_VFLR_EVENT_PENDING,
207 __ICE_FLTR_OVERFLOW_PROMISC,
212 __ICE_OICR_INTR_DIS, /* Global OICR interrupt disabled */
213 __ICE_STATE_NBITS /* must be last */
217 ICE_VSI_FLAG_UMAC_FLTR_CHANGED,
218 ICE_VSI_FLAG_MMAC_FLTR_CHANGED,
219 ICE_VSI_FLAG_VLAN_FLTR_CHANGED,
220 ICE_VSI_FLAG_PROMISC_CHANGED,
221 ICE_VSI_FLAG_NBITS /* must be last */
224 /* struct that defines a VSI, associated with a dev */
226 struct net_device *netdev;
227 struct ice_sw *vsw; /* switch this VSI is on */
228 struct ice_pf *back; /* back pointer to PF */
229 struct ice_port_info *port_info; /* back pointer to port_info */
230 struct ice_ring **rx_rings; /* Rx ring array */
231 struct ice_ring **tx_rings; /* Tx ring array */
232 struct ice_q_vector **q_vectors; /* q_vector array */
234 irqreturn_t (*irq_handler)(int irq, void *data);
237 DECLARE_BITMAP(state, __ICE_STATE_NBITS);
238 DECLARE_BITMAP(flags, ICE_VSI_FLAG_NBITS);
239 unsigned int current_netdev_flags;
245 int base_vector; /* IRQ base for OS reserved vectors */
246 enum ice_vsi_type type;
247 u16 vsi_num; /* HW (absolute) index of this VSI */
248 u16 idx; /* software index in pf->vsi[] */
250 s16 vf_id; /* VF ID for SR-IOV VSIs */
252 u16 ethtype; /* Ethernet protocol for pause frame */
255 u16 rss_table_size; /* HW RSS table size */
256 u16 rss_size; /* Allocated RSS queues */
257 u8 *rss_hkey_user; /* User configured hash keys */
258 u8 *rss_lut_user; /* User configured lookup table entries */
259 u8 rss_lut_type; /* used to configure Get/Set RSS LUT AQ call */
264 struct ice_aqc_vsi_props info; /* VSI properties */
267 struct rtnl_link_stats64 net_stats;
268 struct ice_eth_stats eth_stats;
269 struct ice_eth_stats eth_stats_prev;
271 struct list_head tmp_sync_list; /* MAC filters to be synced */
272 struct list_head tmp_unsync_list; /* MAC filters to be unsynced */
275 u8 current_isup:1; /* Sync 'link up' logging */
276 u8 stat_offsets_loaded:1;
279 /* queue information */
280 u8 tx_mapping_mode; /* ICE_MAP_MODE_[CONTIG|SCATTER] */
281 u8 rx_mapping_mode; /* ICE_MAP_MODE_[CONTIG|SCATTER] */
282 u16 *txq_map; /* index in pf->avail_txqs */
283 u16 *rxq_map; /* index in pf->avail_rxqs */
284 u16 alloc_txq; /* Allocated Tx queues */
285 u16 num_txq; /* Used Tx queues */
286 u16 alloc_rxq; /* Allocated Rx queues */
287 u16 num_rxq; /* Used Rx queues */
288 u16 req_txq; /* User requested Tx queues */
289 u16 req_rxq; /* User requested Rx queues */
292 struct ice_tc_cfg tc_cfg;
293 struct bpf_prog *xdp_prog;
294 struct ice_ring **xdp_rings; /* XDP ring array */
295 u16 num_xdp_txq; /* Used XDP queues */
296 u8 xdp_mapping_mode; /* ICE_MAP_MODE_[CONTIG|SCATTER] */
297 struct xdp_umem **xsk_umems;
298 u16 num_xsk_umems_used;
300 } ____cacheline_internodealigned_in_smp;
302 /* struct that defines an interrupt vector */
303 struct ice_q_vector {
306 u16 v_idx; /* index in the vsi->q_vector array. */
308 u8 num_ring_rx; /* total number of Rx rings in vector */
309 u8 num_ring_tx; /* total number of Tx rings in vector */
310 u8 itr_countdown; /* when 0 should adjust adaptive ITR */
311 /* in usecs, need to use ice_intrl_to_usecs_reg() before writing this
312 * value to the device
316 struct napi_struct napi;
318 struct ice_ring_container rx;
319 struct ice_ring_container tx;
321 cpumask_t affinity_mask;
322 struct irq_affinity_notify affinity_notify;
324 char name[ICE_INT_NAME_STR_LEN];
325 } ____cacheline_internodealigned_in_smp;
331 ICE_FLAG_SRIOV_CAPABLE,
332 ICE_FLAG_DCB_CAPABLE,
334 ICE_FLAG_ADV_FEATURES,
335 ICE_FLAG_LINK_DOWN_ON_CLOSE_ENA,
337 ICE_FLAG_FW_LLDP_AGENT,
338 ICE_FLAG_ETHTOOL_CTXT, /* set when ethtool holds RTNL lock */
340 ICE_PF_FLAGS_NBITS /* must be last */
344 struct pci_dev *pdev;
346 /* OS reserved IRQ details */
347 struct msix_entry *msix_entries;
348 struct ice_res_tracker *irq_tracker;
349 /* First MSIX vector used by SR-IOV VFs. Calculated by subtracting the
350 * number of MSIX vectors needed for all SR-IOV VFs from the number of
351 * MSIX vectors allowed on this PF.
353 u16 sriov_base_vector;
355 struct ice_vsi **vsi; /* VSIs created by the driver */
356 struct ice_sw *first_sw; /* first switch created by firmware */
357 /* Virtchnl/SR-IOV config info */
359 int num_alloc_vfs; /* actual number of VFs allocated */
360 u16 num_vfs_supported; /* num VFs supported for this PF */
361 u16 num_vf_qps; /* num queue pairs per VF */
362 u16 num_vf_msix; /* num vectors per VF */
363 DECLARE_BITMAP(state, __ICE_STATE_NBITS);
364 DECLARE_BITMAP(flags, ICE_PF_FLAGS_NBITS);
365 unsigned long *avail_txqs; /* bitmap to track PF Tx queue usage */
366 unsigned long *avail_rxqs; /* bitmap to track PF Rx queue usage */
367 unsigned long serv_tmr_period;
368 unsigned long serv_tmr_prev;
369 struct timer_list serv_tmr;
370 struct work_struct serv_task;
371 struct mutex avail_q_mutex; /* protects access to avail_[rx|tx]qs */
372 struct mutex sw_mutex; /* lock for protecting VSI alloc flow */
373 struct mutex tc_mutex; /* lock to protect TC changes */
375 u32 hw_csum_rx_error;
376 u32 oicr_idx; /* Other interrupt cause MSIX vector index */
377 u32 num_avail_sw_msix; /* remaining MSIX SW vectors left unclaimed */
378 u16 max_pf_txqs; /* Total Tx queues PF wide */
379 u16 max_pf_rxqs; /* Total Rx queues PF wide */
380 u32 num_lan_msix; /* Total MSIX vectors for base driver */
381 u16 num_lan_tx; /* num LAN Tx queues setup */
382 u16 num_lan_rx; /* num LAN Rx queues setup */
383 u16 next_vsi; /* Next free slot in pf->vsi[] - 0-based! */
385 u16 corer_count; /* Core reset count */
386 u16 globr_count; /* Global reset count */
387 u16 empr_count; /* EMP reset count */
388 u16 pfr_count; /* PF reset count */
390 struct ice_hw_port_stats stats;
391 struct ice_hw_port_stats stats_prev;
393 u8 stat_prev_loaded:1; /* has previous stats been loaded */
396 #endif /* CONFIG_DCB */
397 u32 tx_timeout_count;
398 unsigned long tx_timeout_last_recovery;
399 u32 tx_timeout_recovery_level;
400 char int_name[ICE_INT_NAME_STR_LEN];
404 struct ice_netdev_priv {
409 * ice_irq_dynamic_ena - Enable default interrupt generation settings
410 * @hw: pointer to HW struct
411 * @vsi: pointer to VSI struct, can be NULL
412 * @q_vector: pointer to q_vector, can be NULL
415 ice_irq_dynamic_ena(struct ice_hw *hw, struct ice_vsi *vsi,
416 struct ice_q_vector *q_vector)
418 u32 vector = (vsi && q_vector) ? q_vector->reg_idx :
419 ((struct ice_pf *)hw->back)->oicr_idx;
420 int itr = ICE_ITR_NONE;
423 /* clear the PBA here, as this function is meant to clean out all
424 * previous interrupts and enable the interrupt
426 val = GLINT_DYN_CTL_INTENA_M | GLINT_DYN_CTL_CLEARPBA_M |
427 (itr << GLINT_DYN_CTL_ITR_INDX_S);
429 if (test_bit(__ICE_DOWN, vsi->state))
431 wr32(hw, GLINT_DYN_CTL(vector), val);
435 * ice_netdev_to_pf - Retrieve the PF struct associated with a netdev
436 * @netdev: pointer to the netdev struct
438 static inline struct ice_pf *ice_netdev_to_pf(struct net_device *netdev)
440 struct ice_netdev_priv *np = netdev_priv(netdev);
442 return np->vsi->back;
445 static inline bool ice_is_xdp_ena_vsi(struct ice_vsi *vsi)
447 return !!vsi->xdp_prog;
450 static inline void ice_set_ring_xdp(struct ice_ring *ring)
452 ring->flags |= ICE_TX_FLAGS_RING_XDP;
456 * ice_xsk_umem - get XDP UMEM bound to a ring
457 * @ring - ring to use
459 * Returns a pointer to xdp_umem structure if there is an UMEM present,
462 static inline struct xdp_umem *ice_xsk_umem(struct ice_ring *ring)
464 struct xdp_umem **umems = ring->vsi->xsk_umems;
465 int qid = ring->q_index;
467 if (ice_ring_is_xdp(ring))
468 qid -= ring->vsi->num_xdp_txq;
470 if (!umems || !umems[qid] || !ice_is_xdp_ena_vsi(ring->vsi))
477 * ice_get_main_vsi - Get the PF VSI
480 * returns pf->vsi[0], which by definition is the PF VSI
482 static inline struct ice_vsi *ice_get_main_vsi(struct ice_pf *pf)
490 int ice_vsi_setup_tx_rings(struct ice_vsi *vsi);
491 int ice_vsi_setup_rx_rings(struct ice_vsi *vsi);
492 void ice_set_ethtool_ops(struct net_device *netdev);
493 void ice_set_ethtool_safe_mode_ops(struct net_device *netdev);
494 u16 ice_get_avail_txq_count(struct ice_pf *pf);
495 u16 ice_get_avail_rxq_count(struct ice_pf *pf);
496 int ice_vsi_recfg_qs(struct ice_vsi *vsi, int new_rx, int new_tx);
497 void ice_update_vsi_stats(struct ice_vsi *vsi);
498 void ice_update_pf_stats(struct ice_pf *pf);
499 int ice_up(struct ice_vsi *vsi);
500 int ice_down(struct ice_vsi *vsi);
501 int ice_vsi_cfg(struct ice_vsi *vsi);
502 struct ice_vsi *ice_lb_vsi_setup(struct ice_pf *pf, struct ice_port_info *pi);
503 int ice_prepare_xdp_rings(struct ice_vsi *vsi, struct bpf_prog *prog);
504 int ice_destroy_xdp_rings(struct ice_vsi *vsi);
506 ice_xdp_xmit(struct net_device *dev, int n, struct xdp_frame **frames,
508 int ice_set_rss(struct ice_vsi *vsi, u8 *seed, u8 *lut, u16 lut_size);
509 int ice_get_rss(struct ice_vsi *vsi, u8 *seed, u8 *lut, u16 lut_size);
510 void ice_fill_rss_lut(u8 *lut, u16 rss_table_size, u16 rss_size);
511 int ice_schedule_reset(struct ice_pf *pf, enum ice_reset_req reset);
512 void ice_print_link_msg(struct ice_vsi *vsi, bool isup);
513 int ice_open(struct net_device *netdev);
514 int ice_stop(struct net_device *netdev);