1 /* SPDX-License-Identifier: (GPL-2.0+ OR BSD-3-Clause) */
2 /* Copyright 2014-2016 Freescale Semiconductor Inc.
3 * Copyright 2016-2020 NXP
9 #include <linux/dcbnl.h>
10 #include <linux/netdevice.h>
11 #include <linux/if_vlan.h>
12 #include <linux/fsl/mc.h>
14 #include <soc/fsl/dpaa2-io.h>
15 #include <soc/fsl/dpaa2-fd.h>
19 #include "dpaa2-eth-trace.h"
20 #include "dpaa2-eth-debugfs.h"
21 #include "dpaa2-mac.h"
23 #define DPAA2_WRIOP_VERSION(x, y, z) ((x) << 10 | (y) << 5 | (z) << 0)
25 #define DPAA2_ETH_STORE_SIZE 16
27 /* Maximum number of scatter-gather entries in an ingress frame,
28 * considering the maximum receive frame size is 64K
30 #define DPAA2_ETH_MAX_SG_ENTRIES ((64 * 1024) / DPAA2_ETH_RX_BUF_SIZE)
32 /* Maximum acceptable MTU value. It is in direct relation with the hardware
33 * enforced Max Frame Length (currently 10k).
35 #define DPAA2_ETH_MFL (10 * 1024)
36 #define DPAA2_ETH_MAX_MTU (DPAA2_ETH_MFL - VLAN_ETH_HLEN)
37 /* Convert L3 MTU to L2 MFL */
38 #define DPAA2_ETH_L2_MAX_FRM(mtu) ((mtu) + VLAN_ETH_HLEN)
40 /* Set the taildrop threshold (in bytes) to allow the enqueue of a large
41 * enough number of jumbo frames in the Rx queues (length of the current
42 * frame is not taken into account when making the taildrop decision)
44 #define DPAA2_ETH_FQ_TAILDROP_THRESH (1024 * 1024)
46 /* Maximum number of Tx confirmation frames to be processed
47 * in a single NAPI call
49 #define DPAA2_ETH_TXCONF_PER_NAPI 256
51 /* Buffer qouta per channel. We want to keep in check number of ingress frames
52 * in flight: for small sized frames, congestion group taildrop may kick in
53 * first; for large sizes, Rx FQ taildrop threshold will ensure only a
54 * reasonable number of frames will be pending at any given time.
55 * Ingress frame drop due to buffer pool depletion should be a corner case only
57 #define DPAA2_ETH_NUM_BUFS 1280
58 #define DPAA2_ETH_REFILL_THRESH \
59 (DPAA2_ETH_NUM_BUFS - DPAA2_ETH_BUFS_PER_CMD)
61 /* Congestion group taildrop threshold: number of frames allowed to accumulate
62 * at any moment in a group of Rx queues belonging to the same traffic class.
63 * Choose value such that we don't risk depleting the buffer pool before the
66 #define DPAA2_ETH_CG_TAILDROP_THRESH(priv) \
67 (1024 * dpaa2_eth_queue_count(priv) / dpaa2_eth_tc_count(priv))
69 /* Congestion group notification threshold: when this many frames accumulate
70 * on the Rx queues belonging to the same TC, the MAC is instructed to send
71 * PFC frames for that TC.
72 * When number of pending frames drops below exit threshold transmission of
73 * PFC frames is stopped.
75 #define DPAA2_ETH_CN_THRESH_ENTRY(priv) \
76 (DPAA2_ETH_CG_TAILDROP_THRESH(priv) / 2)
77 #define DPAA2_ETH_CN_THRESH_EXIT(priv) \
78 (DPAA2_ETH_CN_THRESH_ENTRY(priv) * 3 / 4)
80 /* Maximum number of buffers that can be acquired/released through a single
83 #define DPAA2_ETH_BUFS_PER_CMD 7
85 /* Hardware requires alignment for ingress/egress buffer addresses */
86 #define DPAA2_ETH_TX_BUF_ALIGN 64
88 #define DPAA2_ETH_RX_BUF_RAW_SIZE PAGE_SIZE
89 #define DPAA2_ETH_RX_BUF_TAILROOM \
90 SKB_DATA_ALIGN(sizeof(struct skb_shared_info))
91 #define DPAA2_ETH_RX_BUF_SIZE \
92 (DPAA2_ETH_RX_BUF_RAW_SIZE - DPAA2_ETH_RX_BUF_TAILROOM)
94 /* Hardware annotation area in RX/TX buffers */
95 #define DPAA2_ETH_RX_HWA_SIZE 64
96 #define DPAA2_ETH_TX_HWA_SIZE 128
98 /* PTP nominal frequency 1GHz */
99 #define DPAA2_PTP_CLK_PERIOD_NS 1
101 /* Due to a limitation in WRIOP 1.0.0, the RX buffer data must be aligned
102 * to 256B. For newer revisions, the requirement is only for 64B alignment
104 #define DPAA2_ETH_RX_BUF_ALIGN_REV1 256
105 #define DPAA2_ETH_RX_BUF_ALIGN 64
107 /* We are accommodating a skb backpointer and some S/G info
108 * in the frame's software annotation. The hardware
109 * options are either 0 or 64, so we choose the latter.
111 #define DPAA2_ETH_SWA_SIZE 64
113 /* We store different information in the software annotation area of a Tx frame
114 * based on what type of frame it is
116 enum dpaa2_eth_swa_type {
117 DPAA2_ETH_SWA_SINGLE,
122 /* Must keep this struct smaller than DPAA2_ETH_SWA_SIZE */
123 struct dpaa2_eth_swa {
124 enum dpaa2_eth_swa_type type;
131 struct scatterlist *scl;
137 struct xdp_frame *xdpf;
142 /* Annotation valid bits in FD FRC */
143 #define DPAA2_FD_FRC_FASV 0x8000
144 #define DPAA2_FD_FRC_FAEADV 0x4000
145 #define DPAA2_FD_FRC_FAPRV 0x2000
146 #define DPAA2_FD_FRC_FAIADV 0x1000
147 #define DPAA2_FD_FRC_FASWOV 0x0800
148 #define DPAA2_FD_FRC_FAICFDV 0x0400
150 /* Error bits in FD CTRL */
151 #define DPAA2_FD_RX_ERR_MASK (FD_CTRL_SBE | FD_CTRL_FAERR)
152 #define DPAA2_FD_TX_ERR_MASK (FD_CTRL_UFD | \
157 /* Annotation bits in FD CTRL */
158 #define DPAA2_FD_CTRL_ASAL 0x00020000 /* ASAL = 128B */
160 /* Frame annotation status */
168 /* Frame annotation status word is located in the first 8 bytes
169 * of the buffer's hardware annoatation area
171 #define DPAA2_FAS_OFFSET 0
172 #define DPAA2_FAS_SIZE (sizeof(struct dpaa2_fas))
174 /* Timestamp is located in the next 8 bytes of the buffer's
175 * hardware annotation area
177 #define DPAA2_TS_OFFSET 0x8
179 /* Frame annotation egress action descriptor */
180 #define DPAA2_FAEAD_OFFSET 0x58
187 #define DPAA2_FAEAD_A2V 0x20000000
188 #define DPAA2_FAEAD_A4V 0x08000000
189 #define DPAA2_FAEAD_UPDV 0x00001000
190 #define DPAA2_FAEAD_EBDDV 0x00002000
191 #define DPAA2_FAEAD_UPD 0x00000010
193 /* Accessors for the hardware annotation fields that we use */
194 static inline void *dpaa2_get_hwa(void *buf_addr, bool swa)
196 return buf_addr + (swa ? DPAA2_ETH_SWA_SIZE : 0);
199 static inline struct dpaa2_fas *dpaa2_get_fas(void *buf_addr, bool swa)
201 return dpaa2_get_hwa(buf_addr, swa) + DPAA2_FAS_OFFSET;
204 static inline __le64 *dpaa2_get_ts(void *buf_addr, bool swa)
206 return dpaa2_get_hwa(buf_addr, swa) + DPAA2_TS_OFFSET;
209 static inline struct dpaa2_faead *dpaa2_get_faead(void *buf_addr, bool swa)
211 return dpaa2_get_hwa(buf_addr, swa) + DPAA2_FAEAD_OFFSET;
214 /* Error and status bits in the frame annotation status word */
215 /* Debug frame, otherwise supposed to be discarded */
216 #define DPAA2_FAS_DISC 0x80000000
218 #define DPAA2_FAS_MS 0x40000000
219 #define DPAA2_FAS_PTP 0x08000000
220 /* Ethernet multicast frame */
221 #define DPAA2_FAS_MC 0x04000000
222 /* Ethernet broadcast frame */
223 #define DPAA2_FAS_BC 0x02000000
224 #define DPAA2_FAS_KSE 0x00040000
225 #define DPAA2_FAS_EOFHE 0x00020000
226 #define DPAA2_FAS_MNLE 0x00010000
227 #define DPAA2_FAS_TIDE 0x00008000
228 #define DPAA2_FAS_PIEE 0x00004000
229 /* Frame length error */
230 #define DPAA2_FAS_FLE 0x00002000
231 /* Frame physical error */
232 #define DPAA2_FAS_FPE 0x00001000
233 #define DPAA2_FAS_PTE 0x00000080
234 #define DPAA2_FAS_ISP 0x00000040
235 #define DPAA2_FAS_PHE 0x00000020
236 #define DPAA2_FAS_BLE 0x00000010
237 /* L3 csum validation performed */
238 #define DPAA2_FAS_L3CV 0x00000008
240 #define DPAA2_FAS_L3CE 0x00000004
241 /* L4 csum validation performed */
242 #define DPAA2_FAS_L4CV 0x00000002
244 #define DPAA2_FAS_L4CE 0x00000001
245 /* Possible errors on the ingress path */
246 #define DPAA2_FAS_RX_ERR_MASK (DPAA2_FAS_KSE | \
260 /* Time in milliseconds between link state updates */
261 #define DPAA2_ETH_LINK_STATE_REFRESH 1000
263 /* Number of times to retry a frame enqueue before giving up.
264 * Value determined empirically, in order to minimize the number
265 * of frames dropped on Tx
267 #define DPAA2_ETH_ENQUEUE_RETRIES 10
269 /* Number of times to retry DPIO portal operations while waiting
270 * for portal to finish executing current command and become
271 * available. We want to avoid being stuck in a while loop in case
272 * hardware becomes unresponsive, but not give up too easily if
273 * the portal really is busy for valid reasons
275 #define DPAA2_ETH_SWP_BUSY_RETRIES 1000
277 /* Driver statistics, other than those in struct rtnl_link_stats64.
278 * These are usually collected per-CPU and aggregated by ethtool.
280 struct dpaa2_eth_drv_stats {
281 __u64 tx_conf_frames;
288 /* Enqueues retried due to portal busy */
289 __u64 tx_portal_busy;
292 /* Per-FQ statistics */
293 struct dpaa2_eth_fq_stats {
294 /* Number of frames received on this queue */
298 /* Per-channel statistics */
299 struct dpaa2_eth_ch_stats {
300 /* Volatile dequeues retried due to portal busy */
301 __u64 dequeue_portal_busy;
304 /* Number of CDANs; useful to estimate avg NAPI len */
311 /* Must be last, does not show up in ethtool stats */
315 /* Maximum number of queues associated with a DPNI */
316 #define DPAA2_ETH_MAX_TCS 8
317 #define DPAA2_ETH_MAX_RX_QUEUES_PER_TC 16
318 #define DPAA2_ETH_MAX_RX_QUEUES \
319 (DPAA2_ETH_MAX_RX_QUEUES_PER_TC * DPAA2_ETH_MAX_TCS)
320 #define DPAA2_ETH_MAX_TX_QUEUES 16
321 #define DPAA2_ETH_MAX_QUEUES (DPAA2_ETH_MAX_RX_QUEUES + \
322 DPAA2_ETH_MAX_TX_QUEUES)
323 #define DPAA2_ETH_MAX_NETDEV_QUEUES \
324 (DPAA2_ETH_MAX_TX_QUEUES * DPAA2_ETH_MAX_TCS)
326 #define DPAA2_ETH_MAX_DPCONS 16
328 enum dpaa2_eth_fq_type {
333 struct dpaa2_eth_priv;
335 struct dpaa2_eth_xdp_fds {
336 struct dpaa2_fd fds[DEV_MAP_BULK_SIZE];
340 struct dpaa2_eth_fq {
343 u32 tx_fqid[DPAA2_ETH_MAX_TCS];
349 struct dpaa2_eth_channel *channel;
350 enum dpaa2_eth_fq_type type;
352 void (*consume)(struct dpaa2_eth_priv *priv,
353 struct dpaa2_eth_channel *ch,
354 const struct dpaa2_fd *fd,
355 struct dpaa2_eth_fq *fq);
356 struct dpaa2_eth_fq_stats stats;
358 struct dpaa2_eth_xdp_fds xdp_redirect_fds;
359 struct dpaa2_eth_xdp_fds xdp_tx_fds;
362 struct dpaa2_eth_ch_xdp {
363 struct bpf_prog *prog;
364 u64 drop_bufs[DPAA2_ETH_BUFS_PER_CMD];
369 struct dpaa2_eth_channel {
370 struct dpaa2_io_notification_ctx nctx;
371 struct fsl_mc_device *dpcon;
374 struct napi_struct napi;
375 struct dpaa2_io *dpio;
376 struct dpaa2_io_store *store;
377 struct dpaa2_eth_priv *priv;
379 struct dpaa2_eth_ch_stats stats;
380 struct dpaa2_eth_ch_xdp xdp;
381 struct xdp_rxq_info xdp_rxq;
382 struct list_head *rx_list;
385 struct dpaa2_eth_dist_fields {
387 enum net_prot cls_prot;
393 struct dpaa2_eth_cls_rule {
394 struct ethtool_rx_flow_spec fs;
398 /* Driver private data */
399 struct dpaa2_eth_priv {
400 struct net_device *net_dev;
403 struct dpaa2_eth_fq fq[DPAA2_ETH_MAX_QUEUES];
404 int (*enqueue)(struct dpaa2_eth_priv *priv,
405 struct dpaa2_eth_fq *fq,
406 struct dpaa2_fd *fd, u8 prio,
408 int *frames_enqueued);
411 struct dpaa2_eth_channel *channel[DPAA2_ETH_MAX_DPCONS];
413 struct dpni_attr dpni_attrs;
418 struct fsl_mc_device *dpbp_dev;
421 struct iommu_domain *iommu_domain;
423 bool tx_tstamp; /* Tx timestamping enabled */
424 bool rx_tstamp; /* Rx timestamping enabled */
427 struct fsl_mc_io *mc_io;
428 /* Cores which have an affine DPIO/DPCON.
429 * This is the cpu set on which Rx and Tx conf frames are processed
431 struct cpumask dpio_cpumask;
433 /* Standard statistics */
434 struct rtnl_link_stats64 __percpu *percpu_stats;
435 /* Extra stats, in addition to the ones known by the kernel */
436 struct dpaa2_eth_drv_stats __percpu *percpu_extras;
441 struct dpni_link_state link_state;
443 struct task_struct *poll_thread;
445 /* enabled ethtool hashing bits */
448 struct dpaa2_eth_cls_rule *cls_rules;
451 #ifdef CONFIG_FSL_DPAA2_ETH_DCB
455 struct bpf_prog *xdp_prog;
456 #ifdef CONFIG_DEBUG_FS
457 struct dpaa2_debugfs dbg;
460 struct dpaa2_mac *mac;
463 #define DPAA2_RXH_SUPPORTED (RXH_L2DA | RXH_VLAN | RXH_L3_PROTO \
464 | RXH_IP_SRC | RXH_IP_DST | RXH_L4_B_0_1 \
467 /* default Rx hash options, set during probing */
468 #define DPAA2_RXH_DEFAULT (RXH_L3_PROTO | RXH_IP_SRC | RXH_IP_DST | \
469 RXH_L4_B_0_1 | RXH_L4_B_2_3)
471 #define dpaa2_eth_hash_enabled(priv) \
472 ((priv)->dpni_attrs.num_queues > 1)
474 /* Required by struct dpni_rx_tc_dist_cfg::key_cfg_iova */
475 #define DPAA2_CLASSIFIER_DMA_SIZE 256
477 extern const struct ethtool_ops dpaa2_ethtool_ops;
478 extern int dpaa2_phc_index;
480 static inline int dpaa2_eth_cmp_dpni_ver(struct dpaa2_eth_priv *priv,
481 u16 ver_major, u16 ver_minor)
483 if (priv->dpni_ver_major == ver_major)
484 return priv->dpni_ver_minor - ver_minor;
485 return priv->dpni_ver_major - ver_major;
488 /* Minimum firmware version that supports a more flexible API
489 * for configuring the Rx flow hash key
491 #define DPNI_RX_DIST_KEY_VER_MAJOR 7
492 #define DPNI_RX_DIST_KEY_VER_MINOR 5
494 #define dpaa2_eth_has_legacy_dist(priv) \
495 (dpaa2_eth_cmp_dpni_ver((priv), DPNI_RX_DIST_KEY_VER_MAJOR, \
496 DPNI_RX_DIST_KEY_VER_MINOR) < 0)
498 #define dpaa2_eth_fs_enabled(priv) \
499 (!((priv)->dpni_attrs.options & DPNI_OPT_NO_FS))
501 #define dpaa2_eth_fs_mask_enabled(priv) \
502 ((priv)->dpni_attrs.options & DPNI_OPT_HAS_KEY_MASKING)
504 #define dpaa2_eth_fs_count(priv) \
505 ((priv)->dpni_attrs.fs_entries)
507 #define dpaa2_eth_tc_count(priv) \
508 ((priv)->dpni_attrs.num_tcs)
510 /* We have exactly one {Rx, Tx conf} queue per channel */
511 #define dpaa2_eth_queue_count(priv) \
512 ((priv)->num_channels)
514 enum dpaa2_eth_rx_dist {
515 DPAA2_ETH_RX_DIST_HASH,
516 DPAA2_ETH_RX_DIST_CLS
519 /* Unique IDs for the supported Rx classification header fields */
520 #define DPAA2_ETH_DIST_ETHDST BIT(0)
521 #define DPAA2_ETH_DIST_ETHSRC BIT(1)
522 #define DPAA2_ETH_DIST_ETHTYPE BIT(2)
523 #define DPAA2_ETH_DIST_VLAN BIT(3)
524 #define DPAA2_ETH_DIST_IPSRC BIT(4)
525 #define DPAA2_ETH_DIST_IPDST BIT(5)
526 #define DPAA2_ETH_DIST_IPPROTO BIT(6)
527 #define DPAA2_ETH_DIST_L4SRC BIT(7)
528 #define DPAA2_ETH_DIST_L4DST BIT(8)
529 #define DPAA2_ETH_DIST_ALL (~0ULL)
531 #define DPNI_PAUSE_VER_MAJOR 7
532 #define DPNI_PAUSE_VER_MINOR 13
533 #define dpaa2_eth_has_pause_support(priv) \
534 (dpaa2_eth_cmp_dpni_ver((priv), DPNI_PAUSE_VER_MAJOR, \
535 DPNI_PAUSE_VER_MINOR) >= 0)
537 static inline bool dpaa2_eth_tx_pause_enabled(u64 link_options)
539 return !!(link_options & DPNI_LINK_OPT_PAUSE) ^
540 !!(link_options & DPNI_LINK_OPT_ASYM_PAUSE);
543 static inline bool dpaa2_eth_rx_pause_enabled(u64 link_options)
545 return !!(link_options & DPNI_LINK_OPT_PAUSE);
549 unsigned int dpaa2_eth_needed_headroom(struct dpaa2_eth_priv *priv,
552 unsigned int headroom = DPAA2_ETH_SWA_SIZE;
554 /* If we don't have an skb (e.g. XDP buffer), we only need space for
555 * the software annotation area
560 /* For non-linear skbs we have no headroom requirement, as we build a
561 * SG frame with a newly allocated SGT buffer
563 if (skb_is_nonlinear(skb))
566 /* If we have Tx timestamping, need 128B hardware annotation */
567 if (priv->tx_tstamp && skb_shinfo(skb)->tx_flags & SKBTX_HW_TSTAMP)
568 headroom += DPAA2_ETH_TX_HWA_SIZE;
573 /* Extra headroom space requested to hardware, in order to make sure there's
574 * no realloc'ing in forwarding scenarios
576 static inline unsigned int dpaa2_eth_rx_head_room(struct dpaa2_eth_priv *priv)
578 return priv->tx_data_offset - DPAA2_ETH_RX_HWA_SIZE;
581 int dpaa2_eth_set_hash(struct net_device *net_dev, u64 flags);
582 int dpaa2_eth_set_cls(struct net_device *net_dev, u64 key);
583 int dpaa2_eth_cls_key_size(u64 key);
584 int dpaa2_eth_cls_fld_off(int prot, int field);
585 void dpaa2_eth_cls_trim_rule(void *key_mem, u64 fields);
587 extern const struct dcbnl_rtnl_ops dpaa2_eth_dcbnl_ops;
589 #endif /* __DPAA2_H */