1 /* SPDX-License-Identifier: (GPL-2.0+ OR BSD-3-Clause) */ 2 /* Copyright 2014-2016 Freescale Semiconductor Inc. 3 * Copyright 2016-2020 NXP 4 */ 5 6 #ifndef __DPAA2_ETH_H 7 #define __DPAA2_ETH_H 8 9 #include <linux/netdevice.h> 10 #include <linux/if_vlan.h> 11 #include <linux/fsl/mc.h> 12 13 #include <soc/fsl/dpaa2-io.h> 14 #include <soc/fsl/dpaa2-fd.h> 15 #include "dpni.h" 16 #include "dpni-cmd.h" 17 18 #include "dpaa2-eth-trace.h" 19 #include "dpaa2-eth-debugfs.h" 20 #include "dpaa2-mac.h" 21 22 #define DPAA2_WRIOP_VERSION(x, y, z) ((x) << 10 | (y) << 5 | (z) << 0) 23 24 #define DPAA2_ETH_STORE_SIZE 16 25 26 /* Maximum number of scatter-gather entries in an ingress frame, 27 * considering the maximum receive frame size is 64K 28 */ 29 #define DPAA2_ETH_MAX_SG_ENTRIES ((64 * 1024) / DPAA2_ETH_RX_BUF_SIZE) 30 31 /* Maximum acceptable MTU value. It is in direct relation with the hardware 32 * enforced Max Frame Length (currently 10k). 33 */ 34 #define DPAA2_ETH_MFL (10 * 1024) 35 #define DPAA2_ETH_MAX_MTU (DPAA2_ETH_MFL - VLAN_ETH_HLEN) 36 /* Convert L3 MTU to L2 MFL */ 37 #define DPAA2_ETH_L2_MAX_FRM(mtu) ((mtu) + VLAN_ETH_HLEN) 38 39 /* Set the taildrop threshold (in bytes) to allow the enqueue of several jumbo 40 * frames in the Rx queues (length of the current frame is not 41 * taken into account when making the taildrop decision) 42 */ 43 #define DPAA2_ETH_TAILDROP_THRESH (64 * 1024) 44 45 /* Maximum number of Tx confirmation frames to be processed 46 * in a single NAPI call 47 */ 48 #define DPAA2_ETH_TXCONF_PER_NAPI 256 49 50 /* Buffer quota per queue. Must be large enough such that for minimum sized 51 * frames taildrop kicks in before the bpool gets depleted, so we compute 52 * how many 64B frames fit inside the taildrop threshold and add a margin 53 * to accommodate the buffer refill delay. 54 */ 55 #define DPAA2_ETH_MAX_FRAMES_PER_QUEUE (DPAA2_ETH_TAILDROP_THRESH / 64) 56 #define DPAA2_ETH_NUM_BUFS (DPAA2_ETH_MAX_FRAMES_PER_QUEUE + 256) 57 #define DPAA2_ETH_REFILL_THRESH \ 58 (DPAA2_ETH_NUM_BUFS - DPAA2_ETH_BUFS_PER_CMD) 59 60 /* Maximum number of buffers that can be acquired/released through a single 61 * QBMan command 62 */ 63 #define DPAA2_ETH_BUFS_PER_CMD 7 64 65 /* Hardware requires alignment for ingress/egress buffer addresses */ 66 #define DPAA2_ETH_TX_BUF_ALIGN 64 67 68 #define DPAA2_ETH_RX_BUF_RAW_SIZE PAGE_SIZE 69 #define DPAA2_ETH_RX_BUF_TAILROOM \ 70 SKB_DATA_ALIGN(sizeof(struct skb_shared_info)) 71 #define DPAA2_ETH_RX_BUF_SIZE \ 72 (DPAA2_ETH_RX_BUF_RAW_SIZE - DPAA2_ETH_RX_BUF_TAILROOM) 73 74 /* Hardware annotation area in RX/TX buffers */ 75 #define DPAA2_ETH_RX_HWA_SIZE 64 76 #define DPAA2_ETH_TX_HWA_SIZE 128 77 78 /* PTP nominal frequency 1GHz */ 79 #define DPAA2_PTP_CLK_PERIOD_NS 1 80 81 /* Due to a limitation in WRIOP 1.0.0, the RX buffer data must be aligned 82 * to 256B. For newer revisions, the requirement is only for 64B alignment 83 */ 84 #define DPAA2_ETH_RX_BUF_ALIGN_REV1 256 85 #define DPAA2_ETH_RX_BUF_ALIGN 64 86 87 /* We are accommodating a skb backpointer and some S/G info 88 * in the frame's software annotation. The hardware 89 * options are either 0 or 64, so we choose the latter. 90 */ 91 #define DPAA2_ETH_SWA_SIZE 64 92 93 /* We store different information in the software annotation area of a Tx frame 94 * based on what type of frame it is 95 */ 96 enum dpaa2_eth_swa_type { 97 DPAA2_ETH_SWA_SINGLE, 98 DPAA2_ETH_SWA_SG, 99 DPAA2_ETH_SWA_XDP, 100 }; 101 102 /* Must keep this struct smaller than DPAA2_ETH_SWA_SIZE */ 103 struct dpaa2_eth_swa { 104 enum dpaa2_eth_swa_type type; 105 union { 106 struct { 107 struct sk_buff *skb; 108 } single; 109 struct { 110 struct sk_buff *skb; 111 struct scatterlist *scl; 112 int num_sg; 113 int sgt_size; 114 } sg; 115 struct { 116 int dma_size; 117 struct xdp_frame *xdpf; 118 } xdp; 119 }; 120 }; 121 122 /* Annotation valid bits in FD FRC */ 123 #define DPAA2_FD_FRC_FASV 0x8000 124 #define DPAA2_FD_FRC_FAEADV 0x4000 125 #define DPAA2_FD_FRC_FAPRV 0x2000 126 #define DPAA2_FD_FRC_FAIADV 0x1000 127 #define DPAA2_FD_FRC_FASWOV 0x0800 128 #define DPAA2_FD_FRC_FAICFDV 0x0400 129 130 /* Error bits in FD CTRL */ 131 #define DPAA2_FD_RX_ERR_MASK (FD_CTRL_SBE | FD_CTRL_FAERR) 132 #define DPAA2_FD_TX_ERR_MASK (FD_CTRL_UFD | \ 133 FD_CTRL_SBE | \ 134 FD_CTRL_FSE | \ 135 FD_CTRL_FAERR) 136 137 /* Annotation bits in FD CTRL */ 138 #define DPAA2_FD_CTRL_ASAL 0x00020000 /* ASAL = 128B */ 139 140 /* Frame annotation status */ 141 struct dpaa2_fas { 142 u8 reserved; 143 u8 ppid; 144 __le16 ifpid; 145 __le32 status; 146 }; 147 148 /* Frame annotation status word is located in the first 8 bytes 149 * of the buffer's hardware annoatation area 150 */ 151 #define DPAA2_FAS_OFFSET 0 152 #define DPAA2_FAS_SIZE (sizeof(struct dpaa2_fas)) 153 154 /* Timestamp is located in the next 8 bytes of the buffer's 155 * hardware annotation area 156 */ 157 #define DPAA2_TS_OFFSET 0x8 158 159 /* Frame annotation egress action descriptor */ 160 #define DPAA2_FAEAD_OFFSET 0x58 161 162 struct dpaa2_faead { 163 __le32 conf_fqid; 164 __le32 ctrl; 165 }; 166 167 #define DPAA2_FAEAD_A2V 0x20000000 168 #define DPAA2_FAEAD_A4V 0x08000000 169 #define DPAA2_FAEAD_UPDV 0x00001000 170 #define DPAA2_FAEAD_EBDDV 0x00002000 171 #define DPAA2_FAEAD_UPD 0x00000010 172 173 /* Accessors for the hardware annotation fields that we use */ 174 static inline void *dpaa2_get_hwa(void *buf_addr, bool swa) 175 { 176 return buf_addr + (swa ? DPAA2_ETH_SWA_SIZE : 0); 177 } 178 179 static inline struct dpaa2_fas *dpaa2_get_fas(void *buf_addr, bool swa) 180 { 181 return dpaa2_get_hwa(buf_addr, swa) + DPAA2_FAS_OFFSET; 182 } 183 184 static inline __le64 *dpaa2_get_ts(void *buf_addr, bool swa) 185 { 186 return dpaa2_get_hwa(buf_addr, swa) + DPAA2_TS_OFFSET; 187 } 188 189 static inline struct dpaa2_faead *dpaa2_get_faead(void *buf_addr, bool swa) 190 { 191 return dpaa2_get_hwa(buf_addr, swa) + DPAA2_FAEAD_OFFSET; 192 } 193 194 /* Error and status bits in the frame annotation status word */ 195 /* Debug frame, otherwise supposed to be discarded */ 196 #define DPAA2_FAS_DISC 0x80000000 197 /* MACSEC frame */ 198 #define DPAA2_FAS_MS 0x40000000 199 #define DPAA2_FAS_PTP 0x08000000 200 /* Ethernet multicast frame */ 201 #define DPAA2_FAS_MC 0x04000000 202 /* Ethernet broadcast frame */ 203 #define DPAA2_FAS_BC 0x02000000 204 #define DPAA2_FAS_KSE 0x00040000 205 #define DPAA2_FAS_EOFHE 0x00020000 206 #define DPAA2_FAS_MNLE 0x00010000 207 #define DPAA2_FAS_TIDE 0x00008000 208 #define DPAA2_FAS_PIEE 0x00004000 209 /* Frame length error */ 210 #define DPAA2_FAS_FLE 0x00002000 211 /* Frame physical error */ 212 #define DPAA2_FAS_FPE 0x00001000 213 #define DPAA2_FAS_PTE 0x00000080 214 #define DPAA2_FAS_ISP 0x00000040 215 #define DPAA2_FAS_PHE 0x00000020 216 #define DPAA2_FAS_BLE 0x00000010 217 /* L3 csum validation performed */ 218 #define DPAA2_FAS_L3CV 0x00000008 219 /* L3 csum error */ 220 #define DPAA2_FAS_L3CE 0x00000004 221 /* L4 csum validation performed */ 222 #define DPAA2_FAS_L4CV 0x00000002 223 /* L4 csum error */ 224 #define DPAA2_FAS_L4CE 0x00000001 225 /* Possible errors on the ingress path */ 226 #define DPAA2_FAS_RX_ERR_MASK (DPAA2_FAS_KSE | \ 227 DPAA2_FAS_EOFHE | \ 228 DPAA2_FAS_MNLE | \ 229 DPAA2_FAS_TIDE | \ 230 DPAA2_FAS_PIEE | \ 231 DPAA2_FAS_FLE | \ 232 DPAA2_FAS_FPE | \ 233 DPAA2_FAS_PTE | \ 234 DPAA2_FAS_ISP | \ 235 DPAA2_FAS_PHE | \ 236 DPAA2_FAS_BLE | \ 237 DPAA2_FAS_L3CE | \ 238 DPAA2_FAS_L4CE) 239 240 /* Time in milliseconds between link state updates */ 241 #define DPAA2_ETH_LINK_STATE_REFRESH 1000 242 243 /* Number of times to retry a frame enqueue before giving up. 244 * Value determined empirically, in order to minimize the number 245 * of frames dropped on Tx 246 */ 247 #define DPAA2_ETH_ENQUEUE_RETRIES 10 248 249 /* Number of times to retry DPIO portal operations while waiting 250 * for portal to finish executing current command and become 251 * available. We want to avoid being stuck in a while loop in case 252 * hardware becomes unresponsive, but not give up too easily if 253 * the portal really is busy for valid reasons 254 */ 255 #define DPAA2_ETH_SWP_BUSY_RETRIES 1000 256 257 /* Driver statistics, other than those in struct rtnl_link_stats64. 258 * These are usually collected per-CPU and aggregated by ethtool. 259 */ 260 struct dpaa2_eth_drv_stats { 261 __u64 tx_conf_frames; 262 __u64 tx_conf_bytes; 263 __u64 tx_sg_frames; 264 __u64 tx_sg_bytes; 265 __u64 tx_reallocs; 266 __u64 rx_sg_frames; 267 __u64 rx_sg_bytes; 268 /* Enqueues retried due to portal busy */ 269 __u64 tx_portal_busy; 270 }; 271 272 /* Per-FQ statistics */ 273 struct dpaa2_eth_fq_stats { 274 /* Number of frames received on this queue */ 275 __u64 frames; 276 }; 277 278 /* Per-channel statistics */ 279 struct dpaa2_eth_ch_stats { 280 /* Volatile dequeues retried due to portal busy */ 281 __u64 dequeue_portal_busy; 282 /* Pull errors */ 283 __u64 pull_err; 284 /* Number of CDANs; useful to estimate avg NAPI len */ 285 __u64 cdan; 286 /* XDP counters */ 287 __u64 xdp_drop; 288 __u64 xdp_tx; 289 __u64 xdp_tx_err; 290 __u64 xdp_redirect; 291 /* Must be last, does not show up in ethtool stats */ 292 __u64 frames; 293 }; 294 295 /* Maximum number of queues associated with a DPNI */ 296 #define DPAA2_ETH_MAX_TCS 8 297 #define DPAA2_ETH_MAX_RX_QUEUES 16 298 #define DPAA2_ETH_MAX_TX_QUEUES 16 299 #define DPAA2_ETH_MAX_QUEUES (DPAA2_ETH_MAX_RX_QUEUES + \ 300 DPAA2_ETH_MAX_TX_QUEUES) 301 #define DPAA2_ETH_MAX_NETDEV_QUEUES \ 302 (DPAA2_ETH_MAX_TX_QUEUES * DPAA2_ETH_MAX_TCS) 303 304 #define DPAA2_ETH_MAX_DPCONS 16 305 306 enum dpaa2_eth_fq_type { 307 DPAA2_RX_FQ = 0, 308 DPAA2_TX_CONF_FQ, 309 }; 310 311 struct dpaa2_eth_priv; 312 313 struct dpaa2_eth_xdp_fds { 314 struct dpaa2_fd fds[DEV_MAP_BULK_SIZE]; 315 ssize_t num; 316 }; 317 318 struct dpaa2_eth_fq { 319 u32 fqid; 320 u32 tx_qdbin; 321 u32 tx_fqid[DPAA2_ETH_MAX_TCS]; 322 u16 flowid; 323 u8 tc; 324 int target_cpu; 325 u32 dq_frames; 326 u32 dq_bytes; 327 struct dpaa2_eth_channel *channel; 328 enum dpaa2_eth_fq_type type; 329 330 void (*consume)(struct dpaa2_eth_priv *priv, 331 struct dpaa2_eth_channel *ch, 332 const struct dpaa2_fd *fd, 333 struct dpaa2_eth_fq *fq); 334 struct dpaa2_eth_fq_stats stats; 335 336 struct dpaa2_eth_xdp_fds xdp_redirect_fds; 337 }; 338 339 struct dpaa2_eth_ch_xdp { 340 struct bpf_prog *prog; 341 u64 drop_bufs[DPAA2_ETH_BUFS_PER_CMD]; 342 int drop_cnt; 343 unsigned int res; 344 }; 345 346 struct dpaa2_eth_channel { 347 struct dpaa2_io_notification_ctx nctx; 348 struct fsl_mc_device *dpcon; 349 int dpcon_id; 350 int ch_id; 351 struct napi_struct napi; 352 struct dpaa2_io *dpio; 353 struct dpaa2_io_store *store; 354 struct dpaa2_eth_priv *priv; 355 int buf_count; 356 struct dpaa2_eth_ch_stats stats; 357 struct dpaa2_eth_ch_xdp xdp; 358 struct xdp_rxq_info xdp_rxq; 359 struct list_head *rx_list; 360 }; 361 362 struct dpaa2_eth_dist_fields { 363 u64 rxnfc_field; 364 enum net_prot cls_prot; 365 int cls_field; 366 int size; 367 u64 id; 368 }; 369 370 struct dpaa2_eth_cls_rule { 371 struct ethtool_rx_flow_spec fs; 372 u8 in_use; 373 }; 374 375 /* Driver private data */ 376 struct dpaa2_eth_priv { 377 struct net_device *net_dev; 378 379 u8 num_fqs; 380 struct dpaa2_eth_fq fq[DPAA2_ETH_MAX_QUEUES]; 381 int (*enqueue)(struct dpaa2_eth_priv *priv, 382 struct dpaa2_eth_fq *fq, 383 struct dpaa2_fd *fd, u8 prio, 384 u32 num_frames, 385 int *frames_enqueued); 386 387 u8 num_channels; 388 struct dpaa2_eth_channel *channel[DPAA2_ETH_MAX_DPCONS]; 389 390 struct dpni_attr dpni_attrs; 391 u16 dpni_ver_major; 392 u16 dpni_ver_minor; 393 u16 tx_data_offset; 394 395 struct fsl_mc_device *dpbp_dev; 396 u16 rx_buf_size; 397 u16 bpid; 398 struct iommu_domain *iommu_domain; 399 400 bool tx_tstamp; /* Tx timestamping enabled */ 401 bool rx_tstamp; /* Rx timestamping enabled */ 402 403 u16 tx_qdid; 404 struct fsl_mc_io *mc_io; 405 /* Cores which have an affine DPIO/DPCON. 406 * This is the cpu set on which Rx and Tx conf frames are processed 407 */ 408 struct cpumask dpio_cpumask; 409 410 /* Standard statistics */ 411 struct rtnl_link_stats64 __percpu *percpu_stats; 412 /* Extra stats, in addition to the ones known by the kernel */ 413 struct dpaa2_eth_drv_stats __percpu *percpu_extras; 414 415 u16 mc_token; 416 u8 rx_td_enabled; 417 418 struct dpni_link_state link_state; 419 bool do_link_poll; 420 struct task_struct *poll_thread; 421 422 /* enabled ethtool hashing bits */ 423 u64 rx_hash_fields; 424 u64 rx_cls_fields; 425 struct dpaa2_eth_cls_rule *cls_rules; 426 u8 rx_cls_enabled; 427 struct bpf_prog *xdp_prog; 428 #ifdef CONFIG_DEBUG_FS 429 struct dpaa2_debugfs dbg; 430 #endif 431 432 struct dpaa2_mac *mac; 433 }; 434 435 #define DPAA2_RXH_SUPPORTED (RXH_L2DA | RXH_VLAN | RXH_L3_PROTO \ 436 | RXH_IP_SRC | RXH_IP_DST | RXH_L4_B_0_1 \ 437 | RXH_L4_B_2_3) 438 439 /* default Rx hash options, set during probing */ 440 #define DPAA2_RXH_DEFAULT (RXH_L3_PROTO | RXH_IP_SRC | RXH_IP_DST | \ 441 RXH_L4_B_0_1 | RXH_L4_B_2_3) 442 443 #define dpaa2_eth_hash_enabled(priv) \ 444 ((priv)->dpni_attrs.num_queues > 1) 445 446 /* Required by struct dpni_rx_tc_dist_cfg::key_cfg_iova */ 447 #define DPAA2_CLASSIFIER_DMA_SIZE 256 448 449 extern const struct ethtool_ops dpaa2_ethtool_ops; 450 extern int dpaa2_phc_index; 451 452 static inline int dpaa2_eth_cmp_dpni_ver(struct dpaa2_eth_priv *priv, 453 u16 ver_major, u16 ver_minor) 454 { 455 if (priv->dpni_ver_major == ver_major) 456 return priv->dpni_ver_minor - ver_minor; 457 return priv->dpni_ver_major - ver_major; 458 } 459 460 /* Minimum firmware version that supports a more flexible API 461 * for configuring the Rx flow hash key 462 */ 463 #define DPNI_RX_DIST_KEY_VER_MAJOR 7 464 #define DPNI_RX_DIST_KEY_VER_MINOR 5 465 466 #define dpaa2_eth_has_legacy_dist(priv) \ 467 (dpaa2_eth_cmp_dpni_ver((priv), DPNI_RX_DIST_KEY_VER_MAJOR, \ 468 DPNI_RX_DIST_KEY_VER_MINOR) < 0) 469 470 #define dpaa2_eth_fs_enabled(priv) \ 471 (!((priv)->dpni_attrs.options & DPNI_OPT_NO_FS)) 472 473 #define dpaa2_eth_fs_mask_enabled(priv) \ 474 ((priv)->dpni_attrs.options & DPNI_OPT_HAS_KEY_MASKING) 475 476 #define dpaa2_eth_fs_count(priv) \ 477 ((priv)->dpni_attrs.fs_entries) 478 479 #define dpaa2_eth_tc_count(priv) \ 480 ((priv)->dpni_attrs.num_tcs) 481 482 /* We have exactly one {Rx, Tx conf} queue per channel */ 483 #define dpaa2_eth_queue_count(priv) \ 484 ((priv)->num_channels) 485 486 enum dpaa2_eth_rx_dist { 487 DPAA2_ETH_RX_DIST_HASH, 488 DPAA2_ETH_RX_DIST_CLS 489 }; 490 491 /* Unique IDs for the supported Rx classification header fields */ 492 #define DPAA2_ETH_DIST_ETHDST BIT(0) 493 #define DPAA2_ETH_DIST_ETHSRC BIT(1) 494 #define DPAA2_ETH_DIST_ETHTYPE BIT(2) 495 #define DPAA2_ETH_DIST_VLAN BIT(3) 496 #define DPAA2_ETH_DIST_IPSRC BIT(4) 497 #define DPAA2_ETH_DIST_IPDST BIT(5) 498 #define DPAA2_ETH_DIST_IPPROTO BIT(6) 499 #define DPAA2_ETH_DIST_L4SRC BIT(7) 500 #define DPAA2_ETH_DIST_L4DST BIT(8) 501 #define DPAA2_ETH_DIST_ALL (~0ULL) 502 503 #define DPNI_PAUSE_VER_MAJOR 7 504 #define DPNI_PAUSE_VER_MINOR 13 505 #define dpaa2_eth_has_pause_support(priv) \ 506 (dpaa2_eth_cmp_dpni_ver((priv), DPNI_PAUSE_VER_MAJOR, \ 507 DPNI_PAUSE_VER_MINOR) >= 0) 508 509 static inline 510 unsigned int dpaa2_eth_needed_headroom(struct dpaa2_eth_priv *priv, 511 struct sk_buff *skb) 512 { 513 unsigned int headroom = DPAA2_ETH_SWA_SIZE; 514 515 /* If we don't have an skb (e.g. XDP buffer), we only need space for 516 * the software annotation area 517 */ 518 if (!skb) 519 return headroom; 520 521 /* For non-linear skbs we have no headroom requirement, as we build a 522 * SG frame with a newly allocated SGT buffer 523 */ 524 if (skb_is_nonlinear(skb)) 525 return 0; 526 527 /* If we have Tx timestamping, need 128B hardware annotation */ 528 if (priv->tx_tstamp && skb_shinfo(skb)->tx_flags & SKBTX_HW_TSTAMP) 529 headroom += DPAA2_ETH_TX_HWA_SIZE; 530 531 return headroom; 532 } 533 534 /* Extra headroom space requested to hardware, in order to make sure there's 535 * no realloc'ing in forwarding scenarios 536 */ 537 static inline unsigned int dpaa2_eth_rx_head_room(struct dpaa2_eth_priv *priv) 538 { 539 return priv->tx_data_offset - DPAA2_ETH_RX_HWA_SIZE; 540 } 541 542 int dpaa2_eth_set_hash(struct net_device *net_dev, u64 flags); 543 int dpaa2_eth_set_cls(struct net_device *net_dev, u64 key); 544 int dpaa2_eth_cls_key_size(u64 key); 545 int dpaa2_eth_cls_fld_off(int prot, int field); 546 void dpaa2_eth_cls_trim_rule(void *key_mem, u64 fields); 547 548 #endif /* __DPAA2_H */ 549