1 /* 2 * Copyright (C) 2017 Netronome Systems, Inc. 3 * 4 * This software is licensed under the GNU General License Version 2, 5 * June 1991 as shown in the file COPYING in the top-level directory of this 6 * source tree. 7 * 8 * THE COPYRIGHT HOLDERS AND/OR OTHER PARTIES PROVIDE THE PROGRAM "AS IS" 9 * WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING, 10 * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS 11 * FOR A PARTICULAR PURPOSE. THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE 12 * OF THE PROGRAM IS WITH YOU. SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME 13 * THE COST OF ALL NECESSARY SERVICING, REPAIR OR CORRECTION. 14 */ 15 16 #include <linux/debugfs.h> 17 #include <linux/etherdevice.h> 18 #include <linux/ethtool_netlink.h> 19 #include <linux/kernel.h> 20 #include <linux/module.h> 21 #include <linux/netdevice.h> 22 #include <linux/slab.h> 23 #include <net/netdev_queues.h> 24 #include <net/netdev_rx_queue.h> 25 #include <net/page_pool/helpers.h> 26 #include <net/netlink.h> 27 #include <net/net_shaper.h> 28 #include <net/netdev_lock.h> 29 #include <net/pkt_cls.h> 30 #include <net/rtnetlink.h> 31 #include <net/udp_tunnel.h> 32 #include <net/busy_poll.h> 33 34 #include "netdevsim.h" 35 36 MODULE_IMPORT_NS("NETDEV_INTERNAL"); 37 38 #define NSIM_RING_SIZE 256 39 40 static void nsim_start_peer_tx_queue(struct net_device *dev, struct nsim_rq *rq) 41 { 42 struct netdevsim *ns = netdev_priv(dev); 43 struct net_device *peer_dev; 44 struct netdevsim *peer_ns; 45 struct netdev_queue *txq; 46 u16 idx; 47 48 idx = rq->napi.index; 49 rcu_read_lock(); 50 peer_ns = rcu_dereference(ns->peer); 51 if (!peer_ns) 52 goto out; 53 54 /* TX device */ 55 peer_dev = peer_ns->netdev; 56 if (dev->real_num_tx_queues != peer_dev->num_rx_queues) 57 goto out; 58 59 txq = netdev_get_tx_queue(peer_dev, idx); 60 if (!netif_tx_queue_stopped(txq)) 61 goto out; 62 63 netif_tx_wake_queue(txq); 64 out: 65 rcu_read_unlock(); 66 } 67 68 static void nsim_stop_tx_queue(struct net_device *tx_dev, 69 struct net_device *rx_dev, 70 struct nsim_rq *rq, 71 u16 idx) 72 { 73 /* If different queues size, do not stop, since it is not 74 * easy to find which TX queue is mapped here 75 */ 76 if (rx_dev->real_num_tx_queues != tx_dev->num_rx_queues) 77 return; 78 79 /* rq is the queue on the receive side */ 80 netif_subqueue_try_stop(tx_dev, idx, 81 NSIM_RING_SIZE - skb_queue_len(&rq->skb_queue), 82 NSIM_RING_SIZE / 2); 83 } 84 85 static int nsim_napi_rx(struct net_device *tx_dev, struct net_device *rx_dev, 86 struct nsim_rq *rq, struct sk_buff *skb) 87 { 88 if (skb_queue_len(&rq->skb_queue) > NSIM_RING_SIZE) { 89 dev_kfree_skb_any(skb); 90 return NET_RX_DROP; 91 } 92 93 skb_queue_tail(&rq->skb_queue, skb); 94 95 /* Stop the peer TX queue avoiding dropping packets later */ 96 if (skb_queue_len(&rq->skb_queue) >= NSIM_RING_SIZE) 97 nsim_stop_tx_queue(tx_dev, rx_dev, rq, 98 skb_get_queue_mapping(skb)); 99 100 return NET_RX_SUCCESS; 101 } 102 103 static int nsim_forward_skb(struct net_device *tx_dev, 104 struct net_device *rx_dev, 105 struct sk_buff *skb, 106 struct nsim_rq *rq, 107 struct skb_ext *psp_ext) 108 { 109 int ret; 110 111 ret = __dev_forward_skb(rx_dev, skb); 112 if (ret) 113 return ret; 114 115 nsim_psp_handle_ext(skb, psp_ext); 116 117 return nsim_napi_rx(tx_dev, rx_dev, rq, skb); 118 } 119 120 static netdev_tx_t nsim_start_xmit(struct sk_buff *skb, struct net_device *dev) 121 { 122 struct netdevsim *ns = netdev_priv(dev); 123 struct skb_ext *psp_ext = NULL; 124 struct net_device *peer_dev; 125 unsigned int len = skb->len; 126 struct netdevsim *peer_ns; 127 struct netdev_config *cfg; 128 struct nsim_rq *rq; 129 int rxq; 130 int dr; 131 132 rcu_read_lock(); 133 if (!nsim_ipsec_tx(ns, skb)) 134 goto out_drop_any; 135 136 peer_ns = rcu_dereference(ns->peer); 137 if (!peer_ns) 138 goto out_drop_any; 139 140 dr = nsim_do_psp(skb, ns, peer_ns, &psp_ext); 141 if (dr) 142 goto out_drop_free; 143 144 peer_dev = peer_ns->netdev; 145 rxq = skb_get_queue_mapping(skb); 146 if (rxq >= peer_dev->num_rx_queues) 147 rxq = rxq % peer_dev->num_rx_queues; 148 rq = peer_ns->rq[rxq]; 149 150 cfg = peer_dev->cfg; 151 if (skb_is_nonlinear(skb) && 152 (cfg->hds_config != ETHTOOL_TCP_DATA_SPLIT_ENABLED || 153 (cfg->hds_config == ETHTOOL_TCP_DATA_SPLIT_ENABLED && 154 cfg->hds_thresh > len))) 155 skb_linearize(skb); 156 157 skb_tx_timestamp(skb); 158 if (unlikely(nsim_forward_skb(dev, peer_dev, 159 skb, rq, psp_ext) == NET_RX_DROP)) 160 goto out_drop_cnt; 161 162 if (!hrtimer_active(&rq->napi_timer)) 163 hrtimer_start(&rq->napi_timer, us_to_ktime(5), HRTIMER_MODE_REL); 164 165 rcu_read_unlock(); 166 dev_dstats_tx_add(dev, len); 167 return NETDEV_TX_OK; 168 169 out_drop_any: 170 dr = SKB_DROP_REASON_NOT_SPECIFIED; 171 out_drop_free: 172 kfree_skb_reason(skb, dr); 173 out_drop_cnt: 174 rcu_read_unlock(); 175 dev_dstats_tx_dropped(dev); 176 return NETDEV_TX_OK; 177 } 178 179 static void nsim_set_rx_mode(struct net_device *dev) 180 { 181 } 182 183 static int nsim_change_mtu(struct net_device *dev, int new_mtu) 184 { 185 struct netdevsim *ns = netdev_priv(dev); 186 187 if (ns->xdp.prog && !ns->xdp.prog->aux->xdp_has_frags && 188 new_mtu > NSIM_XDP_MAX_MTU) 189 return -EBUSY; 190 191 WRITE_ONCE(dev->mtu, new_mtu); 192 193 return 0; 194 } 195 196 static int 197 nsim_setup_tc_block_cb(enum tc_setup_type type, void *type_data, void *cb_priv) 198 { 199 return nsim_bpf_setup_tc_block_cb(type, type_data, cb_priv); 200 } 201 202 static int nsim_set_vf_mac(struct net_device *dev, int vf, u8 *mac) 203 { 204 struct netdevsim *ns = netdev_priv(dev); 205 struct nsim_dev *nsim_dev = ns->nsim_dev; 206 207 /* Only refuse multicast addresses, zero address can mean unset/any. */ 208 if (vf >= nsim_dev_get_vfs(nsim_dev) || is_multicast_ether_addr(mac)) 209 return -EINVAL; 210 memcpy(nsim_dev->vfconfigs[vf].vf_mac, mac, ETH_ALEN); 211 212 return 0; 213 } 214 215 static int nsim_set_vf_vlan(struct net_device *dev, int vf, 216 u16 vlan, u8 qos, __be16 vlan_proto) 217 { 218 struct netdevsim *ns = netdev_priv(dev); 219 struct nsim_dev *nsim_dev = ns->nsim_dev; 220 221 if (vf >= nsim_dev_get_vfs(nsim_dev) || vlan > 4095 || qos > 7) 222 return -EINVAL; 223 224 nsim_dev->vfconfigs[vf].vlan = vlan; 225 nsim_dev->vfconfigs[vf].qos = qos; 226 nsim_dev->vfconfigs[vf].vlan_proto = vlan_proto; 227 228 return 0; 229 } 230 231 static int nsim_set_vf_rate(struct net_device *dev, int vf, int min, int max) 232 { 233 struct netdevsim *ns = netdev_priv(dev); 234 struct nsim_dev *nsim_dev = ns->nsim_dev; 235 236 if (nsim_esw_mode_is_switchdev(ns->nsim_dev)) { 237 pr_err("Not supported in switchdev mode. Please use devlink API.\n"); 238 return -EOPNOTSUPP; 239 } 240 241 if (vf >= nsim_dev_get_vfs(nsim_dev)) 242 return -EINVAL; 243 244 nsim_dev->vfconfigs[vf].min_tx_rate = min; 245 nsim_dev->vfconfigs[vf].max_tx_rate = max; 246 247 return 0; 248 } 249 250 static int nsim_set_vf_spoofchk(struct net_device *dev, int vf, bool val) 251 { 252 struct netdevsim *ns = netdev_priv(dev); 253 struct nsim_dev *nsim_dev = ns->nsim_dev; 254 255 if (vf >= nsim_dev_get_vfs(nsim_dev)) 256 return -EINVAL; 257 nsim_dev->vfconfigs[vf].spoofchk_enabled = val; 258 259 return 0; 260 } 261 262 static int nsim_set_vf_rss_query_en(struct net_device *dev, int vf, bool val) 263 { 264 struct netdevsim *ns = netdev_priv(dev); 265 struct nsim_dev *nsim_dev = ns->nsim_dev; 266 267 if (vf >= nsim_dev_get_vfs(nsim_dev)) 268 return -EINVAL; 269 nsim_dev->vfconfigs[vf].rss_query_enabled = val; 270 271 return 0; 272 } 273 274 static int nsim_set_vf_trust(struct net_device *dev, int vf, bool val) 275 { 276 struct netdevsim *ns = netdev_priv(dev); 277 struct nsim_dev *nsim_dev = ns->nsim_dev; 278 279 if (vf >= nsim_dev_get_vfs(nsim_dev)) 280 return -EINVAL; 281 nsim_dev->vfconfigs[vf].trusted = val; 282 283 return 0; 284 } 285 286 static int 287 nsim_get_vf_config(struct net_device *dev, int vf, struct ifla_vf_info *ivi) 288 { 289 struct netdevsim *ns = netdev_priv(dev); 290 struct nsim_dev *nsim_dev = ns->nsim_dev; 291 292 if (vf >= nsim_dev_get_vfs(nsim_dev)) 293 return -EINVAL; 294 295 ivi->vf = vf; 296 ivi->linkstate = nsim_dev->vfconfigs[vf].link_state; 297 ivi->min_tx_rate = nsim_dev->vfconfigs[vf].min_tx_rate; 298 ivi->max_tx_rate = nsim_dev->vfconfigs[vf].max_tx_rate; 299 ivi->vlan = nsim_dev->vfconfigs[vf].vlan; 300 ivi->vlan_proto = nsim_dev->vfconfigs[vf].vlan_proto; 301 ivi->qos = nsim_dev->vfconfigs[vf].qos; 302 memcpy(&ivi->mac, nsim_dev->vfconfigs[vf].vf_mac, ETH_ALEN); 303 ivi->spoofchk = nsim_dev->vfconfigs[vf].spoofchk_enabled; 304 ivi->trusted = nsim_dev->vfconfigs[vf].trusted; 305 ivi->rss_query_en = nsim_dev->vfconfigs[vf].rss_query_enabled; 306 307 return 0; 308 } 309 310 static int nsim_set_vf_link_state(struct net_device *dev, int vf, int state) 311 { 312 struct netdevsim *ns = netdev_priv(dev); 313 struct nsim_dev *nsim_dev = ns->nsim_dev; 314 315 if (vf >= nsim_dev_get_vfs(nsim_dev)) 316 return -EINVAL; 317 318 switch (state) { 319 case IFLA_VF_LINK_STATE_AUTO: 320 case IFLA_VF_LINK_STATE_ENABLE: 321 case IFLA_VF_LINK_STATE_DISABLE: 322 break; 323 default: 324 return -EINVAL; 325 } 326 327 nsim_dev->vfconfigs[vf].link_state = state; 328 329 return 0; 330 } 331 332 static void nsim_taprio_stats(struct tc_taprio_qopt_stats *stats) 333 { 334 stats->window_drops = 0; 335 stats->tx_overruns = 0; 336 } 337 338 static int nsim_setup_tc_taprio(struct net_device *dev, 339 struct tc_taprio_qopt_offload *offload) 340 { 341 int err = 0; 342 343 switch (offload->cmd) { 344 case TAPRIO_CMD_REPLACE: 345 case TAPRIO_CMD_DESTROY: 346 break; 347 case TAPRIO_CMD_STATS: 348 nsim_taprio_stats(&offload->stats); 349 break; 350 default: 351 err = -EOPNOTSUPP; 352 } 353 354 return err; 355 } 356 357 static LIST_HEAD(nsim_block_cb_list); 358 359 static int 360 nsim_setup_tc(struct net_device *dev, enum tc_setup_type type, void *type_data) 361 { 362 struct netdevsim *ns = netdev_priv(dev); 363 364 switch (type) { 365 case TC_SETUP_QDISC_TAPRIO: 366 return nsim_setup_tc_taprio(dev, type_data); 367 case TC_SETUP_BLOCK: 368 return flow_block_cb_setup_simple(type_data, 369 &nsim_block_cb_list, 370 nsim_setup_tc_block_cb, 371 ns, ns, true); 372 default: 373 return -EOPNOTSUPP; 374 } 375 } 376 377 static int 378 nsim_set_features(struct net_device *dev, netdev_features_t features) 379 { 380 struct netdevsim *ns = netdev_priv(dev); 381 382 if ((dev->features & NETIF_F_HW_TC) > (features & NETIF_F_HW_TC)) 383 return nsim_bpf_disable_tc(ns); 384 385 return 0; 386 } 387 388 static int nsim_get_iflink(const struct net_device *dev) 389 { 390 struct netdevsim *nsim, *peer; 391 int iflink; 392 393 nsim = netdev_priv(dev); 394 395 rcu_read_lock(); 396 peer = rcu_dereference(nsim->peer); 397 iflink = peer ? READ_ONCE(peer->netdev->ifindex) : 398 READ_ONCE(dev->ifindex); 399 rcu_read_unlock(); 400 401 return iflink; 402 } 403 404 static int nsim_rcv(struct nsim_rq *rq, int budget) 405 { 406 struct net_device *dev = rq->napi.dev; 407 struct bpf_prog *xdp_prog; 408 struct netdevsim *ns; 409 struct sk_buff *skb; 410 unsigned int skblen; 411 int i, ret; 412 413 ns = netdev_priv(dev); 414 xdp_prog = READ_ONCE(ns->xdp.prog); 415 416 for (i = 0; i < budget; i++) { 417 if (skb_queue_empty(&rq->skb_queue)) 418 break; 419 420 skb = skb_dequeue(&rq->skb_queue); 421 422 if (xdp_prog) { 423 /* skb might be freed directly by XDP, save the len */ 424 skblen = skb->len; 425 426 if (skb->ip_summed == CHECKSUM_PARTIAL) 427 skb_checksum_help(skb); 428 ret = do_xdp_generic(xdp_prog, &skb); 429 if (ret != XDP_PASS) { 430 dev_dstats_rx_add(dev, skblen); 431 continue; 432 } 433 } 434 435 /* skb might be discard at netif_receive_skb, save the len */ 436 skblen = skb->len; 437 skb_mark_napi_id(skb, &rq->napi); 438 ret = netif_receive_skb(skb); 439 if (ret == NET_RX_SUCCESS) 440 dev_dstats_rx_add(dev, skblen); 441 else 442 dev_dstats_rx_dropped(dev); 443 } 444 445 nsim_start_peer_tx_queue(dev, rq); 446 return i; 447 } 448 449 static int nsim_poll(struct napi_struct *napi, int budget) 450 { 451 struct nsim_rq *rq = container_of(napi, struct nsim_rq, napi); 452 int done; 453 454 done = nsim_rcv(rq, budget); 455 if (done < budget) 456 napi_complete_done(napi, done); 457 458 return done; 459 } 460 461 static int nsim_create_page_pool(struct page_pool **p, struct napi_struct *napi) 462 { 463 struct page_pool_params params = { 464 .order = 0, 465 .pool_size = NSIM_RING_SIZE, 466 .nid = NUMA_NO_NODE, 467 .dev = &napi->dev->dev, 468 .napi = napi, 469 .dma_dir = DMA_BIDIRECTIONAL, 470 .netdev = napi->dev, 471 }; 472 struct page_pool *pool; 473 474 pool = page_pool_create(¶ms); 475 if (IS_ERR(pool)) 476 return PTR_ERR(pool); 477 478 *p = pool; 479 return 0; 480 } 481 482 static int nsim_init_napi(struct netdevsim *ns) 483 { 484 struct net_device *dev = ns->netdev; 485 struct nsim_rq *rq; 486 int err, i; 487 488 for (i = 0; i < dev->num_rx_queues; i++) { 489 rq = ns->rq[i]; 490 491 netif_napi_add_config_locked(dev, &rq->napi, nsim_poll, i); 492 } 493 494 for (i = 0; i < dev->num_rx_queues; i++) { 495 rq = ns->rq[i]; 496 497 err = nsim_create_page_pool(&rq->page_pool, &rq->napi); 498 if (err) 499 goto err_pp_destroy; 500 } 501 502 return 0; 503 504 err_pp_destroy: 505 while (i--) { 506 page_pool_destroy(ns->rq[i]->page_pool); 507 ns->rq[i]->page_pool = NULL; 508 } 509 510 for (i = 0; i < dev->num_rx_queues; i++) 511 __netif_napi_del_locked(&ns->rq[i]->napi); 512 513 return err; 514 } 515 516 static enum hrtimer_restart nsim_napi_schedule(struct hrtimer *timer) 517 { 518 struct nsim_rq *rq; 519 520 rq = container_of(timer, struct nsim_rq, napi_timer); 521 napi_schedule(&rq->napi); 522 523 return HRTIMER_NORESTART; 524 } 525 526 static void nsim_rq_timer_init(struct nsim_rq *rq) 527 { 528 hrtimer_setup(&rq->napi_timer, nsim_napi_schedule, CLOCK_MONOTONIC, 529 HRTIMER_MODE_REL); 530 } 531 532 static void nsim_enable_napi(struct netdevsim *ns) 533 { 534 struct net_device *dev = ns->netdev; 535 int i; 536 537 for (i = 0; i < dev->num_rx_queues; i++) { 538 struct nsim_rq *rq = ns->rq[i]; 539 540 netif_queue_set_napi(dev, i, NETDEV_QUEUE_TYPE_RX, &rq->napi); 541 napi_enable_locked(&rq->napi); 542 } 543 } 544 545 static int nsim_open(struct net_device *dev) 546 { 547 struct netdevsim *ns = netdev_priv(dev); 548 struct netdevsim *peer; 549 int err; 550 551 netdev_assert_locked(dev); 552 553 err = nsim_init_napi(ns); 554 if (err) 555 return err; 556 557 nsim_enable_napi(ns); 558 559 peer = rtnl_dereference(ns->peer); 560 if (peer && netif_running(peer->netdev)) { 561 netif_carrier_on(dev); 562 netif_carrier_on(peer->netdev); 563 } 564 565 return 0; 566 } 567 568 static void nsim_del_napi(struct netdevsim *ns) 569 { 570 struct net_device *dev = ns->netdev; 571 int i; 572 573 for (i = 0; i < dev->num_rx_queues; i++) { 574 struct nsim_rq *rq = ns->rq[i]; 575 576 napi_disable_locked(&rq->napi); 577 __netif_napi_del_locked(&rq->napi); 578 } 579 synchronize_net(); 580 581 for (i = 0; i < dev->num_rx_queues; i++) { 582 page_pool_destroy(ns->rq[i]->page_pool); 583 ns->rq[i]->page_pool = NULL; 584 } 585 } 586 587 static int nsim_stop(struct net_device *dev) 588 { 589 struct netdevsim *ns = netdev_priv(dev); 590 struct netdevsim *peer; 591 592 netdev_assert_locked(dev); 593 594 netif_carrier_off(dev); 595 peer = rtnl_dereference(ns->peer); 596 if (peer) 597 netif_carrier_off(peer->netdev); 598 599 nsim_del_napi(ns); 600 601 return 0; 602 } 603 604 static int nsim_shaper_set(struct net_shaper_binding *binding, 605 const struct net_shaper *shaper, 606 struct netlink_ext_ack *extack) 607 { 608 return 0; 609 } 610 611 static int nsim_shaper_del(struct net_shaper_binding *binding, 612 const struct net_shaper_handle *handle, 613 struct netlink_ext_ack *extack) 614 { 615 return 0; 616 } 617 618 static int nsim_shaper_group(struct net_shaper_binding *binding, 619 int leaves_count, 620 const struct net_shaper *leaves, 621 const struct net_shaper *root, 622 struct netlink_ext_ack *extack) 623 { 624 return 0; 625 } 626 627 static void nsim_shaper_cap(struct net_shaper_binding *binding, 628 enum net_shaper_scope scope, 629 unsigned long *flags) 630 { 631 *flags = ULONG_MAX; 632 } 633 634 static const struct net_shaper_ops nsim_shaper_ops = { 635 .set = nsim_shaper_set, 636 .delete = nsim_shaper_del, 637 .group = nsim_shaper_group, 638 .capabilities = nsim_shaper_cap, 639 }; 640 641 static const struct net_device_ops nsim_netdev_ops = { 642 .ndo_start_xmit = nsim_start_xmit, 643 .ndo_set_rx_mode = nsim_set_rx_mode, 644 .ndo_set_mac_address = eth_mac_addr, 645 .ndo_validate_addr = eth_validate_addr, 646 .ndo_change_mtu = nsim_change_mtu, 647 .ndo_set_vf_mac = nsim_set_vf_mac, 648 .ndo_set_vf_vlan = nsim_set_vf_vlan, 649 .ndo_set_vf_rate = nsim_set_vf_rate, 650 .ndo_set_vf_spoofchk = nsim_set_vf_spoofchk, 651 .ndo_set_vf_trust = nsim_set_vf_trust, 652 .ndo_get_vf_config = nsim_get_vf_config, 653 .ndo_set_vf_link_state = nsim_set_vf_link_state, 654 .ndo_set_vf_rss_query_en = nsim_set_vf_rss_query_en, 655 .ndo_setup_tc = nsim_setup_tc, 656 .ndo_set_features = nsim_set_features, 657 .ndo_get_iflink = nsim_get_iflink, 658 .ndo_bpf = nsim_bpf, 659 .ndo_open = nsim_open, 660 .ndo_stop = nsim_stop, 661 .net_shaper_ops = &nsim_shaper_ops, 662 }; 663 664 static const struct net_device_ops nsim_vf_netdev_ops = { 665 .ndo_start_xmit = nsim_start_xmit, 666 .ndo_set_rx_mode = nsim_set_rx_mode, 667 .ndo_set_mac_address = eth_mac_addr, 668 .ndo_validate_addr = eth_validate_addr, 669 .ndo_change_mtu = nsim_change_mtu, 670 .ndo_setup_tc = nsim_setup_tc, 671 .ndo_set_features = nsim_set_features, 672 }; 673 674 /* We don't have true per-queue stats, yet, so do some random fakery here. 675 * Only report stuff for queue 0. 676 */ 677 static void nsim_get_queue_stats_rx(struct net_device *dev, int idx, 678 struct netdev_queue_stats_rx *stats) 679 { 680 struct rtnl_link_stats64 rtstats = {}; 681 682 if (!idx) 683 dev_get_stats(dev, &rtstats); 684 685 stats->packets = rtstats.rx_packets - !!rtstats.rx_packets; 686 stats->bytes = rtstats.rx_bytes; 687 } 688 689 static void nsim_get_queue_stats_tx(struct net_device *dev, int idx, 690 struct netdev_queue_stats_tx *stats) 691 { 692 struct rtnl_link_stats64 rtstats = {}; 693 694 if (!idx) 695 dev_get_stats(dev, &rtstats); 696 697 stats->packets = rtstats.tx_packets - !!rtstats.tx_packets; 698 stats->bytes = rtstats.tx_bytes; 699 } 700 701 static void nsim_get_base_stats(struct net_device *dev, 702 struct netdev_queue_stats_rx *rx, 703 struct netdev_queue_stats_tx *tx) 704 { 705 struct rtnl_link_stats64 rtstats = {}; 706 707 dev_get_stats(dev, &rtstats); 708 709 rx->packets = !!rtstats.rx_packets; 710 rx->bytes = 0; 711 tx->packets = !!rtstats.tx_packets; 712 tx->bytes = 0; 713 } 714 715 static const struct netdev_stat_ops nsim_stat_ops = { 716 .get_queue_stats_tx = nsim_get_queue_stats_tx, 717 .get_queue_stats_rx = nsim_get_queue_stats_rx, 718 .get_base_stats = nsim_get_base_stats, 719 }; 720 721 static struct nsim_rq *nsim_queue_alloc(void) 722 { 723 struct nsim_rq *rq; 724 725 rq = kzalloc(sizeof(*rq), GFP_KERNEL_ACCOUNT); 726 if (!rq) 727 return NULL; 728 729 skb_queue_head_init(&rq->skb_queue); 730 nsim_rq_timer_init(rq); 731 return rq; 732 } 733 734 static void nsim_queue_free(struct net_device *dev, struct nsim_rq *rq) 735 { 736 hrtimer_cancel(&rq->napi_timer); 737 738 if (rq->skb_queue.qlen) { 739 local_bh_disable(); 740 dev_dstats_rx_dropped_add(dev, rq->skb_queue.qlen); 741 local_bh_enable(); 742 } 743 744 skb_queue_purge_reason(&rq->skb_queue, SKB_DROP_REASON_QUEUE_PURGE); 745 kfree(rq); 746 } 747 748 /* Queue reset mode is controlled by ns->rq_reset_mode. 749 * - normal - new NAPI new pool (old NAPI enabled when new added) 750 * - mode 1 - allocate new pool (NAPI is only disabled / enabled) 751 * - mode 2 - new NAPI new pool (old NAPI removed before new added) 752 * - mode 3 - new NAPI new pool (old NAPI disabled when new added) 753 */ 754 struct nsim_queue_mem { 755 struct nsim_rq *rq; 756 struct page_pool *pp; 757 }; 758 759 static int 760 nsim_queue_mem_alloc(struct net_device *dev, void *per_queue_mem, int idx) 761 { 762 struct nsim_queue_mem *qmem = per_queue_mem; 763 struct netdevsim *ns = netdev_priv(dev); 764 int err; 765 766 if (ns->rq_reset_mode > 3) 767 return -EINVAL; 768 769 if (ns->rq_reset_mode == 1) { 770 if (!netif_running(ns->netdev)) 771 return -ENETDOWN; 772 return nsim_create_page_pool(&qmem->pp, &ns->rq[idx]->napi); 773 } 774 775 qmem->rq = nsim_queue_alloc(); 776 if (!qmem->rq) 777 return -ENOMEM; 778 779 err = nsim_create_page_pool(&qmem->rq->page_pool, &qmem->rq->napi); 780 if (err) 781 goto err_free; 782 783 if (!ns->rq_reset_mode) 784 netif_napi_add_config_locked(dev, &qmem->rq->napi, nsim_poll, 785 idx); 786 787 return 0; 788 789 err_free: 790 nsim_queue_free(dev, qmem->rq); 791 return err; 792 } 793 794 static void nsim_queue_mem_free(struct net_device *dev, void *per_queue_mem) 795 { 796 struct nsim_queue_mem *qmem = per_queue_mem; 797 struct netdevsim *ns = netdev_priv(dev); 798 799 page_pool_destroy(qmem->pp); 800 if (qmem->rq) { 801 if (!ns->rq_reset_mode) 802 netif_napi_del_locked(&qmem->rq->napi); 803 page_pool_destroy(qmem->rq->page_pool); 804 nsim_queue_free(dev, qmem->rq); 805 } 806 } 807 808 static int 809 nsim_queue_start(struct net_device *dev, void *per_queue_mem, int idx) 810 { 811 struct nsim_queue_mem *qmem = per_queue_mem; 812 struct netdevsim *ns = netdev_priv(dev); 813 814 netdev_assert_locked(dev); 815 816 if (ns->rq_reset_mode == 1) { 817 ns->rq[idx]->page_pool = qmem->pp; 818 napi_enable_locked(&ns->rq[idx]->napi); 819 return 0; 820 } 821 822 /* netif_napi_add()/_del() should normally be called from alloc/free, 823 * here we want to test various call orders. 824 */ 825 if (ns->rq_reset_mode == 2) { 826 netif_napi_del_locked(&ns->rq[idx]->napi); 827 netif_napi_add_config_locked(dev, &qmem->rq->napi, nsim_poll, 828 idx); 829 } else if (ns->rq_reset_mode == 3) { 830 netif_napi_add_config_locked(dev, &qmem->rq->napi, nsim_poll, 831 idx); 832 netif_napi_del_locked(&ns->rq[idx]->napi); 833 } 834 835 ns->rq[idx] = qmem->rq; 836 napi_enable_locked(&ns->rq[idx]->napi); 837 838 return 0; 839 } 840 841 static int nsim_queue_stop(struct net_device *dev, void *per_queue_mem, int idx) 842 { 843 struct nsim_queue_mem *qmem = per_queue_mem; 844 struct netdevsim *ns = netdev_priv(dev); 845 846 netdev_assert_locked(dev); 847 848 napi_disable_locked(&ns->rq[idx]->napi); 849 850 if (ns->rq_reset_mode == 1) { 851 qmem->pp = ns->rq[idx]->page_pool; 852 page_pool_disable_direct_recycling(qmem->pp); 853 } else { 854 qmem->rq = ns->rq[idx]; 855 } 856 857 return 0; 858 } 859 860 static const struct netdev_queue_mgmt_ops nsim_queue_mgmt_ops = { 861 .ndo_queue_mem_size = sizeof(struct nsim_queue_mem), 862 .ndo_queue_mem_alloc = nsim_queue_mem_alloc, 863 .ndo_queue_mem_free = nsim_queue_mem_free, 864 .ndo_queue_start = nsim_queue_start, 865 .ndo_queue_stop = nsim_queue_stop, 866 }; 867 868 static ssize_t 869 nsim_qreset_write(struct file *file, const char __user *data, 870 size_t count, loff_t *ppos) 871 { 872 struct netdevsim *ns = file->private_data; 873 unsigned int queue, mode; 874 char buf[32]; 875 ssize_t ret; 876 877 if (count >= sizeof(buf)) 878 return -EINVAL; 879 if (copy_from_user(buf, data, count)) 880 return -EFAULT; 881 buf[count] = '\0'; 882 883 ret = sscanf(buf, "%u %u", &queue, &mode); 884 if (ret != 2) 885 return -EINVAL; 886 887 netdev_lock(ns->netdev); 888 if (queue >= ns->netdev->real_num_rx_queues) { 889 ret = -EINVAL; 890 goto exit_unlock; 891 } 892 893 ns->rq_reset_mode = mode; 894 ret = netdev_rx_queue_restart(ns->netdev, queue); 895 ns->rq_reset_mode = 0; 896 if (ret) 897 goto exit_unlock; 898 899 ret = count; 900 exit_unlock: 901 netdev_unlock(ns->netdev); 902 return ret; 903 } 904 905 static const struct file_operations nsim_qreset_fops = { 906 .open = simple_open, 907 .write = nsim_qreset_write, 908 .owner = THIS_MODULE, 909 }; 910 911 static ssize_t 912 nsim_pp_hold_read(struct file *file, char __user *data, 913 size_t count, loff_t *ppos) 914 { 915 struct netdevsim *ns = file->private_data; 916 char buf[3] = "n\n"; 917 918 if (ns->page) 919 buf[0] = 'y'; 920 921 return simple_read_from_buffer(data, count, ppos, buf, 2); 922 } 923 924 static ssize_t 925 nsim_pp_hold_write(struct file *file, const char __user *data, 926 size_t count, loff_t *ppos) 927 { 928 struct netdevsim *ns = file->private_data; 929 ssize_t ret; 930 bool val; 931 932 ret = kstrtobool_from_user(data, count, &val); 933 if (ret) 934 return ret; 935 936 rtnl_lock(); 937 ret = count; 938 if (val == !!ns->page) 939 goto exit; 940 941 if (!netif_running(ns->netdev) && val) { 942 ret = -ENETDOWN; 943 } else if (val) { 944 ns->page = page_pool_dev_alloc_pages(ns->rq[0]->page_pool); 945 if (!ns->page) 946 ret = -ENOMEM; 947 } else { 948 page_pool_put_full_page(pp_page_to_nmdesc(ns->page)->pp, 949 ns->page, false); 950 ns->page = NULL; 951 } 952 953 exit: 954 rtnl_unlock(); 955 return ret; 956 } 957 958 static const struct file_operations nsim_pp_hold_fops = { 959 .open = simple_open, 960 .read = nsim_pp_hold_read, 961 .write = nsim_pp_hold_write, 962 .llseek = generic_file_llseek, 963 .owner = THIS_MODULE, 964 }; 965 966 static void nsim_setup(struct net_device *dev) 967 { 968 ether_setup(dev); 969 eth_hw_addr_random(dev); 970 971 dev->flags &= ~IFF_MULTICAST; 972 dev->priv_flags |= IFF_LIVE_ADDR_CHANGE; 973 dev->features |= NETIF_F_HIGHDMA | 974 NETIF_F_SG | 975 NETIF_F_FRAGLIST | 976 NETIF_F_HW_CSUM | 977 NETIF_F_LRO | 978 NETIF_F_TSO; 979 dev->hw_features |= NETIF_F_HW_TC | 980 NETIF_F_SG | 981 NETIF_F_FRAGLIST | 982 NETIF_F_HW_CSUM | 983 NETIF_F_LRO | 984 NETIF_F_TSO; 985 dev->pcpu_stat_type = NETDEV_PCPU_STAT_DSTATS; 986 dev->max_mtu = ETH_MAX_MTU; 987 dev->xdp_features = NETDEV_XDP_ACT_BASIC | NETDEV_XDP_ACT_HW_OFFLOAD; 988 } 989 990 static int nsim_queue_init(struct netdevsim *ns) 991 { 992 struct net_device *dev = ns->netdev; 993 int i; 994 995 ns->rq = kcalloc(dev->num_rx_queues, sizeof(*ns->rq), 996 GFP_KERNEL_ACCOUNT); 997 if (!ns->rq) 998 return -ENOMEM; 999 1000 for (i = 0; i < dev->num_rx_queues; i++) { 1001 ns->rq[i] = nsim_queue_alloc(); 1002 if (!ns->rq[i]) 1003 goto err_free_prev; 1004 } 1005 1006 return 0; 1007 1008 err_free_prev: 1009 while (i--) 1010 kfree(ns->rq[i]); 1011 kfree(ns->rq); 1012 return -ENOMEM; 1013 } 1014 1015 static void nsim_queue_uninit(struct netdevsim *ns) 1016 { 1017 struct net_device *dev = ns->netdev; 1018 int i; 1019 1020 for (i = 0; i < dev->num_rx_queues; i++) 1021 nsim_queue_free(dev, ns->rq[i]); 1022 1023 kfree(ns->rq); 1024 ns->rq = NULL; 1025 } 1026 1027 static int nsim_init_netdevsim(struct netdevsim *ns) 1028 { 1029 struct netdevsim *peer; 1030 struct mock_phc *phc; 1031 int err; 1032 1033 phc = mock_phc_create(&ns->nsim_bus_dev->dev); 1034 if (IS_ERR(phc)) 1035 return PTR_ERR(phc); 1036 1037 ns->phc = phc; 1038 ns->netdev->netdev_ops = &nsim_netdev_ops; 1039 ns->netdev->stat_ops = &nsim_stat_ops; 1040 ns->netdev->queue_mgmt_ops = &nsim_queue_mgmt_ops; 1041 netdev_lockdep_set_classes(ns->netdev); 1042 1043 err = nsim_udp_tunnels_info_create(ns->nsim_dev, ns->netdev); 1044 if (err) 1045 goto err_phc_destroy; 1046 1047 rtnl_lock(); 1048 err = nsim_queue_init(ns); 1049 if (err) 1050 goto err_utn_destroy; 1051 1052 err = nsim_bpf_init(ns); 1053 if (err) 1054 goto err_rq_destroy; 1055 1056 nsim_macsec_init(ns); 1057 nsim_ipsec_init(ns); 1058 1059 err = register_netdevice(ns->netdev); 1060 if (err) 1061 goto err_ipsec_teardown; 1062 rtnl_unlock(); 1063 1064 err = nsim_psp_init(ns); 1065 if (err) 1066 goto err_unregister_netdev; 1067 1068 if (IS_ENABLED(CONFIG_DEBUG_NET)) { 1069 ns->nb.notifier_call = netdev_debug_event; 1070 if (register_netdevice_notifier_dev_net(ns->netdev, &ns->nb, 1071 &ns->nn)) 1072 ns->nb.notifier_call = NULL; 1073 } 1074 1075 return 0; 1076 1077 err_unregister_netdev: 1078 rtnl_lock(); 1079 peer = rtnl_dereference(ns->peer); 1080 if (peer) 1081 RCU_INIT_POINTER(peer->peer, NULL); 1082 RCU_INIT_POINTER(ns->peer, NULL); 1083 unregister_netdevice(ns->netdev); 1084 err_ipsec_teardown: 1085 nsim_ipsec_teardown(ns); 1086 nsim_macsec_teardown(ns); 1087 nsim_bpf_uninit(ns); 1088 err_rq_destroy: 1089 nsim_queue_uninit(ns); 1090 err_utn_destroy: 1091 rtnl_unlock(); 1092 nsim_udp_tunnels_info_destroy(ns->netdev); 1093 err_phc_destroy: 1094 mock_phc_destroy(ns->phc); 1095 return err; 1096 } 1097 1098 static int nsim_init_netdevsim_vf(struct netdevsim *ns) 1099 { 1100 int err; 1101 1102 ns->netdev->netdev_ops = &nsim_vf_netdev_ops; 1103 rtnl_lock(); 1104 err = register_netdevice(ns->netdev); 1105 rtnl_unlock(); 1106 return err; 1107 } 1108 1109 static void nsim_exit_netdevsim(struct netdevsim *ns) 1110 { 1111 nsim_udp_tunnels_info_destroy(ns->netdev); 1112 mock_phc_destroy(ns->phc); 1113 } 1114 1115 struct netdevsim *nsim_create(struct nsim_dev *nsim_dev, 1116 struct nsim_dev_port *nsim_dev_port, 1117 u8 perm_addr[ETH_ALEN]) 1118 { 1119 struct net_device *dev; 1120 struct netdevsim *ns; 1121 int err; 1122 1123 dev = alloc_netdev_mq(sizeof(*ns), "eth%d", NET_NAME_UNKNOWN, nsim_setup, 1124 nsim_dev->nsim_bus_dev->num_queues); 1125 if (!dev) 1126 return ERR_PTR(-ENOMEM); 1127 1128 if (perm_addr) 1129 memcpy(dev->perm_addr, perm_addr, ETH_ALEN); 1130 1131 dev_net_set(dev, nsim_dev_net(nsim_dev)); 1132 ns = netdev_priv(dev); 1133 ns->netdev = dev; 1134 ns->nsim_dev = nsim_dev; 1135 ns->nsim_dev_port = nsim_dev_port; 1136 ns->nsim_bus_dev = nsim_dev->nsim_bus_dev; 1137 SET_NETDEV_DEV(dev, &ns->nsim_bus_dev->dev); 1138 SET_NETDEV_DEVLINK_PORT(dev, &nsim_dev_port->devlink_port); 1139 nsim_ethtool_init(ns); 1140 if (nsim_dev_port_is_pf(nsim_dev_port)) 1141 err = nsim_init_netdevsim(ns); 1142 else 1143 err = nsim_init_netdevsim_vf(ns); 1144 if (err) 1145 goto err_free_netdev; 1146 1147 ns->pp_dfs = debugfs_create_file("pp_hold", 0600, nsim_dev_port->ddir, 1148 ns, &nsim_pp_hold_fops); 1149 ns->qr_dfs = debugfs_create_file("queue_reset", 0200, 1150 nsim_dev_port->ddir, ns, 1151 &nsim_qreset_fops); 1152 return ns; 1153 1154 err_free_netdev: 1155 free_netdev(dev); 1156 return ERR_PTR(err); 1157 } 1158 1159 void nsim_destroy(struct netdevsim *ns) 1160 { 1161 struct net_device *dev = ns->netdev; 1162 struct netdevsim *peer; 1163 1164 debugfs_remove(ns->qr_dfs); 1165 debugfs_remove(ns->pp_dfs); 1166 1167 if (ns->nb.notifier_call) 1168 unregister_netdevice_notifier_dev_net(ns->netdev, &ns->nb, 1169 &ns->nn); 1170 1171 nsim_psp_uninit(ns); 1172 1173 rtnl_lock(); 1174 peer = rtnl_dereference(ns->peer); 1175 if (peer) 1176 RCU_INIT_POINTER(peer->peer, NULL); 1177 RCU_INIT_POINTER(ns->peer, NULL); 1178 unregister_netdevice(dev); 1179 if (nsim_dev_port_is_pf(ns->nsim_dev_port)) { 1180 nsim_macsec_teardown(ns); 1181 nsim_ipsec_teardown(ns); 1182 nsim_bpf_uninit(ns); 1183 nsim_queue_uninit(ns); 1184 } 1185 rtnl_unlock(); 1186 if (nsim_dev_port_is_pf(ns->nsim_dev_port)) 1187 nsim_exit_netdevsim(ns); 1188 1189 /* Put this intentionally late to exercise the orphaning path */ 1190 if (ns->page) { 1191 page_pool_put_full_page(pp_page_to_nmdesc(ns->page)->pp, 1192 ns->page, false); 1193 ns->page = NULL; 1194 } 1195 1196 free_netdev(dev); 1197 } 1198 1199 bool netdev_is_nsim(struct net_device *dev) 1200 { 1201 return dev->netdev_ops == &nsim_netdev_ops; 1202 } 1203 1204 static int nsim_validate(struct nlattr *tb[], struct nlattr *data[], 1205 struct netlink_ext_ack *extack) 1206 { 1207 NL_SET_ERR_MSG_MOD(extack, 1208 "Please use: echo \"[ID] [PORT_COUNT] [NUM_QUEUES]\" > /sys/bus/netdevsim/new_device"); 1209 return -EOPNOTSUPP; 1210 } 1211 1212 static struct rtnl_link_ops nsim_link_ops __read_mostly = { 1213 .kind = DRV_NAME, 1214 .validate = nsim_validate, 1215 }; 1216 1217 static int __init nsim_module_init(void) 1218 { 1219 int err; 1220 1221 err = nsim_dev_init(); 1222 if (err) 1223 return err; 1224 1225 err = nsim_bus_init(); 1226 if (err) 1227 goto err_dev_exit; 1228 1229 err = rtnl_link_register(&nsim_link_ops); 1230 if (err) 1231 goto err_bus_exit; 1232 1233 return 0; 1234 1235 err_bus_exit: 1236 nsim_bus_exit(); 1237 err_dev_exit: 1238 nsim_dev_exit(); 1239 return err; 1240 } 1241 1242 static void __exit nsim_module_exit(void) 1243 { 1244 rtnl_link_unregister(&nsim_link_ops); 1245 nsim_bus_exit(); 1246 nsim_dev_exit(); 1247 } 1248 1249 module_init(nsim_module_init); 1250 module_exit(nsim_module_exit); 1251 MODULE_LICENSE("GPL"); 1252 MODULE_DESCRIPTION("Simulated networking device for testing"); 1253 MODULE_ALIAS_RTNL_LINK(DRV_NAME); 1254