1 /*
2 * Copyright (C) 2017 Netronome Systems, Inc.
3 *
4 * This software is licensed under the GNU General License Version 2,
5 * June 1991 as shown in the file COPYING in the top-level directory of this
6 * source tree.
7 *
8 * THE COPYRIGHT HOLDERS AND/OR OTHER PARTIES PROVIDE THE PROGRAM "AS IS"
9 * WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING,
10 * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
11 * FOR A PARTICULAR PURPOSE. THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE
12 * OF THE PROGRAM IS WITH YOU. SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME
13 * THE COST OF ALL NECESSARY SERVICING, REPAIR OR CORRECTION.
14 */
15
16 #include <linux/debugfs.h>
17 #include <linux/etherdevice.h>
18 #include <linux/ethtool_netlink.h>
19 #include <linux/kernel.h>
20 #include <linux/module.h>
21 #include <linux/netdevice.h>
22 #include <linux/slab.h>
23 #include <net/netdev_queues.h>
24 #include <net/netdev_rx_queue.h>
25 #include <net/page_pool/helpers.h>
26 #include <net/netlink.h>
27 #include <net/net_shaper.h>
28 #include <net/netdev_lock.h>
29 #include <net/pkt_cls.h>
30 #include <net/rtnetlink.h>
31 #include <net/udp_tunnel.h>
32 #include <net/busy_poll.h>
33
34 #include "netdevsim.h"
35
36 MODULE_IMPORT_NS("NETDEV_INTERNAL");
37
38 #define NSIM_RING_SIZE 256
39
nsim_start_peer_tx_queue(struct net_device * dev,struct nsim_rq * rq)40 static void nsim_start_peer_tx_queue(struct net_device *dev, struct nsim_rq *rq)
41 {
42 struct netdevsim *ns = netdev_priv(dev);
43 struct net_device *peer_dev;
44 struct netdevsim *peer_ns;
45 struct netdev_queue *txq;
46 u16 idx;
47
48 idx = rq->napi.index;
49 rcu_read_lock();
50 peer_ns = rcu_dereference(ns->peer);
51 if (!peer_ns)
52 goto out;
53
54 /* TX device */
55 peer_dev = peer_ns->netdev;
56 if (dev->real_num_tx_queues != peer_dev->num_rx_queues)
57 goto out;
58
59 txq = netdev_get_tx_queue(peer_dev, idx);
60 if (!netif_tx_queue_stopped(txq))
61 goto out;
62
63 netif_tx_wake_queue(txq);
64 out:
65 rcu_read_unlock();
66 }
67
nsim_stop_tx_queue(struct net_device * tx_dev,struct net_device * rx_dev,struct nsim_rq * rq,u16 idx)68 static void nsim_stop_tx_queue(struct net_device *tx_dev,
69 struct net_device *rx_dev,
70 struct nsim_rq *rq,
71 u16 idx)
72 {
73 /* If different queues size, do not stop, since it is not
74 * easy to find which TX queue is mapped here
75 */
76 if (rx_dev->real_num_tx_queues != tx_dev->num_rx_queues)
77 return;
78
79 /* rq is the queue on the receive side */
80 netif_subqueue_try_stop(tx_dev, idx,
81 NSIM_RING_SIZE - skb_queue_len(&rq->skb_queue),
82 NSIM_RING_SIZE / 2);
83 }
84
nsim_napi_rx(struct net_device * tx_dev,struct net_device * rx_dev,struct nsim_rq * rq,struct sk_buff * skb)85 static int nsim_napi_rx(struct net_device *tx_dev, struct net_device *rx_dev,
86 struct nsim_rq *rq, struct sk_buff *skb)
87 {
88 if (skb_queue_len(&rq->skb_queue) > NSIM_RING_SIZE) {
89 dev_kfree_skb_any(skb);
90 return NET_RX_DROP;
91 }
92
93 skb_queue_tail(&rq->skb_queue, skb);
94
95 /* Stop the peer TX queue avoiding dropping packets later */
96 if (skb_queue_len(&rq->skb_queue) >= NSIM_RING_SIZE)
97 nsim_stop_tx_queue(tx_dev, rx_dev, rq,
98 skb_get_queue_mapping(skb));
99
100 return NET_RX_SUCCESS;
101 }
102
nsim_forward_skb(struct net_device * tx_dev,struct net_device * rx_dev,struct sk_buff * skb,struct nsim_rq * rq,struct skb_ext * psp_ext)103 static int nsim_forward_skb(struct net_device *tx_dev,
104 struct net_device *rx_dev,
105 struct sk_buff *skb,
106 struct nsim_rq *rq,
107 struct skb_ext *psp_ext)
108 {
109 int ret;
110
111 ret = __dev_forward_skb(rx_dev, skb);
112 if (ret)
113 return ret;
114
115 nsim_psp_handle_ext(skb, psp_ext);
116
117 return nsim_napi_rx(tx_dev, rx_dev, rq, skb);
118 }
119
nsim_start_xmit(struct sk_buff * skb,struct net_device * dev)120 static netdev_tx_t nsim_start_xmit(struct sk_buff *skb, struct net_device *dev)
121 {
122 struct netdevsim *ns = netdev_priv(dev);
123 struct skb_ext *psp_ext = NULL;
124 struct net_device *peer_dev;
125 unsigned int len = skb->len;
126 struct netdevsim *peer_ns;
127 struct netdev_config *cfg;
128 struct nsim_rq *rq;
129 int rxq;
130 int dr;
131
132 rcu_read_lock();
133 if (!nsim_ipsec_tx(ns, skb))
134 goto out_drop_any;
135
136 peer_ns = rcu_dereference(ns->peer);
137 if (!peer_ns)
138 goto out_drop_any;
139
140 dr = nsim_do_psp(skb, ns, peer_ns, &psp_ext);
141 if (dr)
142 goto out_drop_free;
143
144 peer_dev = peer_ns->netdev;
145 rxq = skb_get_queue_mapping(skb);
146 if (rxq >= peer_dev->num_rx_queues)
147 rxq = rxq % peer_dev->num_rx_queues;
148 rq = peer_ns->rq[rxq];
149
150 cfg = peer_dev->cfg;
151 if (skb_is_nonlinear(skb) &&
152 (cfg->hds_config != ETHTOOL_TCP_DATA_SPLIT_ENABLED ||
153 (cfg->hds_config == ETHTOOL_TCP_DATA_SPLIT_ENABLED &&
154 cfg->hds_thresh > len)))
155 skb_linearize(skb);
156
157 skb_tx_timestamp(skb);
158 if (unlikely(nsim_forward_skb(dev, peer_dev,
159 skb, rq, psp_ext) == NET_RX_DROP))
160 goto out_drop_cnt;
161
162 if (!hrtimer_active(&rq->napi_timer))
163 hrtimer_start(&rq->napi_timer, us_to_ktime(5), HRTIMER_MODE_REL);
164
165 rcu_read_unlock();
166 dev_dstats_tx_add(dev, len);
167 return NETDEV_TX_OK;
168
169 out_drop_any:
170 dr = SKB_DROP_REASON_NOT_SPECIFIED;
171 out_drop_free:
172 kfree_skb_reason(skb, dr);
173 out_drop_cnt:
174 rcu_read_unlock();
175 dev_dstats_tx_dropped(dev);
176 return NETDEV_TX_OK;
177 }
178
nsim_set_rx_mode(struct net_device * dev)179 static void nsim_set_rx_mode(struct net_device *dev)
180 {
181 }
182
nsim_change_mtu(struct net_device * dev,int new_mtu)183 static int nsim_change_mtu(struct net_device *dev, int new_mtu)
184 {
185 struct netdevsim *ns = netdev_priv(dev);
186
187 if (ns->xdp.prog && !ns->xdp.prog->aux->xdp_has_frags &&
188 new_mtu > NSIM_XDP_MAX_MTU)
189 return -EBUSY;
190
191 WRITE_ONCE(dev->mtu, new_mtu);
192
193 return 0;
194 }
195
196 static int
nsim_setup_tc_block_cb(enum tc_setup_type type,void * type_data,void * cb_priv)197 nsim_setup_tc_block_cb(enum tc_setup_type type, void *type_data, void *cb_priv)
198 {
199 return nsim_bpf_setup_tc_block_cb(type, type_data, cb_priv);
200 }
201
nsim_set_vf_mac(struct net_device * dev,int vf,u8 * mac)202 static int nsim_set_vf_mac(struct net_device *dev, int vf, u8 *mac)
203 {
204 struct netdevsim *ns = netdev_priv(dev);
205 struct nsim_dev *nsim_dev = ns->nsim_dev;
206
207 /* Only refuse multicast addresses, zero address can mean unset/any. */
208 if (vf >= nsim_dev_get_vfs(nsim_dev) || is_multicast_ether_addr(mac))
209 return -EINVAL;
210 memcpy(nsim_dev->vfconfigs[vf].vf_mac, mac, ETH_ALEN);
211
212 return 0;
213 }
214
nsim_set_vf_vlan(struct net_device * dev,int vf,u16 vlan,u8 qos,__be16 vlan_proto)215 static int nsim_set_vf_vlan(struct net_device *dev, int vf,
216 u16 vlan, u8 qos, __be16 vlan_proto)
217 {
218 struct netdevsim *ns = netdev_priv(dev);
219 struct nsim_dev *nsim_dev = ns->nsim_dev;
220
221 if (vf >= nsim_dev_get_vfs(nsim_dev) || vlan > 4095 || qos > 7)
222 return -EINVAL;
223
224 nsim_dev->vfconfigs[vf].vlan = vlan;
225 nsim_dev->vfconfigs[vf].qos = qos;
226 nsim_dev->vfconfigs[vf].vlan_proto = vlan_proto;
227
228 return 0;
229 }
230
nsim_set_vf_rate(struct net_device * dev,int vf,int min,int max)231 static int nsim_set_vf_rate(struct net_device *dev, int vf, int min, int max)
232 {
233 struct netdevsim *ns = netdev_priv(dev);
234 struct nsim_dev *nsim_dev = ns->nsim_dev;
235
236 if (nsim_esw_mode_is_switchdev(ns->nsim_dev)) {
237 pr_err("Not supported in switchdev mode. Please use devlink API.\n");
238 return -EOPNOTSUPP;
239 }
240
241 if (vf >= nsim_dev_get_vfs(nsim_dev))
242 return -EINVAL;
243
244 nsim_dev->vfconfigs[vf].min_tx_rate = min;
245 nsim_dev->vfconfigs[vf].max_tx_rate = max;
246
247 return 0;
248 }
249
nsim_set_vf_spoofchk(struct net_device * dev,int vf,bool val)250 static int nsim_set_vf_spoofchk(struct net_device *dev, int vf, bool val)
251 {
252 struct netdevsim *ns = netdev_priv(dev);
253 struct nsim_dev *nsim_dev = ns->nsim_dev;
254
255 if (vf >= nsim_dev_get_vfs(nsim_dev))
256 return -EINVAL;
257 nsim_dev->vfconfigs[vf].spoofchk_enabled = val;
258
259 return 0;
260 }
261
nsim_set_vf_rss_query_en(struct net_device * dev,int vf,bool val)262 static int nsim_set_vf_rss_query_en(struct net_device *dev, int vf, bool val)
263 {
264 struct netdevsim *ns = netdev_priv(dev);
265 struct nsim_dev *nsim_dev = ns->nsim_dev;
266
267 if (vf >= nsim_dev_get_vfs(nsim_dev))
268 return -EINVAL;
269 nsim_dev->vfconfigs[vf].rss_query_enabled = val;
270
271 return 0;
272 }
273
nsim_set_vf_trust(struct net_device * dev,int vf,bool val)274 static int nsim_set_vf_trust(struct net_device *dev, int vf, bool val)
275 {
276 struct netdevsim *ns = netdev_priv(dev);
277 struct nsim_dev *nsim_dev = ns->nsim_dev;
278
279 if (vf >= nsim_dev_get_vfs(nsim_dev))
280 return -EINVAL;
281 nsim_dev->vfconfigs[vf].trusted = val;
282
283 return 0;
284 }
285
286 static int
nsim_get_vf_config(struct net_device * dev,int vf,struct ifla_vf_info * ivi)287 nsim_get_vf_config(struct net_device *dev, int vf, struct ifla_vf_info *ivi)
288 {
289 struct netdevsim *ns = netdev_priv(dev);
290 struct nsim_dev *nsim_dev = ns->nsim_dev;
291
292 if (vf >= nsim_dev_get_vfs(nsim_dev))
293 return -EINVAL;
294
295 ivi->vf = vf;
296 ivi->linkstate = nsim_dev->vfconfigs[vf].link_state;
297 ivi->min_tx_rate = nsim_dev->vfconfigs[vf].min_tx_rate;
298 ivi->max_tx_rate = nsim_dev->vfconfigs[vf].max_tx_rate;
299 ivi->vlan = nsim_dev->vfconfigs[vf].vlan;
300 ivi->vlan_proto = nsim_dev->vfconfigs[vf].vlan_proto;
301 ivi->qos = nsim_dev->vfconfigs[vf].qos;
302 memcpy(&ivi->mac, nsim_dev->vfconfigs[vf].vf_mac, ETH_ALEN);
303 ivi->spoofchk = nsim_dev->vfconfigs[vf].spoofchk_enabled;
304 ivi->trusted = nsim_dev->vfconfigs[vf].trusted;
305 ivi->rss_query_en = nsim_dev->vfconfigs[vf].rss_query_enabled;
306
307 return 0;
308 }
309
nsim_set_vf_link_state(struct net_device * dev,int vf,int state)310 static int nsim_set_vf_link_state(struct net_device *dev, int vf, int state)
311 {
312 struct netdevsim *ns = netdev_priv(dev);
313 struct nsim_dev *nsim_dev = ns->nsim_dev;
314
315 if (vf >= nsim_dev_get_vfs(nsim_dev))
316 return -EINVAL;
317
318 switch (state) {
319 case IFLA_VF_LINK_STATE_AUTO:
320 case IFLA_VF_LINK_STATE_ENABLE:
321 case IFLA_VF_LINK_STATE_DISABLE:
322 break;
323 default:
324 return -EINVAL;
325 }
326
327 nsim_dev->vfconfigs[vf].link_state = state;
328
329 return 0;
330 }
331
nsim_taprio_stats(struct tc_taprio_qopt_stats * stats)332 static void nsim_taprio_stats(struct tc_taprio_qopt_stats *stats)
333 {
334 stats->window_drops = 0;
335 stats->tx_overruns = 0;
336 }
337
nsim_setup_tc_taprio(struct net_device * dev,struct tc_taprio_qopt_offload * offload)338 static int nsim_setup_tc_taprio(struct net_device *dev,
339 struct tc_taprio_qopt_offload *offload)
340 {
341 int err = 0;
342
343 switch (offload->cmd) {
344 case TAPRIO_CMD_REPLACE:
345 case TAPRIO_CMD_DESTROY:
346 break;
347 case TAPRIO_CMD_STATS:
348 nsim_taprio_stats(&offload->stats);
349 break;
350 default:
351 err = -EOPNOTSUPP;
352 }
353
354 return err;
355 }
356
357 static LIST_HEAD(nsim_block_cb_list);
358
359 static int
nsim_setup_tc(struct net_device * dev,enum tc_setup_type type,void * type_data)360 nsim_setup_tc(struct net_device *dev, enum tc_setup_type type, void *type_data)
361 {
362 struct netdevsim *ns = netdev_priv(dev);
363
364 switch (type) {
365 case TC_SETUP_QDISC_TAPRIO:
366 return nsim_setup_tc_taprio(dev, type_data);
367 case TC_SETUP_BLOCK:
368 return flow_block_cb_setup_simple(type_data,
369 &nsim_block_cb_list,
370 nsim_setup_tc_block_cb,
371 ns, ns, true);
372 default:
373 return -EOPNOTSUPP;
374 }
375 }
376
377 static int
nsim_set_features(struct net_device * dev,netdev_features_t features)378 nsim_set_features(struct net_device *dev, netdev_features_t features)
379 {
380 struct netdevsim *ns = netdev_priv(dev);
381
382 if ((dev->features & NETIF_F_HW_TC) > (features & NETIF_F_HW_TC))
383 return nsim_bpf_disable_tc(ns);
384
385 return 0;
386 }
387
nsim_get_iflink(const struct net_device * dev)388 static int nsim_get_iflink(const struct net_device *dev)
389 {
390 struct netdevsim *nsim, *peer;
391 int iflink;
392
393 nsim = netdev_priv(dev);
394
395 rcu_read_lock();
396 peer = rcu_dereference(nsim->peer);
397 iflink = peer ? READ_ONCE(peer->netdev->ifindex) :
398 READ_ONCE(dev->ifindex);
399 rcu_read_unlock();
400
401 return iflink;
402 }
403
nsim_rcv(struct nsim_rq * rq,int budget)404 static int nsim_rcv(struct nsim_rq *rq, int budget)
405 {
406 struct net_device *dev = rq->napi.dev;
407 struct bpf_prog *xdp_prog;
408 struct netdevsim *ns;
409 struct sk_buff *skb;
410 unsigned int skblen;
411 int i, ret;
412
413 ns = netdev_priv(dev);
414 xdp_prog = READ_ONCE(ns->xdp.prog);
415
416 for (i = 0; i < budget; i++) {
417 if (skb_queue_empty(&rq->skb_queue))
418 break;
419
420 skb = skb_dequeue(&rq->skb_queue);
421
422 if (xdp_prog) {
423 /* skb might be freed directly by XDP, save the len */
424 skblen = skb->len;
425
426 if (skb->ip_summed == CHECKSUM_PARTIAL)
427 skb_checksum_help(skb);
428 ret = do_xdp_generic(xdp_prog, &skb);
429 if (ret != XDP_PASS) {
430 dev_dstats_rx_add(dev, skblen);
431 continue;
432 }
433 }
434
435 /* skb might be discard at netif_receive_skb, save the len */
436 skblen = skb->len;
437 skb_mark_napi_id(skb, &rq->napi);
438 ret = netif_receive_skb(skb);
439 if (ret == NET_RX_SUCCESS)
440 dev_dstats_rx_add(dev, skblen);
441 else
442 dev_dstats_rx_dropped(dev);
443 }
444
445 nsim_start_peer_tx_queue(dev, rq);
446 return i;
447 }
448
nsim_poll(struct napi_struct * napi,int budget)449 static int nsim_poll(struct napi_struct *napi, int budget)
450 {
451 struct nsim_rq *rq = container_of(napi, struct nsim_rq, napi);
452 int done;
453
454 done = nsim_rcv(rq, budget);
455 if (done < budget)
456 napi_complete_done(napi, done);
457
458 return done;
459 }
460
nsim_create_page_pool(struct page_pool ** p,struct napi_struct * napi)461 static int nsim_create_page_pool(struct page_pool **p, struct napi_struct *napi)
462 {
463 struct page_pool_params params = {
464 .order = 0,
465 .pool_size = NSIM_RING_SIZE,
466 .nid = NUMA_NO_NODE,
467 .dev = &napi->dev->dev,
468 .napi = napi,
469 .dma_dir = DMA_BIDIRECTIONAL,
470 .netdev = napi->dev,
471 };
472 struct page_pool *pool;
473
474 pool = page_pool_create(¶ms);
475 if (IS_ERR(pool))
476 return PTR_ERR(pool);
477
478 *p = pool;
479 return 0;
480 }
481
nsim_init_napi(struct netdevsim * ns)482 static int nsim_init_napi(struct netdevsim *ns)
483 {
484 struct net_device *dev = ns->netdev;
485 struct nsim_rq *rq;
486 int err, i;
487
488 for (i = 0; i < dev->num_rx_queues; i++) {
489 rq = ns->rq[i];
490
491 netif_napi_add_config_locked(dev, &rq->napi, nsim_poll, i);
492 }
493
494 for (i = 0; i < dev->num_rx_queues; i++) {
495 rq = ns->rq[i];
496
497 err = nsim_create_page_pool(&rq->page_pool, &rq->napi);
498 if (err)
499 goto err_pp_destroy;
500 }
501
502 return 0;
503
504 err_pp_destroy:
505 while (i--) {
506 page_pool_destroy(ns->rq[i]->page_pool);
507 ns->rq[i]->page_pool = NULL;
508 }
509
510 for (i = 0; i < dev->num_rx_queues; i++)
511 __netif_napi_del_locked(&ns->rq[i]->napi);
512
513 return err;
514 }
515
nsim_napi_schedule(struct hrtimer * timer)516 static enum hrtimer_restart nsim_napi_schedule(struct hrtimer *timer)
517 {
518 struct nsim_rq *rq;
519
520 rq = container_of(timer, struct nsim_rq, napi_timer);
521 napi_schedule(&rq->napi);
522
523 return HRTIMER_NORESTART;
524 }
525
nsim_rq_timer_init(struct nsim_rq * rq)526 static void nsim_rq_timer_init(struct nsim_rq *rq)
527 {
528 hrtimer_setup(&rq->napi_timer, nsim_napi_schedule, CLOCK_MONOTONIC,
529 HRTIMER_MODE_REL);
530 }
531
nsim_enable_napi(struct netdevsim * ns)532 static void nsim_enable_napi(struct netdevsim *ns)
533 {
534 struct net_device *dev = ns->netdev;
535 int i;
536
537 for (i = 0; i < dev->num_rx_queues; i++) {
538 struct nsim_rq *rq = ns->rq[i];
539
540 netif_queue_set_napi(dev, i, NETDEV_QUEUE_TYPE_RX, &rq->napi);
541 napi_enable_locked(&rq->napi);
542 }
543 }
544
nsim_open(struct net_device * dev)545 static int nsim_open(struct net_device *dev)
546 {
547 struct netdevsim *ns = netdev_priv(dev);
548 struct netdevsim *peer;
549 int err;
550
551 netdev_assert_locked(dev);
552
553 err = nsim_init_napi(ns);
554 if (err)
555 return err;
556
557 nsim_enable_napi(ns);
558
559 peer = rtnl_dereference(ns->peer);
560 if (peer && netif_running(peer->netdev)) {
561 netif_carrier_on(dev);
562 netif_carrier_on(peer->netdev);
563 }
564
565 return 0;
566 }
567
nsim_del_napi(struct netdevsim * ns)568 static void nsim_del_napi(struct netdevsim *ns)
569 {
570 struct net_device *dev = ns->netdev;
571 int i;
572
573 for (i = 0; i < dev->num_rx_queues; i++) {
574 struct nsim_rq *rq = ns->rq[i];
575
576 napi_disable_locked(&rq->napi);
577 __netif_napi_del_locked(&rq->napi);
578 }
579 synchronize_net();
580
581 for (i = 0; i < dev->num_rx_queues; i++) {
582 page_pool_destroy(ns->rq[i]->page_pool);
583 ns->rq[i]->page_pool = NULL;
584 }
585 }
586
nsim_stop(struct net_device * dev)587 static int nsim_stop(struct net_device *dev)
588 {
589 struct netdevsim *ns = netdev_priv(dev);
590 struct netdevsim *peer;
591
592 netdev_assert_locked(dev);
593
594 netif_carrier_off(dev);
595 peer = rtnl_dereference(ns->peer);
596 if (peer)
597 netif_carrier_off(peer->netdev);
598
599 nsim_del_napi(ns);
600
601 return 0;
602 }
603
nsim_shaper_set(struct net_shaper_binding * binding,const struct net_shaper * shaper,struct netlink_ext_ack * extack)604 static int nsim_shaper_set(struct net_shaper_binding *binding,
605 const struct net_shaper *shaper,
606 struct netlink_ext_ack *extack)
607 {
608 return 0;
609 }
610
nsim_shaper_del(struct net_shaper_binding * binding,const struct net_shaper_handle * handle,struct netlink_ext_ack * extack)611 static int nsim_shaper_del(struct net_shaper_binding *binding,
612 const struct net_shaper_handle *handle,
613 struct netlink_ext_ack *extack)
614 {
615 return 0;
616 }
617
nsim_shaper_group(struct net_shaper_binding * binding,int leaves_count,const struct net_shaper * leaves,const struct net_shaper * root,struct netlink_ext_ack * extack)618 static int nsim_shaper_group(struct net_shaper_binding *binding,
619 int leaves_count,
620 const struct net_shaper *leaves,
621 const struct net_shaper *root,
622 struct netlink_ext_ack *extack)
623 {
624 return 0;
625 }
626
nsim_shaper_cap(struct net_shaper_binding * binding,enum net_shaper_scope scope,unsigned long * flags)627 static void nsim_shaper_cap(struct net_shaper_binding *binding,
628 enum net_shaper_scope scope,
629 unsigned long *flags)
630 {
631 *flags = ULONG_MAX;
632 }
633
634 static const struct net_shaper_ops nsim_shaper_ops = {
635 .set = nsim_shaper_set,
636 .delete = nsim_shaper_del,
637 .group = nsim_shaper_group,
638 .capabilities = nsim_shaper_cap,
639 };
640
641 static const struct net_device_ops nsim_netdev_ops = {
642 .ndo_start_xmit = nsim_start_xmit,
643 .ndo_set_rx_mode = nsim_set_rx_mode,
644 .ndo_set_mac_address = eth_mac_addr,
645 .ndo_validate_addr = eth_validate_addr,
646 .ndo_change_mtu = nsim_change_mtu,
647 .ndo_set_vf_mac = nsim_set_vf_mac,
648 .ndo_set_vf_vlan = nsim_set_vf_vlan,
649 .ndo_set_vf_rate = nsim_set_vf_rate,
650 .ndo_set_vf_spoofchk = nsim_set_vf_spoofchk,
651 .ndo_set_vf_trust = nsim_set_vf_trust,
652 .ndo_get_vf_config = nsim_get_vf_config,
653 .ndo_set_vf_link_state = nsim_set_vf_link_state,
654 .ndo_set_vf_rss_query_en = nsim_set_vf_rss_query_en,
655 .ndo_setup_tc = nsim_setup_tc,
656 .ndo_set_features = nsim_set_features,
657 .ndo_get_iflink = nsim_get_iflink,
658 .ndo_bpf = nsim_bpf,
659 .ndo_open = nsim_open,
660 .ndo_stop = nsim_stop,
661 .net_shaper_ops = &nsim_shaper_ops,
662 };
663
664 static const struct net_device_ops nsim_vf_netdev_ops = {
665 .ndo_start_xmit = nsim_start_xmit,
666 .ndo_set_rx_mode = nsim_set_rx_mode,
667 .ndo_set_mac_address = eth_mac_addr,
668 .ndo_validate_addr = eth_validate_addr,
669 .ndo_change_mtu = nsim_change_mtu,
670 .ndo_setup_tc = nsim_setup_tc,
671 .ndo_set_features = nsim_set_features,
672 };
673
674 /* We don't have true per-queue stats, yet, so do some random fakery here.
675 * Only report stuff for queue 0.
676 */
nsim_get_queue_stats_rx(struct net_device * dev,int idx,struct netdev_queue_stats_rx * stats)677 static void nsim_get_queue_stats_rx(struct net_device *dev, int idx,
678 struct netdev_queue_stats_rx *stats)
679 {
680 struct rtnl_link_stats64 rtstats = {};
681
682 if (!idx)
683 dev_get_stats(dev, &rtstats);
684
685 stats->packets = rtstats.rx_packets - !!rtstats.rx_packets;
686 stats->bytes = rtstats.rx_bytes;
687 }
688
nsim_get_queue_stats_tx(struct net_device * dev,int idx,struct netdev_queue_stats_tx * stats)689 static void nsim_get_queue_stats_tx(struct net_device *dev, int idx,
690 struct netdev_queue_stats_tx *stats)
691 {
692 struct rtnl_link_stats64 rtstats = {};
693
694 if (!idx)
695 dev_get_stats(dev, &rtstats);
696
697 stats->packets = rtstats.tx_packets - !!rtstats.tx_packets;
698 stats->bytes = rtstats.tx_bytes;
699 }
700
nsim_get_base_stats(struct net_device * dev,struct netdev_queue_stats_rx * rx,struct netdev_queue_stats_tx * tx)701 static void nsim_get_base_stats(struct net_device *dev,
702 struct netdev_queue_stats_rx *rx,
703 struct netdev_queue_stats_tx *tx)
704 {
705 struct rtnl_link_stats64 rtstats = {};
706
707 dev_get_stats(dev, &rtstats);
708
709 rx->packets = !!rtstats.rx_packets;
710 rx->bytes = 0;
711 tx->packets = !!rtstats.tx_packets;
712 tx->bytes = 0;
713 }
714
715 static const struct netdev_stat_ops nsim_stat_ops = {
716 .get_queue_stats_tx = nsim_get_queue_stats_tx,
717 .get_queue_stats_rx = nsim_get_queue_stats_rx,
718 .get_base_stats = nsim_get_base_stats,
719 };
720
nsim_queue_alloc(void)721 static struct nsim_rq *nsim_queue_alloc(void)
722 {
723 struct nsim_rq *rq;
724
725 rq = kzalloc(sizeof(*rq), GFP_KERNEL_ACCOUNT);
726 if (!rq)
727 return NULL;
728
729 skb_queue_head_init(&rq->skb_queue);
730 nsim_rq_timer_init(rq);
731 return rq;
732 }
733
nsim_queue_free(struct net_device * dev,struct nsim_rq * rq)734 static void nsim_queue_free(struct net_device *dev, struct nsim_rq *rq)
735 {
736 hrtimer_cancel(&rq->napi_timer);
737
738 if (rq->skb_queue.qlen) {
739 local_bh_disable();
740 dev_dstats_rx_dropped_add(dev, rq->skb_queue.qlen);
741 local_bh_enable();
742 }
743
744 skb_queue_purge_reason(&rq->skb_queue, SKB_DROP_REASON_QUEUE_PURGE);
745 kfree(rq);
746 }
747
748 /* Queue reset mode is controlled by ns->rq_reset_mode.
749 * - normal - new NAPI new pool (old NAPI enabled when new added)
750 * - mode 1 - allocate new pool (NAPI is only disabled / enabled)
751 * - mode 2 - new NAPI new pool (old NAPI removed before new added)
752 * - mode 3 - new NAPI new pool (old NAPI disabled when new added)
753 */
754 struct nsim_queue_mem {
755 struct nsim_rq *rq;
756 struct page_pool *pp;
757 };
758
759 static int
nsim_queue_mem_alloc(struct net_device * dev,void * per_queue_mem,int idx)760 nsim_queue_mem_alloc(struct net_device *dev, void *per_queue_mem, int idx)
761 {
762 struct nsim_queue_mem *qmem = per_queue_mem;
763 struct netdevsim *ns = netdev_priv(dev);
764 int err;
765
766 if (ns->rq_reset_mode > 3)
767 return -EINVAL;
768
769 if (ns->rq_reset_mode == 1) {
770 if (!netif_running(ns->netdev))
771 return -ENETDOWN;
772 return nsim_create_page_pool(&qmem->pp, &ns->rq[idx]->napi);
773 }
774
775 qmem->rq = nsim_queue_alloc();
776 if (!qmem->rq)
777 return -ENOMEM;
778
779 err = nsim_create_page_pool(&qmem->rq->page_pool, &qmem->rq->napi);
780 if (err)
781 goto err_free;
782
783 if (!ns->rq_reset_mode)
784 netif_napi_add_config_locked(dev, &qmem->rq->napi, nsim_poll,
785 idx);
786
787 return 0;
788
789 err_free:
790 nsim_queue_free(dev, qmem->rq);
791 return err;
792 }
793
nsim_queue_mem_free(struct net_device * dev,void * per_queue_mem)794 static void nsim_queue_mem_free(struct net_device *dev, void *per_queue_mem)
795 {
796 struct nsim_queue_mem *qmem = per_queue_mem;
797 struct netdevsim *ns = netdev_priv(dev);
798
799 page_pool_destroy(qmem->pp);
800 if (qmem->rq) {
801 if (!ns->rq_reset_mode)
802 netif_napi_del_locked(&qmem->rq->napi);
803 page_pool_destroy(qmem->rq->page_pool);
804 nsim_queue_free(dev, qmem->rq);
805 }
806 }
807
808 static int
nsim_queue_start(struct net_device * dev,void * per_queue_mem,int idx)809 nsim_queue_start(struct net_device *dev, void *per_queue_mem, int idx)
810 {
811 struct nsim_queue_mem *qmem = per_queue_mem;
812 struct netdevsim *ns = netdev_priv(dev);
813
814 netdev_assert_locked(dev);
815
816 if (ns->rq_reset_mode == 1) {
817 ns->rq[idx]->page_pool = qmem->pp;
818 napi_enable_locked(&ns->rq[idx]->napi);
819 return 0;
820 }
821
822 /* netif_napi_add()/_del() should normally be called from alloc/free,
823 * here we want to test various call orders.
824 */
825 if (ns->rq_reset_mode == 2) {
826 netif_napi_del_locked(&ns->rq[idx]->napi);
827 netif_napi_add_config_locked(dev, &qmem->rq->napi, nsim_poll,
828 idx);
829 } else if (ns->rq_reset_mode == 3) {
830 netif_napi_add_config_locked(dev, &qmem->rq->napi, nsim_poll,
831 idx);
832 netif_napi_del_locked(&ns->rq[idx]->napi);
833 }
834
835 ns->rq[idx] = qmem->rq;
836 napi_enable_locked(&ns->rq[idx]->napi);
837
838 return 0;
839 }
840
nsim_queue_stop(struct net_device * dev,void * per_queue_mem,int idx)841 static int nsim_queue_stop(struct net_device *dev, void *per_queue_mem, int idx)
842 {
843 struct nsim_queue_mem *qmem = per_queue_mem;
844 struct netdevsim *ns = netdev_priv(dev);
845
846 netdev_assert_locked(dev);
847
848 napi_disable_locked(&ns->rq[idx]->napi);
849
850 if (ns->rq_reset_mode == 1) {
851 qmem->pp = ns->rq[idx]->page_pool;
852 page_pool_disable_direct_recycling(qmem->pp);
853 } else {
854 qmem->rq = ns->rq[idx];
855 }
856
857 return 0;
858 }
859
860 static const struct netdev_queue_mgmt_ops nsim_queue_mgmt_ops = {
861 .ndo_queue_mem_size = sizeof(struct nsim_queue_mem),
862 .ndo_queue_mem_alloc = nsim_queue_mem_alloc,
863 .ndo_queue_mem_free = nsim_queue_mem_free,
864 .ndo_queue_start = nsim_queue_start,
865 .ndo_queue_stop = nsim_queue_stop,
866 };
867
868 static ssize_t
nsim_qreset_write(struct file * file,const char __user * data,size_t count,loff_t * ppos)869 nsim_qreset_write(struct file *file, const char __user *data,
870 size_t count, loff_t *ppos)
871 {
872 struct netdevsim *ns = file->private_data;
873 unsigned int queue, mode;
874 char buf[32];
875 ssize_t ret;
876
877 if (count >= sizeof(buf))
878 return -EINVAL;
879 if (copy_from_user(buf, data, count))
880 return -EFAULT;
881 buf[count] = '\0';
882
883 ret = sscanf(buf, "%u %u", &queue, &mode);
884 if (ret != 2)
885 return -EINVAL;
886
887 netdev_lock(ns->netdev);
888 if (queue >= ns->netdev->real_num_rx_queues) {
889 ret = -EINVAL;
890 goto exit_unlock;
891 }
892
893 ns->rq_reset_mode = mode;
894 ret = netdev_rx_queue_restart(ns->netdev, queue);
895 ns->rq_reset_mode = 0;
896 if (ret)
897 goto exit_unlock;
898
899 ret = count;
900 exit_unlock:
901 netdev_unlock(ns->netdev);
902 return ret;
903 }
904
905 static const struct file_operations nsim_qreset_fops = {
906 .open = simple_open,
907 .write = nsim_qreset_write,
908 .owner = THIS_MODULE,
909 };
910
911 static ssize_t
nsim_pp_hold_read(struct file * file,char __user * data,size_t count,loff_t * ppos)912 nsim_pp_hold_read(struct file *file, char __user *data,
913 size_t count, loff_t *ppos)
914 {
915 struct netdevsim *ns = file->private_data;
916 char buf[3] = "n\n";
917
918 if (ns->page)
919 buf[0] = 'y';
920
921 return simple_read_from_buffer(data, count, ppos, buf, 2);
922 }
923
924 static ssize_t
nsim_pp_hold_write(struct file * file,const char __user * data,size_t count,loff_t * ppos)925 nsim_pp_hold_write(struct file *file, const char __user *data,
926 size_t count, loff_t *ppos)
927 {
928 struct netdevsim *ns = file->private_data;
929 ssize_t ret;
930 bool val;
931
932 ret = kstrtobool_from_user(data, count, &val);
933 if (ret)
934 return ret;
935
936 rtnl_lock();
937 ret = count;
938 if (val == !!ns->page)
939 goto exit;
940
941 if (!netif_running(ns->netdev) && val) {
942 ret = -ENETDOWN;
943 } else if (val) {
944 ns->page = page_pool_dev_alloc_pages(ns->rq[0]->page_pool);
945 if (!ns->page)
946 ret = -ENOMEM;
947 } else {
948 page_pool_put_full_page(pp_page_to_nmdesc(ns->page)->pp,
949 ns->page, false);
950 ns->page = NULL;
951 }
952
953 exit:
954 rtnl_unlock();
955 return ret;
956 }
957
958 static const struct file_operations nsim_pp_hold_fops = {
959 .open = simple_open,
960 .read = nsim_pp_hold_read,
961 .write = nsim_pp_hold_write,
962 .llseek = generic_file_llseek,
963 .owner = THIS_MODULE,
964 };
965
nsim_setup(struct net_device * dev)966 static void nsim_setup(struct net_device *dev)
967 {
968 ether_setup(dev);
969 eth_hw_addr_random(dev);
970
971 dev->flags &= ~IFF_MULTICAST;
972 dev->priv_flags |= IFF_LIVE_ADDR_CHANGE;
973 dev->features |= NETIF_F_HIGHDMA |
974 NETIF_F_SG |
975 NETIF_F_FRAGLIST |
976 NETIF_F_HW_CSUM |
977 NETIF_F_LRO |
978 NETIF_F_TSO;
979 dev->hw_features |= NETIF_F_HW_TC |
980 NETIF_F_SG |
981 NETIF_F_FRAGLIST |
982 NETIF_F_HW_CSUM |
983 NETIF_F_LRO |
984 NETIF_F_TSO;
985 dev->pcpu_stat_type = NETDEV_PCPU_STAT_DSTATS;
986 dev->max_mtu = ETH_MAX_MTU;
987 dev->xdp_features = NETDEV_XDP_ACT_BASIC | NETDEV_XDP_ACT_HW_OFFLOAD;
988 }
989
nsim_queue_init(struct netdevsim * ns)990 static int nsim_queue_init(struct netdevsim *ns)
991 {
992 struct net_device *dev = ns->netdev;
993 int i;
994
995 ns->rq = kcalloc(dev->num_rx_queues, sizeof(*ns->rq),
996 GFP_KERNEL_ACCOUNT);
997 if (!ns->rq)
998 return -ENOMEM;
999
1000 for (i = 0; i < dev->num_rx_queues; i++) {
1001 ns->rq[i] = nsim_queue_alloc();
1002 if (!ns->rq[i])
1003 goto err_free_prev;
1004 }
1005
1006 return 0;
1007
1008 err_free_prev:
1009 while (i--)
1010 kfree(ns->rq[i]);
1011 kfree(ns->rq);
1012 return -ENOMEM;
1013 }
1014
nsim_queue_uninit(struct netdevsim * ns)1015 static void nsim_queue_uninit(struct netdevsim *ns)
1016 {
1017 struct net_device *dev = ns->netdev;
1018 int i;
1019
1020 for (i = 0; i < dev->num_rx_queues; i++)
1021 nsim_queue_free(dev, ns->rq[i]);
1022
1023 kfree(ns->rq);
1024 ns->rq = NULL;
1025 }
1026
nsim_init_netdevsim(struct netdevsim * ns)1027 static int nsim_init_netdevsim(struct netdevsim *ns)
1028 {
1029 struct netdevsim *peer;
1030 struct mock_phc *phc;
1031 int err;
1032
1033 phc = mock_phc_create(&ns->nsim_bus_dev->dev);
1034 if (IS_ERR(phc))
1035 return PTR_ERR(phc);
1036
1037 ns->phc = phc;
1038 ns->netdev->netdev_ops = &nsim_netdev_ops;
1039 ns->netdev->stat_ops = &nsim_stat_ops;
1040 ns->netdev->queue_mgmt_ops = &nsim_queue_mgmt_ops;
1041 netdev_lockdep_set_classes(ns->netdev);
1042
1043 err = nsim_udp_tunnels_info_create(ns->nsim_dev, ns->netdev);
1044 if (err)
1045 goto err_phc_destroy;
1046
1047 rtnl_lock();
1048 err = nsim_queue_init(ns);
1049 if (err)
1050 goto err_utn_destroy;
1051
1052 err = nsim_bpf_init(ns);
1053 if (err)
1054 goto err_rq_destroy;
1055
1056 nsim_macsec_init(ns);
1057 nsim_ipsec_init(ns);
1058
1059 err = register_netdevice(ns->netdev);
1060 if (err)
1061 goto err_ipsec_teardown;
1062 rtnl_unlock();
1063
1064 err = nsim_psp_init(ns);
1065 if (err)
1066 goto err_unregister_netdev;
1067
1068 if (IS_ENABLED(CONFIG_DEBUG_NET)) {
1069 ns->nb.notifier_call = netdev_debug_event;
1070 if (register_netdevice_notifier_dev_net(ns->netdev, &ns->nb,
1071 &ns->nn))
1072 ns->nb.notifier_call = NULL;
1073 }
1074
1075 return 0;
1076
1077 err_unregister_netdev:
1078 rtnl_lock();
1079 peer = rtnl_dereference(ns->peer);
1080 if (peer)
1081 RCU_INIT_POINTER(peer->peer, NULL);
1082 RCU_INIT_POINTER(ns->peer, NULL);
1083 unregister_netdevice(ns->netdev);
1084 err_ipsec_teardown:
1085 nsim_ipsec_teardown(ns);
1086 nsim_macsec_teardown(ns);
1087 nsim_bpf_uninit(ns);
1088 err_rq_destroy:
1089 nsim_queue_uninit(ns);
1090 err_utn_destroy:
1091 rtnl_unlock();
1092 nsim_udp_tunnels_info_destroy(ns->netdev);
1093 err_phc_destroy:
1094 mock_phc_destroy(ns->phc);
1095 return err;
1096 }
1097
nsim_init_netdevsim_vf(struct netdevsim * ns)1098 static int nsim_init_netdevsim_vf(struct netdevsim *ns)
1099 {
1100 int err;
1101
1102 ns->netdev->netdev_ops = &nsim_vf_netdev_ops;
1103 rtnl_lock();
1104 err = register_netdevice(ns->netdev);
1105 rtnl_unlock();
1106 return err;
1107 }
1108
nsim_exit_netdevsim(struct netdevsim * ns)1109 static void nsim_exit_netdevsim(struct netdevsim *ns)
1110 {
1111 nsim_udp_tunnels_info_destroy(ns->netdev);
1112 mock_phc_destroy(ns->phc);
1113 }
1114
nsim_create(struct nsim_dev * nsim_dev,struct nsim_dev_port * nsim_dev_port,u8 perm_addr[ETH_ALEN])1115 struct netdevsim *nsim_create(struct nsim_dev *nsim_dev,
1116 struct nsim_dev_port *nsim_dev_port,
1117 u8 perm_addr[ETH_ALEN])
1118 {
1119 struct net_device *dev;
1120 struct netdevsim *ns;
1121 int err;
1122
1123 dev = alloc_netdev_mq(sizeof(*ns), "eth%d", NET_NAME_UNKNOWN, nsim_setup,
1124 nsim_dev->nsim_bus_dev->num_queues);
1125 if (!dev)
1126 return ERR_PTR(-ENOMEM);
1127
1128 if (perm_addr)
1129 memcpy(dev->perm_addr, perm_addr, ETH_ALEN);
1130
1131 dev_net_set(dev, nsim_dev_net(nsim_dev));
1132 ns = netdev_priv(dev);
1133 ns->netdev = dev;
1134 ns->nsim_dev = nsim_dev;
1135 ns->nsim_dev_port = nsim_dev_port;
1136 ns->nsim_bus_dev = nsim_dev->nsim_bus_dev;
1137 SET_NETDEV_DEV(dev, &ns->nsim_bus_dev->dev);
1138 SET_NETDEV_DEVLINK_PORT(dev, &nsim_dev_port->devlink_port);
1139 nsim_ethtool_init(ns);
1140 if (nsim_dev_port_is_pf(nsim_dev_port))
1141 err = nsim_init_netdevsim(ns);
1142 else
1143 err = nsim_init_netdevsim_vf(ns);
1144 if (err)
1145 goto err_free_netdev;
1146
1147 ns->pp_dfs = debugfs_create_file("pp_hold", 0600, nsim_dev_port->ddir,
1148 ns, &nsim_pp_hold_fops);
1149 ns->qr_dfs = debugfs_create_file("queue_reset", 0200,
1150 nsim_dev_port->ddir, ns,
1151 &nsim_qreset_fops);
1152 return ns;
1153
1154 err_free_netdev:
1155 free_netdev(dev);
1156 return ERR_PTR(err);
1157 }
1158
nsim_destroy(struct netdevsim * ns)1159 void nsim_destroy(struct netdevsim *ns)
1160 {
1161 struct net_device *dev = ns->netdev;
1162 struct netdevsim *peer;
1163
1164 debugfs_remove(ns->qr_dfs);
1165 debugfs_remove(ns->pp_dfs);
1166
1167 if (ns->nb.notifier_call)
1168 unregister_netdevice_notifier_dev_net(ns->netdev, &ns->nb,
1169 &ns->nn);
1170
1171 nsim_psp_uninit(ns);
1172
1173 rtnl_lock();
1174 peer = rtnl_dereference(ns->peer);
1175 if (peer)
1176 RCU_INIT_POINTER(peer->peer, NULL);
1177 RCU_INIT_POINTER(ns->peer, NULL);
1178 unregister_netdevice(dev);
1179 if (nsim_dev_port_is_pf(ns->nsim_dev_port)) {
1180 nsim_macsec_teardown(ns);
1181 nsim_ipsec_teardown(ns);
1182 nsim_bpf_uninit(ns);
1183 nsim_queue_uninit(ns);
1184 }
1185 rtnl_unlock();
1186 if (nsim_dev_port_is_pf(ns->nsim_dev_port))
1187 nsim_exit_netdevsim(ns);
1188
1189 /* Put this intentionally late to exercise the orphaning path */
1190 if (ns->page) {
1191 page_pool_put_full_page(pp_page_to_nmdesc(ns->page)->pp,
1192 ns->page, false);
1193 ns->page = NULL;
1194 }
1195
1196 free_netdev(dev);
1197 }
1198
netdev_is_nsim(struct net_device * dev)1199 bool netdev_is_nsim(struct net_device *dev)
1200 {
1201 return dev->netdev_ops == &nsim_netdev_ops;
1202 }
1203
nsim_validate(struct nlattr * tb[],struct nlattr * data[],struct netlink_ext_ack * extack)1204 static int nsim_validate(struct nlattr *tb[], struct nlattr *data[],
1205 struct netlink_ext_ack *extack)
1206 {
1207 NL_SET_ERR_MSG_MOD(extack,
1208 "Please use: echo \"[ID] [PORT_COUNT] [NUM_QUEUES]\" > /sys/bus/netdevsim/new_device");
1209 return -EOPNOTSUPP;
1210 }
1211
1212 static struct rtnl_link_ops nsim_link_ops __read_mostly = {
1213 .kind = DRV_NAME,
1214 .validate = nsim_validate,
1215 };
1216
nsim_module_init(void)1217 static int __init nsim_module_init(void)
1218 {
1219 int err;
1220
1221 err = nsim_dev_init();
1222 if (err)
1223 return err;
1224
1225 err = nsim_bus_init();
1226 if (err)
1227 goto err_dev_exit;
1228
1229 err = rtnl_link_register(&nsim_link_ops);
1230 if (err)
1231 goto err_bus_exit;
1232
1233 return 0;
1234
1235 err_bus_exit:
1236 nsim_bus_exit();
1237 err_dev_exit:
1238 nsim_dev_exit();
1239 return err;
1240 }
1241
nsim_module_exit(void)1242 static void __exit nsim_module_exit(void)
1243 {
1244 rtnl_link_unregister(&nsim_link_ops);
1245 nsim_bus_exit();
1246 nsim_dev_exit();
1247 }
1248
1249 module_init(nsim_module_init);
1250 module_exit(nsim_module_exit);
1251 MODULE_LICENSE("GPL");
1252 MODULE_DESCRIPTION("Simulated networking device for testing");
1253 MODULE_ALIAS_RTNL_LINK(DRV_NAME);
1254