1 /*
2 * Copyright (C) 2017 Netronome Systems, Inc.
3 *
4 * This software is licensed under the GNU General License Version 2,
5 * June 1991 as shown in the file COPYING in the top-level directory of this
6 * source tree.
7 *
8 * THE COPYRIGHT HOLDERS AND/OR OTHER PARTIES PROVIDE THE PROGRAM "AS IS"
9 * WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING,
10 * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
11 * FOR A PARTICULAR PURPOSE. THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE
12 * OF THE PROGRAM IS WITH YOU. SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME
13 * THE COST OF ALL NECESSARY SERVICING, REPAIR OR CORRECTION.
14 */
15
16 #include <linux/debugfs.h>
17 #include <linux/etherdevice.h>
18 #include <linux/ethtool_netlink.h>
19 #include <linux/kernel.h>
20 #include <linux/module.h>
21 #include <linux/netdevice.h>
22 #include <linux/slab.h>
23 #include <net/netdev_queues.h>
24 #include <net/netdev_rx_queue.h>
25 #include <net/page_pool/helpers.h>
26 #include <net/netlink.h>
27 #include <net/net_shaper.h>
28 #include <net/pkt_cls.h>
29 #include <net/rtnetlink.h>
30 #include <net/udp_tunnel.h>
31
32 #include "netdevsim.h"
33
34 MODULE_IMPORT_NS("NETDEV_INTERNAL");
35
36 #define NSIM_RING_SIZE 256
37
nsim_napi_rx(struct nsim_rq * rq,struct sk_buff * skb)38 static int nsim_napi_rx(struct nsim_rq *rq, struct sk_buff *skb)
39 {
40 if (skb_queue_len(&rq->skb_queue) > NSIM_RING_SIZE) {
41 dev_kfree_skb_any(skb);
42 return NET_RX_DROP;
43 }
44
45 skb_queue_tail(&rq->skb_queue, skb);
46 return NET_RX_SUCCESS;
47 }
48
nsim_forward_skb(struct net_device * dev,struct sk_buff * skb,struct nsim_rq * rq)49 static int nsim_forward_skb(struct net_device *dev, struct sk_buff *skb,
50 struct nsim_rq *rq)
51 {
52 return __dev_forward_skb(dev, skb) ?: nsim_napi_rx(rq, skb);
53 }
54
nsim_start_xmit(struct sk_buff * skb,struct net_device * dev)55 static netdev_tx_t nsim_start_xmit(struct sk_buff *skb, struct net_device *dev)
56 {
57 struct netdevsim *ns = netdev_priv(dev);
58 struct net_device *peer_dev;
59 unsigned int len = skb->len;
60 struct netdevsim *peer_ns;
61 struct netdev_config *cfg;
62 struct nsim_rq *rq;
63 int rxq;
64
65 rcu_read_lock();
66 if (!nsim_ipsec_tx(ns, skb))
67 goto out_drop_free;
68
69 peer_ns = rcu_dereference(ns->peer);
70 if (!peer_ns)
71 goto out_drop_free;
72
73 peer_dev = peer_ns->netdev;
74 rxq = skb_get_queue_mapping(skb);
75 if (rxq >= peer_dev->num_rx_queues)
76 rxq = rxq % peer_dev->num_rx_queues;
77 rq = peer_ns->rq[rxq];
78
79 cfg = peer_dev->cfg;
80 if (skb_is_nonlinear(skb) &&
81 (cfg->hds_config != ETHTOOL_TCP_DATA_SPLIT_ENABLED ||
82 (cfg->hds_config == ETHTOOL_TCP_DATA_SPLIT_ENABLED &&
83 cfg->hds_thresh > len)))
84 skb_linearize(skb);
85
86 skb_tx_timestamp(skb);
87 if (unlikely(nsim_forward_skb(peer_dev, skb, rq) == NET_RX_DROP))
88 goto out_drop_cnt;
89
90 napi_schedule(&rq->napi);
91
92 rcu_read_unlock();
93 u64_stats_update_begin(&ns->syncp);
94 ns->tx_packets++;
95 ns->tx_bytes += len;
96 u64_stats_update_end(&ns->syncp);
97 return NETDEV_TX_OK;
98
99 out_drop_free:
100 dev_kfree_skb(skb);
101 out_drop_cnt:
102 rcu_read_unlock();
103 u64_stats_update_begin(&ns->syncp);
104 ns->tx_dropped++;
105 u64_stats_update_end(&ns->syncp);
106 return NETDEV_TX_OK;
107 }
108
nsim_set_rx_mode(struct net_device * dev)109 static void nsim_set_rx_mode(struct net_device *dev)
110 {
111 }
112
nsim_change_mtu(struct net_device * dev,int new_mtu)113 static int nsim_change_mtu(struct net_device *dev, int new_mtu)
114 {
115 struct netdevsim *ns = netdev_priv(dev);
116
117 if (ns->xdp.prog && new_mtu > NSIM_XDP_MAX_MTU)
118 return -EBUSY;
119
120 WRITE_ONCE(dev->mtu, new_mtu);
121
122 return 0;
123 }
124
125 static void
nsim_get_stats64(struct net_device * dev,struct rtnl_link_stats64 * stats)126 nsim_get_stats64(struct net_device *dev, struct rtnl_link_stats64 *stats)
127 {
128 struct netdevsim *ns = netdev_priv(dev);
129 unsigned int start;
130
131 do {
132 start = u64_stats_fetch_begin(&ns->syncp);
133 stats->tx_bytes = ns->tx_bytes;
134 stats->tx_packets = ns->tx_packets;
135 stats->tx_dropped = ns->tx_dropped;
136 } while (u64_stats_fetch_retry(&ns->syncp, start));
137 }
138
139 static int
nsim_setup_tc_block_cb(enum tc_setup_type type,void * type_data,void * cb_priv)140 nsim_setup_tc_block_cb(enum tc_setup_type type, void *type_data, void *cb_priv)
141 {
142 return nsim_bpf_setup_tc_block_cb(type, type_data, cb_priv);
143 }
144
nsim_set_vf_mac(struct net_device * dev,int vf,u8 * mac)145 static int nsim_set_vf_mac(struct net_device *dev, int vf, u8 *mac)
146 {
147 struct netdevsim *ns = netdev_priv(dev);
148 struct nsim_dev *nsim_dev = ns->nsim_dev;
149
150 /* Only refuse multicast addresses, zero address can mean unset/any. */
151 if (vf >= nsim_dev_get_vfs(nsim_dev) || is_multicast_ether_addr(mac))
152 return -EINVAL;
153 memcpy(nsim_dev->vfconfigs[vf].vf_mac, mac, ETH_ALEN);
154
155 return 0;
156 }
157
nsim_set_vf_vlan(struct net_device * dev,int vf,u16 vlan,u8 qos,__be16 vlan_proto)158 static int nsim_set_vf_vlan(struct net_device *dev, int vf,
159 u16 vlan, u8 qos, __be16 vlan_proto)
160 {
161 struct netdevsim *ns = netdev_priv(dev);
162 struct nsim_dev *nsim_dev = ns->nsim_dev;
163
164 if (vf >= nsim_dev_get_vfs(nsim_dev) || vlan > 4095 || qos > 7)
165 return -EINVAL;
166
167 nsim_dev->vfconfigs[vf].vlan = vlan;
168 nsim_dev->vfconfigs[vf].qos = qos;
169 nsim_dev->vfconfigs[vf].vlan_proto = vlan_proto;
170
171 return 0;
172 }
173
nsim_set_vf_rate(struct net_device * dev,int vf,int min,int max)174 static int nsim_set_vf_rate(struct net_device *dev, int vf, int min, int max)
175 {
176 struct netdevsim *ns = netdev_priv(dev);
177 struct nsim_dev *nsim_dev = ns->nsim_dev;
178
179 if (nsim_esw_mode_is_switchdev(ns->nsim_dev)) {
180 pr_err("Not supported in switchdev mode. Please use devlink API.\n");
181 return -EOPNOTSUPP;
182 }
183
184 if (vf >= nsim_dev_get_vfs(nsim_dev))
185 return -EINVAL;
186
187 nsim_dev->vfconfigs[vf].min_tx_rate = min;
188 nsim_dev->vfconfigs[vf].max_tx_rate = max;
189
190 return 0;
191 }
192
nsim_set_vf_spoofchk(struct net_device * dev,int vf,bool val)193 static int nsim_set_vf_spoofchk(struct net_device *dev, int vf, bool val)
194 {
195 struct netdevsim *ns = netdev_priv(dev);
196 struct nsim_dev *nsim_dev = ns->nsim_dev;
197
198 if (vf >= nsim_dev_get_vfs(nsim_dev))
199 return -EINVAL;
200 nsim_dev->vfconfigs[vf].spoofchk_enabled = val;
201
202 return 0;
203 }
204
nsim_set_vf_rss_query_en(struct net_device * dev,int vf,bool val)205 static int nsim_set_vf_rss_query_en(struct net_device *dev, int vf, bool val)
206 {
207 struct netdevsim *ns = netdev_priv(dev);
208 struct nsim_dev *nsim_dev = ns->nsim_dev;
209
210 if (vf >= nsim_dev_get_vfs(nsim_dev))
211 return -EINVAL;
212 nsim_dev->vfconfigs[vf].rss_query_enabled = val;
213
214 return 0;
215 }
216
nsim_set_vf_trust(struct net_device * dev,int vf,bool val)217 static int nsim_set_vf_trust(struct net_device *dev, int vf, bool val)
218 {
219 struct netdevsim *ns = netdev_priv(dev);
220 struct nsim_dev *nsim_dev = ns->nsim_dev;
221
222 if (vf >= nsim_dev_get_vfs(nsim_dev))
223 return -EINVAL;
224 nsim_dev->vfconfigs[vf].trusted = val;
225
226 return 0;
227 }
228
229 static int
nsim_get_vf_config(struct net_device * dev,int vf,struct ifla_vf_info * ivi)230 nsim_get_vf_config(struct net_device *dev, int vf, struct ifla_vf_info *ivi)
231 {
232 struct netdevsim *ns = netdev_priv(dev);
233 struct nsim_dev *nsim_dev = ns->nsim_dev;
234
235 if (vf >= nsim_dev_get_vfs(nsim_dev))
236 return -EINVAL;
237
238 ivi->vf = vf;
239 ivi->linkstate = nsim_dev->vfconfigs[vf].link_state;
240 ivi->min_tx_rate = nsim_dev->vfconfigs[vf].min_tx_rate;
241 ivi->max_tx_rate = nsim_dev->vfconfigs[vf].max_tx_rate;
242 ivi->vlan = nsim_dev->vfconfigs[vf].vlan;
243 ivi->vlan_proto = nsim_dev->vfconfigs[vf].vlan_proto;
244 ivi->qos = nsim_dev->vfconfigs[vf].qos;
245 memcpy(&ivi->mac, nsim_dev->vfconfigs[vf].vf_mac, ETH_ALEN);
246 ivi->spoofchk = nsim_dev->vfconfigs[vf].spoofchk_enabled;
247 ivi->trusted = nsim_dev->vfconfigs[vf].trusted;
248 ivi->rss_query_en = nsim_dev->vfconfigs[vf].rss_query_enabled;
249
250 return 0;
251 }
252
nsim_set_vf_link_state(struct net_device * dev,int vf,int state)253 static int nsim_set_vf_link_state(struct net_device *dev, int vf, int state)
254 {
255 struct netdevsim *ns = netdev_priv(dev);
256 struct nsim_dev *nsim_dev = ns->nsim_dev;
257
258 if (vf >= nsim_dev_get_vfs(nsim_dev))
259 return -EINVAL;
260
261 switch (state) {
262 case IFLA_VF_LINK_STATE_AUTO:
263 case IFLA_VF_LINK_STATE_ENABLE:
264 case IFLA_VF_LINK_STATE_DISABLE:
265 break;
266 default:
267 return -EINVAL;
268 }
269
270 nsim_dev->vfconfigs[vf].link_state = state;
271
272 return 0;
273 }
274
nsim_taprio_stats(struct tc_taprio_qopt_stats * stats)275 static void nsim_taprio_stats(struct tc_taprio_qopt_stats *stats)
276 {
277 stats->window_drops = 0;
278 stats->tx_overruns = 0;
279 }
280
nsim_setup_tc_taprio(struct net_device * dev,struct tc_taprio_qopt_offload * offload)281 static int nsim_setup_tc_taprio(struct net_device *dev,
282 struct tc_taprio_qopt_offload *offload)
283 {
284 int err = 0;
285
286 switch (offload->cmd) {
287 case TAPRIO_CMD_REPLACE:
288 case TAPRIO_CMD_DESTROY:
289 break;
290 case TAPRIO_CMD_STATS:
291 nsim_taprio_stats(&offload->stats);
292 break;
293 default:
294 err = -EOPNOTSUPP;
295 }
296
297 return err;
298 }
299
300 static LIST_HEAD(nsim_block_cb_list);
301
302 static int
nsim_setup_tc(struct net_device * dev,enum tc_setup_type type,void * type_data)303 nsim_setup_tc(struct net_device *dev, enum tc_setup_type type, void *type_data)
304 {
305 struct netdevsim *ns = netdev_priv(dev);
306
307 switch (type) {
308 case TC_SETUP_QDISC_TAPRIO:
309 return nsim_setup_tc_taprio(dev, type_data);
310 case TC_SETUP_BLOCK:
311 return flow_block_cb_setup_simple(type_data,
312 &nsim_block_cb_list,
313 nsim_setup_tc_block_cb,
314 ns, ns, true);
315 default:
316 return -EOPNOTSUPP;
317 }
318 }
319
320 static int
nsim_set_features(struct net_device * dev,netdev_features_t features)321 nsim_set_features(struct net_device *dev, netdev_features_t features)
322 {
323 struct netdevsim *ns = netdev_priv(dev);
324
325 if ((dev->features & NETIF_F_HW_TC) > (features & NETIF_F_HW_TC))
326 return nsim_bpf_disable_tc(ns);
327
328 return 0;
329 }
330
nsim_get_iflink(const struct net_device * dev)331 static int nsim_get_iflink(const struct net_device *dev)
332 {
333 struct netdevsim *nsim, *peer;
334 int iflink;
335
336 nsim = netdev_priv(dev);
337
338 rcu_read_lock();
339 peer = rcu_dereference(nsim->peer);
340 iflink = peer ? READ_ONCE(peer->netdev->ifindex) :
341 READ_ONCE(dev->ifindex);
342 rcu_read_unlock();
343
344 return iflink;
345 }
346
nsim_rcv(struct nsim_rq * rq,int budget)347 static int nsim_rcv(struct nsim_rq *rq, int budget)
348 {
349 struct sk_buff *skb;
350 int i;
351
352 for (i = 0; i < budget; i++) {
353 if (skb_queue_empty(&rq->skb_queue))
354 break;
355
356 skb = skb_dequeue(&rq->skb_queue);
357 netif_receive_skb(skb);
358 }
359
360 return i;
361 }
362
nsim_poll(struct napi_struct * napi,int budget)363 static int nsim_poll(struct napi_struct *napi, int budget)
364 {
365 struct nsim_rq *rq = container_of(napi, struct nsim_rq, napi);
366 int done;
367
368 done = nsim_rcv(rq, budget);
369 napi_complete(napi);
370
371 return done;
372 }
373
nsim_create_page_pool(struct page_pool ** p,struct napi_struct * napi)374 static int nsim_create_page_pool(struct page_pool **p, struct napi_struct *napi)
375 {
376 struct page_pool_params params = {
377 .order = 0,
378 .pool_size = NSIM_RING_SIZE,
379 .nid = NUMA_NO_NODE,
380 .dev = &napi->dev->dev,
381 .napi = napi,
382 .dma_dir = DMA_BIDIRECTIONAL,
383 .netdev = napi->dev,
384 };
385 struct page_pool *pool;
386
387 pool = page_pool_create(¶ms);
388 if (IS_ERR(pool))
389 return PTR_ERR(pool);
390
391 *p = pool;
392 return 0;
393 }
394
nsim_init_napi(struct netdevsim * ns)395 static int nsim_init_napi(struct netdevsim *ns)
396 {
397 struct net_device *dev = ns->netdev;
398 struct nsim_rq *rq;
399 int err, i;
400
401 for (i = 0; i < dev->num_rx_queues; i++) {
402 rq = ns->rq[i];
403
404 netif_napi_add_config(dev, &rq->napi, nsim_poll, i);
405 }
406
407 for (i = 0; i < dev->num_rx_queues; i++) {
408 rq = ns->rq[i];
409
410 err = nsim_create_page_pool(&rq->page_pool, &rq->napi);
411 if (err)
412 goto err_pp_destroy;
413 }
414
415 return 0;
416
417 err_pp_destroy:
418 while (i--) {
419 page_pool_destroy(ns->rq[i]->page_pool);
420 ns->rq[i]->page_pool = NULL;
421 }
422
423 for (i = 0; i < dev->num_rx_queues; i++)
424 __netif_napi_del(&ns->rq[i]->napi);
425
426 return err;
427 }
428
nsim_enable_napi(struct netdevsim * ns)429 static void nsim_enable_napi(struct netdevsim *ns)
430 {
431 struct net_device *dev = ns->netdev;
432 int i;
433
434 for (i = 0; i < dev->num_rx_queues; i++) {
435 struct nsim_rq *rq = ns->rq[i];
436
437 netif_queue_set_napi(dev, i, NETDEV_QUEUE_TYPE_RX, &rq->napi);
438 napi_enable(&rq->napi);
439 }
440 }
441
nsim_open(struct net_device * dev)442 static int nsim_open(struct net_device *dev)
443 {
444 struct netdevsim *ns = netdev_priv(dev);
445 int err;
446
447 err = nsim_init_napi(ns);
448 if (err)
449 return err;
450
451 nsim_enable_napi(ns);
452
453 return 0;
454 }
455
nsim_del_napi(struct netdevsim * ns)456 static void nsim_del_napi(struct netdevsim *ns)
457 {
458 struct net_device *dev = ns->netdev;
459 int i;
460
461 for (i = 0; i < dev->num_rx_queues; i++) {
462 struct nsim_rq *rq = ns->rq[i];
463
464 napi_disable(&rq->napi);
465 __netif_napi_del(&rq->napi);
466 }
467 synchronize_net();
468
469 for (i = 0; i < dev->num_rx_queues; i++) {
470 page_pool_destroy(ns->rq[i]->page_pool);
471 ns->rq[i]->page_pool = NULL;
472 }
473 }
474
nsim_stop(struct net_device * dev)475 static int nsim_stop(struct net_device *dev)
476 {
477 struct netdevsim *ns = netdev_priv(dev);
478 struct netdevsim *peer;
479
480 netif_carrier_off(dev);
481 peer = rtnl_dereference(ns->peer);
482 if (peer)
483 netif_carrier_off(peer->netdev);
484
485 nsim_del_napi(ns);
486
487 return 0;
488 }
489
nsim_shaper_set(struct net_shaper_binding * binding,const struct net_shaper * shaper,struct netlink_ext_ack * extack)490 static int nsim_shaper_set(struct net_shaper_binding *binding,
491 const struct net_shaper *shaper,
492 struct netlink_ext_ack *extack)
493 {
494 return 0;
495 }
496
nsim_shaper_del(struct net_shaper_binding * binding,const struct net_shaper_handle * handle,struct netlink_ext_ack * extack)497 static int nsim_shaper_del(struct net_shaper_binding *binding,
498 const struct net_shaper_handle *handle,
499 struct netlink_ext_ack *extack)
500 {
501 return 0;
502 }
503
nsim_shaper_group(struct net_shaper_binding * binding,int leaves_count,const struct net_shaper * leaves,const struct net_shaper * root,struct netlink_ext_ack * extack)504 static int nsim_shaper_group(struct net_shaper_binding *binding,
505 int leaves_count,
506 const struct net_shaper *leaves,
507 const struct net_shaper *root,
508 struct netlink_ext_ack *extack)
509 {
510 return 0;
511 }
512
nsim_shaper_cap(struct net_shaper_binding * binding,enum net_shaper_scope scope,unsigned long * flags)513 static void nsim_shaper_cap(struct net_shaper_binding *binding,
514 enum net_shaper_scope scope,
515 unsigned long *flags)
516 {
517 *flags = ULONG_MAX;
518 }
519
520 static const struct net_shaper_ops nsim_shaper_ops = {
521 .set = nsim_shaper_set,
522 .delete = nsim_shaper_del,
523 .group = nsim_shaper_group,
524 .capabilities = nsim_shaper_cap,
525 };
526
527 static const struct net_device_ops nsim_netdev_ops = {
528 .ndo_start_xmit = nsim_start_xmit,
529 .ndo_set_rx_mode = nsim_set_rx_mode,
530 .ndo_set_mac_address = eth_mac_addr,
531 .ndo_validate_addr = eth_validate_addr,
532 .ndo_change_mtu = nsim_change_mtu,
533 .ndo_get_stats64 = nsim_get_stats64,
534 .ndo_set_vf_mac = nsim_set_vf_mac,
535 .ndo_set_vf_vlan = nsim_set_vf_vlan,
536 .ndo_set_vf_rate = nsim_set_vf_rate,
537 .ndo_set_vf_spoofchk = nsim_set_vf_spoofchk,
538 .ndo_set_vf_trust = nsim_set_vf_trust,
539 .ndo_get_vf_config = nsim_get_vf_config,
540 .ndo_set_vf_link_state = nsim_set_vf_link_state,
541 .ndo_set_vf_rss_query_en = nsim_set_vf_rss_query_en,
542 .ndo_setup_tc = nsim_setup_tc,
543 .ndo_set_features = nsim_set_features,
544 .ndo_get_iflink = nsim_get_iflink,
545 .ndo_bpf = nsim_bpf,
546 .ndo_open = nsim_open,
547 .ndo_stop = nsim_stop,
548 .net_shaper_ops = &nsim_shaper_ops,
549 };
550
551 static const struct net_device_ops nsim_vf_netdev_ops = {
552 .ndo_start_xmit = nsim_start_xmit,
553 .ndo_set_rx_mode = nsim_set_rx_mode,
554 .ndo_set_mac_address = eth_mac_addr,
555 .ndo_validate_addr = eth_validate_addr,
556 .ndo_change_mtu = nsim_change_mtu,
557 .ndo_get_stats64 = nsim_get_stats64,
558 .ndo_setup_tc = nsim_setup_tc,
559 .ndo_set_features = nsim_set_features,
560 };
561
562 /* We don't have true per-queue stats, yet, so do some random fakery here.
563 * Only report stuff for queue 0.
564 */
nsim_get_queue_stats_rx(struct net_device * dev,int idx,struct netdev_queue_stats_rx * stats)565 static void nsim_get_queue_stats_rx(struct net_device *dev, int idx,
566 struct netdev_queue_stats_rx *stats)
567 {
568 struct rtnl_link_stats64 rtstats = {};
569
570 if (!idx)
571 nsim_get_stats64(dev, &rtstats);
572
573 stats->packets = rtstats.rx_packets - !!rtstats.rx_packets;
574 stats->bytes = rtstats.rx_bytes;
575 }
576
nsim_get_queue_stats_tx(struct net_device * dev,int idx,struct netdev_queue_stats_tx * stats)577 static void nsim_get_queue_stats_tx(struct net_device *dev, int idx,
578 struct netdev_queue_stats_tx *stats)
579 {
580 struct rtnl_link_stats64 rtstats = {};
581
582 if (!idx)
583 nsim_get_stats64(dev, &rtstats);
584
585 stats->packets = rtstats.tx_packets - !!rtstats.tx_packets;
586 stats->bytes = rtstats.tx_bytes;
587 }
588
nsim_get_base_stats(struct net_device * dev,struct netdev_queue_stats_rx * rx,struct netdev_queue_stats_tx * tx)589 static void nsim_get_base_stats(struct net_device *dev,
590 struct netdev_queue_stats_rx *rx,
591 struct netdev_queue_stats_tx *tx)
592 {
593 struct rtnl_link_stats64 rtstats = {};
594
595 nsim_get_stats64(dev, &rtstats);
596
597 rx->packets = !!rtstats.rx_packets;
598 rx->bytes = 0;
599 tx->packets = !!rtstats.tx_packets;
600 tx->bytes = 0;
601 }
602
603 static const struct netdev_stat_ops nsim_stat_ops = {
604 .get_queue_stats_tx = nsim_get_queue_stats_tx,
605 .get_queue_stats_rx = nsim_get_queue_stats_rx,
606 .get_base_stats = nsim_get_base_stats,
607 };
608
nsim_queue_alloc(void)609 static struct nsim_rq *nsim_queue_alloc(void)
610 {
611 struct nsim_rq *rq;
612
613 rq = kzalloc(sizeof(*rq), GFP_KERNEL_ACCOUNT);
614 if (!rq)
615 return NULL;
616
617 skb_queue_head_init(&rq->skb_queue);
618 return rq;
619 }
620
nsim_queue_free(struct nsim_rq * rq)621 static void nsim_queue_free(struct nsim_rq *rq)
622 {
623 skb_queue_purge_reason(&rq->skb_queue, SKB_DROP_REASON_QUEUE_PURGE);
624 kfree(rq);
625 }
626
627 /* Queue reset mode is controlled by ns->rq_reset_mode.
628 * - normal - new NAPI new pool (old NAPI enabled when new added)
629 * - mode 1 - allocate new pool (NAPI is only disabled / enabled)
630 * - mode 2 - new NAPI new pool (old NAPI removed before new added)
631 * - mode 3 - new NAPI new pool (old NAPI disabled when new added)
632 */
633 struct nsim_queue_mem {
634 struct nsim_rq *rq;
635 struct page_pool *pp;
636 };
637
638 static int
nsim_queue_mem_alloc(struct net_device * dev,void * per_queue_mem,int idx)639 nsim_queue_mem_alloc(struct net_device *dev, void *per_queue_mem, int idx)
640 {
641 struct nsim_queue_mem *qmem = per_queue_mem;
642 struct netdevsim *ns = netdev_priv(dev);
643 int err;
644
645 if (ns->rq_reset_mode > 3)
646 return -EINVAL;
647
648 if (ns->rq_reset_mode == 1)
649 return nsim_create_page_pool(&qmem->pp, &ns->rq[idx]->napi);
650
651 qmem->rq = nsim_queue_alloc();
652 if (!qmem->rq)
653 return -ENOMEM;
654
655 err = nsim_create_page_pool(&qmem->rq->page_pool, &qmem->rq->napi);
656 if (err)
657 goto err_free;
658
659 if (!ns->rq_reset_mode)
660 netif_napi_add_config(dev, &qmem->rq->napi, nsim_poll, idx);
661
662 return 0;
663
664 err_free:
665 nsim_queue_free(qmem->rq);
666 return err;
667 }
668
nsim_queue_mem_free(struct net_device * dev,void * per_queue_mem)669 static void nsim_queue_mem_free(struct net_device *dev, void *per_queue_mem)
670 {
671 struct nsim_queue_mem *qmem = per_queue_mem;
672 struct netdevsim *ns = netdev_priv(dev);
673
674 page_pool_destroy(qmem->pp);
675 if (qmem->rq) {
676 if (!ns->rq_reset_mode)
677 netif_napi_del(&qmem->rq->napi);
678 page_pool_destroy(qmem->rq->page_pool);
679 nsim_queue_free(qmem->rq);
680 }
681 }
682
683 static int
nsim_queue_start(struct net_device * dev,void * per_queue_mem,int idx)684 nsim_queue_start(struct net_device *dev, void *per_queue_mem, int idx)
685 {
686 struct nsim_queue_mem *qmem = per_queue_mem;
687 struct netdevsim *ns = netdev_priv(dev);
688
689 if (ns->rq_reset_mode == 1) {
690 ns->rq[idx]->page_pool = qmem->pp;
691 napi_enable(&ns->rq[idx]->napi);
692 return 0;
693 }
694
695 /* netif_napi_add()/_del() should normally be called from alloc/free,
696 * here we want to test various call orders.
697 */
698 if (ns->rq_reset_mode == 2) {
699 netif_napi_del(&ns->rq[idx]->napi);
700 netif_napi_add_config(dev, &qmem->rq->napi, nsim_poll, idx);
701 } else if (ns->rq_reset_mode == 3) {
702 netif_napi_add_config(dev, &qmem->rq->napi, nsim_poll, idx);
703 netif_napi_del(&ns->rq[idx]->napi);
704 }
705
706 ns->rq[idx] = qmem->rq;
707 napi_enable(&ns->rq[idx]->napi);
708
709 return 0;
710 }
711
nsim_queue_stop(struct net_device * dev,void * per_queue_mem,int idx)712 static int nsim_queue_stop(struct net_device *dev, void *per_queue_mem, int idx)
713 {
714 struct nsim_queue_mem *qmem = per_queue_mem;
715 struct netdevsim *ns = netdev_priv(dev);
716
717 napi_disable(&ns->rq[idx]->napi);
718
719 if (ns->rq_reset_mode == 1) {
720 qmem->pp = ns->rq[idx]->page_pool;
721 page_pool_disable_direct_recycling(qmem->pp);
722 } else {
723 qmem->rq = ns->rq[idx];
724 }
725
726 return 0;
727 }
728
729 static const struct netdev_queue_mgmt_ops nsim_queue_mgmt_ops = {
730 .ndo_queue_mem_size = sizeof(struct nsim_queue_mem),
731 .ndo_queue_mem_alloc = nsim_queue_mem_alloc,
732 .ndo_queue_mem_free = nsim_queue_mem_free,
733 .ndo_queue_start = nsim_queue_start,
734 .ndo_queue_stop = nsim_queue_stop,
735 };
736
737 static ssize_t
nsim_qreset_write(struct file * file,const char __user * data,size_t count,loff_t * ppos)738 nsim_qreset_write(struct file *file, const char __user *data,
739 size_t count, loff_t *ppos)
740 {
741 struct netdevsim *ns = file->private_data;
742 unsigned int queue, mode;
743 char buf[32];
744 ssize_t ret;
745
746 if (count >= sizeof(buf))
747 return -EINVAL;
748 if (copy_from_user(buf, data, count))
749 return -EFAULT;
750 buf[count] = '\0';
751
752 ret = sscanf(buf, "%u %u", &queue, &mode);
753 if (ret != 2)
754 return -EINVAL;
755
756 rtnl_lock();
757 if (!netif_running(ns->netdev)) {
758 ret = -ENETDOWN;
759 goto exit_unlock;
760 }
761
762 if (queue >= ns->netdev->real_num_rx_queues) {
763 ret = -EINVAL;
764 goto exit_unlock;
765 }
766
767 ns->rq_reset_mode = mode;
768 ret = netdev_rx_queue_restart(ns->netdev, queue);
769 ns->rq_reset_mode = 0;
770 if (ret)
771 goto exit_unlock;
772
773 ret = count;
774 exit_unlock:
775 rtnl_unlock();
776 return ret;
777 }
778
779 static const struct file_operations nsim_qreset_fops = {
780 .open = simple_open,
781 .write = nsim_qreset_write,
782 .owner = THIS_MODULE,
783 };
784
785 static ssize_t
nsim_pp_hold_read(struct file * file,char __user * data,size_t count,loff_t * ppos)786 nsim_pp_hold_read(struct file *file, char __user *data,
787 size_t count, loff_t *ppos)
788 {
789 struct netdevsim *ns = file->private_data;
790 char buf[3] = "n\n";
791
792 if (ns->page)
793 buf[0] = 'y';
794
795 return simple_read_from_buffer(data, count, ppos, buf, 2);
796 }
797
798 static ssize_t
nsim_pp_hold_write(struct file * file,const char __user * data,size_t count,loff_t * ppos)799 nsim_pp_hold_write(struct file *file, const char __user *data,
800 size_t count, loff_t *ppos)
801 {
802 struct netdevsim *ns = file->private_data;
803 ssize_t ret;
804 bool val;
805
806 ret = kstrtobool_from_user(data, count, &val);
807 if (ret)
808 return ret;
809
810 rtnl_lock();
811 ret = count;
812 if (val == !!ns->page)
813 goto exit;
814
815 if (!netif_running(ns->netdev) && val) {
816 ret = -ENETDOWN;
817 } else if (val) {
818 ns->page = page_pool_dev_alloc_pages(ns->rq[0]->page_pool);
819 if (!ns->page)
820 ret = -ENOMEM;
821 } else {
822 page_pool_put_full_page(ns->page->pp, ns->page, false);
823 ns->page = NULL;
824 }
825
826 exit:
827 rtnl_unlock();
828 return ret;
829 }
830
831 static const struct file_operations nsim_pp_hold_fops = {
832 .open = simple_open,
833 .read = nsim_pp_hold_read,
834 .write = nsim_pp_hold_write,
835 .llseek = generic_file_llseek,
836 .owner = THIS_MODULE,
837 };
838
nsim_setup(struct net_device * dev)839 static void nsim_setup(struct net_device *dev)
840 {
841 ether_setup(dev);
842 eth_hw_addr_random(dev);
843
844 dev->tx_queue_len = 0;
845 dev->flags &= ~IFF_MULTICAST;
846 dev->priv_flags |= IFF_LIVE_ADDR_CHANGE |
847 IFF_NO_QUEUE;
848 dev->features |= NETIF_F_HIGHDMA |
849 NETIF_F_SG |
850 NETIF_F_FRAGLIST |
851 NETIF_F_HW_CSUM |
852 NETIF_F_TSO;
853 dev->hw_features |= NETIF_F_HW_TC |
854 NETIF_F_SG |
855 NETIF_F_FRAGLIST |
856 NETIF_F_HW_CSUM |
857 NETIF_F_TSO;
858 dev->max_mtu = ETH_MAX_MTU;
859 dev->xdp_features = NETDEV_XDP_ACT_HW_OFFLOAD;
860 }
861
nsim_queue_init(struct netdevsim * ns)862 static int nsim_queue_init(struct netdevsim *ns)
863 {
864 struct net_device *dev = ns->netdev;
865 int i;
866
867 ns->rq = kcalloc(dev->num_rx_queues, sizeof(*ns->rq),
868 GFP_KERNEL_ACCOUNT);
869 if (!ns->rq)
870 return -ENOMEM;
871
872 for (i = 0; i < dev->num_rx_queues; i++) {
873 ns->rq[i] = nsim_queue_alloc();
874 if (!ns->rq[i])
875 goto err_free_prev;
876 }
877
878 return 0;
879
880 err_free_prev:
881 while (i--)
882 kfree(ns->rq[i]);
883 kfree(ns->rq);
884 return -ENOMEM;
885 }
886
nsim_queue_uninit(struct netdevsim * ns)887 static void nsim_queue_uninit(struct netdevsim *ns)
888 {
889 struct net_device *dev = ns->netdev;
890 int i;
891
892 for (i = 0; i < dev->num_rx_queues; i++)
893 nsim_queue_free(ns->rq[i]);
894
895 kfree(ns->rq);
896 ns->rq = NULL;
897 }
898
nsim_init_netdevsim(struct netdevsim * ns)899 static int nsim_init_netdevsim(struct netdevsim *ns)
900 {
901 struct mock_phc *phc;
902 int err;
903
904 phc = mock_phc_create(&ns->nsim_bus_dev->dev);
905 if (IS_ERR(phc))
906 return PTR_ERR(phc);
907
908 ns->phc = phc;
909 ns->netdev->netdev_ops = &nsim_netdev_ops;
910 ns->netdev->stat_ops = &nsim_stat_ops;
911 ns->netdev->queue_mgmt_ops = &nsim_queue_mgmt_ops;
912
913 err = nsim_udp_tunnels_info_create(ns->nsim_dev, ns->netdev);
914 if (err)
915 goto err_phc_destroy;
916
917 rtnl_lock();
918 err = nsim_queue_init(ns);
919 if (err)
920 goto err_utn_destroy;
921
922 err = nsim_bpf_init(ns);
923 if (err)
924 goto err_rq_destroy;
925
926 nsim_macsec_init(ns);
927 nsim_ipsec_init(ns);
928
929 err = register_netdevice(ns->netdev);
930 if (err)
931 goto err_ipsec_teardown;
932 rtnl_unlock();
933 return 0;
934
935 err_ipsec_teardown:
936 nsim_ipsec_teardown(ns);
937 nsim_macsec_teardown(ns);
938 nsim_bpf_uninit(ns);
939 err_rq_destroy:
940 nsim_queue_uninit(ns);
941 err_utn_destroy:
942 rtnl_unlock();
943 nsim_udp_tunnels_info_destroy(ns->netdev);
944 err_phc_destroy:
945 mock_phc_destroy(ns->phc);
946 return err;
947 }
948
nsim_init_netdevsim_vf(struct netdevsim * ns)949 static int nsim_init_netdevsim_vf(struct netdevsim *ns)
950 {
951 int err;
952
953 ns->netdev->netdev_ops = &nsim_vf_netdev_ops;
954 rtnl_lock();
955 err = register_netdevice(ns->netdev);
956 rtnl_unlock();
957 return err;
958 }
959
nsim_exit_netdevsim(struct netdevsim * ns)960 static void nsim_exit_netdevsim(struct netdevsim *ns)
961 {
962 nsim_udp_tunnels_info_destroy(ns->netdev);
963 mock_phc_destroy(ns->phc);
964 }
965
966 struct netdevsim *
nsim_create(struct nsim_dev * nsim_dev,struct nsim_dev_port * nsim_dev_port)967 nsim_create(struct nsim_dev *nsim_dev, struct nsim_dev_port *nsim_dev_port)
968 {
969 struct net_device *dev;
970 struct netdevsim *ns;
971 int err;
972
973 dev = alloc_netdev_mq(sizeof(*ns), "eth%d", NET_NAME_UNKNOWN, nsim_setup,
974 nsim_dev->nsim_bus_dev->num_queues);
975 if (!dev)
976 return ERR_PTR(-ENOMEM);
977
978 dev_net_set(dev, nsim_dev_net(nsim_dev));
979 ns = netdev_priv(dev);
980 ns->netdev = dev;
981 u64_stats_init(&ns->syncp);
982 ns->nsim_dev = nsim_dev;
983 ns->nsim_dev_port = nsim_dev_port;
984 ns->nsim_bus_dev = nsim_dev->nsim_bus_dev;
985 SET_NETDEV_DEV(dev, &ns->nsim_bus_dev->dev);
986 SET_NETDEV_DEVLINK_PORT(dev, &nsim_dev_port->devlink_port);
987 nsim_ethtool_init(ns);
988 if (nsim_dev_port_is_pf(nsim_dev_port))
989 err = nsim_init_netdevsim(ns);
990 else
991 err = nsim_init_netdevsim_vf(ns);
992 if (err)
993 goto err_free_netdev;
994
995 ns->pp_dfs = debugfs_create_file("pp_hold", 0600, nsim_dev_port->ddir,
996 ns, &nsim_pp_hold_fops);
997 ns->qr_dfs = debugfs_create_file("queue_reset", 0200,
998 nsim_dev_port->ddir, ns,
999 &nsim_qreset_fops);
1000
1001 return ns;
1002
1003 err_free_netdev:
1004 free_netdev(dev);
1005 return ERR_PTR(err);
1006 }
1007
nsim_destroy(struct netdevsim * ns)1008 void nsim_destroy(struct netdevsim *ns)
1009 {
1010 struct net_device *dev = ns->netdev;
1011 struct netdevsim *peer;
1012
1013 debugfs_remove(ns->qr_dfs);
1014 debugfs_remove(ns->pp_dfs);
1015
1016 rtnl_lock();
1017 peer = rtnl_dereference(ns->peer);
1018 if (peer)
1019 RCU_INIT_POINTER(peer->peer, NULL);
1020 RCU_INIT_POINTER(ns->peer, NULL);
1021 unregister_netdevice(dev);
1022 if (nsim_dev_port_is_pf(ns->nsim_dev_port)) {
1023 nsim_macsec_teardown(ns);
1024 nsim_ipsec_teardown(ns);
1025 nsim_bpf_uninit(ns);
1026 nsim_queue_uninit(ns);
1027 }
1028 rtnl_unlock();
1029 if (nsim_dev_port_is_pf(ns->nsim_dev_port))
1030 nsim_exit_netdevsim(ns);
1031
1032 /* Put this intentionally late to exercise the orphaning path */
1033 if (ns->page) {
1034 page_pool_put_full_page(ns->page->pp, ns->page, false);
1035 ns->page = NULL;
1036 }
1037
1038 free_netdev(dev);
1039 }
1040
netdev_is_nsim(struct net_device * dev)1041 bool netdev_is_nsim(struct net_device *dev)
1042 {
1043 return dev->netdev_ops == &nsim_netdev_ops;
1044 }
1045
nsim_validate(struct nlattr * tb[],struct nlattr * data[],struct netlink_ext_ack * extack)1046 static int nsim_validate(struct nlattr *tb[], struct nlattr *data[],
1047 struct netlink_ext_ack *extack)
1048 {
1049 NL_SET_ERR_MSG_MOD(extack,
1050 "Please use: echo \"[ID] [PORT_COUNT] [NUM_QUEUES]\" > /sys/bus/netdevsim/new_device");
1051 return -EOPNOTSUPP;
1052 }
1053
1054 static struct rtnl_link_ops nsim_link_ops __read_mostly = {
1055 .kind = DRV_NAME,
1056 .validate = nsim_validate,
1057 };
1058
nsim_module_init(void)1059 static int __init nsim_module_init(void)
1060 {
1061 int err;
1062
1063 err = nsim_dev_init();
1064 if (err)
1065 return err;
1066
1067 err = nsim_bus_init();
1068 if (err)
1069 goto err_dev_exit;
1070
1071 err = rtnl_link_register(&nsim_link_ops);
1072 if (err)
1073 goto err_bus_exit;
1074
1075 return 0;
1076
1077 err_bus_exit:
1078 nsim_bus_exit();
1079 err_dev_exit:
1080 nsim_dev_exit();
1081 return err;
1082 }
1083
nsim_module_exit(void)1084 static void __exit nsim_module_exit(void)
1085 {
1086 rtnl_link_unregister(&nsim_link_ops);
1087 nsim_bus_exit();
1088 nsim_dev_exit();
1089 }
1090
1091 module_init(nsim_module_init);
1092 module_exit(nsim_module_exit);
1093 MODULE_LICENSE("GPL");
1094 MODULE_DESCRIPTION("Simulated networking device for testing");
1095 MODULE_ALIAS_RTNL_LINK(DRV_NAME);
1096