xref: /linux/drivers/net/netdevsim/netdev.c (revision 07fdad3a93756b872da7b53647715c48d0f4a2d0)
1 /*
2  * Copyright (C) 2017 Netronome Systems, Inc.
3  *
4  * This software is licensed under the GNU General License Version 2,
5  * June 1991 as shown in the file COPYING in the top-level directory of this
6  * source tree.
7  *
8  * THE COPYRIGHT HOLDERS AND/OR OTHER PARTIES PROVIDE THE PROGRAM "AS IS"
9  * WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING,
10  * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
11  * FOR A PARTICULAR PURPOSE. THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE
12  * OF THE PROGRAM IS WITH YOU. SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME
13  * THE COST OF ALL NECESSARY SERVICING, REPAIR OR CORRECTION.
14  */
15 
16 #include <linux/debugfs.h>
17 #include <linux/etherdevice.h>
18 #include <linux/ethtool_netlink.h>
19 #include <linux/kernel.h>
20 #include <linux/module.h>
21 #include <linux/netdevice.h>
22 #include <linux/slab.h>
23 #include <net/netdev_queues.h>
24 #include <net/netdev_rx_queue.h>
25 #include <net/page_pool/helpers.h>
26 #include <net/netlink.h>
27 #include <net/net_shaper.h>
28 #include <net/netdev_lock.h>
29 #include <net/pkt_cls.h>
30 #include <net/rtnetlink.h>
31 #include <net/udp_tunnel.h>
32 #include <net/busy_poll.h>
33 
34 #include "netdevsim.h"
35 
36 MODULE_IMPORT_NS("NETDEV_INTERNAL");
37 
38 #define NSIM_RING_SIZE		256
39 
40 static void nsim_start_peer_tx_queue(struct net_device *dev, struct nsim_rq *rq)
41 {
42 	struct netdevsim *ns = netdev_priv(dev);
43 	struct net_device *peer_dev;
44 	struct netdevsim *peer_ns;
45 	struct netdev_queue *txq;
46 	u16 idx;
47 
48 	idx = rq->napi.index;
49 	rcu_read_lock();
50 	peer_ns = rcu_dereference(ns->peer);
51 	if (!peer_ns)
52 		goto out;
53 
54 	/* TX device */
55 	peer_dev = peer_ns->netdev;
56 	if (dev->real_num_tx_queues != peer_dev->num_rx_queues)
57 		goto out;
58 
59 	txq = netdev_get_tx_queue(peer_dev, idx);
60 	if (!netif_tx_queue_stopped(txq))
61 		goto out;
62 
63 	netif_tx_wake_queue(txq);
64 out:
65 	rcu_read_unlock();
66 }
67 
68 static void nsim_stop_tx_queue(struct net_device *tx_dev,
69 			       struct net_device *rx_dev,
70 			       struct nsim_rq *rq,
71 			       u16 idx)
72 {
73 	/* If different queues size, do not stop, since it is not
74 	 * easy to find which TX queue is mapped here
75 	 */
76 	if (rx_dev->real_num_tx_queues != tx_dev->num_rx_queues)
77 		return;
78 
79 	/* rq is the queue on the receive side */
80 	netif_subqueue_try_stop(tx_dev, idx,
81 				NSIM_RING_SIZE - skb_queue_len(&rq->skb_queue),
82 				NSIM_RING_SIZE / 2);
83 }
84 
85 static int nsim_napi_rx(struct net_device *tx_dev, struct net_device *rx_dev,
86 			struct nsim_rq *rq, struct sk_buff *skb)
87 {
88 	if (skb_queue_len(&rq->skb_queue) > NSIM_RING_SIZE) {
89 		dev_kfree_skb_any(skb);
90 		return NET_RX_DROP;
91 	}
92 
93 	skb_queue_tail(&rq->skb_queue, skb);
94 
95 	/* Stop the peer TX queue avoiding dropping packets later */
96 	if (skb_queue_len(&rq->skb_queue) >= NSIM_RING_SIZE)
97 		nsim_stop_tx_queue(tx_dev, rx_dev, rq,
98 				   skb_get_queue_mapping(skb));
99 
100 	return NET_RX_SUCCESS;
101 }
102 
103 static int nsim_forward_skb(struct net_device *tx_dev,
104 			    struct net_device *rx_dev,
105 			    struct sk_buff *skb,
106 			    struct nsim_rq *rq,
107 			    struct skb_ext *psp_ext)
108 {
109 	int ret;
110 
111 	ret = __dev_forward_skb(rx_dev, skb);
112 	if (ret)
113 		return ret;
114 
115 	nsim_psp_handle_ext(skb, psp_ext);
116 
117 	return nsim_napi_rx(tx_dev, rx_dev, rq, skb);
118 }
119 
120 static netdev_tx_t nsim_start_xmit(struct sk_buff *skb, struct net_device *dev)
121 {
122 	struct netdevsim *ns = netdev_priv(dev);
123 	struct skb_ext *psp_ext = NULL;
124 	struct net_device *peer_dev;
125 	unsigned int len = skb->len;
126 	struct netdevsim *peer_ns;
127 	struct netdev_config *cfg;
128 	struct nsim_rq *rq;
129 	int rxq;
130 	int dr;
131 
132 	rcu_read_lock();
133 	if (!nsim_ipsec_tx(ns, skb))
134 		goto out_drop_any;
135 
136 	peer_ns = rcu_dereference(ns->peer);
137 	if (!peer_ns)
138 		goto out_drop_any;
139 
140 	dr = nsim_do_psp(skb, ns, peer_ns, &psp_ext);
141 	if (dr)
142 		goto out_drop_free;
143 
144 	peer_dev = peer_ns->netdev;
145 	rxq = skb_get_queue_mapping(skb);
146 	if (rxq >= peer_dev->num_rx_queues)
147 		rxq = rxq % peer_dev->num_rx_queues;
148 	rq = peer_ns->rq[rxq];
149 
150 	cfg = peer_dev->cfg;
151 	if (skb_is_nonlinear(skb) &&
152 	    (cfg->hds_config != ETHTOOL_TCP_DATA_SPLIT_ENABLED ||
153 	     (cfg->hds_config == ETHTOOL_TCP_DATA_SPLIT_ENABLED &&
154 	      cfg->hds_thresh > len)))
155 		skb_linearize(skb);
156 
157 	skb_tx_timestamp(skb);
158 	if (unlikely(nsim_forward_skb(dev, peer_dev,
159 				      skb, rq, psp_ext) == NET_RX_DROP))
160 		goto out_drop_cnt;
161 
162 	if (!hrtimer_active(&rq->napi_timer))
163 		hrtimer_start(&rq->napi_timer, us_to_ktime(5), HRTIMER_MODE_REL);
164 
165 	rcu_read_unlock();
166 	dev_dstats_tx_add(dev, len);
167 	return NETDEV_TX_OK;
168 
169 out_drop_any:
170 	dr = SKB_DROP_REASON_NOT_SPECIFIED;
171 out_drop_free:
172 	kfree_skb_reason(skb, dr);
173 out_drop_cnt:
174 	rcu_read_unlock();
175 	dev_dstats_tx_dropped(dev);
176 	return NETDEV_TX_OK;
177 }
178 
179 static void nsim_set_rx_mode(struct net_device *dev)
180 {
181 }
182 
183 static int nsim_change_mtu(struct net_device *dev, int new_mtu)
184 {
185 	struct netdevsim *ns = netdev_priv(dev);
186 
187 	if (ns->xdp.prog && !ns->xdp.prog->aux->xdp_has_frags &&
188 	    new_mtu > NSIM_XDP_MAX_MTU)
189 		return -EBUSY;
190 
191 	WRITE_ONCE(dev->mtu, new_mtu);
192 
193 	return 0;
194 }
195 
196 static int
197 nsim_setup_tc_block_cb(enum tc_setup_type type, void *type_data, void *cb_priv)
198 {
199 	return nsim_bpf_setup_tc_block_cb(type, type_data, cb_priv);
200 }
201 
202 static int nsim_set_vf_mac(struct net_device *dev, int vf, u8 *mac)
203 {
204 	struct netdevsim *ns = netdev_priv(dev);
205 	struct nsim_dev *nsim_dev = ns->nsim_dev;
206 
207 	/* Only refuse multicast addresses, zero address can mean unset/any. */
208 	if (vf >= nsim_dev_get_vfs(nsim_dev) || is_multicast_ether_addr(mac))
209 		return -EINVAL;
210 	memcpy(nsim_dev->vfconfigs[vf].vf_mac, mac, ETH_ALEN);
211 
212 	return 0;
213 }
214 
215 static int nsim_set_vf_vlan(struct net_device *dev, int vf,
216 			    u16 vlan, u8 qos, __be16 vlan_proto)
217 {
218 	struct netdevsim *ns = netdev_priv(dev);
219 	struct nsim_dev *nsim_dev = ns->nsim_dev;
220 
221 	if (vf >= nsim_dev_get_vfs(nsim_dev) || vlan > 4095 || qos > 7)
222 		return -EINVAL;
223 
224 	nsim_dev->vfconfigs[vf].vlan = vlan;
225 	nsim_dev->vfconfigs[vf].qos = qos;
226 	nsim_dev->vfconfigs[vf].vlan_proto = vlan_proto;
227 
228 	return 0;
229 }
230 
231 static int nsim_set_vf_rate(struct net_device *dev, int vf, int min, int max)
232 {
233 	struct netdevsim *ns = netdev_priv(dev);
234 	struct nsim_dev *nsim_dev = ns->nsim_dev;
235 
236 	if (nsim_esw_mode_is_switchdev(ns->nsim_dev)) {
237 		pr_err("Not supported in switchdev mode. Please use devlink API.\n");
238 		return -EOPNOTSUPP;
239 	}
240 
241 	if (vf >= nsim_dev_get_vfs(nsim_dev))
242 		return -EINVAL;
243 
244 	nsim_dev->vfconfigs[vf].min_tx_rate = min;
245 	nsim_dev->vfconfigs[vf].max_tx_rate = max;
246 
247 	return 0;
248 }
249 
250 static int nsim_set_vf_spoofchk(struct net_device *dev, int vf, bool val)
251 {
252 	struct netdevsim *ns = netdev_priv(dev);
253 	struct nsim_dev *nsim_dev = ns->nsim_dev;
254 
255 	if (vf >= nsim_dev_get_vfs(nsim_dev))
256 		return -EINVAL;
257 	nsim_dev->vfconfigs[vf].spoofchk_enabled = val;
258 
259 	return 0;
260 }
261 
262 static int nsim_set_vf_rss_query_en(struct net_device *dev, int vf, bool val)
263 {
264 	struct netdevsim *ns = netdev_priv(dev);
265 	struct nsim_dev *nsim_dev = ns->nsim_dev;
266 
267 	if (vf >= nsim_dev_get_vfs(nsim_dev))
268 		return -EINVAL;
269 	nsim_dev->vfconfigs[vf].rss_query_enabled = val;
270 
271 	return 0;
272 }
273 
274 static int nsim_set_vf_trust(struct net_device *dev, int vf, bool val)
275 {
276 	struct netdevsim *ns = netdev_priv(dev);
277 	struct nsim_dev *nsim_dev = ns->nsim_dev;
278 
279 	if (vf >= nsim_dev_get_vfs(nsim_dev))
280 		return -EINVAL;
281 	nsim_dev->vfconfigs[vf].trusted = val;
282 
283 	return 0;
284 }
285 
286 static int
287 nsim_get_vf_config(struct net_device *dev, int vf, struct ifla_vf_info *ivi)
288 {
289 	struct netdevsim *ns = netdev_priv(dev);
290 	struct nsim_dev *nsim_dev = ns->nsim_dev;
291 
292 	if (vf >= nsim_dev_get_vfs(nsim_dev))
293 		return -EINVAL;
294 
295 	ivi->vf = vf;
296 	ivi->linkstate = nsim_dev->vfconfigs[vf].link_state;
297 	ivi->min_tx_rate = nsim_dev->vfconfigs[vf].min_tx_rate;
298 	ivi->max_tx_rate = nsim_dev->vfconfigs[vf].max_tx_rate;
299 	ivi->vlan = nsim_dev->vfconfigs[vf].vlan;
300 	ivi->vlan_proto = nsim_dev->vfconfigs[vf].vlan_proto;
301 	ivi->qos = nsim_dev->vfconfigs[vf].qos;
302 	memcpy(&ivi->mac, nsim_dev->vfconfigs[vf].vf_mac, ETH_ALEN);
303 	ivi->spoofchk = nsim_dev->vfconfigs[vf].spoofchk_enabled;
304 	ivi->trusted = nsim_dev->vfconfigs[vf].trusted;
305 	ivi->rss_query_en = nsim_dev->vfconfigs[vf].rss_query_enabled;
306 
307 	return 0;
308 }
309 
310 static int nsim_set_vf_link_state(struct net_device *dev, int vf, int state)
311 {
312 	struct netdevsim *ns = netdev_priv(dev);
313 	struct nsim_dev *nsim_dev = ns->nsim_dev;
314 
315 	if (vf >= nsim_dev_get_vfs(nsim_dev))
316 		return -EINVAL;
317 
318 	switch (state) {
319 	case IFLA_VF_LINK_STATE_AUTO:
320 	case IFLA_VF_LINK_STATE_ENABLE:
321 	case IFLA_VF_LINK_STATE_DISABLE:
322 		break;
323 	default:
324 		return -EINVAL;
325 	}
326 
327 	nsim_dev->vfconfigs[vf].link_state = state;
328 
329 	return 0;
330 }
331 
332 static void nsim_taprio_stats(struct tc_taprio_qopt_stats *stats)
333 {
334 	stats->window_drops = 0;
335 	stats->tx_overruns = 0;
336 }
337 
338 static int nsim_setup_tc_taprio(struct net_device *dev,
339 				struct tc_taprio_qopt_offload *offload)
340 {
341 	int err = 0;
342 
343 	switch (offload->cmd) {
344 	case TAPRIO_CMD_REPLACE:
345 	case TAPRIO_CMD_DESTROY:
346 		break;
347 	case TAPRIO_CMD_STATS:
348 		nsim_taprio_stats(&offload->stats);
349 		break;
350 	default:
351 		err = -EOPNOTSUPP;
352 	}
353 
354 	return err;
355 }
356 
357 static LIST_HEAD(nsim_block_cb_list);
358 
359 static int
360 nsim_setup_tc(struct net_device *dev, enum tc_setup_type type, void *type_data)
361 {
362 	struct netdevsim *ns = netdev_priv(dev);
363 
364 	switch (type) {
365 	case TC_SETUP_QDISC_TAPRIO:
366 		return nsim_setup_tc_taprio(dev, type_data);
367 	case TC_SETUP_BLOCK:
368 		return flow_block_cb_setup_simple(type_data,
369 						  &nsim_block_cb_list,
370 						  nsim_setup_tc_block_cb,
371 						  ns, ns, true);
372 	default:
373 		return -EOPNOTSUPP;
374 	}
375 }
376 
377 static int
378 nsim_set_features(struct net_device *dev, netdev_features_t features)
379 {
380 	struct netdevsim *ns = netdev_priv(dev);
381 
382 	if ((dev->features & NETIF_F_HW_TC) > (features & NETIF_F_HW_TC))
383 		return nsim_bpf_disable_tc(ns);
384 
385 	return 0;
386 }
387 
388 static int nsim_get_iflink(const struct net_device *dev)
389 {
390 	struct netdevsim *nsim, *peer;
391 	int iflink;
392 
393 	nsim = netdev_priv(dev);
394 
395 	rcu_read_lock();
396 	peer = rcu_dereference(nsim->peer);
397 	iflink = peer ? READ_ONCE(peer->netdev->ifindex) :
398 			READ_ONCE(dev->ifindex);
399 	rcu_read_unlock();
400 
401 	return iflink;
402 }
403 
404 static int nsim_rcv(struct nsim_rq *rq, int budget)
405 {
406 	struct net_device *dev = rq->napi.dev;
407 	struct bpf_prog *xdp_prog;
408 	struct netdevsim *ns;
409 	struct sk_buff *skb;
410 	unsigned int skblen;
411 	int i, ret;
412 
413 	ns = netdev_priv(dev);
414 	xdp_prog = READ_ONCE(ns->xdp.prog);
415 
416 	for (i = 0; i < budget; i++) {
417 		if (skb_queue_empty(&rq->skb_queue))
418 			break;
419 
420 		skb = skb_dequeue(&rq->skb_queue);
421 
422 		if (xdp_prog) {
423 			/* skb might be freed directly by XDP, save the len */
424 			skblen = skb->len;
425 
426 			if (skb->ip_summed == CHECKSUM_PARTIAL)
427 				skb_checksum_help(skb);
428 			ret = do_xdp_generic(xdp_prog, &skb);
429 			if (ret != XDP_PASS) {
430 				dev_dstats_rx_add(dev, skblen);
431 				continue;
432 			}
433 		}
434 
435 		/* skb might be discard at netif_receive_skb, save the len */
436 		skblen = skb->len;
437 		skb_mark_napi_id(skb, &rq->napi);
438 		ret = netif_receive_skb(skb);
439 		if (ret == NET_RX_SUCCESS)
440 			dev_dstats_rx_add(dev, skblen);
441 		else
442 			dev_dstats_rx_dropped(dev);
443 	}
444 
445 	nsim_start_peer_tx_queue(dev, rq);
446 	return i;
447 }
448 
449 static int nsim_poll(struct napi_struct *napi, int budget)
450 {
451 	struct nsim_rq *rq = container_of(napi, struct nsim_rq, napi);
452 	int done;
453 
454 	done = nsim_rcv(rq, budget);
455 	if (done < budget)
456 		napi_complete_done(napi, done);
457 
458 	return done;
459 }
460 
461 static int nsim_create_page_pool(struct page_pool **p, struct napi_struct *napi)
462 {
463 	struct page_pool_params params = {
464 		.order = 0,
465 		.pool_size = NSIM_RING_SIZE,
466 		.nid = NUMA_NO_NODE,
467 		.dev = &napi->dev->dev,
468 		.napi = napi,
469 		.dma_dir = DMA_BIDIRECTIONAL,
470 		.netdev = napi->dev,
471 	};
472 	struct page_pool *pool;
473 
474 	pool = page_pool_create(&params);
475 	if (IS_ERR(pool))
476 		return PTR_ERR(pool);
477 
478 	*p = pool;
479 	return 0;
480 }
481 
482 static int nsim_init_napi(struct netdevsim *ns)
483 {
484 	struct net_device *dev = ns->netdev;
485 	struct nsim_rq *rq;
486 	int err, i;
487 
488 	for (i = 0; i < dev->num_rx_queues; i++) {
489 		rq = ns->rq[i];
490 
491 		netif_napi_add_config_locked(dev, &rq->napi, nsim_poll, i);
492 	}
493 
494 	for (i = 0; i < dev->num_rx_queues; i++) {
495 		rq = ns->rq[i];
496 
497 		err = nsim_create_page_pool(&rq->page_pool, &rq->napi);
498 		if (err)
499 			goto err_pp_destroy;
500 	}
501 
502 	return 0;
503 
504 err_pp_destroy:
505 	while (i--) {
506 		page_pool_destroy(ns->rq[i]->page_pool);
507 		ns->rq[i]->page_pool = NULL;
508 	}
509 
510 	for (i = 0; i < dev->num_rx_queues; i++)
511 		__netif_napi_del_locked(&ns->rq[i]->napi);
512 
513 	return err;
514 }
515 
516 static enum hrtimer_restart nsim_napi_schedule(struct hrtimer *timer)
517 {
518 	struct nsim_rq *rq;
519 
520 	rq = container_of(timer, struct nsim_rq, napi_timer);
521 	napi_schedule(&rq->napi);
522 
523 	return HRTIMER_NORESTART;
524 }
525 
526 static void nsim_rq_timer_init(struct nsim_rq *rq)
527 {
528 	hrtimer_setup(&rq->napi_timer, nsim_napi_schedule, CLOCK_MONOTONIC,
529 		      HRTIMER_MODE_REL);
530 }
531 
532 static void nsim_enable_napi(struct netdevsim *ns)
533 {
534 	struct net_device *dev = ns->netdev;
535 	int i;
536 
537 	for (i = 0; i < dev->num_rx_queues; i++) {
538 		struct nsim_rq *rq = ns->rq[i];
539 
540 		netif_queue_set_napi(dev, i, NETDEV_QUEUE_TYPE_RX, &rq->napi);
541 		napi_enable_locked(&rq->napi);
542 	}
543 }
544 
545 static int nsim_open(struct net_device *dev)
546 {
547 	struct netdevsim *ns = netdev_priv(dev);
548 	int err;
549 
550 	netdev_assert_locked(dev);
551 
552 	err = nsim_init_napi(ns);
553 	if (err)
554 		return err;
555 
556 	nsim_enable_napi(ns);
557 
558 	return 0;
559 }
560 
561 static void nsim_del_napi(struct netdevsim *ns)
562 {
563 	struct net_device *dev = ns->netdev;
564 	int i;
565 
566 	for (i = 0; i < dev->num_rx_queues; i++) {
567 		struct nsim_rq *rq = ns->rq[i];
568 
569 		napi_disable_locked(&rq->napi);
570 		__netif_napi_del_locked(&rq->napi);
571 	}
572 	synchronize_net();
573 
574 	for (i = 0; i < dev->num_rx_queues; i++) {
575 		page_pool_destroy(ns->rq[i]->page_pool);
576 		ns->rq[i]->page_pool = NULL;
577 	}
578 }
579 
580 static int nsim_stop(struct net_device *dev)
581 {
582 	struct netdevsim *ns = netdev_priv(dev);
583 	struct netdevsim *peer;
584 
585 	netdev_assert_locked(dev);
586 
587 	netif_carrier_off(dev);
588 	peer = rtnl_dereference(ns->peer);
589 	if (peer)
590 		netif_carrier_off(peer->netdev);
591 
592 	nsim_del_napi(ns);
593 
594 	return 0;
595 }
596 
597 static int nsim_shaper_set(struct net_shaper_binding *binding,
598 			   const struct net_shaper *shaper,
599 			   struct netlink_ext_ack *extack)
600 {
601 	return 0;
602 }
603 
604 static int nsim_shaper_del(struct net_shaper_binding *binding,
605 			   const struct net_shaper_handle *handle,
606 			   struct netlink_ext_ack *extack)
607 {
608 	return 0;
609 }
610 
611 static int nsim_shaper_group(struct net_shaper_binding *binding,
612 			     int leaves_count,
613 			     const struct net_shaper *leaves,
614 			     const struct net_shaper *root,
615 			     struct netlink_ext_ack *extack)
616 {
617 	return 0;
618 }
619 
620 static void nsim_shaper_cap(struct net_shaper_binding *binding,
621 			    enum net_shaper_scope scope,
622 			    unsigned long *flags)
623 {
624 	*flags = ULONG_MAX;
625 }
626 
627 static const struct net_shaper_ops nsim_shaper_ops = {
628 	.set			= nsim_shaper_set,
629 	.delete			= nsim_shaper_del,
630 	.group			= nsim_shaper_group,
631 	.capabilities		= nsim_shaper_cap,
632 };
633 
634 static const struct net_device_ops nsim_netdev_ops = {
635 	.ndo_start_xmit		= nsim_start_xmit,
636 	.ndo_set_rx_mode	= nsim_set_rx_mode,
637 	.ndo_set_mac_address	= eth_mac_addr,
638 	.ndo_validate_addr	= eth_validate_addr,
639 	.ndo_change_mtu		= nsim_change_mtu,
640 	.ndo_set_vf_mac		= nsim_set_vf_mac,
641 	.ndo_set_vf_vlan	= nsim_set_vf_vlan,
642 	.ndo_set_vf_rate	= nsim_set_vf_rate,
643 	.ndo_set_vf_spoofchk	= nsim_set_vf_spoofchk,
644 	.ndo_set_vf_trust	= nsim_set_vf_trust,
645 	.ndo_get_vf_config	= nsim_get_vf_config,
646 	.ndo_set_vf_link_state	= nsim_set_vf_link_state,
647 	.ndo_set_vf_rss_query_en = nsim_set_vf_rss_query_en,
648 	.ndo_setup_tc		= nsim_setup_tc,
649 	.ndo_set_features	= nsim_set_features,
650 	.ndo_get_iflink		= nsim_get_iflink,
651 	.ndo_bpf		= nsim_bpf,
652 	.ndo_open		= nsim_open,
653 	.ndo_stop		= nsim_stop,
654 	.net_shaper_ops		= &nsim_shaper_ops,
655 };
656 
657 static const struct net_device_ops nsim_vf_netdev_ops = {
658 	.ndo_start_xmit		= nsim_start_xmit,
659 	.ndo_set_rx_mode	= nsim_set_rx_mode,
660 	.ndo_set_mac_address	= eth_mac_addr,
661 	.ndo_validate_addr	= eth_validate_addr,
662 	.ndo_change_mtu		= nsim_change_mtu,
663 	.ndo_setup_tc		= nsim_setup_tc,
664 	.ndo_set_features	= nsim_set_features,
665 };
666 
667 /* We don't have true per-queue stats, yet, so do some random fakery here.
668  * Only report stuff for queue 0.
669  */
670 static void nsim_get_queue_stats_rx(struct net_device *dev, int idx,
671 				    struct netdev_queue_stats_rx *stats)
672 {
673 	struct rtnl_link_stats64 rtstats = {};
674 
675 	if (!idx)
676 		dev_get_stats(dev, &rtstats);
677 
678 	stats->packets = rtstats.rx_packets - !!rtstats.rx_packets;
679 	stats->bytes = rtstats.rx_bytes;
680 }
681 
682 static void nsim_get_queue_stats_tx(struct net_device *dev, int idx,
683 				    struct netdev_queue_stats_tx *stats)
684 {
685 	struct rtnl_link_stats64 rtstats = {};
686 
687 	if (!idx)
688 		dev_get_stats(dev, &rtstats);
689 
690 	stats->packets = rtstats.tx_packets - !!rtstats.tx_packets;
691 	stats->bytes = rtstats.tx_bytes;
692 }
693 
694 static void nsim_get_base_stats(struct net_device *dev,
695 				struct netdev_queue_stats_rx *rx,
696 				struct netdev_queue_stats_tx *tx)
697 {
698 	struct rtnl_link_stats64 rtstats = {};
699 
700 	dev_get_stats(dev, &rtstats);
701 
702 	rx->packets = !!rtstats.rx_packets;
703 	rx->bytes = 0;
704 	tx->packets = !!rtstats.tx_packets;
705 	tx->bytes = 0;
706 }
707 
708 static const struct netdev_stat_ops nsim_stat_ops = {
709 	.get_queue_stats_tx	= nsim_get_queue_stats_tx,
710 	.get_queue_stats_rx	= nsim_get_queue_stats_rx,
711 	.get_base_stats		= nsim_get_base_stats,
712 };
713 
714 static struct nsim_rq *nsim_queue_alloc(void)
715 {
716 	struct nsim_rq *rq;
717 
718 	rq = kzalloc(sizeof(*rq), GFP_KERNEL_ACCOUNT);
719 	if (!rq)
720 		return NULL;
721 
722 	skb_queue_head_init(&rq->skb_queue);
723 	nsim_rq_timer_init(rq);
724 	return rq;
725 }
726 
727 static void nsim_queue_free(struct net_device *dev, struct nsim_rq *rq)
728 {
729 	hrtimer_cancel(&rq->napi_timer);
730 
731 	if (rq->skb_queue.qlen) {
732 		local_bh_disable();
733 		dev_dstats_rx_dropped_add(dev, rq->skb_queue.qlen);
734 		local_bh_enable();
735 	}
736 
737 	skb_queue_purge_reason(&rq->skb_queue, SKB_DROP_REASON_QUEUE_PURGE);
738 	kfree(rq);
739 }
740 
741 /* Queue reset mode is controlled by ns->rq_reset_mode.
742  * - normal - new NAPI new pool (old NAPI enabled when new added)
743  * - mode 1 - allocate new pool (NAPI is only disabled / enabled)
744  * - mode 2 - new NAPI new pool (old NAPI removed before new added)
745  * - mode 3 - new NAPI new pool (old NAPI disabled when new added)
746  */
747 struct nsim_queue_mem {
748 	struct nsim_rq *rq;
749 	struct page_pool *pp;
750 };
751 
752 static int
753 nsim_queue_mem_alloc(struct net_device *dev, void *per_queue_mem, int idx)
754 {
755 	struct nsim_queue_mem *qmem = per_queue_mem;
756 	struct netdevsim *ns = netdev_priv(dev);
757 	int err;
758 
759 	if (ns->rq_reset_mode > 3)
760 		return -EINVAL;
761 
762 	if (ns->rq_reset_mode == 1) {
763 		if (!netif_running(ns->netdev))
764 			return -ENETDOWN;
765 		return nsim_create_page_pool(&qmem->pp, &ns->rq[idx]->napi);
766 	}
767 
768 	qmem->rq = nsim_queue_alloc();
769 	if (!qmem->rq)
770 		return -ENOMEM;
771 
772 	err = nsim_create_page_pool(&qmem->rq->page_pool, &qmem->rq->napi);
773 	if (err)
774 		goto err_free;
775 
776 	if (!ns->rq_reset_mode)
777 		netif_napi_add_config_locked(dev, &qmem->rq->napi, nsim_poll,
778 					     idx);
779 
780 	return 0;
781 
782 err_free:
783 	nsim_queue_free(dev, qmem->rq);
784 	return err;
785 }
786 
787 static void nsim_queue_mem_free(struct net_device *dev, void *per_queue_mem)
788 {
789 	struct nsim_queue_mem *qmem = per_queue_mem;
790 	struct netdevsim *ns = netdev_priv(dev);
791 
792 	page_pool_destroy(qmem->pp);
793 	if (qmem->rq) {
794 		if (!ns->rq_reset_mode)
795 			netif_napi_del_locked(&qmem->rq->napi);
796 		page_pool_destroy(qmem->rq->page_pool);
797 		nsim_queue_free(dev, qmem->rq);
798 	}
799 }
800 
801 static int
802 nsim_queue_start(struct net_device *dev, void *per_queue_mem, int idx)
803 {
804 	struct nsim_queue_mem *qmem = per_queue_mem;
805 	struct netdevsim *ns = netdev_priv(dev);
806 
807 	netdev_assert_locked(dev);
808 
809 	if (ns->rq_reset_mode == 1) {
810 		ns->rq[idx]->page_pool = qmem->pp;
811 		napi_enable_locked(&ns->rq[idx]->napi);
812 		return 0;
813 	}
814 
815 	/* netif_napi_add()/_del() should normally be called from alloc/free,
816 	 * here we want to test various call orders.
817 	 */
818 	if (ns->rq_reset_mode == 2) {
819 		netif_napi_del_locked(&ns->rq[idx]->napi);
820 		netif_napi_add_config_locked(dev, &qmem->rq->napi, nsim_poll,
821 					     idx);
822 	} else if (ns->rq_reset_mode == 3) {
823 		netif_napi_add_config_locked(dev, &qmem->rq->napi, nsim_poll,
824 					     idx);
825 		netif_napi_del_locked(&ns->rq[idx]->napi);
826 	}
827 
828 	ns->rq[idx] = qmem->rq;
829 	napi_enable_locked(&ns->rq[idx]->napi);
830 
831 	return 0;
832 }
833 
834 static int nsim_queue_stop(struct net_device *dev, void *per_queue_mem, int idx)
835 {
836 	struct nsim_queue_mem *qmem = per_queue_mem;
837 	struct netdevsim *ns = netdev_priv(dev);
838 
839 	netdev_assert_locked(dev);
840 
841 	napi_disable_locked(&ns->rq[idx]->napi);
842 
843 	if (ns->rq_reset_mode == 1) {
844 		qmem->pp = ns->rq[idx]->page_pool;
845 		page_pool_disable_direct_recycling(qmem->pp);
846 	} else {
847 		qmem->rq = ns->rq[idx];
848 	}
849 
850 	return 0;
851 }
852 
853 static const struct netdev_queue_mgmt_ops nsim_queue_mgmt_ops = {
854 	.ndo_queue_mem_size	= sizeof(struct nsim_queue_mem),
855 	.ndo_queue_mem_alloc	= nsim_queue_mem_alloc,
856 	.ndo_queue_mem_free	= nsim_queue_mem_free,
857 	.ndo_queue_start	= nsim_queue_start,
858 	.ndo_queue_stop		= nsim_queue_stop,
859 };
860 
861 static ssize_t
862 nsim_qreset_write(struct file *file, const char __user *data,
863 		  size_t count, loff_t *ppos)
864 {
865 	struct netdevsim *ns = file->private_data;
866 	unsigned int queue, mode;
867 	char buf[32];
868 	ssize_t ret;
869 
870 	if (count >= sizeof(buf))
871 		return -EINVAL;
872 	if (copy_from_user(buf, data, count))
873 		return -EFAULT;
874 	buf[count] = '\0';
875 
876 	ret = sscanf(buf, "%u %u", &queue, &mode);
877 	if (ret != 2)
878 		return -EINVAL;
879 
880 	netdev_lock(ns->netdev);
881 	if (queue >= ns->netdev->real_num_rx_queues) {
882 		ret = -EINVAL;
883 		goto exit_unlock;
884 	}
885 
886 	ns->rq_reset_mode = mode;
887 	ret = netdev_rx_queue_restart(ns->netdev, queue);
888 	ns->rq_reset_mode = 0;
889 	if (ret)
890 		goto exit_unlock;
891 
892 	ret = count;
893 exit_unlock:
894 	netdev_unlock(ns->netdev);
895 	return ret;
896 }
897 
898 static const struct file_operations nsim_qreset_fops = {
899 	.open = simple_open,
900 	.write = nsim_qreset_write,
901 	.owner = THIS_MODULE,
902 };
903 
904 static ssize_t
905 nsim_pp_hold_read(struct file *file, char __user *data,
906 		  size_t count, loff_t *ppos)
907 {
908 	struct netdevsim *ns = file->private_data;
909 	char buf[3] = "n\n";
910 
911 	if (ns->page)
912 		buf[0] = 'y';
913 
914 	return simple_read_from_buffer(data, count, ppos, buf, 2);
915 }
916 
917 static ssize_t
918 nsim_pp_hold_write(struct file *file, const char __user *data,
919 		   size_t count, loff_t *ppos)
920 {
921 	struct netdevsim *ns = file->private_data;
922 	ssize_t ret;
923 	bool val;
924 
925 	ret = kstrtobool_from_user(data, count, &val);
926 	if (ret)
927 		return ret;
928 
929 	rtnl_lock();
930 	ret = count;
931 	if (val == !!ns->page)
932 		goto exit;
933 
934 	if (!netif_running(ns->netdev) && val) {
935 		ret = -ENETDOWN;
936 	} else if (val) {
937 		ns->page = page_pool_dev_alloc_pages(ns->rq[0]->page_pool);
938 		if (!ns->page)
939 			ret = -ENOMEM;
940 	} else {
941 		page_pool_put_full_page(pp_page_to_nmdesc(ns->page)->pp,
942 					ns->page, false);
943 		ns->page = NULL;
944 	}
945 
946 exit:
947 	rtnl_unlock();
948 	return ret;
949 }
950 
951 static const struct file_operations nsim_pp_hold_fops = {
952 	.open = simple_open,
953 	.read = nsim_pp_hold_read,
954 	.write = nsim_pp_hold_write,
955 	.llseek = generic_file_llseek,
956 	.owner = THIS_MODULE,
957 };
958 
959 static void nsim_setup(struct net_device *dev)
960 {
961 	ether_setup(dev);
962 	eth_hw_addr_random(dev);
963 
964 	dev->flags &= ~IFF_MULTICAST;
965 	dev->priv_flags |= IFF_LIVE_ADDR_CHANGE;
966 	dev->features |= NETIF_F_HIGHDMA |
967 			 NETIF_F_SG |
968 			 NETIF_F_FRAGLIST |
969 			 NETIF_F_HW_CSUM |
970 			 NETIF_F_LRO |
971 			 NETIF_F_TSO;
972 	dev->hw_features |= NETIF_F_HW_TC |
973 			    NETIF_F_SG |
974 			    NETIF_F_FRAGLIST |
975 			    NETIF_F_HW_CSUM |
976 			    NETIF_F_LRO |
977 			    NETIF_F_TSO;
978 	dev->pcpu_stat_type = NETDEV_PCPU_STAT_DSTATS;
979 	dev->max_mtu = ETH_MAX_MTU;
980 	dev->xdp_features = NETDEV_XDP_ACT_BASIC | NETDEV_XDP_ACT_HW_OFFLOAD;
981 }
982 
983 static int nsim_queue_init(struct netdevsim *ns)
984 {
985 	struct net_device *dev = ns->netdev;
986 	int i;
987 
988 	ns->rq = kcalloc(dev->num_rx_queues, sizeof(*ns->rq),
989 			 GFP_KERNEL_ACCOUNT);
990 	if (!ns->rq)
991 		return -ENOMEM;
992 
993 	for (i = 0; i < dev->num_rx_queues; i++) {
994 		ns->rq[i] = nsim_queue_alloc();
995 		if (!ns->rq[i])
996 			goto err_free_prev;
997 	}
998 
999 	return 0;
1000 
1001 err_free_prev:
1002 	while (i--)
1003 		kfree(ns->rq[i]);
1004 	kfree(ns->rq);
1005 	return -ENOMEM;
1006 }
1007 
1008 static void nsim_queue_uninit(struct netdevsim *ns)
1009 {
1010 	struct net_device *dev = ns->netdev;
1011 	int i;
1012 
1013 	for (i = 0; i < dev->num_rx_queues; i++)
1014 		nsim_queue_free(dev, ns->rq[i]);
1015 
1016 	kfree(ns->rq);
1017 	ns->rq = NULL;
1018 }
1019 
1020 static int nsim_init_netdevsim(struct netdevsim *ns)
1021 {
1022 	struct netdevsim *peer;
1023 	struct mock_phc *phc;
1024 	int err;
1025 
1026 	phc = mock_phc_create(&ns->nsim_bus_dev->dev);
1027 	if (IS_ERR(phc))
1028 		return PTR_ERR(phc);
1029 
1030 	ns->phc = phc;
1031 	ns->netdev->netdev_ops = &nsim_netdev_ops;
1032 	ns->netdev->stat_ops = &nsim_stat_ops;
1033 	ns->netdev->queue_mgmt_ops = &nsim_queue_mgmt_ops;
1034 	netdev_lockdep_set_classes(ns->netdev);
1035 
1036 	err = nsim_udp_tunnels_info_create(ns->nsim_dev, ns->netdev);
1037 	if (err)
1038 		goto err_phc_destroy;
1039 
1040 	rtnl_lock();
1041 	err = nsim_queue_init(ns);
1042 	if (err)
1043 		goto err_utn_destroy;
1044 
1045 	err = nsim_bpf_init(ns);
1046 	if (err)
1047 		goto err_rq_destroy;
1048 
1049 	nsim_macsec_init(ns);
1050 	nsim_ipsec_init(ns);
1051 
1052 	err = register_netdevice(ns->netdev);
1053 	if (err)
1054 		goto err_ipsec_teardown;
1055 	rtnl_unlock();
1056 
1057 	err = nsim_psp_init(ns);
1058 	if (err)
1059 		goto err_unregister_netdev;
1060 
1061 	if (IS_ENABLED(CONFIG_DEBUG_NET)) {
1062 		ns->nb.notifier_call = netdev_debug_event;
1063 		if (register_netdevice_notifier_dev_net(ns->netdev, &ns->nb,
1064 							&ns->nn))
1065 			ns->nb.notifier_call = NULL;
1066 	}
1067 
1068 	return 0;
1069 
1070 err_unregister_netdev:
1071 	rtnl_lock();
1072 	peer = rtnl_dereference(ns->peer);
1073 	if (peer)
1074 		RCU_INIT_POINTER(peer->peer, NULL);
1075 	RCU_INIT_POINTER(ns->peer, NULL);
1076 	unregister_netdevice(ns->netdev);
1077 err_ipsec_teardown:
1078 	nsim_ipsec_teardown(ns);
1079 	nsim_macsec_teardown(ns);
1080 	nsim_bpf_uninit(ns);
1081 err_rq_destroy:
1082 	nsim_queue_uninit(ns);
1083 err_utn_destroy:
1084 	rtnl_unlock();
1085 	nsim_udp_tunnels_info_destroy(ns->netdev);
1086 err_phc_destroy:
1087 	mock_phc_destroy(ns->phc);
1088 	return err;
1089 }
1090 
1091 static int nsim_init_netdevsim_vf(struct netdevsim *ns)
1092 {
1093 	int err;
1094 
1095 	ns->netdev->netdev_ops = &nsim_vf_netdev_ops;
1096 	rtnl_lock();
1097 	err = register_netdevice(ns->netdev);
1098 	rtnl_unlock();
1099 	return err;
1100 }
1101 
1102 static void nsim_exit_netdevsim(struct netdevsim *ns)
1103 {
1104 	nsim_udp_tunnels_info_destroy(ns->netdev);
1105 	mock_phc_destroy(ns->phc);
1106 }
1107 
1108 struct netdevsim *nsim_create(struct nsim_dev *nsim_dev,
1109 			      struct nsim_dev_port *nsim_dev_port,
1110 			      u8 perm_addr[ETH_ALEN])
1111 {
1112 	struct net_device *dev;
1113 	struct netdevsim *ns;
1114 	int err;
1115 
1116 	dev = alloc_netdev_mq(sizeof(*ns), "eth%d", NET_NAME_UNKNOWN, nsim_setup,
1117 			      nsim_dev->nsim_bus_dev->num_queues);
1118 	if (!dev)
1119 		return ERR_PTR(-ENOMEM);
1120 
1121 	if (perm_addr)
1122 		memcpy(dev->perm_addr, perm_addr, ETH_ALEN);
1123 
1124 	dev_net_set(dev, nsim_dev_net(nsim_dev));
1125 	ns = netdev_priv(dev);
1126 	ns->netdev = dev;
1127 	ns->nsim_dev = nsim_dev;
1128 	ns->nsim_dev_port = nsim_dev_port;
1129 	ns->nsim_bus_dev = nsim_dev->nsim_bus_dev;
1130 	SET_NETDEV_DEV(dev, &ns->nsim_bus_dev->dev);
1131 	SET_NETDEV_DEVLINK_PORT(dev, &nsim_dev_port->devlink_port);
1132 	nsim_ethtool_init(ns);
1133 	if (nsim_dev_port_is_pf(nsim_dev_port))
1134 		err = nsim_init_netdevsim(ns);
1135 	else
1136 		err = nsim_init_netdevsim_vf(ns);
1137 	if (err)
1138 		goto err_free_netdev;
1139 
1140 	ns->pp_dfs = debugfs_create_file("pp_hold", 0600, nsim_dev_port->ddir,
1141 					 ns, &nsim_pp_hold_fops);
1142 	ns->qr_dfs = debugfs_create_file("queue_reset", 0200,
1143 					 nsim_dev_port->ddir, ns,
1144 					 &nsim_qreset_fops);
1145 	return ns;
1146 
1147 err_free_netdev:
1148 	free_netdev(dev);
1149 	return ERR_PTR(err);
1150 }
1151 
1152 void nsim_destroy(struct netdevsim *ns)
1153 {
1154 	struct net_device *dev = ns->netdev;
1155 	struct netdevsim *peer;
1156 
1157 	debugfs_remove(ns->qr_dfs);
1158 	debugfs_remove(ns->pp_dfs);
1159 
1160 	if (ns->nb.notifier_call)
1161 		unregister_netdevice_notifier_dev_net(ns->netdev, &ns->nb,
1162 						      &ns->nn);
1163 
1164 	nsim_psp_uninit(ns);
1165 
1166 	rtnl_lock();
1167 	peer = rtnl_dereference(ns->peer);
1168 	if (peer)
1169 		RCU_INIT_POINTER(peer->peer, NULL);
1170 	RCU_INIT_POINTER(ns->peer, NULL);
1171 	unregister_netdevice(dev);
1172 	if (nsim_dev_port_is_pf(ns->nsim_dev_port)) {
1173 		nsim_macsec_teardown(ns);
1174 		nsim_ipsec_teardown(ns);
1175 		nsim_bpf_uninit(ns);
1176 		nsim_queue_uninit(ns);
1177 	}
1178 	rtnl_unlock();
1179 	if (nsim_dev_port_is_pf(ns->nsim_dev_port))
1180 		nsim_exit_netdevsim(ns);
1181 
1182 	/* Put this intentionally late to exercise the orphaning path */
1183 	if (ns->page) {
1184 		page_pool_put_full_page(pp_page_to_nmdesc(ns->page)->pp,
1185 					ns->page, false);
1186 		ns->page = NULL;
1187 	}
1188 
1189 	free_netdev(dev);
1190 }
1191 
1192 bool netdev_is_nsim(struct net_device *dev)
1193 {
1194 	return dev->netdev_ops == &nsim_netdev_ops;
1195 }
1196 
1197 static int nsim_validate(struct nlattr *tb[], struct nlattr *data[],
1198 			 struct netlink_ext_ack *extack)
1199 {
1200 	NL_SET_ERR_MSG_MOD(extack,
1201 			   "Please use: echo \"[ID] [PORT_COUNT] [NUM_QUEUES]\" > /sys/bus/netdevsim/new_device");
1202 	return -EOPNOTSUPP;
1203 }
1204 
1205 static struct rtnl_link_ops nsim_link_ops __read_mostly = {
1206 	.kind		= DRV_NAME,
1207 	.validate	= nsim_validate,
1208 };
1209 
1210 static int __init nsim_module_init(void)
1211 {
1212 	int err;
1213 
1214 	err = nsim_dev_init();
1215 	if (err)
1216 		return err;
1217 
1218 	err = nsim_bus_init();
1219 	if (err)
1220 		goto err_dev_exit;
1221 
1222 	err = rtnl_link_register(&nsim_link_ops);
1223 	if (err)
1224 		goto err_bus_exit;
1225 
1226 	return 0;
1227 
1228 err_bus_exit:
1229 	nsim_bus_exit();
1230 err_dev_exit:
1231 	nsim_dev_exit();
1232 	return err;
1233 }
1234 
1235 static void __exit nsim_module_exit(void)
1236 {
1237 	rtnl_link_unregister(&nsim_link_ops);
1238 	nsim_bus_exit();
1239 	nsim_dev_exit();
1240 }
1241 
1242 module_init(nsim_module_init);
1243 module_exit(nsim_module_exit);
1244 MODULE_LICENSE("GPL");
1245 MODULE_DESCRIPTION("Simulated networking device for testing");
1246 MODULE_ALIAS_RTNL_LINK(DRV_NAME);
1247