2 * Copyright (C) 2017 Netronome Systems, Inc.
4 * This software is licensed under the GNU General License Version 2,
5 * June 1991 as shown in the file COPYING in the top-level directory of this
8 * THE COPYRIGHT HOLDERS AND/OR OTHER PARTIES PROVIDE THE PROGRAM "AS IS"
9 * WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING,
10 * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
11 * FOR A PARTICULAR PURPOSE. THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE
12 * OF THE PROGRAM IS WITH YOU. SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME
13 * THE COST OF ALL NECESSARY SERVICING, REPAIR OR CORRECTION.
16 #include <linux/debugfs.h>
17 #include <linux/etherdevice.h>
18 #include <linux/kernel.h>
19 #include <linux/module.h>
20 #include <linux/netdevice.h>
21 #include <linux/slab.h>
22 #include <net/netdev_queues.h>
23 #include <net/page_pool/helpers.h>
24 #include <net/netlink.h>
25 #include <net/pkt_cls.h>
26 #include <net/rtnetlink.h>
27 #include <net/udp_tunnel.h>
29 #include "netdevsim.h"
31 #define NSIM_RING_SIZE 256
33 static int nsim_napi_rx(struct nsim_rq *rq, struct sk_buff *skb)
35 if (skb_queue_len(&rq->skb_queue) > NSIM_RING_SIZE) {
36 dev_kfree_skb_any(skb);
40 skb_queue_tail(&rq->skb_queue, skb);
41 return NET_RX_SUCCESS;
44 static int nsim_forward_skb(struct net_device *dev, struct sk_buff *skb,
47 return __dev_forward_skb(dev, skb) ?: nsim_napi_rx(rq, skb);
50 static netdev_tx_t nsim_start_xmit(struct sk_buff *skb, struct net_device *dev)
52 struct netdevsim *ns = netdev_priv(dev);
53 struct net_device *peer_dev;
54 unsigned int len = skb->len;
55 struct netdevsim *peer_ns;
60 if (!nsim_ipsec_tx(ns, skb))
63 peer_ns = rcu_dereference(ns->peer);
67 peer_dev = peer_ns->netdev;
68 rxq = skb_get_queue_mapping(skb);
69 if (rxq >= peer_dev->num_rx_queues)
70 rxq = rxq % peer_dev->num_rx_queues;
71 rq = &peer_ns->rq[rxq];
73 skb_tx_timestamp(skb);
74 if (unlikely(nsim_forward_skb(peer_dev, skb, rq) == NET_RX_DROP))
77 napi_schedule(&rq->napi);
80 u64_stats_update_begin(&ns->syncp);
83 u64_stats_update_end(&ns->syncp);
90 u64_stats_update_begin(&ns->syncp);
92 u64_stats_update_end(&ns->syncp);
96 static void nsim_set_rx_mode(struct net_device *dev)
100 static int nsim_change_mtu(struct net_device *dev, int new_mtu)
102 struct netdevsim *ns = netdev_priv(dev);
104 if (ns->xdp.prog && new_mtu > NSIM_XDP_MAX_MTU)
107 WRITE_ONCE(dev->mtu, new_mtu);
113 nsim_get_stats64(struct net_device *dev, struct rtnl_link_stats64 *stats)
115 struct netdevsim *ns = netdev_priv(dev);
119 start = u64_stats_fetch_begin(&ns->syncp);
120 stats->tx_bytes = ns->tx_bytes;
121 stats->tx_packets = ns->tx_packets;
122 stats->tx_dropped = ns->tx_dropped;
123 } while (u64_stats_fetch_retry(&ns->syncp, start));
127 nsim_setup_tc_block_cb(enum tc_setup_type type, void *type_data, void *cb_priv)
129 return nsim_bpf_setup_tc_block_cb(type, type_data, cb_priv);
132 static int nsim_set_vf_mac(struct net_device *dev, int vf, u8 *mac)
134 struct netdevsim *ns = netdev_priv(dev);
135 struct nsim_dev *nsim_dev = ns->nsim_dev;
137 /* Only refuse multicast addresses, zero address can mean unset/any. */
138 if (vf >= nsim_dev_get_vfs(nsim_dev) || is_multicast_ether_addr(mac))
140 memcpy(nsim_dev->vfconfigs[vf].vf_mac, mac, ETH_ALEN);
145 static int nsim_set_vf_vlan(struct net_device *dev, int vf,
146 u16 vlan, u8 qos, __be16 vlan_proto)
148 struct netdevsim *ns = netdev_priv(dev);
149 struct nsim_dev *nsim_dev = ns->nsim_dev;
151 if (vf >= nsim_dev_get_vfs(nsim_dev) || vlan > 4095 || qos > 7)
154 nsim_dev->vfconfigs[vf].vlan = vlan;
155 nsim_dev->vfconfigs[vf].qos = qos;
156 nsim_dev->vfconfigs[vf].vlan_proto = vlan_proto;
161 static int nsim_set_vf_rate(struct net_device *dev, int vf, int min, int max)
163 struct netdevsim *ns = netdev_priv(dev);
164 struct nsim_dev *nsim_dev = ns->nsim_dev;
166 if (nsim_esw_mode_is_switchdev(ns->nsim_dev)) {
167 pr_err("Not supported in switchdev mode. Please use devlink API.\n");
171 if (vf >= nsim_dev_get_vfs(nsim_dev))
174 nsim_dev->vfconfigs[vf].min_tx_rate = min;
175 nsim_dev->vfconfigs[vf].max_tx_rate = max;
180 static int nsim_set_vf_spoofchk(struct net_device *dev, int vf, bool val)
182 struct netdevsim *ns = netdev_priv(dev);
183 struct nsim_dev *nsim_dev = ns->nsim_dev;
185 if (vf >= nsim_dev_get_vfs(nsim_dev))
187 nsim_dev->vfconfigs[vf].spoofchk_enabled = val;
192 static int nsim_set_vf_rss_query_en(struct net_device *dev, int vf, bool val)
194 struct netdevsim *ns = netdev_priv(dev);
195 struct nsim_dev *nsim_dev = ns->nsim_dev;
197 if (vf >= nsim_dev_get_vfs(nsim_dev))
199 nsim_dev->vfconfigs[vf].rss_query_enabled = val;
204 static int nsim_set_vf_trust(struct net_device *dev, int vf, bool val)
206 struct netdevsim *ns = netdev_priv(dev);
207 struct nsim_dev *nsim_dev = ns->nsim_dev;
209 if (vf >= nsim_dev_get_vfs(nsim_dev))
211 nsim_dev->vfconfigs[vf].trusted = val;
217 nsim_get_vf_config(struct net_device *dev, int vf, struct ifla_vf_info *ivi)
219 struct netdevsim *ns = netdev_priv(dev);
220 struct nsim_dev *nsim_dev = ns->nsim_dev;
222 if (vf >= nsim_dev_get_vfs(nsim_dev))
226 ivi->linkstate = nsim_dev->vfconfigs[vf].link_state;
227 ivi->min_tx_rate = nsim_dev->vfconfigs[vf].min_tx_rate;
228 ivi->max_tx_rate = nsim_dev->vfconfigs[vf].max_tx_rate;
229 ivi->vlan = nsim_dev->vfconfigs[vf].vlan;
230 ivi->vlan_proto = nsim_dev->vfconfigs[vf].vlan_proto;
231 ivi->qos = nsim_dev->vfconfigs[vf].qos;
232 memcpy(&ivi->mac, nsim_dev->vfconfigs[vf].vf_mac, ETH_ALEN);
233 ivi->spoofchk = nsim_dev->vfconfigs[vf].spoofchk_enabled;
234 ivi->trusted = nsim_dev->vfconfigs[vf].trusted;
235 ivi->rss_query_en = nsim_dev->vfconfigs[vf].rss_query_enabled;
240 static int nsim_set_vf_link_state(struct net_device *dev, int vf, int state)
242 struct netdevsim *ns = netdev_priv(dev);
243 struct nsim_dev *nsim_dev = ns->nsim_dev;
245 if (vf >= nsim_dev_get_vfs(nsim_dev))
249 case IFLA_VF_LINK_STATE_AUTO:
250 case IFLA_VF_LINK_STATE_ENABLE:
251 case IFLA_VF_LINK_STATE_DISABLE:
257 nsim_dev->vfconfigs[vf].link_state = state;
262 static void nsim_taprio_stats(struct tc_taprio_qopt_stats *stats)
264 stats->window_drops = 0;
265 stats->tx_overruns = 0;
268 static int nsim_setup_tc_taprio(struct net_device *dev,
269 struct tc_taprio_qopt_offload *offload)
273 switch (offload->cmd) {
274 case TAPRIO_CMD_REPLACE:
275 case TAPRIO_CMD_DESTROY:
277 case TAPRIO_CMD_STATS:
278 nsim_taprio_stats(&offload->stats);
287 static LIST_HEAD(nsim_block_cb_list);
290 nsim_setup_tc(struct net_device *dev, enum tc_setup_type type, void *type_data)
292 struct netdevsim *ns = netdev_priv(dev);
295 case TC_SETUP_QDISC_TAPRIO:
296 return nsim_setup_tc_taprio(dev, type_data);
298 return flow_block_cb_setup_simple(type_data,
300 nsim_setup_tc_block_cb,
308 nsim_set_features(struct net_device *dev, netdev_features_t features)
310 struct netdevsim *ns = netdev_priv(dev);
312 if ((dev->features & NETIF_F_HW_TC) > (features & NETIF_F_HW_TC))
313 return nsim_bpf_disable_tc(ns);
318 static int nsim_get_iflink(const struct net_device *dev)
320 struct netdevsim *nsim, *peer;
323 nsim = netdev_priv(dev);
326 peer = rcu_dereference(nsim->peer);
327 iflink = peer ? READ_ONCE(peer->netdev->ifindex) :
328 READ_ONCE(dev->ifindex);
334 static int nsim_rcv(struct nsim_rq *rq, int budget)
339 for (i = 0; i < budget; i++) {
340 if (skb_queue_empty(&rq->skb_queue))
343 skb = skb_dequeue(&rq->skb_queue);
344 netif_receive_skb(skb);
350 static int nsim_poll(struct napi_struct *napi, int budget)
352 struct nsim_rq *rq = container_of(napi, struct nsim_rq, napi);
355 done = nsim_rcv(rq, budget);
361 static int nsim_create_page_pool(struct nsim_rq *rq)
363 struct page_pool_params p = {
365 .pool_size = NSIM_RING_SIZE,
367 .dev = &rq->napi.dev->dev,
369 .dma_dir = DMA_BIDIRECTIONAL,
370 .netdev = rq->napi.dev,
373 rq->page_pool = page_pool_create(&p);
374 if (IS_ERR(rq->page_pool)) {
375 int err = PTR_ERR(rq->page_pool);
377 rq->page_pool = NULL;
383 static int nsim_init_napi(struct netdevsim *ns)
385 struct net_device *dev = ns->netdev;
389 for (i = 0; i < dev->num_rx_queues; i++) {
392 netif_napi_add(dev, &rq->napi, nsim_poll);
395 for (i = 0; i < dev->num_rx_queues; i++) {
398 err = nsim_create_page_pool(rq);
407 page_pool_destroy(ns->rq[i].page_pool);
408 ns->rq[i].page_pool = NULL;
411 for (i = 0; i < dev->num_rx_queues; i++)
412 __netif_napi_del(&ns->rq[i].napi);
417 static void nsim_enable_napi(struct netdevsim *ns)
419 struct net_device *dev = ns->netdev;
422 for (i = 0; i < dev->num_rx_queues; i++) {
423 struct nsim_rq *rq = &ns->rq[i];
425 netif_queue_set_napi(dev, i, NETDEV_QUEUE_TYPE_RX, &rq->napi);
426 napi_enable(&rq->napi);
430 static int nsim_open(struct net_device *dev)
432 struct netdevsim *ns = netdev_priv(dev);
435 err = nsim_init_napi(ns);
439 nsim_enable_napi(ns);
444 static void nsim_del_napi(struct netdevsim *ns)
446 struct net_device *dev = ns->netdev;
449 for (i = 0; i < dev->num_rx_queues; i++) {
450 struct nsim_rq *rq = &ns->rq[i];
452 napi_disable(&rq->napi);
453 __netif_napi_del(&rq->napi);
457 for (i = 0; i < dev->num_rx_queues; i++) {
458 page_pool_destroy(ns->rq[i].page_pool);
459 ns->rq[i].page_pool = NULL;
463 static int nsim_stop(struct net_device *dev)
465 struct netdevsim *ns = netdev_priv(dev);
466 struct netdevsim *peer;
468 netif_carrier_off(dev);
469 peer = rtnl_dereference(ns->peer);
471 netif_carrier_off(peer->netdev);
478 static const struct net_device_ops nsim_netdev_ops = {
479 .ndo_start_xmit = nsim_start_xmit,
480 .ndo_set_rx_mode = nsim_set_rx_mode,
481 .ndo_set_mac_address = eth_mac_addr,
482 .ndo_validate_addr = eth_validate_addr,
483 .ndo_change_mtu = nsim_change_mtu,
484 .ndo_get_stats64 = nsim_get_stats64,
485 .ndo_set_vf_mac = nsim_set_vf_mac,
486 .ndo_set_vf_vlan = nsim_set_vf_vlan,
487 .ndo_set_vf_rate = nsim_set_vf_rate,
488 .ndo_set_vf_spoofchk = nsim_set_vf_spoofchk,
489 .ndo_set_vf_trust = nsim_set_vf_trust,
490 .ndo_get_vf_config = nsim_get_vf_config,
491 .ndo_set_vf_link_state = nsim_set_vf_link_state,
492 .ndo_set_vf_rss_query_en = nsim_set_vf_rss_query_en,
493 .ndo_setup_tc = nsim_setup_tc,
494 .ndo_set_features = nsim_set_features,
495 .ndo_get_iflink = nsim_get_iflink,
497 .ndo_open = nsim_open,
498 .ndo_stop = nsim_stop,
501 static const struct net_device_ops nsim_vf_netdev_ops = {
502 .ndo_start_xmit = nsim_start_xmit,
503 .ndo_set_rx_mode = nsim_set_rx_mode,
504 .ndo_set_mac_address = eth_mac_addr,
505 .ndo_validate_addr = eth_validate_addr,
506 .ndo_change_mtu = nsim_change_mtu,
507 .ndo_get_stats64 = nsim_get_stats64,
508 .ndo_setup_tc = nsim_setup_tc,
509 .ndo_set_features = nsim_set_features,
512 /* We don't have true per-queue stats, yet, so do some random fakery here.
513 * Only report stuff for queue 0.
515 static void nsim_get_queue_stats_rx(struct net_device *dev, int idx,
516 struct netdev_queue_stats_rx *stats)
518 struct rtnl_link_stats64 rtstats = {};
521 nsim_get_stats64(dev, &rtstats);
523 stats->packets = rtstats.rx_packets - !!rtstats.rx_packets;
524 stats->bytes = rtstats.rx_bytes;
527 static void nsim_get_queue_stats_tx(struct net_device *dev, int idx,
528 struct netdev_queue_stats_tx *stats)
530 struct rtnl_link_stats64 rtstats = {};
533 nsim_get_stats64(dev, &rtstats);
535 stats->packets = rtstats.tx_packets - !!rtstats.tx_packets;
536 stats->bytes = rtstats.tx_bytes;
539 static void nsim_get_base_stats(struct net_device *dev,
540 struct netdev_queue_stats_rx *rx,
541 struct netdev_queue_stats_tx *tx)
543 struct rtnl_link_stats64 rtstats = {};
545 nsim_get_stats64(dev, &rtstats);
547 rx->packets = !!rtstats.rx_packets;
549 tx->packets = !!rtstats.tx_packets;
553 static const struct netdev_stat_ops nsim_stat_ops = {
554 .get_queue_stats_tx = nsim_get_queue_stats_tx,
555 .get_queue_stats_rx = nsim_get_queue_stats_rx,
556 .get_base_stats = nsim_get_base_stats,
560 nsim_pp_hold_read(struct file *file, char __user *data,
561 size_t count, loff_t *ppos)
563 struct netdevsim *ns = file->private_data;
569 return simple_read_from_buffer(data, count, ppos, buf, 2);
573 nsim_pp_hold_write(struct file *file, const char __user *data,
574 size_t count, loff_t *ppos)
576 struct netdevsim *ns = file->private_data;
580 ret = kstrtobool_from_user(data, count, &val);
586 if (val == !!ns->page)
589 if (!netif_running(ns->netdev) && val) {
592 ns->page = page_pool_dev_alloc_pages(ns->rq[0].page_pool);
596 page_pool_put_full_page(ns->page->pp, ns->page, false);
605 static const struct file_operations nsim_pp_hold_fops = {
607 .read = nsim_pp_hold_read,
608 .write = nsim_pp_hold_write,
609 .llseek = generic_file_llseek,
610 .owner = THIS_MODULE,
613 static void nsim_setup(struct net_device *dev)
616 eth_hw_addr_random(dev);
618 dev->tx_queue_len = 0;
619 dev->flags &= ~IFF_MULTICAST;
620 dev->priv_flags |= IFF_LIVE_ADDR_CHANGE |
622 dev->features |= NETIF_F_HIGHDMA |
627 dev->hw_features |= NETIF_F_HW_TC;
628 dev->max_mtu = ETH_MAX_MTU;
629 dev->xdp_features = NETDEV_XDP_ACT_HW_OFFLOAD;
632 static int nsim_queue_init(struct netdevsim *ns)
634 struct net_device *dev = ns->netdev;
637 ns->rq = kvcalloc(dev->num_rx_queues, sizeof(*ns->rq),
638 GFP_KERNEL_ACCOUNT | __GFP_RETRY_MAYFAIL);
642 for (i = 0; i < dev->num_rx_queues; i++)
643 skb_queue_head_init(&ns->rq[i].skb_queue);
648 static void nsim_queue_free(struct netdevsim *ns)
650 struct net_device *dev = ns->netdev;
653 for (i = 0; i < dev->num_rx_queues; i++)
654 skb_queue_purge_reason(&ns->rq[i].skb_queue,
655 SKB_DROP_REASON_QUEUE_PURGE);
661 static int nsim_init_netdevsim(struct netdevsim *ns)
663 struct mock_phc *phc;
666 phc = mock_phc_create(&ns->nsim_bus_dev->dev);
671 ns->netdev->netdev_ops = &nsim_netdev_ops;
672 ns->netdev->stat_ops = &nsim_stat_ops;
674 err = nsim_udp_tunnels_info_create(ns->nsim_dev, ns->netdev);
676 goto err_phc_destroy;
679 err = nsim_queue_init(ns);
681 goto err_utn_destroy;
683 err = nsim_bpf_init(ns);
687 nsim_macsec_init(ns);
690 err = register_netdevice(ns->netdev);
692 goto err_ipsec_teardown;
697 nsim_ipsec_teardown(ns);
698 nsim_macsec_teardown(ns);
704 nsim_udp_tunnels_info_destroy(ns->netdev);
706 mock_phc_destroy(ns->phc);
710 static int nsim_init_netdevsim_vf(struct netdevsim *ns)
714 ns->netdev->netdev_ops = &nsim_vf_netdev_ops;
716 err = register_netdevice(ns->netdev);
721 static void nsim_exit_netdevsim(struct netdevsim *ns)
723 nsim_udp_tunnels_info_destroy(ns->netdev);
724 mock_phc_destroy(ns->phc);
728 nsim_create(struct nsim_dev *nsim_dev, struct nsim_dev_port *nsim_dev_port)
730 struct net_device *dev;
731 struct netdevsim *ns;
734 dev = alloc_netdev_mq(sizeof(*ns), "eth%d", NET_NAME_UNKNOWN, nsim_setup,
735 nsim_dev->nsim_bus_dev->num_queues);
737 return ERR_PTR(-ENOMEM);
739 dev_net_set(dev, nsim_dev_net(nsim_dev));
740 ns = netdev_priv(dev);
742 u64_stats_init(&ns->syncp);
743 ns->nsim_dev = nsim_dev;
744 ns->nsim_dev_port = nsim_dev_port;
745 ns->nsim_bus_dev = nsim_dev->nsim_bus_dev;
746 SET_NETDEV_DEV(dev, &ns->nsim_bus_dev->dev);
747 SET_NETDEV_DEVLINK_PORT(dev, &nsim_dev_port->devlink_port);
748 nsim_ethtool_init(ns);
749 if (nsim_dev_port_is_pf(nsim_dev_port))
750 err = nsim_init_netdevsim(ns);
752 err = nsim_init_netdevsim_vf(ns);
754 goto err_free_netdev;
756 ns->pp_dfs = debugfs_create_file("pp_hold", 0600, nsim_dev_port->ddir,
757 ns, &nsim_pp_hold_fops);
766 void nsim_destroy(struct netdevsim *ns)
768 struct net_device *dev = ns->netdev;
769 struct netdevsim *peer;
771 debugfs_remove(ns->pp_dfs);
774 peer = rtnl_dereference(ns->peer);
776 RCU_INIT_POINTER(peer->peer, NULL);
777 RCU_INIT_POINTER(ns->peer, NULL);
778 unregister_netdevice(dev);
779 if (nsim_dev_port_is_pf(ns->nsim_dev_port)) {
780 nsim_macsec_teardown(ns);
781 nsim_ipsec_teardown(ns);
786 if (nsim_dev_port_is_pf(ns->nsim_dev_port))
787 nsim_exit_netdevsim(ns);
789 /* Put this intentionally late to exercise the orphaning path */
791 page_pool_put_full_page(ns->page->pp, ns->page, false);
798 bool netdev_is_nsim(struct net_device *dev)
800 return dev->netdev_ops == &nsim_netdev_ops;
803 static int nsim_validate(struct nlattr *tb[], struct nlattr *data[],
804 struct netlink_ext_ack *extack)
806 NL_SET_ERR_MSG_MOD(extack,
807 "Please use: echo \"[ID] [PORT_COUNT] [NUM_QUEUES]\" > /sys/bus/netdevsim/new_device");
811 static struct rtnl_link_ops nsim_link_ops __read_mostly = {
813 .validate = nsim_validate,
816 static int __init nsim_module_init(void)
820 err = nsim_dev_init();
824 err = nsim_bus_init();
828 err = rtnl_link_register(&nsim_link_ops);
841 static void __exit nsim_module_exit(void)
843 rtnl_link_unregister(&nsim_link_ops);
848 module_init(nsim_module_init);
849 module_exit(nsim_module_exit);
850 MODULE_LICENSE("GPL");
851 MODULE_DESCRIPTION("Simulated networking device for testing");
852 MODULE_ALIAS_RTNL_LINK(DRV_NAME);