2 * Copyright (C) 2017 Netronome Systems, Inc.
4 * This software is licensed under the GNU General License Version 2,
5 * June 1991 as shown in the file COPYING in the top-level directory of this
8 * THE COPYRIGHT HOLDERS AND/OR OTHER PARTIES PROVIDE THE PROGRAM "AS IS"
9 * WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING,
10 * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
11 * FOR A PARTICULAR PURPOSE. THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE
12 * OF THE PROGRAM IS WITH YOU. SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME
13 * THE COST OF ALL NECESSARY SERVICING, REPAIR OR CORRECTION.
16 #include <linux/debugfs.h>
17 #include <linux/etherdevice.h>
18 #include <linux/ethtool_netlink.h>
19 #include <linux/kernel.h>
20 #include <linux/module.h>
21 #include <linux/netdevice.h>
22 #include <linux/slab.h>
23 #include <net/netdev_queues.h>
24 #include <net/netdev_rx_queue.h>
25 #include <net/page_pool/helpers.h>
26 #include <net/netlink.h>
27 #include <net/net_shaper.h>
28 #include <net/netdev_lock.h>
29 #include <net/pkt_cls.h>
30 #include <net/rtnetlink.h>
31 #include <net/udp_tunnel.h>
32 #include <net/busy_poll.h>
34 #include "netdevsim.h"
36 MODULE_IMPORT_NS("NETDEV_INTERNAL");
38 #define NSIM_RING_SIZE 256
40 static int nsim_napi_rx(struct nsim_rq *rq, struct sk_buff *skb)
42 if (skb_queue_len(&rq->skb_queue) > NSIM_RING_SIZE) {
43 dev_kfree_skb_any(skb);
47 skb_queue_tail(&rq->skb_queue, skb);
48 return NET_RX_SUCCESS;
51 static int nsim_forward_skb(struct net_device *dev, struct sk_buff *skb,
54 return __dev_forward_skb(dev, skb) ?: nsim_napi_rx(rq, skb);
57 static netdev_tx_t nsim_start_xmit(struct sk_buff *skb, struct net_device *dev)
59 struct netdevsim *ns = netdev_priv(dev);
60 struct net_device *peer_dev;
61 unsigned int len = skb->len;
62 struct netdevsim *peer_ns;
63 struct netdev_config *cfg;
68 if (!nsim_ipsec_tx(ns, skb))
71 peer_ns = rcu_dereference(ns->peer);
75 peer_dev = peer_ns->netdev;
76 rxq = skb_get_queue_mapping(skb);
77 if (rxq >= peer_dev->num_rx_queues)
78 rxq = rxq % peer_dev->num_rx_queues;
79 rq = peer_ns->rq[rxq];
82 if (skb_is_nonlinear(skb) &&
83 (cfg->hds_config != ETHTOOL_TCP_DATA_SPLIT_ENABLED ||
84 (cfg->hds_config == ETHTOOL_TCP_DATA_SPLIT_ENABLED &&
85 cfg->hds_thresh > len)))
88 skb_tx_timestamp(skb);
89 if (unlikely(nsim_forward_skb(peer_dev, skb, rq) == NET_RX_DROP))
92 if (!hrtimer_active(&rq->napi_timer))
93 hrtimer_start(&rq->napi_timer, us_to_ktime(5), HRTIMER_MODE_REL);
96 u64_stats_update_begin(&ns->syncp);
99 u64_stats_update_end(&ns->syncp);
106 u64_stats_update_begin(&ns->syncp);
108 u64_stats_update_end(&ns->syncp);
112 static void nsim_set_rx_mode(struct net_device *dev)
116 static int nsim_change_mtu(struct net_device *dev, int new_mtu)
118 struct netdevsim *ns = netdev_priv(dev);
120 if (ns->xdp.prog && !ns->xdp.prog->aux->xdp_has_frags &&
121 new_mtu > NSIM_XDP_MAX_MTU)
124 WRITE_ONCE(dev->mtu, new_mtu);
130 nsim_get_stats64(struct net_device *dev, struct rtnl_link_stats64 *stats)
132 struct netdevsim *ns = netdev_priv(dev);
136 start = u64_stats_fetch_begin(&ns->syncp);
137 stats->tx_bytes = ns->tx_bytes;
138 stats->tx_packets = ns->tx_packets;
139 stats->tx_dropped = ns->tx_dropped;
140 } while (u64_stats_fetch_retry(&ns->syncp, start));
144 nsim_setup_tc_block_cb(enum tc_setup_type type, void *type_data, void *cb_priv)
146 return nsim_bpf_setup_tc_block_cb(type, type_data, cb_priv);
149 static int nsim_set_vf_mac(struct net_device *dev, int vf, u8 *mac)
151 struct netdevsim *ns = netdev_priv(dev);
152 struct nsim_dev *nsim_dev = ns->nsim_dev;
154 /* Only refuse multicast addresses, zero address can mean unset/any. */
155 if (vf >= nsim_dev_get_vfs(nsim_dev) || is_multicast_ether_addr(mac))
157 memcpy(nsim_dev->vfconfigs[vf].vf_mac, mac, ETH_ALEN);
162 static int nsim_set_vf_vlan(struct net_device *dev, int vf,
163 u16 vlan, u8 qos, __be16 vlan_proto)
165 struct netdevsim *ns = netdev_priv(dev);
166 struct nsim_dev *nsim_dev = ns->nsim_dev;
168 if (vf >= nsim_dev_get_vfs(nsim_dev) || vlan > 4095 || qos > 7)
171 nsim_dev->vfconfigs[vf].vlan = vlan;
172 nsim_dev->vfconfigs[vf].qos = qos;
173 nsim_dev->vfconfigs[vf].vlan_proto = vlan_proto;
178 static int nsim_set_vf_rate(struct net_device *dev, int vf, int min, int max)
180 struct netdevsim *ns = netdev_priv(dev);
181 struct nsim_dev *nsim_dev = ns->nsim_dev;
183 if (nsim_esw_mode_is_switchdev(ns->nsim_dev)) {
184 pr_err("Not supported in switchdev mode. Please use devlink API.\n");
188 if (vf >= nsim_dev_get_vfs(nsim_dev))
191 nsim_dev->vfconfigs[vf].min_tx_rate = min;
192 nsim_dev->vfconfigs[vf].max_tx_rate = max;
197 static int nsim_set_vf_spoofchk(struct net_device *dev, int vf, bool val)
199 struct netdevsim *ns = netdev_priv(dev);
200 struct nsim_dev *nsim_dev = ns->nsim_dev;
202 if (vf >= nsim_dev_get_vfs(nsim_dev))
204 nsim_dev->vfconfigs[vf].spoofchk_enabled = val;
209 static int nsim_set_vf_rss_query_en(struct net_device *dev, int vf, bool val)
211 struct netdevsim *ns = netdev_priv(dev);
212 struct nsim_dev *nsim_dev = ns->nsim_dev;
214 if (vf >= nsim_dev_get_vfs(nsim_dev))
216 nsim_dev->vfconfigs[vf].rss_query_enabled = val;
221 static int nsim_set_vf_trust(struct net_device *dev, int vf, bool val)
223 struct netdevsim *ns = netdev_priv(dev);
224 struct nsim_dev *nsim_dev = ns->nsim_dev;
226 if (vf >= nsim_dev_get_vfs(nsim_dev))
228 nsim_dev->vfconfigs[vf].trusted = val;
234 nsim_get_vf_config(struct net_device *dev, int vf, struct ifla_vf_info *ivi)
236 struct netdevsim *ns = netdev_priv(dev);
237 struct nsim_dev *nsim_dev = ns->nsim_dev;
239 if (vf >= nsim_dev_get_vfs(nsim_dev))
243 ivi->linkstate = nsim_dev->vfconfigs[vf].link_state;
244 ivi->min_tx_rate = nsim_dev->vfconfigs[vf].min_tx_rate;
245 ivi->max_tx_rate = nsim_dev->vfconfigs[vf].max_tx_rate;
246 ivi->vlan = nsim_dev->vfconfigs[vf].vlan;
247 ivi->vlan_proto = nsim_dev->vfconfigs[vf].vlan_proto;
248 ivi->qos = nsim_dev->vfconfigs[vf].qos;
249 memcpy(&ivi->mac, nsim_dev->vfconfigs[vf].vf_mac, ETH_ALEN);
250 ivi->spoofchk = nsim_dev->vfconfigs[vf].spoofchk_enabled;
251 ivi->trusted = nsim_dev->vfconfigs[vf].trusted;
252 ivi->rss_query_en = nsim_dev->vfconfigs[vf].rss_query_enabled;
257 static int nsim_set_vf_link_state(struct net_device *dev, int vf, int state)
259 struct netdevsim *ns = netdev_priv(dev);
260 struct nsim_dev *nsim_dev = ns->nsim_dev;
262 if (vf >= nsim_dev_get_vfs(nsim_dev))
266 case IFLA_VF_LINK_STATE_AUTO:
267 case IFLA_VF_LINK_STATE_ENABLE:
268 case IFLA_VF_LINK_STATE_DISABLE:
274 nsim_dev->vfconfigs[vf].link_state = state;
279 static void nsim_taprio_stats(struct tc_taprio_qopt_stats *stats)
281 stats->window_drops = 0;
282 stats->tx_overruns = 0;
285 static int nsim_setup_tc_taprio(struct net_device *dev,
286 struct tc_taprio_qopt_offload *offload)
290 switch (offload->cmd) {
291 case TAPRIO_CMD_REPLACE:
292 case TAPRIO_CMD_DESTROY:
294 case TAPRIO_CMD_STATS:
295 nsim_taprio_stats(&offload->stats);
304 static LIST_HEAD(nsim_block_cb_list);
307 nsim_setup_tc(struct net_device *dev, enum tc_setup_type type, void *type_data)
309 struct netdevsim *ns = netdev_priv(dev);
312 case TC_SETUP_QDISC_TAPRIO:
313 return nsim_setup_tc_taprio(dev, type_data);
315 return flow_block_cb_setup_simple(type_data,
317 nsim_setup_tc_block_cb,
325 nsim_set_features(struct net_device *dev, netdev_features_t features)
327 struct netdevsim *ns = netdev_priv(dev);
329 if ((dev->features & NETIF_F_HW_TC) > (features & NETIF_F_HW_TC))
330 return nsim_bpf_disable_tc(ns);
335 static int nsim_get_iflink(const struct net_device *dev)
337 struct netdevsim *nsim, *peer;
340 nsim = netdev_priv(dev);
343 peer = rcu_dereference(nsim->peer);
344 iflink = peer ? READ_ONCE(peer->netdev->ifindex) :
345 READ_ONCE(dev->ifindex);
351 static int nsim_rcv(struct nsim_rq *rq, int budget)
356 for (i = 0; i < budget; i++) {
357 if (skb_queue_empty(&rq->skb_queue))
360 skb = skb_dequeue(&rq->skb_queue);
361 skb_mark_napi_id(skb, &rq->napi);
362 netif_receive_skb(skb);
368 static int nsim_poll(struct napi_struct *napi, int budget)
370 struct nsim_rq *rq = container_of(napi, struct nsim_rq, napi);
373 done = nsim_rcv(rq, budget);
375 napi_complete_done(napi, done);
380 static int nsim_create_page_pool(struct page_pool **p, struct napi_struct *napi)
382 struct page_pool_params params = {
384 .pool_size = NSIM_RING_SIZE,
386 .dev = &napi->dev->dev,
388 .dma_dir = DMA_BIDIRECTIONAL,
391 struct page_pool *pool;
393 pool = page_pool_create(¶ms);
395 return PTR_ERR(pool);
401 static int nsim_init_napi(struct netdevsim *ns)
403 struct net_device *dev = ns->netdev;
407 for (i = 0; i < dev->num_rx_queues; i++) {
410 netif_napi_add_config_locked(dev, &rq->napi, nsim_poll, i);
413 for (i = 0; i < dev->num_rx_queues; i++) {
416 err = nsim_create_page_pool(&rq->page_pool, &rq->napi);
425 page_pool_destroy(ns->rq[i]->page_pool);
426 ns->rq[i]->page_pool = NULL;
429 for (i = 0; i < dev->num_rx_queues; i++)
430 __netif_napi_del_locked(&ns->rq[i]->napi);
435 static enum hrtimer_restart nsim_napi_schedule(struct hrtimer *timer)
439 rq = container_of(timer, struct nsim_rq, napi_timer);
440 napi_schedule(&rq->napi);
442 return HRTIMER_NORESTART;
445 static void nsim_rq_timer_init(struct nsim_rq *rq)
447 hrtimer_setup(&rq->napi_timer, nsim_napi_schedule, CLOCK_MONOTONIC,
451 static void nsim_enable_napi(struct netdevsim *ns)
453 struct net_device *dev = ns->netdev;
456 for (i = 0; i < dev->num_rx_queues; i++) {
457 struct nsim_rq *rq = ns->rq[i];
459 netif_queue_set_napi(dev, i, NETDEV_QUEUE_TYPE_RX, &rq->napi);
460 napi_enable_locked(&rq->napi);
464 static int nsim_open(struct net_device *dev)
466 struct netdevsim *ns = netdev_priv(dev);
469 netdev_assert_locked(dev);
471 err = nsim_init_napi(ns);
475 nsim_enable_napi(ns);
480 static void nsim_del_napi(struct netdevsim *ns)
482 struct net_device *dev = ns->netdev;
485 for (i = 0; i < dev->num_rx_queues; i++) {
486 struct nsim_rq *rq = ns->rq[i];
488 napi_disable_locked(&rq->napi);
489 __netif_napi_del_locked(&rq->napi);
493 for (i = 0; i < dev->num_rx_queues; i++) {
494 page_pool_destroy(ns->rq[i]->page_pool);
495 ns->rq[i]->page_pool = NULL;
499 static int nsim_stop(struct net_device *dev)
501 struct netdevsim *ns = netdev_priv(dev);
502 struct netdevsim *peer;
504 netdev_assert_locked(dev);
506 netif_carrier_off(dev);
507 peer = rtnl_dereference(ns->peer);
509 netif_carrier_off(peer->netdev);
516 static int nsim_shaper_set(struct net_shaper_binding *binding,
517 const struct net_shaper *shaper,
518 struct netlink_ext_ack *extack)
523 static int nsim_shaper_del(struct net_shaper_binding *binding,
524 const struct net_shaper_handle *handle,
525 struct netlink_ext_ack *extack)
530 static int nsim_shaper_group(struct net_shaper_binding *binding,
532 const struct net_shaper *leaves,
533 const struct net_shaper *root,
534 struct netlink_ext_ack *extack)
539 static void nsim_shaper_cap(struct net_shaper_binding *binding,
540 enum net_shaper_scope scope,
541 unsigned long *flags)
546 static const struct net_shaper_ops nsim_shaper_ops = {
547 .set = nsim_shaper_set,
548 .delete = nsim_shaper_del,
549 .group = nsim_shaper_group,
550 .capabilities = nsim_shaper_cap,
553 static const struct net_device_ops nsim_netdev_ops = {
554 .ndo_start_xmit = nsim_start_xmit,
555 .ndo_set_rx_mode = nsim_set_rx_mode,
556 .ndo_set_mac_address = eth_mac_addr,
557 .ndo_validate_addr = eth_validate_addr,
558 .ndo_change_mtu = nsim_change_mtu,
559 .ndo_get_stats64 = nsim_get_stats64,
560 .ndo_set_vf_mac = nsim_set_vf_mac,
561 .ndo_set_vf_vlan = nsim_set_vf_vlan,
562 .ndo_set_vf_rate = nsim_set_vf_rate,
563 .ndo_set_vf_spoofchk = nsim_set_vf_spoofchk,
564 .ndo_set_vf_trust = nsim_set_vf_trust,
565 .ndo_get_vf_config = nsim_get_vf_config,
566 .ndo_set_vf_link_state = nsim_set_vf_link_state,
567 .ndo_set_vf_rss_query_en = nsim_set_vf_rss_query_en,
568 .ndo_setup_tc = nsim_setup_tc,
569 .ndo_set_features = nsim_set_features,
570 .ndo_get_iflink = nsim_get_iflink,
572 .ndo_open = nsim_open,
573 .ndo_stop = nsim_stop,
574 .net_shaper_ops = &nsim_shaper_ops,
577 static const struct net_device_ops nsim_vf_netdev_ops = {
578 .ndo_start_xmit = nsim_start_xmit,
579 .ndo_set_rx_mode = nsim_set_rx_mode,
580 .ndo_set_mac_address = eth_mac_addr,
581 .ndo_validate_addr = eth_validate_addr,
582 .ndo_change_mtu = nsim_change_mtu,
583 .ndo_get_stats64 = nsim_get_stats64,
584 .ndo_setup_tc = nsim_setup_tc,
585 .ndo_set_features = nsim_set_features,
588 /* We don't have true per-queue stats, yet, so do some random fakery here.
589 * Only report stuff for queue 0.
591 static void nsim_get_queue_stats_rx(struct net_device *dev, int idx,
592 struct netdev_queue_stats_rx *stats)
594 struct rtnl_link_stats64 rtstats = {};
597 nsim_get_stats64(dev, &rtstats);
599 stats->packets = rtstats.rx_packets - !!rtstats.rx_packets;
600 stats->bytes = rtstats.rx_bytes;
603 static void nsim_get_queue_stats_tx(struct net_device *dev, int idx,
604 struct netdev_queue_stats_tx *stats)
606 struct rtnl_link_stats64 rtstats = {};
609 nsim_get_stats64(dev, &rtstats);
611 stats->packets = rtstats.tx_packets - !!rtstats.tx_packets;
612 stats->bytes = rtstats.tx_bytes;
615 static void nsim_get_base_stats(struct net_device *dev,
616 struct netdev_queue_stats_rx *rx,
617 struct netdev_queue_stats_tx *tx)
619 struct rtnl_link_stats64 rtstats = {};
621 nsim_get_stats64(dev, &rtstats);
623 rx->packets = !!rtstats.rx_packets;
625 tx->packets = !!rtstats.tx_packets;
629 static const struct netdev_stat_ops nsim_stat_ops = {
630 .get_queue_stats_tx = nsim_get_queue_stats_tx,
631 .get_queue_stats_rx = nsim_get_queue_stats_rx,
632 .get_base_stats = nsim_get_base_stats,
635 static struct nsim_rq *nsim_queue_alloc(void)
639 rq = kzalloc(sizeof(*rq), GFP_KERNEL_ACCOUNT);
643 skb_queue_head_init(&rq->skb_queue);
644 nsim_rq_timer_init(rq);
648 static void nsim_queue_free(struct nsim_rq *rq)
650 hrtimer_cancel(&rq->napi_timer);
651 skb_queue_purge_reason(&rq->skb_queue, SKB_DROP_REASON_QUEUE_PURGE);
655 /* Queue reset mode is controlled by ns->rq_reset_mode.
656 * - normal - new NAPI new pool (old NAPI enabled when new added)
657 * - mode 1 - allocate new pool (NAPI is only disabled / enabled)
658 * - mode 2 - new NAPI new pool (old NAPI removed before new added)
659 * - mode 3 - new NAPI new pool (old NAPI disabled when new added)
661 struct nsim_queue_mem {
663 struct page_pool *pp;
667 nsim_queue_mem_alloc(struct net_device *dev, void *per_queue_mem, int idx)
669 struct nsim_queue_mem *qmem = per_queue_mem;
670 struct netdevsim *ns = netdev_priv(dev);
673 if (ns->rq_reset_mode > 3)
676 if (ns->rq_reset_mode == 1) {
677 if (!netif_running(ns->netdev))
679 return nsim_create_page_pool(&qmem->pp, &ns->rq[idx]->napi);
682 qmem->rq = nsim_queue_alloc();
686 err = nsim_create_page_pool(&qmem->rq->page_pool, &qmem->rq->napi);
690 if (!ns->rq_reset_mode)
691 netif_napi_add_config_locked(dev, &qmem->rq->napi, nsim_poll,
697 nsim_queue_free(qmem->rq);
701 static void nsim_queue_mem_free(struct net_device *dev, void *per_queue_mem)
703 struct nsim_queue_mem *qmem = per_queue_mem;
704 struct netdevsim *ns = netdev_priv(dev);
706 page_pool_destroy(qmem->pp);
708 if (!ns->rq_reset_mode)
709 netif_napi_del_locked(&qmem->rq->napi);
710 page_pool_destroy(qmem->rq->page_pool);
711 nsim_queue_free(qmem->rq);
716 nsim_queue_start(struct net_device *dev, void *per_queue_mem, int idx)
718 struct nsim_queue_mem *qmem = per_queue_mem;
719 struct netdevsim *ns = netdev_priv(dev);
721 netdev_assert_locked(dev);
723 if (ns->rq_reset_mode == 1) {
724 ns->rq[idx]->page_pool = qmem->pp;
725 napi_enable_locked(&ns->rq[idx]->napi);
729 /* netif_napi_add()/_del() should normally be called from alloc/free,
730 * here we want to test various call orders.
732 if (ns->rq_reset_mode == 2) {
733 netif_napi_del_locked(&ns->rq[idx]->napi);
734 netif_napi_add_config_locked(dev, &qmem->rq->napi, nsim_poll,
736 } else if (ns->rq_reset_mode == 3) {
737 netif_napi_add_config_locked(dev, &qmem->rq->napi, nsim_poll,
739 netif_napi_del_locked(&ns->rq[idx]->napi);
742 ns->rq[idx] = qmem->rq;
743 napi_enable_locked(&ns->rq[idx]->napi);
748 static int nsim_queue_stop(struct net_device *dev, void *per_queue_mem, int idx)
750 struct nsim_queue_mem *qmem = per_queue_mem;
751 struct netdevsim *ns = netdev_priv(dev);
753 netdev_assert_locked(dev);
755 napi_disable_locked(&ns->rq[idx]->napi);
757 if (ns->rq_reset_mode == 1) {
758 qmem->pp = ns->rq[idx]->page_pool;
759 page_pool_disable_direct_recycling(qmem->pp);
761 qmem->rq = ns->rq[idx];
767 static const struct netdev_queue_mgmt_ops nsim_queue_mgmt_ops = {
768 .ndo_queue_mem_size = sizeof(struct nsim_queue_mem),
769 .ndo_queue_mem_alloc = nsim_queue_mem_alloc,
770 .ndo_queue_mem_free = nsim_queue_mem_free,
771 .ndo_queue_start = nsim_queue_start,
772 .ndo_queue_stop = nsim_queue_stop,
776 nsim_qreset_write(struct file *file, const char __user *data,
777 size_t count, loff_t *ppos)
779 struct netdevsim *ns = file->private_data;
780 unsigned int queue, mode;
784 if (count >= sizeof(buf))
786 if (copy_from_user(buf, data, count))
790 ret = sscanf(buf, "%u %u", &queue, &mode);
794 netdev_lock(ns->netdev);
795 if (queue >= ns->netdev->real_num_rx_queues) {
800 ns->rq_reset_mode = mode;
801 ret = netdev_rx_queue_restart(ns->netdev, queue);
802 ns->rq_reset_mode = 0;
808 netdev_unlock(ns->netdev);
812 static const struct file_operations nsim_qreset_fops = {
814 .write = nsim_qreset_write,
815 .owner = THIS_MODULE,
819 nsim_pp_hold_read(struct file *file, char __user *data,
820 size_t count, loff_t *ppos)
822 struct netdevsim *ns = file->private_data;
828 return simple_read_from_buffer(data, count, ppos, buf, 2);
832 nsim_pp_hold_write(struct file *file, const char __user *data,
833 size_t count, loff_t *ppos)
835 struct netdevsim *ns = file->private_data;
839 ret = kstrtobool_from_user(data, count, &val);
845 if (val == !!ns->page)
848 if (!netif_running(ns->netdev) && val) {
851 ns->page = page_pool_dev_alloc_pages(ns->rq[0]->page_pool);
855 page_pool_put_full_page(ns->page->pp, ns->page, false);
864 static const struct file_operations nsim_pp_hold_fops = {
866 .read = nsim_pp_hold_read,
867 .write = nsim_pp_hold_write,
868 .llseek = generic_file_llseek,
869 .owner = THIS_MODULE,
872 static void nsim_setup(struct net_device *dev)
875 eth_hw_addr_random(dev);
877 dev->tx_queue_len = 0;
878 dev->flags &= ~IFF_MULTICAST;
879 dev->priv_flags |= IFF_LIVE_ADDR_CHANGE |
881 dev->features |= NETIF_F_HIGHDMA |
887 dev->hw_features |= NETIF_F_HW_TC |
893 dev->max_mtu = ETH_MAX_MTU;
894 dev->xdp_features = NETDEV_XDP_ACT_HW_OFFLOAD;
897 static int nsim_queue_init(struct netdevsim *ns)
899 struct net_device *dev = ns->netdev;
902 ns->rq = kcalloc(dev->num_rx_queues, sizeof(*ns->rq),
907 for (i = 0; i < dev->num_rx_queues; i++) {
908 ns->rq[i] = nsim_queue_alloc();
922 static void nsim_queue_uninit(struct netdevsim *ns)
924 struct net_device *dev = ns->netdev;
927 for (i = 0; i < dev->num_rx_queues; i++)
928 nsim_queue_free(ns->rq[i]);
934 static int nsim_init_netdevsim(struct netdevsim *ns)
936 struct mock_phc *phc;
939 phc = mock_phc_create(&ns->nsim_bus_dev->dev);
944 ns->netdev->netdev_ops = &nsim_netdev_ops;
945 ns->netdev->stat_ops = &nsim_stat_ops;
946 ns->netdev->queue_mgmt_ops = &nsim_queue_mgmt_ops;
947 netdev_lockdep_set_classes(ns->netdev);
949 err = nsim_udp_tunnels_info_create(ns->nsim_dev, ns->netdev);
951 goto err_phc_destroy;
954 err = nsim_queue_init(ns);
956 goto err_utn_destroy;
958 err = nsim_bpf_init(ns);
962 nsim_macsec_init(ns);
965 err = register_netdevice(ns->netdev);
967 goto err_ipsec_teardown;
970 if (IS_ENABLED(CONFIG_DEBUG_NET)) {
971 ns->nb.notifier_call = netdev_debug_event;
972 if (register_netdevice_notifier_dev_net(ns->netdev, &ns->nb,
974 ns->nb.notifier_call = NULL;
980 nsim_ipsec_teardown(ns);
981 nsim_macsec_teardown(ns);
984 nsim_queue_uninit(ns);
987 nsim_udp_tunnels_info_destroy(ns->netdev);
989 mock_phc_destroy(ns->phc);
993 static int nsim_init_netdevsim_vf(struct netdevsim *ns)
997 ns->netdev->netdev_ops = &nsim_vf_netdev_ops;
999 err = register_netdevice(ns->netdev);
1004 static void nsim_exit_netdevsim(struct netdevsim *ns)
1006 nsim_udp_tunnels_info_destroy(ns->netdev);
1007 mock_phc_destroy(ns->phc);
1011 nsim_create(struct nsim_dev *nsim_dev, struct nsim_dev_port *nsim_dev_port)
1013 struct net_device *dev;
1014 struct netdevsim *ns;
1017 dev = alloc_netdev_mq(sizeof(*ns), "eth%d", NET_NAME_UNKNOWN, nsim_setup,
1018 nsim_dev->nsim_bus_dev->num_queues);
1020 return ERR_PTR(-ENOMEM);
1022 dev_net_set(dev, nsim_dev_net(nsim_dev));
1023 ns = netdev_priv(dev);
1025 u64_stats_init(&ns->syncp);
1026 ns->nsim_dev = nsim_dev;
1027 ns->nsim_dev_port = nsim_dev_port;
1028 ns->nsim_bus_dev = nsim_dev->nsim_bus_dev;
1029 SET_NETDEV_DEV(dev, &ns->nsim_bus_dev->dev);
1030 SET_NETDEV_DEVLINK_PORT(dev, &nsim_dev_port->devlink_port);
1031 nsim_ethtool_init(ns);
1032 if (nsim_dev_port_is_pf(nsim_dev_port))
1033 err = nsim_init_netdevsim(ns);
1035 err = nsim_init_netdevsim_vf(ns);
1037 goto err_free_netdev;
1039 ns->pp_dfs = debugfs_create_file("pp_hold", 0600, nsim_dev_port->ddir,
1040 ns, &nsim_pp_hold_fops);
1041 ns->qr_dfs = debugfs_create_file("queue_reset", 0200,
1042 nsim_dev_port->ddir, ns,
1049 return ERR_PTR(err);
1052 void nsim_destroy(struct netdevsim *ns)
1054 struct net_device *dev = ns->netdev;
1055 struct netdevsim *peer;
1057 debugfs_remove(ns->qr_dfs);
1058 debugfs_remove(ns->pp_dfs);
1060 if (ns->nb.notifier_call)
1061 unregister_netdevice_notifier_dev_net(ns->netdev, &ns->nb,
1065 peer = rtnl_dereference(ns->peer);
1067 RCU_INIT_POINTER(peer->peer, NULL);
1068 RCU_INIT_POINTER(ns->peer, NULL);
1069 unregister_netdevice(dev);
1070 if (nsim_dev_port_is_pf(ns->nsim_dev_port)) {
1071 nsim_macsec_teardown(ns);
1072 nsim_ipsec_teardown(ns);
1073 nsim_bpf_uninit(ns);
1074 nsim_queue_uninit(ns);
1077 if (nsim_dev_port_is_pf(ns->nsim_dev_port))
1078 nsim_exit_netdevsim(ns);
1080 /* Put this intentionally late to exercise the orphaning path */
1082 page_pool_put_full_page(ns->page->pp, ns->page, false);
1089 bool netdev_is_nsim(struct net_device *dev)
1091 return dev->netdev_ops == &nsim_netdev_ops;
1094 static int nsim_validate(struct nlattr *tb[], struct nlattr *data[],
1095 struct netlink_ext_ack *extack)
1097 NL_SET_ERR_MSG_MOD(extack,
1098 "Please use: echo \"[ID] [PORT_COUNT] [NUM_QUEUES]\" > /sys/bus/netdevsim/new_device");
1102 static struct rtnl_link_ops nsim_link_ops __read_mostly = {
1104 .validate = nsim_validate,
1107 static int __init nsim_module_init(void)
1111 err = nsim_dev_init();
1115 err = nsim_bus_init();
1119 err = rtnl_link_register(&nsim_link_ops);
1132 static void __exit nsim_module_exit(void)
1134 rtnl_link_unregister(&nsim_link_ops);
1139 module_init(nsim_module_init);
1140 module_exit(nsim_module_exit);
1141 MODULE_LICENSE("GPL");
1142 MODULE_DESCRIPTION("Simulated networking device for testing");
1143 MODULE_ALIAS_RTNL_LINK(DRV_NAME);