netfilter: nft_flow_offload: use direct xmit if hardware offload is enabled
[linux-block.git] / net / bridge / br_device.c
CommitLineData
2874c5fd 1// SPDX-License-Identifier: GPL-2.0-or-later
1da177e4
LT
2/*
3 * Device handling code
4 * Linux ethernet bridge
5 *
6 * Authors:
7 * Lennert Buytenhek <buytenh@gnu.org>
1da177e4
LT
8 */
9
10#include <linux/kernel.h>
11#include <linux/netdevice.h>
c06ee961 12#include <linux/netpoll.h>
4505a3ef 13#include <linux/etherdevice.h>
edb5e46f 14#include <linux/ethtool.h>
c06ee961 15#include <linux/list.h>
ea2d9b41 16#include <linux/netfilter_bridge.h>
4505a3ef 17
7c0f6ba6 18#include <linux/uaccess.h>
1da177e4
LT
19#include "br_private.h"
20
161f65ba
VY
21#define COMMON_FEATURES (NETIF_F_SG | NETIF_F_FRAGLIST | NETIF_F_HIGHDMA | \
22 NETIF_F_GSO_MASK | NETIF_F_HW_CSUM)
23
1a4ba64d
PNA
24const struct nf_br_ops __rcu *nf_br_ops __read_mostly;
25EXPORT_SYMBOL_GPL(nf_br_ops);
26
eeaf61d8 27/* net device transmit always called with BH disabled */
6fef4c0c 28netdev_tx_t br_dev_xmit(struct sk_buff *skb, struct net_device *dev)
1da177e4
LT
29{
30 struct net_bridge *br = netdev_priv(dev);
1da177e4 31 struct net_bridge_fdb_entry *dst;
c4fcb78c 32 struct net_bridge_mdb_entry *mdst;
1a4ba64d 33 const struct nf_br_ops *nf_ops;
a580c76d 34 u8 state = BR_STATE_FORWARDING;
31a4562d 35 const unsigned char *dest;
78851988 36 u16 vid = 0;
1da177e4 37
fd65e5a9
NA
38 memset(skb->cb, 0, sizeof(struct br_input_skb_cb));
39
c03307ea 40 rcu_read_lock();
1a4ba64d
PNA
41 nf_ops = rcu_dereference(nf_br_ops);
42 if (nf_ops && nf_ops->br_dev_xmit_hook(skb)) {
c03307ea 43 rcu_read_unlock();
ea2d9b41
BDS
44 return NETDEV_TX_OK;
45 }
ea2d9b41 46
7609ecb2 47 dev_sw_netstats_tx_add(dev, 1, skb->len);
6088a539 48
f1c2eddf 49 br_switchdev_frame_unmark(skb);
14bb4789 50 BR_INPUT_SKB_CB(skb)->brdev = dev;
3c171f49 51 BR_INPUT_SKB_CB(skb)->frag_max_size = 0;
1da177e4 52
459a98ed 53 skb_reset_mac_header(skb);
1da177e4
LT
54 skb_pull(skb, ETH_HLEN);
55
a580c76d 56 if (!br_allowed_ingress(br, br_vlan_group_rcu(br), skb, &vid, &state))
12464bb8
TM
57 goto out;
58
057658cb 59 if (IS_ENABLED(CONFIG_INET) &&
823d81b0
NA
60 (eth_hdr(skb)->h_proto == htons(ETH_P_ARP) ||
61 eth_hdr(skb)->h_proto == htons(ETH_P_RARP)) &&
c69c2cd4 62 br_opt_get(br, BROPT_NEIGH_SUPPRESS_ENABLED)) {
057658cb 63 br_do_proxy_suppress_arp(skb, br, vid, NULL);
ed842fae
RP
64 } else if (IS_ENABLED(CONFIG_IPV6) &&
65 skb->protocol == htons(ETH_P_IPV6) &&
c69c2cd4 66 br_opt_get(br, BROPT_NEIGH_SUPPRESS_ENABLED) &&
ed842fae
RP
67 pskb_may_pull(skb, sizeof(struct ipv6hdr) +
68 sizeof(struct nd_msg)) &&
69 ipv6_hdr(skb)->nexthdr == IPPROTO_ICMPV6) {
70 struct nd_msg *msg, _msg;
71
72 msg = br_is_nd_neigh_msg(skb, &_msg);
73 if (msg)
74 br_do_suppress_nd(skb, br, vid, NULL, msg);
057658cb
RP
75 }
76
31a4562d 77 dest = eth_hdr(skb)->h_dest;
37b090e6 78 if (is_broadcast_ether_addr(dest)) {
8addd5e7 79 br_flood(br, skb, BR_PKT_BROADCAST, false, true);
37b090e6 80 } else if (is_multicast_ether_addr(dest)) {
91d2c34a 81 if (unlikely(netpoll_tx_running(dev))) {
8addd5e7 82 br_flood(br, skb, BR_PKT_MULTICAST, false, true);
91d2c34a
HX
83 goto out;
84 }
06499098 85 if (br_multicast_rcv(br, NULL, skb, vid)) {
6d1d1d39 86 kfree_skb(skb);
c4fcb78c 87 goto out;
6d1d1d39 88 }
c4fcb78c 89
fbca58a2 90 mdst = br_mdb_get(br, skb, vid);
b00589af 91 if ((mdst || BR_INPUT_SKB_CB_MROUTERS_ONLY(skb)) &&
955062b0 92 br_multicast_querier_exists(br, eth_hdr(skb), mdst))
37b090e6 93 br_multicast_flood(mdst, skb, false, true);
c4fcb78c 94 else
8addd5e7 95 br_flood(br, skb, BR_PKT_MULTICAST, false, true);
bfd0aeac 96 } else if ((dst = br_fdb_find_rcu(br, dest, vid)) != NULL) {
37b090e6
NA
97 br_forward(dst->dst, skb, false, true);
98 } else {
8addd5e7 99 br_flood(br, skb, BR_PKT_UNICAST, false, true);
37b090e6 100 }
c4fcb78c 101out:
eeaf61d8 102 rcu_read_unlock();
6ed10654 103 return NETDEV_TX_OK;
1da177e4
LT
104}
105
845e0ebb
CW
106static struct lock_class_key bridge_netdev_addr_lock_key;
107
108static void br_set_lockdep_class(struct net_device *dev)
109{
110 lockdep_set_class(&dev->addr_list_lock, &bridge_netdev_addr_lock_key);
111}
112
bb900b27 113static int br_dev_init(struct net_device *dev)
114{
115 struct net_bridge *br = netdev_priv(dev);
5be5a2df 116 int err;
bb900b27 117
7609ecb2
HK
118 dev->tstats = netdev_alloc_pcpu_stats(struct pcpu_sw_netstats);
119 if (!dev->tstats)
bb900b27 120 return -ENOMEM;
121
eb793583
NA
122 err = br_fdb_hash_init(br);
123 if (err) {
7609ecb2 124 free_percpu(dev->tstats);
eb793583
NA
125 return err;
126 }
127
19e3a9c9
NA
128 err = br_mdb_hash_init(br);
129 if (err) {
7609ecb2 130 free_percpu(dev->tstats);
19e3a9c9
NA
131 br_fdb_hash_fini(br);
132 return err;
133 }
134
5be5a2df 135 err = br_vlan_init(br);
1080ab95 136 if (err) {
7609ecb2 137 free_percpu(dev->tstats);
19e3a9c9 138 br_mdb_hash_fini(br);
eb793583 139 br_fdb_hash_fini(br);
1080ab95
NA
140 return err;
141 }
142
143 err = br_multicast_init_stats(br);
144 if (err) {
7609ecb2 145 free_percpu(dev->tstats);
1080ab95 146 br_vlan_flush(br);
19e3a9c9 147 br_mdb_hash_fini(br);
eb793583 148 br_fdb_hash_fini(br);
1080ab95 149 }
5be5a2df 150
845e0ebb 151 br_set_lockdep_class(dev);
5be5a2df 152 return err;
bb900b27 153}
154
b6fe0440
IS
155static void br_dev_uninit(struct net_device *dev)
156{
157 struct net_bridge *br = netdev_priv(dev);
158
b1b9d366 159 br_multicast_dev_del(br);
b6fe0440
IS
160 br_multicast_uninit_stats(br);
161 br_vlan_flush(br);
19e3a9c9 162 br_mdb_hash_fini(br);
eb793583 163 br_fdb_hash_fini(br);
7609ecb2 164 free_percpu(dev->tstats);
b6fe0440
IS
165}
166
1da177e4
LT
167static int br_dev_open(struct net_device *dev)
168{
81d35307 169 struct net_bridge *br = netdev_priv(dev);
1da177e4 170
c4d27ef9 171 netdev_update_features(dev);
81d35307
SH
172 netif_start_queue(dev);
173 br_stp_enable_bridge(br);
3fe2d7c7 174 br_multicast_open(br);
1da177e4 175
851d0a73
JH
176 if (br_opt_get(br, BROPT_MULTICAST_ENABLED))
177 br_multicast_join_snoopers(br);
178
1da177e4
LT
179 return 0;
180}
181
182static void br_dev_set_multicast_list(struct net_device *dev)
183{
184}
185
2796d0c6
VY
186static void br_dev_change_rx_flags(struct net_device *dev, int change)
187{
188 if (change & IFF_PROMISC)
189 br_manage_promisc(netdev_priv(dev));
190}
191
1da177e4
LT
192static int br_dev_stop(struct net_device *dev)
193{
3fe2d7c7
HX
194 struct net_bridge *br = netdev_priv(dev);
195
196 br_stp_disable_bridge(br);
197 br_multicast_stop(br);
1da177e4 198
851d0a73
JH
199 if (br_opt_get(br, BROPT_MULTICAST_ENABLED))
200 br_multicast_leave_snoopers(br);
201
1da177e4
LT
202 netif_stop_queue(dev);
203
204 return 0;
205}
206
207static int br_change_mtu(struct net_device *dev, int new_mtu)
208{
4adf0af6 209 struct net_bridge *br = netdev_priv(dev);
f40aa233 210
1da177e4 211 dev->mtu = new_mtu;
4adf0af6 212
804b854d 213 /* this flag will be cleared if the MTU was automatically adjusted */
3341d917 214 br_opt_toggle(br, BROPT_MTU_SET_BY_USER, true);
34666d46 215#if IS_ENABLED(CONFIG_BRIDGE_NETFILTER)
4adf0af6 216 /* remember the MTU in the rtable for PMTU */
defb3519 217 dst_metric_set(&br->fake_rtable.dst, RTAX_MTU, new_mtu);
4adf0af6
SW
218#endif
219
1da177e4
LT
220 return 0;
221}
222
ffe1d49c 223/* Allow setting mac address to any valid ethernet address. */
4505a3ef
SH
224static int br_set_mac_address(struct net_device *dev, void *p)
225{
226 struct net_bridge *br = netdev_priv(dev);
227 struct sockaddr *addr = p;
ffe1d49c
SH
228
229 if (!is_valid_ether_addr(addr->sa_data))
7ca1e11a 230 return -EADDRNOTAVAIL;
4505a3ef 231
c4b4c421
NA
232 /* dev_set_mac_addr() can be called by a master device on bridge's
233 * NETDEV_UNREGISTER, but since it's being destroyed do nothing
234 */
235 if (dev->reg_state != NETREG_REGISTERED)
236 return -EBUSY;
237
4505a3ef 238 spin_lock_bh(&br->lock);
9a7b6ef9 239 if (!ether_addr_equal(dev->dev_addr, addr->sa_data)) {
a3ebb7ef 240 /* Mac address will be changed in br_stp_change_bridge_id(). */
43598813 241 br_stp_change_bridge_id(br, addr->sa_data);
242 }
4505a3ef
SH
243 spin_unlock_bh(&br->lock);
244
ffe1d49c 245 return 0;
4505a3ef
SH
246}
247
edb5e46f
SH
248static void br_getinfo(struct net_device *dev, struct ethtool_drvinfo *info)
249{
7826d43f
JP
250 strlcpy(info->driver, "bridge", sizeof(info->driver));
251 strlcpy(info->version, BR_VERSION, sizeof(info->version));
252 strlcpy(info->fw_version, "N/A", sizeof(info->fw_version));
253 strlcpy(info->bus_info, "N/A", sizeof(info->bus_info));
edb5e46f
SH
254}
255
542575fe
MS
256static int br_get_link_ksettings(struct net_device *dev,
257 struct ethtool_link_ksettings *cmd)
258{
259 struct net_bridge *br = netdev_priv(dev);
260 struct net_bridge_port *p;
261
262 cmd->base.duplex = DUPLEX_UNKNOWN;
263 cmd->base.port = PORT_OTHER;
264 cmd->base.speed = SPEED_UNKNOWN;
265
266 list_for_each_entry(p, &br->port_list, list) {
267 struct ethtool_link_ksettings ecmd;
268 struct net_device *pdev = p->dev;
269
270 if (!netif_running(pdev) || !netif_oper_up(pdev))
271 continue;
272
273 if (__ethtool_get_link_ksettings(pdev, &ecmd))
274 continue;
275
276 if (ecmd.base.speed == (__u32)SPEED_UNKNOWN)
277 continue;
278
279 if (cmd->base.speed == (__u32)SPEED_UNKNOWN ||
280 cmd->base.speed < ecmd.base.speed)
281 cmd->base.speed = ecmd.base.speed;
282 }
283
284 return 0;
285}
286
c8f44aff
MM
287static netdev_features_t br_fix_features(struct net_device *dev,
288 netdev_features_t features)
edb5e46f
SH
289{
290 struct net_bridge *br = netdev_priv(dev);
291
c4d27ef9 292 return br_features_recompute(br, features);
361ff8a6
JG
293}
294
c06ee961 295#ifdef CONFIG_NET_POLL_CONTROLLER
91d2c34a 296static void br_poll_controller(struct net_device *br_dev)
c06ee961 297{
c06ee961
WC
298}
299
91d2c34a 300static void br_netpoll_cleanup(struct net_device *dev)
c06ee961 301{
91d2c34a 302 struct net_bridge *br = netdev_priv(dev);
4e3828c4 303 struct net_bridge_port *p;
c06ee961 304
4e3828c4 305 list_for_each_entry(p, &br->port_list, list)
91d2c34a 306 br_netpoll_disable(p);
c06ee961
WC
307}
308
a8779ec1 309static int __br_netpoll_enable(struct net_bridge_port *p)
dbe17307
CW
310{
311 struct netpoll *np;
312 int err;
313
a8779ec1 314 np = kzalloc(sizeof(*p->np), GFP_KERNEL);
dbe17307
CW
315 if (!np)
316 return -ENOMEM;
317
a8779ec1 318 err = __netpoll_setup(np, p->dev);
dbe17307
CW
319 if (err) {
320 kfree(np);
321 return err;
322 }
323
324 p->np = np;
325 return err;
326}
327
a8779ec1 328int br_netpoll_enable(struct net_bridge_port *p)
dbe17307
CW
329{
330 if (!p->br->dev->npinfo)
331 return 0;
332
a8779ec1 333 return __br_netpoll_enable(p);
dbe17307
CW
334}
335
a8779ec1 336static int br_netpoll_setup(struct net_device *dev, struct netpoll_info *ni)
c06ee961 337{
cfb478da 338 struct net_bridge *br = netdev_priv(dev);
4e3828c4 339 struct net_bridge_port *p;
91d2c34a 340 int err = 0;
c06ee961 341
4e3828c4 342 list_for_each_entry(p, &br->port_list, list) {
91d2c34a
HX
343 if (!p->dev)
344 continue;
a8779ec1 345 err = __br_netpoll_enable(p);
91d2c34a
HX
346 if (err)
347 goto fail;
c06ee961 348 }
91d2c34a
HX
349
350out:
351 return err;
352
353fail:
354 br_netpoll_cleanup(dev);
355 goto out;
c06ee961
WC
356}
357
91d2c34a 358void br_netpoll_disable(struct net_bridge_port *p)
c06ee961 359{
91d2c34a
HX
360 struct netpoll *np = p->np;
361
362 if (!np)
363 return;
364
365 p->np = NULL;
366
c9fbd71f 367 __netpoll_free(np);
c06ee961
WC
368}
369
370#endif
371
33eaf2a6
DA
372static int br_add_slave(struct net_device *dev, struct net_device *slave_dev,
373 struct netlink_ext_ack *extack)
afc6151a
JP
374
375{
376 struct net_bridge *br = netdev_priv(dev);
377
ca752be0 378 return br_add_if(br, slave_dev, extack);
afc6151a
JP
379}
380
381static int br_del_slave(struct net_device *dev, struct net_device *slave_dev)
382{
383 struct net_bridge *br = netdev_priv(dev);
384
385 return br_del_if(br, slave_dev);
386}
387
ec9d16ba
PNA
388static int br_fill_forward_path(struct net_device_path_ctx *ctx,
389 struct net_device_path *path)
390{
391 struct net_bridge_fdb_entry *f;
392 struct net_bridge_port *dst;
393 struct net_bridge *br;
394
395 if (netif_is_bridge_port(ctx->dev))
396 return -1;
397
398 br = netdev_priv(ctx->dev);
bcf2766b
FF
399
400 br_vlan_fill_forward_path_pvid(br, ctx, path);
401
402 f = br_fdb_find_rcu(br, ctx->daddr, path->bridge.vlan_id);
ec9d16ba
PNA
403 if (!f || !f->dst)
404 return -1;
405
406 dst = READ_ONCE(f->dst);
407 if (!dst)
408 return -1;
409
bcf2766b
FF
410 if (br_vlan_fill_forward_path_mode(br, dst, path))
411 return -1;
412
ec9d16ba
PNA
413 path->type = DEV_PATH_BRIDGE;
414 path->dev = dst->br->dev;
415 ctx->dev = dst->dev;
416
bcf2766b
FF
417 switch (path->bridge.vlan_mode) {
418 case DEV_PATH_BR_VLAN_TAG:
419 if (ctx->num_vlans >= ARRAY_SIZE(ctx->vlan))
420 return -ENOSPC;
421 ctx->vlan[ctx->num_vlans].id = path->bridge.vlan_id;
422 ctx->vlan[ctx->num_vlans].proto = path->bridge.vlan_proto;
423 ctx->num_vlans++;
424 break;
425 case DEV_PATH_BR_VLAN_UNTAG:
426 ctx->num_vlans--;
427 break;
428 case DEV_PATH_BR_VLAN_KEEP:
429 break;
430 }
431
ec9d16ba
PNA
432 return 0;
433}
434
a2dbb882 435static const struct ethtool_ops br_ethtool_ops = {
542575fe
MS
436 .get_drvinfo = br_getinfo,
437 .get_link = ethtool_op_get_link,
438 .get_link_ksettings = br_get_link_ksettings,
edb5e46f
SH
439};
440
a2dbb882
SH
441static const struct net_device_ops br_netdev_ops = {
442 .ndo_open = br_dev_open,
443 .ndo_stop = br_dev_stop,
bb900b27 444 .ndo_init = br_dev_init,
b6fe0440 445 .ndo_uninit = br_dev_uninit,
00829823 446 .ndo_start_xmit = br_dev_xmit,
7609ecb2 447 .ndo_get_stats64 = dev_get_tstats64,
00829823 448 .ndo_set_mac_address = br_set_mac_address,
afc4b13d 449 .ndo_set_rx_mode = br_dev_set_multicast_list,
2796d0c6 450 .ndo_change_rx_flags = br_dev_change_rx_flags,
00829823
SH
451 .ndo_change_mtu = br_change_mtu,
452 .ndo_do_ioctl = br_dev_ioctl,
c06ee961 453#ifdef CONFIG_NET_POLL_CONTROLLER
91d2c34a 454 .ndo_netpoll_setup = br_netpoll_setup,
c06ee961
WC
455 .ndo_netpoll_cleanup = br_netpoll_cleanup,
456 .ndo_poll_controller = br_poll_controller,
457#endif
afc6151a
JP
458 .ndo_add_slave = br_add_slave,
459 .ndo_del_slave = br_del_slave,
c4d27ef9 460 .ndo_fix_features = br_fix_features,
77162022
JF
461 .ndo_fdb_add = br_fdb_add,
462 .ndo_fdb_del = br_fdb_delete,
463 .ndo_fdb_dump = br_fdb_dump,
47674562 464 .ndo_fdb_get = br_fdb_get,
e5a55a89
JF
465 .ndo_bridge_getlink = br_getlink,
466 .ndo_bridge_setlink = br_setlink,
407af329 467 .ndo_bridge_dellink = br_dellink,
66780530 468 .ndo_features_check = passthru_features_check,
ec9d16ba 469 .ndo_fill_forward_path = br_fill_forward_path,
a2dbb882
SH
470};
471
bb900b27 472static struct device_type br_type = {
473 .name = "bridge",
474};
475
1da177e4
LT
476void br_dev_setup(struct net_device *dev)
477{
bb900b27 478 struct net_bridge *br = netdev_priv(dev);
479
7ce5d222 480 eth_hw_addr_random(dev);
1da177e4
LT
481 ether_setup(dev);
482
a2dbb882 483 dev->netdev_ops = &br_netdev_ops;
cf124db5 484 dev->needs_free_netdev = true;
7ad24ea4 485 dev->ethtool_ops = &br_ethtool_ops;
bb900b27 486 SET_NETDEV_DEVTYPE(dev, &br_type);
ccecb2a4 487 dev->priv_flags = IFF_EBRIDGE | IFF_NO_QUEUE;
edb5e46f 488
161f65ba 489 dev->features = COMMON_FEATURES | NETIF_F_LLTX | NETIF_F_NETNS_LOCAL |
1c5abb6c
TM
490 NETIF_F_HW_VLAN_CTAG_TX | NETIF_F_HW_VLAN_STAG_TX;
491 dev->hw_features = COMMON_FEATURES | NETIF_F_HW_VLAN_CTAG_TX |
492 NETIF_F_HW_VLAN_STAG_TX;
161f65ba 493 dev->vlan_features = COMMON_FEATURES;
bb900b27 494
495 br->dev = dev;
496 spin_lock_init(&br->lock);
497 INIT_LIST_HEAD(&br->port_list);
eb793583 498 INIT_HLIST_HEAD(&br->fdb_list);
90c628dd 499 INIT_HLIST_HEAD(&br->frame_type_list);
65369933 500#if IS_ENABLED(CONFIG_BRIDGE_MRP)
0169b820 501 INIT_HLIST_HEAD(&br->mrp_list);
f323aa54
HB
502#endif
503#if IS_ENABLED(CONFIG_BRIDGE_CFM)
504 INIT_HLIST_HEAD(&br->mep_list);
65369933 505#endif
bb900b27 506 spin_lock_init(&br->hash_lock);
507
508 br->bridge_id.prio[0] = 0x80;
509 br->bridge_id.prio[1] = 0x00;
510
05428729 511 ether_addr_copy(br->group_addr, eth_stp_addr);
bb900b27 512
bb900b27 513 br->stp_enabled = BR_NO_STP;
515853cc 514 br->group_fwd_mask = BR_GROUPFWD_DEFAULT;
f2808d22 515 br->group_fwd_mask_required = BR_GROUPFWD_DEFAULT;
515853cc 516
bb900b27 517 br->designated_root = br->bridge_id;
518 br->bridge_max_age = br->max_age = 20 * HZ;
519 br->bridge_hello_time = br->hello_time = 2 * HZ;
520 br->bridge_forward_delay = br->forward_delay = 15 * HZ;
34d8acd8 521 br->bridge_ageing_time = br->ageing_time = BR_DEFAULT_AGEING_TIME;
91572088 522 dev->max_mtu = ETH_MAX_MTU;
bb900b27 523
524 br_netfilter_rtable_init(br);
525 br_stp_timer_init(br);
526 br_multicast_init(br);
f7cdee8a 527 INIT_DELAYED_WORK(&br->gc_work, br_fdb_cleanup);
1da177e4 528}