Merge branch 'nf' of git://1984.lsi.us.es/net
[linux-block.git] / net / bridge / br_if.c
CommitLineData
1da177e4
LT
1/*
2 * Userspace interface
3 * Linux ethernet bridge
4 *
5 * Authors:
6 * Lennert Buytenhek <buytenh@gnu.org>
7 *
1da177e4
LT
8 * This program is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU General Public License
10 * as published by the Free Software Foundation; either version
11 * 2 of the License, or (at your option) any later version.
12 */
13
14#include <linux/kernel.h>
15#include <linux/netdevice.h>
c06ee961 16#include <linux/netpoll.h>
1da177e4
LT
17#include <linux/ethtool.h>
18#include <linux/if_arp.h>
19#include <linux/module.h>
20#include <linux/init.h>
21#include <linux/rtnetlink.h>
46f25dff 22#include <linux/if_ether.h>
5a0e3ad6 23#include <linux/slab.h>
1da177e4
LT
24#include <net/sock.h>
25
26#include "br_private.h"
27
28/*
29 * Determine initial path cost based on speed.
30 * using recommendations from 802.1d standard
31 *
61a44b9c 32 * Since driver might sleep need to not be holding any locks.
1da177e4 33 */
4433f420 34static int port_cost(struct net_device *dev)
1da177e4 35{
b4a488d1
SH
36 if (dev->ethtool_ops && dev->ethtool_ops->get_settings) {
37 struct ethtool_cmd ecmd = { .cmd = ETHTOOL_GSET, };
38
25db0338
DD
39 if (!dev_ethtool_get_settings(dev, &ecmd)) {
40 switch (ethtool_cmd_speed(&ecmd)) {
61a44b9c
MW
41 case SPEED_10000:
42 return 2;
b4a488d1
SH
43 case SPEED_1000:
44 return 4;
45 case SPEED_100:
46 return 19;
61a44b9c
MW
47 case SPEED_10:
48 return 100;
49 }
1da177e4
LT
50 }
51 }
52
53 /* Old silly heuristics based on name */
54 if (!strncmp(dev->name, "lec", 3))
55 return 7;
56
57 if (!strncmp(dev->name, "plip", 4))
58 return 2500;
59
60 return 100; /* assume old 10Mbps */
61}
62
4433f420 63
944c794d 64/* Check for port carrier transistions. */
269def7c 65void br_port_carrier_check(struct net_bridge_port *p)
4433f420 66{
269def7c
SH
67 struct net_device *dev = p->dev;
68 struct net_bridge *br = p->br;
6e86b890 69
aa7c6e5f 70 if (netif_running(dev) && netif_carrier_ok(dev))
6e86b890
SH
71 p->path_cost = port_cost(dev);
72
aa7c6e5f 73 if (!netif_running(br->dev))
74 return;
75
76 spin_lock_bh(&br->lock);
77 if (netif_running(dev) && netif_carrier_ok(dev)) {
78 if (p->state == BR_STATE_DISABLED)
79 br_stp_enable_port(p);
80 } else {
81 if (p->state != BR_STATE_DISABLED)
82 br_stp_disable_port(p);
4433f420 83 }
aa7c6e5f 84 spin_unlock_bh(&br->lock);
4433f420
SH
85}
86
bab1deea
SH
87static void release_nbp(struct kobject *kobj)
88{
89 struct net_bridge_port *p
90 = container_of(kobj, struct net_bridge_port, kobj);
91 kfree(p);
92}
93
94static struct kobj_type brport_ktype = {
95#ifdef CONFIG_SYSFS
96 .sysfs_ops = &brport_sysfs_ops,
97#endif
98 .release = release_nbp,
99};
100
1da177e4
LT
101static void destroy_nbp(struct net_bridge_port *p)
102{
103 struct net_device *dev = p->dev;
104
1da177e4
LT
105 p->br = NULL;
106 p->dev = NULL;
107 dev_put(dev);
108
bab1deea 109 kobject_put(&p->kobj);
1da177e4
LT
110}
111
112static void destroy_nbp_rcu(struct rcu_head *head)
113{
114 struct net_bridge_port *p =
115 container_of(head, struct net_bridge_port, rcu);
116 destroy_nbp(p);
117}
118
3f4cfc2d
SH
119/* Delete port(interface) from bridge is done in two steps.
120 * via RCU. First step, marks device as down. That deletes
121 * all the timers and stops new packets from flowing through.
122 *
123 * Final cleanup doesn't occur until after all CPU's finished
124 * processing packets.
125 *
126 * Protected from multiple admin operations by RTNL mutex
127 */
1da177e4
LT
128static void del_nbp(struct net_bridge_port *p)
129{
130 struct net_bridge *br = p->br;
131 struct net_device *dev = p->dev;
132
b3bcb72e 133 sysfs_remove_link(br->ifobj, p->dev->name);
bab1deea 134
1da177e4
LT
135 dev_set_promiscuity(dev, -1);
136
137 spin_lock_bh(&br->lock);
138 br_stp_disable_port(p);
139 spin_unlock_bh(&br->lock);
140
b86c4503
SH
141 br_ifinfo_notify(RTM_DELLINK, p);
142
1a620698 143 br_fdb_delete_by_port(br, p, 1);
1da177e4
LT
144
145 list_del_rcu(&p->list);
146
f350a0a8
JP
147 dev->priv_flags &= ~IFF_BRIDGE_PORT;
148
ab95bfe0 149 netdev_rx_handler_unregister(dev);
6df427fe 150 synchronize_net();
b3f1be4b 151
afc6151a
JP
152 netdev_set_master(dev, NULL);
153
3fe2d7c7
HX
154 br_multicast_del_port(p);
155
125a12cc 156 kobject_uevent(&p->kobj, KOBJ_REMOVE);
bab1deea
SH
157 kobject_del(&p->kobj);
158
91d2c34a
HX
159 br_netpoll_disable(p);
160
1da177e4
LT
161 call_rcu(&p->rcu, destroy_nbp_rcu);
162}
163
164/* called with RTNL */
8c56ba05 165static void del_br(struct net_bridge *br, struct list_head *head)
1da177e4
LT
166{
167 struct net_bridge_port *p, *n;
168
169 list_for_each_entry_safe(p, n, &br->port_list, list) {
1da177e4
LT
170 del_nbp(p);
171 }
172
173 del_timer_sync(&br->gc_timer);
174
175 br_sysfs_delbr(br->dev);
8c56ba05 176 unregister_netdevice_queue(br->dev, head);
1da177e4
LT
177}
178
1da177e4
LT
179/* find an available port number */
180static int find_portno(struct net_bridge *br)
181{
182 int index;
183 struct net_bridge_port *p;
184 unsigned long *inuse;
185
3b781fa1 186 inuse = kcalloc(BITS_TO_LONGS(BR_MAX_PORTS), sizeof(unsigned long),
1da177e4
LT
187 GFP_KERNEL);
188 if (!inuse)
189 return -ENOMEM;
190
1da177e4
LT
191 set_bit(0, inuse); /* zero is reserved */
192 list_for_each_entry(p, &br->port_list, list) {
193 set_bit(p->port_no, inuse);
194 }
195 index = find_first_zero_bit(inuse, BR_MAX_PORTS);
196 kfree(inuse);
197
198 return (index >= BR_MAX_PORTS) ? -EXFULL : index;
199}
200
4433f420 201/* called with RTNL but without bridge lock */
9d6f229f 202static struct net_bridge_port *new_nbp(struct net_bridge *br,
4433f420 203 struct net_device *dev)
1da177e4
LT
204{
205 int index;
206 struct net_bridge_port *p;
9d6f229f 207
1da177e4
LT
208 index = find_portno(br);
209 if (index < 0)
210 return ERR_PTR(index);
211
cee48541 212 p = kzalloc(sizeof(*p), GFP_KERNEL);
1da177e4
LT
213 if (p == NULL)
214 return ERR_PTR(-ENOMEM);
215
1da177e4
LT
216 p->br = br;
217 dev_hold(dev);
218 p->dev = dev;
4433f420 219 p->path_cost = port_cost(dev);
9d6f229f 220 p->priority = 0x8000 >> BR_PORT_BITS;
1da177e4 221 p->port_no = index;
3982d3d2 222 p->flags = 0;
1da177e4
LT
223 br_init_port(p);
224 p->state = BR_STATE_DISABLED;
d32439c0 225 br_stp_port_timer_init(p);
3fe2d7c7 226 br_multicast_add_port(p);
1da177e4
LT
227
228 return p;
229}
230
4aa678ba 231int br_add_bridge(struct net *net, const char *name)
1da177e4
LT
232{
233 struct net_device *dev;
11f3a6bd 234 int res;
1da177e4 235
bb900b27 236 dev = alloc_netdev(sizeof(struct net_bridge), name,
237 br_dev_setup);
238
9d6f229f 239 if (!dev)
1da177e4
LT
240 return -ENOMEM;
241
bb900b27 242 dev_net_set(dev, net);
e340a90e 243
11f3a6bd
ED
244 res = register_netdev(dev);
245 if (res)
246 free_netdev(dev);
247 return res;
1da177e4
LT
248}
249
4aa678ba 250int br_del_bridge(struct net *net, const char *name)
1da177e4
LT
251{
252 struct net_device *dev;
253 int ret = 0;
254
255 rtnl_lock();
4aa678ba 256 dev = __dev_get_by_name(net, name);
9d6f229f 257 if (dev == NULL)
1da177e4
LT
258 ret = -ENXIO; /* Could not find device */
259
260 else if (!(dev->priv_flags & IFF_EBRIDGE)) {
261 /* Attempt to delete non bridge device! */
262 ret = -EPERM;
263 }
264
265 else if (dev->flags & IFF_UP) {
266 /* Not shutdown yet. */
267 ret = -EBUSY;
9d6f229f 268 }
1da177e4 269
9d6f229f 270 else
8c56ba05 271 del_br(netdev_priv(dev), NULL);
1da177e4
LT
272
273 rtnl_unlock();
274 return ret;
275}
276
46f25dff 277/* MTU of the bridge pseudo-device: ETH_DATA_LEN or the minimum of the ports */
1da177e4
LT
278int br_min_mtu(const struct net_bridge *br)
279{
280 const struct net_bridge_port *p;
281 int mtu = 0;
282
283 ASSERT_RTNL();
284
285 if (list_empty(&br->port_list))
46f25dff 286 mtu = ETH_DATA_LEN;
1da177e4
LT
287 else {
288 list_for_each_entry(p, &br->port_list, list) {
289 if (!mtu || p->dev->mtu < mtu)
290 mtu = p->dev->mtu;
291 }
292 }
293 return mtu;
294}
295
81d35307
SH
296/*
297 * Recomputes features using slave's features
298 */
c4d27ef9 299u32 br_features_recompute(struct net_bridge *br, u32 features)
81d35307
SH
300{
301 struct net_bridge_port *p;
c4d27ef9 302 u32 mask;
81d35307 303
b63365a2 304 if (list_empty(&br->port_list))
c4d27ef9 305 return features;
b63365a2 306
c4d27ef9 307 mask = features;
b63365a2 308 features &= ~NETIF_F_ONE_FOR_ALL;
81d35307
SH
309
310 list_for_each_entry(p, &br->port_list, list) {
b63365a2
HX
311 features = netdev_increment_features(features,
312 p->dev->features, mask);
81d35307
SH
313 }
314
c4d27ef9 315 return features;
81d35307
SH
316}
317
1da177e4
LT
318/* called with RTNL */
319int br_add_if(struct net_bridge *br, struct net_device *dev)
320{
321 struct net_bridge_port *p;
322 int err = 0;
edf947f1 323 bool changed_addr;
1da177e4 324
1056bd51
SH
325 /* Don't allow bridging non-ethernet like devices */
326 if ((dev->flags & IFF_LOOPBACK) ||
327 dev->type != ARPHRD_ETHER || dev->addr_len != ETH_ALEN)
1da177e4
LT
328 return -EINVAL;
329
1056bd51 330 /* No bridging of bridges */
00829823 331 if (dev->netdev_ops->ndo_start_xmit == br_dev_xmit)
1da177e4
LT
332 return -ELOOP;
333
1056bd51 334 /* Device is already being bridged */
f350a0a8 335 if (br_port_exists(dev))
1da177e4
LT
336 return -EBUSY;
337
ad4bb6f8
JB
338 /* No bridging devices that dislike that (e.g. wireless) */
339 if (dev->priv_flags & IFF_DONT_BRIDGE)
340 return -EOPNOTSUPP;
341
bab1deea
SH
342 p = new_nbp(br, dev);
343 if (IS_ERR(p))
1da177e4
LT
344 return PTR_ERR(p);
345
bb8ed630
AW
346 call_netdevice_notifiers(NETDEV_JOIN, dev);
347
bc3f9076
WC
348 err = dev_set_promiscuity(dev, 1);
349 if (err)
350 goto put_back;
351
e32cc736
GKH
352 err = kobject_init_and_add(&p->kobj, &brport_ktype, &(dev->dev.kobj),
353 SYSFS_BRIDGE_PORT_ATTR);
bab1deea
SH
354 if (err)
355 goto err0;
1da177e4 356
9d6f229f 357 err = br_fdb_insert(br, p, dev->dev_addr);
bab1deea
SH
358 if (err)
359 goto err1;
1da177e4 360
bab1deea
SH
361 err = br_sysfs_addif(p);
362 if (err)
363 goto err2;
1da177e4 364
91d2c34a
HX
365 if (br_netpoll_info(br) && ((err = br_netpoll_enable(p))))
366 goto err3;
367
afc6151a 368 err = netdev_set_master(dev, br->dev);
ab95bfe0 369 if (err)
f350a0a8
JP
370 goto err3;
371
afc6151a
JP
372 err = netdev_rx_handler_register(dev, br_handle_frame, p);
373 if (err)
374 goto err4;
375
f350a0a8 376 dev->priv_flags |= IFF_BRIDGE_PORT;
ab95bfe0 377
0187bdfb 378 dev_disable_lro(dev);
bab1deea
SH
379
380 list_add_rcu(&p->list, &br->port_list);
381
c4d27ef9
MM
382 netdev_update_features(br->dev);
383
bab1deea 384 spin_lock_bh(&br->lock);
edf947f1 385 changed_addr = br_stp_recalculate_bridge_id(br);
de79059e
AS
386
387 if ((dev->flags & IFF_UP) && netif_carrier_ok(dev) &&
388 (br->dev->flags & IFF_UP))
389 br_stp_enable_port(p);
bab1deea
SH
390 spin_unlock_bh(&br->lock);
391
b86c4503
SH
392 br_ifinfo_notify(RTM_NEWLINK, p);
393
edf947f1 394 if (changed_addr)
56139fc5 395 call_netdevice_notifiers(NETDEV_CHANGEADDR, br->dev);
edf947f1 396
bab1deea 397 dev_set_mtu(br->dev, br_min_mtu(br));
269def7c 398
bab1deea 399 kobject_uevent(&p->kobj, KOBJ_ADD);
1da177e4 400
bab1deea 401 return 0;
afc6151a
JP
402
403err4:
404 netdev_set_master(dev, NULL);
91d2c34a
HX
405err3:
406 sysfs_remove_link(br->ifobj, p->dev->name);
bab1deea 407err2:
1a620698 408 br_fdb_delete_by_port(br, p, 1);
bab1deea 409err1:
c587aea9 410 kobject_put(&p->kobj);
30df94f8 411 p = NULL; /* kobject_put frees */
bab1deea 412err0:
bc3f9076 413 dev_set_promiscuity(dev, -1);
43af8532
VL
414put_back:
415 dev_put(dev);
bc3f9076 416 kfree(p);
1da177e4
LT
417 return err;
418}
419
420/* called with RTNL */
421int br_del_if(struct net_bridge *br, struct net_device *dev)
422{
f350a0a8 423 struct net_bridge_port *p;
9be6dd65 424 bool changed_addr;
f350a0a8 425
ec1e5610 426 p = br_port_get_rtnl(dev);
b5ed54e9 427 if (!p || p->br != br)
1da177e4
LT
428 return -EINVAL;
429
1da177e4
LT
430 del_nbp(p);
431
432 spin_lock_bh(&br->lock);
9be6dd65 433 changed_addr = br_stp_recalculate_bridge_id(br);
1da177e4
LT
434 spin_unlock_bh(&br->lock);
435
9be6dd65
AW
436 if (changed_addr)
437 call_netdevice_notifiers(NETDEV_CHANGEADDR, br->dev);
438
c4d27ef9
MM
439 netdev_update_features(br->dev);
440
1da177e4
LT
441 return 0;
442}
443
2c8c1e72 444void __net_exit br_net_exit(struct net *net)
1da177e4 445{
ab1b2046 446 struct net_device *dev;
8c56ba05 447 LIST_HEAD(list);
1da177e4
LT
448
449 rtnl_lock();
8c56ba05
ED
450 for_each_netdev(net, dev)
451 if (dev->priv_flags & IFF_EBRIDGE)
452 del_br(netdev_priv(dev), &list);
453
454 unregister_netdevice_many(&list);
1da177e4
LT
455 rtnl_unlock();
456
457}