Merge tag 'for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/dledford/rdma
[linux-2.6-block.git] / net / bridge / br_mdb.c
CommitLineData
ee07c6e7
CW
1#include <linux/err.h>
2#include <linux/igmp.h>
3#include <linux/kernel.h>
4#include <linux/netdevice.h>
5#include <linux/rculist.h>
6#include <linux/skbuff.h>
cfd56754 7#include <linux/if_ether.h>
ee07c6e7
CW
8#include <net/ip.h>
9#include <net/netlink.h>
10#if IS_ENABLED(CONFIG_IPV6)
11#include <net/ipv6.h>
3c3769e6 12#include <net/addrconf.h>
ee07c6e7
CW
13#endif
14
15#include "br_private.h"
16
17static int br_rports_fill_info(struct sk_buff *skb, struct netlink_callback *cb,
18 struct net_device *dev)
19{
20 struct net_bridge *br = netdev_priv(dev);
21 struct net_bridge_port *p;
ee07c6e7
CW
22 struct nlattr *nest;
23
24 if (!br->multicast_router || hlist_empty(&br->router_list))
25 return 0;
26
27 nest = nla_nest_start(skb, MDBA_ROUTER);
28 if (nest == NULL)
29 return -EMSGSIZE;
30
b67bfe0d 31 hlist_for_each_entry_rcu(p, &br->router_list, rlist) {
ee07c6e7
CW
32 if (p && nla_put_u32(skb, MDBA_ROUTER_PORT, p->dev->ifindex))
33 goto fail;
34 }
35
36 nla_nest_end(skb, nest);
37 return 0;
38fail:
39 nla_nest_cancel(skb, nest);
40 return -EMSGSIZE;
41}
42
43static int br_mdb_fill_info(struct sk_buff *skb, struct netlink_callback *cb,
44 struct net_device *dev)
45{
46 struct net_bridge *br = netdev_priv(dev);
47 struct net_bridge_mdb_htable *mdb;
48 struct nlattr *nest, *nest2;
49 int i, err = 0;
50 int idx = 0, s_idx = cb->args[1];
51
52 if (br->multicast_disabled)
53 return 0;
54
55 mdb = rcu_dereference(br->mdb);
56 if (!mdb)
57 return 0;
58
59 nest = nla_nest_start(skb, MDBA_MDB);
60 if (nest == NULL)
61 return -EMSGSIZE;
62
63 for (i = 0; i < mdb->max; i++) {
ee07c6e7 64 struct net_bridge_mdb_entry *mp;
762a3d89 65 struct net_bridge_port_group *p;
66 struct net_bridge_port_group __rcu **pp;
ee07c6e7
CW
67 struct net_bridge_port *port;
68
b67bfe0d 69 hlist_for_each_entry_rcu(mp, &mdb->mhash[i], hlist[mdb->ver]) {
ee07c6e7
CW
70 if (idx < s_idx)
71 goto skip;
72
73 nest2 = nla_nest_start(skb, MDBA_MDB_ENTRY);
74 if (nest2 == NULL) {
75 err = -EMSGSIZE;
76 goto out;
77 }
78
79 for (pp = &mp->ports;
80 (p = rcu_dereference(*pp)) != NULL;
81 pp = &p->next) {
82 port = p->port;
83 if (port) {
84 struct br_mdb_entry e;
c085c499 85 memset(&e, 0, sizeof(e));
ee07c6e7 86 e.ifindex = port->dev->ifindex;
ccb1c31a 87 e.state = p->state;
09d7cf7d
VY
88 if (p->addr.proto == htons(ETH_P_IP))
89 e.addr.u.ip4 = p->addr.u.ip4;
ee07c6e7 90#if IS_ENABLED(CONFIG_IPV6)
09d7cf7d
VY
91 if (p->addr.proto == htons(ETH_P_IPV6))
92 e.addr.u.ip6 = p->addr.u.ip6;
ee07c6e7
CW
93#endif
94 e.addr.proto = p->addr.proto;
95 if (nla_put(skb, MDBA_MDB_ENTRY_INFO, sizeof(e), &e)) {
96 nla_nest_cancel(skb, nest2);
97 err = -EMSGSIZE;
98 goto out;
99 }
100 }
101 }
102 nla_nest_end(skb, nest2);
103 skip:
104 idx++;
105 }
106 }
107
108out:
109 cb->args[1] = idx;
110 nla_nest_end(skb, nest);
111 return err;
112}
113
114static int br_mdb_dump(struct sk_buff *skb, struct netlink_callback *cb)
115{
116 struct net_device *dev;
117 struct net *net = sock_net(skb->sk);
118 struct nlmsghdr *nlh = NULL;
119 int idx = 0, s_idx;
120
121 s_idx = cb->args[0];
122
123 rcu_read_lock();
124
2ce297fc
CW
125 /* In theory this could be wrapped to 0... */
126 cb->seq = net->dev_base_seq + br_mdb_rehash_seq;
ee07c6e7
CW
127
128 for_each_netdev_rcu(net, dev) {
129 if (dev->priv_flags & IFF_EBRIDGE) {
130 struct br_port_msg *bpm;
131
132 if (idx < s_idx)
133 goto skip;
134
135 nlh = nlmsg_put(skb, NETLINK_CB(cb->skb).portid,
136 cb->nlh->nlmsg_seq, RTM_GETMDB,
137 sizeof(*bpm), NLM_F_MULTI);
138 if (nlh == NULL)
139 break;
140
141 bpm = nlmsg_data(nlh);
c085c499 142 memset(bpm, 0, sizeof(*bpm));
ee07c6e7
CW
143 bpm->ifindex = dev->ifindex;
144 if (br_mdb_fill_info(skb, cb, dev) < 0)
145 goto out;
146 if (br_rports_fill_info(skb, cb, dev) < 0)
147 goto out;
148
149 cb->args[1] = 0;
150 nlmsg_end(skb, nlh);
151 skip:
152 idx++;
153 }
154 }
155
156out:
157 if (nlh)
158 nlmsg_end(skb, nlh);
159 rcu_read_unlock();
160 cb->args[0] = idx;
161 return skb->len;
162}
163
37a393bc
CW
164static int nlmsg_populate_mdb_fill(struct sk_buff *skb,
165 struct net_device *dev,
166 struct br_mdb_entry *entry, u32 pid,
167 u32 seq, int type, unsigned int flags)
168{
169 struct nlmsghdr *nlh;
170 struct br_port_msg *bpm;
171 struct nlattr *nest, *nest2;
172
82199679 173 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*bpm), 0);
37a393bc
CW
174 if (!nlh)
175 return -EMSGSIZE;
176
177 bpm = nlmsg_data(nlh);
c085c499 178 memset(bpm, 0, sizeof(*bpm));
37a393bc
CW
179 bpm->family = AF_BRIDGE;
180 bpm->ifindex = dev->ifindex;
181 nest = nla_nest_start(skb, MDBA_MDB);
182 if (nest == NULL)
183 goto cancel;
184 nest2 = nla_nest_start(skb, MDBA_MDB_ENTRY);
185 if (nest2 == NULL)
186 goto end;
187
188 if (nla_put(skb, MDBA_MDB_ENTRY_INFO, sizeof(*entry), entry))
189 goto end;
190
191 nla_nest_end(skb, nest2);
192 nla_nest_end(skb, nest);
053c095a
JB
193 nlmsg_end(skb, nlh);
194 return 0;
37a393bc
CW
195
196end:
197 nla_nest_end(skb, nest);
198cancel:
199 nlmsg_cancel(skb, nlh);
200 return -EMSGSIZE;
201}
202
203static inline size_t rtnl_mdb_nlmsg_size(void)
204{
205 return NLMSG_ALIGN(sizeof(struct br_port_msg))
206 + nla_total_size(sizeof(struct br_mdb_entry));
207}
208
209static void __br_mdb_notify(struct net_device *dev, struct br_mdb_entry *entry,
210 int type)
211{
212 struct net *net = dev_net(dev);
213 struct sk_buff *skb;
214 int err = -ENOBUFS;
215
216 skb = nlmsg_new(rtnl_mdb_nlmsg_size(), GFP_ATOMIC);
217 if (!skb)
218 goto errout;
219
220 err = nlmsg_populate_mdb_fill(skb, dev, entry, 0, 0, type, NTF_SELF);
221 if (err < 0) {
222 kfree_skb(skb);
223 goto errout;
224 }
225
226 rtnl_notify(skb, net, 0, RTNLGRP_MDB, NULL, GFP_ATOMIC);
227 return;
228errout:
229 rtnl_set_sk_err(net, RTNLGRP_MDB, err);
230}
231
232void br_mdb_notify(struct net_device *dev, struct net_bridge_port *port,
233 struct br_ip *group, int type)
234{
235 struct br_mdb_entry entry;
236
c085c499 237 memset(&entry, 0, sizeof(entry));
37a393bc
CW
238 entry.ifindex = port->dev->ifindex;
239 entry.addr.proto = group->proto;
240 entry.addr.u.ip4 = group->u.ip4;
241#if IS_ENABLED(CONFIG_IPV6)
242 entry.addr.u.ip6 = group->u.ip6;
243#endif
244 __br_mdb_notify(dev, &entry, type);
245}
246
cfd56754
CW
247static bool is_valid_mdb_entry(struct br_mdb_entry *entry)
248{
249 if (entry->ifindex == 0)
250 return false;
251
252 if (entry->addr.proto == htons(ETH_P_IP)) {
253 if (!ipv4_is_multicast(entry->addr.u.ip4))
254 return false;
255 if (ipv4_is_local_multicast(entry->addr.u.ip4))
256 return false;
257#if IS_ENABLED(CONFIG_IPV6)
258 } else if (entry->addr.proto == htons(ETH_P_IPV6)) {
3c3769e6 259 if (ipv6_addr_is_ll_all_nodes(&entry->addr.u.ip6))
cfd56754
CW
260 return false;
261#endif
262 } else
263 return false;
ccb1c31a
AW
264 if (entry->state != MDB_PERMANENT && entry->state != MDB_TEMPORARY)
265 return false;
cfd56754
CW
266
267 return true;
268}
269
270static int br_mdb_parse(struct sk_buff *skb, struct nlmsghdr *nlh,
271 struct net_device **pdev, struct br_mdb_entry **pentry)
272{
273 struct net *net = sock_net(skb->sk);
274 struct br_mdb_entry *entry;
275 struct br_port_msg *bpm;
276 struct nlattr *tb[MDBA_SET_ENTRY_MAX+1];
277 struct net_device *dev;
278 int err;
279
12d87251 280 err = nlmsg_parse(nlh, sizeof(*bpm), tb, MDBA_SET_ENTRY_MAX, NULL);
cfd56754
CW
281 if (err < 0)
282 return err;
283
284 bpm = nlmsg_data(nlh);
285 if (bpm->ifindex == 0) {
286 pr_info("PF_BRIDGE: br_mdb_parse() with invalid ifindex\n");
287 return -EINVAL;
288 }
289
290 dev = __dev_get_by_index(net, bpm->ifindex);
291 if (dev == NULL) {
292 pr_info("PF_BRIDGE: br_mdb_parse() with unknown ifindex\n");
293 return -ENODEV;
294 }
295
296 if (!(dev->priv_flags & IFF_EBRIDGE)) {
297 pr_info("PF_BRIDGE: br_mdb_parse() with non-bridge\n");
298 return -EOPNOTSUPP;
299 }
300
301 *pdev = dev;
302
303 if (!tb[MDBA_SET_ENTRY] ||
304 nla_len(tb[MDBA_SET_ENTRY]) != sizeof(struct br_mdb_entry)) {
305 pr_info("PF_BRIDGE: br_mdb_parse() with invalid attr\n");
306 return -EINVAL;
307 }
308
309 entry = nla_data(tb[MDBA_SET_ENTRY]);
310 if (!is_valid_mdb_entry(entry)) {
311 pr_info("PF_BRIDGE: br_mdb_parse() with invalid entry\n");
312 return -EINVAL;
313 }
314
315 *pentry = entry;
316 return 0;
317}
318
319static int br_mdb_add_group(struct net_bridge *br, struct net_bridge_port *port,
ccb1c31a 320 struct br_ip *group, unsigned char state)
cfd56754
CW
321{
322 struct net_bridge_mdb_entry *mp;
323 struct net_bridge_port_group *p;
324 struct net_bridge_port_group __rcu **pp;
325 struct net_bridge_mdb_htable *mdb;
f7e2965d 326 unsigned long now = jiffies;
cfd56754
CW
327 int err;
328
329 mdb = mlock_dereference(br->mdb, br);
330 mp = br_mdb_ip_get(mdb, group);
331 if (!mp) {
332 mp = br_multicast_new_group(br, port, group);
333 err = PTR_ERR(mp);
334 if (IS_ERR(mp))
335 return err;
336 }
337
338 for (pp = &mp->ports;
339 (p = mlock_dereference(*pp, br)) != NULL;
340 pp = &p->next) {
341 if (p->port == port)
342 return -EEXIST;
343 if ((unsigned long)p->port < (unsigned long)port)
344 break;
345 }
346
ccb1c31a 347 p = br_multicast_new_port_group(port, group, *pp, state);
cfd56754
CW
348 if (unlikely(!p))
349 return -ENOMEM;
350 rcu_assign_pointer(*pp, p);
f7e2965d
SA
351 if (state == MDB_TEMPORARY)
352 mod_timer(&p->timer, now + br->multicast_membership_interval);
cfd56754 353
cfd56754
CW
354 return 0;
355}
356
357static int __br_mdb_add(struct net *net, struct net_bridge *br,
358 struct br_mdb_entry *entry)
359{
360 struct br_ip ip;
361 struct net_device *dev;
362 struct net_bridge_port *p;
363 int ret;
364
365 if (!netif_running(br->dev) || br->multicast_disabled)
366 return -EINVAL;
367
368 dev = __dev_get_by_index(net, entry->ifindex);
369 if (!dev)
370 return -ENODEV;
371
372 p = br_port_get_rtnl(dev);
373 if (!p || p->br != br || p->state == BR_STATE_DISABLED)
374 return -EINVAL;
375
f1158b74 376 memset(&ip, 0, sizeof(ip));
cfd56754
CW
377 ip.proto = entry->addr.proto;
378 if (ip.proto == htons(ETH_P_IP))
379 ip.u.ip4 = entry->addr.u.ip4;
380#if IS_ENABLED(CONFIG_IPV6)
381 else
382 ip.u.ip6 = entry->addr.u.ip6;
383#endif
384
385 spin_lock_bh(&br->multicast_lock);
ccb1c31a 386 ret = br_mdb_add_group(br, p, &ip, entry->state);
cfd56754
CW
387 spin_unlock_bh(&br->multicast_lock);
388 return ret;
389}
390
661d2967 391static int br_mdb_add(struct sk_buff *skb, struct nlmsghdr *nlh)
cfd56754
CW
392{
393 struct net *net = sock_net(skb->sk);
394 struct br_mdb_entry *entry;
395 struct net_device *dev;
396 struct net_bridge *br;
397 int err;
398
399 err = br_mdb_parse(skb, nlh, &dev, &entry);
400 if (err < 0)
401 return err;
402
403 br = netdev_priv(dev);
404
405 err = __br_mdb_add(net, br, entry);
406 if (!err)
407 __br_mdb_notify(dev, entry, RTM_NEWMDB);
408 return err;
409}
410
411static int __br_mdb_del(struct net_bridge *br, struct br_mdb_entry *entry)
412{
413 struct net_bridge_mdb_htable *mdb;
414 struct net_bridge_mdb_entry *mp;
415 struct net_bridge_port_group *p;
416 struct net_bridge_port_group __rcu **pp;
417 struct br_ip ip;
418 int err = -EINVAL;
419
420 if (!netif_running(br->dev) || br->multicast_disabled)
421 return -EINVAL;
422
f1158b74 423 memset(&ip, 0, sizeof(ip));
cfd56754 424 ip.proto = entry->addr.proto;
51ed7f3e 425 if (ip.proto == htons(ETH_P_IP))
cfd56754
CW
426 ip.u.ip4 = entry->addr.u.ip4;
427#if IS_ENABLED(CONFIG_IPV6)
51ed7f3e 428 else
cfd56754
CW
429 ip.u.ip6 = entry->addr.u.ip6;
430#endif
431
432 spin_lock_bh(&br->multicast_lock);
433 mdb = mlock_dereference(br->mdb, br);
434
435 mp = br_mdb_ip_get(mdb, &ip);
436 if (!mp)
437 goto unlock;
438
439 for (pp = &mp->ports;
440 (p = mlock_dereference(*pp, br)) != NULL;
441 pp = &p->next) {
442 if (!p->port || p->port->dev->ifindex != entry->ifindex)
443 continue;
444
445 if (p->port->state == BR_STATE_DISABLED)
446 goto unlock;
447
7ae90a4f 448 entry->state = p->state;
cfd56754
CW
449 rcu_assign_pointer(*pp, p->next);
450 hlist_del_init(&p->mglist);
451 del_timer(&p->timer);
452 call_rcu_bh(&p->rcu, br_multicast_free_pg);
453 err = 0;
454
454594f3 455 if (!mp->ports && !mp->mglist &&
cfd56754
CW
456 netif_running(br->dev))
457 mod_timer(&mp->timer, jiffies);
458 break;
459 }
460
461unlock:
462 spin_unlock_bh(&br->multicast_lock);
463 return err;
464}
465
661d2967 466static int br_mdb_del(struct sk_buff *skb, struct nlmsghdr *nlh)
cfd56754
CW
467{
468 struct net_device *dev;
469 struct br_mdb_entry *entry;
470 struct net_bridge *br;
471 int err;
472
473 err = br_mdb_parse(skb, nlh, &dev, &entry);
474 if (err < 0)
475 return err;
476
477 br = netdev_priv(dev);
478
479 err = __br_mdb_del(br, entry);
480 if (!err)
481 __br_mdb_notify(dev, entry, RTM_DELMDB);
482 return err;
483}
484
ee07c6e7
CW
485void br_mdb_init(void)
486{
487 rtnl_register(PF_BRIDGE, RTM_GETMDB, NULL, br_mdb_dump, NULL);
cfd56754
CW
488 rtnl_register(PF_BRIDGE, RTM_NEWMDB, br_mdb_add, NULL, NULL);
489 rtnl_register(PF_BRIDGE, RTM_DELMDB, br_mdb_del, NULL, NULL);
ee07c6e7 490}
63233159
VY
491
492void br_mdb_uninit(void)
493{
494 rtnl_unregister(PF_BRIDGE, RTM_GETMDB);
495 rtnl_unregister(PF_BRIDGE, RTM_NEWMDB);
496 rtnl_unregister(PF_BRIDGE, RTM_DELMDB);
497}