net: ethernet: litex: Add the dependency on HAS_IOMEM
[linux-block.git] / net / ipv6 / ip6mr.c
CommitLineData
2874c5fd 1// SPDX-License-Identifier: GPL-2.0-or-later
7bc570c8
YH
2/*
3 * Linux IPv6 multicast routing support for BSD pim6sd
4 * Based on net/ipv4/ipmr.c.
5 *
6 * (c) 2004 Mickael Hoerdt, <hoerdt@clarinet.u-strasbg.fr>
7 * LSIIT Laboratory, Strasbourg, France
8 * (c) 2004 Jean-Philippe Andriot, <jean-philippe.andriot@6WIND.com>
9 * 6WIND, Paris, France
10 * Copyright (C)2007,2008 USAGI/WIDE Project
11 * YOSHIFUJI Hideaki <yoshfuji@linux-ipv6.org>
7bc570c8
YH
12 */
13
7c0f6ba6 14#include <linux/uaccess.h>
7bc570c8
YH
15#include <linux/types.h>
16#include <linux/sched.h>
17#include <linux/errno.h>
7bc570c8
YH
18#include <linux/mm.h>
19#include <linux/kernel.h>
20#include <linux/fcntl.h>
21#include <linux/stat.h>
22#include <linux/socket.h>
7bc570c8
YH
23#include <linux/inet.h>
24#include <linux/netdevice.h>
25#include <linux/inetdevice.h>
7bc570c8
YH
26#include <linux/proc_fs.h>
27#include <linux/seq_file.h>
7bc570c8 28#include <linux/init.h>
e2d57766 29#include <linux/compat.h>
0eb71a9d 30#include <linux/rhashtable.h>
7bc570c8
YH
31#include <net/protocol.h>
32#include <linux/skbuff.h>
7bc570c8 33#include <net/raw.h>
7bc570c8
YH
34#include <linux/notifier.h>
35#include <linux/if_arp.h>
7bc570c8
YH
36#include <net/checksum.h>
37#include <net/netlink.h>
d1db275d 38#include <net/fib_rules.h>
7bc570c8
YH
39
40#include <net/ipv6.h>
41#include <net/ip6_route.h>
42#include <linux/mroute6.h>
14fb64e1 43#include <linux/pim.h>
7bc570c8
YH
44#include <net/addrconf.h>
45#include <linux/netfilter_ipv6.h>
bc3b2d7f 46#include <linux/export.h>
5d6e430d 47#include <net/ip6_checksum.h>
d67b8c61 48#include <linux/netconf.h>
cb9f1b78 49#include <net/ip_tunnels.h>
7bc570c8 50
69d2c867
GS
51#include <linux/nospec.h>
52
d1db275d
PM
53struct ip6mr_rule {
54 struct fib_rule common;
55};
56
57struct ip6mr_result {
b70432f7 58 struct mr_table *mrt;
d1db275d
PM
59};
60
7bc570c8
YH
61/* Big lock, protecting vif table, mrt cache and mroute socket state.
62 Note that the changes are semaphored via rtnl_lock.
63 */
64
65static DEFINE_RWLOCK(mrt_lock);
66
b70432f7 67/* Multicast router control variables */
7bc570c8 68
7bc570c8
YH
69/* Special spinlock for queue of unresolved entries */
70static DEFINE_SPINLOCK(mfc_unres_lock);
71
72/* We return to original Alan's scheme. Hash table of resolved
73 entries is changed only in process context and protected
74 with weak lock mrt_lock. Queue of unresolved entries is protected
75 with strong spinlock mfc_unres_lock.
76
77 In this case data path is free of exclusive locks at all.
78 */
79
80static struct kmem_cache *mrt_cachep __read_mostly;
81
b70432f7
YM
82static struct mr_table *ip6mr_new_table(struct net *net, u32 id);
83static void ip6mr_free_table(struct mr_table *mrt);
d1db275d 84
b70432f7 85static void ip6_mr_forward(struct net *net, struct mr_table *mrt,
e4a38c0c
PR
86 struct net_device *dev, struct sk_buff *skb,
87 struct mfc6_cache *cache);
b70432f7 88static int ip6mr_cache_report(struct mr_table *mrt, struct sk_buff *pkt,
8229efda 89 mifi_t mifi, int assert);
b70432f7 90static void mr6_netlink_event(struct mr_table *mrt, struct mfc6_cache *mfc,
812e44dd 91 int cmd);
b70432f7 92static void mrt6msg_netlink_event(struct mr_table *mrt, struct sk_buff *pkt);
5b285cac
PM
93static int ip6mr_rtm_dumproute(struct sk_buff *skb,
94 struct netlink_callback *cb);
ca8d4794 95static void mroute_clean_tables(struct mr_table *mrt, int flags);
e99e88a9 96static void ipmr_expire_process(struct timer_list *t);
d1db275d
PM
97
98#ifdef CONFIG_IPV6_MROUTE_MULTIPLE_TABLES
8ffb335e 99#define ip6mr_for_each_table(mrt, net) \
28b380e2 100 list_for_each_entry_rcu(mrt, &net->ipv6.mr6_tables, list, \
b6dd5acd
MB
101 lockdep_rtnl_is_held() || \
102 list_empty(&net->ipv6.mr6_tables))
d1db275d 103
7b0db857
YM
104static struct mr_table *ip6mr_mr_table_iter(struct net *net,
105 struct mr_table *mrt)
106{
107 struct mr_table *ret;
108
109 if (!mrt)
110 ret = list_entry_rcu(net->ipv6.mr6_tables.next,
111 struct mr_table, list);
112 else
113 ret = list_entry_rcu(mrt->list.next,
114 struct mr_table, list);
115
116 if (&ret->list == &net->ipv6.mr6_tables)
117 return NULL;
118 return ret;
119}
120
b70432f7 121static struct mr_table *ip6mr_get_table(struct net *net, u32 id)
d1db275d 122{
b70432f7 123 struct mr_table *mrt;
d1db275d
PM
124
125 ip6mr_for_each_table(mrt, net) {
126 if (mrt->id == id)
127 return mrt;
128 }
129 return NULL;
130}
131
4c9483b2 132static int ip6mr_fib_lookup(struct net *net, struct flowi6 *flp6,
b70432f7 133 struct mr_table **mrt)
d1db275d 134{
d1db275d 135 int err;
95f4a45d
HFS
136 struct ip6mr_result res;
137 struct fib_lookup_arg arg = {
138 .result = &res,
139 .flags = FIB_LOOKUP_NOREF,
140 };
d1db275d 141
e4a38c0c
PR
142 /* update flow if oif or iif point to device enslaved to l3mdev */
143 l3mdev_update_flow(net, flowi6_to_flowi(flp6));
144
4c9483b2
DM
145 err = fib_rules_lookup(net->ipv6.mr6_rules_ops,
146 flowi6_to_flowi(flp6), 0, &arg);
d1db275d
PM
147 if (err < 0)
148 return err;
149 *mrt = res.mrt;
150 return 0;
151}
152
153static int ip6mr_rule_action(struct fib_rule *rule, struct flowi *flp,
154 int flags, struct fib_lookup_arg *arg)
155{
156 struct ip6mr_result *res = arg->result;
b70432f7 157 struct mr_table *mrt;
d1db275d
PM
158
159 switch (rule->action) {
160 case FR_ACT_TO_TBL:
161 break;
162 case FR_ACT_UNREACHABLE:
163 return -ENETUNREACH;
164 case FR_ACT_PROHIBIT:
165 return -EACCES;
166 case FR_ACT_BLACKHOLE:
167 default:
168 return -EINVAL;
169 }
170
e4a38c0c
PR
171 arg->table = fib_rule_get_table(rule, arg);
172
173 mrt = ip6mr_get_table(rule->fr_net, arg->table);
63159f29 174 if (!mrt)
d1db275d
PM
175 return -EAGAIN;
176 res->mrt = mrt;
177 return 0;
178}
179
180static int ip6mr_rule_match(struct fib_rule *rule, struct flowi *flp, int flags)
181{
182 return 1;
183}
184
d1db275d 185static int ip6mr_rule_configure(struct fib_rule *rule, struct sk_buff *skb,
b16fb418
RP
186 struct fib_rule_hdr *frh, struct nlattr **tb,
187 struct netlink_ext_ack *extack)
d1db275d
PM
188{
189 return 0;
190}
191
192static int ip6mr_rule_compare(struct fib_rule *rule, struct fib_rule_hdr *frh,
193 struct nlattr **tb)
194{
195 return 1;
196}
197
198static int ip6mr_rule_fill(struct fib_rule *rule, struct sk_buff *skb,
199 struct fib_rule_hdr *frh)
200{
201 frh->dst_len = 0;
202 frh->src_len = 0;
203 frh->tos = 0;
204 return 0;
205}
206
04a6f82c 207static const struct fib_rules_ops __net_initconst ip6mr_rules_ops_template = {
d1db275d
PM
208 .family = RTNL_FAMILY_IP6MR,
209 .rule_size = sizeof(struct ip6mr_rule),
210 .addr_size = sizeof(struct in6_addr),
211 .action = ip6mr_rule_action,
212 .match = ip6mr_rule_match,
213 .configure = ip6mr_rule_configure,
214 .compare = ip6mr_rule_compare,
d1db275d
PM
215 .fill = ip6mr_rule_fill,
216 .nlgroup = RTNLGRP_IPV6_RULE,
d1db275d
PM
217 .owner = THIS_MODULE,
218};
219
220static int __net_init ip6mr_rules_init(struct net *net)
221{
222 struct fib_rules_ops *ops;
b70432f7 223 struct mr_table *mrt;
d1db275d
PM
224 int err;
225
226 ops = fib_rules_register(&ip6mr_rules_ops_template, net);
227 if (IS_ERR(ops))
228 return PTR_ERR(ops);
229
230 INIT_LIST_HEAD(&net->ipv6.mr6_tables);
231
232 mrt = ip6mr_new_table(net, RT6_TABLE_DFLT);
e783bb00
SD
233 if (IS_ERR(mrt)) {
234 err = PTR_ERR(mrt);
d1db275d
PM
235 goto err1;
236 }
237
238 err = fib_default_rule_add(ops, 0x7fff, RT6_TABLE_DFLT, 0);
239 if (err < 0)
240 goto err2;
241
242 net->ipv6.mr6_rules_ops = ops;
243 return 0;
244
245err2:
f243e5a7 246 ip6mr_free_table(mrt);
d1db275d
PM
247err1:
248 fib_rules_unregister(ops);
249 return err;
250}
251
252static void __net_exit ip6mr_rules_exit(struct net *net)
253{
b70432f7 254 struct mr_table *mrt, *next;
d1db275d 255
905a6f96 256 rtnl_lock();
035320d5
ED
257 list_for_each_entry_safe(mrt, next, &net->ipv6.mr6_tables, list) {
258 list_del(&mrt->list);
d1db275d 259 ip6mr_free_table(mrt);
035320d5 260 }
d1db275d 261 fib_rules_unregister(net->ipv6.mr6_rules_ops);
419df12f 262 rtnl_unlock();
d1db275d 263}
088aa3ee 264
b7a59557
JP
265static int ip6mr_rules_dump(struct net *net, struct notifier_block *nb,
266 struct netlink_ext_ack *extack)
088aa3ee 267{
b7a59557 268 return fib_rules_dump(net, nb, RTNL_FAMILY_IP6MR, extack);
088aa3ee
YM
269}
270
271static unsigned int ip6mr_rules_seq_read(struct net *net)
272{
273 return fib_rules_seq_read(net, RTNL_FAMILY_IP6MR);
274}
d3c07e5b
YM
275
276bool ip6mr_rule_default(const struct fib_rule *rule)
277{
278 return fib_rule_matchall(rule) && rule->action == FR_ACT_TO_TBL &&
279 rule->table == RT6_TABLE_DFLT && !rule->l3mdev;
280}
281EXPORT_SYMBOL(ip6mr_rule_default);
d1db275d
PM
282#else
283#define ip6mr_for_each_table(mrt, net) \
284 for (mrt = net->ipv6.mrt6; mrt; mrt = NULL)
285
7b0db857
YM
286static struct mr_table *ip6mr_mr_table_iter(struct net *net,
287 struct mr_table *mrt)
288{
289 if (!mrt)
290 return net->ipv6.mrt6;
291 return NULL;
292}
293
b70432f7 294static struct mr_table *ip6mr_get_table(struct net *net, u32 id)
d1db275d
PM
295{
296 return net->ipv6.mrt6;
297}
298
4c9483b2 299static int ip6mr_fib_lookup(struct net *net, struct flowi6 *flp6,
b70432f7 300 struct mr_table **mrt)
d1db275d
PM
301{
302 *mrt = net->ipv6.mrt6;
303 return 0;
304}
305
306static int __net_init ip6mr_rules_init(struct net *net)
307{
e783bb00
SD
308 struct mr_table *mrt;
309
310 mrt = ip6mr_new_table(net, RT6_TABLE_DFLT);
311 if (IS_ERR(mrt))
312 return PTR_ERR(mrt);
313 net->ipv6.mrt6 = mrt;
314 return 0;
d1db275d
PM
315}
316
317static void __net_exit ip6mr_rules_exit(struct net *net)
318{
905a6f96 319 rtnl_lock();
d1db275d 320 ip6mr_free_table(net->ipv6.mrt6);
905a6f96
HFS
321 net->ipv6.mrt6 = NULL;
322 rtnl_unlock();
d1db275d 323}
088aa3ee 324
b7a59557
JP
325static int ip6mr_rules_dump(struct net *net, struct notifier_block *nb,
326 struct netlink_ext_ack *extack)
088aa3ee
YM
327{
328 return 0;
329}
330
331static unsigned int ip6mr_rules_seq_read(struct net *net)
332{
333 return 0;
334}
d1db275d
PM
335#endif
336
87c418bf
YM
337static int ip6mr_hash_cmp(struct rhashtable_compare_arg *arg,
338 const void *ptr)
339{
340 const struct mfc6_cache_cmp_arg *cmparg = arg->key;
341 struct mfc6_cache *c = (struct mfc6_cache *)ptr;
342
343 return !ipv6_addr_equal(&c->mf6c_mcastgrp, &cmparg->mf6c_mcastgrp) ||
344 !ipv6_addr_equal(&c->mf6c_origin, &cmparg->mf6c_origin);
345}
346
347static const struct rhashtable_params ip6mr_rht_params = {
494fff56 348 .head_offset = offsetof(struct mr_mfc, mnode),
87c418bf
YM
349 .key_offset = offsetof(struct mfc6_cache, cmparg),
350 .key_len = sizeof(struct mfc6_cache_cmp_arg),
351 .nelem_hint = 3,
87c418bf
YM
352 .obj_cmpfn = ip6mr_hash_cmp,
353 .automatic_shrinking = true,
354};
355
0bbbf0e7
YM
356static void ip6mr_new_table_set(struct mr_table *mrt,
357 struct net *net)
358{
359#ifdef CONFIG_IPV6_MROUTE_MULTIPLE_TABLES
360 list_add_tail_rcu(&mrt->list, &net->ipv6.mr6_tables);
361#endif
362}
363
845c9a7a
YM
364static struct mfc6_cache_cmp_arg ip6mr_mr_table_ops_cmparg_any = {
365 .mf6c_origin = IN6ADDR_ANY_INIT,
366 .mf6c_mcastgrp = IN6ADDR_ANY_INIT,
367};
368
369static struct mr_table_ops ip6mr_mr_table_ops = {
370 .rht_params = &ip6mr_rht_params,
371 .cmparg_any = &ip6mr_mr_table_ops_cmparg_any,
372};
373
b70432f7 374static struct mr_table *ip6mr_new_table(struct net *net, u32 id)
d1db275d 375{
b70432f7 376 struct mr_table *mrt;
d1db275d
PM
377
378 mrt = ip6mr_get_table(net, id);
53b24b8f 379 if (mrt)
d1db275d
PM
380 return mrt;
381
845c9a7a 382 return mr_table_alloc(net, id, &ip6mr_mr_table_ops,
0bbbf0e7 383 ipmr_expire_process, ip6mr_new_table_set);
d1db275d 384}
7bc570c8 385
b70432f7 386static void ip6mr_free_table(struct mr_table *mrt)
d1db275d 387{
7ba0c47c 388 del_timer_sync(&mrt->ipmr_expire_timer);
ca8d4794
CS
389 mroute_clean_tables(mrt, MRT6_FLUSH_MIFS | MRT6_FLUSH_MIFS_STATIC |
390 MRT6_FLUSH_MFC | MRT6_FLUSH_MFC_STATIC);
b70432f7 391 rhltable_destroy(&mrt->mfc_hash);
d1db275d
PM
392 kfree(mrt);
393}
7bc570c8
YH
394
395#ifdef CONFIG_PROC_FS
c8d61968
YM
396/* The /proc interfaces to multicast routing
397 * /proc/ip6_mr_cache /proc/ip6_mr_vif
7bc570c8
YH
398 */
399
7bc570c8
YH
400static void *ip6mr_vif_seq_start(struct seq_file *seq, loff_t *pos)
401 __acquires(mrt_lock)
402{
3feda6b4 403 struct mr_vif_iter *iter = seq->private;
8b90fc7e 404 struct net *net = seq_file_net(seq);
b70432f7 405 struct mr_table *mrt;
d1db275d
PM
406
407 mrt = ip6mr_get_table(net, RT6_TABLE_DFLT);
63159f29 408 if (!mrt)
d1db275d
PM
409 return ERR_PTR(-ENOENT);
410
411 iter->mrt = mrt;
8b90fc7e 412
7bc570c8 413 read_lock(&mrt_lock);
3feda6b4 414 return mr_vif_seq_start(seq, pos);
7bc570c8
YH
415}
416
417static void ip6mr_vif_seq_stop(struct seq_file *seq, void *v)
418 __releases(mrt_lock)
419{
420 read_unlock(&mrt_lock);
421}
422
423static int ip6mr_vif_seq_show(struct seq_file *seq, void *v)
424{
3feda6b4 425 struct mr_vif_iter *iter = seq->private;
b70432f7 426 struct mr_table *mrt = iter->mrt;
8b90fc7e 427
7bc570c8
YH
428 if (v == SEQ_START_TOKEN) {
429 seq_puts(seq,
430 "Interface BytesIn PktsIn BytesOut PktsOut Flags\n");
431 } else {
6853f21f 432 const struct vif_device *vif = v;
7bc570c8
YH
433 const char *name = vif->dev ? vif->dev->name : "none";
434
435 seq_printf(seq,
d430a227 436 "%2td %-10s %8ld %7ld %8ld %7ld %05X\n",
b70432f7 437 vif - mrt->vif_table,
7bc570c8
YH
438 name, vif->bytes_in, vif->pkt_in,
439 vif->bytes_out, vif->pkt_out,
440 vif->flags);
441 }
442 return 0;
443}
444
98147d52 445static const struct seq_operations ip6mr_vif_seq_ops = {
7bc570c8 446 .start = ip6mr_vif_seq_start,
3feda6b4 447 .next = mr_vif_seq_next,
7bc570c8
YH
448 .stop = ip6mr_vif_seq_stop,
449 .show = ip6mr_vif_seq_show,
450};
451
7bc570c8
YH
452static void *ipmr_mfc_seq_start(struct seq_file *seq, loff_t *pos)
453{
8b90fc7e 454 struct net *net = seq_file_net(seq);
b70432f7 455 struct mr_table *mrt;
8b90fc7e 456
d1db275d 457 mrt = ip6mr_get_table(net, RT6_TABLE_DFLT);
63159f29 458 if (!mrt)
d1db275d
PM
459 return ERR_PTR(-ENOENT);
460
c8d61968 461 return mr_mfc_seq_start(seq, pos, mrt, &mfc_unres_lock);
7bc570c8
YH
462}
463
464static int ipmr_mfc_seq_show(struct seq_file *seq, void *v)
465{
466 int n;
467
468 if (v == SEQ_START_TOKEN) {
469 seq_puts(seq,
470 "Group "
471 "Origin "
472 "Iif Pkts Bytes Wrong Oifs\n");
473 } else {
474 const struct mfc6_cache *mfc = v;
c8d61968 475 const struct mr_mfc_iter *it = seq->private;
b70432f7 476 struct mr_table *mrt = it->mrt;
7bc570c8 477
999890b2 478 seq_printf(seq, "%pI6 %pI6 %-3hd",
0c6ce78a 479 &mfc->mf6c_mcastgrp, &mfc->mf6c_origin,
494fff56 480 mfc->_c.mfc_parent);
7bc570c8 481
b70432f7 482 if (it->cache != &mrt->mfc_unres_queue) {
1ea472e2 483 seq_printf(seq, " %8lu %8lu %8lu",
494fff56
YM
484 mfc->_c.mfc_un.res.pkt,
485 mfc->_c.mfc_un.res.bytes,
486 mfc->_c.mfc_un.res.wrong_if);
487 for (n = mfc->_c.mfc_un.res.minvif;
488 n < mfc->_c.mfc_un.res.maxvif; n++) {
b70432f7 489 if (VIF_EXISTS(mrt, n) &&
494fff56 490 mfc->_c.mfc_un.res.ttls[n] < 255)
7bc570c8 491 seq_printf(seq,
494fff56
YM
492 " %2d:%-3d", n,
493 mfc->_c.mfc_un.res.ttls[n]);
7bc570c8 494 }
1ea472e2
BT
495 } else {
496 /* unresolved mfc_caches don't contain
497 * pkt, bytes and wrong_if values
498 */
499 seq_printf(seq, " %8lu %8lu %8lu", 0ul, 0ul, 0ul);
7bc570c8
YH
500 }
501 seq_putc(seq, '\n');
502 }
503 return 0;
504}
505
88e9d34c 506static const struct seq_operations ipmr_mfc_seq_ops = {
7bc570c8 507 .start = ipmr_mfc_seq_start,
c8d61968
YM
508 .next = mr_mfc_seq_next,
509 .stop = mr_mfc_seq_stop,
7bc570c8
YH
510 .show = ipmr_mfc_seq_show,
511};
7bc570c8
YH
512#endif
513
14fb64e1 514#ifdef CONFIG_IPV6_PIMSM_V2
14fb64e1
YH
515
516static int pim6_rcv(struct sk_buff *skb)
517{
518 struct pimreghdr *pim;
519 struct ipv6hdr *encap;
520 struct net_device *reg_dev = NULL;
8229efda 521 struct net *net = dev_net(skb->dev);
b70432f7 522 struct mr_table *mrt;
4c9483b2
DM
523 struct flowi6 fl6 = {
524 .flowi6_iif = skb->dev->ifindex,
525 .flowi6_mark = skb->mark,
d1db275d
PM
526 };
527 int reg_vif_num;
14fb64e1
YH
528
529 if (!pskb_may_pull(skb, sizeof(*pim) + sizeof(*encap)))
530 goto drop;
531
532 pim = (struct pimreghdr *)skb_transport_header(skb);
56245cae 533 if (pim->type != ((PIM_VERSION << 4) | PIM_TYPE_REGISTER) ||
14fb64e1 534 (pim->flags & PIM_NULL_REGISTER) ||
1d6e55f1
TG
535 (csum_ipv6_magic(&ipv6_hdr(skb)->saddr, &ipv6_hdr(skb)->daddr,
536 sizeof(*pim), IPPROTO_PIM,
537 csum_partial((void *)pim, sizeof(*pim), 0)) &&
ec6b486f 538 csum_fold(skb_checksum(skb, 0, skb->len, 0))))
14fb64e1
YH
539 goto drop;
540
541 /* check if the inner packet is destined to mcast group */
542 encap = (struct ipv6hdr *)(skb_transport_header(skb) +
543 sizeof(*pim));
544
545 if (!ipv6_addr_is_multicast(&encap->daddr) ||
546 encap->payload_len == 0 ||
547 ntohs(encap->payload_len) + sizeof(*pim) > skb->len)
548 goto drop;
549
4c9483b2 550 if (ip6mr_fib_lookup(net, &fl6, &mrt) < 0)
d1db275d
PM
551 goto drop;
552 reg_vif_num = mrt->mroute_reg_vif_num;
553
14fb64e1
YH
554 read_lock(&mrt_lock);
555 if (reg_vif_num >= 0)
b70432f7 556 reg_dev = mrt->vif_table[reg_vif_num].dev;
1160dfa1 557 dev_hold(reg_dev);
14fb64e1
YH
558 read_unlock(&mrt_lock);
559
63159f29 560 if (!reg_dev)
14fb64e1
YH
561 goto drop;
562
563 skb->mac_header = skb->network_header;
564 skb_pull(skb, (u8 *)encap - skb->data);
565 skb_reset_network_header(skb);
1d6e55f1 566 skb->protocol = htons(ETH_P_IPV6);
3e49e6d5 567 skb->ip_summed = CHECKSUM_NONE;
d19d56dd 568
ea23192e 569 skb_tunnel_rx(skb, reg_dev, dev_net(reg_dev));
d19d56dd 570
caf586e5 571 netif_rx(skb);
8990f468 572
14fb64e1
YH
573 dev_put(reg_dev);
574 return 0;
575 drop:
576 kfree_skb(skb);
577 return 0;
578}
579
41135cc8 580static const struct inet6_protocol pim6_protocol = {
14fb64e1
YH
581 .handler = pim6_rcv,
582};
583
584/* Service routines creating virtual interfaces: PIMREG */
585
6fef4c0c
SH
586static netdev_tx_t reg_vif_xmit(struct sk_buff *skb,
587 struct net_device *dev)
14fb64e1 588{
8229efda 589 struct net *net = dev_net(dev);
b70432f7 590 struct mr_table *mrt;
4c9483b2
DM
591 struct flowi6 fl6 = {
592 .flowi6_oif = dev->ifindex,
6a662719 593 .flowi6_iif = skb->skb_iif ? : LOOPBACK_IFINDEX,
4c9483b2 594 .flowi6_mark = skb->mark,
d1db275d 595 };
d1db275d 596
cb9f1b78
WB
597 if (!pskb_inet_may_pull(skb))
598 goto tx_err;
599
600 if (ip6mr_fib_lookup(net, &fl6, &mrt) < 0)
601 goto tx_err;
8229efda 602
14fb64e1 603 read_lock(&mrt_lock);
dc58c78c
PE
604 dev->stats.tx_bytes += skb->len;
605 dev->stats.tx_packets++;
6bd52143 606 ip6mr_cache_report(mrt, skb, mrt->mroute_reg_vif_num, MRT6MSG_WHOLEPKT);
14fb64e1
YH
607 read_unlock(&mrt_lock);
608 kfree_skb(skb);
6ed10654 609 return NETDEV_TX_OK;
cb9f1b78
WB
610
611tx_err:
612 dev->stats.tx_errors++;
613 kfree_skb(skb);
614 return NETDEV_TX_OK;
14fb64e1
YH
615}
616
ee9b9596
ND
617static int reg_vif_get_iflink(const struct net_device *dev)
618{
619 return 0;
620}
621
007c3838
SH
622static const struct net_device_ops reg_vif_netdev_ops = {
623 .ndo_start_xmit = reg_vif_xmit,
ee9b9596 624 .ndo_get_iflink = reg_vif_get_iflink,
007c3838
SH
625};
626
14fb64e1
YH
627static void reg_vif_setup(struct net_device *dev)
628{
629 dev->type = ARPHRD_PIMREG;
630 dev->mtu = 1500 - sizeof(struct ipv6hdr) - 8;
631 dev->flags = IFF_NOARP;
007c3838 632 dev->netdev_ops = &reg_vif_netdev_ops;
cf124db5 633 dev->needs_free_netdev = true;
403dbb97 634 dev->features |= NETIF_F_NETNS_LOCAL;
14fb64e1
YH
635}
636
b70432f7 637static struct net_device *ip6mr_reg_vif(struct net *net, struct mr_table *mrt)
14fb64e1
YH
638{
639 struct net_device *dev;
d1db275d
PM
640 char name[IFNAMSIZ];
641
642 if (mrt->id == RT6_TABLE_DFLT)
643 sprintf(name, "pim6reg");
644 else
645 sprintf(name, "pim6reg%u", mrt->id);
14fb64e1 646
c835a677 647 dev = alloc_netdev(0, name, NET_NAME_UNKNOWN, reg_vif_setup);
63159f29 648 if (!dev)
14fb64e1
YH
649 return NULL;
650
8229efda
BT
651 dev_net_set(dev, net);
652
14fb64e1
YH
653 if (register_netdevice(dev)) {
654 free_netdev(dev);
655 return NULL;
656 }
14fb64e1 657
00f54e68 658 if (dev_open(dev, NULL))
14fb64e1
YH
659 goto failure;
660
7af3db78 661 dev_hold(dev);
14fb64e1
YH
662 return dev;
663
664failure:
14fb64e1
YH
665 unregister_netdevice(dev);
666 return NULL;
667}
668#endif
669
088aa3ee
YM
670static int call_ip6mr_vif_entry_notifiers(struct net *net,
671 enum fib_event_type event_type,
672 struct vif_device *vif,
673 mifi_t vif_index, u32 tb_id)
674{
675 return mr_call_vif_notifiers(net, RTNL_FAMILY_IP6MR, event_type,
676 vif, vif_index, tb_id,
677 &net->ipv6.ipmr_seq);
678}
7bc570c8 679
088aa3ee
YM
680static int call_ip6mr_mfc_entry_notifiers(struct net *net,
681 enum fib_event_type event_type,
682 struct mfc6_cache *mfc, u32 tb_id)
683{
684 return mr_call_mfc_notifiers(net, RTNL_FAMILY_IP6MR, event_type,
685 &mfc->_c, tb_id, &net->ipv6.ipmr_seq);
686}
687
688/* Delete a VIF entry */
b70432f7 689static int mif6_delete(struct mr_table *mrt, int vifi, int notify,
723b929c 690 struct list_head *head)
7bc570c8 691{
6853f21f 692 struct vif_device *v;
7bc570c8 693 struct net_device *dev;
1d6e55f1 694 struct inet6_dev *in6_dev;
6bd52143
PM
695
696 if (vifi < 0 || vifi >= mrt->maxvif)
7bc570c8
YH
697 return -EADDRNOTAVAIL;
698
b70432f7 699 v = &mrt->vif_table[vifi];
7bc570c8 700
088aa3ee
YM
701 if (VIF_EXISTS(mrt, vifi))
702 call_ip6mr_vif_entry_notifiers(read_pnet(&mrt->net),
703 FIB_EVENT_VIF_DEL, v, vifi,
704 mrt->id);
705
7bc570c8
YH
706 write_lock_bh(&mrt_lock);
707 dev = v->dev;
708 v->dev = NULL;
709
710 if (!dev) {
711 write_unlock_bh(&mrt_lock);
712 return -EADDRNOTAVAIL;
713 }
714
14fb64e1 715#ifdef CONFIG_IPV6_PIMSM_V2
6bd52143
PM
716 if (vifi == mrt->mroute_reg_vif_num)
717 mrt->mroute_reg_vif_num = -1;
14fb64e1
YH
718#endif
719
6bd52143 720 if (vifi + 1 == mrt->maxvif) {
7bc570c8
YH
721 int tmp;
722 for (tmp = vifi - 1; tmp >= 0; tmp--) {
b70432f7 723 if (VIF_EXISTS(mrt, tmp))
7bc570c8
YH
724 break;
725 }
6bd52143 726 mrt->maxvif = tmp + 1;
7bc570c8
YH
727 }
728
729 write_unlock_bh(&mrt_lock);
730
731 dev_set_allmulti(dev, -1);
732
1d6e55f1 733 in6_dev = __in6_dev_get(dev);
d67b8c61 734 if (in6_dev) {
1d6e55f1 735 in6_dev->cnf.mc_forwarding--;
85b3daad 736 inet6_netconf_notify_devconf(dev_net(dev), RTM_NEWNETCONF,
d67b8c61
ND
737 NETCONFA_MC_FORWARDING,
738 dev->ifindex, &in6_dev->cnf);
739 }
1d6e55f1 740
723b929c 741 if ((v->flags & MIFF_REGISTER) && !notify)
c871e664 742 unregister_netdevice_queue(dev, head);
7bc570c8 743
42120a86 744 dev_put_track(dev, &v->dev_tracker);
7bc570c8
YH
745 return 0;
746}
747
87c418bf 748static inline void ip6mr_cache_free_rcu(struct rcu_head *head)
58701ad4 749{
494fff56 750 struct mr_mfc *c = container_of(head, struct mr_mfc, rcu);
87c418bf 751
494fff56 752 kmem_cache_free(mrt_cachep, (struct mfc6_cache *)c);
58701ad4
BT
753}
754
87c418bf
YM
755static inline void ip6mr_cache_free(struct mfc6_cache *c)
756{
494fff56 757 call_rcu(&c->_c.rcu, ip6mr_cache_free_rcu);
87c418bf
YM
758}
759
7bc570c8
YH
760/* Destroy an unresolved cache entry, killing queued skbs
761 and reporting error to netlink readers.
762 */
763
b70432f7 764static void ip6mr_destroy_unres(struct mr_table *mrt, struct mfc6_cache *c)
7bc570c8 765{
6bd52143 766 struct net *net = read_pnet(&mrt->net);
7bc570c8
YH
767 struct sk_buff *skb;
768
6bd52143 769 atomic_dec(&mrt->cache_resolve_queue_len);
7bc570c8 770
494fff56 771 while ((skb = skb_dequeue(&c->_c.mfc_un.unres.unresolved)) != NULL) {
7bc570c8 772 if (ipv6_hdr(skb)->version == 0) {
af72868b
JB
773 struct nlmsghdr *nlh = skb_pull(skb,
774 sizeof(struct ipv6hdr));
7bc570c8 775 nlh->nlmsg_type = NLMSG_ERROR;
573ce260 776 nlh->nlmsg_len = nlmsg_msg_size(sizeof(struct nlmsgerr));
7bc570c8 777 skb_trim(skb, nlh->nlmsg_len);
573ce260 778 ((struct nlmsgerr *)nlmsg_data(nlh))->error = -ETIMEDOUT;
15e47304 779 rtnl_unicast(skb, net, NETLINK_CB(skb).portid);
7bc570c8
YH
780 } else
781 kfree_skb(skb);
782 }
783
58701ad4 784 ip6mr_cache_free(c);
7bc570c8
YH
785}
786
787
c476efbc 788/* Timer process for all the unresolved queue. */
7bc570c8 789
b70432f7 790static void ipmr_do_expire_process(struct mr_table *mrt)
7bc570c8
YH
791{
792 unsigned long now = jiffies;
793 unsigned long expires = 10 * HZ;
494fff56 794 struct mr_mfc *c, *next;
7bc570c8 795
b70432f7 796 list_for_each_entry_safe(c, next, &mrt->mfc_unres_queue, list) {
7bc570c8
YH
797 if (time_after(c->mfc_un.unres.expires, now)) {
798 /* not yet... */
799 unsigned long interval = c->mfc_un.unres.expires - now;
800 if (interval < expires)
801 expires = interval;
7bc570c8
YH
802 continue;
803 }
804
f30a7784 805 list_del(&c->list);
494fff56
YM
806 mr6_netlink_event(mrt, (struct mfc6_cache *)c, RTM_DELROUTE);
807 ip6mr_destroy_unres(mrt, (struct mfc6_cache *)c);
7bc570c8
YH
808 }
809
b70432f7 810 if (!list_empty(&mrt->mfc_unres_queue))
6bd52143 811 mod_timer(&mrt->ipmr_expire_timer, jiffies + expires);
7bc570c8
YH
812}
813
e99e88a9 814static void ipmr_expire_process(struct timer_list *t)
7bc570c8 815{
b70432f7 816 struct mr_table *mrt = from_timer(mrt, t, ipmr_expire_timer);
c476efbc 817
7bc570c8 818 if (!spin_trylock(&mfc_unres_lock)) {
6bd52143 819 mod_timer(&mrt->ipmr_expire_timer, jiffies + 1);
7bc570c8
YH
820 return;
821 }
822
b70432f7 823 if (!list_empty(&mrt->mfc_unres_queue))
6bd52143 824 ipmr_do_expire_process(mrt);
7bc570c8
YH
825
826 spin_unlock(&mfc_unres_lock);
827}
828
829/* Fill oifs list. It is called under write locked mrt_lock. */
830
b70432f7 831static void ip6mr_update_thresholds(struct mr_table *mrt,
494fff56 832 struct mr_mfc *cache,
b5aa30b1 833 unsigned char *ttls)
7bc570c8
YH
834{
835 int vifi;
836
6ac7eb08 837 cache->mfc_un.res.minvif = MAXMIFS;
7bc570c8 838 cache->mfc_un.res.maxvif = 0;
6ac7eb08 839 memset(cache->mfc_un.res.ttls, 255, MAXMIFS);
7bc570c8 840
6bd52143 841 for (vifi = 0; vifi < mrt->maxvif; vifi++) {
b70432f7 842 if (VIF_EXISTS(mrt, vifi) &&
4e16880c 843 ttls[vifi] && ttls[vifi] < 255) {
7bc570c8
YH
844 cache->mfc_un.res.ttls[vifi] = ttls[vifi];
845 if (cache->mfc_un.res.minvif > vifi)
846 cache->mfc_un.res.minvif = vifi;
847 if (cache->mfc_un.res.maxvif <= vifi)
848 cache->mfc_un.res.maxvif = vifi + 1;
849 }
850 }
90b5ca17 851 cache->mfc_un.res.lastuse = jiffies;
7bc570c8
YH
852}
853
b70432f7 854static int mif6_add(struct net *net, struct mr_table *mrt,
6bd52143 855 struct mif6ctl *vifc, int mrtsock)
7bc570c8
YH
856{
857 int vifi = vifc->mif6c_mifi;
b70432f7 858 struct vif_device *v = &mrt->vif_table[vifi];
7bc570c8 859 struct net_device *dev;
1d6e55f1 860 struct inet6_dev *in6_dev;
5ae7b444 861 int err;
7bc570c8
YH
862
863 /* Is vif busy ? */
b70432f7 864 if (VIF_EXISTS(mrt, vifi))
7bc570c8
YH
865 return -EADDRINUSE;
866
867 switch (vifc->mif6c_flags) {
14fb64e1
YH
868#ifdef CONFIG_IPV6_PIMSM_V2
869 case MIFF_REGISTER:
870 /*
871 * Special Purpose VIF in PIM
872 * All the packets will be sent to the daemon
873 */
6bd52143 874 if (mrt->mroute_reg_vif_num >= 0)
14fb64e1 875 return -EADDRINUSE;
d1db275d 876 dev = ip6mr_reg_vif(net, mrt);
14fb64e1
YH
877 if (!dev)
878 return -ENOBUFS;
5ae7b444
WC
879 err = dev_set_allmulti(dev, 1);
880 if (err) {
881 unregister_netdevice(dev);
7af3db78 882 dev_put(dev);
5ae7b444
WC
883 return err;
884 }
14fb64e1
YH
885 break;
886#endif
7bc570c8 887 case 0:
8229efda 888 dev = dev_get_by_index(net, vifc->mif6c_pifi);
7bc570c8
YH
889 if (!dev)
890 return -EADDRNOTAVAIL;
5ae7b444 891 err = dev_set_allmulti(dev, 1);
7af3db78
WC
892 if (err) {
893 dev_put(dev);
5ae7b444 894 return err;
7af3db78 895 }
7bc570c8
YH
896 break;
897 default:
898 return -EINVAL;
899 }
900
1d6e55f1 901 in6_dev = __in6_dev_get(dev);
d67b8c61 902 if (in6_dev) {
1d6e55f1 903 in6_dev->cnf.mc_forwarding++;
85b3daad 904 inet6_netconf_notify_devconf(dev_net(dev), RTM_NEWNETCONF,
d67b8c61
ND
905 NETCONFA_MC_FORWARDING,
906 dev->ifindex, &in6_dev->cnf);
907 }
1d6e55f1 908
6853f21f
YM
909 /* Fill in the VIF structures */
910 vif_device_init(v, dev, vifc->vifc_rate_limit, vifc->vifc_threshold,
911 vifc->mif6c_flags | (!mrtsock ? VIFF_STATIC : 0),
912 MIFF_REGISTER);
7bc570c8
YH
913
914 /* And finish update writing critical data */
915 write_lock_bh(&mrt_lock);
7bc570c8 916 v->dev = dev;
42120a86 917 netdev_tracker_alloc(dev, &v->dev_tracker, GFP_ATOMIC);
14fb64e1
YH
918#ifdef CONFIG_IPV6_PIMSM_V2
919 if (v->flags & MIFF_REGISTER)
6bd52143 920 mrt->mroute_reg_vif_num = vifi;
14fb64e1 921#endif
6bd52143
PM
922 if (vifi + 1 > mrt->maxvif)
923 mrt->maxvif = vifi + 1;
7bc570c8 924 write_unlock_bh(&mrt_lock);
088aa3ee
YM
925 call_ip6mr_vif_entry_notifiers(net, FIB_EVENT_VIF_ADD,
926 v, vifi, mrt->id);
7bc570c8
YH
927 return 0;
928}
929
b70432f7 930static struct mfc6_cache *ip6mr_cache_find(struct mr_table *mrt,
b71d1d42
ED
931 const struct in6_addr *origin,
932 const struct in6_addr *mcastgrp)
7bc570c8 933{
87c418bf
YM
934 struct mfc6_cache_cmp_arg arg = {
935 .mf6c_origin = *origin,
936 .mf6c_mcastgrp = *mcastgrp,
937 };
87c418bf 938
845c9a7a 939 return mr_mfc_find(mrt, &arg);
660b26dc
ND
940}
941
942/* Look for a (*,G) entry */
b70432f7 943static struct mfc6_cache *ip6mr_cache_find_any(struct mr_table *mrt,
660b26dc
ND
944 struct in6_addr *mcastgrp,
945 mifi_t mifi)
946{
87c418bf
YM
947 struct mfc6_cache_cmp_arg arg = {
948 .mf6c_origin = in6addr_any,
949 .mf6c_mcastgrp = *mcastgrp,
950 };
660b26dc
ND
951
952 if (ipv6_addr_any(mcastgrp))
845c9a7a
YM
953 return mr_mfc_find_any_parent(mrt, mifi);
954 return mr_mfc_find_any(mrt, mifi, &arg);
660b26dc
ND
955}
956
87c418bf
YM
957/* Look for a (S,G,iif) entry if parent != -1 */
958static struct mfc6_cache *
b70432f7 959ip6mr_cache_find_parent(struct mr_table *mrt,
87c418bf
YM
960 const struct in6_addr *origin,
961 const struct in6_addr *mcastgrp,
962 int parent)
963{
964 struct mfc6_cache_cmp_arg arg = {
965 .mf6c_origin = *origin,
966 .mf6c_mcastgrp = *mcastgrp,
967 };
87c418bf 968
845c9a7a 969 return mr_mfc_find_parent(mrt, &arg, parent);
87c418bf
YM
970}
971
845c9a7a 972/* Allocate a multicast cache entry */
b5aa30b1 973static struct mfc6_cache *ip6mr_cache_alloc(void)
7bc570c8 974{
36cbac59 975 struct mfc6_cache *c = kmem_cache_zalloc(mrt_cachep, GFP_KERNEL);
63159f29 976 if (!c)
7bc570c8 977 return NULL;
494fff56
YM
978 c->_c.mfc_un.res.last_assert = jiffies - MFC_ASSERT_THRESH - 1;
979 c->_c.mfc_un.res.minvif = MAXMIFS;
8c13af2a
YM
980 c->_c.free = ip6mr_cache_free_rcu;
981 refcount_set(&c->_c.mfc_un.res.refcount, 1);
7bc570c8
YH
982 return c;
983}
984
b5aa30b1 985static struct mfc6_cache *ip6mr_cache_alloc_unres(void)
7bc570c8 986{
36cbac59 987 struct mfc6_cache *c = kmem_cache_zalloc(mrt_cachep, GFP_ATOMIC);
63159f29 988 if (!c)
7bc570c8 989 return NULL;
494fff56
YM
990 skb_queue_head_init(&c->_c.mfc_un.unres.unresolved);
991 c->_c.mfc_un.unres.expires = jiffies + 10 * HZ;
7bc570c8
YH
992 return c;
993}
994
995/*
996 * A cache entry has gone into a resolved state from queued
997 */
998
b70432f7 999static void ip6mr_cache_resolve(struct net *net, struct mr_table *mrt,
6bd52143 1000 struct mfc6_cache *uc, struct mfc6_cache *c)
7bc570c8
YH
1001{
1002 struct sk_buff *skb;
1003
1004 /*
1005 * Play the pending entries through our router
1006 */
1007
494fff56 1008 while ((skb = __skb_dequeue(&uc->_c.mfc_un.unres.unresolved))) {
7bc570c8 1009 if (ipv6_hdr(skb)->version == 0) {
af72868b
JB
1010 struct nlmsghdr *nlh = skb_pull(skb,
1011 sizeof(struct ipv6hdr));
7bc570c8 1012
7b0db857
YM
1013 if (mr_fill_mroute(mrt, skb, &c->_c,
1014 nlmsg_data(nlh)) > 0) {
549e028d 1015 nlh->nlmsg_len = skb_tail_pointer(skb) - (u8 *)nlh;
7bc570c8
YH
1016 } else {
1017 nlh->nlmsg_type = NLMSG_ERROR;
573ce260 1018 nlh->nlmsg_len = nlmsg_msg_size(sizeof(struct nlmsgerr));
7bc570c8 1019 skb_trim(skb, nlh->nlmsg_len);
573ce260 1020 ((struct nlmsgerr *)nlmsg_data(nlh))->error = -EMSGSIZE;
7bc570c8 1021 }
15e47304 1022 rtnl_unicast(skb, net, NETLINK_CB(skb).portid);
7bc570c8 1023 } else
e4a38c0c 1024 ip6_mr_forward(net, mrt, skb->dev, skb, c);
7bc570c8
YH
1025 }
1026}
1027
1028/*
dd12d15c 1029 * Bounce a cache query up to pim6sd and netlink.
7bc570c8
YH
1030 *
1031 * Called under mrt_lock.
1032 */
1033
b70432f7 1034static int ip6mr_cache_report(struct mr_table *mrt, struct sk_buff *pkt,
6bd52143 1035 mifi_t mifi, int assert)
7bc570c8 1036{
8571ab47 1037 struct sock *mroute6_sk;
7bc570c8
YH
1038 struct sk_buff *skb;
1039 struct mrt6msg *msg;
1040 int ret;
1041
14fb64e1
YH
1042#ifdef CONFIG_IPV6_PIMSM_V2
1043 if (assert == MRT6MSG_WHOLEPKT)
1044 skb = skb_realloc_headroom(pkt, -skb_network_offset(pkt)
1045 +sizeof(*msg));
1046 else
1047#endif
1048 skb = alloc_skb(sizeof(struct ipv6hdr) + sizeof(*msg), GFP_ATOMIC);
7bc570c8
YH
1049
1050 if (!skb)
1051 return -ENOBUFS;
1052
1053 /* I suppose that internal messages
1054 * do not require checksums */
1055
1056 skb->ip_summed = CHECKSUM_UNNECESSARY;
1057
14fb64e1
YH
1058#ifdef CONFIG_IPV6_PIMSM_V2
1059 if (assert == MRT6MSG_WHOLEPKT) {
1060 /* Ugly, but we have no choice with this interface.
1061 Duplicate old header, fix length etc.
1062 And all this only to mangle msg->im6_msgtype and
1063 to set msg->im6_mbz to "mbz" :-)
1064 */
1065 skb_push(skb, -skb_network_offset(pkt));
1066
1067 skb_push(skb, sizeof(*msg));
1068 skb_reset_transport_header(skb);
1069 msg = (struct mrt6msg *)skb_transport_header(skb);
1070 msg->im6_mbz = 0;
1071 msg->im6_msgtype = MRT6MSG_WHOLEPKT;
6bd52143 1072 msg->im6_mif = mrt->mroute_reg_vif_num;
14fb64e1 1073 msg->im6_pad = 0;
4e3fd7a0
AD
1074 msg->im6_src = ipv6_hdr(pkt)->saddr;
1075 msg->im6_dst = ipv6_hdr(pkt)->daddr;
14fb64e1
YH
1076
1077 skb->ip_summed = CHECKSUM_UNNECESSARY;
1078 } else
1079#endif
1080 {
7bc570c8
YH
1081 /*
1082 * Copy the IP header
1083 */
1084
1085 skb_put(skb, sizeof(struct ipv6hdr));
1086 skb_reset_network_header(skb);
1087 skb_copy_to_linear_data(skb, ipv6_hdr(pkt), sizeof(struct ipv6hdr));
1088
1089 /*
1090 * Add our header
1091 */
1092 skb_put(skb, sizeof(*msg));
1093 skb_reset_transport_header(skb);
1094 msg = (struct mrt6msg *)skb_transport_header(skb);
1095
1096 msg->im6_mbz = 0;
1097 msg->im6_msgtype = assert;
6ac7eb08 1098 msg->im6_mif = mifi;
7bc570c8 1099 msg->im6_pad = 0;
4e3fd7a0
AD
1100 msg->im6_src = ipv6_hdr(pkt)->saddr;
1101 msg->im6_dst = ipv6_hdr(pkt)->daddr;
7bc570c8 1102
adf30907 1103 skb_dst_set(skb, dst_clone(skb_dst(pkt)));
7bc570c8 1104 skb->ip_summed = CHECKSUM_UNNECESSARY;
14fb64e1 1105 }
7bc570c8 1106
8571ab47 1107 rcu_read_lock();
b70432f7 1108 mroute6_sk = rcu_dereference(mrt->mroute_sk);
8571ab47
YM
1109 if (!mroute6_sk) {
1110 rcu_read_unlock();
7bc570c8
YH
1111 kfree_skb(skb);
1112 return -EINVAL;
1113 }
1114
dd12d15c
JG
1115 mrt6msg_netlink_event(mrt, skb);
1116
8571ab47
YM
1117 /* Deliver to user space multicast routing algorithms */
1118 ret = sock_queue_rcv_skb(mroute6_sk, skb);
1119 rcu_read_unlock();
bd91b8bf 1120 if (ret < 0) {
e87cc472 1121 net_warn_ratelimited("mroute6: pending queue full, dropping entries\n");
7bc570c8
YH
1122 kfree_skb(skb);
1123 }
1124
1125 return ret;
1126}
1127
494fff56
YM
1128/* Queue a packet for resolution. It gets locked cache entry! */
1129static int ip6mr_cache_unresolved(struct mr_table *mrt, mifi_t mifi,
e4a38c0c 1130 struct sk_buff *skb, struct net_device *dev)
7bc570c8 1131{
494fff56 1132 struct mfc6_cache *c;
f30a7784 1133 bool found = false;
7bc570c8 1134 int err;
7bc570c8
YH
1135
1136 spin_lock_bh(&mfc_unres_lock);
494fff56 1137 list_for_each_entry(c, &mrt->mfc_unres_queue, _c.list) {
c476efbc 1138 if (ipv6_addr_equal(&c->mf6c_mcastgrp, &ipv6_hdr(skb)->daddr) &&
f30a7784
PM
1139 ipv6_addr_equal(&c->mf6c_origin, &ipv6_hdr(skb)->saddr)) {
1140 found = true;
7bc570c8 1141 break;
f30a7784 1142 }
7bc570c8
YH
1143 }
1144
f30a7784 1145 if (!found) {
7bc570c8
YH
1146 /*
1147 * Create a new entry if allowable
1148 */
1149
0079ad8e
HL
1150 c = ip6mr_cache_alloc_unres();
1151 if (!c) {
7bc570c8
YH
1152 spin_unlock_bh(&mfc_unres_lock);
1153
1154 kfree_skb(skb);
1155 return -ENOBUFS;
1156 }
1157
494fff56
YM
1158 /* Fill in the new cache entry */
1159 c->_c.mfc_parent = -1;
7bc570c8
YH
1160 c->mf6c_origin = ipv6_hdr(skb)->saddr;
1161 c->mf6c_mcastgrp = ipv6_hdr(skb)->daddr;
1162
1163 /*
1164 * Reflect first query at pim6sd
1165 */
6bd52143 1166 err = ip6mr_cache_report(mrt, skb, mifi, MRT6MSG_NOCACHE);
8229efda 1167 if (err < 0) {
7bc570c8
YH
1168 /* If the report failed throw the cache entry
1169 out - Brad Parker
1170 */
1171 spin_unlock_bh(&mfc_unres_lock);
1172
58701ad4 1173 ip6mr_cache_free(c);
7bc570c8
YH
1174 kfree_skb(skb);
1175 return err;
1176 }
1177
6bd52143 1178 atomic_inc(&mrt->cache_resolve_queue_len);
494fff56 1179 list_add(&c->_c.list, &mrt->mfc_unres_queue);
812e44dd 1180 mr6_netlink_event(mrt, c, RTM_NEWROUTE);
7bc570c8 1181
6bd52143 1182 ipmr_do_expire_process(mrt);
7bc570c8
YH
1183 }
1184
494fff56
YM
1185 /* See if we can append the packet */
1186 if (c->_c.mfc_un.unres.unresolved.qlen > 3) {
7bc570c8
YH
1187 kfree_skb(skb);
1188 err = -ENOBUFS;
1189 } else {
e4a38c0c
PR
1190 if (dev) {
1191 skb->dev = dev;
1192 skb->skb_iif = dev->ifindex;
1193 }
494fff56 1194 skb_queue_tail(&c->_c.mfc_un.unres.unresolved, skb);
7bc570c8
YH
1195 err = 0;
1196 }
1197
1198 spin_unlock_bh(&mfc_unres_lock);
1199 return err;
1200}
1201
1202/*
1203 * MFC6 cache manipulation by user space
1204 */
1205
b70432f7 1206static int ip6mr_mfc_delete(struct mr_table *mrt, struct mf6cctl *mfc,
660b26dc 1207 int parent)
7bc570c8 1208{
87c418bf 1209 struct mfc6_cache *c;
7bc570c8 1210
87c418bf
YM
1211 /* The entries are added/deleted only under RTNL */
1212 rcu_read_lock();
1213 c = ip6mr_cache_find_parent(mrt, &mfc->mf6cc_origin.sin6_addr,
1214 &mfc->mf6cc_mcastgrp.sin6_addr, parent);
1215 rcu_read_unlock();
1216 if (!c)
1217 return -ENOENT;
494fff56
YM
1218 rhltable_remove(&mrt->mfc_hash, &c->_c.mnode, ip6mr_rht_params);
1219 list_del_rcu(&c->_c.list);
7bc570c8 1220
088aa3ee
YM
1221 call_ip6mr_mfc_entry_notifiers(read_pnet(&mrt->net),
1222 FIB_EVENT_ENTRY_DEL, c, mrt->id);
87c418bf 1223 mr6_netlink_event(mrt, c, RTM_DELROUTE);
8c13af2a 1224 mr_cache_put(&c->_c);
87c418bf 1225 return 0;
7bc570c8
YH
1226}
1227
1228static int ip6mr_device_event(struct notifier_block *this,
1229 unsigned long event, void *ptr)
1230{
351638e7 1231 struct net_device *dev = netdev_notifier_info_to_dev(ptr);
8229efda 1232 struct net *net = dev_net(dev);
b70432f7 1233 struct mr_table *mrt;
6853f21f 1234 struct vif_device *v;
7bc570c8
YH
1235 int ct;
1236
7bc570c8
YH
1237 if (event != NETDEV_UNREGISTER)
1238 return NOTIFY_DONE;
1239
d1db275d 1240 ip6mr_for_each_table(mrt, net) {
b70432f7 1241 v = &mrt->vif_table[0];
d1db275d
PM
1242 for (ct = 0; ct < mrt->maxvif; ct++, v++) {
1243 if (v->dev == dev)
723b929c 1244 mif6_delete(mrt, ct, 1, NULL);
d1db275d 1245 }
7bc570c8 1246 }
c871e664 1247
7bc570c8
YH
1248 return NOTIFY_DONE;
1249}
1250
088aa3ee
YM
1251static unsigned int ip6mr_seq_read(struct net *net)
1252{
1253 ASSERT_RTNL();
1254
1255 return net->ipv6.ipmr_seq + ip6mr_rules_seq_read(net);
1256}
1257
b7a59557
JP
1258static int ip6mr_dump(struct net *net, struct notifier_block *nb,
1259 struct netlink_ext_ack *extack)
088aa3ee
YM
1260{
1261 return mr_dump(net, nb, RTNL_FAMILY_IP6MR, ip6mr_rules_dump,
b7a59557 1262 ip6mr_mr_table_iter, &mrt_lock, extack);
088aa3ee
YM
1263}
1264
7bc570c8
YH
1265static struct notifier_block ip6_mr_notifier = {
1266 .notifier_call = ip6mr_device_event
1267};
1268
088aa3ee
YM
1269static const struct fib_notifier_ops ip6mr_notifier_ops_template = {
1270 .family = RTNL_FAMILY_IP6MR,
1271 .fib_seq_read = ip6mr_seq_read,
1272 .fib_dump = ip6mr_dump,
1273 .owner = THIS_MODULE,
1274};
1275
1276static int __net_init ip6mr_notifier_init(struct net *net)
1277{
1278 struct fib_notifier_ops *ops;
1279
1280 net->ipv6.ipmr_seq = 0;
7bc570c8 1281
088aa3ee
YM
1282 ops = fib_notifier_ops_register(&ip6mr_notifier_ops_template, net);
1283 if (IS_ERR(ops))
1284 return PTR_ERR(ops);
1285
1286 net->ipv6.ip6mr_notifier_ops = ops;
1287
1288 return 0;
1289}
1290
1291static void __net_exit ip6mr_notifier_exit(struct net *net)
1292{
1293 fib_notifier_ops_unregister(net->ipv6.ip6mr_notifier_ops);
1294 net->ipv6.ip6mr_notifier_ops = NULL;
1295}
1296
1297/* Setup for IP multicast routing */
4e16880c
BT
1298static int __net_init ip6mr_net_init(struct net *net)
1299{
d1db275d 1300 int err;
f30a7784 1301
088aa3ee
YM
1302 err = ip6mr_notifier_init(net);
1303 if (err)
1304 return err;
1305
d1db275d
PM
1306 err = ip6mr_rules_init(net);
1307 if (err < 0)
088aa3ee 1308 goto ip6mr_rules_fail;
8b90fc7e
BT
1309
1310#ifdef CONFIG_PROC_FS
1311 err = -ENOMEM;
c3506372
CH
1312 if (!proc_create_net("ip6_mr_vif", 0, net->proc_net, &ip6mr_vif_seq_ops,
1313 sizeof(struct mr_vif_iter)))
8b90fc7e 1314 goto proc_vif_fail;
c3506372
CH
1315 if (!proc_create_net("ip6_mr_cache", 0, net->proc_net, &ipmr_mfc_seq_ops,
1316 sizeof(struct mr_mfc_iter)))
8b90fc7e
BT
1317 goto proc_cache_fail;
1318#endif
6bd52143 1319
4a6258a0
BT
1320 return 0;
1321
8b90fc7e
BT
1322#ifdef CONFIG_PROC_FS
1323proc_cache_fail:
ece31ffd 1324 remove_proc_entry("ip6_mr_vif", net->proc_net);
8b90fc7e 1325proc_vif_fail:
d1db275d 1326 ip6mr_rules_exit(net);
8b90fc7e 1327#endif
088aa3ee
YM
1328ip6mr_rules_fail:
1329 ip6mr_notifier_exit(net);
4e16880c
BT
1330 return err;
1331}
1332
1333static void __net_exit ip6mr_net_exit(struct net *net)
1334{
8b90fc7e 1335#ifdef CONFIG_PROC_FS
ece31ffd
G
1336 remove_proc_entry("ip6_mr_cache", net->proc_net);
1337 remove_proc_entry("ip6_mr_vif", net->proc_net);
8b90fc7e 1338#endif
d1db275d 1339 ip6mr_rules_exit(net);
088aa3ee 1340 ip6mr_notifier_exit(net);
4e16880c
BT
1341}
1342
1343static struct pernet_operations ip6mr_net_ops = {
1344 .init = ip6mr_net_init,
1345 .exit = ip6mr_net_exit,
1346};
1347
623d1a1a 1348int __init ip6_mr_init(void)
7bc570c8 1349{
623d1a1a
WC
1350 int err;
1351
7bc570c8
YH
1352 mrt_cachep = kmem_cache_create("ip6_mrt_cache",
1353 sizeof(struct mfc6_cache),
1354 0, SLAB_HWCACHE_ALIGN,
1355 NULL);
1356 if (!mrt_cachep)
623d1a1a 1357 return -ENOMEM;
7bc570c8 1358
4e16880c
BT
1359 err = register_pernet_subsys(&ip6mr_net_ops);
1360 if (err)
1361 goto reg_pernet_fail;
1362
623d1a1a
WC
1363 err = register_netdevice_notifier(&ip6_mr_notifier);
1364 if (err)
1365 goto reg_notif_fail;
403dbb97
TG
1366#ifdef CONFIG_IPV6_PIMSM_V2
1367 if (inet6_add_protocol(&pim6_protocol, IPPROTO_PIM) < 0) {
f3213831 1368 pr_err("%s: can't add PIM protocol\n", __func__);
403dbb97
TG
1369 err = -EAGAIN;
1370 goto add_proto_fail;
1371 }
1372#endif
a3fde2ad
FW
1373 err = rtnl_register_module(THIS_MODULE, RTNL_FAMILY_IP6MR, RTM_GETROUTE,
1374 NULL, ip6mr_rtm_dumproute, 0);
1375 if (err == 0)
1376 return 0;
1377
403dbb97 1378#ifdef CONFIG_IPV6_PIMSM_V2
a3fde2ad 1379 inet6_del_protocol(&pim6_protocol, IPPROTO_PIM);
403dbb97
TG
1380add_proto_fail:
1381 unregister_netdevice_notifier(&ip6_mr_notifier);
1382#endif
87b30a65 1383reg_notif_fail:
4e16880c
BT
1384 unregister_pernet_subsys(&ip6mr_net_ops);
1385reg_pernet_fail:
87b30a65 1386 kmem_cache_destroy(mrt_cachep);
623d1a1a 1387 return err;
7bc570c8
YH
1388}
1389
623d1a1a
WC
1390void ip6_mr_cleanup(void)
1391{
ffb1388a
DJ
1392 rtnl_unregister(RTNL_FAMILY_IP6MR, RTM_GETROUTE);
1393#ifdef CONFIG_IPV6_PIMSM_V2
1394 inet6_del_protocol(&pim6_protocol, IPPROTO_PIM);
1395#endif
623d1a1a 1396 unregister_netdevice_notifier(&ip6_mr_notifier);
4e16880c 1397 unregister_pernet_subsys(&ip6mr_net_ops);
623d1a1a
WC
1398 kmem_cache_destroy(mrt_cachep);
1399}
7bc570c8 1400
b70432f7 1401static int ip6mr_mfc_add(struct net *net, struct mr_table *mrt,
660b26dc 1402 struct mf6cctl *mfc, int mrtsock, int parent)
7bc570c8 1403{
6ac7eb08 1404 unsigned char ttls[MAXMIFS];
87c418bf 1405 struct mfc6_cache *uc, *c;
494fff56 1406 struct mr_mfc *_uc;
87c418bf
YM
1407 bool found;
1408 int i, err;
7bc570c8 1409
a50436f2
PM
1410 if (mfc->mf6cc_parent >= MAXMIFS)
1411 return -ENFILE;
1412
6ac7eb08
RR
1413 memset(ttls, 255, MAXMIFS);
1414 for (i = 0; i < MAXMIFS; i++) {
7bc570c8
YH
1415 if (IF_ISSET(i, &mfc->mf6cc_ifset))
1416 ttls[i] = 1;
7bc570c8
YH
1417 }
1418
87c418bf
YM
1419 /* The entries are added/deleted only under RTNL */
1420 rcu_read_lock();
1421 c = ip6mr_cache_find_parent(mrt, &mfc->mf6cc_origin.sin6_addr,
1422 &mfc->mf6cc_mcastgrp.sin6_addr, parent);
1423 rcu_read_unlock();
1424 if (c) {
7bc570c8 1425 write_lock_bh(&mrt_lock);
494fff56
YM
1426 c->_c.mfc_parent = mfc->mf6cc_parent;
1427 ip6mr_update_thresholds(mrt, &c->_c, ttls);
7bc570c8 1428 if (!mrtsock)
494fff56 1429 c->_c.mfc_flags |= MFC_STATIC;
7bc570c8 1430 write_unlock_bh(&mrt_lock);
088aa3ee
YM
1431 call_ip6mr_mfc_entry_notifiers(net, FIB_EVENT_ENTRY_REPLACE,
1432 c, mrt->id);
812e44dd 1433 mr6_netlink_event(mrt, c, RTM_NEWROUTE);
7bc570c8
YH
1434 return 0;
1435 }
1436
660b26dc
ND
1437 if (!ipv6_addr_any(&mfc->mf6cc_mcastgrp.sin6_addr) &&
1438 !ipv6_addr_is_multicast(&mfc->mf6cc_mcastgrp.sin6_addr))
7bc570c8
YH
1439 return -EINVAL;
1440
b5aa30b1 1441 c = ip6mr_cache_alloc();
63159f29 1442 if (!c)
7bc570c8
YH
1443 return -ENOMEM;
1444
1445 c->mf6c_origin = mfc->mf6cc_origin.sin6_addr;
1446 c->mf6c_mcastgrp = mfc->mf6cc_mcastgrp.sin6_addr;
494fff56
YM
1447 c->_c.mfc_parent = mfc->mf6cc_parent;
1448 ip6mr_update_thresholds(mrt, &c->_c, ttls);
7bc570c8 1449 if (!mrtsock)
494fff56 1450 c->_c.mfc_flags |= MFC_STATIC;
7bc570c8 1451
494fff56 1452 err = rhltable_insert_key(&mrt->mfc_hash, &c->cmparg, &c->_c.mnode,
87c418bf
YM
1453 ip6mr_rht_params);
1454 if (err) {
1455 pr_err("ip6mr: rhtable insert error %d\n", err);
1456 ip6mr_cache_free(c);
1457 return err;
1458 }
494fff56 1459 list_add_tail_rcu(&c->_c.list, &mrt->mfc_cache_list);
7bc570c8 1460
87c418bf
YM
1461 /* Check to see if we resolved a queued list. If so we
1462 * need to send on the frames and tidy up.
7bc570c8 1463 */
f30a7784 1464 found = false;
7bc570c8 1465 spin_lock_bh(&mfc_unres_lock);
494fff56
YM
1466 list_for_each_entry(_uc, &mrt->mfc_unres_queue, list) {
1467 uc = (struct mfc6_cache *)_uc;
c476efbc 1468 if (ipv6_addr_equal(&uc->mf6c_origin, &c->mf6c_origin) &&
7bc570c8 1469 ipv6_addr_equal(&uc->mf6c_mcastgrp, &c->mf6c_mcastgrp)) {
494fff56 1470 list_del(&_uc->list);
6bd52143 1471 atomic_dec(&mrt->cache_resolve_queue_len);
f30a7784 1472 found = true;
7bc570c8
YH
1473 break;
1474 }
1475 }
b70432f7 1476 if (list_empty(&mrt->mfc_unres_queue))
6bd52143 1477 del_timer(&mrt->ipmr_expire_timer);
7bc570c8
YH
1478 spin_unlock_bh(&mfc_unres_lock);
1479
f30a7784 1480 if (found) {
6bd52143 1481 ip6mr_cache_resolve(net, mrt, uc, c);
58701ad4 1482 ip6mr_cache_free(uc);
7bc570c8 1483 }
088aa3ee
YM
1484 call_ip6mr_mfc_entry_notifiers(net, FIB_EVENT_ENTRY_ADD,
1485 c, mrt->id);
812e44dd 1486 mr6_netlink_event(mrt, c, RTM_NEWROUTE);
7bc570c8
YH
1487 return 0;
1488}
1489
1490/*
1491 * Close the multicast socket, and clear the vif tables etc
1492 */
1493
ca8d4794 1494static void mroute_clean_tables(struct mr_table *mrt, int flags)
7bc570c8 1495{
494fff56 1496 struct mr_mfc *c, *tmp;
c871e664 1497 LIST_HEAD(list);
87c418bf 1498 int i;
7bc570c8 1499
87c418bf 1500 /* Shut down all active vif entries */
ca8d4794
CS
1501 if (flags & (MRT6_FLUSH_MIFS | MRT6_FLUSH_MIFS_STATIC)) {
1502 for (i = 0; i < mrt->maxvif; i++) {
1503 if (((mrt->vif_table[i].flags & VIFF_STATIC) &&
1504 !(flags & MRT6_FLUSH_MIFS_STATIC)) ||
1505 (!(mrt->vif_table[i].flags & VIFF_STATIC) && !(flags & MRT6_FLUSH_MIFS)))
1506 continue;
1507 mif6_delete(mrt, i, 0, &list);
1508 }
1509 unregister_netdevice_many(&list);
7bc570c8
YH
1510 }
1511
87c418bf 1512 /* Wipe the cache */
ca8d4794
CS
1513 if (flags & (MRT6_FLUSH_MFC | MRT6_FLUSH_MFC_STATIC)) {
1514 list_for_each_entry_safe(c, tmp, &mrt->mfc_cache_list, list) {
1515 if (((c->mfc_flags & MFC_STATIC) && !(flags & MRT6_FLUSH_MFC_STATIC)) ||
1516 (!(c->mfc_flags & MFC_STATIC) && !(flags & MRT6_FLUSH_MFC)))
1517 continue;
1518 rhltable_remove(&mrt->mfc_hash, &c->mnode, ip6mr_rht_params);
1519 list_del_rcu(&c->list);
1520 call_ip6mr_mfc_entry_notifiers(read_pnet(&mrt->net),
1521 FIB_EVENT_ENTRY_DEL,
1522 (struct mfc6_cache *)c, mrt->id);
1523 mr6_netlink_event(mrt, (struct mfc6_cache *)c, RTM_DELROUTE);
1524 mr_cache_put(c);
1525 }
7bc570c8
YH
1526 }
1527
ca8d4794
CS
1528 if (flags & MRT6_FLUSH_MFC) {
1529 if (atomic_read(&mrt->cache_resolve_queue_len) != 0) {
1530 spin_lock_bh(&mfc_unres_lock);
1531 list_for_each_entry_safe(c, tmp, &mrt->mfc_unres_queue, list) {
1532 list_del(&c->list);
1533 mr6_netlink_event(mrt, (struct mfc6_cache *)c,
1534 RTM_DELROUTE);
1535 ip6mr_destroy_unres(mrt, (struct mfc6_cache *)c);
1536 }
1537 spin_unlock_bh(&mfc_unres_lock);
7bc570c8 1538 }
7bc570c8
YH
1539 }
1540}
1541
b70432f7 1542static int ip6mr_sk_init(struct mr_table *mrt, struct sock *sk)
7bc570c8
YH
1543{
1544 int err = 0;
8229efda 1545 struct net *net = sock_net(sk);
7bc570c8
YH
1546
1547 rtnl_lock();
1548 write_lock_bh(&mrt_lock);
b70432f7 1549 if (rtnl_dereference(mrt->mroute_sk)) {
7bc570c8 1550 err = -EADDRINUSE;
8571ab47 1551 } else {
b70432f7 1552 rcu_assign_pointer(mrt->mroute_sk, sk);
a366e300 1553 sock_set_flag(sk, SOCK_RCU_FREE);
8571ab47 1554 net->ipv6.devconf_all->mc_forwarding++;
927265bc 1555 }
7bc570c8
YH
1556 write_unlock_bh(&mrt_lock);
1557
927265bc 1558 if (!err)
85b3daad
DA
1559 inet6_netconf_notify_devconf(net, RTM_NEWNETCONF,
1560 NETCONFA_MC_FORWARDING,
927265bc
ED
1561 NETCONFA_IFINDEX_ALL,
1562 net->ipv6.devconf_all);
7bc570c8
YH
1563 rtnl_unlock();
1564
1565 return err;
1566}
1567
1568int ip6mr_sk_done(struct sock *sk)
1569{
d1db275d 1570 int err = -EACCES;
8229efda 1571 struct net *net = sock_net(sk);
b70432f7 1572 struct mr_table *mrt;
7bc570c8 1573
338d182f
FR
1574 if (sk->sk_type != SOCK_RAW ||
1575 inet_sk(sk)->inet_num != IPPROTO_ICMPV6)
1576 return err;
1577
7bc570c8 1578 rtnl_lock();
d1db275d 1579 ip6mr_for_each_table(mrt, net) {
b70432f7 1580 if (sk == rtnl_dereference(mrt->mroute_sk)) {
d1db275d 1581 write_lock_bh(&mrt_lock);
b70432f7 1582 RCU_INIT_POINTER(mrt->mroute_sk, NULL);
a366e300
ED
1583 /* Note that mroute_sk had SOCK_RCU_FREE set,
1584 * so the RCU grace period before sk freeing
1585 * is guaranteed by sk_destruct()
1586 */
d1db275d 1587 net->ipv6.devconf_all->mc_forwarding--;
927265bc 1588 write_unlock_bh(&mrt_lock);
85b3daad 1589 inet6_netconf_notify_devconf(net, RTM_NEWNETCONF,
d67b8c61
ND
1590 NETCONFA_MC_FORWARDING,
1591 NETCONFA_IFINDEX_ALL,
1592 net->ipv6.devconf_all);
7bc570c8 1593
ca8d4794 1594 mroute_clean_tables(mrt, MRT6_FLUSH_MIFS | MRT6_FLUSH_MFC);
d1db275d
PM
1595 err = 0;
1596 break;
1597 }
1598 }
7bc570c8
YH
1599 rtnl_unlock();
1600
1601 return err;
1602}
1603
8571ab47 1604bool mroute6_is_socket(struct net *net, struct sk_buff *skb)
6bd52143 1605{
b70432f7 1606 struct mr_table *mrt;
4c9483b2 1607 struct flowi6 fl6 = {
e374c618 1608 .flowi6_iif = skb->skb_iif ? : LOOPBACK_IFINDEX,
4c9483b2
DM
1609 .flowi6_oif = skb->dev->ifindex,
1610 .flowi6_mark = skb->mark,
d1db275d
PM
1611 };
1612
4c9483b2 1613 if (ip6mr_fib_lookup(net, &fl6, &mrt) < 0)
d1db275d 1614 return NULL;
6bd52143 1615
b70432f7 1616 return rcu_access_pointer(mrt->mroute_sk);
6bd52143 1617}
8571ab47 1618EXPORT_SYMBOL(mroute6_is_socket);
6bd52143 1619
7bc570c8
YH
1620/*
1621 * Socket options and virtual interface manipulation. The whole
1622 * virtual interface system is a complete heap, but unfortunately
1623 * that's how BSD mrouted happens to think. Maybe one day with a proper
1624 * MOSPF/PIM router set up we can clean this up.
1625 */
1626
b43c6153
CH
1627int ip6_mroute_setsockopt(struct sock *sk, int optname, sockptr_t optval,
1628 unsigned int optlen)
7bc570c8 1629{
660b26dc 1630 int ret, parent = 0;
7bc570c8
YH
1631 struct mif6ctl vif;
1632 struct mf6cctl mfc;
1633 mifi_t mifi;
8229efda 1634 struct net *net = sock_net(sk);
b70432f7 1635 struct mr_table *mrt;
d1db275d 1636
99253eb7
XL
1637 if (sk->sk_type != SOCK_RAW ||
1638 inet_sk(sk)->inet_num != IPPROTO_ICMPV6)
1639 return -EOPNOTSUPP;
1640
d1db275d 1641 mrt = ip6mr_get_table(net, raw6_sk(sk)->ip6mr_table ? : RT6_TABLE_DFLT);
63159f29 1642 if (!mrt)
d1db275d 1643 return -ENOENT;
7bc570c8
YH
1644
1645 if (optname != MRT6_INIT) {
b70432f7 1646 if (sk != rcu_access_pointer(mrt->mroute_sk) &&
8571ab47 1647 !ns_capable(net->user_ns, CAP_NET_ADMIN))
7bc570c8
YH
1648 return -EACCES;
1649 }
1650
1651 switch (optname) {
1652 case MRT6_INIT:
7bc570c8
YH
1653 if (optlen < sizeof(int))
1654 return -EINVAL;
1655
6bd52143 1656 return ip6mr_sk_init(mrt, sk);
7bc570c8
YH
1657
1658 case MRT6_DONE:
1659 return ip6mr_sk_done(sk);
1660
1661 case MRT6_ADD_MIF:
1662 if (optlen < sizeof(vif))
1663 return -EINVAL;
b43c6153 1664 if (copy_from_sockptr(&vif, optval, sizeof(vif)))
7bc570c8 1665 return -EFAULT;
6ac7eb08 1666 if (vif.mif6c_mifi >= MAXMIFS)
7bc570c8
YH
1667 return -ENFILE;
1668 rtnl_lock();
8571ab47 1669 ret = mif6_add(net, mrt, &vif,
b70432f7 1670 sk == rtnl_dereference(mrt->mroute_sk));
7bc570c8
YH
1671 rtnl_unlock();
1672 return ret;
1673
1674 case MRT6_DEL_MIF:
1675 if (optlen < sizeof(mifi_t))
1676 return -EINVAL;
b43c6153 1677 if (copy_from_sockptr(&mifi, optval, sizeof(mifi_t)))
7bc570c8
YH
1678 return -EFAULT;
1679 rtnl_lock();
723b929c 1680 ret = mif6_delete(mrt, mifi, 0, NULL);
7bc570c8
YH
1681 rtnl_unlock();
1682 return ret;
1683
1684 /*
1685 * Manipulate the forwarding caches. These live
1686 * in a sort of kernel/user symbiosis.
1687 */
1688 case MRT6_ADD_MFC:
1689 case MRT6_DEL_MFC:
660b26dc 1690 parent = -1;
a8eceea8 1691 fallthrough;
660b26dc
ND
1692 case MRT6_ADD_MFC_PROXY:
1693 case MRT6_DEL_MFC_PROXY:
7bc570c8
YH
1694 if (optlen < sizeof(mfc))
1695 return -EINVAL;
b43c6153 1696 if (copy_from_sockptr(&mfc, optval, sizeof(mfc)))
7bc570c8 1697 return -EFAULT;
660b26dc
ND
1698 if (parent == 0)
1699 parent = mfc.mf6cc_parent;
7bc570c8 1700 rtnl_lock();
660b26dc
ND
1701 if (optname == MRT6_DEL_MFC || optname == MRT6_DEL_MFC_PROXY)
1702 ret = ip6mr_mfc_delete(mrt, &mfc, parent);
7bc570c8 1703 else
660b26dc 1704 ret = ip6mr_mfc_add(net, mrt, &mfc,
8571ab47 1705 sk ==
b70432f7 1706 rtnl_dereference(mrt->mroute_sk),
8571ab47 1707 parent);
7bc570c8
YH
1708 rtnl_unlock();
1709 return ret;
1710
ca8d4794
CS
1711 case MRT6_FLUSH:
1712 {
1713 int flags;
1714
1715 if (optlen != sizeof(flags))
1716 return -EINVAL;
b43c6153 1717 if (copy_from_sockptr(&flags, optval, sizeof(flags)))
ca8d4794
CS
1718 return -EFAULT;
1719 rtnl_lock();
1720 mroute_clean_tables(mrt, flags);
1721 rtnl_unlock();
1722 return 0;
1723 }
1724
14fb64e1
YH
1725 /*
1726 * Control PIM assert (to activate pim will activate assert)
1727 */
1728 case MRT6_ASSERT:
1729 {
1730 int v;
03f52a0a
JP
1731
1732 if (optlen != sizeof(v))
1733 return -EINVAL;
b43c6153 1734 if (copy_from_sockptr(&v, optval, sizeof(v)))
14fb64e1 1735 return -EFAULT;
53d6841d 1736 mrt->mroute_do_assert = v;
14fb64e1
YH
1737 return 0;
1738 }
1739
1740#ifdef CONFIG_IPV6_PIMSM_V2
1741 case MRT6_PIM:
1742 {
a9f83bf3 1743 int v;
03f52a0a
JP
1744
1745 if (optlen != sizeof(v))
1746 return -EINVAL;
b43c6153 1747 if (copy_from_sockptr(&v, optval, sizeof(v)))
14fb64e1
YH
1748 return -EFAULT;
1749 v = !!v;
1750 rtnl_lock();
1751 ret = 0;
6bd52143
PM
1752 if (v != mrt->mroute_do_pim) {
1753 mrt->mroute_do_pim = v;
1754 mrt->mroute_do_assert = v;
14fb64e1
YH
1755 }
1756 rtnl_unlock();
1757 return ret;
1758 }
1759
d1db275d
PM
1760#endif
1761#ifdef CONFIG_IPV6_MROUTE_MULTIPLE_TABLES
1762 case MRT6_TABLE:
1763 {
1764 u32 v;
1765
1766 if (optlen != sizeof(u32))
1767 return -EINVAL;
b43c6153 1768 if (copy_from_sockptr(&v, optval, sizeof(v)))
d1db275d 1769 return -EFAULT;
75356a81
DC
1770 /* "pim6reg%u" should not exceed 16 bytes (IFNAMSIZ) */
1771 if (v != RT_TABLE_DEFAULT && v >= 100000000)
1772 return -EINVAL;
b70432f7 1773 if (sk == rcu_access_pointer(mrt->mroute_sk))
d1db275d
PM
1774 return -EBUSY;
1775
1776 rtnl_lock();
1777 ret = 0;
e783bb00
SD
1778 mrt = ip6mr_new_table(net, v);
1779 if (IS_ERR(mrt))
1780 ret = PTR_ERR(mrt);
848235ed
SD
1781 else
1782 raw6_sk(sk)->ip6mr_table = v;
d1db275d
PM
1783 rtnl_unlock();
1784 return ret;
1785 }
14fb64e1 1786#endif
7bc570c8 1787 /*
7d120c55 1788 * Spurious command, or MRT6_VERSION which you cannot
7bc570c8
YH
1789 * set.
1790 */
1791 default:
1792 return -ENOPROTOOPT;
1793 }
1794}
1795
1796/*
1797 * Getsock opt support for the multicast routing system.
1798 */
1799
1800int ip6_mroute_getsockopt(struct sock *sk, int optname, char __user *optval,
1801 int __user *optlen)
1802{
1803 int olr;
1804 int val;
8229efda 1805 struct net *net = sock_net(sk);
b70432f7 1806 struct mr_table *mrt;
d1db275d 1807
99253eb7
XL
1808 if (sk->sk_type != SOCK_RAW ||
1809 inet_sk(sk)->inet_num != IPPROTO_ICMPV6)
1810 return -EOPNOTSUPP;
1811
d1db275d 1812 mrt = ip6mr_get_table(net, raw6_sk(sk)->ip6mr_table ? : RT6_TABLE_DFLT);
63159f29 1813 if (!mrt)
d1db275d 1814 return -ENOENT;
7bc570c8
YH
1815
1816 switch (optname) {
1817 case MRT6_VERSION:
1818 val = 0x0305;
1819 break;
14fb64e1
YH
1820#ifdef CONFIG_IPV6_PIMSM_V2
1821 case MRT6_PIM:
6bd52143 1822 val = mrt->mroute_do_pim;
14fb64e1
YH
1823 break;
1824#endif
1825 case MRT6_ASSERT:
6bd52143 1826 val = mrt->mroute_do_assert;
14fb64e1 1827 break;
7bc570c8
YH
1828 default:
1829 return -ENOPROTOOPT;
1830 }
1831
1832 if (get_user(olr, optlen))
1833 return -EFAULT;
1834
1835 olr = min_t(int, olr, sizeof(int));
1836 if (olr < 0)
1837 return -EINVAL;
1838
1839 if (put_user(olr, optlen))
1840 return -EFAULT;
1841 if (copy_to_user(optval, &val, olr))
1842 return -EFAULT;
1843 return 0;
1844}
1845
1846/*
1847 * The IP multicast ioctl support routines.
1848 */
1849
1850int ip6mr_ioctl(struct sock *sk, int cmd, void __user *arg)
1851{
1852 struct sioc_sg_req6 sr;
1853 struct sioc_mif_req6 vr;
6853f21f 1854 struct vif_device *vif;
7bc570c8 1855 struct mfc6_cache *c;
8229efda 1856 struct net *net = sock_net(sk);
b70432f7 1857 struct mr_table *mrt;
d1db275d
PM
1858
1859 mrt = ip6mr_get_table(net, raw6_sk(sk)->ip6mr_table ? : RT6_TABLE_DFLT);
63159f29 1860 if (!mrt)
d1db275d 1861 return -ENOENT;
7bc570c8
YH
1862
1863 switch (cmd) {
1864 case SIOCGETMIFCNT_IN6:
1865 if (copy_from_user(&vr, arg, sizeof(vr)))
1866 return -EFAULT;
6bd52143 1867 if (vr.mifi >= mrt->maxvif)
7bc570c8 1868 return -EINVAL;
69d2c867 1869 vr.mifi = array_index_nospec(vr.mifi, mrt->maxvif);
7bc570c8 1870 read_lock(&mrt_lock);
b70432f7
YM
1871 vif = &mrt->vif_table[vr.mifi];
1872 if (VIF_EXISTS(mrt, vr.mifi)) {
7bc570c8
YH
1873 vr.icount = vif->pkt_in;
1874 vr.ocount = vif->pkt_out;
1875 vr.ibytes = vif->bytes_in;
1876 vr.obytes = vif->bytes_out;
1877 read_unlock(&mrt_lock);
1878
1879 if (copy_to_user(arg, &vr, sizeof(vr)))
1880 return -EFAULT;
1881 return 0;
1882 }
1883 read_unlock(&mrt_lock);
1884 return -EADDRNOTAVAIL;
1885 case SIOCGETSGCNT_IN6:
1886 if (copy_from_user(&sr, arg, sizeof(sr)))
1887 return -EFAULT;
1888
87c418bf 1889 rcu_read_lock();
6bd52143 1890 c = ip6mr_cache_find(mrt, &sr.src.sin6_addr, &sr.grp.sin6_addr);
7bc570c8 1891 if (c) {
494fff56
YM
1892 sr.pktcnt = c->_c.mfc_un.res.pkt;
1893 sr.bytecnt = c->_c.mfc_un.res.bytes;
1894 sr.wrong_if = c->_c.mfc_un.res.wrong_if;
87c418bf 1895 rcu_read_unlock();
7bc570c8
YH
1896
1897 if (copy_to_user(arg, &sr, sizeof(sr)))
1898 return -EFAULT;
1899 return 0;
1900 }
87c418bf 1901 rcu_read_unlock();
7bc570c8
YH
1902 return -EADDRNOTAVAIL;
1903 default:
1904 return -ENOIOCTLCMD;
1905 }
1906}
1907
e2d57766
DM
1908#ifdef CONFIG_COMPAT
1909struct compat_sioc_sg_req6 {
1910 struct sockaddr_in6 src;
1911 struct sockaddr_in6 grp;
1912 compat_ulong_t pktcnt;
1913 compat_ulong_t bytecnt;
1914 compat_ulong_t wrong_if;
1915};
1916
1917struct compat_sioc_mif_req6 {
1918 mifi_t mifi;
1919 compat_ulong_t icount;
1920 compat_ulong_t ocount;
1921 compat_ulong_t ibytes;
1922 compat_ulong_t obytes;
1923};
1924
1925int ip6mr_compat_ioctl(struct sock *sk, unsigned int cmd, void __user *arg)
1926{
1927 struct compat_sioc_sg_req6 sr;
1928 struct compat_sioc_mif_req6 vr;
6853f21f 1929 struct vif_device *vif;
e2d57766
DM
1930 struct mfc6_cache *c;
1931 struct net *net = sock_net(sk);
b70432f7 1932 struct mr_table *mrt;
e2d57766
DM
1933
1934 mrt = ip6mr_get_table(net, raw6_sk(sk)->ip6mr_table ? : RT6_TABLE_DFLT);
63159f29 1935 if (!mrt)
e2d57766
DM
1936 return -ENOENT;
1937
1938 switch (cmd) {
1939 case SIOCGETMIFCNT_IN6:
1940 if (copy_from_user(&vr, arg, sizeof(vr)))
1941 return -EFAULT;
1942 if (vr.mifi >= mrt->maxvif)
1943 return -EINVAL;
69d2c867 1944 vr.mifi = array_index_nospec(vr.mifi, mrt->maxvif);
e2d57766 1945 read_lock(&mrt_lock);
b70432f7
YM
1946 vif = &mrt->vif_table[vr.mifi];
1947 if (VIF_EXISTS(mrt, vr.mifi)) {
e2d57766
DM
1948 vr.icount = vif->pkt_in;
1949 vr.ocount = vif->pkt_out;
1950 vr.ibytes = vif->bytes_in;
1951 vr.obytes = vif->bytes_out;
1952 read_unlock(&mrt_lock);
1953
1954 if (copy_to_user(arg, &vr, sizeof(vr)))
1955 return -EFAULT;
1956 return 0;
1957 }
1958 read_unlock(&mrt_lock);
1959 return -EADDRNOTAVAIL;
1960 case SIOCGETSGCNT_IN6:
1961 if (copy_from_user(&sr, arg, sizeof(sr)))
1962 return -EFAULT;
1963
87c418bf 1964 rcu_read_lock();
e2d57766
DM
1965 c = ip6mr_cache_find(mrt, &sr.src.sin6_addr, &sr.grp.sin6_addr);
1966 if (c) {
494fff56
YM
1967 sr.pktcnt = c->_c.mfc_un.res.pkt;
1968 sr.bytecnt = c->_c.mfc_un.res.bytes;
1969 sr.wrong_if = c->_c.mfc_un.res.wrong_if;
87c418bf 1970 rcu_read_unlock();
e2d57766
DM
1971
1972 if (copy_to_user(arg, &sr, sizeof(sr)))
1973 return -EFAULT;
1974 return 0;
1975 }
87c418bf 1976 rcu_read_unlock();
e2d57766
DM
1977 return -EADDRNOTAVAIL;
1978 default:
1979 return -ENOIOCTLCMD;
1980 }
1981}
1982#endif
7bc570c8 1983
0c4b51f0 1984static inline int ip6mr_forward2_finish(struct net *net, struct sock *sk, struct sk_buff *skb)
7bc570c8 1985{
87c11f1d
IS
1986 IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
1987 IPSTATS_MIB_OUTFORWDATAGRAMS);
1988 IP6_ADD_STATS(net, ip6_dst_idev(skb_dst(skb)),
1989 IPSTATS_MIB_OUTOCTETS, skb->len);
13206b6b 1990 return dst_output(net, sk, skb);
7bc570c8
YH
1991}
1992
1993/*
1994 * Processing handlers for ip6mr_forward
1995 */
1996
b70432f7 1997static int ip6mr_forward2(struct net *net, struct mr_table *mrt,
f5c6dfde 1998 struct sk_buff *skb, int vifi)
7bc570c8
YH
1999{
2000 struct ipv6hdr *ipv6h;
b70432f7 2001 struct vif_device *vif = &mrt->vif_table[vifi];
7bc570c8
YH
2002 struct net_device *dev;
2003 struct dst_entry *dst;
4c9483b2 2004 struct flowi6 fl6;
7bc570c8 2005
63159f29 2006 if (!vif->dev)
7bc570c8
YH
2007 goto out_free;
2008
14fb64e1
YH
2009#ifdef CONFIG_IPV6_PIMSM_V2
2010 if (vif->flags & MIFF_REGISTER) {
2011 vif->pkt_out++;
2012 vif->bytes_out += skb->len;
dc58c78c
PE
2013 vif->dev->stats.tx_bytes += skb->len;
2014 vif->dev->stats.tx_packets++;
6bd52143 2015 ip6mr_cache_report(mrt, skb, vifi, MRT6MSG_WHOLEPKT);
8da73b73 2016 goto out_free;
14fb64e1
YH
2017 }
2018#endif
2019
7bc570c8
YH
2020 ipv6h = ipv6_hdr(skb);
2021
4c9483b2
DM
2022 fl6 = (struct flowi6) {
2023 .flowi6_oif = vif->link,
2024 .daddr = ipv6h->daddr,
7bc570c8
YH
2025 };
2026
4c9483b2 2027 dst = ip6_route_output(net, NULL, &fl6);
5095d64d
RL
2028 if (dst->error) {
2029 dst_release(dst);
7bc570c8 2030 goto out_free;
5095d64d 2031 }
7bc570c8 2032
adf30907
ED
2033 skb_dst_drop(skb);
2034 skb_dst_set(skb, dst);
7bc570c8
YH
2035
2036 /*
2037 * RFC1584 teaches, that DVMRP/PIM router must deliver packets locally
2038 * not only before forwarding, but after forwarding on all output
2039 * interfaces. It is clear, if mrouter runs a multicasting
2040 * program, it should receive packets not depending to what interface
2041 * program is joined.
2042 * If we will not make it, the program will have to join on all
2043 * interfaces. On the other hand, multihoming host (or router, but
2044 * not mrouter) cannot join to more than one interface - it will
2045 * result in receiving multiple packets.
2046 */
2047 dev = vif->dev;
2048 skb->dev = dev;
2049 vif->pkt_out++;
2050 vif->bytes_out += skb->len;
2051
2052 /* We are about to write */
2053 /* XXX: extension headers? */
2054 if (skb_cow(skb, sizeof(*ipv6h) + LL_RESERVED_SPACE(dev)))
2055 goto out_free;
2056
2057 ipv6h = ipv6_hdr(skb);
2058 ipv6h->hop_limit--;
2059
2060 IP6CB(skb)->flags |= IP6SKB_FORWARDED;
2061
29a26a56
EB
2062 return NF_HOOK(NFPROTO_IPV6, NF_INET_FORWARD,
2063 net, NULL, skb, skb->dev, dev,
7bc570c8
YH
2064 ip6mr_forward2_finish);
2065
2066out_free:
2067 kfree_skb(skb);
2068 return 0;
2069}
2070
b70432f7 2071static int ip6mr_find_vif(struct mr_table *mrt, struct net_device *dev)
7bc570c8
YH
2072{
2073 int ct;
6bd52143
PM
2074
2075 for (ct = mrt->maxvif - 1; ct >= 0; ct--) {
b70432f7 2076 if (mrt->vif_table[ct].dev == dev)
7bc570c8
YH
2077 break;
2078 }
2079 return ct;
2080}
2081
b70432f7 2082static void ip6_mr_forward(struct net *net, struct mr_table *mrt,
e4a38c0c
PR
2083 struct net_device *dev, struct sk_buff *skb,
2084 struct mfc6_cache *c)
7bc570c8
YH
2085{
2086 int psend = -1;
2087 int vif, ct;
e4a38c0c 2088 int true_vifi = ip6mr_find_vif(mrt, dev);
7bc570c8 2089
494fff56
YM
2090 vif = c->_c.mfc_parent;
2091 c->_c.mfc_un.res.pkt++;
2092 c->_c.mfc_un.res.bytes += skb->len;
2093 c->_c.mfc_un.res.lastuse = jiffies;
7bc570c8 2094
494fff56 2095 if (ipv6_addr_any(&c->mf6c_origin) && true_vifi >= 0) {
660b26dc
ND
2096 struct mfc6_cache *cache_proxy;
2097
40dc2ca3 2098 /* For an (*,G) entry, we only check that the incoming
660b26dc
ND
2099 * interface is part of the static tree.
2100 */
87c418bf 2101 rcu_read_lock();
845c9a7a 2102 cache_proxy = mr_mfc_find_any_parent(mrt, vif);
660b26dc 2103 if (cache_proxy &&
494fff56 2104 cache_proxy->_c.mfc_un.res.ttls[true_vifi] < 255) {
87c418bf 2105 rcu_read_unlock();
660b26dc 2106 goto forward;
87c418bf
YM
2107 }
2108 rcu_read_unlock();
660b26dc
ND
2109 }
2110
14fb64e1
YH
2111 /*
2112 * Wrong interface: drop packet and (maybe) send PIM assert.
2113 */
e4a38c0c 2114 if (mrt->vif_table[vif].dev != dev) {
494fff56 2115 c->_c.mfc_un.res.wrong_if++;
14fb64e1 2116
6bd52143 2117 if (true_vifi >= 0 && mrt->mroute_do_assert &&
14fb64e1
YH
2118 /* pimsm uses asserts, when switching from RPT to SPT,
2119 so that we cannot check that packet arrived on an oif.
2120 It is bad, but otherwise we would need to move pretty
2121 large chunk of pimd to kernel. Ough... --ANK
2122 */
6bd52143 2123 (mrt->mroute_do_pim ||
494fff56 2124 c->_c.mfc_un.res.ttls[true_vifi] < 255) &&
14fb64e1 2125 time_after(jiffies,
494fff56
YM
2126 c->_c.mfc_un.res.last_assert +
2127 MFC_ASSERT_THRESH)) {
2128 c->_c.mfc_un.res.last_assert = jiffies;
6bd52143 2129 ip6mr_cache_report(mrt, skb, true_vifi, MRT6MSG_WRONGMIF);
14fb64e1
YH
2130 }
2131 goto dont_forward;
2132 }
2133
660b26dc 2134forward:
b70432f7
YM
2135 mrt->vif_table[vif].pkt_in++;
2136 mrt->vif_table[vif].bytes_in += skb->len;
7bc570c8
YH
2137
2138 /*
2139 * Forward the frame
2140 */
494fff56
YM
2141 if (ipv6_addr_any(&c->mf6c_origin) &&
2142 ipv6_addr_any(&c->mf6c_mcastgrp)) {
660b26dc 2143 if (true_vifi >= 0 &&
494fff56 2144 true_vifi != c->_c.mfc_parent &&
660b26dc 2145 ipv6_hdr(skb)->hop_limit >
494fff56 2146 c->_c.mfc_un.res.ttls[c->_c.mfc_parent]) {
660b26dc
ND
2147 /* It's an (*,*) entry and the packet is not coming from
2148 * the upstream: forward the packet to the upstream
2149 * only.
2150 */
494fff56 2151 psend = c->_c.mfc_parent;
660b26dc
ND
2152 goto last_forward;
2153 }
2154 goto dont_forward;
2155 }
494fff56
YM
2156 for (ct = c->_c.mfc_un.res.maxvif - 1;
2157 ct >= c->_c.mfc_un.res.minvif; ct--) {
660b26dc 2158 /* For (*,G) entry, don't forward to the incoming interface */
494fff56
YM
2159 if ((!ipv6_addr_any(&c->mf6c_origin) || ct != true_vifi) &&
2160 ipv6_hdr(skb)->hop_limit > c->_c.mfc_un.res.ttls[ct]) {
7bc570c8
YH
2161 if (psend != -1) {
2162 struct sk_buff *skb2 = skb_clone(skb, GFP_ATOMIC);
2163 if (skb2)
f5c6dfde 2164 ip6mr_forward2(net, mrt, skb2, psend);
7bc570c8
YH
2165 }
2166 psend = ct;
2167 }
2168 }
660b26dc 2169last_forward:
7bc570c8 2170 if (psend != -1) {
f5c6dfde 2171 ip6mr_forward2(net, mrt, skb, psend);
2b52c3ad 2172 return;
7bc570c8
YH
2173 }
2174
14fb64e1 2175dont_forward:
7bc570c8 2176 kfree_skb(skb);
7bc570c8
YH
2177}
2178
2179
2180/*
2181 * Multicast packets for forwarding arrive here
2182 */
2183
2184int ip6_mr_input(struct sk_buff *skb)
2185{
2186 struct mfc6_cache *cache;
8229efda 2187 struct net *net = dev_net(skb->dev);
b70432f7 2188 struct mr_table *mrt;
4c9483b2
DM
2189 struct flowi6 fl6 = {
2190 .flowi6_iif = skb->dev->ifindex,
2191 .flowi6_mark = skb->mark,
d1db275d
PM
2192 };
2193 int err;
e4a38c0c
PR
2194 struct net_device *dev;
2195
2196 /* skb->dev passed in is the master dev for vrfs.
2197 * Get the proper interface that does have a vif associated with it.
2198 */
2199 dev = skb->dev;
2200 if (netif_is_l3_master(skb->dev)) {
2201 dev = dev_get_by_index_rcu(net, IPCB(skb)->iif);
2202 if (!dev) {
2203 kfree_skb(skb);
2204 return -ENODEV;
2205 }
2206 }
d1db275d 2207
4c9483b2 2208 err = ip6mr_fib_lookup(net, &fl6, &mrt);
2015de5f
BG
2209 if (err < 0) {
2210 kfree_skb(skb);
d1db275d 2211 return err;
2015de5f 2212 }
7bc570c8
YH
2213
2214 read_lock(&mrt_lock);
6bd52143 2215 cache = ip6mr_cache_find(mrt,
8229efda 2216 &ipv6_hdr(skb)->saddr, &ipv6_hdr(skb)->daddr);
63159f29 2217 if (!cache) {
e4a38c0c 2218 int vif = ip6mr_find_vif(mrt, dev);
660b26dc
ND
2219
2220 if (vif >= 0)
2221 cache = ip6mr_cache_find_any(mrt,
2222 &ipv6_hdr(skb)->daddr,
2223 vif);
2224 }
7bc570c8
YH
2225
2226 /*
2227 * No usable cache entry
2228 */
63159f29 2229 if (!cache) {
7bc570c8
YH
2230 int vif;
2231
e4a38c0c 2232 vif = ip6mr_find_vif(mrt, dev);
7bc570c8 2233 if (vif >= 0) {
e4a38c0c 2234 int err = ip6mr_cache_unresolved(mrt, vif, skb, dev);
7bc570c8
YH
2235 read_unlock(&mrt_lock);
2236
2237 return err;
2238 }
2239 read_unlock(&mrt_lock);
2240 kfree_skb(skb);
2241 return -ENODEV;
2242 }
2243
e4a38c0c 2244 ip6_mr_forward(net, mrt, dev, skb, cache);
7bc570c8
YH
2245
2246 read_unlock(&mrt_lock);
2247
2248 return 0;
2249}
2250
2cf75070 2251int ip6mr_get_route(struct net *net, struct sk_buff *skb, struct rtmsg *rtm,
fd61c6ba 2252 u32 portid)
7bc570c8
YH
2253{
2254 int err;
b70432f7 2255 struct mr_table *mrt;
7bc570c8 2256 struct mfc6_cache *cache;
adf30907 2257 struct rt6_info *rt = (struct rt6_info *)skb_dst(skb);
7bc570c8 2258
d1db275d 2259 mrt = ip6mr_get_table(net, RT6_TABLE_DFLT);
63159f29 2260 if (!mrt)
d1db275d
PM
2261 return -ENOENT;
2262
7bc570c8 2263 read_lock(&mrt_lock);
6bd52143 2264 cache = ip6mr_cache_find(mrt, &rt->rt6i_src.addr, &rt->rt6i_dst.addr);
660b26dc
ND
2265 if (!cache && skb->dev) {
2266 int vif = ip6mr_find_vif(mrt, skb->dev);
2267
2268 if (vif >= 0)
2269 cache = ip6mr_cache_find_any(mrt, &rt->rt6i_dst.addr,
2270 vif);
2271 }
7bc570c8
YH
2272
2273 if (!cache) {
2274 struct sk_buff *skb2;
2275 struct ipv6hdr *iph;
2276 struct net_device *dev;
2277 int vif;
2278
7bc570c8 2279 dev = skb->dev;
63159f29 2280 if (!dev || (vif = ip6mr_find_vif(mrt, dev)) < 0) {
7bc570c8
YH
2281 read_unlock(&mrt_lock);
2282 return -ENODEV;
2283 }
2284
2285 /* really correct? */
2286 skb2 = alloc_skb(sizeof(struct ipv6hdr), GFP_ATOMIC);
2287 if (!skb2) {
2288 read_unlock(&mrt_lock);
2289 return -ENOMEM;
2290 }
2291
2cf75070 2292 NETLINK_CB(skb2).portid = portid;
7bc570c8
YH
2293 skb_reset_transport_header(skb2);
2294
2295 skb_put(skb2, sizeof(struct ipv6hdr));
2296 skb_reset_network_header(skb2);
2297
2298 iph = ipv6_hdr(skb2);
2299 iph->version = 0;
2300 iph->priority = 0;
2301 iph->flow_lbl[0] = 0;
2302 iph->flow_lbl[1] = 0;
2303 iph->flow_lbl[2] = 0;
2304 iph->payload_len = 0;
2305 iph->nexthdr = IPPROTO_NONE;
2306 iph->hop_limit = 0;
4e3fd7a0
AD
2307 iph->saddr = rt->rt6i_src.addr;
2308 iph->daddr = rt->rt6i_dst.addr;
7bc570c8 2309
e4a38c0c 2310 err = ip6mr_cache_unresolved(mrt, vif, skb2, dev);
7bc570c8
YH
2311 read_unlock(&mrt_lock);
2312
2313 return err;
2314 }
2315
7b0db857 2316 err = mr_fill_mroute(mrt, skb, &cache->_c, rtm);
7bc570c8
YH
2317 read_unlock(&mrt_lock);
2318 return err;
2319}
2320
b70432f7 2321static int ip6mr_fill_mroute(struct mr_table *mrt, struct sk_buff *skb,
f518338b
ND
2322 u32 portid, u32 seq, struct mfc6_cache *c, int cmd,
2323 int flags)
5b285cac
PM
2324{
2325 struct nlmsghdr *nlh;
2326 struct rtmsg *rtm;
1eb99af5 2327 int err;
5b285cac 2328
f518338b 2329 nlh = nlmsg_put(skb, portid, seq, cmd, sizeof(*rtm), flags);
63159f29 2330 if (!nlh)
5b285cac
PM
2331 return -EMSGSIZE;
2332
2333 rtm = nlmsg_data(nlh);
193c1e47 2334 rtm->rtm_family = RTNL_FAMILY_IP6MR;
5b285cac
PM
2335 rtm->rtm_dst_len = 128;
2336 rtm->rtm_src_len = 128;
2337 rtm->rtm_tos = 0;
2338 rtm->rtm_table = mrt->id;
c78679e8
DM
2339 if (nla_put_u32(skb, RTA_TABLE, mrt->id))
2340 goto nla_put_failure;
1eb99af5 2341 rtm->rtm_type = RTN_MULTICAST;
5b285cac 2342 rtm->rtm_scope = RT_SCOPE_UNIVERSE;
494fff56 2343 if (c->_c.mfc_flags & MFC_STATIC)
9a68ac72
ND
2344 rtm->rtm_protocol = RTPROT_STATIC;
2345 else
2346 rtm->rtm_protocol = RTPROT_MROUTED;
5b285cac
PM
2347 rtm->rtm_flags = 0;
2348
930345ea
JB
2349 if (nla_put_in6_addr(skb, RTA_SRC, &c->mf6c_origin) ||
2350 nla_put_in6_addr(skb, RTA_DST, &c->mf6c_mcastgrp))
c78679e8 2351 goto nla_put_failure;
7b0db857 2352 err = mr_fill_mroute(mrt, skb, &c->_c, rtm);
1eb99af5
ND
2353 /* do not break the dump if cache is unresolved */
2354 if (err < 0 && err != -ENOENT)
5b285cac
PM
2355 goto nla_put_failure;
2356
053c095a
JB
2357 nlmsg_end(skb, nlh);
2358 return 0;
5b285cac
PM
2359
2360nla_put_failure:
2361 nlmsg_cancel(skb, nlh);
2362 return -EMSGSIZE;
2363}
2364
7b0db857
YM
2365static int _ip6mr_fill_mroute(struct mr_table *mrt, struct sk_buff *skb,
2366 u32 portid, u32 seq, struct mr_mfc *c,
2367 int cmd, int flags)
2368{
2369 return ip6mr_fill_mroute(mrt, skb, portid, seq, (struct mfc6_cache *)c,
2370 cmd, flags);
2371}
2372
812e44dd
ND
2373static int mr6_msgsize(bool unresolved, int maxvif)
2374{
2375 size_t len =
2376 NLMSG_ALIGN(sizeof(struct rtmsg))
2377 + nla_total_size(4) /* RTA_TABLE */
2378 + nla_total_size(sizeof(struct in6_addr)) /* RTA_SRC */
2379 + nla_total_size(sizeof(struct in6_addr)) /* RTA_DST */
2380 ;
2381
2382 if (!unresolved)
2383 len = len
2384 + nla_total_size(4) /* RTA_IIF */
2385 + nla_total_size(0) /* RTA_MULTIPATH */
2386 + maxvif * NLA_ALIGN(sizeof(struct rtnexthop))
2387 /* RTA_MFC_STATS */
3d6b66c1 2388 + nla_total_size_64bit(sizeof(struct rta_mfc_stats))
812e44dd
ND
2389 ;
2390
2391 return len;
2392}
2393
b70432f7 2394static void mr6_netlink_event(struct mr_table *mrt, struct mfc6_cache *mfc,
812e44dd
ND
2395 int cmd)
2396{
2397 struct net *net = read_pnet(&mrt->net);
2398 struct sk_buff *skb;
2399 int err = -ENOBUFS;
2400
494fff56 2401 skb = nlmsg_new(mr6_msgsize(mfc->_c.mfc_parent >= MAXMIFS, mrt->maxvif),
812e44dd 2402 GFP_ATOMIC);
63159f29 2403 if (!skb)
812e44dd
ND
2404 goto errout;
2405
f518338b 2406 err = ip6mr_fill_mroute(mrt, skb, 0, 0, mfc, cmd, 0);
812e44dd
ND
2407 if (err < 0)
2408 goto errout;
2409
2410 rtnl_notify(skb, net, 0, RTNLGRP_IPV6_MROUTE, NULL, GFP_ATOMIC);
2411 return;
2412
2413errout:
2414 kfree_skb(skb);
2415 if (err < 0)
2416 rtnl_set_sk_err(net, RTNLGRP_IPV6_MROUTE, err);
2417}
2418
dd12d15c
JG
2419static size_t mrt6msg_netlink_msgsize(size_t payloadlen)
2420{
2421 size_t len =
2422 NLMSG_ALIGN(sizeof(struct rtgenmsg))
2423 + nla_total_size(1) /* IP6MRA_CREPORT_MSGTYPE */
2424 + nla_total_size(4) /* IP6MRA_CREPORT_MIF_ID */
2425 /* IP6MRA_CREPORT_SRC_ADDR */
2426 + nla_total_size(sizeof(struct in6_addr))
2427 /* IP6MRA_CREPORT_DST_ADDR */
2428 + nla_total_size(sizeof(struct in6_addr))
2429 /* IP6MRA_CREPORT_PKT */
2430 + nla_total_size(payloadlen)
2431 ;
2432
2433 return len;
2434}
2435
b70432f7 2436static void mrt6msg_netlink_event(struct mr_table *mrt, struct sk_buff *pkt)
dd12d15c
JG
2437{
2438 struct net *net = read_pnet(&mrt->net);
2439 struct nlmsghdr *nlh;
2440 struct rtgenmsg *rtgenm;
2441 struct mrt6msg *msg;
2442 struct sk_buff *skb;
2443 struct nlattr *nla;
2444 int payloadlen;
2445
2446 payloadlen = pkt->len - sizeof(struct mrt6msg);
2447 msg = (struct mrt6msg *)skb_transport_header(pkt);
2448
2449 skb = nlmsg_new(mrt6msg_netlink_msgsize(payloadlen), GFP_ATOMIC);
2450 if (!skb)
2451 goto errout;
2452
2453 nlh = nlmsg_put(skb, 0, 0, RTM_NEWCACHEREPORT,
2454 sizeof(struct rtgenmsg), 0);
2455 if (!nlh)
2456 goto errout;
2457 rtgenm = nlmsg_data(nlh);
2458 rtgenm->rtgen_family = RTNL_FAMILY_IP6MR;
2459 if (nla_put_u8(skb, IP6MRA_CREPORT_MSGTYPE, msg->im6_msgtype) ||
2460 nla_put_u32(skb, IP6MRA_CREPORT_MIF_ID, msg->im6_mif) ||
2461 nla_put_in6_addr(skb, IP6MRA_CREPORT_SRC_ADDR,
2462 &msg->im6_src) ||
2463 nla_put_in6_addr(skb, IP6MRA_CREPORT_DST_ADDR,
2464 &msg->im6_dst))
2465 goto nla_put_failure;
2466
2467 nla = nla_reserve(skb, IP6MRA_CREPORT_PKT, payloadlen);
2468 if (!nla || skb_copy_bits(pkt, sizeof(struct mrt6msg),
2469 nla_data(nla), payloadlen))
2470 goto nla_put_failure;
2471
2472 nlmsg_end(skb, nlh);
2473
2474 rtnl_notify(skb, net, 0, RTNLGRP_IPV6_MROUTE_R, NULL, GFP_ATOMIC);
2475 return;
2476
2477nla_put_failure:
2478 nlmsg_cancel(skb, nlh);
2479errout:
2480 kfree_skb(skb);
2481 rtnl_set_sk_err(net, RTNLGRP_IPV6_MROUTE_R, -ENOBUFS);
2482}
2483
5b285cac
PM
2484static int ip6mr_rtm_dumproute(struct sk_buff *skb, struct netlink_callback *cb)
2485{
e8ba330a 2486 const struct nlmsghdr *nlh = cb->nlh;
4724676d 2487 struct fib_dump_filter filter = {};
cb167893 2488 int err;
e8ba330a
DA
2489
2490 if (cb->strict_check) {
4724676d 2491 err = ip_valid_fib_dump_req(sock_net(skb->sk), nlh,
effe6792 2492 &filter, cb);
e8ba330a
DA
2493 if (err < 0)
2494 return err;
2495 }
2496
cb167893
DA
2497 if (filter.table_id) {
2498 struct mr_table *mrt;
2499
2500 mrt = ip6mr_get_table(sock_net(skb->sk), filter.table_id);
2501 if (!mrt) {
41b4bd98 2502 if (rtnl_msg_family(cb->nlh) != RTNL_FAMILY_IP6MR)
ae677bbb
DA
2503 return skb->len;
2504
cb167893
DA
2505 NL_SET_ERR_MSG_MOD(cb->extack, "MR table does not exist");
2506 return -ENOENT;
2507 }
2508 err = mr_table_dump(mrt, skb, cb, _ip6mr_fill_mroute,
2509 &mfc_unres_lock, &filter);
2510 return skb->len ? : err;
2511 }
2512
7b0db857 2513 return mr_rtm_dumproute(skb, cb, ip6mr_mr_table_iter,
cb167893 2514 _ip6mr_fill_mroute, &mfc_unres_lock, &filter);
5b285cac 2515}