inet: frag: move evictor calls into frag_find function
[linux-2.6-block.git] / net / ieee802154 / reassembly.c
CommitLineData
7240cdec
AA
1/* 6LoWPAN fragment reassembly
2 *
3 *
4 * Authors:
5 * Alexander Aring <aar@pengutronix.de>
6 *
7 * Based on: net/ipv6/reassembly.c
8 *
9 * This program is free software; you can redistribute it and/or
10 * modify it under the terms of the GNU General Public License
11 * as published by the Free Software Foundation; either version
12 * 2 of the License, or (at your option) any later version.
13 */
14
15#define pr_fmt(fmt) "6LoWPAN: " fmt
16
17#include <linux/net.h>
18#include <linux/list.h>
19#include <linux/netdevice.h>
20#include <linux/random.h>
21#include <linux/jhash.h>
22#include <linux/skbuff.h>
23#include <linux/slab.h>
24#include <linux/export.h>
25
26#include <net/ieee802154_netdev.h>
cefc8c8a 27#include <net/6lowpan.h>
7240cdec
AA
28#include <net/ipv6.h>
29#include <net/inet_frag.h>
30
7240cdec
AA
31#include "reassembly.h"
32
a13061ec
PB
33struct lowpan_frag_info {
34 __be16 d_tag;
35 u16 d_size;
36 u8 d_offset;
37};
38
94716d2f 39static struct lowpan_frag_info *lowpan_cb(struct sk_buff *skb)
a13061ec
PB
40{
41 return (struct lowpan_frag_info *)skb->cb;
42}
43
7240cdec
AA
44static struct inet_frags lowpan_frags;
45
46static int lowpan_frag_reasm(struct lowpan_frag_queue *fq,
47 struct sk_buff *prev, struct net_device *dev);
48
4c7f778e 49static unsigned int lowpan_hash_frag(__be16 tag, u16 d_size,
ae531b94
PB
50 const struct ieee802154_addr *saddr,
51 const struct ieee802154_addr *daddr)
7240cdec 52{
7240cdec 53 net_get_random_once(&lowpan_frags.rnd, sizeof(lowpan_frags.rnd));
fb3cfe6e
FW
54 return jhash_3words(ieee802154_addr_hash(saddr),
55 ieee802154_addr_hash(daddr),
56 (__force u32)(tag + (d_size << 16)),
57 lowpan_frags.rnd);
7240cdec
AA
58}
59
36c77782 60static unsigned int lowpan_hashfn(const struct inet_frag_queue *q)
7240cdec 61{
36c77782 62 const struct lowpan_frag_queue *fq;
7240cdec
AA
63
64 fq = container_of(q, struct lowpan_frag_queue, q);
65 return lowpan_hash_frag(fq->tag, fq->d_size, &fq->saddr, &fq->daddr);
66}
67
36c77782 68static bool lowpan_frag_match(const struct inet_frag_queue *q, const void *a)
7240cdec 69{
36c77782
FW
70 const struct lowpan_frag_queue *fq;
71 const struct lowpan_create_arg *arg = a;
7240cdec
AA
72
73 fq = container_of(q, struct lowpan_frag_queue, q);
74 return fq->tag == arg->tag && fq->d_size == arg->d_size &&
ae531b94
PB
75 ieee802154_addr_equal(&fq->saddr, arg->src) &&
76 ieee802154_addr_equal(&fq->daddr, arg->dst);
7240cdec 77}
7240cdec 78
36c77782 79static void lowpan_frag_init(struct inet_frag_queue *q, const void *a)
7240cdec 80{
36c77782 81 const struct lowpan_create_arg *arg = a;
7240cdec 82 struct lowpan_frag_queue *fq;
7240cdec
AA
83
84 fq = container_of(q, struct lowpan_frag_queue, q);
85
86 fq->tag = arg->tag;
87 fq->d_size = arg->d_size;
88 fq->saddr = *arg->src;
89 fq->daddr = *arg->dst;
90}
7240cdec
AA
91
92static void lowpan_frag_expire(unsigned long data)
93{
94 struct frag_queue *fq;
95 struct net *net;
96
97 fq = container_of((struct inet_frag_queue *)data, struct frag_queue, q);
98 net = container_of(fq->q.net, struct net, ieee802154_lowpan.frags);
99
17794326
FW
100 spin_lock(&fq->q.lock);
101
102 if (fq->q.last_in & INET_FRAG_COMPLETE)
103 goto out;
104
105 inet_frag_kill(&fq->q, &lowpan_frags);
106out:
107 spin_unlock(&fq->q.lock);
108 inet_frag_put(&fq->q, &lowpan_frags);
7240cdec
AA
109}
110
111static inline struct lowpan_frag_queue *
a13061ec 112fq_find(struct net *net, const struct lowpan_frag_info *frag_info,
ae531b94
PB
113 const struct ieee802154_addr *src,
114 const struct ieee802154_addr *dst)
7240cdec
AA
115{
116 struct inet_frag_queue *q;
117 struct lowpan_create_arg arg;
118 unsigned int hash;
599018a7
LR
119 struct netns_ieee802154_lowpan *ieee802154_lowpan =
120 net_ieee802154_lowpan(net);
7240cdec
AA
121
122 arg.tag = frag_info->d_tag;
123 arg.d_size = frag_info->d_size;
124 arg.src = src;
125 arg.dst = dst;
126
127 read_lock(&lowpan_frags.lock);
128 hash = lowpan_hash_frag(frag_info->d_tag, frag_info->d_size, src, dst);
129
599018a7 130 q = inet_frag_find(&ieee802154_lowpan->frags,
7240cdec
AA
131 &lowpan_frags, &arg, hash);
132 if (IS_ERR_OR_NULL(q)) {
133 inet_frag_maybe_warn_overflow(q, pr_fmt());
134 return NULL;
135 }
136 return container_of(q, struct lowpan_frag_queue, q);
137}
138
139static int lowpan_frag_queue(struct lowpan_frag_queue *fq,
140 struct sk_buff *skb, const u8 frag_type)
141{
142 struct sk_buff *prev, *next;
143 struct net_device *dev;
144 int end, offset;
145
146 if (fq->q.last_in & INET_FRAG_COMPLETE)
147 goto err;
148
a13061ec
PB
149 offset = lowpan_cb(skb)->d_offset << 3;
150 end = lowpan_cb(skb)->d_size;
7240cdec
AA
151
152 /* Is this the final fragment? */
153 if (offset + skb->len == end) {
154 /* If we already have some bits beyond end
155 * or have different end, the segment is corrupted.
156 */
157 if (end < fq->q.len ||
158 ((fq->q.last_in & INET_FRAG_LAST_IN) && end != fq->q.len))
159 goto err;
160 fq->q.last_in |= INET_FRAG_LAST_IN;
161 fq->q.len = end;
162 } else {
163 if (end > fq->q.len) {
164 /* Some bits beyond end -> corruption. */
165 if (fq->q.last_in & INET_FRAG_LAST_IN)
166 goto err;
167 fq->q.len = end;
168 }
169 }
170
171 /* Find out which fragments are in front and at the back of us
172 * in the chain of fragments so far. We must know where to put
173 * this fragment, right?
174 */
175 prev = fq->q.fragments_tail;
a13061ec 176 if (!prev || lowpan_cb(prev)->d_offset < lowpan_cb(skb)->d_offset) {
7240cdec
AA
177 next = NULL;
178 goto found;
179 }
180 prev = NULL;
181 for (next = fq->q.fragments; next != NULL; next = next->next) {
a13061ec 182 if (lowpan_cb(next)->d_offset >= lowpan_cb(skb)->d_offset)
7240cdec
AA
183 break; /* bingo! */
184 prev = next;
185 }
186
187found:
188 /* Insert this fragment in the chain of fragments. */
189 skb->next = next;
190 if (!next)
191 fq->q.fragments_tail = skb;
192 if (prev)
193 prev->next = skb;
194 else
195 fq->q.fragments = skb;
196
197 dev = skb->dev;
198 if (dev)
199 skb->dev = NULL;
200
201 fq->q.stamp = skb->tstamp;
202 if (frag_type == LOWPAN_DISPATCH_FRAG1) {
203 /* Calculate uncomp. 6lowpan header to estimate full size */
204 fq->q.meat += lowpan_uncompress_size(skb, NULL);
205 fq->q.last_in |= INET_FRAG_FIRST_IN;
206 } else {
207 fq->q.meat += skb->len;
208 }
209 add_frag_mem_limit(&fq->q, skb->truesize);
210
211 if (fq->q.last_in == (INET_FRAG_FIRST_IN | INET_FRAG_LAST_IN) &&
212 fq->q.meat == fq->q.len) {
213 int res;
214 unsigned long orefdst = skb->_skb_refdst;
215
216 skb->_skb_refdst = 0UL;
217 res = lowpan_frag_reasm(fq, prev, dev);
218 skb->_skb_refdst = orefdst;
219 return res;
220 }
221
222 inet_frag_lru_move(&fq->q);
223 return -1;
224err:
225 kfree_skb(skb);
226 return -1;
227}
228
229/* Check if this packet is complete.
230 * Returns NULL on failure by any reason, and pointer
231 * to current nexthdr field in reassembled frame.
232 *
233 * It is called with locked fq, and caller must check that
234 * queue is eligible for reassembly i.e. it is not COMPLETE,
235 * the last and the first frames arrived and all the bits are here.
236 */
237static int lowpan_frag_reasm(struct lowpan_frag_queue *fq, struct sk_buff *prev,
238 struct net_device *dev)
239{
240 struct sk_buff *fp, *head = fq->q.fragments;
241 int sum_truesize;
242
243 inet_frag_kill(&fq->q, &lowpan_frags);
244
245 /* Make the one we just received the head. */
246 if (prev) {
247 head = prev->next;
248 fp = skb_clone(head, GFP_ATOMIC);
249
250 if (!fp)
251 goto out_oom;
252
253 fp->next = head->next;
254 if (!fp->next)
255 fq->q.fragments_tail = fp;
256 prev->next = fp;
257
258 skb_morph(head, fq->q.fragments);
259 head->next = fq->q.fragments->next;
260
261 consume_skb(fq->q.fragments);
262 fq->q.fragments = head;
263 }
264
265 /* Head of list must not be cloned. */
266 if (skb_unclone(head, GFP_ATOMIC))
267 goto out_oom;
268
269 /* If the first fragment is fragmented itself, we split
270 * it to two chunks: the first with data and paged part
271 * and the second, holding only fragments.
272 */
273 if (skb_has_frag_list(head)) {
274 struct sk_buff *clone;
275 int i, plen = 0;
276
277 clone = alloc_skb(0, GFP_ATOMIC);
278 if (!clone)
279 goto out_oom;
280 clone->next = head->next;
281 head->next = clone;
282 skb_shinfo(clone)->frag_list = skb_shinfo(head)->frag_list;
283 skb_frag_list_init(head);
284 for (i = 0; i < skb_shinfo(head)->nr_frags; i++)
285 plen += skb_frag_size(&skb_shinfo(head)->frags[i]);
286 clone->len = head->data_len - plen;
287 clone->data_len = clone->len;
288 head->data_len -= clone->len;
289 head->len -= clone->len;
290 add_frag_mem_limit(&fq->q, clone->truesize);
291 }
292
293 WARN_ON(head == NULL);
294
295 sum_truesize = head->truesize;
296 for (fp = head->next; fp;) {
297 bool headstolen;
298 int delta;
299 struct sk_buff *next = fp->next;
300
301 sum_truesize += fp->truesize;
302 if (skb_try_coalesce(head, fp, &headstolen, &delta)) {
303 kfree_skb_partial(fp, headstolen);
304 } else {
305 if (!skb_shinfo(head)->frag_list)
306 skb_shinfo(head)->frag_list = fp;
307 head->data_len += fp->len;
308 head->len += fp->len;
309 head->truesize += fp->truesize;
310 }
311 fp = next;
312 }
313 sub_frag_mem_limit(&fq->q, sum_truesize);
314
315 head->next = NULL;
316 head->dev = dev;
317 head->tstamp = fq->q.stamp;
318
319 fq->q.fragments = NULL;
320 fq->q.fragments_tail = NULL;
321
322 return 1;
323out_oom:
324 net_dbg_ratelimited("lowpan_frag_reasm: no memory for reassembly\n");
325 return -1;
326}
327
328static int lowpan_get_frag_info(struct sk_buff *skb, const u8 frag_type,
a13061ec 329 struct lowpan_frag_info *frag_info)
7240cdec
AA
330{
331 bool fail;
332 u8 pattern = 0, low = 0;
333
334 fail = lowpan_fetch_skb(skb, &pattern, 1);
335 fail |= lowpan_fetch_skb(skb, &low, 1);
336 frag_info->d_size = (pattern & 7) << 8 | low;
337 fail |= lowpan_fetch_skb(skb, &frag_info->d_tag, 2);
338
339 if (frag_type == LOWPAN_DISPATCH_FRAGN) {
340 fail |= lowpan_fetch_skb(skb, &frag_info->d_offset, 1);
341 } else {
342 skb_reset_network_header(skb);
343 frag_info->d_offset = 0;
344 }
345
346 if (unlikely(fail))
347 return -EIO;
348
349 return 0;
350}
351
352int lowpan_frag_rcv(struct sk_buff *skb, const u8 frag_type)
353{
354 struct lowpan_frag_queue *fq;
355 struct net *net = dev_net(skb->dev);
a13061ec 356 struct lowpan_frag_info *frag_info = lowpan_cb(skb);
ae531b94 357 struct ieee802154_addr source, dest;
599018a7
LR
358 struct netns_ieee802154_lowpan *ieee802154_lowpan =
359 net_ieee802154_lowpan(net);
7240cdec
AA
360 int err;
361
ae531b94
PB
362 source = mac_cb(skb)->source;
363 dest = mac_cb(skb)->dest;
364
7240cdec
AA
365 err = lowpan_get_frag_info(skb, frag_type, frag_info);
366 if (err < 0)
367 goto err;
368
599018a7 369 if (frag_info->d_size > ieee802154_lowpan->max_dsize)
7240cdec
AA
370 goto err;
371
ae531b94 372 fq = fq_find(net, frag_info, &source, &dest);
7240cdec
AA
373 if (fq != NULL) {
374 int ret;
4710d806 375
7240cdec
AA
376 spin_lock(&fq->q.lock);
377 ret = lowpan_frag_queue(fq, skb, frag_type);
378 spin_unlock(&fq->q.lock);
379
380 inet_frag_put(&fq->q, &lowpan_frags);
381 return ret;
382 }
383
384err:
385 kfree_skb(skb);
386 return -1;
387}
388EXPORT_SYMBOL(lowpan_frag_rcv);
389
390#ifdef CONFIG_SYSCTL
391static struct ctl_table lowpan_frags_ns_ctl_table[] = {
392 {
393 .procname = "6lowpanfrag_high_thresh",
394 .data = &init_net.ieee802154_lowpan.frags.high_thresh,
395 .maxlen = sizeof(int),
396 .mode = 0644,
397 .proc_handler = proc_dointvec
398 },
399 {
400 .procname = "6lowpanfrag_low_thresh",
401 .data = &init_net.ieee802154_lowpan.frags.low_thresh,
402 .maxlen = sizeof(int),
403 .mode = 0644,
404 .proc_handler = proc_dointvec
405 },
406 {
407 .procname = "6lowpanfrag_time",
408 .data = &init_net.ieee802154_lowpan.frags.timeout,
409 .maxlen = sizeof(int),
410 .mode = 0644,
411 .proc_handler = proc_dointvec_jiffies,
412 },
413 {
414 .procname = "6lowpanfrag_max_datagram_size",
415 .data = &init_net.ieee802154_lowpan.max_dsize,
416 .maxlen = sizeof(int),
417 .mode = 0644,
418 .proc_handler = proc_dointvec
419 },
420 { }
421};
422
423static struct ctl_table lowpan_frags_ctl_table[] = {
424 {
425 .procname = "6lowpanfrag_secret_interval",
426 .data = &lowpan_frags.secret_interval,
427 .maxlen = sizeof(int),
428 .mode = 0644,
429 .proc_handler = proc_dointvec_jiffies,
430 },
431 { }
432};
433
434static int __net_init lowpan_frags_ns_sysctl_register(struct net *net)
435{
436 struct ctl_table *table;
437 struct ctl_table_header *hdr;
599018a7
LR
438 struct netns_ieee802154_lowpan *ieee802154_lowpan =
439 net_ieee802154_lowpan(net);
7240cdec
AA
440
441 table = lowpan_frags_ns_ctl_table;
442 if (!net_eq(net, &init_net)) {
443 table = kmemdup(table, sizeof(lowpan_frags_ns_ctl_table),
444 GFP_KERNEL);
445 if (table == NULL)
446 goto err_alloc;
447
599018a7
LR
448 table[0].data = &ieee802154_lowpan->frags.high_thresh;
449 table[1].data = &ieee802154_lowpan->frags.low_thresh;
450 table[2].data = &ieee802154_lowpan->frags.timeout;
451 table[3].data = &ieee802154_lowpan->max_dsize;
7240cdec
AA
452
453 /* Don't export sysctls to unprivileged users */
454 if (net->user_ns != &init_user_ns)
455 table[0].procname = NULL;
456 }
457
458 hdr = register_net_sysctl(net, "net/ieee802154/6lowpan", table);
459 if (hdr == NULL)
460 goto err_reg;
461
599018a7 462 ieee802154_lowpan->sysctl.frags_hdr = hdr;
7240cdec
AA
463 return 0;
464
465err_reg:
466 if (!net_eq(net, &init_net))
467 kfree(table);
468err_alloc:
469 return -ENOMEM;
470}
471
472static void __net_exit lowpan_frags_ns_sysctl_unregister(struct net *net)
473{
474 struct ctl_table *table;
599018a7
LR
475 struct netns_ieee802154_lowpan *ieee802154_lowpan =
476 net_ieee802154_lowpan(net);
7240cdec 477
599018a7
LR
478 table = ieee802154_lowpan->sysctl.frags_hdr->ctl_table_arg;
479 unregister_net_sysctl_table(ieee802154_lowpan->sysctl.frags_hdr);
7240cdec
AA
480 if (!net_eq(net, &init_net))
481 kfree(table);
482}
483
484static struct ctl_table_header *lowpan_ctl_header;
485
486static int lowpan_frags_sysctl_register(void)
487{
488 lowpan_ctl_header = register_net_sysctl(&init_net,
489 "net/ieee802154/6lowpan",
490 lowpan_frags_ctl_table);
491 return lowpan_ctl_header == NULL ? -ENOMEM : 0;
492}
493
494static void lowpan_frags_sysctl_unregister(void)
495{
496 unregister_net_sysctl_table(lowpan_ctl_header);
497}
498#else
499static inline int lowpan_frags_ns_sysctl_register(struct net *net)
500{
501 return 0;
502}
503
504static inline void lowpan_frags_ns_sysctl_unregister(struct net *net)
505{
506}
507
508static inline int lowpan_frags_sysctl_register(void)
509{
510 return 0;
511}
512
513static inline void lowpan_frags_sysctl_unregister(void)
514{
515}
516#endif
517
518static int __net_init lowpan_frags_init_net(struct net *net)
519{
599018a7
LR
520 struct netns_ieee802154_lowpan *ieee802154_lowpan =
521 net_ieee802154_lowpan(net);
7240cdec 522
599018a7
LR
523 ieee802154_lowpan->frags.high_thresh = IPV6_FRAG_HIGH_THRESH;
524 ieee802154_lowpan->frags.low_thresh = IPV6_FRAG_LOW_THRESH;
525 ieee802154_lowpan->frags.timeout = IPV6_FRAG_TIMEOUT;
526 ieee802154_lowpan->max_dsize = 0xFFFF;
527
528 inet_frags_init_net(&ieee802154_lowpan->frags);
7240cdec
AA
529
530 return lowpan_frags_ns_sysctl_register(net);
531}
532
533static void __net_exit lowpan_frags_exit_net(struct net *net)
534{
599018a7
LR
535 struct netns_ieee802154_lowpan *ieee802154_lowpan =
536 net_ieee802154_lowpan(net);
537
7240cdec 538 lowpan_frags_ns_sysctl_unregister(net);
599018a7 539 inet_frags_exit_net(&ieee802154_lowpan->frags, &lowpan_frags);
7240cdec
AA
540}
541
542static struct pernet_operations lowpan_frags_ops = {
543 .init = lowpan_frags_init_net,
544 .exit = lowpan_frags_exit_net,
545};
546
547int __init lowpan_net_frag_init(void)
548{
549 int ret;
550
551 ret = lowpan_frags_sysctl_register();
552 if (ret)
37147652 553 return ret;
7240cdec
AA
554
555 ret = register_pernet_subsys(&lowpan_frags_ops);
556 if (ret)
557 goto err_pernet;
558
559 lowpan_frags.hashfn = lowpan_hashfn;
560 lowpan_frags.constructor = lowpan_frag_init;
561 lowpan_frags.destructor = NULL;
562 lowpan_frags.skb_free = NULL;
563 lowpan_frags.qsize = sizeof(struct frag_queue);
564 lowpan_frags.match = lowpan_frag_match;
565 lowpan_frags.frag_expire = lowpan_frag_expire;
566 lowpan_frags.secret_interval = 10 * 60 * HZ;
567 inet_frags_init(&lowpan_frags);
37147652
AA
568
569 return ret;
7240cdec
AA
570err_pernet:
571 lowpan_frags_sysctl_unregister();
7240cdec
AA
572 return ret;
573}
574
575void lowpan_net_frag_exit(void)
576{
577 inet_frags_fini(&lowpan_frags);
578 lowpan_frags_sysctl_unregister();
579 unregister_pernet_subsys(&lowpan_frags_ops);
580}