Merge branch 'asoc-4.19' into asoc-linus
[linux-2.6-block.git] / net / xfrm / xfrm_input.c
CommitLineData
b2441318 1// SPDX-License-Identifier: GPL-2.0
1da177e4
LT
2/*
3 * xfrm_input.c
4 *
5 * Changes:
6 * YOSHIFUJI Hideaki @USAGI
7 * Split up af-specific portion
a716c119 8 *
1da177e4
LT
9 */
10
acf568ee 11#include <linux/bottom_half.h>
f8c3d0dd 12#include <linux/cache.h>
acf568ee 13#include <linux/interrupt.h>
1da177e4
LT
14#include <linux/slab.h>
15#include <linux/module.h>
716062fd 16#include <linux/netdevice.h>
acf568ee 17#include <linux/percpu.h>
716062fd 18#include <net/dst.h>
1da177e4
LT
19#include <net/ip.h>
20#include <net/xfrm.h>
049f8e2e
AD
21#include <net/ip_tunnels.h>
22#include <net/ip6_tunnel.h>
1da177e4 23
acf568ee
HX
24struct xfrm_trans_tasklet {
25 struct tasklet_struct tasklet;
26 struct sk_buff_head queue;
27};
28
29struct xfrm_trans_cb {
9a3fb9fb
SK
30 union {
31 struct inet_skb_parm h4;
32#if IS_ENABLED(CONFIG_IPV6)
33 struct inet6_skb_parm h6;
34#endif
35 } header;
acf568ee
HX
36 int (*finish)(struct net *net, struct sock *sk, struct sk_buff *skb);
37};
38
39#define XFRM_TRANS_SKB_CB(__skb) ((struct xfrm_trans_cb *)&((__skb)->cb[0]))
40
f8c3d0dd 41static struct kmem_cache *secpath_cachep __ro_after_init;
1da177e4 42
2f32b51b 43static DEFINE_SPINLOCK(xfrm_input_afinfo_lock);
960fdfde 44static struct xfrm_input_afinfo const __rcu *xfrm_input_afinfo[AF_INET6 + 1];
2f32b51b 45
1995876a
SK
46static struct gro_cells gro_cells;
47static struct net_device xfrm_napi_dev;
48
acf568ee
HX
49static DEFINE_PER_CPU(struct xfrm_trans_tasklet, xfrm_trans_tasklet);
50
960fdfde 51int xfrm_input_register_afinfo(const struct xfrm_input_afinfo *afinfo)
2f32b51b
SK
52{
53 int err = 0;
54
960fdfde 55 if (WARN_ON(afinfo->family >= ARRAY_SIZE(xfrm_input_afinfo)))
2f32b51b 56 return -EAFNOSUPPORT;
960fdfde 57
2f32b51b
SK
58 spin_lock_bh(&xfrm_input_afinfo_lock);
59 if (unlikely(xfrm_input_afinfo[afinfo->family] != NULL))
f31e8d4f 60 err = -EEXIST;
2f32b51b
SK
61 else
62 rcu_assign_pointer(xfrm_input_afinfo[afinfo->family], afinfo);
63 spin_unlock_bh(&xfrm_input_afinfo_lock);
64 return err;
65}
66EXPORT_SYMBOL(xfrm_input_register_afinfo);
67
960fdfde 68int xfrm_input_unregister_afinfo(const struct xfrm_input_afinfo *afinfo)
2f32b51b
SK
69{
70 int err = 0;
71
2f32b51b
SK
72 spin_lock_bh(&xfrm_input_afinfo_lock);
73 if (likely(xfrm_input_afinfo[afinfo->family] != NULL)) {
74 if (unlikely(xfrm_input_afinfo[afinfo->family] != afinfo))
75 err = -EINVAL;
76 else
77 RCU_INIT_POINTER(xfrm_input_afinfo[afinfo->family], NULL);
78 }
79 spin_unlock_bh(&xfrm_input_afinfo_lock);
80 synchronize_rcu();
81 return err;
82}
83EXPORT_SYMBOL(xfrm_input_unregister_afinfo);
84
960fdfde 85static const struct xfrm_input_afinfo *xfrm_input_get_afinfo(unsigned int family)
2f32b51b 86{
960fdfde 87 const struct xfrm_input_afinfo *afinfo;
2f32b51b 88
960fdfde 89 if (WARN_ON_ONCE(family >= ARRAY_SIZE(xfrm_input_afinfo)))
2f32b51b 90 return NULL;
960fdfde 91
2f32b51b
SK
92 rcu_read_lock();
93 afinfo = rcu_dereference(xfrm_input_afinfo[family]);
94 if (unlikely(!afinfo))
95 rcu_read_unlock();
96 return afinfo;
97}
98
2f32b51b
SK
99static int xfrm_rcv_cb(struct sk_buff *skb, unsigned int family, u8 protocol,
100 int err)
101{
102 int ret;
960fdfde 103 const struct xfrm_input_afinfo *afinfo = xfrm_input_get_afinfo(family);
2f32b51b
SK
104
105 if (!afinfo)
106 return -EAFNOSUPPORT;
107
108 ret = afinfo->callback(skb, protocol, err);
960fdfde 109 rcu_read_unlock();
2f32b51b
SK
110
111 return ret;
112}
113
1da177e4
LT
114void __secpath_destroy(struct sec_path *sp)
115{
116 int i;
117 for (i = 0; i < sp->len; i++)
dbe5b4aa 118 xfrm_state_put(sp->xvec[i]);
1da177e4
LT
119 kmem_cache_free(secpath_cachep, sp);
120}
121EXPORT_SYMBOL(__secpath_destroy);
122
123struct sec_path *secpath_dup(struct sec_path *src)
124{
125 struct sec_path *sp;
126
54e6ecb2 127 sp = kmem_cache_alloc(secpath_cachep, GFP_ATOMIC);
1da177e4
LT
128 if (!sp)
129 return NULL;
130
131 sp->len = 0;
54ef207a
SK
132 sp->olen = 0;
133
d77e38e6
SK
134 memset(sp->ovec, 0, sizeof(sp->ovec[XFRM_MAX_OFFLOAD_DEPTH]));
135
1da177e4
LT
136 if (src) {
137 int i;
138
139 memcpy(sp, src, sizeof(*sp));
140 for (i = 0; i < sp->len; i++)
dbe5b4aa 141 xfrm_state_hold(sp->xvec[i]);
1da177e4 142 }
55eabed6 143 refcount_set(&sp->refcnt, 1);
1da177e4
LT
144 return sp;
145}
146EXPORT_SYMBOL(secpath_dup);
147
b0fcee82
SK
148int secpath_set(struct sk_buff *skb)
149{
150 struct sec_path *sp;
151
152 /* Allocate new secpath or COW existing one. */
55eabed6 153 if (!skb->sp || refcount_read(&skb->sp->refcnt) != 1) {
b0fcee82
SK
154 sp = secpath_dup(skb->sp);
155 if (!sp)
156 return -ENOMEM;
157
158 if (skb->sp)
159 secpath_put(skb->sp);
160 skb->sp = sp;
161 }
162 return 0;
163}
164EXPORT_SYMBOL(secpath_set);
165
1da177e4
LT
166/* Fetch spi and seq from ipsec header */
167
6067b2ba 168int xfrm_parse_spi(struct sk_buff *skb, u8 nexthdr, __be32 *spi, __be32 *seq)
1da177e4
LT
169{
170 int offset, offset_seq;
44072500 171 int hlen;
1da177e4
LT
172
173 switch (nexthdr) {
174 case IPPROTO_AH:
44072500 175 hlen = sizeof(struct ip_auth_hdr);
1da177e4
LT
176 offset = offsetof(struct ip_auth_hdr, spi);
177 offset_seq = offsetof(struct ip_auth_hdr, seq_no);
178 break;
179 case IPPROTO_ESP:
44072500 180 hlen = sizeof(struct ip_esp_hdr);
1da177e4
LT
181 offset = offsetof(struct ip_esp_hdr, spi);
182 offset_seq = offsetof(struct ip_esp_hdr, seq_no);
183 break;
184 case IPPROTO_COMP:
185 if (!pskb_may_pull(skb, sizeof(struct ip_comp_hdr)))
186 return -EINVAL;
3e94c2dc 187 *spi = htonl(ntohs(*(__be16 *)(skb_transport_header(skb) + 2)));
1da177e4
LT
188 *seq = 0;
189 return 0;
190 default:
191 return 1;
192 }
193
44072500 194 if (!pskb_may_pull(skb, hlen))
1da177e4
LT
195 return -EINVAL;
196
3e94c2dc
WC
197 *spi = *(__be32 *)(skb_transport_header(skb) + offset);
198 *seq = *(__be32 *)(skb_transport_header(skb) + offset_seq);
1da177e4
LT
199 return 0;
200}
1e295370 201EXPORT_SYMBOL(xfrm_parse_spi);
1da177e4 202
227620e2
HX
203int xfrm_prepare_input(struct xfrm_state *x, struct sk_buff *skb)
204{
df9dcb45 205 struct xfrm_mode *inner_mode = x->inner_mode;
227620e2
HX
206 int err;
207
208 err = x->outer_mode->afinfo->extract_input(x, skb);
209 if (err)
210 return err;
211
df9dcb45
KM
212 if (x->sel.family == AF_UNSPEC) {
213 inner_mode = xfrm_ip2inner_mode(x, XFRM_MODE_SKB_CB(skb)->protocol);
214 if (inner_mode == NULL)
215 return -EAFNOSUPPORT;
216 }
217
218 skb->protocol = inner_mode->afinfo->eth_proto;
219 return inner_mode->input2(x, skb);
227620e2
HX
220}
221EXPORT_SYMBOL(xfrm_prepare_input);
222
716062fd
HX
223int xfrm_input(struct sk_buff *skb, int nexthdr, __be32 spi, int encap_type)
224{
bd235e3c 225 struct net *net = dev_net(skb->dev);
716062fd
HX
226 int err;
227 __be32 seq;
2cd08467 228 __be32 seq_hi;
3328715e 229 struct xfrm_state *x = NULL;
1bf06cd2 230 xfrm_address_t *daddr;
df9dcb45 231 struct xfrm_mode *inner_mode;
049f8e2e 232 u32 mark = skb->mark;
4ce3dbe3 233 unsigned int family = AF_UNSPEC;
716062fd 234 int decaps = 0;
1bf06cd2 235 int async = 0;
7785bba2 236 bool xfrm_gro = false;
d77e38e6
SK
237 bool crypto_done = false;
238 struct xfrm_offload *xo = xfrm_offload(skb);
1bf06cd2 239
1bf06cd2 240 if (encap_type < 0) {
00501121 241 x = xfrm_input_state(skb);
4ce3dbe3
AH
242
243 if (unlikely(x->km.state != XFRM_STATE_VALID)) {
244 if (x->km.state == XFRM_STATE_ACQ)
245 XFRM_INC_STATS(net, LINUX_MIB_XFRMACQUIREERROR);
246 else
247 XFRM_INC_STATS(net,
248 LINUX_MIB_XFRMINSTATEINVALID);
249 goto drop;
250 }
251
3328715e 252 family = x->outer_mode->afinfo->family;
7785bba2
SK
253
254 /* An encap_type of -1 indicates async resumption. */
255 if (encap_type == -1) {
256 async = 1;
257 seq = XFRM_SKB_CB(skb)->seq.input.low;
258 goto resume;
259 }
bcd1f8a4 260
7785bba2
SK
261 /* encap_type < -1 indicates a GRO call. */
262 encap_type = 0;
263 seq = XFRM_SPI_SKB_CB(skb)->seq;
716062fd 264
bcd1f8a4
SK
265 if (xo && (xo->flags & CRYPTO_DONE)) {
266 crypto_done = true;
bcd1f8a4
SK
267 family = XFRM_SPI_SKB_CB(skb)->family;
268
269 if (!(xo->status & CRYPTO_SUCCESS)) {
270 if (xo->status &
271 (CRYPTO_TRANSPORT_AH_AUTH_FAILED |
272 CRYPTO_TRANSPORT_ESP_AUTH_FAILED |
273 CRYPTO_TUNNEL_AH_AUTH_FAILED |
274 CRYPTO_TUNNEL_ESP_AUTH_FAILED)) {
275
276 xfrm_audit_state_icvfail(x, skb,
277 x->type->proto);
278 x->stats.integrity_failed++;
279 XFRM_INC_STATS(net, LINUX_MIB_XFRMINSTATEPROTOERROR);
280 goto drop;
281 }
282
47ebcc0b
YK
283 if (xo->status & CRYPTO_INVALID_PROTOCOL) {
284 XFRM_INC_STATS(net, LINUX_MIB_XFRMINSTATEPROTOERROR);
285 goto drop;
286 }
287
bcd1f8a4 288 XFRM_INC_STATS(net, LINUX_MIB_XFRMINBUFFERERROR);
d77e38e6
SK
289 goto drop;
290 }
291
bcd1f8a4
SK
292 if ((err = xfrm_parse_spi(skb, nexthdr, &spi, &seq)) != 0) {
293 XFRM_INC_STATS(net, LINUX_MIB_XFRMINHDRERROR);
294 goto drop;
295 }
d77e38e6
SK
296 }
297
7785bba2 298 goto lock;
1bf06cd2 299 }
716062fd 300
3328715e
SK
301 family = XFRM_SPI_SKB_CB(skb)->family;
302
049f8e2e 303 /* if tunnel is present override skb->mark value with tunnel i_key */
1625f452
AK
304 switch (family) {
305 case AF_INET:
306 if (XFRM_TUNNEL_SKB_CB(skb)->tunnel.ip4)
049f8e2e 307 mark = be32_to_cpu(XFRM_TUNNEL_SKB_CB(skb)->tunnel.ip4->parms.i_key);
1625f452
AK
308 break;
309 case AF_INET6:
310 if (XFRM_TUNNEL_SKB_CB(skb)->tunnel.ip6)
049f8e2e 311 mark = be32_to_cpu(XFRM_TUNNEL_SKB_CB(skb)->tunnel.ip6->parms.i_key);
1625f452 312 break;
049f8e2e
AD
313 }
314
b0fcee82
SK
315 err = secpath_set(skb);
316 if (err) {
317 XFRM_INC_STATS(net, LINUX_MIB_XFRMINERROR);
318 goto drop;
b2aa5e9d
HX
319 }
320
716062fd 321 seq = 0;
0aa64774 322 if (!spi && (err = xfrm_parse_spi(skb, nexthdr, &spi, &seq)) != 0) {
f203b76d 323 secpath_reset(skb);
59c9940e 324 XFRM_INC_STATS(net, LINUX_MIB_XFRMINHDRERROR);
716062fd 325 goto drop;
0aa64774 326 }
716062fd 327
cb79a180
FW
328 daddr = (xfrm_address_t *)(skb_network_header(skb) +
329 XFRM_SPI_SKB_CB(skb)->daddroff);
716062fd 330 do {
0aa64774 331 if (skb->sp->len == XFRM_MAX_DEPTH) {
f203b76d 332 secpath_reset(skb);
59c9940e 333 XFRM_INC_STATS(net, LINUX_MIB_XFRMINBUFFERERROR);
716062fd 334 goto drop;
0aa64774 335 }
716062fd 336
049f8e2e 337 x = xfrm_state_lookup(net, mark, daddr, spi, nexthdr, family);
0aa64774 338 if (x == NULL) {
f203b76d 339 secpath_reset(skb);
59c9940e 340 XFRM_INC_STATS(net, LINUX_MIB_XFRMINNOSTATES);
afeb14b4 341 xfrm_audit_state_notfound(skb, family, spi, seq);
716062fd 342 goto drop;
0aa64774 343 }
716062fd 344
9b42c1f1
SK
345 skb->mark = xfrm_smark_get(skb->mark, x);
346
b2aa5e9d
HX
347 skb->sp->xvec[skb->sp->len++] = x;
348
7785bba2 349lock:
716062fd 350 spin_lock(&x->lock);
4c4d41f2 351
0aa64774 352 if (unlikely(x->km.state != XFRM_STATE_VALID)) {
dc0565ce
LR
353 if (x->km.state == XFRM_STATE_ACQ)
354 XFRM_INC_STATS(net, LINUX_MIB_XFRMACQUIREERROR);
355 else
356 XFRM_INC_STATS(net,
357 LINUX_MIB_XFRMINSTATEINVALID);
716062fd 358 goto drop_unlock;
0aa64774 359 }
716062fd 360
3de77cf2
DM
361 if ((x->encap ? x->encap->encap_type : 0) != encap_type) {
362 XFRM_INC_STATS(net, LINUX_MIB_XFRMINSTATEMISMATCH);
363 goto drop_unlock;
364 }
365
36ae0148 366 if (x->repl->check(x, skb, seq)) {
59c9940e 367 XFRM_INC_STATS(net, LINUX_MIB_XFRMINSTATESEQERROR);
716062fd 368 goto drop_unlock;
0aa64774 369 }
716062fd 370
0aa64774 371 if (xfrm_state_check_expire(x)) {
59c9940e 372 XFRM_INC_STATS(net, LINUX_MIB_XFRMINSTATEEXPIRED);
716062fd 373 goto drop_unlock;
0aa64774 374 }
716062fd 375
0ebea8ef
HX
376 spin_unlock(&x->lock);
377
68c11e98
AD
378 if (xfrm_tunnel_check(skb, x, family)) {
379 XFRM_INC_STATS(net, LINUX_MIB_XFRMINSTATEMODEERROR);
380 goto drop;
381 }
382
2cd08467
SK
383 seq_hi = htonl(xfrm_replay_seqhi(x, seq));
384
1ce3644a 385 XFRM_SKB_CB(skb)->seq.input.low = seq;
2cd08467 386 XFRM_SKB_CB(skb)->seq.input.hi = seq_hi;
1bf06cd2 387
3bc07321 388 skb_dst_force(skb);
071d36bf 389 dev_hold(skb->dev);
3bc07321 390
d77e38e6
SK
391 if (crypto_done)
392 nexthdr = x->type_offload->input_tail(x, skb);
393 else
394 nexthdr = x->type->input(x, skb);
0ebea8ef 395
1bf06cd2
HX
396 if (nexthdr == -EINPROGRESS)
397 return 0;
1bf06cd2 398resume:
071d36bf 399 dev_put(skb->dev);
400
0ebea8ef 401 spin_lock(&x->lock);
668dc8af 402 if (nexthdr <= 0) {
9dd3245a
HX
403 if (nexthdr == -EBADMSG) {
404 xfrm_audit_state_icvfail(x, skb,
405 x->type->proto);
668dc8af 406 x->stats.integrity_failed++;
9dd3245a 407 }
59c9940e 408 XFRM_INC_STATS(net, LINUX_MIB_XFRMINSTATEPROTOERROR);
716062fd 409 goto drop_unlock;
668dc8af 410 }
716062fd 411
716062fd
HX
412 /* only the first xfrm gets the encap type */
413 encap_type = 0;
414
3b59df46 415 if (async && x->repl->recheck(x, skb, seq)) {
bcf66bf5
SK
416 XFRM_INC_STATS(net, LINUX_MIB_XFRMINSTATESEQERROR);
417 goto drop_unlock;
418 }
419
9fdc4883 420 x->repl->advance(x, seq);
716062fd
HX
421
422 x->curlft.bytes += skb->len;
423 x->curlft.packets++;
424
425 spin_unlock(&x->lock);
426
60d5fcfb
HX
427 XFRM_MODE_SKB_CB(skb)->protocol = nexthdr;
428
df9dcb45
KM
429 inner_mode = x->inner_mode;
430
431 if (x->sel.family == AF_UNSPEC) {
432 inner_mode = xfrm_ip2inner_mode(x, XFRM_MODE_SKB_CB(skb)->protocol);
cb866e32
SK
433 if (inner_mode == NULL) {
434 XFRM_INC_STATS(net, LINUX_MIB_XFRMINSTATEMODEERROR);
df9dcb45 435 goto drop;
cb866e32 436 }
df9dcb45
KM
437 }
438
439 if (inner_mode->input(x, skb)) {
59c9940e 440 XFRM_INC_STATS(net, LINUX_MIB_XFRMINSTATEMODEERROR);
716062fd 441 goto drop;
0aa64774 442 }
716062fd
HX
443
444 if (x->outer_mode->flags & XFRM_MODE_FLAG_TUNNEL) {
445 decaps = 1;
446 break;
447 }
448
1bf06cd2
HX
449 /*
450 * We need the inner address. However, we only get here for
451 * transport mode so the outer address is identical.
452 */
453 daddr = &x->id.daddr;
2fcb45b6 454 family = x->outer_mode->afinfo->family;
1bf06cd2 455
716062fd 456 err = xfrm_parse_spi(skb, nexthdr, &spi, &seq);
0aa64774 457 if (err < 0) {
59c9940e 458 XFRM_INC_STATS(net, LINUX_MIB_XFRMINHDRERROR);
716062fd 459 goto drop;
0aa64774 460 }
782710e3 461 crypto_done = false;
716062fd
HX
462 } while (!err);
463
3328715e
SK
464 err = xfrm_rcv_cb(skb, family, x->type->proto, 0);
465 if (err)
466 goto drop;
467
716062fd
HX
468 nf_reset(skb);
469
470 if (decaps) {
23e9fcfe
AK
471 if (skb->sp)
472 skb->sp->olen = 0;
adf30907 473 skb_dst_drop(skb);
1995876a 474 gro_cells_receive(&gro_cells, skb);
716062fd
HX
475 return 0;
476 } else {
7785bba2
SK
477 xo = xfrm_offload(skb);
478 if (xo)
479 xfrm_gro = xo->flags & XFRM_GRO;
480
cfcf99f9 481 err = x->inner_mode->afinfo->transport_finish(skb, xfrm_gro || async);
7785bba2 482 if (xfrm_gro) {
23e9fcfe
AK
483 if (skb->sp)
484 skb->sp->olen = 0;
7785bba2
SK
485 skb_dst_drop(skb);
486 gro_cells_receive(&gro_cells, skb);
487 return err;
488 }
489
490 return err;
716062fd
HX
491 }
492
493drop_unlock:
494 spin_unlock(&x->lock);
716062fd 495drop:
3328715e 496 xfrm_rcv_cb(skb, family, x && x->type ? x->type->proto : nexthdr, -1);
716062fd
HX
497 kfree_skb(skb);
498 return 0;
499}
500EXPORT_SYMBOL(xfrm_input);
501
1bf06cd2
HX
502int xfrm_input_resume(struct sk_buff *skb, int nexthdr)
503{
504 return xfrm_input(skb, nexthdr, 0, -1);
505}
506EXPORT_SYMBOL(xfrm_input_resume);
507
acf568ee
HX
508static void xfrm_trans_reinject(unsigned long data)
509{
510 struct xfrm_trans_tasklet *trans = (void *)data;
511 struct sk_buff_head queue;
512 struct sk_buff *skb;
513
514 __skb_queue_head_init(&queue);
515 skb_queue_splice_init(&trans->queue, &queue);
516
517 while ((skb = __skb_dequeue(&queue)))
518 XFRM_TRANS_SKB_CB(skb)->finish(dev_net(skb->dev), NULL, skb);
519}
520
521int xfrm_trans_queue(struct sk_buff *skb,
522 int (*finish)(struct net *, struct sock *,
523 struct sk_buff *))
524{
525 struct xfrm_trans_tasklet *trans;
526
527 trans = this_cpu_ptr(&xfrm_trans_tasklet);
528
529 if (skb_queue_len(&trans->queue) >= netdev_max_backlog)
530 return -ENOBUFS;
531
532 XFRM_TRANS_SKB_CB(skb)->finish = finish;
d16b46e4 533 __skb_queue_tail(&trans->queue, skb);
acf568ee
HX
534 tasklet_schedule(&trans->tasklet);
535 return 0;
536}
537EXPORT_SYMBOL(xfrm_trans_queue);
538
1da177e4
LT
539void __init xfrm_input_init(void)
540{
1995876a 541 int err;
acf568ee 542 int i;
1995876a
SK
543
544 init_dummy_netdev(&xfrm_napi_dev);
545 err = gro_cells_init(&gro_cells, &xfrm_napi_dev);
546 if (err)
547 gro_cells.cells = NULL;
548
1da177e4
LT
549 secpath_cachep = kmem_cache_create("secpath_cache",
550 sizeof(struct sec_path),
e5d679f3 551 0, SLAB_HWCACHE_ALIGN|SLAB_PANIC,
20c2df83 552 NULL);
acf568ee
HX
553
554 for_each_possible_cpu(i) {
555 struct xfrm_trans_tasklet *trans;
556
557 trans = &per_cpu(xfrm_trans_tasklet, i);
558 __skb_queue_head_init(&trans->queue);
559 tasklet_init(&trans->tasklet, xfrm_trans_reinject,
560 (unsigned long)trans);
561 }
1da177e4 562}