Merge tag 'pci-v6.16-fixes-3' of git://git.kernel.org/pub/scm/linux/kernel/git/pci/pci
[linux-block.git] / net / l2tp / l2tp_core.c
CommitLineData
d2912cb1 1// SPDX-License-Identifier: GPL-2.0-only
20dcb110 2/* L2TP core.
fd558d18
JC
3 *
4 * Copyright (c) 2008,2009,2010 Katalix Systems Ltd
5 *
6 * This file contains some code of the original L2TPv2 pppol2tp
7 * driver, which has the following copyright:
8 *
9 * Authors: Martijn van Oosterhout <kleptog@svana.org>
10 * James Chapman (jchapman@katalix.com)
11 * Contributors:
12 * Michal Ostrowski <mostrows@speakeasy.net>
13 * Arnaldo Carvalho de Melo <acme@xconectiva.com.br>
14 * David S. Miller (davem@redhat.com)
fd558d18
JC
15 */
16
a4ca44fa
JP
17#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
18
fd558d18
JC
19#include <linux/module.h>
20#include <linux/string.h>
21#include <linux/list.h>
e02d494d 22#include <linux/rculist.h>
fd558d18
JC
23#include <linux/uaccess.h>
24
25#include <linux/kernel.h>
26#include <linux/spinlock.h>
27#include <linux/kthread.h>
28#include <linux/sched.h>
29#include <linux/slab.h>
30#include <linux/errno.h>
31#include <linux/jiffies.h>
32
33#include <linux/netdevice.h>
34#include <linux/net.h>
35#include <linux/inetdevice.h>
36#include <linux/skbuff.h>
37#include <linux/init.h>
0d76751f 38#include <linux/in.h>
fd558d18
JC
39#include <linux/ip.h>
40#include <linux/udp.h>
0d76751f 41#include <linux/l2tp.h>
fd558d18
JC
42#include <linux/sort.h>
43#include <linux/file.h>
44#include <linux/nsproxy.h>
45#include <net/net_namespace.h>
46#include <net/netns/generic.h>
47#include <net/dst.h>
48#include <net/ip.h>
49#include <net/udp.h>
85644b4d 50#include <net/udp_tunnel.h>
309795f4 51#include <net/inet_common.h>
fd558d18 52#include <net/xfrm.h>
0d76751f 53#include <net/protocol.h>
d2cf3361
BL
54#include <net/inet6_connection_sock.h>
55#include <net/inet_ecn.h>
56#include <net/ip6_route.h>
d499bd2e 57#include <net/ip6_checksum.h>
fd558d18
JC
58
59#include <asm/byteorder.h>
60063497 60#include <linux/atomic.h>
fd558d18
JC
61
62#include "l2tp_core.h"
63
3f117d6f
TP
64#define CREATE_TRACE_POINTS
65#include "trace.h"
66
fd558d18
JC
67#define L2TP_DRV_VERSION "V2.0"
68
69/* L2TP header constants */
70#define L2TP_HDRFLAG_T 0x8000
71#define L2TP_HDRFLAG_L 0x4000
72#define L2TP_HDRFLAG_S 0x0800
73#define L2TP_HDRFLAG_O 0x0200
74#define L2TP_HDRFLAG_P 0x0100
75
76#define L2TP_HDR_VER_MASK 0x000F
77#define L2TP_HDR_VER_2 0x0002
f7faffa3 78#define L2TP_HDR_VER_3 0x0003
fd558d18
JC
79
80/* L2TPv3 default L2-specific sublayer */
81#define L2TP_SLFLAG_S 0x40000000
82#define L2TP_SL_SEQ_MASK 0x00ffffff
83
91c52470 84#define L2TP_HDR_SIZE_MAX 14
fd558d18
JC
85
86/* Default trace flags */
87#define L2TP_DEFAULT_DEBUG_FLAGS 0
88
86a41ea9
JC
89#define L2TP_DEPTH_NESTING 2
90#if L2TP_DEPTH_NESTING == SINGLE_DEPTH_NESTING
91#error "L2TP requires its own lockdep subclass"
92#endif
93
fd558d18
JC
94/* Private data stored for received packets in the skb.
95 */
96struct l2tp_skb_cb {
f7faffa3 97 u32 ns;
fd558d18
JC
98 u16 has_seq;
99 u16 length;
100 unsigned long expires;
101};
102
efcd8c85 103#define L2TP_SKB_CB(skb) ((struct l2tp_skb_cb *)&(skb)->cb[sizeof(struct inet_skb_parm)])
fd558d18 104
f8ccac0e 105static struct workqueue_struct *l2tp_wq;
fd558d18
JC
106
107/* per-net private data for this module */
108static unsigned int l2tp_net_id;
109struct l2tp_net {
c4d48a58
CW
110 /* Lock for write access to l2tp_tunnel_idr */
111 spinlock_t l2tp_tunnel_idr_lock;
112 struct idr l2tp_tunnel_idr;
2a3339f6 113 /* Lock for write access to l2tp_v[23]_session_idr/htable */
aa5e17e1 114 spinlock_t l2tp_session_idr_lock;
2a3339f6 115 struct idr l2tp_v2_session_idr;
aa5e17e1
JC
116 struct idr l2tp_v3_session_idr;
117 struct hlist_head l2tp_v3_session_htable[16];
fd558d18
JC
118};
119
168464c1 120static u32 l2tp_v2_session_key(u16 tunnel_id, u16 session_id)
2a3339f6
JC
121{
122 return ((u32)tunnel_id) << 16 | session_id;
123}
124
168464c1 125static unsigned long l2tp_v3_session_hashkey(struct sock *sk, u32 session_id)
aa5e17e1
JC
126{
127 return ((unsigned long)sk) + session_id;
128}
129
b954f940
PA
130#if IS_ENABLED(CONFIG_IPV6)
131static bool l2tp_sk_is_v6(struct sock *sk)
132{
133 return sk->sk_family == PF_INET6 &&
134 !ipv6_addr_v4mapped(&sk->sk_v6_daddr);
135}
136#endif
fc130840 137
168464c1 138static struct l2tp_net *l2tp_pernet(const struct net *net)
fd558d18 139{
fd558d18
JC
140 return net_generic(net, l2tp_net_id);
141}
142
52016e25 143static void l2tp_tunnel_free(struct l2tp_tunnel *tunnel)
d00fa9ad 144{
29717a4f
JC
145 struct sock *sk = tunnel->sock;
146
6b7bdcd7 147 trace_free_tunnel(tunnel);
29717a4f
JC
148
149 if (sk) {
150 /* Disable udp encapsulation */
151 switch (tunnel->encap) {
152 case L2TP_ENCAPTYPE_UDP:
153 /* No longer an encapsulation socket. See net/ipv4/udp.c */
154 WRITE_ONCE(udp_sk(sk)->encap_type, 0);
155 udp_sk(sk)->encap_rcv = NULL;
156 udp_sk(sk)->encap_destroy = NULL;
157 break;
158 case L2TP_ENCAPTYPE_IP:
159 break;
160 }
161
162 tunnel->sock = NULL;
163 sock_put(sk);
164 }
165
166 kfree_rcu(tunnel, rcu);
d00fa9ad 167}
52016e25
TP
168
169static void l2tp_session_free(struct l2tp_session *session)
170{
6b7bdcd7 171 trace_free_session(session);
45faeff1 172 if (session->tunnel)
abe7a1a7 173 l2tp_tunnel_put(session->tunnel);
d17e8999 174 kfree_rcu(session, rcu);
45faeff1 175}
6b7bdcd7 176
2e7a2806
JC
177struct l2tp_tunnel *l2tp_sk_to_tunnel(const struct sock *sk)
178{
179 const struct net *net = sock_net(sk);
180 unsigned long tunnel_id, tmp;
181 struct l2tp_tunnel *tunnel;
182 struct l2tp_net *pn;
183
184 rcu_read_lock_bh();
185 pn = l2tp_pernet(net);
186 idr_for_each_entry_ul(&pn->l2tp_tunnel_idr, tunnel, tmp, tunnel_id) {
187 if (tunnel &&
188 tunnel->sock == sk &&
189 refcount_inc_not_zero(&tunnel->ref_count)) {
190 rcu_read_unlock_bh();
191 return tunnel;
192 }
193 }
194 rcu_read_unlock_bh();
52016e25 195
2e7a2806 196 return NULL;
52016e25 197}
45faeff1 198EXPORT_SYMBOL_GPL(l2tp_sk_to_tunnel);
52016e25 199
abe7a1a7 200void l2tp_tunnel_put(struct l2tp_tunnel *tunnel)
52016e25
TP
201{
202 if (refcount_dec_and_test(&tunnel->ref_count))
203 l2tp_tunnel_free(tunnel);
204}
abe7a1a7 205EXPORT_SYMBOL_GPL(l2tp_tunnel_put);
52016e25 206
abe7a1a7 207void l2tp_session_put(struct l2tp_session *session)
52016e25
TP
208{
209 if (refcount_dec_and_test(&session->ref_count))
210 l2tp_session_free(session);
211}
abe7a1a7 212EXPORT_SYMBOL_GPL(l2tp_session_put);
d00fa9ad 213
54652eb1
GN
214/* Lookup a tunnel. A new reference is held on the returned tunnel. */
215struct l2tp_tunnel *l2tp_tunnel_get(const struct net *net, u32 tunnel_id)
216{
217 const struct l2tp_net *pn = l2tp_pernet(net);
218 struct l2tp_tunnel *tunnel;
219
220 rcu_read_lock_bh();
c4d48a58
CW
221 tunnel = idr_find(&pn->l2tp_tunnel_idr, tunnel_id);
222 if (tunnel && refcount_inc_not_zero(&tunnel->ref_count)) {
223 rcu_read_unlock_bh();
224 return tunnel;
54652eb1
GN
225 }
226 rcu_read_unlock_bh();
227
228 return NULL;
229}
230EXPORT_SYMBOL_GPL(l2tp_tunnel_get);
231
aa92c1ce
JC
232struct l2tp_tunnel *l2tp_tunnel_get_next(const struct net *net, unsigned long *key)
233{
234 struct l2tp_net *pn = l2tp_pernet(net);
235 struct l2tp_tunnel *tunnel = NULL;
236
237 rcu_read_lock_bh();
238again:
239 tunnel = idr_get_next_ul(&pn->l2tp_tunnel_idr, key);
240 if (tunnel) {
241 if (refcount_inc_not_zero(&tunnel->ref_count)) {
242 rcu_read_unlock_bh();
243 return tunnel;
244 }
245 (*key)++;
246 goto again;
247 }
248 rcu_read_unlock_bh();
249
250 return NULL;
251}
252EXPORT_SYMBOL_GPL(l2tp_tunnel_get_next);
253
aa5e17e1 254struct l2tp_session *l2tp_v3_session_get(const struct net *net, struct sock *sk, u32 session_id)
01e28b92 255{
aa5e17e1 256 const struct l2tp_net *pn = l2tp_pernet(net);
01e28b92
GN
257 struct l2tp_session *session;
258
01e28b92 259 rcu_read_lock_bh();
aa5e17e1
JC
260 session = idr_find(&pn->l2tp_v3_session_idr, session_id);
261 if (session && !hash_hashed(&session->hlist) &&
262 refcount_inc_not_zero(&session->ref_count)) {
263 rcu_read_unlock_bh();
264 return session;
265 }
61b9a047 266
aa5e17e1
JC
267 /* If we get here and session is non-NULL, the session_id
268 * collides with one in another tunnel. If sk is non-NULL,
269 * find the session matching sk.
270 */
271 if (session && sk) {
272 unsigned long key = l2tp_v3_session_hashkey(sk, session->session_id);
273
274 hash_for_each_possible_rcu(pn->l2tp_v3_session_htable, session,
275 hlist, key) {
24256415
JC
276 /* session->tunnel may be NULL if another thread is in
277 * l2tp_session_register and has added an item to
278 * l2tp_v3_session_htable but hasn't yet added the
279 * session to its tunnel's session_list.
280 */
281 struct l2tp_tunnel *tunnel = READ_ONCE(session->tunnel);
282
b0a8deda
JC
283 if (session->session_id == session_id &&
284 tunnel && tunnel->sock == sk &&
aa5e17e1
JC
285 refcount_inc_not_zero(&session->ref_count)) {
286 rcu_read_unlock_bh();
287 return session;
288 }
61b9a047 289 }
aa5e17e1 290 }
01e28b92 291 rcu_read_unlock_bh();
61b9a047
GN
292
293 return NULL;
294}
aa5e17e1 295EXPORT_SYMBOL_GPL(l2tp_v3_session_get);
61b9a047 296
2a3339f6
JC
297struct l2tp_session *l2tp_v2_session_get(const struct net *net, u16 tunnel_id, u16 session_id)
298{
299 u32 session_key = l2tp_v2_session_key(tunnel_id, session_id);
300 const struct l2tp_net *pn = l2tp_pernet(net);
301 struct l2tp_session *session;
302
303 rcu_read_lock_bh();
304 session = idr_find(&pn->l2tp_v2_session_idr, session_key);
305 if (session && refcount_inc_not_zero(&session->ref_count)) {
306 rcu_read_unlock_bh();
307 return session;
308 }
309 rcu_read_unlock_bh();
310
311 return NULL;
312}
313EXPORT_SYMBOL_GPL(l2tp_v2_session_get);
314
5f77c18e
JC
315struct l2tp_session *l2tp_session_get(const struct net *net, struct sock *sk, int pver,
316 u32 tunnel_id, u32 session_id)
317{
318 if (pver == L2TP_HDR_VER_2)
319 return l2tp_v2_session_get(net, tunnel_id, session_id);
320 else
321 return l2tp_v3_session_get(net, sk, session_id);
322}
323EXPORT_SYMBOL_GPL(l2tp_session_get);
324
aa92c1ce
JC
325static struct l2tp_session *l2tp_v2_session_get_next(const struct net *net,
326 u16 tid,
327 unsigned long *key)
328{
329 struct l2tp_net *pn = l2tp_pernet(net);
330 struct l2tp_session *session = NULL;
331
332 /* Start searching within the range of the tid */
333 if (*key == 0)
334 *key = l2tp_v2_session_key(tid, 0);
335
336 rcu_read_lock_bh();
337again:
338 session = idr_get_next_ul(&pn->l2tp_v2_session_idr, key);
339 if (session) {
340 struct l2tp_tunnel *tunnel = READ_ONCE(session->tunnel);
341
342 /* ignore sessions with id 0 as they are internal for pppol2tp */
343 if (session->session_id == 0) {
344 (*key)++;
345 goto again;
346 }
347
510c0732 348 if (tunnel->tunnel_id == tid &&
aa92c1ce
JC
349 refcount_inc_not_zero(&session->ref_count)) {
350 rcu_read_unlock_bh();
351 return session;
352 }
353
354 (*key)++;
355 if (tunnel->tunnel_id == tid)
356 goto again;
357 }
358 rcu_read_unlock_bh();
359
360 return NULL;
361}
362
363static struct l2tp_session *l2tp_v3_session_get_next(const struct net *net,
364 u32 tid, struct sock *sk,
365 unsigned long *key)
366{
367 struct l2tp_net *pn = l2tp_pernet(net);
368 struct l2tp_session *session = NULL;
369
370 rcu_read_lock_bh();
371again:
372 session = idr_get_next_ul(&pn->l2tp_v3_session_idr, key);
373 if (session && !hash_hashed(&session->hlist)) {
374 struct l2tp_tunnel *tunnel = READ_ONCE(session->tunnel);
375
376 if (tunnel && tunnel->tunnel_id == tid &&
377 refcount_inc_not_zero(&session->ref_count)) {
378 rcu_read_unlock_bh();
379 return session;
380 }
381
382 (*key)++;
383 goto again;
384 }
385
386 /* If we get here and session is non-NULL, the IDR entry may be one
387 * where the session_id collides with one in another tunnel. Check
388 * session_htable for a match. There can only be one session of a given
389 * ID per tunnel so we can return as soon as a match is found.
390 */
391 if (session && hash_hashed(&session->hlist)) {
392 unsigned long hkey = l2tp_v3_session_hashkey(sk, session->session_id);
393 u32 sid = session->session_id;
394
395 hash_for_each_possible_rcu(pn->l2tp_v3_session_htable, session,
396 hlist, hkey) {
397 struct l2tp_tunnel *tunnel = READ_ONCE(session->tunnel);
398
399 if (session->session_id == sid &&
400 tunnel && tunnel->tunnel_id == tid &&
401 refcount_inc_not_zero(&session->ref_count)) {
402 rcu_read_unlock_bh();
403 return session;
404 }
405 }
406
407 /* If no match found, the colliding session ID isn't in our
408 * tunnel so try the next session ID.
409 */
410 (*key)++;
411 goto again;
412 }
413
414 rcu_read_unlock_bh();
415
416 return NULL;
417}
418
419struct l2tp_session *l2tp_session_get_next(const struct net *net, struct sock *sk, int pver,
420 u32 tunnel_id, unsigned long *key)
421{
422 if (pver == L2TP_HDR_VER_2)
423 return l2tp_v2_session_get_next(net, tunnel_id, key);
424 else
425 return l2tp_v3_session_get_next(net, tunnel_id, sk, key);
426}
427EXPORT_SYMBOL_GPL(l2tp_session_get_next);
428
309795f4
JC
429/* Lookup a session by interface name.
430 * This is very inefficient but is only used by management interfaces.
431 */
9aaef50c 432struct l2tp_session *l2tp_session_get_by_ifname(const struct net *net,
a4346210 433 const char *ifname)
309795f4
JC
434{
435 struct l2tp_net *pn = l2tp_pernet(net);
d18d3f0a 436 unsigned long tunnel_id, tmp;
309795f4 437 struct l2tp_session *session;
d18d3f0a 438 struct l2tp_tunnel *tunnel;
309795f4 439
e02d494d 440 rcu_read_lock_bh();
d18d3f0a
JC
441 idr_for_each_entry_ul(&pn->l2tp_tunnel_idr, tunnel, tmp, tunnel_id) {
442 if (tunnel) {
443 list_for_each_entry_rcu(session, &tunnel->session_list, list) {
444 if (!strcmp(session->ifname, ifname)) {
abe7a1a7 445 refcount_inc(&session->ref_count);
d18d3f0a
JC
446 rcu_read_unlock_bh();
447
448 return session;
449 }
309795f4
JC
450 }
451 }
452 }
e02d494d 453 rcu_read_unlock_bh();
309795f4
JC
454
455 return NULL;
456}
2777e2ab 457EXPORT_SYMBOL_GPL(l2tp_session_get_by_ifname);
309795f4 458
aa5e17e1
JC
459static void l2tp_session_coll_list_add(struct l2tp_session_coll_list *clist,
460 struct l2tp_session *session)
461{
abe7a1a7 462 refcount_inc(&session->ref_count);
aa5e17e1
JC
463 WARN_ON_ONCE(session->coll_list);
464 session->coll_list = clist;
465 spin_lock(&clist->lock);
466 list_add(&session->clist, &clist->list);
467 spin_unlock(&clist->lock);
468}
469
470static int l2tp_session_collision_add(struct l2tp_net *pn,
471 struct l2tp_session *session1,
472 struct l2tp_session *session2)
473{
474 struct l2tp_session_coll_list *clist;
475
476 lockdep_assert_held(&pn->l2tp_session_idr_lock);
477
478 if (!session2)
479 return -EEXIST;
480
481 /* If existing session is in IP-encap tunnel, refuse new session */
482 if (session2->tunnel->encap == L2TP_ENCAPTYPE_IP)
483 return -EEXIST;
484
485 clist = session2->coll_list;
486 if (!clist) {
487 /* First collision. Allocate list to manage the collided sessions
488 * and add the existing session to the list.
489 */
490 clist = kmalloc(sizeof(*clist), GFP_ATOMIC);
491 if (!clist)
492 return -ENOMEM;
493
494 spin_lock_init(&clist->lock);
495 INIT_LIST_HEAD(&clist->list);
496 refcount_set(&clist->ref_count, 1);
497 l2tp_session_coll_list_add(clist, session2);
498 }
499
500 /* If existing session isn't already in the session hlist, add it. */
501 if (!hash_hashed(&session2->hlist))
89b768ec
JC
502 hash_add_rcu(pn->l2tp_v3_session_htable, &session2->hlist,
503 session2->hlist_key);
aa5e17e1
JC
504
505 /* Add new session to the hlist and collision list */
89b768ec
JC
506 hash_add_rcu(pn->l2tp_v3_session_htable, &session1->hlist,
507 session1->hlist_key);
aa5e17e1
JC
508 refcount_inc(&clist->ref_count);
509 l2tp_session_coll_list_add(clist, session1);
510
511 return 0;
512}
513
514static void l2tp_session_collision_del(struct l2tp_net *pn,
515 struct l2tp_session *session)
516{
517 struct l2tp_session_coll_list *clist = session->coll_list;
518 unsigned long session_key = session->session_id;
519 struct l2tp_session *session2;
520
521 lockdep_assert_held(&pn->l2tp_session_idr_lock);
522
89b768ec 523 hash_del_rcu(&session->hlist);
aa5e17e1
JC
524
525 if (clist) {
526 /* Remove session from its collision list. If there
527 * are other sessions with the same ID, replace this
528 * session's IDR entry with that session, otherwise
529 * remove the IDR entry. If this is the last session,
530 * the collision list data is freed.
531 */
532 spin_lock(&clist->lock);
533 list_del_init(&session->clist);
534 session2 = list_first_entry_or_null(&clist->list, struct l2tp_session, clist);
535 if (session2) {
536 void *old = idr_replace(&pn->l2tp_v3_session_idr, session2, session_key);
537
538 WARN_ON_ONCE(IS_ERR_VALUE(old));
539 } else {
540 void *removed = idr_remove(&pn->l2tp_v3_session_idr, session_key);
541
542 WARN_ON_ONCE(removed != session);
543 }
544 session->coll_list = NULL;
545 spin_unlock(&clist->lock);
546 if (refcount_dec_and_test(&clist->ref_count))
547 kfree(clist);
abe7a1a7 548 l2tp_session_put(session);
aa5e17e1
JC
549 }
550}
551
3953ae7b
GN
552int l2tp_session_register(struct l2tp_session *session,
553 struct l2tp_tunnel *tunnel)
dbdbc73b 554{
aa5e17e1 555 struct l2tp_net *pn = l2tp_pernet(tunnel->l2tp_net);
2146b7dd 556 struct l2tp_session *other_session = NULL;
0aa45570 557 void *old = NULL;
aa5e17e1 558 u32 session_key;
f3c66d4e 559 int err;
dbdbc73b 560
d18d3f0a 561 spin_lock_bh(&tunnel->list_lock);
d587d825
JC
562 spin_lock_bh(&pn->l2tp_session_idr_lock);
563
f3c66d4e
GN
564 if (!tunnel->acpt_newsess) {
565 err = -ENODEV;
d587d825 566 goto out;
f3c66d4e
GN
567 }
568
dbdbc73b 569 if (tunnel->version == L2TP_HDR_VER_3) {
aa5e17e1 570 session_key = session->session_id;
aa5e17e1
JC
571 err = idr_alloc_u32(&pn->l2tp_v3_session_idr, NULL,
572 &session_key, session_key, GFP_ATOMIC);
0d0d9a38 573 /* IP encap expects session IDs to be globally unique, while
aa5e17e1
JC
574 * UDP encap doesn't. This isn't per the RFC, which says that
575 * sessions are identified only by the session ID, but is to
576 * support existing userspace which depends on it.
0d0d9a38 577 */
aa5e17e1 578 if (err == -ENOSPC && tunnel->encap == L2TP_ENCAPTYPE_UDP) {
2146b7dd
JC
579 other_session = idr_find(&pn->l2tp_v3_session_idr,
580 session_key);
581 err = l2tp_session_collision_add(pn, session,
582 other_session);
aa5e17e1 583 }
2a3339f6
JC
584 } else {
585 session_key = l2tp_v2_session_key(tunnel->tunnel_id,
586 session->session_id);
2a3339f6
JC
587 err = idr_alloc_u32(&pn->l2tp_v2_session_idr, NULL,
588 &session_key, session_key, GFP_ATOMIC);
dbdbc73b
GN
589 }
590
2a3339f6
JC
591 if (err) {
592 if (err == -ENOSPC)
593 err = -EEXIST;
d587d825 594 goto out;
2a3339f6 595 }
aa5e17e1 596
abe7a1a7 597 refcount_inc(&tunnel->ref_count);
24256415 598 WRITE_ONCE(session->tunnel, tunnel);
89b768ec 599 list_add_rcu(&session->list, &tunnel->session_list);
dbdbc73b 600
0aa45570 601 /* this makes session available to lockless getters */
2146b7dd
JC
602 if (tunnel->version == L2TP_HDR_VER_3) {
603 if (!other_session)
0aa45570 604 old = idr_replace(&pn->l2tp_v3_session_idr, session, session_key);
2146b7dd 605 } else {
0aa45570 606 old = idr_replace(&pn->l2tp_v2_session_idr, session, session_key);
2146b7dd 607 }
6b7bdcd7 608
0aa45570
JC
609 /* old should be NULL, unless something removed or modified
610 * the IDR entry after our idr_alloc_32 above (which shouldn't
611 * happen).
612 */
613 WARN_ON_ONCE(old);
d587d825
JC
614out:
615 spin_unlock_bh(&pn->l2tp_session_idr_lock);
d18d3f0a 616 spin_unlock_bh(&tunnel->list_lock);
dbdbc73b 617
d587d825
JC
618 if (!err)
619 trace_register_session(session);
620
f3c66d4e 621 return err;
dbdbc73b 622}
3953ae7b 623EXPORT_SYMBOL_GPL(l2tp_session_register);
dbdbc73b 624
fd558d18
JC
625/*****************************************************************************
626 * Receive data handling
627 *****************************************************************************/
628
629/* Queue a skb in order. We come here only if the skb has an L2TP sequence
630 * number.
631 */
632static void l2tp_recv_queue_skb(struct l2tp_session *session, struct sk_buff *skb)
633{
634 struct sk_buff *skbp;
635 struct sk_buff *tmp;
f7faffa3 636 u32 ns = L2TP_SKB_CB(skb)->ns;
fd558d18
JC
637
638 spin_lock_bh(&session->reorder_q.lock);
639 skb_queue_walk_safe(&session->reorder_q, skbp, tmp) {
640 if (L2TP_SKB_CB(skbp)->ns > ns) {
641 __skb_queue_before(&session->reorder_q, skbp, skb);
7b7c0719 642 atomic_long_inc(&session->stats.rx_oos_packets);
fd558d18
JC
643 goto out;
644 }
645 }
646
647 __skb_queue_tail(&session->reorder_q, skb);
648
649out:
650 spin_unlock_bh(&session->reorder_q.lock);
651}
652
653/* Dequeue a single skb.
654 */
655static void l2tp_recv_dequeue_skb(struct l2tp_session *session, struct sk_buff *skb)
656{
657 struct l2tp_tunnel *tunnel = session->tunnel;
658 int length = L2TP_SKB_CB(skb)->length;
659
660 /* We're about to requeue the skb, so return resources
661 * to its current owner (a socket receive buffer).
662 */
663 skb_orphan(skb);
664
7b7c0719
TP
665 atomic_long_inc(&tunnel->stats.rx_packets);
666 atomic_long_add(length, &tunnel->stats.rx_bytes);
667 atomic_long_inc(&session->stats.rx_packets);
668 atomic_long_add(length, &session->stats.rx_bytes);
fd558d18
JC
669
670 if (L2TP_SKB_CB(skb)->has_seq) {
671 /* Bump our Nr */
672 session->nr++;
8a1631d5 673 session->nr &= session->nr_max;
6b7bdcd7 674 trace_session_seqnum_update(session);
fd558d18
JC
675 }
676
677 /* call private receive handler */
0febc7b3 678 if (session->recv_skb)
fd558d18
JC
679 (*session->recv_skb)(session, skb, L2TP_SKB_CB(skb)->length);
680 else
681 kfree_skb(skb);
fd558d18
JC
682}
683
684/* Dequeue skbs from the session's reorder_q, subject to packet order.
685 * Skbs that have been in the queue for too long are simply discarded.
686 */
687static void l2tp_recv_dequeue(struct l2tp_session *session)
688{
689 struct sk_buff *skb;
690 struct sk_buff *tmp;
691
692 /* If the pkt at the head of the queue has the nr that we
693 * expect to send up next, dequeue it and any other
694 * in-sequence packets behind it.
695 */
e2e210c0 696start:
fd558d18
JC
697 spin_lock_bh(&session->reorder_q.lock);
698 skb_queue_walk_safe(&session->reorder_q, skb, tmp) {
6b7bdcd7
TP
699 struct l2tp_skb_cb *cb = L2TP_SKB_CB(skb);
700
701 /* If the packet has been pending on the queue for too long, discard it */
702 if (time_after(jiffies, cb->expires)) {
7b7c0719
TP
703 atomic_long_inc(&session->stats.rx_seq_discards);
704 atomic_long_inc(&session->stats.rx_errors);
6b7bdcd7 705 trace_session_pkt_expired(session, cb->ns);
38d40b3f 706 session->reorder_skip = 1;
fd558d18
JC
707 __skb_unlink(skb, &session->reorder_q);
708 kfree_skb(skb);
fd558d18
JC
709 continue;
710 }
711
6b7bdcd7 712 if (cb->has_seq) {
38d40b3f 713 if (session->reorder_skip) {
38d40b3f 714 session->reorder_skip = 0;
6b7bdcd7
TP
715 session->nr = cb->ns;
716 trace_session_seqnum_reset(session);
38d40b3f 717 }
6b7bdcd7 718 if (cb->ns != session->nr)
fd558d18 719 goto out;
fd558d18
JC
720 }
721 __skb_unlink(skb, &session->reorder_q);
722
723 /* Process the skb. We release the queue lock while we
724 * do so to let other contexts process the queue.
725 */
726 spin_unlock_bh(&session->reorder_q.lock);
727 l2tp_recv_dequeue_skb(session, skb);
e2e210c0 728 goto start;
fd558d18
JC
729 }
730
731out:
732 spin_unlock_bh(&session->reorder_q.lock);
733}
734
8a1631d5
JC
735static int l2tp_seq_check_rx_window(struct l2tp_session *session, u32 nr)
736{
737 u32 nws;
738
739 if (nr >= session->nr)
740 nws = nr - session->nr;
741 else
742 nws = (session->nr_max + 1) - (session->nr - nr);
743
744 return nws < session->nr_window_size;
745}
746
b6dc01a4
JC
747/* If packet has sequence numbers, queue it if acceptable. Returns 0 if
748 * acceptable, else non-zero.
749 */
750static int l2tp_recv_data_seq(struct l2tp_session *session, struct sk_buff *skb)
751{
6b7bdcd7
TP
752 struct l2tp_skb_cb *cb = L2TP_SKB_CB(skb);
753
754 if (!l2tp_seq_check_rx_window(session, cb->ns)) {
8a1631d5
JC
755 /* Packet sequence number is outside allowed window.
756 * Discard it.
757 */
6b7bdcd7 758 trace_session_pkt_outside_rx_window(session, cb->ns);
8a1631d5
JC
759 goto discard;
760 }
761
b6dc01a4
JC
762 if (session->reorder_timeout != 0) {
763 /* Packet reordering enabled. Add skb to session's
764 * reorder queue, in order of ns.
765 */
766 l2tp_recv_queue_skb(session, skb);
a0dbd822
JC
767 goto out;
768 }
769
770 /* Packet reordering disabled. Discard out-of-sequence packets, while
771 * tracking the number if in-sequence packets after the first OOS packet
772 * is seen. After nr_oos_count_max in-sequence packets, reset the
773 * sequence number to re-enable packet reception.
774 */
6b7bdcd7 775 if (cb->ns == session->nr) {
a0dbd822 776 skb_queue_tail(&session->reorder_q, skb);
b6dc01a4 777 } else {
6b7bdcd7 778 u32 nr_oos = cb->ns;
a0dbd822
JC
779 u32 nr_next = (session->nr_oos + 1) & session->nr_max;
780
781 if (nr_oos == nr_next)
782 session->nr_oos_count++;
783 else
784 session->nr_oos_count = 0;
785
786 session->nr_oos = nr_oos;
787 if (session->nr_oos_count > session->nr_oos_count_max) {
788 session->reorder_skip = 1;
a0dbd822
JC
789 }
790 if (!session->reorder_skip) {
b6dc01a4 791 atomic_long_inc(&session->stats.rx_seq_discards);
6b7bdcd7 792 trace_session_pkt_oos(session, cb->ns);
b6dc01a4
JC
793 goto discard;
794 }
795 skb_queue_tail(&session->reorder_q, skb);
796 }
797
a0dbd822 798out:
b6dc01a4
JC
799 return 0;
800
801discard:
802 return 1;
803}
804
f7faffa3
JC
805/* Do receive processing of L2TP data frames. We handle both L2TPv2
806 * and L2TPv3 data frames here.
807 *
808 * L2TPv2 Data Message Header
809 *
810 * 0 1 2 3
811 * 0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1
812 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
813 * |T|L|x|x|S|x|O|P|x|x|x|x| Ver | Length (opt) |
814 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
815 * | Tunnel ID | Session ID |
816 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
817 * | Ns (opt) | Nr (opt) |
818 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
819 * | Offset Size (opt) | Offset pad... (opt)
820 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
821 *
822 * Data frames are marked by T=0. All other fields are the same as
823 * those in L2TP control frames.
824 *
825 * L2TPv3 Data Message Header
826 *
827 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
828 * | L2TP Session Header |
829 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
830 * | L2-Specific Sublayer |
831 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
832 * | Tunnel Payload ...
833 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
834 *
835 * L2TPv3 Session Header Over IP
836 *
837 * 0 1 2 3
838 * 0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1
839 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
840 * | Session ID |
841 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
842 * | Cookie (optional, maximum 64 bits)...
843 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
844 * |
845 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
846 *
847 * L2TPv3 L2-Specific Sublayer Format
848 *
849 * 0 1 2 3
850 * 0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1
851 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
852 * |x|S|x|x|x|x|x|x| Sequence Number |
853 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
854 *
23fe846f
GN
855 * Cookie value and sublayer format are negotiated with the peer when
856 * the session is set up. Unlike L2TPv2, we do not need to parse the
857 * packet header to determine if optional fields are present.
f7faffa3
JC
858 *
859 * Caller must already have parsed the frame and determined that it is
860 * a data (not control) frame before coming here. Fields up to the
861 * session-id have already been parsed and ptr points to the data
862 * after the session-id.
fd558d18 863 */
f7faffa3
JC
864void l2tp_recv_common(struct l2tp_session *session, struct sk_buff *skb,
865 unsigned char *ptr, unsigned char *optr, u16 hdrflags,
2b139e6b 866 int length)
fd558d18 867{
f7faffa3 868 struct l2tp_tunnel *tunnel = session->tunnel;
fd558d18 869 int offset;
fd558d18 870
f7faffa3
JC
871 /* Parse and check optional cookie */
872 if (session->peer_cookie_len > 0) {
873 if (memcmp(ptr, &session->peer_cookie[0], session->peer_cookie_len)) {
3e59e885
MS
874 pr_debug_ratelimited("%s: cookie mismatch (%u/%u). Discarding.\n",
875 tunnel->name, tunnel->tunnel_id,
876 session->session_id);
7b7c0719 877 atomic_long_inc(&session->stats.rx_cookie_discards);
f7faffa3
JC
878 goto discard;
879 }
880 ptr += session->peer_cookie_len;
881 }
882
fd558d18
JC
883 /* Handle the optional sequence numbers. Sequence numbers are
884 * in different places for L2TPv2 and L2TPv3.
885 *
886 * If we are the LAC, enable/disable sequence numbers under
887 * the control of the LNS. If no sequence numbers present but
888 * we were expecting them, discard frame.
889 */
fd558d18 890 L2TP_SKB_CB(skb)->has_seq = 0;
f7faffa3
JC
891 if (tunnel->version == L2TP_HDR_VER_2) {
892 if (hdrflags & L2TP_HDRFLAG_S) {
f7faffa3 893 /* Store L2TP info in the skb */
12923365 894 L2TP_SKB_CB(skb)->ns = ntohs(*(__be16 *)ptr);
f7faffa3 895 L2TP_SKB_CB(skb)->has_seq = 1;
12923365
TP
896 ptr += 2;
897 /* Skip past nr in the header */
898 ptr += 2;
fd558d18 899
f7faffa3
JC
900 }
901 } else if (session->l2specific_type == L2TP_L2SPECTYPE_DEFAULT) {
b71a61cc 902 u32 l2h = ntohl(*(__be32 *)ptr);
f7faffa3
JC
903
904 if (l2h & 0x40000000) {
f7faffa3 905 /* Store L2TP info in the skb */
12923365 906 L2TP_SKB_CB(skb)->ns = l2h & 0x00ffffff;
f7faffa3 907 L2TP_SKB_CB(skb)->has_seq = 1;
f7faffa3 908 }
62e7b6a5 909 ptr += 4;
fd558d18
JC
910 }
911
912 if (L2TP_SKB_CB(skb)->has_seq) {
20dcb110 913 /* Received a packet with sequence numbers. If we're the LAC,
fd558d18
JC
914 * check if we sre sending sequence numbers and if not,
915 * configure it so.
916 */
6c0ec37b 917 if (!session->lns_mode && !session->send_seq) {
6b7bdcd7 918 trace_session_seqnum_lns_enable(session);
3f9b9770 919 session->send_seq = 1;
24256415
JC
920 l2tp_session_set_header_len(session, tunnel->version,
921 tunnel->encap);
fd558d18
JC
922 }
923 } else {
924 /* No sequence numbers.
925 * If user has configured mandatory sequence numbers, discard.
926 */
927 if (session->recv_seq) {
3e59e885
MS
928 pr_debug_ratelimited("%s: recv data has no seq numbers when required. Discarding.\n",
929 session->name);
7b7c0719 930 atomic_long_inc(&session->stats.rx_seq_discards);
fd558d18
JC
931 goto discard;
932 }
933
934 /* If we're the LAC and we're sending sequence numbers, the
935 * LNS has requested that we no longer send sequence numbers.
936 * If we're the LNS and we're sending sequence numbers, the
937 * LAC is broken. Discard the frame.
938 */
6c0ec37b 939 if (!session->lns_mode && session->send_seq) {
6b7bdcd7 940 trace_session_seqnum_lns_disable(session);
fd558d18 941 session->send_seq = 0;
24256415
JC
942 l2tp_session_set_header_len(session, tunnel->version,
943 tunnel->encap);
fd558d18 944 } else if (session->send_seq) {
3e59e885
MS
945 pr_debug_ratelimited("%s: recv data has no seq numbers when required. Discarding.\n",
946 session->name);
7b7c0719 947 atomic_long_inc(&session->stats.rx_seq_discards);
fd558d18
JC
948 goto discard;
949 }
950 }
951
900631ee
JC
952 /* Session data offset is defined only for L2TPv2 and is
953 * indicated by an optional 16-bit value in the header.
f7faffa3
JC
954 */
955 if (tunnel->version == L2TP_HDR_VER_2) {
956 /* If offset bit set, skip it. */
957 if (hdrflags & L2TP_HDRFLAG_O) {
958 offset = ntohs(*(__be16 *)ptr);
959 ptr += 2 + offset;
960 }
900631ee 961 }
fd558d18
JC
962
963 offset = ptr - optr;
964 if (!pskb_may_pull(skb, offset))
965 goto discard;
966
967 __skb_pull(skb, offset);
968
fd558d18
JC
969 /* Prepare skb for adding to the session's reorder_q. Hold
970 * packets for max reorder_timeout or 1 second if not
971 * reordering.
972 */
973 L2TP_SKB_CB(skb)->length = length;
974 L2TP_SKB_CB(skb)->expires = jiffies +
975 (session->reorder_timeout ? session->reorder_timeout : HZ);
976
977 /* Add packet to the session's receive queue. Reordering is done here, if
978 * enabled. Saved L2TP protocol info is stored in skb->sb[].
979 */
980 if (L2TP_SKB_CB(skb)->has_seq) {
b6dc01a4
JC
981 if (l2tp_recv_data_seq(session, skb))
982 goto discard;
fd558d18
JC
983 } else {
984 /* No sequence numbers. Add the skb to the tail of the
985 * reorder queue. This ensures that it will be
986 * delivered after all previous sequenced skbs.
987 */
988 skb_queue_tail(&session->reorder_q, skb);
989 }
990
991 /* Try to dequeue as many skbs from reorder_q as we can. */
992 l2tp_recv_dequeue(session);
993
f7faffa3 994 return;
fd558d18
JC
995
996discard:
7b7c0719 997 atomic_long_inc(&session->stats.rx_errors);
fd558d18 998 kfree_skb(skb);
f7faffa3 999}
ca7885db 1000EXPORT_SYMBOL_GPL(l2tp_recv_common);
f7faffa3 1001
48f72f92
TP
1002/* Drop skbs from the session's reorder_q
1003 */
493048f5 1004static void l2tp_session_queue_purge(struct l2tp_session *session)
48f72f92
TP
1005{
1006 struct sk_buff *skb = NULL;
b71a61cc 1007
48f72f92
TP
1008 while ((skb = skb_dequeue(&session->reorder_q))) {
1009 atomic_long_inc(&session->stats.rx_errors);
1010 kfree_skb(skb);
48f72f92 1011 }
48f72f92 1012}
48f72f92 1013
ff6a2ac2
JC
1014/* UDP encapsulation receive handler. See net/ipv4/udp.c for details. */
1015int l2tp_udp_encap_recv(struct sock *sk, struct sk_buff *skb)
f7faffa3
JC
1016{
1017 struct l2tp_session *session = NULL;
ff6a2ac2
JC
1018 struct l2tp_tunnel *tunnel = NULL;
1019 struct net *net = sock_net(sk);
f7faffa3
JC
1020 unsigned char *ptr, *optr;
1021 u16 hdrflags;
f7faffa3
JC
1022 u16 version;
1023 int length;
1024
aa785f93 1025 /* UDP has verified checksum */
f7faffa3
JC
1026
1027 /* UDP always verifies the packet length. */
1028 __skb_pull(skb, sizeof(struct udphdr));
1029
1030 /* Short packet? */
ff6a2ac2
JC
1031 if (!pskb_may_pull(skb, L2TP_HDR_SIZE_MAX))
1032 goto pass;
f7faffa3 1033
e50e705c 1034 /* Point to L2TP header */
95075150
TP
1035 optr = skb->data;
1036 ptr = skb->data;
e50e705c 1037
f7faffa3 1038 /* Get L2TP header flags */
b71a61cc 1039 hdrflags = ntohs(*(__be16 *)ptr);
f7faffa3 1040
36479805 1041 /* Get protocol version */
f7faffa3 1042 version = hdrflags & L2TP_HDR_VER_MASK;
f7faffa3
JC
1043
1044 /* Get length of L2TP packet */
1045 length = skb->len;
1046
1047 /* If type is control packet, it is handled by userspace. */
12923365 1048 if (hdrflags & L2TP_HDRFLAG_T)
3e59e885 1049 goto pass;
f7faffa3
JC
1050
1051 /* Skip flags */
1052 ptr += 2;
1053
36479805 1054 if (version == L2TP_HDR_VER_2) {
ff6a2ac2
JC
1055 u16 tunnel_id, session_id;
1056
f7faffa3
JC
1057 /* If length is present, skip it */
1058 if (hdrflags & L2TP_HDRFLAG_L)
1059 ptr += 2;
1060
1061 /* Extract tunnel and session ID */
b71a61cc 1062 tunnel_id = ntohs(*(__be16 *)ptr);
f7faffa3 1063 ptr += 2;
b71a61cc 1064 session_id = ntohs(*(__be16 *)ptr);
f7faffa3 1065 ptr += 2;
ff6a2ac2
JC
1066
1067 session = l2tp_v2_session_get(net, tunnel_id, session_id);
f7faffa3 1068 } else {
ff6a2ac2
JC
1069 u32 session_id;
1070
f7faffa3 1071 ptr += 2; /* skip reserved bits */
b71a61cc 1072 session_id = ntohl(*(__be32 *)ptr);
f7faffa3 1073 ptr += 4;
f7faffa3 1074
ff6a2ac2 1075 session = l2tp_v3_session_get(net, sk, session_id);
36479805
ST
1076 }
1077
309795f4 1078 if (!session || !session->recv_skb) {
a4346210 1079 if (session)
abe7a1a7 1080 l2tp_session_put(session);
61b9a047 1081
f7faffa3 1082 /* Not found? Pass to userspace to deal with */
3e59e885 1083 goto pass;
f7faffa3
JC
1084 }
1085
ff6a2ac2
JC
1086 tunnel = session->tunnel;
1087
1088 /* Check protocol version */
1089 if (version != tunnel->version)
1090 goto invalid;
1091
1092 if (version == L2TP_HDR_VER_3 &&
9b6ff7eb 1093 l2tp_v3_ensure_opt_in_linear(session, skb, &ptr, &optr)) {
abe7a1a7 1094 l2tp_session_put(session);
3e59e885 1095 goto invalid;
9b6ff7eb 1096 }
4522a70d 1097
2b139e6b 1098 l2tp_recv_common(session, skb, ptr, optr, hdrflags, length);
abe7a1a7 1099 l2tp_session_put(session);
fd558d18
JC
1100
1101 return 0;
1102
3e59e885
MS
1103invalid:
1104 atomic_long_inc(&tunnel->stats.rx_invalid);
1105
1106pass:
fd558d18
JC
1107 /* Put UDP header back */
1108 __skb_push(skb, sizeof(struct udphdr));
1109
fd558d18
JC
1110 return 1;
1111}
1112EXPORT_SYMBOL_GPL(l2tp_udp_encap_recv);
1113
ff6a2ac2 1114/* UDP encapsulation receive error handler. See net/ipv4/udp.c for details. */
6e828dc6
TP
1115static void l2tp_udp_encap_err_recv(struct sock *sk, struct sk_buff *skb, int err,
1116 __be16 port, u32 info, u8 *payload)
1117{
6e828dc6
TP
1118 sk->sk_err = err;
1119 sk_error_report(sk);
1120
1121 if (ip_hdr(skb)->version == IPVERSION) {
1122 if (inet_test_bit(RECVERR, sk))
1123 return ip_icmp_error(sk, skb, err, port, info, payload);
1124#if IS_ENABLED(CONFIG_IPV6)
1125 } else {
1126 if (inet6_test_bit(RECVERR6, sk))
1127 return ipv6_icmp_error(sk, skb, err, port, info, payload);
1128#endif
1129 }
1130}
1131
fd558d18
JC
1132/************************************************************************
1133 * Transmit handling
1134 ***********************************************************************/
1135
1136/* Build an L2TP header for the session into the buffer provided.
1137 */
f7faffa3 1138static int l2tp_build_l2tpv2_header(struct l2tp_session *session, void *buf)
fd558d18 1139{
f7faffa3 1140 struct l2tp_tunnel *tunnel = session->tunnel;
fd558d18 1141 __be16 *bufp = buf;
f7faffa3 1142 __be16 *optr = buf;
fd558d18
JC
1143 u16 flags = L2TP_HDR_VER_2;
1144 u32 tunnel_id = tunnel->peer_tunnel_id;
1145 u32 session_id = session->peer_session_id;
1146
1147 if (session->send_seq)
1148 flags |= L2TP_HDRFLAG_S;
1149
1150 /* Setup L2TP header. */
1151 *bufp++ = htons(flags);
1152 *bufp++ = htons(tunnel_id);
1153 *bufp++ = htons(session_id);
1154 if (session->send_seq) {
1155 *bufp++ = htons(session->ns);
1156 *bufp++ = 0;
1157 session->ns++;
f7faffa3 1158 session->ns &= 0xffff;
6b7bdcd7 1159 trace_session_seqnum_update(session);
fd558d18 1160 }
f7faffa3
JC
1161
1162 return bufp - optr;
fd558d18
JC
1163}
1164
f7faffa3 1165static int l2tp_build_l2tpv3_header(struct l2tp_session *session, void *buf)
fd558d18 1166{
0d76751f 1167 struct l2tp_tunnel *tunnel = session->tunnel;
f7faffa3
JC
1168 char *bufp = buf;
1169 char *optr = bufp;
f7faffa3 1170
0d76751f
JC
1171 /* Setup L2TP header. The header differs slightly for UDP and
1172 * IP encapsulations. For UDP, there is 4 bytes of flags.
1173 */
1174 if (tunnel->encap == L2TP_ENCAPTYPE_UDP) {
1175 u16 flags = L2TP_HDR_VER_3;
b71a61cc 1176 *((__be16 *)bufp) = htons(flags);
0d76751f 1177 bufp += 2;
b71a61cc 1178 *((__be16 *)bufp) = 0;
0d76751f
JC
1179 bufp += 2;
1180 }
1181
b71a61cc 1182 *((__be32 *)bufp) = htonl(session->peer_session_id);
f7faffa3
JC
1183 bufp += 4;
1184 if (session->cookie_len) {
1185 memcpy(bufp, &session->cookie[0], session->cookie_len);
1186 bufp += session->cookie_len;
1187 }
62e7b6a5
LB
1188 if (session->l2specific_type == L2TP_L2SPECTYPE_DEFAULT) {
1189 u32 l2h = 0;
f7faffa3 1190
62e7b6a5
LB
1191 if (session->send_seq) {
1192 l2h = 0x40000000 | session->ns;
1193 session->ns++;
1194 session->ns &= 0xffffff;
6b7bdcd7 1195 trace_session_seqnum_update(session);
f7faffa3 1196 }
62e7b6a5
LB
1197
1198 *((__be32 *)bufp) = htonl(l2h);
1199 bufp += 4;
f7faffa3 1200 }
fd558d18 1201
f7faffa3 1202 return bufp - optr;
fd558d18 1203}
fd558d18 1204
de68b039
TP
1205/* Queue the packet to IP for output: tunnel socket lock must be held */
1206static int l2tp_xmit_queue(struct l2tp_tunnel *tunnel, struct sk_buff *skb, struct flowi *fl)
fd558d18 1207{
de68b039 1208 int err;
fd558d18 1209
60ff7467 1210 skb->ignore_df = 1;
27d53323 1211 skb_dst_drop(skb);
d2cf3361 1212#if IS_ENABLED(CONFIG_IPV6)
b954f940 1213 if (l2tp_sk_is_v6(tunnel->sock))
de68b039 1214 err = inet6_csk_xmit(tunnel->sock, skb, NULL);
d2cf3361
BL
1215 else
1216#endif
de68b039 1217 err = ip_queue_xmit(tunnel->sock, skb, fl);
fd558d18 1218
de68b039 1219 return err >= 0 ? NET_XMIT_SUCCESS : NET_XMIT_DROP;
fd558d18 1220}
fd558d18 1221
f52e4b27 1222static int l2tp_xmit_core(struct l2tp_session *session, struct sk_buff *skb, unsigned int *len)
fd558d18 1223{
0d76751f 1224 struct l2tp_tunnel *tunnel = session->tunnel;
de68b039 1225 unsigned int data_len = skb->len;
0d76751f 1226 struct sock *sk = tunnel->sock;
de68b039 1227 int headroom, uhlen, udp_len;
b8c84307 1228 int ret = NET_XMIT_SUCCESS;
de68b039
TP
1229 struct inet_sock *inet;
1230 struct udphdr *uh;
fd558d18
JC
1231
1232 /* Check that there's enough headroom in the skb to insert IP,
1233 * UDP and L2TP headers. If not enough, expand it to
1234 * make room. Adjust truesize.
1235 */
de68b039
TP
1236 uhlen = (tunnel->encap == L2TP_ENCAPTYPE_UDP) ? sizeof(*uh) : 0;
1237 headroom = NET_SKB_PAD + sizeof(struct iphdr) + uhlen + session->hdr_len;
835acf5d 1238 if (skb_cow_head(skb, headroom)) {
b8c84307
ED
1239 kfree_skb(skb);
1240 return NET_XMIT_DROP;
835acf5d 1241 }
fd558d18 1242
fd558d18 1243 /* Setup L2TP header */
2dedab6f 1244 if (tunnel->version == L2TP_HDR_VER_2)
efe05278 1245 l2tp_build_l2tpv2_header(session, __skb_push(skb, session->hdr_len));
2dedab6f 1246 else
efe05278 1247 l2tp_build_l2tpv3_header(session, __skb_push(skb, session->hdr_len));
fd558d18 1248
0d76751f 1249 /* Reset skb netfilter state */
fd558d18 1250 memset(&(IPCB(skb)->opt), 0, sizeof(IPCB(skb)->opt));
de68b039 1251 IPCB(skb)->flags &= ~(IPSKB_XFRM_TUNNEL_SIZE | IPSKB_XFRM_TRANSFORMED | IPSKB_REROUTED);
895b5c9f 1252 nf_reset_ct(skb);
fd558d18 1253
86a41ea9
JC
1254 /* L2TP uses its own lockdep subclass to avoid lockdep splats caused by
1255 * nested socket calls on the same lockdep socket class. This can
1256 * happen when data from a user socket is routed over l2tp, which uses
1257 * another userspace socket.
1258 */
1259 spin_lock_nested(&sk->sk_lock.slock, L2TP_DEPTH_NESTING);
1260
6af88da1 1261 if (sock_owned_by_user(sk)) {
b8c84307
ED
1262 kfree_skb(skb);
1263 ret = NET_XMIT_DROP;
6af88da1
DM
1264 goto out_unlock;
1265 }
1266
b954f940
PA
1267 /* The user-space may change the connection status for the user-space
1268 * provided socket at run time: we must check it under the socket lock
1269 */
1270 if (tunnel->fd >= 0 && sk->sk_state != TCP_ESTABLISHED) {
1271 kfree_skb(skb);
1272 ret = NET_XMIT_DROP;
1273 goto out_unlock;
1274 }
1275
f52e4b27
TP
1276 /* Report transmitted length before we add encap header, which keeps
1277 * statistics consistent for both UDP and IP encap tx/rx paths.
1278 */
1279 *len = skb->len;
1280
d9d8da80 1281 inet = inet_sk(sk);
0d76751f
JC
1282 switch (tunnel->encap) {
1283 case L2TP_ENCAPTYPE_UDP:
1284 /* Setup UDP header */
0d76751f
JC
1285 __skb_push(skb, sizeof(*uh));
1286 skb_reset_transport_header(skb);
1287 uh = udp_hdr(skb);
1288 uh->source = inet->inet_sport;
1289 uh->dest = inet->inet_dport;
efe05278 1290 udp_len = uhlen + session->hdr_len + data_len;
0d76751f 1291 uh->len = htons(udp_len);
0d76751f
JC
1292
1293 /* Calculate UDP checksum if configured to do so */
d2cf3361 1294#if IS_ENABLED(CONFIG_IPV6)
b954f940 1295 if (l2tp_sk_is_v6(sk))
77157e19
TH
1296 udp6_set_csum(udp_get_no_check6_tx(sk),
1297 skb, &inet6_sk(sk)->saddr,
1298 &sk->sk_v6_daddr, udp_len);
d2cf3361
BL
1299 else
1300#endif
0864e331
TP
1301 udp_set_csum(sk->sk_no_check_tx, skb, inet->inet_saddr,
1302 inet->inet_daddr, udp_len);
0d76751f
JC
1303 break;
1304
1305 case L2TP_ENCAPTYPE_IP:
1306 break;
fd558d18
JC
1307 }
1308
de68b039
TP
1309 ret = l2tp_xmit_queue(tunnel, skb, &inet->cork.fl);
1310
6af88da1 1311out_unlock:
86a41ea9 1312 spin_unlock(&sk->sk_lock.slock);
fd558d18 1313
b8c84307 1314 return ret;
fd558d18 1315}
de68b039
TP
1316
1317/* If caller requires the skb to have a ppp header, the header must be
1318 * inserted in the skb data before calling this function.
1319 */
1320int l2tp_xmit_skb(struct l2tp_session *session, struct sk_buff *skb)
1321{
f52e4b27 1322 unsigned int len = 0;
de68b039
TP
1323 int ret;
1324
f52e4b27 1325 ret = l2tp_xmit_core(session, skb, &len);
de68b039
TP
1326 if (ret == NET_XMIT_SUCCESS) {
1327 atomic_long_inc(&session->tunnel->stats.tx_packets);
1328 atomic_long_add(len, &session->tunnel->stats.tx_bytes);
1329 atomic_long_inc(&session->stats.tx_packets);
1330 atomic_long_add(len, &session->stats.tx_bytes);
1331 } else {
1332 atomic_long_inc(&session->tunnel->stats.tx_errors);
1333 atomic_long_inc(&session->stats.tx_errors);
1334 }
1335 return ret;
1336}
fd558d18
JC
1337EXPORT_SYMBOL_GPL(l2tp_xmit_skb);
1338
1339/*****************************************************************************
1340 * Tinnel and session create/destroy.
1341 *****************************************************************************/
1342
d18d3f0a 1343/* Remove an l2tp session from l2tp_core's lists. */
b2aecfe8
TP
1344static void l2tp_session_unhash(struct l2tp_session *session)
1345{
1346 struct l2tp_tunnel *tunnel = session->tunnel;
1347
b2aecfe8 1348 if (tunnel) {
2a3339f6
JC
1349 struct l2tp_net *pn = l2tp_pernet(tunnel->l2tp_net);
1350 struct l2tp_session *removed = session;
1351
d18d3f0a 1352 spin_lock_bh(&tunnel->list_lock);
d587d825
JC
1353 spin_lock_bh(&pn->l2tp_session_idr_lock);
1354
1355 /* Remove from the per-tunnel list */
d18d3f0a 1356 list_del_init(&session->list);
b2aecfe8 1357
2a3339f6 1358 /* Remove from per-net IDR */
aa5e17e1 1359 if (tunnel->version == L2TP_HDR_VER_3) {
aa5e17e1
JC
1360 if (hash_hashed(&session->hlist))
1361 l2tp_session_collision_del(pn, session);
1362 else
1363 removed = idr_remove(&pn->l2tp_v3_session_idr,
1364 session->session_id);
2a3339f6
JC
1365 } else {
1366 u32 session_key = l2tp_v2_session_key(tunnel->tunnel_id,
1367 session->session_id);
1368 removed = idr_remove(&pn->l2tp_v2_session_idr,
1369 session_key);
b2aecfe8 1370 }
2a3339f6 1371 WARN_ON_ONCE(removed && removed != session);
d587d825 1372
2a3339f6 1373 spin_unlock_bh(&pn->l2tp_session_idr_lock);
d587d825 1374 spin_unlock_bh(&tunnel->list_lock);
b2aecfe8
TP
1375 }
1376}
1377
fd558d18
JC
1378/* When the tunnel is closed, all the attached sessions need to go too.
1379 */
d08532bb 1380static void l2tp_tunnel_closeall(struct l2tp_tunnel *tunnel)
fd558d18 1381{
fd558d18
JC
1382 struct l2tp_session *session;
1383
d18d3f0a 1384 spin_lock_bh(&tunnel->list_lock);
f3c66d4e 1385 tunnel->acpt_newsess = false;
fc7ec7f5 1386 list_for_each_entry(session, &tunnel->session_list, list)
d18d3f0a 1387 l2tp_session_delete(session);
d18d3f0a 1388 spin_unlock_bh(&tunnel->list_lock);
fd558d18 1389}
fd558d18 1390
9980d001
TP
1391/* Tunnel socket destroy hook for UDP encapsulation */
1392static void l2tp_udp_encap_destroy(struct sock *sk)
1393{
2e7a2806 1394 struct l2tp_tunnel *tunnel;
d00fa9ad 1395
2e7a2806
JC
1396 tunnel = l2tp_sk_to_tunnel(sk);
1397 if (tunnel) {
d00fa9ad 1398 l2tp_tunnel_delete(tunnel);
abe7a1a7 1399 l2tp_tunnel_put(tunnel);
2e7a2806 1400 }
9980d001
TP
1401}
1402
c4d48a58
CW
1403static void l2tp_tunnel_remove(struct net *net, struct l2tp_tunnel *tunnel)
1404{
1405 struct l2tp_net *pn = l2tp_pernet(net);
1406
1407 spin_lock_bh(&pn->l2tp_tunnel_idr_lock);
1408 idr_remove(&pn->l2tp_tunnel_idr, tunnel->tunnel_id);
1409 spin_unlock_bh(&pn->l2tp_tunnel_idr_lock);
1410}
1411
f8ccac0e
TP
1412/* Workqueue tunnel deletion function */
1413static void l2tp_tunnel_del_work(struct work_struct *work)
1414{
d00fa9ad
JC
1415 struct l2tp_tunnel *tunnel = container_of(work, struct l2tp_tunnel,
1416 del_work);
1417 struct sock *sk = tunnel->sock;
1418 struct socket *sock = sk->sk_socket;
12d656af
RK
1419
1420 l2tp_tunnel_closeall(tunnel);
1421
76a6abdb 1422 /* If the tunnel socket was created within the kernel, use
02d13ed5 1423 * the sk API to release it here.
f8ccac0e 1424 */
76a6abdb 1425 if (tunnel->fd < 0) {
26abe143 1426 if (sock) {
02d13ed5 1427 kernel_sock_shutdown(sock, SHUT_RDWR);
26abe143
EB
1428 sock_release(sock);
1429 }
167eb17e 1430 }
f8ccac0e 1431
c4d48a58 1432 l2tp_tunnel_remove(tunnel->l2tp_net, tunnel);
d00fa9ad 1433 /* drop initial ref */
abe7a1a7 1434 l2tp_tunnel_put(tunnel);
d00fa9ad
JC
1435
1436 /* drop workqueue ref */
abe7a1a7 1437 l2tp_tunnel_put(tunnel);
fd558d18 1438}
fd558d18 1439
789a4a2c
JC
1440/* Create a socket for the tunnel, if one isn't set up by
1441 * userspace. This is used for static tunnels where there is no
1442 * managing L2TP daemon.
167eb17e
TP
1443 *
1444 * Since we don't want these sockets to keep a namespace alive by
1445 * themselves, we drop the socket's namespace refcount after creation.
1446 * These sockets are freed when the namespace exits using the pernet
1447 * exit hook.
789a4a2c 1448 */
167eb17e 1449static int l2tp_tunnel_sock_create(struct net *net,
8ce9825a
TP
1450 u32 tunnel_id,
1451 u32 peer_tunnel_id,
1452 struct l2tp_tunnel_cfg *cfg,
1453 struct socket **sockp)
789a4a2c
JC
1454{
1455 int err = -EINVAL;
167eb17e 1456 struct socket *sock = NULL;
85644b4d 1457 struct udp_port_cfg udp_conf;
789a4a2c
JC
1458
1459 switch (cfg->encap) {
1460 case L2TP_ENCAPTYPE_UDP:
85644b4d
TH
1461 memset(&udp_conf, 0, sizeof(udp_conf));
1462
f9bac8df
CE
1463#if IS_ENABLED(CONFIG_IPV6)
1464 if (cfg->local_ip6 && cfg->peer_ip6) {
85644b4d
TH
1465 udp_conf.family = AF_INET6;
1466 memcpy(&udp_conf.local_ip6, cfg->local_ip6,
1467 sizeof(udp_conf.local_ip6));
1468 memcpy(&udp_conf.peer_ip6, cfg->peer_ip6,
1469 sizeof(udp_conf.peer_ip6));
1470 udp_conf.use_udp6_tx_checksums =
b71a61cc 1471 !cfg->udp6_zero_tx_checksums;
85644b4d 1472 udp_conf.use_udp6_rx_checksums =
b71a61cc 1473 !cfg->udp6_zero_rx_checksums;
f9bac8df
CE
1474 } else
1475#endif
1476 {
85644b4d
TH
1477 udp_conf.family = AF_INET;
1478 udp_conf.local_ip = cfg->local_ip;
1479 udp_conf.peer_ip = cfg->peer_ip;
1480 udp_conf.use_udp_checksums = cfg->use_udp_checksums;
f9bac8df 1481 }
789a4a2c 1482
85644b4d
TH
1483 udp_conf.local_udp_port = htons(cfg->local_udp_port);
1484 udp_conf.peer_udp_port = htons(cfg->peer_udp_port);
1485
1486 err = udp_sock_create(net, &udp_conf, &sock);
1487 if (err < 0)
1488 goto out;
789a4a2c
JC
1489
1490 break;
1491
1492 case L2TP_ENCAPTYPE_IP:
f9bac8df
CE
1493#if IS_ENABLED(CONFIG_IPV6)
1494 if (cfg->local_ip6 && cfg->peer_ip6) {
85644b4d
TH
1495 struct sockaddr_l2tpip6 ip6_addr = {0};
1496
26abe143 1497 err = sock_create_kern(net, AF_INET6, SOCK_DGRAM,
8ce9825a 1498 IPPROTO_L2TP, &sock);
5dac94e1
JC
1499 if (err < 0)
1500 goto out;
789a4a2c 1501
5dac94e1
JC
1502 ip6_addr.l2tp_family = AF_INET6;
1503 memcpy(&ip6_addr.l2tp_addr, cfg->local_ip6,
1504 sizeof(ip6_addr.l2tp_addr));
1505 ip6_addr.l2tp_conn_id = tunnel_id;
b71a61cc 1506 err = kernel_bind(sock, (struct sockaddr *)&ip6_addr,
5dac94e1
JC
1507 sizeof(ip6_addr));
1508 if (err < 0)
1509 goto out;
789a4a2c 1510
5dac94e1
JC
1511 ip6_addr.l2tp_family = AF_INET6;
1512 memcpy(&ip6_addr.l2tp_addr, cfg->peer_ip6,
1513 sizeof(ip6_addr.l2tp_addr));
1514 ip6_addr.l2tp_conn_id = peer_tunnel_id;
1515 err = kernel_connect(sock,
b71a61cc 1516 (struct sockaddr *)&ip6_addr,
5dac94e1
JC
1517 sizeof(ip6_addr), 0);
1518 if (err < 0)
1519 goto out;
1520 } else
1521#endif
1522 {
85644b4d
TH
1523 struct sockaddr_l2tpip ip_addr = {0};
1524
26abe143 1525 err = sock_create_kern(net, AF_INET, SOCK_DGRAM,
8ce9825a 1526 IPPROTO_L2TP, &sock);
5dac94e1
JC
1527 if (err < 0)
1528 goto out;
789a4a2c 1529
5dac94e1
JC
1530 ip_addr.l2tp_family = AF_INET;
1531 ip_addr.l2tp_addr = cfg->local_ip;
1532 ip_addr.l2tp_conn_id = tunnel_id;
b71a61cc 1533 err = kernel_bind(sock, (struct sockaddr *)&ip_addr,
5dac94e1
JC
1534 sizeof(ip_addr));
1535 if (err < 0)
1536 goto out;
1537
1538 ip_addr.l2tp_family = AF_INET;
1539 ip_addr.l2tp_addr = cfg->peer_ip;
1540 ip_addr.l2tp_conn_id = peer_tunnel_id;
b71a61cc 1541 err = kernel_connect(sock, (struct sockaddr *)&ip_addr,
5dac94e1
JC
1542 sizeof(ip_addr), 0);
1543 if (err < 0)
1544 goto out;
1545 }
789a4a2c
JC
1546 break;
1547
1548 default:
1549 goto out;
1550 }
1551
1552out:
167eb17e 1553 *sockp = sock;
6c0ec37b 1554 if (err < 0 && sock) {
167eb17e 1555 kernel_sock_shutdown(sock, SHUT_RDWR);
26abe143 1556 sock_release(sock);
789a4a2c
JC
1557 *sockp = NULL;
1558 }
1559
1560 return err;
1561}
1562
c9ccd4c6 1563int l2tp_tunnel_create(int fd, int version, u32 tunnel_id, u32 peer_tunnel_id,
c0235fb3 1564 struct l2tp_tunnel_cfg *cfg, struct l2tp_tunnel **tunnelp)
fd558d18
JC
1565{
1566 struct l2tp_tunnel *tunnel = NULL;
1567 int err;
0d76751f 1568 enum l2tp_encap_type encap = L2TP_ENCAPTYPE_UDP;
fd558d18 1569
0febc7b3 1570 if (cfg)
0d76751f
JC
1571 encap = cfg->encap;
1572
70c05bfa 1573 tunnel = kzalloc(sizeof(*tunnel), GFP_KERNEL);
0febc7b3 1574 if (!tunnel) {
fd558d18
JC
1575 err = -ENOMEM;
1576 goto err;
1577 }
1578
1579 tunnel->version = version;
1580 tunnel->tunnel_id = tunnel_id;
1581 tunnel->peer_tunnel_id = peer_tunnel_id;
fd558d18 1582
fd558d18 1583 sprintf(&tunnel->name[0], "tunl %u", tunnel_id);
d18d3f0a 1584 spin_lock_init(&tunnel->list_lock);
f3c66d4e 1585 tunnel->acpt_newsess = true;
d18d3f0a 1586 INIT_LIST_HEAD(&tunnel->session_list);
fd558d18 1587
0d76751f 1588 tunnel->encap = encap;
fd558d18 1589
d00fa9ad 1590 refcount_set(&tunnel->ref_count, 1);
d00fa9ad
JC
1591 tunnel->fd = fd;
1592
f8ccac0e
TP
1593 /* Init delete workqueue struct */
1594 INIT_WORK(&tunnel->del_work, l2tp_tunnel_del_work);
1595
fd558d18
JC
1596 err = 0;
1597err:
1598 if (tunnelp)
1599 *tunnelp = tunnel;
1600
fd558d18
JC
1601 return err;
1602}
1603EXPORT_SYMBOL_GPL(l2tp_tunnel_create);
1604
6b9f3423
GN
1605static int l2tp_validate_socket(const struct sock *sk, const struct net *net,
1606 enum l2tp_encap_type encap)
1607{
4a4cd703
JC
1608 struct l2tp_tunnel *tunnel;
1609
6b9f3423
GN
1610 if (!net_eq(sock_net(sk), net))
1611 return -EINVAL;
1612
1613 if (sk->sk_type != SOCK_DGRAM)
1614 return -EPROTONOSUPPORT;
1615
d9a81a22
ED
1616 if (sk->sk_family != PF_INET && sk->sk_family != PF_INET6)
1617 return -EPROTONOSUPPORT;
1618
6b9f3423
GN
1619 if ((encap == L2TP_ENCAPTYPE_UDP && sk->sk_protocol != IPPROTO_UDP) ||
1620 (encap == L2TP_ENCAPTYPE_IP && sk->sk_protocol != IPPROTO_L2TP))
1621 return -EPROTONOSUPPORT;
1622
1461f5a3
CW
1623 if (encap == L2TP_ENCAPTYPE_UDP && sk->sk_user_data)
1624 return -EBUSY;
1625
4a4cd703
JC
1626 tunnel = l2tp_sk_to_tunnel(sk);
1627 if (tunnel) {
abe7a1a7 1628 l2tp_tunnel_put(tunnel);
6b9f3423 1629 return -EBUSY;
4a4cd703 1630 }
6b9f3423
GN
1631
1632 return 0;
1633}
1634
1635int l2tp_tunnel_register(struct l2tp_tunnel *tunnel, struct net *net,
1636 struct l2tp_tunnel_cfg *cfg)
1637{
c4d48a58
CW
1638 struct l2tp_net *pn = l2tp_pernet(net);
1639 u32 tunnel_id = tunnel->tunnel_id;
6b9f3423
GN
1640 struct socket *sock;
1641 struct sock *sk;
1642 int ret;
1643
c4d48a58
CW
1644 spin_lock_bh(&pn->l2tp_tunnel_idr_lock);
1645 ret = idr_alloc_u32(&pn->l2tp_tunnel_idr, NULL, &tunnel_id, tunnel_id,
1646 GFP_ATOMIC);
1647 spin_unlock_bh(&pn->l2tp_tunnel_idr_lock);
1648 if (ret)
1649 return ret == -ENOSPC ? -EEXIST : ret;
1650
6b9f3423
GN
1651 if (tunnel->fd < 0) {
1652 ret = l2tp_tunnel_sock_create(net, tunnel->tunnel_id,
1653 tunnel->peer_tunnel_id, cfg,
1654 &sock);
1655 if (ret < 0)
1656 goto err;
1657 } else {
1658 sock = sockfd_lookup(tunnel->fd, &ret);
1659 if (!sock)
1660 goto err;
6b9f3423
GN
1661 }
1662
b68777d5 1663 sk = sock->sk;
0b2c5972 1664 lock_sock(sk);
af295e85 1665 write_lock_bh(&sk->sk_callback_lock);
b68777d5 1666 ret = l2tp_validate_socket(sk, net, tunnel->encap);
b9fb10d1 1667 if (ret < 0)
af295e85 1668 goto err_inval_sock;
af295e85 1669 write_unlock_bh(&sk->sk_callback_lock);
b68777d5 1670
6b9f3423
GN
1671 if (tunnel->encap == L2TP_ENCAPTYPE_UDP) {
1672 struct udp_tunnel_sock_cfg udp_cfg = {
6b9f3423
GN
1673 .encap_type = UDP_ENCAP_L2TPINUDP,
1674 .encap_rcv = l2tp_udp_encap_recv,
6e828dc6 1675 .encap_err_rcv = l2tp_udp_encap_err_recv,
6b9f3423
GN
1676 .encap_destroy = l2tp_udp_encap_destroy,
1677 };
1678
1679 setup_udp_tunnel_sock(net, sock, &udp_cfg);
6b9f3423
GN
1680 }
1681
6b9f3423 1682 sk->sk_allocation = GFP_ATOMIC;
0b2c5972
CW
1683 release_sock(sk);
1684
1685 sock_hold(sk);
1686 tunnel->sock = sk;
1687 tunnel->l2tp_net = net;
1688
1689 spin_lock_bh(&pn->l2tp_tunnel_idr_lock);
1690 idr_replace(&pn->l2tp_tunnel_idr, tunnel, tunnel->tunnel_id);
1691 spin_unlock_bh(&pn->l2tp_tunnel_idr_lock);
6b9f3423 1692
6b7bdcd7
TP
1693 trace_register_tunnel(tunnel);
1694
6b9f3423
GN
1695 if (tunnel->fd >= 0)
1696 sockfd_put(sock);
1697
1698 return 0;
1699
af295e85
JS
1700err_inval_sock:
1701 write_unlock_bh(&sk->sk_callback_lock);
b9fb10d1 1702 release_sock(sk);
af295e85 1703
f6cd651b
GN
1704 if (tunnel->fd < 0)
1705 sock_release(sock);
1706 else
1707 sockfd_put(sock);
6b9f3423 1708err:
c4d48a58 1709 l2tp_tunnel_remove(net, tunnel);
6b9f3423
GN
1710 return ret;
1711}
1712EXPORT_SYMBOL_GPL(l2tp_tunnel_register);
1713
309795f4
JC
1714/* This function is used by the netlink TUNNEL_DELETE command.
1715 */
62b982ee 1716void l2tp_tunnel_delete(struct l2tp_tunnel *tunnel)
309795f4 1717{
62b982ee 1718 if (!test_and_set_bit(0, &tunnel->dead)) {
6b7bdcd7 1719 trace_delete_tunnel(tunnel);
abe7a1a7 1720 refcount_inc(&tunnel->ref_count);
62b982ee 1721 queue_work(l2tp_wq, &tunnel->del_work);
06a15f51 1722 }
309795f4
JC
1723}
1724EXPORT_SYMBOL_GPL(l2tp_tunnel_delete);
1725
628703f5 1726void l2tp_session_delete(struct l2tp_session *session)
309795f4 1727{
fc7ec7f5
JC
1728 if (!test_and_set_bit(0, &session->dead)) {
1729 trace_delete_session(session);
abe7a1a7 1730 refcount_inc(&session->ref_count);
fc7ec7f5
JC
1731 queue_work(l2tp_wq, &session->del_work);
1732 }
1733}
1734EXPORT_SYMBOL_GPL(l2tp_session_delete);
1735
1736/* Workqueue session deletion function */
1737static void l2tp_session_del_work(struct work_struct *work)
1738{
1739 struct l2tp_session *session = container_of(work, struct l2tp_session,
1740 del_work);
b228a940 1741
b2aecfe8 1742 l2tp_session_unhash(session);
4c6e2fd3 1743 l2tp_session_queue_purge(session);
0febc7b3 1744 if (session->session_close)
309795f4 1745 (*session->session_close)(session);
a4346210 1746
fc7ec7f5 1747 /* drop initial ref */
abe7a1a7 1748 l2tp_session_put(session);
fc7ec7f5
JC
1749
1750 /* drop workqueue ref */
abe7a1a7 1751 l2tp_session_put(session);
309795f4 1752}
309795f4 1753
f7faffa3 1754/* We come here whenever a session's send_seq, cookie_len or
62e7b6a5 1755 * l2specific_type parameters are set.
f7faffa3 1756 */
24256415
JC
1757void l2tp_session_set_header_len(struct l2tp_session *session, int version,
1758 enum l2tp_encap_type encap)
f7faffa3
JC
1759{
1760 if (version == L2TP_HDR_VER_2) {
1761 session->hdr_len = 6;
1762 if (session->send_seq)
1763 session->hdr_len += 4;
1764 } else {
62e7b6a5
LB
1765 session->hdr_len = 4 + session->cookie_len;
1766 session->hdr_len += l2tp_get_l2specific_len(session);
24256415 1767 if (encap == L2TP_ENCAPTYPE_UDP)
0d76751f 1768 session->hdr_len += 4;
f7faffa3 1769 }
f7faffa3 1770}
bb5016ea 1771EXPORT_SYMBOL_GPL(l2tp_session_set_header_len);
f7faffa3 1772
c0235fb3
TP
1773struct l2tp_session *l2tp_session_create(int priv_size, struct l2tp_tunnel *tunnel, u32 session_id,
1774 u32 peer_session_id, struct l2tp_session_cfg *cfg)
fd558d18
JC
1775{
1776 struct l2tp_session *session;
1777
70c05bfa 1778 session = kzalloc(sizeof(*session) + priv_size, GFP_KERNEL);
0febc7b3 1779 if (session) {
fd558d18 1780 session->magic = L2TP_SESSION_MAGIC;
fd558d18
JC
1781
1782 session->session_id = session_id;
1783 session->peer_session_id = peer_session_id;
d301e325 1784 session->nr = 0;
8a1631d5
JC
1785 if (tunnel->version == L2TP_HDR_VER_2)
1786 session->nr_max = 0xffff;
1787 else
1788 session->nr_max = 0xffffff;
1789 session->nr_window_size = session->nr_max / 2;
a0dbd822
JC
1790 session->nr_oos_count_max = 4;
1791
1792 /* Use NR of first received packet */
1793 session->reorder_skip = 1;
fd558d18
JC
1794
1795 sprintf(&session->name[0], "sess %u/%u",
1796 tunnel->tunnel_id, session->session_id);
1797
1798 skb_queue_head_init(&session->reorder_q);
1799
aa5e17e1 1800 session->hlist_key = l2tp_v3_session_hashkey(tunnel->sock, session->session_id);
fd558d18 1801 INIT_HLIST_NODE(&session->hlist);
aa5e17e1 1802 INIT_LIST_HEAD(&session->clist);
d18d3f0a 1803 INIT_LIST_HEAD(&session->list);
fc7ec7f5 1804 INIT_WORK(&session->del_work, l2tp_session_del_work);
fd558d18 1805
fd558d18 1806 if (cfg) {
f7faffa3 1807 session->pwtype = cfg->pw_type;
fd558d18
JC
1808 session->send_seq = cfg->send_seq;
1809 session->recv_seq = cfg->recv_seq;
1810 session->lns_mode = cfg->lns_mode;
f7faffa3 1811 session->reorder_timeout = cfg->reorder_timeout;
f7faffa3 1812 session->l2specific_type = cfg->l2specific_type;
f7faffa3
JC
1813 session->cookie_len = cfg->cookie_len;
1814 memcpy(&session->cookie[0], &cfg->cookie[0], cfg->cookie_len);
1815 session->peer_cookie_len = cfg->peer_cookie_len;
1816 memcpy(&session->peer_cookie[0], &cfg->peer_cookie[0], cfg->peer_cookie_len);
fd558d18
JC
1817 }
1818
24256415 1819 l2tp_session_set_header_len(session, tunnel->version, tunnel->encap);
f7faffa3 1820
9ee369a4
GN
1821 refcount_set(&session->ref_count, 1);
1822
dbdbc73b 1823 return session;
fd558d18
JC
1824 }
1825
dbdbc73b 1826 return ERR_PTR(-ENOMEM);
fd558d18
JC
1827}
1828EXPORT_SYMBOL_GPL(l2tp_session_create);
1829
1830/*****************************************************************************
1831 * Init and cleanup
1832 *****************************************************************************/
1833
1834static __net_init int l2tp_init_net(struct net *net)
1835{
e773aaff 1836 struct l2tp_net *pn = net_generic(net, l2tp_net_id);
fd558d18 1837
c4d48a58
CW
1838 idr_init(&pn->l2tp_tunnel_idr);
1839 spin_lock_init(&pn->l2tp_tunnel_idr_lock);
fd558d18 1840
2a3339f6 1841 idr_init(&pn->l2tp_v2_session_idr);
aa5e17e1
JC
1842 idr_init(&pn->l2tp_v3_session_idr);
1843 spin_lock_init(&pn->l2tp_session_idr_lock);
f7faffa3 1844
fd558d18 1845 return 0;
fd558d18
JC
1846}
1847
5dfa598b 1848static __net_exit void l2tp_pre_exit_net(struct net *net)
167eb17e
TP
1849{
1850 struct l2tp_net *pn = l2tp_pernet(net);
1851 struct l2tp_tunnel *tunnel = NULL;
c4d48a58 1852 unsigned long tunnel_id, tmp;
167eb17e
TP
1853
1854 rcu_read_lock_bh();
c4d48a58
CW
1855 idr_for_each_entry_ul(&pn->l2tp_tunnel_idr, tunnel, tmp, tunnel_id) {
1856 if (tunnel)
1857 l2tp_tunnel_delete(tunnel);
167eb17e
TP
1858 }
1859 rcu_read_unlock_bh();
2f86953e 1860
c1b2e36b 1861 if (l2tp_wq) {
73d33bd0
JC
1862 /* Run all TUNNEL_DELETE work items just queued. */
1863 __flush_workqueue(l2tp_wq);
1864
1865 /* Each TUNNEL_DELETE work item will queue a SESSION_DELETE
1866 * work item for each session in the tunnel. Flush the
1867 * workqueue again to process these.
c1b2e36b
JC
1868 */
1869 __flush_workqueue(l2tp_wq);
c1b2e36b 1870 }
5dfa598b
JC
1871}
1872
5d066766
JC
1873static int l2tp_idr_item_unexpected(int id, void *p, void *data)
1874{
1875 const char *idr_name = data;
1876
1877 pr_err("l2tp: %s IDR not empty at net %d exit\n", idr_name, id);
1878 WARN_ON_ONCE(1);
1879 return 1;
1880}
1881
5dfa598b
JC
1882static __net_exit void l2tp_exit_net(struct net *net)
1883{
1884 struct l2tp_net *pn = l2tp_pernet(net);
1e7af3b2 1885
5d066766
JC
1886 /* Our per-net IDRs should be empty. Check that is so, to
1887 * help catch cleanup races or refcnt leaks.
1888 */
1889 idr_for_each(&pn->l2tp_v2_session_idr, l2tp_idr_item_unexpected,
1890 "v2_session");
1891 idr_for_each(&pn->l2tp_v3_session_idr, l2tp_idr_item_unexpected,
1892 "v3_session");
1893 idr_for_each(&pn->l2tp_tunnel_idr, l2tp_idr_item_unexpected,
1894 "tunnel");
1895
2a3339f6 1896 idr_destroy(&pn->l2tp_v2_session_idr);
aa5e17e1 1897 idr_destroy(&pn->l2tp_v3_session_idr);
c4d48a58 1898 idr_destroy(&pn->l2tp_tunnel_idr);
167eb17e
TP
1899}
1900
fd558d18
JC
1901static struct pernet_operations l2tp_net_ops = {
1902 .init = l2tp_init_net,
167eb17e 1903 .exit = l2tp_exit_net,
5dfa598b 1904 .pre_exit = l2tp_pre_exit_net,
fd558d18
JC
1905 .id = &l2tp_net_id,
1906 .size = sizeof(struct l2tp_net),
1907};
1908
1909static int __init l2tp_init(void)
1910{
1911 int rc = 0;
1912
1913 rc = register_pernet_device(&l2tp_net_ops);
1914 if (rc)
1915 goto out;
1916
59ff3eb6 1917 l2tp_wq = alloc_workqueue("l2tp", WQ_UNBOUND, 0);
f8ccac0e
TP
1918 if (!l2tp_wq) {
1919 pr_err("alloc_workqueue failed\n");
67e04c29 1920 unregister_pernet_device(&l2tp_net_ops);
f8ccac0e
TP
1921 rc = -ENOMEM;
1922 goto out;
1923 }
1924
a4ca44fa 1925 pr_info("L2TP core driver, %s\n", L2TP_DRV_VERSION);
fd558d18
JC
1926
1927out:
1928 return rc;
1929}
1930
1931static void __exit l2tp_exit(void)
1932{
1933 unregister_pernet_device(&l2tp_net_ops);
f8ccac0e
TP
1934 if (l2tp_wq) {
1935 destroy_workqueue(l2tp_wq);
1936 l2tp_wq = NULL;
1937 }
fd558d18
JC
1938}
1939
1940module_init(l2tp_init);
1941module_exit(l2tp_exit);
1942
1943MODULE_AUTHOR("James Chapman <jchapman@katalix.com>");
1944MODULE_DESCRIPTION("L2TP core");
1945MODULE_LICENSE("GPL");
1946MODULE_VERSION(L2TP_DRV_VERSION);