Loading...
1// SPDX-License-Identifier: GPL-2.0-or-later
2/* L2TPv3 IP encapsulation support for IPv6
3 *
4 * Copyright (c) 2012 Katalix Systems Ltd
5 */
6
7#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
8
9#include <linux/icmp.h>
10#include <linux/module.h>
11#include <linux/skbuff.h>
12#include <linux/random.h>
13#include <linux/socket.h>
14#include <linux/l2tp.h>
15#include <linux/in.h>
16#include <linux/in6.h>
17#include <net/sock.h>
18#include <net/ip.h>
19#include <net/icmp.h>
20#include <net/udp.h>
21#include <net/inet_common.h>
22#include <net/tcp_states.h>
23#include <net/protocol.h>
24#include <net/xfrm.h>
25#include <net/net_namespace.h>
26#include <net/netns/generic.h>
27
28#include <net/transp_v6.h>
29#include <net/addrconf.h>
30#include <net/ip6_route.h>
31
32#include "l2tp_core.h"
33
34/* per-net private data for this module */
35static unsigned int l2tp_ip6_net_id;
36struct l2tp_ip6_net {
37 rwlock_t l2tp_ip6_lock;
38 struct hlist_head l2tp_ip6_table;
39 struct hlist_head l2tp_ip6_bind_table;
40};
41
42struct l2tp_ip6_sock {
43 /* inet_sock has to be the first member of l2tp_ip6_sock */
44 struct inet_sock inet;
45
46 u32 conn_id;
47 u32 peer_conn_id;
48
49 struct ipv6_pinfo inet6;
50};
51
52static struct l2tp_ip6_sock *l2tp_ip6_sk(const struct sock *sk)
53{
54 return (struct l2tp_ip6_sock *)sk;
55}
56
57static struct l2tp_ip6_net *l2tp_ip6_pernet(const struct net *net)
58{
59 return net_generic(net, l2tp_ip6_net_id);
60}
61
62static struct sock *__l2tp_ip6_bind_lookup(const struct net *net,
63 const struct in6_addr *laddr,
64 const struct in6_addr *raddr,
65 int dif, u32 tunnel_id)
66{
67 struct l2tp_ip6_net *pn = l2tp_ip6_pernet(net);
68 struct sock *sk;
69
70 sk_for_each_bound(sk, &pn->l2tp_ip6_bind_table) {
71 const struct in6_addr *sk_laddr = inet6_rcv_saddr(sk);
72 const struct in6_addr *sk_raddr = &sk->sk_v6_daddr;
73 const struct l2tp_ip6_sock *l2tp = l2tp_ip6_sk(sk);
74 int bound_dev_if;
75
76 if (!net_eq(sock_net(sk), net))
77 continue;
78
79 bound_dev_if = READ_ONCE(sk->sk_bound_dev_if);
80 if (bound_dev_if && dif && bound_dev_if != dif)
81 continue;
82
83 if (sk_laddr && !ipv6_addr_any(sk_laddr) &&
84 !ipv6_addr_any(laddr) && !ipv6_addr_equal(sk_laddr, laddr))
85 continue;
86
87 if (!ipv6_addr_any(sk_raddr) && raddr &&
88 !ipv6_addr_any(raddr) && !ipv6_addr_equal(sk_raddr, raddr))
89 continue;
90
91 if (l2tp->conn_id != tunnel_id)
92 continue;
93
94 goto found;
95 }
96
97 sk = NULL;
98found:
99 return sk;
100}
101
102/* When processing receive frames, there are two cases to
103 * consider. Data frames consist of a non-zero session-id and an
104 * optional cookie. Control frames consist of a regular L2TP header
105 * preceded by 32-bits of zeros.
106 *
107 * L2TPv3 Session Header Over IP
108 *
109 * 0 1 2 3
110 * 0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1
111 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
112 * | Session ID |
113 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
114 * | Cookie (optional, maximum 64 bits)...
115 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
116 * |
117 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
118 *
119 * L2TPv3 Control Message Header Over IP
120 *
121 * 0 1 2 3
122 * 0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1
123 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
124 * | (32 bits of zeros) |
125 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
126 * |T|L|x|x|S|x|x|x|x|x|x|x| Ver | Length |
127 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
128 * | Control Connection ID |
129 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
130 * | Ns | Nr |
131 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
132 *
133 * All control frames are passed to userspace.
134 */
135static int l2tp_ip6_recv(struct sk_buff *skb)
136{
137 struct net *net = dev_net(skb->dev);
138 struct l2tp_ip6_net *pn;
139 struct sock *sk;
140 u32 session_id;
141 u32 tunnel_id;
142 unsigned char *ptr, *optr;
143 struct l2tp_session *session;
144 struct l2tp_tunnel *tunnel = NULL;
145 struct ipv6hdr *iph;
146
147 pn = l2tp_ip6_pernet(net);
148
149 if (!pskb_may_pull(skb, 4))
150 goto discard;
151
152 /* Point to L2TP header */
153 optr = skb->data;
154 ptr = skb->data;
155 session_id = ntohl(*((__be32 *)ptr));
156 ptr += 4;
157
158 /* RFC3931: L2TP/IP packets have the first 4 bytes containing
159 * the session_id. If it is 0, the packet is a L2TP control
160 * frame and the session_id value can be discarded.
161 */
162 if (session_id == 0) {
163 __skb_pull(skb, 4);
164 goto pass_up;
165 }
166
167 /* Ok, this is a data packet. Lookup the session. */
168 session = l2tp_v3_session_get(net, NULL, session_id);
169 if (!session)
170 goto discard;
171
172 tunnel = session->tunnel;
173 if (!tunnel)
174 goto discard_sess;
175
176 if (l2tp_v3_ensure_opt_in_linear(session, skb, &ptr, &optr))
177 goto discard_sess;
178
179 l2tp_recv_common(session, skb, ptr, optr, 0, skb->len);
180 l2tp_session_put(session);
181
182 return 0;
183
184pass_up:
185 /* Get the tunnel_id from the L2TP header */
186 if (!pskb_may_pull(skb, 12))
187 goto discard;
188
189 if ((skb->data[0] & 0xc0) != 0xc0)
190 goto discard;
191
192 tunnel_id = ntohl(*(__be32 *)&skb->data[4]);
193 iph = ipv6_hdr(skb);
194
195 read_lock_bh(&pn->l2tp_ip6_lock);
196 sk = __l2tp_ip6_bind_lookup(net, &iph->daddr, &iph->saddr,
197 inet6_iif(skb), tunnel_id);
198 if (!sk) {
199 read_unlock_bh(&pn->l2tp_ip6_lock);
200 goto discard;
201 }
202 sock_hold(sk);
203 read_unlock_bh(&pn->l2tp_ip6_lock);
204
205 if (!xfrm6_policy_check(sk, XFRM_POLICY_IN, skb))
206 goto discard_put;
207
208 nf_reset_ct(skb);
209
210 return sk_receive_skb(sk, skb, 1);
211
212discard_sess:
213 l2tp_session_put(session);
214 goto discard;
215
216discard_put:
217 sock_put(sk);
218
219discard:
220 kfree_skb(skb);
221 return 0;
222}
223
224static int l2tp_ip6_hash(struct sock *sk)
225{
226 struct l2tp_ip6_net *pn = l2tp_ip6_pernet(sock_net(sk));
227
228 if (sk_unhashed(sk)) {
229 write_lock_bh(&pn->l2tp_ip6_lock);
230 sk_add_node(sk, &pn->l2tp_ip6_table);
231 write_unlock_bh(&pn->l2tp_ip6_lock);
232 }
233 return 0;
234}
235
236static void l2tp_ip6_unhash(struct sock *sk)
237{
238 struct l2tp_ip6_net *pn = l2tp_ip6_pernet(sock_net(sk));
239
240 if (sk_unhashed(sk))
241 return;
242 write_lock_bh(&pn->l2tp_ip6_lock);
243 sk_del_node_init(sk);
244 write_unlock_bh(&pn->l2tp_ip6_lock);
245}
246
247static int l2tp_ip6_open(struct sock *sk)
248{
249 /* Prevent autobind. We don't have ports. */
250 inet_sk(sk)->inet_num = IPPROTO_L2TP;
251
252 l2tp_ip6_hash(sk);
253 return 0;
254}
255
256static void l2tp_ip6_close(struct sock *sk, long timeout)
257{
258 struct l2tp_ip6_net *pn = l2tp_ip6_pernet(sock_net(sk));
259
260 write_lock_bh(&pn->l2tp_ip6_lock);
261 hlist_del_init(&sk->sk_bind_node);
262 sk_del_node_init(sk);
263 write_unlock_bh(&pn->l2tp_ip6_lock);
264
265 sk_common_release(sk);
266}
267
268static void l2tp_ip6_destroy_sock(struct sock *sk)
269{
270 struct l2tp_tunnel *tunnel;
271
272 lock_sock(sk);
273 ip6_flush_pending_frames(sk);
274 release_sock(sk);
275
276 tunnel = l2tp_sk_to_tunnel(sk);
277 if (tunnel) {
278 l2tp_tunnel_delete(tunnel);
279 l2tp_tunnel_put(tunnel);
280 }
281}
282
283static int l2tp_ip6_bind(struct sock *sk, struct sockaddr *uaddr, int addr_len)
284{
285 struct inet_sock *inet = inet_sk(sk);
286 struct ipv6_pinfo *np = inet6_sk(sk);
287 struct sockaddr_l2tpip6 *addr = (struct sockaddr_l2tpip6 *)uaddr;
288 struct net *net = sock_net(sk);
289 struct l2tp_ip6_net *pn;
290 __be32 v4addr = 0;
291 int bound_dev_if;
292 int addr_type;
293 int err;
294
295 pn = l2tp_ip6_pernet(net);
296
297 if (addr->l2tp_family != AF_INET6)
298 return -EINVAL;
299 if (addr_len < sizeof(*addr))
300 return -EINVAL;
301
302 addr_type = ipv6_addr_type(&addr->l2tp_addr);
303
304 /* l2tp_ip6 sockets are IPv6 only */
305 if (addr_type == IPV6_ADDR_MAPPED)
306 return -EADDRNOTAVAIL;
307
308 /* L2TP is point-point, not multicast */
309 if (addr_type & IPV6_ADDR_MULTICAST)
310 return -EADDRNOTAVAIL;
311
312 lock_sock(sk);
313
314 err = -EINVAL;
315 if (!sock_flag(sk, SOCK_ZAPPED))
316 goto out_unlock;
317
318 if (sk->sk_state != TCP_CLOSE)
319 goto out_unlock;
320
321 bound_dev_if = sk->sk_bound_dev_if;
322
323 /* Check if the address belongs to the host. */
324 rcu_read_lock();
325 if (addr_type != IPV6_ADDR_ANY) {
326 struct net_device *dev = NULL;
327
328 if (addr_type & IPV6_ADDR_LINKLOCAL) {
329 if (addr->l2tp_scope_id)
330 bound_dev_if = addr->l2tp_scope_id;
331
332 /* Binding to link-local address requires an
333 * interface.
334 */
335 if (!bound_dev_if)
336 goto out_unlock_rcu;
337
338 err = -ENODEV;
339 dev = dev_get_by_index_rcu(sock_net(sk), bound_dev_if);
340 if (!dev)
341 goto out_unlock_rcu;
342 }
343
344 /* ipv4 addr of the socket is invalid. Only the
345 * unspecified and mapped address have a v4 equivalent.
346 */
347 v4addr = LOOPBACK4_IPV6;
348 err = -EADDRNOTAVAIL;
349 if (!ipv6_chk_addr(sock_net(sk), &addr->l2tp_addr, dev, 0))
350 goto out_unlock_rcu;
351 }
352 rcu_read_unlock();
353
354 write_lock_bh(&pn->l2tp_ip6_lock);
355 if (__l2tp_ip6_bind_lookup(net, &addr->l2tp_addr, NULL, bound_dev_if,
356 addr->l2tp_conn_id)) {
357 write_unlock_bh(&pn->l2tp_ip6_lock);
358 err = -EADDRINUSE;
359 goto out_unlock;
360 }
361
362 inet->inet_saddr = v4addr;
363 inet->inet_rcv_saddr = v4addr;
364 sk->sk_bound_dev_if = bound_dev_if;
365 sk->sk_v6_rcv_saddr = addr->l2tp_addr;
366 np->saddr = addr->l2tp_addr;
367
368 l2tp_ip6_sk(sk)->conn_id = addr->l2tp_conn_id;
369
370 sk_add_bind_node(sk, &pn->l2tp_ip6_bind_table);
371 sk_del_node_init(sk);
372 write_unlock_bh(&pn->l2tp_ip6_lock);
373
374 sock_reset_flag(sk, SOCK_ZAPPED);
375 release_sock(sk);
376 return 0;
377
378out_unlock_rcu:
379 rcu_read_unlock();
380out_unlock:
381 release_sock(sk);
382
383 return err;
384}
385
386static int l2tp_ip6_connect(struct sock *sk, struct sockaddr *uaddr,
387 int addr_len)
388{
389 struct sockaddr_l2tpip6 *lsa = (struct sockaddr_l2tpip6 *)uaddr;
390 struct sockaddr_in6 *usin = (struct sockaddr_in6 *)uaddr;
391 struct in6_addr *daddr;
392 int addr_type;
393 int rc;
394 struct l2tp_ip6_net *pn;
395
396 if (addr_len < sizeof(*lsa))
397 return -EINVAL;
398
399 if (usin->sin6_family != AF_INET6)
400 return -EINVAL;
401
402 addr_type = ipv6_addr_type(&usin->sin6_addr);
403 if (addr_type & IPV6_ADDR_MULTICAST)
404 return -EINVAL;
405
406 if (addr_type & IPV6_ADDR_MAPPED) {
407 daddr = &usin->sin6_addr;
408 if (ipv4_is_multicast(daddr->s6_addr32[3]))
409 return -EINVAL;
410 }
411
412 lock_sock(sk);
413
414 /* Must bind first - autobinding does not work */
415 if (sock_flag(sk, SOCK_ZAPPED)) {
416 rc = -EINVAL;
417 goto out_sk;
418 }
419
420 rc = __ip6_datagram_connect(sk, uaddr, addr_len);
421 if (rc < 0)
422 goto out_sk;
423
424 l2tp_ip6_sk(sk)->peer_conn_id = lsa->l2tp_conn_id;
425
426 pn = l2tp_ip6_pernet(sock_net(sk));
427 write_lock_bh(&pn->l2tp_ip6_lock);
428 hlist_del_init(&sk->sk_bind_node);
429 sk_add_bind_node(sk, &pn->l2tp_ip6_bind_table);
430 write_unlock_bh(&pn->l2tp_ip6_lock);
431
432out_sk:
433 release_sock(sk);
434
435 return rc;
436}
437
438static int l2tp_ip6_disconnect(struct sock *sk, int flags)
439{
440 if (sock_flag(sk, SOCK_ZAPPED))
441 return 0;
442
443 return __udp_disconnect(sk, flags);
444}
445
446static int l2tp_ip6_getname(struct socket *sock, struct sockaddr *uaddr,
447 int peer)
448{
449 struct sockaddr_l2tpip6 *lsa = (struct sockaddr_l2tpip6 *)uaddr;
450 struct sock *sk = sock->sk;
451 struct ipv6_pinfo *np = inet6_sk(sk);
452 struct l2tp_ip6_sock *lsk = l2tp_ip6_sk(sk);
453
454 lsa->l2tp_family = AF_INET6;
455 lsa->l2tp_flowinfo = 0;
456 lsa->l2tp_scope_id = 0;
457 lsa->l2tp_unused = 0;
458 if (peer) {
459 if (!lsk->peer_conn_id)
460 return -ENOTCONN;
461 lsa->l2tp_conn_id = lsk->peer_conn_id;
462 lsa->l2tp_addr = sk->sk_v6_daddr;
463 if (inet6_test_bit(SNDFLOW, sk))
464 lsa->l2tp_flowinfo = np->flow_label;
465 } else {
466 if (ipv6_addr_any(&sk->sk_v6_rcv_saddr))
467 lsa->l2tp_addr = np->saddr;
468 else
469 lsa->l2tp_addr = sk->sk_v6_rcv_saddr;
470
471 lsa->l2tp_conn_id = lsk->conn_id;
472 }
473 if (ipv6_addr_type(&lsa->l2tp_addr) & IPV6_ADDR_LINKLOCAL)
474 lsa->l2tp_scope_id = READ_ONCE(sk->sk_bound_dev_if);
475 return sizeof(*lsa);
476}
477
478static int l2tp_ip6_backlog_recv(struct sock *sk, struct sk_buff *skb)
479{
480 int rc;
481
482 /* Charge it to the socket, dropping if the queue is full. */
483 rc = sock_queue_rcv_skb(sk, skb);
484 if (rc < 0)
485 goto drop;
486
487 return 0;
488
489drop:
490 IP_INC_STATS(sock_net(sk), IPSTATS_MIB_INDISCARDS);
491 kfree_skb(skb);
492 return -1;
493}
494
495static int l2tp_ip6_push_pending_frames(struct sock *sk)
496{
497 struct sk_buff *skb;
498 __be32 *transhdr = NULL;
499 int err = 0;
500
501 skb = skb_peek(&sk->sk_write_queue);
502 if (!skb)
503 goto out;
504
505 transhdr = (__be32 *)skb_transport_header(skb);
506 *transhdr = 0;
507
508 err = ip6_push_pending_frames(sk);
509
510out:
511 return err;
512}
513
514/* Userspace will call sendmsg() on the tunnel socket to send L2TP
515 * control frames.
516 */
517static int l2tp_ip6_sendmsg(struct sock *sk, struct msghdr *msg, size_t len)
518{
519 struct ipv6_txoptions opt_space;
520 DECLARE_SOCKADDR(struct sockaddr_l2tpip6 *, lsa, msg->msg_name);
521 struct in6_addr *daddr, *final_p, final;
522 struct ipv6_pinfo *np = inet6_sk(sk);
523 struct ipv6_txoptions *opt_to_free = NULL;
524 struct ipv6_txoptions *opt = NULL;
525 struct ip6_flowlabel *flowlabel = NULL;
526 struct dst_entry *dst = NULL;
527 struct flowi6 fl6;
528 struct ipcm6_cookie ipc6;
529 int addr_len = msg->msg_namelen;
530 int transhdrlen = 4; /* zero session-id */
531 int ulen;
532 int err;
533
534 /* Rough check on arithmetic overflow,
535 * better check is made in ip6_append_data().
536 */
537 if (len > INT_MAX - transhdrlen)
538 return -EMSGSIZE;
539
540 /* Mirror BSD error message compatibility */
541 if (msg->msg_flags & MSG_OOB)
542 return -EOPNOTSUPP;
543
544 /* Get and verify the address */
545 memset(&fl6, 0, sizeof(fl6));
546
547 fl6.flowi6_mark = READ_ONCE(sk->sk_mark);
548 fl6.flowi6_uid = sk->sk_uid;
549
550 ipcm6_init(&ipc6);
551
552 if (lsa) {
553 if (addr_len < SIN6_LEN_RFC2133)
554 return -EINVAL;
555
556 if (lsa->l2tp_family && lsa->l2tp_family != AF_INET6)
557 return -EAFNOSUPPORT;
558
559 daddr = &lsa->l2tp_addr;
560 if (inet6_test_bit(SNDFLOW, sk)) {
561 fl6.flowlabel = lsa->l2tp_flowinfo & IPV6_FLOWINFO_MASK;
562 if (fl6.flowlabel & IPV6_FLOWLABEL_MASK) {
563 flowlabel = fl6_sock_lookup(sk, fl6.flowlabel);
564 if (IS_ERR(flowlabel))
565 return -EINVAL;
566 }
567 }
568
569 /* Otherwise it will be difficult to maintain
570 * sk->sk_dst_cache.
571 */
572 if (sk->sk_state == TCP_ESTABLISHED &&
573 ipv6_addr_equal(daddr, &sk->sk_v6_daddr))
574 daddr = &sk->sk_v6_daddr;
575
576 if (addr_len >= sizeof(struct sockaddr_in6) &&
577 lsa->l2tp_scope_id &&
578 ipv6_addr_type(daddr) & IPV6_ADDR_LINKLOCAL)
579 fl6.flowi6_oif = lsa->l2tp_scope_id;
580 } else {
581 if (sk->sk_state != TCP_ESTABLISHED)
582 return -EDESTADDRREQ;
583
584 daddr = &sk->sk_v6_daddr;
585 fl6.flowlabel = np->flow_label;
586 }
587
588 if (fl6.flowi6_oif == 0)
589 fl6.flowi6_oif = READ_ONCE(sk->sk_bound_dev_if);
590
591 if (msg->msg_controllen) {
592 opt = &opt_space;
593 memset(opt, 0, sizeof(struct ipv6_txoptions));
594 opt->tot_len = sizeof(struct ipv6_txoptions);
595 ipc6.opt = opt;
596
597 err = ip6_datagram_send_ctl(sock_net(sk), sk, msg, &fl6, &ipc6);
598 if (err < 0) {
599 fl6_sock_release(flowlabel);
600 return err;
601 }
602 if ((fl6.flowlabel & IPV6_FLOWLABEL_MASK) && !flowlabel) {
603 flowlabel = fl6_sock_lookup(sk, fl6.flowlabel);
604 if (IS_ERR(flowlabel))
605 return -EINVAL;
606 }
607 if (!(opt->opt_nflen | opt->opt_flen))
608 opt = NULL;
609 }
610
611 if (!opt) {
612 opt = txopt_get(np);
613 opt_to_free = opt;
614 }
615 if (flowlabel)
616 opt = fl6_merge_options(&opt_space, flowlabel, opt);
617 opt = ipv6_fixup_options(&opt_space, opt);
618 ipc6.opt = opt;
619
620 fl6.flowi6_proto = sk->sk_protocol;
621 if (!ipv6_addr_any(daddr))
622 fl6.daddr = *daddr;
623 else
624 fl6.daddr.s6_addr[15] = 0x1; /* :: means loopback (BSD'ism) */
625 if (ipv6_addr_any(&fl6.saddr) && !ipv6_addr_any(&np->saddr))
626 fl6.saddr = np->saddr;
627
628 final_p = fl6_update_dst(&fl6, opt, &final);
629
630 if (!fl6.flowi6_oif && ipv6_addr_is_multicast(&fl6.daddr))
631 fl6.flowi6_oif = READ_ONCE(np->mcast_oif);
632 else if (!fl6.flowi6_oif)
633 fl6.flowi6_oif = READ_ONCE(np->ucast_oif);
634
635 security_sk_classify_flow(sk, flowi6_to_flowi_common(&fl6));
636
637 if (ipc6.tclass < 0)
638 ipc6.tclass = np->tclass;
639
640 fl6.flowlabel = ip6_make_flowinfo(ipc6.tclass, fl6.flowlabel);
641
642 dst = ip6_dst_lookup_flow(sock_net(sk), sk, &fl6, final_p);
643 if (IS_ERR(dst)) {
644 err = PTR_ERR(dst);
645 goto out;
646 }
647
648 if (ipc6.hlimit < 0)
649 ipc6.hlimit = ip6_sk_dst_hoplimit(np, &fl6, dst);
650
651 if (ipc6.dontfrag < 0)
652 ipc6.dontfrag = inet6_test_bit(DONTFRAG, sk);
653
654 if (msg->msg_flags & MSG_CONFIRM)
655 goto do_confirm;
656
657back_from_confirm:
658 lock_sock(sk);
659 ulen = len + (skb_queue_empty(&sk->sk_write_queue) ? transhdrlen : 0);
660 err = ip6_append_data(sk, ip_generic_getfrag, msg,
661 ulen, transhdrlen, &ipc6,
662 &fl6, dst_rt6_info(dst),
663 msg->msg_flags);
664 if (err)
665 ip6_flush_pending_frames(sk);
666 else if (!(msg->msg_flags & MSG_MORE))
667 err = l2tp_ip6_push_pending_frames(sk);
668 release_sock(sk);
669done:
670 dst_release(dst);
671out:
672 fl6_sock_release(flowlabel);
673 txopt_put(opt_to_free);
674
675 return err < 0 ? err : len;
676
677do_confirm:
678 if (msg->msg_flags & MSG_PROBE)
679 dst_confirm_neigh(dst, &fl6.daddr);
680 if (!(msg->msg_flags & MSG_PROBE) || len)
681 goto back_from_confirm;
682 err = 0;
683 goto done;
684}
685
686static int l2tp_ip6_recvmsg(struct sock *sk, struct msghdr *msg, size_t len,
687 int flags, int *addr_len)
688{
689 struct ipv6_pinfo *np = inet6_sk(sk);
690 DECLARE_SOCKADDR(struct sockaddr_l2tpip6 *, lsa, msg->msg_name);
691 size_t copied = 0;
692 int err = -EOPNOTSUPP;
693 struct sk_buff *skb;
694
695 if (flags & MSG_OOB)
696 goto out;
697
698 if (flags & MSG_ERRQUEUE)
699 return ipv6_recv_error(sk, msg, len, addr_len);
700
701 skb = skb_recv_datagram(sk, flags, &err);
702 if (!skb)
703 goto out;
704
705 copied = skb->len;
706 if (len < copied) {
707 msg->msg_flags |= MSG_TRUNC;
708 copied = len;
709 }
710
711 err = skb_copy_datagram_msg(skb, 0, msg, copied);
712 if (err)
713 goto done;
714
715 sock_recv_timestamp(msg, sk, skb);
716
717 /* Copy the address. */
718 if (lsa) {
719 lsa->l2tp_family = AF_INET6;
720 lsa->l2tp_unused = 0;
721 lsa->l2tp_addr = ipv6_hdr(skb)->saddr;
722 lsa->l2tp_flowinfo = 0;
723 lsa->l2tp_scope_id = 0;
724 lsa->l2tp_conn_id = 0;
725 if (ipv6_addr_type(&lsa->l2tp_addr) & IPV6_ADDR_LINKLOCAL)
726 lsa->l2tp_scope_id = inet6_iif(skb);
727 *addr_len = sizeof(*lsa);
728 }
729
730 if (np->rxopt.all)
731 ip6_datagram_recv_ctl(sk, msg, skb);
732
733 if (flags & MSG_TRUNC)
734 copied = skb->len;
735done:
736 skb_free_datagram(sk, skb);
737out:
738 return err ? err : copied;
739}
740
741static struct proto l2tp_ip6_prot = {
742 .name = "L2TP/IPv6",
743 .owner = THIS_MODULE,
744 .init = l2tp_ip6_open,
745 .close = l2tp_ip6_close,
746 .bind = l2tp_ip6_bind,
747 .connect = l2tp_ip6_connect,
748 .disconnect = l2tp_ip6_disconnect,
749 .ioctl = l2tp_ioctl,
750 .destroy = l2tp_ip6_destroy_sock,
751 .setsockopt = ipv6_setsockopt,
752 .getsockopt = ipv6_getsockopt,
753 .sendmsg = l2tp_ip6_sendmsg,
754 .recvmsg = l2tp_ip6_recvmsg,
755 .backlog_rcv = l2tp_ip6_backlog_recv,
756 .hash = l2tp_ip6_hash,
757 .unhash = l2tp_ip6_unhash,
758 .obj_size = sizeof(struct l2tp_ip6_sock),
759 .ipv6_pinfo_offset = offsetof(struct l2tp_ip6_sock, inet6),
760};
761
762static const struct proto_ops l2tp_ip6_ops = {
763 .family = PF_INET6,
764 .owner = THIS_MODULE,
765 .release = inet6_release,
766 .bind = inet6_bind,
767 .connect = inet_dgram_connect,
768 .socketpair = sock_no_socketpair,
769 .accept = sock_no_accept,
770 .getname = l2tp_ip6_getname,
771 .poll = datagram_poll,
772 .ioctl = inet6_ioctl,
773 .gettstamp = sock_gettstamp,
774 .listen = sock_no_listen,
775 .shutdown = inet_shutdown,
776 .setsockopt = sock_common_setsockopt,
777 .getsockopt = sock_common_getsockopt,
778 .sendmsg = inet_sendmsg,
779 .recvmsg = sock_common_recvmsg,
780 .mmap = sock_no_mmap,
781#ifdef CONFIG_COMPAT
782 .compat_ioctl = inet6_compat_ioctl,
783#endif
784};
785
786static struct inet_protosw l2tp_ip6_protosw = {
787 .type = SOCK_DGRAM,
788 .protocol = IPPROTO_L2TP,
789 .prot = &l2tp_ip6_prot,
790 .ops = &l2tp_ip6_ops,
791};
792
793static struct inet6_protocol l2tp_ip6_protocol __read_mostly = {
794 .handler = l2tp_ip6_recv,
795};
796
797static __net_init int l2tp_ip6_init_net(struct net *net)
798{
799 struct l2tp_ip6_net *pn = net_generic(net, l2tp_ip6_net_id);
800
801 rwlock_init(&pn->l2tp_ip6_lock);
802 INIT_HLIST_HEAD(&pn->l2tp_ip6_table);
803 INIT_HLIST_HEAD(&pn->l2tp_ip6_bind_table);
804 return 0;
805}
806
807static __net_exit void l2tp_ip6_exit_net(struct net *net)
808{
809 struct l2tp_ip6_net *pn = l2tp_ip6_pernet(net);
810
811 write_lock_bh(&pn->l2tp_ip6_lock);
812 WARN_ON_ONCE(hlist_count_nodes(&pn->l2tp_ip6_table) != 0);
813 WARN_ON_ONCE(hlist_count_nodes(&pn->l2tp_ip6_bind_table) != 0);
814 write_unlock_bh(&pn->l2tp_ip6_lock);
815}
816
817static struct pernet_operations l2tp_ip6_net_ops = {
818 .init = l2tp_ip6_init_net,
819 .exit = l2tp_ip6_exit_net,
820 .id = &l2tp_ip6_net_id,
821 .size = sizeof(struct l2tp_ip6_net),
822};
823
824static int __init l2tp_ip6_init(void)
825{
826 int err;
827
828 pr_info("L2TP IP encapsulation support for IPv6 (L2TPv3)\n");
829
830 err = register_pernet_device(&l2tp_ip6_net_ops);
831 if (err)
832 goto out;
833
834 err = proto_register(&l2tp_ip6_prot, 1);
835 if (err != 0)
836 goto out1;
837
838 err = inet6_add_protocol(&l2tp_ip6_protocol, IPPROTO_L2TP);
839 if (err)
840 goto out2;
841
842 inet6_register_protosw(&l2tp_ip6_protosw);
843 return 0;
844
845out2:
846 proto_unregister(&l2tp_ip6_prot);
847out1:
848 unregister_pernet_device(&l2tp_ip6_net_ops);
849out:
850 return err;
851}
852
853static void __exit l2tp_ip6_exit(void)
854{
855 inet6_unregister_protosw(&l2tp_ip6_protosw);
856 inet6_del_protocol(&l2tp_ip6_protocol, IPPROTO_L2TP);
857 proto_unregister(&l2tp_ip6_prot);
858 unregister_pernet_device(&l2tp_ip6_net_ops);
859}
860
861module_init(l2tp_ip6_init);
862module_exit(l2tp_ip6_exit);
863
864MODULE_LICENSE("GPL");
865MODULE_AUTHOR("Chris Elston <celston@katalix.com>");
866MODULE_DESCRIPTION("L2TP IP encapsulation for IPv6");
867MODULE_VERSION("1.0");
868
869/* Use the values of SOCK_DGRAM (2) as type and IPPROTO_L2TP (115) as protocol,
870 * because __stringify doesn't like enums
871 */
872MODULE_ALIAS_NET_PF_PROTO_TYPE(PF_INET6, 115, 2);
873MODULE_ALIAS_NET_PF_PROTO(PF_INET6, 115);
1/*
2 * L2TPv3 IP encapsulation support for IPv6
3 *
4 * Copyright (c) 2012 Katalix Systems Ltd
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 */
11
12#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
13
14#include <linux/icmp.h>
15#include <linux/module.h>
16#include <linux/skbuff.h>
17#include <linux/random.h>
18#include <linux/socket.h>
19#include <linux/l2tp.h>
20#include <linux/in.h>
21#include <linux/in6.h>
22#include <net/sock.h>
23#include <net/ip.h>
24#include <net/icmp.h>
25#include <net/udp.h>
26#include <net/inet_common.h>
27#include <net/inet_hashtables.h>
28#include <net/tcp_states.h>
29#include <net/protocol.h>
30#include <net/xfrm.h>
31
32#include <net/transp_v6.h>
33#include <net/addrconf.h>
34#include <net/ip6_route.h>
35
36#include "l2tp_core.h"
37
38struct l2tp_ip6_sock {
39 /* inet_sock has to be the first member of l2tp_ip6_sock */
40 struct inet_sock inet;
41
42 u32 conn_id;
43 u32 peer_conn_id;
44
45 /* ipv6_pinfo has to be the last member of l2tp_ip6_sock, see
46 inet6_sk_generic */
47 struct ipv6_pinfo inet6;
48};
49
50static DEFINE_RWLOCK(l2tp_ip6_lock);
51static struct hlist_head l2tp_ip6_table;
52static struct hlist_head l2tp_ip6_bind_table;
53
54static inline struct l2tp_ip6_sock *l2tp_ip6_sk(const struct sock *sk)
55{
56 return (struct l2tp_ip6_sock *)sk;
57}
58
59static struct sock *__l2tp_ip6_bind_lookup(struct net *net,
60 struct in6_addr *laddr,
61 int dif, u32 tunnel_id)
62{
63 struct hlist_node *node;
64 struct sock *sk;
65
66 sk_for_each_bound(sk, node, &l2tp_ip6_bind_table) {
67 struct in6_addr *addr = inet6_rcv_saddr(sk);
68 struct l2tp_ip6_sock *l2tp = l2tp_ip6_sk(sk);
69
70 if (l2tp == NULL)
71 continue;
72
73 if ((l2tp->conn_id == tunnel_id) &&
74 net_eq(sock_net(sk), net) &&
75 !(addr && ipv6_addr_equal(addr, laddr)) &&
76 !(sk->sk_bound_dev_if && sk->sk_bound_dev_if != dif))
77 goto found;
78 }
79
80 sk = NULL;
81found:
82 return sk;
83}
84
85static inline struct sock *l2tp_ip6_bind_lookup(struct net *net,
86 struct in6_addr *laddr,
87 int dif, u32 tunnel_id)
88{
89 struct sock *sk = __l2tp_ip6_bind_lookup(net, laddr, dif, tunnel_id);
90 if (sk)
91 sock_hold(sk);
92
93 return sk;
94}
95
96/* When processing receive frames, there are two cases to
97 * consider. Data frames consist of a non-zero session-id and an
98 * optional cookie. Control frames consist of a regular L2TP header
99 * preceded by 32-bits of zeros.
100 *
101 * L2TPv3 Session Header Over IP
102 *
103 * 0 1 2 3
104 * 0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1
105 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
106 * | Session ID |
107 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
108 * | Cookie (optional, maximum 64 bits)...
109 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
110 * |
111 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
112 *
113 * L2TPv3 Control Message Header Over IP
114 *
115 * 0 1 2 3
116 * 0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1
117 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
118 * | (32 bits of zeros) |
119 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
120 * |T|L|x|x|S|x|x|x|x|x|x|x| Ver | Length |
121 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
122 * | Control Connection ID |
123 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
124 * | Ns | Nr |
125 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
126 *
127 * All control frames are passed to userspace.
128 */
129static int l2tp_ip6_recv(struct sk_buff *skb)
130{
131 struct sock *sk;
132 u32 session_id;
133 u32 tunnel_id;
134 unsigned char *ptr, *optr;
135 struct l2tp_session *session;
136 struct l2tp_tunnel *tunnel = NULL;
137 int length;
138
139 /* Point to L2TP header */
140 optr = ptr = skb->data;
141
142 if (!pskb_may_pull(skb, 4))
143 goto discard;
144
145 session_id = ntohl(*((__be32 *) ptr));
146 ptr += 4;
147
148 /* RFC3931: L2TP/IP packets have the first 4 bytes containing
149 * the session_id. If it is 0, the packet is a L2TP control
150 * frame and the session_id value can be discarded.
151 */
152 if (session_id == 0) {
153 __skb_pull(skb, 4);
154 goto pass_up;
155 }
156
157 /* Ok, this is a data packet. Lookup the session. */
158 session = l2tp_session_find(&init_net, NULL, session_id);
159 if (session == NULL)
160 goto discard;
161
162 tunnel = session->tunnel;
163 if (tunnel == NULL)
164 goto discard;
165
166 /* Trace packet contents, if enabled */
167 if (tunnel->debug & L2TP_MSG_DATA) {
168 length = min(32u, skb->len);
169 if (!pskb_may_pull(skb, length))
170 goto discard;
171
172 pr_debug("%s: ip recv\n", tunnel->name);
173 print_hex_dump_bytes("", DUMP_PREFIX_OFFSET, ptr, length);
174 }
175
176 l2tp_recv_common(session, skb, ptr, optr, 0, skb->len,
177 tunnel->recv_payload_hook);
178 return 0;
179
180pass_up:
181 /* Get the tunnel_id from the L2TP header */
182 if (!pskb_may_pull(skb, 12))
183 goto discard;
184
185 if ((skb->data[0] & 0xc0) != 0xc0)
186 goto discard;
187
188 tunnel_id = ntohl(*(__be32 *) &skb->data[4]);
189 tunnel = l2tp_tunnel_find(&init_net, tunnel_id);
190 if (tunnel != NULL)
191 sk = tunnel->sock;
192 else {
193 struct ipv6hdr *iph = ipv6_hdr(skb);
194
195 read_lock_bh(&l2tp_ip6_lock);
196 sk = __l2tp_ip6_bind_lookup(&init_net, &iph->daddr,
197 0, tunnel_id);
198 read_unlock_bh(&l2tp_ip6_lock);
199 }
200
201 if (sk == NULL)
202 goto discard;
203
204 sock_hold(sk);
205
206 if (!xfrm6_policy_check(sk, XFRM_POLICY_IN, skb))
207 goto discard_put;
208
209 nf_reset(skb);
210
211 return sk_receive_skb(sk, skb, 1);
212
213discard_put:
214 sock_put(sk);
215
216discard:
217 kfree_skb(skb);
218 return 0;
219}
220
221static int l2tp_ip6_open(struct sock *sk)
222{
223 /* Prevent autobind. We don't have ports. */
224 inet_sk(sk)->inet_num = IPPROTO_L2TP;
225
226 write_lock_bh(&l2tp_ip6_lock);
227 sk_add_node(sk, &l2tp_ip6_table);
228 write_unlock_bh(&l2tp_ip6_lock);
229
230 return 0;
231}
232
233static void l2tp_ip6_close(struct sock *sk, long timeout)
234{
235 write_lock_bh(&l2tp_ip6_lock);
236 hlist_del_init(&sk->sk_bind_node);
237 sk_del_node_init(sk);
238 write_unlock_bh(&l2tp_ip6_lock);
239
240 sk_common_release(sk);
241}
242
243static void l2tp_ip6_destroy_sock(struct sock *sk)
244{
245 lock_sock(sk);
246 ip6_flush_pending_frames(sk);
247 release_sock(sk);
248
249 inet6_destroy_sock(sk);
250}
251
252static int l2tp_ip6_bind(struct sock *sk, struct sockaddr *uaddr, int addr_len)
253{
254 struct inet_sock *inet = inet_sk(sk);
255 struct ipv6_pinfo *np = inet6_sk(sk);
256 struct sockaddr_l2tpip6 *addr = (struct sockaddr_l2tpip6 *) uaddr;
257 __be32 v4addr = 0;
258 int addr_type;
259 int err;
260
261 if (!sock_flag(sk, SOCK_ZAPPED))
262 return -EINVAL;
263 if (addr->l2tp_family != AF_INET6)
264 return -EINVAL;
265 if (addr_len < sizeof(*addr))
266 return -EINVAL;
267
268 addr_type = ipv6_addr_type(&addr->l2tp_addr);
269
270 /* l2tp_ip6 sockets are IPv6 only */
271 if (addr_type == IPV6_ADDR_MAPPED)
272 return -EADDRNOTAVAIL;
273
274 /* L2TP is point-point, not multicast */
275 if (addr_type & IPV6_ADDR_MULTICAST)
276 return -EADDRNOTAVAIL;
277
278 err = -EADDRINUSE;
279 read_lock_bh(&l2tp_ip6_lock);
280 if (__l2tp_ip6_bind_lookup(&init_net, &addr->l2tp_addr,
281 sk->sk_bound_dev_if, addr->l2tp_conn_id))
282 goto out_in_use;
283 read_unlock_bh(&l2tp_ip6_lock);
284
285 lock_sock(sk);
286
287 err = -EINVAL;
288 if (sk->sk_state != TCP_CLOSE)
289 goto out_unlock;
290
291 /* Check if the address belongs to the host. */
292 rcu_read_lock();
293 if (addr_type != IPV6_ADDR_ANY) {
294 struct net_device *dev = NULL;
295
296 if (addr_type & IPV6_ADDR_LINKLOCAL) {
297 if (addr_len >= sizeof(struct sockaddr_in6) &&
298 addr->l2tp_scope_id) {
299 /* Override any existing binding, if another
300 * one is supplied by user.
301 */
302 sk->sk_bound_dev_if = addr->l2tp_scope_id;
303 }
304
305 /* Binding to link-local address requires an
306 interface */
307 if (!sk->sk_bound_dev_if)
308 goto out_unlock_rcu;
309
310 err = -ENODEV;
311 dev = dev_get_by_index_rcu(sock_net(sk),
312 sk->sk_bound_dev_if);
313 if (!dev)
314 goto out_unlock_rcu;
315 }
316
317 /* ipv4 addr of the socket is invalid. Only the
318 * unspecified and mapped address have a v4 equivalent.
319 */
320 v4addr = LOOPBACK4_IPV6;
321 err = -EADDRNOTAVAIL;
322 if (!ipv6_chk_addr(sock_net(sk), &addr->l2tp_addr, dev, 0))
323 goto out_unlock_rcu;
324 }
325 rcu_read_unlock();
326
327 inet->inet_rcv_saddr = inet->inet_saddr = v4addr;
328 np->rcv_saddr = addr->l2tp_addr;
329 np->saddr = addr->l2tp_addr;
330
331 l2tp_ip6_sk(sk)->conn_id = addr->l2tp_conn_id;
332
333 write_lock_bh(&l2tp_ip6_lock);
334 sk_add_bind_node(sk, &l2tp_ip6_bind_table);
335 sk_del_node_init(sk);
336 write_unlock_bh(&l2tp_ip6_lock);
337
338 sock_reset_flag(sk, SOCK_ZAPPED);
339 release_sock(sk);
340 return 0;
341
342out_unlock_rcu:
343 rcu_read_unlock();
344out_unlock:
345 release_sock(sk);
346 return err;
347
348out_in_use:
349 read_unlock_bh(&l2tp_ip6_lock);
350 return err;
351}
352
353static int l2tp_ip6_connect(struct sock *sk, struct sockaddr *uaddr,
354 int addr_len)
355{
356 struct sockaddr_l2tpip6 *lsa = (struct sockaddr_l2tpip6 *) uaddr;
357 struct sockaddr_in6 *usin = (struct sockaddr_in6 *) uaddr;
358 struct in6_addr *daddr;
359 int addr_type;
360 int rc;
361
362 if (sock_flag(sk, SOCK_ZAPPED)) /* Must bind first - autobinding does not work */
363 return -EINVAL;
364
365 if (addr_len < sizeof(*lsa))
366 return -EINVAL;
367
368 addr_type = ipv6_addr_type(&usin->sin6_addr);
369 if (addr_type & IPV6_ADDR_MULTICAST)
370 return -EINVAL;
371
372 if (addr_type & IPV6_ADDR_MAPPED) {
373 daddr = &usin->sin6_addr;
374 if (ipv4_is_multicast(daddr->s6_addr32[3]))
375 return -EINVAL;
376 }
377
378 rc = ip6_datagram_connect(sk, uaddr, addr_len);
379
380 lock_sock(sk);
381
382 l2tp_ip6_sk(sk)->peer_conn_id = lsa->l2tp_conn_id;
383
384 write_lock_bh(&l2tp_ip6_lock);
385 hlist_del_init(&sk->sk_bind_node);
386 sk_add_bind_node(sk, &l2tp_ip6_bind_table);
387 write_unlock_bh(&l2tp_ip6_lock);
388
389 release_sock(sk);
390
391 return rc;
392}
393
394static int l2tp_ip6_disconnect(struct sock *sk, int flags)
395{
396 if (sock_flag(sk, SOCK_ZAPPED))
397 return 0;
398
399 return udp_disconnect(sk, flags);
400}
401
402static int l2tp_ip6_getname(struct socket *sock, struct sockaddr *uaddr,
403 int *uaddr_len, int peer)
404{
405 struct sockaddr_l2tpip6 *lsa = (struct sockaddr_l2tpip6 *)uaddr;
406 struct sock *sk = sock->sk;
407 struct ipv6_pinfo *np = inet6_sk(sk);
408 struct l2tp_ip6_sock *lsk = l2tp_ip6_sk(sk);
409
410 lsa->l2tp_family = AF_INET6;
411 lsa->l2tp_flowinfo = 0;
412 lsa->l2tp_scope_id = 0;
413 lsa->l2tp_unused = 0;
414 if (peer) {
415 if (!lsk->peer_conn_id)
416 return -ENOTCONN;
417 lsa->l2tp_conn_id = lsk->peer_conn_id;
418 lsa->l2tp_addr = np->daddr;
419 if (np->sndflow)
420 lsa->l2tp_flowinfo = np->flow_label;
421 } else {
422 if (ipv6_addr_any(&np->rcv_saddr))
423 lsa->l2tp_addr = np->saddr;
424 else
425 lsa->l2tp_addr = np->rcv_saddr;
426
427 lsa->l2tp_conn_id = lsk->conn_id;
428 }
429 if (ipv6_addr_type(&lsa->l2tp_addr) & IPV6_ADDR_LINKLOCAL)
430 lsa->l2tp_scope_id = sk->sk_bound_dev_if;
431 *uaddr_len = sizeof(*lsa);
432 return 0;
433}
434
435static int l2tp_ip6_backlog_recv(struct sock *sk, struct sk_buff *skb)
436{
437 int rc;
438
439 /* Charge it to the socket, dropping if the queue is full. */
440 rc = sock_queue_rcv_skb(sk, skb);
441 if (rc < 0)
442 goto drop;
443
444 return 0;
445
446drop:
447 IP_INC_STATS(&init_net, IPSTATS_MIB_INDISCARDS);
448 kfree_skb(skb);
449 return -1;
450}
451
452static int l2tp_ip6_push_pending_frames(struct sock *sk)
453{
454 struct sk_buff *skb;
455 __be32 *transhdr = NULL;
456 int err = 0;
457
458 skb = skb_peek(&sk->sk_write_queue);
459 if (skb == NULL)
460 goto out;
461
462 transhdr = (__be32 *)skb_transport_header(skb);
463 *transhdr = 0;
464
465 err = ip6_push_pending_frames(sk);
466
467out:
468 return err;
469}
470
471/* Userspace will call sendmsg() on the tunnel socket to send L2TP
472 * control frames.
473 */
474static int l2tp_ip6_sendmsg(struct kiocb *iocb, struct sock *sk,
475 struct msghdr *msg, size_t len)
476{
477 struct ipv6_txoptions opt_space;
478 struct sockaddr_l2tpip6 *lsa =
479 (struct sockaddr_l2tpip6 *) msg->msg_name;
480 struct in6_addr *daddr, *final_p, final;
481 struct ipv6_pinfo *np = inet6_sk(sk);
482 struct ipv6_txoptions *opt = NULL;
483 struct ip6_flowlabel *flowlabel = NULL;
484 struct dst_entry *dst = NULL;
485 struct flowi6 fl6;
486 int addr_len = msg->msg_namelen;
487 int hlimit = -1;
488 int tclass = -1;
489 int dontfrag = -1;
490 int transhdrlen = 4; /* zero session-id */
491 int ulen = len + transhdrlen;
492 int err;
493
494 /* Rough check on arithmetic overflow,
495 better check is made in ip6_append_data().
496 */
497 if (len > INT_MAX)
498 return -EMSGSIZE;
499
500 /* Mirror BSD error message compatibility */
501 if (msg->msg_flags & MSG_OOB)
502 return -EOPNOTSUPP;
503
504 /*
505 * Get and verify the address.
506 */
507 memset(&fl6, 0, sizeof(fl6));
508
509 fl6.flowi6_mark = sk->sk_mark;
510
511 if (lsa) {
512 if (addr_len < SIN6_LEN_RFC2133)
513 return -EINVAL;
514
515 if (lsa->l2tp_family && lsa->l2tp_family != AF_INET6)
516 return -EAFNOSUPPORT;
517
518 daddr = &lsa->l2tp_addr;
519 if (np->sndflow) {
520 fl6.flowlabel = lsa->l2tp_flowinfo & IPV6_FLOWINFO_MASK;
521 if (fl6.flowlabel&IPV6_FLOWLABEL_MASK) {
522 flowlabel = fl6_sock_lookup(sk, fl6.flowlabel);
523 if (flowlabel == NULL)
524 return -EINVAL;
525 daddr = &flowlabel->dst;
526 }
527 }
528
529 /*
530 * Otherwise it will be difficult to maintain
531 * sk->sk_dst_cache.
532 */
533 if (sk->sk_state == TCP_ESTABLISHED &&
534 ipv6_addr_equal(daddr, &np->daddr))
535 daddr = &np->daddr;
536
537 if (addr_len >= sizeof(struct sockaddr_in6) &&
538 lsa->l2tp_scope_id &&
539 ipv6_addr_type(daddr) & IPV6_ADDR_LINKLOCAL)
540 fl6.flowi6_oif = lsa->l2tp_scope_id;
541 } else {
542 if (sk->sk_state != TCP_ESTABLISHED)
543 return -EDESTADDRREQ;
544
545 daddr = &np->daddr;
546 fl6.flowlabel = np->flow_label;
547 }
548
549 if (fl6.flowi6_oif == 0)
550 fl6.flowi6_oif = sk->sk_bound_dev_if;
551
552 if (msg->msg_controllen) {
553 opt = &opt_space;
554 memset(opt, 0, sizeof(struct ipv6_txoptions));
555 opt->tot_len = sizeof(struct ipv6_txoptions);
556
557 err = datagram_send_ctl(sock_net(sk), sk, msg, &fl6, opt,
558 &hlimit, &tclass, &dontfrag);
559 if (err < 0) {
560 fl6_sock_release(flowlabel);
561 return err;
562 }
563 if ((fl6.flowlabel & IPV6_FLOWLABEL_MASK) && !flowlabel) {
564 flowlabel = fl6_sock_lookup(sk, fl6.flowlabel);
565 if (flowlabel == NULL)
566 return -EINVAL;
567 }
568 if (!(opt->opt_nflen|opt->opt_flen))
569 opt = NULL;
570 }
571
572 if (opt == NULL)
573 opt = np->opt;
574 if (flowlabel)
575 opt = fl6_merge_options(&opt_space, flowlabel, opt);
576 opt = ipv6_fixup_options(&opt_space, opt);
577
578 fl6.flowi6_proto = sk->sk_protocol;
579 if (!ipv6_addr_any(daddr))
580 fl6.daddr = *daddr;
581 else
582 fl6.daddr.s6_addr[15] = 0x1; /* :: means loopback (BSD'ism) */
583 if (ipv6_addr_any(&fl6.saddr) && !ipv6_addr_any(&np->saddr))
584 fl6.saddr = np->saddr;
585
586 final_p = fl6_update_dst(&fl6, opt, &final);
587
588 if (!fl6.flowi6_oif && ipv6_addr_is_multicast(&fl6.daddr))
589 fl6.flowi6_oif = np->mcast_oif;
590 else if (!fl6.flowi6_oif)
591 fl6.flowi6_oif = np->ucast_oif;
592
593 security_sk_classify_flow(sk, flowi6_to_flowi(&fl6));
594
595 dst = ip6_dst_lookup_flow(sk, &fl6, final_p, true);
596 if (IS_ERR(dst)) {
597 err = PTR_ERR(dst);
598 goto out;
599 }
600
601 if (hlimit < 0) {
602 if (ipv6_addr_is_multicast(&fl6.daddr))
603 hlimit = np->mcast_hops;
604 else
605 hlimit = np->hop_limit;
606 if (hlimit < 0)
607 hlimit = ip6_dst_hoplimit(dst);
608 }
609
610 if (tclass < 0)
611 tclass = np->tclass;
612
613 if (dontfrag < 0)
614 dontfrag = np->dontfrag;
615
616 if (msg->msg_flags & MSG_CONFIRM)
617 goto do_confirm;
618
619back_from_confirm:
620 lock_sock(sk);
621 err = ip6_append_data(sk, ip_generic_getfrag, msg->msg_iov,
622 ulen, transhdrlen, hlimit, tclass, opt,
623 &fl6, (struct rt6_info *)dst,
624 msg->msg_flags, dontfrag);
625 if (err)
626 ip6_flush_pending_frames(sk);
627 else if (!(msg->msg_flags & MSG_MORE))
628 err = l2tp_ip6_push_pending_frames(sk);
629 release_sock(sk);
630done:
631 dst_release(dst);
632out:
633 fl6_sock_release(flowlabel);
634
635 return err < 0 ? err : len;
636
637do_confirm:
638 dst_confirm(dst);
639 if (!(msg->msg_flags & MSG_PROBE) || len)
640 goto back_from_confirm;
641 err = 0;
642 goto done;
643}
644
645static int l2tp_ip6_recvmsg(struct kiocb *iocb, struct sock *sk,
646 struct msghdr *msg, size_t len, int noblock,
647 int flags, int *addr_len)
648{
649 struct inet_sock *inet = inet_sk(sk);
650 struct sockaddr_l2tpip6 *lsa = (struct sockaddr_l2tpip6 *)msg->msg_name;
651 size_t copied = 0;
652 int err = -EOPNOTSUPP;
653 struct sk_buff *skb;
654
655 if (flags & MSG_OOB)
656 goto out;
657
658 if (addr_len)
659 *addr_len = sizeof(*lsa);
660
661 if (flags & MSG_ERRQUEUE)
662 return ipv6_recv_error(sk, msg, len);
663
664 skb = skb_recv_datagram(sk, flags, noblock, &err);
665 if (!skb)
666 goto out;
667
668 copied = skb->len;
669 if (len < copied) {
670 msg->msg_flags |= MSG_TRUNC;
671 copied = len;
672 }
673
674 err = skb_copy_datagram_iovec(skb, 0, msg->msg_iov, copied);
675 if (err)
676 goto done;
677
678 sock_recv_timestamp(msg, sk, skb);
679
680 /* Copy the address. */
681 if (lsa) {
682 lsa->l2tp_family = AF_INET6;
683 lsa->l2tp_unused = 0;
684 lsa->l2tp_addr = ipv6_hdr(skb)->saddr;
685 lsa->l2tp_flowinfo = 0;
686 lsa->l2tp_scope_id = 0;
687 if (ipv6_addr_type(&lsa->l2tp_addr) & IPV6_ADDR_LINKLOCAL)
688 lsa->l2tp_scope_id = IP6CB(skb)->iif;
689 }
690
691 if (inet->cmsg_flags)
692 ip_cmsg_recv(msg, skb);
693
694 if (flags & MSG_TRUNC)
695 copied = skb->len;
696done:
697 skb_free_datagram(sk, skb);
698out:
699 return err ? err : copied;
700}
701
702static struct proto l2tp_ip6_prot = {
703 .name = "L2TP/IPv6",
704 .owner = THIS_MODULE,
705 .init = l2tp_ip6_open,
706 .close = l2tp_ip6_close,
707 .bind = l2tp_ip6_bind,
708 .connect = l2tp_ip6_connect,
709 .disconnect = l2tp_ip6_disconnect,
710 .ioctl = udp_ioctl,
711 .destroy = l2tp_ip6_destroy_sock,
712 .setsockopt = ipv6_setsockopt,
713 .getsockopt = ipv6_getsockopt,
714 .sendmsg = l2tp_ip6_sendmsg,
715 .recvmsg = l2tp_ip6_recvmsg,
716 .backlog_rcv = l2tp_ip6_backlog_recv,
717 .hash = inet_hash,
718 .unhash = inet_unhash,
719 .obj_size = sizeof(struct l2tp_ip6_sock),
720#ifdef CONFIG_COMPAT
721 .compat_setsockopt = compat_ipv6_setsockopt,
722 .compat_getsockopt = compat_ipv6_getsockopt,
723#endif
724};
725
726static const struct proto_ops l2tp_ip6_ops = {
727 .family = PF_INET6,
728 .owner = THIS_MODULE,
729 .release = inet6_release,
730 .bind = inet6_bind,
731 .connect = inet_dgram_connect,
732 .socketpair = sock_no_socketpair,
733 .accept = sock_no_accept,
734 .getname = l2tp_ip6_getname,
735 .poll = datagram_poll,
736 .ioctl = inet6_ioctl,
737 .listen = sock_no_listen,
738 .shutdown = inet_shutdown,
739 .setsockopt = sock_common_setsockopt,
740 .getsockopt = sock_common_getsockopt,
741 .sendmsg = inet_sendmsg,
742 .recvmsg = sock_common_recvmsg,
743 .mmap = sock_no_mmap,
744 .sendpage = sock_no_sendpage,
745#ifdef CONFIG_COMPAT
746 .compat_setsockopt = compat_sock_common_setsockopt,
747 .compat_getsockopt = compat_sock_common_getsockopt,
748#endif
749};
750
751static struct inet_protosw l2tp_ip6_protosw = {
752 .type = SOCK_DGRAM,
753 .protocol = IPPROTO_L2TP,
754 .prot = &l2tp_ip6_prot,
755 .ops = &l2tp_ip6_ops,
756 .no_check = 0,
757};
758
759static struct inet6_protocol l2tp_ip6_protocol __read_mostly = {
760 .handler = l2tp_ip6_recv,
761};
762
763static int __init l2tp_ip6_init(void)
764{
765 int err;
766
767 pr_info("L2TP IP encapsulation support for IPv6 (L2TPv3)\n");
768
769 err = proto_register(&l2tp_ip6_prot, 1);
770 if (err != 0)
771 goto out;
772
773 err = inet6_add_protocol(&l2tp_ip6_protocol, IPPROTO_L2TP);
774 if (err)
775 goto out1;
776
777 inet6_register_protosw(&l2tp_ip6_protosw);
778 return 0;
779
780out1:
781 proto_unregister(&l2tp_ip6_prot);
782out:
783 return err;
784}
785
786static void __exit l2tp_ip6_exit(void)
787{
788 inet6_unregister_protosw(&l2tp_ip6_protosw);
789 inet6_del_protocol(&l2tp_ip6_protocol, IPPROTO_L2TP);
790 proto_unregister(&l2tp_ip6_prot);
791}
792
793module_init(l2tp_ip6_init);
794module_exit(l2tp_ip6_exit);
795
796MODULE_LICENSE("GPL");
797MODULE_AUTHOR("Chris Elston <celston@katalix.com>");
798MODULE_DESCRIPTION("L2TP IP encapsulation for IPv6");
799MODULE_VERSION("1.0");
800
801/* Use the value of SOCK_DGRAM (2) directory, because __stringify doesn't like
802 * enums
803 */
804MODULE_ALIAS_NET_PF_PROTO_TYPE(PF_INET6, 2, IPPROTO_L2TP);