Loading...
1// SPDX-License-Identifier: GPL-2.0-only
2/*
3 * Copyright (c) 2008 Patrick McHardy <kaber@trash.net>
4 *
5 * Development of this code funded by Astaro AG (http://www.astaro.com/)
6 */
7
8#include <asm/unaligned.h>
9#include <linux/kernel.h>
10#include <linux/netlink.h>
11#include <linux/netfilter.h>
12#include <linux/netfilter/nf_tables.h>
13#include <linux/sctp.h>
14#include <net/netfilter/nf_tables_core.h>
15#include <net/netfilter/nf_tables.h>
16#include <net/sctp/sctp.h>
17#include <net/tcp.h>
18
19struct nft_exthdr {
20 u8 type;
21 u8 offset;
22 u8 len;
23 u8 op;
24 u8 dreg;
25 u8 sreg;
26 u8 flags;
27};
28
29static unsigned int optlen(const u8 *opt, unsigned int offset)
30{
31 /* Beware zero-length options: make finite progress */
32 if (opt[offset] <= TCPOPT_NOP || opt[offset + 1] == 0)
33 return 1;
34 else
35 return opt[offset + 1];
36}
37
38static void nft_exthdr_ipv6_eval(const struct nft_expr *expr,
39 struct nft_regs *regs,
40 const struct nft_pktinfo *pkt)
41{
42 struct nft_exthdr *priv = nft_expr_priv(expr);
43 u32 *dest = ®s->data[priv->dreg];
44 unsigned int offset = 0;
45 int err;
46
47 if (pkt->skb->protocol != htons(ETH_P_IPV6))
48 goto err;
49
50 err = ipv6_find_hdr(pkt->skb, &offset, priv->type, NULL, NULL);
51 if (priv->flags & NFT_EXTHDR_F_PRESENT) {
52 nft_reg_store8(dest, err >= 0);
53 return;
54 } else if (err < 0) {
55 goto err;
56 }
57 offset += priv->offset;
58
59 dest[priv->len / NFT_REG32_SIZE] = 0;
60 if (skb_copy_bits(pkt->skb, offset, dest, priv->len) < 0)
61 goto err;
62 return;
63err:
64 regs->verdict.code = NFT_BREAK;
65}
66
67/* find the offset to specified option.
68 *
69 * If target header is found, its offset is set in *offset and return option
70 * number. Otherwise, return negative error.
71 *
72 * If the first fragment doesn't contain the End of Options it is considered
73 * invalid.
74 */
75static int ipv4_find_option(struct net *net, struct sk_buff *skb,
76 unsigned int *offset, int target)
77{
78 unsigned char optbuf[sizeof(struct ip_options) + 40];
79 struct ip_options *opt = (struct ip_options *)optbuf;
80 struct iphdr *iph, _iph;
81 unsigned int start;
82 bool found = false;
83 __be32 info;
84 int optlen;
85
86 iph = skb_header_pointer(skb, 0, sizeof(_iph), &_iph);
87 if (!iph)
88 return -EBADMSG;
89 start = sizeof(struct iphdr);
90
91 optlen = iph->ihl * 4 - (int)sizeof(struct iphdr);
92 if (optlen <= 0)
93 return -ENOENT;
94
95 memset(opt, 0, sizeof(struct ip_options));
96 /* Copy the options since __ip_options_compile() modifies
97 * the options.
98 */
99 if (skb_copy_bits(skb, start, opt->__data, optlen))
100 return -EBADMSG;
101 opt->optlen = optlen;
102
103 if (__ip_options_compile(net, opt, NULL, &info))
104 return -EBADMSG;
105
106 switch (target) {
107 case IPOPT_SSRR:
108 case IPOPT_LSRR:
109 if (!opt->srr)
110 break;
111 found = target == IPOPT_SSRR ? opt->is_strictroute :
112 !opt->is_strictroute;
113 if (found)
114 *offset = opt->srr + start;
115 break;
116 case IPOPT_RR:
117 if (!opt->rr)
118 break;
119 *offset = opt->rr + start;
120 found = true;
121 break;
122 case IPOPT_RA:
123 if (!opt->router_alert)
124 break;
125 *offset = opt->router_alert + start;
126 found = true;
127 break;
128 default:
129 return -EOPNOTSUPP;
130 }
131 return found ? target : -ENOENT;
132}
133
134static void nft_exthdr_ipv4_eval(const struct nft_expr *expr,
135 struct nft_regs *regs,
136 const struct nft_pktinfo *pkt)
137{
138 struct nft_exthdr *priv = nft_expr_priv(expr);
139 u32 *dest = ®s->data[priv->dreg];
140 struct sk_buff *skb = pkt->skb;
141 unsigned int offset;
142 int err;
143
144 if (skb->protocol != htons(ETH_P_IP))
145 goto err;
146
147 err = ipv4_find_option(nft_net(pkt), skb, &offset, priv->type);
148 if (priv->flags & NFT_EXTHDR_F_PRESENT) {
149 nft_reg_store8(dest, err >= 0);
150 return;
151 } else if (err < 0) {
152 goto err;
153 }
154 offset += priv->offset;
155
156 dest[priv->len / NFT_REG32_SIZE] = 0;
157 if (skb_copy_bits(pkt->skb, offset, dest, priv->len) < 0)
158 goto err;
159 return;
160err:
161 regs->verdict.code = NFT_BREAK;
162}
163
164static void *
165nft_tcp_header_pointer(const struct nft_pktinfo *pkt,
166 unsigned int len, void *buffer, unsigned int *tcphdr_len)
167{
168 struct tcphdr *tcph;
169
170 if (pkt->tprot != IPPROTO_TCP)
171 return NULL;
172
173 tcph = skb_header_pointer(pkt->skb, nft_thoff(pkt), sizeof(*tcph), buffer);
174 if (!tcph)
175 return NULL;
176
177 *tcphdr_len = __tcp_hdrlen(tcph);
178 if (*tcphdr_len < sizeof(*tcph) || *tcphdr_len > len)
179 return NULL;
180
181 return skb_header_pointer(pkt->skb, nft_thoff(pkt), *tcphdr_len, buffer);
182}
183
184static void nft_exthdr_tcp_eval(const struct nft_expr *expr,
185 struct nft_regs *regs,
186 const struct nft_pktinfo *pkt)
187{
188 u8 buff[sizeof(struct tcphdr) + MAX_TCP_OPTION_SPACE];
189 struct nft_exthdr *priv = nft_expr_priv(expr);
190 unsigned int i, optl, tcphdr_len, offset;
191 u32 *dest = ®s->data[priv->dreg];
192 struct tcphdr *tcph;
193 u8 *opt;
194
195 tcph = nft_tcp_header_pointer(pkt, sizeof(buff), buff, &tcphdr_len);
196 if (!tcph)
197 goto err;
198
199 opt = (u8 *)tcph;
200 for (i = sizeof(*tcph); i < tcphdr_len - 1; i += optl) {
201 optl = optlen(opt, i);
202
203 if (priv->type != opt[i])
204 continue;
205
206 if (i + optl > tcphdr_len || priv->len + priv->offset > optl)
207 goto err;
208
209 offset = i + priv->offset;
210 if (priv->flags & NFT_EXTHDR_F_PRESENT) {
211 *dest = 1;
212 } else {
213 dest[priv->len / NFT_REG32_SIZE] = 0;
214 memcpy(dest, opt + offset, priv->len);
215 }
216
217 return;
218 }
219
220err:
221 if (priv->flags & NFT_EXTHDR_F_PRESENT)
222 *dest = 0;
223 else
224 regs->verdict.code = NFT_BREAK;
225}
226
227static void nft_exthdr_tcp_set_eval(const struct nft_expr *expr,
228 struct nft_regs *regs,
229 const struct nft_pktinfo *pkt)
230{
231 u8 buff[sizeof(struct tcphdr) + MAX_TCP_OPTION_SPACE];
232 struct nft_exthdr *priv = nft_expr_priv(expr);
233 unsigned int i, optl, tcphdr_len, offset;
234 struct tcphdr *tcph;
235 u8 *opt;
236
237 tcph = nft_tcp_header_pointer(pkt, sizeof(buff), buff, &tcphdr_len);
238 if (!tcph)
239 return;
240
241 opt = (u8 *)tcph;
242 for (i = sizeof(*tcph); i < tcphdr_len - 1; i += optl) {
243 union {
244 __be16 v16;
245 __be32 v32;
246 } old, new;
247
248 optl = optlen(opt, i);
249
250 if (priv->type != opt[i])
251 continue;
252
253 if (i + optl > tcphdr_len || priv->len + priv->offset > optl)
254 return;
255
256 if (skb_ensure_writable(pkt->skb,
257 nft_thoff(pkt) + i + priv->len))
258 return;
259
260 tcph = nft_tcp_header_pointer(pkt, sizeof(buff), buff,
261 &tcphdr_len);
262 if (!tcph)
263 return;
264
265 offset = i + priv->offset;
266
267 switch (priv->len) {
268 case 2:
269 old.v16 = get_unaligned((u16 *)(opt + offset));
270 new.v16 = (__force __be16)nft_reg_load16(
271 ®s->data[priv->sreg]);
272
273 switch (priv->type) {
274 case TCPOPT_MSS:
275 /* increase can cause connection to stall */
276 if (ntohs(old.v16) <= ntohs(new.v16))
277 return;
278 break;
279 }
280
281 if (old.v16 == new.v16)
282 return;
283
284 put_unaligned(new.v16, (u16*)(opt + offset));
285 inet_proto_csum_replace2(&tcph->check, pkt->skb,
286 old.v16, new.v16, false);
287 break;
288 case 4:
289 new.v32 = regs->data[priv->sreg];
290 old.v32 = get_unaligned((u32 *)(opt + offset));
291
292 if (old.v32 == new.v32)
293 return;
294
295 put_unaligned(new.v32, (u32*)(opt + offset));
296 inet_proto_csum_replace4(&tcph->check, pkt->skb,
297 old.v32, new.v32, false);
298 break;
299 default:
300 WARN_ON_ONCE(1);
301 break;
302 }
303
304 return;
305 }
306}
307
308static void nft_exthdr_sctp_eval(const struct nft_expr *expr,
309 struct nft_regs *regs,
310 const struct nft_pktinfo *pkt)
311{
312 unsigned int offset = nft_thoff(pkt) + sizeof(struct sctphdr);
313 struct nft_exthdr *priv = nft_expr_priv(expr);
314 u32 *dest = ®s->data[priv->dreg];
315 const struct sctp_chunkhdr *sch;
316 struct sctp_chunkhdr _sch;
317
318 if (pkt->tprot != IPPROTO_SCTP)
319 goto err;
320
321 do {
322 sch = skb_header_pointer(pkt->skb, offset, sizeof(_sch), &_sch);
323 if (!sch || !sch->length)
324 break;
325
326 if (sch->type == priv->type) {
327 if (priv->flags & NFT_EXTHDR_F_PRESENT) {
328 nft_reg_store8(dest, true);
329 return;
330 }
331 if (priv->offset + priv->len > ntohs(sch->length) ||
332 offset + ntohs(sch->length) > pkt->skb->len)
333 break;
334
335 dest[priv->len / NFT_REG32_SIZE] = 0;
336 if (skb_copy_bits(pkt->skb, offset + priv->offset,
337 dest, priv->len) < 0)
338 break;
339 return;
340 }
341 offset += SCTP_PAD4(ntohs(sch->length));
342 } while (offset < pkt->skb->len);
343err:
344 if (priv->flags & NFT_EXTHDR_F_PRESENT)
345 nft_reg_store8(dest, false);
346 else
347 regs->verdict.code = NFT_BREAK;
348}
349
350static const struct nla_policy nft_exthdr_policy[NFTA_EXTHDR_MAX + 1] = {
351 [NFTA_EXTHDR_DREG] = { .type = NLA_U32 },
352 [NFTA_EXTHDR_TYPE] = { .type = NLA_U8 },
353 [NFTA_EXTHDR_OFFSET] = { .type = NLA_U32 },
354 [NFTA_EXTHDR_LEN] = { .type = NLA_U32 },
355 [NFTA_EXTHDR_FLAGS] = { .type = NLA_U32 },
356 [NFTA_EXTHDR_OP] = { .type = NLA_U32 },
357 [NFTA_EXTHDR_SREG] = { .type = NLA_U32 },
358};
359
360static int nft_exthdr_init(const struct nft_ctx *ctx,
361 const struct nft_expr *expr,
362 const struct nlattr * const tb[])
363{
364 struct nft_exthdr *priv = nft_expr_priv(expr);
365 u32 offset, len, flags = 0, op = NFT_EXTHDR_OP_IPV6;
366 int err;
367
368 if (!tb[NFTA_EXTHDR_DREG] ||
369 !tb[NFTA_EXTHDR_TYPE] ||
370 !tb[NFTA_EXTHDR_OFFSET] ||
371 !tb[NFTA_EXTHDR_LEN])
372 return -EINVAL;
373
374 err = nft_parse_u32_check(tb[NFTA_EXTHDR_OFFSET], U8_MAX, &offset);
375 if (err < 0)
376 return err;
377
378 err = nft_parse_u32_check(tb[NFTA_EXTHDR_LEN], U8_MAX, &len);
379 if (err < 0)
380 return err;
381
382 if (tb[NFTA_EXTHDR_FLAGS]) {
383 err = nft_parse_u32_check(tb[NFTA_EXTHDR_FLAGS], U8_MAX, &flags);
384 if (err < 0)
385 return err;
386
387 if (flags & ~NFT_EXTHDR_F_PRESENT)
388 return -EINVAL;
389 }
390
391 if (tb[NFTA_EXTHDR_OP]) {
392 err = nft_parse_u32_check(tb[NFTA_EXTHDR_OP], U8_MAX, &op);
393 if (err < 0)
394 return err;
395 }
396
397 priv->type = nla_get_u8(tb[NFTA_EXTHDR_TYPE]);
398 priv->offset = offset;
399 priv->len = len;
400 priv->flags = flags;
401 priv->op = op;
402
403 return nft_parse_register_store(ctx, tb[NFTA_EXTHDR_DREG],
404 &priv->dreg, NULL, NFT_DATA_VALUE,
405 priv->len);
406}
407
408static int nft_exthdr_tcp_set_init(const struct nft_ctx *ctx,
409 const struct nft_expr *expr,
410 const struct nlattr * const tb[])
411{
412 struct nft_exthdr *priv = nft_expr_priv(expr);
413 u32 offset, len, flags = 0, op = NFT_EXTHDR_OP_IPV6;
414 int err;
415
416 if (!tb[NFTA_EXTHDR_SREG] ||
417 !tb[NFTA_EXTHDR_TYPE] ||
418 !tb[NFTA_EXTHDR_OFFSET] ||
419 !tb[NFTA_EXTHDR_LEN])
420 return -EINVAL;
421
422 if (tb[NFTA_EXTHDR_DREG] || tb[NFTA_EXTHDR_FLAGS])
423 return -EINVAL;
424
425 err = nft_parse_u32_check(tb[NFTA_EXTHDR_OFFSET], U8_MAX, &offset);
426 if (err < 0)
427 return err;
428
429 err = nft_parse_u32_check(tb[NFTA_EXTHDR_LEN], U8_MAX, &len);
430 if (err < 0)
431 return err;
432
433 if (offset < 2)
434 return -EOPNOTSUPP;
435
436 switch (len) {
437 case 2: break;
438 case 4: break;
439 default:
440 return -EOPNOTSUPP;
441 }
442
443 err = nft_parse_u32_check(tb[NFTA_EXTHDR_OP], U8_MAX, &op);
444 if (err < 0)
445 return err;
446
447 priv->type = nla_get_u8(tb[NFTA_EXTHDR_TYPE]);
448 priv->offset = offset;
449 priv->len = len;
450 priv->flags = flags;
451 priv->op = op;
452
453 return nft_parse_register_load(tb[NFTA_EXTHDR_SREG], &priv->sreg,
454 priv->len);
455}
456
457static int nft_exthdr_ipv4_init(const struct nft_ctx *ctx,
458 const struct nft_expr *expr,
459 const struct nlattr * const tb[])
460{
461 struct nft_exthdr *priv = nft_expr_priv(expr);
462 int err = nft_exthdr_init(ctx, expr, tb);
463
464 if (err < 0)
465 return err;
466
467 switch (priv->type) {
468 case IPOPT_SSRR:
469 case IPOPT_LSRR:
470 case IPOPT_RR:
471 case IPOPT_RA:
472 break;
473 default:
474 return -EOPNOTSUPP;
475 }
476 return 0;
477}
478
479static int nft_exthdr_dump_common(struct sk_buff *skb, const struct nft_exthdr *priv)
480{
481 if (nla_put_u8(skb, NFTA_EXTHDR_TYPE, priv->type))
482 goto nla_put_failure;
483 if (nla_put_be32(skb, NFTA_EXTHDR_OFFSET, htonl(priv->offset)))
484 goto nla_put_failure;
485 if (nla_put_be32(skb, NFTA_EXTHDR_LEN, htonl(priv->len)))
486 goto nla_put_failure;
487 if (nla_put_be32(skb, NFTA_EXTHDR_FLAGS, htonl(priv->flags)))
488 goto nla_put_failure;
489 if (nla_put_be32(skb, NFTA_EXTHDR_OP, htonl(priv->op)))
490 goto nla_put_failure;
491 return 0;
492
493nla_put_failure:
494 return -1;
495}
496
497static int nft_exthdr_dump(struct sk_buff *skb, const struct nft_expr *expr)
498{
499 const struct nft_exthdr *priv = nft_expr_priv(expr);
500
501 if (nft_dump_register(skb, NFTA_EXTHDR_DREG, priv->dreg))
502 return -1;
503
504 return nft_exthdr_dump_common(skb, priv);
505}
506
507static int nft_exthdr_dump_set(struct sk_buff *skb, const struct nft_expr *expr)
508{
509 const struct nft_exthdr *priv = nft_expr_priv(expr);
510
511 if (nft_dump_register(skb, NFTA_EXTHDR_SREG, priv->sreg))
512 return -1;
513
514 return nft_exthdr_dump_common(skb, priv);
515}
516
517static const struct nft_expr_ops nft_exthdr_ipv6_ops = {
518 .type = &nft_exthdr_type,
519 .size = NFT_EXPR_SIZE(sizeof(struct nft_exthdr)),
520 .eval = nft_exthdr_ipv6_eval,
521 .init = nft_exthdr_init,
522 .dump = nft_exthdr_dump,
523};
524
525static const struct nft_expr_ops nft_exthdr_ipv4_ops = {
526 .type = &nft_exthdr_type,
527 .size = NFT_EXPR_SIZE(sizeof(struct nft_exthdr)),
528 .eval = nft_exthdr_ipv4_eval,
529 .init = nft_exthdr_ipv4_init,
530 .dump = nft_exthdr_dump,
531};
532
533static const struct nft_expr_ops nft_exthdr_tcp_ops = {
534 .type = &nft_exthdr_type,
535 .size = NFT_EXPR_SIZE(sizeof(struct nft_exthdr)),
536 .eval = nft_exthdr_tcp_eval,
537 .init = nft_exthdr_init,
538 .dump = nft_exthdr_dump,
539};
540
541static const struct nft_expr_ops nft_exthdr_tcp_set_ops = {
542 .type = &nft_exthdr_type,
543 .size = NFT_EXPR_SIZE(sizeof(struct nft_exthdr)),
544 .eval = nft_exthdr_tcp_set_eval,
545 .init = nft_exthdr_tcp_set_init,
546 .dump = nft_exthdr_dump_set,
547};
548
549static const struct nft_expr_ops nft_exthdr_sctp_ops = {
550 .type = &nft_exthdr_type,
551 .size = NFT_EXPR_SIZE(sizeof(struct nft_exthdr)),
552 .eval = nft_exthdr_sctp_eval,
553 .init = nft_exthdr_init,
554 .dump = nft_exthdr_dump,
555};
556
557static const struct nft_expr_ops *
558nft_exthdr_select_ops(const struct nft_ctx *ctx,
559 const struct nlattr * const tb[])
560{
561 u32 op;
562
563 if (!tb[NFTA_EXTHDR_OP])
564 return &nft_exthdr_ipv6_ops;
565
566 if (tb[NFTA_EXTHDR_SREG] && tb[NFTA_EXTHDR_DREG])
567 return ERR_PTR(-EOPNOTSUPP);
568
569 op = ntohl(nla_get_be32(tb[NFTA_EXTHDR_OP]));
570 switch (op) {
571 case NFT_EXTHDR_OP_TCPOPT:
572 if (tb[NFTA_EXTHDR_SREG])
573 return &nft_exthdr_tcp_set_ops;
574 if (tb[NFTA_EXTHDR_DREG])
575 return &nft_exthdr_tcp_ops;
576 break;
577 case NFT_EXTHDR_OP_IPV6:
578 if (tb[NFTA_EXTHDR_DREG])
579 return &nft_exthdr_ipv6_ops;
580 break;
581 case NFT_EXTHDR_OP_IPV4:
582 if (ctx->family != NFPROTO_IPV6) {
583 if (tb[NFTA_EXTHDR_DREG])
584 return &nft_exthdr_ipv4_ops;
585 }
586 break;
587 case NFT_EXTHDR_OP_SCTP:
588 if (tb[NFTA_EXTHDR_DREG])
589 return &nft_exthdr_sctp_ops;
590 break;
591 }
592
593 return ERR_PTR(-EOPNOTSUPP);
594}
595
596struct nft_expr_type nft_exthdr_type __read_mostly = {
597 .name = "exthdr",
598 .select_ops = nft_exthdr_select_ops,
599 .policy = nft_exthdr_policy,
600 .maxattr = NFTA_EXTHDR_MAX,
601 .owner = THIS_MODULE,
602};
1// SPDX-License-Identifier: GPL-2.0-only
2/*
3 * Copyright (c) 2008 Patrick McHardy <kaber@trash.net>
4 *
5 * Development of this code funded by Astaro AG (http://www.astaro.com/)
6 */
7
8#include <asm/unaligned.h>
9#include <linux/kernel.h>
10#include <linux/netlink.h>
11#include <linux/netfilter.h>
12#include <linux/netfilter/nf_tables.h>
13#include <linux/sctp.h>
14#include <net/netfilter/nf_tables_core.h>
15#include <net/netfilter/nf_tables.h>
16#include <net/tcp.h>
17
18struct nft_exthdr {
19 u8 type;
20 u8 offset;
21 u8 len;
22 u8 op;
23 u8 dreg;
24 u8 sreg;
25 u8 flags;
26};
27
28static unsigned int optlen(const u8 *opt, unsigned int offset)
29{
30 /* Beware zero-length options: make finite progress */
31 if (opt[offset] <= TCPOPT_NOP || opt[offset + 1] == 0)
32 return 1;
33 else
34 return opt[offset + 1];
35}
36
37static void nft_exthdr_ipv6_eval(const struct nft_expr *expr,
38 struct nft_regs *regs,
39 const struct nft_pktinfo *pkt)
40{
41 struct nft_exthdr *priv = nft_expr_priv(expr);
42 u32 *dest = ®s->data[priv->dreg];
43 unsigned int offset = 0;
44 int err;
45
46 if (pkt->skb->protocol != htons(ETH_P_IPV6))
47 goto err;
48
49 err = ipv6_find_hdr(pkt->skb, &offset, priv->type, NULL, NULL);
50 if (priv->flags & NFT_EXTHDR_F_PRESENT) {
51 nft_reg_store8(dest, err >= 0);
52 return;
53 } else if (err < 0) {
54 goto err;
55 }
56 offset += priv->offset;
57
58 dest[priv->len / NFT_REG32_SIZE] = 0;
59 if (skb_copy_bits(pkt->skb, offset, dest, priv->len) < 0)
60 goto err;
61 return;
62err:
63 regs->verdict.code = NFT_BREAK;
64}
65
66/* find the offset to specified option.
67 *
68 * If target header is found, its offset is set in *offset and return option
69 * number. Otherwise, return negative error.
70 *
71 * If the first fragment doesn't contain the End of Options it is considered
72 * invalid.
73 */
74static int ipv4_find_option(struct net *net, struct sk_buff *skb,
75 unsigned int *offset, int target)
76{
77 unsigned char optbuf[sizeof(struct ip_options) + 40];
78 struct ip_options *opt = (struct ip_options *)optbuf;
79 struct iphdr *iph, _iph;
80 unsigned int start;
81 bool found = false;
82 __be32 info;
83 int optlen;
84
85 iph = skb_header_pointer(skb, 0, sizeof(_iph), &_iph);
86 if (!iph)
87 return -EBADMSG;
88 start = sizeof(struct iphdr);
89
90 optlen = iph->ihl * 4 - (int)sizeof(struct iphdr);
91 if (optlen <= 0)
92 return -ENOENT;
93
94 memset(opt, 0, sizeof(struct ip_options));
95 /* Copy the options since __ip_options_compile() modifies
96 * the options.
97 */
98 if (skb_copy_bits(skb, start, opt->__data, optlen))
99 return -EBADMSG;
100 opt->optlen = optlen;
101
102 if (__ip_options_compile(net, opt, NULL, &info))
103 return -EBADMSG;
104
105 switch (target) {
106 case IPOPT_SSRR:
107 case IPOPT_LSRR:
108 if (!opt->srr)
109 break;
110 found = target == IPOPT_SSRR ? opt->is_strictroute :
111 !opt->is_strictroute;
112 if (found)
113 *offset = opt->srr + start;
114 break;
115 case IPOPT_RR:
116 if (!opt->rr)
117 break;
118 *offset = opt->rr + start;
119 found = true;
120 break;
121 case IPOPT_RA:
122 if (!opt->router_alert)
123 break;
124 *offset = opt->router_alert + start;
125 found = true;
126 break;
127 default:
128 return -EOPNOTSUPP;
129 }
130 return found ? target : -ENOENT;
131}
132
133static void nft_exthdr_ipv4_eval(const struct nft_expr *expr,
134 struct nft_regs *regs,
135 const struct nft_pktinfo *pkt)
136{
137 struct nft_exthdr *priv = nft_expr_priv(expr);
138 u32 *dest = ®s->data[priv->dreg];
139 struct sk_buff *skb = pkt->skb;
140 unsigned int offset;
141 int err;
142
143 if (skb->protocol != htons(ETH_P_IP))
144 goto err;
145
146 err = ipv4_find_option(nft_net(pkt), skb, &offset, priv->type);
147 if (priv->flags & NFT_EXTHDR_F_PRESENT) {
148 nft_reg_store8(dest, err >= 0);
149 return;
150 } else if (err < 0) {
151 goto err;
152 }
153 offset += priv->offset;
154
155 dest[priv->len / NFT_REG32_SIZE] = 0;
156 if (skb_copy_bits(pkt->skb, offset, dest, priv->len) < 0)
157 goto err;
158 return;
159err:
160 regs->verdict.code = NFT_BREAK;
161}
162
163static void *
164nft_tcp_header_pointer(const struct nft_pktinfo *pkt,
165 unsigned int len, void *buffer, unsigned int *tcphdr_len)
166{
167 struct tcphdr *tcph;
168
169 if (pkt->tprot != IPPROTO_TCP || pkt->fragoff)
170 return NULL;
171
172 tcph = skb_header_pointer(pkt->skb, nft_thoff(pkt), sizeof(*tcph), buffer);
173 if (!tcph)
174 return NULL;
175
176 *tcphdr_len = __tcp_hdrlen(tcph);
177 if (*tcphdr_len < sizeof(*tcph) || *tcphdr_len > len)
178 return NULL;
179
180 return skb_header_pointer(pkt->skb, nft_thoff(pkt), *tcphdr_len, buffer);
181}
182
183static void nft_exthdr_tcp_eval(const struct nft_expr *expr,
184 struct nft_regs *regs,
185 const struct nft_pktinfo *pkt)
186{
187 u8 buff[sizeof(struct tcphdr) + MAX_TCP_OPTION_SPACE];
188 struct nft_exthdr *priv = nft_expr_priv(expr);
189 unsigned int i, optl, tcphdr_len, offset;
190 u32 *dest = ®s->data[priv->dreg];
191 struct tcphdr *tcph;
192 u8 *opt;
193
194 tcph = nft_tcp_header_pointer(pkt, sizeof(buff), buff, &tcphdr_len);
195 if (!tcph)
196 goto err;
197
198 opt = (u8 *)tcph;
199 for (i = sizeof(*tcph); i < tcphdr_len - 1; i += optl) {
200 optl = optlen(opt, i);
201
202 if (priv->type != opt[i])
203 continue;
204
205 if (i + optl > tcphdr_len || priv->len + priv->offset > optl)
206 goto err;
207
208 offset = i + priv->offset;
209 if (priv->flags & NFT_EXTHDR_F_PRESENT) {
210 *dest = 1;
211 } else {
212 dest[priv->len / NFT_REG32_SIZE] = 0;
213 memcpy(dest, opt + offset, priv->len);
214 }
215
216 return;
217 }
218
219err:
220 if (priv->flags & NFT_EXTHDR_F_PRESENT)
221 *dest = 0;
222 else
223 regs->verdict.code = NFT_BREAK;
224}
225
226static void nft_exthdr_tcp_set_eval(const struct nft_expr *expr,
227 struct nft_regs *regs,
228 const struct nft_pktinfo *pkt)
229{
230 u8 buff[sizeof(struct tcphdr) + MAX_TCP_OPTION_SPACE];
231 struct nft_exthdr *priv = nft_expr_priv(expr);
232 unsigned int i, optl, tcphdr_len, offset;
233 struct tcphdr *tcph;
234 u8 *opt;
235
236 tcph = nft_tcp_header_pointer(pkt, sizeof(buff), buff, &tcphdr_len);
237 if (!tcph)
238 goto err;
239
240 opt = (u8 *)tcph;
241 for (i = sizeof(*tcph); i < tcphdr_len - 1; i += optl) {
242 union {
243 __be16 v16;
244 __be32 v32;
245 } old, new;
246
247 optl = optlen(opt, i);
248
249 if (priv->type != opt[i])
250 continue;
251
252 if (i + optl > tcphdr_len || priv->len + priv->offset > optl)
253 goto err;
254
255 if (skb_ensure_writable(pkt->skb,
256 nft_thoff(pkt) + i + priv->len))
257 goto err;
258
259 tcph = nft_tcp_header_pointer(pkt, sizeof(buff), buff,
260 &tcphdr_len);
261 if (!tcph)
262 goto err;
263
264 offset = i + priv->offset;
265
266 switch (priv->len) {
267 case 2:
268 old.v16 = (__force __be16)get_unaligned((u16 *)(opt + offset));
269 new.v16 = (__force __be16)nft_reg_load16(
270 ®s->data[priv->sreg]);
271
272 switch (priv->type) {
273 case TCPOPT_MSS:
274 /* increase can cause connection to stall */
275 if (ntohs(old.v16) <= ntohs(new.v16))
276 return;
277 break;
278 }
279
280 if (old.v16 == new.v16)
281 return;
282
283 put_unaligned(new.v16, (__be16*)(opt + offset));
284 inet_proto_csum_replace2(&tcph->check, pkt->skb,
285 old.v16, new.v16, false);
286 break;
287 case 4:
288 new.v32 = nft_reg_load_be32(®s->data[priv->sreg]);
289 old.v32 = (__force __be32)get_unaligned((u32 *)(opt + offset));
290
291 if (old.v32 == new.v32)
292 return;
293
294 put_unaligned(new.v32, (__be32*)(opt + offset));
295 inet_proto_csum_replace4(&tcph->check, pkt->skb,
296 old.v32, new.v32, false);
297 break;
298 default:
299 WARN_ON_ONCE(1);
300 break;
301 }
302
303 return;
304 }
305 return;
306err:
307 regs->verdict.code = NFT_BREAK;
308}
309
310static void nft_exthdr_tcp_strip_eval(const struct nft_expr *expr,
311 struct nft_regs *regs,
312 const struct nft_pktinfo *pkt)
313{
314 u8 buff[sizeof(struct tcphdr) + MAX_TCP_OPTION_SPACE];
315 struct nft_exthdr *priv = nft_expr_priv(expr);
316 unsigned int i, tcphdr_len, optl;
317 struct tcphdr *tcph;
318 u8 *opt;
319
320 tcph = nft_tcp_header_pointer(pkt, sizeof(buff), buff, &tcphdr_len);
321 if (!tcph)
322 goto err;
323
324 if (skb_ensure_writable(pkt->skb, nft_thoff(pkt) + tcphdr_len))
325 goto drop;
326
327 opt = (u8 *)nft_tcp_header_pointer(pkt, sizeof(buff), buff, &tcphdr_len);
328 if (!opt)
329 goto err;
330 for (i = sizeof(*tcph); i < tcphdr_len - 1; i += optl) {
331 unsigned int j;
332
333 optl = optlen(opt, i);
334 if (priv->type != opt[i])
335 continue;
336
337 if (i + optl > tcphdr_len)
338 goto drop;
339
340 for (j = 0; j < optl; ++j) {
341 u16 n = TCPOPT_NOP;
342 u16 o = opt[i+j];
343
344 if ((i + j) % 2 == 0) {
345 o <<= 8;
346 n <<= 8;
347 }
348 inet_proto_csum_replace2(&tcph->check, pkt->skb, htons(o),
349 htons(n), false);
350 }
351 memset(opt + i, TCPOPT_NOP, optl);
352 return;
353 }
354
355 /* option not found, continue. This allows to do multiple
356 * option removals per rule.
357 */
358 return;
359err:
360 regs->verdict.code = NFT_BREAK;
361 return;
362drop:
363 /* can't remove, no choice but to drop */
364 regs->verdict.code = NF_DROP;
365}
366
367static void nft_exthdr_sctp_eval(const struct nft_expr *expr,
368 struct nft_regs *regs,
369 const struct nft_pktinfo *pkt)
370{
371 unsigned int offset = nft_thoff(pkt) + sizeof(struct sctphdr);
372 struct nft_exthdr *priv = nft_expr_priv(expr);
373 u32 *dest = ®s->data[priv->dreg];
374 const struct sctp_chunkhdr *sch;
375 struct sctp_chunkhdr _sch;
376
377 if (pkt->tprot != IPPROTO_SCTP)
378 goto err;
379
380 do {
381 sch = skb_header_pointer(pkt->skb, offset, sizeof(_sch), &_sch);
382 if (!sch || !sch->length)
383 break;
384
385 if (sch->type == priv->type) {
386 if (priv->flags & NFT_EXTHDR_F_PRESENT) {
387 nft_reg_store8(dest, true);
388 return;
389 }
390 if (priv->offset + priv->len > ntohs(sch->length) ||
391 offset + ntohs(sch->length) > pkt->skb->len)
392 break;
393
394 dest[priv->len / NFT_REG32_SIZE] = 0;
395 if (skb_copy_bits(pkt->skb, offset + priv->offset,
396 dest, priv->len) < 0)
397 break;
398 return;
399 }
400 offset += SCTP_PAD4(ntohs(sch->length));
401 } while (offset < pkt->skb->len);
402err:
403 if (priv->flags & NFT_EXTHDR_F_PRESENT)
404 nft_reg_store8(dest, false);
405 else
406 regs->verdict.code = NFT_BREAK;
407}
408
409static const struct nla_policy nft_exthdr_policy[NFTA_EXTHDR_MAX + 1] = {
410 [NFTA_EXTHDR_DREG] = { .type = NLA_U32 },
411 [NFTA_EXTHDR_TYPE] = { .type = NLA_U8 },
412 [NFTA_EXTHDR_OFFSET] = { .type = NLA_U32 },
413 [NFTA_EXTHDR_LEN] = { .type = NLA_U32 },
414 [NFTA_EXTHDR_FLAGS] = { .type = NLA_U32 },
415 [NFTA_EXTHDR_OP] = { .type = NLA_U32 },
416 [NFTA_EXTHDR_SREG] = { .type = NLA_U32 },
417};
418
419static int nft_exthdr_init(const struct nft_ctx *ctx,
420 const struct nft_expr *expr,
421 const struct nlattr * const tb[])
422{
423 struct nft_exthdr *priv = nft_expr_priv(expr);
424 u32 offset, len, flags = 0, op = NFT_EXTHDR_OP_IPV6;
425 int err;
426
427 if (!tb[NFTA_EXTHDR_DREG] ||
428 !tb[NFTA_EXTHDR_TYPE] ||
429 !tb[NFTA_EXTHDR_OFFSET] ||
430 !tb[NFTA_EXTHDR_LEN])
431 return -EINVAL;
432
433 err = nft_parse_u32_check(tb[NFTA_EXTHDR_OFFSET], U8_MAX, &offset);
434 if (err < 0)
435 return err;
436
437 err = nft_parse_u32_check(tb[NFTA_EXTHDR_LEN], U8_MAX, &len);
438 if (err < 0)
439 return err;
440
441 if (tb[NFTA_EXTHDR_FLAGS]) {
442 err = nft_parse_u32_check(tb[NFTA_EXTHDR_FLAGS], U8_MAX, &flags);
443 if (err < 0)
444 return err;
445
446 if (flags & ~NFT_EXTHDR_F_PRESENT)
447 return -EINVAL;
448 }
449
450 if (tb[NFTA_EXTHDR_OP]) {
451 err = nft_parse_u32_check(tb[NFTA_EXTHDR_OP], U8_MAX, &op);
452 if (err < 0)
453 return err;
454 }
455
456 priv->type = nla_get_u8(tb[NFTA_EXTHDR_TYPE]);
457 priv->offset = offset;
458 priv->len = len;
459 priv->flags = flags;
460 priv->op = op;
461
462 return nft_parse_register_store(ctx, tb[NFTA_EXTHDR_DREG],
463 &priv->dreg, NULL, NFT_DATA_VALUE,
464 priv->len);
465}
466
467static int nft_exthdr_tcp_set_init(const struct nft_ctx *ctx,
468 const struct nft_expr *expr,
469 const struct nlattr * const tb[])
470{
471 struct nft_exthdr *priv = nft_expr_priv(expr);
472 u32 offset, len, flags = 0, op = NFT_EXTHDR_OP_IPV6;
473 int err;
474
475 if (!tb[NFTA_EXTHDR_SREG] ||
476 !tb[NFTA_EXTHDR_TYPE] ||
477 !tb[NFTA_EXTHDR_OFFSET] ||
478 !tb[NFTA_EXTHDR_LEN])
479 return -EINVAL;
480
481 if (tb[NFTA_EXTHDR_DREG] || tb[NFTA_EXTHDR_FLAGS])
482 return -EINVAL;
483
484 err = nft_parse_u32_check(tb[NFTA_EXTHDR_OFFSET], U8_MAX, &offset);
485 if (err < 0)
486 return err;
487
488 err = nft_parse_u32_check(tb[NFTA_EXTHDR_LEN], U8_MAX, &len);
489 if (err < 0)
490 return err;
491
492 if (offset < 2)
493 return -EOPNOTSUPP;
494
495 switch (len) {
496 case 2: break;
497 case 4: break;
498 default:
499 return -EOPNOTSUPP;
500 }
501
502 err = nft_parse_u32_check(tb[NFTA_EXTHDR_OP], U8_MAX, &op);
503 if (err < 0)
504 return err;
505
506 priv->type = nla_get_u8(tb[NFTA_EXTHDR_TYPE]);
507 priv->offset = offset;
508 priv->len = len;
509 priv->flags = flags;
510 priv->op = op;
511
512 return nft_parse_register_load(tb[NFTA_EXTHDR_SREG], &priv->sreg,
513 priv->len);
514}
515
516static int nft_exthdr_tcp_strip_init(const struct nft_ctx *ctx,
517 const struct nft_expr *expr,
518 const struct nlattr * const tb[])
519{
520 struct nft_exthdr *priv = nft_expr_priv(expr);
521
522 if (tb[NFTA_EXTHDR_SREG] ||
523 tb[NFTA_EXTHDR_DREG] ||
524 tb[NFTA_EXTHDR_FLAGS] ||
525 tb[NFTA_EXTHDR_OFFSET] ||
526 tb[NFTA_EXTHDR_LEN])
527 return -EINVAL;
528
529 if (!tb[NFTA_EXTHDR_TYPE])
530 return -EINVAL;
531
532 priv->type = nla_get_u8(tb[NFTA_EXTHDR_TYPE]);
533 priv->op = NFT_EXTHDR_OP_TCPOPT;
534
535 return 0;
536}
537
538static int nft_exthdr_ipv4_init(const struct nft_ctx *ctx,
539 const struct nft_expr *expr,
540 const struct nlattr * const tb[])
541{
542 struct nft_exthdr *priv = nft_expr_priv(expr);
543 int err = nft_exthdr_init(ctx, expr, tb);
544
545 if (err < 0)
546 return err;
547
548 switch (priv->type) {
549 case IPOPT_SSRR:
550 case IPOPT_LSRR:
551 case IPOPT_RR:
552 case IPOPT_RA:
553 break;
554 default:
555 return -EOPNOTSUPP;
556 }
557 return 0;
558}
559
560static int nft_exthdr_dump_common(struct sk_buff *skb, const struct nft_exthdr *priv)
561{
562 if (nla_put_u8(skb, NFTA_EXTHDR_TYPE, priv->type))
563 goto nla_put_failure;
564 if (nla_put_be32(skb, NFTA_EXTHDR_OFFSET, htonl(priv->offset)))
565 goto nla_put_failure;
566 if (nla_put_be32(skb, NFTA_EXTHDR_LEN, htonl(priv->len)))
567 goto nla_put_failure;
568 if (nla_put_be32(skb, NFTA_EXTHDR_FLAGS, htonl(priv->flags)))
569 goto nla_put_failure;
570 if (nla_put_be32(skb, NFTA_EXTHDR_OP, htonl(priv->op)))
571 goto nla_put_failure;
572 return 0;
573
574nla_put_failure:
575 return -1;
576}
577
578static int nft_exthdr_dump(struct sk_buff *skb,
579 const struct nft_expr *expr, bool reset)
580{
581 const struct nft_exthdr *priv = nft_expr_priv(expr);
582
583 if (nft_dump_register(skb, NFTA_EXTHDR_DREG, priv->dreg))
584 return -1;
585
586 return nft_exthdr_dump_common(skb, priv);
587}
588
589static int nft_exthdr_dump_set(struct sk_buff *skb,
590 const struct nft_expr *expr, bool reset)
591{
592 const struct nft_exthdr *priv = nft_expr_priv(expr);
593
594 if (nft_dump_register(skb, NFTA_EXTHDR_SREG, priv->sreg))
595 return -1;
596
597 return nft_exthdr_dump_common(skb, priv);
598}
599
600static int nft_exthdr_dump_strip(struct sk_buff *skb,
601 const struct nft_expr *expr, bool reset)
602{
603 const struct nft_exthdr *priv = nft_expr_priv(expr);
604
605 return nft_exthdr_dump_common(skb, priv);
606}
607
608static bool nft_exthdr_reduce(struct nft_regs_track *track,
609 const struct nft_expr *expr)
610{
611 const struct nft_exthdr *priv = nft_expr_priv(expr);
612 const struct nft_exthdr *exthdr;
613
614 if (!nft_reg_track_cmp(track, expr, priv->dreg)) {
615 nft_reg_track_update(track, expr, priv->dreg, priv->len);
616 return false;
617 }
618
619 exthdr = nft_expr_priv(track->regs[priv->dreg].selector);
620 if (priv->type != exthdr->type ||
621 priv->op != exthdr->op ||
622 priv->flags != exthdr->flags ||
623 priv->offset != exthdr->offset ||
624 priv->len != exthdr->len) {
625 nft_reg_track_update(track, expr, priv->dreg, priv->len);
626 return false;
627 }
628
629 if (!track->regs[priv->dreg].bitwise)
630 return true;
631
632 return nft_expr_reduce_bitwise(track, expr);
633}
634
635static const struct nft_expr_ops nft_exthdr_ipv6_ops = {
636 .type = &nft_exthdr_type,
637 .size = NFT_EXPR_SIZE(sizeof(struct nft_exthdr)),
638 .eval = nft_exthdr_ipv6_eval,
639 .init = nft_exthdr_init,
640 .dump = nft_exthdr_dump,
641 .reduce = nft_exthdr_reduce,
642};
643
644static const struct nft_expr_ops nft_exthdr_ipv4_ops = {
645 .type = &nft_exthdr_type,
646 .size = NFT_EXPR_SIZE(sizeof(struct nft_exthdr)),
647 .eval = nft_exthdr_ipv4_eval,
648 .init = nft_exthdr_ipv4_init,
649 .dump = nft_exthdr_dump,
650 .reduce = nft_exthdr_reduce,
651};
652
653static const struct nft_expr_ops nft_exthdr_tcp_ops = {
654 .type = &nft_exthdr_type,
655 .size = NFT_EXPR_SIZE(sizeof(struct nft_exthdr)),
656 .eval = nft_exthdr_tcp_eval,
657 .init = nft_exthdr_init,
658 .dump = nft_exthdr_dump,
659 .reduce = nft_exthdr_reduce,
660};
661
662static const struct nft_expr_ops nft_exthdr_tcp_set_ops = {
663 .type = &nft_exthdr_type,
664 .size = NFT_EXPR_SIZE(sizeof(struct nft_exthdr)),
665 .eval = nft_exthdr_tcp_set_eval,
666 .init = nft_exthdr_tcp_set_init,
667 .dump = nft_exthdr_dump_set,
668 .reduce = NFT_REDUCE_READONLY,
669};
670
671static const struct nft_expr_ops nft_exthdr_tcp_strip_ops = {
672 .type = &nft_exthdr_type,
673 .size = NFT_EXPR_SIZE(sizeof(struct nft_exthdr)),
674 .eval = nft_exthdr_tcp_strip_eval,
675 .init = nft_exthdr_tcp_strip_init,
676 .dump = nft_exthdr_dump_strip,
677 .reduce = NFT_REDUCE_READONLY,
678};
679
680static const struct nft_expr_ops nft_exthdr_sctp_ops = {
681 .type = &nft_exthdr_type,
682 .size = NFT_EXPR_SIZE(sizeof(struct nft_exthdr)),
683 .eval = nft_exthdr_sctp_eval,
684 .init = nft_exthdr_init,
685 .dump = nft_exthdr_dump,
686 .reduce = nft_exthdr_reduce,
687};
688
689static const struct nft_expr_ops *
690nft_exthdr_select_ops(const struct nft_ctx *ctx,
691 const struct nlattr * const tb[])
692{
693 u32 op;
694
695 if (!tb[NFTA_EXTHDR_OP])
696 return &nft_exthdr_ipv6_ops;
697
698 if (tb[NFTA_EXTHDR_SREG] && tb[NFTA_EXTHDR_DREG])
699 return ERR_PTR(-EOPNOTSUPP);
700
701 op = ntohl(nla_get_be32(tb[NFTA_EXTHDR_OP]));
702 switch (op) {
703 case NFT_EXTHDR_OP_TCPOPT:
704 if (tb[NFTA_EXTHDR_SREG])
705 return &nft_exthdr_tcp_set_ops;
706 if (tb[NFTA_EXTHDR_DREG])
707 return &nft_exthdr_tcp_ops;
708 return &nft_exthdr_tcp_strip_ops;
709 case NFT_EXTHDR_OP_IPV6:
710 if (tb[NFTA_EXTHDR_DREG])
711 return &nft_exthdr_ipv6_ops;
712 break;
713 case NFT_EXTHDR_OP_IPV4:
714 if (ctx->family != NFPROTO_IPV6) {
715 if (tb[NFTA_EXTHDR_DREG])
716 return &nft_exthdr_ipv4_ops;
717 }
718 break;
719 case NFT_EXTHDR_OP_SCTP:
720 if (tb[NFTA_EXTHDR_DREG])
721 return &nft_exthdr_sctp_ops;
722 break;
723 }
724
725 return ERR_PTR(-EOPNOTSUPP);
726}
727
728struct nft_expr_type nft_exthdr_type __read_mostly = {
729 .name = "exthdr",
730 .select_ops = nft_exthdr_select_ops,
731 .policy = nft_exthdr_policy,
732 .maxattr = NFTA_EXTHDR_MAX,
733 .owner = THIS_MODULE,
734};