Loading...
1// SPDX-License-Identifier: GPL-2.0-only
2/*
3 * Copyright (c) 2008-2009 Patrick McHardy <kaber@trash.net>
4 * Copyright (c) 2016 Pablo Neira Ayuso <pablo@netfilter.org>
5 *
6 * Development of this code funded by Astaro AG (http://www.astaro.com/)
7 */
8
9#include <linux/kernel.h>
10#include <linux/if_vlan.h>
11#include <linux/init.h>
12#include <linux/module.h>
13#include <linux/netlink.h>
14#include <linux/netfilter.h>
15#include <linux/netfilter/nf_tables.h>
16#include <net/netfilter/nf_tables_core.h>
17#include <net/netfilter/nf_tables.h>
18#include <net/netfilter/nf_tables_offload.h>
19/* For layer 4 checksum field offset. */
20#include <linux/tcp.h>
21#include <linux/udp.h>
22#include <linux/icmpv6.h>
23#include <linux/ip.h>
24#include <linux/ipv6.h>
25#include <net/sctp/checksum.h>
26
27static bool nft_payload_rebuild_vlan_hdr(const struct sk_buff *skb, int mac_off,
28 struct vlan_ethhdr *veth)
29{
30 if (skb_copy_bits(skb, mac_off, veth, ETH_HLEN))
31 return false;
32
33 veth->h_vlan_proto = skb->vlan_proto;
34 veth->h_vlan_TCI = htons(skb_vlan_tag_get(skb));
35 veth->h_vlan_encapsulated_proto = skb->protocol;
36
37 return true;
38}
39
40/* add vlan header into the user buffer for if tag was removed by offloads */
41static bool
42nft_payload_copy_vlan(u32 *d, const struct sk_buff *skb, u8 offset, u8 len)
43{
44 int mac_off = skb_mac_header(skb) - skb->data;
45 u8 *vlanh, *dst_u8 = (u8 *) d;
46 struct vlan_ethhdr veth;
47 u8 vlan_hlen = 0;
48
49 if ((skb->protocol == htons(ETH_P_8021AD) ||
50 skb->protocol == htons(ETH_P_8021Q)) &&
51 offset >= VLAN_ETH_HLEN && offset < VLAN_ETH_HLEN + VLAN_HLEN)
52 vlan_hlen += VLAN_HLEN;
53
54 vlanh = (u8 *) &veth;
55 if (offset < VLAN_ETH_HLEN + vlan_hlen) {
56 u8 ethlen = len;
57
58 if (vlan_hlen &&
59 skb_copy_bits(skb, mac_off, &veth, VLAN_ETH_HLEN) < 0)
60 return false;
61 else if (!nft_payload_rebuild_vlan_hdr(skb, mac_off, &veth))
62 return false;
63
64 if (offset + len > VLAN_ETH_HLEN + vlan_hlen)
65 ethlen -= offset + len - VLAN_ETH_HLEN + vlan_hlen;
66
67 memcpy(dst_u8, vlanh + offset - vlan_hlen, ethlen);
68
69 len -= ethlen;
70 if (len == 0)
71 return true;
72
73 dst_u8 += ethlen;
74 offset = ETH_HLEN + vlan_hlen;
75 } else {
76 offset -= VLAN_HLEN + vlan_hlen;
77 }
78
79 return skb_copy_bits(skb, offset + mac_off, dst_u8, len) == 0;
80}
81
82void nft_payload_eval(const struct nft_expr *expr,
83 struct nft_regs *regs,
84 const struct nft_pktinfo *pkt)
85{
86 const struct nft_payload *priv = nft_expr_priv(expr);
87 const struct sk_buff *skb = pkt->skb;
88 u32 *dest = ®s->data[priv->dreg];
89 int offset;
90
91 if (priv->len % NFT_REG32_SIZE)
92 dest[priv->len / NFT_REG32_SIZE] = 0;
93
94 switch (priv->base) {
95 case NFT_PAYLOAD_LL_HEADER:
96 if (!skb_mac_header_was_set(skb))
97 goto err;
98
99 if (skb_vlan_tag_present(skb)) {
100 if (!nft_payload_copy_vlan(dest, skb,
101 priv->offset, priv->len))
102 goto err;
103 return;
104 }
105 offset = skb_mac_header(skb) - skb->data;
106 break;
107 case NFT_PAYLOAD_NETWORK_HEADER:
108 offset = skb_network_offset(skb);
109 break;
110 case NFT_PAYLOAD_TRANSPORT_HEADER:
111 if (!pkt->tprot_set)
112 goto err;
113 offset = nft_thoff(pkt);
114 break;
115 default:
116 BUG();
117 }
118 offset += priv->offset;
119
120 if (skb_copy_bits(skb, offset, dest, priv->len) < 0)
121 goto err;
122 return;
123err:
124 regs->verdict.code = NFT_BREAK;
125}
126
127static const struct nla_policy nft_payload_policy[NFTA_PAYLOAD_MAX + 1] = {
128 [NFTA_PAYLOAD_SREG] = { .type = NLA_U32 },
129 [NFTA_PAYLOAD_DREG] = { .type = NLA_U32 },
130 [NFTA_PAYLOAD_BASE] = { .type = NLA_U32 },
131 [NFTA_PAYLOAD_OFFSET] = { .type = NLA_U32 },
132 [NFTA_PAYLOAD_LEN] = { .type = NLA_U32 },
133 [NFTA_PAYLOAD_CSUM_TYPE] = { .type = NLA_U32 },
134 [NFTA_PAYLOAD_CSUM_OFFSET] = { .type = NLA_U32 },
135 [NFTA_PAYLOAD_CSUM_FLAGS] = { .type = NLA_U32 },
136};
137
138static int nft_payload_init(const struct nft_ctx *ctx,
139 const struct nft_expr *expr,
140 const struct nlattr * const tb[])
141{
142 struct nft_payload *priv = nft_expr_priv(expr);
143
144 priv->base = ntohl(nla_get_be32(tb[NFTA_PAYLOAD_BASE]));
145 priv->offset = ntohl(nla_get_be32(tb[NFTA_PAYLOAD_OFFSET]));
146 priv->len = ntohl(nla_get_be32(tb[NFTA_PAYLOAD_LEN]));
147
148 return nft_parse_register_store(ctx, tb[NFTA_PAYLOAD_DREG],
149 &priv->dreg, NULL, NFT_DATA_VALUE,
150 priv->len);
151}
152
153static int nft_payload_dump(struct sk_buff *skb, const struct nft_expr *expr)
154{
155 const struct nft_payload *priv = nft_expr_priv(expr);
156
157 if (nft_dump_register(skb, NFTA_PAYLOAD_DREG, priv->dreg) ||
158 nla_put_be32(skb, NFTA_PAYLOAD_BASE, htonl(priv->base)) ||
159 nla_put_be32(skb, NFTA_PAYLOAD_OFFSET, htonl(priv->offset)) ||
160 nla_put_be32(skb, NFTA_PAYLOAD_LEN, htonl(priv->len)))
161 goto nla_put_failure;
162 return 0;
163
164nla_put_failure:
165 return -1;
166}
167
168static bool nft_payload_offload_mask(struct nft_offload_reg *reg,
169 u32 priv_len, u32 field_len)
170{
171 unsigned int remainder, delta, k;
172 struct nft_data mask = {};
173 __be32 remainder_mask;
174
175 if (priv_len == field_len) {
176 memset(®->mask, 0xff, priv_len);
177 return true;
178 } else if (priv_len > field_len) {
179 return false;
180 }
181
182 memset(&mask, 0xff, field_len);
183 remainder = priv_len % sizeof(u32);
184 if (remainder) {
185 k = priv_len / sizeof(u32);
186 delta = field_len - priv_len;
187 remainder_mask = htonl(~((1 << (delta * BITS_PER_BYTE)) - 1));
188 mask.data[k] = (__force u32)remainder_mask;
189 }
190
191 memcpy(®->mask, &mask, field_len);
192
193 return true;
194}
195
196static int nft_payload_offload_ll(struct nft_offload_ctx *ctx,
197 struct nft_flow_rule *flow,
198 const struct nft_payload *priv)
199{
200 struct nft_offload_reg *reg = &ctx->regs[priv->dreg];
201
202 switch (priv->offset) {
203 case offsetof(struct ethhdr, h_source):
204 if (!nft_payload_offload_mask(reg, priv->len, ETH_ALEN))
205 return -EOPNOTSUPP;
206
207 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_ETH_ADDRS, eth_addrs,
208 src, ETH_ALEN, reg);
209 break;
210 case offsetof(struct ethhdr, h_dest):
211 if (!nft_payload_offload_mask(reg, priv->len, ETH_ALEN))
212 return -EOPNOTSUPP;
213
214 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_ETH_ADDRS, eth_addrs,
215 dst, ETH_ALEN, reg);
216 break;
217 case offsetof(struct ethhdr, h_proto):
218 if (!nft_payload_offload_mask(reg, priv->len, sizeof(__be16)))
219 return -EOPNOTSUPP;
220
221 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_BASIC, basic,
222 n_proto, sizeof(__be16), reg);
223 nft_offload_set_dependency(ctx, NFT_OFFLOAD_DEP_NETWORK);
224 break;
225 case offsetof(struct vlan_ethhdr, h_vlan_TCI):
226 if (!nft_payload_offload_mask(reg, priv->len, sizeof(__be16)))
227 return -EOPNOTSUPP;
228
229 NFT_OFFLOAD_MATCH_FLAGS(FLOW_DISSECTOR_KEY_VLAN, vlan,
230 vlan_tci, sizeof(__be16), reg,
231 NFT_OFFLOAD_F_NETWORK2HOST);
232 break;
233 case offsetof(struct vlan_ethhdr, h_vlan_encapsulated_proto):
234 if (!nft_payload_offload_mask(reg, priv->len, sizeof(__be16)))
235 return -EOPNOTSUPP;
236
237 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_VLAN, vlan,
238 vlan_tpid, sizeof(__be16), reg);
239 nft_offload_set_dependency(ctx, NFT_OFFLOAD_DEP_NETWORK);
240 break;
241 case offsetof(struct vlan_ethhdr, h_vlan_TCI) + sizeof(struct vlan_hdr):
242 if (!nft_payload_offload_mask(reg, priv->len, sizeof(__be16)))
243 return -EOPNOTSUPP;
244
245 NFT_OFFLOAD_MATCH_FLAGS(FLOW_DISSECTOR_KEY_CVLAN, cvlan,
246 vlan_tci, sizeof(__be16), reg,
247 NFT_OFFLOAD_F_NETWORK2HOST);
248 break;
249 case offsetof(struct vlan_ethhdr, h_vlan_encapsulated_proto) +
250 sizeof(struct vlan_hdr):
251 if (!nft_payload_offload_mask(reg, priv->len, sizeof(__be16)))
252 return -EOPNOTSUPP;
253
254 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_CVLAN, cvlan,
255 vlan_tpid, sizeof(__be16), reg);
256 nft_offload_set_dependency(ctx, NFT_OFFLOAD_DEP_NETWORK);
257 break;
258 default:
259 return -EOPNOTSUPP;
260 }
261
262 return 0;
263}
264
265static int nft_payload_offload_ip(struct nft_offload_ctx *ctx,
266 struct nft_flow_rule *flow,
267 const struct nft_payload *priv)
268{
269 struct nft_offload_reg *reg = &ctx->regs[priv->dreg];
270
271 switch (priv->offset) {
272 case offsetof(struct iphdr, saddr):
273 if (!nft_payload_offload_mask(reg, priv->len,
274 sizeof(struct in_addr)))
275 return -EOPNOTSUPP;
276
277 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_IPV4_ADDRS, ipv4, src,
278 sizeof(struct in_addr), reg);
279 nft_flow_rule_set_addr_type(flow, FLOW_DISSECTOR_KEY_IPV4_ADDRS);
280 break;
281 case offsetof(struct iphdr, daddr):
282 if (!nft_payload_offload_mask(reg, priv->len,
283 sizeof(struct in_addr)))
284 return -EOPNOTSUPP;
285
286 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_IPV4_ADDRS, ipv4, dst,
287 sizeof(struct in_addr), reg);
288 nft_flow_rule_set_addr_type(flow, FLOW_DISSECTOR_KEY_IPV4_ADDRS);
289 break;
290 case offsetof(struct iphdr, protocol):
291 if (!nft_payload_offload_mask(reg, priv->len, sizeof(__u8)))
292 return -EOPNOTSUPP;
293
294 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_BASIC, basic, ip_proto,
295 sizeof(__u8), reg);
296 nft_offload_set_dependency(ctx, NFT_OFFLOAD_DEP_TRANSPORT);
297 break;
298 default:
299 return -EOPNOTSUPP;
300 }
301
302 return 0;
303}
304
305static int nft_payload_offload_ip6(struct nft_offload_ctx *ctx,
306 struct nft_flow_rule *flow,
307 const struct nft_payload *priv)
308{
309 struct nft_offload_reg *reg = &ctx->regs[priv->dreg];
310
311 switch (priv->offset) {
312 case offsetof(struct ipv6hdr, saddr):
313 if (!nft_payload_offload_mask(reg, priv->len,
314 sizeof(struct in6_addr)))
315 return -EOPNOTSUPP;
316
317 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_IPV6_ADDRS, ipv6, src,
318 sizeof(struct in6_addr), reg);
319 nft_flow_rule_set_addr_type(flow, FLOW_DISSECTOR_KEY_IPV6_ADDRS);
320 break;
321 case offsetof(struct ipv6hdr, daddr):
322 if (!nft_payload_offload_mask(reg, priv->len,
323 sizeof(struct in6_addr)))
324 return -EOPNOTSUPP;
325
326 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_IPV6_ADDRS, ipv6, dst,
327 sizeof(struct in6_addr), reg);
328 nft_flow_rule_set_addr_type(flow, FLOW_DISSECTOR_KEY_IPV6_ADDRS);
329 break;
330 case offsetof(struct ipv6hdr, nexthdr):
331 if (!nft_payload_offload_mask(reg, priv->len, sizeof(__u8)))
332 return -EOPNOTSUPP;
333
334 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_BASIC, basic, ip_proto,
335 sizeof(__u8), reg);
336 nft_offload_set_dependency(ctx, NFT_OFFLOAD_DEP_TRANSPORT);
337 break;
338 default:
339 return -EOPNOTSUPP;
340 }
341
342 return 0;
343}
344
345static int nft_payload_offload_nh(struct nft_offload_ctx *ctx,
346 struct nft_flow_rule *flow,
347 const struct nft_payload *priv)
348{
349 int err;
350
351 switch (ctx->dep.l3num) {
352 case htons(ETH_P_IP):
353 err = nft_payload_offload_ip(ctx, flow, priv);
354 break;
355 case htons(ETH_P_IPV6):
356 err = nft_payload_offload_ip6(ctx, flow, priv);
357 break;
358 default:
359 return -EOPNOTSUPP;
360 }
361
362 return err;
363}
364
365static int nft_payload_offload_tcp(struct nft_offload_ctx *ctx,
366 struct nft_flow_rule *flow,
367 const struct nft_payload *priv)
368{
369 struct nft_offload_reg *reg = &ctx->regs[priv->dreg];
370
371 switch (priv->offset) {
372 case offsetof(struct tcphdr, source):
373 if (!nft_payload_offload_mask(reg, priv->len, sizeof(__be16)))
374 return -EOPNOTSUPP;
375
376 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_PORTS, tp, src,
377 sizeof(__be16), reg);
378 break;
379 case offsetof(struct tcphdr, dest):
380 if (!nft_payload_offload_mask(reg, priv->len, sizeof(__be16)))
381 return -EOPNOTSUPP;
382
383 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_PORTS, tp, dst,
384 sizeof(__be16), reg);
385 break;
386 default:
387 return -EOPNOTSUPP;
388 }
389
390 return 0;
391}
392
393static int nft_payload_offload_udp(struct nft_offload_ctx *ctx,
394 struct nft_flow_rule *flow,
395 const struct nft_payload *priv)
396{
397 struct nft_offload_reg *reg = &ctx->regs[priv->dreg];
398
399 switch (priv->offset) {
400 case offsetof(struct udphdr, source):
401 if (!nft_payload_offload_mask(reg, priv->len, sizeof(__be16)))
402 return -EOPNOTSUPP;
403
404 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_PORTS, tp, src,
405 sizeof(__be16), reg);
406 break;
407 case offsetof(struct udphdr, dest):
408 if (!nft_payload_offload_mask(reg, priv->len, sizeof(__be16)))
409 return -EOPNOTSUPP;
410
411 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_PORTS, tp, dst,
412 sizeof(__be16), reg);
413 break;
414 default:
415 return -EOPNOTSUPP;
416 }
417
418 return 0;
419}
420
421static int nft_payload_offload_th(struct nft_offload_ctx *ctx,
422 struct nft_flow_rule *flow,
423 const struct nft_payload *priv)
424{
425 int err;
426
427 switch (ctx->dep.protonum) {
428 case IPPROTO_TCP:
429 err = nft_payload_offload_tcp(ctx, flow, priv);
430 break;
431 case IPPROTO_UDP:
432 err = nft_payload_offload_udp(ctx, flow, priv);
433 break;
434 default:
435 return -EOPNOTSUPP;
436 }
437
438 return err;
439}
440
441static int nft_payload_offload(struct nft_offload_ctx *ctx,
442 struct nft_flow_rule *flow,
443 const struct nft_expr *expr)
444{
445 const struct nft_payload *priv = nft_expr_priv(expr);
446 int err;
447
448 switch (priv->base) {
449 case NFT_PAYLOAD_LL_HEADER:
450 err = nft_payload_offload_ll(ctx, flow, priv);
451 break;
452 case NFT_PAYLOAD_NETWORK_HEADER:
453 err = nft_payload_offload_nh(ctx, flow, priv);
454 break;
455 case NFT_PAYLOAD_TRANSPORT_HEADER:
456 err = nft_payload_offload_th(ctx, flow, priv);
457 break;
458 default:
459 err = -EOPNOTSUPP;
460 break;
461 }
462 return err;
463}
464
465static const struct nft_expr_ops nft_payload_ops = {
466 .type = &nft_payload_type,
467 .size = NFT_EXPR_SIZE(sizeof(struct nft_payload)),
468 .eval = nft_payload_eval,
469 .init = nft_payload_init,
470 .dump = nft_payload_dump,
471 .offload = nft_payload_offload,
472};
473
474const struct nft_expr_ops nft_payload_fast_ops = {
475 .type = &nft_payload_type,
476 .size = NFT_EXPR_SIZE(sizeof(struct nft_payload)),
477 .eval = nft_payload_eval,
478 .init = nft_payload_init,
479 .dump = nft_payload_dump,
480 .offload = nft_payload_offload,
481};
482
483static inline void nft_csum_replace(__sum16 *sum, __wsum fsum, __wsum tsum)
484{
485 *sum = csum_fold(csum_add(csum_sub(~csum_unfold(*sum), fsum), tsum));
486 if (*sum == 0)
487 *sum = CSUM_MANGLED_0;
488}
489
490static bool nft_payload_udp_checksum(struct sk_buff *skb, unsigned int thoff)
491{
492 struct udphdr *uh, _uh;
493
494 uh = skb_header_pointer(skb, thoff, sizeof(_uh), &_uh);
495 if (!uh)
496 return false;
497
498 return (__force bool)uh->check;
499}
500
501static int nft_payload_l4csum_offset(const struct nft_pktinfo *pkt,
502 struct sk_buff *skb,
503 unsigned int *l4csum_offset)
504{
505 switch (pkt->tprot) {
506 case IPPROTO_TCP:
507 *l4csum_offset = offsetof(struct tcphdr, check);
508 break;
509 case IPPROTO_UDP:
510 if (!nft_payload_udp_checksum(skb, nft_thoff(pkt)))
511 return -1;
512 fallthrough;
513 case IPPROTO_UDPLITE:
514 *l4csum_offset = offsetof(struct udphdr, check);
515 break;
516 case IPPROTO_ICMPV6:
517 *l4csum_offset = offsetof(struct icmp6hdr, icmp6_cksum);
518 break;
519 default:
520 return -1;
521 }
522
523 *l4csum_offset += nft_thoff(pkt);
524 return 0;
525}
526
527static int nft_payload_csum_sctp(struct sk_buff *skb, int offset)
528{
529 struct sctphdr *sh;
530
531 if (skb_ensure_writable(skb, offset + sizeof(*sh)))
532 return -1;
533
534 sh = (struct sctphdr *)(skb->data + offset);
535 sh->checksum = sctp_compute_cksum(skb, offset);
536 skb->ip_summed = CHECKSUM_UNNECESSARY;
537 return 0;
538}
539
540static int nft_payload_l4csum_update(const struct nft_pktinfo *pkt,
541 struct sk_buff *skb,
542 __wsum fsum, __wsum tsum)
543{
544 int l4csum_offset;
545 __sum16 sum;
546
547 /* If we cannot determine layer 4 checksum offset or this packet doesn't
548 * require layer 4 checksum recalculation, skip this packet.
549 */
550 if (nft_payload_l4csum_offset(pkt, skb, &l4csum_offset) < 0)
551 return 0;
552
553 if (skb_copy_bits(skb, l4csum_offset, &sum, sizeof(sum)) < 0)
554 return -1;
555
556 /* Checksum mangling for an arbitrary amount of bytes, based on
557 * inet_proto_csum_replace*() functions.
558 */
559 if (skb->ip_summed != CHECKSUM_PARTIAL) {
560 nft_csum_replace(&sum, fsum, tsum);
561 if (skb->ip_summed == CHECKSUM_COMPLETE) {
562 skb->csum = ~csum_add(csum_sub(~(skb->csum), fsum),
563 tsum);
564 }
565 } else {
566 sum = ~csum_fold(csum_add(csum_sub(csum_unfold(sum), fsum),
567 tsum));
568 }
569
570 if (skb_ensure_writable(skb, l4csum_offset + sizeof(sum)) ||
571 skb_store_bits(skb, l4csum_offset, &sum, sizeof(sum)) < 0)
572 return -1;
573
574 return 0;
575}
576
577static int nft_payload_csum_inet(struct sk_buff *skb, const u32 *src,
578 __wsum fsum, __wsum tsum, int csum_offset)
579{
580 __sum16 sum;
581
582 if (skb_copy_bits(skb, csum_offset, &sum, sizeof(sum)) < 0)
583 return -1;
584
585 nft_csum_replace(&sum, fsum, tsum);
586 if (skb_ensure_writable(skb, csum_offset + sizeof(sum)) ||
587 skb_store_bits(skb, csum_offset, &sum, sizeof(sum)) < 0)
588 return -1;
589
590 return 0;
591}
592
593static void nft_payload_set_eval(const struct nft_expr *expr,
594 struct nft_regs *regs,
595 const struct nft_pktinfo *pkt)
596{
597 const struct nft_payload_set *priv = nft_expr_priv(expr);
598 struct sk_buff *skb = pkt->skb;
599 const u32 *src = ®s->data[priv->sreg];
600 int offset, csum_offset;
601 __wsum fsum, tsum;
602
603 switch (priv->base) {
604 case NFT_PAYLOAD_LL_HEADER:
605 if (!skb_mac_header_was_set(skb))
606 goto err;
607 offset = skb_mac_header(skb) - skb->data;
608 break;
609 case NFT_PAYLOAD_NETWORK_HEADER:
610 offset = skb_network_offset(skb);
611 break;
612 case NFT_PAYLOAD_TRANSPORT_HEADER:
613 if (!pkt->tprot_set)
614 goto err;
615 offset = nft_thoff(pkt);
616 break;
617 default:
618 BUG();
619 }
620
621 csum_offset = offset + priv->csum_offset;
622 offset += priv->offset;
623
624 if ((priv->csum_type == NFT_PAYLOAD_CSUM_INET || priv->csum_flags) &&
625 (priv->base != NFT_PAYLOAD_TRANSPORT_HEADER ||
626 skb->ip_summed != CHECKSUM_PARTIAL)) {
627 fsum = skb_checksum(skb, offset, priv->len, 0);
628 tsum = csum_partial(src, priv->len, 0);
629
630 if (priv->csum_type == NFT_PAYLOAD_CSUM_INET &&
631 nft_payload_csum_inet(skb, src, fsum, tsum, csum_offset))
632 goto err;
633
634 if (priv->csum_flags &&
635 nft_payload_l4csum_update(pkt, skb, fsum, tsum) < 0)
636 goto err;
637 }
638
639 if (skb_ensure_writable(skb, max(offset + priv->len, 0)) ||
640 skb_store_bits(skb, offset, src, priv->len) < 0)
641 goto err;
642
643 if (priv->csum_type == NFT_PAYLOAD_CSUM_SCTP &&
644 pkt->tprot == IPPROTO_SCTP &&
645 skb->ip_summed != CHECKSUM_PARTIAL) {
646 if (nft_payload_csum_sctp(skb, nft_thoff(pkt)))
647 goto err;
648 }
649
650 return;
651err:
652 regs->verdict.code = NFT_BREAK;
653}
654
655static int nft_payload_set_init(const struct nft_ctx *ctx,
656 const struct nft_expr *expr,
657 const struct nlattr * const tb[])
658{
659 struct nft_payload_set *priv = nft_expr_priv(expr);
660
661 priv->base = ntohl(nla_get_be32(tb[NFTA_PAYLOAD_BASE]));
662 priv->offset = ntohl(nla_get_be32(tb[NFTA_PAYLOAD_OFFSET]));
663 priv->len = ntohl(nla_get_be32(tb[NFTA_PAYLOAD_LEN]));
664
665 if (tb[NFTA_PAYLOAD_CSUM_TYPE])
666 priv->csum_type =
667 ntohl(nla_get_be32(tb[NFTA_PAYLOAD_CSUM_TYPE]));
668 if (tb[NFTA_PAYLOAD_CSUM_OFFSET])
669 priv->csum_offset =
670 ntohl(nla_get_be32(tb[NFTA_PAYLOAD_CSUM_OFFSET]));
671 if (tb[NFTA_PAYLOAD_CSUM_FLAGS]) {
672 u32 flags;
673
674 flags = ntohl(nla_get_be32(tb[NFTA_PAYLOAD_CSUM_FLAGS]));
675 if (flags & ~NFT_PAYLOAD_L4CSUM_PSEUDOHDR)
676 return -EINVAL;
677
678 priv->csum_flags = flags;
679 }
680
681 switch (priv->csum_type) {
682 case NFT_PAYLOAD_CSUM_NONE:
683 case NFT_PAYLOAD_CSUM_INET:
684 break;
685 case NFT_PAYLOAD_CSUM_SCTP:
686 if (priv->base != NFT_PAYLOAD_TRANSPORT_HEADER)
687 return -EINVAL;
688
689 if (priv->csum_offset != offsetof(struct sctphdr, checksum))
690 return -EINVAL;
691 break;
692 default:
693 return -EOPNOTSUPP;
694 }
695
696 return nft_parse_register_load(tb[NFTA_PAYLOAD_SREG], &priv->sreg,
697 priv->len);
698}
699
700static int nft_payload_set_dump(struct sk_buff *skb, const struct nft_expr *expr)
701{
702 const struct nft_payload_set *priv = nft_expr_priv(expr);
703
704 if (nft_dump_register(skb, NFTA_PAYLOAD_SREG, priv->sreg) ||
705 nla_put_be32(skb, NFTA_PAYLOAD_BASE, htonl(priv->base)) ||
706 nla_put_be32(skb, NFTA_PAYLOAD_OFFSET, htonl(priv->offset)) ||
707 nla_put_be32(skb, NFTA_PAYLOAD_LEN, htonl(priv->len)) ||
708 nla_put_be32(skb, NFTA_PAYLOAD_CSUM_TYPE, htonl(priv->csum_type)) ||
709 nla_put_be32(skb, NFTA_PAYLOAD_CSUM_OFFSET,
710 htonl(priv->csum_offset)) ||
711 nla_put_be32(skb, NFTA_PAYLOAD_CSUM_FLAGS, htonl(priv->csum_flags)))
712 goto nla_put_failure;
713 return 0;
714
715nla_put_failure:
716 return -1;
717}
718
719static const struct nft_expr_ops nft_payload_set_ops = {
720 .type = &nft_payload_type,
721 .size = NFT_EXPR_SIZE(sizeof(struct nft_payload_set)),
722 .eval = nft_payload_set_eval,
723 .init = nft_payload_set_init,
724 .dump = nft_payload_set_dump,
725};
726
727static const struct nft_expr_ops *
728nft_payload_select_ops(const struct nft_ctx *ctx,
729 const struct nlattr * const tb[])
730{
731 enum nft_payload_bases base;
732 unsigned int offset, len;
733
734 if (tb[NFTA_PAYLOAD_BASE] == NULL ||
735 tb[NFTA_PAYLOAD_OFFSET] == NULL ||
736 tb[NFTA_PAYLOAD_LEN] == NULL)
737 return ERR_PTR(-EINVAL);
738
739 base = ntohl(nla_get_be32(tb[NFTA_PAYLOAD_BASE]));
740 switch (base) {
741 case NFT_PAYLOAD_LL_HEADER:
742 case NFT_PAYLOAD_NETWORK_HEADER:
743 case NFT_PAYLOAD_TRANSPORT_HEADER:
744 break;
745 default:
746 return ERR_PTR(-EOPNOTSUPP);
747 }
748
749 if (tb[NFTA_PAYLOAD_SREG] != NULL) {
750 if (tb[NFTA_PAYLOAD_DREG] != NULL)
751 return ERR_PTR(-EINVAL);
752 return &nft_payload_set_ops;
753 }
754
755 if (tb[NFTA_PAYLOAD_DREG] == NULL)
756 return ERR_PTR(-EINVAL);
757
758 offset = ntohl(nla_get_be32(tb[NFTA_PAYLOAD_OFFSET]));
759 len = ntohl(nla_get_be32(tb[NFTA_PAYLOAD_LEN]));
760
761 if (len <= 4 && is_power_of_2(len) && IS_ALIGNED(offset, len) &&
762 base != NFT_PAYLOAD_LL_HEADER)
763 return &nft_payload_fast_ops;
764 else
765 return &nft_payload_ops;
766}
767
768struct nft_expr_type nft_payload_type __read_mostly = {
769 .name = "payload",
770 .select_ops = nft_payload_select_ops,
771 .policy = nft_payload_policy,
772 .maxattr = NFTA_PAYLOAD_MAX,
773 .owner = THIS_MODULE,
774};
1// SPDX-License-Identifier: GPL-2.0-only
2/*
3 * Copyright (c) 2008-2009 Patrick McHardy <kaber@trash.net>
4 * Copyright (c) 2016 Pablo Neira Ayuso <pablo@netfilter.org>
5 *
6 * Development of this code funded by Astaro AG (http://www.astaro.com/)
7 */
8
9#include <linux/kernel.h>
10#include <linux/if_vlan.h>
11#include <linux/init.h>
12#include <linux/module.h>
13#include <linux/netlink.h>
14#include <linux/netfilter.h>
15#include <linux/netfilter/nf_tables.h>
16#include <net/netfilter/nf_tables_core.h>
17#include <net/netfilter/nf_tables.h>
18#include <net/netfilter/nf_tables_offload.h>
19/* For layer 4 checksum field offset. */
20#include <linux/tcp.h>
21#include <linux/udp.h>
22#include <net/gre.h>
23#include <linux/icmpv6.h>
24#include <linux/ip.h>
25#include <linux/ipv6.h>
26#include <net/sctp/checksum.h>
27
28static bool nft_payload_rebuild_vlan_hdr(const struct sk_buff *skb, int mac_off,
29 struct vlan_ethhdr *veth)
30{
31 if (skb_copy_bits(skb, mac_off, veth, ETH_HLEN))
32 return false;
33
34 veth->h_vlan_proto = skb->vlan_proto;
35 veth->h_vlan_TCI = htons(skb_vlan_tag_get(skb));
36 veth->h_vlan_encapsulated_proto = skb->protocol;
37
38 return true;
39}
40
41/* add vlan header into the user buffer for if tag was removed by offloads */
42static bool
43nft_payload_copy_vlan(u32 *d, const struct sk_buff *skb, u8 offset, u8 len)
44{
45 int mac_off = skb_mac_header(skb) - skb->data;
46 u8 *vlanh, *dst_u8 = (u8 *) d;
47 struct vlan_ethhdr veth;
48 u8 vlan_hlen = 0;
49
50 if ((skb->protocol == htons(ETH_P_8021AD) ||
51 skb->protocol == htons(ETH_P_8021Q)) &&
52 offset >= VLAN_ETH_HLEN && offset < VLAN_ETH_HLEN + VLAN_HLEN)
53 vlan_hlen += VLAN_HLEN;
54
55 vlanh = (u8 *) &veth;
56 if (offset < VLAN_ETH_HLEN + vlan_hlen) {
57 u8 ethlen = len;
58
59 if (vlan_hlen &&
60 skb_copy_bits(skb, mac_off, &veth, VLAN_ETH_HLEN) < 0)
61 return false;
62 else if (!nft_payload_rebuild_vlan_hdr(skb, mac_off, &veth))
63 return false;
64
65 if (offset + len > VLAN_ETH_HLEN + vlan_hlen)
66 ethlen -= offset + len - VLAN_ETH_HLEN - vlan_hlen;
67
68 memcpy(dst_u8, vlanh + offset - vlan_hlen, ethlen);
69
70 len -= ethlen;
71 if (len == 0)
72 return true;
73
74 dst_u8 += ethlen;
75 offset = ETH_HLEN + vlan_hlen;
76 } else {
77 offset -= VLAN_HLEN + vlan_hlen;
78 }
79
80 return skb_copy_bits(skb, offset + mac_off, dst_u8, len) == 0;
81}
82
83static int __nft_payload_inner_offset(struct nft_pktinfo *pkt)
84{
85 unsigned int thoff = nft_thoff(pkt);
86
87 if (!(pkt->flags & NFT_PKTINFO_L4PROTO) || pkt->fragoff)
88 return -1;
89
90 switch (pkt->tprot) {
91 case IPPROTO_UDP:
92 pkt->inneroff = thoff + sizeof(struct udphdr);
93 break;
94 case IPPROTO_TCP: {
95 struct tcphdr *th, _tcph;
96
97 th = skb_header_pointer(pkt->skb, thoff, sizeof(_tcph), &_tcph);
98 if (!th)
99 return -1;
100
101 pkt->inneroff = thoff + __tcp_hdrlen(th);
102 }
103 break;
104 case IPPROTO_GRE: {
105 u32 offset = sizeof(struct gre_base_hdr);
106 struct gre_base_hdr *gre, _gre;
107 __be16 version;
108
109 gre = skb_header_pointer(pkt->skb, thoff, sizeof(_gre), &_gre);
110 if (!gre)
111 return -1;
112
113 version = gre->flags & GRE_VERSION;
114 switch (version) {
115 case GRE_VERSION_0:
116 if (gre->flags & GRE_ROUTING)
117 return -1;
118
119 if (gre->flags & GRE_CSUM) {
120 offset += sizeof_field(struct gre_full_hdr, csum) +
121 sizeof_field(struct gre_full_hdr, reserved1);
122 }
123 if (gre->flags & GRE_KEY)
124 offset += sizeof_field(struct gre_full_hdr, key);
125
126 if (gre->flags & GRE_SEQ)
127 offset += sizeof_field(struct gre_full_hdr, seq);
128 break;
129 default:
130 return -1;
131 }
132
133 pkt->inneroff = thoff + offset;
134 }
135 break;
136 case IPPROTO_IPIP:
137 pkt->inneroff = thoff;
138 break;
139 default:
140 return -1;
141 }
142
143 pkt->flags |= NFT_PKTINFO_INNER;
144
145 return 0;
146}
147
148int nft_payload_inner_offset(const struct nft_pktinfo *pkt)
149{
150 if (!(pkt->flags & NFT_PKTINFO_INNER) &&
151 __nft_payload_inner_offset((struct nft_pktinfo *)pkt) < 0)
152 return -1;
153
154 return pkt->inneroff;
155}
156
157void nft_payload_eval(const struct nft_expr *expr,
158 struct nft_regs *regs,
159 const struct nft_pktinfo *pkt)
160{
161 const struct nft_payload *priv = nft_expr_priv(expr);
162 const struct sk_buff *skb = pkt->skb;
163 u32 *dest = ®s->data[priv->dreg];
164 int offset;
165
166 if (priv->len % NFT_REG32_SIZE)
167 dest[priv->len / NFT_REG32_SIZE] = 0;
168
169 switch (priv->base) {
170 case NFT_PAYLOAD_LL_HEADER:
171 if (!skb_mac_header_was_set(skb))
172 goto err;
173
174 if (skb_vlan_tag_present(skb)) {
175 if (!nft_payload_copy_vlan(dest, skb,
176 priv->offset, priv->len))
177 goto err;
178 return;
179 }
180 offset = skb_mac_header(skb) - skb->data;
181 break;
182 case NFT_PAYLOAD_NETWORK_HEADER:
183 offset = skb_network_offset(skb);
184 break;
185 case NFT_PAYLOAD_TRANSPORT_HEADER:
186 if (!(pkt->flags & NFT_PKTINFO_L4PROTO) || pkt->fragoff)
187 goto err;
188 offset = nft_thoff(pkt);
189 break;
190 case NFT_PAYLOAD_INNER_HEADER:
191 offset = nft_payload_inner_offset(pkt);
192 if (offset < 0)
193 goto err;
194 break;
195 default:
196 WARN_ON_ONCE(1);
197 goto err;
198 }
199 offset += priv->offset;
200
201 if (skb_copy_bits(skb, offset, dest, priv->len) < 0)
202 goto err;
203 return;
204err:
205 regs->verdict.code = NFT_BREAK;
206}
207
208static const struct nla_policy nft_payload_policy[NFTA_PAYLOAD_MAX + 1] = {
209 [NFTA_PAYLOAD_SREG] = { .type = NLA_U32 },
210 [NFTA_PAYLOAD_DREG] = { .type = NLA_U32 },
211 [NFTA_PAYLOAD_BASE] = { .type = NLA_U32 },
212 [NFTA_PAYLOAD_OFFSET] = NLA_POLICY_MAX(NLA_BE32, 255),
213 [NFTA_PAYLOAD_LEN] = NLA_POLICY_MAX(NLA_BE32, 255),
214 [NFTA_PAYLOAD_CSUM_TYPE] = { .type = NLA_U32 },
215 [NFTA_PAYLOAD_CSUM_OFFSET] = NLA_POLICY_MAX(NLA_BE32, 255),
216 [NFTA_PAYLOAD_CSUM_FLAGS] = { .type = NLA_U32 },
217};
218
219static int nft_payload_init(const struct nft_ctx *ctx,
220 const struct nft_expr *expr,
221 const struct nlattr * const tb[])
222{
223 struct nft_payload *priv = nft_expr_priv(expr);
224
225 priv->base = ntohl(nla_get_be32(tb[NFTA_PAYLOAD_BASE]));
226 priv->offset = ntohl(nla_get_be32(tb[NFTA_PAYLOAD_OFFSET]));
227 priv->len = ntohl(nla_get_be32(tb[NFTA_PAYLOAD_LEN]));
228
229 return nft_parse_register_store(ctx, tb[NFTA_PAYLOAD_DREG],
230 &priv->dreg, NULL, NFT_DATA_VALUE,
231 priv->len);
232}
233
234static int nft_payload_dump(struct sk_buff *skb,
235 const struct nft_expr *expr, bool reset)
236{
237 const struct nft_payload *priv = nft_expr_priv(expr);
238
239 if (nft_dump_register(skb, NFTA_PAYLOAD_DREG, priv->dreg) ||
240 nla_put_be32(skb, NFTA_PAYLOAD_BASE, htonl(priv->base)) ||
241 nla_put_be32(skb, NFTA_PAYLOAD_OFFSET, htonl(priv->offset)) ||
242 nla_put_be32(skb, NFTA_PAYLOAD_LEN, htonl(priv->len)))
243 goto nla_put_failure;
244 return 0;
245
246nla_put_failure:
247 return -1;
248}
249
250static bool nft_payload_reduce(struct nft_regs_track *track,
251 const struct nft_expr *expr)
252{
253 const struct nft_payload *priv = nft_expr_priv(expr);
254 const struct nft_payload *payload;
255
256 if (!nft_reg_track_cmp(track, expr, priv->dreg)) {
257 nft_reg_track_update(track, expr, priv->dreg, priv->len);
258 return false;
259 }
260
261 payload = nft_expr_priv(track->regs[priv->dreg].selector);
262 if (priv->base != payload->base ||
263 priv->offset != payload->offset ||
264 priv->len != payload->len) {
265 nft_reg_track_update(track, expr, priv->dreg, priv->len);
266 return false;
267 }
268
269 if (!track->regs[priv->dreg].bitwise)
270 return true;
271
272 return nft_expr_reduce_bitwise(track, expr);
273}
274
275static bool nft_payload_offload_mask(struct nft_offload_reg *reg,
276 u32 priv_len, u32 field_len)
277{
278 unsigned int remainder, delta, k;
279 struct nft_data mask = {};
280 __be32 remainder_mask;
281
282 if (priv_len == field_len) {
283 memset(®->mask, 0xff, priv_len);
284 return true;
285 } else if (priv_len > field_len) {
286 return false;
287 }
288
289 memset(&mask, 0xff, field_len);
290 remainder = priv_len % sizeof(u32);
291 if (remainder) {
292 k = priv_len / sizeof(u32);
293 delta = field_len - priv_len;
294 remainder_mask = htonl(~((1 << (delta * BITS_PER_BYTE)) - 1));
295 mask.data[k] = (__force u32)remainder_mask;
296 }
297
298 memcpy(®->mask, &mask, field_len);
299
300 return true;
301}
302
303static int nft_payload_offload_ll(struct nft_offload_ctx *ctx,
304 struct nft_flow_rule *flow,
305 const struct nft_payload *priv)
306{
307 struct nft_offload_reg *reg = &ctx->regs[priv->dreg];
308
309 switch (priv->offset) {
310 case offsetof(struct ethhdr, h_source):
311 if (!nft_payload_offload_mask(reg, priv->len, ETH_ALEN))
312 return -EOPNOTSUPP;
313
314 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_ETH_ADDRS, eth_addrs,
315 src, ETH_ALEN, reg);
316 break;
317 case offsetof(struct ethhdr, h_dest):
318 if (!nft_payload_offload_mask(reg, priv->len, ETH_ALEN))
319 return -EOPNOTSUPP;
320
321 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_ETH_ADDRS, eth_addrs,
322 dst, ETH_ALEN, reg);
323 break;
324 case offsetof(struct ethhdr, h_proto):
325 if (!nft_payload_offload_mask(reg, priv->len, sizeof(__be16)))
326 return -EOPNOTSUPP;
327
328 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_BASIC, basic,
329 n_proto, sizeof(__be16), reg);
330 nft_offload_set_dependency(ctx, NFT_OFFLOAD_DEP_NETWORK);
331 break;
332 case offsetof(struct vlan_ethhdr, h_vlan_TCI):
333 if (!nft_payload_offload_mask(reg, priv->len, sizeof(__be16)))
334 return -EOPNOTSUPP;
335
336 NFT_OFFLOAD_MATCH_FLAGS(FLOW_DISSECTOR_KEY_VLAN, vlan,
337 vlan_tci, sizeof(__be16), reg,
338 NFT_OFFLOAD_F_NETWORK2HOST);
339 break;
340 case offsetof(struct vlan_ethhdr, h_vlan_encapsulated_proto):
341 if (!nft_payload_offload_mask(reg, priv->len, sizeof(__be16)))
342 return -EOPNOTSUPP;
343
344 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_VLAN, vlan,
345 vlan_tpid, sizeof(__be16), reg);
346 nft_offload_set_dependency(ctx, NFT_OFFLOAD_DEP_NETWORK);
347 break;
348 case offsetof(struct vlan_ethhdr, h_vlan_TCI) + sizeof(struct vlan_hdr):
349 if (!nft_payload_offload_mask(reg, priv->len, sizeof(__be16)))
350 return -EOPNOTSUPP;
351
352 NFT_OFFLOAD_MATCH_FLAGS(FLOW_DISSECTOR_KEY_CVLAN, cvlan,
353 vlan_tci, sizeof(__be16), reg,
354 NFT_OFFLOAD_F_NETWORK2HOST);
355 break;
356 case offsetof(struct vlan_ethhdr, h_vlan_encapsulated_proto) +
357 sizeof(struct vlan_hdr):
358 if (!nft_payload_offload_mask(reg, priv->len, sizeof(__be16)))
359 return -EOPNOTSUPP;
360
361 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_CVLAN, cvlan,
362 vlan_tpid, sizeof(__be16), reg);
363 nft_offload_set_dependency(ctx, NFT_OFFLOAD_DEP_NETWORK);
364 break;
365 default:
366 return -EOPNOTSUPP;
367 }
368
369 return 0;
370}
371
372static int nft_payload_offload_ip(struct nft_offload_ctx *ctx,
373 struct nft_flow_rule *flow,
374 const struct nft_payload *priv)
375{
376 struct nft_offload_reg *reg = &ctx->regs[priv->dreg];
377
378 switch (priv->offset) {
379 case offsetof(struct iphdr, saddr):
380 if (!nft_payload_offload_mask(reg, priv->len,
381 sizeof(struct in_addr)))
382 return -EOPNOTSUPP;
383
384 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_IPV4_ADDRS, ipv4, src,
385 sizeof(struct in_addr), reg);
386 nft_flow_rule_set_addr_type(flow, FLOW_DISSECTOR_KEY_IPV4_ADDRS);
387 break;
388 case offsetof(struct iphdr, daddr):
389 if (!nft_payload_offload_mask(reg, priv->len,
390 sizeof(struct in_addr)))
391 return -EOPNOTSUPP;
392
393 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_IPV4_ADDRS, ipv4, dst,
394 sizeof(struct in_addr), reg);
395 nft_flow_rule_set_addr_type(flow, FLOW_DISSECTOR_KEY_IPV4_ADDRS);
396 break;
397 case offsetof(struct iphdr, protocol):
398 if (!nft_payload_offload_mask(reg, priv->len, sizeof(__u8)))
399 return -EOPNOTSUPP;
400
401 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_BASIC, basic, ip_proto,
402 sizeof(__u8), reg);
403 nft_offload_set_dependency(ctx, NFT_OFFLOAD_DEP_TRANSPORT);
404 break;
405 default:
406 return -EOPNOTSUPP;
407 }
408
409 return 0;
410}
411
412static int nft_payload_offload_ip6(struct nft_offload_ctx *ctx,
413 struct nft_flow_rule *flow,
414 const struct nft_payload *priv)
415{
416 struct nft_offload_reg *reg = &ctx->regs[priv->dreg];
417
418 switch (priv->offset) {
419 case offsetof(struct ipv6hdr, saddr):
420 if (!nft_payload_offload_mask(reg, priv->len,
421 sizeof(struct in6_addr)))
422 return -EOPNOTSUPP;
423
424 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_IPV6_ADDRS, ipv6, src,
425 sizeof(struct in6_addr), reg);
426 nft_flow_rule_set_addr_type(flow, FLOW_DISSECTOR_KEY_IPV6_ADDRS);
427 break;
428 case offsetof(struct ipv6hdr, daddr):
429 if (!nft_payload_offload_mask(reg, priv->len,
430 sizeof(struct in6_addr)))
431 return -EOPNOTSUPP;
432
433 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_IPV6_ADDRS, ipv6, dst,
434 sizeof(struct in6_addr), reg);
435 nft_flow_rule_set_addr_type(flow, FLOW_DISSECTOR_KEY_IPV6_ADDRS);
436 break;
437 case offsetof(struct ipv6hdr, nexthdr):
438 if (!nft_payload_offload_mask(reg, priv->len, sizeof(__u8)))
439 return -EOPNOTSUPP;
440
441 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_BASIC, basic, ip_proto,
442 sizeof(__u8), reg);
443 nft_offload_set_dependency(ctx, NFT_OFFLOAD_DEP_TRANSPORT);
444 break;
445 default:
446 return -EOPNOTSUPP;
447 }
448
449 return 0;
450}
451
452static int nft_payload_offload_nh(struct nft_offload_ctx *ctx,
453 struct nft_flow_rule *flow,
454 const struct nft_payload *priv)
455{
456 int err;
457
458 switch (ctx->dep.l3num) {
459 case htons(ETH_P_IP):
460 err = nft_payload_offload_ip(ctx, flow, priv);
461 break;
462 case htons(ETH_P_IPV6):
463 err = nft_payload_offload_ip6(ctx, flow, priv);
464 break;
465 default:
466 return -EOPNOTSUPP;
467 }
468
469 return err;
470}
471
472static int nft_payload_offload_tcp(struct nft_offload_ctx *ctx,
473 struct nft_flow_rule *flow,
474 const struct nft_payload *priv)
475{
476 struct nft_offload_reg *reg = &ctx->regs[priv->dreg];
477
478 switch (priv->offset) {
479 case offsetof(struct tcphdr, source):
480 if (!nft_payload_offload_mask(reg, priv->len, sizeof(__be16)))
481 return -EOPNOTSUPP;
482
483 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_PORTS, tp, src,
484 sizeof(__be16), reg);
485 break;
486 case offsetof(struct tcphdr, dest):
487 if (!nft_payload_offload_mask(reg, priv->len, sizeof(__be16)))
488 return -EOPNOTSUPP;
489
490 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_PORTS, tp, dst,
491 sizeof(__be16), reg);
492 break;
493 default:
494 return -EOPNOTSUPP;
495 }
496
497 return 0;
498}
499
500static int nft_payload_offload_udp(struct nft_offload_ctx *ctx,
501 struct nft_flow_rule *flow,
502 const struct nft_payload *priv)
503{
504 struct nft_offload_reg *reg = &ctx->regs[priv->dreg];
505
506 switch (priv->offset) {
507 case offsetof(struct udphdr, source):
508 if (!nft_payload_offload_mask(reg, priv->len, sizeof(__be16)))
509 return -EOPNOTSUPP;
510
511 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_PORTS, tp, src,
512 sizeof(__be16), reg);
513 break;
514 case offsetof(struct udphdr, dest):
515 if (!nft_payload_offload_mask(reg, priv->len, sizeof(__be16)))
516 return -EOPNOTSUPP;
517
518 NFT_OFFLOAD_MATCH(FLOW_DISSECTOR_KEY_PORTS, tp, dst,
519 sizeof(__be16), reg);
520 break;
521 default:
522 return -EOPNOTSUPP;
523 }
524
525 return 0;
526}
527
528static int nft_payload_offload_th(struct nft_offload_ctx *ctx,
529 struct nft_flow_rule *flow,
530 const struct nft_payload *priv)
531{
532 int err;
533
534 switch (ctx->dep.protonum) {
535 case IPPROTO_TCP:
536 err = nft_payload_offload_tcp(ctx, flow, priv);
537 break;
538 case IPPROTO_UDP:
539 err = nft_payload_offload_udp(ctx, flow, priv);
540 break;
541 default:
542 return -EOPNOTSUPP;
543 }
544
545 return err;
546}
547
548static int nft_payload_offload(struct nft_offload_ctx *ctx,
549 struct nft_flow_rule *flow,
550 const struct nft_expr *expr)
551{
552 const struct nft_payload *priv = nft_expr_priv(expr);
553 int err;
554
555 switch (priv->base) {
556 case NFT_PAYLOAD_LL_HEADER:
557 err = nft_payload_offload_ll(ctx, flow, priv);
558 break;
559 case NFT_PAYLOAD_NETWORK_HEADER:
560 err = nft_payload_offload_nh(ctx, flow, priv);
561 break;
562 case NFT_PAYLOAD_TRANSPORT_HEADER:
563 err = nft_payload_offload_th(ctx, flow, priv);
564 break;
565 default:
566 err = -EOPNOTSUPP;
567 break;
568 }
569 return err;
570}
571
572static const struct nft_expr_ops nft_payload_ops = {
573 .type = &nft_payload_type,
574 .size = NFT_EXPR_SIZE(sizeof(struct nft_payload)),
575 .eval = nft_payload_eval,
576 .init = nft_payload_init,
577 .dump = nft_payload_dump,
578 .reduce = nft_payload_reduce,
579 .offload = nft_payload_offload,
580};
581
582const struct nft_expr_ops nft_payload_fast_ops = {
583 .type = &nft_payload_type,
584 .size = NFT_EXPR_SIZE(sizeof(struct nft_payload)),
585 .eval = nft_payload_eval,
586 .init = nft_payload_init,
587 .dump = nft_payload_dump,
588 .reduce = nft_payload_reduce,
589 .offload = nft_payload_offload,
590};
591
592void nft_payload_inner_eval(const struct nft_expr *expr, struct nft_regs *regs,
593 const struct nft_pktinfo *pkt,
594 struct nft_inner_tun_ctx *tun_ctx)
595{
596 const struct nft_payload *priv = nft_expr_priv(expr);
597 const struct sk_buff *skb = pkt->skb;
598 u32 *dest = ®s->data[priv->dreg];
599 int offset;
600
601 if (priv->len % NFT_REG32_SIZE)
602 dest[priv->len / NFT_REG32_SIZE] = 0;
603
604 switch (priv->base) {
605 case NFT_PAYLOAD_TUN_HEADER:
606 if (!(tun_ctx->flags & NFT_PAYLOAD_CTX_INNER_TUN))
607 goto err;
608
609 offset = tun_ctx->inner_tunoff;
610 break;
611 case NFT_PAYLOAD_LL_HEADER:
612 if (!(tun_ctx->flags & NFT_PAYLOAD_CTX_INNER_LL))
613 goto err;
614
615 offset = tun_ctx->inner_lloff;
616 break;
617 case NFT_PAYLOAD_NETWORK_HEADER:
618 if (!(tun_ctx->flags & NFT_PAYLOAD_CTX_INNER_NH))
619 goto err;
620
621 offset = tun_ctx->inner_nhoff;
622 break;
623 case NFT_PAYLOAD_TRANSPORT_HEADER:
624 if (!(tun_ctx->flags & NFT_PAYLOAD_CTX_INNER_TH))
625 goto err;
626
627 offset = tun_ctx->inner_thoff;
628 break;
629 default:
630 WARN_ON_ONCE(1);
631 goto err;
632 }
633 offset += priv->offset;
634
635 if (skb_copy_bits(skb, offset, dest, priv->len) < 0)
636 goto err;
637
638 return;
639err:
640 regs->verdict.code = NFT_BREAK;
641}
642
643static int nft_payload_inner_init(const struct nft_ctx *ctx,
644 const struct nft_expr *expr,
645 const struct nlattr * const tb[])
646{
647 struct nft_payload *priv = nft_expr_priv(expr);
648 u32 base;
649
650 base = ntohl(nla_get_be32(tb[NFTA_PAYLOAD_BASE]));
651 switch (base) {
652 case NFT_PAYLOAD_TUN_HEADER:
653 case NFT_PAYLOAD_LL_HEADER:
654 case NFT_PAYLOAD_NETWORK_HEADER:
655 case NFT_PAYLOAD_TRANSPORT_HEADER:
656 break;
657 default:
658 return -EOPNOTSUPP;
659 }
660
661 priv->base = base;
662 priv->offset = ntohl(nla_get_be32(tb[NFTA_PAYLOAD_OFFSET]));
663 priv->len = ntohl(nla_get_be32(tb[NFTA_PAYLOAD_LEN]));
664
665 return nft_parse_register_store(ctx, tb[NFTA_PAYLOAD_DREG],
666 &priv->dreg, NULL, NFT_DATA_VALUE,
667 priv->len);
668}
669
670static const struct nft_expr_ops nft_payload_inner_ops = {
671 .type = &nft_payload_type,
672 .size = NFT_EXPR_SIZE(sizeof(struct nft_payload)),
673 .init = nft_payload_inner_init,
674 .dump = nft_payload_dump,
675 /* direct call to nft_payload_inner_eval(). */
676};
677
678static inline void nft_csum_replace(__sum16 *sum, __wsum fsum, __wsum tsum)
679{
680 *sum = csum_fold(csum_add(csum_sub(~csum_unfold(*sum), fsum), tsum));
681 if (*sum == 0)
682 *sum = CSUM_MANGLED_0;
683}
684
685static bool nft_payload_udp_checksum(struct sk_buff *skb, unsigned int thoff)
686{
687 struct udphdr *uh, _uh;
688
689 uh = skb_header_pointer(skb, thoff, sizeof(_uh), &_uh);
690 if (!uh)
691 return false;
692
693 return (__force bool)uh->check;
694}
695
696static int nft_payload_l4csum_offset(const struct nft_pktinfo *pkt,
697 struct sk_buff *skb,
698 unsigned int *l4csum_offset)
699{
700 if (pkt->fragoff)
701 return -1;
702
703 switch (pkt->tprot) {
704 case IPPROTO_TCP:
705 *l4csum_offset = offsetof(struct tcphdr, check);
706 break;
707 case IPPROTO_UDP:
708 if (!nft_payload_udp_checksum(skb, nft_thoff(pkt)))
709 return -1;
710 fallthrough;
711 case IPPROTO_UDPLITE:
712 *l4csum_offset = offsetof(struct udphdr, check);
713 break;
714 case IPPROTO_ICMPV6:
715 *l4csum_offset = offsetof(struct icmp6hdr, icmp6_cksum);
716 break;
717 default:
718 return -1;
719 }
720
721 *l4csum_offset += nft_thoff(pkt);
722 return 0;
723}
724
725static int nft_payload_csum_sctp(struct sk_buff *skb, int offset)
726{
727 struct sctphdr *sh;
728
729 if (skb_ensure_writable(skb, offset + sizeof(*sh)))
730 return -1;
731
732 sh = (struct sctphdr *)(skb->data + offset);
733 sh->checksum = sctp_compute_cksum(skb, offset);
734 skb->ip_summed = CHECKSUM_UNNECESSARY;
735 return 0;
736}
737
738static int nft_payload_l4csum_update(const struct nft_pktinfo *pkt,
739 struct sk_buff *skb,
740 __wsum fsum, __wsum tsum)
741{
742 int l4csum_offset;
743 __sum16 sum;
744
745 /* If we cannot determine layer 4 checksum offset or this packet doesn't
746 * require layer 4 checksum recalculation, skip this packet.
747 */
748 if (nft_payload_l4csum_offset(pkt, skb, &l4csum_offset) < 0)
749 return 0;
750
751 if (skb_copy_bits(skb, l4csum_offset, &sum, sizeof(sum)) < 0)
752 return -1;
753
754 /* Checksum mangling for an arbitrary amount of bytes, based on
755 * inet_proto_csum_replace*() functions.
756 */
757 if (skb->ip_summed != CHECKSUM_PARTIAL) {
758 nft_csum_replace(&sum, fsum, tsum);
759 if (skb->ip_summed == CHECKSUM_COMPLETE) {
760 skb->csum = ~csum_add(csum_sub(~(skb->csum), fsum),
761 tsum);
762 }
763 } else {
764 sum = ~csum_fold(csum_add(csum_sub(csum_unfold(sum), fsum),
765 tsum));
766 }
767
768 if (skb_ensure_writable(skb, l4csum_offset + sizeof(sum)) ||
769 skb_store_bits(skb, l4csum_offset, &sum, sizeof(sum)) < 0)
770 return -1;
771
772 return 0;
773}
774
775static int nft_payload_csum_inet(struct sk_buff *skb, const u32 *src,
776 __wsum fsum, __wsum tsum, int csum_offset)
777{
778 __sum16 sum;
779
780 if (skb_copy_bits(skb, csum_offset, &sum, sizeof(sum)) < 0)
781 return -1;
782
783 nft_csum_replace(&sum, fsum, tsum);
784 if (skb_ensure_writable(skb, csum_offset + sizeof(sum)) ||
785 skb_store_bits(skb, csum_offset, &sum, sizeof(sum)) < 0)
786 return -1;
787
788 return 0;
789}
790
791struct nft_payload_set {
792 enum nft_payload_bases base:8;
793 u8 offset;
794 u8 len;
795 u8 sreg;
796 u8 csum_type;
797 u8 csum_offset;
798 u8 csum_flags;
799};
800
801static void nft_payload_set_eval(const struct nft_expr *expr,
802 struct nft_regs *regs,
803 const struct nft_pktinfo *pkt)
804{
805 const struct nft_payload_set *priv = nft_expr_priv(expr);
806 struct sk_buff *skb = pkt->skb;
807 const u32 *src = ®s->data[priv->sreg];
808 int offset, csum_offset;
809 __wsum fsum, tsum;
810
811 switch (priv->base) {
812 case NFT_PAYLOAD_LL_HEADER:
813 if (!skb_mac_header_was_set(skb))
814 goto err;
815 offset = skb_mac_header(skb) - skb->data;
816 break;
817 case NFT_PAYLOAD_NETWORK_HEADER:
818 offset = skb_network_offset(skb);
819 break;
820 case NFT_PAYLOAD_TRANSPORT_HEADER:
821 if (!(pkt->flags & NFT_PKTINFO_L4PROTO) || pkt->fragoff)
822 goto err;
823 offset = nft_thoff(pkt);
824 break;
825 case NFT_PAYLOAD_INNER_HEADER:
826 offset = nft_payload_inner_offset(pkt);
827 if (offset < 0)
828 goto err;
829 break;
830 default:
831 WARN_ON_ONCE(1);
832 goto err;
833 }
834
835 csum_offset = offset + priv->csum_offset;
836 offset += priv->offset;
837
838 if ((priv->csum_type == NFT_PAYLOAD_CSUM_INET || priv->csum_flags) &&
839 ((priv->base != NFT_PAYLOAD_TRANSPORT_HEADER &&
840 priv->base != NFT_PAYLOAD_INNER_HEADER) ||
841 skb->ip_summed != CHECKSUM_PARTIAL)) {
842 fsum = skb_checksum(skb, offset, priv->len, 0);
843 tsum = csum_partial(src, priv->len, 0);
844
845 if (priv->csum_type == NFT_PAYLOAD_CSUM_INET &&
846 nft_payload_csum_inet(skb, src, fsum, tsum, csum_offset))
847 goto err;
848
849 if (priv->csum_flags &&
850 nft_payload_l4csum_update(pkt, skb, fsum, tsum) < 0)
851 goto err;
852 }
853
854 if (skb_ensure_writable(skb, max(offset + priv->len, 0)) ||
855 skb_store_bits(skb, offset, src, priv->len) < 0)
856 goto err;
857
858 if (priv->csum_type == NFT_PAYLOAD_CSUM_SCTP &&
859 pkt->tprot == IPPROTO_SCTP &&
860 skb->ip_summed != CHECKSUM_PARTIAL) {
861 if (pkt->fragoff == 0 &&
862 nft_payload_csum_sctp(skb, nft_thoff(pkt)))
863 goto err;
864 }
865
866 return;
867err:
868 regs->verdict.code = NFT_BREAK;
869}
870
871static int nft_payload_set_init(const struct nft_ctx *ctx,
872 const struct nft_expr *expr,
873 const struct nlattr * const tb[])
874{
875 struct nft_payload_set *priv = nft_expr_priv(expr);
876 u32 csum_offset, csum_type = NFT_PAYLOAD_CSUM_NONE;
877 int err;
878
879 priv->base = ntohl(nla_get_be32(tb[NFTA_PAYLOAD_BASE]));
880 priv->offset = ntohl(nla_get_be32(tb[NFTA_PAYLOAD_OFFSET]));
881 priv->len = ntohl(nla_get_be32(tb[NFTA_PAYLOAD_LEN]));
882
883 if (tb[NFTA_PAYLOAD_CSUM_TYPE])
884 csum_type = ntohl(nla_get_be32(tb[NFTA_PAYLOAD_CSUM_TYPE]));
885 if (tb[NFTA_PAYLOAD_CSUM_OFFSET]) {
886 err = nft_parse_u32_check(tb[NFTA_PAYLOAD_CSUM_OFFSET], U8_MAX,
887 &csum_offset);
888 if (err < 0)
889 return err;
890
891 priv->csum_offset = csum_offset;
892 }
893 if (tb[NFTA_PAYLOAD_CSUM_FLAGS]) {
894 u32 flags;
895
896 flags = ntohl(nla_get_be32(tb[NFTA_PAYLOAD_CSUM_FLAGS]));
897 if (flags & ~NFT_PAYLOAD_L4CSUM_PSEUDOHDR)
898 return -EINVAL;
899
900 priv->csum_flags = flags;
901 }
902
903 switch (csum_type) {
904 case NFT_PAYLOAD_CSUM_NONE:
905 case NFT_PAYLOAD_CSUM_INET:
906 break;
907 case NFT_PAYLOAD_CSUM_SCTP:
908 if (priv->base != NFT_PAYLOAD_TRANSPORT_HEADER)
909 return -EINVAL;
910
911 if (priv->csum_offset != offsetof(struct sctphdr, checksum))
912 return -EINVAL;
913 break;
914 default:
915 return -EOPNOTSUPP;
916 }
917 priv->csum_type = csum_type;
918
919 return nft_parse_register_load(tb[NFTA_PAYLOAD_SREG], &priv->sreg,
920 priv->len);
921}
922
923static int nft_payload_set_dump(struct sk_buff *skb,
924 const struct nft_expr *expr, bool reset)
925{
926 const struct nft_payload_set *priv = nft_expr_priv(expr);
927
928 if (nft_dump_register(skb, NFTA_PAYLOAD_SREG, priv->sreg) ||
929 nla_put_be32(skb, NFTA_PAYLOAD_BASE, htonl(priv->base)) ||
930 nla_put_be32(skb, NFTA_PAYLOAD_OFFSET, htonl(priv->offset)) ||
931 nla_put_be32(skb, NFTA_PAYLOAD_LEN, htonl(priv->len)) ||
932 nla_put_be32(skb, NFTA_PAYLOAD_CSUM_TYPE, htonl(priv->csum_type)) ||
933 nla_put_be32(skb, NFTA_PAYLOAD_CSUM_OFFSET,
934 htonl(priv->csum_offset)) ||
935 nla_put_be32(skb, NFTA_PAYLOAD_CSUM_FLAGS, htonl(priv->csum_flags)))
936 goto nla_put_failure;
937 return 0;
938
939nla_put_failure:
940 return -1;
941}
942
943static bool nft_payload_set_reduce(struct nft_regs_track *track,
944 const struct nft_expr *expr)
945{
946 int i;
947
948 for (i = 0; i < NFT_REG32_NUM; i++) {
949 if (!track->regs[i].selector)
950 continue;
951
952 if (track->regs[i].selector->ops != &nft_payload_ops &&
953 track->regs[i].selector->ops != &nft_payload_fast_ops)
954 continue;
955
956 __nft_reg_track_cancel(track, i);
957 }
958
959 return false;
960}
961
962static const struct nft_expr_ops nft_payload_set_ops = {
963 .type = &nft_payload_type,
964 .size = NFT_EXPR_SIZE(sizeof(struct nft_payload_set)),
965 .eval = nft_payload_set_eval,
966 .init = nft_payload_set_init,
967 .dump = nft_payload_set_dump,
968 .reduce = nft_payload_set_reduce,
969};
970
971static const struct nft_expr_ops *
972nft_payload_select_ops(const struct nft_ctx *ctx,
973 const struct nlattr * const tb[])
974{
975 enum nft_payload_bases base;
976 unsigned int offset, len;
977 int err;
978
979 if (tb[NFTA_PAYLOAD_BASE] == NULL ||
980 tb[NFTA_PAYLOAD_OFFSET] == NULL ||
981 tb[NFTA_PAYLOAD_LEN] == NULL)
982 return ERR_PTR(-EINVAL);
983
984 base = ntohl(nla_get_be32(tb[NFTA_PAYLOAD_BASE]));
985 switch (base) {
986 case NFT_PAYLOAD_LL_HEADER:
987 case NFT_PAYLOAD_NETWORK_HEADER:
988 case NFT_PAYLOAD_TRANSPORT_HEADER:
989 case NFT_PAYLOAD_INNER_HEADER:
990 break;
991 default:
992 return ERR_PTR(-EOPNOTSUPP);
993 }
994
995 if (tb[NFTA_PAYLOAD_SREG] != NULL) {
996 if (tb[NFTA_PAYLOAD_DREG] != NULL)
997 return ERR_PTR(-EINVAL);
998 return &nft_payload_set_ops;
999 }
1000
1001 if (tb[NFTA_PAYLOAD_DREG] == NULL)
1002 return ERR_PTR(-EINVAL);
1003
1004 err = nft_parse_u32_check(tb[NFTA_PAYLOAD_OFFSET], U8_MAX, &offset);
1005 if (err < 0)
1006 return ERR_PTR(err);
1007
1008 err = nft_parse_u32_check(tb[NFTA_PAYLOAD_LEN], U8_MAX, &len);
1009 if (err < 0)
1010 return ERR_PTR(err);
1011
1012 if (len <= 4 && is_power_of_2(len) && IS_ALIGNED(offset, len) &&
1013 base != NFT_PAYLOAD_LL_HEADER && base != NFT_PAYLOAD_INNER_HEADER)
1014 return &nft_payload_fast_ops;
1015 else
1016 return &nft_payload_ops;
1017}
1018
1019struct nft_expr_type nft_payload_type __read_mostly = {
1020 .name = "payload",
1021 .select_ops = nft_payload_select_ops,
1022 .inner_ops = &nft_payload_inner_ops,
1023 .policy = nft_payload_policy,
1024 .maxattr = NFTA_PAYLOAD_MAX,
1025 .owner = THIS_MODULE,
1026};