Loading...
1// SPDX-License-Identifier: (LGPL-2.1 OR BSD-2-Clause)
2/* Copyright (c) 2018 Facebook */
3
4#include <stdlib.h>
5#include <memory.h>
6#include <unistd.h>
7#include <arpa/inet.h>
8#include <linux/bpf.h>
9#include <linux/if_ether.h>
10#include <linux/pkt_cls.h>
11#include <linux/rtnetlink.h>
12#include <linux/netdev.h>
13#include <sys/socket.h>
14#include <errno.h>
15#include <time.h>
16
17#include "bpf.h"
18#include "libbpf.h"
19#include "libbpf_internal.h"
20#include "nlattr.h"
21
22#ifndef SOL_NETLINK
23#define SOL_NETLINK 270
24#endif
25
26typedef int (*libbpf_dump_nlmsg_t)(void *cookie, void *msg, struct nlattr **tb);
27
28typedef int (*__dump_nlmsg_t)(struct nlmsghdr *nlmsg, libbpf_dump_nlmsg_t,
29 void *cookie);
30
31struct xdp_link_info {
32 __u32 prog_id;
33 __u32 drv_prog_id;
34 __u32 hw_prog_id;
35 __u32 skb_prog_id;
36 __u8 attach_mode;
37};
38
39struct xdp_id_md {
40 int ifindex;
41 __u32 flags;
42 struct xdp_link_info info;
43 __u64 feature_flags;
44};
45
46struct xdp_features_md {
47 int ifindex;
48 __u32 xdp_zc_max_segs;
49 __u64 flags;
50};
51
52static int libbpf_netlink_open(__u32 *nl_pid, int proto)
53{
54 struct sockaddr_nl sa;
55 socklen_t addrlen;
56 int one = 1, ret;
57 int sock;
58
59 memset(&sa, 0, sizeof(sa));
60 sa.nl_family = AF_NETLINK;
61
62 sock = socket(AF_NETLINK, SOCK_RAW | SOCK_CLOEXEC, proto);
63 if (sock < 0)
64 return -errno;
65
66 if (setsockopt(sock, SOL_NETLINK, NETLINK_EXT_ACK,
67 &one, sizeof(one)) < 0) {
68 pr_warn("Netlink error reporting not supported\n");
69 }
70
71 if (bind(sock, (struct sockaddr *)&sa, sizeof(sa)) < 0) {
72 ret = -errno;
73 goto cleanup;
74 }
75
76 addrlen = sizeof(sa);
77 if (getsockname(sock, (struct sockaddr *)&sa, &addrlen) < 0) {
78 ret = -errno;
79 goto cleanup;
80 }
81
82 if (addrlen != sizeof(sa)) {
83 ret = -LIBBPF_ERRNO__INTERNAL;
84 goto cleanup;
85 }
86
87 *nl_pid = sa.nl_pid;
88 return sock;
89
90cleanup:
91 close(sock);
92 return ret;
93}
94
95static void libbpf_netlink_close(int sock)
96{
97 close(sock);
98}
99
100enum {
101 NL_CONT,
102 NL_NEXT,
103 NL_DONE,
104};
105
106static int netlink_recvmsg(int sock, struct msghdr *mhdr, int flags)
107{
108 int len;
109
110 do {
111 len = recvmsg(sock, mhdr, flags);
112 } while (len < 0 && (errno == EINTR || errno == EAGAIN));
113
114 if (len < 0)
115 return -errno;
116 return len;
117}
118
119static int alloc_iov(struct iovec *iov, int len)
120{
121 void *nbuf;
122
123 nbuf = realloc(iov->iov_base, len);
124 if (!nbuf)
125 return -ENOMEM;
126
127 iov->iov_base = nbuf;
128 iov->iov_len = len;
129 return 0;
130}
131
132static int libbpf_netlink_recv(int sock, __u32 nl_pid, int seq,
133 __dump_nlmsg_t _fn, libbpf_dump_nlmsg_t fn,
134 void *cookie)
135{
136 struct iovec iov = {};
137 struct msghdr mhdr = {
138 .msg_iov = &iov,
139 .msg_iovlen = 1,
140 };
141 bool multipart = true;
142 struct nlmsgerr *err;
143 struct nlmsghdr *nh;
144 int len, ret;
145
146 ret = alloc_iov(&iov, 4096);
147 if (ret)
148 goto done;
149
150 while (multipart) {
151start:
152 multipart = false;
153 len = netlink_recvmsg(sock, &mhdr, MSG_PEEK | MSG_TRUNC);
154 if (len < 0) {
155 ret = len;
156 goto done;
157 }
158
159 if (len > iov.iov_len) {
160 ret = alloc_iov(&iov, len);
161 if (ret)
162 goto done;
163 }
164
165 len = netlink_recvmsg(sock, &mhdr, 0);
166 if (len < 0) {
167 ret = len;
168 goto done;
169 }
170
171 if (len == 0)
172 break;
173
174 for (nh = (struct nlmsghdr *)iov.iov_base; NLMSG_OK(nh, len);
175 nh = NLMSG_NEXT(nh, len)) {
176 if (nh->nlmsg_pid != nl_pid) {
177 ret = -LIBBPF_ERRNO__WRNGPID;
178 goto done;
179 }
180 if (nh->nlmsg_seq != seq) {
181 ret = -LIBBPF_ERRNO__INVSEQ;
182 goto done;
183 }
184 if (nh->nlmsg_flags & NLM_F_MULTI)
185 multipart = true;
186 switch (nh->nlmsg_type) {
187 case NLMSG_ERROR:
188 err = (struct nlmsgerr *)NLMSG_DATA(nh);
189 if (!err->error)
190 continue;
191 ret = err->error;
192 libbpf_nla_dump_errormsg(nh);
193 goto done;
194 case NLMSG_DONE:
195 ret = 0;
196 goto done;
197 default:
198 break;
199 }
200 if (_fn) {
201 ret = _fn(nh, fn, cookie);
202 switch (ret) {
203 case NL_CONT:
204 break;
205 case NL_NEXT:
206 goto start;
207 case NL_DONE:
208 ret = 0;
209 goto done;
210 default:
211 goto done;
212 }
213 }
214 }
215 }
216 ret = 0;
217done:
218 free(iov.iov_base);
219 return ret;
220}
221
222static int libbpf_netlink_send_recv(struct libbpf_nla_req *req,
223 int proto, __dump_nlmsg_t parse_msg,
224 libbpf_dump_nlmsg_t parse_attr,
225 void *cookie)
226{
227 __u32 nl_pid = 0;
228 int sock, ret;
229
230 sock = libbpf_netlink_open(&nl_pid, proto);
231 if (sock < 0)
232 return sock;
233
234 req->nh.nlmsg_pid = 0;
235 req->nh.nlmsg_seq = time(NULL);
236
237 if (send(sock, req, req->nh.nlmsg_len, 0) < 0) {
238 ret = -errno;
239 goto out;
240 }
241
242 ret = libbpf_netlink_recv(sock, nl_pid, req->nh.nlmsg_seq,
243 parse_msg, parse_attr, cookie);
244out:
245 libbpf_netlink_close(sock);
246 return ret;
247}
248
249static int parse_genl_family_id(struct nlmsghdr *nh, libbpf_dump_nlmsg_t fn,
250 void *cookie)
251{
252 struct genlmsghdr *gnl = NLMSG_DATA(nh);
253 struct nlattr *na = (struct nlattr *)((void *)gnl + GENL_HDRLEN);
254 struct nlattr *tb[CTRL_ATTR_FAMILY_ID + 1];
255 __u16 *id = cookie;
256
257 libbpf_nla_parse(tb, CTRL_ATTR_FAMILY_ID, na,
258 NLMSG_PAYLOAD(nh, sizeof(*gnl)), NULL);
259 if (!tb[CTRL_ATTR_FAMILY_ID])
260 return NL_CONT;
261
262 *id = libbpf_nla_getattr_u16(tb[CTRL_ATTR_FAMILY_ID]);
263 return NL_DONE;
264}
265
266static int libbpf_netlink_resolve_genl_family_id(const char *name,
267 __u16 len, __u16 *id)
268{
269 struct libbpf_nla_req req = {
270 .nh.nlmsg_len = NLMSG_LENGTH(GENL_HDRLEN),
271 .nh.nlmsg_type = GENL_ID_CTRL,
272 .nh.nlmsg_flags = NLM_F_REQUEST,
273 .gnl.cmd = CTRL_CMD_GETFAMILY,
274 .gnl.version = 2,
275 };
276 int err;
277
278 err = nlattr_add(&req, CTRL_ATTR_FAMILY_NAME, name, len);
279 if (err < 0)
280 return err;
281
282 return libbpf_netlink_send_recv(&req, NETLINK_GENERIC,
283 parse_genl_family_id, NULL, id);
284}
285
286static int __bpf_set_link_xdp_fd_replace(int ifindex, int fd, int old_fd,
287 __u32 flags)
288{
289 struct nlattr *nla;
290 int ret;
291 struct libbpf_nla_req req;
292
293 memset(&req, 0, sizeof(req));
294 req.nh.nlmsg_len = NLMSG_LENGTH(sizeof(struct ifinfomsg));
295 req.nh.nlmsg_flags = NLM_F_REQUEST | NLM_F_ACK;
296 req.nh.nlmsg_type = RTM_SETLINK;
297 req.ifinfo.ifi_family = AF_UNSPEC;
298 req.ifinfo.ifi_index = ifindex;
299
300 nla = nlattr_begin_nested(&req, IFLA_XDP);
301 if (!nla)
302 return -EMSGSIZE;
303 ret = nlattr_add(&req, IFLA_XDP_FD, &fd, sizeof(fd));
304 if (ret < 0)
305 return ret;
306 if (flags) {
307 ret = nlattr_add(&req, IFLA_XDP_FLAGS, &flags, sizeof(flags));
308 if (ret < 0)
309 return ret;
310 }
311 if (flags & XDP_FLAGS_REPLACE) {
312 ret = nlattr_add(&req, IFLA_XDP_EXPECTED_FD, &old_fd,
313 sizeof(old_fd));
314 if (ret < 0)
315 return ret;
316 }
317 nlattr_end_nested(&req, nla);
318
319 return libbpf_netlink_send_recv(&req, NETLINK_ROUTE, NULL, NULL, NULL);
320}
321
322int bpf_xdp_attach(int ifindex, int prog_fd, __u32 flags, const struct bpf_xdp_attach_opts *opts)
323{
324 int old_prog_fd, err;
325
326 if (!OPTS_VALID(opts, bpf_xdp_attach_opts))
327 return libbpf_err(-EINVAL);
328
329 old_prog_fd = OPTS_GET(opts, old_prog_fd, 0);
330 if (old_prog_fd)
331 flags |= XDP_FLAGS_REPLACE;
332 else
333 old_prog_fd = -1;
334
335 err = __bpf_set_link_xdp_fd_replace(ifindex, prog_fd, old_prog_fd, flags);
336 return libbpf_err(err);
337}
338
339int bpf_xdp_detach(int ifindex, __u32 flags, const struct bpf_xdp_attach_opts *opts)
340{
341 return bpf_xdp_attach(ifindex, -1, flags, opts);
342}
343
344static int __dump_link_nlmsg(struct nlmsghdr *nlh,
345 libbpf_dump_nlmsg_t dump_link_nlmsg, void *cookie)
346{
347 struct nlattr *tb[IFLA_MAX + 1], *attr;
348 struct ifinfomsg *ifi = NLMSG_DATA(nlh);
349 int len;
350
351 len = nlh->nlmsg_len - NLMSG_LENGTH(sizeof(*ifi));
352 attr = (struct nlattr *) ((void *) ifi + NLMSG_ALIGN(sizeof(*ifi)));
353
354 if (libbpf_nla_parse(tb, IFLA_MAX, attr, len, NULL) != 0)
355 return -LIBBPF_ERRNO__NLPARSE;
356
357 return dump_link_nlmsg(cookie, ifi, tb);
358}
359
360static int get_xdp_info(void *cookie, void *msg, struct nlattr **tb)
361{
362 struct nlattr *xdp_tb[IFLA_XDP_MAX + 1];
363 struct xdp_id_md *xdp_id = cookie;
364 struct ifinfomsg *ifinfo = msg;
365 int ret;
366
367 if (xdp_id->ifindex && xdp_id->ifindex != ifinfo->ifi_index)
368 return 0;
369
370 if (!tb[IFLA_XDP])
371 return 0;
372
373 ret = libbpf_nla_parse_nested(xdp_tb, IFLA_XDP_MAX, tb[IFLA_XDP], NULL);
374 if (ret)
375 return ret;
376
377 if (!xdp_tb[IFLA_XDP_ATTACHED])
378 return 0;
379
380 xdp_id->info.attach_mode = libbpf_nla_getattr_u8(
381 xdp_tb[IFLA_XDP_ATTACHED]);
382
383 if (xdp_id->info.attach_mode == XDP_ATTACHED_NONE)
384 return 0;
385
386 if (xdp_tb[IFLA_XDP_PROG_ID])
387 xdp_id->info.prog_id = libbpf_nla_getattr_u32(
388 xdp_tb[IFLA_XDP_PROG_ID]);
389
390 if (xdp_tb[IFLA_XDP_SKB_PROG_ID])
391 xdp_id->info.skb_prog_id = libbpf_nla_getattr_u32(
392 xdp_tb[IFLA_XDP_SKB_PROG_ID]);
393
394 if (xdp_tb[IFLA_XDP_DRV_PROG_ID])
395 xdp_id->info.drv_prog_id = libbpf_nla_getattr_u32(
396 xdp_tb[IFLA_XDP_DRV_PROG_ID]);
397
398 if (xdp_tb[IFLA_XDP_HW_PROG_ID])
399 xdp_id->info.hw_prog_id = libbpf_nla_getattr_u32(
400 xdp_tb[IFLA_XDP_HW_PROG_ID]);
401
402 return 0;
403}
404
405static int parse_xdp_features(struct nlmsghdr *nh, libbpf_dump_nlmsg_t fn,
406 void *cookie)
407{
408 struct genlmsghdr *gnl = NLMSG_DATA(nh);
409 struct nlattr *na = (struct nlattr *)((void *)gnl + GENL_HDRLEN);
410 struct nlattr *tb[NETDEV_CMD_MAX + 1];
411 struct xdp_features_md *md = cookie;
412 __u32 ifindex;
413
414 libbpf_nla_parse(tb, NETDEV_CMD_MAX, na,
415 NLMSG_PAYLOAD(nh, sizeof(*gnl)), NULL);
416
417 if (!tb[NETDEV_A_DEV_IFINDEX] || !tb[NETDEV_A_DEV_XDP_FEATURES])
418 return NL_CONT;
419
420 ifindex = libbpf_nla_getattr_u32(tb[NETDEV_A_DEV_IFINDEX]);
421 if (ifindex != md->ifindex)
422 return NL_CONT;
423
424 md->flags = libbpf_nla_getattr_u64(tb[NETDEV_A_DEV_XDP_FEATURES]);
425 if (tb[NETDEV_A_DEV_XDP_ZC_MAX_SEGS])
426 md->xdp_zc_max_segs =
427 libbpf_nla_getattr_u32(tb[NETDEV_A_DEV_XDP_ZC_MAX_SEGS]);
428 return NL_DONE;
429}
430
431int bpf_xdp_query(int ifindex, int xdp_flags, struct bpf_xdp_query_opts *opts)
432{
433 struct libbpf_nla_req req = {
434 .nh.nlmsg_len = NLMSG_LENGTH(sizeof(struct ifinfomsg)),
435 .nh.nlmsg_type = RTM_GETLINK,
436 .nh.nlmsg_flags = NLM_F_DUMP | NLM_F_REQUEST,
437 .ifinfo.ifi_family = AF_PACKET,
438 };
439 struct xdp_id_md xdp_id = {};
440 struct xdp_features_md md = {
441 .ifindex = ifindex,
442 };
443 __u16 id;
444 int err;
445
446 if (!OPTS_VALID(opts, bpf_xdp_query_opts))
447 return libbpf_err(-EINVAL);
448
449 if (xdp_flags & ~XDP_FLAGS_MASK)
450 return libbpf_err(-EINVAL);
451
452 /* Check whether the single {HW,DRV,SKB} mode is set */
453 xdp_flags &= XDP_FLAGS_SKB_MODE | XDP_FLAGS_DRV_MODE | XDP_FLAGS_HW_MODE;
454 if (xdp_flags & (xdp_flags - 1))
455 return libbpf_err(-EINVAL);
456
457 xdp_id.ifindex = ifindex;
458 xdp_id.flags = xdp_flags;
459
460 err = libbpf_netlink_send_recv(&req, NETLINK_ROUTE, __dump_link_nlmsg,
461 get_xdp_info, &xdp_id);
462 if (err)
463 return libbpf_err(err);
464
465 OPTS_SET(opts, prog_id, xdp_id.info.prog_id);
466 OPTS_SET(opts, drv_prog_id, xdp_id.info.drv_prog_id);
467 OPTS_SET(opts, hw_prog_id, xdp_id.info.hw_prog_id);
468 OPTS_SET(opts, skb_prog_id, xdp_id.info.skb_prog_id);
469 OPTS_SET(opts, attach_mode, xdp_id.info.attach_mode);
470
471 if (!OPTS_HAS(opts, feature_flags))
472 return 0;
473
474 err = libbpf_netlink_resolve_genl_family_id("netdev", sizeof("netdev"), &id);
475 if (err < 0) {
476 if (err == -ENOENT) {
477 opts->feature_flags = 0;
478 goto skip_feature_flags;
479 }
480 return libbpf_err(err);
481 }
482
483 memset(&req, 0, sizeof(req));
484 req.nh.nlmsg_len = NLMSG_LENGTH(GENL_HDRLEN);
485 req.nh.nlmsg_flags = NLM_F_REQUEST;
486 req.nh.nlmsg_type = id;
487 req.gnl.cmd = NETDEV_CMD_DEV_GET;
488 req.gnl.version = 2;
489
490 err = nlattr_add(&req, NETDEV_A_DEV_IFINDEX, &ifindex, sizeof(ifindex));
491 if (err < 0)
492 return libbpf_err(err);
493
494 err = libbpf_netlink_send_recv(&req, NETLINK_GENERIC,
495 parse_xdp_features, NULL, &md);
496 if (err)
497 return libbpf_err(err);
498
499 opts->feature_flags = md.flags;
500 opts->xdp_zc_max_segs = md.xdp_zc_max_segs;
501
502skip_feature_flags:
503 return 0;
504}
505
506int bpf_xdp_query_id(int ifindex, int flags, __u32 *prog_id)
507{
508 LIBBPF_OPTS(bpf_xdp_query_opts, opts);
509 int ret;
510
511 ret = bpf_xdp_query(ifindex, flags, &opts);
512 if (ret)
513 return libbpf_err(ret);
514
515 flags &= XDP_FLAGS_MODES;
516
517 if (opts.attach_mode != XDP_ATTACHED_MULTI && !flags)
518 *prog_id = opts.prog_id;
519 else if (flags & XDP_FLAGS_DRV_MODE)
520 *prog_id = opts.drv_prog_id;
521 else if (flags & XDP_FLAGS_HW_MODE)
522 *prog_id = opts.hw_prog_id;
523 else if (flags & XDP_FLAGS_SKB_MODE)
524 *prog_id = opts.skb_prog_id;
525 else
526 *prog_id = 0;
527
528 return 0;
529}
530
531
532typedef int (*qdisc_config_t)(struct libbpf_nla_req *req);
533
534static int clsact_config(struct libbpf_nla_req *req)
535{
536 req->tc.tcm_parent = TC_H_CLSACT;
537 req->tc.tcm_handle = TC_H_MAKE(TC_H_CLSACT, 0);
538
539 return nlattr_add(req, TCA_KIND, "clsact", sizeof("clsact"));
540}
541
542static int attach_point_to_config(struct bpf_tc_hook *hook,
543 qdisc_config_t *config)
544{
545 switch (OPTS_GET(hook, attach_point, 0)) {
546 case BPF_TC_INGRESS:
547 case BPF_TC_EGRESS:
548 case BPF_TC_INGRESS | BPF_TC_EGRESS:
549 if (OPTS_GET(hook, parent, 0))
550 return -EINVAL;
551 *config = &clsact_config;
552 return 0;
553 case BPF_TC_CUSTOM:
554 return -EOPNOTSUPP;
555 default:
556 return -EINVAL;
557 }
558}
559
560static int tc_get_tcm_parent(enum bpf_tc_attach_point attach_point,
561 __u32 *parent)
562{
563 switch (attach_point) {
564 case BPF_TC_INGRESS:
565 case BPF_TC_EGRESS:
566 if (*parent)
567 return -EINVAL;
568 *parent = TC_H_MAKE(TC_H_CLSACT,
569 attach_point == BPF_TC_INGRESS ?
570 TC_H_MIN_INGRESS : TC_H_MIN_EGRESS);
571 break;
572 case BPF_TC_CUSTOM:
573 if (!*parent)
574 return -EINVAL;
575 break;
576 default:
577 return -EINVAL;
578 }
579 return 0;
580}
581
582static int tc_qdisc_modify(struct bpf_tc_hook *hook, int cmd, int flags)
583{
584 qdisc_config_t config;
585 int ret;
586 struct libbpf_nla_req req;
587
588 ret = attach_point_to_config(hook, &config);
589 if (ret < 0)
590 return ret;
591
592 memset(&req, 0, sizeof(req));
593 req.nh.nlmsg_len = NLMSG_LENGTH(sizeof(struct tcmsg));
594 req.nh.nlmsg_flags = NLM_F_REQUEST | NLM_F_ACK | flags;
595 req.nh.nlmsg_type = cmd;
596 req.tc.tcm_family = AF_UNSPEC;
597 req.tc.tcm_ifindex = OPTS_GET(hook, ifindex, 0);
598
599 ret = config(&req);
600 if (ret < 0)
601 return ret;
602
603 return libbpf_netlink_send_recv(&req, NETLINK_ROUTE, NULL, NULL, NULL);
604}
605
606static int tc_qdisc_create_excl(struct bpf_tc_hook *hook)
607{
608 return tc_qdisc_modify(hook, RTM_NEWQDISC, NLM_F_CREATE | NLM_F_EXCL);
609}
610
611static int tc_qdisc_delete(struct bpf_tc_hook *hook)
612{
613 return tc_qdisc_modify(hook, RTM_DELQDISC, 0);
614}
615
616int bpf_tc_hook_create(struct bpf_tc_hook *hook)
617{
618 int ret;
619
620 if (!hook || !OPTS_VALID(hook, bpf_tc_hook) ||
621 OPTS_GET(hook, ifindex, 0) <= 0)
622 return libbpf_err(-EINVAL);
623
624 ret = tc_qdisc_create_excl(hook);
625 return libbpf_err(ret);
626}
627
628static int __bpf_tc_detach(const struct bpf_tc_hook *hook,
629 const struct bpf_tc_opts *opts,
630 const bool flush);
631
632int bpf_tc_hook_destroy(struct bpf_tc_hook *hook)
633{
634 if (!hook || !OPTS_VALID(hook, bpf_tc_hook) ||
635 OPTS_GET(hook, ifindex, 0) <= 0)
636 return libbpf_err(-EINVAL);
637
638 switch (OPTS_GET(hook, attach_point, 0)) {
639 case BPF_TC_INGRESS:
640 case BPF_TC_EGRESS:
641 return libbpf_err(__bpf_tc_detach(hook, NULL, true));
642 case BPF_TC_INGRESS | BPF_TC_EGRESS:
643 return libbpf_err(tc_qdisc_delete(hook));
644 case BPF_TC_CUSTOM:
645 return libbpf_err(-EOPNOTSUPP);
646 default:
647 return libbpf_err(-EINVAL);
648 }
649}
650
651struct bpf_cb_ctx {
652 struct bpf_tc_opts *opts;
653 bool processed;
654};
655
656static int __get_tc_info(void *cookie, struct tcmsg *tc, struct nlattr **tb,
657 bool unicast)
658{
659 struct nlattr *tbb[TCA_BPF_MAX + 1];
660 struct bpf_cb_ctx *info = cookie;
661
662 if (!info || !info->opts)
663 return -EINVAL;
664 if (unicast && info->processed)
665 return -EINVAL;
666 if (!tb[TCA_OPTIONS])
667 return NL_CONT;
668
669 libbpf_nla_parse_nested(tbb, TCA_BPF_MAX, tb[TCA_OPTIONS], NULL);
670 if (!tbb[TCA_BPF_ID])
671 return -EINVAL;
672
673 OPTS_SET(info->opts, prog_id, libbpf_nla_getattr_u32(tbb[TCA_BPF_ID]));
674 OPTS_SET(info->opts, handle, tc->tcm_handle);
675 OPTS_SET(info->opts, priority, TC_H_MAJ(tc->tcm_info) >> 16);
676
677 info->processed = true;
678 return unicast ? NL_NEXT : NL_DONE;
679}
680
681static int get_tc_info(struct nlmsghdr *nh, libbpf_dump_nlmsg_t fn,
682 void *cookie)
683{
684 struct tcmsg *tc = NLMSG_DATA(nh);
685 struct nlattr *tb[TCA_MAX + 1];
686
687 libbpf_nla_parse(tb, TCA_MAX,
688 (struct nlattr *)((void *)tc + NLMSG_ALIGN(sizeof(*tc))),
689 NLMSG_PAYLOAD(nh, sizeof(*tc)), NULL);
690 if (!tb[TCA_KIND])
691 return NL_CONT;
692 return __get_tc_info(cookie, tc, tb, nh->nlmsg_flags & NLM_F_ECHO);
693}
694
695static int tc_add_fd_and_name(struct libbpf_nla_req *req, int fd)
696{
697 struct bpf_prog_info info;
698 __u32 info_len = sizeof(info);
699 char name[256];
700 int len, ret;
701
702 memset(&info, 0, info_len);
703 ret = bpf_prog_get_info_by_fd(fd, &info, &info_len);
704 if (ret < 0)
705 return ret;
706
707 ret = nlattr_add(req, TCA_BPF_FD, &fd, sizeof(fd));
708 if (ret < 0)
709 return ret;
710 len = snprintf(name, sizeof(name), "%s:[%u]", info.name, info.id);
711 if (len < 0)
712 return -errno;
713 if (len >= sizeof(name))
714 return -ENAMETOOLONG;
715 return nlattr_add(req, TCA_BPF_NAME, name, len + 1);
716}
717
718int bpf_tc_attach(const struct bpf_tc_hook *hook, struct bpf_tc_opts *opts)
719{
720 __u32 protocol, bpf_flags, handle, priority, parent, prog_id, flags;
721 int ret, ifindex, attach_point, prog_fd;
722 struct bpf_cb_ctx info = {};
723 struct libbpf_nla_req req;
724 struct nlattr *nla;
725
726 if (!hook || !opts ||
727 !OPTS_VALID(hook, bpf_tc_hook) ||
728 !OPTS_VALID(opts, bpf_tc_opts))
729 return libbpf_err(-EINVAL);
730
731 ifindex = OPTS_GET(hook, ifindex, 0);
732 parent = OPTS_GET(hook, parent, 0);
733 attach_point = OPTS_GET(hook, attach_point, 0);
734
735 handle = OPTS_GET(opts, handle, 0);
736 priority = OPTS_GET(opts, priority, 0);
737 prog_fd = OPTS_GET(opts, prog_fd, 0);
738 prog_id = OPTS_GET(opts, prog_id, 0);
739 flags = OPTS_GET(opts, flags, 0);
740
741 if (ifindex <= 0 || !prog_fd || prog_id)
742 return libbpf_err(-EINVAL);
743 if (priority > UINT16_MAX)
744 return libbpf_err(-EINVAL);
745 if (flags & ~BPF_TC_F_REPLACE)
746 return libbpf_err(-EINVAL);
747
748 flags = (flags & BPF_TC_F_REPLACE) ? NLM_F_REPLACE : NLM_F_EXCL;
749 protocol = ETH_P_ALL;
750
751 memset(&req, 0, sizeof(req));
752 req.nh.nlmsg_len = NLMSG_LENGTH(sizeof(struct tcmsg));
753 req.nh.nlmsg_flags = NLM_F_REQUEST | NLM_F_ACK | NLM_F_CREATE |
754 NLM_F_ECHO | flags;
755 req.nh.nlmsg_type = RTM_NEWTFILTER;
756 req.tc.tcm_family = AF_UNSPEC;
757 req.tc.tcm_ifindex = ifindex;
758 req.tc.tcm_handle = handle;
759 req.tc.tcm_info = TC_H_MAKE(priority << 16, htons(protocol));
760
761 ret = tc_get_tcm_parent(attach_point, &parent);
762 if (ret < 0)
763 return libbpf_err(ret);
764 req.tc.tcm_parent = parent;
765
766 ret = nlattr_add(&req, TCA_KIND, "bpf", sizeof("bpf"));
767 if (ret < 0)
768 return libbpf_err(ret);
769 nla = nlattr_begin_nested(&req, TCA_OPTIONS);
770 if (!nla)
771 return libbpf_err(-EMSGSIZE);
772 ret = tc_add_fd_and_name(&req, prog_fd);
773 if (ret < 0)
774 return libbpf_err(ret);
775 bpf_flags = TCA_BPF_FLAG_ACT_DIRECT;
776 ret = nlattr_add(&req, TCA_BPF_FLAGS, &bpf_flags, sizeof(bpf_flags));
777 if (ret < 0)
778 return libbpf_err(ret);
779 nlattr_end_nested(&req, nla);
780
781 info.opts = opts;
782
783 ret = libbpf_netlink_send_recv(&req, NETLINK_ROUTE, get_tc_info, NULL,
784 &info);
785 if (ret < 0)
786 return libbpf_err(ret);
787 if (!info.processed)
788 return libbpf_err(-ENOENT);
789 return ret;
790}
791
792static int __bpf_tc_detach(const struct bpf_tc_hook *hook,
793 const struct bpf_tc_opts *opts,
794 const bool flush)
795{
796 __u32 protocol = 0, handle, priority, parent, prog_id, flags;
797 int ret, ifindex, attach_point, prog_fd;
798 struct libbpf_nla_req req;
799
800 if (!hook ||
801 !OPTS_VALID(hook, bpf_tc_hook) ||
802 !OPTS_VALID(opts, bpf_tc_opts))
803 return -EINVAL;
804
805 ifindex = OPTS_GET(hook, ifindex, 0);
806 parent = OPTS_GET(hook, parent, 0);
807 attach_point = OPTS_GET(hook, attach_point, 0);
808
809 handle = OPTS_GET(opts, handle, 0);
810 priority = OPTS_GET(opts, priority, 0);
811 prog_fd = OPTS_GET(opts, prog_fd, 0);
812 prog_id = OPTS_GET(opts, prog_id, 0);
813 flags = OPTS_GET(opts, flags, 0);
814
815 if (ifindex <= 0 || flags || prog_fd || prog_id)
816 return -EINVAL;
817 if (priority > UINT16_MAX)
818 return -EINVAL;
819 if (!flush) {
820 if (!handle || !priority)
821 return -EINVAL;
822 protocol = ETH_P_ALL;
823 } else {
824 if (handle || priority)
825 return -EINVAL;
826 }
827
828 memset(&req, 0, sizeof(req));
829 req.nh.nlmsg_len = NLMSG_LENGTH(sizeof(struct tcmsg));
830 req.nh.nlmsg_flags = NLM_F_REQUEST | NLM_F_ACK;
831 req.nh.nlmsg_type = RTM_DELTFILTER;
832 req.tc.tcm_family = AF_UNSPEC;
833 req.tc.tcm_ifindex = ifindex;
834 if (!flush) {
835 req.tc.tcm_handle = handle;
836 req.tc.tcm_info = TC_H_MAKE(priority << 16, htons(protocol));
837 }
838
839 ret = tc_get_tcm_parent(attach_point, &parent);
840 if (ret < 0)
841 return ret;
842 req.tc.tcm_parent = parent;
843
844 if (!flush) {
845 ret = nlattr_add(&req, TCA_KIND, "bpf", sizeof("bpf"));
846 if (ret < 0)
847 return ret;
848 }
849
850 return libbpf_netlink_send_recv(&req, NETLINK_ROUTE, NULL, NULL, NULL);
851}
852
853int bpf_tc_detach(const struct bpf_tc_hook *hook,
854 const struct bpf_tc_opts *opts)
855{
856 int ret;
857
858 if (!opts)
859 return libbpf_err(-EINVAL);
860
861 ret = __bpf_tc_detach(hook, opts, false);
862 return libbpf_err(ret);
863}
864
865int bpf_tc_query(const struct bpf_tc_hook *hook, struct bpf_tc_opts *opts)
866{
867 __u32 protocol, handle, priority, parent, prog_id, flags;
868 int ret, ifindex, attach_point, prog_fd;
869 struct bpf_cb_ctx info = {};
870 struct libbpf_nla_req req;
871
872 if (!hook || !opts ||
873 !OPTS_VALID(hook, bpf_tc_hook) ||
874 !OPTS_VALID(opts, bpf_tc_opts))
875 return libbpf_err(-EINVAL);
876
877 ifindex = OPTS_GET(hook, ifindex, 0);
878 parent = OPTS_GET(hook, parent, 0);
879 attach_point = OPTS_GET(hook, attach_point, 0);
880
881 handle = OPTS_GET(opts, handle, 0);
882 priority = OPTS_GET(opts, priority, 0);
883 prog_fd = OPTS_GET(opts, prog_fd, 0);
884 prog_id = OPTS_GET(opts, prog_id, 0);
885 flags = OPTS_GET(opts, flags, 0);
886
887 if (ifindex <= 0 || flags || prog_fd || prog_id ||
888 !handle || !priority)
889 return libbpf_err(-EINVAL);
890 if (priority > UINT16_MAX)
891 return libbpf_err(-EINVAL);
892
893 protocol = ETH_P_ALL;
894
895 memset(&req, 0, sizeof(req));
896 req.nh.nlmsg_len = NLMSG_LENGTH(sizeof(struct tcmsg));
897 req.nh.nlmsg_flags = NLM_F_REQUEST;
898 req.nh.nlmsg_type = RTM_GETTFILTER;
899 req.tc.tcm_family = AF_UNSPEC;
900 req.tc.tcm_ifindex = ifindex;
901 req.tc.tcm_handle = handle;
902 req.tc.tcm_info = TC_H_MAKE(priority << 16, htons(protocol));
903
904 ret = tc_get_tcm_parent(attach_point, &parent);
905 if (ret < 0)
906 return libbpf_err(ret);
907 req.tc.tcm_parent = parent;
908
909 ret = nlattr_add(&req, TCA_KIND, "bpf", sizeof("bpf"));
910 if (ret < 0)
911 return libbpf_err(ret);
912
913 info.opts = opts;
914
915 ret = libbpf_netlink_send_recv(&req, NETLINK_ROUTE, get_tc_info, NULL,
916 &info);
917 if (ret < 0)
918 return libbpf_err(ret);
919 if (!info.processed)
920 return libbpf_err(-ENOENT);
921 return ret;
922}
1// SPDX-License-Identifier: (LGPL-2.1 OR BSD-2-Clause)
2/* Copyright (c) 2018 Facebook */
3
4#include <stdlib.h>
5#include <memory.h>
6#include <unistd.h>
7#include <arpa/inet.h>
8#include <linux/bpf.h>
9#include <linux/if_ether.h>
10#include <linux/pkt_cls.h>
11#include <linux/rtnetlink.h>
12#include <sys/socket.h>
13#include <errno.h>
14#include <time.h>
15
16#include "bpf.h"
17#include "libbpf.h"
18#include "libbpf_internal.h"
19#include "nlattr.h"
20
21#ifndef SOL_NETLINK
22#define SOL_NETLINK 270
23#endif
24
25typedef int (*libbpf_dump_nlmsg_t)(void *cookie, void *msg, struct nlattr **tb);
26
27typedef int (*__dump_nlmsg_t)(struct nlmsghdr *nlmsg, libbpf_dump_nlmsg_t,
28 void *cookie);
29
30struct xdp_id_md {
31 int ifindex;
32 __u32 flags;
33 struct xdp_link_info info;
34};
35
36static int libbpf_netlink_open(__u32 *nl_pid)
37{
38 struct sockaddr_nl sa;
39 socklen_t addrlen;
40 int one = 1, ret;
41 int sock;
42
43 memset(&sa, 0, sizeof(sa));
44 sa.nl_family = AF_NETLINK;
45
46 sock = socket(AF_NETLINK, SOCK_RAW | SOCK_CLOEXEC, NETLINK_ROUTE);
47 if (sock < 0)
48 return -errno;
49
50 if (setsockopt(sock, SOL_NETLINK, NETLINK_EXT_ACK,
51 &one, sizeof(one)) < 0) {
52 pr_warn("Netlink error reporting not supported\n");
53 }
54
55 if (bind(sock, (struct sockaddr *)&sa, sizeof(sa)) < 0) {
56 ret = -errno;
57 goto cleanup;
58 }
59
60 addrlen = sizeof(sa);
61 if (getsockname(sock, (struct sockaddr *)&sa, &addrlen) < 0) {
62 ret = -errno;
63 goto cleanup;
64 }
65
66 if (addrlen != sizeof(sa)) {
67 ret = -LIBBPF_ERRNO__INTERNAL;
68 goto cleanup;
69 }
70
71 *nl_pid = sa.nl_pid;
72 return sock;
73
74cleanup:
75 close(sock);
76 return ret;
77}
78
79static void libbpf_netlink_close(int sock)
80{
81 close(sock);
82}
83
84enum {
85 NL_CONT,
86 NL_NEXT,
87 NL_DONE,
88};
89
90static int libbpf_netlink_recv(int sock, __u32 nl_pid, int seq,
91 __dump_nlmsg_t _fn, libbpf_dump_nlmsg_t fn,
92 void *cookie)
93{
94 bool multipart = true;
95 struct nlmsgerr *err;
96 struct nlmsghdr *nh;
97 char buf[4096];
98 int len, ret;
99
100 while (multipart) {
101start:
102 multipart = false;
103 len = recv(sock, buf, sizeof(buf), 0);
104 if (len < 0) {
105 ret = -errno;
106 goto done;
107 }
108
109 if (len == 0)
110 break;
111
112 for (nh = (struct nlmsghdr *)buf; NLMSG_OK(nh, len);
113 nh = NLMSG_NEXT(nh, len)) {
114 if (nh->nlmsg_pid != nl_pid) {
115 ret = -LIBBPF_ERRNO__WRNGPID;
116 goto done;
117 }
118 if (nh->nlmsg_seq != seq) {
119 ret = -LIBBPF_ERRNO__INVSEQ;
120 goto done;
121 }
122 if (nh->nlmsg_flags & NLM_F_MULTI)
123 multipart = true;
124 switch (nh->nlmsg_type) {
125 case NLMSG_ERROR:
126 err = (struct nlmsgerr *)NLMSG_DATA(nh);
127 if (!err->error)
128 continue;
129 ret = err->error;
130 libbpf_nla_dump_errormsg(nh);
131 goto done;
132 case NLMSG_DONE:
133 return 0;
134 default:
135 break;
136 }
137 if (_fn) {
138 ret = _fn(nh, fn, cookie);
139 switch (ret) {
140 case NL_CONT:
141 break;
142 case NL_NEXT:
143 goto start;
144 case NL_DONE:
145 return 0;
146 default:
147 return ret;
148 }
149 }
150 }
151 }
152 ret = 0;
153done:
154 return ret;
155}
156
157static int libbpf_netlink_send_recv(struct libbpf_nla_req *req,
158 __dump_nlmsg_t parse_msg,
159 libbpf_dump_nlmsg_t parse_attr,
160 void *cookie)
161{
162 __u32 nl_pid = 0;
163 int sock, ret;
164
165 sock = libbpf_netlink_open(&nl_pid);
166 if (sock < 0)
167 return sock;
168
169 req->nh.nlmsg_pid = 0;
170 req->nh.nlmsg_seq = time(NULL);
171
172 if (send(sock, req, req->nh.nlmsg_len, 0) < 0) {
173 ret = -errno;
174 goto out;
175 }
176
177 ret = libbpf_netlink_recv(sock, nl_pid, req->nh.nlmsg_seq,
178 parse_msg, parse_attr, cookie);
179out:
180 libbpf_netlink_close(sock);
181 return ret;
182}
183
184static int __bpf_set_link_xdp_fd_replace(int ifindex, int fd, int old_fd,
185 __u32 flags)
186{
187 struct nlattr *nla;
188 int ret;
189 struct libbpf_nla_req req;
190
191 memset(&req, 0, sizeof(req));
192 req.nh.nlmsg_len = NLMSG_LENGTH(sizeof(struct ifinfomsg));
193 req.nh.nlmsg_flags = NLM_F_REQUEST | NLM_F_ACK;
194 req.nh.nlmsg_type = RTM_SETLINK;
195 req.ifinfo.ifi_family = AF_UNSPEC;
196 req.ifinfo.ifi_index = ifindex;
197
198 nla = nlattr_begin_nested(&req, IFLA_XDP);
199 if (!nla)
200 return -EMSGSIZE;
201 ret = nlattr_add(&req, IFLA_XDP_FD, &fd, sizeof(fd));
202 if (ret < 0)
203 return ret;
204 if (flags) {
205 ret = nlattr_add(&req, IFLA_XDP_FLAGS, &flags, sizeof(flags));
206 if (ret < 0)
207 return ret;
208 }
209 if (flags & XDP_FLAGS_REPLACE) {
210 ret = nlattr_add(&req, IFLA_XDP_EXPECTED_FD, &old_fd,
211 sizeof(old_fd));
212 if (ret < 0)
213 return ret;
214 }
215 nlattr_end_nested(&req, nla);
216
217 return libbpf_netlink_send_recv(&req, NULL, NULL, NULL);
218}
219
220int bpf_set_link_xdp_fd_opts(int ifindex, int fd, __u32 flags,
221 const struct bpf_xdp_set_link_opts *opts)
222{
223 int old_fd = -1, ret;
224
225 if (!OPTS_VALID(opts, bpf_xdp_set_link_opts))
226 return libbpf_err(-EINVAL);
227
228 if (OPTS_HAS(opts, old_fd)) {
229 old_fd = OPTS_GET(opts, old_fd, -1);
230 flags |= XDP_FLAGS_REPLACE;
231 }
232
233 ret = __bpf_set_link_xdp_fd_replace(ifindex, fd, old_fd, flags);
234 return libbpf_err(ret);
235}
236
237int bpf_set_link_xdp_fd(int ifindex, int fd, __u32 flags)
238{
239 int ret;
240
241 ret = __bpf_set_link_xdp_fd_replace(ifindex, fd, 0, flags);
242 return libbpf_err(ret);
243}
244
245static int __dump_link_nlmsg(struct nlmsghdr *nlh,
246 libbpf_dump_nlmsg_t dump_link_nlmsg, void *cookie)
247{
248 struct nlattr *tb[IFLA_MAX + 1], *attr;
249 struct ifinfomsg *ifi = NLMSG_DATA(nlh);
250 int len;
251
252 len = nlh->nlmsg_len - NLMSG_LENGTH(sizeof(*ifi));
253 attr = (struct nlattr *) ((void *) ifi + NLMSG_ALIGN(sizeof(*ifi)));
254
255 if (libbpf_nla_parse(tb, IFLA_MAX, attr, len, NULL) != 0)
256 return -LIBBPF_ERRNO__NLPARSE;
257
258 return dump_link_nlmsg(cookie, ifi, tb);
259}
260
261static int get_xdp_info(void *cookie, void *msg, struct nlattr **tb)
262{
263 struct nlattr *xdp_tb[IFLA_XDP_MAX + 1];
264 struct xdp_id_md *xdp_id = cookie;
265 struct ifinfomsg *ifinfo = msg;
266 int ret;
267
268 if (xdp_id->ifindex && xdp_id->ifindex != ifinfo->ifi_index)
269 return 0;
270
271 if (!tb[IFLA_XDP])
272 return 0;
273
274 ret = libbpf_nla_parse_nested(xdp_tb, IFLA_XDP_MAX, tb[IFLA_XDP], NULL);
275 if (ret)
276 return ret;
277
278 if (!xdp_tb[IFLA_XDP_ATTACHED])
279 return 0;
280
281 xdp_id->info.attach_mode = libbpf_nla_getattr_u8(
282 xdp_tb[IFLA_XDP_ATTACHED]);
283
284 if (xdp_id->info.attach_mode == XDP_ATTACHED_NONE)
285 return 0;
286
287 if (xdp_tb[IFLA_XDP_PROG_ID])
288 xdp_id->info.prog_id = libbpf_nla_getattr_u32(
289 xdp_tb[IFLA_XDP_PROG_ID]);
290
291 if (xdp_tb[IFLA_XDP_SKB_PROG_ID])
292 xdp_id->info.skb_prog_id = libbpf_nla_getattr_u32(
293 xdp_tb[IFLA_XDP_SKB_PROG_ID]);
294
295 if (xdp_tb[IFLA_XDP_DRV_PROG_ID])
296 xdp_id->info.drv_prog_id = libbpf_nla_getattr_u32(
297 xdp_tb[IFLA_XDP_DRV_PROG_ID]);
298
299 if (xdp_tb[IFLA_XDP_HW_PROG_ID])
300 xdp_id->info.hw_prog_id = libbpf_nla_getattr_u32(
301 xdp_tb[IFLA_XDP_HW_PROG_ID]);
302
303 return 0;
304}
305
306int bpf_get_link_xdp_info(int ifindex, struct xdp_link_info *info,
307 size_t info_size, __u32 flags)
308{
309 struct xdp_id_md xdp_id = {};
310 __u32 mask;
311 int ret;
312 struct libbpf_nla_req req = {
313 .nh.nlmsg_len = NLMSG_LENGTH(sizeof(struct ifinfomsg)),
314 .nh.nlmsg_type = RTM_GETLINK,
315 .nh.nlmsg_flags = NLM_F_DUMP | NLM_F_REQUEST,
316 .ifinfo.ifi_family = AF_PACKET,
317 };
318
319 if (flags & ~XDP_FLAGS_MASK || !info_size)
320 return libbpf_err(-EINVAL);
321
322 /* Check whether the single {HW,DRV,SKB} mode is set */
323 flags &= (XDP_FLAGS_SKB_MODE | XDP_FLAGS_DRV_MODE | XDP_FLAGS_HW_MODE);
324 mask = flags - 1;
325 if (flags && flags & mask)
326 return libbpf_err(-EINVAL);
327
328 xdp_id.ifindex = ifindex;
329 xdp_id.flags = flags;
330
331 ret = libbpf_netlink_send_recv(&req, __dump_link_nlmsg,
332 get_xdp_info, &xdp_id);
333 if (!ret) {
334 size_t sz = min(info_size, sizeof(xdp_id.info));
335
336 memcpy(info, &xdp_id.info, sz);
337 memset((void *) info + sz, 0, info_size - sz);
338 }
339
340 return libbpf_err(ret);
341}
342
343static __u32 get_xdp_id(struct xdp_link_info *info, __u32 flags)
344{
345 flags &= XDP_FLAGS_MODES;
346
347 if (info->attach_mode != XDP_ATTACHED_MULTI && !flags)
348 return info->prog_id;
349 if (flags & XDP_FLAGS_DRV_MODE)
350 return info->drv_prog_id;
351 if (flags & XDP_FLAGS_HW_MODE)
352 return info->hw_prog_id;
353 if (flags & XDP_FLAGS_SKB_MODE)
354 return info->skb_prog_id;
355
356 return 0;
357}
358
359int bpf_get_link_xdp_id(int ifindex, __u32 *prog_id, __u32 flags)
360{
361 struct xdp_link_info info;
362 int ret;
363
364 ret = bpf_get_link_xdp_info(ifindex, &info, sizeof(info), flags);
365 if (!ret)
366 *prog_id = get_xdp_id(&info, flags);
367
368 return libbpf_err(ret);
369}
370
371typedef int (*qdisc_config_t)(struct libbpf_nla_req *req);
372
373static int clsact_config(struct libbpf_nla_req *req)
374{
375 req->tc.tcm_parent = TC_H_CLSACT;
376 req->tc.tcm_handle = TC_H_MAKE(TC_H_CLSACT, 0);
377
378 return nlattr_add(req, TCA_KIND, "clsact", sizeof("clsact"));
379}
380
381static int attach_point_to_config(struct bpf_tc_hook *hook,
382 qdisc_config_t *config)
383{
384 switch (OPTS_GET(hook, attach_point, 0)) {
385 case BPF_TC_INGRESS:
386 case BPF_TC_EGRESS:
387 case BPF_TC_INGRESS | BPF_TC_EGRESS:
388 if (OPTS_GET(hook, parent, 0))
389 return -EINVAL;
390 *config = &clsact_config;
391 return 0;
392 case BPF_TC_CUSTOM:
393 return -EOPNOTSUPP;
394 default:
395 return -EINVAL;
396 }
397}
398
399static int tc_get_tcm_parent(enum bpf_tc_attach_point attach_point,
400 __u32 *parent)
401{
402 switch (attach_point) {
403 case BPF_TC_INGRESS:
404 case BPF_TC_EGRESS:
405 if (*parent)
406 return -EINVAL;
407 *parent = TC_H_MAKE(TC_H_CLSACT,
408 attach_point == BPF_TC_INGRESS ?
409 TC_H_MIN_INGRESS : TC_H_MIN_EGRESS);
410 break;
411 case BPF_TC_CUSTOM:
412 if (!*parent)
413 return -EINVAL;
414 break;
415 default:
416 return -EINVAL;
417 }
418 return 0;
419}
420
421static int tc_qdisc_modify(struct bpf_tc_hook *hook, int cmd, int flags)
422{
423 qdisc_config_t config;
424 int ret;
425 struct libbpf_nla_req req;
426
427 ret = attach_point_to_config(hook, &config);
428 if (ret < 0)
429 return ret;
430
431 memset(&req, 0, sizeof(req));
432 req.nh.nlmsg_len = NLMSG_LENGTH(sizeof(struct tcmsg));
433 req.nh.nlmsg_flags = NLM_F_REQUEST | NLM_F_ACK | flags;
434 req.nh.nlmsg_type = cmd;
435 req.tc.tcm_family = AF_UNSPEC;
436 req.tc.tcm_ifindex = OPTS_GET(hook, ifindex, 0);
437
438 ret = config(&req);
439 if (ret < 0)
440 return ret;
441
442 return libbpf_netlink_send_recv(&req, NULL, NULL, NULL);
443}
444
445static int tc_qdisc_create_excl(struct bpf_tc_hook *hook)
446{
447 return tc_qdisc_modify(hook, RTM_NEWQDISC, NLM_F_CREATE | NLM_F_EXCL);
448}
449
450static int tc_qdisc_delete(struct bpf_tc_hook *hook)
451{
452 return tc_qdisc_modify(hook, RTM_DELQDISC, 0);
453}
454
455int bpf_tc_hook_create(struct bpf_tc_hook *hook)
456{
457 int ret;
458
459 if (!hook || !OPTS_VALID(hook, bpf_tc_hook) ||
460 OPTS_GET(hook, ifindex, 0) <= 0)
461 return libbpf_err(-EINVAL);
462
463 ret = tc_qdisc_create_excl(hook);
464 return libbpf_err(ret);
465}
466
467static int __bpf_tc_detach(const struct bpf_tc_hook *hook,
468 const struct bpf_tc_opts *opts,
469 const bool flush);
470
471int bpf_tc_hook_destroy(struct bpf_tc_hook *hook)
472{
473 if (!hook || !OPTS_VALID(hook, bpf_tc_hook) ||
474 OPTS_GET(hook, ifindex, 0) <= 0)
475 return libbpf_err(-EINVAL);
476
477 switch (OPTS_GET(hook, attach_point, 0)) {
478 case BPF_TC_INGRESS:
479 case BPF_TC_EGRESS:
480 return libbpf_err(__bpf_tc_detach(hook, NULL, true));
481 case BPF_TC_INGRESS | BPF_TC_EGRESS:
482 return libbpf_err(tc_qdisc_delete(hook));
483 case BPF_TC_CUSTOM:
484 return libbpf_err(-EOPNOTSUPP);
485 default:
486 return libbpf_err(-EINVAL);
487 }
488}
489
490struct bpf_cb_ctx {
491 struct bpf_tc_opts *opts;
492 bool processed;
493};
494
495static int __get_tc_info(void *cookie, struct tcmsg *tc, struct nlattr **tb,
496 bool unicast)
497{
498 struct nlattr *tbb[TCA_BPF_MAX + 1];
499 struct bpf_cb_ctx *info = cookie;
500
501 if (!info || !info->opts)
502 return -EINVAL;
503 if (unicast && info->processed)
504 return -EINVAL;
505 if (!tb[TCA_OPTIONS])
506 return NL_CONT;
507
508 libbpf_nla_parse_nested(tbb, TCA_BPF_MAX, tb[TCA_OPTIONS], NULL);
509 if (!tbb[TCA_BPF_ID])
510 return -EINVAL;
511
512 OPTS_SET(info->opts, prog_id, libbpf_nla_getattr_u32(tbb[TCA_BPF_ID]));
513 OPTS_SET(info->opts, handle, tc->tcm_handle);
514 OPTS_SET(info->opts, priority, TC_H_MAJ(tc->tcm_info) >> 16);
515
516 info->processed = true;
517 return unicast ? NL_NEXT : NL_DONE;
518}
519
520static int get_tc_info(struct nlmsghdr *nh, libbpf_dump_nlmsg_t fn,
521 void *cookie)
522{
523 struct tcmsg *tc = NLMSG_DATA(nh);
524 struct nlattr *tb[TCA_MAX + 1];
525
526 libbpf_nla_parse(tb, TCA_MAX,
527 (struct nlattr *)((void *)tc + NLMSG_ALIGN(sizeof(*tc))),
528 NLMSG_PAYLOAD(nh, sizeof(*tc)), NULL);
529 if (!tb[TCA_KIND])
530 return NL_CONT;
531 return __get_tc_info(cookie, tc, tb, nh->nlmsg_flags & NLM_F_ECHO);
532}
533
534static int tc_add_fd_and_name(struct libbpf_nla_req *req, int fd)
535{
536 struct bpf_prog_info info = {};
537 __u32 info_len = sizeof(info);
538 char name[256];
539 int len, ret;
540
541 ret = bpf_obj_get_info_by_fd(fd, &info, &info_len);
542 if (ret < 0)
543 return ret;
544
545 ret = nlattr_add(req, TCA_BPF_FD, &fd, sizeof(fd));
546 if (ret < 0)
547 return ret;
548 len = snprintf(name, sizeof(name), "%s:[%u]", info.name, info.id);
549 if (len < 0)
550 return -errno;
551 if (len >= sizeof(name))
552 return -ENAMETOOLONG;
553 return nlattr_add(req, TCA_BPF_NAME, name, len + 1);
554}
555
556int bpf_tc_attach(const struct bpf_tc_hook *hook, struct bpf_tc_opts *opts)
557{
558 __u32 protocol, bpf_flags, handle, priority, parent, prog_id, flags;
559 int ret, ifindex, attach_point, prog_fd;
560 struct bpf_cb_ctx info = {};
561 struct libbpf_nla_req req;
562 struct nlattr *nla;
563
564 if (!hook || !opts ||
565 !OPTS_VALID(hook, bpf_tc_hook) ||
566 !OPTS_VALID(opts, bpf_tc_opts))
567 return libbpf_err(-EINVAL);
568
569 ifindex = OPTS_GET(hook, ifindex, 0);
570 parent = OPTS_GET(hook, parent, 0);
571 attach_point = OPTS_GET(hook, attach_point, 0);
572
573 handle = OPTS_GET(opts, handle, 0);
574 priority = OPTS_GET(opts, priority, 0);
575 prog_fd = OPTS_GET(opts, prog_fd, 0);
576 prog_id = OPTS_GET(opts, prog_id, 0);
577 flags = OPTS_GET(opts, flags, 0);
578
579 if (ifindex <= 0 || !prog_fd || prog_id)
580 return libbpf_err(-EINVAL);
581 if (priority > UINT16_MAX)
582 return libbpf_err(-EINVAL);
583 if (flags & ~BPF_TC_F_REPLACE)
584 return libbpf_err(-EINVAL);
585
586 flags = (flags & BPF_TC_F_REPLACE) ? NLM_F_REPLACE : NLM_F_EXCL;
587 protocol = ETH_P_ALL;
588
589 memset(&req, 0, sizeof(req));
590 req.nh.nlmsg_len = NLMSG_LENGTH(sizeof(struct tcmsg));
591 req.nh.nlmsg_flags = NLM_F_REQUEST | NLM_F_ACK | NLM_F_CREATE |
592 NLM_F_ECHO | flags;
593 req.nh.nlmsg_type = RTM_NEWTFILTER;
594 req.tc.tcm_family = AF_UNSPEC;
595 req.tc.tcm_ifindex = ifindex;
596 req.tc.tcm_handle = handle;
597 req.tc.tcm_info = TC_H_MAKE(priority << 16, htons(protocol));
598
599 ret = tc_get_tcm_parent(attach_point, &parent);
600 if (ret < 0)
601 return libbpf_err(ret);
602 req.tc.tcm_parent = parent;
603
604 ret = nlattr_add(&req, TCA_KIND, "bpf", sizeof("bpf"));
605 if (ret < 0)
606 return libbpf_err(ret);
607 nla = nlattr_begin_nested(&req, TCA_OPTIONS);
608 if (!nla)
609 return libbpf_err(-EMSGSIZE);
610 ret = tc_add_fd_and_name(&req, prog_fd);
611 if (ret < 0)
612 return libbpf_err(ret);
613 bpf_flags = TCA_BPF_FLAG_ACT_DIRECT;
614 ret = nlattr_add(&req, TCA_BPF_FLAGS, &bpf_flags, sizeof(bpf_flags));
615 if (ret < 0)
616 return libbpf_err(ret);
617 nlattr_end_nested(&req, nla);
618
619 info.opts = opts;
620
621 ret = libbpf_netlink_send_recv(&req, get_tc_info, NULL, &info);
622 if (ret < 0)
623 return libbpf_err(ret);
624 if (!info.processed)
625 return libbpf_err(-ENOENT);
626 return ret;
627}
628
629static int __bpf_tc_detach(const struct bpf_tc_hook *hook,
630 const struct bpf_tc_opts *opts,
631 const bool flush)
632{
633 __u32 protocol = 0, handle, priority, parent, prog_id, flags;
634 int ret, ifindex, attach_point, prog_fd;
635 struct libbpf_nla_req req;
636
637 if (!hook ||
638 !OPTS_VALID(hook, bpf_tc_hook) ||
639 !OPTS_VALID(opts, bpf_tc_opts))
640 return -EINVAL;
641
642 ifindex = OPTS_GET(hook, ifindex, 0);
643 parent = OPTS_GET(hook, parent, 0);
644 attach_point = OPTS_GET(hook, attach_point, 0);
645
646 handle = OPTS_GET(opts, handle, 0);
647 priority = OPTS_GET(opts, priority, 0);
648 prog_fd = OPTS_GET(opts, prog_fd, 0);
649 prog_id = OPTS_GET(opts, prog_id, 0);
650 flags = OPTS_GET(opts, flags, 0);
651
652 if (ifindex <= 0 || flags || prog_fd || prog_id)
653 return -EINVAL;
654 if (priority > UINT16_MAX)
655 return -EINVAL;
656 if (!flush) {
657 if (!handle || !priority)
658 return -EINVAL;
659 protocol = ETH_P_ALL;
660 } else {
661 if (handle || priority)
662 return -EINVAL;
663 }
664
665 memset(&req, 0, sizeof(req));
666 req.nh.nlmsg_len = NLMSG_LENGTH(sizeof(struct tcmsg));
667 req.nh.nlmsg_flags = NLM_F_REQUEST | NLM_F_ACK;
668 req.nh.nlmsg_type = RTM_DELTFILTER;
669 req.tc.tcm_family = AF_UNSPEC;
670 req.tc.tcm_ifindex = ifindex;
671 if (!flush) {
672 req.tc.tcm_handle = handle;
673 req.tc.tcm_info = TC_H_MAKE(priority << 16, htons(protocol));
674 }
675
676 ret = tc_get_tcm_parent(attach_point, &parent);
677 if (ret < 0)
678 return ret;
679 req.tc.tcm_parent = parent;
680
681 if (!flush) {
682 ret = nlattr_add(&req, TCA_KIND, "bpf", sizeof("bpf"));
683 if (ret < 0)
684 return ret;
685 }
686
687 return libbpf_netlink_send_recv(&req, NULL, NULL, NULL);
688}
689
690int bpf_tc_detach(const struct bpf_tc_hook *hook,
691 const struct bpf_tc_opts *opts)
692{
693 int ret;
694
695 if (!opts)
696 return libbpf_err(-EINVAL);
697
698 ret = __bpf_tc_detach(hook, opts, false);
699 return libbpf_err(ret);
700}
701
702int bpf_tc_query(const struct bpf_tc_hook *hook, struct bpf_tc_opts *opts)
703{
704 __u32 protocol, handle, priority, parent, prog_id, flags;
705 int ret, ifindex, attach_point, prog_fd;
706 struct bpf_cb_ctx info = {};
707 struct libbpf_nla_req req;
708
709 if (!hook || !opts ||
710 !OPTS_VALID(hook, bpf_tc_hook) ||
711 !OPTS_VALID(opts, bpf_tc_opts))
712 return libbpf_err(-EINVAL);
713
714 ifindex = OPTS_GET(hook, ifindex, 0);
715 parent = OPTS_GET(hook, parent, 0);
716 attach_point = OPTS_GET(hook, attach_point, 0);
717
718 handle = OPTS_GET(opts, handle, 0);
719 priority = OPTS_GET(opts, priority, 0);
720 prog_fd = OPTS_GET(opts, prog_fd, 0);
721 prog_id = OPTS_GET(opts, prog_id, 0);
722 flags = OPTS_GET(opts, flags, 0);
723
724 if (ifindex <= 0 || flags || prog_fd || prog_id ||
725 !handle || !priority)
726 return libbpf_err(-EINVAL);
727 if (priority > UINT16_MAX)
728 return libbpf_err(-EINVAL);
729
730 protocol = ETH_P_ALL;
731
732 memset(&req, 0, sizeof(req));
733 req.nh.nlmsg_len = NLMSG_LENGTH(sizeof(struct tcmsg));
734 req.nh.nlmsg_flags = NLM_F_REQUEST;
735 req.nh.nlmsg_type = RTM_GETTFILTER;
736 req.tc.tcm_family = AF_UNSPEC;
737 req.tc.tcm_ifindex = ifindex;
738 req.tc.tcm_handle = handle;
739 req.tc.tcm_info = TC_H_MAKE(priority << 16, htons(protocol));
740
741 ret = tc_get_tcm_parent(attach_point, &parent);
742 if (ret < 0)
743 return libbpf_err(ret);
744 req.tc.tcm_parent = parent;
745
746 ret = nlattr_add(&req, TCA_KIND, "bpf", sizeof("bpf"));
747 if (ret < 0)
748 return libbpf_err(ret);
749
750 info.opts = opts;
751
752 ret = libbpf_netlink_send_recv(&req, get_tc_info, NULL, &info);
753 if (ret < 0)
754 return libbpf_err(ret);
755 if (!info.processed)
756 return libbpf_err(-ENOENT);
757 return ret;
758}