1 /* Copyright (c) 2017 Facebook
3 * This program is free software; you can redistribute it and/or
4 * modify it under the terms of version 2 of the GNU General Public
5 * License as published by the Free Software Foundation.
15 #include <linux/types.h>
16 typedef __u16 __sum16;
17 #include <arpa/inet.h>
18 #include <linux/if_ether.h>
19 #include <linux/if_packet.h>
21 #include <linux/ipv6.h>
22 #include <linux/tcp.h>
23 #include <linux/filter.h>
24 #include <linux/perf_event.h>
25 #include <linux/unistd.h>
27 #include <sys/ioctl.h>
29 #include <sys/types.h>
32 #include <linux/bpf.h>
33 #include <linux/err.h>
35 #include <bpf/libbpf.h>
37 #include "test_iptunnel_common.h"
39 #include "bpf_endian.h"
40 #include "bpf_rlimit.h"
41 #include "trace_helpers.h"
43 static int error_cnt, pass_cnt;
44 static bool jit_enabled;
46 #define MAGIC_BYTES 123
48 /* ipv4 test vector */
54 .eth.h_proto = __bpf_constant_htons(ETH_P_IP),
57 .iph.tot_len = __bpf_constant_htons(MAGIC_BYTES),
61 /* ipv6 test vector */
67 .eth.h_proto = __bpf_constant_htons(ETH_P_IPV6),
69 .iph.payload_len = __bpf_constant_htons(MAGIC_BYTES),
73 #define _CHECK(condition, tag, duration, format...) ({ \
74 int __ret = !!(condition); \
77 printf("%s:FAIL:%s ", __func__, tag); \
81 printf("%s:PASS:%s %d nsec\n", __func__, tag, duration);\
86 #define CHECK(condition, tag, format...) \
87 _CHECK(condition, tag, duration, format)
88 #define CHECK_ATTR(condition, tag, format...) \
89 _CHECK(condition, tag, tattr.duration, format)
91 static int bpf_find_map(const char *test, struct bpf_object *obj,
96 map = bpf_object__find_map_by_name(obj, name);
98 printf("%s:FAIL:map '%s' not found\n", test, name);
102 return bpf_map__fd(map);
105 static void test_pkt_access(void)
107 const char *file = "./test_pkt_access.o";
108 struct bpf_object *obj;
109 __u32 duration, retval;
112 err = bpf_prog_load(file, BPF_PROG_TYPE_SCHED_CLS, &obj, &prog_fd);
118 err = bpf_prog_test_run(prog_fd, 100000, &pkt_v4, sizeof(pkt_v4),
119 NULL, NULL, &retval, &duration);
120 CHECK(err || retval, "ipv4",
121 "err %d errno %d retval %d duration %d\n",
122 err, errno, retval, duration);
124 err = bpf_prog_test_run(prog_fd, 100000, &pkt_v6, sizeof(pkt_v6),
125 NULL, NULL, &retval, &duration);
126 CHECK(err || retval, "ipv6",
127 "err %d errno %d retval %d duration %d\n",
128 err, errno, retval, duration);
129 bpf_object__close(obj);
132 static void test_prog_run_xattr(void)
134 const char *file = "./test_pkt_access.o";
135 struct bpf_object *obj;
138 struct bpf_prog_test_run_attr tattr = {
141 .data_size_in = sizeof(pkt_v4),
146 err = bpf_prog_load(file, BPF_PROG_TYPE_SCHED_CLS, &obj,
148 if (CHECK_ATTR(err, "load", "err %d errno %d\n", err, errno))
151 memset(buf, 0, sizeof(buf));
153 err = bpf_prog_test_run_xattr(&tattr);
154 CHECK_ATTR(err != -1 || errno != ENOSPC || tattr.retval, "run",
155 "err %d errno %d retval %d\n", err, errno, tattr.retval);
157 CHECK_ATTR(tattr.data_size_out != sizeof(pkt_v4), "data_size_out",
158 "incorrect output size, want %lu have %u\n",
159 sizeof(pkt_v4), tattr.data_size_out);
161 CHECK_ATTR(buf[5] != 0, "overflow",
162 "BPF_PROG_TEST_RUN ignored size hint\n");
164 tattr.data_out = NULL;
165 tattr.data_size_out = 0;
168 err = bpf_prog_test_run_xattr(&tattr);
169 CHECK_ATTR(err || errno || tattr.retval, "run_no_output",
170 "err %d errno %d retval %d\n", err, errno, tattr.retval);
172 tattr.data_size_out = 1;
173 err = bpf_prog_test_run_xattr(&tattr);
174 CHECK_ATTR(err != -EINVAL, "run_wrong_size_out", "err %d\n", err);
176 bpf_object__close(obj);
179 static void test_xdp(void)
181 struct vip key4 = {.protocol = 6, .family = AF_INET};
182 struct vip key6 = {.protocol = 6, .family = AF_INET6};
183 struct iptnl_info value4 = {.family = AF_INET};
184 struct iptnl_info value6 = {.family = AF_INET6};
185 const char *file = "./test_xdp.o";
186 struct bpf_object *obj;
188 struct ipv6hdr *iph6 = (void *)buf + sizeof(struct ethhdr);
189 struct iphdr *iph = (void *)buf + sizeof(struct ethhdr);
190 __u32 duration, retval, size;
191 int err, prog_fd, map_fd;
193 err = bpf_prog_load(file, BPF_PROG_TYPE_XDP, &obj, &prog_fd);
199 map_fd = bpf_find_map(__func__, obj, "vip2tnl");
202 bpf_map_update_elem(map_fd, &key4, &value4, 0);
203 bpf_map_update_elem(map_fd, &key6, &value6, 0);
205 err = bpf_prog_test_run(prog_fd, 1, &pkt_v4, sizeof(pkt_v4),
206 buf, &size, &retval, &duration);
208 CHECK(err || retval != XDP_TX || size != 74 ||
209 iph->protocol != IPPROTO_IPIP, "ipv4",
210 "err %d errno %d retval %d size %d\n",
211 err, errno, retval, size);
213 err = bpf_prog_test_run(prog_fd, 1, &pkt_v6, sizeof(pkt_v6),
214 buf, &size, &retval, &duration);
215 CHECK(err || retval != XDP_TX || size != 114 ||
216 iph6->nexthdr != IPPROTO_IPV6, "ipv6",
217 "err %d errno %d retval %d size %d\n",
218 err, errno, retval, size);
220 bpf_object__close(obj);
223 static void test_xdp_adjust_tail(void)
225 const char *file = "./test_adjust_tail.o";
226 struct bpf_object *obj;
228 __u32 duration, retval, size;
231 err = bpf_prog_load(file, BPF_PROG_TYPE_XDP, &obj, &prog_fd);
237 err = bpf_prog_test_run(prog_fd, 1, &pkt_v4, sizeof(pkt_v4),
238 buf, &size, &retval, &duration);
240 CHECK(err || retval != XDP_DROP,
241 "ipv4", "err %d errno %d retval %d size %d\n",
242 err, errno, retval, size);
244 err = bpf_prog_test_run(prog_fd, 1, &pkt_v6, sizeof(pkt_v6),
245 buf, &size, &retval, &duration);
246 CHECK(err || retval != XDP_TX || size != 54,
247 "ipv6", "err %d errno %d retval %d size %d\n",
248 err, errno, retval, size);
249 bpf_object__close(obj);
254 #define MAGIC_VAL 0x1234
255 #define NUM_ITER 100000
258 static void test_l4lb(const char *file)
260 unsigned int nr_cpus = bpf_num_possible_cpus();
261 struct vip key = {.protocol = 6};
265 } value = {.vip_num = VIP_NUM};
266 __u32 stats_key = VIP_NUM;
271 struct real_definition {
277 } real_def = {.dst = MAGIC_VAL};
278 __u32 ch_key = 11, real_num = 3;
279 __u32 duration, retval, size;
280 int err, i, prog_fd, map_fd;
281 __u64 bytes = 0, pkts = 0;
282 struct bpf_object *obj;
284 u32 *magic = (u32 *)buf;
286 err = bpf_prog_load(file, BPF_PROG_TYPE_SCHED_CLS, &obj, &prog_fd);
292 map_fd = bpf_find_map(__func__, obj, "vip_map");
295 bpf_map_update_elem(map_fd, &key, &value, 0);
297 map_fd = bpf_find_map(__func__, obj, "ch_rings");
300 bpf_map_update_elem(map_fd, &ch_key, &real_num, 0);
302 map_fd = bpf_find_map(__func__, obj, "reals");
305 bpf_map_update_elem(map_fd, &real_num, &real_def, 0);
307 err = bpf_prog_test_run(prog_fd, NUM_ITER, &pkt_v4, sizeof(pkt_v4),
308 buf, &size, &retval, &duration);
309 CHECK(err || retval != 7/*TC_ACT_REDIRECT*/ || size != 54 ||
310 *magic != MAGIC_VAL, "ipv4",
311 "err %d errno %d retval %d size %d magic %x\n",
312 err, errno, retval, size, *magic);
314 err = bpf_prog_test_run(prog_fd, NUM_ITER, &pkt_v6, sizeof(pkt_v6),
315 buf, &size, &retval, &duration);
316 CHECK(err || retval != 7/*TC_ACT_REDIRECT*/ || size != 74 ||
317 *magic != MAGIC_VAL, "ipv6",
318 "err %d errno %d retval %d size %d magic %x\n",
319 err, errno, retval, size, *magic);
321 map_fd = bpf_find_map(__func__, obj, "stats");
324 bpf_map_lookup_elem(map_fd, &stats_key, stats);
325 for (i = 0; i < nr_cpus; i++) {
326 bytes += stats[i].bytes;
327 pkts += stats[i].pkts;
329 if (bytes != MAGIC_BYTES * NUM_ITER * 2 || pkts != NUM_ITER * 2) {
331 printf("test_l4lb:FAIL:stats %lld %lld\n", bytes, pkts);
334 bpf_object__close(obj);
337 static void test_l4lb_all(void)
339 const char *file1 = "./test_l4lb.o";
340 const char *file2 = "./test_l4lb_noinline.o";
346 static void test_xdp_noinline(void)
348 const char *file = "./test_xdp_noinline.o";
349 unsigned int nr_cpus = bpf_num_possible_cpus();
350 struct vip key = {.protocol = 6};
354 } value = {.vip_num = VIP_NUM};
355 __u32 stats_key = VIP_NUM;
360 struct real_definition {
366 } real_def = {.dst = MAGIC_VAL};
367 __u32 ch_key = 11, real_num = 3;
368 __u32 duration, retval, size;
369 int err, i, prog_fd, map_fd;
370 __u64 bytes = 0, pkts = 0;
371 struct bpf_object *obj;
373 u32 *magic = (u32 *)buf;
375 err = bpf_prog_load(file, BPF_PROG_TYPE_XDP, &obj, &prog_fd);
381 map_fd = bpf_find_map(__func__, obj, "vip_map");
384 bpf_map_update_elem(map_fd, &key, &value, 0);
386 map_fd = bpf_find_map(__func__, obj, "ch_rings");
389 bpf_map_update_elem(map_fd, &ch_key, &real_num, 0);
391 map_fd = bpf_find_map(__func__, obj, "reals");
394 bpf_map_update_elem(map_fd, &real_num, &real_def, 0);
396 err = bpf_prog_test_run(prog_fd, NUM_ITER, &pkt_v4, sizeof(pkt_v4),
397 buf, &size, &retval, &duration);
398 CHECK(err || retval != 1 || size != 54 ||
399 *magic != MAGIC_VAL, "ipv4",
400 "err %d errno %d retval %d size %d magic %x\n",
401 err, errno, retval, size, *magic);
403 err = bpf_prog_test_run(prog_fd, NUM_ITER, &pkt_v6, sizeof(pkt_v6),
404 buf, &size, &retval, &duration);
405 CHECK(err || retval != 1 || size != 74 ||
406 *magic != MAGIC_VAL, "ipv6",
407 "err %d errno %d retval %d size %d magic %x\n",
408 err, errno, retval, size, *magic);
410 map_fd = bpf_find_map(__func__, obj, "stats");
413 bpf_map_lookup_elem(map_fd, &stats_key, stats);
414 for (i = 0; i < nr_cpus; i++) {
415 bytes += stats[i].bytes;
416 pkts += stats[i].pkts;
418 if (bytes != MAGIC_BYTES * NUM_ITER * 2 || pkts != NUM_ITER * 2) {
420 printf("test_xdp_noinline:FAIL:stats %lld %lld\n", bytes, pkts);
423 bpf_object__close(obj);
426 static void test_tcp_estats(void)
428 const char *file = "./test_tcp_estats.o";
430 struct bpf_object *obj;
433 err = bpf_prog_load(file, BPF_PROG_TYPE_TRACEPOINT, &obj, &prog_fd);
434 CHECK(err, "", "err %d errno %d\n", err, errno);
440 bpf_object__close(obj);
443 static inline __u64 ptr_to_u64(const void *ptr)
445 return (__u64) (unsigned long) ptr;
448 static bool is_jit_enabled(void)
450 const char *jit_sysctl = "/proc/sys/net/core/bpf_jit_enable";
451 bool enabled = false;
454 sysctl_fd = open(jit_sysctl, 0, O_RDONLY);
455 if (sysctl_fd != -1) {
458 if (read(sysctl_fd, &tmpc, sizeof(tmpc)) == 1)
459 enabled = (tmpc != '0');
466 static void test_bpf_obj_id(void)
468 const __u64 array_magic_value = 0xfaceb00c;
469 const __u32 array_key = 0;
470 const int nr_iters = 2;
471 const char *file = "./test_obj_id.o";
472 const char *expected_prog_name = "test_obj_id";
473 const char *expected_map_name = "test_map_id";
474 const __u64 nsec_per_sec = 1000000000;
476 struct bpf_object *objs[nr_iters];
477 int prog_fds[nr_iters], map_fds[nr_iters];
478 /* +1 to test for the info_len returned by kernel */
479 struct bpf_prog_info prog_infos[nr_iters + 1];
480 struct bpf_map_info map_infos[nr_iters + 1];
481 /* Each prog only uses one map. +1 to test nr_map_ids
482 * returned by kernel.
484 __u32 map_ids[nr_iters + 1];
485 char jited_insns[128], xlated_insns[128], zeros[128];
486 __u32 i, next_id, info_len, nr_id_found, duration = 0;
487 struct timespec real_time_ts, boot_time_ts;
490 uid_t my_uid = getuid();
491 time_t now, load_time;
493 err = bpf_prog_get_fd_by_id(0);
494 CHECK(err >= 0 || errno != ENOENT,
495 "get-fd-by-notexist-prog-id", "err %d errno %d\n", err, errno);
497 err = bpf_map_get_fd_by_id(0);
498 CHECK(err >= 0 || errno != ENOENT,
499 "get-fd-by-notexist-map-id", "err %d errno %d\n", err, errno);
501 for (i = 0; i < nr_iters; i++)
504 /* Check bpf_obj_get_info_by_fd() */
505 bzero(zeros, sizeof(zeros));
506 for (i = 0; i < nr_iters; i++) {
508 err = bpf_prog_load(file, BPF_PROG_TYPE_SOCKET_FILTER,
509 &objs[i], &prog_fds[i]);
510 /* test_obj_id.o is a dumb prog. It should never fail
517 /* Insert a magic value to the map */
518 map_fds[i] = bpf_find_map(__func__, objs[i], "test_map_id");
519 assert(map_fds[i] >= 0);
520 err = bpf_map_update_elem(map_fds[i], &array_key,
521 &array_magic_value, 0);
524 /* Check getting map info */
525 info_len = sizeof(struct bpf_map_info) * 2;
526 bzero(&map_infos[i], info_len);
527 err = bpf_obj_get_info_by_fd(map_fds[i], &map_infos[i],
530 map_infos[i].type != BPF_MAP_TYPE_ARRAY ||
531 map_infos[i].key_size != sizeof(__u32) ||
532 map_infos[i].value_size != sizeof(__u64) ||
533 map_infos[i].max_entries != 1 ||
534 map_infos[i].map_flags != 0 ||
535 info_len != sizeof(struct bpf_map_info) ||
536 strcmp((char *)map_infos[i].name, expected_map_name),
538 "err %d errno %d type %d(%d) info_len %u(%Zu) key_size %u value_size %u max_entries %u map_flags %X name %s(%s)\n",
540 map_infos[i].type, BPF_MAP_TYPE_ARRAY,
541 info_len, sizeof(struct bpf_map_info),
542 map_infos[i].key_size,
543 map_infos[i].value_size,
544 map_infos[i].max_entries,
545 map_infos[i].map_flags,
546 map_infos[i].name, expected_map_name))
549 /* Check getting prog info */
550 info_len = sizeof(struct bpf_prog_info) * 2;
551 bzero(&prog_infos[i], info_len);
552 bzero(jited_insns, sizeof(jited_insns));
553 bzero(xlated_insns, sizeof(xlated_insns));
554 prog_infos[i].jited_prog_insns = ptr_to_u64(jited_insns);
555 prog_infos[i].jited_prog_len = sizeof(jited_insns);
556 prog_infos[i].xlated_prog_insns = ptr_to_u64(xlated_insns);
557 prog_infos[i].xlated_prog_len = sizeof(xlated_insns);
558 prog_infos[i].map_ids = ptr_to_u64(map_ids + i);
559 prog_infos[i].nr_map_ids = 2;
560 err = clock_gettime(CLOCK_REALTIME, &real_time_ts);
562 err = clock_gettime(CLOCK_BOOTTIME, &boot_time_ts);
564 err = bpf_obj_get_info_by_fd(prog_fds[i], &prog_infos[i],
566 load_time = (real_time_ts.tv_sec - boot_time_ts.tv_sec)
567 + (prog_infos[i].load_time / nsec_per_sec);
569 prog_infos[i].type != BPF_PROG_TYPE_SOCKET_FILTER ||
570 info_len != sizeof(struct bpf_prog_info) ||
571 (jit_enabled && !prog_infos[i].jited_prog_len) ||
573 !memcmp(jited_insns, zeros, sizeof(zeros))) ||
574 !prog_infos[i].xlated_prog_len ||
575 !memcmp(xlated_insns, zeros, sizeof(zeros)) ||
576 load_time < now - 60 || load_time > now + 60 ||
577 prog_infos[i].created_by_uid != my_uid ||
578 prog_infos[i].nr_map_ids != 1 ||
579 *(int *)(long)prog_infos[i].map_ids != map_infos[i].id ||
580 strcmp((char *)prog_infos[i].name, expected_prog_name),
582 "err %d errno %d i %d type %d(%d) info_len %u(%Zu) jit_enabled %d jited_prog_len %u xlated_prog_len %u jited_prog %d xlated_prog %d load_time %lu(%lu) uid %u(%u) nr_map_ids %u(%u) map_id %u(%u) name %s(%s)\n",
584 prog_infos[i].type, BPF_PROG_TYPE_SOCKET_FILTER,
585 info_len, sizeof(struct bpf_prog_info),
587 prog_infos[i].jited_prog_len,
588 prog_infos[i].xlated_prog_len,
589 !!memcmp(jited_insns, zeros, sizeof(zeros)),
590 !!memcmp(xlated_insns, zeros, sizeof(zeros)),
592 prog_infos[i].created_by_uid, my_uid,
593 prog_infos[i].nr_map_ids, 1,
594 *(int *)(long)prog_infos[i].map_ids, map_infos[i].id,
595 prog_infos[i].name, expected_prog_name))
599 /* Check bpf_prog_get_next_id() */
602 while (!bpf_prog_get_next_id(next_id, &next_id)) {
603 struct bpf_prog_info prog_info = {};
607 info_len = sizeof(prog_info);
609 prog_fd = bpf_prog_get_fd_by_id(next_id);
610 if (prog_fd < 0 && errno == ENOENT)
611 /* The bpf_prog is in the dead row */
613 if (CHECK(prog_fd < 0, "get-prog-fd(next_id)",
614 "prog_fd %d next_id %d errno %d\n",
615 prog_fd, next_id, errno))
618 for (i = 0; i < nr_iters; i++)
619 if (prog_infos[i].id == next_id)
628 * prog_info.nr_map_ids = 1
629 * prog_info.map_ids = NULL
631 prog_info.nr_map_ids = 1;
632 err = bpf_obj_get_info_by_fd(prog_fd, &prog_info, &info_len);
633 if (CHECK(!err || errno != EFAULT,
634 "get-prog-fd-bad-nr-map-ids", "err %d errno %d(%d)",
637 bzero(&prog_info, sizeof(prog_info));
638 info_len = sizeof(prog_info);
640 saved_map_id = *(int *)((long)prog_infos[i].map_ids);
641 prog_info.map_ids = prog_infos[i].map_ids;
642 prog_info.nr_map_ids = 2;
643 err = bpf_obj_get_info_by_fd(prog_fd, &prog_info, &info_len);
644 prog_infos[i].jited_prog_insns = 0;
645 prog_infos[i].xlated_prog_insns = 0;
646 CHECK(err || info_len != sizeof(struct bpf_prog_info) ||
647 memcmp(&prog_info, &prog_infos[i], info_len) ||
648 *(int *)(long)prog_info.map_ids != saved_map_id,
649 "get-prog-info(next_id->fd)",
650 "err %d errno %d info_len %u(%Zu) memcmp %d map_id %u(%u)\n",
651 err, errno, info_len, sizeof(struct bpf_prog_info),
652 memcmp(&prog_info, &prog_infos[i], info_len),
653 *(int *)(long)prog_info.map_ids, saved_map_id);
656 CHECK(nr_id_found != nr_iters,
657 "check total prog id found by get_next_id",
658 "nr_id_found %u(%u)\n",
659 nr_id_found, nr_iters);
661 /* Check bpf_map_get_next_id() */
664 while (!bpf_map_get_next_id(next_id, &next_id)) {
665 struct bpf_map_info map_info = {};
668 info_len = sizeof(map_info);
670 map_fd = bpf_map_get_fd_by_id(next_id);
671 if (map_fd < 0 && errno == ENOENT)
672 /* The bpf_map is in the dead row */
674 if (CHECK(map_fd < 0, "get-map-fd(next_id)",
675 "map_fd %d next_id %u errno %d\n",
676 map_fd, next_id, errno))
679 for (i = 0; i < nr_iters; i++)
680 if (map_infos[i].id == next_id)
688 err = bpf_map_lookup_elem(map_fd, &array_key, &array_value);
691 err = bpf_obj_get_info_by_fd(map_fd, &map_info, &info_len);
692 CHECK(err || info_len != sizeof(struct bpf_map_info) ||
693 memcmp(&map_info, &map_infos[i], info_len) ||
694 array_value != array_magic_value,
695 "check get-map-info(next_id->fd)",
696 "err %d errno %d info_len %u(%Zu) memcmp %d array_value %llu(%llu)\n",
697 err, errno, info_len, sizeof(struct bpf_map_info),
698 memcmp(&map_info, &map_infos[i], info_len),
699 array_value, array_magic_value);
703 CHECK(nr_id_found != nr_iters,
704 "check total map id found by get_next_id",
705 "nr_id_found %u(%u)\n",
706 nr_id_found, nr_iters);
709 for (i = 0; i < nr_iters; i++)
710 bpf_object__close(objs[i]);
713 static void test_pkt_md_access(void)
715 const char *file = "./test_pkt_md_access.o";
716 struct bpf_object *obj;
717 __u32 duration, retval;
720 err = bpf_prog_load(file, BPF_PROG_TYPE_SCHED_CLS, &obj, &prog_fd);
726 err = bpf_prog_test_run(prog_fd, 10, &pkt_v4, sizeof(pkt_v4),
727 NULL, NULL, &retval, &duration);
728 CHECK(err || retval, "",
729 "err %d errno %d retval %d duration %d\n",
730 err, errno, retval, duration);
732 bpf_object__close(obj);
735 static void test_obj_name(void)
743 { "_123456789ABCDE", 1, 0 },
744 { "_123456789ABCDEF", 0, EINVAL },
745 { "_123456789ABCD\n", 0, EINVAL },
747 struct bpf_insn prog[] = {
748 BPF_ALU64_IMM(BPF_MOV, BPF_REG_0, 0),
754 for (i = 0; i < sizeof(tests) / sizeof(tests[0]); i++) {
755 size_t name_len = strlen(tests[i].name) + 1;
760 /* test different attr.prog_name during BPF_PROG_LOAD */
761 ncopy = name_len < sizeof(attr.prog_name) ?
762 name_len : sizeof(attr.prog_name);
763 bzero(&attr, sizeof(attr));
764 attr.prog_type = BPF_PROG_TYPE_SCHED_CLS;
766 attr.insns = ptr_to_u64(prog);
767 attr.license = ptr_to_u64("");
768 memcpy(attr.prog_name, tests[i].name, ncopy);
770 fd = syscall(__NR_bpf, BPF_PROG_LOAD, &attr, sizeof(attr));
771 CHECK((tests[i].success && fd < 0) ||
772 (!tests[i].success && fd != -1) ||
773 (!tests[i].success && errno != tests[i].expected_errno),
774 "check-bpf-prog-name",
775 "fd %d(%d) errno %d(%d)\n",
776 fd, tests[i].success, errno, tests[i].expected_errno);
781 /* test different attr.map_name during BPF_MAP_CREATE */
782 ncopy = name_len < sizeof(attr.map_name) ?
783 name_len : sizeof(attr.map_name);
784 bzero(&attr, sizeof(attr));
785 attr.map_type = BPF_MAP_TYPE_ARRAY;
788 attr.max_entries = 1;
790 memcpy(attr.map_name, tests[i].name, ncopy);
791 fd = syscall(__NR_bpf, BPF_MAP_CREATE, &attr, sizeof(attr));
792 CHECK((tests[i].success && fd < 0) ||
793 (!tests[i].success && fd != -1) ||
794 (!tests[i].success && errno != tests[i].expected_errno),
795 "check-bpf-map-name",
796 "fd %d(%d) errno %d(%d)\n",
797 fd, tests[i].success, errno, tests[i].expected_errno);
804 static void test_tp_attach_query(void)
806 const int num_progs = 3;
807 int i, j, bytes, efd, err, prog_fd[num_progs], pmu_fd[num_progs];
808 __u32 duration = 0, info_len, saved_prog_ids[num_progs];
809 const char *file = "./test_tracepoint.o";
810 struct perf_event_query_bpf *query;
811 struct perf_event_attr attr = {};
812 struct bpf_object *obj[num_progs];
813 struct bpf_prog_info prog_info;
816 snprintf(buf, sizeof(buf),
817 "/sys/kernel/debug/tracing/events/sched/sched_switch/id");
818 efd = open(buf, O_RDONLY, 0);
819 if (CHECK(efd < 0, "open", "err %d errno %d\n", efd, errno))
821 bytes = read(efd, buf, sizeof(buf));
823 if (CHECK(bytes <= 0 || bytes >= sizeof(buf),
824 "read", "bytes %d errno %d\n", bytes, errno))
827 attr.config = strtol(buf, NULL, 0);
828 attr.type = PERF_TYPE_TRACEPOINT;
829 attr.sample_type = PERF_SAMPLE_RAW | PERF_SAMPLE_CALLCHAIN;
830 attr.sample_period = 1;
831 attr.wakeup_events = 1;
833 query = malloc(sizeof(*query) + sizeof(__u32) * num_progs);
834 for (i = 0; i < num_progs; i++) {
835 err = bpf_prog_load(file, BPF_PROG_TYPE_TRACEPOINT, &obj[i],
837 if (CHECK(err, "prog_load", "err %d errno %d\n", err, errno))
840 bzero(&prog_info, sizeof(prog_info));
841 prog_info.jited_prog_len = 0;
842 prog_info.xlated_prog_len = 0;
843 prog_info.nr_map_ids = 0;
844 info_len = sizeof(prog_info);
845 err = bpf_obj_get_info_by_fd(prog_fd[i], &prog_info, &info_len);
846 if (CHECK(err, "bpf_obj_get_info_by_fd", "err %d errno %d\n",
849 saved_prog_ids[i] = prog_info.id;
851 pmu_fd[i] = syscall(__NR_perf_event_open, &attr, -1 /* pid */,
852 0 /* cpu 0 */, -1 /* group id */,
854 if (CHECK(pmu_fd[i] < 0, "perf_event_open", "err %d errno %d\n",
857 err = ioctl(pmu_fd[i], PERF_EVENT_IOC_ENABLE, 0);
858 if (CHECK(err, "perf_event_ioc_enable", "err %d errno %d\n",
863 /* check NULL prog array query */
864 query->ids_len = num_progs;
865 err = ioctl(pmu_fd[i], PERF_EVENT_IOC_QUERY_BPF, query);
866 if (CHECK(err || query->prog_cnt != 0,
867 "perf_event_ioc_query_bpf",
868 "err %d errno %d query->prog_cnt %u\n",
869 err, errno, query->prog_cnt))
873 err = ioctl(pmu_fd[i], PERF_EVENT_IOC_SET_BPF, prog_fd[i]);
874 if (CHECK(err, "perf_event_ioc_set_bpf", "err %d errno %d\n",
879 /* try to get # of programs only */
881 err = ioctl(pmu_fd[i], PERF_EVENT_IOC_QUERY_BPF, query);
882 if (CHECK(err || query->prog_cnt != 2,
883 "perf_event_ioc_query_bpf",
884 "err %d errno %d query->prog_cnt %u\n",
885 err, errno, query->prog_cnt))
888 /* try a few negative tests */
889 /* invalid query pointer */
890 err = ioctl(pmu_fd[i], PERF_EVENT_IOC_QUERY_BPF,
891 (struct perf_event_query_bpf *)0x1);
892 if (CHECK(!err || errno != EFAULT,
893 "perf_event_ioc_query_bpf",
894 "err %d errno %d\n", err, errno))
897 /* no enough space */
899 err = ioctl(pmu_fd[i], PERF_EVENT_IOC_QUERY_BPF, query);
900 if (CHECK(!err || errno != ENOSPC || query->prog_cnt != 2,
901 "perf_event_ioc_query_bpf",
902 "err %d errno %d query->prog_cnt %u\n",
903 err, errno, query->prog_cnt))
907 query->ids_len = num_progs;
908 err = ioctl(pmu_fd[i], PERF_EVENT_IOC_QUERY_BPF, query);
909 if (CHECK(err || query->prog_cnt != (i + 1),
910 "perf_event_ioc_query_bpf",
911 "err %d errno %d query->prog_cnt %u\n",
912 err, errno, query->prog_cnt))
914 for (j = 0; j < i + 1; j++)
915 if (CHECK(saved_prog_ids[j] != query->ids[j],
916 "perf_event_ioc_query_bpf",
917 "#%d saved_prog_id %x query prog_id %x\n",
918 j, saved_prog_ids[j], query->ids[j]))
923 for (; i >= 0; i--) {
925 ioctl(pmu_fd[i], PERF_EVENT_IOC_DISABLE);
929 bpf_object__close(obj[i]);
934 static int compare_map_keys(int map1_fd, int map2_fd)
937 char val_buf[PERF_MAX_STACK_DEPTH *
938 sizeof(struct bpf_stack_build_id)];
941 err = bpf_map_get_next_key(map1_fd, NULL, &key);
944 err = bpf_map_lookup_elem(map2_fd, &key, val_buf);
948 while (bpf_map_get_next_key(map1_fd, &key, &next_key) == 0) {
949 err = bpf_map_lookup_elem(map2_fd, &next_key, val_buf);
961 static int compare_stack_ips(int smap_fd, int amap_fd, int stack_trace_len)
963 __u32 key, next_key, *cur_key_p, *next_key_p;
964 char *val_buf1, *val_buf2;
967 val_buf1 = malloc(stack_trace_len);
968 val_buf2 = malloc(stack_trace_len);
971 while (bpf_map_get_next_key(smap_fd, cur_key_p, next_key_p) == 0) {
972 err = bpf_map_lookup_elem(smap_fd, next_key_p, val_buf1);
975 err = bpf_map_lookup_elem(amap_fd, next_key_p, val_buf2);
978 for (i = 0; i < stack_trace_len; i++) {
979 if (val_buf1[i] != val_buf2[i]) {
986 next_key_p = &next_key;
997 static void test_stacktrace_map()
999 int control_map_fd, stackid_hmap_fd, stackmap_fd, stack_amap_fd;
1000 const char *file = "./test_stacktrace_map.o";
1001 int bytes, efd, err, pmu_fd, prog_fd, stack_trace_len;
1002 struct perf_event_attr attr = {};
1003 __u32 key, val, duration = 0;
1004 struct bpf_object *obj;
1007 err = bpf_prog_load(file, BPF_PROG_TYPE_TRACEPOINT, &obj, &prog_fd);
1008 if (CHECK(err, "prog_load", "err %d errno %d\n", err, errno))
1011 /* Get the ID for the sched/sched_switch tracepoint */
1012 snprintf(buf, sizeof(buf),
1013 "/sys/kernel/debug/tracing/events/sched/sched_switch/id");
1014 efd = open(buf, O_RDONLY, 0);
1015 if (CHECK(efd < 0, "open", "err %d errno %d\n", efd, errno))
1018 bytes = read(efd, buf, sizeof(buf));
1020 if (bytes <= 0 || bytes >= sizeof(buf))
1023 /* Open the perf event and attach bpf progrram */
1024 attr.config = strtol(buf, NULL, 0);
1025 attr.type = PERF_TYPE_TRACEPOINT;
1026 attr.sample_type = PERF_SAMPLE_RAW | PERF_SAMPLE_CALLCHAIN;
1027 attr.sample_period = 1;
1028 attr.wakeup_events = 1;
1029 pmu_fd = syscall(__NR_perf_event_open, &attr, -1 /* pid */,
1030 0 /* cpu 0 */, -1 /* group id */,
1032 if (CHECK(pmu_fd < 0, "perf_event_open", "err %d errno %d\n",
1036 err = ioctl(pmu_fd, PERF_EVENT_IOC_ENABLE, 0);
1040 err = ioctl(pmu_fd, PERF_EVENT_IOC_SET_BPF, prog_fd);
1045 control_map_fd = bpf_find_map(__func__, obj, "control_map");
1046 if (control_map_fd < 0)
1049 stackid_hmap_fd = bpf_find_map(__func__, obj, "stackid_hmap");
1050 if (stackid_hmap_fd < 0)
1053 stackmap_fd = bpf_find_map(__func__, obj, "stackmap");
1054 if (stackmap_fd < 0)
1057 stack_amap_fd = bpf_find_map(__func__, obj, "stack_amap");
1058 if (stack_amap_fd < 0)
1061 /* give some time for bpf program run */
1064 /* disable stack trace collection */
1067 bpf_map_update_elem(control_map_fd, &key, &val, 0);
1069 /* for every element in stackid_hmap, we can find a corresponding one
1070 * in stackmap, and vise versa.
1072 err = compare_map_keys(stackid_hmap_fd, stackmap_fd);
1073 if (CHECK(err, "compare_map_keys stackid_hmap vs. stackmap",
1074 "err %d errno %d\n", err, errno))
1075 goto disable_pmu_noerr;
1077 err = compare_map_keys(stackmap_fd, stackid_hmap_fd);
1078 if (CHECK(err, "compare_map_keys stackmap vs. stackid_hmap",
1079 "err %d errno %d\n", err, errno))
1080 goto disable_pmu_noerr;
1082 stack_trace_len = PERF_MAX_STACK_DEPTH * sizeof(__u64);
1083 err = compare_stack_ips(stackmap_fd, stack_amap_fd, stack_trace_len);
1084 if (CHECK(err, "compare_stack_ips stackmap vs. stack_amap",
1085 "err %d errno %d\n", err, errno))
1086 goto disable_pmu_noerr;
1088 goto disable_pmu_noerr;
1092 ioctl(pmu_fd, PERF_EVENT_IOC_DISABLE);
1095 bpf_object__close(obj);
1098 static void test_stacktrace_map_raw_tp()
1100 int control_map_fd, stackid_hmap_fd, stackmap_fd;
1101 const char *file = "./test_stacktrace_map.o";
1102 int efd, err, prog_fd;
1103 __u32 key, val, duration = 0;
1104 struct bpf_object *obj;
1106 err = bpf_prog_load(file, BPF_PROG_TYPE_RAW_TRACEPOINT, &obj, &prog_fd);
1107 if (CHECK(err, "prog_load raw tp", "err %d errno %d\n", err, errno))
1110 efd = bpf_raw_tracepoint_open("sched_switch", prog_fd);
1111 if (CHECK(efd < 0, "raw_tp_open", "err %d errno %d\n", efd, errno))
1115 control_map_fd = bpf_find_map(__func__, obj, "control_map");
1116 if (control_map_fd < 0)
1119 stackid_hmap_fd = bpf_find_map(__func__, obj, "stackid_hmap");
1120 if (stackid_hmap_fd < 0)
1123 stackmap_fd = bpf_find_map(__func__, obj, "stackmap");
1124 if (stackmap_fd < 0)
1127 /* give some time for bpf program run */
1130 /* disable stack trace collection */
1133 bpf_map_update_elem(control_map_fd, &key, &val, 0);
1135 /* for every element in stackid_hmap, we can find a corresponding one
1136 * in stackmap, and vise versa.
1138 err = compare_map_keys(stackid_hmap_fd, stackmap_fd);
1139 if (CHECK(err, "compare_map_keys stackid_hmap vs. stackmap",
1140 "err %d errno %d\n", err, errno))
1143 err = compare_map_keys(stackmap_fd, stackid_hmap_fd);
1144 if (CHECK(err, "compare_map_keys stackmap vs. stackid_hmap",
1145 "err %d errno %d\n", err, errno))
1148 goto close_prog_noerr;
1152 bpf_object__close(obj);
1155 static int extract_build_id(char *build_id, size_t size)
1161 fp = popen("readelf -n ./urandom_read | grep 'Build ID'", "r");
1165 if (getline(&line, &len, fp) == -1)
1171 memcpy(build_id, line, len);
1172 build_id[len] = '\0';
1179 static void test_stacktrace_build_id(void)
1181 int control_map_fd, stackid_hmap_fd, stackmap_fd, stack_amap_fd;
1182 const char *file = "./test_stacktrace_build_id.o";
1183 int bytes, efd, err, pmu_fd, prog_fd, stack_trace_len;
1184 struct perf_event_attr attr = {};
1185 __u32 key, previous_key, val, duration = 0;
1186 struct bpf_object *obj;
1189 struct bpf_stack_build_id id_offs[PERF_MAX_STACK_DEPTH];
1190 int build_id_matches = 0;
1194 err = bpf_prog_load(file, BPF_PROG_TYPE_TRACEPOINT, &obj, &prog_fd);
1195 if (CHECK(err, "prog_load", "err %d errno %d\n", err, errno))
1198 /* Get the ID for the sched/sched_switch tracepoint */
1199 snprintf(buf, sizeof(buf),
1200 "/sys/kernel/debug/tracing/events/random/urandom_read/id");
1201 efd = open(buf, O_RDONLY, 0);
1202 if (CHECK(efd < 0, "open", "err %d errno %d\n", efd, errno))
1205 bytes = read(efd, buf, sizeof(buf));
1207 if (CHECK(bytes <= 0 || bytes >= sizeof(buf),
1208 "read", "bytes %d errno %d\n", bytes, errno))
1211 /* Open the perf event and attach bpf progrram */
1212 attr.config = strtol(buf, NULL, 0);
1213 attr.type = PERF_TYPE_TRACEPOINT;
1214 attr.sample_type = PERF_SAMPLE_RAW | PERF_SAMPLE_CALLCHAIN;
1215 attr.sample_period = 1;
1216 attr.wakeup_events = 1;
1217 pmu_fd = syscall(__NR_perf_event_open, &attr, -1 /* pid */,
1218 0 /* cpu 0 */, -1 /* group id */,
1220 if (CHECK(pmu_fd < 0, "perf_event_open", "err %d errno %d\n",
1224 err = ioctl(pmu_fd, PERF_EVENT_IOC_ENABLE, 0);
1225 if (CHECK(err, "perf_event_ioc_enable", "err %d errno %d\n",
1229 err = ioctl(pmu_fd, PERF_EVENT_IOC_SET_BPF, prog_fd);
1230 if (CHECK(err, "perf_event_ioc_set_bpf", "err %d errno %d\n",
1235 control_map_fd = bpf_find_map(__func__, obj, "control_map");
1236 if (CHECK(control_map_fd < 0, "bpf_find_map control_map",
1237 "err %d errno %d\n", err, errno))
1240 stackid_hmap_fd = bpf_find_map(__func__, obj, "stackid_hmap");
1241 if (CHECK(stackid_hmap_fd < 0, "bpf_find_map stackid_hmap",
1242 "err %d errno %d\n", err, errno))
1245 stackmap_fd = bpf_find_map(__func__, obj, "stackmap");
1246 if (CHECK(stackmap_fd < 0, "bpf_find_map stackmap", "err %d errno %d\n",
1250 stack_amap_fd = bpf_find_map(__func__, obj, "stack_amap");
1251 if (CHECK(stack_amap_fd < 0, "bpf_find_map stack_amap",
1252 "err %d errno %d\n", err, errno))
1255 assert(system("dd if=/dev/urandom of=/dev/zero count=4 2> /dev/null")
1257 assert(system("./urandom_read") == 0);
1258 /* disable stack trace collection */
1261 bpf_map_update_elem(control_map_fd, &key, &val, 0);
1263 /* for every element in stackid_hmap, we can find a corresponding one
1264 * in stackmap, and vise versa.
1266 err = compare_map_keys(stackid_hmap_fd, stackmap_fd);
1267 if (CHECK(err, "compare_map_keys stackid_hmap vs. stackmap",
1268 "err %d errno %d\n", err, errno))
1271 err = compare_map_keys(stackmap_fd, stackid_hmap_fd);
1272 if (CHECK(err, "compare_map_keys stackmap vs. stackid_hmap",
1273 "err %d errno %d\n", err, errno))
1276 err = extract_build_id(buf, 256);
1278 if (CHECK(err, "get build_id with readelf",
1279 "err %d errno %d\n", err, errno))
1282 err = bpf_map_get_next_key(stackmap_fd, NULL, &key);
1283 if (CHECK(err, "get_next_key from stackmap",
1284 "err %d, errno %d\n", err, errno))
1290 err = bpf_map_lookup_elem(stackmap_fd, &key, id_offs);
1291 if (CHECK(err, "lookup_elem from stackmap",
1292 "err %d, errno %d\n", err, errno))
1294 for (i = 0; i < PERF_MAX_STACK_DEPTH; ++i)
1295 if (id_offs[i].status == BPF_STACK_BUILD_ID_VALID &&
1296 id_offs[i].offset != 0) {
1297 for (j = 0; j < 20; ++j)
1298 sprintf(build_id + 2 * j, "%02x",
1299 id_offs[i].build_id[j] & 0xff);
1300 if (strstr(buf, build_id) != NULL)
1301 build_id_matches = 1;
1304 } while (bpf_map_get_next_key(stackmap_fd, &previous_key, &key) == 0);
1306 /* stack_map_get_build_id_offset() is racy and sometimes can return
1307 * BPF_STACK_BUILD_ID_IP instead of BPF_STACK_BUILD_ID_VALID;
1308 * try it one more time.
1310 if (build_id_matches < 1 && retry--) {
1311 ioctl(pmu_fd, PERF_EVENT_IOC_DISABLE);
1313 bpf_object__close(obj);
1314 printf("%s:WARN:Didn't find expected build ID from the map, retrying\n",
1319 if (CHECK(build_id_matches < 1, "build id match",
1320 "Didn't find expected build ID from the map\n"))
1323 stack_trace_len = PERF_MAX_STACK_DEPTH
1324 * sizeof(struct bpf_stack_build_id);
1325 err = compare_stack_ips(stackmap_fd, stack_amap_fd, stack_trace_len);
1326 CHECK(err, "compare_stack_ips stackmap vs. stack_amap",
1327 "err %d errno %d\n", err, errno);
1330 ioctl(pmu_fd, PERF_EVENT_IOC_DISABLE);
1336 bpf_object__close(obj);
1342 static void test_stacktrace_build_id_nmi(void)
1344 int control_map_fd, stackid_hmap_fd, stackmap_fd, stack_amap_fd;
1345 const char *file = "./test_stacktrace_build_id.o";
1346 int err, pmu_fd, prog_fd;
1347 struct perf_event_attr attr = {
1348 .sample_freq = 5000,
1350 .type = PERF_TYPE_HARDWARE,
1351 .config = PERF_COUNT_HW_CPU_CYCLES,
1353 __u32 key, previous_key, val, duration = 0;
1354 struct bpf_object *obj;
1357 struct bpf_stack_build_id id_offs[PERF_MAX_STACK_DEPTH];
1358 int build_id_matches = 0;
1362 err = bpf_prog_load(file, BPF_PROG_TYPE_PERF_EVENT, &obj, &prog_fd);
1363 if (CHECK(err, "prog_load", "err %d errno %d\n", err, errno))
1366 pmu_fd = syscall(__NR_perf_event_open, &attr, -1 /* pid */,
1367 0 /* cpu 0 */, -1 /* group id */,
1369 if (CHECK(pmu_fd < 0, "perf_event_open",
1370 "err %d errno %d. Does the test host support PERF_COUNT_HW_CPU_CYCLES?\n",
1374 err = ioctl(pmu_fd, PERF_EVENT_IOC_ENABLE, 0);
1375 if (CHECK(err, "perf_event_ioc_enable", "err %d errno %d\n",
1379 err = ioctl(pmu_fd, PERF_EVENT_IOC_SET_BPF, prog_fd);
1380 if (CHECK(err, "perf_event_ioc_set_bpf", "err %d errno %d\n",
1385 control_map_fd = bpf_find_map(__func__, obj, "control_map");
1386 if (CHECK(control_map_fd < 0, "bpf_find_map control_map",
1387 "err %d errno %d\n", err, errno))
1390 stackid_hmap_fd = bpf_find_map(__func__, obj, "stackid_hmap");
1391 if (CHECK(stackid_hmap_fd < 0, "bpf_find_map stackid_hmap",
1392 "err %d errno %d\n", err, errno))
1395 stackmap_fd = bpf_find_map(__func__, obj, "stackmap");
1396 if (CHECK(stackmap_fd < 0, "bpf_find_map stackmap", "err %d errno %d\n",
1400 stack_amap_fd = bpf_find_map(__func__, obj, "stack_amap");
1401 if (CHECK(stack_amap_fd < 0, "bpf_find_map stack_amap",
1402 "err %d errno %d\n", err, errno))
1405 assert(system("dd if=/dev/urandom of=/dev/zero count=4 2> /dev/null")
1407 assert(system("taskset 0x1 ./urandom_read 100000") == 0);
1408 /* disable stack trace collection */
1411 bpf_map_update_elem(control_map_fd, &key, &val, 0);
1413 /* for every element in stackid_hmap, we can find a corresponding one
1414 * in stackmap, and vise versa.
1416 err = compare_map_keys(stackid_hmap_fd, stackmap_fd);
1417 if (CHECK(err, "compare_map_keys stackid_hmap vs. stackmap",
1418 "err %d errno %d\n", err, errno))
1421 err = compare_map_keys(stackmap_fd, stackid_hmap_fd);
1422 if (CHECK(err, "compare_map_keys stackmap vs. stackid_hmap",
1423 "err %d errno %d\n", err, errno))
1426 err = extract_build_id(buf, 256);
1428 if (CHECK(err, "get build_id with readelf",
1429 "err %d errno %d\n", err, errno))
1432 err = bpf_map_get_next_key(stackmap_fd, NULL, &key);
1433 if (CHECK(err, "get_next_key from stackmap",
1434 "err %d, errno %d\n", err, errno))
1440 err = bpf_map_lookup_elem(stackmap_fd, &key, id_offs);
1441 if (CHECK(err, "lookup_elem from stackmap",
1442 "err %d, errno %d\n", err, errno))
1444 for (i = 0; i < PERF_MAX_STACK_DEPTH; ++i)
1445 if (id_offs[i].status == BPF_STACK_BUILD_ID_VALID &&
1446 id_offs[i].offset != 0) {
1447 for (j = 0; j < 20; ++j)
1448 sprintf(build_id + 2 * j, "%02x",
1449 id_offs[i].build_id[j] & 0xff);
1450 if (strstr(buf, build_id) != NULL)
1451 build_id_matches = 1;
1454 } while (bpf_map_get_next_key(stackmap_fd, &previous_key, &key) == 0);
1456 /* stack_map_get_build_id_offset() is racy and sometimes can return
1457 * BPF_STACK_BUILD_ID_IP instead of BPF_STACK_BUILD_ID_VALID;
1458 * try it one more time.
1460 if (build_id_matches < 1 && retry--) {
1461 ioctl(pmu_fd, PERF_EVENT_IOC_DISABLE);
1463 bpf_object__close(obj);
1464 printf("%s:WARN:Didn't find expected build ID from the map, retrying\n",
1469 if (CHECK(build_id_matches < 1, "build id match",
1470 "Didn't find expected build ID from the map\n"))
1474 * We intentionally skip compare_stack_ips(). This is because we
1475 * only support one in_nmi() ips-to-build_id translation per cpu
1476 * at any time, thus stack_amap here will always fallback to
1477 * BPF_STACK_BUILD_ID_IP;
1481 ioctl(pmu_fd, PERF_EVENT_IOC_DISABLE);
1487 bpf_object__close(obj);
1490 #define MAX_CNT_RAWTP 10ull
1491 #define MAX_STACK_RAWTP 100
1492 struct get_stack_trace_t {
1494 int kern_stack_size;
1495 int user_stack_size;
1496 int user_stack_buildid_size;
1497 __u64 kern_stack[MAX_STACK_RAWTP];
1498 __u64 user_stack[MAX_STACK_RAWTP];
1499 struct bpf_stack_build_id user_stack_buildid[MAX_STACK_RAWTP];
1502 static int get_stack_print_output(void *data, int size)
1504 bool good_kern_stack = false, good_user_stack = false;
1505 const char *nonjit_func = "___bpf_prog_run";
1506 struct get_stack_trace_t *e = data;
1513 if (size < sizeof(struct get_stack_trace_t)) {
1514 __u64 *raw_data = data;
1517 num_stack = size / sizeof(__u64);
1518 /* If jit is enabled, we do not have a good way to
1519 * verify the sanity of the kernel stack. So we
1520 * just assume it is good if the stack is not empty.
1521 * This could be improved in the future.
1524 found = num_stack > 0;
1526 for (i = 0; i < num_stack; i++) {
1527 ks = ksym_search(raw_data[i]);
1528 if (strcmp(ks->name, nonjit_func) == 0) {
1535 good_kern_stack = true;
1536 good_user_stack = true;
1539 num_stack = e->kern_stack_size / sizeof(__u64);
1541 good_kern_stack = num_stack > 0;
1543 for (i = 0; i < num_stack; i++) {
1544 ks = ksym_search(e->kern_stack[i]);
1545 if (strcmp(ks->name, nonjit_func) == 0) {
1546 good_kern_stack = true;
1551 if (e->user_stack_size > 0 && e->user_stack_buildid_size > 0)
1552 good_user_stack = true;
1554 if (!good_kern_stack || !good_user_stack)
1555 return LIBBPF_PERF_EVENT_ERROR;
1557 if (cnt == MAX_CNT_RAWTP)
1558 return LIBBPF_PERF_EVENT_DONE;
1560 return LIBBPF_PERF_EVENT_CONT;
1563 static void test_get_stack_raw_tp(void)
1565 const char *file = "./test_get_stack_rawtp.o";
1566 int i, efd, err, prog_fd, pmu_fd, perfmap_fd;
1567 struct perf_event_attr attr = {};
1568 struct timespec tv = {0, 10};
1569 __u32 key = 0, duration = 0;
1570 struct bpf_object *obj;
1572 err = bpf_prog_load(file, BPF_PROG_TYPE_RAW_TRACEPOINT, &obj, &prog_fd);
1573 if (CHECK(err, "prog_load raw tp", "err %d errno %d\n", err, errno))
1576 efd = bpf_raw_tracepoint_open("sys_enter", prog_fd);
1577 if (CHECK(efd < 0, "raw_tp_open", "err %d errno %d\n", efd, errno))
1580 perfmap_fd = bpf_find_map(__func__, obj, "perfmap");
1581 if (CHECK(perfmap_fd < 0, "bpf_find_map", "err %d errno %d\n",
1585 err = load_kallsyms();
1586 if (CHECK(err < 0, "load_kallsyms", "err %d errno %d\n", err, errno))
1589 attr.sample_type = PERF_SAMPLE_RAW;
1590 attr.type = PERF_TYPE_SOFTWARE;
1591 attr.config = PERF_COUNT_SW_BPF_OUTPUT;
1592 pmu_fd = syscall(__NR_perf_event_open, &attr, getpid()/*pid*/, -1/*cpu*/,
1594 if (CHECK(pmu_fd < 0, "perf_event_open", "err %d errno %d\n", pmu_fd,
1598 err = bpf_map_update_elem(perfmap_fd, &key, &pmu_fd, BPF_ANY);
1599 if (CHECK(err < 0, "bpf_map_update_elem", "err %d errno %d\n", err,
1603 err = ioctl(pmu_fd, PERF_EVENT_IOC_ENABLE, 0);
1604 if (CHECK(err < 0, "ioctl PERF_EVENT_IOC_ENABLE", "err %d errno %d\n",
1608 err = perf_event_mmap(pmu_fd);
1609 if (CHECK(err < 0, "perf_event_mmap", "err %d errno %d\n", err, errno))
1612 /* trigger some syscall action */
1613 for (i = 0; i < MAX_CNT_RAWTP; i++)
1614 nanosleep(&tv, NULL);
1616 err = perf_event_poller(pmu_fd, get_stack_print_output);
1617 if (CHECK(err < 0, "perf_event_poller", "err %d errno %d\n", err, errno))
1620 goto close_prog_noerr;
1624 bpf_object__close(obj);
1627 static void test_task_fd_query_rawtp(void)
1629 const char *file = "./test_get_stack_rawtp.o";
1630 __u64 probe_offset, probe_addr;
1631 __u32 len, prog_id, fd_type;
1632 struct bpf_object *obj;
1633 int efd, err, prog_fd;
1637 err = bpf_prog_load(file, BPF_PROG_TYPE_RAW_TRACEPOINT, &obj, &prog_fd);
1638 if (CHECK(err, "prog_load raw tp", "err %d errno %d\n", err, errno))
1641 efd = bpf_raw_tracepoint_open("sys_enter", prog_fd);
1642 if (CHECK(efd < 0, "raw_tp_open", "err %d errno %d\n", efd, errno))
1645 /* query (getpid(), efd) */
1647 err = bpf_task_fd_query(getpid(), efd, 0, buf, &len, &prog_id,
1648 &fd_type, &probe_offset, &probe_addr);
1649 if (CHECK(err < 0, "bpf_task_fd_query", "err %d errno %d\n", err,
1653 err = fd_type == BPF_FD_TYPE_RAW_TRACEPOINT &&
1654 strcmp(buf, "sys_enter") == 0;
1655 if (CHECK(!err, "check_results", "fd_type %d tp_name %s\n",
1661 err = bpf_task_fd_query(getpid(), efd, 0, buf, &len, &prog_id,
1662 &fd_type, &probe_offset, &probe_addr);
1663 if (CHECK(err < 0, "bpf_task_fd_query (len = 0)", "err %d errno %d\n",
1666 err = fd_type == BPF_FD_TYPE_RAW_TRACEPOINT &&
1667 len == strlen("sys_enter");
1668 if (CHECK(!err, "check_results", "fd_type %d len %u\n", fd_type, len))
1671 /* test empty buffer */
1673 err = bpf_task_fd_query(getpid(), efd, 0, 0, &len, &prog_id,
1674 &fd_type, &probe_offset, &probe_addr);
1675 if (CHECK(err < 0, "bpf_task_fd_query (buf = 0)", "err %d errno %d\n",
1678 err = fd_type == BPF_FD_TYPE_RAW_TRACEPOINT &&
1679 len == strlen("sys_enter");
1680 if (CHECK(!err, "check_results", "fd_type %d len %u\n", fd_type, len))
1683 /* test smaller buffer */
1685 err = bpf_task_fd_query(getpid(), efd, 0, buf, &len, &prog_id,
1686 &fd_type, &probe_offset, &probe_addr);
1687 if (CHECK(err >= 0 || errno != ENOSPC, "bpf_task_fd_query (len = 3)",
1688 "err %d errno %d\n", err, errno))
1690 err = fd_type == BPF_FD_TYPE_RAW_TRACEPOINT &&
1691 len == strlen("sys_enter") &&
1692 strcmp(buf, "sy") == 0;
1693 if (CHECK(!err, "check_results", "fd_type %d len %u\n", fd_type, len))
1696 goto close_prog_noerr;
1700 bpf_object__close(obj);
1703 static void test_task_fd_query_tp_core(const char *probe_name,
1704 const char *tp_name)
1706 const char *file = "./test_tracepoint.o";
1707 int err, bytes, efd, prog_fd, pmu_fd;
1708 struct perf_event_attr attr = {};
1709 __u64 probe_offset, probe_addr;
1710 __u32 len, prog_id, fd_type;
1711 struct bpf_object *obj;
1715 err = bpf_prog_load(file, BPF_PROG_TYPE_TRACEPOINT, &obj, &prog_fd);
1716 if (CHECK(err, "bpf_prog_load", "err %d errno %d\n", err, errno))
1719 snprintf(buf, sizeof(buf),
1720 "/sys/kernel/debug/tracing/events/%s/id", probe_name);
1721 efd = open(buf, O_RDONLY, 0);
1722 if (CHECK(efd < 0, "open", "err %d errno %d\n", efd, errno))
1724 bytes = read(efd, buf, sizeof(buf));
1726 if (CHECK(bytes <= 0 || bytes >= sizeof(buf), "read",
1727 "bytes %d errno %d\n", bytes, errno))
1730 attr.config = strtol(buf, NULL, 0);
1731 attr.type = PERF_TYPE_TRACEPOINT;
1732 attr.sample_type = PERF_SAMPLE_RAW;
1733 attr.sample_period = 1;
1734 attr.wakeup_events = 1;
1735 pmu_fd = syscall(__NR_perf_event_open, &attr, -1 /* pid */,
1736 0 /* cpu 0 */, -1 /* group id */,
1738 if (CHECK(err, "perf_event_open", "err %d errno %d\n", err, errno))
1741 err = ioctl(pmu_fd, PERF_EVENT_IOC_ENABLE, 0);
1742 if (CHECK(err, "perf_event_ioc_enable", "err %d errno %d\n", err,
1746 err = ioctl(pmu_fd, PERF_EVENT_IOC_SET_BPF, prog_fd);
1747 if (CHECK(err, "perf_event_ioc_set_bpf", "err %d errno %d\n", err,
1751 /* query (getpid(), pmu_fd) */
1753 err = bpf_task_fd_query(getpid(), pmu_fd, 0, buf, &len, &prog_id,
1754 &fd_type, &probe_offset, &probe_addr);
1755 if (CHECK(err < 0, "bpf_task_fd_query", "err %d errno %d\n", err,
1759 err = (fd_type == BPF_FD_TYPE_TRACEPOINT) && !strcmp(buf, tp_name);
1760 if (CHECK(!err, "check_results", "fd_type %d tp_name %s\n",
1765 goto close_prog_noerr;
1772 bpf_object__close(obj);
1775 static void test_task_fd_query_tp(void)
1777 test_task_fd_query_tp_core("sched/sched_switch",
1779 test_task_fd_query_tp_core("syscalls/sys_enter_read",
1783 static void test_reference_tracking()
1785 const char *file = "./test_sk_lookup_kern.o";
1786 struct bpf_object *obj;
1787 struct bpf_program *prog;
1791 obj = bpf_object__open(file);
1797 bpf_object__for_each_program(prog, obj) {
1800 /* Ignore .text sections */
1801 title = bpf_program__title(prog, false);
1802 if (strstr(title, ".text") != NULL)
1805 bpf_program__set_type(prog, BPF_PROG_TYPE_SCHED_CLS);
1807 /* Expect verifier failure if test name has 'fail' */
1808 if (strstr(title, "fail") != NULL) {
1809 libbpf_set_print(NULL, NULL, NULL);
1810 err = !bpf_program__load(prog, "GPL", 0);
1811 libbpf_set_print(printf, printf, NULL);
1813 err = bpf_program__load(prog, "GPL", 0);
1815 CHECK(err, title, "\n");
1817 bpf_object__close(obj);
1825 static void test_queue_stack_map(int type)
1827 const int MAP_SIZE = 32;
1828 __u32 vals[MAP_SIZE], duration, retval, size, val;
1829 int i, err, prog_fd, map_in_fd, map_out_fd;
1830 char file[32], buf[128];
1831 struct bpf_object *obj;
1832 struct iphdr *iph = (void *)buf + sizeof(struct ethhdr);
1834 /* Fill test values to be used */
1835 for (i = 0; i < MAP_SIZE; i++)
1839 strncpy(file, "./test_queue_map.o", sizeof(file));
1840 else if (type == STACK)
1841 strncpy(file, "./test_stack_map.o", sizeof(file));
1845 err = bpf_prog_load(file, BPF_PROG_TYPE_SCHED_CLS, &obj, &prog_fd);
1851 map_in_fd = bpf_find_map(__func__, obj, "map_in");
1855 map_out_fd = bpf_find_map(__func__, obj, "map_out");
1859 /* Push 32 elements to the input map */
1860 for (i = 0; i < MAP_SIZE; i++) {
1861 err = bpf_map_update_elem(map_in_fd, NULL, &vals[i], 0);
1868 /* The eBPF program pushes iph.saddr in the output map,
1869 * pops the input map and saves this value in iph.daddr
1871 for (i = 0; i < MAP_SIZE; i++) {
1872 if (type == QUEUE) {
1874 pkt_v4.iph.saddr = vals[i] * 5;
1875 } else if (type == STACK) {
1876 val = vals[MAP_SIZE - 1 - i];
1877 pkt_v4.iph.saddr = vals[MAP_SIZE - 1 - i] * 5;
1880 err = bpf_prog_test_run(prog_fd, 1, &pkt_v4, sizeof(pkt_v4),
1881 buf, &size, &retval, &duration);
1882 if (err || retval || size != sizeof(pkt_v4) ||
1887 CHECK(err || retval || size != sizeof(pkt_v4) || iph->daddr != val,
1889 "err %d errno %d retval %d size %d iph->daddr %u\n",
1890 err, errno, retval, size, iph->daddr);
1892 /* Queue is empty, program should return TC_ACT_SHOT */
1893 err = bpf_prog_test_run(prog_fd, 1, &pkt_v4, sizeof(pkt_v4),
1894 buf, &size, &retval, &duration);
1895 CHECK(err || retval != 2 /* TC_ACT_SHOT */|| size != sizeof(pkt_v4),
1896 "check-queue-stack-map-empty",
1897 "err %d errno %d retval %d size %d\n",
1898 err, errno, retval, size);
1900 /* Check that the program pushed elements correctly */
1901 for (i = 0; i < MAP_SIZE; i++) {
1902 err = bpf_map_lookup_and_delete_elem(map_out_fd, NULL, &val);
1903 if (err || val != vals[i] * 5)
1907 CHECK(i != MAP_SIZE && (err || val != vals[i] * 5),
1908 "bpf_map_push_elem", "err %d value %u\n", err, val);
1911 pkt_v4.iph.saddr = 0;
1912 bpf_object__close(obj);
1919 jit_enabled = is_jit_enabled();
1922 test_prog_run_xattr();
1924 test_xdp_adjust_tail();
1926 test_xdp_noinline();
1929 test_pkt_md_access();
1931 test_tp_attach_query();
1932 test_stacktrace_map();
1933 test_stacktrace_build_id();
1934 test_stacktrace_build_id_nmi();
1935 test_stacktrace_map_raw_tp();
1936 test_get_stack_raw_tp();
1937 test_task_fd_query_rawtp();
1938 test_task_fd_query_tp();
1939 test_reference_tracking();
1940 test_queue_stack_map(QUEUE);
1941 test_queue_stack_map(STACK);
1943 printf("Summary: %d PASSED, %d FAILED\n", pass_cnt, error_cnt);
1944 return error_cnt ? EXIT_FAILURE : EXIT_SUCCESS;