1// SPDX-License-Identifier: (GPL-2.0-only OR BSD-2-Clause)
2/* Copyright (c) 2019 Netronome Systems, Inc. */
3
4#include <ctype.h>
5#include <errno.h>
6#include <fcntl.h>
7#include <string.h>
8#include <unistd.h>
9#include <net/if.h>
10#ifdef USE_LIBCAP
11#include <sys/capability.h>
12#endif
13#include <sys/utsname.h>
14#include <sys/vfs.h>
15
16#include <linux/filter.h>
17#include <linux/limits.h>
18
19#include <bpf/bpf.h>
20#include <bpf/libbpf.h>
21#include <zlib.h>
22
23#include "main.h"
24
25#ifndef PROC_SUPER_MAGIC
26# define PROC_SUPER_MAGIC	0x9fa0
27#endif
28
29enum probe_component {
30	COMPONENT_UNSPEC,
31	COMPONENT_KERNEL,
32	COMPONENT_DEVICE,
33};
34
35#define BPF_HELPER_MAKE_ENTRY(name)	[BPF_FUNC_ ## name] = "bpf_" # name
36static const char * const helper_name[] = {
37	__BPF_FUNC_MAPPER(BPF_HELPER_MAKE_ENTRY)
38};
39
40#undef BPF_HELPER_MAKE_ENTRY
41
42static bool full_mode;
43#ifdef USE_LIBCAP
44static bool run_as_unprivileged;
45#endif
46
47/* Miscellaneous utility functions */
48
49static bool grep(const char *buffer, const char *pattern)
50{
51	return !!strstr(buffer, pattern);
52}
53
54static bool check_procfs(void)
55{
56	struct statfs st_fs;
57
58	if (statfs("/proc", &st_fs) < 0)
59		return false;
60	if ((unsigned long)st_fs.f_type != PROC_SUPER_MAGIC)
61		return false;
62
63	return true;
64}
65
66static void uppercase(char *str, size_t len)
67{
68	size_t i;
69
70	for (i = 0; i < len && str[i] != '\0'; i++)
71		str[i] = toupper(str[i]);
72}
73
74/* Printing utility functions */
75
76static void
77print_bool_feature(const char *feat_name, const char *plain_name,
78		   const char *define_name, bool res, const char *define_prefix)
79{
80	if (json_output)
81		jsonw_bool_field(json_wtr, feat_name, res);
82	else if (define_prefix)
83		printf("#define %s%sHAVE_%s\n", define_prefix,
84		       res ? "" : "NO_", define_name);
85	else
86		printf("%s is %savailable\n", plain_name, res ? "" : "NOT ");
87}
88
89static void print_kernel_option(const char *name, const char *value,
90				const char *define_prefix)
91{
92	char *endptr;
93	int res;
94
95	if (json_output) {
96		if (!value) {
97			jsonw_null_field(json_wtr, name);
98			return;
99		}
100		errno = 0;
101		res = strtol(value, &endptr, 0);
102		if (!errno && *endptr == '\n')
103			jsonw_int_field(json_wtr, name, res);
104		else
105			jsonw_string_field(json_wtr, name, value);
106	} else if (define_prefix) {
107		if (value)
108			printf("#define %s%s %s\n", define_prefix,
109			       name, value);
110		else
111			printf("/* %s%s is not set */\n", define_prefix, name);
112	} else {
113		if (value)
114			printf("%s is set to %s\n", name, value);
115		else
116			printf("%s is not set\n", name);
117	}
118}
119
120static void
121print_start_section(const char *json_title, const char *plain_title,
122		    const char *define_comment, const char *define_prefix)
123{
124	if (json_output) {
125		jsonw_name(json_wtr, json_title);
126		jsonw_start_object(json_wtr);
127	} else if (define_prefix) {
128		printf("%s\n", define_comment);
129	} else {
130		printf("%s\n", plain_title);
131	}
132}
133
134static void print_end_section(void)
135{
136	if (json_output)
137		jsonw_end_object(json_wtr);
138	else
139		printf("\n");
140}
141
142/* Probing functions */
143
144static int get_vendor_id(int ifindex)
145{
146	char ifname[IF_NAMESIZE], path[64], buf[8];
147	ssize_t len;
148	int fd;
149
150	if (!if_indextoname(ifindex, ifname))
151		return -1;
152
153	snprintf(path, sizeof(path), "/sys/class/net/%s/device/vendor", ifname);
154
155	fd = open(path, O_RDONLY | O_CLOEXEC);
156	if (fd < 0)
157		return -1;
158
159	len = read(fd, buf, sizeof(buf));
160	close(fd);
161	if (len < 0)
162		return -1;
163	if (len >= (ssize_t)sizeof(buf))
164		return -1;
165	buf[len] = '\0';
166
167	return strtol(buf, NULL, 0);
168}
169
170static long read_procfs(const char *path)
171{
172	char *endptr, *line = NULL;
173	size_t len = 0;
174	FILE *fd;
175	long res;
176
177	fd = fopen(path, "r");
178	if (!fd)
179		return -1;
180
181	res = getline(&line, &len, fd);
182	fclose(fd);
183	if (res < 0)
184		return -1;
185
186	errno = 0;
187	res = strtol(line, &endptr, 10);
188	if (errno || *line == '\0' || *endptr != '\n')
189		res = -1;
190	free(line);
191
192	return res;
193}
194
195static void probe_unprivileged_disabled(void)
196{
197	long res;
198
199	/* No support for C-style ouptut */
200
201	res = read_procfs("/proc/sys/kernel/unprivileged_bpf_disabled");
202	if (json_output) {
203		jsonw_int_field(json_wtr, "unprivileged_bpf_disabled", res);
204	} else {
205		switch (res) {
206		case 0:
207			printf("bpf() syscall for unprivileged users is enabled\n");
208			break;
209		case 1:
210			printf("bpf() syscall restricted to privileged users (without recovery)\n");
211			break;
212		case 2:
213			printf("bpf() syscall restricted to privileged users (admin can change)\n");
214			break;
215		case -1:
216			printf("Unable to retrieve required privileges for bpf() syscall\n");
217			break;
218		default:
219			printf("bpf() syscall restriction has unknown value %ld\n", res);
220		}
221	}
222}
223
224static void probe_jit_enable(void)
225{
226	long res;
227
228	/* No support for C-style ouptut */
229
230	res = read_procfs("/proc/sys/net/core/bpf_jit_enable");
231	if (json_output) {
232		jsonw_int_field(json_wtr, "bpf_jit_enable", res);
233	} else {
234		switch (res) {
235		case 0:
236			printf("JIT compiler is disabled\n");
237			break;
238		case 1:
239			printf("JIT compiler is enabled\n");
240			break;
241		case 2:
242			printf("JIT compiler is enabled with debugging traces in kernel logs\n");
243			break;
244		case -1:
245			printf("Unable to retrieve JIT-compiler status\n");
246			break;
247		default:
248			printf("JIT-compiler status has unknown value %ld\n",
249			       res);
250		}
251	}
252}
253
254static void probe_jit_harden(void)
255{
256	long res;
257
258	/* No support for C-style ouptut */
259
260	res = read_procfs("/proc/sys/net/core/bpf_jit_harden");
261	if (json_output) {
262		jsonw_int_field(json_wtr, "bpf_jit_harden", res);
263	} else {
264		switch (res) {
265		case 0:
266			printf("JIT compiler hardening is disabled\n");
267			break;
268		case 1:
269			printf("JIT compiler hardening is enabled for unprivileged users\n");
270			break;
271		case 2:
272			printf("JIT compiler hardening is enabled for all users\n");
273			break;
274		case -1:
275			printf("Unable to retrieve JIT hardening status\n");
276			break;
277		default:
278			printf("JIT hardening status has unknown value %ld\n",
279			       res);
280		}
281	}
282}
283
284static void probe_jit_kallsyms(void)
285{
286	long res;
287
288	/* No support for C-style ouptut */
289
290	res = read_procfs("/proc/sys/net/core/bpf_jit_kallsyms");
291	if (json_output) {
292		jsonw_int_field(json_wtr, "bpf_jit_kallsyms", res);
293	} else {
294		switch (res) {
295		case 0:
296			printf("JIT compiler kallsyms exports are disabled\n");
297			break;
298		case 1:
299			printf("JIT compiler kallsyms exports are enabled for root\n");
300			break;
301		case -1:
302			printf("Unable to retrieve JIT kallsyms export status\n");
303			break;
304		default:
305			printf("JIT kallsyms exports status has unknown value %ld\n", res);
306		}
307	}
308}
309
310static void probe_jit_limit(void)
311{
312	long res;
313
314	/* No support for C-style ouptut */
315
316	res = read_procfs("/proc/sys/net/core/bpf_jit_limit");
317	if (json_output) {
318		jsonw_int_field(json_wtr, "bpf_jit_limit", res);
319	} else {
320		switch (res) {
321		case -1:
322			printf("Unable to retrieve global memory limit for JIT compiler for unprivileged users\n");
323			break;
324		default:
325			printf("Global memory limit for JIT compiler for unprivileged users is %ld bytes\n", res);
326		}
327	}
328}
329
330static bool read_next_kernel_config_option(gzFile file, char *buf, size_t n,
331					   char **value)
332{
333	char *sep;
334
335	while (gzgets(file, buf, n)) {
336		if (strncmp(buf, "CONFIG_", 7))
337			continue;
338
339		sep = strchr(buf, '=');
340		if (!sep)
341			continue;
342
343		/* Trim ending '\n' */
344		buf[strlen(buf) - 1] = '\0';
345
346		/* Split on '=' and ensure that a value is present. */
347		*sep = '\0';
348		if (!sep[1])
349			continue;
350
351		*value = sep + 1;
352		return true;
353	}
354
355	return false;
356}
357
358static void probe_kernel_image_config(const char *define_prefix)
359{
360	static const struct {
361		const char * const name;
362		bool macro_dump;
363	} options[] = {
364		/* Enable BPF */
365		{ "CONFIG_BPF", },
366		/* Enable bpf() syscall */
367		{ "CONFIG_BPF_SYSCALL", },
368		/* Does selected architecture support eBPF JIT compiler */
369		{ "CONFIG_HAVE_EBPF_JIT", },
370		/* Compile eBPF JIT compiler */
371		{ "CONFIG_BPF_JIT", },
372		/* Avoid compiling eBPF interpreter (use JIT only) */
373		{ "CONFIG_BPF_JIT_ALWAYS_ON", },
374		/* Kernel BTF debug information available */
375		{ "CONFIG_DEBUG_INFO_BTF", },
376		/* Kernel module BTF debug information available */
377		{ "CONFIG_DEBUG_INFO_BTF_MODULES", },
378
379		/* cgroups */
380		{ "CONFIG_CGROUPS", },
381		/* BPF programs attached to cgroups */
382		{ "CONFIG_CGROUP_BPF", },
383		/* bpf_get_cgroup_classid() helper */
384		{ "CONFIG_CGROUP_NET_CLASSID", },
385		/* bpf_skb_{,ancestor_}cgroup_id() helpers */
386		{ "CONFIG_SOCK_CGROUP_DATA", },
387
388		/* Tracing: attach BPF to kprobes, tracepoints, etc. */
389		{ "CONFIG_BPF_EVENTS", },
390		/* Kprobes */
391		{ "CONFIG_KPROBE_EVENTS", },
392		/* Uprobes */
393		{ "CONFIG_UPROBE_EVENTS", },
394		/* Tracepoints */
395		{ "CONFIG_TRACING", },
396		/* Syscall tracepoints */
397		{ "CONFIG_FTRACE_SYSCALLS", },
398		/* bpf_override_return() helper support for selected arch */
399		{ "CONFIG_FUNCTION_ERROR_INJECTION", },
400		/* bpf_override_return() helper */
401		{ "CONFIG_BPF_KPROBE_OVERRIDE", },
402
403		/* Network */
404		{ "CONFIG_NET", },
405		/* AF_XDP sockets */
406		{ "CONFIG_XDP_SOCKETS", },
407		/* BPF_PROG_TYPE_LWT_* and related helpers */
408		{ "CONFIG_LWTUNNEL_BPF", },
409		/* BPF_PROG_TYPE_SCHED_ACT, TC (traffic control) actions */
410		{ "CONFIG_NET_ACT_BPF", },
411		/* BPF_PROG_TYPE_SCHED_CLS, TC filters */
412		{ "CONFIG_NET_CLS_BPF", },
413		/* TC clsact qdisc */
414		{ "CONFIG_NET_CLS_ACT", },
415		/* Ingress filtering with TC */
416		{ "CONFIG_NET_SCH_INGRESS", },
417		/* bpf_skb_get_xfrm_state() helper */
418		{ "CONFIG_XFRM", },
419		/* bpf_get_route_realm() helper */
420		{ "CONFIG_IP_ROUTE_CLASSID", },
421		/* BPF_PROG_TYPE_LWT_SEG6_LOCAL and related helpers */
422		{ "CONFIG_IPV6_SEG6_BPF", },
423		/* BPF_PROG_TYPE_LIRC_MODE2 and related helpers */
424		{ "CONFIG_BPF_LIRC_MODE2", },
425		/* BPF stream parser and BPF socket maps */
426		{ "CONFIG_BPF_STREAM_PARSER", },
427		/* xt_bpf module for passing BPF programs to netfilter  */
428		{ "CONFIG_NETFILTER_XT_MATCH_BPF", },
429
430		/* test_bpf module for BPF tests */
431		{ "CONFIG_TEST_BPF", },
432
433		/* Misc configs useful in BPF C programs */
434		/* jiffies <-> sec conversion for bpf_jiffies64() helper */
435		{ "CONFIG_HZ", true, }
436	};
437	char *values[ARRAY_SIZE(options)] = { };
438	struct utsname utsn;
439	char path[PATH_MAX];
440	gzFile file = NULL;
441	char buf[4096];
442	char *value;
443	size_t i;
444
445	if (!uname(&utsn)) {
446		snprintf(path, sizeof(path), "/boot/config-%s", utsn.release);
447
448		/* gzopen also accepts uncompressed files. */
449		file = gzopen(path, "r");
450	}
451
452	if (!file) {
453		/* Some distributions build with CONFIG_IKCONFIG=y and put the
454		 * config file at /proc/config.gz.
455		 */
456		file = gzopen("/proc/config.gz", "r");
457	}
458	if (!file) {
459		p_info("skipping kernel config, can't open file: %s",
460		       strerror(errno));
461		goto end_parse;
462	}
463	/* Sanity checks */
464	if (!gzgets(file, buf, sizeof(buf)) ||
465	    !gzgets(file, buf, sizeof(buf))) {
466		p_info("skipping kernel config, can't read from file: %s",
467		       strerror(errno));
468		goto end_parse;
469	}
470	if (strcmp(buf, "# Automatically generated file; DO NOT EDIT.\n")) {
471		p_info("skipping kernel config, can't find correct file");
472		goto end_parse;
473	}
474
475	while (read_next_kernel_config_option(file, buf, sizeof(buf), &value)) {
476		for (i = 0; i < ARRAY_SIZE(options); i++) {
477			if ((define_prefix && !options[i].macro_dump) ||
478			    values[i] || strcmp(buf, options[i].name))
479				continue;
480
481			values[i] = strdup(value);
482		}
483	}
484
485	for (i = 0; i < ARRAY_SIZE(options); i++) {
486		if (define_prefix && !options[i].macro_dump)
487			continue;
488		print_kernel_option(options[i].name, values[i], define_prefix);
489		free(values[i]);
490	}
491
492end_parse:
493	if (file)
494		gzclose(file);
495}
496
497static bool probe_bpf_syscall(const char *define_prefix)
498{
499	bool res;
500
501	bpf_prog_load(BPF_PROG_TYPE_UNSPEC, NULL, NULL, NULL, 0, NULL);
502	res = (errno != ENOSYS);
503
504	print_bool_feature("have_bpf_syscall",
505			   "bpf() syscall",
506			   "BPF_SYSCALL",
507			   res, define_prefix);
508
509	return res;
510}
511
512static bool
513probe_prog_load_ifindex(enum bpf_prog_type prog_type,
514			const struct bpf_insn *insns, size_t insns_cnt,
515			char *log_buf, size_t log_buf_sz,
516			__u32 ifindex)
517{
518	LIBBPF_OPTS(bpf_prog_load_opts, opts,
519		    .log_buf = log_buf,
520		    .log_size = log_buf_sz,
521		    .log_level = log_buf ? 1 : 0,
522		    .prog_ifindex = ifindex,
523		   );
524	int fd;
525
526	errno = 0;
527	fd = bpf_prog_load(prog_type, NULL, "GPL", insns, insns_cnt, &opts);
528	if (fd >= 0)
529		close(fd);
530
531	return fd >= 0 && errno != EINVAL && errno != EOPNOTSUPP;
532}
533
534static bool probe_prog_type_ifindex(enum bpf_prog_type prog_type, __u32 ifindex)
535{
536	/* nfp returns -EINVAL on exit(0) with TC offload */
537	struct bpf_insn insns[2] = {
538		BPF_MOV64_IMM(BPF_REG_0, 2),
539		BPF_EXIT_INSN()
540	};
541
542	return probe_prog_load_ifindex(prog_type, insns, ARRAY_SIZE(insns),
543				       NULL, 0, ifindex);
544}
545
546static void
547probe_prog_type(enum bpf_prog_type prog_type, const char *prog_type_str,
548		bool *supported_types, const char *define_prefix, __u32 ifindex)
549{
550	char feat_name[128], plain_desc[128], define_name[128];
551	const char *plain_comment = "eBPF program_type ";
552	size_t maxlen;
553	bool res;
554
555	if (ifindex) {
556		switch (prog_type) {
557		case BPF_PROG_TYPE_SCHED_CLS:
558		case BPF_PROG_TYPE_XDP:
559			break;
560		default:
561			return;
562		}
563
564		res = probe_prog_type_ifindex(prog_type, ifindex);
565	} else {
566		res = libbpf_probe_bpf_prog_type(prog_type, NULL) > 0;
567	}
568
569#ifdef USE_LIBCAP
570	/* Probe may succeed even if program load fails, for unprivileged users
571	 * check that we did not fail because of insufficient permissions
572	 */
573	if (run_as_unprivileged && errno == EPERM)
574		res = false;
575#endif
576
577	supported_types[prog_type] |= res;
578
579	maxlen = sizeof(plain_desc) - strlen(plain_comment) - 1;
580	if (strlen(prog_type_str) > maxlen) {
581		p_info("program type name too long");
582		return;
583	}
584
585	sprintf(feat_name, "have_%s_prog_type", prog_type_str);
586	sprintf(define_name, "%s_prog_type", prog_type_str);
587	uppercase(define_name, sizeof(define_name));
588	sprintf(plain_desc, "%s%s", plain_comment, prog_type_str);
589	print_bool_feature(feat_name, plain_desc, define_name, res,
590			   define_prefix);
591}
592
593static bool probe_map_type_ifindex(enum bpf_map_type map_type, __u32 ifindex)
594{
595	LIBBPF_OPTS(bpf_map_create_opts, opts);
596	int key_size, value_size, max_entries;
597	int fd;
598
599	opts.map_ifindex = ifindex;
600
601	key_size = sizeof(__u32);
602	value_size = sizeof(__u32);
603	max_entries = 1;
604
605	fd = bpf_map_create(map_type, NULL, key_size, value_size, max_entries,
606			    &opts);
607	if (fd >= 0)
608		close(fd);
609
610	return fd >= 0;
611}
612
613static void
614probe_map_type(enum bpf_map_type map_type, char const *map_type_str,
615	       const char *define_prefix, __u32 ifindex)
616{
617	char feat_name[128], plain_desc[128], define_name[128];
618	const char *plain_comment = "eBPF map_type ";
619	size_t maxlen;
620	bool res;
621
622	if (ifindex) {
623		switch (map_type) {
624		case BPF_MAP_TYPE_HASH:
625		case BPF_MAP_TYPE_ARRAY:
626			break;
627		default:
628			return;
629		}
630
631		res = probe_map_type_ifindex(map_type, ifindex);
632	} else {
633		res = libbpf_probe_bpf_map_type(map_type, NULL) > 0;
634	}
635
636	/* Probe result depends on the success of map creation, no additional
637	 * check required for unprivileged users
638	 */
639
640	maxlen = sizeof(plain_desc) - strlen(plain_comment) - 1;
641	if (strlen(map_type_str) > maxlen) {
642		p_info("map type name too long");
643		return;
644	}
645
646	sprintf(feat_name, "have_%s_map_type", map_type_str);
647	sprintf(define_name, "%s_map_type", map_type_str);
648	uppercase(define_name, sizeof(define_name));
649	sprintf(plain_desc, "%s%s", plain_comment, map_type_str);
650	print_bool_feature(feat_name, plain_desc, define_name, res,
651			   define_prefix);
652}
653
654static bool
655probe_helper_ifindex(enum bpf_func_id id, enum bpf_prog_type prog_type,
656		     __u32 ifindex)
657{
658	struct bpf_insn insns[2] = {
659		BPF_EMIT_CALL(id),
660		BPF_EXIT_INSN()
661	};
662	char buf[4096] = {};
663	bool res;
664
665	probe_prog_load_ifindex(prog_type, insns, ARRAY_SIZE(insns), buf,
666				sizeof(buf), ifindex);
667	res = !grep(buf, "invalid func ") && !grep(buf, "unknown func ");
668
669	switch (get_vendor_id(ifindex)) {
670	case 0x19ee: /* Netronome specific */
671		res = res && !grep(buf, "not supported by FW") &&
672			!grep(buf, "unsupported function id");
673		break;
674	default:
675		break;
676	}
677
678	return res;
679}
680
681static bool
682probe_helper_for_progtype(enum bpf_prog_type prog_type, bool supported_type,
683			  const char *define_prefix, unsigned int id,
684			  const char *ptype_name, __u32 ifindex)
685{
686	bool res = false;
687
688	if (supported_type) {
689		if (ifindex)
690			res = probe_helper_ifindex(id, prog_type, ifindex);
691		else
692			res = libbpf_probe_bpf_helper(prog_type, id, NULL) > 0;
693#ifdef USE_LIBCAP
694		/* Probe may succeed even if program load fails, for
695		 * unprivileged users check that we did not fail because of
696		 * insufficient permissions
697		 */
698		if (run_as_unprivileged && errno == EPERM)
699			res = false;
700#endif
701	}
702
703	if (json_output) {
704		if (res)
705			jsonw_string(json_wtr, helper_name[id]);
706	} else if (define_prefix) {
707		printf("#define %sBPF__PROG_TYPE_%s__HELPER_%s %s\n",
708		       define_prefix, ptype_name, helper_name[id],
709		       res ? "1" : "0");
710	} else {
711		if (res)
712			printf("\n\t- %s", helper_name[id]);
713	}
714
715	return res;
716}
717
718static void
719probe_helpers_for_progtype(enum bpf_prog_type prog_type,
720			   const char *prog_type_str, bool supported_type,
721			   const char *define_prefix, __u32 ifindex)
722{
723	char feat_name[128];
724	unsigned int id;
725	bool probe_res = false;
726
727	if (ifindex)
728		/* Only test helpers for offload-able program types */
729		switch (prog_type) {
730		case BPF_PROG_TYPE_SCHED_CLS:
731		case BPF_PROG_TYPE_XDP:
732			break;
733		default:
734			return;
735		}
736
737	if (json_output) {
738		sprintf(feat_name, "%s_available_helpers", prog_type_str);
739		jsonw_name(json_wtr, feat_name);
740		jsonw_start_array(json_wtr);
741	} else if (!define_prefix) {
742		printf("eBPF helpers supported for program type %s:",
743		       prog_type_str);
744	}
745
746	for (id = 1; id < ARRAY_SIZE(helper_name); id++) {
747		/* Skip helper functions which emit dmesg messages when not in
748		 * the full mode.
749		 */
750		switch (id) {
751		case BPF_FUNC_trace_printk:
752		case BPF_FUNC_trace_vprintk:
753		case BPF_FUNC_probe_write_user:
754			if (!full_mode)
755				continue;
756			fallthrough;
757		default:
758			probe_res |= probe_helper_for_progtype(prog_type, supported_type,
759						  define_prefix, id, prog_type_str,
760						  ifindex);
761		}
762	}
763
764	if (json_output)
765		jsonw_end_array(json_wtr);
766	else if (!define_prefix) {
767		printf("\n");
768		if (!probe_res) {
769			if (!supported_type)
770				printf("\tProgram type not supported\n");
771			else
772				printf("\tCould not determine which helpers are available\n");
773		}
774	}
775
776
777}
778
779static void
780probe_misc_feature(struct bpf_insn *insns, size_t len,
781		   const char *define_prefix, __u32 ifindex,
782		   const char *feat_name, const char *plain_name,
783		   const char *define_name)
784{
785	LIBBPF_OPTS(bpf_prog_load_opts, opts,
786		.prog_ifindex = ifindex,
787	);
788	bool res;
789	int fd;
790
791	errno = 0;
792	fd = bpf_prog_load(BPF_PROG_TYPE_SOCKET_FILTER, NULL, "GPL",
793			   insns, len, &opts);
794	res = fd >= 0 || !errno;
795
796	if (fd >= 0)
797		close(fd);
798
799	print_bool_feature(feat_name, plain_name, define_name, res,
800			   define_prefix);
801}
802
803/*
804 * Probe for availability of kernel commit (5.3):
805 *
806 * c04c0d2b968a ("bpf: increase complexity limit and maximum program size")
807 */
808static void probe_large_insn_limit(const char *define_prefix, __u32 ifindex)
809{
810	struct bpf_insn insns[BPF_MAXINSNS + 1];
811	int i;
812
813	for (i = 0; i < BPF_MAXINSNS; i++)
814		insns[i] = BPF_MOV64_IMM(BPF_REG_0, 1);
815	insns[BPF_MAXINSNS] = BPF_EXIT_INSN();
816
817	probe_misc_feature(insns, ARRAY_SIZE(insns),
818			   define_prefix, ifindex,
819			   "have_large_insn_limit",
820			   "Large program size limit",
821			   "LARGE_INSN_LIMIT");
822}
823
824/*
825 * Probe for bounded loop support introduced in commit 2589726d12a1
826 * ("bpf: introduce bounded loops").
827 */
828static void
829probe_bounded_loops(const char *define_prefix, __u32 ifindex)
830{
831	struct bpf_insn insns[4] = {
832		BPF_MOV64_IMM(BPF_REG_0, 10),
833		BPF_ALU64_IMM(BPF_SUB, BPF_REG_0, 1),
834		BPF_JMP_IMM(BPF_JNE, BPF_REG_0, 0, -2),
835		BPF_EXIT_INSN()
836	};
837
838	probe_misc_feature(insns, ARRAY_SIZE(insns),
839			   define_prefix, ifindex,
840			   "have_bounded_loops",
841			   "Bounded loop support",
842			   "BOUNDED_LOOPS");
843}
844
845/*
846 * Probe for the v2 instruction set extension introduced in commit 92b31a9af73b
847 * ("bpf: add BPF_J{LT,LE,SLT,SLE} instructions").
848 */
849static void
850probe_v2_isa_extension(const char *define_prefix, __u32 ifindex)
851{
852	struct bpf_insn insns[4] = {
853		BPF_MOV64_IMM(BPF_REG_0, 0),
854		BPF_JMP_IMM(BPF_JLT, BPF_REG_0, 0, 1),
855		BPF_MOV64_IMM(BPF_REG_0, 1),
856		BPF_EXIT_INSN()
857	};
858
859	probe_misc_feature(insns, ARRAY_SIZE(insns),
860			   define_prefix, ifindex,
861			   "have_v2_isa_extension",
862			   "ISA extension v2",
863			   "V2_ISA_EXTENSION");
864}
865
866/*
867 * Probe for the v3 instruction set extension introduced in commit 092ed0968bb6
868 * ("bpf: verifier support JMP32").
869 */
870static void
871probe_v3_isa_extension(const char *define_prefix, __u32 ifindex)
872{
873	struct bpf_insn insns[4] = {
874		BPF_MOV64_IMM(BPF_REG_0, 0),
875		BPF_JMP32_IMM(BPF_JLT, BPF_REG_0, 0, 1),
876		BPF_MOV64_IMM(BPF_REG_0, 1),
877		BPF_EXIT_INSN()
878	};
879
880	probe_misc_feature(insns, ARRAY_SIZE(insns),
881			   define_prefix, ifindex,
882			   "have_v3_isa_extension",
883			   "ISA extension v3",
884			   "V3_ISA_EXTENSION");
885}
886
887static void
888section_system_config(enum probe_component target, const char *define_prefix)
889{
890	switch (target) {
891	case COMPONENT_KERNEL:
892	case COMPONENT_UNSPEC:
893		print_start_section("system_config",
894				    "Scanning system configuration...",
895				    "/*** Misc kernel config items ***/",
896				    define_prefix);
897		if (!define_prefix) {
898			if (check_procfs()) {
899				probe_unprivileged_disabled();
900				probe_jit_enable();
901				probe_jit_harden();
902				probe_jit_kallsyms();
903				probe_jit_limit();
904			} else {
905				p_info("/* procfs not mounted, skipping related probes */");
906			}
907		}
908		probe_kernel_image_config(define_prefix);
909		print_end_section();
910		break;
911	default:
912		break;
913	}
914}
915
916static bool section_syscall_config(const char *define_prefix)
917{
918	bool res;
919
920	print_start_section("syscall_config",
921			    "Scanning system call availability...",
922			    "/*** System call availability ***/",
923			    define_prefix);
924	res = probe_bpf_syscall(define_prefix);
925	print_end_section();
926
927	return res;
928}
929
930static void
931section_program_types(bool *supported_types, const char *define_prefix,
932		      __u32 ifindex)
933{
934	unsigned int prog_type = BPF_PROG_TYPE_UNSPEC;
935	const char *prog_type_str;
936
937	print_start_section("program_types",
938			    "Scanning eBPF program types...",
939			    "/*** eBPF program types ***/",
940			    define_prefix);
941
942	while (true) {
943		prog_type++;
944		prog_type_str = libbpf_bpf_prog_type_str(prog_type);
945		/* libbpf will return NULL for variants unknown to it. */
946		if (!prog_type_str)
947			break;
948
949		probe_prog_type(prog_type, prog_type_str, supported_types, define_prefix,
950				ifindex);
951	}
952
953	print_end_section();
954}
955
956static void section_map_types(const char *define_prefix, __u32 ifindex)
957{
958	unsigned int map_type = BPF_MAP_TYPE_UNSPEC;
959	const char *map_type_str;
960
961	print_start_section("map_types",
962			    "Scanning eBPF map types...",
963			    "/*** eBPF map types ***/",
964			    define_prefix);
965
966	while (true) {
967		map_type++;
968		map_type_str = libbpf_bpf_map_type_str(map_type);
969		/* libbpf will return NULL for variants unknown to it. */
970		if (!map_type_str)
971			break;
972
973		probe_map_type(map_type, map_type_str, define_prefix, ifindex);
974	}
975
976	print_end_section();
977}
978
979static void
980section_helpers(bool *supported_types, const char *define_prefix, __u32 ifindex)
981{
982	unsigned int prog_type = BPF_PROG_TYPE_UNSPEC;
983	const char *prog_type_str;
984
985	print_start_section("helpers",
986			    "Scanning eBPF helper functions...",
987			    "/*** eBPF helper functions ***/",
988			    define_prefix);
989
990	if (define_prefix)
991		printf("/*\n"
992		       " * Use %sHAVE_PROG_TYPE_HELPER(prog_type_name, helper_name)\n"
993		       " * to determine if <helper_name> is available for <prog_type_name>,\n"
994		       " * e.g.\n"
995		       " *	#if %sHAVE_PROG_TYPE_HELPER(xdp, bpf_redirect)\n"
996		       " *		// do stuff with this helper\n"
997		       " *	#elif\n"
998		       " *		// use a workaround\n"
999		       " *	#endif\n"
1000		       " */\n"
1001		       "#define %sHAVE_PROG_TYPE_HELPER(prog_type, helper)	\\\n"
1002		       "	%sBPF__PROG_TYPE_ ## prog_type ## __HELPER_ ## helper\n",
1003		       define_prefix, define_prefix, define_prefix,
1004		       define_prefix);
1005	while (true) {
1006		prog_type++;
1007		prog_type_str = libbpf_bpf_prog_type_str(prog_type);
1008		/* libbpf will return NULL for variants unknown to it. */
1009		if (!prog_type_str)
1010			break;
1011
1012		probe_helpers_for_progtype(prog_type, prog_type_str,
1013					   supported_types[prog_type],
1014					   define_prefix,
1015					   ifindex);
1016	}
1017
1018	print_end_section();
1019}
1020
1021static void section_misc(const char *define_prefix, __u32 ifindex)
1022{
1023	print_start_section("misc",
1024			    "Scanning miscellaneous eBPF features...",
1025			    "/*** eBPF misc features ***/",
1026			    define_prefix);
1027	probe_large_insn_limit(define_prefix, ifindex);
1028	probe_bounded_loops(define_prefix, ifindex);
1029	probe_v2_isa_extension(define_prefix, ifindex);
1030	probe_v3_isa_extension(define_prefix, ifindex);
1031	print_end_section();
1032}
1033
1034#ifdef USE_LIBCAP
1035#define capability(c) { c, false, #c }
1036#define capability_msg(a, i) a[i].set ? "" : a[i].name, a[i].set ? "" : ", "
1037#endif
1038
1039static int handle_perms(void)
1040{
1041#ifdef USE_LIBCAP
1042	struct {
1043		cap_value_t cap;
1044		bool set;
1045		char name[14];	/* strlen("CAP_SYS_ADMIN") */
1046	} bpf_caps[] = {
1047		capability(CAP_SYS_ADMIN),
1048#ifdef CAP_BPF
1049		capability(CAP_BPF),
1050		capability(CAP_NET_ADMIN),
1051		capability(CAP_PERFMON),
1052#endif
1053	};
1054	cap_value_t cap_list[ARRAY_SIZE(bpf_caps)];
1055	unsigned int i, nb_bpf_caps = 0;
1056	bool cap_sys_admin_only = true;
1057	cap_flag_value_t val;
1058	int res = -1;
1059	cap_t caps;
1060
1061	caps = cap_get_proc();
1062	if (!caps) {
1063		p_err("failed to get capabilities for process: %s",
1064		      strerror(errno));
1065		return -1;
1066	}
1067
1068#ifdef CAP_BPF
1069	if (CAP_IS_SUPPORTED(CAP_BPF))
1070		cap_sys_admin_only = false;
1071#endif
1072
1073	for (i = 0; i < ARRAY_SIZE(bpf_caps); i++) {
1074		const char *cap_name = bpf_caps[i].name;
1075		cap_value_t cap = bpf_caps[i].cap;
1076
1077		if (cap_get_flag(caps, cap, CAP_EFFECTIVE, &val)) {
1078			p_err("bug: failed to retrieve %s status: %s", cap_name,
1079			      strerror(errno));
1080			goto exit_free;
1081		}
1082
1083		if (val == CAP_SET) {
1084			bpf_caps[i].set = true;
1085			cap_list[nb_bpf_caps++] = cap;
1086		}
1087
1088		if (cap_sys_admin_only)
1089			/* System does not know about CAP_BPF, meaning that
1090			 * CAP_SYS_ADMIN is the only capability required. We
1091			 * just checked it, break.
1092			 */
1093			break;
1094	}
1095
1096	if ((run_as_unprivileged && !nb_bpf_caps) ||
1097	    (!run_as_unprivileged && nb_bpf_caps == ARRAY_SIZE(bpf_caps)) ||
1098	    (!run_as_unprivileged && cap_sys_admin_only && nb_bpf_caps)) {
1099		/* We are all good, exit now */
1100		res = 0;
1101		goto exit_free;
1102	}
1103
1104	if (!run_as_unprivileged) {
1105		if (cap_sys_admin_only)
1106			p_err("missing %s, required for full feature probing; run as root or use 'unprivileged'",
1107			      bpf_caps[0].name);
1108		else
1109			p_err("missing %s%s%s%s%s%s%s%srequired for full feature probing; run as root or use 'unprivileged'",
1110			      capability_msg(bpf_caps, 0),
1111#ifdef CAP_BPF
1112			      capability_msg(bpf_caps, 1),
1113			      capability_msg(bpf_caps, 2),
1114			      capability_msg(bpf_caps, 3)
1115#else
1116				"", "", "", "", "", ""
1117#endif /* CAP_BPF */
1118				);
1119		goto exit_free;
1120	}
1121
1122	/* if (run_as_unprivileged && nb_bpf_caps > 0), drop capabilities. */
1123	if (cap_set_flag(caps, CAP_EFFECTIVE, nb_bpf_caps, cap_list,
1124			 CAP_CLEAR)) {
1125		p_err("bug: failed to clear capabilities: %s", strerror(errno));
1126		goto exit_free;
1127	}
1128
1129	if (cap_set_proc(caps)) {
1130		p_err("failed to drop capabilities: %s", strerror(errno));
1131		goto exit_free;
1132	}
1133
1134	res = 0;
1135
1136exit_free:
1137	if (cap_free(caps) && !res) {
1138		p_err("failed to clear storage object for capabilities: %s",
1139		      strerror(errno));
1140		res = -1;
1141	}
1142
1143	return res;
1144#else
1145	/* Detection assumes user has specific privileges.
1146	 * We do not use libcap so let's approximate, and restrict usage to
1147	 * root user only.
1148	 */
1149	if (geteuid()) {
1150		p_err("full feature probing requires root privileges");
1151		return -1;
1152	}
1153
1154	return 0;
1155#endif /* USE_LIBCAP */
1156}
1157
1158static int do_probe(int argc, char **argv)
1159{
1160	enum probe_component target = COMPONENT_UNSPEC;
1161	const char *define_prefix = NULL;
1162	bool supported_types[128] = {};
1163	__u32 ifindex = 0;
1164	char *ifname;
1165
1166	set_max_rlimit();
1167
1168	while (argc) {
1169		if (is_prefix(*argv, "kernel")) {
1170			if (target != COMPONENT_UNSPEC) {
1171				p_err("component to probe already specified");
1172				return -1;
1173			}
1174			target = COMPONENT_KERNEL;
1175			NEXT_ARG();
1176		} else if (is_prefix(*argv, "dev")) {
1177			NEXT_ARG();
1178
1179			if (target != COMPONENT_UNSPEC || ifindex) {
1180				p_err("component to probe already specified");
1181				return -1;
1182			}
1183			if (!REQ_ARGS(1))
1184				return -1;
1185
1186			target = COMPONENT_DEVICE;
1187			ifname = GET_ARG();
1188			ifindex = if_nametoindex(ifname);
1189			if (!ifindex) {
1190				p_err("unrecognized netdevice '%s': %s", ifname,
1191				      strerror(errno));
1192				return -1;
1193			}
1194		} else if (is_prefix(*argv, "full")) {
1195			full_mode = true;
1196			NEXT_ARG();
1197		} else if (is_prefix(*argv, "macros") && !define_prefix) {
1198			define_prefix = "";
1199			NEXT_ARG();
1200		} else if (is_prefix(*argv, "prefix")) {
1201			if (!define_prefix) {
1202				p_err("'prefix' argument can only be use after 'macros'");
1203				return -1;
1204			}
1205			if (strcmp(define_prefix, "")) {
1206				p_err("'prefix' already defined");
1207				return -1;
1208			}
1209			NEXT_ARG();
1210
1211			if (!REQ_ARGS(1))
1212				return -1;
1213			define_prefix = GET_ARG();
1214		} else if (is_prefix(*argv, "unprivileged")) {
1215#ifdef USE_LIBCAP
1216			run_as_unprivileged = true;
1217			NEXT_ARG();
1218#else
1219			p_err("unprivileged run not supported, recompile bpftool with libcap");
1220			return -1;
1221#endif
1222		} else {
1223			p_err("expected no more arguments, 'kernel', 'dev', 'macros' or 'prefix', got: '%s'?",
1224			      *argv);
1225			return -1;
1226		}
1227	}
1228
1229	/* Full feature detection requires specific privileges.
1230	 * Let's approximate, and warn if user is not root.
1231	 */
1232	if (handle_perms())
1233		return -1;
1234
1235	if (json_output) {
1236		define_prefix = NULL;
1237		jsonw_start_object(json_wtr);
1238	}
1239
1240	section_system_config(target, define_prefix);
1241	if (!section_syscall_config(define_prefix))
1242		/* bpf() syscall unavailable, don't probe other BPF features */
1243		goto exit_close_json;
1244	section_program_types(supported_types, define_prefix, ifindex);
1245	section_map_types(define_prefix, ifindex);
1246	section_helpers(supported_types, define_prefix, ifindex);
1247	section_misc(define_prefix, ifindex);
1248
1249exit_close_json:
1250	if (json_output)
1251		/* End root object */
1252		jsonw_end_object(json_wtr);
1253
1254	return 0;
1255}
1256
1257static const char *get_helper_name(unsigned int id)
1258{
1259	if (id >= ARRAY_SIZE(helper_name))
1260		return NULL;
1261
1262	return helper_name[id];
1263}
1264
1265static int do_list_builtins(int argc, char **argv)
1266{
1267	const char *(*get_name)(unsigned int id);
1268	unsigned int id = 0;
1269
1270	if (argc < 1)
1271		usage();
1272
1273	if (is_prefix(*argv, "prog_types")) {
1274		get_name = (const char *(*)(unsigned int))libbpf_bpf_prog_type_str;
1275	} else if (is_prefix(*argv, "map_types")) {
1276		get_name = (const char *(*)(unsigned int))libbpf_bpf_map_type_str;
1277	} else if (is_prefix(*argv, "attach_types")) {
1278		get_name = (const char *(*)(unsigned int))libbpf_bpf_attach_type_str;
1279	} else if (is_prefix(*argv, "link_types")) {
1280		get_name = (const char *(*)(unsigned int))libbpf_bpf_link_type_str;
1281	} else if (is_prefix(*argv, "helpers")) {
1282		get_name = get_helper_name;
1283	} else {
1284		p_err("expected 'prog_types', 'map_types', 'attach_types', 'link_types' or 'helpers', got: %s", *argv);
1285		return -1;
1286	}
1287
1288	if (json_output)
1289		jsonw_start_array(json_wtr);	/* root array */
1290
1291	while (true) {
1292		const char *name;
1293
1294		name = get_name(id++);
1295		if (!name)
1296			break;
1297		if (json_output)
1298			jsonw_string(json_wtr, name);
1299		else
1300			printf("%s\n", name);
1301	}
1302
1303	if (json_output)
1304		jsonw_end_array(json_wtr);	/* root array */
1305
1306	return 0;
1307}
1308
1309static int do_help(int argc, char **argv)
1310{
1311	if (json_output) {
1312		jsonw_null(json_wtr);
1313		return 0;
1314	}
1315
1316	fprintf(stderr,
1317		"Usage: %1$s %2$s probe [COMPONENT] [full] [unprivileged] [macros [prefix PREFIX]]\n"
1318		"       %1$s %2$s list_builtins GROUP\n"
1319		"       %1$s %2$s help\n"
1320		"\n"
1321		"       COMPONENT := { kernel | dev NAME }\n"
1322		"       GROUP := { prog_types | map_types | attach_types | link_types | helpers }\n"
1323		"       " HELP_SPEC_OPTIONS " }\n"
1324		"",
1325		bin_name, argv[-2]);
1326
1327	return 0;
1328}
1329
1330static const struct cmd cmds[] = {
1331	{ "probe",		do_probe },
1332	{ "list_builtins",	do_list_builtins },
1333	{ "help",		do_help },
1334	{ 0 }
1335};
1336
1337int do_feature(int argc, char **argv)
1338{
1339	return cmd_select(cmds, argc, argv, do_help);
1340}
1341