tools/bpf/bpftool/common.c at master · tjh.dev/kernel

tjh.dev / kernel
Linux kernel mirror (for testing) git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
kernel os linux
kernel / tools / bpf / bpftool / common.c
at master 1303 lines 28 kB view raw
   1// SPDX-License-Identifier: (GPL-2.0-only OR BSD-2-Clause)
   2/* Copyright (C) 2017-2018 Netronome Systems, Inc. */
   3
   4#ifndef _GNU_SOURCE
   5#define _GNU_SOURCE
   6#endif
   7#include <assert.h>
   8#include <ctype.h>
   9#include <errno.h>
  10#include <fcntl.h>
  11#include <ftw.h>
  12#include <libgen.h>
  13#include <mntent.h>
  14#include <stdbool.h>
  15#include <stdio.h>
  16#include <stdlib.h>
  17#include <string.h>
  18#include <unistd.h>
  19#include <net/if.h>
  20#include <sys/mount.h>
  21#include <sys/resource.h>
  22#include <sys/stat.h>
  23#include <sys/vfs.h>
  24#include <sys/utsname.h>
  25
  26#include <linux/filter.h>
  27#include <linux/limits.h>
  28#include <linux/magic.h>
  29#include <linux/unistd.h>
  30
  31#include <bpf/bpf.h>
  32#include <bpf/hashmap.h>
  33#include <bpf/libbpf.h> /* libbpf_num_possible_cpus */
  34#include <bpf/btf.h>
  35#include <zlib.h>
  36
  37#include "main.h"
  38
  39#ifndef BPF_FS_MAGIC
  40#define BPF_FS_MAGIC		0xcafe4a11
  41#endif
  42
  43void p_err(const char *fmt, ...)
  44{
  45	va_list ap;
  46
  47	va_start(ap, fmt);
  48	if (json_output) {
  49		jsonw_start_object(json_wtr);
  50		jsonw_name(json_wtr, "error");
  51		jsonw_vprintf_enquote(json_wtr, fmt, ap);
  52		jsonw_end_object(json_wtr);
  53	} else {
  54		fprintf(stderr, "Error: ");
  55		vfprintf(stderr, fmt, ap);
  56		fprintf(stderr, "\n");
  57	}
  58	va_end(ap);
  59}
  60
  61void p_info(const char *fmt, ...)
  62{
  63	va_list ap;
  64
  65	if (json_output)
  66		return;
  67
  68	va_start(ap, fmt);
  69	vfprintf(stderr, fmt, ap);
  70	fprintf(stderr, "\n");
  71	va_end(ap);
  72}
  73
  74static bool is_bpffs(const char *path)
  75{
  76	struct statfs st_fs;
  77
  78	if (statfs(path, &st_fs) < 0)
  79		return false;
  80
  81	return (unsigned long)st_fs.f_type == BPF_FS_MAGIC;
  82}
  83
  84/* Probe whether kernel switched from memlock-based (RLIMIT_MEMLOCK) to
  85 * memcg-based memory accounting for BPF maps and programs. This was done in
  86 * commit 97306be45fbe ("Merge branch 'switch to memcg-based memory
  87 * accounting'"), in Linux 5.11.
  88 *
  89 * Libbpf also offers to probe for memcg-based accounting vs rlimit, but does
  90 * so by checking for the availability of a given BPF helper and this has
  91 * failed on some kernels with backports in the past, see commit 6b4384ff1088
  92 * ("Revert "bpftool: Use libbpf 1.0 API mode instead of RLIMIT_MEMLOCK"").
  93 * Instead, we can probe by lowering the process-based rlimit to 0, trying to
  94 * load a BPF object, and resetting the rlimit. If the load succeeds then
  95 * memcg-based accounting is supported.
  96 *
  97 * This would be too dangerous to do in the library, because multithreaded
  98 * applications might attempt to load items while the rlimit is at 0. Given
  99 * that bpftool is single-threaded, this is fine to do here.
 100 */
 101static bool known_to_need_rlimit(void)
 102{
 103	struct rlimit rlim_init, rlim_cur_zero = {};
 104	struct bpf_insn insns[] = {
 105		BPF_MOV64_IMM(BPF_REG_0, 0),
 106		BPF_EXIT_INSN(),
 107	};
 108	size_t insn_cnt = ARRAY_SIZE(insns);
 109	union bpf_attr attr;
 110	int prog_fd, err;
 111
 112	memset(&attr, 0, sizeof(attr));
 113	attr.prog_type = BPF_PROG_TYPE_SOCKET_FILTER;
 114	attr.insns = ptr_to_u64(insns);
 115	attr.insn_cnt = insn_cnt;
 116	attr.license = ptr_to_u64("GPL");
 117
 118	if (getrlimit(RLIMIT_MEMLOCK, &rlim_init))
 119		return false;
 120
 121	/* Drop the soft limit to zero. We maintain the hard limit to its
 122	 * current value, because lowering it would be a permanent operation
 123	 * for unprivileged users.
 124	 */
 125	rlim_cur_zero.rlim_max = rlim_init.rlim_max;
 126	if (setrlimit(RLIMIT_MEMLOCK, &rlim_cur_zero))
 127		return false;
 128
 129	/* Do not use bpf_prog_load() from libbpf here, because it calls
 130	 * bump_rlimit_memlock(), interfering with the current probe.
 131	 */
 132	prog_fd = syscall(__NR_bpf, BPF_PROG_LOAD, &attr, sizeof(attr));
 133	err = errno;
 134
 135	/* reset soft rlimit to its initial value */
 136	setrlimit(RLIMIT_MEMLOCK, &rlim_init);
 137
 138	if (prog_fd < 0)
 139		return err == EPERM;
 140
 141	close(prog_fd);
 142	return false;
 143}
 144
 145void set_max_rlimit(void)
 146{
 147	struct rlimit rinf = { RLIM_INFINITY, RLIM_INFINITY };
 148
 149	if (known_to_need_rlimit())
 150		setrlimit(RLIMIT_MEMLOCK, &rinf);
 151}
 152
 153static int
 154mnt_fs(const char *target, const char *type, char *buff, size_t bufflen)
 155{
 156	bool bind_done = false;
 157
 158	while (mount("", target, "none", MS_PRIVATE | MS_REC, NULL)) {
 159		if (errno != EINVAL || bind_done) {
 160			snprintf(buff, bufflen,
 161				 "mount --make-private %s failed: %s",
 162				 target, strerror(errno));
 163			return -1;
 164		}
 165
 166		if (mount(target, target, "none", MS_BIND, NULL)) {
 167			snprintf(buff, bufflen,
 168				 "mount --bind %s %s failed: %s",
 169				 target, target, strerror(errno));
 170			return -1;
 171		}
 172
 173		bind_done = true;
 174	}
 175
 176	if (mount(type, target, type, 0, "mode=0700")) {
 177		snprintf(buff, bufflen, "mount -t %s %s %s failed: %s",
 178			 type, type, target, strerror(errno));
 179		return -1;
 180	}
 181
 182	return 0;
 183}
 184
 185int mount_tracefs(const char *target)
 186{
 187	char err_str[ERR_MAX_LEN];
 188	int err;
 189
 190	err = mnt_fs(target, "tracefs", err_str, ERR_MAX_LEN);
 191	if (err) {
 192		err_str[ERR_MAX_LEN - 1] = '\0';
 193		p_err("can't mount tracefs: %s", err_str);
 194	}
 195
 196	return err;
 197}
 198
 199int open_obj_pinned(const char *path, bool quiet,
 200		    const struct bpf_obj_get_opts *opts)
 201{
 202	char *pname;
 203	int fd = -1;
 204
 205	pname = strdup(path);
 206	if (!pname) {
 207		if (!quiet)
 208			p_err("mem alloc failed");
 209		goto out_ret;
 210	}
 211
 212	fd = bpf_obj_get_opts(pname, opts);
 213	if (fd < 0) {
 214		if (!quiet)
 215			p_err("bpf obj get (%s): %s", pname,
 216			      errno == EACCES && !is_bpffs(dirname(pname)) ?
 217			    "directory not in bpf file system (bpffs)" :
 218			    strerror(errno));
 219		goto out_free;
 220	}
 221
 222out_free:
 223	free(pname);
 224out_ret:
 225	return fd;
 226}
 227
 228int open_obj_pinned_any(const char *path, enum bpf_obj_type exp_type,
 229			const struct bpf_obj_get_opts *opts)
 230{
 231	enum bpf_obj_type type;
 232	int fd;
 233
 234	fd = open_obj_pinned(path, false, opts);
 235	if (fd < 0)
 236		return -1;
 237
 238	type = get_fd_type(fd);
 239	if (type < 0) {
 240		close(fd);
 241		return type;
 242	}
 243	if (type != exp_type) {
 244		p_err("incorrect object type: %s", get_fd_type_name(type));
 245		close(fd);
 246		return -1;
 247	}
 248
 249	return fd;
 250}
 251
 252int create_and_mount_bpffs_dir(const char *dir_name)
 253{
 254	char err_str[ERR_MAX_LEN];
 255	bool dir_exists;
 256	int err = 0;
 257
 258	if (is_bpffs(dir_name))
 259		return err;
 260
 261	dir_exists = access(dir_name, F_OK) == 0;
 262
 263	if (!dir_exists) {
 264		char *temp_name;
 265		char *parent_name;
 266
 267		temp_name = strdup(dir_name);
 268		if (!temp_name) {
 269			p_err("mem alloc failed");
 270			return -1;
 271		}
 272
 273		parent_name = dirname(temp_name);
 274
 275		if (is_bpffs(parent_name)) {
 276			/* nothing to do if already mounted */
 277			free(temp_name);
 278			return err;
 279		}
 280
 281		if (access(parent_name, F_OK) == -1) {
 282			p_err("can't create dir '%s' to pin BPF object: parent dir '%s' doesn't exist",
 283			      dir_name, parent_name);
 284			free(temp_name);
 285			return -1;
 286		}
 287
 288		free(temp_name);
 289	}
 290
 291	if (block_mount) {
 292		p_err("no BPF file system found, not mounting it due to --nomount option");
 293		return -1;
 294	}
 295
 296	if (!dir_exists) {
 297		err = mkdir(dir_name, S_IRWXU);
 298		if (err) {
 299			p_err("failed to create dir '%s': %s", dir_name, strerror(errno));
 300			return err;
 301		}
 302	}
 303
 304	err = mnt_fs(dir_name, "bpf", err_str, ERR_MAX_LEN);
 305	if (err) {
 306		err_str[ERR_MAX_LEN - 1] = '\0';
 307		p_err("can't mount BPF file system on given dir '%s': %s",
 308		      dir_name, err_str);
 309
 310		if (!dir_exists)
 311			rmdir(dir_name);
 312	}
 313
 314	return err;
 315}
 316
 317int mount_bpffs_for_file(const char *file_name)
 318{
 319	char err_str[ERR_MAX_LEN];
 320	char *temp_name;
 321	char *dir;
 322	int err = 0;
 323
 324	if (access(file_name, F_OK) != -1) {
 325		p_err("can't pin BPF object: path '%s' already exists", file_name);
 326		return -1;
 327	}
 328
 329	temp_name = strdup(file_name);
 330	if (!temp_name) {
 331		p_err("mem alloc failed");
 332		return -1;
 333	}
 334
 335	dir = dirname(temp_name);
 336
 337	if (is_bpffs(dir))
 338		/* nothing to do if already mounted */
 339		goto out_free;
 340
 341	if (access(dir, F_OK) == -1) {
 342		p_err("can't pin BPF object: dir '%s' doesn't exist", dir);
 343		err = -1;
 344		goto out_free;
 345	}
 346
 347	if (block_mount) {
 348		p_err("no BPF file system found, not mounting it due to --nomount option");
 349		err = -1;
 350		goto out_free;
 351	}
 352
 353	err = mnt_fs(dir, "bpf", err_str, ERR_MAX_LEN);
 354	if (err) {
 355		err_str[ERR_MAX_LEN - 1] = '\0';
 356		p_err("can't mount BPF file system to pin the object '%s': %s",
 357		      file_name, err_str);
 358	}
 359
 360out_free:
 361	free(temp_name);
 362	return err;
 363}
 364
 365int do_pin_fd(int fd, const char *name)
 366{
 367	int err;
 368
 369	err = mount_bpffs_for_file(name);
 370	if (err)
 371		return err;
 372
 373	err = bpf_obj_pin(fd, name);
 374	if (err)
 375		p_err("can't pin the object (%s): %s", name, strerror(errno));
 376
 377	return err;
 378}
 379
 380int do_pin_any(int argc, char **argv, int (*get_fd)(int *, char ***))
 381{
 382	int err;
 383	int fd;
 384
 385	if (!REQ_ARGS(3))
 386		return -EINVAL;
 387
 388	fd = get_fd(&argc, &argv);
 389	if (fd < 0)
 390		return fd;
 391
 392	err = do_pin_fd(fd, *argv);
 393
 394	close(fd);
 395	return err;
 396}
 397
 398const char *get_fd_type_name(enum bpf_obj_type type)
 399{
 400	static const char * const names[] = {
 401		[BPF_OBJ_UNKNOWN]	= "unknown",
 402		[BPF_OBJ_PROG]		= "prog",
 403		[BPF_OBJ_MAP]		= "map",
 404		[BPF_OBJ_LINK]		= "link",
 405	};
 406
 407	if (type < 0 || type >= ARRAY_SIZE(names) || !names[type])
 408		return names[BPF_OBJ_UNKNOWN];
 409
 410	return names[type];
 411}
 412
 413void get_prog_full_name(const struct bpf_prog_info *prog_info, int prog_fd,
 414			char *name_buff, size_t buff_len)
 415{
 416	const char *prog_name = prog_info->name;
 417	const struct btf_type *func_type;
 418	struct bpf_func_info finfo = {};
 419	struct bpf_prog_info info = {};
 420	__u32 info_len = sizeof(info);
 421	struct btf *prog_btf = NULL;
 422
 423	if (buff_len <= BPF_OBJ_NAME_LEN ||
 424	    strlen(prog_info->name) < BPF_OBJ_NAME_LEN - 1)
 425		goto copy_name;
 426
 427	if (!prog_info->btf_id || prog_info->nr_func_info == 0)
 428		goto copy_name;
 429
 430	info.nr_func_info = 1;
 431	info.func_info_rec_size = prog_info->func_info_rec_size;
 432	if (info.func_info_rec_size > sizeof(finfo))
 433		info.func_info_rec_size = sizeof(finfo);
 434	info.func_info = ptr_to_u64(&finfo);
 435
 436	if (bpf_prog_get_info_by_fd(prog_fd, &info, &info_len))
 437		goto copy_name;
 438
 439	prog_btf = btf__load_from_kernel_by_id(info.btf_id);
 440	if (!prog_btf)
 441		goto copy_name;
 442
 443	func_type = btf__type_by_id(prog_btf, finfo.type_id);
 444	if (!func_type || !btf_is_func(func_type))
 445		goto copy_name;
 446
 447	prog_name = btf__name_by_offset(prog_btf, func_type->name_off);
 448
 449copy_name:
 450	snprintf(name_buff, buff_len, "%s", prog_name);
 451
 452	if (prog_btf)
 453		btf__free(prog_btf);
 454}
 455
 456int get_fd_type(int fd)
 457{
 458	char path[PATH_MAX];
 459	char buf[512];
 460	ssize_t n;
 461
 462	snprintf(path, sizeof(path), "/proc/self/fd/%d", fd);
 463
 464	n = readlink(path, buf, sizeof(buf));
 465	if (n < 0) {
 466		p_err("can't read link type: %s", strerror(errno));
 467		return -1;
 468	}
 469	if (n == sizeof(buf)) {
 470		p_err("can't read link type: path too long!");
 471		return -1;
 472	}
 473	buf[n] = '\0';
 474
 475	if (strstr(buf, "bpf-map"))
 476		return BPF_OBJ_MAP;
 477	else if (strstr(buf, "bpf-prog"))
 478		return BPF_OBJ_PROG;
 479	else if (strstr(buf, "bpf-link"))
 480		return BPF_OBJ_LINK;
 481
 482	return BPF_OBJ_UNKNOWN;
 483}
 484
 485char *get_fdinfo(int fd, const char *key)
 486{
 487	char path[PATH_MAX];
 488	char *line = NULL;
 489	size_t line_n = 0;
 490	ssize_t n;
 491	FILE *fdi;
 492
 493	snprintf(path, sizeof(path), "/proc/self/fdinfo/%d", fd);
 494
 495	fdi = fopen(path, "r");
 496	if (!fdi)
 497		return NULL;
 498
 499	while ((n = getline(&line, &line_n, fdi)) > 0) {
 500		char *value;
 501		int len;
 502
 503		if (!strstr(line, key))
 504			continue;
 505
 506		fclose(fdi);
 507
 508		value = strchr(line, '\t');
 509		if (!value || !value[1]) {
 510			free(line);
 511			return NULL;
 512		}
 513		value++;
 514
 515		len = strlen(value);
 516		memmove(line, value, len);
 517		line[len - 1] = '\0';
 518
 519		return line;
 520	}
 521
 522	free(line);
 523	fclose(fdi);
 524	return NULL;
 525}
 526
 527void print_data_json(uint8_t *data, size_t len)
 528{
 529	unsigned int i;
 530
 531	jsonw_start_array(json_wtr);
 532	for (i = 0; i < len; i++)
 533		jsonw_printf(json_wtr, "%d", data[i]);
 534	jsonw_end_array(json_wtr);
 535}
 536
 537void print_hex_data_json(uint8_t *data, size_t len)
 538{
 539	unsigned int i;
 540
 541	jsonw_start_array(json_wtr);
 542	for (i = 0; i < len; i++)
 543		jsonw_printf(json_wtr, "\"0x%02hhx\"", data[i]);
 544	jsonw_end_array(json_wtr);
 545}
 546
 547/* extra params for nftw cb */
 548static struct hashmap *build_fn_table;
 549static enum bpf_obj_type build_fn_type;
 550
 551static int do_build_table_cb(const char *fpath, const struct stat *sb,
 552			     int typeflag, struct FTW *ftwbuf)
 553{
 554	struct bpf_prog_info pinned_info;
 555	__u32 len = sizeof(pinned_info);
 556	enum bpf_obj_type objtype;
 557	int fd, err = 0;
 558	char *path;
 559
 560	if (typeflag != FTW_F)
 561		goto out_ret;
 562
 563	fd = open_obj_pinned(fpath, true, NULL);
 564	if (fd < 0)
 565		goto out_ret;
 566
 567	objtype = get_fd_type(fd);
 568	if (objtype != build_fn_type)
 569		goto out_close;
 570
 571	memset(&pinned_info, 0, sizeof(pinned_info));
 572	if (bpf_prog_get_info_by_fd(fd, &pinned_info, &len))
 573		goto out_close;
 574
 575	path = strdup(fpath);
 576	if (!path) {
 577		err = -1;
 578		goto out_close;
 579	}
 580
 581	err = hashmap__append(build_fn_table, pinned_info.id, path);
 582	if (err) {
 583		p_err("failed to append entry to hashmap for ID %u, path '%s': %s",
 584		      pinned_info.id, path, strerror(errno));
 585		free(path);
 586		goto out_close;
 587	}
 588
 589out_close:
 590	close(fd);
 591out_ret:
 592	return err;
 593}
 594
 595int build_pinned_obj_table(struct hashmap *tab,
 596			   enum bpf_obj_type type)
 597{
 598	struct mntent *mntent = NULL;
 599	FILE *mntfile = NULL;
 600	int flags = FTW_PHYS;
 601	int nopenfd = 16;
 602	int err = 0;
 603
 604	mntfile = setmntent("/proc/mounts", "r");
 605	if (!mntfile)
 606		return -1;
 607
 608	build_fn_table = tab;
 609	build_fn_type = type;
 610
 611	while ((mntent = getmntent(mntfile))) {
 612		char *path = mntent->mnt_dir;
 613
 614		if (strncmp(mntent->mnt_type, "bpf", 3) != 0)
 615			continue;
 616		err = nftw(path, do_build_table_cb, nopenfd, flags);
 617		if (err)
 618			break;
 619	}
 620	fclose(mntfile);
 621	return err;
 622}
 623
 624void delete_pinned_obj_table(struct hashmap *map)
 625{
 626	struct hashmap_entry *entry;
 627	size_t bkt;
 628
 629	if (!map)
 630		return;
 631
 632	hashmap__for_each_entry(map, entry, bkt)
 633		free(entry->pvalue);
 634
 635	hashmap__free(map);
 636}
 637
 638unsigned int get_page_size(void)
 639{
 640	static int result;
 641
 642	if (!result)
 643		result = getpagesize();
 644	return result;
 645}
 646
 647unsigned int get_possible_cpus(void)
 648{
 649	int cpus = libbpf_num_possible_cpus();
 650
 651	if (cpus < 0) {
 652		p_err("Can't get # of possible cpus: %s", strerror(-cpus));
 653		exit(-1);
 654	}
 655	return cpus;
 656}
 657
 658static char *
 659ifindex_to_name_ns(__u32 ifindex, __u32 ns_dev, __u32 ns_ino, char *buf)
 660{
 661	struct stat st;
 662	int err;
 663
 664	err = stat("/proc/self/ns/net", &st);
 665	if (err) {
 666		p_err("Can't stat /proc/self: %s", strerror(errno));
 667		return NULL;
 668	}
 669
 670	if (st.st_dev != ns_dev || st.st_ino != ns_ino)
 671		return NULL;
 672
 673	return if_indextoname(ifindex, buf);
 674}
 675
 676static int read_sysfs_hex_int(char *path)
 677{
 678	char vendor_id_buf[8];
 679	int len;
 680	int fd;
 681
 682	fd = open(path, O_RDONLY);
 683	if (fd < 0) {
 684		p_err("Can't open %s: %s", path, strerror(errno));
 685		return -1;
 686	}
 687
 688	len = read(fd, vendor_id_buf, sizeof(vendor_id_buf));
 689	close(fd);
 690	if (len < 0) {
 691		p_err("Can't read %s: %s", path, strerror(errno));
 692		return -1;
 693	}
 694	if (len >= (int)sizeof(vendor_id_buf)) {
 695		p_err("Value in %s too long", path);
 696		return -1;
 697	}
 698
 699	vendor_id_buf[len] = 0;
 700
 701	return strtol(vendor_id_buf, NULL, 0);
 702}
 703
 704static int read_sysfs_netdev_hex_int(char *devname, const char *entry_name)
 705{
 706	char full_path[64];
 707
 708	snprintf(full_path, sizeof(full_path), "/sys/class/net/%s/device/%s",
 709		 devname, entry_name);
 710
 711	return read_sysfs_hex_int(full_path);
 712}
 713
 714const char *
 715ifindex_to_arch(__u32 ifindex, __u64 ns_dev, __u64 ns_ino, const char **opt)
 716{
 717	__maybe_unused int device_id;
 718	char devname[IF_NAMESIZE];
 719	int vendor_id;
 720
 721	if (!ifindex_to_name_ns(ifindex, ns_dev, ns_ino, devname)) {
 722		p_err("Can't get net device name for ifindex %u: %s", ifindex,
 723		      strerror(errno));
 724		return NULL;
 725	}
 726
 727	vendor_id = read_sysfs_netdev_hex_int(devname, "vendor");
 728	if (vendor_id < 0) {
 729		p_err("Can't get device vendor id for %s", devname);
 730		return NULL;
 731	}
 732
 733	switch (vendor_id) {
 734#ifdef HAVE_LIBBFD_SUPPORT
 735	case 0x19ee:
 736		device_id = read_sysfs_netdev_hex_int(devname, "device");
 737		if (device_id != 0x4000 &&
 738		    device_id != 0x6000 &&
 739		    device_id != 0x6003)
 740			p_info("Unknown NFP device ID, assuming it is NFP-6xxx arch");
 741		*opt = "ctx4";
 742		return "NFP-6xxx";
 743#endif /* HAVE_LIBBFD_SUPPORT */
 744	/* No NFP support in LLVM, we have no valid triple to return. */
 745	default:
 746		p_err("Can't get arch name for device vendor id 0x%04x",
 747		      (unsigned int)vendor_id);
 748		return NULL;
 749	}
 750}
 751
 752void print_dev_plain(__u32 ifindex, __u64 ns_dev, __u64 ns_inode)
 753{
 754	char name[IF_NAMESIZE];
 755
 756	if (!ifindex)
 757		return;
 758
 759	printf("  offloaded_to ");
 760	if (ifindex_to_name_ns(ifindex, ns_dev, ns_inode, name))
 761		printf("%s", name);
 762	else
 763		printf("ifindex %u ns_dev %llu ns_ino %llu",
 764		       ifindex, ns_dev, ns_inode);
 765}
 766
 767void print_dev_json(__u32 ifindex, __u64 ns_dev, __u64 ns_inode)
 768{
 769	char name[IF_NAMESIZE];
 770
 771	if (!ifindex)
 772		return;
 773
 774	jsonw_name(json_wtr, "dev");
 775	jsonw_start_object(json_wtr);
 776	jsonw_uint_field(json_wtr, "ifindex", ifindex);
 777	jsonw_uint_field(json_wtr, "ns_dev", ns_dev);
 778	jsonw_uint_field(json_wtr, "ns_inode", ns_inode);
 779	if (ifindex_to_name_ns(ifindex, ns_dev, ns_inode, name))
 780		jsonw_string_field(json_wtr, "ifname", name);
 781	jsonw_end_object(json_wtr);
 782}
 783
 784int parse_u32_arg(int *argc, char ***argv, __u32 *val, const char *what)
 785{
 786	char *endptr;
 787
 788	NEXT_ARGP();
 789
 790	if (*val) {
 791		p_err("%s already specified", what);
 792		return -1;
 793	}
 794
 795	*val = strtoul(**argv, &endptr, 0);
 796	if (*endptr) {
 797		p_err("can't parse %s as %s", **argv, what);
 798		return -1;
 799	}
 800	NEXT_ARGP();
 801
 802	return 0;
 803}
 804
 805int __printf(2, 0)
 806print_all_levels(__maybe_unused enum libbpf_print_level level,
 807		 const char *format, va_list args)
 808{
 809	return vfprintf(stderr, format, args);
 810}
 811
 812static int prog_fd_by_nametag(void *nametag, int **fds, bool tag)
 813{
 814	char prog_name[MAX_PROG_FULL_NAME];
 815	unsigned int id = 0;
 816	int fd, nb_fds = 0;
 817	void *tmp;
 818	int err;
 819
 820	while (true) {
 821		struct bpf_prog_info info = {};
 822		__u32 len = sizeof(info);
 823
 824		err = bpf_prog_get_next_id(id, &id);
 825		if (err) {
 826			if (errno != ENOENT) {
 827				p_err("%s", strerror(errno));
 828				goto err_close_fds;
 829			}
 830			return nb_fds;
 831		}
 832
 833		fd = bpf_prog_get_fd_by_id(id);
 834		if (fd < 0) {
 835			p_err("can't get prog by id (%u): %s",
 836			      id, strerror(errno));
 837			goto err_close_fds;
 838		}
 839
 840		err = bpf_prog_get_info_by_fd(fd, &info, &len);
 841		if (err) {
 842			p_err("can't get prog info (%u): %s",
 843			      id, strerror(errno));
 844			goto err_close_fd;
 845		}
 846
 847		if (tag && memcmp(nametag, info.tag, BPF_TAG_SIZE)) {
 848			close(fd);
 849			continue;
 850		}
 851
 852		if (!tag) {
 853			get_prog_full_name(&info, fd, prog_name,
 854					   sizeof(prog_name));
 855			if (strncmp(nametag, prog_name, sizeof(prog_name))) {
 856				close(fd);
 857				continue;
 858			}
 859		}
 860
 861		if (nb_fds > 0) {
 862			tmp = realloc(*fds, (nb_fds + 1) * sizeof(int));
 863			if (!tmp) {
 864				p_err("failed to realloc");
 865				goto err_close_fd;
 866			}
 867			*fds = tmp;
 868		}
 869		(*fds)[nb_fds++] = fd;
 870	}
 871
 872err_close_fd:
 873	close(fd);
 874err_close_fds:
 875	while (--nb_fds >= 0)
 876		close((*fds)[nb_fds]);
 877	return -1;
 878}
 879
 880int prog_parse_fds(int *argc, char ***argv, int **fds)
 881{
 882	if (is_prefix(**argv, "id")) {
 883		unsigned int id;
 884		char *endptr;
 885
 886		NEXT_ARGP();
 887
 888		id = strtoul(**argv, &endptr, 0);
 889		if (*endptr) {
 890			p_err("can't parse %s as ID", **argv);
 891			return -1;
 892		}
 893		NEXT_ARGP();
 894
 895		(*fds)[0] = bpf_prog_get_fd_by_id(id);
 896		if ((*fds)[0] < 0) {
 897			p_err("get by id (%u): %s", id, strerror(errno));
 898			return -1;
 899		}
 900		return 1;
 901	} else if (is_prefix(**argv, "tag")) {
 902		unsigned char tag[BPF_TAG_SIZE];
 903
 904		NEXT_ARGP();
 905
 906		if (sscanf(**argv, BPF_TAG_FMT, tag, tag + 1, tag + 2,
 907			   tag + 3, tag + 4, tag + 5, tag + 6, tag + 7)
 908		    != BPF_TAG_SIZE) {
 909			p_err("can't parse tag");
 910			return -1;
 911		}
 912		NEXT_ARGP();
 913
 914		return prog_fd_by_nametag(tag, fds, true);
 915	} else if (is_prefix(**argv, "name")) {
 916		char *name;
 917
 918		NEXT_ARGP();
 919
 920		name = **argv;
 921		if (strlen(name) > MAX_PROG_FULL_NAME - 1) {
 922			p_err("can't parse name");
 923			return -1;
 924		}
 925		NEXT_ARGP();
 926
 927		return prog_fd_by_nametag(name, fds, false);
 928	} else if (is_prefix(**argv, "pinned")) {
 929		char *path;
 930
 931		NEXT_ARGP();
 932
 933		path = **argv;
 934		NEXT_ARGP();
 935
 936		(*fds)[0] = open_obj_pinned_any(path, BPF_OBJ_PROG, NULL);
 937		if ((*fds)[0] < 0)
 938			return -1;
 939		return 1;
 940	}
 941
 942	p_err("expected 'id', 'tag', 'name' or 'pinned', got: '%s'?", **argv);
 943	return -1;
 944}
 945
 946int prog_parse_fd(int *argc, char ***argv)
 947{
 948	int *fds = NULL;
 949	int nb_fds, fd;
 950
 951	fds = malloc(sizeof(int));
 952	if (!fds) {
 953		p_err("mem alloc failed");
 954		return -1;
 955	}
 956	nb_fds = prog_parse_fds(argc, argv, &fds);
 957	if (nb_fds != 1) {
 958		if (nb_fds > 1) {
 959			p_err("several programs match this handle");
 960			while (nb_fds--)
 961				close(fds[nb_fds]);
 962		}
 963		fd = -1;
 964		goto exit_free;
 965	}
 966
 967	fd = fds[0];
 968exit_free:
 969	free(fds);
 970	return fd;
 971}
 972
 973static int map_fd_by_name(char *name, int **fds,
 974			  const struct bpf_get_fd_by_id_opts *opts)
 975{
 976	unsigned int id = 0;
 977	int fd, nb_fds = 0;
 978	void *tmp;
 979	int err;
 980
 981	while (true) {
 982		LIBBPF_OPTS(bpf_get_fd_by_id_opts, opts_ro);
 983		struct bpf_map_info info = {};
 984		__u32 len = sizeof(info);
 985
 986		err = bpf_map_get_next_id(id, &id);
 987		if (err) {
 988			if (errno != ENOENT) {
 989				p_err("%s", strerror(errno));
 990				goto err_close_fds;
 991			}
 992			return nb_fds;
 993		}
 994
 995		/* Request a read-only fd to query the map info */
 996		opts_ro.open_flags = BPF_F_RDONLY;
 997		fd = bpf_map_get_fd_by_id_opts(id, &opts_ro);
 998		if (fd < 0) {
 999			p_err("can't get map by id (%u): %s",
1000			      id, strerror(errno));
1001			goto err_close_fds;
1002		}
1003
1004		err = bpf_map_get_info_by_fd(fd, &info, &len);
1005		if (err) {
1006			p_err("can't get map info (%u): %s",
1007			      id, strerror(errno));
1008			goto err_close_fd;
1009		}
1010
1011		if (strncmp(name, info.name, BPF_OBJ_NAME_LEN)) {
1012			close(fd);
1013			continue;
1014		}
1015
1016		/* Get an fd with the requested options, if they differ
1017		 * from the read-only options used to get the fd above.
1018		 */
1019		if (memcmp(opts, &opts_ro, sizeof(opts_ro))) {
1020			close(fd);
1021			fd = bpf_map_get_fd_by_id_opts(id, opts);
1022			if (fd < 0) {
1023				p_err("can't get map by id (%u): %s", id,
1024					strerror(errno));
1025				goto err_close_fds;
1026			}
1027		}
1028
1029		if (nb_fds > 0) {
1030			tmp = realloc(*fds, (nb_fds + 1) * sizeof(int));
1031			if (!tmp) {
1032				p_err("failed to realloc");
1033				goto err_close_fd;
1034			}
1035			*fds = tmp;
1036		}
1037		(*fds)[nb_fds++] = fd;
1038	}
1039
1040err_close_fd:
1041	close(fd);
1042err_close_fds:
1043	while (--nb_fds >= 0)
1044		close((*fds)[nb_fds]);
1045	return -1;
1046}
1047
1048int map_parse_fds(int *argc, char ***argv, int **fds, __u32 open_flags)
1049{
1050	LIBBPF_OPTS(bpf_get_fd_by_id_opts, opts);
1051
1052	assert((open_flags & ~BPF_F_RDONLY) == 0);
1053	opts.open_flags = open_flags;
1054
1055	if (is_prefix(**argv, "id")) {
1056		unsigned int id;
1057		char *endptr;
1058
1059		NEXT_ARGP();
1060
1061		id = strtoul(**argv, &endptr, 0);
1062		if (*endptr) {
1063			p_err("can't parse %s as ID", **argv);
1064			return -1;
1065		}
1066		NEXT_ARGP();
1067
1068		(*fds)[0] = bpf_map_get_fd_by_id_opts(id, &opts);
1069		if ((*fds)[0] < 0) {
1070			p_err("get map by id (%u): %s", id, strerror(errno));
1071			return -1;
1072		}
1073		return 1;
1074	} else if (is_prefix(**argv, "name")) {
1075		char *name;
1076
1077		NEXT_ARGP();
1078
1079		name = **argv;
1080		if (strlen(name) > BPF_OBJ_NAME_LEN - 1) {
1081			p_err("can't parse name");
1082			return -1;
1083		}
1084		NEXT_ARGP();
1085
1086		return map_fd_by_name(name, fds, &opts);
1087	} else if (is_prefix(**argv, "pinned")) {
1088		char *path;
1089		LIBBPF_OPTS(bpf_obj_get_opts, get_opts);
1090		get_opts.file_flags = open_flags;
1091
1092		NEXT_ARGP();
1093
1094		path = **argv;
1095		NEXT_ARGP();
1096
1097		(*fds)[0] = open_obj_pinned_any(path, BPF_OBJ_MAP, &get_opts);
1098		if ((*fds)[0] < 0)
1099			return -1;
1100		return 1;
1101	}
1102
1103	p_err("expected 'id', 'name' or 'pinned', got: '%s'?", **argv);
1104	return -1;
1105}
1106
1107int map_parse_fd(int *argc, char ***argv, __u32 open_flags)
1108{
1109	int *fds = NULL;
1110	int nb_fds, fd;
1111
1112	fds = malloc(sizeof(int));
1113	if (!fds) {
1114		p_err("mem alloc failed");
1115		return -1;
1116	}
1117	nb_fds = map_parse_fds(argc, argv, &fds, open_flags);
1118	if (nb_fds != 1) {
1119		if (nb_fds > 1) {
1120			p_err("several maps match this handle");
1121			while (nb_fds--)
1122				close(fds[nb_fds]);
1123		}
1124		fd = -1;
1125		goto exit_free;
1126	}
1127
1128	fd = fds[0];
1129exit_free:
1130	free(fds);
1131	return fd;
1132}
1133
1134int map_parse_fd_and_info(int *argc, char ***argv, struct bpf_map_info *info,
1135			  __u32 *info_len, __u32 open_flags)
1136{
1137	int err;
1138	int fd;
1139
1140	fd = map_parse_fd(argc, argv, open_flags);
1141	if (fd < 0)
1142		return -1;
1143
1144	err = bpf_map_get_info_by_fd(fd, info, info_len);
1145	if (err) {
1146		p_err("can't get map info: %s", strerror(errno));
1147		close(fd);
1148		return err;
1149	}
1150
1151	return fd;
1152}
1153
1154size_t hash_fn_for_key_as_id(long key, void *ctx)
1155{
1156	return key;
1157}
1158
1159bool equal_fn_for_key_as_id(long k1, long k2, void *ctx)
1160{
1161	return k1 == k2;
1162}
1163
1164const char *bpf_attach_type_input_str(enum bpf_attach_type t)
1165{
1166	switch (t) {
1167	case BPF_CGROUP_INET_INGRESS:		return "ingress";
1168	case BPF_CGROUP_INET_EGRESS:		return "egress";
1169	case BPF_CGROUP_INET_SOCK_CREATE:	return "sock_create";
1170	case BPF_CGROUP_INET_SOCK_RELEASE:	return "sock_release";
1171	case BPF_CGROUP_SOCK_OPS:		return "sock_ops";
1172	case BPF_CGROUP_DEVICE:			return "device";
1173	case BPF_CGROUP_INET4_BIND:		return "bind4";
1174	case BPF_CGROUP_INET6_BIND:		return "bind6";
1175	case BPF_CGROUP_INET4_CONNECT:		return "connect4";
1176	case BPF_CGROUP_INET6_CONNECT:		return "connect6";
1177	case BPF_CGROUP_INET4_POST_BIND:	return "post_bind4";
1178	case BPF_CGROUP_INET6_POST_BIND:	return "post_bind6";
1179	case BPF_CGROUP_INET4_GETPEERNAME:	return "getpeername4";
1180	case BPF_CGROUP_INET6_GETPEERNAME:	return "getpeername6";
1181	case BPF_CGROUP_INET4_GETSOCKNAME:	return "getsockname4";
1182	case BPF_CGROUP_INET6_GETSOCKNAME:	return "getsockname6";
1183	case BPF_CGROUP_UDP4_SENDMSG:		return "sendmsg4";
1184	case BPF_CGROUP_UDP6_SENDMSG:		return "sendmsg6";
1185	case BPF_CGROUP_SYSCTL:			return "sysctl";
1186	case BPF_CGROUP_UDP4_RECVMSG:		return "recvmsg4";
1187	case BPF_CGROUP_UDP6_RECVMSG:		return "recvmsg6";
1188	case BPF_CGROUP_GETSOCKOPT:		return "getsockopt";
1189	case BPF_CGROUP_SETSOCKOPT:		return "setsockopt";
1190	case BPF_TRACE_RAW_TP:			return "raw_tp";
1191	case BPF_TRACE_FENTRY:			return "fentry";
1192	case BPF_TRACE_FEXIT:			return "fexit";
1193	case BPF_MODIFY_RETURN:			return "mod_ret";
1194	case BPF_SK_REUSEPORT_SELECT:		return "sk_skb_reuseport_select";
1195	case BPF_SK_REUSEPORT_SELECT_OR_MIGRATE:	return "sk_skb_reuseport_select_or_migrate";
1196	default:	return libbpf_bpf_attach_type_str(t);
1197	}
1198}
1199
1200int pathname_concat(char *buf, int buf_sz, const char *path,
1201		    const char *name)
1202{
1203	int len;
1204
1205	len = snprintf(buf, buf_sz, "%s/%s", path, name);
1206	if (len < 0)
1207		return -EINVAL;
1208	if (len >= buf_sz)
1209		return -ENAMETOOLONG;
1210
1211	return 0;
1212}
1213
1214static bool read_next_kernel_config_option(gzFile file, char *buf, size_t n,
1215					   char **value)
1216{
1217	char *sep;
1218
1219	while (gzgets(file, buf, n)) {
1220		if (strncmp(buf, "CONFIG_", 7))
1221			continue;
1222
1223		sep = strchr(buf, '=');
1224		if (!sep)
1225			continue;
1226
1227		/* Trim ending '\n' */
1228		buf[strlen(buf) - 1] = '\0';
1229
1230		/* Split on '=' and ensure that a value is present. */
1231		*sep = '\0';
1232		if (!sep[1])
1233			continue;
1234
1235		*value = sep + 1;
1236		return true;
1237	}
1238
1239	return false;
1240}
1241
1242int read_kernel_config(const struct kernel_config_option *requested_options,
1243		       size_t num_options, char **out_values,
1244		       const char *define_prefix)
1245{
1246	struct utsname utsn;
1247	char path[PATH_MAX];
1248	gzFile file = NULL;
1249	char buf[4096];
1250	char *value;
1251	size_t i;
1252	int ret = 0;
1253
1254	if (!requested_options || !out_values || num_options == 0)
1255		return -1;
1256
1257	if (!uname(&utsn)) {
1258		snprintf(path, sizeof(path), "/boot/config-%s", utsn.release);
1259
1260		/* gzopen also accepts uncompressed files. */
1261		file = gzopen(path, "r");
1262	}
1263
1264	if (!file) {
1265		/* Some distributions build with CONFIG_IKCONFIG=y and put the
1266		 * config file at /proc/config.gz.
1267		 */
1268		file = gzopen("/proc/config.gz", "r");
1269	}
1270
1271	if (!file) {
1272		p_info("skipping kernel config, can't open file: %s",
1273			strerror(errno));
1274		return -1;
1275	}
1276
1277	if (!gzgets(file, buf, sizeof(buf)) || !gzgets(file, buf, sizeof(buf))) {
1278		p_info("skipping kernel config, can't read from file: %s",
1279			strerror(errno));
1280		ret = -1;
1281		goto end_parse;
1282	}
1283
1284	if (strcmp(buf, "# Automatically generated file; DO NOT EDIT.\n")) {
1285		p_info("skipping kernel config, can't find correct file");
1286		ret = -1;
1287		goto end_parse;
1288	}
1289
1290	while (read_next_kernel_config_option(file, buf, sizeof(buf), &value)) {
1291		for (i = 0; i < num_options; i++) {
1292			if ((define_prefix && !requested_options[i].macro_dump) ||
1293			     out_values[i] || strcmp(buf, requested_options[i].name))
1294				continue;
1295
1296			out_values[i] = strdup(value);
1297		}
1298	}
1299
1300end_parse:
1301	gzclose(file);
1302	return ret;
1303}