mirror of
				https://github.com/torvalds/linux.git
				synced 2025-11-04 10:40:15 +02:00 
			
		
		
		
	Macro PAGE_OFFSET(0xffff880000000000) in sampleip_user.c is inaccurate,
for example, in aarch64 architecture, this value depends on the
CONFIG_ARM64_VA_BITS compilation configuration, this value defaults to 48,
the corresponding PAGE_OFFSET is 0xffff800000000000, if we use the value
defined in sampleip_user.c, then all KSYMs obtained by sampleip are (user)
Symbol error due to PAGE_OFFSET error:
    $ sudo ./sampleip 1
    Sampling at 99 Hertz for 1 seconds. Ctrl-C also ends.
    ADDR                KSYM                             COUNT
    0xffff80000810ceb8  (user)                           1
    0xffffb28ec880      (user)                           1
    0xffff8000080c82b8  (user)                           1
    0xffffb23fed24      (user)                           1
    0xffffb28944fc      (user)                           1
    0xffff8000084628bc  (user)                           1
    0xffffb2a935c0      (user)                           1
    0xffff80000844677c  (user)                           1
    0xffff80000857a3a4  (user)                           1
    ...
A few examples of addresses in the CONFIG_ARM64_VA_BITS=48 environment in
the aarch64 environment:
    $ sudo head /proc/kallsyms
    ffff8000080a0000 T _text
    ffff8000080b0000 t gic_handle_irq
    ffff8000080b0000 T _stext
    ffff8000080b0000 T __irqentry_text_start
    ffff8000080b00b0 t gic_handle_irq
    ffff8000080b0230 t gic_handle_irq
    ffff8000080b03b4 T __irqentry_text_end
    ffff8000080b03b8 T __softirqentry_text_start
    ffff8000080b03c0 T __do_softirq
    ffff8000080b0718 T __entry_text_start
We just need to replace the PAGE_OFFSET with the address _text in
/proc/kallsyms to solve this problem:
    $ sudo ./sampleip 1
    Sampling at 99 Hertz for 1 seconds. Ctrl-C also ends.
    ADDR                KSYM                             COUNT
    0xffffb2892ab0      (user)                           1
    0xffffb2b1edfc      (user)                           1
    0xffff800008462834  __arm64_sys_ppoll                1
    0xffff8000084b87f4  eventfd_read                     1
    0xffffb28e6788      (user)                           1
    0xffff8000081e96d8  rcu_all_qs                       1
    0xffffb2ada878      (user)                           1
    ...
Signed-off-by: Rong Tao <rongtao@cestc.cn>
Link: https://lore.kernel.org/r/tencent_A0E82E0BEE925285F8156D540731DF805F05@qq.com
Signed-off-by: Alexei Starovoitov <ast@kernel.org>
		
	
			
		
			
				
	
	
		
			234 lines
		
	
	
	
		
			5 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			234 lines
		
	
	
	
		
			5 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
// SPDX-License-Identifier: GPL-2.0-only
 | 
						|
/*
 | 
						|
 * sampleip: sample instruction pointer and frequency count in a BPF map.
 | 
						|
 *
 | 
						|
 * Copyright 2016 Netflix, Inc.
 | 
						|
 */
 | 
						|
#include <stdio.h>
 | 
						|
#include <stdlib.h>
 | 
						|
#include <unistd.h>
 | 
						|
#include <errno.h>
 | 
						|
#include <signal.h>
 | 
						|
#include <string.h>
 | 
						|
#include <linux/perf_event.h>
 | 
						|
#include <linux/ptrace.h>
 | 
						|
#include <linux/bpf.h>
 | 
						|
#include <bpf/bpf.h>
 | 
						|
#include <bpf/libbpf.h>
 | 
						|
#include "perf-sys.h"
 | 
						|
#include "trace_helpers.h"
 | 
						|
 | 
						|
#define DEFAULT_FREQ	99
 | 
						|
#define DEFAULT_SECS	5
 | 
						|
#define MAX_IPS		8192
 | 
						|
 | 
						|
static int map_fd;
 | 
						|
static int nr_cpus;
 | 
						|
static long _text_addr;
 | 
						|
 | 
						|
static void usage(void)
 | 
						|
{
 | 
						|
	printf("USAGE: sampleip [-F freq] [duration]\n");
 | 
						|
	printf("       -F freq    # sample frequency (Hertz), default 99\n");
 | 
						|
	printf("       duration   # sampling duration (seconds), default 5\n");
 | 
						|
}
 | 
						|
 | 
						|
static int sampling_start(int freq, struct bpf_program *prog,
 | 
						|
			  struct bpf_link *links[])
 | 
						|
{
 | 
						|
	int i, pmu_fd;
 | 
						|
 | 
						|
	struct perf_event_attr pe_sample_attr = {
 | 
						|
		.type = PERF_TYPE_SOFTWARE,
 | 
						|
		.freq = 1,
 | 
						|
		.sample_period = freq,
 | 
						|
		.config = PERF_COUNT_SW_CPU_CLOCK,
 | 
						|
		.inherit = 1,
 | 
						|
	};
 | 
						|
 | 
						|
	for (i = 0; i < nr_cpus; i++) {
 | 
						|
		pmu_fd = sys_perf_event_open(&pe_sample_attr, -1 /* pid */, i,
 | 
						|
					    -1 /* group_fd */, 0 /* flags */);
 | 
						|
		if (pmu_fd < 0) {
 | 
						|
			fprintf(stderr, "ERROR: Initializing perf sampling\n");
 | 
						|
			return 1;
 | 
						|
		}
 | 
						|
		links[i] = bpf_program__attach_perf_event(prog, pmu_fd);
 | 
						|
		if (libbpf_get_error(links[i])) {
 | 
						|
			fprintf(stderr, "ERROR: Attach perf event\n");
 | 
						|
			links[i] = NULL;
 | 
						|
			close(pmu_fd);
 | 
						|
			return 1;
 | 
						|
		}
 | 
						|
	}
 | 
						|
 | 
						|
	return 0;
 | 
						|
}
 | 
						|
 | 
						|
static void sampling_end(struct bpf_link *links[])
 | 
						|
{
 | 
						|
	int i;
 | 
						|
 | 
						|
	for (i = 0; i < nr_cpus; i++)
 | 
						|
		bpf_link__destroy(links[i]);
 | 
						|
}
 | 
						|
 | 
						|
struct ipcount {
 | 
						|
	__u64 ip;
 | 
						|
	__u32 count;
 | 
						|
};
 | 
						|
 | 
						|
/* used for sorting */
 | 
						|
struct ipcount counts[MAX_IPS];
 | 
						|
 | 
						|
static int count_cmp(const void *p1, const void *p2)
 | 
						|
{
 | 
						|
	return ((struct ipcount *)p1)->count - ((struct ipcount *)p2)->count;
 | 
						|
}
 | 
						|
 | 
						|
static void print_ip_map(int fd)
 | 
						|
{
 | 
						|
	struct ksym *sym;
 | 
						|
	__u64 key, next_key;
 | 
						|
	__u32 value;
 | 
						|
	int i, max;
 | 
						|
 | 
						|
	printf("%-19s %-32s %s\n", "ADDR", "KSYM", "COUNT");
 | 
						|
 | 
						|
	/* fetch IPs and counts */
 | 
						|
	key = 0, i = 0;
 | 
						|
	while (bpf_map_get_next_key(fd, &key, &next_key) == 0) {
 | 
						|
		bpf_map_lookup_elem(fd, &next_key, &value);
 | 
						|
		counts[i].ip = next_key;
 | 
						|
		counts[i++].count = value;
 | 
						|
		key = next_key;
 | 
						|
	}
 | 
						|
	max = i;
 | 
						|
 | 
						|
	/* sort and print */
 | 
						|
	qsort(counts, max, sizeof(struct ipcount), count_cmp);
 | 
						|
	for (i = 0; i < max; i++) {
 | 
						|
		if (counts[i].ip > _text_addr) {
 | 
						|
			sym = ksym_search(counts[i].ip);
 | 
						|
			if (!sym) {
 | 
						|
				printf("ksym not found. Is kallsyms loaded?\n");
 | 
						|
				continue;
 | 
						|
			}
 | 
						|
 | 
						|
			printf("0x%-17llx %-32s %u\n", counts[i].ip, sym->name,
 | 
						|
			       counts[i].count);
 | 
						|
		} else {
 | 
						|
			printf("0x%-17llx %-32s %u\n", counts[i].ip, "(user)",
 | 
						|
			       counts[i].count);
 | 
						|
		}
 | 
						|
	}
 | 
						|
 | 
						|
	if (max == MAX_IPS) {
 | 
						|
		printf("WARNING: IP hash was full (max %d entries); ", max);
 | 
						|
		printf("may have dropped samples\n");
 | 
						|
	}
 | 
						|
}
 | 
						|
 | 
						|
static void int_exit(int sig)
 | 
						|
{
 | 
						|
	printf("\n");
 | 
						|
	print_ip_map(map_fd);
 | 
						|
	exit(0);
 | 
						|
}
 | 
						|
 | 
						|
int main(int argc, char **argv)
 | 
						|
{
 | 
						|
	int opt, freq = DEFAULT_FREQ, secs = DEFAULT_SECS, error = 1;
 | 
						|
	struct bpf_object *obj = NULL;
 | 
						|
	struct bpf_program *prog;
 | 
						|
	struct bpf_link **links;
 | 
						|
	char filename[256];
 | 
						|
 | 
						|
	/* process arguments */
 | 
						|
	while ((opt = getopt(argc, argv, "F:h")) != -1) {
 | 
						|
		switch (opt) {
 | 
						|
		case 'F':
 | 
						|
			freq = atoi(optarg);
 | 
						|
			break;
 | 
						|
		case 'h':
 | 
						|
		default:
 | 
						|
			usage();
 | 
						|
			return 0;
 | 
						|
		}
 | 
						|
	}
 | 
						|
	if (argc - optind == 1)
 | 
						|
		secs = atoi(argv[optind]);
 | 
						|
	if (freq == 0 || secs == 0) {
 | 
						|
		usage();
 | 
						|
		return 1;
 | 
						|
	}
 | 
						|
 | 
						|
	/* initialize kernel symbol translation */
 | 
						|
	if (load_kallsyms()) {
 | 
						|
		fprintf(stderr, "ERROR: loading /proc/kallsyms\n");
 | 
						|
		return 2;
 | 
						|
	}
 | 
						|
 | 
						|
	/* used to determine whether the address is kernel space */
 | 
						|
	_text_addr = ksym_get_addr("_text");
 | 
						|
	if (!_text_addr) {
 | 
						|
		fprintf(stderr, "ERROR: no '_text' in /proc/kallsyms\n");
 | 
						|
		return 3;
 | 
						|
	}
 | 
						|
 | 
						|
	/* create perf FDs for each CPU */
 | 
						|
	nr_cpus = sysconf(_SC_NPROCESSORS_ONLN);
 | 
						|
	links = calloc(nr_cpus, sizeof(struct bpf_link *));
 | 
						|
	if (!links) {
 | 
						|
		fprintf(stderr, "ERROR: malloc of links\n");
 | 
						|
		goto cleanup;
 | 
						|
	}
 | 
						|
 | 
						|
	snprintf(filename, sizeof(filename), "%s_kern.o", argv[0]);
 | 
						|
	obj = bpf_object__open_file(filename, NULL);
 | 
						|
	if (libbpf_get_error(obj)) {
 | 
						|
		fprintf(stderr, "ERROR: opening BPF object file failed\n");
 | 
						|
		obj = NULL;
 | 
						|
		goto cleanup;
 | 
						|
	}
 | 
						|
 | 
						|
	prog = bpf_object__find_program_by_name(obj, "do_sample");
 | 
						|
	if (!prog) {
 | 
						|
		fprintf(stderr, "ERROR: finding a prog in obj file failed\n");
 | 
						|
		goto cleanup;
 | 
						|
	}
 | 
						|
 | 
						|
	/* load BPF program */
 | 
						|
	if (bpf_object__load(obj)) {
 | 
						|
		fprintf(stderr, "ERROR: loading BPF object file failed\n");
 | 
						|
		goto cleanup;
 | 
						|
	}
 | 
						|
 | 
						|
	map_fd = bpf_object__find_map_fd_by_name(obj, "ip_map");
 | 
						|
	if (map_fd < 0) {
 | 
						|
		fprintf(stderr, "ERROR: finding a map in obj file failed\n");
 | 
						|
		goto cleanup;
 | 
						|
	}
 | 
						|
 | 
						|
	signal(SIGINT, int_exit);
 | 
						|
	signal(SIGTERM, int_exit);
 | 
						|
 | 
						|
	/* do sampling */
 | 
						|
	printf("Sampling at %d Hertz for %d seconds. Ctrl-C also ends.\n",
 | 
						|
	       freq, secs);
 | 
						|
	if (sampling_start(freq, prog, links) != 0)
 | 
						|
		goto cleanup;
 | 
						|
 | 
						|
	sleep(secs);
 | 
						|
	error = 0;
 | 
						|
 | 
						|
cleanup:
 | 
						|
	sampling_end(links);
 | 
						|
	/* output sample counts */
 | 
						|
	if (!error)
 | 
						|
		print_ip_map(map_fd);
 | 
						|
 | 
						|
	free(links);
 | 
						|
	bpf_object__close(obj);
 | 
						|
	return error;
 | 
						|
}
 |