mirror of
				https://github.com/torvalds/linux.git
				synced 2025-11-04 02:30:34 +02:00 
			
		
		
		
	The CPU map for a non-core PMU gives a default CPU value for perf_event_open. For core PMUs the CPU map lists all CPUs the evsel may be opened on. If there are >1 core PMU, the CPU maps will list the CPUs for that core PMU, but the user_requested_cpus may contain CPUs that are invalid for the PMU and cause perf_event_open to fail. To avoid this, when propagating the CPU map for core PMUs intersect it with the CPU map of the PMU (the evsel's "own_cpus"). Add comments to __perf_evlist__propagate_maps to explain its somewhat complex behavior. Fix the related comments for system_wide in struct perf_evsel. Reviewed-by: Kan Liang <kan.liang@linux.intel.com> Signed-off-by: Ian Rogers <irogers@google.com> Cc: Adrian Hunter <adrian.hunter@intel.com> Cc: Alexander Shishkin <alexander.shishkin@linux.intel.com> Cc: Ali Saidi <alisaidi@amazon.com> Cc: Athira Rajeev <atrajeev@linux.vnet.ibm.com> Cc: Dmitrii Dolgov <9erthalion6@gmail.com> Cc: Huacai Chen <chenhuacai@kernel.org> Cc: Ingo Molnar <mingo@redhat.com> Cc: James Clark <james.clark@arm.com> Cc: Jing Zhang <renyu.zj@linux.alibaba.com> Cc: Jiri Olsa <jolsa@kernel.org> Cc: John Garry <john.g.garry@oracle.com> Cc: Kajol Jain <kjain@linux.ibm.com> Cc: Kang Minchul <tegongkang@gmail.com> Cc: Leo Yan <leo.yan@linaro.org> Cc: Madhavan Srinivasan <maddy@linux.ibm.com> Cc: Mark Rutland <mark.rutland@arm.com> Cc: Mike Leach <mike.leach@linaro.org> Cc: Ming Wang <wangming01@loongson.cn> Cc: Namhyung Kim <namhyung@kernel.org> Cc: Peter Zijlstra <peterz@infradead.org> Cc: Ravi Bangoria <ravi.bangoria@amd.com> Cc: Rob Herring <robh@kernel.org> Cc: Sandipan Das <sandipan.das@amd.com> Cc: Sean Christopherson <seanjc@google.com> Cc: Suzuki Poulouse <suzuki.poulose@arm.com> Cc: Thomas Richter <tmricht@linux.ibm.com> Cc: Will Deacon <will@kernel.org> Cc: Xing Zhengjun <zhengjun.xing@linux.intel.com> Cc: coresight@lists.linaro.org Cc: linux-arm-kernel@lists.infradead.org Link: https://lore.kernel.org/r/20230527072210.2900565-9-irogers@google.com Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
		
			
				
	
	
		
			91 lines
		
	
	
	
		
			2.8 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			91 lines
		
	
	
	
		
			2.8 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
/* SPDX-License-Identifier: GPL-2.0 */
 | 
						|
#ifndef __LIBPERF_INTERNAL_EVSEL_H
 | 
						|
#define __LIBPERF_INTERNAL_EVSEL_H
 | 
						|
 | 
						|
#include <linux/types.h>
 | 
						|
#include <linux/perf_event.h>
 | 
						|
#include <stdbool.h>
 | 
						|
#include <sys/types.h>
 | 
						|
#include <internal/cpumap.h>
 | 
						|
 | 
						|
struct perf_thread_map;
 | 
						|
struct xyarray;
 | 
						|
 | 
						|
/*
 | 
						|
 * Per fd, to map back from PERF_SAMPLE_ID to evsel, only used when there are
 | 
						|
 * more than one entry in the evlist.
 | 
						|
 */
 | 
						|
struct perf_sample_id {
 | 
						|
	struct hlist_node	 node;
 | 
						|
	u64			 id;
 | 
						|
	struct perf_evsel	*evsel;
 | 
						|
       /*
 | 
						|
	* 'idx' will be used for AUX area sampling. A sample will have AUX area
 | 
						|
	* data that will be queued for decoding, where there are separate
 | 
						|
	* queues for each CPU (per-cpu tracing) or task (per-thread tracing).
 | 
						|
	* The sample ID can be used to lookup 'idx' which is effectively the
 | 
						|
	* queue number.
 | 
						|
	*/
 | 
						|
	int			 idx;
 | 
						|
	struct perf_cpu		 cpu;
 | 
						|
	pid_t			 tid;
 | 
						|
 | 
						|
	/* Guest machine pid and VCPU, valid only if machine_pid is non-zero */
 | 
						|
	pid_t			 machine_pid;
 | 
						|
	struct perf_cpu		 vcpu;
 | 
						|
 | 
						|
	/* Holds total ID period value for PERF_SAMPLE_READ processing. */
 | 
						|
	u64			 period;
 | 
						|
};
 | 
						|
 | 
						|
struct perf_evsel {
 | 
						|
	struct list_head	 node;
 | 
						|
	struct perf_event_attr	 attr;
 | 
						|
	/** The commonly used cpu map of CPUs the event should be opened upon, etc. */
 | 
						|
	struct perf_cpu_map	*cpus;
 | 
						|
	/**
 | 
						|
	 * The cpu map read from the PMU. For core PMUs this is the list of all
 | 
						|
	 * CPUs the event can be opened upon. For other PMUs this is the default
 | 
						|
	 * cpu map for opening the event on, for example, the first CPU on a
 | 
						|
	 * socket for an uncore event.
 | 
						|
	 */
 | 
						|
	struct perf_cpu_map	*own_cpus;
 | 
						|
	struct perf_thread_map	*threads;
 | 
						|
	struct xyarray		*fd;
 | 
						|
	struct xyarray		*mmap;
 | 
						|
	struct xyarray		*sample_id;
 | 
						|
	u64			*id;
 | 
						|
	u32			 ids;
 | 
						|
	struct perf_evsel	*leader;
 | 
						|
 | 
						|
	/* parse modifier helper */
 | 
						|
	int			 nr_members;
 | 
						|
	/*
 | 
						|
	 * system_wide is for events that need to be on every CPU, irrespective
 | 
						|
	 * of user requested CPUs or threads. Tha main example of this is the
 | 
						|
	 * dummy event. Map propagation will set cpus for this event to all CPUs
 | 
						|
	 * as software PMU events like dummy, have a CPU map that is empty.
 | 
						|
	 */
 | 
						|
	bool			 system_wide;
 | 
						|
	/*
 | 
						|
	 * Some events, for example uncore events, require a CPU.
 | 
						|
	 * i.e. it cannot be the 'any CPU' value of -1.
 | 
						|
	 */
 | 
						|
	bool			 requires_cpu;
 | 
						|
	/** Is the PMU for the event a core one? Effects the handling of own_cpus. */
 | 
						|
	bool			 is_pmu_core;
 | 
						|
	int			 idx;
 | 
						|
};
 | 
						|
 | 
						|
void perf_evsel__init(struct perf_evsel *evsel, struct perf_event_attr *attr,
 | 
						|
		      int idx);
 | 
						|
int perf_evsel__alloc_fd(struct perf_evsel *evsel, int ncpus, int nthreads);
 | 
						|
void perf_evsel__close_fd(struct perf_evsel *evsel);
 | 
						|
void perf_evsel__free_fd(struct perf_evsel *evsel);
 | 
						|
int perf_evsel__read_size(struct perf_evsel *evsel);
 | 
						|
int perf_evsel__apply_filter(struct perf_evsel *evsel, const char *filter);
 | 
						|
 | 
						|
int perf_evsel__alloc_id(struct perf_evsel *evsel, int ncpus, int nthreads);
 | 
						|
void perf_evsel__free_id(struct perf_evsel *evsel);
 | 
						|
 | 
						|
#endif /* __LIBPERF_INTERNAL_EVSEL_H */
 |