lists.openwall.net   lists  /  announce  owl-users  owl-dev  john-users  john-dev  passwdqc-users  yescrypt  popa3d-users  /  oss-security  kernel-hardening  musl  sabotage  tlsify  passwords  /  crypt-dev  xvendor  /  Bugtraq  Full-Disclosure  linux-kernel  linux-netdev  linux-ext4  linux-hardening  linux-cve-announce  PHC 
Open Source and information security mailing list archives
 
Hash Suite: Windows password security audit tool. GUI, reports in PDF.
[<prev] [next>] [<thread-prev] [thread-next>] [day] [month] [year] [list]
Message-ID: <53C56D55.5020303@intel.com>
Date:	Tue, 15 Jul 2014 21:05:09 +0300
From:	Adrian Hunter <adrian.hunter@...el.com>
To:	Arnaldo Carvalho de Melo <acme@...nel.org>
CC:	Peter Zijlstra <peterz@...radead.org>,
	linux-kernel@...r.kernel.org, David Ahern <dsahern@...il.com>,
	Frederic Weisbecker <fweisbec@...il.com>,
	Jiri Olsa <jolsa@...hat.com>,
	Namhyung Kim <namhyung@...il.com>,
	Paul Mackerras <paulus@...ba.org>,
	Stephane Eranian <eranian@...gle.com>
Subject: Re: [PATCH 34/41] perf evlist: Add 'system_wide' option

On 15/07/2014 6:03 p.m., Arnaldo Carvalho de Melo wrote:
> Em Mon, Jul 14, 2014 at 01:02:58PM +0300, Adrian Hunter escreveu:
>> Add an option to cause a selected event
>> to be opened always without a pid when
>> configured by perf_evsel__config().
>>
>> This is needed when using the sched_switch
>> tracepoint to follow object code execution.
>> sched_switch occurs before the task
>> switch and so it cannot record it in a
>> context limited to that task.  Note
>> that also means that sched_switch is
>> useless when capturing data per-thread,
>> as is the 'context-switches' software
>> event for the same reason.
>
> clever, but humm, need to be judicious when allocating things like the
> pollfd, I think, more below...
>
> ... after going thru the whole patch, its not clear how pollfd usage
> takes into account the fact that some of the evsels don't have
> thread_map->nr entries, but just one, will continue reading...
>
>> Signed-off-by: Adrian Hunter <adrian.hunter@...el.com>
>> ---
>>   tools/perf/util/evlist.c | 45 +++++++++++++++++++++++++++++++++++++--------
>>   tools/perf/util/evsel.c  | 31 ++++++++++++++++++++++++++-----
>>   tools/perf/util/evsel.h  |  1 +
>>   3 files changed, 64 insertions(+), 13 deletions(-)
>>
>> diff --git a/tools/perf/util/evlist.c b/tools/perf/util/evlist.c
>> index 282e83e..c295b7b 100644
>> --- a/tools/perf/util/evlist.c
>> +++ b/tools/perf/util/evlist.c
>> @@ -265,17 +265,27 @@ int perf_evlist__add_newtp(struct perf_evlist *evlist,
>>   	return 0;
>>   }
>>
>> +static int perf_evlist__nr_threads(struct perf_evlist *evlist,
>> +				   struct perf_evsel *evsel)
>> +{
>> +	if (evsel->system_wide)
>> +		return 1;
>> +	else
>> +		return thread_map__nr(evlist->threads);
>> +}
>> +
>>   void perf_evlist__disable(struct perf_evlist *evlist)
>>   {
>>   	int cpu, thread;
>>   	struct perf_evsel *pos;
>>   	int nr_cpus = cpu_map__nr(evlist->cpus);
>> -	int nr_threads = thread_map__nr(evlist->threads);
>> +	int nr_threads;
>>
>>   	for (cpu = 0; cpu < nr_cpus; cpu++) {
>>   		evlist__for_each(evlist, pos) {
>>   			if (!perf_evsel__is_group_leader(pos) || !pos->fd)
>>   				continue;
>> +			nr_threads = perf_evlist__nr_threads(evlist, pos);
>>   			for (thread = 0; thread < nr_threads; thread++)
>>   				ioctl(FD(pos, cpu, thread),
>>   				      PERF_EVENT_IOC_DISABLE, 0);
>> @@ -288,12 +298,13 @@ void perf_evlist__enable(struct perf_evlist *evlist)
>>   	int cpu, thread;
>>   	struct perf_evsel *pos;
>>   	int nr_cpus = cpu_map__nr(evlist->cpus);
>> -	int nr_threads = thread_map__nr(evlist->threads);
>> +	int nr_threads;
>>
>>   	for (cpu = 0; cpu < nr_cpus; cpu++) {
>>   		evlist__for_each(evlist, pos) {
>>   			if (!perf_evsel__is_group_leader(pos) || !pos->fd)
>>   				continue;
>> +			nr_threads = perf_evlist__nr_threads(evlist, pos);
>>   			for (thread = 0; thread < nr_threads; thread++)
>>   				ioctl(FD(pos, cpu, thread),
>>   				      PERF_EVENT_IOC_ENABLE, 0);
>> @@ -305,12 +316,14 @@ int perf_evlist__disable_event(struct perf_evlist *evlist,
>>   			       struct perf_evsel *evsel)
>>   {
>>   	int cpu, thread, err;
>> +	int nr_cpus = cpu_map__nr(evlist->cpus);
>> +	int nr_threads = perf_evlist__nr_threads(evlist, evsel);
>>
>>   	if (!evsel->fd)
>>   		return 0;
>>
>> -	for (cpu = 0; cpu < evlist->cpus->nr; cpu++) {
>> -		for (thread = 0; thread < evlist->threads->nr; thread++) {
>> +	for (cpu = 0; cpu < nr_cpus; cpu++) {
>> +		for (thread = 0; thread < nr_threads; thread++) {
>>   			err = ioctl(FD(evsel, cpu, thread),
>>   				    PERF_EVENT_IOC_DISABLE, 0);
>>   			if (err)
>> @@ -324,12 +337,14 @@ int perf_evlist__enable_event(struct perf_evlist *evlist,
>>   			      struct perf_evsel *evsel)
>>   {
>>   	int cpu, thread, err;
>> +	int nr_cpus = cpu_map__nr(evlist->cpus);
>> +	int nr_threads = perf_evlist__nr_threads(evlist, evsel);
>>
>>   	if (!evsel->fd)
>>   		return -EINVAL;
>>
>> -	for (cpu = 0; cpu < evlist->cpus->nr; cpu++) {
>> -		for (thread = 0; thread < evlist->threads->nr; thread++) {
>> +	for (cpu = 0; cpu < nr_cpus; cpu++) {
>> +		for (thread = 0; thread < nr_threads; thread++) {
>>   			err = ioctl(FD(evsel, cpu, thread),
>>   				    PERF_EVENT_IOC_ENABLE, 0);
>>   			if (err)
>
> All the above seems ok, the threads (x axis) array is flat when syswide, ok.
>
>> @@ -343,7 +358,16 @@ static int perf_evlist__alloc_pollfd(struct perf_evlist *evlist)
>>   {
>>   	int nr_cpus = cpu_map__nr(evlist->cpus);
>>   	int nr_threads = thread_map__nr(evlist->threads);
>> -	int nfds = nr_cpus * nr_threads * evlist->nr_entries;
>> +	int nfds = 0;
>> +	struct perf_evsel *evsel;
>> +
>> +	list_for_each_entry(evsel, &evlist->entries, node) {
>> +		if (evsel->system_wide)
>> +			nfds += nr_cpus;
>> +		else
>> +			nfds += nr_cpus * nr_threads;
>> +	}
>
> But here looks tricky, will look how the evlist->pollfd is used...
>
>> +
>>   	evlist->pollfd = malloc(sizeof(struct pollfd) * nfds);
>>   	return evlist->pollfd != NULL ? 0 : -ENOMEM;
>>   }
>> @@ -636,7 +660,12 @@ static int perf_evlist__mmap_per_evsel(struct perf_evlist *evlist, int idx,
>>   	struct perf_evsel *evsel;
>>
>>   	evlist__for_each(evlist, evsel) {
>> -		int fd = FD(evsel, cpu, thread);
>> +		int fd;
>> +
>> +		if (evsel->system_wide && thread)
>> +			continue;
>
> Discard after thread 0, i.e. the first, ok.
>
>> +
>> +		fd = FD(evsel, cpu, thread);
>>
>>   		if (*output == -1) {
>>   			*output = fd;
>> diff --git a/tools/perf/util/evsel.c b/tools/perf/util/evsel.c
>> index 90f58cd..7540b5f 100644
>> --- a/tools/perf/util/evsel.c
>> +++ b/tools/perf/util/evsel.c
>> @@ -691,6 +691,10 @@ void perf_evsel__config(struct perf_evsel *evsel, struct record_opts *opts)
>>   int perf_evsel__alloc_fd(struct perf_evsel *evsel, int ncpus, int nthreads)
>>   {
>>   	int cpu, thread;
>> +
>> +	if (evsel->system_wide)
>> +		nthreads = 1;
>
> flatten it, ok
>
>> +
>>   	evsel->fd = xyarray__new(ncpus, nthreads, sizeof(int));
>>
>>   	if (evsel->fd) {
>> @@ -709,6 +713,9 @@ static int perf_evsel__run_ioctl(struct perf_evsel *evsel, int ncpus, int nthrea
>>   {
>>   	int cpu, thread;
>>
>> +	if (evsel->system_wide)
>> +		nthreads = 1;
>> +
>
> Ditto.
>
>>   	for (cpu = 0; cpu < ncpus; cpu++) {
>>   		for (thread = 0; thread < nthreads; thread++) {
>>   			int fd = FD(evsel, cpu, thread),
>> @@ -739,6 +746,9 @@ int perf_evsel__enable(struct perf_evsel *evsel, int ncpus, int nthreads)
>>
>>   int perf_evsel__alloc_id(struct perf_evsel *evsel, int ncpus, int nthreads)
>>   {
>> +	if (evsel->system_wide)
>> +		nthreads = 1;
>> +
>>   	evsel->sample_id = xyarray__new(ncpus, nthreads, sizeof(struct perf_sample_id));
>
> These are per evsel, so can be flattened when we get to it,
> evlist->pollfd is per evlist, so mixes syswide with !syswide,  that is why I'm scratching my head at this
> point...

pollfd is not a 2-dimensional array.  It is just a 1-dimensional array.
So it just needs to be the right length.

>
>>   	if (evsel->sample_id == NULL)
>>   		return -ENOMEM;
>> @@ -783,6 +793,9 @@ void perf_evsel__close_fd(struct perf_evsel *evsel, int ncpus, int nthreads)
>>   {
>>   	int cpu, thread;
>>
>> +	if (evsel->system_wide)
>> +		nthreads = 1;
>> +
>>   	for (cpu = 0; cpu < ncpus; cpu++)
>>   		for (thread = 0; thread < nthreads; ++thread) {
>>   			close(FD(evsel, cpu, thread));
>> @@ -871,6 +884,9 @@ int __perf_evsel__read(struct perf_evsel *evsel,
>>   	int cpu, thread;
>>   	struct perf_counts_values *aggr = &evsel->counts->aggr, count;
>>
>> +	if (evsel->system_wide)
>> +		nthreads = 1;
>> +
>>   	aggr->val = aggr->ena = aggr->run = 0;
>>
>>   	for (cpu = 0; cpu < ncpus; cpu++) {
>> @@ -993,13 +1009,18 @@ static size_t perf_event_attr__fprintf(struct perf_event_attr *attr, FILE *fp)
>>   static int __perf_evsel__open(struct perf_evsel *evsel, struct cpu_map *cpus,
>>   			      struct thread_map *threads)
>>   {
>> -	int cpu, thread;
>> +	int cpu, thread, nthreads;
>>   	unsigned long flags = 0;
>>   	int pid = -1, err;
>>   	enum { NO_CHANGE, SET_TO_MAX, INCREASED_MAX } set_rlimit = NO_CHANGE;
>>
>> +	if (evsel->system_wide)
>> +		nthreads = 1;
>> +	else
>> +		nthreads = threads->nr;
>> +
>>   	if (evsel->fd == NULL &&
>> -	    perf_evsel__alloc_fd(evsel, cpus->nr, threads->nr) < 0)
>> +	    perf_evsel__alloc_fd(evsel, cpus->nr, nthreads) < 0)
>>   		return -ENOMEM;
>>
>>   	if (evsel->cgrp) {
>> @@ -1021,10 +1042,10 @@ retry_sample_id:
>>
>>   	for (cpu = 0; cpu < cpus->nr; cpu++) {
>>
>> -		for (thread = 0; thread < threads->nr; thread++) {
>> +		for (thread = 0; thread < nthreads; thread++) {
>>   			int group_fd;
>>
>> -			if (!evsel->cgrp)
>> +			if (!evsel->cgrp && !evsel->system_wide)
>>   				pid = threads->map[thread];
>>
>>   			group_fd = get_group_fd(evsel, cpu, thread);
>> @@ -1094,7 +1115,7 @@ out_close:
>>   			close(FD(evsel, cpu, thread));
>>   			FD(evsel, cpu, thread) = -1;
>>   		}
>> -		thread = threads->nr;
>> +		thread = nthreads;
>>   	} while (--cpu >= 0);
>>   	return err;
>>   }
>> diff --git a/tools/perf/util/evsel.h b/tools/perf/util/evsel.h
>> index d7f93ce..dbb2a0d 100644
>> --- a/tools/perf/util/evsel.h
>> +++ b/tools/perf/util/evsel.h
>> @@ -85,6 +85,7 @@ struct perf_evsel {
>>   	bool 			needs_swap;
>>   	bool			no_aux_samples;
>>   	bool			immediate;
>> +	bool			system_wide;
>>   	/* parse modifier helper */
>>   	int			exclude_GH;
>>   	int			nr_members;
>> --
>> 1.8.3.2
--
To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
the body of a message to majordomo@...r.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html
Please read the FAQ at  http://www.tux.org/lkml/

Powered by blists - more mailing lists

Powered by Openwall GNU/*/Linux Powered by OpenVZ