[<prev] [next>] [<thread-prev] [thread-next>] [day] [month] [year] [list]
Message-ID: <CAM9d7cgrx7vjLtnSt6Y4q+vtok=kSy6V83xe0c6cT6BVY2m-oA@mail.gmail.com>
Date: Mon, 4 Dec 2023 15:39:08 -0800
From: Namhyung Kim <namhyung@...nel.org>
To: Ian Rogers <irogers@...gle.com>
Cc: Peter Zijlstra <peterz@...radead.org>,
Ingo Molnar <mingo@...hat.com>,
Arnaldo Carvalho de Melo <acme@...nel.org>,
Mark Rutland <mark.rutland@....com>,
Alexander Shishkin <alexander.shishkin@...ux.intel.com>,
Jiri Olsa <jolsa@...nel.org>,
Adrian Hunter <adrian.hunter@...el.com>,
Nick Terrell <terrelln@...com>,
Kan Liang <kan.liang@...ux.intel.com>,
Andi Kleen <ak@...ux.intel.com>,
Kajol Jain <kjain@...ux.ibm.com>,
Athira Rajeev <atrajeev@...ux.vnet.ibm.com>,
Huacai Chen <chenhuacai@...nel.org>,
Masami Hiramatsu <mhiramat@...nel.org>,
Vincent Whitchurch <vincent.whitchurch@...s.com>,
"Steinar H. Gunderson" <sesse@...gle.com>,
Liam Howlett <liam.howlett@...cle.com>,
Miguel Ojeda <ojeda@...nel.org>,
Colin Ian King <colin.i.king@...il.com>,
Dmitrii Dolgov <9erthalion6@...il.com>,
Yang Jihong <yangjihong1@...wei.com>,
Ming Wang <wangming01@...ngson.cn>,
James Clark <james.clark@....com>,
K Prateek Nayak <kprateek.nayak@....com>,
Sean Christopherson <seanjc@...gle.com>,
Leo Yan <leo.yan@...aro.org>,
Ravi Bangoria <ravi.bangoria@....com>,
German Gomez <german.gomez@....com>,
Changbin Du <changbin.du@...wei.com>,
Paolo Bonzini <pbonzini@...hat.com>, Li Dong <lidong@...o.com>,
Sandipan Das <sandipan.das@....com>,
liuwenyu <liuwenyu7@...wei.com>, linux-kernel@...r.kernel.org,
linux-perf-users@...r.kernel.org,
Guilherme Amadio <amadio@...too.org>
Subject: Re: [PATCH v5 12/50] perf map: Simplify map_ip/unmap_ip and make map
size smaller
Hi Ian,
On Mon, Nov 27, 2023 at 2:09 PM Ian Rogers <irogers@...gle.com> wrote:
>
> When mapping an IP it is either an identity mapping or a DSO relative
> mapping, so a single bit is required in the struct to identify
> this. The current code uses function pointers, adding 2 pointers per
> map and also pushing the size of a map beyond 1 cache line. Switch to
> using a byte to identify the mapping type (as well as priv and
> erange_warned), to avoid any masking. Change struct maps's layout to
> avoid holes.
>
> Before:
> ```
> struct map {
> u64 start; /* 0 8 */
> u64 end; /* 8 8 */
> _Bool erange_warned:1; /* 16: 0 1 */
> _Bool priv:1; /* 16: 1 1 */
>
> /* XXX 6 bits hole, try to pack */
> /* XXX 3 bytes hole, try to pack */
>
> u32 prot; /* 20 4 */
> u64 pgoff; /* 24 8 */
> u64 reloc; /* 32 8 */
> u64 (*map_ip)(const struct map *, u64); /* 40 8 */
> u64 (*unmap_ip)(const struct map *, u64); /* 48 8 */
> struct dso * dso; /* 56 8 */
> /* --- cacheline 1 boundary (64 bytes) --- */
> refcount_t refcnt; /* 64 4 */
> u32 flags; /* 68 4 */
>
> /* size: 72, cachelines: 2, members: 12 */
> /* sum members: 68, holes: 1, sum holes: 3 */
> /* sum bitfield members: 2 bits, bit holes: 1, sum bit holes: 6 bits */
> /* last cacheline: 8 bytes */
> };
> ```
>
> After:
> ```
> struct map {
> u64 start; /* 0 8 */
> u64 end; /* 8 8 */
> u64 pgoff; /* 16 8 */
> u64 reloc; /* 24 8 */
> struct dso * dso; /* 32 8 */
> refcount_t refcnt; /* 40 4 */
> u32 prot; /* 44 4 */
> u32 flags; /* 48 4 */
> enum mapping_type mapping_type:8; /* 52: 0 4 */
>
> /* Bitfield combined with next fields */
>
> _Bool erange_warned; /* 53 1 */
> _Bool priv; /* 54 1 */
>
> /* size: 56, cachelines: 1, members: 11 */
> /* padding: 1 */
> /* last cacheline: 56 bytes */
> };
> ```
Thanks for doing this! I really wanted to clean up the map
code and to make it more intuitive.
>
> Signed-off-by: Ian Rogers <irogers@...gle.com>
Acked-by: Namhyung Kim <namhyung@...nel.org>
A few nitpicks below.
> ---
> tools/perf/util/machine.c | 3 +-
> tools/perf/util/map.c | 20 +--------
> tools/perf/util/map.h | 83 +++++++++++++++++++-----------------
> tools/perf/util/symbol-elf.c | 6 +--
> tools/perf/util/symbol.c | 6 +--
> 5 files changed, 50 insertions(+), 68 deletions(-)
>
> diff --git a/tools/perf/util/machine.c b/tools/perf/util/machine.c
> index be3dab9d5253..b6831a1f909d 100644
> --- a/tools/perf/util/machine.c
> +++ b/tools/perf/util/machine.c
> @@ -1360,8 +1360,7 @@ __machine__create_kernel_maps(struct machine *machine, struct dso *kernel)
> if (machine->vmlinux_map == NULL)
> return -ENOMEM;
>
> - map__set_map_ip(machine->vmlinux_map, identity__map_ip);
> - map__set_unmap_ip(machine->vmlinux_map, identity__map_ip);
> + map__set_mapping_type(machine->vmlinux_map, MAPPING_TYPE__IDENTITY);
> return maps__insert(machine__kernel_maps(machine), machine->vmlinux_map);
> }
>
> diff --git a/tools/perf/util/map.c b/tools/perf/util/map.c
> index f64b83004421..54c67cb7ecef 100644
> --- a/tools/perf/util/map.c
> +++ b/tools/perf/util/map.c
> @@ -109,8 +109,7 @@ void map__init(struct map *map, u64 start, u64 end, u64 pgoff, struct dso *dso)
> map__set_pgoff(map, pgoff);
> map__set_reloc(map, 0);
> map__set_dso(map, dso__get(dso));
> - map__set_map_ip(map, map__dso_map_ip);
> - map__set_unmap_ip(map, map__dso_unmap_ip);
> + map__set_mapping_type(map, MAPPING_TYPE__DSO);
> map__set_erange_warned(map, false);
> refcount_set(map__refcnt(map), 1);
> }
> @@ -172,7 +171,7 @@ struct map *map__new(struct machine *machine, u64 start, u64 len,
> map__init(result, start, start + len, pgoff, dso);
>
> if (anon || no_dso) {
> - map->map_ip = map->unmap_ip = identity__map_ip;
> + map->mapping_type = MAPPING_TYPE__IDENTITY;
>
> /*
> * Set memory without DSO as loaded. All map__find_*
> @@ -630,18 +629,3 @@ struct maps *map__kmaps(struct map *map)
> }
> return kmap->kmaps;
> }
> -
> -u64 map__dso_map_ip(const struct map *map, u64 ip)
> -{
> - return ip - map__start(map) + map__pgoff(map);
> -}
> -
> -u64 map__dso_unmap_ip(const struct map *map, u64 ip)
> -{
> - return ip + map__start(map) - map__pgoff(map);
> -}
> -
> -u64 identity__map_ip(const struct map *map __maybe_unused, u64 ip)
> -{
> - return ip;
> -}
> diff --git a/tools/perf/util/map.h b/tools/perf/util/map.h
> index 1b53d53adc86..3a3b7757da5f 100644
> --- a/tools/perf/util/map.h
> +++ b/tools/perf/util/map.h
> @@ -16,23 +16,25 @@ struct dso;
> struct maps;
> struct machine;
>
> +enum mapping_type {
> + /* map__map_ip/map__unmap_ip are given as offsets in the DSO. */
> + MAPPING_TYPE__DSO,
I slightly prefer __PIC than __DSO, but won't argue. :)
> + /* map__map_ip/map__unmap_ip are just the given ip value. */
> + MAPPING_TYPE__IDENTITY,
> +};
> +
> DECLARE_RC_STRUCT(map) {
> u64 start;
> u64 end;
> - bool erange_warned:1;
> - bool priv:1;
> - u32 prot;
> u64 pgoff;
> u64 reloc;
> -
> - /* ip -> dso rip */
> - u64 (*map_ip)(const struct map *, u64);
> - /* dso rip -> ip */
> - u64 (*unmap_ip)(const struct map *, u64);
> -
> struct dso *dso;
> refcount_t refcnt;
> + u32 prot;
> u32 flags;
> + enum mapping_type mapping_type:8;
> + bool erange_warned;
> + bool priv;
> };
>
> struct kmap;
> @@ -41,38 +43,11 @@ struct kmap *__map__kmap(struct map *map);
> struct kmap *map__kmap(struct map *map);
> struct maps *map__kmaps(struct map *map);
>
> -/* ip -> dso rip */
> -u64 map__dso_map_ip(const struct map *map, u64 ip);
> -/* dso rip -> ip */
> -u64 map__dso_unmap_ip(const struct map *map, u64 ip);
> -/* Returns ip */
> -u64 identity__map_ip(const struct map *map __maybe_unused, u64 ip);
> -
> static inline struct dso *map__dso(const struct map *map)
> {
> return RC_CHK_ACCESS(map)->dso;
> }
>
> -static inline u64 map__map_ip(const struct map *map, u64 ip)
> -{
> - return RC_CHK_ACCESS(map)->map_ip(map, ip);
> -}
> -
> -static inline u64 map__unmap_ip(const struct map *map, u64 ip)
> -{
> - return RC_CHK_ACCESS(map)->unmap_ip(map, ip);
> -}
> -
> -static inline void *map__map_ip_ptr(struct map *map)
> -{
> - return RC_CHK_ACCESS(map)->map_ip;
> -}
> -
> -static inline void* map__unmap_ip_ptr(struct map *map)
> -{
> - return RC_CHK_ACCESS(map)->unmap_ip;
> -}
> -
> static inline u64 map__start(const struct map *map)
> {
> return RC_CHK_ACCESS(map)->start;
> @@ -123,6 +98,34 @@ static inline size_t map__size(const struct map *map)
> return map__end(map) - map__start(map);
> }
>
> +/* ip -> dso rip */
> +static inline u64 map__dso_map_ip(const struct map *map, u64 ip)
> +{
> + return ip - map__start(map) + map__pgoff(map);
> +}
> +
> +/* dso rip -> ip */
> +static inline u64 map__dso_unmap_ip(const struct map *map, u64 ip)
I think it's better to use 'rip' consistently in the variable name
if possible.
Thanks,
Namhyung
> +{
> + return ip + map__start(map) - map__pgoff(map);
> +}
> +
> +static inline u64 map__map_ip(const struct map *map, u64 ip)
> +{
> + if ((RC_CHK_ACCESS(map)->mapping_type) == MAPPING_TYPE__DSO)
> + return map__dso_map_ip(map, ip);
> + else
> + return ip;
> +}
> +
> +static inline u64 map__unmap_ip(const struct map *map, u64 ip)
> +{
> + if ((RC_CHK_ACCESS(map)->mapping_type) == MAPPING_TYPE__DSO)
> + return map__dso_unmap_ip(map, ip);
> + else
> + return ip;
> +}
> +
> /* rip/ip <-> addr suitable for passing to `objdump --start-address=` */
> u64 map__rip_2objdump(struct map *map, u64 rip);
>
> @@ -294,13 +297,13 @@ static inline void map__set_dso(struct map *map, struct dso *dso)
> RC_CHK_ACCESS(map)->dso = dso;
> }
>
> -static inline void map__set_map_ip(struct map *map, u64 (*map_ip)(const struct map *map, u64 ip))
> +static inline void map__set_mapping_type(struct map *map, enum mapping_type type)
> {
> - RC_CHK_ACCESS(map)->map_ip = map_ip;
> + RC_CHK_ACCESS(map)->mapping_type = type;
> }
>
> -static inline void map__set_unmap_ip(struct map *map, u64 (*unmap_ip)(const struct map *map, u64 rip))
> +static inline enum mapping_type map__mapping_type(struct map *map)
> {
> - RC_CHK_ACCESS(map)->unmap_ip = unmap_ip;
> + return RC_CHK_ACCESS(map)->mapping_type;
> }
> #endif /* __PERF_MAP_H */
> diff --git a/tools/perf/util/symbol-elf.c b/tools/perf/util/symbol-elf.c
> index 9e7eeaf616b8..4b934ed3bfd1 100644
> --- a/tools/perf/util/symbol-elf.c
> +++ b/tools/perf/util/symbol-elf.c
> @@ -1392,8 +1392,7 @@ static int dso__process_kernel_symbol(struct dso *dso, struct map *map,
> map__set_start(map, shdr->sh_addr + ref_reloc(kmap));
> map__set_end(map, map__start(map) + shdr->sh_size);
> map__set_pgoff(map, shdr->sh_offset);
> - map__set_map_ip(map, map__dso_map_ip);
> - map__set_unmap_ip(map, map__dso_unmap_ip);
> + map__set_mapping_type(map, MAPPING_TYPE__DSO);
> /* Ensure maps are correctly ordered */
> if (kmaps) {
> int err;
> @@ -1455,8 +1454,7 @@ static int dso__process_kernel_symbol(struct dso *dso, struct map *map,
> map__set_end(curr_map, map__start(curr_map) + shdr->sh_size);
> map__set_pgoff(curr_map, shdr->sh_offset);
> } else {
> - map__set_map_ip(curr_map, identity__map_ip);
> - map__set_unmap_ip(curr_map, identity__map_ip);
> + map__set_mapping_type(curr_map, MAPPING_TYPE__IDENTITY);
> }
> curr_dso->symtab_type = dso->symtab_type;
> if (maps__insert(kmaps, curr_map))
> diff --git a/tools/perf/util/symbol.c b/tools/perf/util/symbol.c
> index 82cc74b9358e..314c0263bf3c 100644
> --- a/tools/perf/util/symbol.c
> +++ b/tools/perf/util/symbol.c
> @@ -956,8 +956,7 @@ static int maps__split_kallsyms(struct maps *kmaps, struct dso *dso, u64 delta,
> return -1;
> }
>
> - map__set_map_ip(curr_map, identity__map_ip);
> - map__set_unmap_ip(curr_map, identity__map_ip);
> + map__set_mapping_type(curr_map, MAPPING_TYPE__IDENTITY);
> if (maps__insert(kmaps, curr_map)) {
> dso__put(ndso);
> return -1;
> @@ -1475,8 +1474,7 @@ static int dso__load_kcore(struct dso *dso, struct map *map,
> map__set_start(map, map__start(new_map));
> map__set_end(map, map__end(new_map));
> map__set_pgoff(map, map__pgoff(new_map));
> - map__set_map_ip(map, map__map_ip_ptr(new_map));
> - map__set_unmap_ip(map, map__unmap_ip_ptr(new_map));
> + map__set_mapping_type(map, map__mapping_type(new_map));
> /* Ensure maps are correctly ordered */
> map_ref = map__get(map);
> maps__remove(kmaps, map_ref);
> --
> 2.43.0.rc1.413.gea7ed67945-goog
>
Powered by blists - more mailing lists