Commit 74b873e4 authored by Peter Zijlstra's avatar Peter Zijlstra

objtool: Optimize find_rela_by_dest_range()

Perf shows there is significant time in find_rela_by_dest(); this is
because we have to iterate the address space per byte, looking for
relocation entries.

Optimize this by reducing the address space granularity.

This reduces objtool on vmlinux.o runtime from 4.8 to 4.4 seconds.
Signed-off-by: default avatarPeter Zijlstra (Intel) <peterz@infradead.org>
Reviewed-by: default avatarMiroslav Benes <mbenes@suse.cz>
Acked-by: default avatarJosh Poimboeuf <jpoimboe@redhat.com>
Link: https://lkml.kernel.org/r/20200324160924.861321325@infradead.org
parent 8887a86e
...@@ -215,7 +215,7 @@ struct symbol *find_symbol_by_name(struct elf *elf, const char *name) ...@@ -215,7 +215,7 @@ struct symbol *find_symbol_by_name(struct elf *elf, const char *name)
struct rela *find_rela_by_dest_range(struct elf *elf, struct section *sec, struct rela *find_rela_by_dest_range(struct elf *elf, struct section *sec,
unsigned long offset, unsigned int len) unsigned long offset, unsigned int len)
{ {
struct rela *rela; struct rela *rela, *r = NULL;
unsigned long o; unsigned long o;
if (!sec->rela) if (!sec->rela)
...@@ -223,12 +223,19 @@ struct rela *find_rela_by_dest_range(struct elf *elf, struct section *sec, ...@@ -223,12 +223,19 @@ struct rela *find_rela_by_dest_range(struct elf *elf, struct section *sec,
sec = sec->rela; sec = sec->rela;
for (o = offset; o < offset + len; o++) { for_offset_range(o, offset, offset + len) {
hash_for_each_possible(elf->rela_hash, rela, hash, hash_for_each_possible(elf->rela_hash, rela, hash,
sec_offset_hash(sec, o)) { sec_offset_hash(sec, o)) {
if (rela->sec == sec && rela->offset == o) if (rela->sec != sec)
return rela; continue;
if (rela->offset >= offset && rela->offset < offset + len) {
if (!r || rela->offset < r->offset)
r = rela;
}
} }
if (r)
return r;
} }
return NULL; return NULL;
......
...@@ -83,9 +83,23 @@ struct elf { ...@@ -83,9 +83,23 @@ struct elf {
DECLARE_HASHTABLE(rela_hash, 20); DECLARE_HASHTABLE(rela_hash, 20);
}; };
#define OFFSET_STRIDE_BITS 4
#define OFFSET_STRIDE (1UL << OFFSET_STRIDE_BITS)
#define OFFSET_STRIDE_MASK (~(OFFSET_STRIDE - 1))
#define for_offset_range(_offset, _start, _end) \
for (_offset = ((_start) & OFFSET_STRIDE_MASK); \
_offset <= ((_end) & OFFSET_STRIDE_MASK); \
_offset += OFFSET_STRIDE)
static inline u32 sec_offset_hash(struct section *sec, unsigned long offset) static inline u32 sec_offset_hash(struct section *sec, unsigned long offset)
{ {
u32 ol = offset, oh = offset >> 32, idx = sec->idx; u32 ol, oh, idx = sec->idx;
offset &= OFFSET_STRIDE_MASK;
ol = offset;
oh = offset >> 32;
__jhash_mix(ol, oh, idx); __jhash_mix(ol, oh, idx);
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment