]> www.infradead.org Git - users/dwmw2/linux.git/commitdiff
objtool: Introduce CFI hash
authorPeter Zijlstra <peterz@infradead.org>
Thu, 24 Jun 2021 09:41:01 +0000 (11:41 +0200)
committerGreg Kroah-Hartman <gregkh@linuxfoundation.org>
Mon, 25 Jul 2022 09:26:22 +0000 (11:26 +0200)
commit 8b946cc38e063f0f7bb67789478c38f6d7d457c9 upstream.

Andi reported that objtool on vmlinux.o consumes more memory than his
system has, leading to horrific performance.

This is in part because we keep a struct instruction for every
instruction in the file in-memory. Shrink struct instruction by
removing the CFI state (which includes full register state) from it
and demand allocating it.

Given most instructions don't actually change CFI state, there's lots
of repetition there, so add a hash table to find previous CFI
instances.

Reduces memory consumption (and runtime) for processing an
x86_64-allyesconfig:

  pre:  4:40.84 real,   143.99 user,    44.18 sys,      30624988 mem
  post: 2:14.61 real,   108.58 user,    25.04 sys,      16396184 mem

Suggested-by: Andi Kleen <andi@firstfloor.org>
Signed-off-by: Peter Zijlstra (Intel) <peterz@infradead.org>
Link: https://lore.kernel.org/r/20210624095147.756759107@infradead.org
Signed-off-by: Thadeu Lima de Souza Cascardo <cascardo@canonical.com>
[bwh: Backported to 5.10:
 - Don't use bswap_if_needed() since we don't have any of the other fixes
   for mixed-endian cross-compilation
 - Since we don't have "objtool: Rewrite hashtable sizing", make
   cfi_hash_alloc() set the number of bits similarly to elf_hash_bits()
 - objtool doesn't have any mcount handling
 - Adjust context]
Signed-off-by: Ben Hutchings <ben@decadent.org.uk>
Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
tools/objtool/arch.h
tools/objtool/arch/x86/decode.c
tools/objtool/cfi.h
tools/objtool/check.c
tools/objtool/check.h
tools/objtool/orc_gen.c

index 8918de4f81898ef6939cfb5d5c7e7a0ee30fcbed..35e3f94413ebd8ddfe882324fef2944ceb22c3a4 100644 (file)
@@ -84,7 +84,7 @@ unsigned long arch_dest_reloc_offset(int addend);
 
 const char *arch_nop_insn(int len);
 
-int arch_decode_hint_reg(struct instruction *insn, u8 sp_reg);
+int arch_decode_hint_reg(u8 sp_reg, int *base);
 
 bool arch_is_retpoline(struct symbol *sym);
 
index 99b47720dce9b6022bea9b1a93ccdbc44daf7c78..5005a4811157b95b849d63568bd382413418918b 100644 (file)
@@ -706,34 +706,32 @@ int arch_rewrite_retpolines(struct objtool_file *file)
        return 0;
 }
 
-int arch_decode_hint_reg(struct instruction *insn, u8 sp_reg)
+int arch_decode_hint_reg(u8 sp_reg, int *base)
 {
-       struct cfi_reg *cfa = &insn->cfi.cfa;
-
        switch (sp_reg) {
        case ORC_REG_UNDEFINED:
-               cfa->base = CFI_UNDEFINED;
+               *base = CFI_UNDEFINED;
                break;
        case ORC_REG_SP:
-               cfa->base = CFI_SP;
+               *base = CFI_SP;
                break;
        case ORC_REG_BP:
-               cfa->base = CFI_BP;
+               *base = CFI_BP;
                break;
        case ORC_REG_SP_INDIRECT:
-               cfa->base = CFI_SP_INDIRECT;
+               *base = CFI_SP_INDIRECT;
                break;
        case ORC_REG_R10:
-               cfa->base = CFI_R10;
+               *base = CFI_R10;
                break;
        case ORC_REG_R13:
-               cfa->base = CFI_R13;
+               *base = CFI_R13;
                break;
        case ORC_REG_DI:
-               cfa->base = CFI_DI;
+               *base = CFI_DI;
                break;
        case ORC_REG_DX:
-               cfa->base = CFI_DX;
+               *base = CFI_DX;
                break;
        default:
                return -1;
index c7c59c6a44eeacaeff9f0338bf6af83d5476e9f0..f579802d7ec241c3f5b931d53bee2b3a6744d6be 100644 (file)
@@ -7,6 +7,7 @@
 #define _OBJTOOL_CFI_H
 
 #include "cfi_regs.h"
+#include <linux/list.h>
 
 #define CFI_UNDEFINED          -1
 #define CFI_CFA                        -2
@@ -24,6 +25,7 @@ struct cfi_init_state {
 };
 
 struct cfi_state {
+       struct hlist_node hash; /* must be first, cficmp() */
        struct cfi_reg regs[CFI_NUM_REGS];
        struct cfi_reg vals[CFI_NUM_REGS];
        struct cfi_reg cfa;
index eb180c78f440cb13454e248f07dbcc6a7180a971..b6c56c7bb8372d210b7502ee806227619582ef83 100644 (file)
@@ -5,6 +5,7 @@
 
 #include <string.h>
 #include <stdlib.h>
+#include <sys/mman.h>
 
 #include "builtin.h"
 #include "cfi.h"
@@ -25,7 +26,11 @@ struct alternative {
        bool skip_orig;
 };
 
-struct cfi_init_state initial_func_cfi;
+static unsigned long nr_cfi, nr_cfi_reused, nr_cfi_cache;
+
+static struct cfi_init_state initial_func_cfi;
+static struct cfi_state init_cfi;
+static struct cfi_state func_cfi;
 
 struct instruction *find_insn(struct objtool_file *file,
                              struct section *sec, unsigned long offset)
@@ -265,6 +270,78 @@ static void init_insn_state(struct insn_state *state, struct section *sec)
                state->noinstr = sec->noinstr;
 }
 
+static struct cfi_state *cfi_alloc(void)
+{
+       struct cfi_state *cfi = calloc(sizeof(struct cfi_state), 1);
+       if (!cfi) {
+               WARN("calloc failed");
+               exit(1);
+       }
+       nr_cfi++;
+       return cfi;
+}
+
+static int cfi_bits;
+static struct hlist_head *cfi_hash;
+
+static inline bool cficmp(struct cfi_state *cfi1, struct cfi_state *cfi2)
+{
+       return memcmp((void *)cfi1 + sizeof(cfi1->hash),
+                     (void *)cfi2 + sizeof(cfi2->hash),
+                     sizeof(struct cfi_state) - sizeof(struct hlist_node));
+}
+
+static inline u32 cfi_key(struct cfi_state *cfi)
+{
+       return jhash((void *)cfi + sizeof(cfi->hash),
+                    sizeof(*cfi) - sizeof(cfi->hash), 0);
+}
+
+static struct cfi_state *cfi_hash_find_or_add(struct cfi_state *cfi)
+{
+       struct hlist_head *head = &cfi_hash[hash_min(cfi_key(cfi), cfi_bits)];
+       struct cfi_state *obj;
+
+       hlist_for_each_entry(obj, head, hash) {
+               if (!cficmp(cfi, obj)) {
+                       nr_cfi_cache++;
+                       return obj;
+               }
+       }
+
+       obj = cfi_alloc();
+       *obj = *cfi;
+       hlist_add_head(&obj->hash, head);
+
+       return obj;
+}
+
+static void cfi_hash_add(struct cfi_state *cfi)
+{
+       struct hlist_head *head = &cfi_hash[hash_min(cfi_key(cfi), cfi_bits)];
+
+       hlist_add_head(&cfi->hash, head);
+}
+
+static void *cfi_hash_alloc(void)
+{
+       cfi_bits = vmlinux ? ELF_HASH_BITS - 3 : 13;
+       cfi_hash = mmap(NULL, sizeof(struct hlist_head) << cfi_bits,
+                       PROT_READ|PROT_WRITE,
+                       MAP_PRIVATE|MAP_ANON, -1, 0);
+       if (cfi_hash == (void *)-1L) {
+               WARN("mmap fail cfi_hash");
+               cfi_hash = NULL;
+       }  else if (stats) {
+               printf("cfi_bits: %d\n", cfi_bits);
+       }
+
+       return cfi_hash;
+}
+
+static unsigned long nr_insns;
+static unsigned long nr_insns_visited;
+
 /*
  * Call the arch-specific instruction decoder for all the instructions and add
  * them to the global instruction list.
@@ -275,7 +352,6 @@ static int decode_instructions(struct objtool_file *file)
        struct symbol *func;
        unsigned long offset;
        struct instruction *insn;
-       unsigned long nr_insns = 0;
        int ret;
 
        for_each_sec(file, sec) {
@@ -301,7 +377,6 @@ static int decode_instructions(struct objtool_file *file)
                        memset(insn, 0, sizeof(*insn));
                        INIT_LIST_HEAD(&insn->alts);
                        INIT_LIST_HEAD(&insn->stack_ops);
-                       init_cfi_state(&insn->cfi);
 
                        insn->sec = sec;
                        insn->offset = offset;
@@ -1077,7 +1152,6 @@ static int handle_group_alt(struct objtool_file *file,
                memset(nop, 0, sizeof(*nop));
                INIT_LIST_HEAD(&nop->alts);
                INIT_LIST_HEAD(&nop->stack_ops);
-               init_cfi_state(&nop->cfi);
 
                nop->sec = special_alt->new_sec;
                nop->offset = special_alt->new_off + special_alt->new_len;
@@ -1454,10 +1528,11 @@ static void set_func_state(struct cfi_state *state)
 
 static int read_unwind_hints(struct objtool_file *file)
 {
+       struct cfi_state cfi = init_cfi;
        struct section *sec, *relocsec;
-       struct reloc *reloc;
        struct unwind_hint *hint;
        struct instruction *insn;
+       struct reloc *reloc;
        int i;
 
        sec = find_section_by_name(file->elf, ".discard.unwind_hints");
@@ -1495,19 +1570,24 @@ static int read_unwind_hints(struct objtool_file *file)
                insn->hint = true;
 
                if (hint->type == UNWIND_HINT_TYPE_FUNC) {
-                       set_func_state(&insn->cfi);
+                       insn->cfi = &func_cfi;
                        continue;
                }
 
-               if (arch_decode_hint_reg(insn, hint->sp_reg)) {
+               if (insn->cfi)
+                       cfi = *(insn->cfi);
+
+               if (arch_decode_hint_reg(hint->sp_reg, &cfi.cfa.base)) {
                        WARN_FUNC("unsupported unwind_hint sp base reg %d",
                                  insn->sec, insn->offset, hint->sp_reg);
                        return -1;
                }
 
-               insn->cfi.cfa.offset = hint->sp_offset;
-               insn->cfi.type = hint->type;
-               insn->cfi.end = hint->end;
+               cfi.cfa.offset = hint->sp_offset;
+               cfi.type = hint->type;
+               cfi.end = hint->end;
+
+               insn->cfi = cfi_hash_find_or_add(&cfi);
        }
 
        return 0;
@@ -2283,13 +2363,18 @@ static int propagate_alt_cfi(struct objtool_file *file, struct instruction *insn
        if (!insn->alt_group)
                return 0;
 
+       if (!insn->cfi) {
+               WARN("CFI missing");
+               return -1;
+       }
+
        alt_cfi = insn->alt_group->cfi;
        group_off = insn->offset - insn->alt_group->first_insn->offset;
 
        if (!alt_cfi[group_off]) {
-               alt_cfi[group_off] = &insn->cfi;
+               alt_cfi[group_off] = insn->cfi;
        } else {
-               if (memcmp(alt_cfi[group_off], &insn->cfi, sizeof(struct cfi_state))) {
+               if (cficmp(alt_cfi[group_off], insn->cfi)) {
                        WARN_FUNC("stack layout conflict in alternatives",
                                  insn->sec, insn->offset);
                        return -1;
@@ -2335,9 +2420,14 @@ static int handle_insn_ops(struct instruction *insn, struct insn_state *state)
 
 static bool insn_cfi_match(struct instruction *insn, struct cfi_state *cfi2)
 {
-       struct cfi_state *cfi1 = &insn->cfi;
+       struct cfi_state *cfi1 = insn->cfi;
        int i;
 
+       if (!cfi1) {
+               WARN("CFI missing");
+               return false;
+       }
+
        if (memcmp(&cfi1->cfa, &cfi2->cfa, sizeof(cfi1->cfa))) {
 
                WARN_FUNC("stack state mismatch: cfa1=%d%+d cfa2=%d%+d",
@@ -2522,7 +2612,7 @@ static int validate_branch(struct objtool_file *file, struct symbol *func,
                           struct instruction *insn, struct insn_state state)
 {
        struct alternative *alt;
-       struct instruction *next_insn;
+       struct instruction *next_insn, *prev_insn = NULL;
        struct section *sec;
        u8 visited;
        int ret;
@@ -2551,15 +2641,25 @@ static int validate_branch(struct objtool_file *file, struct symbol *func,
 
                        if (insn->visited & visited)
                                return 0;
+               } else {
+                       nr_insns_visited++;
                }
 
                if (state.noinstr)
                        state.instr += insn->instr;
 
-               if (insn->hint)
-                       state.cfi = insn->cfi;
-               else
-                       insn->cfi = state.cfi;
+               if (insn->hint) {
+                       state.cfi = *insn->cfi;
+               } else {
+                       /* XXX track if we actually changed state.cfi */
+
+                       if (prev_insn && !cficmp(prev_insn->cfi, &state.cfi)) {
+                               insn->cfi = prev_insn->cfi;
+                               nr_cfi_reused++;
+                       } else {
+                               insn->cfi = cfi_hash_find_or_add(&state.cfi);
+                       }
+               }
 
                insn->visited |= visited;
 
@@ -2709,6 +2809,7 @@ static int validate_branch(struct objtool_file *file, struct symbol *func,
                        return 1;
                }
 
+               prev_insn = insn;
                insn = next_insn;
        }
 
@@ -2964,10 +3065,20 @@ int check(struct objtool_file *file)
        int ret, warnings = 0;
 
        arch_initial_func_cfi_state(&initial_func_cfi);
+       init_cfi_state(&init_cfi);
+       init_cfi_state(&func_cfi);
+       set_func_state(&func_cfi);
+
+       if (!cfi_hash_alloc())
+               goto out;
+
+       cfi_hash_add(&init_cfi);
+       cfi_hash_add(&func_cfi);
 
        ret = decode_sections(file);
        if (ret < 0)
                goto out;
+
        warnings += ret;
 
        if (list_empty(&file->insn_list))
@@ -3011,6 +3122,13 @@ int check(struct objtool_file *file)
                goto out;
        warnings += ret;
 
+       if (stats) {
+               printf("nr_insns_visited: %ld\n", nr_insns_visited);
+               printf("nr_cfi: %ld\n", nr_cfi);
+               printf("nr_cfi_reused: %ld\n", nr_cfi_reused);
+               printf("nr_cfi_cache: %ld\n", nr_cfi_cache);
+       }
+
 out:
        /*
         *  For now, don't fail the kernel build on fatal warnings.  These
index ca3259eebac88102a6708ac4cc77c2fa4a1616e9..508f712deba106cc33bf5ccc2978a50422be733b 100644 (file)
@@ -59,7 +59,7 @@ struct instruction {
        struct list_head alts;
        struct symbol *func;
        struct list_head stack_ops;
-       struct cfi_state cfi;
+       struct cfi_state *cfi;
 };
 
 static inline bool is_static_jump(struct instruction *insn)
index 671f3b296c1ad04c2f8a26f8f84c698cf656547d..812b33ed9f6521922a02ad9e8439a7b6da96898c 100644 (file)
 #include "check.h"
 #include "warn.h"
 
-static int init_orc_entry(struct orc_entry *orc, struct cfi_state *cfi)
+static int init_orc_entry(struct orc_entry *orc, struct cfi_state *cfi,
+                         struct instruction *insn)
 {
-       struct instruction *insn = container_of(cfi, struct instruction, cfi);
        struct cfi_reg *bp = &cfi->regs[CFI_BP];
 
        memset(orc, 0, sizeof(*orc));
 
+       if (!cfi) {
+               orc->end = 0;
+               orc->sp_reg = ORC_REG_UNDEFINED;
+               return 0;
+       }
+
        orc->end = cfi->end;
 
        if (cfi->cfa.base == CFI_UNDEFINED) {
@@ -159,7 +165,7 @@ int orc_create(struct objtool_file *file)
                        int i;
 
                        if (!alt_group) {
-                               if (init_orc_entry(&orc, &insn->cfi))
+                               if (init_orc_entry(&orc, insn->cfi, insn))
                                        return -1;
                                if (!memcmp(&prev_orc, &orc, sizeof(orc)))
                                        continue;
@@ -183,7 +189,8 @@ int orc_create(struct objtool_file *file)
                                struct cfi_state *cfi = alt_group->cfi[i];
                                if (!cfi)
                                        continue;
-                               if (init_orc_entry(&orc, cfi))
+                               /* errors are reported on the original insn */
+                               if (init_orc_entry(&orc, cfi, insn))
                                        return -1;
                                if (!memcmp(&prev_orc, &orc, sizeof(orc)))
                                        continue;