Re: [PATCH v6 15/20] kbuild: implement CONFIG_TRIM_UNUSED_KSYMS without recursion

From: Nick Desaulniers
Date: Thu May 25 2023 - 14:15:18 EST


On Sun, May 21, 2023 at 9:05 AM Masahiro Yamada <masahiroy@xxxxxxxxxx> wrote:
>
> When CONFIG_TRIM_UNUSED_KSYMS is enabled, Kbuild recursively traverses
> the directory tree to determine which EXPORT_SYMBOL to trim. If an
> EXPORT_SYMBOL turns out to be unused by anyone, Kbuild begins the
> second traverse, where some source files are recompiled with their
> EXPORT_SYMBOL() tuned into a no-op.
>
> Linus stated negative opinions about this slowness in commits:
>
> - 5cf0fd591f2e ("Kbuild: disable TRIM_UNUSED_KSYMS option")
> - a555bdd0c58c ("Kbuild: enable TRIM_UNUSED_KSYMS again, with some guarding")
>
> We can do this better now. The final data structures of EXPORT_SYMBOL
> are generated by the modpost stage, so modpost can selectively emit
> KSYMTAB entries that are really used by modules.
>
> Commit f73edc8951b2 ("kbuild: unify two modpost invocations") is another
> ground-work to do this in a one-pass algorithm. With the list of modules,
> modpost sets sym->used if it is used by a module. modpost emits KSYMTAB
> only for symbols with sym->used==true.
>
> BTW, Nicolas explained why the trimming was implemented with recursion:
>
> https://lore.kernel.org/all/2o2rpn97-79nq-p7s2-nq5-8p83391473r@xxxxxxxxxxx/
>
> Actually, we never achieved that level of optimization where the chain
> reaction of trimming comes into play because:
>
> - CONFIG_LTO_CLANG cannot remove any unused symbols
> - CONFIG_LD_DEAD_CODE_DATA_ELIMINATION is enabled only for vmlinux,
> but not modules
>
> If deeper trimming is required, we need to revisit this, but I guess
> that is unlikely to happen.

I think this patch removes the only 2 references to
scripts/gen_autoksyms.sh in the tree. Can or should that be removed as
well?
The rest of the patch LGTM.

>
> Signed-off-by: Masahiro Yamada <masahiroy@xxxxxxxxxx>
> ---
>
> Changes in v5:
> - Clean up more
>
> .gitignore | 1 -
> Makefile | 19 +---------
> include/linux/export.h | 65 +++++----------------------------
> scripts/Makefile.build | 7 ----
> scripts/Makefile.modpost | 7 ++++
> scripts/adjust_autoksyms.sh | 73 -------------------------------------
> scripts/basic/fixdep.c | 3 +-
> scripts/gen_ksymdeps.sh | 30 ---------------
> scripts/mod/modpost.c | 54 ++++++++++++++++++++++++---
> scripts/remove-stale-files | 2 +
> 10 files changed, 70 insertions(+), 191 deletions(-)
> delete mode 100755 scripts/adjust_autoksyms.sh
> delete mode 100755 scripts/gen_ksymdeps.sh
>
> diff --git a/.gitignore b/.gitignore
> index 7f86e0837909..172e3874adfd 100644
> --- a/.gitignore
> +++ b/.gitignore
> @@ -112,7 +112,6 @@ modules.order
> #
> /include/config/
> /include/generated/
> -/include/ksym/
> /arch/*/include/generated/
>
> # stgit generated dirs
> diff --git a/Makefile b/Makefile
> index f836936fb4d8..ffc2c9b632fd 100644
> --- a/Makefile
> +++ b/Makefile
> @@ -1193,28 +1193,13 @@ endif
> export KBUILD_VMLINUX_LIBS
> export KBUILD_LDS := arch/$(SRCARCH)/kernel/vmlinux.lds
>
> -# Recurse until adjust_autoksyms.sh is satisfied
> -PHONY += autoksyms_recursive
> ifdef CONFIG_TRIM_UNUSED_KSYMS
> # For the kernel to actually contain only the needed exported symbols,
> # we have to build modules as well to determine what those symbols are.
> # (this can be evaluated only once include/config/auto.conf has been included)
> KBUILD_MODULES := 1
> -
> -autoksyms_recursive: $(build-dir) modules.order
> - $(Q)$(CONFIG_SHELL) $(srctree)/scripts/adjust_autoksyms.sh \
> - "$(MAKE) -f $(srctree)/Makefile autoksyms_recursive"
> endif
>
> -autoksyms_h := $(if $(CONFIG_TRIM_UNUSED_KSYMS), include/generated/autoksyms.h)
> -
> -quiet_cmd_autoksyms_h = GEN $@
> - cmd_autoksyms_h = mkdir -p $(dir $@); \
> - $(CONFIG_SHELL) $(srctree)/scripts/gen_autoksyms.sh $@
> -
> -$(autoksyms_h):
> - $(call cmd,autoksyms_h)
> -
> # '$(AR) mPi' needs 'T' to workaround the bug of llvm-ar <= 14
> quiet_cmd_ar_vmlinux.a = AR $@
> cmd_ar_vmlinux.a = \
> @@ -1223,7 +1208,7 @@ quiet_cmd_ar_vmlinux.a = AR $@
> $(AR) mPiT $$($(AR) t $@ | sed -n 1p) $@ $$($(AR) t $@ | grep -F -f $(srctree)/scripts/head-object-list.txt)
>
> targets += vmlinux.a
> -vmlinux.a: $(KBUILD_VMLINUX_OBJS) scripts/head-object-list.txt autoksyms_recursive FORCE
> +vmlinux.a: $(KBUILD_VMLINUX_OBJS) scripts/head-object-list.txt FORCE
> $(call if_changed,ar_vmlinux.a)
>
> PHONY += vmlinux_o
> @@ -1279,7 +1264,7 @@ scripts: scripts_basic scripts_dtc
> PHONY += prepare archprepare
>
> archprepare: outputmakefile archheaders archscripts scripts include/config/kernel.release \
> - asm-generic $(version_h) $(autoksyms_h) include/generated/utsrelease.h \
> + asm-generic $(version_h) include/generated/utsrelease.h \
> include/generated/compile.h include/generated/autoconf.h remove-stale-files
>
> prepare0: archprepare
> diff --git a/include/linux/export.h b/include/linux/export.h
> index 32461a01608c..9bf081ff9903 100644
> --- a/include/linux/export.h
> +++ b/include/linux/export.h
> @@ -37,30 +37,13 @@ extern struct module __this_module;
> #define __EXPORT_SYMBOL_REF(sym) .balign 4; .long sym
> #endif
>
> -#define ____EXPORT_SYMBOL(sym, license, ns) \
> +#define ___EXPORT_SYMBOL(sym, license, ns) \
> .section ".export_symbol","a" ; \
> __export_symbol_##license##_##sym: ; \
> .asciz ns ; \
> __EXPORT_SYMBOL_REF(sym) ; \
> .previous
>
> -#ifdef __GENKSYMS__
> -
> -#define ___EXPORT_SYMBOL(sym, sec, ns) __GENKSYMS_EXPORT_SYMBOL(sym)
> -
> -#elif defined(__ASSEMBLY__)
> -
> -#define ___EXPORT_SYMBOL(sym, license, ns) \
> - ____EXPORT_SYMBOL(sym, license, ns)
> -
> -#else
> -
> -#define ___EXPORT_SYMBOL(sym, license, ns) \
> - __ADDRESSABLE(sym) \
> - asm(__stringify(____EXPORT_SYMBOL(sym, license, ns)))
> -
> -#endif
> -
> #if !defined(CONFIG_MODULES) || defined(__DISABLE_EXPORTS)
>
> /*
> @@ -70,50 +53,20 @@ extern struct module __this_module;
> */
> #define __EXPORT_SYMBOL(sym, sec, ns)
>
> -#elif defined(CONFIG_TRIM_UNUSED_KSYMS)
> +#elif defined(__GENKSYMS__)
>
> -#include <generated/autoksyms.h>
> +#define __EXPORT_SYMBOL(sym, sec, ns) __GENKSYMS_EXPORT_SYMBOL(sym)
>
> -/*
> - * For fine grained build dependencies, we want to tell the build system
> - * about each possible exported symbol even if they're not actually exported.
> - * We use a symbol pattern __ksym_marker_<symbol> that the build system filters
> - * from the $(NM) output (see scripts/gen_ksymdeps.sh). These symbols are
> - * discarded in the final link stage.
> - */
> +#elif defined(__ASSEMBLY__)
>
> -#ifdef __ASSEMBLY__
> -
> -#define __ksym_marker(sym) \
> - .section ".discard.ksym","a" ; \
> -__ksym_marker_##sym: ; \
> - .previous
> +#define __EXPORT_SYMBOL(sym, license, ns) \
> + ___EXPORT_SYMBOL(sym, license, ns)
>
> #else
>
> -#define __ksym_marker(sym) \
> - static int __ksym_marker_##sym[0] __section(".discard.ksym") __used
> -
> -#endif
> -
> -#define __EXPORT_SYMBOL(sym, sec, ns) \
> - __ksym_marker(sym); \
> - __cond_export_sym(sym, sec, ns, __is_defined(__KSYM_##sym))
> -#define __cond_export_sym(sym, sec, ns, conf) \
> - ___cond_export_sym(sym, sec, ns, conf)
> -#define ___cond_export_sym(sym, sec, ns, enabled) \
> - __cond_export_sym_##enabled(sym, sec, ns)
> -#define __cond_export_sym_1(sym, sec, ns) ___EXPORT_SYMBOL(sym, sec, ns)
> -
> -#ifdef __GENKSYMS__
> -#define __cond_export_sym_0(sym, sec, ns) __GENKSYMS_EXPORT_SYMBOL(sym)
> -#else
> -#define __cond_export_sym_0(sym, sec, ns) /* nothing */
> -#endif
> -
> -#else
> -
> -#define __EXPORT_SYMBOL(sym, sec, ns) ___EXPORT_SYMBOL(sym, sec, ns)
> +#define __EXPORT_SYMBOL(sym, license, ns) \
> + __ADDRESSABLE(sym) \
> + asm(__stringify(___EXPORT_SYMBOL(sym, license, ns)))
>
> #endif /* CONFIG_MODULES */
>
> diff --git a/scripts/Makefile.build b/scripts/Makefile.build
> index bd4123795299..8154bd962eea 100644
> --- a/scripts/Makefile.build
> +++ b/scripts/Makefile.build
> @@ -215,18 +215,12 @@ is-standard-object = $(if $(filter-out y%, $(OBJECT_FILES_NON_STANDARD_$(basetar
>
> $(obj)/%.o: objtool-enabled = $(if $(is-standard-object),$(if $(delay-objtool),$(is-single-obj-m),y))
>
> -ifdef CONFIG_TRIM_UNUSED_KSYMS
> -cmd_gen_ksymdeps = \
> - $(CONFIG_SHELL) $(srctree)/scripts/gen_ksymdeps.sh $@ >> $(dot-target).cmd
> -endif
> -
> ifneq ($(findstring 1, $(KBUILD_EXTRA_WARN)),)
> cmd_warn_shared_object = $(if $(word 2, $(modname-multi)),$(warning $(kbuild-file): $*.o is added to multiple modules: $(modname-multi)))
> endif
>
> define rule_cc_o_c
> $(call cmd_and_fixdep,cc_o_c)
> - $(call cmd,gen_ksymdeps)
> $(call cmd,checksrc)
> $(call cmd,checkdoc)
> $(call cmd,gen_objtooldep)
> @@ -237,7 +231,6 @@ endef
>
> define rule_as_o_S
> $(call cmd_and_fixdep,as_o_S)
> - $(call cmd,gen_ksymdeps)
> $(call cmd,gen_objtooldep)
> $(call cmd,gen_symversions_S)
> $(call cmd,warn_shared_object)
> diff --git a/scripts/Makefile.modpost b/scripts/Makefile.modpost
> index 0980c58d8afc..1e0b47cbabd9 100644
> --- a/scripts/Makefile.modpost
> +++ b/scripts/Makefile.modpost
> @@ -90,6 +90,13 @@ targets += .vmlinux.objs
> .vmlinux.objs: vmlinux.a $(KBUILD_VMLINUX_LIBS) FORCE
> $(call if_changed,vmlinux_objs)
>
> +ifdef CONFIG_TRIM_UNUSED_KSYMS
> +ksym-wl := $(CONFIG_UNUSED_KSYMS_WHITELIST)
> +ksym-wl := $(if $(filter-out /%, $(ksym-wl)),$(srctree)/)$(ksym-wl)
> +modpost-args += -t $(addprefix -W, $(ksym-wl))
> +modpost-deps += $(ksym-wl)
> +endif
> +
> ifeq ($(wildcard vmlinux.o),)
> missing-input := vmlinux.o
> output-symdump := modules-only.symvers
> diff --git a/scripts/adjust_autoksyms.sh b/scripts/adjust_autoksyms.sh
> deleted file mode 100755
> index f1b5ac818411..000000000000
> --- a/scripts/adjust_autoksyms.sh
> +++ /dev/null
> @@ -1,73 +0,0 @@
> -#!/bin/sh
> -# SPDX-License-Identifier: GPL-2.0-only
> -
> -# Script to update include/generated/autoksyms.h and dependency files
> -#
> -# Copyright: (C) 2016 Linaro Limited
> -# Created by: Nicolas Pitre, January 2016
> -#
> -
> -# Update the include/generated/autoksyms.h file.
> -#
> -# For each symbol being added or removed, the corresponding dependency
> -# file's timestamp is updated to force a rebuild of the affected source
> -# file. All arguments passed to this script are assumed to be a command
> -# to be exec'd to trigger a rebuild of those files.
> -
> -set -e
> -
> -cur_ksyms_file="include/generated/autoksyms.h"
> -new_ksyms_file="include/generated/autoksyms.h.tmpnew"
> -
> -info() {
> - if [ "$quiet" != "silent_" ]; then
> - printf " %-7s %s\n" "$1" "$2"
> - fi
> -}
> -
> -info "CHK" "$cur_ksyms_file"
> -
> -# Use "make V=1" to debug this script.
> -case "$KBUILD_VERBOSE" in
> -*1*)
> - set -x
> - ;;
> -esac
> -
> -# Generate a new symbol list file
> -$CONFIG_SHELL $srctree/scripts/gen_autoksyms.sh --modorder "$new_ksyms_file"
> -
> -# Extract changes between old and new list and touch corresponding
> -# dependency files.
> -changed=$(
> -count=0
> -sort "$cur_ksyms_file" "$new_ksyms_file" | uniq -u |
> -sed -n 's/^#define __KSYM_\(.*\) 1/\1/p' |
> -while read sympath; do
> - if [ -z "$sympath" ]; then continue; fi
> - depfile="include/ksym/${sympath}"
> - mkdir -p "$(dirname "$depfile")"
> - touch "$depfile"
> - # Filesystems with coarse time precision may create timestamps
> - # equal to the one from a file that was very recently built and that
> - # needs to be rebuild. Let's guard against that by making sure our
> - # dep files are always newer than the first file we created here.
> - while [ ! "$depfile" -nt "$new_ksyms_file" ]; do
> - touch "$depfile"
> - done
> - echo $((count += 1))
> -done | tail -1 )
> -changed=${changed:-0}
> -
> -if [ $changed -gt 0 ]; then
> - # Replace the old list with tne new one
> - old=$(grep -c "^#define __KSYM_" "$cur_ksyms_file" || true)
> - new=$(grep -c "^#define __KSYM_" "$new_ksyms_file" || true)
> - info "KSYMS" "symbols: before=$old, after=$new, changed=$changed"
> - info "UPD" "$cur_ksyms_file"
> - mv -f "$new_ksyms_file" "$cur_ksyms_file"
> - # Then trigger a rebuild of affected source files
> - exec $@
> -else
> - rm -f "$new_ksyms_file"
> -fi
> diff --git a/scripts/basic/fixdep.c b/scripts/basic/fixdep.c
> index fa562806c2be..84b6efa849f4 100644
> --- a/scripts/basic/fixdep.c
> +++ b/scripts/basic/fixdep.c
> @@ -246,8 +246,7 @@ static void *read_file(const char *filename)
> /* Ignore certain dependencies */
> static int is_ignored_file(const char *s, int len)
> {
> - return str_ends_with(s, len, "include/generated/autoconf.h") ||
> - str_ends_with(s, len, "include/generated/autoksyms.h");
> + return str_ends_with(s, len, "include/generated/autoconf.h");
> }
>
> /* Do not parse these files */
> diff --git a/scripts/gen_ksymdeps.sh b/scripts/gen_ksymdeps.sh
> deleted file mode 100755
> index 8ee533f33659..000000000000
> --- a/scripts/gen_ksymdeps.sh
> +++ /dev/null
> @@ -1,30 +0,0 @@
> -#!/bin/sh
> -# SPDX-License-Identifier: GPL-2.0
> -
> -set -e
> -
> -# List of exported symbols
> -#
> -# If the object has no symbol, $NM warns 'no symbols'.
> -# Suppress the stderr.
> -# TODO:
> -# Use -q instead of 2>/dev/null when we upgrade the minimum version of
> -# binutils to 2.37, llvm to 13.0.0.
> -ksyms=$($NM $1 2>/dev/null | sed -n 's/.*__ksym_marker_\(.*\)/\1/p')
> -
> -if [ -z "$ksyms" ]; then
> - exit 0
> -fi
> -
> -echo
> -echo "ksymdeps_$1 := \\"
> -
> -for s in $ksyms
> -do
> - printf ' $(wildcard include/ksym/%s) \\\n' "$s"
> -done
> -
> -echo
> -echo "$1: \$(ksymdeps_$1)"
> -echo
> -echo "\$(ksymdeps_$1):"
> diff --git a/scripts/mod/modpost.c b/scripts/mod/modpost.c
> index f14fe9301ae6..516323c3910a 100644
> --- a/scripts/mod/modpost.c
> +++ b/scripts/mod/modpost.c
> @@ -35,6 +35,9 @@ static bool warn_unresolved;
>
> static int sec_mismatch_count;
> static bool sec_mismatch_warn_only = true;
> +/* Trim EXPORT_SYMBOLs that are unused by in-tree modules */
> +static bool trim_unused_exports;
> +
> /* ignore missing files */
> static bool ignore_missing_files;
> /* If set to 1, only warn (instead of error) about missing ns imports */
> @@ -217,6 +220,7 @@ struct symbol {
> bool weak;
> bool is_func;
> bool is_gpl_only; /* exported by EXPORT_SYMBOL_GPL */
> + bool used; /* there exists a user of this symbol */
> char name[];
> };
>
> @@ -1772,6 +1776,7 @@ static void check_exports(struct module *mod)
> continue;
> }
>
> + exp->used = true;
> s->module = exp->module;
> s->crc_valid = exp->crc_valid;
> s->crc = exp->crc;
> @@ -1795,6 +1800,23 @@ static void check_exports(struct module *mod)
> }
> }
>
> +static void handle_white_list_exports(const char *white_list)
> +{
> + char *buf, *p, *name;
> +
> + buf = read_text_file(white_list);
> + p = buf;
> +
> + while ((name = strsep(&p, "\n"))) {
> + struct symbol *sym = find_symbol(name);
> +
> + if (sym)
> + sym->used = true;
> + }
> +
> + free(buf);
> +}
> +
> static void check_modname_len(struct module *mod)
> {
> const char *mod_name;
> @@ -1865,10 +1887,14 @@ static void add_exported_symbols(struct buffer *buf, struct module *mod)
>
> /* generate struct for exported symbols */
> buf_printf(buf, "\n");
> - list_for_each_entry(sym, &mod->exported_symbols, list)
> + list_for_each_entry(sym, &mod->exported_symbols, list) {
> + if (trim_unused_exports && !sym->used)
> + continue;
> +
> buf_printf(buf, "KSYMTAB_%s(%s, \"%s\", \"%s\");\n",
> sym->is_func ? "FUNC" : "DATA", sym->name,
> sym->is_gpl_only ? "_gpl" : "", sym->namespace);
> + }
>
> if (!modversions)
> return;
> @@ -1876,6 +1902,9 @@ static void add_exported_symbols(struct buffer *buf, struct module *mod)
> /* record CRCs for exported symbols */
> buf_printf(buf, "\n");
> list_for_each_entry(sym, &mod->exported_symbols, list) {
> + if (trim_unused_exports && !sym->used)
> + continue;
> +
> if (!sym->crc_valid)
> warn("EXPORT symbol \"%s\" [%s%s] version generation failed, symbol will not be versioned.\n"
> "Is \"%s\" prototyped in <asm/asm-prototypes.h>?\n",
> @@ -2039,9 +2068,6 @@ static void write_mod_c_file(struct module *mod)
> char fname[PATH_MAX];
> int ret;
>
> - check_modname_len(mod);
> - check_exports(mod);
> -
> add_header(&buf, mod);
> add_exported_symbols(&buf, mod);
> add_versions(&buf, mod);
> @@ -2175,12 +2201,13 @@ int main(int argc, char **argv)
> {
> struct module *mod;
> char *missing_namespace_deps = NULL;
> + char *unused_exports_white_list = NULL;
> char *dump_write = NULL, *files_source = NULL;
> int opt;
> LIST_HEAD(dump_lists);
> struct dump_list *dl, *dl2;
>
> - while ((opt = getopt(argc, argv, "ei:mnT:o:awENd:")) != -1) {
> + while ((opt = getopt(argc, argv, "ei:mntT:tW:o:awENd:")) != -1) {
> switch (opt) {
> case 'e':
> external_module = true;
> @@ -2205,6 +2232,12 @@ int main(int argc, char **argv)
> case 'T':
> files_source = optarg;
> break;
> + case 't':
> + trim_unused_exports = true;
> + break;
> + case 'W':
> + unused_exports_white_list = optarg;
> + break;
> case 'w':
> warn_unresolved = true;
> break;
> @@ -2234,6 +2267,17 @@ int main(int argc, char **argv)
> if (files_source)
> read_symbols_from_files(files_source);
>
> + list_for_each_entry(mod, &modules, list) {
> + if (mod->from_dump || mod->is_vmlinux)
> + continue;
> +
> + check_modname_len(mod);
> + check_exports(mod);
> + }
> +
> + if (unused_exports_white_list)
> + handle_white_list_exports(unused_exports_white_list);
> +
> list_for_each_entry(mod, &modules, list) {
> if (mod->from_dump)
> continue;
> diff --git a/scripts/remove-stale-files b/scripts/remove-stale-files
> index 7f432900671a..8502a17d47df 100755
> --- a/scripts/remove-stale-files
> +++ b/scripts/remove-stale-files
> @@ -33,3 +33,5 @@ rm -f rust/target.json
> rm -f scripts/bin2c
>
> rm -f .scmversion
> +
> +rm -rf include/ksym
> --
> 2.39.2
>


--
Thanks,
~Nick Desaulniers