Skip to content

Commit 3f135e5

Browse files
jpoimboeIngo Molnar
authored andcommitted
x86/build: Mostly disable '-maccumulate-outgoing-args'
The GCC '-maccumulate-outgoing-args' flag is enabled for most configs, mostly because of issues which are no longer relevant. For most configs, and with most recent versions of GCC, it's no longer needed. Clarify which cases need it, and only enable it for those cases. Also produce a compile-time error for the ftrace graph + mcount + '-Os' case, which will otherwise cause runtime failures. The main benefit of '-maccumulate-outgoing-args' is that it prevents an ugly prologue for functions which have aligned stacks. But removing the option also has some benefits: more readable argument saves, smaller text size, and (presumably) slightly improved performance. Here are the object size savings for 32-bit and 64-bit defconfig kernels: text data bss dec hex filename 10006710 3543328 1773568 15323606 e9d1d6 vmlinux.x86-32.before 9706358 3547424 1773568 15027350 e54c96 vmlinux.x86-32.after text data bss dec hex filename 10652105 4537576 843776 16033457 f4a6b1 vmlinux.x86-64.before 10639629 4537576 843776 16020981 f475f5 vmlinux.x86-64.after That comes out to a 3% text size improvement on x86-32 and a 0.1% text size improvement on x86-64. Signed-off-by: Josh Poimboeuf <jpoimboe@redhat.com> Cc: Andrew Lutomirski <luto@kernel.org> Cc: Andy Lutomirski <luto@amacapital.net> Cc: Borislav Petkov <bp@alien8.de> Cc: Brian Gerst <brgerst@gmail.com> Cc: Denys Vlasenko <dvlasenk@redhat.com> Cc: Linus Torvalds <torvalds@linux-foundation.org> Cc: Pavel Machek <pavel@ucw.cz> Cc: Peter Zijlstra <peterz@infradead.org> Cc: Steven Rostedt <rostedt@goodmis.org> Cc: Thomas Gleixner <tglx@linutronix.de> Link: http://lkml.kernel.org/r/20170316193133.zrj6gug53766m6nn@treble Signed-off-by: Ingo Molnar <mingo@kernel.org>
1 parent a46f60d commit 3f135e5

File tree

4 files changed

+41
-22
lines changed

4 files changed

+41
-22
lines changed

arch/x86/Makefile

Lines changed: 31 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -120,10 +120,6 @@ else
120120
# -funit-at-a-time shrinks the kernel .text considerably
121121
# unfortunately it makes reading oopses harder.
122122
KBUILD_CFLAGS += $(call cc-option,-funit-at-a-time)
123-
124-
# this works around some issues with generating unwind tables in older gccs
125-
# newer gccs do it by default
126-
KBUILD_CFLAGS += $(call cc-option,-maccumulate-outgoing-args)
127123
endif
128124

129125
ifdef CONFIG_X86_X32
@@ -147,6 +143,37 @@ ifeq ($(CONFIG_KMEMCHECK),y)
147143
KBUILD_CFLAGS += $(call cc-option,-fno-builtin-memcpy)
148144
endif
149145

146+
#
147+
# If the function graph tracer is used with mcount instead of fentry,
148+
# '-maccumulate-outgoing-args' is needed to prevent a GCC bug
149+
# (https://gcc.gnu.org/bugzilla/show_bug.cgi?id=42109)
150+
#
151+
ifdef CONFIG_FUNCTION_GRAPH_TRACER
152+
ifndef CONFIG_HAVE_FENTRY
153+
ACCUMULATE_OUTGOING_ARGS := 1
154+
else
155+
ifeq ($(call cc-option-yn, -mfentry), n)
156+
ACCUMULATE_OUTGOING_ARGS := 1
157+
endif
158+
endif
159+
endif
160+
161+
#
162+
# Jump labels need '-maccumulate-outgoing-args' for gcc < 4.5.2 to prevent a
163+
# GCC bug (https://gcc.gnu.org/bugzilla/show_bug.cgi?id=46226). There's no way
164+
# to test for this bug at compile-time because the test case needs to execute,
165+
# which is a no-go for cross compilers. So check the GCC version instead.
166+
#
167+
ifdef CONFIG_JUMP_LABEL
168+
ifneq ($(ACCUMULATE_OUTGOING_ARGS), 1)
169+
ACCUMULATE_OUTGOING_ARGS = $(call cc-if-fullversion, -lt, 040502, 1)
170+
endif
171+
endif
172+
173+
ifeq ($(ACCUMULATE_OUTGOING_ARGS), 1)
174+
KBUILD_CFLAGS += -maccumulate-outgoing-args
175+
endif
176+
150177
# Stackpointer is addressed different for 32 bit and 64 bit x86
151178
sp-$(CONFIG_X86_32) := esp
152179
sp-$(CONFIG_X86_64) := rsp

arch/x86/Makefile_32.cpu

Lines changed: 0 additions & 18 deletions
Original file line numberDiff line numberDiff line change
@@ -45,24 +45,6 @@ cflags-$(CONFIG_MGEODE_LX) += $(call cc-option,-march=geode,-march=pentium-mmx)
4545
# cpu entries
4646
cflags-$(CONFIG_X86_GENERIC) += $(call tune,generic,$(call tune,i686))
4747

48-
# Work around the pentium-mmx code generator madness of gcc4.4.x which
49-
# does stack alignment by generating horrible code _before_ the mcount
50-
# prologue (push %ebp, mov %esp, %ebp) which breaks the function graph
51-
# tracer assumptions. For i686, generic, core2 this is set by the
52-
# compiler anyway
53-
ifeq ($(CONFIG_FUNCTION_GRAPH_TRACER), y)
54-
ADD_ACCUMULATE_OUTGOING_ARGS := y
55-
endif
56-
57-
# Work around to a bug with asm goto with first implementations of it
58-
# in gcc causing gcc to mess up the push and pop of the stack in some
59-
# uses of asm goto.
60-
ifeq ($(CONFIG_JUMP_LABEL), y)
61-
ADD_ACCUMULATE_OUTGOING_ARGS := y
62-
endif
63-
64-
cflags-$(ADD_ACCUMULATE_OUTGOING_ARGS) += $(call cc-option,-maccumulate-outgoing-args)
65-
6648
# Bug fix for binutils: this option is required in order to keep
6749
# binutils from generating NOPL instructions against our will.
6850
ifneq ($(CONFIG_X86_P6_NOP),y)

arch/x86/kernel/ftrace.c

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -29,6 +29,12 @@
2929
#include <asm/ftrace.h>
3030
#include <asm/nops.h>
3131

32+
#if defined(CONFIG_FUNCTION_GRAPH_TRACER) && \
33+
!defined(CC_USING_FENTRY) && \
34+
!defined(CONFIG_CC_OPTIMIZE_FOR_PERFORMANCE)
35+
# error The following combination is not supported: ((compiler missing -mfentry) || (CONFIG_X86_32 and !CONFIG_DYNAMIC_FTRACE)) && CONFIG_FUNCTION_GRAPH_TRACER && CONFIG_CC_OPTIMIZE_FOR_SIZE
36+
#endif
37+
3238
#ifdef CONFIG_DYNAMIC_FTRACE
3339

3440
int ftrace_arch_code_modify_prepare(void)

scripts/Kbuild.include

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -148,6 +148,10 @@ cc-fullversion = $(shell $(CONFIG_SHELL) \
148148
# Usage: EXTRA_CFLAGS += $(call cc-ifversion, -lt, 0402, -O1)
149149
cc-ifversion = $(shell [ $(cc-version) $(1) $(2) ] && echo $(3) || echo $(4))
150150

151+
# cc-if-fullversion
152+
# Usage: EXTRA_CFLAGS += $(call cc-if-fullversion, -lt, 040502, -O1)
153+
cc-if-fullversion = $(shell [ $(cc-fullversion) $(1) $(2) ] && echo $(3) || echo $(4))
154+
151155
# cc-ldoption
152156
# Usage: ldflags += $(call cc-ldoption, -Wl$(comma)--hash-style=both)
153157
cc-ldoption = $(call try-run,\

0 commit comments

Comments
 (0)