From: Bradley Smith Date: Mon, 13 Oct 2014 10:16:06 +0000 (+0000) Subject: [AArch64] Add workaround for Cortex-A53 erratum (835769) X-Git-Url: https://granicus.if.org/sourcecode?a=commitdiff_plain;h=8af1acab3e5f2e87a3e20c6af3694bdfff361f94;p=clang [AArch64] Add workaround for Cortex-A53 erratum (835769) Some early revisions of the Cortex-A53 have an erratum (835769) whereby it is possible for a 64-bit multiply-accumulate instruction in AArch64 state to generate an incorrect result. The details are quite complex and hard to determine statically, since branches in the code may exist in some circumstances, but all cases end with a memory (load, store, or prefetch) instruction followed immediately by the multiply-accumulate operation. The safest work-around for this issue is to make the compiler avoid emitting multiply-accumulate instructions immediately after memory instructions and the simplest way to do this is to insert a NOP. This patch implements clang options to enable this workaround in the backend. The work-around code generation is not enabled by default. git-svn-id: https://llvm.org/svn/llvm-project/cfe/trunk@219604 91177308-0d34-0410-b5e6-96231b3b80d8 --- diff --git a/include/clang/Driver/Options.td b/include/clang/Driver/Options.td index ecccf2929b..df0b7a4b8d 100644 --- a/include/clang/Driver/Options.td +++ b/include/clang/Driver/Options.td @@ -1169,6 +1169,13 @@ def mno_long_calls : Flag<["-"], "mno-long-calls">, Group, def mgeneral_regs_only : Flag<["-"], "mgeneral-regs-only">, Group, HelpText<"Generate code which only uses the general purpose registers (AArch64 only)">; +def mfix_cortex_a53_835769 : Flag<["-"], "mfix-cortex-a53-835769">, + Group, + HelpText<"Workaround Cortex-A53 erratum 835769 (AArch64 only)">; +def mno_fix_cortex_a53_835769 : Flag<["-"], "mno-fix-cortex-a53-835769">, + Group, + HelpText<"Don't workaround Cortex-A53 erratum 835769 (AArch64 only)">; + def mvsx : Flag<["-"], "mvsx">, Group; def mno_vsx : Flag<["-"], "mno-vsx">, Group; def mpower8_vector : Flag<["-"], "mpower8-vector">, diff --git a/lib/Driver/Tools.cpp b/lib/Driver/Tools.cpp index 0bbc964838..c0607284e3 100644 --- a/lib/Driver/Tools.cpp +++ b/lib/Driver/Tools.cpp @@ -913,6 +913,15 @@ void Clang::AddAArch64TargetArgs(const ArgList &Args, CmdArgs.push_back("-aarch64-no-strict-align"); } + if (Arg *A = Args.getLastArg(options::OPT_mfix_cortex_a53_835769, + options::OPT_mno_fix_cortex_a53_835769)) { + CmdArgs.push_back("-backend-option"); + if (A->getOption().matches(options::OPT_mfix_cortex_a53_835769)) + CmdArgs.push_back("-aarch64-fix-cortex-a53-835769=1"); + else + CmdArgs.push_back("-aarch64-fix-cortex-a53-835769=0"); + } + // Setting -mno-global-merge disables the codegen global merge pass. Setting // -mglobal-merge has no effect as the pass is enabled by default. if (Arg *A = Args.getLastArg(options::OPT_mglobal_merge, diff --git a/test/Driver/aarch64-fix-cortex-a53-835769-cg.c b/test/Driver/aarch64-fix-cortex-a53-835769-cg.c new file mode 100644 index 0000000000..efe60c9aaf --- /dev/null +++ b/test/Driver/aarch64-fix-cortex-a53-835769-cg.c @@ -0,0 +1,19 @@ +// REQUIRES: aarch64-registered-target +// RUN: %clang -O3 -target aarch64-linux-eabi %s -S -o- \ +// RUN: | FileCheck --check-prefix=CHECK-NO --check-prefix=CHECK %s +// RUN: %clang -O3 -target aarch64-linux-eabi -mfix-cortex-a53-835769 %s -S -o- 2>&1 \ +// RUN: | FileCheck --check-prefix=CHECK-YES --check-prefix=CHECK %s +// RUN: %clang -O3 -target aarch64-linux-eabi -mno-fix-cortex-a53-835769 %s -S -o- 2>&1 \ +// RUN: | FileCheck --check-prefix=CHECK-NO --check-prefix=CHECK %s + +#include + +int64_t f_load_madd_64(int64_t a, int64_t b, int64_t *c) { + int64_t result = a+b*(*c); + return result; +} + +// CHECK: ldr +// CHECK-YES-NEXT: nop +// CHECK-NO-NEXT-NOT: nop +// CHECK-NEXT: madd diff --git a/test/Driver/aarch64-fix-cortex-a53-835769.c b/test/Driver/aarch64-fix-cortex-a53-835769.c new file mode 100644 index 0000000000..379a3238ac --- /dev/null +++ b/test/Driver/aarch64-fix-cortex-a53-835769.c @@ -0,0 +1,9 @@ +// RUN: %clang -target aarch64-linux-eabi %s -### 2>&1 \ +// RUN: | FileCheck --check-prefix=CHECK-DEF %s +// RUN: %clang -target aarch64-linux-eabi -mfix-cortex-a53-835769 %s -### 2>&1 \ +// RUN: | FileCheck --check-prefix=CHECK-YES %s +// RUN: %clang -target aarch64-linux-eabi -mno-fix-cortex-a53-835769 %s -### 2>&1 \ +// RUN: | FileCheck --check-prefix=CHECK-NO %s +// CHECK-DEF-NOT: "-backend-option" "-aarch64-fix-cortex-a53-835769" +// CHECK-YES: "-backend-option" "-aarch64-fix-cortex-a53-835769=1" +// CHECK-NO: "-backend-option" "-aarch64-fix-cortex-a53-835769=0"