[TM] Restore default TargetOptions in TargetMachine::resetTargetOptions.

Summary:
Previously if you had

 * a function with the fast-math-enabled attr, followed by
 * a function without the fast-math attr,

the second function would inherit the first function's fast-math-ness.

This means that mixing fast-math and non-fast-math functions in a module
was completely broken unless you explicitly annotated every
non-fast-math function with "unsafe-fp-math"="false".  This appears to
have been broken since r176986 (March 2013), when the resetTargetOptions
function was introduced.

This patch tests the correct behavior as best we can.  I don't think I
can test FPDenormalMode and NoTrappingFPMath, because they aren't used
in any backends during function lowering.  Surprisingly, I also can't
find any uses at all of LessPreciseFPMAD affecting generated code.

The NVPTX/fast-math.ll test changes are an expected result of fixing
this bug.  When FMA is disabled, we emit add as "add.rn.f32", which
prevents fma combining.  Before this patch, fast-math was enabled in all
functions following the one which explicitly enabled it on itself, so we
were emitting plain "add.f32" where we should have generated
"add.rn.f32".

Reviewers: mkuper

Subscribers: hfinkel, majnemer, jholewinski, nemanjai, llvm-commits

Differential Revision: https://reviews.llvm.org/D28507

git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@291618 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
Justin Lebar 2017-01-10 23:43:04 +00:00
parent 9975cecf1a
commit e9bf848e46
5 changed files with 132 additions and 5 deletions

View File

@ -103,6 +103,7 @@ protected: // Can only create subclasses.
unsigned O0WantsFastISel : 1;
public:
const TargetOptions DefaultOptions;
mutable TargetOptions Options;
virtual ~TargetMachine();

View File

@ -44,7 +44,7 @@ TargetMachine::TargetMachine(const Target &T, StringRef DataLayoutString,
const TargetOptions &Options)
: TheTarget(T), DL(DataLayoutString), TargetTriple(TT), TargetCPU(CPU),
TargetFS(FS), AsmInfo(nullptr), MRI(nullptr), MII(nullptr), STI(nullptr),
RequireStructuredCFG(false), Options(Options) {
RequireStructuredCFG(false), DefaultOptions(Options), Options(Options) {
if (EnableIPRA.getNumOccurrences())
this->Options.EnableIPRA = EnableIPRA;
}
@ -63,14 +63,15 @@ bool TargetMachine::isPositionIndependent() const {
/// \brief Reset the target options based on the function's attributes.
// FIXME: This function needs to go away for a number of reasons:
// a) global state on the TargetMachine is terrible in general,
// b) there's no default state here to keep,
// c) these target options should be passed only on the function
// b) these target options should be passed only on the function
// and not on the TargetMachine (via TargetOptions) at all.
void TargetMachine::resetTargetOptions(const Function &F) const {
#define RESET_OPTION(X, Y) \
do { \
if (F.hasFnAttribute(Y)) \
Options.X = (F.getFnAttribute(Y).getValueAsString() == "true"); \
else \
Options.X = DefaultOptions.X; \
} while (0)
RESET_OPTION(LessPreciseFPMADOption, "less-precise-fpmad");
@ -87,6 +88,8 @@ void TargetMachine::resetTargetOptions(const Function &F) const {
Options.FPDenormalMode = FPDenormal::PreserveSign;
else if (Denormal == "positive-zero")
Options.FPDenormalMode = FPDenormal::PositiveZero;
else
Options.FPDenormalMode = DefaultOptions.FPDenormalMode;
}
/// Returns the code generation relocation model. The choices are static, PIC,

View File

@ -21,14 +21,14 @@ define float @sqrt_div_fast(float %a, float %b) #0 {
}
; CHECK-LABEL: fadd
; CHECK: add.f32
; CHECK: add.rn.f32
define float @fadd(float %a, float %b) {
%t1 = fadd float %a, %b
ret float %t1
}
; CHECK-LABEL: fadd_ftz
; CHECK: add.ftz.f32
; CHECK: add.rn.ftz.f32
define float @fadd_ftz(float %a, float %b) #1 {
%t1 = fadd float %a, %b
ret float %t1

View File

@ -0,0 +1,67 @@
; Check that we can enable/disable NoInfsFPMath and NoNaNsInFPMath via function
; attributes. An attribute on one function should not magically apply to the
; next one.
; RUN: llc < %s -mtriple=powerpc64-unknown-unknown -mcpu=pwr7 -mattr=-vsx \
; RUN: | FileCheck %s --check-prefix=CHECK --check-prefix=SAFE
; RUN: llc < %s -mtriple=powerpc64-unknown-unknown -mcpu=pwr7 -mattr=-vsx \
; RUN: -enable-no-infs-fp-math -enable-no-nans-fp-math \
; RUN: | FileCheck %s --check-prefix=CHECK --check-prefix=UNSAFE
; The fcmp+select in these functions should be converted to a fsel instruction
; when both NoInfsFPMath and NoNaNsInFPMath are enabled.
; CHECK-LABEL: default0:
define double @default0(double %a, double %y, double %z) {
entry:
; SAFE-NOT: fsel
; UNSAFE: fsel
%cmp = fcmp ult double %a, 0.000000e+00
%z.y = select i1 %cmp, double %z, double %y
ret double %z.y
}
; CHECK-LABEL: unsafe_math_off:
define double @unsafe_math_off(double %a, double %y, double %z) #0 #2 {
entry:
; SAFE-NOT: fsel
; UNSAFE-NOT: fsel
%cmp = fcmp ult double %a, 0.000000e+00
%z.y = select i1 %cmp, double %z, double %y
ret double %z.y
}
; CHECK-LABEL: default1:
define double @default1(double %a, double %y, double %z) {
; SAFE-NOT: fsel
; UNSAFE: fsel
%cmp = fcmp ult double %a, 0.000000e+00
%z.y = select i1 %cmp, double %z, double %y
ret double %z.y
}
; CHECK-LABEL: unsafe_math_on:
define double @unsafe_math_on(double %a, double %y, double %z) #1 #3 {
entry:
; SAFE-NOT: fsel
; UNSAFE-NOT: fsel
%cmp = fcmp ult double %a, 0.000000e+00
%z.y = select i1 %cmp, double %z, double %y
ret double %z.y
}
; CHECK-LABEL: default2:
define double @default2(double %a, double %y, double %z) {
; SAFE-NOT: fsel
; UNSAFE: fsel
%cmp = fcmp ult double %a, 0.000000e+00
%z.y = select i1 %cmp, double %z, double %y
ret double %z.y
}
attributes #0 = { "no-infs-fp-math"="false" }
attributes #1 = { "no-nans-fp-math"="false" }
attributes #2 = { "no-infs-fp-math"="false" }
attributes #3 = { "no-infs-fp-math"="true" }

View File

@ -0,0 +1,56 @@
; Check that we can enable/disable UnsafeFPMath via function attributes. An
; attribute on one function should not magically apply to the next one.
; RUN: llc < %s -mtriple=x86_64-unknown-unknown \
; RUN: | FileCheck %s --check-prefix=CHECK --check-prefix=SAFE
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -enable-unsafe-fp-math \
; RUN: | FileCheck %s --check-prefix=CHECK --check-prefix=UNSAFE
; The div in these functions should be converted to a mul when unsafe-fp-math
; is enabled.
; CHECK-LABEL: unsafe_fp_math_default0:
define double @unsafe_fp_math_default0(double %x) {
; SAFE: divsd
; UNSAFE: mulsd
%div = fdiv double %x, 2.0
ret double %div
}
; CHECK-LABEL: unsafe_fp_math_off:
define double @unsafe_fp_math_off(double %x) #0 {
; SAFE: divsd
; UNSAFE: divsd
%div = fdiv double %x, 2.0
ret double %div
}
; CHECK-LABEL: unsafe_fp_math_default1:
define double @unsafe_fp_math_default1(double %x) {
; With unsafe math enabled, can change this div to a mul.
; SAFE: divsd
; UNSAFE: mulsd
%div = fdiv double %x, 2.0
ret double %div
}
; CHECK-LABEL: unsafe_fp_math_on:
define double @unsafe_fp_math_on(double %x) #1 {
; SAFE: mulsd
; UNSAFE: mulsd
%div = fdiv double %x, 2.0
ret double %div
}
; CHECK-LABEL: unsafe_fp_math_default2:
define double @unsafe_fp_math_default2(double %x) {
; With unsafe math enabled, can change this div to a mul.
; SAFE: divsd
; UNSAFE: mulsd
%div = fdiv double %x, 2.0
ret double %div
}
attributes #0 = { "unsafe-fp-math"="false" }
attributes #1 = { "unsafe-fp-math"="true" }