[llvm] 156afb2 - AMDGPU: Fix inlining logic for denormals

Matt Arsenault via llvm-commits llvm-commits at lists.llvm.org
Thu Apr 23 12:43:59 PDT 2020


Author: Matt Arsenault
Date: 2020-04-23T15:30:48-04:00
New Revision: 156afb2253eabf0e2d446dafd08e754d7b9f513a

URL: https://github.com/llvm/llvm-project/commit/156afb2253eabf0e2d446dafd08e754d7b9f513a
DIFF: https://github.com/llvm/llvm-project/commit/156afb2253eabf0e2d446dafd08e754d7b9f513a.diff

LOG: AMDGPU: Fix inlining logic for denormals

This was backwards from intended and missing a test. We perhaps should
just ignored the FP mode here, since it shouldn't be legal to mix code
with different default modes in the absence of strictfp.

Added: 
    llvm/test/Transforms/Inline/AMDGPU/inline-denormal-fp-math.ll

Modified: 
    llvm/lib/Target/AMDGPU/Utils/AMDGPUBaseInfo.h

Removed: 
    


################################################################################
diff  --git a/llvm/lib/Target/AMDGPU/Utils/AMDGPUBaseInfo.h b/llvm/lib/Target/AMDGPU/Utils/AMDGPUBaseInfo.h
index 9f1670c52e69..9cca73646ac7 100644
--- a/llvm/lib/Target/AMDGPU/Utils/AMDGPUBaseInfo.h
+++ b/llvm/lib/Target/AMDGPU/Utils/AMDGPUBaseInfo.h
@@ -750,7 +750,7 @@ struct SIModeRegisterDefaults {
   /// Returns true if a flag is compatible if it's enabled in the callee, but
   /// disabled in the caller.
   static bool oneWayCompatible(bool CallerMode, bool CalleeMode) {
-    return CallerMode == CalleeMode || (CallerMode && !CalleeMode);
+    return CallerMode == CalleeMode || (!CallerMode && CalleeMode);
   }
 
   // FIXME: Inlining should be OK for dx10-clamp, since the caller's mode should

diff  --git a/llvm/test/Transforms/Inline/AMDGPU/inline-denormal-fp-math.ll b/llvm/test/Transforms/Inline/AMDGPU/inline-denormal-fp-math.ll
new file mode 100644
index 000000000000..8d2c3d9a6f31
--- /dev/null
+++ b/llvm/test/Transforms/Inline/AMDGPU/inline-denormal-fp-math.ll
@@ -0,0 +1,79 @@
+; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
+; RUN: opt -mtriple=amdgcn-amd-amdhsa -S -inline < %s | FileCheck %s
+; RUN: opt -mtriple=amdgcn-amd-amdhsa -S -passes='cgscc(inline)' < %s | FileCheck %s
+
+define i32 @func_default() #0 {
+; CHECK-LABEL: @func_default(
+; CHECK-NEXT:    ret i32 0
+;
+  ret i32 0
+}
+
+define i32 @func_denormal_fp_math_ieee_ieee() #1 {
+; CHECK-LABEL: @func_denormal_fp_math_ieee_ieee(
+; CHECK-NEXT:    ret i32 0
+;
+  ret i32 0
+}
+
+define i32 @func_denormal_fp_math_flush_flush() #2 {
+; CHECK-LABEL: @func_denormal_fp_math_flush_flush(
+; CHECK-NEXT:    ret i32 0
+;
+  ret i32 0
+}
+
+define i32 @call_func_ieee_ieee_from_flush_flush() #2 {
+; CHECK-LABEL: @call_func_ieee_ieee_from_flush_flush(
+; CHECK-NEXT:    ret i32 0
+;
+  %call = call i32 @func_denormal_fp_math_ieee_ieee()
+  ret i32 %call
+}
+
+define i32 @call_func_flush_flush_from_ieee_ieee() #1 {
+; CHECK-LABEL: @call_func_flush_flush_from_ieee_ieee(
+; CHECK-NEXT:    [[CALL:%.*]] = call i32 @func_denormal_fp_math_flush_flush()
+; CHECK-NEXT:    ret i32 [[CALL]]
+;
+  %call = call i32 @func_denormal_fp_math_flush_flush()
+  ret i32 %call
+}
+
+define i32 @func_denormal_fp_math_flush_ieee() #3 {
+; CHECK-LABEL: @func_denormal_fp_math_flush_ieee(
+; CHECK-NEXT:    ret i32 0
+;
+  ret i32 0
+}
+
+define i32 @func_denormal_fp_math_ieee_flush() #4 {
+; CHECK-LABEL: @func_denormal_fp_math_ieee_flush(
+; CHECK-NEXT:    ret i32 0
+;
+  ret i32 0
+}
+
+define i32 @call_func_flush_ieee_from_ieee_ieee() #1 {
+; CHECK-LABEL: @call_func_flush_ieee_from_ieee_ieee(
+; CHECK-NEXT:    [[CALL:%.*]] = call i32 @func_denormal_fp_math_flush_ieee()
+; CHECK-NEXT:    ret i32 [[CALL]]
+;
+  %call = call i32 @func_denormal_fp_math_flush_ieee()
+  ret i32 %call
+}
+
+define i32 @call_func_ieee_flush_from_ieee_ieee() #1 {
+; CHECK-LABEL: @call_func_ieee_flush_from_ieee_ieee(
+; CHECK-NEXT:    [[CALL:%.*]] = call i32 @func_denormal_fp_math_ieee_flush()
+; CHECK-NEXT:    ret i32 [[CALL]]
+;
+  %call = call i32 @func_denormal_fp_math_ieee_flush()
+  ret i32 %call
+}
+
+attributes #0 = { nounwind }
+attributes #1 = { nounwind "denormal-fp-math"="ieee,ieee" }
+attributes #2 = { nounwind "denormal-fp-math"="preserve-sign,preserve-sign" }
+attributes #3 = { nounwind "denormal-fp-math"="preserve-sign,ieee" }
+attributes #4 = { nounwind "denormal-fp-math"="ieee,preserve-sign" }


        


More information about the llvm-commits mailing list