[PATCH] D43765: [InstSimplify] loosen FMF for sqrt(X) * sqrt(X) --> X
Sanjay Patel via Phabricator via llvm-commits
llvm-commits at lists.llvm.org
Sun Mar 18 07:15:01 PDT 2018
This revision was automatically updated to reflect the committed changes.
Closed by commit rL327796: [InstSimplify] loosen FMF for sqrt(X) * sqrt(X) --> X (authored by spatel, committed by ).
Changed prior to commit:
https://reviews.llvm.org/D43765?vs=138080&id=138848#toc
Repository:
rL LLVM
https://reviews.llvm.org/D43765
Files:
llvm/trunk/lib/Analysis/InstructionSimplify.cpp
llvm/trunk/test/Transforms/InstSimplify/fast-math.ll
Index: llvm/trunk/test/Transforms/InstSimplify/fast-math.ll
===================================================================
--- llvm/trunk/test/Transforms/InstSimplify/fast-math.ll
+++ llvm/trunk/test/Transforms/InstSimplify/fast-math.ll
@@ -323,16 +323,51 @@
}
; PR21126: http://llvm.org/bugs/show_bug.cgi?id=21126
-; With unsafe/fast math, sqrt(X) * sqrt(X) is just X.
+; With loose math, sqrt(X) * sqrt(X) is just X.
declare double @llvm.sqrt.f64(double)
define double @sqrt_squared(double %f) {
; CHECK-LABEL: @sqrt_squared(
; CHECK-NEXT: ret double [[F:%.*]]
;
%sqrt = call double @llvm.sqrt.f64(double %f)
- %mul = fmul fast double %sqrt, %sqrt
+ %mul = fmul reassoc nnan nsz double %sqrt, %sqrt
+ ret double %mul
+}
+
+; Negative tests for the above transform: we need all 3 of those flags.
+
+define double @sqrt_squared_not_fast_enough1(double %f) {
+; CHECK-LABEL: @sqrt_squared_not_fast_enough1(
+; CHECK-NEXT: [[SQRT:%.*]] = call double @llvm.sqrt.f64(double [[F:%.*]])
+; CHECK-NEXT: [[MUL:%.*]] = fmul nnan nsz double [[SQRT]], [[SQRT]]
+; CHECK-NEXT: ret double [[MUL]]
+;
+ %sqrt = call double @llvm.sqrt.f64(double %f)
+ %mul = fmul nnan nsz double %sqrt, %sqrt
+ ret double %mul
+}
+
+define double @sqrt_squared_not_fast_enough2(double %f) {
+; CHECK-LABEL: @sqrt_squared_not_fast_enough2(
+; CHECK-NEXT: [[SQRT:%.*]] = call double @llvm.sqrt.f64(double [[F:%.*]])
+; CHECK-NEXT: [[MUL:%.*]] = fmul reassoc nnan double [[SQRT]], [[SQRT]]
+; CHECK-NEXT: ret double [[MUL]]
+;
+ %sqrt = call double @llvm.sqrt.f64(double %f)
+ %mul = fmul reassoc nnan double %sqrt, %sqrt
+ ret double %mul
+}
+
+define double @sqrt_squared_not_fast_enough3(double %f) {
+; CHECK-LABEL: @sqrt_squared_not_fast_enough3(
+; CHECK-NEXT: [[SQRT:%.*]] = call double @llvm.sqrt.f64(double [[F:%.*]])
+; CHECK-NEXT: [[MUL:%.*]] = fmul reassoc nsz double [[SQRT]], [[SQRT]]
+; CHECK-NEXT: ret double [[MUL]]
+;
+ %sqrt = call double @llvm.sqrt.f64(double %f)
+ %mul = fmul reassoc nsz double %sqrt, %sqrt
ret double %mul
}
Index: llvm/trunk/lib/Analysis/InstructionSimplify.cpp
===================================================================
--- llvm/trunk/lib/Analysis/InstructionSimplify.cpp
+++ llvm/trunk/lib/Analysis/InstructionSimplify.cpp
@@ -4249,10 +4249,13 @@
if (FMF.noNaNs() && FMF.noSignedZeros() && match(Op1, m_AnyZeroFP()))
return ConstantFP::getNullValue(Op0->getType());
- // sqrt(X) * sqrt(X) --> X
+ // sqrt(X) * sqrt(X) --> X, if we can:
+ // 1. Remove the intermediate rounding (reassociate).
+ // 2. Ignore non-zero negative numbers because sqrt would produce NAN.
+ // 3. Ignore -0.0 because sqrt(-0.0) == -0.0, but -0.0 * -0.0 == 0.0.
Value *X;
- if (FMF.isFast() && Op0 == Op1 &&
- match(Op0, m_Intrinsic<Intrinsic::sqrt>(m_Value(X))))
+ if (Op0 == Op1 && match(Op0, m_Intrinsic<Intrinsic::sqrt>(m_Value(X))) &&
+ FMF.allowReassoc() && FMF.noNaNs() && FMF.noSignedZeros())
return X;
return nullptr;
-------------- next part --------------
A non-text attachment was scrubbed...
Name: D43765.138848.patch
Type: text/x-patch
Size: 3028 bytes
Desc: not available
URL: <http://lists.llvm.org/pipermail/llvm-commits/attachments/20180318/82832659/attachment.bin>
More information about the llvm-commits
mailing list