[llvm] [InstCombineCompares] Replace the sqrt in if-condition (PR #91707)

Fri May 10 04:18:52 PDT 2024

================
@@ -0,0 +1,87 @@
+; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
+; RUN: opt < %s -passes=instcombine -S -replace-sqrt-compare-by-square=true | FileCheck %s -check-prefix=OPT-TRUE
+; RUN: opt < %s -passes=instcombine -S | FileCheck %s -check-prefix=OPT-FALSE
+
+define i1 @foo1_fast(float %a, float %b) {
+; OPT-TRUE-LABEL: @foo1_fast(
+; OPT-TRUE-NEXT:    [[FCMP:%.*]] = fcmp fast ogt float %a, %b
+; OPT-TRUE-NEXT:    ret i1 [[FCMP]]
+;
+; OPT-FALSE-LABEL: @foo1_fast(
+; OPT-FALSE-NEXT:    %c = call fast float @llvm.sqrt.f32(float %a)
+; OPT-FALSE-NEXT:    %d = call fast float @llvm.sqrt.f32(float %b)
+; OPT-FALSE-NEXT:    [[FCMP:%.*]] = fcmp fast ogt float %c, %d
+; OPT-FALSE-NEXT:    ret i1 [[FCMP]]
+;
+  %c = call fast float @llvm.sqrt.f32(float %a)
+  %d = call fast float @llvm.sqrt.f32(float %b)
+  %e = fcmp fast ogt float %c, %d
+  ret i1 %e
+}
+
+define i1 @foo2_fast(float %a, float %b) {
+; OPT-TRUE-LABEL: @foo2_fast(
+; OPT-TRUE-NEXT:    [[FMUL:%.*]] = fmul fast float %b, %b
+; OPT-TRUE-NEXT:    [[SIGN:%.*]] = call fast float @llvm.copysign.f32(float [[FMUL]], float %b)
+; OPT-TRUE-NEXT:    [[FCMP:%.*]] = fcmp fast ogt float [[SIGN]], %a
+; OPT-TRUE-NEXT:    ret i1 [[FCMP]]
+;
+; OPT-FALSE-LABEL: @foo2_fast(
+; OPT-FALSE-NEXT:    [[SQRT:%.*]] = call fast float @llvm.sqrt.f32(float %a)
+; OPT-FALSE-NEXT:    [[FCMP:%.*]] = fcmp fast olt float [[SQRT]], %b
+; OPT-FALSE-NEXT:    ret i1 [[FCMP]]
+;
+  %c = call fast float @llvm.sqrt.f32(float %a)
+  %d = fcmp fast ogt float %b, %c
+  ret i1 %d
+}
+
+define i1 @foo3_fast(float %a, float %b) {
+; OPT-TRUE-LABEL: @foo3_fast(
+; OPT-TRUE-NEXT:    [[FMUL:%.*]] = fmul fast float %b, %b
+; OPT-TRUE-NEXT:    [[SIGN:%.*]] = call fast float @llvm.copysign.f32(float [[FMUL]], float %b)
+; OPT-TRUE-NEXT:    [[FCMP:%.*]] = fcmp fast olt float [[SIGN]], %a
+; OPT-TRUE-NEXT:    ret i1 [[FCMP]]
+;
+; OPT-FALSE-LABEL: @foo3_fast(
+; OPT-FALSE-NEXT:    [[SQRT:%.*]] = call fast float @llvm.sqrt.f32(float %a)
+; OPT-FALSE-NEXT:    [[FCMP:%.*]] = fcmp fast ogt float [[SQRT]], %b
+; OPT-FALSE-NEXT:    ret i1 [[FCMP]]
+;
+  %c = call fast float @llvm.sqrt.f32(float %a)
+  %d = fcmp fast ogt float %c, %b
+  ret i1 %d
+}
+
+define i1 @foo1_no_fast(float %a, float %b) {
+; OPT-TRUE-LABEL: @foo1_no_fast(
+; OPT-TRUE:    [[FCMP:%.*]] = fcmp ogt float %c, %d
+; OPT-TRUE-NEXT:    ret i1 [[FCMP]]
+;
+  %c = call float @llvm.sqrt.f32(float %a)
+  %d = call float @llvm.sqrt.f32(float %b)
+  %e = fcmp ogt float %c, %d
----------------
arsenm wrote:

Should test with full range of compare types, particularly unordered compares 

https://github.com/llvm/llvm-project/pull/91707