[llvm] 0fa1743 - [LICM] Add test for noalias call (NFC)

Nikita Popov via llvm-commits llvm-commits at lists.llvm.org
Thu Jan 6 02:46:39 PST 2022


Author: Nikita Popov
Date: 2022-01-06T11:46:27+01:00
New Revision: 0fa174398bfd7040128340bae03228838ee6082e

URL: https://github.com/llvm/llvm-project/commit/0fa174398bfd7040128340bae03228838ee6082e
DIFF: https://github.com/llvm/llvm-project/commit/0fa174398bfd7040128340bae03228838ee6082e.diff

LOG: [LICM] Add test for noalias call (NFC)

Add a test with a noalias call that is not a known allocation
function.

Added: 
    

Modified: 
    llvm/test/Transforms/LICM/promote-tls.ll

Removed: 
    


################################################################################
diff  --git a/llvm/test/Transforms/LICM/promote-tls.ll b/llvm/test/Transforms/LICM/promote-tls.ll
index abb9d96c3ea09..a0c966eee79a1 100644
--- a/llvm/test/Transforms/LICM/promote-tls.ll
+++ b/llvm/test/Transforms/LICM/promote-tls.ll
@@ -1,5 +1,6 @@
-; RUN: opt -tbaa -basic-aa -licm -S < %s | FileCheck %s
-; RUN: opt -aa-pipeline=tbaa,basic-aa -passes='require<aa>,require<targetir>,require<scalar-evolution>,require<opt-remark-emit>,loop-mssa(licm)' -S %s | FileCheck %s
+; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
+; RUN: opt -licm -S < %s | FileCheck %s
+; RUN: opt -passes='loop-mssa(licm)' -S %s | FileCheck %s
 
 ; If we can prove a local is thread local, we can insert stores during
 ; promotion which wouldn't be legal otherwise.
@@ -12,8 +13,36 @@ target triple = "x86_64-linux-generic"
 declare i8* @malloc(i64)
 
 ; Exercise the TLS case
-; CHECK-LABEL: @test
 define i32* @test(i32 %n) {
+; CHECK-LABEL: @test(
+; CHECK-NEXT:  entry:
+; CHECK-NEXT:    [[MEM:%.*]] = call noalias dereferenceable(16) i8* @malloc(i64 16)
+; CHECK-NEXT:    [[ADDR:%.*]] = bitcast i8* [[MEM]] to i32*
+; CHECK-NEXT:    br label [[FOR_BODY_LR_PH:%.*]]
+; CHECK:       for.body.lr.ph:
+; CHECK-NEXT:    [[ADDR_PROMOTED:%.*]] = load i32, i32* [[ADDR]], align 4
+; CHECK-NEXT:    br label [[FOR_HEADER:%.*]]
+; CHECK:       for.header:
+; CHECK-NEXT:    [[NEW1:%.*]] = phi i32 [ [[ADDR_PROMOTED]], [[FOR_BODY_LR_PH]] ], [ [[NEW:%.*]], [[FOR_BODY:%.*]] ]
+; CHECK-NEXT:    [[I_02:%.*]] = phi i32 [ 0, [[FOR_BODY_LR_PH]] ], [ [[INC:%.*]], [[FOR_BODY]] ]
+; CHECK-NEXT:    [[GUARD:%.*]] = load atomic i8*, i8** @p monotonic, align 8
+; CHECK-NEXT:    [[EXITCMP:%.*]] = icmp eq i8* [[GUARD]], null
+; CHECK-NEXT:    br i1 [[EXITCMP]], label [[FOR_BODY]], label [[EARLY_EXIT:%.*]]
+; CHECK:       early-exit:
+; CHECK-NEXT:    [[NEW1_LCSSA:%.*]] = phi i32 [ [[NEW1]], [[FOR_HEADER]] ]
+; CHECK-NEXT:    store i32 [[NEW1_LCSSA]], i32* [[ADDR]], align 4
+; CHECK-NEXT:    ret i32* null
+; CHECK:       for.body:
+; CHECK-NEXT:    [[NEW]] = add i32 [[NEW1]], 1
+; CHECK-NEXT:    [[INC]] = add nsw i32 [[I_02]], 1
+; CHECK-NEXT:    [[CMP:%.*]] = icmp slt i32 [[INC]], [[N:%.*]]
+; CHECK-NEXT:    br i1 [[CMP]], label [[FOR_HEADER]], label [[FOR_COND_FOR_END_CRIT_EDGE:%.*]]
+; CHECK:       for.cond.for.end_crit_edge:
+; CHECK-NEXT:    [[NEW_LCSSA:%.*]] = phi i32 [ [[NEW]], [[FOR_BODY]] ]
+; CHECK-NEXT:    [[SPLIT:%.*]] = phi i32* [ [[ADDR]], [[FOR_BODY]] ]
+; CHECK-NEXT:    store i32 [[NEW_LCSSA]], i32* [[ADDR]], align 4
+; CHECK-NEXT:    ret i32* null
+;
 entry:
   ;; ignore the required null check for simplicity
   %mem = call dereferenceable(16) noalias i8* @malloc(i64 16)
@@ -21,8 +50,6 @@ entry:
   br label %for.body.lr.ph
 
 for.body.lr.ph:                                   ; preds = %entry
-; CHECK-LABEL: for.body.lr.ph:
-; CHECK-NEXT: %addr.promoted = load i32, i32* %addr, align 4
   br label %for.header
 
 for.header:
@@ -34,8 +61,6 @@ for.header:
   br i1 %exitcmp, label %for.body, label %early-exit
 
 early-exit:
-; CHECK-LABEL: early-exit:
-; CHECK: store i32 %new1.lcssa, i32* %addr, align 4
   ret i32* null
 
 for.body:
@@ -46,23 +71,47 @@ for.body:
   br i1 %cmp, label %for.header, label %for.cond.for.end_crit_edge
 
 for.cond.for.end_crit_edge:                       ; preds = %for.body
-; CHECK-LABEL: for.cond.for.end_crit_edge:
-; CHECK: store i32 %new.lcssa, i32* %addr, align 4
   %split = phi i32* [ %addr, %for.body ]
   ret i32* null
 }
 
 ; Stack allocations can also be thread-local
-; CHECK-LABEL: @test2
 define i32* @test2(i32 %n) {
+; CHECK-LABEL: @test2(
+; CHECK-NEXT:  entry:
+; CHECK-NEXT:    [[MEM:%.*]] = alloca i8, i32 16, align 1
+; CHECK-NEXT:    [[ADDR:%.*]] = bitcast i8* [[MEM]] to i32*
+; CHECK-NEXT:    br label [[FOR_BODY_LR_PH:%.*]]
+; CHECK:       for.body.lr.ph:
+; CHECK-NEXT:    [[ADDR_PROMOTED:%.*]] = load i32, i32* [[ADDR]], align 4
+; CHECK-NEXT:    br label [[FOR_HEADER:%.*]]
+; CHECK:       for.header:
+; CHECK-NEXT:    [[NEW1:%.*]] = phi i32 [ [[ADDR_PROMOTED]], [[FOR_BODY_LR_PH]] ], [ [[NEW:%.*]], [[FOR_BODY:%.*]] ]
+; CHECK-NEXT:    [[I_02:%.*]] = phi i32 [ 0, [[FOR_BODY_LR_PH]] ], [ [[INC:%.*]], [[FOR_BODY]] ]
+; CHECK-NEXT:    [[GUARD:%.*]] = load atomic i8*, i8** @p monotonic, align 8
+; CHECK-NEXT:    [[EXITCMP:%.*]] = icmp eq i8* [[GUARD]], null
+; CHECK-NEXT:    br i1 [[EXITCMP]], label [[FOR_BODY]], label [[EARLY_EXIT:%.*]]
+; CHECK:       early-exit:
+; CHECK-NEXT:    [[NEW1_LCSSA:%.*]] = phi i32 [ [[NEW1]], [[FOR_HEADER]] ]
+; CHECK-NEXT:    store i32 [[NEW1_LCSSA]], i32* [[ADDR]], align 4
+; CHECK-NEXT:    ret i32* null
+; CHECK:       for.body:
+; CHECK-NEXT:    [[NEW]] = add i32 [[NEW1]], 1
+; CHECK-NEXT:    [[INC]] = add nsw i32 [[I_02]], 1
+; CHECK-NEXT:    [[CMP:%.*]] = icmp slt i32 [[INC]], [[N:%.*]]
+; CHECK-NEXT:    br i1 [[CMP]], label [[FOR_HEADER]], label [[FOR_COND_FOR_END_CRIT_EDGE:%.*]]
+; CHECK:       for.cond.for.end_crit_edge:
+; CHECK-NEXT:    [[NEW_LCSSA:%.*]] = phi i32 [ [[NEW]], [[FOR_BODY]] ]
+; CHECK-NEXT:    [[SPLIT:%.*]] = phi i32* [ [[ADDR]], [[FOR_BODY]] ]
+; CHECK-NEXT:    store i32 [[NEW_LCSSA]], i32* [[ADDR]], align 4
+; CHECK-NEXT:    ret i32* null
+;
 entry:
   %mem = alloca i8, i32 16
   %addr = bitcast i8* %mem to i32*
   br label %for.body.lr.ph
 
 for.body.lr.ph:                                   ; preds = %entry
-; CHECK-LABEL: for.body.lr.ph:
-; CHECK-NEXT: %addr.promoted = load i32, i32* %addr, align 4
   br label %for.header
 
 for.header:
@@ -74,8 +123,6 @@ for.header:
   br i1 %exitcmp, label %for.body, label %early-exit
 
 early-exit:
-; CHECK-LABEL: early-exit:
-; CHECK: store i32 %new1.lcssa, i32* %addr, align 4
   ret i32* null
 
 for.body:
@@ -86,20 +133,103 @@ for.body:
   br i1 %cmp, label %for.header, label %for.cond.for.end_crit_edge
 
 for.cond.for.end_crit_edge:                       ; preds = %for.body
-; CHECK-LABEL: for.cond.for.end_crit_edge:
-; CHECK: store i32 %new.lcssa, i32* %addr, align 4
+  %split = phi i32* [ %addr, %for.body ]
+  ret i32* null
+}
+
+declare noalias i8* @custom_malloc(i64)
+
+; Custom allocation function marked via noalias.
+define i32* @test_custom_malloc(i32 %n) {
+; CHECK-LABEL: @test_custom_malloc(
+; CHECK-NEXT:  entry:
+; CHECK-NEXT:    [[MEM:%.*]] = call noalias dereferenceable(16) i8* @custom_malloc(i64 16)
+; CHECK-NEXT:    [[ADDR:%.*]] = bitcast i8* [[MEM]] to i32*
+; CHECK-NEXT:    br label [[FOR_BODY_LR_PH:%.*]]
+; CHECK:       for.body.lr.ph:
+; CHECK-NEXT:    [[ADDR_PROMOTED:%.*]] = load i32, i32* [[ADDR]], align 4
+; CHECK-NEXT:    br label [[FOR_HEADER:%.*]]
+; CHECK:       for.header:
+; CHECK-NEXT:    [[NEW1:%.*]] = phi i32 [ [[ADDR_PROMOTED]], [[FOR_BODY_LR_PH]] ], [ [[NEW:%.*]], [[FOR_BODY:%.*]] ]
+; CHECK-NEXT:    [[I_02:%.*]] = phi i32 [ 0, [[FOR_BODY_LR_PH]] ], [ [[INC:%.*]], [[FOR_BODY]] ]
+; CHECK-NEXT:    [[GUARD:%.*]] = load volatile i8*, i8** @p, align 8
+; CHECK-NEXT:    [[EXITCMP:%.*]] = icmp eq i8* [[GUARD]], null
+; CHECK-NEXT:    br i1 [[EXITCMP]], label [[FOR_BODY]], label [[EARLY_EXIT:%.*]]
+; CHECK:       early-exit:
+; CHECK-NEXT:    ret i32* null
+; CHECK:       for.body:
+; CHECK-NEXT:    [[NEW]] = add i32 [[NEW1]], 1
+; CHECK-NEXT:    store i32 [[NEW]], i32* [[ADDR]], align 4
+; CHECK-NEXT:    [[INC]] = add nsw i32 [[I_02]], 1
+; CHECK-NEXT:    [[CMP:%.*]] = icmp slt i32 [[INC]], [[N:%.*]]
+; CHECK-NEXT:    br i1 [[CMP]], label [[FOR_HEADER]], label [[FOR_COND_FOR_END_CRIT_EDGE:%.*]]
+; CHECK:       for.cond.for.end_crit_edge:
+; CHECK-NEXT:    [[SPLIT:%.*]] = phi i32* [ [[ADDR]], [[FOR_BODY]] ]
+; CHECK-NEXT:    ret i32* null
+;
+entry:
+  %mem = call dereferenceable(16) noalias i8* @custom_malloc(i64 16)
+  %addr = bitcast i8* %mem to i32*
+  br label %for.body.lr.ph
+
+for.body.lr.ph:                                   ; preds = %entry
+  br label %for.header
+
+for.header:
+  %i.02 = phi i32 [ 0, %for.body.lr.ph ], [ %inc, %for.body ]
+  %old = load i32, i32* %addr, align 4
+  ; deliberate impossible to analyze branch
+  %guard = load volatile i8*, i8** @p
+  %exitcmp = icmp eq i8* %guard, null
+  br i1 %exitcmp, label %for.body, label %early-exit
+
+early-exit:
+  ret i32* null
+
+for.body:
+  %new = add i32 %old, 1
+  store i32 %new, i32* %addr, align 4
+  %inc = add nsw i32 %i.02, 1
+  %cmp = icmp slt i32 %inc, %n
+  br i1 %cmp, label %for.header, label %for.cond.for.end_crit_edge
+
+for.cond.for.end_crit_edge:                       ; preds = %for.body
   %split = phi i32* [ %addr, %for.body ]
   ret i32* null
 }
 
 declare i8* @not_malloc(i64)
 
-; Negative test - not TLS
-; CHECK-LABEL: @test_neg
-define i32* @test_neg(i32 %n) {
+; Negative test - not an allocation function.
+define i32* @test_neg_not_malloc(i32 %n) {
+; CHECK-LABEL: @test_neg_not_malloc(
+; CHECK-NEXT:  entry:
+; CHECK-NEXT:    [[MEM:%.*]] = call dereferenceable(16) i8* @not_malloc(i64 16)
+; CHECK-NEXT:    [[ADDR:%.*]] = bitcast i8* [[MEM]] to i32*
+; CHECK-NEXT:    br label [[FOR_BODY_LR_PH:%.*]]
+; CHECK:       for.body.lr.ph:
+; CHECK-NEXT:    br label [[FOR_HEADER:%.*]]
+; CHECK:       for.header:
+; CHECK-NEXT:    [[I_02:%.*]] = phi i32 [ 0, [[FOR_BODY_LR_PH]] ], [ [[INC:%.*]], [[FOR_BODY:%.*]] ]
+; CHECK-NEXT:    [[OLD:%.*]] = load i32, i32* [[ADDR]], align 4
+; CHECK-NEXT:    [[GUARD:%.*]] = load volatile i8*, i8** @p, align 8
+; CHECK-NEXT:    [[EXITCMP:%.*]] = icmp eq i8* [[GUARD]], null
+; CHECK-NEXT:    br i1 [[EXITCMP]], label [[FOR_BODY]], label [[EARLY_EXIT:%.*]]
+; CHECK:       early-exit:
+; CHECK-NEXT:    ret i32* null
+; CHECK:       for.body:
+; CHECK-NEXT:    [[NEW:%.*]] = add i32 [[OLD]], 1
+; CHECK-NEXT:    store i32 [[NEW]], i32* [[ADDR]], align 4
+; CHECK-NEXT:    [[INC]] = add nsw i32 [[I_02]], 1
+; CHECK-NEXT:    [[CMP:%.*]] = icmp slt i32 [[INC]], [[N:%.*]]
+; CHECK-NEXT:    br i1 [[CMP]], label [[FOR_HEADER]], label [[FOR_COND_FOR_END_CRIT_EDGE:%.*]]
+; CHECK:       for.cond.for.end_crit_edge:
+; CHECK-NEXT:    [[SPLIT:%.*]] = phi i32* [ [[ADDR]], [[FOR_BODY]] ]
+; CHECK-NEXT:    ret i32* null
+;
 entry:
   ;; ignore the required null check for simplicity
-  %mem = call dereferenceable(16) noalias i8* @not_malloc(i64 16)
+  %mem = call dereferenceable(16) i8* @not_malloc(i64 16)
   %addr = bitcast i8* %mem to i32*
   br label %for.body.lr.ph
 
@@ -115,13 +245,9 @@ for.header:
   br i1 %exitcmp, label %for.body, label %early-exit
 
 early-exit:
-; CHECK-LABEL: early-exit:
-; CHECK-NOT: store
   ret i32* null
 
 for.body:
-; CHECK-LABEL: for.body:
-; CHECK: store i32 %new, i32* %addr, align 4
   %new = add i32 %old, 1
   store i32 %new, i32* %addr, align 4
   %inc = add nsw i32 %i.02, 1
@@ -129,16 +255,38 @@ for.body:
   br i1 %cmp, label %for.header, label %for.cond.for.end_crit_edge
 
 for.cond.for.end_crit_edge:                       ; preds = %for.body
-; CHECK-LABEL: for.cond.for.end_crit_edge:
-; CHECK-NOT: store
   %split = phi i32* [ %addr, %for.body ]
   ret i32* null
 }
 
 ; Negative test - can't speculate load since branch
 ; may control alignment
-; CHECK-LABEL: @test_neg2
 define i32* @test_neg2(i32 %n) {
+; CHECK-LABEL: @test_neg2(
+; CHECK-NEXT:  entry:
+; CHECK-NEXT:    [[MEM:%.*]] = call noalias dereferenceable(16) i8* @malloc(i64 16)
+; CHECK-NEXT:    [[ADDR:%.*]] = bitcast i8* [[MEM]] to i32*
+; CHECK-NEXT:    br label [[FOR_BODY_LR_PH:%.*]]
+; CHECK:       for.body.lr.ph:
+; CHECK-NEXT:    br label [[FOR_HEADER:%.*]]
+; CHECK:       for.header:
+; CHECK-NEXT:    [[I_02:%.*]] = phi i32 [ 0, [[FOR_BODY_LR_PH]] ], [ [[INC:%.*]], [[FOR_BODY:%.*]] ]
+; CHECK-NEXT:    [[GUARD:%.*]] = load volatile i8*, i8** @p, align 8
+; CHECK-NEXT:    [[EXITCMP:%.*]] = icmp eq i8* [[GUARD]], null
+; CHECK-NEXT:    br i1 [[EXITCMP]], label [[FOR_BODY]], label [[EARLY_EXIT:%.*]]
+; CHECK:       early-exit:
+; CHECK-NEXT:    ret i32* null
+; CHECK:       for.body:
+; CHECK-NEXT:    [[OLD:%.*]] = load i32, i32* [[ADDR]], align 4
+; CHECK-NEXT:    [[NEW:%.*]] = add i32 [[OLD]], 1
+; CHECK-NEXT:    store i32 [[NEW]], i32* [[ADDR]], align 4
+; CHECK-NEXT:    [[INC]] = add nsw i32 [[I_02]], 1
+; CHECK-NEXT:    [[CMP:%.*]] = icmp slt i32 [[INC]], [[N:%.*]]
+; CHECK-NEXT:    br i1 [[CMP]], label [[FOR_HEADER]], label [[FOR_COND_FOR_END_CRIT_EDGE:%.*]]
+; CHECK:       for.cond.for.end_crit_edge:
+; CHECK-NEXT:    [[SPLIT:%.*]] = phi i32* [ [[ADDR]], [[FOR_BODY]] ]
+; CHECK-NEXT:    ret i32* null
+;
 entry:
   ;; ignore the required null check for simplicity
   %mem = call dereferenceable(16) noalias i8* @malloc(i64 16)
@@ -156,13 +304,9 @@ for.header:
   br i1 %exitcmp, label %for.body, label %early-exit
 
 early-exit:
-; CHECK-LABEL: early-exit:
-; CHECK-NOT: store
   ret i32* null
 
 for.body:
-; CHECK-LABEL: for.body:
-; CHECK: store i32 %new, i32* %addr, align 4
   %old = load i32, i32* %addr, align 4
   %new = add i32 %old, 1
   store i32 %new, i32* %addr, align 4
@@ -171,8 +315,6 @@ for.body:
   br i1 %cmp, label %for.header, label %for.cond.for.end_crit_edge
 
 for.cond.for.end_crit_edge:                       ; preds = %for.body
-; CHECK-LABEL: for.cond.for.end_crit_edge:
-; CHECK-NOT: store
   %split = phi i32* [ %addr, %for.body ]
   ret i32* null
 }


        


More information about the llvm-commits mailing list