[llvm] a409fcd - [ARM] Extra test for reverted WLS memset. NFC
David Green via llvm-commits
llvm-commits at lists.llvm.org
Wed May 26 06:54:45 PDT 2021
Author: David Green
Date: 2021-05-26T14:54:36+01:00
New Revision: a409fcddaed9ad4468d781a447fc5a4b3aac90d4
URL: https://github.com/llvm/llvm-project/commit/a409fcddaed9ad4468d781a447fc5a4b3aac90d4
DIFF: https://github.com/llvm/llvm-project/commit/a409fcddaed9ad4468d781a447fc5a4b3aac90d4.diff
LOG: [ARM] Extra test for reverted WLS memset. NFC
Added:
Modified:
llvm/test/CodeGen/Thumb2/mve-memtp-loop.ll
Removed:
################################################################################
diff --git a/llvm/test/CodeGen/Thumb2/mve-memtp-loop.ll b/llvm/test/CodeGen/Thumb2/mve-memtp-loop.ll
index 82f81ec46da4..e64cf92517c3 100644
--- a/llvm/test/CodeGen/Thumb2/mve-memtp-loop.ll
+++ b/llvm/test/CodeGen/Thumb2/mve-memtp-loop.ll
@@ -460,5 +460,93 @@ cleanup:
declare void @other()
+ at arr_56 = external dso_local local_unnamed_addr global [21 x [16 x [11 x i8]]], align 1
+define void @multilooped_exit(i32 %b) {
+; CHECK-LABEL: multilooped_exit:
+; CHECK: @ %bb.0: @ %entry
+; CHECK-NEXT: .save {r4, lr}
+; CHECK-NEXT: push {r4, lr}
+; CHECK-NEXT: cmp r0, #1
+; CHECK-NEXT: it lt
+; CHECK-NEXT: poplt {r4, pc}
+; CHECK-NEXT: .LBB18_1: @ %loop.preheader
+; CHECK-NEXT: mov.w r4, #-1
+; CHECK-NEXT: vmov.i32 q0, #0x0
+; CHECK-NEXT: b .LBB18_3
+; CHECK-NEXT: .LBB18_2: @ %loop
+; CHECK-NEXT: @ in Loop: Header=BB18_3 Depth=1
+; CHECK-NEXT: adds r4, #1
+; CHECK-NEXT: cmp.w r4, #1024
+; CHECK-NEXT: bge .LBB18_11
+; CHECK-NEXT: .LBB18_3: @ %loop
+; CHECK-NEXT: @ =>This Loop Header: Depth=1
+; CHECK-NEXT: @ Child Loop BB18_4 Depth 2
+; CHECK-NEXT: @ Child Loop BB18_6 Depth 2
+; CHECK-NEXT: @ Child Loop BB18_8 Depth 2
+; CHECK-NEXT: @ Child Loop BB18_10 Depth 2
+; CHECK-NEXT: movw r3, :lower16:arr_56
+; CHECK-NEXT: add.w r1, r0, #15
+; CHECK-NEXT: movt r3, :upper16:arr_56
+; CHECK-NEXT: lsr.w r12, r1, #4
+; CHECK-NEXT: mov r2, r3
+; CHECK-NEXT: mov r1, r0
+; CHECK-NEXT: wlstp.8 lr, r1, .LBB18_5
+; CHECK-NEXT: .LBB18_4: @ Parent Loop BB18_3 Depth=1
+; CHECK-NEXT: @ => This Inner Loop Header: Depth=2
+; CHECK-NEXT: vstrb.8 q0, [r2], #16
+; CHECK-NEXT: letp lr, .LBB18_4
+; CHECK-NEXT: .LBB18_5: @ %loop
+; CHECK-NEXT: @ in Loop: Header=BB18_3 Depth=1
+; CHECK-NEXT: mov r2, r3
+; CHECK-NEXT: mov r1, r0
+; CHECK-NEXT: wlstp.8 lr, r1, .LBB18_7
+; CHECK-NEXT: .LBB18_6: @ Parent Loop BB18_3 Depth=1
+; CHECK-NEXT: @ => This Inner Loop Header: Depth=2
+; CHECK-NEXT: vstrb.8 q0, [r2], #16
+; CHECK-NEXT: letp lr, .LBB18_6
+; CHECK-NEXT: .LBB18_7: @ %loop
+; CHECK-NEXT: @ in Loop: Header=BB18_3 Depth=1
+; CHECK-NEXT: mov r2, r3
+; CHECK-NEXT: mov r1, r0
+; CHECK-NEXT: wlstp.8 lr, r1, .LBB18_9
+; CHECK-NEXT: .LBB18_8: @ Parent Loop BB18_3 Depth=1
+; CHECK-NEXT: @ => This Inner Loop Header: Depth=2
+; CHECK-NEXT: vstrb.8 q0, [r2], #16
+; CHECK-NEXT: letp lr, .LBB18_8
+; CHECK-NEXT: .LBB18_9: @ %loop
+; CHECK-NEXT: @ in Loop: Header=BB18_3 Depth=1
+; CHECK-NEXT: mov r1, r0
+; CHECK-NEXT: subs.w lr, r12, #0
+; CHECK-NEXT: beq .LBB18_2
+; CHECK-NEXT: b .LBB18_10
+; CHECK-NEXT: .LBB18_10: @ Parent Loop BB18_3 Depth=1
+; CHECK-NEXT: @ => This Inner Loop Header: Depth=2
+; CHECK-NEXT: vctp.8 r1
+; CHECK-NEXT: subs r1, #16
+; CHECK-NEXT: vpst
+; CHECK-NEXT: vstrbt.8 q0, [r3], #16
+; CHECK-NEXT: subs.w lr, lr, #1
+; CHECK-NEXT: bne .LBB18_10
+; CHECK-NEXT: b .LBB18_2
+; CHECK-NEXT: .LBB18_11: @ %exit
+; CHECK-NEXT: pop {r4, pc}
+entry:
+ %cmp8 = icmp sgt i32 %b, 0
+ br i1 %cmp8, label %loop, label %exit
+
+loop:
+ %p = phi i32 [ 0, %entry ], [ %inc, %loop ]
+ call void @llvm.memset.p0i8.i32(i8* align 1 getelementptr ([21 x [16 x [11 x i8]]], [21 x [16 x [11 x i8]]]* @arr_56, i32 0, i32 0, i32 undef, i32 0), i8 0, i32 %b, i1 false)
+ call void @llvm.memset.p0i8.i32(i8* align 1 getelementptr ([21 x [16 x [11 x i8]]], [21 x [16 x [11 x i8]]]* @arr_56, i32 0, i32 0, i32 undef, i32 0), i8 0, i32 %b, i1 false)
+ call void @llvm.memset.p0i8.i32(i8* align 1 getelementptr ([21 x [16 x [11 x i8]]], [21 x [16 x [11 x i8]]]* @arr_56, i32 0, i32 0, i32 undef, i32 0), i8 0, i32 %b, i1 false)
+ call void @llvm.memset.p0i8.i32(i8* align 1 getelementptr ([21 x [16 x [11 x i8]]], [21 x [16 x [11 x i8]]]* @arr_56, i32 0, i32 0, i32 undef, i32 0), i8 0, i32 %b, i1 false)
+ %inc = add i32 %p, 1
+ %c = icmp slt i32 %p, 1024
+ br i1 %c, label %loop, label %exit
+
+exit:
+ ret void
+}
+
attributes #0 = { noinline optnone }
attributes #1 = { optsize }
More information about the llvm-commits
mailing list