[llvm] f05bce8 - [AMDGPU] Add some missing check prefixes and tweak test
Jay Foad via llvm-commits
llvm-commits at lists.llvm.org
Fri Jul 17 04:59:13 PDT 2020
Author: Jay Foad
Date: 2020-07-17T12:57:47+01:00
New Revision: f05bce86af32d7b5cf1ab28b3abf6ee473bf3ef1
URL: https://github.com/llvm/llvm-project/commit/f05bce86af32d7b5cf1ab28b3abf6ee473bf3ef1
DIFF: https://github.com/llvm/llvm-project/commit/f05bce86af32d7b5cf1ab28b3abf6ee473bf3ef1.diff
LOG: [AMDGPU] Add some missing check prefixes and tweak test
The test needed some extra ALU instructions to prevent it from being
memory bound.
Added:
Modified:
llvm/test/CodeGen/AMDGPU/perfhint.ll
Removed:
################################################################################
diff --git a/llvm/test/CodeGen/AMDGPU/perfhint.ll b/llvm/test/CodeGen/AMDGPU/perfhint.ll
index 375a699e040e..1fef1423ac4f 100644
--- a/llvm/test/CodeGen/AMDGPU/perfhint.ll
+++ b/llvm/test/CodeGen/AMDGPU/perfhint.ll
@@ -30,22 +30,25 @@ bb:
}
; GCN-LABEL: {{^}}test_large_stride:
-; MemoryBound: 0
-; WaveLimiterHint : 1
+; GCN: MemoryBound: 0
+; GCN: WaveLimiterHint : 1
define amdgpu_kernel void @test_large_stride(i32 addrspace(1)* nocapture %arg) {
bb:
%tmp = getelementptr inbounds i32, i32 addrspace(1)* %arg, i64 4096
%tmp1 = load i32, i32 addrspace(1)* %tmp, align 4
+ %mul1 = mul i32 %tmp1, %tmp1
%tmp2 = getelementptr inbounds i32, i32 addrspace(1)* %arg, i64 1
- store i32 %tmp1, i32 addrspace(1)* %tmp2, align 4
+ store i32 %mul1, i32 addrspace(1)* %tmp2, align 4
%tmp3 = getelementptr inbounds i32, i32 addrspace(1)* %arg, i64 8192
%tmp4 = load i32, i32 addrspace(1)* %tmp3, align 4
+ %mul4 = mul i32 %tmp4, %tmp4
%tmp5 = getelementptr inbounds i32, i32 addrspace(1)* %arg, i64 2
- store i32 %tmp4, i32 addrspace(1)* %tmp5, align 4
+ store i32 %mul4, i32 addrspace(1)* %tmp5, align 4
%tmp6 = getelementptr inbounds i32, i32 addrspace(1)* %arg, i64 12288
%tmp7 = load i32, i32 addrspace(1)* %tmp6, align 4
+ %mul7 = mul i32 %tmp7, %tmp7
%tmp8 = getelementptr inbounds i32, i32 addrspace(1)* %arg, i64 3
- store i32 %tmp7, i32 addrspace(1)* %tmp8, align 4
+ store i32 %mul7, i32 addrspace(1)* %tmp8, align 4
ret void
}
More information about the llvm-commits
mailing list