[PATCH] D39951: AMDGPU: Implement computeKnownBitsForTargetNode for mbcnt
Matt Arsenault via Phabricator via llvm-commits
llvm-commits at lists.llvm.org
Sun Nov 12 20:59:25 PST 2017
arsenm created this revision.
Herald added subscribers: t-tye, tpr, dstuttard, yaxunl, nhaehnle, wdng, kzhuravl.
https://reviews.llvm.org/D39951
Files:
lib/Target/AMDGPU/AMDGPUISelLowering.cpp
lib/Target/AMDGPU/AMDGPUSubtarget.h
test/CodeGen/AMDGPU/llvm.amdgcn.mbcnt.ll
Index: test/CodeGen/AMDGPU/llvm.amdgcn.mbcnt.ll
===================================================================
--- test/CodeGen/AMDGPU/llvm.amdgcn.mbcnt.ll
+++ test/CodeGen/AMDGPU/llvm.amdgcn.mbcnt.ll
@@ -14,6 +14,24 @@
ret void
}
+; GCN-LABEL: {{^}}mbcnt_lo_known_bits:
+; GCN: v_mbcnt_lo_u32_b32
+; GCN-NOT: and
+define i32 @mbcnt_lo_known_bits(i32 %x, i32 %y) #0 {
+ %lo = call i32 @llvm.amdgcn.mbcnt.lo(i32 %x, i32 %y)
+ %mask = and i32 %lo, 63
+ ret i32 %mask
+}
+
+; GCN-LABEL: {{^}}mbcnt_hi_known_bits:
+; GCN: v_mbcnt_hi_u32_b32
+; GCN-NOT: and
+define i32 @mbcnt_hi_known_bits(i32 %x, i32 %y) #0 {
+ %hi = call i32 @llvm.amdgcn.mbcnt.hi(i32 %x, i32 %y)
+ %mask = and i32 %hi, 63
+ ret i32 %mask
+}
+
declare i32 @llvm.amdgcn.mbcnt.lo(i32, i32) #0
declare i32 @llvm.amdgcn.mbcnt.hi(i32, i32) #0
declare void @llvm.amdgcn.exp.f32(i32, i32, float, float, float, float, i1, i1) #1
Index: lib/Target/AMDGPU/AMDGPUSubtarget.h
===================================================================
--- lib/Target/AMDGPU/AMDGPUSubtarget.h
+++ lib/Target/AMDGPU/AMDGPUSubtarget.h
@@ -229,6 +229,10 @@
return WavefrontSize;
}
+ unsigned getWavefrontSizeLog2() const {
+ return Log2_32(WavefrontSize);
+ }
+
int getLocalMemorySize() const {
return LocalMemorySize;
}
Index: lib/Target/AMDGPU/AMDGPUISelLowering.cpp
===================================================================
--- lib/Target/AMDGPU/AMDGPUISelLowering.cpp
+++ lib/Target/AMDGPU/AMDGPUISelLowering.cpp
@@ -4067,6 +4067,20 @@
Known.Zero.setHighBits(32 - MaxValBits);
break;
}
+ case ISD::INTRINSIC_WO_CHAIN: {
+ unsigned IID = cast<ConstantSDNode>(Op.getOperand(0))->getZExtValue();
+ switch (IID) {
+ case Intrinsic::amdgcn_mbcnt_lo:
+ case Intrinsic::amdgcn_mbcnt_hi: {
+ // These return at most the wavefront size - 1.
+ unsigned Size = Op.getValueType().getSizeInBits();
+ Known.Zero.setHighBits(Size- Subtarget->getWavefrontSizeLog2());
+ break;
+ }
+ default:
+ break;
+ }
+ }
}
}
-------------- next part --------------
A non-text attachment was scrubbed...
Name: D39951.122609.patch
Type: text/x-patch
Size: 2067 bytes
Desc: not available
URL: <http://lists.llvm.org/pipermail/llvm-commits/attachments/20171113/afac7dfa/attachment.bin>
More information about the llvm-commits
mailing list