[llvm] fc06c8e - AMDGPU: Partially clean up canonicalized predicates in tablegen (#85404)
via llvm-commits
llvm-commits at lists.llvm.org
Fri Mar 15 08:39:22 PDT 2024
Author: Matt Arsenault
Date: 2024-03-15T21:09:18+05:30
New Revision: fc06c8efcbca6951f849b5c30e1c253929100a7c
URL: https://github.com/llvm/llvm-project/commit/fc06c8efcbca6951f849b5c30e1c253929100a7c
DIFF: https://github.com/llvm/llvm-project/commit/fc06c8efcbca6951f849b5c30e1c253929100a7c.diff
LOG: AMDGPU: Partially clean up canonicalized predicates in tablegen (#85404)
This was the easy case. There are more issues with some of the other
is_canonicalized* patterns. First there appears to be a tablegen bug
where the predicate is silently ignored if used as a ComplexPattern
source, and we also probably need a version with an operand.
Added:
Modified:
llvm/lib/Target/AMDGPU/SIInstrInfo.td
llvm/lib/Target/AMDGPU/SIInstructions.td
Removed:
################################################################################
diff --git a/llvm/lib/Target/AMDGPU/SIInstrInfo.td b/llvm/lib/Target/AMDGPU/SIInstrInfo.td
index 835a5a24723154..1694436bad15ce 100644
--- a/llvm/lib/Target/AMDGPU/SIInstrInfo.td
+++ b/llvm/lib/Target/AMDGPU/SIInstrInfo.td
@@ -835,6 +835,19 @@ def fp16_zeros_high_16bits : PatLeaf<(f16 VGPR_32:$src), [{
return fp16SrcZerosHighBits(N->getOpcode());
}]>;
+def is_canonicalized : PatLeaf<(fAny srcvalue:$src), [{
+ const SITargetLowering &Lowering =
+ *static_cast<const SITargetLowering *>(getTargetLowering());
+ return Lowering.isCanonicalized(*CurDAG, SDValue(N, 0));
+}]> {
+ let GISelPredicateCode = [{
+ const SITargetLowering *TLI = static_cast<const SITargetLowering *>(
+ MF.getSubtarget().getTargetLowering());
+ const MachineOperand &Dst = MI.getOperand(0);
+ assert(Dst.isDef());
+ return TLI->isCanonicalized(Dst.getReg(), MF);
+ }];
+}
//===----------------------------------------------------------------------===//
// MUBUF/SMEM Patterns
diff --git a/llvm/lib/Target/AMDGPU/SIInstructions.td b/llvm/lib/Target/AMDGPU/SIInstructions.td
index 3ab788406ecb28..1c942dcefdacea 100644
--- a/llvm/lib/Target/AMDGPU/SIInstructions.td
+++ b/llvm/lib/Target/AMDGPU/SIInstructions.td
@@ -2946,30 +2946,12 @@ def : GCNPat<
// If fcanonicalize's operand is implicitly canonicalized, we only need a copy.
let AddedComplexity = 1000 in {
-def : GCNPat<
- (is_canonicalized_1<fcanonicalize> f16:$src),
- (COPY f16:$src)
->;
-
-def : GCNPat<
- (is_canonicalized_1<fcanonicalize> v2f16:$src),
- (COPY v2f16:$src)
->;
-
-def : GCNPat<
- (is_canonicalized_1<fcanonicalize> f32:$src),
- (COPY f32:$src)
->;
-
-def : GCNPat<
- (is_canonicalized_1<fcanonicalize> v2f32:$src),
- (COPY v2f32:$src)
->;
-
-def : GCNPat<
- (is_canonicalized_1<fcanonicalize> f64:$src),
- (COPY f64:$src)
->;
+foreach vt = [f16, v2f16, f32, v2f32, f64] in {
+ def : GCNPat<
+ (fcanonicalize (vt is_canonicalized:$src)),
+ (COPY vt:$src)
+ >;
+}
}
// Prefer selecting to max when legal, but using mul is always valid.
More information about the llvm-commits
mailing list