[llvm] r352976 - AMDGPU/GlobalISel: Legalize icmp for pointer types
Matt Arsenault via llvm-commits
llvm-commits at lists.llvm.org
Sat Feb 2 15:35:15 PST 2019
Author: arsenm
Date: Sat Feb 2 15:35:15 2019
New Revision: 352976
URL: http://llvm.org/viewvc/llvm-project?rev=352976&view=rev
Log:
AMDGPU/GlobalISel: Legalize icmp for pointer types
Modified:
llvm/trunk/lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp
llvm/trunk/test/CodeGen/AMDGPU/GlobalISel/legalize-icmp.mir
Modified: llvm/trunk/lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp?rev=352976&r1=352975&r2=352976&view=diff
==============================================================================
--- llvm/trunk/lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp (original)
+++ llvm/trunk/lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp Sat Feb 2 15:35:15 2019
@@ -200,7 +200,16 @@ AMDGPULegalizerInfo::AMDGPULegalizerInfo
setAction({G_BLOCK_ADDR, CodePtr}, Legal);
- getActionDefinitionsBuilder({G_ICMP, G_FCMP})
+ getActionDefinitionsBuilder(G_ICMP)
+ .legalForCartesianProduct(
+ {S1}, {S32, S64, GlobalPtr, LocalPtr, ConstantPtr, PrivatePtr, FlatPtr})
+ .legalFor({{S1, S32}, {S1, S64}})
+ .widenScalarToNextPow2(1)
+ .clampScalar(1, S32, S64)
+ .scalarize(0)
+ .legalIf(all(typeIs(0, S1), isPointer(1)));
+
+ getActionDefinitionsBuilder(G_FCMP)
.legalFor({{S1, S32}, {S1, S64}})
.widenScalarToNextPow2(1)
.clampScalar(1, S32, S64)
Modified: llvm/trunk/test/CodeGen/AMDGPU/GlobalISel/legalize-icmp.mir
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/CodeGen/AMDGPU/GlobalISel/legalize-icmp.mir?rev=352976&r1=352975&r2=352976&view=diff
==============================================================================
--- llvm/trunk/test/CodeGen/AMDGPU/GlobalISel/legalize-icmp.mir (original)
+++ llvm/trunk/test/CodeGen/AMDGPU/GlobalISel/legalize-icmp.mir Sat Feb 2 15:35:15 2019
@@ -164,3 +164,178 @@ body: |
S_NOP 0, implicit %3
...
+
+---
+name: test_icmp_p0
+body: |
+ bb.0.entry:
+ liveins: $vgpr0_vgpr1, $vgpr2_vgpr3
+ ; CHECK-LABEL: name: test_icmp_p0
+ ; CHECK: [[COPY:%[0-9]+]]:_(p0) = COPY $vgpr0_vgpr1
+ ; CHECK: [[COPY1:%[0-9]+]]:_(p0) = COPY $vgpr0_vgpr1
+ ; CHECK: [[ICMP:%[0-9]+]]:_(s1) = G_ICMP intpred(ne), [[COPY]](p0), [[COPY1]]
+ ; CHECK: [[SEXT:%[0-9]+]]:_(s32) = G_SEXT [[ICMP]](s1)
+ ; CHECK: $vgpr0 = COPY [[SEXT]](s32)
+ %0:_(p0) = COPY $vgpr0_vgpr1
+ %1:_(p0) = COPY $vgpr0_vgpr1
+ %2:_(s1) = G_ICMP intpred(ne), %0, %1
+ %3:_(s32) = G_SEXT %2
+ $vgpr0 = COPY %3
+...
+
+---
+name: test_icmp_p1
+body: |
+ bb.0.entry:
+ liveins: $vgpr0_vgpr1, $vgpr2_vgpr3
+ ; CHECK-LABEL: name: test_icmp_p1
+ ; CHECK: [[COPY:%[0-9]+]]:_(p1) = COPY $vgpr0_vgpr1
+ ; CHECK: [[COPY1:%[0-9]+]]:_(p1) = COPY $vgpr0_vgpr1
+ ; CHECK: [[ICMP:%[0-9]+]]:_(s1) = G_ICMP intpred(ne), [[COPY]](p1), [[COPY1]]
+ ; CHECK: [[SEXT:%[0-9]+]]:_(s32) = G_SEXT [[ICMP]](s1)
+ ; CHECK: $vgpr0 = COPY [[SEXT]](s32)
+ %0:_(p1) = COPY $vgpr0_vgpr1
+ %1:_(p1) = COPY $vgpr0_vgpr1
+ %2:_(s1) = G_ICMP intpred(ne), %0, %1
+ %3:_(s32) = G_SEXT %2
+ $vgpr0 = COPY %3
+...
+
+---
+name: test_icmp_p2
+body: |
+ bb.0.entry:
+ liveins: $vgpr0, $vgpr1
+
+ ; CHECK-LABEL: name: test_icmp_p2
+ ; CHECK: [[COPY:%[0-9]+]]:_(p2) = COPY $vgpr0
+ ; CHECK: [[COPY1:%[0-9]+]]:_(p2) = COPY $vgpr1
+ ; CHECK: [[ICMP:%[0-9]+]]:_(s1) = G_ICMP intpred(ne), [[COPY]](p2), [[COPY1]]
+ ; CHECK: [[SEXT:%[0-9]+]]:_(s32) = G_SEXT [[ICMP]](s1)
+ ; CHECK: $vgpr0 = COPY [[SEXT]](s32)
+ %0:_(p2) = COPY $vgpr0
+ %1:_(p2) = COPY $vgpr1
+ %2:_(s1) = G_ICMP intpred(ne), %0, %1
+ %3:_(s32) = G_SEXT %2
+ $vgpr0 = COPY %3
+...
+
+---
+name: test_icmp_p3
+body: |
+ bb.0.entry:
+ liveins: $vgpr0, $vgpr1
+
+ ; CHECK-LABEL: name: test_icmp_p3
+ ; CHECK: [[COPY:%[0-9]+]]:_(p3) = COPY $vgpr0
+ ; CHECK: [[COPY1:%[0-9]+]]:_(p3) = COPY $vgpr1
+ ; CHECK: [[ICMP:%[0-9]+]]:_(s1) = G_ICMP intpred(ne), [[COPY]](p3), [[COPY1]]
+ ; CHECK: [[SEXT:%[0-9]+]]:_(s32) = G_SEXT [[ICMP]](s1)
+ ; CHECK: $vgpr0 = COPY [[SEXT]](s32)
+ %0:_(p3) = COPY $vgpr0
+ %1:_(p3) = COPY $vgpr1
+ %2:_(s1) = G_ICMP intpred(ne), %0, %1
+ %3:_(s32) = G_SEXT %2
+ $vgpr0 = COPY %3
+...
+
+---
+name: test_icmp_p4
+body: |
+ bb.0.entry:
+ liveins: $vgpr0_vgpr1, $vgpr2_vgpr3
+ ; CHECK-LABEL: name: test_icmp_p4
+ ; CHECK: [[COPY:%[0-9]+]]:_(p4) = COPY $vgpr0_vgpr1
+ ; CHECK: [[COPY1:%[0-9]+]]:_(p4) = COPY $vgpr0_vgpr1
+ ; CHECK: [[ICMP:%[0-9]+]]:_(s1) = G_ICMP intpred(ne), [[COPY]](p4), [[COPY1]]
+ ; CHECK: [[SEXT:%[0-9]+]]:_(s32) = G_SEXT [[ICMP]](s1)
+ ; CHECK: $vgpr0 = COPY [[SEXT]](s32)
+ %0:_(p4) = COPY $vgpr0_vgpr1
+ %1:_(p4) = COPY $vgpr0_vgpr1
+ %2:_(s1) = G_ICMP intpred(ne), %0, %1
+ %3:_(s32) = G_SEXT %2
+ $vgpr0 = COPY %3
+...
+
+---
+name: test_icmp_p5
+body: |
+ bb.0.entry:
+ liveins: $vgpr0, $vgpr1
+
+ ; CHECK-LABEL: name: test_icmp_p5
+ ; CHECK: [[COPY:%[0-9]+]]:_(p5) = COPY $vgpr0
+ ; CHECK: [[COPY1:%[0-9]+]]:_(p5) = COPY $vgpr1
+ ; CHECK: [[ICMP:%[0-9]+]]:_(s1) = G_ICMP intpred(ne), [[COPY]](p5), [[COPY1]]
+ ; CHECK: [[SEXT:%[0-9]+]]:_(s32) = G_SEXT [[ICMP]](s1)
+ ; CHECK: $vgpr0 = COPY [[SEXT]](s32)
+ %0:_(p5) = COPY $vgpr0
+ %1:_(p5) = COPY $vgpr1
+ %2:_(s1) = G_ICMP intpred(ne), %0, %1
+ %3:_(s32) = G_SEXT %2
+ $vgpr0 = COPY %3
+...
+
+---
+name: test_icmp_p999
+body: |
+ bb.0.entry:
+ liveins: $vgpr0_vgpr1, $vgpr2_vgpr3
+ ; CHECK-LABEL: name: test_icmp_p999
+ ; CHECK: [[COPY:%[0-9]+]]:_(p999) = COPY $vgpr0_vgpr1
+ ; CHECK: [[COPY1:%[0-9]+]]:_(p999) = COPY $vgpr0_vgpr1
+ ; CHECK: [[ICMP:%[0-9]+]]:_(s1) = G_ICMP intpred(ne), [[COPY]](p999), [[COPY1]]
+ ; CHECK: [[SEXT:%[0-9]+]]:_(s32) = G_SEXT [[ICMP]](s1)
+ ; CHECK: $vgpr0 = COPY [[SEXT]](s32)
+ %0:_(p999) = COPY $vgpr0_vgpr1
+ %1:_(p999) = COPY $vgpr0_vgpr1
+ %2:_(s1) = G_ICMP intpred(ne), %0, %1
+ %3:_(s32) = G_SEXT %2
+ $vgpr0 = COPY %3
+...
+
+---
+name: test_icmp_v2p3
+body: |
+ bb.0.entry:
+ liveins: $vgpr0_vgpr1, $vgpr2_vgpr3
+ ; CHECK-LABEL: name: test_icmp_v2p3
+ ; CHECK: [[COPY:%[0-9]+]]:_(<2 x p3>) = COPY $vgpr0_vgpr1
+ ; CHECK: [[COPY1:%[0-9]+]]:_(<2 x p3>) = COPY $vgpr0_vgpr1
+ ; CHECK: [[UV:%[0-9]+]]:_(p3), [[UV1:%[0-9]+]]:_(p3) = G_UNMERGE_VALUES [[COPY]](<2 x p3>)
+ ; CHECK: [[UV2:%[0-9]+]]:_(p3), [[UV3:%[0-9]+]]:_(p3) = G_UNMERGE_VALUES [[COPY1]](<2 x p3>)
+ ; CHECK: [[ICMP:%[0-9]+]]:_(s1) = G_ICMP intpred(ne), [[UV]](p3), [[UV2]]
+ ; CHECK: [[ICMP1:%[0-9]+]]:_(s1) = G_ICMP intpred(ne), [[UV1]](p3), [[UV3]]
+ ; CHECK: [[SEXT:%[0-9]+]]:_(s32) = G_SEXT [[ICMP]](s1)
+ ; CHECK: [[SEXT1:%[0-9]+]]:_(s32) = G_SEXT [[ICMP1]](s1)
+ ; CHECK: [[BUILD_VECTOR:%[0-9]+]]:_(<2 x s32>) = G_BUILD_VECTOR [[SEXT]](s32), [[SEXT1]](s32)
+ ; CHECK: $vgpr0_vgpr1 = COPY [[BUILD_VECTOR]](<2 x s32>)
+ %0:_(<2 x p3>) = COPY $vgpr0_vgpr1
+ %1:_(<2 x p3>) = COPY $vgpr0_vgpr1
+ %2:_(<2 x s1>) = G_ICMP intpred(ne), %0, %1
+ %3:_(<2 x s32>) = G_SEXT %2
+ $vgpr0_vgpr1 = COPY %3
+...
+
+---
+name: test_icmp_v2p999
+body: |
+ bb.0.entry:
+ liveins: $vgpr0_vgpr1_vgpr2_vgpr3, $vgpr4_vgpr5_vgpr6_vgpr7
+ ; CHECK-LABEL: name: test_icmp_v2p999
+ ; CHECK: [[COPY:%[0-9]+]]:_(<2 x p999>) = COPY $vgpr0_vgpr1_vgpr2_vgpr3
+ ; CHECK: [[COPY1:%[0-9]+]]:_(<2 x p999>) = COPY $vgpr4_vgpr5_vgpr6_vgpr7
+ ; CHECK: [[UV:%[0-9]+]]:_(p999), [[UV1:%[0-9]+]]:_(p999) = G_UNMERGE_VALUES [[COPY]](<2 x p999>)
+ ; CHECK: [[UV2:%[0-9]+]]:_(p999), [[UV3:%[0-9]+]]:_(p999) = G_UNMERGE_VALUES [[COPY1]](<2 x p999>)
+ ; CHECK: [[ICMP:%[0-9]+]]:_(s1) = G_ICMP intpred(ne), [[UV]](p999), [[UV2]]
+ ; CHECK: [[ICMP1:%[0-9]+]]:_(s1) = G_ICMP intpred(ne), [[UV1]](p999), [[UV3]]
+ ; CHECK: [[SEXT:%[0-9]+]]:_(s32) = G_SEXT [[ICMP]](s1)
+ ; CHECK: [[SEXT1:%[0-9]+]]:_(s32) = G_SEXT [[ICMP1]](s1)
+ ; CHECK: [[BUILD_VECTOR:%[0-9]+]]:_(<2 x s32>) = G_BUILD_VECTOR [[SEXT]](s32), [[SEXT1]](s32)
+ ; CHECK: $vgpr0_vgpr1 = COPY [[BUILD_VECTOR]](<2 x s32>)
+ %0:_(<2 x p999>) = COPY $vgpr0_vgpr1_vgpr2_vgpr3
+ %1:_(<2 x p999>) = COPY $vgpr4_vgpr5_vgpr6_vgpr7
+ %2:_(<2 x s1>) = G_ICMP intpred(ne), %0, %1
+ %3:_(<2 x s32>) = G_SEXT %2
+ $vgpr0_vgpr1 = COPY %3
+...
More information about the llvm-commits
mailing list