[llvm] e699c03 - AMDGPU/GlobalISel: Fix import of s_abs_i32 pattern
Matt Arsenault via llvm-commits
llvm-commits at lists.llvm.org
Tue Jan 7 07:41:38 PST 2020
Author: Matt Arsenault
Date: 2020-01-07T10:32:07-05:00
New Revision: e699c03c9be4839f03dcc3a7fa86a44594e80dcf
URL: https://github.com/llvm/llvm-project/commit/e699c03c9be4839f03dcc3a7fa86a44594e80dcf
DIFF: https://github.com/llvm/llvm-project/commit/e699c03c9be4839f03dcc3a7fa86a44594e80dcf.diff
LOG: AMDGPU/GlobalISel: Fix import of s_abs_i32 pattern
Added:
llvm/test/CodeGen/AMDGPU/GlobalISel/inst-select-abs.mir
Modified:
llvm/lib/Target/AMDGPU/SOPInstructions.td
Removed:
################################################################################
diff --git a/llvm/lib/Target/AMDGPU/SOPInstructions.td b/llvm/lib/Target/AMDGPU/SOPInstructions.td
index a89416d2f373..73ba2ae367f7 100644
--- a/llvm/lib/Target/AMDGPU/SOPInstructions.td
+++ b/llvm/lib/Target/AMDGPU/SOPInstructions.td
@@ -1213,7 +1213,7 @@ def : GCNPat <
def : GCNPat <
(i32 (smax i32:$x, (i32 (ineg i32:$x)))),
- (S_ABS_I32 $x)
+ (S_ABS_I32 SReg_32:$x)
>;
def : GCNPat <
diff --git a/llvm/test/CodeGen/AMDGPU/GlobalISel/inst-select-abs.mir b/llvm/test/CodeGen/AMDGPU/GlobalISel/inst-select-abs.mir
new file mode 100644
index 000000000000..a9e1124d1026
--- /dev/null
+++ b/llvm/test/CodeGen/AMDGPU/GlobalISel/inst-select-abs.mir
@@ -0,0 +1,105 @@
+# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
+# RUN: llc -march=amdgcn -mcpu=tahiti -run-pass=instruction-select -verify-machineinstrs %s -o - | FileCheck -check-prefix=GFX6 %s
+# RUN: llc -march=amdgcn -mcpu=gfx900 -run-pass=instruction-select -verify-machineinstrs %s -o - | FileCheck -check-prefix=GFX9 %s
+
+---
+name: smax_neg_abs_pattern_s32_ss
+legalized: true
+regBankSelected: true
+tracksRegLiveness: true
+
+body: |
+ bb.0:
+ liveins: $sgpr0
+
+ ; GFX6-LABEL: name: smax_neg_abs_pattern_s32_ss
+ ; GFX6: liveins: $sgpr0
+ ; GFX6: %src0:sreg_32 = COPY $sgpr0
+ ; GFX6: %smax:sreg_32 = S_ABS_I32 %src0, implicit-def $scc
+ ; GFX6: S_ENDPGM 0, implicit %smax
+ ; GFX9-LABEL: name: smax_neg_abs_pattern_s32_ss
+ ; GFX9: liveins: $sgpr0
+ ; GFX9: %src0:sreg_32 = COPY $sgpr0
+ ; GFX9: %smax:sreg_32 = S_ABS_I32 %src0, implicit-def $scc
+ ; GFX9: S_ENDPGM 0, implicit %smax
+ %src0:sgpr(s32) = COPY $sgpr0
+ %zero:sgpr(s32) = G_CONSTANT i32 0
+ %ineg:sgpr(s32) = G_SUB %zero, %src0
+ %smax:sgpr(s32) = G_SMAX %src0, %ineg
+ S_ENDPGM 0, implicit %smax
+...
+
+---
+name: smax_neg_abs_pattern_s32_ss_commute
+legalized: true
+regBankSelected: true
+tracksRegLiveness: true
+
+body: |
+ bb.0:
+ liveins: $sgpr0
+
+ ; GFX6-LABEL: name: smax_neg_abs_pattern_s32_ss_commute
+ ; GFX6: liveins: $sgpr0
+ ; GFX6: %src0:sreg_32 = COPY $sgpr0
+ ; GFX6: %smax:sreg_32 = S_ABS_I32 %src0, implicit-def $scc
+ ; GFX6: S_ENDPGM 0, implicit %smax
+ ; GFX9-LABEL: name: smax_neg_abs_pattern_s32_ss_commute
+ ; GFX9: liveins: $sgpr0
+ ; GFX9: %src0:sreg_32 = COPY $sgpr0
+ ; GFX9: %smax:sreg_32 = S_ABS_I32 %src0, implicit-def $scc
+ ; GFX9: S_ENDPGM 0, implicit %smax
+ %src0:sgpr(s32) = COPY $sgpr0
+ %zero:sgpr(s32) = G_CONSTANT i32 0
+ %ineg:sgpr(s32) = G_SUB %zero, %src0
+ %smax:sgpr(s32) = G_SMAX %ineg, %src0
+ S_ENDPGM 0, implicit %smax
+...
+
+---
+name: smax_neg_abs_pattern_s32_vv
+legalized: true
+regBankSelected: true
+tracksRegLiveness: true
+
+body: |
+ bb.0:
+ liveins: $vgpr0
+
+ ; GFX6-LABEL: name: smax_neg_abs_pattern_s32_vv
+ ; GFX6: liveins: $vgpr0
+ ; GFX6: %src0:vgpr_32 = COPY $vgpr0
+ ; GFX6: %zero:vgpr_32 = V_MOV_B32_e32 0, implicit $exec
+ ; GFX6: %ineg:vgpr_32, dead %4:sreg_64_xexec = V_SUB_I32_e64 %zero, %src0, 0, implicit $exec
+ ; GFX6: %smax:vgpr_32 = V_MAX_I32_e64 %src0, %ineg, implicit $exec
+ ; GFX6: S_ENDPGM 0, implicit %smax
+ ; GFX9-LABEL: name: smax_neg_abs_pattern_s32_vv
+ ; GFX9: liveins: $vgpr0
+ ; GFX9: %src0:vgpr_32 = COPY $vgpr0
+ ; GFX9: %zero:vgpr_32 = V_MOV_B32_e32 0, implicit $exec
+ ; GFX9: %ineg:vgpr_32 = V_SUB_U32_e64 %zero, %src0, 0, implicit $exec
+ ; GFX9: %smax:vgpr_32 = V_MAX_I32_e64 %src0, %ineg, implicit $exec
+ ; GFX9: S_ENDPGM 0, implicit %smax
+ %src0:vgpr(s32) = COPY $vgpr0
+ %zero:vgpr(s32) = G_CONSTANT i32 0
+ %ineg:vgpr(s32) = G_SUB %zero, %src0
+ %smax:vgpr(s32) = G_SMAX %src0, %ineg
+ S_ENDPGM 0, implicit %smax
+...
+
+# FIXME: Violates constant bus restriction
+# ---
+# name: smax_neg_abs_pattern_s32_vs
+# legalized: true
+# regBankSelected: true
+
+# body: |
+# bb.0:
+# liveins: $sgpr0
+
+# %src0:sgpr(s32) = COPY $sgpr0
+# %zero:sgpr(s32) = G_CONSTANT i32 0
+# %ineg:sgpr(s32) = G_SUB %zero, %src0
+# %smax:vgpr(s32) = G_SMAX %src0, %ineg
+# S_ENDPGM 0, implicit %smax
+# ...
More information about the llvm-commits
mailing list