[PATCH] D18247: [DAGCombine] Catch the case where extract_vector_elt can cause an any_ext while processing AND SDNodes
silviu.baranga@arm.com via llvm-commits
llvm-commits at lists.llvm.org
Mon Mar 21 04:48:50 PDT 2016
This revision was automatically updated to reflect the committed changes.
Closed by commit rL263935: [DAGCombine] Catch the case where extract_vector_elt can cause an any_ext… (authored by sbaranga).
Changed prior to commit:
http://reviews.llvm.org/D18247?vs=50950&id=51148#toc
Repository:
rL LLVM
http://reviews.llvm.org/D18247
Files:
llvm/trunk/lib/CodeGen/SelectionDAG/DAGCombiner.cpp
llvm/trunk/test/CodeGen/ARM/dagcombine-anyexttozeroext.ll
Index: llvm/trunk/lib/CodeGen/SelectionDAG/DAGCombiner.cpp
===================================================================
--- llvm/trunk/lib/CodeGen/SelectionDAG/DAGCombiner.cpp
+++ llvm/trunk/lib/CodeGen/SelectionDAG/DAGCombiner.cpp
@@ -3089,6 +3089,7 @@
// the 'X' node here can either be nothing or an extract_vector_elt to catch
// more cases.
if ((N0.getOpcode() == ISD::EXTRACT_VECTOR_ELT &&
+ N0.getValueSizeInBits() == N0.getOperand(0).getScalarValueSizeInBits() &&
N0.getOperand(0).getOpcode() == ISD::LOAD) ||
N0.getOpcode() == ISD::LOAD) {
LoadSDNode *Load = cast<LoadSDNode>( (N0.getOpcode() == ISD::LOAD) ?
Index: llvm/trunk/test/CodeGen/ARM/dagcombine-anyexttozeroext.ll
===================================================================
--- llvm/trunk/test/CodeGen/ARM/dagcombine-anyexttozeroext.ll
+++ llvm/trunk/test/CodeGen/ARM/dagcombine-anyexttozeroext.ll
@@ -19,12 +19,48 @@
ret float %7
}
+; CHECK-LABEL: g:
define float @g(<4 x i16>* nocapture %in) {
; CHECK: vldr
%1 = load <4 x i16>, <4 x i16>* %in
- ; CHECK-NOT: uxth
+
+ ; For now we're generating a vmov.16 and a uxth instruction.
+ ; The uxth is redundant, and we should be able to extend without
+ ; having to generate cross-domain copies. Once we can do this
+ ; we should modify the checks below.
+
+ ; CHECK: uxth
%2 = extractelement <4 x i16> %1, i32 0
; CHECK: vcvt.f32.u32
%3 = uitofp i16 %2 to float
ret float %3
}
+
+; The backend generates for the following code an
+; (and 0xff (i32 extract_vector_elt (zext load <4 x i8> to 4 x i16)))
+;
+; The and is not redundant and cannot be removed. Since
+; extract_vector_elt is doing an implicit any_ext, the and
+; is required to guarantee that the top bits are set to zero.
+
+; Ideally should be a zext from <4 x i8> to <4 x 32>.
+
+; CHECK-LABEL: h:
+; CHECK: vld1.32
+; CHECK: uxtb
+define <4 x i32> @h(<4 x i8> *%in) {
+ %1 = load <4 x i8>, <4 x i8>* %in, align 4
+ %2 = extractelement <4 x i8> %1, i32 0
+ %3 = zext i8 %2 to i32
+ %4 = insertelement <4 x i32> undef, i32 %3, i32 0
+ %5 = extractelement <4 x i8> %1, i32 1
+ %6 = zext i8 %5 to i32
+ %7 = insertelement <4 x i32> %4, i32 %6, i32 1
+ %8 = extractelement <4 x i8> %1, i32 2
+ %9 = zext i8 %8 to i32
+ %10 = insertelement <4 x i32> %7, i32 %9, i32 2
+ %11 = extractelement <4 x i8> %1, i32 3
+ %12 = zext i8 %11 to i32
+ %13 = insertelement <4 x i32> %10, i32 %12, i32 3
+ ret <4 x i32> %13
+}
-------------- next part --------------
A non-text attachment was scrubbed...
Name: D18247.51148.patch
Type: text/x-patch
Size: 2483 bytes
Desc: not available
URL: <http://lists.llvm.org/pipermail/llvm-commits/attachments/20160321/7fb7ac7a/attachment.bin>
More information about the llvm-commits
mailing list