[llvm-commits] [llvm] r104257 - in /llvm/trunk: lib/Target/ARM/ARMISelLowering.cpp test/CodeGen/ARM/2010-05-19-Shuffles.ll

Bob Wilson bob.wilson at apple.com
Thu May 20 11:39:53 PDT 2010


Author: bwilson
Date: Thu May 20 13:39:53 2010
New Revision: 104257

URL: http://llvm.org/viewvc/llvm-project?rev=104257&view=rev
Log:
Handle Neon v2f64 and v2i64 vector shuffles as register copies.
This fixes the remaining issue with pr7167.

Modified:
    llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp
    llvm/trunk/test/CodeGen/ARM/2010-05-19-Shuffles.ll

Modified: llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp?rev=104257&r1=104256&r2=104257&view=diff
==============================================================================
--- llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp (original)
+++ llvm/trunk/lib/Target/ARM/ARMISelLowering.cpp Thu May 20 13:39:53 2010
@@ -3022,6 +3022,24 @@
       return GeneratePerfectShuffle(PFEntry, V1, V2, DAG, dl);
   }
 
+  // v2f64 and v2i64 shuffles are just register copies.
+  if (VT == MVT::v2f64 || VT == MVT::v2i64) {
+    // Do the expansion as f64 since i64 is not legal.
+    V1 = DAG.getNode(ISD::BIT_CONVERT, dl, MVT::v2f64, V1);
+    V2 = DAG.getNode(ISD::BIT_CONVERT, dl, MVT::v2f64, V2);
+    SDValue Val = DAG.getUNDEF(MVT::v2f64);
+    for (unsigned i = 0; i < 2; ++i) {
+      if (ShuffleMask[i] < 0)
+        continue;
+      SDValue Elt = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, MVT::f64,
+                                ShuffleMask[i] < 2 ? V1 : V2,
+                                DAG.getConstant(ShuffleMask[i] & 1, MVT::i32));
+      Val = DAG.getNode(ISD::INSERT_VECTOR_ELT, dl, MVT::v2f64, Val,
+                        Elt, DAG.getConstant(i, MVT::i32));
+    }
+    return DAG.getNode(ISD::BIT_CONVERT, dl, VT, Val);
+  }
+
   return SDValue();
 }
 

Modified: llvm/trunk/test/CodeGen/ARM/2010-05-19-Shuffles.ll
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/CodeGen/ARM/2010-05-19-Shuffles.ll?rev=104257&r1=104256&r2=104257&view=diff
==============================================================================
--- llvm/trunk/test/CodeGen/ARM/2010-05-19-Shuffles.ll (original)
+++ llvm/trunk/test/CodeGen/ARM/2010-05-19-Shuffles.ll Thu May 20 13:39:53 2010
@@ -12,3 +12,10 @@
        <8 x i32> <i32 1, i32 2, i32 0, i32 5, i32 3, i32 6, i32 7, i32 4>
   ret <8 x i8> %y
 }
+
+define void @f3(<4 x i64>* %xp) nounwind {
+  %x = load <4 x i64>* %xp
+  %y = shufflevector <4 x i64> %x, <4 x i64> undef, <4 x i32> <i32 0, i32 3, i32 2, i32 1>
+  store <4 x i64> %y, <4 x i64>* %xp
+  ret void
+}





More information about the llvm-commits mailing list