[llvm-commits] CVS: llvm/lib/Target/X86/X86ISelLowering.cpp X86ISelLowering.h X86InstrSSE.td
Evan Cheng
evan.cheng at apple.com
Thu Mar 23 17:18:42 PST 2006
Changes in directory llvm/lib/Target/X86:
X86ISelLowering.cpp updated: 1.124 -> 1.125
X86ISelLowering.h updated: 1.38 -> 1.39
X86InstrSSE.td updated: 1.21 -> 1.22
---
Log message:
Handle more shuffle cases with SHUFP* instructions.
---
Diffs of the changes: (+77 -44)
X86ISelLowering.cpp | 80 ++++++++++++++++++++++++++++++++++------------------
X86ISelLowering.h | 8 ++---
X86InstrSSE.td | 33 +++++++++++++--------
3 files changed, 77 insertions(+), 44 deletions(-)
Index: llvm/lib/Target/X86/X86ISelLowering.cpp
diff -u llvm/lib/Target/X86/X86ISelLowering.cpp:1.124 llvm/lib/Target/X86/X86ISelLowering.cpp:1.125
--- llvm/lib/Target/X86/X86ISelLowering.cpp:1.124 Thu Mar 23 14:26:04 2006
+++ llvm/lib/Target/X86/X86ISelLowering.cpp Thu Mar 23 19:18:28 2006
@@ -1383,12 +1383,42 @@
return false;
// Check if the value doesn't reference the second vector.
+ for (unsigned i = 1, e = N->getNumOperands(); i != e; ++i) {
+ assert(isa<ConstantSDNode>(N->getOperand(i)) &&
+ "Invalid VECTOR_SHUFFLE mask!");
+ if (cast<ConstantSDNode>(N->getOperand(i))->getValue() >= 4) return false;
+ }
+
+ return true;
+}
+
+/// isSHUFPMask - Return true if the specified VECTOR_SHUFFLE operand
+/// specifies a shuffle of elements that is suitable for input to SHUFP*.
+bool X86::isSHUFPMask(SDNode *N) {
+ assert(N->getOpcode() == ISD::BUILD_VECTOR);
+
+ unsigned NumOperands = N->getNumOperands();
+ if (NumOperands != 2 && NumOperands != 4)
+ return false;
+
+ // Each half must refer to only one of the vector.
SDOperand Elt = N->getOperand(0);
assert(isa<ConstantSDNode>(Elt) && "Invalid VECTOR_SHUFFLE mask!");
- for (unsigned i = 0, e = N->getNumOperands(); i != e; ++i) {
+ for (unsigned i = 1; i != NumOperands / 2; ++i) {
assert(isa<ConstantSDNode>(N->getOperand(i)) &&
"Invalid VECTOR_SHUFFLE mask!");
- if (cast<ConstantSDNode>(N->getOperand(i))->getValue() >= 4) return false;
+ if (cast<ConstantSDNode>(N->getOperand(i))->getValue() !=
+ cast<ConstantSDNode>(Elt)->getValue())
+ return false;
+ }
+ Elt = N->getOperand(NumOperands / 2);
+ assert(isa<ConstantSDNode>(Elt) && "Invalid VECTOR_SHUFFLE mask!");
+ for (unsigned i = NumOperands / 2; i != NumOperands; ++i) {
+ assert(isa<ConstantSDNode>(N->getOperand(i)) &&
+ "Invalid VECTOR_SHUFFLE mask!");
+ if (cast<ConstantSDNode>(N->getOperand(i))->getValue() !=
+ cast<ConstantSDNode>(Elt)->getValue())
+ return false;
}
return true;
@@ -1426,30 +1456,10 @@
unsigned Mask = 0;
unsigned i = NumOperands - 1;
do {
- Mask |= cast<ConstantSDNode>(N->getOperand(i))->getValue();
- Mask <<= Shift;
- --i;
- } while (i != 0);
-
- return Mask;
-}
-
-/// getShufflePSHUFDImmediate - Return the appropriate immediate to shuffle
-/// the specified isShuffleMask VECTOR_SHUFFLE mask with PSHUFD instruction.
-unsigned X86::getShufflePSHUFDImmediate(SDNode *N) {
- unsigned NumOperands = N->getNumOperands();
- unsigned Mask = 0;
-
- assert(NumOperands == 4 && "Expect v4f32 / v4i32 vector operand");
-
- unsigned i = NumOperands - 1;
- do {
- uint64_t Val = cast<ConstantSDNode>(N->getOperand(i))->getValue();
- // Second vector operand must be undef. We can have it point to anything
- // we want.
- if (Val >= NumOperands) Val = 0;
+ unsigned Val = cast<ConstantSDNode>(N->getOperand(i))->getValue();
+ if (Val >= NumOperands) Val -= NumOperands;
Mask |= Val;
- Mask <<= 2;
+ Mask <<= Shift;
--i;
} while (i != 0);
@@ -2246,7 +2256,7 @@
return DAG.getNode(ISD::VECTOR_SHUFFLE, VT, V1,
DAG.getNode(ISD::UNDEF, V1.getValueType()),
PermMask);
- } else if (Subtarget->hasSSE2() && X86::isPSHUFDMask(PermMask.Val)) {
+ } else if (X86::isPSHUFDMask(PermMask.Val)) {
if (V2.getOpcode() == ISD::UNDEF)
// Leave the VECTOR_SHUFFLE alone. It matches PSHUFD.
return SDOperand();
@@ -2255,6 +2265,21 @@
return DAG.getNode(ISD::VECTOR_SHUFFLE, VT, V1,
DAG.getNode(ISD::UNDEF, V1.getValueType()),
PermMask);
+ } else if (X86::isSHUFPMask(PermMask.Val)) {
+ unsigned NumElems = PermMask.getNumOperands();
+ SDOperand Elt = PermMask.getOperand(0);
+ if (cast<ConstantSDNode>(Elt)->getValue() >= NumElems) {
+ // Swap the operands and change mask.
+ std::vector<SDOperand> MaskVec;
+ for (unsigned i = NumElems / 2; i != NumElems; ++i)
+ MaskVec.push_back(PermMask.getOperand(i));
+ for (unsigned i = 0; i != NumElems / 2; ++i)
+ MaskVec.push_back(PermMask.getOperand(i));
+ PermMask =
+ DAG.getNode(ISD::BUILD_VECTOR, PermMask.getValueType(), MaskVec);
+ return DAG.getNode(ISD::VECTOR_SHUFFLE, VT, V2, V1, PermMask);
+ }
+ return SDOperand();
}
// TODO.
@@ -2382,5 +2407,6 @@
// Only do shuffles on 128-bit vector types for now.
if (MVT::getSizeInBits(VT) == 64) return false;
return (X86::isSplatMask(Mask.Val) ||
- (Subtarget->hasSSE2() && X86::isPSHUFDMask(Mask.Val)));
+ X86::isPSHUFDMask(Mask.Val) ||
+ X86::isSHUFPMask(Mask.Val));
}
Index: llvm/lib/Target/X86/X86ISelLowering.h
diff -u llvm/lib/Target/X86/X86ISelLowering.h:1.38 llvm/lib/Target/X86/X86ISelLowering.h:1.39
--- llvm/lib/Target/X86/X86ISelLowering.h:1.38 Wed Mar 22 16:07:06 2006
+++ llvm/lib/Target/X86/X86ISelLowering.h Thu Mar 23 19:18:28 2006
@@ -183,6 +183,10 @@
/// specifies a shuffle of elements that is suitable for input to PSHUFD.
bool isPSHUFDMask(SDNode *N);
+ /// isSHUFPMask - Return true if the specified VECTOR_SHUFFLE operand
+ /// specifies a shuffle of elements that is suitable for input to SHUFP*.
+ bool isSHUFPMask(SDNode *N);
+
/// isSplatMask - Return true if the specified VECTOR_SHUFFLE operand
/// specifies a splat of a single element.
bool isSplatMask(SDNode *N);
@@ -191,10 +195,6 @@
/// the specified isShuffleMask VECTOR_SHUFFLE mask with PSHUF* and SHUFP*
/// instructions.
unsigned getShuffleSHUFImmediate(SDNode *N);
-
- /// getShufflePSHUFDImmediate - Return the appropriate immediate to shuffle
- /// the specified isShuffleMask VECTOR_SHUFFLE mask with PSHUFD instruction.
- unsigned getShufflePSHUFDImmediate(SDNode *N);
}
//===----------------------------------------------------------------------===//
Index: llvm/lib/Target/X86/X86InstrSSE.td
diff -u llvm/lib/Target/X86/X86InstrSSE.td:1.21 llvm/lib/Target/X86/X86InstrSSE.td:1.22
--- llvm/lib/Target/X86/X86InstrSSE.td:1.21 Thu Mar 23 01:44:07 2006
+++ llvm/lib/Target/X86/X86InstrSSE.td Thu Mar 23 19:18:28 2006
@@ -51,10 +51,6 @@
return getI8Imm(X86::getShuffleSHUFImmediate(N));
}]>;
-def SHUFFLE_get_pshufd_imm : SDNodeXForm<build_vector, [{
- return getI8Imm(X86::getShufflePSHUFDImmediate(N));
-}]>;
-
def SHUFP_splat_mask : PatLeaf<(build_vector), [{
return X86::isSplatMask(N);
}], SHUFFLE_get_shuf_imm>;
@@ -66,8 +62,11 @@
// Only use PSHUF if it is not a splat.
def PSHUFD_shuffle_mask : PatLeaf<(build_vector), [{
return !X86::isSplatMask(N) && X86::isPSHUFDMask(N);
-}], SHUFFLE_get_pshufd_imm>;
+}], SHUFFLE_get_shuf_imm>;
+def SHUFP_shuffle_mask : PatLeaf<(build_vector), [{
+ return X86::isSHUFPMask(N);
+}], SHUFFLE_get_shuf_imm>;
//===----------------------------------------------------------------------===//
// SSE scalar FP Instructions
@@ -442,10 +441,12 @@
def MOVHPDmr : PDI<0x17, MRMDestMem, (ops f64mem:$dst, VR128:$src),
"movhpd {$src, $dst|$dst, $src}", []>;
-def MOVLHPSrr : PSI<0x16, MRMSrcReg, (ops VR128:$dst, VR128:$src),
- "movlhps {$src, $dst|$dst, $src}", []>;
-def MOVHLPSrr : PSI<0x12, MRMSrcReg, (ops VR128:$dst, VR128:$src),
- "movlhps {$src, $dst|$dst, $src}", []>;
+let isTwoAddress = 1 in {
+def MOVLHPSrr : PSI<0x16, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
+ "movlhps {$src2, $dst|$dst, $src2}", []>;
+def MOVHLPSrr : PSI<0x12, MRMSrcReg, (ops VR128:$dst, VR128:$src1, VR128:$src2),
+ "movlhps {$src2, $dst|$dst, $src2}", []>;
+}
def MOVMSKPSrr : PSI<0x50, MRMSrcReg, (ops R32:$dst, VR128:$src),
"movmskps {$src, $dst|$dst, $src}", []>;
@@ -711,13 +712,19 @@
let isTwoAddress = 1 in {
def SHUFPSrr : PSIi8<0xC6, MRMSrcReg,
(ops VR128:$dst, VR128:$src1, VR128:$src2, i8imm:$src3),
- "shufps {$src3, $src2, $dst|$dst, $src2, $src3}", []>;
+ "shufps {$src3, $src2, $dst|$dst, $src2, $src3}",
+ [(set VR128:$dst, (vector_shuffle
+ (v4f32 VR128:$src1), (v4f32 VR128:$src2),
+ SHUFP_shuffle_mask:$src3))]>;
def SHUFPSrm : PSIi8<0xC6, MRMSrcMem,
(ops VR128:$dst, VR128:$src1, f128mem:$src2, i8imm:$src3),
"shufps {$src3, $src2, $dst|$dst, $src2, $src3}", []>;
def SHUFPDrr : PDIi8<0xC6, MRMSrcReg,
(ops VR128:$dst, VR128:$src1, VR128:$src2, i8imm:$src3),
- "shufpd {$src3, $src2, $dst|$dst, $src2, $src3}", []>;
+ "shufpd {$src3, $src2, $dst|$dst, $src2, $src3}",
+ [(set VR128:$dst, (vector_shuffle
+ (v2f64 VR128:$src1), (v2f64 VR128:$src2),
+ SHUFP_shuffle_mask:$src3))]>;
def SHUFPDrm : PDIi8<0xC6, MRMSrcMem,
(ops VR128:$dst, VR128:$src1, f128mem:$src2, i8imm:$src3),
"shufpd {$src3, $src2, $dst|$dst, $src2, $src3}", []>;
@@ -873,9 +880,9 @@
// Splat v2f64 / v2i64
def : Pat<(vector_shuffle (v2f64 VR128:$src), (undef), MOVLHPS_splat_mask:$sm),
- (v2f64 (MOVLHPSrr VR128:$src))>, Requires<[HasSSE1]>;
+ (v2f64 (MOVLHPSrr VR128:$src, VR128:$src))>, Requires<[HasSSE1]>;
def : Pat<(vector_shuffle (v2i64 VR128:$src), (undef), MOVLHPS_splat_mask:$sm),
- (v2i64 (MOVLHPSrr VR128:$src))>, Requires<[HasSSE1]>;
+ (v2i64 (MOVLHPSrr VR128:$src, VR128:$src))>, Requires<[HasSSE1]>;
// Shuffle v4f32 / v4i32, undef. These should only match if splat cases do not.
def : Pat<(vector_shuffle (v4f32 VR128:$src), (undef), PSHUFD_shuffle_mask:$sm),
More information about the llvm-commits
mailing list