[llvm] 6b7838b - [AIX] Allow safe for 32bit P8 VSX pattern matching

Zarko Todorovski via llvm-commits llvm-commits at lists.llvm.org
Wed Apr 14 05:12:57 PDT 2021


Author: Zarko Todorovski
Date: 2021-04-14T08:12:48-04:00
New Revision: 6b7838b68cc49621f3c92d8603f95e801d10f759

URL: https://github.com/llvm/llvm-project/commit/6b7838b68cc49621f3c92d8603f95e801d10f759
DIFF: https://github.com/llvm/llvm-project/commit/6b7838b68cc49621f3c92d8603f95e801d10f759.diff

LOG: [AIX] Allow safe for 32bit P8 VSX pattern matching

Pull some of the safe for 32bit pattern matching for Pwr8 and above.

Reviewed By: nemanjai

Differential Revision: https://reviews.llvm.org/D97909

Added: 
    llvm/test/CodeGen/PowerPC/aix32-p8-scalar_vector_conversions.ll

Modified: 
    llvm/lib/Target/PowerPC/PPCInstrVSX.td
    llvm/test/CodeGen/PowerPC/cannonicalize-vector-shifts.ll
    llvm/test/CodeGen/PowerPC/p8-scalar_vector_conversions.ll

Removed: 
    


################################################################################
diff  --git a/llvm/lib/Target/PowerPC/PPCInstrVSX.td b/llvm/lib/Target/PowerPC/PPCInstrVSX.td
index 82b5e9af0c12..471ab32f8778 100644
--- a/llvm/lib/Target/PowerPC/PPCInstrVSX.td
+++ b/llvm/lib/Target/PowerPC/PPCInstrVSX.td
@@ -2187,6 +2187,11 @@ def VectorExtractions {
   dag BE_VFLOAT_PERMUTE = (VPERM $S, $S, BE_VFLOAT_PERM_VEC);
   dag BE_VARIABLE_FLOAT = (XSCVSPDPN BE_VFLOAT_PERMUTE);
 
+  //  BE variable float 32-bit version
+  dag BE_32B_VFLOAT_PERM_VEC = (v16i8 (LVSL (i32 ZERO), (RLWINM $Idx, 2, 0, 29)));
+  dag BE_32B_VFLOAT_PERMUTE = (VPERM $S, $S, BE_32B_VFLOAT_PERM_VEC);
+  dag BE_32B_VARIABLE_FLOAT = (XSCVSPDPN BE_32B_VFLOAT_PERMUTE);
+
   /* BE variable double
       Same as the BE doubleword except there is no move.
   */
@@ -2194,6 +2199,14 @@ def VectorExtractions {
                                          (v16i8 (COPY_TO_REGCLASS $S, VRRC)),
                                          BE_VDWORD_PERM_VEC));
   dag BE_VARIABLE_DOUBLE = (COPY_TO_REGCLASS BE_VDOUBLE_PERMUTE, VSRC);
+
+  //  BE variable double 32-bit version
+  dag BE_32B_VDWORD_PERM_VEC = (v16i8 (LVSL (i32 ZERO),
+                                        (RLWINM (ANDI_rec $Idx, 1), 3, 0, 28)));
+  dag BE_32B_VDOUBLE_PERMUTE = (v16i8 (VPERM (v16i8 (COPY_TO_REGCLASS $S, VRRC)),
+                                      (v16i8 (COPY_TO_REGCLASS $S, VRRC)),
+                                      BE_32B_VDWORD_PERM_VEC));
+  dag BE_32B_VARIABLE_DOUBLE = (COPY_TO_REGCLASS BE_32B_VDOUBLE_PERMUTE, VSRC);
 }
 
 def AlignValues {
@@ -2426,6 +2439,7 @@ def MrgWords {
 // [HasVSX, HasOnlySwappingMemOps]
 // [HasVSX, HasOnlySwappingMemOps, IsBigEndian]
 // [HasVSX, HasP8Vector]
+// [HasVSX, HasP8Vector, IsBigEndian]
 // [HasVSX, HasP8Vector, IsBigEndian, IsPPC64]
 // [HasVSX, HasP8Vector, IsLittleEndian]
 // [HasVSX, HasP8Vector, NoP9Vector, IsBigEndian, IsPPC64]
@@ -3147,8 +3161,8 @@ def : Pat<(v16i8 (bitconvert (v16i8 immAllOnesV))),
           (v16i8 (COPY_TO_REGCLASS(XXLEQVOnes), VSRC))>;
 } // HasVSX, HasP8Vector
 
-// Big endian Power8 VSX subtarget.
-let Predicates = [HasVSX, HasP8Vector, IsBigEndian, IsPPC64] in {
+// Any big endian Power8 VSX subtarget.
+let Predicates = [HasVSX, HasP8Vector, IsBigEndian] in {
 def : Pat<DWToSPExtractConv.El0SS1,
           (f32 (XSCVSXDSP (COPY_TO_REGCLASS $S1, VSFRC)))>;
 def : Pat<DWToSPExtractConv.El1SS1,
@@ -3169,8 +3183,6 @@ def : Pat<(f32 (vector_extract v4f32:$S, 2)),
           (f32 (XSCVSPDPN (XXPERMDI $S, $S, 2)))>;
 def : Pat<(f32 (vector_extract v4f32:$S, 3)),
           (f32 (XSCVSPDPN (XXSLDWI $S, $S, 3)))>;
-def : Pat<(f32 (vector_extract v4f32:$S, i64:$Idx)),
-          (f32 VectorExtractions.BE_VARIABLE_FLOAT)>;
 
 def : Pat<(f32 (PPCfcfids (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 0)))))),
           (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 0))))>;
@@ -3189,6 +3201,18 @@ def : Pat<(f64 (PPCfcfid (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 2)))))),
 def : Pat<(f64 (PPCfcfid (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 3)))))),
           (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 3)), VSFRC))>;
 
+def : Pat<(f32 (vector_extract v4f32:$S, i32:$Idx)),
+          (f32 VectorExtractions.BE_32B_VARIABLE_FLOAT)>;
+
+def : Pat<(f64 (vector_extract v2f64:$S, i32:$Idx)),
+          (f64 VectorExtractions.BE_32B_VARIABLE_DOUBLE)>;
+} // HasVSX, HasP8Vector, IsBigEndian
+
+// Big endian Power8 64Bit VSX subtarget.
+let Predicates = [HasVSX, HasP8Vector, IsBigEndian, IsPPC64] in {
+def : Pat<(f32 (vector_extract v4f32:$S, i64:$Idx)),
+          (f32 VectorExtractions.BE_VARIABLE_FLOAT)>;
+
 // LIWAX - This instruction is used for sign extending i32 -> i64.
 // LIWZX - This instruction will be emitted for i32, f32, and when
 //         zero-extending i32 to i64 (zext i32 -> i64).

diff  --git a/llvm/test/CodeGen/PowerPC/aix32-p8-scalar_vector_conversions.ll b/llvm/test/CodeGen/PowerPC/aix32-p8-scalar_vector_conversions.ll
new file mode 100644
index 000000000000..921c3be960f6
--- /dev/null
+++ b/llvm/test/CodeGen/PowerPC/aix32-p8-scalar_vector_conversions.ll
@@ -0,0 +1,1125 @@
+; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
+; RUN: llc < %s -mtriple=powerpc-ibm-aix-xcoff -verify-machineinstrs \
+; RUN:          -mcpu=pwr8 -vec-extabi | FileCheck %s
+
+; The build[csilf] functions simply test the scalar_to_vector handling with
+; direct moves. This corresponds to the "insertelement" instruction. Subsequent
+; to this, there will be a splat corresponding to the shufflevector.
+
+ at d = common global double 0.000000e+00, align 8
+
+; Function Attrs: norecurse nounwind readnone
+define <16 x i8> @buildc(i8 zeroext %a) {
+; CHECK-LABEL: buildc:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 4, 1, -16
+; CHECK-NEXT:    stb 3, -16(1)
+; CHECK-NEXT:    lxvw4x 34, 0, 4
+; CHECK-NEXT:    vspltb 2, 2, 0
+; CHECK-NEXT:    blr
+entry:
+  %splat.splatinsert = insertelement <16 x i8> undef, i8 %a, i32 0
+  %splat.splat = shufflevector <16 x i8> %splat.splatinsert, <16 x i8> undef, <16 x i32> zeroinitializer
+  ret <16 x i8> %splat.splat
+}
+
+; Function Attrs: norecurse nounwind readnone
+define <8 x i16> @builds(i16 zeroext %a) {
+; CHECK-LABEL: builds:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 4, 1, -16
+; CHECK-NEXT:    sth 3, -16(1)
+; CHECK-NEXT:    lxvw4x 34, 0, 4
+; CHECK-NEXT:    vsplth 2, 2, 0
+; CHECK-NEXT:    blr
+entry:
+  %splat.splatinsert = insertelement <8 x i16> undef, i16 %a, i32 0
+  %splat.splat = shufflevector <8 x i16> %splat.splatinsert, <8 x i16> undef, <8 x i32> zeroinitializer
+  ret <8 x i16> %splat.splat
+}
+
+; Function Attrs: norecurse nounwind readnone
+define <4 x i32> @buildi(i32 zeroext %a) {
+; CHECK-LABEL: buildi:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 4, 1, -16
+; CHECK-NEXT:    stw 3, -16(1)
+; CHECK-NEXT:    lxvw4x 0, 0, 4
+; CHECK-NEXT:    xxspltw 34, 0, 0
+; CHECK-NEXT:    blr
+entry:
+  %splat.splatinsert = insertelement <4 x i32> undef, i32 %a, i32 0
+  %splat.splat = shufflevector <4 x i32> %splat.splatinsert, <4 x i32> undef, <4 x i32> zeroinitializer
+  ret <4 x i32> %splat.splat
+}
+
+; Function Attrs: norecurse nounwind readnone
+define <2 x i64> @buildl(i64 %a) {
+; CHECK-LABEL: buildl:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    stw 4, -16(1)
+; CHECK-NEXT:    stw 3, -32(1)
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    addi 4, 1, -32
+; CHECK-NEXT:    lxvw4x 34, 0, 3
+; CHECK-NEXT:    lxvw4x 35, 0, 4
+; CHECK-NEXT:    vmrghw 2, 3, 2
+; CHECK-NEXT:    xxswapd 0, 34
+; CHECK-NEXT:    xxsldwi 34, 0, 34, 2
+; CHECK-NEXT:    blr
+entry:
+  %splat.splatinsert = insertelement <2 x i64> undef, i64 %a, i32 0
+  %splat.splat = shufflevector <2 x i64> %splat.splatinsert, <2 x i64> undef, <2 x i32> zeroinitializer
+  ret <2 x i64> %splat.splat
+}
+
+; Function Attrs: norecurse nounwind readnone
+define <4 x float> @buildf(float %a) {
+; CHECK-LABEL: buildf:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    xscvdpspn 0, 1
+; CHECK-NEXT:    xxspltw 34, 0, 0
+; CHECK-NEXT:    blr
+entry:
+  %splat.splatinsert = insertelement <4 x float> undef, float %a, i32 0
+  %splat.splat = shufflevector <4 x float> %splat.splatinsert, <4 x float> undef, <4 x i32> zeroinitializer
+  ret <4 x float> %splat.splat
+}
+
+; The optimization to remove stack operations from PPCDAGToDAGISel::Select
+; should still trigger for v2f64, producing an lxvdsx.
+; Function Attrs: norecurse nounwind readonly
+define <2 x double> @buildd() {
+; CHECK-LABEL: buildd:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    lwz 3, L..C0(2)
+; CHECK-NEXT:    lxvdsx 34, 0, 3
+; CHECK-NEXT:    blr
+entry:
+  %0 = load double, double* @d, align 8
+  %splat.splatinsert = insertelement <2 x double> undef, double %0, i32 0
+  %splat.splat = shufflevector <2 x double> %splat.splatinsert, <2 x double> undef, <2 x i32> zeroinitializer
+  ret <2 x double> %splat.splat
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i8 @getsc0(<16 x i8> %vsc) {
+; CHECK-LABEL: getsc0:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -16(1)
+; CHECK-NEXT:    extsb 3, 3
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vsc, i32 0
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i8 @getsc1(<16 x i8> %vsc) {
+; CHECK-LABEL: getsc1:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -15(1)
+; CHECK-NEXT:    extsb 3, 3
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vsc, i32 1
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i8 @getsc2(<16 x i8> %vsc) {
+; CHECK-LABEL: getsc2:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -14(1)
+; CHECK-NEXT:    extsb 3, 3
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vsc, i32 2
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i8 @getsc3(<16 x i8> %vsc) {
+; CHECK-LABEL: getsc3:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -13(1)
+; CHECK-NEXT:    extsb 3, 3
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vsc, i32 3
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i8 @getsc4(<16 x i8> %vsc) {
+; CHECK-LABEL: getsc4:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -12(1)
+; CHECK-NEXT:    extsb 3, 3
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vsc, i32 4
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i8 @getsc5(<16 x i8> %vsc) {
+; CHECK-LABEL: getsc5:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -11(1)
+; CHECK-NEXT:    extsb 3, 3
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vsc, i32 5
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i8 @getsc6(<16 x i8> %vsc) {
+; CHECK-LABEL: getsc6:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -10(1)
+; CHECK-NEXT:    extsb 3, 3
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vsc, i32 6
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i8 @getsc7(<16 x i8> %vsc) {
+; CHECK-LABEL: getsc7:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -9(1)
+; CHECK-NEXT:    extsb 3, 3
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vsc, i32 7
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i8 @getsc8(<16 x i8> %vsc) {
+; CHECK-LABEL: getsc8:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -8(1)
+; CHECK-NEXT:    extsb 3, 3
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vsc, i32 8
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i8 @getsc9(<16 x i8> %vsc) {
+; CHECK-LABEL: getsc9:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -7(1)
+; CHECK-NEXT:    extsb 3, 3
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vsc, i32 9
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i8 @getsc10(<16 x i8> %vsc) {
+; CHECK-LABEL: getsc10:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -6(1)
+; CHECK-NEXT:    extsb 3, 3
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vsc, i32 10
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i8 @getsc11(<16 x i8> %vsc) {
+; CHECK-LABEL: getsc11:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -5(1)
+; CHECK-NEXT:    extsb 3, 3
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vsc, i32 11
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i8 @getsc12(<16 x i8> %vsc) {
+; CHECK-LABEL: getsc12:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -4(1)
+; CHECK-NEXT:    extsb 3, 3
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vsc, i32 12
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i8 @getsc13(<16 x i8> %vsc) {
+; CHECK-LABEL: getsc13:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -3(1)
+; CHECK-NEXT:    extsb 3, 3
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vsc, i32 13
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i8 @getsc14(<16 x i8> %vsc) {
+; CHECK-LABEL: getsc14:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -2(1)
+; CHECK-NEXT:    extsb 3, 3
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vsc, i32 14
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i8 @getsc15(<16 x i8> %vsc) {
+; CHECK-LABEL: getsc15:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -1(1)
+; CHECK-NEXT:    extsb 3, 3
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vsc, i32 15
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i8 @getuc0(<16 x i8> %vuc) {
+; CHECK-LABEL: getuc0:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -16(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vuc, i32 0
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i8 @getuc1(<16 x i8> %vuc) {
+; CHECK-LABEL: getuc1:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -15(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vuc, i32 1
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i8 @getuc2(<16 x i8> %vuc) {
+; CHECK-LABEL: getuc2:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -14(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vuc, i32 2
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i8 @getuc3(<16 x i8> %vuc) {
+; CHECK-LABEL: getuc3:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -13(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vuc, i32 3
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i8 @getuc4(<16 x i8> %vuc) {
+; CHECK-LABEL: getuc4:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -12(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vuc, i32 4
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i8 @getuc5(<16 x i8> %vuc) {
+; CHECK-LABEL: getuc5:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -11(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vuc, i32 5
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i8 @getuc6(<16 x i8> %vuc) {
+; CHECK-LABEL: getuc6:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -10(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vuc, i32 6
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i8 @getuc7(<16 x i8> %vuc) {
+; CHECK-LABEL: getuc7:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -9(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vuc, i32 7
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i8 @getuc8(<16 x i8> %vuc) {
+; CHECK-LABEL: getuc8:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -8(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vuc, i32 8
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i8 @getuc9(<16 x i8> %vuc) {
+; CHECK-LABEL: getuc9:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -7(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vuc, i32 9
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i8 @getuc10(<16 x i8> %vuc) {
+; CHECK-LABEL: getuc10:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -6(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vuc, i32 10
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i8 @getuc11(<16 x i8> %vuc) {
+; CHECK-LABEL: getuc11:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -5(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vuc, i32 11
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i8 @getuc12(<16 x i8> %vuc) {
+;
+; CHECK-LABEL: getuc12:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -4(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vuc, i32 12
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i8 @getuc13(<16 x i8> %vuc) {
+; CHECK-LABEL: getuc13:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -3(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vuc, i32 13
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i8 @getuc14(<16 x i8> %vuc) {
+; CHECK-LABEL: getuc14:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -2(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vuc, i32 14
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i8 @getuc15(<16 x i8> %vuc) {
+; CHECK-LABEL: getuc15:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lbz 3, -1(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vuc, i32 15
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i8 @getvelsc(<16 x i8> %vsc, i32 signext %i) {
+; CHECK-LABEL: getvelsc:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 4, 1, -16
+; CHECK-NEXT:    clrlwi 3, 3, 28
+; CHECK-NEXT:    stxvw4x 34, 0, 4
+; CHECK-NEXT:    lbzx 3, 4, 3
+; CHECK-NEXT:    extsb 3, 3
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vsc, i32 %i
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i8 @getveluc(<16 x i8> %vuc, i32 signext %i) {
+; CHECK-LABEL: getveluc:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 4, 1, -16
+; CHECK-NEXT:    clrlwi 3, 3, 28
+; CHECK-NEXT:    stxvw4x 34, 0, 4
+; CHECK-NEXT:    lbzx 3, 4, 3
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <16 x i8> %vuc, i32 %i
+  ret i8 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i16 @getss0(<8 x i16> %vss) {
+; CHECK-LABEL: getss0:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lha 3, -16(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <8 x i16> %vss, i32 0
+  ret i16 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i16 @getss1(<8 x i16> %vss) {
+; CHECK-LABEL: getss1:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lha 3, -14(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <8 x i16> %vss, i32 1
+  ret i16 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i16 @getss2(<8 x i16> %vss) {
+; CHECK-LABEL: getss2:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lha 3, -12(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <8 x i16> %vss, i32 2
+  ret i16 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i16 @getss3(<8 x i16> %vss) {
+; CHECK-LABEL: getss3:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lha 3, -10(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <8 x i16> %vss, i32 3
+  ret i16 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i16 @getss4(<8 x i16> %vss) {
+; CHECK-LABEL: getss4:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lha 3, -8(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <8 x i16> %vss, i32 4
+  ret i16 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i16 @getss5(<8 x i16> %vss) {
+; CHECK-LABEL: getss5:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lha 3, -6(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <8 x i16> %vss, i32 5
+  ret i16 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i16 @getss6(<8 x i16> %vss) {
+; CHECK-LABEL: getss6:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lha 3, -4(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <8 x i16> %vss, i32 6
+  ret i16 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i16 @getss7(<8 x i16> %vss) {
+; CHECK-LABEL: getss7:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lha 3, -2(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <8 x i16> %vss, i32 7
+  ret i16 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i16 @getus0(<8 x i16> %vus) {
+; CHECK-LABEL: getus0:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lhz 3, -16(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <8 x i16> %vus, i32 0
+  ret i16 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i16 @getus1(<8 x i16> %vus) {
+; CHECK-LABEL: getus1:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lhz 3, -14(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <8 x i16> %vus, i32 1
+  ret i16 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i16 @getus2(<8 x i16> %vus) {
+; CHECK-LABEL: getus2:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lhz 3, -12(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <8 x i16> %vus, i32 2
+  ret i16 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i16 @getus3(<8 x i16> %vus) {
+; CHECK-LABEL: getus3:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lhz 3, -10(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <8 x i16> %vus, i32 3
+  ret i16 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i16 @getus4(<8 x i16> %vus) {
+; CHECK-LABEL: getus4:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lhz 3, -8(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <8 x i16> %vus, i32 4
+  ret i16 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i16 @getus5(<8 x i16> %vus) {
+; CHECK-LABEL: getus5:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lhz 3, -6(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <8 x i16> %vus, i32 5
+  ret i16 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i16 @getus6(<8 x i16> %vus) {
+; CHECK-LABEL: getus6:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lhz 3, -4(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <8 x i16> %vus, i32 6
+  ret i16 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i16 @getus7(<8 x i16> %vus) {
+; CHECK-LABEL: getus7:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lhz 3, -2(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <8 x i16> %vus, i32 7
+  ret i16 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i16 @getvelss(<8 x i16> %vss, i32 signext %i) {
+; CHECK-LABEL: getvelss:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 4, 1, -16
+; CHECK-NEXT:    rlwinm 3, 3, 1, 28, 30
+; CHECK-NEXT:    stxvw4x 34, 0, 4
+; CHECK-NEXT:    lhax 3, 4, 3
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <8 x i16> %vss, i32 %i
+  ret i16 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i16 @getvelus(<8 x i16> %vus, i32 signext %i) {
+; CHECK-LABEL: getvelus:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 4, 1, -16
+; CHECK-NEXT:    rlwinm 3, 3, 1, 28, 30
+; CHECK-NEXT:    stxvw4x 34, 0, 4
+; CHECK-NEXT:    lhzx 3, 4, 3
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <8 x i16> %vus, i32 %i
+  ret i16 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i32 @getsi0(<4 x i32> %vsi) {
+; CHECK-LABEL: getsi0:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lwz 3, -16(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <4 x i32> %vsi, i32 0
+  ret i32 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i32 @getsi1(<4 x i32> %vsi) {
+; CHECK-LABEL: getsi1:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lwz 3, -12(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <4 x i32> %vsi, i32 1
+  ret i32 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i32 @getsi2(<4 x i32> %vsi) {
+; CHECK-LABEL: getsi2:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lwz 3, -8(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <4 x i32> %vsi, i32 2
+  ret i32 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i32 @getsi3(<4 x i32> %vsi) {
+; CHECK-LABEL: getsi3:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lwz 3, -4(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <4 x i32> %vsi, i32 3
+  ret i32 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i32 @getui0(<4 x i32> %vui) {
+; CHECK-LABEL: getui0:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lwz 3, -16(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <4 x i32> %vui, i32 0
+  ret i32 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i32 @getui1(<4 x i32> %vui) {
+; CHECK-LABEL: getui1:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lwz 3, -12(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <4 x i32> %vui, i32 1
+  ret i32 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i32 @getui2(<4 x i32> %vui) {
+; CHECK-LABEL: getui2:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lwz 3, -8(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <4 x i32> %vui, i32 2
+  ret i32 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i32 @getui3(<4 x i32> %vui) {
+; CHECK-LABEL: getui3:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lwz 3, -4(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <4 x i32> %vui, i32 3
+  ret i32 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define signext i32 @getvelsi(<4 x i32> %vsi, i32 signext %i) {
+; CHECK-LABEL: getvelsi:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 4, 1, -16
+; CHECK-NEXT:    rlwinm 3, 3, 2, 28, 29
+; CHECK-NEXT:    stxvw4x 34, 0, 4
+; CHECK-NEXT:    lwzx 3, 4, 3
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <4 x i32> %vsi, i32 %i
+  ret i32 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define zeroext i32 @getvelui(<4 x i32> %vui, i32 signext %i) {
+; CHECK-LABEL: getvelui:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 4, 1, -16
+; CHECK-NEXT:    rlwinm 3, 3, 2, 28, 29
+; CHECK-NEXT:    stxvw4x 34, 0, 4
+; CHECK-NEXT:    lwzx 3, 4, 3
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <4 x i32> %vui, i32 %i
+  ret i32 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define i64 @getsl0(<2 x i64> %vsl) {
+; CHECK-LABEL: getsl0:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lwz 3, -16(1)
+; CHECK-NEXT:    lwz 4, -12(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <2 x i64> %vsl, i32 0
+  ret i64 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define i64 @getsl1(<2 x i64> %vsl) {
+; CHECK-LABEL: getsl1:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lwz 3, -8(1)
+; CHECK-NEXT:    lwz 4, -4(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <2 x i64> %vsl, i32 1
+  ret i64 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define i64 @getul0(<2 x i64> %vul) {
+; CHECK-LABEL: getul0:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lwz 3, -16(1)
+; CHECK-NEXT:    lwz 4, -12(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <2 x i64> %vul, i32 0
+  ret i64 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define i64 @getul1(<2 x i64> %vul) {
+; CHECK-LABEL: getul1:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addi 3, 1, -16
+; CHECK-NEXT:    stxvw4x 34, 0, 3
+; CHECK-NEXT:    lwz 3, -8(1)
+; CHECK-NEXT:    lwz 4, -4(1)
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <2 x i64> %vul, i32 1
+  ret i64 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define i64 @getvelsl(<2 x i64> %vsl, i32 signext %i) {
+; CHECK-LABEL: getvelsl:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    add 3, 3, 3
+; CHECK-NEXT:    addi 4, 1, -16
+; CHECK-NEXT:    addi 5, 3, 1
+; CHECK-NEXT:    stxvw4x 34, 0, 4
+; CHECK-NEXT:    rlwinm 3, 3, 2, 28, 29
+; CHECK-NEXT:    rlwinm 5, 5, 2, 28, 29
+; CHECK-NEXT:    lwzx 3, 4, 3
+; CHECK-NEXT:    lwzx 4, 4, 5
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <2 x i64> %vsl, i32 %i
+  ret i64 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define i64 @getvelul(<2 x i64> %vul, i32 signext %i) {
+; CHECK-LABEL: getvelul:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    add 3, 3, 3
+; CHECK-NEXT:    addi 4, 1, -16
+; CHECK-NEXT:    addi 5, 3, 1
+; CHECK-NEXT:    stxvw4x 34, 0, 4
+; CHECK-NEXT:    rlwinm 3, 3, 2, 28, 29
+; CHECK-NEXT:    rlwinm 5, 5, 2, 28, 29
+; CHECK-NEXT:    lwzx 3, 4, 3
+; CHECK-NEXT:    lwzx 4, 4, 5
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <2 x i64> %vul, i32 %i
+  ret i64 %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define float @getf0(<4 x float> %vf) {
+; CHECK-LABEL: getf0:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    xscvspdpn 1, 34
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <4 x float> %vf, i32 0
+  ret float %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define float @getf1(<4 x float> %vf) {
+; CHECK-LABEL: getf1:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    xxsldwi 0, 34, 34, 1
+; CHECK-NEXT:    xscvspdpn 1, 0
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <4 x float> %vf, i32 1
+  ret float %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define float @getf2(<4 x float> %vf) {
+; CHECK-LABEL: getf2:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    xxswapd 0, 34
+; CHECK-NEXT:    xscvspdpn 1, 0
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <4 x float> %vf, i32 2
+  ret float %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define float @getf3(<4 x float> %vf) {
+; CHECK-LABEL: getf3:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    xxsldwi 0, 34, 34, 3
+; CHECK-NEXT:    xscvspdpn 1, 0
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <4 x float> %vf, i32 3
+  ret float %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define float @getvelf(<4 x float> %vf, i32 signext %i) {
+; CHECK-LABEL: getvelf:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    slwi 3, 3, 2
+; CHECK-NEXT:    lvsl 3, 0, 3
+; CHECK-NEXT:    vperm 2, 2, 2, 3
+; CHECK-NEXT:    xscvspdpn 1, 34
+; CHECK-NEXT:    blr
+entry:
+   %vecext = extractelement <4 x float> %vf, i32 %i
+   ret float %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define double @getd0(<2 x double> %vd) {
+; CHECK-LABEL: getd0:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    xxlor 1, 34, 34
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <2 x double> %vd, i32 0
+  ret double %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define double @getd1(<2 x double> %vd) {
+; CHECK-LABEL: getd1:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    xxswapd 1, 34
+; CHECK-NEXT:    # kill: def $f1 killed $f1 killed $vsl1
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <2 x double> %vd, i32 1
+  ret double %vecext
+}
+
+; Function Attrs: norecurse nounwind readnone
+define double @getveld(<2 x double> %vd, i32 signext %i) {
+; CHECK-LABEL: getveld:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    andi. 3, 3, 1
+; CHECK-NEXT:    slwi 3, 3, 3
+; CHECK-NEXT:    lvsl 3, 0, 3
+; CHECK-NEXT:    vperm 2, 2, 2, 3
+; CHECK-NEXT:    xxlor 1, 34, 34
+; CHECK-NEXT:    # kill: def $f1 killed $f1 killed $vsl1
+; CHECK-NEXT:    blr
+entry:
+  %vecext = extractelement <2 x double> %vd, i32 %i
+  ret double %vecext
+}

diff  --git a/llvm/test/CodeGen/PowerPC/cannonicalize-vector-shifts.ll b/llvm/test/CodeGen/PowerPC/cannonicalize-vector-shifts.ll
index 68d4530e81ec..b0fbc16e1b81 100644
--- a/llvm/test/CodeGen/PowerPC/cannonicalize-vector-shifts.ll
+++ b/llvm/test/CodeGen/PowerPC/cannonicalize-vector-shifts.ll
@@ -2,6 +2,12 @@
 ; RUN:   -verify-machineinstrs < %s | FileCheck %s
 ; RUN: llc -mcpu=pwr8 -mtriple=powerpc64-unknown-linux-gnu \
 ; RUN:   -verify-machineinstrs < %s | FileCheck %s
+
+; RUN: llc -mcpu=pwr8 -vec-extabi -mtriple=powerpc64-ibm-aix-xcoff \
+; RUN:   -verify-machineinstrs < %s | FileCheck %s
+; RUN: llc -mcpu=pwr8 -vec-extabi -mtriple=powerpc-ibm-aix-xcoff \
+; RUN:   -verify-machineinstrs < %s | FileCheck %s
+
 define <4 x i32> @test1(<4 x i32> %a) {
 entry:
 ; CHECK-LABEL: test1

diff  --git a/llvm/test/CodeGen/PowerPC/p8-scalar_vector_conversions.ll b/llvm/test/CodeGen/PowerPC/p8-scalar_vector_conversions.ll
index dffa0fb98fc0..1fe63271add4 100644
--- a/llvm/test/CodeGen/PowerPC/p8-scalar_vector_conversions.ll
+++ b/llvm/test/CodeGen/PowerPC/p8-scalar_vector_conversions.ll
@@ -4,6 +4,9 @@
 ; RUN: llc < %s -ppc-vsr-nums-as-vr -mtriple=powerpc64le-unknown-linux-gnu \
 ; RUN:       -verify-machineinstrs -ppc-asm-full-reg-names -mcpu=pwr8 -relocation-model=pic \
 ; RUN:       | FileCheck %s -check-prefix=CHECK-LE
+; RUN: llc < %s -vec-extabi -mtriple=powerpc64-ibm-aix-xcoff \
+; RUN:       -verify-machineinstrs -mcpu=pwr8 \
+; RUN:       | FileCheck %s -check-prefix=CHECK-AIX
 
 ; The build[csilf] functions simply test the scalar_to_vector handling with
 ; direct moves. This corresponds to the "insertelement" instruction. Subsequent
@@ -20,9 +23,14 @@ entry:
 ; CHECK-LABEL: buildc
 ; CHECK: sldi r3, r3, 56
 ; CHECK: mtvsrd v2, r3
+
 ; CHECK-LE-LABEL: buildc
 ; CHECK-LE: mtvsrd v2, r3
 ; CHECK-LE: vspltb v2, v2, 7
+
+; CHECK-AIX-LABEL: buildc:
+; CHECK-AIX: mtvsrd 34, 3
+; CHECK-AIX: vspltb 2, 2, 0
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -34,9 +42,14 @@ entry:
 ; CHECK-LABEL: builds
 ; CHECK: sldi r3, r3, 48
 ; CHECK: mtvsrd v2, r3
+
 ; CHECK-LE-LABEL: builds
 ; CHECK-LE: mtvsrd v2, r3
 ; CHECK-LE: vsplth v2, v2, 3
+
+; CHECK-AIX-LABEL: builds:
+; CHECK-AIX: mtvsrd 34, 3
+; CHECK-AIX: vsplth 2, 2, 0
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -48,9 +61,14 @@ entry:
 ; CHECK-LABEL: buildi
 ; CHECK: mtfprwz f0, r3
 ; CHECK: xxspltw v2, vs0, 1
+
 ; CHECK-LE-LABEL: buildi
 ; CHECK-LE: mtfprwz f0, r3
 ; CHECK-LE: xxspltw v2, vs0, 1
+
+; CHECK-AIX-LABEL: buildi:
+; CHECK-AIX: mtfprwz 0, 3
+; CHECK-AIX: xxspltw 34, 0, 1
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -61,9 +79,14 @@ entry:
   ret <2 x i64> %splat.splat
 ; CHECK-LABEL: buildl
 ; CHECK: mtfprd f0, r3
+
 ; CHECK-LE-LABEL: buildl
 ; CHECK-LE: mtfprd f0, r3
 ; CHECK-LE: xxspltd v2, vs0, 0
+
+; CHECK-AIX-LABEL: buildl:
+; CHECK-AIX: mtfprd 0, 3
+; CHECK-AIX: xxmrghd 34, 0, 0
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -75,9 +98,14 @@ entry:
 ; CHECK-LABEL: buildf
 ; CHECK: xscvdpspn vs0, f1
 ; CHECK: xxspltw v2, vs0, 0
+
 ; CHECK-LE-LABEL: buildf
 ; CHECK-LE: xscvdpspn vs0, f1
 ; CHECK-LE: xxspltw v2, vs0, 0
+
+; CHECK-AIX-LABEL: buildf:
+; CHECK-AIX: xscvdpspn 0, 1
+; CHECK-AIX: xxspltw 34, 0, 0
 }
 
 ; The optimization to remove stack operations from PPCDAGToDAGISel::Select
@@ -92,9 +120,14 @@ entry:
 ; CHECK-LABEL: buildd
 ; CHECK: ld r3, .LC0 at toc@l(r3)
 ; CHECK: lxvdsx v2, 0, r3
+
 ; CHECK-LE-LABEL: buildd
 ; CHECK-LE: ld r3, .LC0 at toc@l(r3)
 ; CHECK-LE: lxvdsx v2, 0, r3
+
+; CHECK-AIX-LABEL: buildd:
+; CHECK-AIX: ld 3, L..C0(2)
+; CHECK-AIX: lxvdsx 34, 0, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -106,10 +139,16 @@ entry:
 ; CHECK: mfvsrd r3, v2
 ; CHECK: rldicl r3, r3, 8, 56
 ; CHECK: extsb r3, r3
+
 ; CHECK-LE-LABEL: @getsc0
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: clrldi r3, r3, 56
 ; CHECK-LE: extsb r3, r3
+
+; CHECK-AIX-LABEL: getsc0:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: rldicl 3, 3, 8, 56
+; CHECK-AIX: extsb 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -121,10 +160,16 @@ entry:
 ; CHECK: mfvsrd r3, v2
 ; CHECK: rldicl r3, r3, 16, 56
 ; CHECK: extsb r3, r3
+
 ; CHECK-LE-LABEL: @getsc1
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: rldicl r3, r3, 56, 56
 ; CHECK-LE: extsb r3, r3
+
+; CHECK-AIX-LABEL: getsc1:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: rldicl 3, 3, 16, 56
+; CHECK-AIX: extsb 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -136,10 +181,16 @@ entry:
 ; CHECK: mfvsrd r3, v2
 ; CHECK: rldicl r3, r3, 24, 56
 ; CHECK: extsb r3, r3
+
 ; CHECK-LE-LABEL: @getsc2
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: rldicl r3, r3, 48, 56
 ; CHECK-LE: extsb r3, r3
+
+; CHECK-AIX-LABEL: getsc2:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: rldicl 3, 3, 24, 56
+; CHECK-AIX: extsb 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -151,10 +202,16 @@ entry:
 ; CHECK: mfvsrd r3, v2
 ; CHECK: rldicl r3, r3, 32, 56
 ; CHECK: extsb r3, r3
+
 ; CHECK-LE-LABEL: @getsc3
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: rldicl r3, r3, 40, 56
 ; CHECK-LE: extsb r3, r3
+
+; CHECK-AIX-LABEL: getsc3:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: rldicl 3, 3, 32, 56
+; CHECK-AIX: extsb 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -166,10 +223,16 @@ entry:
 ; CHECK: mfvsrd r3, v2
 ; CHECK: rldicl r3, r3, 40, 56
 ; CHECK: extsb r3, r3
+
 ; CHECK-LE-LABEL: @getsc4
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: rldicl r3, r3, 32, 56
 ; CHECK-LE: extsb r3, r3
+
+; CHECK-AIX-LABEL: getsc4:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: rldicl 3, 3, 40, 56
+; CHECK-AIX: extsb 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -181,10 +244,16 @@ entry:
 ; CHECK: mfvsrd r3, v2
 ; CHECK: rldicl r3, r3, 48, 56
 ; CHECK: extsb r3, r3
+
 ; CHECK-LE-LABEL: @getsc5
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: rldicl r3, r3, 24, 56
 ; CHECK-LE: extsb r3, r3
+
+; CHECK-AIX-LABEL: getsc5:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: rldicl 3, 3, 48, 56
+; CHECK-AIX: extsb 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -196,10 +265,16 @@ entry:
 ; CHECK: mfvsrd r3, v2
 ; CHECK: rldicl r3, r3, 56, 56
 ; CHECK: extsb r3, r3
+
 ; CHECK-LE-LABEL: @getsc6
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: rldicl r3, r3, 16, 56
 ; CHECK-LE: extsb r3, r3
+
+; CHECK-AIX-LABEL: getsc6:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: rldicl 3, 3, 56, 56
+; CHECK-AIX: extsb 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -211,10 +286,16 @@ entry:
 ; CHECK: mfvsrd r3, v2
 ; CHECK: clrldi r3, r3, 56
 ; CHECK: extsb r3, r3
+
 ; CHECK-LE-LABEL: @getsc7
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: rldicl r3, r3, 8, 56
 ; CHECK-LE: extsb r3, r3
+
+; CHECK-AIX-LABEL: getsc7:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: clrldi 3, 3, 56
+; CHECK-AIX: extsb 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -226,10 +307,16 @@ entry:
 ; CHECK: mffprd r3, f0
 ; CHECK: rldicl r3, r3, 8, 56
 ; CHECK: extsb r3, r3
+
 ; CHECK-LE-LABEL: @getsc8
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: clrldi r3, r3, 56
 ; CHECK-LE: extsb r3, r3
+
+; CHECK-AIX-LABEL: getsc8:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: rldicl 3, 3, 8, 56
+; CHECK-AIX: extsb 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -241,10 +328,16 @@ entry:
 ; CHECK: mffprd r3, f0
 ; CHECK: rldicl r3, r3, 16, 56
 ; CHECK: extsb r3, r3
+
 ; CHECK-LE-LABEL: @getsc9
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: rldicl r3, r3, 56, 56
 ; CHECK-LE: extsb r3, r3
+
+; CHECK-AIX-LABEL: getsc9:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: rldicl 3, 3, 16, 56
+; CHECK-AIX: extsb 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -256,10 +349,16 @@ entry:
 ; CHECK: mffprd r3, f0
 ; CHECK: rldicl r3, r3, 24, 56
 ; CHECK: extsb r3, r3
+
 ; CHECK-LE-LABEL: @getsc10
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: rldicl r3, r3, 48, 56
 ; CHECK-LE: extsb r3, r3
+
+; CHECK-AIX-LABEL: getsc10:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: rldicl 3, 3, 24, 56
+; CHECK-AIX: extsb 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -271,10 +370,16 @@ entry:
 ; CHECK: mffprd r3, f0
 ; CHECK: rldicl r3, r3, 32, 56
 ; CHECK: extsb r3, r3
+
 ; CHECK-LE-LABEL: @getsc11
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: rldicl r3, r3, 40, 56
 ; CHECK-LE: extsb r3, r3
+
+; CHECK-AIX-LABEL: getsc11:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: rldicl 3, 3, 32, 56
+; CHECK-AIX: extsb 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -286,10 +391,16 @@ entry:
 ; CHECK: mffprd r3, f0
 ; CHECK: rldicl r3, r3, 40, 56
 ; CHECK: extsb r3, r3
+
 ; CHECK-LE-LABEL: @getsc12
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: rldicl r3, r3, 32, 56
 ; CHECK-LE: extsb r3, r3
+
+; CHECK-AIX-LABEL: getsc12:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: rldicl 3, 3, 40, 56
+; CHECK-AIX: extsb 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -301,10 +412,15 @@ entry:
 ; CHECK: mffprd r3, f0
 ; CHECK: rldicl r3, r3, 48, 56
 ; CHECK: extsb r3, r3
+
 ; CHECK-LE-LABEL: @getsc13
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: rldicl r3, r3, 24, 56
 ; CHECK-LE: extsb r3, r3
+
+; CHECK-AIX-LABEL: getsc13:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: rldicl 3, 3, 48, 56
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -316,10 +432,16 @@ entry:
 ; CHECK: mffprd r3, f0
 ; CHECK: rldicl r3, r3, 56, 56
 ; CHECK: extsb r3, r3
+
 ; CHECK-LE-LABEL: @getsc14
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: rldicl r3, r3, 16, 56
 ; CHECK-LE: extsb r3, r3
+
+; CHECK-AIX-LABEL: getsc14:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: rldicl 3, 3, 56, 56
+; CHECK-AIX: extsb 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -331,10 +453,16 @@ entry:
 ; CHECK: mffprd r3, f0
 ; CHECK: clrldi  r3, r3, 56
 ; CHECK: extsb r3, r3
+
 ; CHECK-LE-LABEL: @getsc15
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: rldicl r3, r3, 8, 56
 ; CHECK-LE: extsb r3, r3
+
+; CHECK-AIX-LABEL: getsc15:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: clrldi 3, 3, 56
+; CHECK-AIX: extsb 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -345,9 +473,14 @@ entry:
 ; CHECK-LABEL: @getuc0
 ; CHECK: mfvsrd r3, v2
 ; CHECK: rldicl r3, r3, 8, 56
+
 ; CHECK-LE-LABEL: @getuc0
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: clrldi r3, r3, 56
+
+; CHECK-AIX-LABEL: getuc0:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: rldicl 3, 3, 8, 56
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -358,9 +491,14 @@ entry:
 ; CHECK-LABEL: @getuc1
 ; CHECK: mfvsrd r3, v2
 ; CHECK: rldicl r3, r3, 16, 56
+
 ; CHECK-LE-LABEL: @getuc1
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: rldicl r3, r3, 56, 56
+
+; CHECK-AIX-LABEL: getuc1:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: rldicl 3, 3, 16, 56
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -371,9 +509,15 @@ entry:
 ; CHECK-LABEL: @getuc2
 ; CHECK: mfvsrd r3, v2
 ; CHECK: rldicl r3, r3, 24, 56
+
 ; CHECK-LE-LABEL: @getuc2
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: rldicl r3, r3, 48, 56
+
+; CHECK-AIX-LABEL: getuc2:
+; CHECK-AIX mfvsrd 3, 34
+; CHECK-AIX rldicl 3, 3, 24, 56
+; CHECK-AIX clrldi 3, 3, 56
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -384,9 +528,14 @@ entry:
 ; CHECK-LABEL: @getuc3
 ; CHECK: mfvsrd r3, v2
 ; CHECK: rldicl r3, r3, 32, 56
+
 ; CHECK-LE-LABEL: @getuc3
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: rldicl r3, r3, 40, 56
+
+; CHECK-AIX-LABEL: getuc3:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: rldicl 3, 3, 32, 56
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -397,9 +546,14 @@ entry:
 ; CHECK-LABEL: @getuc4
 ; CHECK: mfvsrd r3, v2
 ; CHECK: rldicl r3, r3, 40, 56
+
 ; CHECK-LE-LABEL: @getuc4
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: rldicl r3, r3, 32, 56
+
+; CHECK-AIX-LABEL: getuc4:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: rldicl 3, 3, 40, 56
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -410,9 +564,14 @@ entry:
 ; CHECK-LABEL: @getuc5
 ; CHECK: mfvsrd r3, v2
 ; CHECK: rldicl r3, r3, 48, 56
+
 ; CHECK-LE-LABEL: @getuc5
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: rldicl r3, r3, 24, 56
+
+; CHECK-AIX-LABEL: getuc5:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: rldicl 3, 3, 48, 56
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -423,9 +582,14 @@ entry:
 ; CHECK-LABEL: @getuc6
 ; CHECK: mfvsrd r3, v2
 ; CHECK: rldicl r3, r3, 56, 56
+
 ; CHECK-LE-LABEL: @getuc6
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: rldicl r3, r3, 16, 56
+
+; CHECK-AIX-LABEL: getuc6:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: rldicl 3, 3, 56, 56
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -436,9 +600,14 @@ entry:
 ; CHECK-LABEL: @getuc7
 ; CHECK: mfvsrd r3, v2
 ; CHECK: clrldi   r3, r3, 56
+
 ; CHECK-LE-LABEL: @getuc7
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: rldicl r3, r3, 8, 56
+
+; CHECK-AIX-LABEL: getuc7:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: clrldi 3, 3, 56
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -449,9 +618,14 @@ entry:
 ; CHECK-LABEL: @getuc8
 ; CHECK: mffprd r3, f0
 ; CHECK: rldicl r3, r3, 8, 56
+
 ; CHECK-LE-LABEL: @getuc8
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: clrldi r3, r3, 56
+
+; CHECK-AIX-LABEL: getuc8:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: rldicl 3, 3, 8, 56
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -462,9 +636,14 @@ entry:
 ; CHECK-LABEL: @getuc9
 ; CHECK: mffprd r3, f0
 ; CHECK: rldicl r3, r3, 16, 56
+
 ; CHECK-LE-LABEL: @getuc9
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: rldicl r3, r3, 56, 56
+
+; CHECK-AIX-LABEL: getuc9:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: rldicl 3, 3, 16, 56
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -475,9 +654,14 @@ entry:
 ; CHECK-LABEL: @getuc10
 ; CHECK: mffprd r3, f0
 ; CHECK: rldicl r3, r3, 24, 56
+
 ; CHECK-LE-LABEL: @getuc10
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: rldicl r3, r3, 48, 56
+
+; CHECK-AIX-LABEL: getuc10:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: rldicl 3, 3, 24, 56
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -488,9 +672,14 @@ entry:
 ; CHECK-LABEL: @getuc11
 ; CHECK: mffprd r3, f0
 ; CHECK: rldicl r3, r3, 32, 56
+
 ; CHECK-LE-LABEL: @getuc11
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: rldicl r3, r3, 40, 56
+
+; CHECK-AIX-LABEL: getuc11:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: rldicl 3, 3, 32, 56
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -501,9 +690,14 @@ entry:
 ; CHECK-LABEL: @getuc12
 ; CHECK: mffprd r3, f0
 ; CHECK: rldicl r3, r3, 40, 56
+
 ; CHECK-LE-LABEL: @getuc12
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: rldicl r3, r3, 32, 56
+
+; CHECK-AIX-LABEL: getuc12:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: rldicl 3, 3, 40, 56
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -514,9 +708,14 @@ entry:
 ; CHECK-LABEL: @getuc13
 ; CHECK: mffprd r3, f0
 ; CHECK: rldicl r3, r3, 48, 56
+
 ; CHECK-LE-LABEL: @getuc13
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: rldicl r3, r3, 24, 56
+
+; CHECK-AIX-LABEL: getuc13:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: rldicl 3, 3, 48, 56
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -527,9 +726,14 @@ entry:
 ; CHECK-LABEL: @getuc14
 ; CHECK: mffprd r3, f0
 ; CHECK: rldicl r3, r3, 56, 56
+
 ; CHECK-LE-LABEL: @getuc14
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: rldicl r3, r3, 16, 56
+
+; CHECK-AIX-LABEL: getuc14
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: rldicl 3, 3, 56, 56
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -540,9 +744,14 @@ entry:
 ; CHECK-LABEL: @getuc15
 ; CHECK: mffprd r3, f0
 ; CHECK: clrldi   r3, r3, 56
+
 ; CHECK-LE-LABEL: @getuc15
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: rldicl r3, r3, 8, 56
+
+; CHECK-AIX-LABEL: getuc15:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: clrldi 3, 3, 56
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -557,6 +766,7 @@ define signext i8 @getvelsc(<16 x i8> %vsc, i32 signext %i) {
 ; CHECK: mfvsrd r4, v2
 ; CHECK: srd r3, r4, r3
 ; CHECK: extsb r3, r3
+
 ; CHECK-LE-LABEL: @getvelsc
 ; CHECK-LE: li r3, 8
 ; CHECK-LE: andc r3, r3, r5
@@ -568,6 +778,17 @@ define signext i8 @getvelsc(<16 x i8> %vsc, i32 signext %i) {
 ; CHECK-LE: mfvsrd r4, v2
 ; CHECK-LE: srd r3, r4, r3
 ; CHECK-LE: extsb r3, r3
+
+; CHECK-AIX-LABEL: getvelsc:
+; CHECK-AIX: andi. 5, 3, 8
+; CHECK-AIX: li 4, 7
+; CHECK-AIX: lvsl 3, 0, 5
+; CHECK-AIX: andc 3, 4, 3
+; CHECK-AIX: sldi 3, 3, 3
+; CHECK-AIX: vperm 2, 2, 2, 3
+; CHECK-AIX: mfvsrd 4, 34
+; CHECK-AIX: srd 3, 4, 3
+; CHECK-AIX: extsb 3, 3
 entry:
   %vecext = extractelement <16 x i8> %vsc, i32 %i
   ret i8 %vecext
@@ -585,6 +806,7 @@ define zeroext i8 @getveluc(<16 x i8> %vuc, i32 signext %i) {
 ; CHECK: mfvsrd r4, v2
 ; CHECK: srd r3, r4, r3
 ; CHECK: clrldi  r3, r3, 5
+
 ; CHECK-LE-LABEL: @getveluc
 ; CHECK-LE: li r3, 8
 ; CHECK-LE: andc r3, r3, r5
@@ -596,6 +818,17 @@ define zeroext i8 @getveluc(<16 x i8> %vuc, i32 signext %i) {
 ; CHECK-LE: mfvsrd r4, v2
 ; CHECK-LE: srd r3, r4, r3
 ; CHECK-LE: clrldi r3, r3, 56
+
+; CHECK-AIX-LABEL: getveluc:
+; CHECK-AIX: andi. 5, 3, 8
+; CHECK-AIX: li 4, 7
+; CHECK-AIX: lvsl 3, 0, 5
+; CHECK-AIX: andc 3, 4, 3
+; CHECK-AIX: sldi 3, 3, 3
+; CHECK-AIX: vperm 2, 2, 2, 3
+; CHECK-AIX: mfvsrd 4, 34
+; CHECK-AIX: srd 3, 4, 3
+; CHECK-AIX: clrldi 3, 3, 56
 entry:
   %vecext = extractelement <16 x i8> %vuc, i32 %i
   ret i8 %vecext
@@ -610,10 +843,16 @@ entry:
 ; CHECK: mfvsrd r3, v2
 ; CHECK: rldicl r3, r3, 16, 48
 ; CHECK: extsh r3, r3
+
 ; CHECK-LE-LABEL: @getss0
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: clrldi r3, r3, 48
 ; CHECK-LE: extsh r3, r3
+
+; CHECK-AIX-LABEL: getss0:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: rldicl 3, 3, 16, 48
+; CHECK-AIX: extsh 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -625,10 +864,16 @@ entry:
 ; CHECK: mfvsrd r3, v2
 ; CHECK: rldicl r3, r3, 32, 48
 ; CHECK: extsh r3, r3
+
 ; CHECK-LE-LABEL: @getss1
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: rldicl r3, r3, 48, 48
 ; CHECK-LE: extsh r3, r3
+
+; CHECK-AIX-LABEL: getss1:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: rldicl 3, 3, 32, 48
+; CHECK-AIX: extsh 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -640,10 +885,16 @@ entry:
 ; CHECK: mfvsrd r3, v2
 ; CHECK: rldicl r3, r3, 48, 48
 ; CHECK: extsh r3, r3
+
 ; CHECK-LE-LABEL: @getss2
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: rldicl r3, r3, 32, 48
 ; CHECK-LE: extsh r3, r3
+
+; CHECK-AIX-LABEL: getss2:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: rldicl 3, 3, 48, 48
+; CHECK-AIX: extsh 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -655,10 +906,16 @@ entry:
 ; CHECK: mfvsrd r3, v2
 ; CHECK: clrldi r3, r3, 48
 ; CHECK: extsh r3, r3
+
 ; CHECK-LE-LABEL: @getss3
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: rldicl r3, r3, 16, 48
 ; CHECK-LE: extsh r3, r3
+
+; CHECK-AIX-LABEL: getss3:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: clrldi 3, 3, 48
+; CHECK-AIX: extsh 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -670,10 +927,16 @@ entry:
 ; CHECK: mffprd r3, f0
 ; CHECK: rldicl r3, r3, 16, 48
 ; CHECK: extsh r3, r3
+
 ; CHECK-LE-LABEL: @getss4
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: clrldi r3, r3, 48
 ; CHECK-LE: extsh r3, r3
+
+; CHECK-AIX-LABEL: getss4:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: rldicl 3, 3, 16, 48
+; CHECK-AIX: extsh 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -685,10 +948,16 @@ entry:
 ; CHECK: mffprd r3, f0
 ; CHECK: rldicl r3, r3, 32, 48
 ; CHECK: extsh r3, r3
+
 ; CHECK-LE-LABEL: @getss5
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: rldicl r3, r3, 48, 48
 ; CHECK-LE: extsh r3, r3
+
+; CHECK-AIX-LABEL: getss5:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: rldicl 3, 3, 32, 48
+; CHECK-AIX: extsh 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -700,10 +969,16 @@ entry:
 ; CHECK: mffprd r3, f0
 ; CHECK: rldicl r3, r3, 48, 48
 ; CHECK: extsh r3, r3
+
 ; CHECK-LE-LABEL: @getss6
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: rldicl r3, r3, 32, 48
 ; CHECK-LE: extsh r3, r3
+
+; CHECK-AIX-LABEL: getss6:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: rldicl 3, 3, 48, 48
+; CHECK-AIX: extsh 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -715,10 +990,16 @@ entry:
 ; CHECK: mffprd r3, f0
 ; CHECK: clrldi  r3, r3, 48
 ; CHECK: extsh r3, r3
+
 ; CHECK-LE-LABEL: @getss7
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: rldicl r3, r3, 16, 48
 ; CHECK-LE: extsh r3, r3
+
+; CHECK-AIX-LABEL: getss7:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: clrldi 3, 3, 48
+; CHECK-AIX: extsh 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -729,9 +1010,14 @@ entry:
 ; CHECK-LABEL: @getus0
 ; CHECK: mfvsrd r3, v2
 ; CHECK: rldicl r3, r3, 16, 48
+
 ; CHECK-LE-LABEL: @getus0
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: clrldi r3, r3, 48
+
+; CHECK-AIX-LABEL: getus0:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: rldicl 3, 3, 16, 48
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -742,9 +1028,14 @@ entry:
 ; CHECK-LABEL: @getus1
 ; CHECK: mfvsrd r3, v2
 ; CHECK: rldicl r3, r3, 32, 48
+
 ; CHECK-LE-LABEL: @getus1
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: rldicl r3, r3, 48, 48
+
+; CHECK-AIX-LABEL: getus1:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: rldicl 3, 3, 32, 48
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -755,9 +1046,14 @@ entry:
 ; CHECK-LABEL: @getus2
 ; CHECK: mfvsrd r3, v2
 ; CHECK: rldicl r3, r3, 48, 48
+
 ; CHECK-LE-LABEL: @getus2
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: rldicl r3, r3, 32, 48
+
+; CHECK-AIX-LABEL: getus2:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: rldicl 3, 3, 48, 48
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -768,9 +1064,14 @@ entry:
 ; CHECK-LABEL: @getus3
 ; CHECK: mfvsrd r3, v2
 ; CHECK: clrldi   r3, r3, 48
+
 ; CHECK-LE-LABEL: @getus3
 ; CHECK-LE: mffprd r3, f0
 ; CHECK-LE: rldicl r3, r3, 16, 48
+
+; CHECK-AIX-LABEL: getus3:
+; CHECK-AIX: mfvsrd 3, 34
+; CHECK-AIX: clrldi 3, 3, 48
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -781,9 +1082,14 @@ entry:
 ; CHECK-LABEL: @getus4
 ; CHECK: mffprd r3, f0
 ; CHECK: rldicl r3, r3, 16, 48
+
 ; CHECK-LE-LABEL: @getus4
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: clrldi r3, r3, 48
+
+; CHECK-AIX-LABEL: getus4:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: rldicl 3, 3, 16, 48
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -794,9 +1100,14 @@ entry:
 ; CHECK-LABEL: @getus5
 ; CHECK: mffprd r3, f0
 ; CHECK: rldicl r3, r3, 32, 48
+
 ; CHECK-LE-LABEL: @getus5
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: rldicl r3, r3, 48, 48
+
+; CHECK-AIX-LABEL: getus5:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: rldicl 3, 3, 32, 48
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -807,9 +1118,14 @@ entry:
 ; CHECK-LABEL: @getus6
 ; CHECK: mffprd r3, f0
 ; CHECK: rldicl r3, r3, 48, 48
+
 ; CHECK-LE-LABEL: @getus6
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: rldicl r3, r3, 32, 48
+
+; CHECK-AIX-LABEL: getus6:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: rldicl 3, 3, 48, 48
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -820,9 +1136,14 @@ entry:
 ; CHECK-LABEL: @getus7
 ; CHECK: mffprd r3, f0
 ; CHECK: clrldi   r3, r3, 48
+
 ; CHECK-LE-LABEL: @getus7
 ; CHECK-LE: mfvsrd r3, v2
 ; CHECK-LE: rldicl r3, r3, 16, 48
+
+; CHECK-AIX-LABEL: getus7:
+; CHECK-AIX: mffprd 3, 0
+; CHECK-AIX: clrldi 3, 3, 48
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -838,6 +1159,7 @@ define signext i16 @getvelss(<8 x i16> %vss, i32 signext %i) {
 ; CHECK: mfvsrd r4, v2
 ; CHECK: srd r3, r4, r3
 ; CHECK: extsh r3, r3
+
 ; CHECK-LE-LABEL: @getvelss
 ; CHECK-LE: li r3, 4
 ; CHECK-LE: andc r3, r3, r5
@@ -850,6 +1172,18 @@ define signext i16 @getvelss(<8 x i16> %vss, i32 signext %i) {
 ; CHECK-LE: mfvsrd r4, v2
 ; CHECK-LE: srd r3, r4, r3
 ; CHECK-LE: extsh r3, r3
+
+; CHECK-AIX-LABEL: getvelss:
+; CHECK-AIX: andi. 5, 3, 4
+; CHECK-AIX: li 4, 3
+; CHECK-AIX: sldi 5, 5, 1
+; CHECK-AIX: andc 3, 4, 3
+; CHECK-AIX: lvsl 3, 0, 5
+; CHECK-AIX: sldi 3, 3, 4
+; CHECK-AIX: vperm 2, 2, 2, 3
+; CHECK-AIX: mfvsrd 4, 34
+; CHECK-AIX: srd 3, 4, 3
+; CHECK-AIX: extsh 3, 3
 entry:
   %vecext = extractelement <8 x i16> %vss, i32 %i
   ret i16 %vecext
@@ -868,6 +1202,7 @@ define zeroext i16 @getvelus(<8 x i16> %vus, i32 signext %i) {
 ; CHECK: mfvsrd r4, v2
 ; CHECK: srd r3, r4, r3
 ; CHECK: clrldi  r3, r3, 48
+
 ; CHECK-LE-LABEL: @getvelus
 ; CHECK-LE: li r3, 4
 ; CHECK-LE: andc r3, r3, r5
@@ -880,6 +1215,18 @@ define zeroext i16 @getvelus(<8 x i16> %vus, i32 signext %i) {
 ; CHECK-LE: mfvsrd r4, v2
 ; CHECK-LE: srd r3, r4, r3
 ; CHECK-LE: clrldi r3, r3, 48
+
+; CHECK-AIX-LABEL: getvelus:
+; CHECK-AIX: andi. 5, 3, 4
+; CHECK-AIX: li 4, 3
+; CHECK-AIX: sldi 5, 5, 1
+; CHECK-AIX: andc 3, 4, 3
+; CHECK-AIX: lvsl 3, 0, 5
+; CHECK-AIX: sldi 3, 3, 4
+; CHECK-AIX: vperm 2, 2, 2, 3
+; CHECK-AIX: mfvsrd 4, 34
+; CHECK-AIX: srd 3, 4, 3
+; CHECK-AIX: clrldi 3, 3, 48
 entry:
   %vecext = extractelement <8 x i16> %vus, i32 %i
   ret i16 %vecext
@@ -894,10 +1241,16 @@ entry:
 ; CHECK: xxsldwi vs0, v2, v2, 3
 ; CHECK: mffprwz r3, f0
 ; CHECK: extsw r3, r3
+
 ; CHECK-LE-LABEL: @getsi0
 ; CHECK-LE: xxswapd vs0, v2
 ; CHECK-LE: mffprwz r3, f0
 ; CHECK-LE: extsw r3, r3
+
+; CHECK-AIX-LABEL: getsi0:
+; CHECK-AIX: xxsldwi 0, 34, 34, 3
+; CHECK-AIX: mffprwz 3, 0
+; CHECK-AIX: extsw 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -908,10 +1261,15 @@ entry:
 ; CHECK-LABEL: @getsi1
 ; CHECK: mfvsrwz r3, v2
 ; CHECK: extsw r3, r3
+
 ; CHECK-LE-LABEL: @getsi1
 ; CHECK-LE: xxsldwi vs0, v2, v2, 1
 ; CHECK-LE: mffprwz r3, f0
 ; CHECK-LE: extsw r3, r3
+
+; CHECK-AIX-LABEL: getsi1:
+; CHECK-AIX: mfvsrwz 3, 34
+; CHECK-AIX: extsw 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -923,9 +1281,15 @@ entry:
 ; CHECK: xxsldwi vs0, v2, v2, 1
 ; CHECK: mffprwz r3, f0
 ; CHECK: extsw r3, r3
+
 ; CHECK-LE-LABEL: @getsi2
 ; CHECK-LE: mfvsrwz r3, v2
 ; CHECK-LE: extsw r3, r3
+
+; CHECK-AIX-LABEL: getsi2:
+; CHECK-AIX: xxsldwi 0, 34, 34, 1
+; CHECK-AIX: mffprwz 3, 0
+; CHECK-AIX: extsw 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -937,10 +1301,16 @@ entry:
 ; CHECK: xxswapd vs0, v2
 ; CHECK: mffprwz r3, f0
 ; CHECK: extsw r3, r3
+
 ; CHECK-LE-LABEL: @getsi3
 ; CHECK-LE: xxsldwi vs0, v2, v2, 3
 ; CHECK-LE: mffprwz r3, f0
 ; CHECK-LE: extsw r3, r3
+
+; CHECK-AIX-LABEL: getsi3:
+; CHECK-AIX: xxswapd 0, 34
+; CHECK-AIX: mffprwz 3, 0
+; CHECK-AIX: extsw 3, 3
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -951,9 +1321,14 @@ entry:
 ; CHECK-LABEL: @getui0
 ; CHECK: xxsldwi vs0, v2, v2, 3
 ; CHECK: mffprwz r3, f0
+
 ; CHECK-LE-LABEL: @getui0
 ; CHECK-LE: xxswapd vs0, v2
 ; CHECK-LE: mffprwz r3, f0
+
+; CHECK-AIX-LABEL: getui0:
+; CHECK-AIX: xxsldwi 0, 34, 34, 3
+; CHECK-AIX: mffprwz 3, 0
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -963,9 +1338,13 @@ entry:
   ret i32 %vecext
 ; CHECK-LABEL: @getui1
 ; CHECK: mfvsrwz r3, v2
+
 ; CHECK-LE-LABEL: @getui1
 ; CHECK-LE: xxsldwi vs0, v2, v2, 1
 ; CHECK-LE: mffprwz r3, f0
+
+; CHECK-AIX-LABEL: getui1:
+; CHECK-AIX: mfvsrwz 3, 34
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -976,8 +1355,13 @@ entry:
 ; CHECK-LABEL: @getui2
 ; CHECK: xxsldwi vs0, v2, v2, 1
 ; CHECK: mffprwz r3, f0
+
 ; CHECK-LE-LABEL: @getui2
 ; CHECK-LE: mfvsrwz r3, v2
+
+; CHECK-AIX-LABEL: getui2:
+; CHECK-AIX: xxsldwi 0, 34, 34, 1
+; CHECK-AIX: mffprwz 3, 0
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -988,9 +1372,14 @@ entry:
 ; CHECK-LABEL: @getui3
 ; CHECK: xxswapd vs0, v2
 ; CHECK: mffprwz r3, f0
+
 ; CHECK-LE-LABEL: @getui3
 ; CHECK-LE: xxsldwi vs0, v2, v2, 3
 ; CHECK-LE: mffprwz r3, f0
+
+; CHECK-AIX-LABEL: getui3:
+; CHECK-AIX: xxswapd 0, 34
+; CHECK-AIX: mffprwz 3, 0
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -1000,6 +1389,7 @@ entry:
   ret i32 %vecext
 ; CHECK-LABEL: @getvelsi
 ; CHECK-LE-LABEL: @getvelsi
+; CHECK-AIX-LABEL: getvelsi
 ; FIXME: add check patterns when variable element extraction is implemented
 }
 
@@ -1010,6 +1400,7 @@ entry:
   ret i32 %vecext
 ; CHECK-LABEL: @getvelui
 ; CHECK-LE-LABEL: @getvelui
+; CHECK-AIX-LABEL: getvelui
 ; FIXME: add check patterns when variable element extraction is implemented
 }
 
@@ -1020,9 +1411,13 @@ entry:
   ret i64 %vecext
 ; CHECK-LABEL: @getsl0
 ; CHECK: mfvsrd r3, v2
+
 ; CHECK-LE-LABEL: @getsl0
 ; CHECK-LE: xxswapd vs0, v2
 ; CHECK-LE: mffprd r3, f0
+
+; CHECK-AIX-LABEL: getsl0:
+; CHECK-AIX: mfvsrd 3, 34
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -1033,8 +1428,13 @@ entry:
 ; CHECK-LABEL: @getsl1
 ; CHECK: xxswapd vs0, v2
 ; CHECK: mffprd r3, f0
+
 ; CHECK-LE-LABEL: @getsl1
 ; CHECK-LE: mfvsrd r3, v2
+
+; CHECK-AIX-LABEL: getsl1:
+; CHECK-AIX: xxswapd 0, 34
+; CHECK-AIX: mffprd 3, 0
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -1044,9 +1444,13 @@ entry:
   ret i64 %vecext
 ; CHECK-LABEL: @getul0
 ; CHECK: mfvsrd r3, v2
+
 ; CHECK-LE-LABEL: @getul0
 ; CHECK-LE: xxswapd  vs0, v2
 ; CHECK-LE: mffprd r3, f0
+
+; CHECK-AIX-LABEL: getul0:
+; CHECK-AIX: mfvsrd 3, 34
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -1057,8 +1461,13 @@ entry:
 ; CHECK-LABEL: @getul1
 ; CHECK: xxswapd vs0, v2
 ; CHECK: mffprd r3, f0
+
 ; CHECK-LE-LABEL: @getul1
 ; CHECK-LE: mfvsrd r3, v2
+
+; CHECK-AIX-LABEL: getul1:
+; CHECK-AIX: xxswapd 0, 34
+; CHECK-AIX: mffprd 3, 0
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -1068,6 +1477,7 @@ entry:
   ret i64 %vecext
 ; CHECK-LABEL: @getvelsl
 ; CHECK-LE-LABEL: @getvelsl
+; CHECK-AIX-LABEL: getvelsl:
 ; FIXME: add check patterns when variable element extraction is implemented
 }
 
@@ -1078,6 +1488,7 @@ entry:
   ret i64 %vecext
 ; CHECK-LABEL: @getvelul
 ; CHECK-LE-LABEL: @getvelul
+; CHECK-AIX-LABEL: getvelul
 ; FIXME: add check patterns when variable element extraction is implemented
 }
 
@@ -1088,9 +1499,13 @@ entry:
   ret float %vecext
 ; CHECK-LABEL: @getf0
 ; CHECK: xscvspdpn f1, v2
+
 ; CHECK-LE-LABEL: @getf0
 ; CHECK-LE: xxsldwi vs0, v2, v2, 3
 ; CHECK-LE: xscvspdpn f1, vs0
+
+; CHECK-AIX-LABEL: getf0:
+; CHECK-AIX: xscvspdpn 1, 34
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -1101,9 +1516,14 @@ entry:
 ; CHECK-LABEL: @getf1
 ; CHECK: xxsldwi vs0, v2, v2, 1
 ; CHECK: xscvspdpn f1, vs0
+
 ; CHECK-LE-LABEL: @getf1
 ; CHECK-LE: xxswapd vs0, v2
 ; CHECK-LE: xscvspdpn f1, vs0
+
+; CHECK-AIX-LABEL: getf1:
+; CHECK-AIX: xxsldwi 0, 34, 34, 1
+; CHECK-AIX: xscvspdpn 1, 0
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -1114,9 +1534,14 @@ entry:
 ; CHECK-LABEL: @getf2
 ; CHECK: xxswapd vs0, v2
 ; CHECK: xscvspdpn f1, vs0
+
 ; CHECK-LE-LABEL: @getf2
 ; CHECK-LE: xxsldwi vs0, v2, v2, 1
 ; CHECK-LE: xscvspdpn f1, vs0
+
+; CHECK-AIX-LABEL: getf2:
+; CHECK-AIX: xxswapd 0, 34
+; CHECK-AIX: xscvspdpn 1, 0
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -1127,8 +1552,13 @@ entry:
 ; CHECK-LABEL: @getf3
 ; CHECK: xxsldwi vs0, v2, v2, 3
 ; CHECK: xscvspdpn f1, vs0
+
 ; CHECK-LE-LABEL: @getf3
 ; CHECK-LE: xscvspdpn f1, v2
+
+; CHECK-AIX-LABEL: getf3:
+; CHECK-AIX: xxsldwi 0, 34, 34, 3
+; CHECK-AIX: xscvspdpn 1, 0
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -1138,6 +1568,7 @@ entry:
   ret float %vecext
 ; CHECK-LABEL: @getvelf
 ; CHECK-LE-LABEL: @getvelf
+; CHECK-AIX-LABEL: @getvelf
 ; FIXME: add check patterns when variable element extraction is implemented
 }
 
@@ -1148,8 +1579,12 @@ entry:
   ret double %vecext
 ; CHECK-LABEL: @getd0
 ; CHECK: xxlor f1, v2, v2
+
 ; CHECK-LE-LABEL: @getd0
 ; CHECK-LE: xxswapd vs1, v2
+
+; CHECK-AIX-LABEL: getd0:
+; CHECK-AIXT: xxlor 1, 34, 34
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -1159,8 +1594,12 @@ entry:
   ret double %vecext
 ; CHECK-LABEL: @getd1
 ; CHECK: xxswapd vs1, v2
+
 ; CHECK-LE-LABEL: @getd1
 ; CHECK-LE: xxlor f1, v2, v2
+
+; CHECK-AIX-LABEL: getd1:
+; CHECK-AIX: xxswapd 1, 34
 }
 
 ; Function Attrs: norecurse nounwind readnone
@@ -1170,5 +1609,6 @@ entry:
   ret double %vecext
 ; CHECK-LABEL: @getveld
 ; CHECK-LE-LABEL: @getveld
+; CHECK-AIX-LABEL: @getveld
 ; FIXME: add check patterns when variable element extraction is implemented
 }


        


More information about the llvm-commits mailing list