[llvm] 966ae76 - Run update_llc_test on test/CodeGen/ARM/vmov.ll

John Brawn via llvm-commits llvm-commits at lists.llvm.org
Fri Apr 3 09:37:27 PDT 2020


Author: John Brawn
Date: 2020-04-03T17:36:50+01:00
New Revision: 966ae762229f9d77e6d9f0ab4220e4c2bf5f4fc4

URL: https://github.com/llvm/llvm-project/commit/966ae762229f9d77e6d9f0ab4220e4c2bf5f4fc4
DIFF: https://github.com/llvm/llvm-project/commit/966ae762229f9d77e6d9f0ab4220e4c2bf5f4fc4.diff

LOG: Run update_llc_test on test/CodeGen/ARM/vmov.ll

This is in preparation for D76514

Added: 
    

Modified: 
    llvm/test/CodeGen/ARM/vmov.ll

Removed: 
    


################################################################################
diff  --git a/llvm/test/CodeGen/ARM/vmov.ll b/llvm/test/CodeGen/ARM/vmov.ll
index b1b4f1a940d4..0341448f9a77 100644
--- a/llvm/test/CodeGen/ARM/vmov.ll
+++ b/llvm/test/CodeGen/ARM/vmov.ll
@@ -1,332 +1,745 @@
-; RUN: llc -mtriple=arm-eabi -mattr=+neon %s -o - | FileCheck %s
-
-define <8 x i8> @v_movi8() nounwind {
-;CHECK-LABEL: v_movi8:
-;CHECK: vmov.i8 d{{.*}}, #0x8
+; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
+; RUN: llc -mtriple=arm-eabi -mattr=+neon %s -o - | FileCheck --check-prefixes=CHECK,CHECK-LE %s
+; RUN: llc -mtriple=armeb-eabi -mattr=+neon %s -o - | FileCheck --check-prefixes=CHECK,CHECK-BE %s
+
+define arm_aapcs_vfpcc <8 x i8> @v_movi8() nounwind {
+; CHECK-LE-LABEL: v_movi8:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmov.i8 d0, #0x8
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_movi8:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmov.i8 d16, #0x8
+; CHECK-BE-NEXT:    vrev64.8 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <8 x i8> < i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8 >
 }
 
-define <4 x i16> @v_movi16a() nounwind {
-;CHECK-LABEL: v_movi16a:
-;CHECK: vmov.i16 d{{.*}}, #0x10
+define arm_aapcs_vfpcc <4 x i16> @v_movi16a() nounwind {
+; CHECK-LE-LABEL: v_movi16a:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmov.i16 d0, #0x10
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_movi16a:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmov.i16 d16, #0x10
+; CHECK-BE-NEXT:    vrev64.16 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <4 x i16> < i16 16, i16 16, i16 16, i16 16 >
 }
 
-define <4 x i16> @v_movi16b() nounwind {
-;CHECK-LABEL: v_movi16b:
-;CHECK: vmov.i16 d{{.*}}, #0x1000
+define arm_aapcs_vfpcc <4 x i16> @v_movi16b() nounwind {
+; CHECK-LE-LABEL: v_movi16b:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmov.i16 d0, #0x1000
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_movi16b:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmov.i16 d16, #0x1000
+; CHECK-BE-NEXT:    vrev64.16 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <4 x i16> < i16 4096, i16 4096, i16 4096, i16 4096 >
 }
 
-define <4 x i16> @v_mvni16a() nounwind {
-;CHECK-LABEL: v_mvni16a:
-;CHECK: vmvn.i16 d{{.*}}, #0x10
+define arm_aapcs_vfpcc <4 x i16> @v_mvni16a() nounwind {
+; CHECK-LE-LABEL: v_mvni16a:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmvn.i16 d0, #0x10
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_mvni16a:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmvn.i16 d16, #0x10
+; CHECK-BE-NEXT:    vrev64.16 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <4 x i16> < i16 65519, i16 65519, i16 65519, i16 65519 >
 }
 
-define <4 x i16> @v_mvni16b() nounwind {
-;CHECK-LABEL: v_mvni16b:
-;CHECK: vmvn.i16 d{{.*}}, #0x1000
+define arm_aapcs_vfpcc <4 x i16> @v_mvni16b() nounwind {
+; CHECK-LE-LABEL: v_mvni16b:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmvn.i16 d0, #0x1000
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_mvni16b:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmvn.i16 d16, #0x1000
+; CHECK-BE-NEXT:    vrev64.16 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <4 x i16> < i16 61439, i16 61439, i16 61439, i16 61439 >
 }
 
-define <2 x i32> @v_movi32a() nounwind {
-;CHECK-LABEL: v_movi32a:
-;CHECK: vmov.i32 d{{.*}}, #0x20
+define arm_aapcs_vfpcc <2 x i32> @v_movi32a() nounwind {
+; CHECK-LE-LABEL: v_movi32a:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmov.i32 d0, #0x20
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_movi32a:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmov.i32 d16, #0x20
+; CHECK-BE-NEXT:    vrev64.32 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <2 x i32> < i32 32, i32 32 >
 }
 
-define <2 x i32> @v_movi32b() nounwind {
-;CHECK-LABEL: v_movi32b:
-;CHECK: vmov.i32 d{{.*}}, #0x2000
+define arm_aapcs_vfpcc <2 x i32> @v_movi32b() nounwind {
+; CHECK-LE-LABEL: v_movi32b:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmov.i32 d0, #0x2000
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_movi32b:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmov.i32 d16, #0x2000
+; CHECK-BE-NEXT:    vrev64.32 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <2 x i32> < i32 8192, i32 8192 >
 }
 
-define <2 x i32> @v_movi32c() nounwind {
-;CHECK-LABEL: v_movi32c:
-;CHECK: vmov.i32 d{{.*}}, #0x200000
+define arm_aapcs_vfpcc <2 x i32> @v_movi32c() nounwind {
+; CHECK-LE-LABEL: v_movi32c:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmov.i32 d0, #0x200000
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_movi32c:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmov.i32 d16, #0x200000
+; CHECK-BE-NEXT:    vrev64.32 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <2 x i32> < i32 2097152, i32 2097152 >
 }
 
-define <2 x i32> @v_movi32d() nounwind {
-;CHECK-LABEL: v_movi32d:
-;CHECK: vmov.i32 d{{.*}}, #0x20000000
+define arm_aapcs_vfpcc <2 x i32> @v_movi32d() nounwind {
+; CHECK-LE-LABEL: v_movi32d:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmov.i32 d0, #0x20000000
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_movi32d:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmov.i32 d16, #0x20000000
+; CHECK-BE-NEXT:    vrev64.32 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <2 x i32> < i32 536870912, i32 536870912 >
 }
 
-define <2 x i32> @v_movi32e() nounwind {
-;CHECK-LABEL: v_movi32e:
-;CHECK: vmov.i32 d{{.*}}, #0x20ff
+define arm_aapcs_vfpcc <2 x i32> @v_movi32e() nounwind {
+; CHECK-LE-LABEL: v_movi32e:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmov.i32 d0, #0x20ff
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_movi32e:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmov.i32 d16, #0x20ff
+; CHECK-BE-NEXT:    vrev64.32 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <2 x i32> < i32 8447, i32 8447 >
 }
 
-define <2 x i32> @v_movi32f() nounwind {
-;CHECK-LABEL: v_movi32f:
-;CHECK: vmov.i32 d{{.*}}, #0x20ffff
+define arm_aapcs_vfpcc <2 x i32> @v_movi32f() nounwind {
+; CHECK-LE-LABEL: v_movi32f:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmov.i32 d0, #0x20ffff
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_movi32f:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmov.i32 d16, #0x20ffff
+; CHECK-BE-NEXT:    vrev64.32 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <2 x i32> < i32 2162687, i32 2162687 >
 }
 
-define <2 x i32> @v_mvni32a() nounwind {
-;CHECK-LABEL: v_mvni32a:
-;CHECK: vmvn.i32 d{{.*}}, #0x20
+define arm_aapcs_vfpcc <2 x i32> @v_mvni32a() nounwind {
+; CHECK-LE-LABEL: v_mvni32a:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmvn.i32 d0, #0x20
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_mvni32a:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmvn.i32 d16, #0x20
+; CHECK-BE-NEXT:    vrev64.32 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <2 x i32> < i32 4294967263, i32 4294967263 >
 }
 
-define <2 x i32> @v_mvni32b() nounwind {
-;CHECK-LABEL: v_mvni32b:
-;CHECK: vmvn.i32 d{{.*}}, #0x2000
+define arm_aapcs_vfpcc <2 x i32> @v_mvni32b() nounwind {
+; CHECK-LE-LABEL: v_mvni32b:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmvn.i32 d0, #0x2000
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_mvni32b:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmvn.i32 d16, #0x2000
+; CHECK-BE-NEXT:    vrev64.32 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <2 x i32> < i32 4294959103, i32 4294959103 >
 }
 
-define <2 x i32> @v_mvni32c() nounwind {
-;CHECK-LABEL: v_mvni32c:
-;CHECK: vmvn.i32 d{{.*}}, #0x200000
+define arm_aapcs_vfpcc <2 x i32> @v_mvni32c() nounwind {
+; CHECK-LE-LABEL: v_mvni32c:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmvn.i32 d0, #0x200000
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_mvni32c:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmvn.i32 d16, #0x200000
+; CHECK-BE-NEXT:    vrev64.32 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <2 x i32> < i32 4292870143, i32 4292870143 >
 }
 
-define <2 x i32> @v_mvni32d() nounwind {
-;CHECK-LABEL: v_mvni32d:
-;CHECK: vmvn.i32 d{{.*}}, #0x20000000
+define arm_aapcs_vfpcc <2 x i32> @v_mvni32d() nounwind {
+; CHECK-LE-LABEL: v_mvni32d:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmvn.i32 d0, #0x20000000
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_mvni32d:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmvn.i32 d16, #0x20000000
+; CHECK-BE-NEXT:    vrev64.32 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <2 x i32> < i32 3758096383, i32 3758096383 >
 }
 
-define <2 x i32> @v_mvni32e() nounwind {
-;CHECK-LABEL: v_mvni32e:
-;CHECK: vmvn.i32 d{{.*}}, #0x20ff
+define arm_aapcs_vfpcc <2 x i32> @v_mvni32e() nounwind {
+; CHECK-LE-LABEL: v_mvni32e:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmvn.i32 d0, #0x20ff
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_mvni32e:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmvn.i32 d16, #0x20ff
+; CHECK-BE-NEXT:    vrev64.32 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <2 x i32> < i32 4294958848, i32 4294958848 >
 }
 
-define <2 x i32> @v_mvni32f() nounwind {
-;CHECK-LABEL: v_mvni32f:
-;CHECK: vmvn.i32 d{{.*}}, #0x20ffff
+define arm_aapcs_vfpcc <2 x i32> @v_mvni32f() nounwind {
+; CHECK-LE-LABEL: v_mvni32f:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmvn.i32 d0, #0x20ffff
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_mvni32f:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmvn.i32 d16, #0x20ffff
+; CHECK-BE-NEXT:    vrev64.32 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <2 x i32> < i32 4292804608, i32 4292804608 >
 }
 
-define <1 x i64> @v_movi64() nounwind {
-;CHECK-LABEL: v_movi64:
-;CHECK: vmov.i64 d{{.*}}, #0xff0000ff0000ffff
+define arm_aapcs_vfpcc <1 x i64> @v_movi64() nounwind {
+; CHECK-LABEL: v_movi64:
+; CHECK:       @ %bb.0:
+; CHECK-NEXT:    vmov.i64 d0, #0xff0000ff0000ffff
+; CHECK-NEXT:    mov pc, lr
 	ret <1 x i64> < i64 18374687574888349695 >
 }
 
-define <16 x i8> @v_movQi8() nounwind {
-;CHECK-LABEL: v_movQi8:
-;CHECK: vmov.i8 q{{.*}}, #0x8
+define arm_aapcs_vfpcc <16 x i8> @v_movQi8() nounwind {
+; CHECK-LE-LABEL: v_movQi8:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmov.i8 q0, #0x8
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_movQi8:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmov.i8 q8, #0x8
+; CHECK-BE-NEXT:    vrev64.8 q0, q8
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <16 x i8> < i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8 >
 }
 
-define <8 x i16> @v_movQi16a() nounwind {
-;CHECK-LABEL: v_movQi16a:
-;CHECK: vmov.i16 q{{.*}}, #0x10
+define arm_aapcs_vfpcc <8 x i16> @v_movQi16a() nounwind {
+; CHECK-LE-LABEL: v_movQi16a:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmov.i16 q0, #0x10
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_movQi16a:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmov.i16 q8, #0x10
+; CHECK-BE-NEXT:    vrev64.16 q0, q8
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <8 x i16> < i16 16, i16 16, i16 16, i16 16, i16 16, i16 16, i16 16, i16 16 >
 }
 
-define <8 x i16> @v_movQi16b() nounwind {
-;CHECK-LABEL: v_movQi16b:
-;CHECK: vmov.i16 q{{.*}}, #0x1000
+define arm_aapcs_vfpcc <8 x i16> @v_movQi16b() nounwind {
+; CHECK-LE-LABEL: v_movQi16b:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmov.i16 q0, #0x1000
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_movQi16b:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmov.i16 q8, #0x1000
+; CHECK-BE-NEXT:    vrev64.16 q0, q8
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <8 x i16> < i16 4096, i16 4096, i16 4096, i16 4096, i16 4096, i16 4096, i16 4096, i16 4096 >
 }
 
-define <4 x i32> @v_movQi32a() nounwind {
-;CHECK-LABEL: v_movQi32a:
-;CHECK: vmov.i32 q{{.*}}, #0x20
+define arm_aapcs_vfpcc <4 x i32> @v_movQi32a() nounwind {
+; CHECK-LE-LABEL: v_movQi32a:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmov.i32 q0, #0x20
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_movQi32a:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmov.i32 q8, #0x20
+; CHECK-BE-NEXT:    vrev64.32 q0, q8
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <4 x i32> < i32 32, i32 32, i32 32, i32 32 >
 }
 
-define <4 x i32> @v_movQi32b() nounwind {
-;CHECK-LABEL: v_movQi32b:
-;CHECK: vmov.i32 q{{.*}}, #0x2000
+define arm_aapcs_vfpcc <4 x i32> @v_movQi32b() nounwind {
+; CHECK-LE-LABEL: v_movQi32b:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmov.i32 q0, #0x2000
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_movQi32b:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmov.i32 q8, #0x2000
+; CHECK-BE-NEXT:    vrev64.32 q0, q8
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <4 x i32> < i32 8192, i32 8192, i32 8192, i32 8192 >
 }
 
-define <4 x i32> @v_movQi32c() nounwind {
-;CHECK-LABEL: v_movQi32c:
-;CHECK: vmov.i32 q{{.*}}, #0x200000
+define arm_aapcs_vfpcc <4 x i32> @v_movQi32c() nounwind {
+; CHECK-LE-LABEL: v_movQi32c:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmov.i32 q0, #0x200000
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_movQi32c:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmov.i32 q8, #0x200000
+; CHECK-BE-NEXT:    vrev64.32 q0, q8
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <4 x i32> < i32 2097152, i32 2097152, i32 2097152, i32 2097152 >
 }
 
-define <4 x i32> @v_movQi32d() nounwind {
-;CHECK-LABEL: v_movQi32d:
-;CHECK: vmov.i32 q{{.*}}, #0x20000000
+define arm_aapcs_vfpcc <4 x i32> @v_movQi32d() nounwind {
+; CHECK-LE-LABEL: v_movQi32d:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmov.i32 q0, #0x20000000
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_movQi32d:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmov.i32 q8, #0x20000000
+; CHECK-BE-NEXT:    vrev64.32 q0, q8
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <4 x i32> < i32 536870912, i32 536870912, i32 536870912, i32 536870912 >
 }
 
-define <4 x i32> @v_movQi32e() nounwind {
-;CHECK-LABEL: v_movQi32e:
-;CHECK: vmov.i32 q{{.*}}, #0x20ff
+define arm_aapcs_vfpcc <4 x i32> @v_movQi32e() nounwind {
+; CHECK-LE-LABEL: v_movQi32e:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmov.i32 q0, #0x20ff
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_movQi32e:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmov.i32 q8, #0x20ff
+; CHECK-BE-NEXT:    vrev64.32 q0, q8
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <4 x i32> < i32 8447, i32 8447, i32 8447, i32 8447 >
 }
 
-define <4 x i32> @v_movQi32f() nounwind {
-;CHECK-LABEL: v_movQi32f:
-;CHECK: vmov.i32 q{{.*}}, #0x20ffff
+define arm_aapcs_vfpcc <4 x i32> @v_movQi32f() nounwind {
+; CHECK-LE-LABEL: v_movQi32f:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmov.i32 q0, #0x20ffff
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_movQi32f:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmov.i32 q8, #0x20ffff
+; CHECK-BE-NEXT:    vrev64.32 q0, q8
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <4 x i32> < i32 2162687, i32 2162687, i32 2162687, i32 2162687 >
 }
 
-define <2 x i64> @v_movQi64() nounwind {
-;CHECK-LABEL: v_movQi64:
-;CHECK: vmov.i64 q{{.*}}, #0xff0000ff0000ffff
+define arm_aapcs_vfpcc <2 x i64> @v_movQi64() nounwind {
+; CHECK-LE-LABEL: v_movQi64:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vmov.i64 q0, #0xff0000ff0000ffff
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_movQi64:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vmov.i64 q0, #0xffffff0000ff
+; CHECK-BE-NEXT:    mov pc, lr
 	ret <2 x i64> < i64 18374687574888349695, i64 18374687574888349695 >
 }
 
 ; Check for correct assembler printing for immediate values.
 %struct.int8x8_t = type { <8 x i8> }
-define void @vdupn128(%struct.int8x8_t* noalias nocapture sret %agg.result) nounwind {
+define arm_aapcs_vfpcc void @vdupn128(%struct.int8x8_t* noalias nocapture sret %agg.result) nounwind {
+; CHECK-LE-LABEL: vdupn128:
+; CHECK-LE:       @ %bb.0: @ %entry
+; CHECK-LE-NEXT:    vmov.i8 d16, #0x80
+; CHECK-LE-NEXT:    vstr d16, [r0]
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: vdupn128:
+; CHECK-BE:       @ %bb.0: @ %entry
+; CHECK-BE-NEXT:    vmov.i8 d16, #0x80
+; CHECK-BE-NEXT:    vrev64.8 d16, d16
+; CHECK-BE-NEXT:    vstr d16, [r0]
+; CHECK-BE-NEXT:    mov pc, lr
 entry:
-;CHECK-LABEL: vdupn128:
-;CHECK: vmov.i8 d{{.*}}, #0x80
   %0 = getelementptr inbounds %struct.int8x8_t, %struct.int8x8_t* %agg.result, i32 0, i32 0 ; <<8 x i8>*> [#uses=1]
   store <8 x i8> <i8 -128, i8 -128, i8 -128, i8 -128, i8 -128, i8 -128, i8 -128, i8 -128>, <8 x i8>* %0, align 8
   ret void
 }
 
-define void @vdupnneg75(%struct.int8x8_t* noalias nocapture sret %agg.result) nounwind {
+define arm_aapcs_vfpcc void @vdupnneg75(%struct.int8x8_t* noalias nocapture sret %agg.result) nounwind {
+; CHECK-LE-LABEL: vdupnneg75:
+; CHECK-LE:       @ %bb.0: @ %entry
+; CHECK-LE-NEXT:    vmov.i8 d16, #0xb5
+; CHECK-LE-NEXT:    vstr d16, [r0]
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: vdupnneg75:
+; CHECK-BE:       @ %bb.0: @ %entry
+; CHECK-BE-NEXT:    vmov.i8 d16, #0xb5
+; CHECK-BE-NEXT:    vrev64.8 d16, d16
+; CHECK-BE-NEXT:    vstr d16, [r0]
+; CHECK-BE-NEXT:    mov pc, lr
 entry:
-;CHECK-LABEL: vdupnneg75:
-;CHECK: vmov.i8 d{{.*}}, #0xb5
   %0 = getelementptr inbounds %struct.int8x8_t, %struct.int8x8_t* %agg.result, i32 0, i32 0 ; <<8 x i8>*> [#uses=1]
   store <8 x i8> <i8 -75, i8 -75, i8 -75, i8 -75, i8 -75, i8 -75, i8 -75, i8 -75>, <8 x i8>* %0, align 8
   ret void
 }
 
-define <8 x i16> @vmovls8(<8 x i8>* %A) nounwind {
-;CHECK-LABEL: vmovls8:
-;CHECK: vmovl.s8
+define arm_aapcs_vfpcc <8 x i16> @vmovls8(<8 x i8>* %A) nounwind {
+; CHECK-LE-LABEL: vmovls8:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vld1.8 {d16}, [r0:64]
+; CHECK-LE-NEXT:    vmovl.s8 q0, d16
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: vmovls8:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vld1.8 {d16}, [r0:64]
+; CHECK-BE-NEXT:    vmovl.s8 q8, d16
+; CHECK-BE-NEXT:    vrev64.16 q0, q8
+; CHECK-BE-NEXT:    mov pc, lr
 	%tmp1 = load <8 x i8>, <8 x i8>* %A
 	%tmp2 = sext <8 x i8> %tmp1 to <8 x i16>
 	ret <8 x i16> %tmp2
 }
 
-define <4 x i32> @vmovls16(<4 x i16>* %A) nounwind {
-;CHECK-LABEL: vmovls16:
-;CHECK: vmovl.s16
+define arm_aapcs_vfpcc <4 x i32> @vmovls16(<4 x i16>* %A) nounwind {
+; CHECK-LE-LABEL: vmovls16:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vld1.16 {d16}, [r0:64]
+; CHECK-LE-NEXT:    vmovl.s16 q0, d16
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: vmovls16:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vld1.16 {d16}, [r0:64]
+; CHECK-BE-NEXT:    vmovl.s16 q8, d16
+; CHECK-BE-NEXT:    vrev64.32 q0, q8
+; CHECK-BE-NEXT:    mov pc, lr
 	%tmp1 = load <4 x i16>, <4 x i16>* %A
 	%tmp2 = sext <4 x i16> %tmp1 to <4 x i32>
 	ret <4 x i32> %tmp2
 }
 
-define <2 x i64> @vmovls32(<2 x i32>* %A) nounwind {
-;CHECK-LABEL: vmovls32:
-;CHECK: vmovl.s32
+define arm_aapcs_vfpcc <2 x i64> @vmovls32(<2 x i32>* %A) nounwind {
+; CHECK-LABEL: vmovls32:
+; CHECK:       @ %bb.0:
+; CHECK-NEXT:    vld1.32 {d16}, [r0:64]
+; CHECK-NEXT:    vmovl.s32 q0, d16
+; CHECK-NEXT:    mov pc, lr
 	%tmp1 = load <2 x i32>, <2 x i32>* %A
 	%tmp2 = sext <2 x i32> %tmp1 to <2 x i64>
 	ret <2 x i64> %tmp2
 }
 
-define <8 x i16> @vmovlu8(<8 x i8>* %A) nounwind {
-;CHECK-LABEL: vmovlu8:
-;CHECK: vmovl.u8
+define arm_aapcs_vfpcc <8 x i16> @vmovlu8(<8 x i8>* %A) nounwind {
+; CHECK-LE-LABEL: vmovlu8:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vld1.8 {d16}, [r0:64]
+; CHECK-LE-NEXT:    vmovl.u8 q0, d16
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: vmovlu8:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vld1.8 {d16}, [r0:64]
+; CHECK-BE-NEXT:    vmovl.u8 q8, d16
+; CHECK-BE-NEXT:    vrev64.16 q0, q8
+; CHECK-BE-NEXT:    mov pc, lr
 	%tmp1 = load <8 x i8>, <8 x i8>* %A
 	%tmp2 = zext <8 x i8> %tmp1 to <8 x i16>
 	ret <8 x i16> %tmp2
 }
 
-define <4 x i32> @vmovlu16(<4 x i16>* %A) nounwind {
-;CHECK-LABEL: vmovlu16:
-;CHECK: vmovl.u16
+define arm_aapcs_vfpcc <4 x i32> @vmovlu16(<4 x i16>* %A) nounwind {
+; CHECK-LE-LABEL: vmovlu16:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vld1.16 {d16}, [r0:64]
+; CHECK-LE-NEXT:    vmovl.u16 q0, d16
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: vmovlu16:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vld1.16 {d16}, [r0:64]
+; CHECK-BE-NEXT:    vmovl.u16 q8, d16
+; CHECK-BE-NEXT:    vrev64.32 q0, q8
+; CHECK-BE-NEXT:    mov pc, lr
 	%tmp1 = load <4 x i16>, <4 x i16>* %A
 	%tmp2 = zext <4 x i16> %tmp1 to <4 x i32>
 	ret <4 x i32> %tmp2
 }
 
-define <2 x i64> @vmovlu32(<2 x i32>* %A) nounwind {
-;CHECK-LABEL: vmovlu32:
-;CHECK: vmovl.u32
+define arm_aapcs_vfpcc <2 x i64> @vmovlu32(<2 x i32>* %A) nounwind {
+; CHECK-LABEL: vmovlu32:
+; CHECK:       @ %bb.0:
+; CHECK-NEXT:    vld1.32 {d16}, [r0:64]
+; CHECK-NEXT:    vmovl.u32 q0, d16
+; CHECK-NEXT:    mov pc, lr
 	%tmp1 = load <2 x i32>, <2 x i32>* %A
 	%tmp2 = zext <2 x i32> %tmp1 to <2 x i64>
 	ret <2 x i64> %tmp2
 }
 
-define <8 x i8> @vmovni16(<8 x i16>* %A) nounwind {
-;CHECK-LABEL: vmovni16:
-;CHECK: vmovn.i16
+define arm_aapcs_vfpcc <8 x i8> @vmovni16(<8 x i16>* %A) nounwind {
+; CHECK-LE-LABEL: vmovni16:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-LE-NEXT:    vmovn.i16 d0, q8
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: vmovni16:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-BE-NEXT:    vrev64.16 q8, q8
+; CHECK-BE-NEXT:    vmovn.i16 d16, q8
+; CHECK-BE-NEXT:    vrev64.8 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	%tmp1 = load <8 x i16>, <8 x i16>* %A
 	%tmp2 = trunc <8 x i16> %tmp1 to <8 x i8>
 	ret <8 x i8> %tmp2
 }
 
-define <4 x i16> @vmovni32(<4 x i32>* %A) nounwind {
-;CHECK-LABEL: vmovni32:
-;CHECK: vmovn.i32
+define arm_aapcs_vfpcc <4 x i16> @vmovni32(<4 x i32>* %A) nounwind {
+; CHECK-LE-LABEL: vmovni32:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-LE-NEXT:    vmovn.i32 d0, q8
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: vmovni32:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-BE-NEXT:    vrev64.32 q8, q8
+; CHECK-BE-NEXT:    vmovn.i32 d16, q8
+; CHECK-BE-NEXT:    vrev64.16 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	%tmp1 = load <4 x i32>, <4 x i32>* %A
 	%tmp2 = trunc <4 x i32> %tmp1 to <4 x i16>
 	ret <4 x i16> %tmp2
 }
 
-define <2 x i32> @vmovni64(<2 x i64>* %A) nounwind {
-;CHECK-LABEL: vmovni64:
-;CHECK: vmovn.i64
+define arm_aapcs_vfpcc <2 x i32> @vmovni64(<2 x i64>* %A) nounwind {
+; CHECK-LE-LABEL: vmovni64:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-LE-NEXT:    vmovn.i64 d0, q8
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: vmovni64:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-BE-NEXT:    vmovn.i64 d16, q8
+; CHECK-BE-NEXT:    vrev64.32 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	%tmp1 = load <2 x i64>, <2 x i64>* %A
 	%tmp2 = trunc <2 x i64> %tmp1 to <2 x i32>
 	ret <2 x i32> %tmp2
 }
 
-define <8 x i8> @vqmovns16(<8 x i16>* %A) nounwind {
-;CHECK-LABEL: vqmovns16:
-;CHECK: vqmovn.s16
+define arm_aapcs_vfpcc <8 x i8> @vqmovns16(<8 x i16>* %A) nounwind {
+; CHECK-LE-LABEL: vqmovns16:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-LE-NEXT:    vqmovn.s16 d0, q8
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: vqmovns16:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-BE-NEXT:    vrev64.16 q8, q8
+; CHECK-BE-NEXT:    vqmovn.s16 d16, q8
+; CHECK-BE-NEXT:    vrev64.8 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	%tmp1 = load <8 x i16>, <8 x i16>* %A
 	%tmp2 = call <8 x i8> @llvm.arm.neon.vqmovns.v8i8(<8 x i16> %tmp1)
 	ret <8 x i8> %tmp2
 }
 
-define <4 x i16> @vqmovns32(<4 x i32>* %A) nounwind {
-;CHECK-LABEL: vqmovns32:
-;CHECK: vqmovn.s32
+define arm_aapcs_vfpcc <4 x i16> @vqmovns32(<4 x i32>* %A) nounwind {
+; CHECK-LE-LABEL: vqmovns32:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-LE-NEXT:    vqmovn.s32 d0, q8
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: vqmovns32:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-BE-NEXT:    vrev64.32 q8, q8
+; CHECK-BE-NEXT:    vqmovn.s32 d16, q8
+; CHECK-BE-NEXT:    vrev64.16 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	%tmp1 = load <4 x i32>, <4 x i32>* %A
 	%tmp2 = call <4 x i16> @llvm.arm.neon.vqmovns.v4i16(<4 x i32> %tmp1)
 	ret <4 x i16> %tmp2
 }
 
-define <2 x i32> @vqmovns64(<2 x i64>* %A) nounwind {
-;CHECK-LABEL: vqmovns64:
-;CHECK: vqmovn.s64
+define arm_aapcs_vfpcc <2 x i32> @vqmovns64(<2 x i64>* %A) nounwind {
+; CHECK-LE-LABEL: vqmovns64:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-LE-NEXT:    vqmovn.s64 d0, q8
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: vqmovns64:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-BE-NEXT:    vqmovn.s64 d16, q8
+; CHECK-BE-NEXT:    vrev64.32 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	%tmp1 = load <2 x i64>, <2 x i64>* %A
 	%tmp2 = call <2 x i32> @llvm.arm.neon.vqmovns.v2i32(<2 x i64> %tmp1)
 	ret <2 x i32> %tmp2
 }
 
-define <8 x i8> @vqmovnu16(<8 x i16>* %A) nounwind {
-;CHECK-LABEL: vqmovnu16:
-;CHECK: vqmovn.u16
+define arm_aapcs_vfpcc <8 x i8> @vqmovnu16(<8 x i16>* %A) nounwind {
+; CHECK-LE-LABEL: vqmovnu16:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-LE-NEXT:    vqmovn.u16 d0, q8
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: vqmovnu16:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-BE-NEXT:    vrev64.16 q8, q8
+; CHECK-BE-NEXT:    vqmovn.u16 d16, q8
+; CHECK-BE-NEXT:    vrev64.8 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	%tmp1 = load <8 x i16>, <8 x i16>* %A
 	%tmp2 = call <8 x i8> @llvm.arm.neon.vqmovnu.v8i8(<8 x i16> %tmp1)
 	ret <8 x i8> %tmp2
 }
 
-define <4 x i16> @vqmovnu32(<4 x i32>* %A) nounwind {
-;CHECK-LABEL: vqmovnu32:
-;CHECK: vqmovn.u32
+define arm_aapcs_vfpcc <4 x i16> @vqmovnu32(<4 x i32>* %A) nounwind {
+; CHECK-LE-LABEL: vqmovnu32:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-LE-NEXT:    vqmovn.u32 d0, q8
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: vqmovnu32:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-BE-NEXT:    vrev64.32 q8, q8
+; CHECK-BE-NEXT:    vqmovn.u32 d16, q8
+; CHECK-BE-NEXT:    vrev64.16 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	%tmp1 = load <4 x i32>, <4 x i32>* %A
 	%tmp2 = call <4 x i16> @llvm.arm.neon.vqmovnu.v4i16(<4 x i32> %tmp1)
 	ret <4 x i16> %tmp2
 }
 
-define <2 x i32> @vqmovnu64(<2 x i64>* %A) nounwind {
-;CHECK-LABEL: vqmovnu64:
-;CHECK: vqmovn.u64
+define arm_aapcs_vfpcc <2 x i32> @vqmovnu64(<2 x i64>* %A) nounwind {
+; CHECK-LE-LABEL: vqmovnu64:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-LE-NEXT:    vqmovn.u64 d0, q8
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: vqmovnu64:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-BE-NEXT:    vqmovn.u64 d16, q8
+; CHECK-BE-NEXT:    vrev64.32 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	%tmp1 = load <2 x i64>, <2 x i64>* %A
 	%tmp2 = call <2 x i32> @llvm.arm.neon.vqmovnu.v2i32(<2 x i64> %tmp1)
 	ret <2 x i32> %tmp2
 }
 
-define <8 x i8> @vqmovuns16(<8 x i16>* %A) nounwind {
-;CHECK-LABEL: vqmovuns16:
-;CHECK: vqmovun.s16
+define arm_aapcs_vfpcc <8 x i8> @vqmovuns16(<8 x i16>* %A) nounwind {
+; CHECK-LE-LABEL: vqmovuns16:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-LE-NEXT:    vqmovun.s16 d0, q8
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: vqmovuns16:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-BE-NEXT:    vrev64.16 q8, q8
+; CHECK-BE-NEXT:    vqmovun.s16 d16, q8
+; CHECK-BE-NEXT:    vrev64.8 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	%tmp1 = load <8 x i16>, <8 x i16>* %A
 	%tmp2 = call <8 x i8> @llvm.arm.neon.vqmovnsu.v8i8(<8 x i16> %tmp1)
 	ret <8 x i8> %tmp2
 }
 
-define <4 x i16> @vqmovuns32(<4 x i32>* %A) nounwind {
-;CHECK-LABEL: vqmovuns32:
-;CHECK: vqmovun.s32
+define arm_aapcs_vfpcc <4 x i16> @vqmovuns32(<4 x i32>* %A) nounwind {
+; CHECK-LE-LABEL: vqmovuns32:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-LE-NEXT:    vqmovun.s32 d0, q8
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: vqmovuns32:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-BE-NEXT:    vrev64.32 q8, q8
+; CHECK-BE-NEXT:    vqmovun.s32 d16, q8
+; CHECK-BE-NEXT:    vrev64.16 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	%tmp1 = load <4 x i32>, <4 x i32>* %A
 	%tmp2 = call <4 x i16> @llvm.arm.neon.vqmovnsu.v4i16(<4 x i32> %tmp1)
 	ret <4 x i16> %tmp2
 }
 
-define <2 x i32> @vqmovuns64(<2 x i64>* %A) nounwind {
-;CHECK-LABEL: vqmovuns64:
-;CHECK: vqmovun.s64
+define arm_aapcs_vfpcc <2 x i32> @vqmovuns64(<2 x i64>* %A) nounwind {
+; CHECK-LE-LABEL: vqmovuns64:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-LE-NEXT:    vqmovun.s64 d0, q8
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: vqmovuns64:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-BE-NEXT:    vqmovun.s64 d16, q8
+; CHECK-BE-NEXT:    vrev64.32 d0, d16
+; CHECK-BE-NEXT:    mov pc, lr
 	%tmp1 = load <2 x i64>, <2 x i64>* %A
 	%tmp2 = call <2 x i32> @llvm.arm.neon.vqmovnsu.v2i32(<2 x i64> %tmp1)
 	ret <2 x i32> %tmp2
@@ -346,8 +759,22 @@ declare <2 x i32> @llvm.arm.neon.vqmovnsu.v2i32(<2 x i64>) nounwind readnone
 
 ; Truncating vector stores are not supported.  The following should not crash.
 ; Radar 8598391.
-define void @noTruncStore(<4 x i32>* %a, <4 x i16>* %b) nounwind {
-;CHECK: vmovn
+define arm_aapcs_vfpcc void @noTruncStore(<4 x i32>* %a, <4 x i16>* %b) nounwind {
+; CHECK-LE-LABEL: noTruncStore:
+; CHECK-LE:       @ %bb.0:
+; CHECK-LE-NEXT:    vld1.64 {d16, d17}, [r0:128]
+; CHECK-LE-NEXT:    vmovn.i32 d16, q8
+; CHECK-LE-NEXT:    vstr d16, [r1]
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: noTruncStore:
+; CHECK-BE:       @ %bb.0:
+; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0:128]
+; CHECK-BE-NEXT:    vrev64.32 q8, q8
+; CHECK-BE-NEXT:    vmovn.i32 d16, q8
+; CHECK-BE-NEXT:    vrev64.16 d16, d16
+; CHECK-BE-NEXT:    vstr d16, [r1]
+; CHECK-BE-NEXT:    mov pc, lr
   %tmp1 = load <4 x i32>, <4 x i32>* %a, align 16
   %tmp2 = trunc <4 x i32> %tmp1 to <4 x i16>
   store <4 x i16> %tmp2, <4 x i16>* %b, align 8
@@ -356,26 +783,61 @@ define void @noTruncStore(<4 x i32>* %a, <4 x i16>* %b) nounwind {
 
 ; Use vmov.f32 to materialize f32 immediate splats
 ; rdar://10437054
-define void @v_mov_v2f32(<2 x float>* nocapture %p) nounwind {
+define arm_aapcs_vfpcc void @v_mov_v2f32(<2 x float>* nocapture %p) nounwind {
+; CHECK-LE-LABEL: v_mov_v2f32:
+; CHECK-LE:       @ %bb.0: @ %entry
+; CHECK-LE-NEXT:    vmov.f32 d16, #-1.600000e+01
+; CHECK-LE-NEXT:    vstr d16, [r0]
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_mov_v2f32:
+; CHECK-BE:       @ %bb.0: @ %entry
+; CHECK-BE-NEXT:    vmov.f32 d16, #-1.600000e+01
+; CHECK-BE-NEXT:    vrev64.32 d16, d16
+; CHECK-BE-NEXT:    vstr d16, [r0]
+; CHECK-BE-NEXT:    mov pc, lr
 entry:
-;CHECK-LABEL: v_mov_v2f32:
-;CHECK: vmov.f32 d{{.*}}, #-1.600000e+01
   store <2 x float> <float -1.600000e+01, float -1.600000e+01>, <2 x float>* %p, align 4
   ret void
 }
 
-define void @v_mov_v4f32(<4 x float>* nocapture %p) nounwind {
+define arm_aapcs_vfpcc void @v_mov_v4f32(<4 x float>* nocapture %p) nounwind {
+; CHECK-LE-LABEL: v_mov_v4f32:
+; CHECK-LE:       @ %bb.0: @ %entry
+; CHECK-LE-NEXT:    vmov.f32 q8, #3.100000e+01
+; CHECK-LE-NEXT:    vst1.32 {d16, d17}, [r0]
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_mov_v4f32:
+; CHECK-BE:       @ %bb.0: @ %entry
+; CHECK-BE-NEXT:    vmov.f32 q8, #3.100000e+01
+; CHECK-BE-NEXT:    vrev64.32 q8, q8
+; CHECK-BE-NEXT:    vstmia r0, {d16, d17}
+; CHECK-BE-NEXT:    mov pc, lr
 entry:
-;CHECK-LABEL: v_mov_v4f32:
-;CHECK: vmov.f32 q{{.*}}, #3.100000e+01
   store <4 x float> <float 3.100000e+01, float 3.100000e+01, float 3.100000e+01, float 3.100000e+01>, <4 x float>* %p, align 4
   ret void
 }
 
-define void @v_mov_v4f32_undef(<4 x float> * nocapture %p) nounwind {
+define arm_aapcs_vfpcc void @v_mov_v4f32_undef(<4 x float> * nocapture %p) nounwind {
+; CHECK-LE-LABEL: v_mov_v4f32_undef:
+; CHECK-LE:       @ %bb.0: @ %entry
+; CHECK-LE-NEXT:    vmov.f32 q8, #1.000000e+00
+; CHECK-LE-NEXT:    vld1.64 {d18, d19}, [r0]
+; CHECK-LE-NEXT:    vadd.f32 q8, q9, q8
+; CHECK-LE-NEXT:    vst1.64 {d16, d17}, [r0]
+; CHECK-LE-NEXT:    mov pc, lr
+;
+; CHECK-BE-LABEL: v_mov_v4f32_undef:
+; CHECK-BE:       @ %bb.0: @ %entry
+; CHECK-BE-NEXT:    vld1.64 {d16, d17}, [r0]
+; CHECK-BE-NEXT:    vmov.f32 q9, #1.000000e+00
+; CHECK-BE-NEXT:    vrev64.32 q8, q8
+; CHECK-BE-NEXT:    vadd.f32 q8, q8, q9
+; CHECK-BE-NEXT:    vrev64.32 q8, q8
+; CHECK-BE-NEXT:    vst1.64 {d16, d17}, [r0]
+; CHECK-BE-NEXT:    mov pc, lr
 entry:
-;CHECK-LABEL: v_mov_v4f32_undef:
-;CHECK: vmov.f32 q{{.*}}, #1.000000e+00
   %a = load <4 x float> , <4 x float> *%p
   %b = fadd <4 x float> %a, <float undef, float 1.0, float 1.0, float 1.0>
   store <4 x float> %b, <4 x float> *%p
@@ -384,10 +846,29 @@ entry:
 
 ; Vector any_extends must be selected as either vmovl.u or vmovl.s.
 ; rdar://10723651
-define void @any_extend(<4 x i1> %x, <4 x i32> %y) nounwind ssp {
+define arm_aapcs_vfpcc void @any_extend(<4 x i1> %x, <4 x i32> %y) nounwind ssp {
+; CHECK-LE-LABEL: any_extend:
+; CHECK-LE:       @ %bb.0: @ %entry
+; CHECK-LE-NEXT:    vmov.i16 d16, #0x1
+; CHECK-LE-NEXT:    vand d16, d0, d16
+; CHECK-LE-NEXT:    vmovl.u16 q8, d16
+; CHECK-LE-NEXT:    vsub.i32 q8, q8, q1
+; CHECK-LE-NEXT:    vmovn.i32 d16, q8
+; CHECK-LE-NEXT:    vst1.16 {d16}, [r0]
+;
+; CHECK-BE-LABEL: any_extend:
+; CHECK-BE:       @ %bb.0: @ %entry
+; CHECK-BE-NEXT:    vmov.i16 d16, #0x1
+; CHECK-BE-NEXT:    vrev64.32 d17, d0
+; CHECK-BE-NEXT:    vrev64.32 q9, q1
+; CHECK-BE-NEXT:    vrev32.16 d16, d16
+; CHECK-BE-NEXT:    vand d16, d17, d16
+; CHECK-BE-NEXT:    vrev32.16 d16, d16
+; CHECK-BE-NEXT:    vmovl.u16 q8, d16
+; CHECK-BE-NEXT:    vsub.i32 q8, q8, q9
+; CHECK-BE-NEXT:    vmovn.i32 d16, q8
+; CHECK-BE-NEXT:    vst1.16 {d16}, [r0]
 entry:
-;CHECK-LABEL: any_extend:
-;CHECK: vmovl
   %and.i186 = zext <4 x i1> %x to <4 x i32>
   %add.i185 = sub <4 x i32> %and.i186, %y
   %sub.i = sub <4 x i32> %add.i185, zeroinitializer


        


More information about the llvm-commits mailing list