[llvm] r318151 - [X86][AVX] Add scheduling test for vmovntdq 256-bit store
Simon Pilgrim via llvm-commits
llvm-commits at lists.llvm.org
Tue Nov 14 06:03:29 PST 2017
Author: rksimon
Date: Tue Nov 14 06:03:29 2017
New Revision: 318151
URL: http://llvm.org/viewvc/llvm-project?rev=318151&view=rev
Log:
[X86][AVX] Add scheduling test for vmovntdq 256-bit store
Needs to use inline asm as domain will otherwise be changed to float (vmovntps)
Modified:
llvm/trunk/test/CodeGen/X86/avx-schedule.ll
Modified: llvm/trunk/test/CodeGen/X86/avx-schedule.ll
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/CodeGen/X86/avx-schedule.ll?rev=318151&r1=318150&r2=318151&view=diff
==============================================================================
--- llvm/trunk/test/CodeGen/X86/avx-schedule.ll (original)
+++ llvm/trunk/test/CodeGen/X86/avx-schedule.ll Tue Nov 14 06:03:29 2017
@@ -2807,6 +2807,73 @@ define i32 @test_movmskps(<8 x float> %a
}
declare i32 @llvm.x86.avx.movmsk.ps.256(<8 x float>) nounwind readnone
+define void @test_movntdq(<4 x i64> %a0, <4 x i64> *%a1) {
+; GENERIC-LABEL: test_movntdq:
+; GENERIC: # BB#0:
+; GENERIC-NEXT: #APP
+; GENERIC-NEXT: vmovntdq %ymm0, (%rdi) # sched: [5:1.00]
+; GENERIC-NEXT: #NO_APP
+; GENERIC-NEXT: vzeroupper
+; GENERIC-NEXT: retq # sched: [1:1.00]
+;
+; SANDY-LABEL: test_movntdq:
+; SANDY: # BB#0:
+; SANDY-NEXT: #APP
+; SANDY-NEXT: vmovntdq %ymm0, (%rdi) # sched: [5:1.00]
+; SANDY-NEXT: #NO_APP
+; SANDY-NEXT: vzeroupper
+; SANDY-NEXT: retq # sched: [1:1.00]
+;
+; HASWELL-LABEL: test_movntdq:
+; HASWELL: # BB#0:
+; HASWELL-NEXT: #APP
+; HASWELL-NEXT: vmovntdq %ymm0, (%rdi) # sched: [1:1.00]
+; HASWELL-NEXT: #NO_APP
+; HASWELL-NEXT: vzeroupper # sched: [4:1.00]
+; HASWELL-NEXT: retq # sched: [2:1.00]
+;
+; BROADWELL-LABEL: test_movntdq:
+; BROADWELL: # BB#0:
+; BROADWELL-NEXT: #APP
+; BROADWELL-NEXT: vmovntdq %ymm0, (%rdi) # sched: [1:1.00]
+; BROADWELL-NEXT: #NO_APP
+; BROADWELL-NEXT: vzeroupper # sched: [4:1.00]
+; BROADWELL-NEXT: retq # sched: [7:1.00]
+;
+; SKYLAKE-LABEL: test_movntdq:
+; SKYLAKE: # BB#0:
+; SKYLAKE-NEXT: #APP
+; SKYLAKE-NEXT: vmovntdq %ymm0, (%rdi) # sched: [1:1.00]
+; SKYLAKE-NEXT: #NO_APP
+; SKYLAKE-NEXT: vzeroupper # sched: [4:1.00]
+; SKYLAKE-NEXT: retq # sched: [7:1.00]
+;
+; SKX-LABEL: test_movntdq:
+; SKX: # BB#0:
+; SKX-NEXT: #APP
+; SKX-NEXT: vmovntdq %ymm0, (%rdi) # sched: [1:1.00]
+; SKX-NEXT: #NO_APP
+; SKX-NEXT: vzeroupper # sched: [4:1.00]
+; SKX-NEXT: retq # sched: [7:1.00]
+;
+; BTVER2-LABEL: test_movntdq:
+; BTVER2: # BB#0:
+; BTVER2-NEXT: #APP
+; BTVER2-NEXT: vmovntdq %ymm0, (%rdi) # sched: [3:2.00]
+; BTVER2-NEXT: #NO_APP
+; BTVER2-NEXT: retq # sched: [4:1.00]
+;
+; ZNVER1-LABEL: test_movntdq:
+; ZNVER1: # BB#0:
+; ZNVER1-NEXT: #APP
+; ZNVER1-NEXT: vmovntdq %ymm0, (%rdi) # sched: [1:0.50]
+; ZNVER1-NEXT: #NO_APP
+; ZNVER1-NEXT: vzeroupper # sched: [100:?]
+; ZNVER1-NEXT: retq # sched: [1:0.50]
+ call void asm sideeffect "vmovntdq $0, $1", "x,*m"(<4 x i64> %a0, <4 x i64> *%a1)
+ ret void
+}
+
define <4 x double> @test_movntpd(<4 x double> %a0, <4 x double> *%a1) {
; GENERIC-LABEL: test_movntpd:
; GENERIC: # BB#0:
More information about the llvm-commits
mailing list