[llvm] r279402 - [CostModel][X86] Split off float arithmetic cost tests
Simon Pilgrim via llvm-commits
llvm-commits at lists.llvm.org
Sun Aug 21 11:34:48 PDT 2016
Author: rksimon
Date: Sun Aug 21 13:34:47 2016
New Revision: 279402
URL: http://llvm.org/viewvc/llvm-project?rev=279402&view=rev
Log:
[CostModel][X86] Split off float arithmetic cost tests
Added:
llvm/trunk/test/Analysis/CostModel/X86/arith-fp.ll
- copied, changed from r279393, llvm/trunk/test/Analysis/CostModel/X86/arith.ll
Modified:
llvm/trunk/test/Analysis/CostModel/X86/arith.ll
Copied: llvm/trunk/test/Analysis/CostModel/X86/arith-fp.ll (from r279393, llvm/trunk/test/Analysis/CostModel/X86/arith.ll)
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/Analysis/CostModel/X86/arith-fp.ll?p2=llvm/trunk/test/Analysis/CostModel/X86/arith-fp.ll&p1=llvm/trunk/test/Analysis/CostModel/X86/arith.ll&r1=279393&r2=279402&rev=279402&view=diff
==============================================================================
--- llvm/trunk/test/Analysis/CostModel/X86/arith.ll (original)
+++ llvm/trunk/test/Analysis/CostModel/X86/arith-fp.ll Sun Aug 21 13:34:47 2016
@@ -8,261 +8,6 @@
target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64-S128"
target triple = "x86_64-apple-macosx10.8.0"
-; CHECK-LABEL: 'add'
-define i32 @add(i32 %arg) {
- ; SSSE3: cost of 1 {{.*}} %A = add
- ; SSE42: cost of 1 {{.*}} %A = add
- ; AVX: cost of 1 {{.*}} %A = add
- ; AVX2: cost of 1 {{.*}} %A = add
- ; AVX512: cost of 1 {{.*}} %A = add
- %A = add <4 x i32> undef, undef
- ; SSSE3: cost of 2 {{.*}} %B = add
- ; SSE42: cost of 2 {{.*}} %B = add
- ; AVX: cost of 4 {{.*}} %B = add
- ; AVX2: cost of 1 {{.*}} %B = add
- ; AVX512: cost of 1 {{.*}} %B = add
- %B = add <8 x i32> undef, undef
- ; SSSE3: cost of 1 {{.*}} %C = add
- ; SSE42: cost of 1 {{.*}} %C = add
- ; AVX: cost of 1 {{.*}} %C = add
- ; AVX2: cost of 1 {{.*}} %C = add
- ; AVX512: cost of 1 {{.*}} %C = add
- %C = add <2 x i64> undef, undef
- ; SSSE3: cost of 2 {{.*}} %D = add
- ; SSE42: cost of 2 {{.*}} %D = add
- ; AVX: cost of 4 {{.*}} %D = add
- ; AVX2: cost of 1 {{.*}} %D = add
- ; AVX512: cost of 1 {{.*}} %D = add
- %D = add <4 x i64> undef, undef
- ; SSSE3: cost of 4 {{.*}} %E = add
- ; SSE42: cost of 4 {{.*}} %E = add
- ; AVX: cost of 8 {{.*}} %E = add
- ; AVX2: cost of 2 {{.*}} %E = add
- ; AVX512: cost of 1 {{.*}} %E = add
- %E = add <8 x i64> undef, undef
- ; SSSE3: cost of 4 {{.*}} %F = add
- ; SSE42: cost of 4 {{.*}} %F = add
- ; AVX: cost of 8 {{.*}} %F = add
- ; AVX2: cost of 2 {{.*}} %F = add
- ; AVX512: cost of 1 {{.*}} %F = add
- %F = add <16 x i32> undef, undef
- ret i32 undef
-}
-
-; CHECK-LABEL: 'sub'
-define i32 @sub(i32 %arg) {
- ; SSSE3: cost of 1 {{.*}} %A = sub
- ; SSE42: cost of 1 {{.*}} %A = sub
- ; AVX: cost of 1 {{.*}} %A = sub
- ; AVX2: cost of 1 {{.*}} %A = sub
- ; AVX512: cost of 1 {{.*}} %A = sub
- %A = sub <4 x i32> undef, undef
- ; SSSE3: cost of 2 {{.*}} %B = sub
- ; SSE42: cost of 2 {{.*}} %B = sub
- ; AVX: cost of 4 {{.*}} %B = sub
- ; AVX2: cost of 1 {{.*}} %B = sub
- ; AVX512: cost of 1 {{.*}} %B = sub
- %B = sub <8 x i32> undef, undef
- ; SSSE3: cost of 1 {{.*}} %C = sub
- ; SSE42: cost of 1 {{.*}} %C = sub
- ; AVX: cost of 1 {{.*}} %C = sub
- ; AVX2: cost of 1 {{.*}} %C = sub
- ; AVX512: cost of 1 {{.*}} %C = sub
- %C = sub <2 x i64> undef, undef
- ; SSSE3: cost of 2 {{.*}} %D = sub
- ; SSE42: cost of 2 {{.*}} %D = sub
- ; AVX: cost of 4 {{.*}} %D = sub
- ; AVX2: cost of 1 {{.*}} %D = sub
- ; AVX512: cost of 1 {{.*}} %D = sub
- %D = sub <4 x i64> undef, undef
- ; SSSE3: cost of 4 {{.*}} %E = sub
- ; SSE42: cost of 4 {{.*}} %E = sub
- ; AVX: cost of 8 {{.*}} %E = sub
- ; AVX2: cost of 2 {{.*}} %E = sub
- ; AVX512: cost of 1 {{.*}} %E = sub
- %E = sub <8 x i64> undef, undef
- ; SSSE3: cost of 4 {{.*}} %F = sub
- ; SSE42: cost of 4 {{.*}} %F = sub
- ; AVX: cost of 8 {{.*}} %F = sub
- ; AVX2: cost of 2 {{.*}} %F = sub
- ; AVX512: cost of 1 {{.*}} %F = sub
- %F = sub <16 x i32> undef, undef
- ret i32 undef
-}
-
-; CHECK-LABEL: 'or'
-define i32 @or(i32 %arg) {
- ; SSSE3: cost of 1 {{.*}} %A = or
- ; SSE42: cost of 1 {{.*}} %A = or
- ; AVX: cost of 1 {{.*}} %A = or
- ; AVX2: cost of 1 {{.*}} %A = or
- ; AVX512: cost of 1 {{.*}} %A = or
- %A = or <4 x i32> undef, undef
- ; SSSE3: cost of 2 {{.*}} %B = or
- ; SSE42: cost of 2 {{.*}} %B = or
- ; AVX: cost of 1 {{.*}} %B = or
- ; AVX2: cost of 1 {{.*}} %B = or
- ; AVX512: cost of 1 {{.*}} %B = or
- %B = or <8 x i32> undef, undef
- ; SSSE3: cost of 1 {{.*}} %C = or
- ; SSE42: cost of 1 {{.*}} %C = or
- ; AVX: cost of 1 {{.*}} %C = or
- ; AVX2: cost of 1 {{.*}} %C = or
- ; AVX512: cost of 1 {{.*}} %C = or
- %C = or <2 x i64> undef, undef
- ; SSSE3: cost of 2 {{.*}} %D = or
- ; SSE42: cost of 2 {{.*}} %D = or
- ; AVX: cost of 1 {{.*}} %D = or
- ; AVX2: cost of 1 {{.*}} %D = or
- ; AVX512: cost of 1 {{.*}} %D = or
- %D = or <4 x i64> undef, undef
- ; SSSE3: cost of 4 {{.*}} %E = or
- ; SSE42: cost of 4 {{.*}} %E = or
- ; AVX: cost of 2 {{.*}} %E = or
- ; AVX2: cost of 2 {{.*}} %E = or
- ; AVX512: cost of 1 {{.*}} %E = or
- %E = or <8 x i64> undef, undef
- ; SSSE3: cost of 4 {{.*}} %F = or
- ; SSE42: cost of 4 {{.*}} %F = or
- ; AVX: cost of 2 {{.*}} %F = or
- ; AVX2: cost of 2 {{.*}} %F = or
- ; AVX512: cost of 1 {{.*}} %F = or
- %F = or <16 x i32> undef, undef
- ret i32 undef
-}
-
-; CHECK-LABEL: 'xor'
-define i32 @xor(i32 %arg) {
- ; SSSE3: cost of 1 {{.*}} %A = xor
- ; SSE42: cost of 1 {{.*}} %A = xor
- ; AVX: cost of 1 {{.*}} %A = xor
- ; AVX2: cost of 1 {{.*}} %A = xor
- ; AVX512: cost of 1 {{.*}} %A = xor
- %A = xor <4 x i32> undef, undef
- ; SSSE3: cost of 2 {{.*}} %B = xor
- ; SSE42: cost of 2 {{.*}} %B = xor
- ; AVX: cost of 1 {{.*}} %B = xor
- ; AVX2: cost of 1 {{.*}} %B = xor
- ; AVX512: cost of 1 {{.*}} %B = xor
- %B = xor <8 x i32> undef, undef
- ; SSSE3: cost of 1 {{.*}} %C = xor
- ; SSE42: cost of 1 {{.*}} %C = xor
- ; AVX: cost of 1 {{.*}} %C = xor
- ; AVX2: cost of 1 {{.*}} %C = xor
- ; AVX512: cost of 1 {{.*}} %C = xor
- %C = xor <2 x i64> undef, undef
- ; SSSE3: cost of 2 {{.*}} %D = xor
- ; SSE42: cost of 2 {{.*}} %D = xor
- ; AVX: cost of 1 {{.*}} %D = xor
- ; AVX2: cost of 1 {{.*}} %D = xor
- ; AVX512: cost of 1 {{.*}} %D = xor
- %D = xor <4 x i64> undef, undef
- ; SSSE3: cost of 4 {{.*}} %E = xor
- ; SSE42: cost of 4 {{.*}} %E = xor
- ; AVX: cost of 2 {{.*}} %E = xor
- ; AVX2: cost of 2 {{.*}} %E = xor
- ; AVX512: cost of 1 {{.*}} %E = xor
- %E = xor <8 x i64> undef, undef
- ; SSSE3: cost of 4 {{.*}} %F = xor
- ; SSE42: cost of 4 {{.*}} %F = xor
- ; AVX: cost of 2 {{.*}} %F = xor
- ; AVX2: cost of 2 {{.*}} %F = xor
- ; AVX512: cost of 1 {{.*}} %F = xor
- %F = xor <16 x i32> undef, undef
- ret i32 undef
-}
-
-; CHECK-LABEL: 'and'
-define i32 @and(i32 %arg) {
- ; SSSE3: cost of 1 {{.*}} %A = and
- ; SSE42: cost of 1 {{.*}} %A = and
- ; AVX: cost of 1 {{.*}} %A = and
- ; AVX2: cost of 1 {{.*}} %A = and
- ; AVX512: cost of 1 {{.*}} %A = and
- %A = and <4 x i32> undef, undef
- ; SSSE3: cost of 2 {{.*}} %B = and
- ; SSE42: cost of 2 {{.*}} %B = and
- ; AVX: cost of 1 {{.*}} %B = and
- ; AVX2: cost of 1 {{.*}} %B = and
- ; AVX512: cost of 1 {{.*}} %B = and
- %B = and <8 x i32> undef, undef
- ; SSSE3: cost of 1 {{.*}} %C = and
- ; SSE42: cost of 1 {{.*}} %C = and
- ; AVX: cost of 1 {{.*}} %C = and
- ; AVX2: cost of 1 {{.*}} %C = and
- ; AVX512: cost of 1 {{.*}} %C = and
- %C = and <2 x i64> undef, undef
- ; SSSE3: cost of 2 {{.*}} %D = and
- ; SSE42: cost of 2 {{.*}} %D = and
- ; AVX: cost of 1 {{.*}} %D = and
- ; AVX2: cost of 1 {{.*}} %D = and
- ; AVX512: cost of 1 {{.*}} %D = and
- %D = and <4 x i64> undef, undef
- ; SSSE3: cost of 4 {{.*}} %E = and
- ; SSE42: cost of 4 {{.*}} %E = and
- ; AVX: cost of 2 {{.*}} %E = and
- ; AVX2: cost of 2 {{.*}} %E = and
- ; AVX512: cost of 1 {{.*}} %E = and
- %E = and <8 x i64> undef, undef
- ; SSSE3: cost of 4 {{.*}} %F = and
- ; SSE42: cost of 4 {{.*}} %F = and
- ; AVX: cost of 2 {{.*}} %F = and
- ; AVX2: cost of 2 {{.*}} %F = and
- ; AVX512: cost of 1 {{.*}} %F = and
- %F = and <16 x i32> undef, undef
- ret i32 undef
-}
-
-; CHECK-LABEL: 'mul'
-define void @mul() {
- ; A <2 x i32> gets expanded to a <2 x i64> vector.
- ; A <2 x i64> vector multiply is implemented using
- ; 3 PMULUDQ and 2 PADDS and 4 shifts.
- ; SSSE3: cost of 9 {{.*}} %A0 = mul
- ; SSE42: cost of 9 {{.*}} %A0 = mul
- ; AVX: cost of 9 {{.*}} %A0 = mul
- ; AVX2: cost of 9 {{.*}} %A0 = mul
- ; AVX512: cost of 9 {{.*}} %A0 = mul
- %A0 = mul <2 x i32> undef, undef
- ; SSSE3: cost of 6 {{.*}} %A1 = mul
- ; SSE42: cost of 1 {{.*}} %A1 = mul
- ; AVX: cost of 1 {{.*}} %A1 = mul
- ; AVX2: cost of 1 {{.*}} %A1 = mul
- ; AVX512: cost of 1 {{.*}} %A1 = mul
- %A1 = mul <4 x i32> undef, undef
- ; SSSE3: cost of 9 {{.*}} %A2 = mul
- ; SSE42: cost of 9 {{.*}} %A2 = mul
- ; AVX: cost of 9 {{.*}} %A2 = mul
- ; AVX2: cost of 9 {{.*}} %A2 = mul
- ; AVX512: cost of 9 {{.*}} %A2 = mul
- %A2 = mul <2 x i64> undef, undef
- ; SSSE3: cost of 18 {{.*}} %A3 = mul
- ; SSE42: cost of 18 {{.*}} %A3 = mul
- ; AVX: cost of 18 {{.*}} %A3 = mul
- ; AVX2: cost of 9 {{.*}} %A3 = mul
- ; AVX512: cost of 9 {{.*}} %A3 = mul
- %A3 = mul <4 x i64> undef, undef
- ; SSSE3: cost of 12 {{.*}} %A4 = mul
- ; SSE42: cost of 2 {{.*}} %A4 = mul
- ; AVX: cost of 4 {{.*}} %A4 = mul
- ; AVX2: cost of 1 {{.*}} %A4 = mul
- ; AVX512: cost of 1 {{.*}} %A4 = mul
- %A4 = mul <8 x i32> undef, undef
- ; SSSE3: cost of 24 {{.*}} %A5 = mul
- ; SSE42: cost of 4 {{.*}} %A5 = mul
- ; AVX: cost of 8 {{.*}} %A5 = mul
- ; AVX2: cost of 2 {{.*}} %A5 = mul
- ; AVX512: cost of 1 {{.*}} %A5 = mul
- %A5 = mul <16 x i32> undef, undef
- ; SSSE3: cost of 36 {{.*}} %A6 = mul
- ; SSE42: cost of 36 {{.*}} %A6 = mul
- ; AVX: cost of 36 {{.*}} %A6 = mul
- ; AVX2: cost of 18 {{.*}} %A6 = mul
- ; AVX512: cost of 2 {{.*}} %A6 = mul
- %A6 = mul <8 x i64> undef, undef
- ret void
-}
-
; CHECK-LABEL: 'fadd'
define i32 @fadd(i32 %arg) {
; SSSE3: cost of 2 {{.*}} %A = fadd
@@ -477,83 +222,3 @@ define i32 @frem(i32 %arg) {
ret i32 undef
}
-
-; CHECK-LABEL: 'shift'
-define void @shift() {
- ; SSSE3: cost of 10 {{.*}} %A0 = shl
- ; SSE42: cost of 10 {{.*}} %A0 = shl
- ; AVX: cost of 10 {{.*}} %A0 = shl
- ; AVX2: cost of 1 {{.*}} %A0 = shl
- ; AVX512: cost of 1 {{.*}} %A0 = shl
- %A0 = shl <4 x i32> undef, undef
- ; SSSE3: cost of 4 {{.*}} %A1 = shl
- ; SSE42: cost of 4 {{.*}} %A1 = shl
- ; AVX: cost of 4 {{.*}} %A1 = shl
- ; AVX2: cost of 1 {{.*}} %A1 = shl
- ; AVX512: cost of 1 {{.*}} %A1 = shl
- %A1 = shl <2 x i64> undef, undef
- ; SSSE3: cost of 20 {{.*}} %A2 = shl
- ; SSE42: cost of 20 {{.*}} %A2 = shl
- ; AVX: cost of 20 {{.*}} %A2 = shl
- ; AVX2: cost of 1 {{.*}} %A2 = shl
- ; AVX512: cost of 1 {{.*}} %A2 = shl
- %A2 = shl <8 x i32> undef, undef
- ; SSSE3: cost of 8 {{.*}} %A3 = shl
- ; SSE42: cost of 8 {{.*}} %A3 = shl
- ; AVX: cost of 8 {{.*}} %A3 = shl
- ; AVX2: cost of 1 {{.*}} %A3 = shl
- ; AVX512: cost of 1 {{.*}} %A3 = shl
- %A3 = shl <4 x i64> undef, undef
-
- ; SSSE3: cost of 16 {{.*}} %B0 = lshr
- ; SSE42: cost of 16 {{.*}} %B0 = lshr
- ; AVX: cost of 16 {{.*}} %B0 = lshr
- ; AVX2: cost of 1 {{.*}} %B0 = lshr
- ; AVX512: cost of 1 {{.*}} %B0 = lshr
- %B0 = lshr <4 x i32> undef, undef
- ; SSSE3: cost of 4 {{.*}} %B1 = lshr
- ; SSE42: cost of 4 {{.*}} %B1 = lshr
- ; AVX: cost of 4 {{.*}} %B1 = lshr
- ; AVX2: cost of 1 {{.*}} %B1 = lshr
- ; AVX512: cost of 1 {{.*}} %B1 = lshr
- %B1 = lshr <2 x i64> undef, undef
- ; SSSE3: cost of 32 {{.*}} %B2 = lshr
- ; SSE42: cost of 32 {{.*}} %B2 = lshr
- ; AVX: cost of 32 {{.*}} %B2 = lshr
- ; AVX2: cost of 1 {{.*}} %B2 = lshr
- ; AVX512: cost of 1 {{.*}} %B2 = lshr
- %B2 = lshr <8 x i32> undef, undef
- ; SSSE3: cost of 8 {{.*}} %B3 = lshr
- ; SSE42: cost of 8 {{.*}} %B3 = lshr
- ; AVX: cost of 8 {{.*}} %B3 = lshr
- ; AVX2: cost of 1 {{.*}} %B3 = lshr
- ; AVX512: cost of 1 {{.*}} %B3 = lshr
- %B3 = lshr <4 x i64> undef, undef
-
- ; SSSE3: cost of 16 {{.*}} %C0 = ashr
- ; SSE42: cost of 16 {{.*}} %C0 = ashr
- ; AVX: cost of 16 {{.*}} %C0 = ashr
- ; AVX2: cost of 1 {{.*}} %C0 = ashr
- ; AVX512: cost of 1 {{.*}} %C0 = ashr
- %C0 = ashr <4 x i32> undef, undef
- ; SSSE3: cost of 12 {{.*}} %C1 = ashr
- ; SSE42: cost of 12 {{.*}} %C1 = ashr
- ; AVX: cost of 12 {{.*}} %C1 = ashr
- ; AVX2: cost of 4 {{.*}} %C1 = ashr
- ; AVX512: cost of 4 {{.*}} %C1 = ashr
- %C1 = ashr <2 x i64> undef, undef
- ; SSSE3: cost of 32 {{.*}} %C2 = ashr
- ; SSE42: cost of 32 {{.*}} %C2 = ashr
- ; AVX: cost of 32 {{.*}} %C2 = ashr
- ; AVX2: cost of 1 {{.*}} %C2 = ashr
- ; AVX512: cost of 1 {{.*}} %C2 = ashr
- %C2 = ashr <8 x i32> undef, undef
- ; SSSE3: cost of 24 {{.*}} %C3 = ashr
- ; SSE42: cost of 24 {{.*}} %C3 = ashr
- ; AVX: cost of 24 {{.*}} %C3 = ashr
- ; AVX2: cost of 4 {{.*}} %C3 = ashr
- ; AVX512: cost of 4 {{.*}} %C3 = ashr
- %C3 = ashr <4 x i64> undef, undef
-
- ret void
-}
Modified: llvm/trunk/test/Analysis/CostModel/X86/arith.ll
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/Analysis/CostModel/X86/arith.ll?rev=279402&r1=279401&r2=279402&view=diff
==============================================================================
--- llvm/trunk/test/Analysis/CostModel/X86/arith.ll (original)
+++ llvm/trunk/test/Analysis/CostModel/X86/arith.ll Sun Aug 21 13:34:47 2016
@@ -263,221 +263,6 @@ define void @mul() {
ret void
}
-; CHECK-LABEL: 'fadd'
-define i32 @fadd(i32 %arg) {
- ; SSSE3: cost of 2 {{.*}} %A = fadd
- ; SSE42: cost of 2 {{.*}} %A = fadd
- ; AVX: cost of 2 {{.*}} %A = fadd
- ; AVX2: cost of 2 {{.*}} %A = fadd
- ; AVX512: cost of 2 {{.*}} %A = fadd
- %A = fadd <4 x float> undef, undef
- ; SSSE3: cost of 4 {{.*}} %B = fadd
- ; SSE42: cost of 4 {{.*}} %B = fadd
- ; AVX: cost of 2 {{.*}} %B = fadd
- ; AVX2: cost of 2 {{.*}} %B = fadd
- ; AVX512: cost of 2 {{.*}} %B = fadd
- %B = fadd <8 x float> undef, undef
- ; SSSE3: cost of 8 {{.*}} %C = fadd
- ; SSE42: cost of 8 {{.*}} %C = fadd
- ; AVX: cost of 4 {{.*}} %C = fadd
- ; AVX2: cost of 4 {{.*}} %C = fadd
- ; AVX512: cost of 2 {{.*}} %C = fadd
- %C = fadd <16 x float> undef, undef
-
- ; SSSE3: cost of 2 {{.*}} %D = fadd
- ; SSE42: cost of 2 {{.*}} %D = fadd
- ; AVX: cost of 2 {{.*}} %D = fadd
- ; AVX2: cost of 2 {{.*}} %D = fadd
- ; AVX512: cost of 2 {{.*}} %D = fadd
- %D = fadd <2 x double> undef, undef
- ; SSSE3: cost of 4 {{.*}} %E = fadd
- ; SSE42: cost of 4 {{.*}} %E = fadd
- ; AVX: cost of 2 {{.*}} %E = fadd
- ; AVX2: cost of 2 {{.*}} %E = fadd
- ; AVX512: cost of 2 {{.*}} %E = fadd
- %E = fadd <4 x double> undef, undef
- ; SSSE3: cost of 8 {{.*}} %F = fadd
- ; SSE42: cost of 8 {{.*}} %F = fadd
- ; AVX: cost of 4 {{.*}} %F = fadd
- ; AVX2: cost of 4 {{.*}} %F = fadd
- ; AVX512: cost of 2 {{.*}} %F = fadd
- %F = fadd <8 x double> undef, undef
-
- ret i32 undef
-}
-
-; CHECK-LABEL: 'fsub'
-define i32 @fsub(i32 %arg) {
- ; SSSE3: cost of 2 {{.*}} %A = fsub
- ; SSE42: cost of 2 {{.*}} %A = fsub
- ; AVX: cost of 2 {{.*}} %A = fsub
- ; AVX2: cost of 2 {{.*}} %A = fsub
- ; AVX512: cost of 2 {{.*}} %A = fsub
- %A = fsub <4 x float> undef, undef
- ; SSSE3: cost of 4 {{.*}} %B = fsub
- ; SSE42: cost of 4 {{.*}} %B = fsub
- ; AVX: cost of 2 {{.*}} %B = fsub
- ; AVX2: cost of 2 {{.*}} %B = fsub
- ; AVX512: cost of 2 {{.*}} %B = fsub
- %B = fsub <8 x float> undef, undef
- ; SSSE3: cost of 8 {{.*}} %C = fsub
- ; SSE42: cost of 8 {{.*}} %C = fsub
- ; AVX: cost of 4 {{.*}} %C = fsub
- ; AVX2: cost of 4 {{.*}} %C = fsub
- ; AVX512: cost of 2 {{.*}} %C = fsub
- %C = fsub <16 x float> undef, undef
-
- ; SSSE3: cost of 2 {{.*}} %D = fsub
- ; SSE42: cost of 2 {{.*}} %D = fsub
- ; AVX: cost of 2 {{.*}} %D = fsub
- ; AVX2: cost of 2 {{.*}} %D = fsub
- ; AVX512: cost of 2 {{.*}} %D = fsub
- %D = fsub <2 x double> undef, undef
- ; SSSE3: cost of 4 {{.*}} %E = fsub
- ; SSE42: cost of 4 {{.*}} %E = fsub
- ; AVX: cost of 2 {{.*}} %E = fsub
- ; AVX2: cost of 2 {{.*}} %E = fsub
- ; AVX512: cost of 2 {{.*}} %E = fsub
- %E = fsub <4 x double> undef, undef
- ; SSSE3: cost of 8 {{.*}} %F = fsub
- ; SSE42: cost of 8 {{.*}} %F = fsub
- ; AVX: cost of 4 {{.*}} %F = fsub
- ; AVX2: cost of 4 {{.*}} %F = fsub
- ; AVX512: cost of 2 {{.*}} %F = fsub
- %F = fsub <8 x double> undef, undef
-
- ret i32 undef
-}
-
-; CHECK-LABEL: 'fmul'
-define i32 @fmul(i32 %arg) {
- ; SSSE3: cost of 2 {{.*}} %A = fmul
- ; SSE42: cost of 2 {{.*}} %A = fmul
- ; AVX: cost of 2 {{.*}} %A = fmul
- ; AVX2: cost of 2 {{.*}} %A = fmul
- ; AVX512: cost of 2 {{.*}} %A = fmul
- %A = fmul <4 x float> undef, undef
- ; SSSE3: cost of 4 {{.*}} %B = fmul
- ; SSE42: cost of 4 {{.*}} %B = fmul
- ; AVX: cost of 2 {{.*}} %B = fmul
- ; AVX2: cost of 2 {{.*}} %B = fmul
- ; AVX512: cost of 2 {{.*}} %B = fmul
- %B = fmul <8 x float> undef, undef
- ; SSSE3: cost of 8 {{.*}} %C = fmul
- ; SSE42: cost of 8 {{.*}} %C = fmul
- ; AVX: cost of 4 {{.*}} %C = fmul
- ; AVX2: cost of 4 {{.*}} %C = fmul
- ; AVX512: cost of 2 {{.*}} %C = fmul
- %C = fmul <16 x float> undef, undef
-
- ; SSSE3: cost of 2 {{.*}} %D = fmul
- ; SSE42: cost of 2 {{.*}} %D = fmul
- ; AVX: cost of 2 {{.*}} %D = fmul
- ; AVX2: cost of 2 {{.*}} %D = fmul
- ; AVX512: cost of 2 {{.*}} %D = fmul
- %D = fmul <2 x double> undef, undef
- ; SSSE3: cost of 4 {{.*}} %E = fmul
- ; SSE42: cost of 4 {{.*}} %E = fmul
- ; AVX: cost of 2 {{.*}} %E = fmul
- ; AVX2: cost of 2 {{.*}} %E = fmul
- ; AVX512: cost of 2 {{.*}} %E = fmul
- %E = fmul <4 x double> undef, undef
- ; SSSE3: cost of 8 {{.*}} %F = fmul
- ; SSE42: cost of 8 {{.*}} %F = fmul
- ; AVX: cost of 4 {{.*}} %F = fmul
- ; AVX2: cost of 4 {{.*}} %F = fmul
- ; AVX512: cost of 2 {{.*}} %F = fmul
- %F = fmul <8 x double> undef, undef
-
- ret i32 undef
-}
-
-; CHECK-LABEL: 'fdiv'
-define i32 @fdiv(i32 %arg) {
- ; SSSE3: cost of 2 {{.*}} %A = fdiv
- ; SSE42: cost of 2 {{.*}} %A = fdiv
- ; AVX: cost of 2 {{.*}} %A = fdiv
- ; AVX2: cost of 2 {{.*}} %A = fdiv
- ; AVX512: cost of 2 {{.*}} %A = fdiv
- %A = fdiv <4 x float> undef, undef
- ; SSSE3: cost of 4 {{.*}} %B = fdiv
- ; SSE42: cost of 4 {{.*}} %B = fdiv
- ; AVX: cost of 2 {{.*}} %B = fdiv
- ; AVX2: cost of 2 {{.*}} %B = fdiv
- ; AVX512: cost of 2 {{.*}} %B = fdiv
- %B = fdiv <8 x float> undef, undef
- ; SSSE3: cost of 8 {{.*}} %C = fdiv
- ; SSE42: cost of 8 {{.*}} %C = fdiv
- ; AVX: cost of 4 {{.*}} %C = fdiv
- ; AVX2: cost of 4 {{.*}} %C = fdiv
- ; AVX512: cost of 2 {{.*}} %C = fdiv
- %C = fdiv <16 x float> undef, undef
-
- ; SSSE3: cost of 2 {{.*}} %D = fdiv
- ; SSE42: cost of 2 {{.*}} %D = fdiv
- ; AVX: cost of 2 {{.*}} %D = fdiv
- ; AVX2: cost of 2 {{.*}} %D = fdiv
- ; AVX512: cost of 2 {{.*}} %D = fdiv
- %D = fdiv <2 x double> undef, undef
- ; SSSE3: cost of 4 {{.*}} %E = fdiv
- ; SSE42: cost of 4 {{.*}} %E = fdiv
- ; AVX: cost of 2 {{.*}} %E = fdiv
- ; AVX2: cost of 2 {{.*}} %E = fdiv
- ; AVX512: cost of 2 {{.*}} %E = fdiv
- %E = fdiv <4 x double> undef, undef
- ; SSSE3: cost of 8 {{.*}} %F = fdiv
- ; SSE42: cost of 8 {{.*}} %F = fdiv
- ; AVX: cost of 4 {{.*}} %F = fdiv
- ; AVX2: cost of 4 {{.*}} %F = fdiv
- ; AVX512: cost of 2 {{.*}} %F = fdiv
- %F = fdiv <8 x double> undef, undef
-
- ret i32 undef
-}
-
-; CHECK-LABEL: 'frem'
-define i32 @frem(i32 %arg) {
- ; SSSE3: cost of 14 {{.*}} %A = frem
- ; SSE42: cost of 14 {{.*}} %A = frem
- ; AVX: cost of 14 {{.*}} %A = frem
- ; AVX2: cost of 14 {{.*}} %A = frem
- ; AVX512: cost of 14 {{.*}} %A = frem
- %A = frem <4 x float> undef, undef
- ; SSSE3: cost of 28 {{.*}} %B = frem
- ; SSE42: cost of 28 {{.*}} %B = frem
- ; AVX: cost of 30 {{.*}} %B = frem
- ; AVX2: cost of 30 {{.*}} %B = frem
- ; AVX512: cost of 30 {{.*}} %B = frem
- %B = frem <8 x float> undef, undef
- ; SSSE3: cost of 56 {{.*}} %C = frem
- ; SSE42: cost of 56 {{.*}} %C = frem
- ; AVX: cost of 60 {{.*}} %C = frem
- ; AVX2: cost of 60 {{.*}} %C = frem
- ; AVX512: cost of 62 {{.*}} %C = frem
- %C = frem <16 x float> undef, undef
-
- ; SSSE3: cost of 6 {{.*}} %D = frem
- ; SSE42: cost of 6 {{.*}} %D = frem
- ; AVX: cost of 6 {{.*}} %D = frem
- ; AVX2: cost of 6 {{.*}} %D = frem
- ; AVX512: cost of 6 {{.*}} %D = frem
- %D = frem <2 x double> undef, undef
- ; SSSE3: cost of 12 {{.*}} %E = frem
- ; SSE42: cost of 12 {{.*}} %E = frem
- ; AVX: cost of 14 {{.*}} %E = frem
- ; AVX2: cost of 14 {{.*}} %E = frem
- ; AVX512: cost of 14 {{.*}} %E = frem
- %E = frem <4 x double> undef, undef
- ; SSSE3: cost of 24 {{.*}} %F = frem
- ; SSE42: cost of 24 {{.*}} %F = frem
- ; AVX: cost of 28 {{.*}} %F = frem
- ; AVX2: cost of 28 {{.*}} %F = frem
- ; AVX512: cost of 30 {{.*}} %F = frem
- %F = frem <8 x double> undef, undef
-
- ret i32 undef
-}
-
; CHECK-LABEL: 'shift'
define void @shift() {
; SSSE3: cost of 10 {{.*}} %A0 = shl
More information about the llvm-commits
mailing list