[llvm] r336313 - [Power9] Add tests for passing float128 in VSX reg for non-homogenous aggregates

Lei Huang via llvm-commits llvm-commits at lists.llvm.org
Wed Jul 4 23:29:29 PDT 2018


Author: lei
Date: Wed Jul  4 23:29:28 2018
New Revision: 336313

URL: http://llvm.org/viewvc/llvm-project?rev=336313&view=rev
Log:
[Power9] Add tests for passing float128 in VSX reg for non-homogenous aggregates

Add missing testcase for rL336310

Added:
    llvm/trunk/test/CodeGen/PowerPC/f128-aggregates.ll

Added: llvm/trunk/test/CodeGen/PowerPC/f128-aggregates.ll
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/CodeGen/PowerPC/f128-aggregates.ll?rev=336313&view=auto
==============================================================================
--- llvm/trunk/test/CodeGen/PowerPC/f128-aggregates.ll (added)
+++ llvm/trunk/test/CodeGen/PowerPC/f128-aggregates.ll Wed Jul  4 23:29:28 2018
@@ -0,0 +1,206 @@
+; RUN: llc -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown \
+; RUN:   -enable-ppc-quad-precision -verify-machineinstrs < %s | FileCheck %s
+; RUN: llc -mcpu=pwr9 -mtriple=powerpc64-unknown-unknown \
+; RUN:   -enable-ppc-quad-precision -verify-machineinstrs < %s | FileCheck -check-prefix=CHECK-BE %s
+
+%struct.MixedC = type { i32, %struct.SA, float, [12 x i8] }
+%struct.SA = type { double, fp128, <4 x float> }
+
+; Function Attrs: norecurse nounwind readnone
+define fp128 @testMixedAggregate([3 x i128] %a.coerce) {
+; CHECK-LABEL: testMixedAggregate:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    mtvsrdd 34, 8, 7
+; CHECK-NEXT:    blr
+
+; CHECK-BE-LABEL: testMixedAggregate:
+; CHECK-BE:       mtvsrdd 34, 8, 7
+; CHECK-BE-NEXT:  blr
+entry:
+  %a.coerce.fca.2.extract = extractvalue [3 x i128] %a.coerce, 2
+  %0 = bitcast i128 %a.coerce.fca.2.extract to fp128
+  ret fp128 %0
+}
+
+; Function Attrs: norecurse nounwind readnone
+define fp128 @testMixedAggregate_02([4 x i128] %a.coerce) {
+; CHECK-LABEL: testMixedAggregate_02:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    mtvsrdd 34, 6, 5
+; CHECK-NEXT:    blr
+
+; CHECK-BE-LABEL: testMixedAggregate_02:
+; CHECK-BE:       mtvsrdd 34, 6, 5
+; CHECK-BE-NEXT:  blr
+entry:
+  %a.coerce.fca.1.extract = extractvalue [4 x i128] %a.coerce, 1
+  %0 = bitcast i128 %a.coerce.fca.1.extract to fp128
+  ret fp128 %0
+}
+
+; Function Attrs: norecurse nounwind readnone
+define fp128 @testMixedAggregate_03([4 x i128] %sa.coerce) {
+; CHECK-LABEL: testMixedAggregate_03:
+; CHECK:       # %bb.0: # %entry
+; CHECK-DAG:     mtvsrwa 34, 3
+; CHECK-DAG:     mtvsrdd 35, 6, 5
+; CHECK:         mtvsrd 36, 10
+; CHECK:         xscvsdqp 2, 2
+; CHECK-DAG:     xscvsdqp [[REG:[0-9]+]], 4
+; CHECK-DAG:     xsaddqp 2, 3, 2
+; CHECK:         xsaddqp 2, 2, [[REG]]
+; CHECK-NEXT:    blr
+entry:
+  %sa.coerce.fca.0.extract = extractvalue [4 x i128] %sa.coerce, 0
+  %sa.sroa.0.0.extract.trunc = trunc i128 %sa.coerce.fca.0.extract to i32
+  %sa.coerce.fca.1.extract = extractvalue [4 x i128] %sa.coerce, 1
+  %sa.coerce.fca.3.extract = extractvalue [4 x i128] %sa.coerce, 3
+  %sa.sroa.6.48.extract.shift = lshr i128 %sa.coerce.fca.3.extract, 64
+  %sa.sroa.6.48.extract.trunc = trunc i128 %sa.sroa.6.48.extract.shift to i64
+  %conv = sitofp i32 %sa.sroa.0.0.extract.trunc to fp128
+  %0 = bitcast i128 %sa.coerce.fca.1.extract to fp128
+  %add = fadd fp128 %0, %conv
+  %conv2 = sitofp i64 %sa.sroa.6.48.extract.trunc to fp128
+  %add3 = fadd fp128 %add, %conv2
+  ret fp128 %add3
+}
+
+
+; Function Attrs: norecurse nounwind readonly
+define fp128 @testNestedAggregate(%struct.MixedC* byval nocapture readonly align 16 %a) {
+; CHECK-LABEL: testNestedAggregate:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    std 8, 72(1)
+; CHECK-NEXT:    std 7, 64(1)
+; CHECK-NEXT:    std 10, 88(1)
+; CHECK-NEXT:    std 9, 80(1)
+; CHECK-NEXT:    lxv 34, 64(1)
+; CHECK-NEXT:    std 6, 56(1)
+; CHECK-NEXT:    std 5, 48(1)
+; CHECK-NEXT:    std 4, 40(1)
+; CHECK-NEXT:    std 3, 32(1)
+; CHECK-NEXT:    blr
+
+; CHECK-BE-LABEL: testNestedAggregate:
+; CHECK-BE:       # %bb.0: # %entry
+; CHECK-BE-NEXT:    std 8, 88(1)
+; CHECK-BE-NEXT:    std 7, 80(1)
+; CHECK-BE-NEXT:    std 10, 104(1)
+; CHECK-BE-NEXT:    std 9, 96(1)
+; CHECK-BE-NEXT:    lxv 34, 80(1)
+; CHECK-BE-NEXT:    std 6, 72(1)
+; CHECK-BE-NEXT:    std 5, 64(1)
+; CHECK-BE-NEXT:    std 4, 56(1)
+; CHECK-BE-NEXT:    std 3, 48(1)
+; CHECK-BE-NEXT:    blr
+entry:
+  %c = getelementptr inbounds %struct.MixedC, %struct.MixedC* %a, i64 0, i32 1, i32 1
+  %0 = load fp128, fp128* %c, align 16
+  ret fp128 %0
+}
+
+; Function Attrs: norecurse nounwind readnone
+define fp128 @testUnion_01([1 x i128] %a.coerce) {
+; CHECK-LABEL: testUnion_01:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    mtvsrdd 34, 4, 3
+; CHECK-NEXT:    blr
+
+; CHECK-BE-LABEL: testUnion_01:
+; CHECK-BE:       mtvsrdd 34, 4, 3
+; CHECK-BE-NEXT:  blr
+entry:
+  %a.coerce.fca.0.extract = extractvalue [1 x i128] %a.coerce, 0
+  %0 = bitcast i128 %a.coerce.fca.0.extract to fp128
+  ret fp128 %0
+}
+
+; Function Attrs: norecurse nounwind readnone
+define fp128 @testUnion_02([1 x i128] %a.coerce) {
+; CHECK-LABEL: testUnion_02:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    mtvsrdd 34, 4, 3
+; CHECK-NEXT:    blr
+
+; CHECK-BE-LABEL: testUnion_02:
+; CHECK-BE:       mtvsrdd 34, 4, 3
+; CHECK-BE-NEXT:  blr
+entry:
+  %a.coerce.fca.0.extract = extractvalue [1 x i128] %a.coerce, 0
+  %0 = bitcast i128 %a.coerce.fca.0.extract to fp128
+  ret fp128 %0
+}
+
+; Function Attrs: norecurse nounwind readnone
+define fp128 @testUnion_03([4 x i128] %a.coerce) {
+; CHECK-LABEL: testUnion_03:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    mtvsrdd 34, 8, 7
+; CHECK-NEXT:    blr
+
+; CHECK-BE-LABEL: testUnion_03:
+; CHECK-BE:       mtvsrdd 34, 8, 7
+; CHECK-BE-NEXT:  blr
+entry:
+  %a.coerce.fca.2.extract = extractvalue [4 x i128] %a.coerce, 2
+  %0 = bitcast i128 %a.coerce.fca.2.extract to fp128
+  ret fp128 %0
+}
+
+; Function Attrs: nounwind
+define fp128 @sum_float128(i32 signext %count, ...) {
+; CHECK-LABEL: sum_float128:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    addis 11, 2, .LCPI7_0 at toc@ha
+; CHECK-NEXT:    cmpwi 0, 3, 1
+; CHECK-NEXT:    std 10, 88(1)
+; CHECK-NEXT:    std 9, 80(1)
+; CHECK-NEXT:    std 8, 72(1)
+; CHECK-NEXT:    std 7, 64(1)
+; CHECK-NEXT:    std 6, 56(1)
+; CHECK-NEXT:    std 5, 48(1)
+; CHECK-NEXT:    std 4, 40(1)
+; CHECK-NEXT:    addi 11, 11, .LCPI7_0 at toc@l
+; CHECK-NEXT:    lxvx 34, 0, 11
+; CHECK-NEXT:    bltlr 0
+; CHECK-NEXT:  # %bb.1: # %if.end
+; CHECK-NEXT:    addi 3, 1, 40
+; CHECK-NEXT:    lxvx 35, 0, 3
+; CHECK-NEXT:    xsaddqp 2, 3, 2
+; CHECK-NEXT:    lxv 35, 16(3)
+; CHECK-NEXT:    addi 3, 1, 72
+; CHECK-NEXT:    std 3, -8(1)
+; CHECK-NEXT:    xsaddqp 2, 2, 3
+; CHECK-NEXT:    blr
+entry:
+  %ap = alloca i8*, align 8
+  %0 = bitcast i8** %ap to i8*
+  call void @llvm.lifetime.start.p0i8(i64 8, i8* nonnull %0) #2
+  %cmp = icmp slt i32 %count, 1
+  br i1 %cmp, label %cleanup, label %if.end
+
+if.end:                                           ; preds = %entry
+  call void @llvm.va_start(i8* nonnull %0)
+  %argp.cur = load i8*, i8** %ap, align 8
+  %argp.next = getelementptr inbounds i8, i8* %argp.cur, i64 16
+  %1 = bitcast i8* %argp.cur to fp128*
+  %2 = load fp128, fp128* %1, align 8
+  %add = fadd fp128 %2, 0xL00000000000000000000000000000000
+  %argp.next3 = getelementptr inbounds i8, i8* %argp.cur, i64 32
+  store i8* %argp.next3, i8** %ap, align 8
+  %3 = bitcast i8* %argp.next to fp128*
+  %4 = load fp128, fp128* %3, align 8
+  %add4 = fadd fp128 %add, %4
+  call void @llvm.va_end(i8* nonnull %0)
+  br label %cleanup
+
+cleanup:                                          ; preds = %entry, %if.end
+  %retval.0 = phi fp128 [ %add4, %if.end ], [ 0xL00000000000000000000000000000000, %entry ]
+  call void @llvm.lifetime.end.p0i8(i64 8, i8* nonnull %0) #2
+  ret fp128 %retval.0
+}
+
+declare void @llvm.lifetime.start.p0i8(i64, i8* nocapture) #1
+declare void @llvm.va_start(i8*) #2
+declare void @llvm.va_end(i8*) #2
+declare void @llvm.lifetime.end.p0i8(i64, i8* nocapture) #1




More information about the llvm-commits mailing list