[llvm-branch-commits] [llvm] Hexagon: Add sincos intrinsic test (PR #147474)
via llvm-branch-commits
llvm-branch-commits at lists.llvm.org
Tue Jul 8 01:01:04 PDT 2025
llvmbot wrote:
<!--LLVM PR SUMMARY COMMENT-->
@llvm/pr-subscribers-backend-hexagon
Author: Matt Arsenault (arsenm)
<details>
<summary>Changes</summary>
---
Patch is 44.74 KiB, truncated to 20.00 KiB below, full version: https://github.com/llvm/llvm-project/pull/147474.diff
1 Files Affected:
- (added) llvm/test/CodeGen/Hexagon/llvm.sincos.ll (+1487)
``````````diff
diff --git a/llvm/test/CodeGen/Hexagon/llvm.sincos.ll b/llvm/test/CodeGen/Hexagon/llvm.sincos.ll
new file mode 100644
index 0000000000000..f02ac2ca8480f
--- /dev/null
+++ b/llvm/test/CodeGen/Hexagon/llvm.sincos.ll
@@ -0,0 +1,1487 @@
+; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
+; RUN: llc -mtriple=hexagon < %s | FileCheck -check-prefix=BASE %s
+; RUN: llc -mtriple=hexagon-unknown-linux-gnu < %s | FileCheck -check-prefix=GNU %s
+; RUN: llc -mtriple=hexagon-unknown-linux-musl < %s | FileCheck -check-prefix=MUSL %s
+
+define { half, half } @test_sincos_f16(half %a) #0 {
+; BASE-LABEL: test_sincos_f16:
+; BASE: // %bb.0:
+; BASE-NEXT: {
+; BASE-NEXT: call __extendhfsf2
+; BASE-NEXT: memd(r29+#-16) = r17:16
+; BASE-NEXT: allocframe(#8)
+; BASE-NEXT: } // 8-byte Folded Spill
+; BASE-NEXT: {
+; BASE-NEXT: call sinf
+; BASE-NEXT: r16 = r0
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: call __truncsfhf2
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: call cosf
+; BASE-NEXT: r17 = r0
+; BASE-NEXT: r0 = r16
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: call __truncsfhf2
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: r1:0 = combine(r0,r17)
+; BASE-NEXT: r17:16 = memd(r29+#0)
+; BASE-NEXT: dealloc_return
+; BASE-NEXT: } // 8-byte Folded Reload
+;
+; GNU-LABEL: test_sincos_f16:
+; GNU: // %bb.0:
+; GNU-NEXT: {
+; GNU-NEXT: call __extendhfsf2
+; GNU-NEXT: memd(r29+#-16) = r17:16
+; GNU-NEXT: allocframe(#16)
+; GNU-NEXT: } // 8-byte Folded Spill
+; GNU-NEXT: {
+; GNU-NEXT: call sincosf
+; GNU-NEXT: r1 = add(r29,#0)
+; GNU-NEXT: r2 = add(r29,#4)
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: call __truncsfhf2
+; GNU-NEXT: r0 = memw(r29+#0)
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: call __truncsfhf2
+; GNU-NEXT: r16 = r0
+; GNU-NEXT: r0 = memw(r29+#4)
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: r1:0 = combine(r0,r16)
+; GNU-NEXT: r17:16 = memd(r29+#8)
+; GNU-NEXT: dealloc_return
+; GNU-NEXT: } // 8-byte Folded Reload
+;
+; MUSL-LABEL: test_sincos_f16:
+; MUSL: // %bb.0:
+; MUSL-NEXT: {
+; MUSL-NEXT: call __extendhfsf2
+; MUSL-NEXT: memd(r29+#-16) = r17:16
+; MUSL-NEXT: allocframe(#8)
+; MUSL-NEXT: } // 8-byte Folded Spill
+; MUSL-NEXT: {
+; MUSL-NEXT: call sinf
+; MUSL-NEXT: r16 = r0
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: call __truncsfhf2
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: call cosf
+; MUSL-NEXT: r17 = r0
+; MUSL-NEXT: r0 = r16
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: call __truncsfhf2
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: r1:0 = combine(r0,r17)
+; MUSL-NEXT: r17:16 = memd(r29+#0)
+; MUSL-NEXT: dealloc_return
+; MUSL-NEXT: } // 8-byte Folded Reload
+ %result = call { half, half } @llvm.sincos.f16(half %a)
+ ret { half, half } %result
+}
+
+define half @test_sincos_f16_only_use_sin(half %a) #0 {
+; BASE-LABEL: test_sincos_f16_only_use_sin:
+; BASE: // %bb.0:
+; BASE-NEXT: {
+; BASE-NEXT: call __extendhfsf2
+; BASE-NEXT: allocframe(r29,#0):raw
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: call sinf
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: call __truncsfhf2
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: r31:30 = dealloc_return(r30):raw
+; BASE-NEXT: }
+;
+; GNU-LABEL: test_sincos_f16_only_use_sin:
+; GNU: // %bb.0:
+; GNU-NEXT: {
+; GNU-NEXT: call __extendhfsf2
+; GNU-NEXT: allocframe(r29,#8):raw
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: call sincosf
+; GNU-NEXT: r1 = add(r29,#0)
+; GNU-NEXT: r2 = add(r29,#4)
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: call __truncsfhf2
+; GNU-NEXT: r0 = memw(r29+#0)
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: r31:30 = dealloc_return(r30):raw
+; GNU-NEXT: }
+;
+; MUSL-LABEL: test_sincos_f16_only_use_sin:
+; MUSL: // %bb.0:
+; MUSL-NEXT: {
+; MUSL-NEXT: call __extendhfsf2
+; MUSL-NEXT: allocframe(r29,#0):raw
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: call sinf
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: call __truncsfhf2
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: r31:30 = dealloc_return(r30):raw
+; MUSL-NEXT: }
+ %result = call { half, half } @llvm.sincos.f16(half %a)
+ %result.0 = extractvalue { half, half } %result, 0
+ ret half %result.0
+}
+
+define half @test_sincos_f16_only_use_cos(half %a) #0 {
+; BASE-LABEL: test_sincos_f16_only_use_cos:
+; BASE: // %bb.0:
+; BASE-NEXT: {
+; BASE-NEXT: call __extendhfsf2
+; BASE-NEXT: allocframe(r29,#0):raw
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: call cosf
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: call __truncsfhf2
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: r31:30 = dealloc_return(r30):raw
+; BASE-NEXT: }
+;
+; GNU-LABEL: test_sincos_f16_only_use_cos:
+; GNU: // %bb.0:
+; GNU-NEXT: {
+; GNU-NEXT: call __extendhfsf2
+; GNU-NEXT: allocframe(r29,#8):raw
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: call sincosf
+; GNU-NEXT: r1 = add(r29,#0)
+; GNU-NEXT: r2 = add(r29,#4)
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: call __truncsfhf2
+; GNU-NEXT: r0 = memw(r29+#4)
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: r31:30 = dealloc_return(r30):raw
+; GNU-NEXT: }
+;
+; MUSL-LABEL: test_sincos_f16_only_use_cos:
+; MUSL: // %bb.0:
+; MUSL-NEXT: {
+; MUSL-NEXT: call __extendhfsf2
+; MUSL-NEXT: allocframe(r29,#0):raw
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: call cosf
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: call __truncsfhf2
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: r31:30 = dealloc_return(r30):raw
+; MUSL-NEXT: }
+ %result = call { half, half } @llvm.sincos.f16(half %a)
+ %result.1 = extractvalue { half, half } %result, 1
+ ret half %result.1
+}
+
+define { <2 x half>, <2 x half> } @test_sincos_v2f16(<2 x half> %a) #0 {
+; BASE-LABEL: test_sincos_v2f16:
+; BASE: // %bb.0:
+; BASE-NEXT: {
+; BASE-NEXT: r17:16 = combine(r3,r0)
+; BASE-NEXT: r0 = r2
+; BASE-NEXT: memd(r29+#-16) = r17:16
+; BASE-NEXT: allocframe(#24)
+; BASE-NEXT: } // 8-byte Folded Spill
+; BASE-NEXT: {
+; BASE-NEXT: call __extendhfsf2
+; BASE-NEXT: memd(r29+#8) = r19:18
+; BASE-NEXT: memd(r29+#0) = r21:20
+; BASE-NEXT: } // 8-byte Folded Spill
+; BASE-NEXT: {
+; BASE-NEXT: call sinf
+; BASE-NEXT: r18 = r0
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: call __truncsfhf2
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: call __extendhfsf2
+; BASE-NEXT: r19 = r0
+; BASE-NEXT: r0 = r17
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: call sinf
+; BASE-NEXT: r17 = r0
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: call __truncsfhf2
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: call cosf
+; BASE-NEXT: r20 = r0
+; BASE-NEXT: r0 = r18
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: call __truncsfhf2
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: call cosf
+; BASE-NEXT: r18 = r0
+; BASE-NEXT: r0 = r17
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: call __truncsfhf2
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: memh(r16+#6) = r0
+; BASE-NEXT: memh(r16+#4) = r18
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: memh(r16+#2) = r20
+; BASE-NEXT: memh(r16+#0) = r19
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: r17:16 = memd(r29+#16)
+; BASE-NEXT: r19:18 = memd(r29+#8)
+; BASE-NEXT: } // 8-byte Folded Reload
+; BASE-NEXT: {
+; BASE-NEXT: r21:20 = memd(r29+#0)
+; BASE-NEXT: dealloc_return
+; BASE-NEXT: } // 8-byte Folded Reload
+;
+; GNU-LABEL: test_sincos_v2f16:
+; GNU: // %bb.0:
+; GNU-NEXT: {
+; GNU-NEXT: r17:16 = combine(r3,r0)
+; GNU-NEXT: r0 = r2
+; GNU-NEXT: memd(r29+#-16) = r17:16
+; GNU-NEXT: allocframe(#32)
+; GNU-NEXT: } // 8-byte Folded Spill
+; GNU-NEXT: {
+; GNU-NEXT: call __extendhfsf2
+; GNU-NEXT: memd(r29+#16) = r19:18
+; GNU-NEXT: } // 8-byte Folded Spill
+; GNU-NEXT: {
+; GNU-NEXT: call sincosf
+; GNU-NEXT: r1 = add(r29,#8)
+; GNU-NEXT: r2 = add(r29,#12)
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: call __extendhfsf2
+; GNU-NEXT: r0 = r17
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: call sincosf
+; GNU-NEXT: r1 = add(r29,#0)
+; GNU-NEXT: r2 = add(r29,#4)
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: call __truncsfhf2
+; GNU-NEXT: r0 = memw(r29+#8)
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: call __truncsfhf2
+; GNU-NEXT: r17 = r0
+; GNU-NEXT: r0 = memw(r29+#0)
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: call __truncsfhf2
+; GNU-NEXT: r18 = r0
+; GNU-NEXT: r0 = memw(r29+#12)
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: call __truncsfhf2
+; GNU-NEXT: r19 = r0
+; GNU-NEXT: r0 = memw(r29+#4)
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: memh(r16+#6) = r0
+; GNU-NEXT: memh(r16+#4) = r19
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: memh(r16+#2) = r18
+; GNU-NEXT: memh(r16+#0) = r17
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: r17:16 = memd(r29+#24)
+; GNU-NEXT: r19:18 = memd(r29+#16)
+; GNU-NEXT: } // 8-byte Folded Reload
+; GNU-NEXT: {
+; GNU-NEXT: r31:30 = dealloc_return(r30):raw
+; GNU-NEXT: }
+;
+; MUSL-LABEL: test_sincos_v2f16:
+; MUSL: // %bb.0:
+; MUSL-NEXT: {
+; MUSL-NEXT: r17:16 = combine(r3,r0)
+; MUSL-NEXT: r0 = r2
+; MUSL-NEXT: memd(r29+#-16) = r17:16
+; MUSL-NEXT: allocframe(#24)
+; MUSL-NEXT: } // 8-byte Folded Spill
+; MUSL-NEXT: {
+; MUSL-NEXT: call __extendhfsf2
+; MUSL-NEXT: memd(r29+#8) = r19:18
+; MUSL-NEXT: memd(r29+#0) = r21:20
+; MUSL-NEXT: } // 8-byte Folded Spill
+; MUSL-NEXT: {
+; MUSL-NEXT: call sinf
+; MUSL-NEXT: r18 = r0
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: call __truncsfhf2
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: call __extendhfsf2
+; MUSL-NEXT: r19 = r0
+; MUSL-NEXT: r0 = r17
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: call sinf
+; MUSL-NEXT: r17 = r0
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: call __truncsfhf2
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: call cosf
+; MUSL-NEXT: r20 = r0
+; MUSL-NEXT: r0 = r18
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: call __truncsfhf2
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: call cosf
+; MUSL-NEXT: r18 = r0
+; MUSL-NEXT: r0 = r17
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: call __truncsfhf2
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: memh(r16+#6) = r0
+; MUSL-NEXT: memh(r16+#4) = r18
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: memh(r16+#2) = r20
+; MUSL-NEXT: memh(r16+#0) = r19
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: r17:16 = memd(r29+#16)
+; MUSL-NEXT: r19:18 = memd(r29+#8)
+; MUSL-NEXT: } // 8-byte Folded Reload
+; MUSL-NEXT: {
+; MUSL-NEXT: r21:20 = memd(r29+#0)
+; MUSL-NEXT: dealloc_return
+; MUSL-NEXT: } // 8-byte Folded Reload
+ %result = call { <2 x half>, <2 x half> } @llvm.sincos.v2f16(<2 x half> %a)
+ ret { <2 x half>, <2 x half> } %result
+}
+
+define { float, float } @test_sincos_f32(float %a) #0 {
+; BASE-LABEL: test_sincos_f32:
+; BASE: // %bb.0:
+; BASE-NEXT: {
+; BASE-NEXT: call sinf
+; BASE-NEXT: r16 = r0
+; BASE-NEXT: memd(r29+#-16) = r17:16
+; BASE-NEXT: allocframe(#8)
+; BASE-NEXT: } // 8-byte Folded Spill
+; BASE-NEXT: {
+; BASE-NEXT: call cosf
+; BASE-NEXT: r17 = r0
+; BASE-NEXT: r0 = r16
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: r1:0 = combine(r0,r17)
+; BASE-NEXT: r17:16 = memd(r29+#0)
+; BASE-NEXT: dealloc_return
+; BASE-NEXT: } // 8-byte Folded Reload
+;
+; GNU-LABEL: test_sincos_f32:
+; GNU: // %bb.0:
+; GNU-NEXT: {
+; GNU-NEXT: allocframe(r29,#8):raw
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: call sincosf
+; GNU-NEXT: r1 = add(r29,#0)
+; GNU-NEXT: r2 = add(r29,#4)
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: r0 = memw(r29+#0)
+; GNU-NEXT: r1 = memw(r29+#4)
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: r31:30 = dealloc_return(r30):raw
+; GNU-NEXT: }
+;
+; MUSL-LABEL: test_sincos_f32:
+; MUSL: // %bb.0:
+; MUSL-NEXT: {
+; MUSL-NEXT: call sinf
+; MUSL-NEXT: r16 = r0
+; MUSL-NEXT: memd(r29+#-16) = r17:16
+; MUSL-NEXT: allocframe(#8)
+; MUSL-NEXT: } // 8-byte Folded Spill
+; MUSL-NEXT: {
+; MUSL-NEXT: call cosf
+; MUSL-NEXT: r17 = r0
+; MUSL-NEXT: r0 = r16
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: r1:0 = combine(r0,r17)
+; MUSL-NEXT: r17:16 = memd(r29+#0)
+; MUSL-NEXT: dealloc_return
+; MUSL-NEXT: } // 8-byte Folded Reload
+ %result = call { float, float } @llvm.sincos.f32(float %a)
+ ret { float, float } %result
+}
+
+define { <2 x float>, <2 x float> } @test_sincos_v2f32(<2 x float> %a) #0 {
+; CHECKR2-LABEL: test_sincos_v2f32:
+; CHECKR2: # %bb.0:
+; CHECKR2-NEXT: daddiu $sp, $sp, -32
+; CHECKR2-NEXT: sd $ra, 24($sp) # 8-byte Folded Spill
+; CHECKR2-NEXT: sd $16, 16($sp) # 8-byte Folded Spill
+; CHECKR2-NEXT: move $16, $4
+; CHECKR2-NEXT: dsrl $1, $4, 32
+; CHECKR2-NEXT: sll $1, $1, 0
+; CHECKR2-NEXT: mtc1 $1, $f12
+; CHECKR2-NEXT: daddiu $5, $sp, 12
+; CHECKR2-NEXT: jal sincosf
+; CHECKR2-NEXT: daddiu $6, $sp, 8
+; CHECKR2-NEXT: sll $1, $16, 0
+; CHECKR2-NEXT: mtc1 $1, $f12
+; CHECKR2-NEXT: daddiu $5, $sp, 4
+; CHECKR2-NEXT: jal sincosf
+; CHECKR2-NEXT: daddiu $6, $sp, 0
+; CHECKR2-NEXT: lwc1 $f0, 12($sp)
+; CHECKR2-NEXT: mfc1 $1, $f0
+; CHECKR2-NEXT: dsll $1, $1, 32
+; CHECKR2-NEXT: lwc1 $f0, 4($sp)
+; CHECKR2-NEXT: mfc1 $2, $f0
+; CHECKR2-NEXT: dext $2, $2, 0, 32
+; CHECKR2-NEXT: lwc1 $f0, 8($sp)
+; CHECKR2-NEXT: or $2, $2, $1
+; CHECKR2-NEXT: mfc1 $1, $f0
+; CHECKR2-NEXT: dsll $1, $1, 32
+; CHECKR2-NEXT: lwc1 $f0, 0($sp)
+; CHECKR2-NEXT: mfc1 $3, $f0
+; CHECKR2-NEXT: dext $3, $3, 0, 32
+; CHECKR2-NEXT: or $3, $3, $1
+; CHECKR2-NEXT: ld $16, 16($sp) # 8-byte Folded Reload
+; CHECKR2-NEXT: ld $ra, 24($sp) # 8-byte Folded Reload
+; CHECKR2-NEXT: jr $ra
+; CHECKR2-NEXT: daddiu $sp, $sp, 32
+; BASE-LABEL: test_sincos_v2f32:
+; BASE: // %bb.0:
+; BASE-NEXT: {
+; BASE-NEXT: r17:16 = combine(r0,r2)
+; BASE-NEXT: r0 = r2
+; BASE-NEXT: memd(r29+#-16) = r17:16
+; BASE-NEXT: allocframe(#24)
+; BASE-NEXT: } // 8-byte Folded Spill
+; BASE-NEXT: {
+; BASE-NEXT: call sinf
+; BASE-NEXT: r18 = r3
+; BASE-NEXT: memd(r29+#8) = r19:18
+; BASE-NEXT: memd(r29+#0) = r21:20
+; BASE-NEXT: } // 8-byte Folded Spill
+; BASE-NEXT: {
+; BASE-NEXT: call sinf
+; BASE-NEXT: r19 = r0
+; BASE-NEXT: r0 = r18
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: call cosf
+; BASE-NEXT: r20 = r0
+; BASE-NEXT: r0 = r16
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: call cosf
+; BASE-NEXT: r16 = r0
+; BASE-NEXT: r0 = r18
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: r1:0 = combine(r0,r16)
+; BASE-NEXT: r3:2 = combine(r20,r19)
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: memd(r17+#8) = r1:0
+; BASE-NEXT: memd(r17+#0) = r3:2
+; BASE-NEXT: }
+; BASE-NEXT: {
+; BASE-NEXT: r17:16 = memd(r29+#16)
+; BASE-NEXT: r19:18 = memd(r29+#8)
+; BASE-NEXT: } // 8-byte Folded Reload
+; BASE-NEXT: {
+; BASE-NEXT: r21:20 = memd(r29+#0)
+; BASE-NEXT: dealloc_return
+; BASE-NEXT: } // 8-byte Folded Reload
+;
+; GNU-LABEL: test_sincos_v2f32:
+; GNU: // %bb.0:
+; GNU-NEXT: {
+; GNU-NEXT: r17:16 = combine(r0,r2)
+; GNU-NEXT: r1 = add(r0,#4)
+; GNU-NEXT: memd(r29+#-16) = r17:16
+; GNU-NEXT: allocframe(#8)
+; GNU-NEXT: } // 8-byte Folded Spill
+; GNU-NEXT: {
+; GNU-NEXT: call sincosf
+; GNU-NEXT: r2 = add(r0,#12)
+; GNU-NEXT: r0 = r3
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: call sincosf
+; GNU-NEXT: r2 = add(r17,#8)
+; GNU-NEXT: r1:0 = combine(r17,r16)
+; GNU-NEXT: }
+; GNU-NEXT: {
+; GNU-NEXT: r17:16 = memd(r29+#0)
+; GNU-NEXT: dealloc_return
+; GNU-NEXT: } // 8-byte Folded Reload
+;
+; MUSL-LABEL: test_sincos_v2f32:
+; MUSL: // %bb.0:
+; MUSL-NEXT: {
+; MUSL-NEXT: r17:16 = combine(r0,r2)
+; MUSL-NEXT: r0 = r2
+; MUSL-NEXT: memd(r29+#-16) = r17:16
+; MUSL-NEXT: allocframe(#24)
+; MUSL-NEXT: } // 8-byte Folded Spill
+; MUSL-NEXT: {
+; MUSL-NEXT: call sinf
+; MUSL-NEXT: r18 = r3
+; MUSL-NEXT: memd(r29+#8) = r19:18
+; MUSL-NEXT: memd(r29+#0) = r21:20
+; MUSL-NEXT: } // 8-byte Folded Spill
+; MUSL-NEXT: {
+; MUSL-NEXT: call sinf
+; MUSL-NEXT: r19 = r0
+; MUSL-NEXT: r0 = r18
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: call cosf
+; MUSL-NEXT: r20 = r0
+; MUSL-NEXT: r0 = r16
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: call cosf
+; MUSL-NEXT: r16 = r0
+; MUSL-NEXT: r0 = r18
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: r1:0 = combine(r0,r16)
+; MUSL-NEXT: r3:2 = combine(r20,r19)
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: memd(r17+#8) = r1:0
+; MUSL-NEXT: memd(r17+#0) = r3:2
+; MUSL-NEXT: }
+; MUSL-NEXT: {
+; MUSL-NEXT: r17:16 = memd(r29+#16)
+; MUSL-NEXT: r19:18 = memd(r29+#8)
+; MUSL-NEXT: } // 8-byte Folded Reload
+; MUSL-NEXT: {
+; MUSL-NEXT: r21:20 = memd(r29+#0)
+; MUSL-NEXT: dealloc_return
+; MUSL-NEXT: } // 8-byte Folded Reload
+ %result = call { <2 x float>, <2 x float> } @llvm.sincos.v2f32(<2 x float> %a)
+ ret { <2 x float>, <2 x float> } %result
+}
+
+define { <3 x float>, <3 x float> } @test_sincos_v3f32(<3 x float> %a) #0 {
+; CHECKR2-LABEL: test_sincos_v3f32:
+; CHECKR2: # %bb.0:
+; CHECKR2-NEXT: daddiu $sp, $sp, -48
+; CHECKR2-NEXT: sdc1 $f25, 40($sp) # 8-byte Folded Spill
+; CHECKR2-NEXT: sdc1 $f24, 32($sp) # 8-byte Folded Spill
+; CHECKR2-NEXT: sd $ra, 24($sp) # 8-byte Folded Spill
+; CHECKR2-NEXT: sd $16, 16($sp) # 8-byte Folded Spill
+; CHECKR2-NEXT: mov.s $f24, $f15
+; CHECKR2-NEXT: mov.s $f25, $f14
+; CHECKR2-NEXT: mov.s $f12, $f13
+; CHECKR2-NEXT: move $16, $4
+; CHECKR2-NEXT: daddiu $5, $sp, 4
+; CHECKR2-NEXT: jal sincosf
+; CHECKR2-NEXT: daddiu $6, $sp, 0
+; CHECKR2-NEXT: daddiu $5, $sp, 12
+; CHECKR2-NEXT: daddiu $6, $sp, 8
+; CHECKR2-NEXT: jal sincosf
+; CHECKR2-NEXT: mov.s $f12, $f25
+; CHECKR2-NEXT: daddiu $5, $16, 8
+; CHECKR2-NEXT: daddiu $6, $16, 24
+; CHECKR2-NEXT: jal sincosf
+; CHECKR2-NEXT: mov.s $f12, $f24
+; CHECKR2-NEXT: lwc1 $f0, 0($sp)
+; CHECKR2-NEXT: mfc1 $1, $f0
+; CHECKR2-NEXT: dsll $1, $1, 32
+; CHECKR2-NEXT: lwc1 $f0, 8($sp)
+; CHECKR2-NEXT: mfc1 $2, $f0
+; CHECKR2-NEXT: dext $2, $2, 0, 32
+; CHECKR2-NEXT: or $1, $2, $1
+; CHECKR2-NEXT: lwc1 $f0, 4($sp)
+; CHECKR2-NEXT: mfc1 $2, $f0
+; CHECKR2-NEXT: sd $1, 16($16)
+; CHECKR2-NEXT: dsll $1, $2, 32
+; CHECKR2-NEXT: lwc1 $f0, 12($sp)
+; CHECKR2-NEXT: mfc1 $2, $f0
+; CHECKR2-NEXT: dext $2, $2, 0, 32
+; CHECKR2-NEXT: or $1, $2, $1
+; CHECKR2-NEXT: sd $1, 0($16)
+; CHECKR2-NEXT: ld $16, 16($sp) # 8-byte Folded Reload
+; CHECKR2-NEXT: ld $ra, 24($sp) # 8-byte Folded Reload
+; CHECKR2-NEXT: ldc1 $f24, 32($sp) # 8-byte Folded Reload
+; CHECKR2-NEXT: ldc1 $f25, 40($sp) # 8-byte Folded Reload
+; CHECKR2-NEXT: jr $ra
+; CHECKR2-NEXT: daddiu $sp, $sp, 48
+; BASE-LABEL: test_sincos_v3f32:
+; BASE: // %bb.0:
+; BASE-NEXT: {
+; BASE-NEXT: memd(r29+#-16) = r17:16
+; BASE-NEXT: allocframe(#32)
+; BASE-NEXT: } // 8-byte Folded Spill
+; BASE-NEXT: {
+; BASE-NEXT: r19:18 = combine(r0,r2)
+; BASE-NEXT: r0 = r2
+; BASE-NEXT: memd(r29+#16) = r19:18
+; BASE-NEXT: memd(r29+#8) = r21:20
+; BASE-NEXT: } // 8-byte Folded Spill
+; BASE-NEXT: {
+; BASE-NEXT: call sinf
+; BAS...
[truncated]
``````````
</details>
https://github.com/llvm/llvm-project/pull/147474
More information about the llvm-branch-commits
mailing list