[llvm] 6953e75 - [NFC][AArch64] Precommit vector-fcvt tests

David Sherwood via llvm-commits llvm-commits at lists.llvm.org
Fri Jul 29 01:29:22 PDT 2022


Author: David Sherwood
Date: 2022-07-29T09:29:15+01:00
New Revision: 6953e754c7a887b22c56ce7b0526506e4aa86e7f

URL: https://github.com/llvm/llvm-project/commit/6953e754c7a887b22c56ce7b0526506e4aa86e7f
DIFF: https://github.com/llvm/llvm-project/commit/6953e754c7a887b22c56ce7b0526506e4aa86e7f.diff

LOG: [NFC][AArch64] Precommit vector-fcvt tests

Add tests which show code quality of uitofp and sitofp.

Differential Revision: https://reviews.llvm.org/D130697

Added: 
    llvm/test/CodeGen/AArch64/vector-fcvt.ll

Modified: 
    

Removed: 
    


################################################################################
diff  --git a/llvm/test/CodeGen/AArch64/vector-fcvt.ll b/llvm/test/CodeGen/AArch64/vector-fcvt.ll
new file mode 100644
index 0000000000000..4b7736eb6026d
--- /dev/null
+++ b/llvm/test/CodeGen/AArch64/vector-fcvt.ll
@@ -0,0 +1,594 @@
+; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
+; RUN: llc < %s -mtriple=aarch64-none-eabi | FileCheck %s --check-prefixes=CHECK
+
+; Note: halves are tested in fp16-v8-instructions.ll.
+
+define <4 x float> @sitofp_v4i8_float(<4 x i8> %a) {
+; CHECK-LABEL: sitofp_v4i8_float:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    shl v0.4h, v0.4h, #8
+; CHECK-NEXT:    sshr v0.4h, v0.4h, #8
+; CHECK-NEXT:    sshll v0.4s, v0.4h, #0
+; CHECK-NEXT:    scvtf v0.4s, v0.4s
+; CHECK-NEXT:    ret
+  %1 = sitofp <4 x i8> %a to <4 x float>
+  ret <4 x float> %1
+}
+
+define <8 x float> @sitofp_v8i8_float(<8 x i8> %a) {
+; CHECK-LABEL: sitofp_v8i8_float:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    zip1 v1.8b, v0.8b, v0.8b
+; CHECK-NEXT:    zip2 v0.8b, v0.8b, v0.8b
+; CHECK-NEXT:    shl v1.4h, v1.4h, #8
+; CHECK-NEXT:    shl v0.4h, v0.4h, #8
+; CHECK-NEXT:    sshr v1.4h, v1.4h, #8
+; CHECK-NEXT:    sshr v0.4h, v0.4h, #8
+; CHECK-NEXT:    sshll v1.4s, v1.4h, #0
+; CHECK-NEXT:    sshll v2.4s, v0.4h, #0
+; CHECK-NEXT:    scvtf v0.4s, v1.4s
+; CHECK-NEXT:    scvtf v1.4s, v2.4s
+; CHECK-NEXT:    ret
+  %1 = sitofp <8 x i8> %a to <8 x float>
+  ret <8 x float> %1
+}
+
+define <16 x float> @sitofp_v16i8_float(<16 x i8> %a) {
+; CHECK-LABEL: sitofp_v16i8_float:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    zip1 v1.8b, v0.8b, v0.8b
+; CHECK-NEXT:    zip2 v2.8b, v0.8b, v0.8b
+; CHECK-NEXT:    ext v0.16b, v0.16b, v0.16b, #8
+; CHECK-NEXT:    shl v1.4h, v1.4h, #8
+; CHECK-NEXT:    shl v2.4h, v2.4h, #8
+; CHECK-NEXT:    zip1 v3.8b, v0.8b, v0.8b
+; CHECK-NEXT:    zip2 v0.8b, v0.8b, v0.8b
+; CHECK-NEXT:    sshr v1.4h, v1.4h, #8
+; CHECK-NEXT:    sshr v2.4h, v2.4h, #8
+; CHECK-NEXT:    sshll v1.4s, v1.4h, #0
+; CHECK-NEXT:    shl v3.4h, v3.4h, #8
+; CHECK-NEXT:    shl v0.4h, v0.4h, #8
+; CHECK-NEXT:    sshr v3.4h, v3.4h, #8
+; CHECK-NEXT:    sshr v0.4h, v0.4h, #8
+; CHECK-NEXT:    sshll v2.4s, v2.4h, #0
+; CHECK-NEXT:    sshll v3.4s, v3.4h, #0
+; CHECK-NEXT:    sshll v4.4s, v0.4h, #0
+; CHECK-NEXT:    scvtf v0.4s, v1.4s
+; CHECK-NEXT:    scvtf v1.4s, v2.4s
+; CHECK-NEXT:    scvtf v2.4s, v3.4s
+; CHECK-NEXT:    scvtf v3.4s, v4.4s
+; CHECK-NEXT:    ret
+  %1 = sitofp <16 x i8> %a to <16 x float>
+  ret <16 x float> %1
+}
+
+define <8 x float> @sitofp_i16_float(<8 x i16> %a) {
+; CHECK-LABEL: sitofp_i16_float:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    sshll2 v1.4s, v0.8h, #0
+; CHECK-NEXT:    sshll v0.4s, v0.4h, #0
+; CHECK-NEXT:    scvtf v1.4s, v1.4s
+; CHECK-NEXT:    scvtf v0.4s, v0.4s
+; CHECK-NEXT:    ret
+  %1 = sitofp <8 x i16> %a to <8 x float>
+  ret <8 x float> %1
+}
+
+define <8 x float> @sitofp_i32_float(<8 x i32> %a) {
+; CHECK-LABEL: sitofp_i32_float:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    scvtf v0.4s, v0.4s
+; CHECK-NEXT:    scvtf v1.4s, v1.4s
+; CHECK-NEXT:    ret
+  %1 = sitofp <8 x i32> %a to <8 x float>
+  ret <8 x float> %1
+}
+
+define <8 x float> @sitofp_i64_float(<8 x i64> %a) {
+; CHECK-LABEL: sitofp_i64_float:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    scvtf v2.2d, v2.2d
+; CHECK-NEXT:    scvtf v0.2d, v0.2d
+; CHECK-NEXT:    scvtf v4.2d, v1.2d
+; CHECK-NEXT:    fcvtn v0.2s, v0.2d
+; CHECK-NEXT:    fcvtn v1.2s, v2.2d
+; CHECK-NEXT:    scvtf v2.2d, v3.2d
+; CHECK-NEXT:    fcvtn2 v0.4s, v4.2d
+; CHECK-NEXT:    fcvtn2 v1.4s, v2.2d
+; CHECK-NEXT:    ret
+  %1 = sitofp <8 x i64> %a to <8 x float>
+  ret <8 x float> %1
+}
+
+define <4 x float> @uitofp_v4i8_float(<4 x i8> %a) {
+; CHECK-LABEL: uitofp_v4i8_float:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    bic v0.4h, #255, lsl #8
+; CHECK-NEXT:    ushll v0.4s, v0.4h, #0
+; CHECK-NEXT:    ucvtf v0.4s, v0.4s
+; CHECK-NEXT:    ret
+  %1 = uitofp <4 x i8> %a to <4 x float>
+  ret <4 x float> %1
+}
+
+define <8 x float> @uitofp_v8i8_float(<8 x i8> %a) {
+; CHECK-LABEL: uitofp_v8i8_float:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    zip1 v1.8b, v0.8b, v0.8b
+; CHECK-NEXT:    zip2 v0.8b, v0.8b, v0.8b
+; CHECK-NEXT:    bic v1.4h, #255, lsl #8
+; CHECK-NEXT:    bic v0.4h, #255, lsl #8
+; CHECK-NEXT:    ushll v1.4s, v1.4h, #0
+; CHECK-NEXT:    ushll v2.4s, v0.4h, #0
+; CHECK-NEXT:    ucvtf v0.4s, v1.4s
+; CHECK-NEXT:    ucvtf v1.4s, v2.4s
+; CHECK-NEXT:    ret
+  %1 = uitofp <8 x i8> %a to <8 x float>
+  ret <8 x float> %1
+}
+
+define <16 x float> @uitofp_v16i8_float(<16 x i8> %a) {
+; CHECK-LABEL: uitofp_v16i8_float:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    zip1 v1.8b, v0.8b, v0.8b
+; CHECK-NEXT:    zip2 v2.8b, v0.8b, v0.8b
+; CHECK-NEXT:    ext v0.16b, v0.16b, v0.16b, #8
+; CHECK-NEXT:    bic v1.4h, #255, lsl #8
+; CHECK-NEXT:    bic v2.4h, #255, lsl #8
+; CHECK-NEXT:    zip1 v3.8b, v0.8b, v0.8b
+; CHECK-NEXT:    zip2 v0.8b, v0.8b, v0.8b
+; CHECK-NEXT:    ushll v1.4s, v1.4h, #0
+; CHECK-NEXT:    ushll v2.4s, v2.4h, #0
+; CHECK-NEXT:    bic v3.4h, #255, lsl #8
+; CHECK-NEXT:    bic v0.4h, #255, lsl #8
+; CHECK-NEXT:    ushll v3.4s, v3.4h, #0
+; CHECK-NEXT:    ushll v4.4s, v0.4h, #0
+; CHECK-NEXT:    ucvtf v0.4s, v1.4s
+; CHECK-NEXT:    ucvtf v1.4s, v2.4s
+; CHECK-NEXT:    ucvtf v2.4s, v3.4s
+; CHECK-NEXT:    ucvtf v3.4s, v4.4s
+; CHECK-NEXT:    ret
+  %1 = uitofp <16 x i8> %a to <16 x float>
+  ret <16 x float> %1
+}
+
+define <8 x float> @uitofp_i16_float(<8 x i16> %a) {
+; CHECK-LABEL: uitofp_i16_float:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    ushll2 v1.4s, v0.8h, #0
+; CHECK-NEXT:    ushll v0.4s, v0.4h, #0
+; CHECK-NEXT:    ucvtf v1.4s, v1.4s
+; CHECK-NEXT:    ucvtf v0.4s, v0.4s
+; CHECK-NEXT:    ret
+  %1 = uitofp <8 x i16> %a to <8 x float>
+  ret <8 x float> %1
+}
+
+define <8 x float> @uitofp_i32_float(<8 x i32> %a) {
+; CHECK-LABEL: uitofp_i32_float:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    ucvtf v0.4s, v0.4s
+; CHECK-NEXT:    ucvtf v1.4s, v1.4s
+; CHECK-NEXT:    ret
+  %1 = uitofp <8 x i32> %a to <8 x float>
+  ret <8 x float> %1
+}
+
+define <8 x float> @uitofp_i64_float(<8 x i64> %a) {
+; CHECK-LABEL: uitofp_i64_float:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    ucvtf v2.2d, v2.2d
+; CHECK-NEXT:    ucvtf v0.2d, v0.2d
+; CHECK-NEXT:    ucvtf v4.2d, v1.2d
+; CHECK-NEXT:    fcvtn v0.2s, v0.2d
+; CHECK-NEXT:    fcvtn v1.2s, v2.2d
+; CHECK-NEXT:    ucvtf v2.2d, v3.2d
+; CHECK-NEXT:    fcvtn2 v0.4s, v4.2d
+; CHECK-NEXT:    fcvtn2 v1.4s, v2.2d
+; CHECK-NEXT:    ret
+  %1 = uitofp <8 x i64> %a to <8 x float>
+  ret <8 x float> %1
+}
+
+
+define <4 x double> @sitofp_v4i8_double(<4 x i8> %a) {
+; CHECK-LABEL: sitofp_v4i8_double:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    // kill: def $d0 killed $d0 def $q0
+; CHECK-NEXT:    umov w8, v0.h[0]
+; CHECK-NEXT:    umov w9, v0.h[2]
+; CHECK-NEXT:    umov w10, v0.h[1]
+; CHECK-NEXT:    fmov s1, w8
+; CHECK-NEXT:    umov w8, v0.h[3]
+; CHECK-NEXT:    fmov s0, w9
+; CHECK-NEXT:    mov v1.s[1], w10
+; CHECK-NEXT:    mov v0.s[1], w8
+; CHECK-NEXT:    shl v1.2s, v1.2s, #24
+; CHECK-NEXT:    shl v0.2s, v0.2s, #24
+; CHECK-NEXT:    sshr v1.2s, v1.2s, #24
+; CHECK-NEXT:    sshr v0.2s, v0.2s, #24
+; CHECK-NEXT:    sshll v1.2d, v1.2s, #0
+; CHECK-NEXT:    sshll v2.2d, v0.2s, #0
+; CHECK-NEXT:    scvtf v0.2d, v1.2d
+; CHECK-NEXT:    scvtf v1.2d, v2.2d
+; CHECK-NEXT:    ret
+  %1 = sitofp <4 x i8> %a to <4 x double>
+  ret <4 x double> %1
+}
+
+define <8 x double> @sitofp_v8i8_double(<8 x i8> %a) {
+; CHECK-LABEL: sitofp_v8i8_double:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    // kill: def $d0 killed $d0 def $q0
+; CHECK-NEXT:    umov w8, v0.b[0]
+; CHECK-NEXT:    umov w9, v0.b[2]
+; CHECK-NEXT:    umov w10, v0.b[4]
+; CHECK-NEXT:    umov w11, v0.b[6]
+; CHECK-NEXT:    fmov s1, w8
+; CHECK-NEXT:    umov w8, v0.b[1]
+; CHECK-NEXT:    fmov s2, w9
+; CHECK-NEXT:    umov w9, v0.b[3]
+; CHECK-NEXT:    fmov s3, w10
+; CHECK-NEXT:    umov w10, v0.b[5]
+; CHECK-NEXT:    fmov s4, w11
+; CHECK-NEXT:    umov w11, v0.b[7]
+; CHECK-NEXT:    mov v1.s[1], w8
+; CHECK-NEXT:    mov v2.s[1], w9
+; CHECK-NEXT:    mov v3.s[1], w10
+; CHECK-NEXT:    mov v4.s[1], w11
+; CHECK-NEXT:    shl v0.2s, v1.2s, #24
+; CHECK-NEXT:    shl v1.2s, v2.2s, #24
+; CHECK-NEXT:    shl v2.2s, v3.2s, #24
+; CHECK-NEXT:    sshr v0.2s, v0.2s, #24
+; CHECK-NEXT:    shl v3.2s, v4.2s, #24
+; CHECK-NEXT:    sshr v1.2s, v1.2s, #24
+; CHECK-NEXT:    sshr v2.2s, v2.2s, #24
+; CHECK-NEXT:    sshr v3.2s, v3.2s, #24
+; CHECK-NEXT:    sshll v0.2d, v0.2s, #0
+; CHECK-NEXT:    sshll v1.2d, v1.2s, #0
+; CHECK-NEXT:    sshll v2.2d, v2.2s, #0
+; CHECK-NEXT:    sshll v3.2d, v3.2s, #0
+; CHECK-NEXT:    scvtf v0.2d, v0.2d
+; CHECK-NEXT:    scvtf v1.2d, v1.2d
+; CHECK-NEXT:    scvtf v2.2d, v2.2d
+; CHECK-NEXT:    scvtf v3.2d, v3.2d
+; CHECK-NEXT:    ret
+  %1 = sitofp <8 x i8> %a to <8 x double>
+  ret <8 x double> %1
+}
+
+define <16 x double> @sitofp_v16i8_double(<16 x i8> %a) {
+; CHECK-LABEL: sitofp_v16i8_double:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    umov w8, v0.b[0]
+; CHECK-NEXT:    umov w9, v0.b[1]
+; CHECK-NEXT:    ext v1.16b, v0.16b, v0.16b, #8
+; CHECK-NEXT:    umov w11, v0.b[2]
+; CHECK-NEXT:    fmov s2, w8
+; CHECK-NEXT:    umov w8, v1.b[0]
+; CHECK-NEXT:    umov w10, v1.b[2]
+; CHECK-NEXT:    umov w12, v1.b[1]
+; CHECK-NEXT:    fmov s6, w11
+; CHECK-NEXT:    mov v2.s[1], w9
+; CHECK-NEXT:    umov w9, v1.b[4]
+; CHECK-NEXT:    umov w11, v0.b[5]
+; CHECK-NEXT:    fmov s3, w8
+; CHECK-NEXT:    umov w8, v1.b[3]
+; CHECK-NEXT:    fmov s4, w10
+; CHECK-NEXT:    umov w10, v1.b[5]
+; CHECK-NEXT:    fmov s5, w9
+; CHECK-NEXT:    umov w9, v1.b[6]
+; CHECK-NEXT:    mov v3.s[1], w12
+; CHECK-NEXT:    umov w12, v1.b[7]
+; CHECK-NEXT:    mov v4.s[1], w8
+; CHECK-NEXT:    umov w8, v0.b[4]
+; CHECK-NEXT:    mov v5.s[1], w10
+; CHECK-NEXT:    umov w10, v0.b[6]
+; CHECK-NEXT:    fmov s1, w9
+; CHECK-NEXT:    umov w9, v0.b[3]
+; CHECK-NEXT:    shl v3.2s, v3.2s, #24
+; CHECK-NEXT:    fmov s7, w8
+; CHECK-NEXT:    umov w8, v0.b[7]
+; CHECK-NEXT:    fmov s0, w10
+; CHECK-NEXT:    shl v4.2s, v4.2s, #24
+; CHECK-NEXT:    mov v1.s[1], w12
+; CHECK-NEXT:    shl v5.2s, v5.2s, #24
+; CHECK-NEXT:    mov v6.s[1], w9
+; CHECK-NEXT:    mov v7.s[1], w11
+; CHECK-NEXT:    mov v0.s[1], w8
+; CHECK-NEXT:    shl v1.2s, v1.2s, #24
+; CHECK-NEXT:    shl v2.2s, v2.2s, #24
+; CHECK-NEXT:    shl v6.2s, v6.2s, #24
+; CHECK-NEXT:    shl v7.2s, v7.2s, #24
+; CHECK-NEXT:    sshr v3.2s, v3.2s, #24
+; CHECK-NEXT:    shl v0.2s, v0.2s, #24
+; CHECK-NEXT:    sshr v4.2s, v4.2s, #24
+; CHECK-NEXT:    sshr v5.2s, v5.2s, #24
+; CHECK-NEXT:    sshr v1.2s, v1.2s, #24
+; CHECK-NEXT:    sshr v2.2s, v2.2s, #24
+; CHECK-NEXT:    sshr v6.2s, v6.2s, #24
+; CHECK-NEXT:    sshr v7.2s, v7.2s, #24
+; CHECK-NEXT:    sshr v0.2s, v0.2s, #24
+; CHECK-NEXT:    sshll v16.2d, v3.2s, #0
+; CHECK-NEXT:    sshll v17.2d, v4.2s, #0
+; CHECK-NEXT:    sshll v18.2d, v5.2s, #0
+; CHECK-NEXT:    sshll v19.2d, v1.2s, #0
+; CHECK-NEXT:    sshll v1.2d, v2.2s, #0
+; CHECK-NEXT:    sshll v2.2d, v6.2s, #0
+; CHECK-NEXT:    sshll v3.2d, v7.2s, #0
+; CHECK-NEXT:    sshll v4.2d, v0.2s, #0
+; CHECK-NEXT:    scvtf v0.2d, v1.2d
+; CHECK-NEXT:    scvtf v1.2d, v2.2d
+; CHECK-NEXT:    scvtf v2.2d, v3.2d
+; CHECK-NEXT:    scvtf v3.2d, v4.2d
+; CHECK-NEXT:    scvtf v4.2d, v16.2d
+; CHECK-NEXT:    scvtf v5.2d, v17.2d
+; CHECK-NEXT:    scvtf v6.2d, v18.2d
+; CHECK-NEXT:    scvtf v7.2d, v19.2d
+; CHECK-NEXT:    ret
+  %1 = sitofp <16 x i8> %a to <16 x double>
+  ret <16 x double> %1
+}
+
+define <8 x double> @sitofp_i16_double(<8 x i16> %a) {
+; CHECK-LABEL: sitofp_i16_double:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    ext v1.16b, v0.16b, v0.16b, #8
+; CHECK-NEXT:    umov w8, v0.h[0]
+; CHECK-NEXT:    umov w9, v0.h[2]
+; CHECK-NEXT:    umov w11, v0.h[1]
+; CHECK-NEXT:    umov w10, v1.h[0]
+; CHECK-NEXT:    umov w12, v1.h[2]
+; CHECK-NEXT:    fmov s2, w8
+; CHECK-NEXT:    umov w8, v0.h[3]
+; CHECK-NEXT:    fmov s0, w9
+; CHECK-NEXT:    umov w9, v1.h[1]
+; CHECK-NEXT:    fmov s3, w10
+; CHECK-NEXT:    umov w10, v1.h[3]
+; CHECK-NEXT:    fmov s1, w12
+; CHECK-NEXT:    mov v0.s[1], w8
+; CHECK-NEXT:    mov v2.s[1], w11
+; CHECK-NEXT:    mov v3.s[1], w9
+; CHECK-NEXT:    mov v1.s[1], w10
+; CHECK-NEXT:    shl v0.2s, v0.2s, #16
+; CHECK-NEXT:    shl v2.2s, v2.2s, #16
+; CHECK-NEXT:    sshr v0.2s, v0.2s, #16
+; CHECK-NEXT:    shl v3.2s, v3.2s, #16
+; CHECK-NEXT:    shl v1.2s, v1.2s, #16
+; CHECK-NEXT:    sshr v2.2s, v2.2s, #16
+; CHECK-NEXT:    sshll v4.2d, v0.2s, #0
+; CHECK-NEXT:    sshr v0.2s, v3.2s, #16
+; CHECK-NEXT:    sshr v1.2s, v1.2s, #16
+; CHECK-NEXT:    sshll v2.2d, v2.2s, #0
+; CHECK-NEXT:    sshll v3.2d, v0.2s, #0
+; CHECK-NEXT:    sshll v5.2d, v1.2s, #0
+; CHECK-NEXT:    scvtf v0.2d, v2.2d
+; CHECK-NEXT:    scvtf v1.2d, v4.2d
+; CHECK-NEXT:    scvtf v2.2d, v3.2d
+; CHECK-NEXT:    scvtf v3.2d, v5.2d
+; CHECK-NEXT:    ret
+  %1 = sitofp <8 x i16> %a to <8 x double>
+  ret <8 x double> %1
+}
+
+define <8 x double> @sitofp_i32_double(<8 x i32> %a) {
+; CHECK-LABEL: sitofp_i32_double:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    sshll2 v2.2d, v0.4s, #0
+; CHECK-NEXT:    sshll2 v3.2d, v1.4s, #0
+; CHECK-NEXT:    sshll v0.2d, v0.2s, #0
+; CHECK-NEXT:    sshll v4.2d, v1.2s, #0
+; CHECK-NEXT:    scvtf v1.2d, v2.2d
+; CHECK-NEXT:    scvtf v0.2d, v0.2d
+; CHECK-NEXT:    scvtf v3.2d, v3.2d
+; CHECK-NEXT:    scvtf v2.2d, v4.2d
+; CHECK-NEXT:    ret
+  %1 = sitofp <8 x i32> %a to <8 x double>
+  ret <8 x double> %1
+}
+
+define <8 x double> @sitofp_i64_double(<8 x i64> %a) {
+; CHECK-LABEL: sitofp_i64_double:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    scvtf v0.2d, v0.2d
+; CHECK-NEXT:    scvtf v1.2d, v1.2d
+; CHECK-NEXT:    scvtf v2.2d, v2.2d
+; CHECK-NEXT:    scvtf v3.2d, v3.2d
+; CHECK-NEXT:    ret
+  %1 = sitofp <8 x i64> %a to <8 x double>
+  ret <8 x double> %1
+}
+
+define <4 x double> @uitofp_v4i8_double(<4 x i8> %a) {
+; CHECK-LABEL: uitofp_v4i8_double:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    // kill: def $d0 killed $d0 def $q0
+; CHECK-NEXT:    umov w8, v0.h[0]
+; CHECK-NEXT:    umov w9, v0.h[2]
+; CHECK-NEXT:    umov w10, v0.h[1]
+; CHECK-NEXT:    movi d1, #0x0000ff000000ff
+; CHECK-NEXT:    fmov s2, w8
+; CHECK-NEXT:    umov w8, v0.h[3]
+; CHECK-NEXT:    fmov s0, w9
+; CHECK-NEXT:    mov v2.s[1], w10
+; CHECK-NEXT:    mov v0.s[1], w8
+; CHECK-NEXT:    and v2.8b, v2.8b, v1.8b
+; CHECK-NEXT:    and v0.8b, v0.8b, v1.8b
+; CHECK-NEXT:    ushll v1.2d, v2.2s, #0
+; CHECK-NEXT:    ushll v2.2d, v0.2s, #0
+; CHECK-NEXT:    ucvtf v0.2d, v1.2d
+; CHECK-NEXT:    ucvtf v1.2d, v2.2d
+; CHECK-NEXT:    ret
+  %1 = uitofp <4 x i8> %a to <4 x double>
+  ret <4 x double> %1
+}
+
+define <8 x double> @uitofp_v8i8_double(<8 x i8> %a) {
+; CHECK-LABEL: uitofp_v8i8_double:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    // kill: def $d0 killed $d0 def $q0
+; CHECK-NEXT:    umov w8, v0.b[0]
+; CHECK-NEXT:    umov w9, v0.b[2]
+; CHECK-NEXT:    umov w10, v0.b[4]
+; CHECK-NEXT:    umov w11, v0.b[6]
+; CHECK-NEXT:    movi d1, #0x0000ff000000ff
+; CHECK-NEXT:    fmov s2, w8
+; CHECK-NEXT:    umov w8, v0.b[1]
+; CHECK-NEXT:    fmov s3, w9
+; CHECK-NEXT:    umov w9, v0.b[3]
+; CHECK-NEXT:    fmov s4, w10
+; CHECK-NEXT:    umov w10, v0.b[5]
+; CHECK-NEXT:    fmov s5, w11
+; CHECK-NEXT:    umov w11, v0.b[7]
+; CHECK-NEXT:    mov v2.s[1], w8
+; CHECK-NEXT:    mov v3.s[1], w9
+; CHECK-NEXT:    mov v4.s[1], w10
+; CHECK-NEXT:    mov v5.s[1], w11
+; CHECK-NEXT:    and v0.8b, v2.8b, v1.8b
+; CHECK-NEXT:    and v2.8b, v3.8b, v1.8b
+; CHECK-NEXT:    and v3.8b, v4.8b, v1.8b
+; CHECK-NEXT:    and v1.8b, v5.8b, v1.8b
+; CHECK-NEXT:    ushll v0.2d, v0.2s, #0
+; CHECK-NEXT:    ushll v2.2d, v2.2s, #0
+; CHECK-NEXT:    ushll v3.2d, v3.2s, #0
+; CHECK-NEXT:    ushll v4.2d, v1.2s, #0
+; CHECK-NEXT:    ucvtf v0.2d, v0.2d
+; CHECK-NEXT:    ucvtf v1.2d, v2.2d
+; CHECK-NEXT:    ucvtf v2.2d, v3.2d
+; CHECK-NEXT:    ucvtf v3.2d, v4.2d
+; CHECK-NEXT:    ret
+  %1 = uitofp <8 x i8> %a to <8 x double>
+  ret <8 x double> %1
+}
+
+define <16 x double> @uitofp_v16i8_double(<16 x i8> %a) {
+; CHECK-LABEL: uitofp_v16i8_double:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    ext v3.16b, v0.16b, v0.16b, #8
+; CHECK-NEXT:    umov w11, v0.b[0]
+; CHECK-NEXT:    movi d1, #0x0000ff000000ff
+; CHECK-NEXT:    umov w8, v3.b[0]
+; CHECK-NEXT:    umov w9, v3.b[1]
+; CHECK-NEXT:    umov w10, v3.b[4]
+; CHECK-NEXT:    umov w12, v3.b[3]
+; CHECK-NEXT:    fmov s6, w11
+; CHECK-NEXT:    umov w11, v0.b[3]
+; CHECK-NEXT:    fmov s2, w8
+; CHECK-NEXT:    umov w8, v3.b[2]
+; CHECK-NEXT:    fmov s5, w10
+; CHECK-NEXT:    umov w10, v3.b[7]
+; CHECK-NEXT:    mov v2.s[1], w9
+; CHECK-NEXT:    umov w9, v3.b[6]
+; CHECK-NEXT:    fmov s4, w8
+; CHECK-NEXT:    umov w8, v3.b[5]
+; CHECK-NEXT:    fmov s3, w9
+; CHECK-NEXT:    umov w9, v0.b[2]
+; CHECK-NEXT:    mov v4.s[1], w12
+; CHECK-NEXT:    umov w12, v0.b[6]
+; CHECK-NEXT:    mov v5.s[1], w8
+; CHECK-NEXT:    umov w8, v0.b[4]
+; CHECK-NEXT:    mov v3.s[1], w10
+; CHECK-NEXT:    umov w10, v0.b[1]
+; CHECK-NEXT:    fmov s7, w9
+; CHECK-NEXT:    umov w9, v0.b[5]
+; CHECK-NEXT:    and v2.8b, v2.8b, v1.8b
+; CHECK-NEXT:    fmov s16, w8
+; CHECK-NEXT:    umov w8, v0.b[7]
+; CHECK-NEXT:    fmov s0, w12
+; CHECK-NEXT:    and v4.8b, v4.8b, v1.8b
+; CHECK-NEXT:    mov v6.s[1], w10
+; CHECK-NEXT:    and v5.8b, v5.8b, v1.8b
+; CHECK-NEXT:    mov v7.s[1], w11
+; CHECK-NEXT:    mov v16.s[1], w9
+; CHECK-NEXT:    mov v0.s[1], w8
+; CHECK-NEXT:    and v3.8b, v3.8b, v1.8b
+; CHECK-NEXT:    and v6.8b, v6.8b, v1.8b
+; CHECK-NEXT:    and v7.8b, v7.8b, v1.8b
+; CHECK-NEXT:    and v16.8b, v16.8b, v1.8b
+; CHECK-NEXT:    and v0.8b, v0.8b, v1.8b
+; CHECK-NEXT:    ushll v17.2d, v2.2s, #0
+; CHECK-NEXT:    ushll v18.2d, v4.2s, #0
+; CHECK-NEXT:    ushll v19.2d, v5.2s, #0
+; CHECK-NEXT:    ushll v20.2d, v3.2s, #0
+; CHECK-NEXT:    ushll v1.2d, v6.2s, #0
+; CHECK-NEXT:    ushll v2.2d, v7.2s, #0
+; CHECK-NEXT:    ushll v3.2d, v16.2s, #0
+; CHECK-NEXT:    ushll v4.2d, v0.2s, #0
+; CHECK-NEXT:    ucvtf v0.2d, v1.2d
+; CHECK-NEXT:    ucvtf v1.2d, v2.2d
+; CHECK-NEXT:    ucvtf v2.2d, v3.2d
+; CHECK-NEXT:    ucvtf v3.2d, v4.2d
+; CHECK-NEXT:    ucvtf v4.2d, v17.2d
+; CHECK-NEXT:    ucvtf v5.2d, v18.2d
+; CHECK-NEXT:    ucvtf v6.2d, v19.2d
+; CHECK-NEXT:    ucvtf v7.2d, v20.2d
+; CHECK-NEXT:    ret
+  %1 = uitofp <16 x i8> %a to <16 x double>
+  ret <16 x double> %1
+}
+
+define <8 x double> @uitofp_i16_double(<8 x i16> %a) {
+; CHECK-LABEL: uitofp_i16_double:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    ext v2.16b, v0.16b, v0.16b, #8
+; CHECK-NEXT:    umov w8, v0.h[0]
+; CHECK-NEXT:    umov w9, v0.h[2]
+; CHECK-NEXT:    umov w11, v0.h[1]
+; CHECK-NEXT:    movi d1, #0x00ffff0000ffff
+; CHECK-NEXT:    umov w10, v2.h[0]
+; CHECK-NEXT:    umov w12, v2.h[2]
+; CHECK-NEXT:    fmov s3, w8
+; CHECK-NEXT:    umov w8, v0.h[3]
+; CHECK-NEXT:    fmov s0, w9
+; CHECK-NEXT:    umov w9, v2.h[1]
+; CHECK-NEXT:    fmov s4, w10
+; CHECK-NEXT:    umov w10, v2.h[3]
+; CHECK-NEXT:    fmov s2, w12
+; CHECK-NEXT:    mov v0.s[1], w8
+; CHECK-NEXT:    mov v3.s[1], w11
+; CHECK-NEXT:    mov v4.s[1], w9
+; CHECK-NEXT:    mov v2.s[1], w10
+; CHECK-NEXT:    and v0.8b, v0.8b, v1.8b
+; CHECK-NEXT:    and v3.8b, v3.8b, v1.8b
+; CHECK-NEXT:    ushll v5.2d, v0.2s, #0
+; CHECK-NEXT:    and v0.8b, v4.8b, v1.8b
+; CHECK-NEXT:    and v1.8b, v2.8b, v1.8b
+; CHECK-NEXT:    ushll v3.2d, v3.2s, #0
+; CHECK-NEXT:    ushll v2.2d, v0.2s, #0
+; CHECK-NEXT:    ushll v4.2d, v1.2s, #0
+; CHECK-NEXT:    ucvtf v0.2d, v3.2d
+; CHECK-NEXT:    ucvtf v1.2d, v5.2d
+; CHECK-NEXT:    ucvtf v2.2d, v2.2d
+; CHECK-NEXT:    ucvtf v3.2d, v4.2d
+; CHECK-NEXT:    ret
+  %1 = uitofp <8 x i16> %a to <8 x double>
+  ret <8 x double> %1
+}
+
+define <8 x double> @uitofp_i32_double(<8 x i32> %a) {
+; CHECK-LABEL: uitofp_i32_double:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    ushll2 v2.2d, v0.4s, #0
+; CHECK-NEXT:    ushll2 v3.2d, v1.4s, #0
+; CHECK-NEXT:    ushll v0.2d, v0.2s, #0
+; CHECK-NEXT:    ushll v4.2d, v1.2s, #0
+; CHECK-NEXT:    ucvtf v1.2d, v2.2d
+; CHECK-NEXT:    ucvtf v0.2d, v0.2d
+; CHECK-NEXT:    ucvtf v3.2d, v3.2d
+; CHECK-NEXT:    ucvtf v2.2d, v4.2d
+; CHECK-NEXT:    ret
+  %1 = uitofp <8 x i32> %a to <8 x double>
+  ret <8 x double> %1
+}
+
+define <8 x double> @uitofp_i64_double(<8 x i64> %a) {
+; CHECK-LABEL: uitofp_i64_double:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    ucvtf v0.2d, v0.2d
+; CHECK-NEXT:    ucvtf v1.2d, v1.2d
+; CHECK-NEXT:    ucvtf v2.2d, v2.2d
+; CHECK-NEXT:    ucvtf v3.2d, v3.2d
+; CHECK-NEXT:    ret
+  %1 = uitofp <8 x i64> %a to <8 x double>
+  ret <8 x double> %1
+}


        


More information about the llvm-commits mailing list