[PATCH] D20468: [X86][AVX] Ensure zero-extension of _mm256_extract_epi8 and _mm256_extract_epi16
Simon Pilgrim via cfe-commits
cfe-commits at lists.llvm.org
Sat May 21 14:20:55 PDT 2016
This revision was automatically updated to reflect the committed changes.
Closed by commit rL270330: [X86][AVX] Ensure zero-extension of _mm256_extract_epi8 and _mm256_extract_epi16 (authored by RKSimon).
Changed prior to commit:
http://reviews.llvm.org/D20468?vs=57927&id=58045#toc
Repository:
rL LLVM
http://reviews.llvm.org/D20468
Files:
cfe/trunk/lib/Headers/avxintrin.h
cfe/trunk/test/CodeGen/avx-builtins.c
Index: cfe/trunk/test/CodeGen/avx-builtins.c
===================================================================
--- cfe/trunk/test/CodeGen/avx-builtins.c
+++ cfe/trunk/test/CodeGen/avx-builtins.c
@@ -314,21 +314,19 @@
return _mm256_dp_ps(A, B, 7);
}
-// FIXME: ZEXT instead of SEXT
int test_mm256_extract_epi8(__m256i A) {
// CHECK-LABEL: test_mm256_extract_epi8
// CHECK: and i32 %{{.*}}, 31
// CHECK: extractelement <32 x i8> %{{.*}}, i32 %{{.*}}
- // CHECK: ext i8 %{{.*}} to i32
+ // CHECK: zext i8 %{{.*}} to i32
return _mm256_extract_epi8(A, 32);
}
-// FIXME: ZEXT instead of SEXT
int test_mm256_extract_epi16(__m256i A) {
// CHECK-LABEL: test_mm256_extract_epi16
// CHECK: and i32 %{{.*}}, 15
// CHECK: extractelement <16 x i16> %{{.*}}, i32 %{{.*}}
- // CHECK: ext i16 %{{.*}} to i32
+ // CHECK: zext i16 %{{.*}} to i32
return _mm256_extract_epi16(A, 16);
}
Index: cfe/trunk/lib/Headers/avxintrin.h
===================================================================
--- cfe/trunk/lib/Headers/avxintrin.h
+++ cfe/trunk/lib/Headers/avxintrin.h
@@ -1875,13 +1875,13 @@
/// \param __imm
/// An immediate integer operand with bits [3:0] determining which vector
/// element is extracted and returned.
-/// \returns A 32-bit integer containing the extracted 16 bits of extended
+/// \returns A 32-bit integer containing the extracted 16 bits of zero extended
/// packed data.
static __inline int __DEFAULT_FN_ATTRS
_mm256_extract_epi16(__m256i __a, const int __imm)
{
__v16hi __b = (__v16hi)__a;
- return __b[__imm & 15];
+ return (unsigned short)__b[__imm & 15];
}
/// \brief Takes a [32 x i8] vector and returns the vector element value
@@ -1897,13 +1897,13 @@
/// \param __imm
/// An immediate integer operand with bits [4:0] determining which vector
/// element is extracted and returned.
-/// \returns A 32-bit integer containing the extracted 8 bits of extended packed
-/// data.
+/// \returns A 32-bit integer containing the extracted 8 bits of zero extended
+/// packed data.
static __inline int __DEFAULT_FN_ATTRS
_mm256_extract_epi8(__m256i __a, const int __imm)
{
__v32qi __b = (__v32qi)__a;
- return __b[__imm & 31];
+ return (unsigned char)__b[__imm & 31];
}
#ifdef __x86_64__
-------------- next part --------------
A non-text attachment was scrubbed...
Name: D20468.58045.patch
Type: text/x-patch
Size: 2288 bytes
Desc: not available
URL: <http://lists.llvm.org/pipermail/cfe-commits/attachments/20160521/29b28c81/attachment.bin>
More information about the cfe-commits
mailing list