[llvm] 09afe41 - [InstCombine] For vector extract when extract vector and insert value type is the same
Philip Reames via llvm-commits
llvm-commits at lists.llvm.org
Fri Aug 19 07:18:12 PDT 2022
JFYI, raised a correctness concern on the original review.
Philip
On 8/19/22 04:14, Caroline Concatto via llvm-commits wrote:
> Author: Caroline Concatto
> Date: 2022-08-19T12:13:03+01:00
> New Revision: 09afe4155b304c8ab9e90c5699f1c0f10ccd0a7e
>
> URL: https://github.com/llvm/llvm-project/commit/09afe4155b304c8ab9e90c5699f1c0f10ccd0a7e
> DIFF: https://github.com/llvm/llvm-project/commit/09afe4155b304c8ab9e90c5699f1c0f10ccd0a7e.diff
>
> LOG: [InstCombine] For vector extract when extract vector and insert value type is the same
>
> This patch has implements these optimizations:
>
> extract.vector(insert.vector(Vector, Value, Idx), Idx) --> Value
>
> extract.vector(insert.vector(Vector, Value, InsertIndex), ExtractIndex)
> --> extract.vector(Vector, ExtractIndex)
>
> Reviewed By: sdesmalen
>
> Differential Revision: https://reviews.llvm.org/D132137
>
> Added:
> llvm/test/Transforms/InstCombine/opts-tuples-extract-intrinsic.ll
>
> Modified:
> llvm/lib/Transforms/InstCombine/InstCombineCalls.cpp
>
> Removed:
>
>
>
> ################################################################################
> diff --git a/llvm/lib/Transforms/InstCombine/InstCombineCalls.cpp b/llvm/lib/Transforms/InstCombine/InstCombineCalls.cpp
> index 43b8bd41500c0..06db948cafcbf 100644
> --- a/llvm/lib/Transforms/InstCombine/InstCombineCalls.cpp
> +++ b/llvm/lib/Transforms/InstCombine/InstCombineCalls.cpp
> @@ -2409,7 +2409,31 @@ Instruction *InstCombinerImpl::visitCallInst(CallInst &CI) {
> Value *Vec = II->getArgOperand(0);
> Value *Idx = II->getArgOperand(1);
>
> - auto *DstTy = dyn_cast<FixedVectorType>(II->getType());
> + Type *ReturnType = II->getType();
> + // (extract_vector (insert_vector InsertTuple, InsertValue, InsertIdx),
> + // ExtractIdx)
> + unsigned ExtractIdx = cast<ConstantInt>(Idx)->getZExtValue();
> + Value *InsertTuple, *InsertIdx, *InsertValue;
> + if (match(Vec, m_Intrinsic<Intrinsic::vector_insert>(m_Value(InsertTuple),
> + m_Value(InsertValue),
> + m_Value(InsertIdx))) &&
> + InsertValue->getType() == ReturnType) {
> + unsigned Index = cast<ConstantInt>(InsertIdx)->getZExtValue();
> + // Case where we get the same index right after setting it.
> + // extract.vector(insert.vector(InsertTuple, InsertValue, Idx), Idx) -->
> + // InsertValue
> + if (ExtractIdx == Index)
> + return replaceInstUsesWith(CI, InsertValue);
> + // If we are getting a
> diff erent index than what was set in the
> + // insert.vector intrinsic. We can just set the input tuple to the one up
> + // in the chain. extract.vector(insert.vector(InsertTuple, InsertValue,
> + // InsertIndex), ExtractIndex)
> + // --> extract.vector(InsertTuple, ExtractIndex)
> + else
> + return replaceOperand(CI, 0, InsertTuple);
> + }
> +
> + auto *DstTy = dyn_cast<FixedVectorType>(ReturnType);
> auto *VecTy = dyn_cast<FixedVectorType>(Vec->getType());
>
> // Only canonicalize if the the destination vector and Vec are fixed
>
> diff --git a/llvm/test/Transforms/InstCombine/opts-tuples-extract-intrinsic.ll b/llvm/test/Transforms/InstCombine/opts-tuples-extract-intrinsic.ll
> new file mode 100644
> index 0000000000000..4303d963ea886
> --- /dev/null
> +++ b/llvm/test/Transforms/InstCombine/opts-tuples-extract-intrinsic.ll
> @@ -0,0 +1,44 @@
> +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
> +; RUN: opt -S -passes=instcombine < %s | FileCheck %s
> +
> +; Check that the redundant sequences of extract/insert are eliminated.
> +
> +; extract.vector(insert.vector(Tuple, Value, Idx), Idx) --> Value
> +define <vscale x 16 x i8> @test_extract_insert_same_idx(<vscale x 64 x i8> %v0, <vscale x 16 x i8> %v1) {
> +; CHECK-LABEL: @test_extract_insert_same_idx(
> +; CHECK-NEXT: ret <vscale x 16 x i8> [[V1:%.*]]
> +;
> + %vec.ins = call <vscale x 64 x i8> @llvm.vector.insert.nxv64i8.nxv16i8(<vscale x 64 x i8> %v0, <vscale x 16 x i8> %v1, i64 48)
> + %vec.ext = call <vscale x 16 x i8> @llvm.vector.extract.nxv16i8.nxv64i8(<vscale x 64 x i8> %vec.ins, i64 48)
> + ret <vscale x 16 x i8> %vec.ext
> +}
> +
> +; extract.vector(insert.vector(Vector, Value, InsertIndex), ExtractIndex)
> +; --> extract.vector(Vector, ExtractIndex)
> +define <vscale x 16 x i8> @test_extract_insert_dif_idx(<vscale x 64 x i8> %v0, <vscale x 16 x i8> %v1) {
> +; CHECK-LABEL: @test_extract_insert_dif_idx(
> +; CHECK-NEXT: [[VEC_EXT:%.*]] = call <vscale x 16 x i8> @llvm.vector.extract.nxv16i8.nxv64i8(<vscale x 64 x i8> [[V0:%.*]], i64 0)
> +; CHECK-NEXT: ret <vscale x 16 x i8> [[VEC_EXT]]
> +;
> + %vec.ins = call <vscale x 64 x i8> @llvm.vector.insert.nxv64i8.nxv16i8(<vscale x 64 x i8> %v0, <vscale x 16 x i8> %v1, i64 48)
> + %vec.ext = call <vscale x 16 x i8> @llvm.vector.extract.nxv16i8.nxv64i8(<vscale x 64 x i8> %vec.ins, i64 0)
> + ret <vscale x 16 x i8> %vec.ext
> +}
> +
> +; Negative test
> +; The extracted vector-size != inserted vector-size
> +define <vscale x 32 x i8> @neg_test_extract_insert_same_idx_dif_ret_size(<vscale x 64 x i8> %v0, <vscale x 16 x i8> %v1) {
> +; CHECK-LABEL: @neg_test_extract_insert_same_idx_dif_ret_size(
> +; CHECK-NEXT: [[VEC_INS:%.*]] = call <vscale x 64 x i8> @llvm.vector.insert.nxv64i8.nxv16i8(<vscale x 64 x i8> [[V0:%.*]], <vscale x 16 x i8> [[V1:%.*]], i64 32)
> +; CHECK-NEXT: [[VEC_EXT:%.*]] = call <vscale x 32 x i8> @llvm.vector.extract.nxv32i8.nxv64i8(<vscale x 64 x i8> [[VEC_INS]], i64 32)
> +; CHECK-NEXT: ret <vscale x 32 x i8> [[VEC_EXT]]
> +;
> + %vec.ins = call <vscale x 64 x i8> @llvm.vector.insert.nxv64i8.nxv16i8(<vscale x 64 x i8> %v0, <vscale x 16 x i8> %v1, i64 32)
> + %vec.ext = call <vscale x 32 x i8> @llvm.vector.extract.nxv32i8.nxv64i8(<vscale x 64 x i8> %vec.ins, i64 32)
> + ret <vscale x 32 x i8> %vec.ext
> +}
> +
> +
> +declare <vscale x 64 x i8> @llvm.vector.insert.nxv64i8.nxv16i8(<vscale x 64 x i8>, <vscale x 16 x i8>, i64)
> +declare <vscale x 16 x i8> @llvm.vector.extract.nxv16i8.nxv64i8(<vscale x 64 x i8>, i64)
> +declare <vscale x 32 x i8> @llvm.vector.extract.nxv32i8.nxv64i8(<vscale x 64 x i8>, i64)
>
>
>
> _______________________________________________
> llvm-commits mailing list
> llvm-commits at lists.llvm.org
> https://lists.llvm.org/cgi-bin/mailman/listinfo/llvm-commits
More information about the llvm-commits
mailing list