[llvm] 6526fa3 - [NFC][VectorCombine] Add baseline test coverage for GEP scalarization
Roman Lebedev via llvm-commits
llvm-commits at lists.llvm.org
Thu Oct 7 15:16:19 PDT 2021
Author: Roman Lebedev
Date: 2021-10-08T01:16:08+03:00
New Revision: 6526fa35894f2782abed9d608d91019f98ed397d
URL: https://github.com/llvm/llvm-project/commit/6526fa35894f2782abed9d608d91019f98ed397d
DIFF: https://github.com/llvm/llvm-project/commit/6526fa35894f2782abed9d608d91019f98ed397d.diff
LOG: [NFC][VectorCombine] Add baseline test coverage for GEP scalarization
Added:
llvm/test/Transforms/VectorCombine/X86/scalarize-vector-gep.ll
Modified:
Removed:
################################################################################
diff --git a/llvm/test/Transforms/VectorCombine/X86/scalarize-vector-gep.ll b/llvm/test/Transforms/VectorCombine/X86/scalarize-vector-gep.ll
new file mode 100644
index 0000000000000..24f3e09c4d163
--- /dev/null
+++ b/llvm/test/Transforms/VectorCombine/X86/scalarize-vector-gep.ll
@@ -0,0 +1,825 @@
+; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
+; RUN: opt < %s -vector-combine -S -mtriple=x86_64-- -mattr=SSE2 | FileCheck %s --check-prefixes=CHECK,SSE
+; RUN: opt < %s -vector-combine -S -mtriple=x86_64-- -mattr=AVX2 | FileCheck %s --check-prefixes=CHECK,AVX
+
+target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
+
+declare void @use(i64*)
+
+;-------------------------------------------------------------------------------
+
+define void @both_operands_need_extraction.2elts(<2 x i64*> %baseptrs, <2 x i64> %indices) {
+; CHECK-LABEL: @both_operands_need_extraction.2elts(
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <2 x i64*> [[BASEPTRS:%.*]], <2 x i64> [[INDICES:%.*]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <2 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <2 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: ret void
+;
+ %ptrs = getelementptr inbounds i64, <2 x i64*> %baseptrs, <2 x i64> %indices
+
+ %ptr.0 = extractelement <2 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <2 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ ret void
+}
+
+define void @both_operands_need_extraction.3elts(<3 x i64*> %baseptrs, <3 x i64> %indices) {
+; CHECK-LABEL: @both_operands_need_extraction.3elts(
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <3 x i64*> [[BASEPTRS:%.*]], <3 x i64> [[INDICES:%.*]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: [[PTR_2:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 2
+; CHECK-NEXT: call void @use(i64* [[PTR_2]])
+; CHECK-NEXT: ret void
+;
+ %ptrs = getelementptr inbounds i64, <3 x i64*> %baseptrs, <3 x i64> %indices
+
+ %ptr.0 = extractelement <3 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <3 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ %ptr.2 = extractelement <3 x i64*> %ptrs, i64 2
+ call void @use(i64* %ptr.2)
+
+ ret void
+}
+
+define void @both_operands_need_extraction.4elts(<4 x i64*> %baseptrs, <4 x i64> %indices) {
+; CHECK-LABEL: @both_operands_need_extraction.4elts(
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <4 x i64*> [[BASEPTRS:%.*]], <4 x i64> [[INDICES:%.*]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: [[PTR_2:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 2
+; CHECK-NEXT: call void @use(i64* [[PTR_2]])
+; CHECK-NEXT: [[PTR_3:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 3
+; CHECK-NEXT: call void @use(i64* [[PTR_3]])
+; CHECK-NEXT: ret void
+;
+ %ptrs = getelementptr inbounds i64, <4 x i64*> %baseptrs, <4 x i64> %indices
+
+ %ptr.0 = extractelement <4 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <4 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ %ptr.2 = extractelement <4 x i64*> %ptrs, i64 2
+ call void @use(i64* %ptr.2)
+
+ %ptr.3 = extractelement <4 x i64*> %ptrs, i64 3
+ call void @use(i64* %ptr.3)
+
+ ret void
+}
+
+;-------------------------------------------------------------------------------
+
+define void @indicies_need_extraction.2elts(i64* %baseptr, <2 x i64> %indices) {
+; CHECK-LABEL: @indicies_need_extraction.2elts(
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, i64* [[BASEPTR:%.*]], <2 x i64> [[INDICES:%.*]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <2 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <2 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: ret void
+;
+ %ptrs = getelementptr inbounds i64, i64* %baseptr, <2 x i64> %indices
+
+ %ptr.0 = extractelement <2 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <2 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ ret void
+}
+
+define void @indicies_need_extraction.3elts(i64* %baseptr, <3 x i64> %indices) {
+; CHECK-LABEL: @indicies_need_extraction.3elts(
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, i64* [[BASEPTR:%.*]], <3 x i64> [[INDICES:%.*]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: [[PTR_2:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 2
+; CHECK-NEXT: call void @use(i64* [[PTR_2]])
+; CHECK-NEXT: ret void
+;
+ %ptrs = getelementptr inbounds i64, i64* %baseptr, <3 x i64> %indices
+
+ %ptr.0 = extractelement <3 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <3 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ %ptr.2 = extractelement <3 x i64*> %ptrs, i64 2
+ call void @use(i64* %ptr.2)
+
+ ret void
+}
+
+define void @indicies_need_extraction.4elts(i64* %baseptr, <4 x i64> %indices) {
+; CHECK-LABEL: @indicies_need_extraction.4elts(
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, i64* [[BASEPTR:%.*]], <4 x i64> [[INDICES:%.*]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: [[PTR_2:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 2
+; CHECK-NEXT: call void @use(i64* [[PTR_2]])
+; CHECK-NEXT: [[PTR_3:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 3
+; CHECK-NEXT: call void @use(i64* [[PTR_3]])
+; CHECK-NEXT: ret void
+;
+ %ptrs = getelementptr inbounds i64, i64* %baseptr, <4 x i64> %indices
+
+ %ptr.0 = extractelement <4 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <4 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ %ptr.2 = extractelement <4 x i64*> %ptrs, i64 2
+ call void @use(i64* %ptr.2)
+
+ %ptr.3 = extractelement <4 x i64*> %ptrs, i64 3
+ call void @use(i64* %ptr.3)
+
+ ret void
+}
+
+;-------------------------------------------------------------------------------
+
+define void @baseptrs_need_extraction.2elts(<2 x i64*> %baseptrs, i64 %indice) {
+; CHECK-LABEL: @baseptrs_need_extraction.2elts(
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <2 x i64*> [[BASEPTRS:%.*]], i64 [[INDICE:%.*]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <2 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <2 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: ret void
+;
+ %ptrs = getelementptr inbounds i64, <2 x i64*> %baseptrs, i64 %indice
+
+ %ptr.0 = extractelement <2 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <2 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ ret void
+}
+
+define void @baseptrs_need_extraction.3elts(<3 x i64*> %baseptrs, i64 %indice) {
+; CHECK-LABEL: @baseptrs_need_extraction.3elts(
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <3 x i64*> [[BASEPTRS:%.*]], i64 [[INDICE:%.*]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: [[PTR_2:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 2
+; CHECK-NEXT: call void @use(i64* [[PTR_2]])
+; CHECK-NEXT: ret void
+;
+ %ptrs = getelementptr inbounds i64, <3 x i64*> %baseptrs, i64 %indice
+
+ %ptr.0 = extractelement <3 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <3 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ %ptr.2 = extractelement <3 x i64*> %ptrs, i64 2
+ call void @use(i64* %ptr.2)
+
+ ret void
+}
+
+define void @baseptrs_need_extraction.4elts(<4 x i64*> %baseptrs, i64 %indice) {
+; CHECK-LABEL: @baseptrs_need_extraction.4elts(
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <4 x i64*> [[BASEPTRS:%.*]], i64 [[INDICE:%.*]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: [[PTR_2:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 2
+; CHECK-NEXT: call void @use(i64* [[PTR_2]])
+; CHECK-NEXT: [[PTR_3:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 3
+; CHECK-NEXT: call void @use(i64* [[PTR_3]])
+; CHECK-NEXT: ret void
+;
+ %ptrs = getelementptr inbounds i64, <4 x i64*> %baseptrs, i64 %indice
+
+ %ptr.0 = extractelement <4 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <4 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ %ptr.2 = extractelement <4 x i64*> %ptrs, i64 2
+ call void @use(i64* %ptr.2)
+
+ %ptr.3 = extractelement <4 x i64*> %ptrs, i64 3
+ call void @use(i64* %ptr.3)
+
+ ret void
+}
+
+;-------------------------------------------------------------------------------
+
+define void @first_baseptr_is_known.2elts(<2 x i64*> %baseptrs, i64* %second_baseptr, <2 x i64> %indices) {
+; CHECK-LABEL: @first_baseptr_is_known.2elts(
+; CHECK-NEXT: [[BASEPTRS_NEW:%.*]] = insertelement <2 x i64*> [[BASEPTRS:%.*]], i64* [[SECOND_BASEPTR:%.*]], i64 0
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <2 x i64*> [[BASEPTRS_NEW]], <2 x i64> [[INDICES:%.*]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <2 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <2 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: ret void
+;
+ %baseptrs.new = insertelement <2 x i64*> %baseptrs, i64* %second_baseptr, i64 0
+ %ptrs = getelementptr inbounds i64, <2 x i64*> %baseptrs.new, <2 x i64> %indices
+
+ %ptr.0 = extractelement <2 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <2 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ ret void
+}
+
+define void @first_indice_is_known.2elts(<2 x i64*> %baseptrs, <2 x i64> %indices, i64 %second_indice) {
+; CHECK-LABEL: @first_indice_is_known.2elts(
+; CHECK-NEXT: [[INDICES_NEW:%.*]] = insertelement <2 x i64> [[INDICES:%.*]], i64 [[SECOND_INDICE:%.*]], i64 0
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <2 x i64*> [[BASEPTRS:%.*]], <2 x i64> [[INDICES_NEW]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <2 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <2 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: ret void
+;
+ %indices.new = insertelement <2 x i64> %indices, i64 %second_indice, i64 0
+ %ptrs = getelementptr inbounds i64, <2 x i64*> %baseptrs, <2 x i64> %indices.new
+
+ %ptr.0 = extractelement <2 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <2 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ ret void
+}
+
+define void @first_indice_and_baseptr_are_known.2elts(<2 x i64*> %baseptrs, i64* %second_baseptr, <2 x i64> %indices, i64 %second_indice) {
+; CHECK-LABEL: @first_indice_and_baseptr_are_known.2elts(
+; CHECK-NEXT: [[BASEPTRS_NEW:%.*]] = insertelement <2 x i64*> [[BASEPTRS:%.*]], i64* [[SECOND_BASEPTR:%.*]], i64 0
+; CHECK-NEXT: [[INDICES_NEW:%.*]] = insertelement <2 x i64> [[INDICES:%.*]], i64 [[SECOND_INDICE:%.*]], i64 0
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <2 x i64*> [[BASEPTRS_NEW]], <2 x i64> [[INDICES_NEW]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <2 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <2 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: ret void
+;
+ %baseptrs.new = insertelement <2 x i64*> %baseptrs, i64* %second_baseptr, i64 0
+ %indices.new = insertelement <2 x i64> %indices, i64 %second_indice, i64 0
+ %ptrs = getelementptr inbounds i64, <2 x i64*> %baseptrs.new, <2 x i64> %indices.new
+
+ %ptr.0 = extractelement <2 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <2 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ ret void
+}
+
+;-------------------------------------------------------------------------------
+
+define void @first_baseptr_is_known.3elts(<3 x i64*> %baseptrs, i64* %second_baseptr, <3 x i64> %indices) {
+; CHECK-LABEL: @first_baseptr_is_known.3elts(
+; CHECK-NEXT: [[BASEPTRS_NEW:%.*]] = insertelement <3 x i64*> [[BASEPTRS:%.*]], i64* [[SECOND_BASEPTR:%.*]], i64 0
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <3 x i64*> [[BASEPTRS_NEW]], <3 x i64> [[INDICES:%.*]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: [[PTR_2:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 2
+; CHECK-NEXT: call void @use(i64* [[PTR_2]])
+; CHECK-NEXT: ret void
+;
+ %baseptrs.new = insertelement <3 x i64*> %baseptrs, i64* %second_baseptr, i64 0
+ %ptrs = getelementptr inbounds i64, <3 x i64*> %baseptrs.new, <3 x i64> %indices
+
+ %ptr.0 = extractelement <3 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <3 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ %ptr.2 = extractelement <3 x i64*> %ptrs, i64 2
+ call void @use(i64* %ptr.2)
+
+ ret void
+}
+
+define void @first_indice_is_known.3elts(<3 x i64*> %baseptrs, <3 x i64> %indices, i64 %second_indice) {
+; CHECK-LABEL: @first_indice_is_known.3elts(
+; CHECK-NEXT: [[INDICES_NEW:%.*]] = insertelement <3 x i64> [[INDICES:%.*]], i64 [[SECOND_INDICE:%.*]], i64 0
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <3 x i64*> [[BASEPTRS:%.*]], <3 x i64> [[INDICES_NEW]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: [[PTR_2:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 2
+; CHECK-NEXT: call void @use(i64* [[PTR_2]])
+; CHECK-NEXT: ret void
+;
+ %indices.new = insertelement <3 x i64> %indices, i64 %second_indice, i64 0
+ %ptrs = getelementptr inbounds i64, <3 x i64*> %baseptrs, <3 x i64> %indices.new
+
+ %ptr.0 = extractelement <3 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <3 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ %ptr.2 = extractelement <3 x i64*> %ptrs, i64 2
+ call void @use(i64* %ptr.2)
+
+ ret void
+}
+
+define void @first_indice_and_baseptr_are_known.3elts(<3 x i64*> %baseptrs, i64* %second_baseptr, <3 x i64> %indices, i64 %second_indice) {
+; CHECK-LABEL: @first_indice_and_baseptr_are_known.3elts(
+; CHECK-NEXT: [[BASEPTRS_NEW:%.*]] = insertelement <3 x i64*> [[BASEPTRS:%.*]], i64* [[SECOND_BASEPTR:%.*]], i64 0
+; CHECK-NEXT: [[INDICES_NEW:%.*]] = insertelement <3 x i64> [[INDICES:%.*]], i64 [[SECOND_INDICE:%.*]], i64 0
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <3 x i64*> [[BASEPTRS_NEW]], <3 x i64> [[INDICES_NEW]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: [[PTR_2:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 2
+; CHECK-NEXT: call void @use(i64* [[PTR_2]])
+; CHECK-NEXT: ret void
+;
+ %baseptrs.new = insertelement <3 x i64*> %baseptrs, i64* %second_baseptr, i64 0
+ %indices.new = insertelement <3 x i64> %indices, i64 %second_indice, i64 0
+ %ptrs = getelementptr inbounds i64, <3 x i64*> %baseptrs.new, <3 x i64> %indices.new
+
+ %ptr.0 = extractelement <3 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <3 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ %ptr.2 = extractelement <3 x i64*> %ptrs, i64 2
+ call void @use(i64* %ptr.2)
+
+ ret void
+}
+
+;-------------------------------------------------------------------------------
+
+define void @first_two_baseptrs_is_known.3elts(<3 x i64*> %baseptrs, i64* %second_baseptr, i64* %third_baseptr, <3 x i64> %indices) {
+; CHECK-LABEL: @first_two_baseptrs_is_known.3elts(
+; CHECK-NEXT: [[BASEPTRS_NEW_TMP:%.*]] = insertelement <3 x i64*> [[BASEPTRS:%.*]], i64* [[SECOND_BASEPTR:%.*]], i64 0
+; CHECK-NEXT: [[BASEPTRS_NEW:%.*]] = insertelement <3 x i64*> [[BASEPTRS_NEW_TMP]], i64* [[THIRD_BASEPTR:%.*]], i64 1
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <3 x i64*> [[BASEPTRS_NEW]], <3 x i64> [[INDICES:%.*]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: [[PTR_2:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 2
+; CHECK-NEXT: call void @use(i64* [[PTR_2]])
+; CHECK-NEXT: ret void
+;
+ %baseptrs.new.tmp = insertelement <3 x i64*> %baseptrs, i64* %second_baseptr, i64 0
+ %baseptrs.new = insertelement <3 x i64*> %baseptrs.new.tmp, i64* %third_baseptr, i64 1
+ %ptrs = getelementptr inbounds i64, <3 x i64*> %baseptrs.new, <3 x i64> %indices
+
+ %ptr.0 = extractelement <3 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <3 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ %ptr.2 = extractelement <3 x i64*> %ptrs, i64 2
+ call void @use(i64* %ptr.2)
+
+ ret void
+}
+
+define void @first_two_indices_is_known.3elts(<3 x i64*> %baseptrs, <3 x i64> %indices, i64 %second_indice, i64 %third_indice) {
+; CHECK-LABEL: @first_two_indices_is_known.3elts(
+; CHECK-NEXT: [[INDICES_NEW_TMP:%.*]] = insertelement <3 x i64> [[INDICES:%.*]], i64 [[SECOND_INDICE:%.*]], i64 0
+; CHECK-NEXT: [[INDICES_NEW:%.*]] = insertelement <3 x i64> [[INDICES_NEW_TMP]], i64 [[THIRD_INDICE:%.*]], i64 1
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <3 x i64*> [[BASEPTRS:%.*]], <3 x i64> [[INDICES_NEW]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: [[PTR_2:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 2
+; CHECK-NEXT: call void @use(i64* [[PTR_2]])
+; CHECK-NEXT: ret void
+;
+ %indices.new.tmp = insertelement <3 x i64> %indices, i64 %second_indice, i64 0
+ %indices.new = insertelement <3 x i64> %indices.new.tmp, i64 %third_indice, i64 1
+ %ptrs = getelementptr inbounds i64, <3 x i64*> %baseptrs, <3 x i64> %indices.new
+
+ %ptr.0 = extractelement <3 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <3 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ %ptr.2 = extractelement <3 x i64*> %ptrs, i64 2
+ call void @use(i64* %ptr.2)
+
+ ret void
+}
+
+define void @first_two_indices_and_first_two_baseptrs_are_known.3elts(<3 x i64*> %baseptrs, i64* %second_baseptr, i64* %third_baseptr, <3 x i64> %indices, i64 %second_indice, i64 %third_indice) {
+; CHECK-LABEL: @first_two_indices_and_first_two_baseptrs_are_known.3elts(
+; CHECK-NEXT: [[BASEPTRS_NEW_TMP:%.*]] = insertelement <3 x i64*> [[BASEPTRS:%.*]], i64* [[SECOND_BASEPTR:%.*]], i64 0
+; CHECK-NEXT: [[BASEPTRS_NEW:%.*]] = insertelement <3 x i64*> [[BASEPTRS_NEW_TMP]], i64* [[THIRD_BASEPTR:%.*]], i64 1
+; CHECK-NEXT: [[INDICES_NEW_TMP:%.*]] = insertelement <3 x i64> [[INDICES:%.*]], i64 [[SECOND_INDICE:%.*]], i64 0
+; CHECK-NEXT: [[INDICES_NEW:%.*]] = insertelement <3 x i64> [[INDICES_NEW_TMP]], i64 [[THIRD_INDICE:%.*]], i64 1
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <3 x i64*> [[BASEPTRS_NEW]], <3 x i64> [[INDICES_NEW]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: [[PTR_2:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 2
+; CHECK-NEXT: call void @use(i64* [[PTR_2]])
+; CHECK-NEXT: ret void
+;
+ %baseptrs.new.tmp = insertelement <3 x i64*> %baseptrs, i64* %second_baseptr, i64 0
+ %baseptrs.new = insertelement <3 x i64*> %baseptrs.new.tmp, i64* %third_baseptr, i64 1
+ %indices.new.tmp = insertelement <3 x i64> %indices, i64 %second_indice, i64 0
+ %indices.new = insertelement <3 x i64> %indices.new.tmp, i64 %third_indice, i64 1
+ %ptrs = getelementptr inbounds i64, <3 x i64*> %baseptrs.new, <3 x i64> %indices.new
+
+ %ptr.0 = extractelement <3 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <3 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ %ptr.2 = extractelement <3 x i64*> %ptrs, i64 2
+ call void @use(i64* %ptr.2)
+
+ ret void
+}
+
+;-------------------------------------------------------------------------------
+
+define void @first_two_baseptrs_is_knownequal.3elts(<3 x i64*> %baseptrs, i64* %second_baseptr, <3 x i64> %indices) {
+; CHECK-LABEL: @first_two_baseptrs_is_knownequal.3elts(
+; CHECK-NEXT: [[BASEPTRS_NEW_TMP:%.*]] = insertelement <3 x i64*> [[BASEPTRS:%.*]], i64* [[SECOND_BASEPTR:%.*]], i64 0
+; CHECK-NEXT: [[BASEPTRS_NEW:%.*]] = insertelement <3 x i64*> [[BASEPTRS_NEW_TMP]], i64* [[SECOND_BASEPTR]], i64 1
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <3 x i64*> [[BASEPTRS_NEW]], <3 x i64> [[INDICES:%.*]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: [[PTR_2:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 2
+; CHECK-NEXT: call void @use(i64* [[PTR_2]])
+; CHECK-NEXT: ret void
+;
+ %baseptrs.new.tmp = insertelement <3 x i64*> %baseptrs, i64* %second_baseptr, i64 0
+ %baseptrs.new = insertelement <3 x i64*> %baseptrs.new.tmp, i64* %second_baseptr, i64 1
+ %ptrs = getelementptr inbounds i64, <3 x i64*> %baseptrs.new, <3 x i64> %indices
+
+ %ptr.0 = extractelement <3 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <3 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ %ptr.2 = extractelement <3 x i64*> %ptrs, i64 2
+ call void @use(i64* %ptr.2)
+
+ ret void
+}
+
+define void @first_two_indices_is_knownequal.3elts(<3 x i64*> %baseptrs, <3 x i64> %indices, i64 %second_indice) {
+; CHECK-LABEL: @first_two_indices_is_knownequal.3elts(
+; CHECK-NEXT: [[INDICES_NEW_TMP:%.*]] = insertelement <3 x i64> [[INDICES:%.*]], i64 [[SECOND_INDICE:%.*]], i64 0
+; CHECK-NEXT: [[INDICES_NEW:%.*]] = insertelement <3 x i64> [[INDICES_NEW_TMP]], i64 [[SECOND_INDICE]], i64 1
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <3 x i64*> [[BASEPTRS:%.*]], <3 x i64> [[INDICES_NEW]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: [[PTR_2:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 2
+; CHECK-NEXT: call void @use(i64* [[PTR_2]])
+; CHECK-NEXT: ret void
+;
+ %indices.new.tmp = insertelement <3 x i64> %indices, i64 %second_indice, i64 0
+ %indices.new = insertelement <3 x i64> %indices.new.tmp, i64 %second_indice, i64 1
+ %ptrs = getelementptr inbounds i64, <3 x i64*> %baseptrs, <3 x i64> %indices.new
+
+ %ptr.0 = extractelement <3 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <3 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ %ptr.2 = extractelement <3 x i64*> %ptrs, i64 2
+ call void @use(i64* %ptr.2)
+
+ ret void
+}
+
+define void @first_two_indices_and_first_two_baseptrs_are_knownequal.3elts(<3 x i64*> %baseptrs, i64* %second_baseptr, <3 x i64> %indices, i64 %second_indice) {
+; CHECK-LABEL: @first_two_indices_and_first_two_baseptrs_are_knownequal.3elts(
+; CHECK-NEXT: [[BASEPTRS_NEW_TMP:%.*]] = insertelement <3 x i64*> [[BASEPTRS:%.*]], i64* [[SECOND_BASEPTR:%.*]], i64 0
+; CHECK-NEXT: [[BASEPTRS_NEW:%.*]] = insertelement <3 x i64*> [[BASEPTRS_NEW_TMP]], i64* [[SECOND_BASEPTR]], i64 1
+; CHECK-NEXT: [[INDICES_NEW_TMP:%.*]] = insertelement <3 x i64> [[INDICES:%.*]], i64 [[SECOND_INDICE:%.*]], i64 0
+; CHECK-NEXT: [[INDICES_NEW:%.*]] = insertelement <3 x i64> [[INDICES_NEW_TMP]], i64 [[SECOND_INDICE]], i64 1
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <3 x i64*> [[BASEPTRS_NEW]], <3 x i64> [[INDICES_NEW]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: [[PTR_2:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 2
+; CHECK-NEXT: call void @use(i64* [[PTR_2]])
+; CHECK-NEXT: ret void
+;
+ %baseptrs.new.tmp = insertelement <3 x i64*> %baseptrs, i64* %second_baseptr, i64 0
+ %baseptrs.new = insertelement <3 x i64*> %baseptrs.new.tmp, i64* %second_baseptr, i64 1
+ %indices.new.tmp = insertelement <3 x i64> %indices, i64 %second_indice, i64 0
+ %indices.new = insertelement <3 x i64> %indices.new.tmp, i64 %second_indice, i64 1
+ %ptrs = getelementptr inbounds i64, <3 x i64*> %baseptrs.new, <3 x i64> %indices.new
+
+ %ptr.0 = extractelement <3 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <3 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ %ptr.2 = extractelement <3 x i64*> %ptrs, i64 2
+ call void @use(i64* %ptr.2)
+
+ ret void
+}
+
+;-------------------------------------------------------------------------------
+
+define void @first_baseptr_is_known.4elts(<4 x i64*> %baseptrs, i64* %second_baseptr, <4 x i64> %indices) {
+; CHECK-LABEL: @first_baseptr_is_known.4elts(
+; CHECK-NEXT: [[BASEPTRS_NEW:%.*]] = insertelement <4 x i64*> [[BASEPTRS:%.*]], i64* [[SECOND_BASEPTR:%.*]], i64 0
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <4 x i64*> [[BASEPTRS_NEW]], <4 x i64> [[INDICES:%.*]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: [[PTR_2:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 2
+; CHECK-NEXT: call void @use(i64* [[PTR_2]])
+; CHECK-NEXT: [[PTR_3:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 3
+; CHECK-NEXT: call void @use(i64* [[PTR_3]])
+; CHECK-NEXT: ret void
+;
+ %baseptrs.new = insertelement <4 x i64*> %baseptrs, i64* %second_baseptr, i64 0
+ %ptrs = getelementptr inbounds i64, <4 x i64*> %baseptrs.new, <4 x i64> %indices
+
+ %ptr.0 = extractelement <4 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <4 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ %ptr.2 = extractelement <4 x i64*> %ptrs, i64 2
+ call void @use(i64* %ptr.2)
+
+ %ptr.3 = extractelement <4 x i64*> %ptrs, i64 3
+ call void @use(i64* %ptr.3)
+
+ ret void
+}
+
+define void @first_indice_is_known.4elts(<4 x i64*> %baseptrs, <4 x i64> %indices, i64 %second_indice) {
+; CHECK-LABEL: @first_indice_is_known.4elts(
+; CHECK-NEXT: [[INDICES_NEW:%.*]] = insertelement <4 x i64> [[INDICES:%.*]], i64 [[SECOND_INDICE:%.*]], i64 0
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <4 x i64*> [[BASEPTRS:%.*]], <4 x i64> [[INDICES_NEW]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: [[PTR_2:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 2
+; CHECK-NEXT: call void @use(i64* [[PTR_2]])
+; CHECK-NEXT: [[PTR_3:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 3
+; CHECK-NEXT: call void @use(i64* [[PTR_3]])
+; CHECK-NEXT: ret void
+;
+ %indices.new = insertelement <4 x i64> %indices, i64 %second_indice, i64 0
+ %ptrs = getelementptr inbounds i64, <4 x i64*> %baseptrs, <4 x i64> %indices.new
+
+ %ptr.0 = extractelement <4 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <4 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ %ptr.2 = extractelement <4 x i64*> %ptrs, i64 2
+ call void @use(i64* %ptr.2)
+
+ %ptr.3 = extractelement <4 x i64*> %ptrs, i64 3
+ call void @use(i64* %ptr.3)
+
+ ret void
+}
+
+define void @first_indice_and_first_baseptr_are_known.4elts(<4 x i64*> %baseptrs, i64* %second_baseptr, <4 x i64> %indices, i64 %second_indice) {
+; CHECK-LABEL: @first_indice_and_first_baseptr_are_known.4elts(
+; CHECK-NEXT: [[BASEPTRS_NEW:%.*]] = insertelement <4 x i64*> [[BASEPTRS:%.*]], i64* [[SECOND_BASEPTR:%.*]], i64 0
+; CHECK-NEXT: [[INDICES_NEW:%.*]] = insertelement <4 x i64> [[INDICES:%.*]], i64 [[SECOND_INDICE:%.*]], i64 0
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <4 x i64*> [[BASEPTRS_NEW]], <4 x i64> [[INDICES_NEW]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: [[PTR_2:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 2
+; CHECK-NEXT: call void @use(i64* [[PTR_2]])
+; CHECK-NEXT: [[PTR_3:%.*]] = extractelement <4 x i64*> [[PTRS]], i64 3
+; CHECK-NEXT: call void @use(i64* [[PTR_3]])
+; CHECK-NEXT: ret void
+;
+ %baseptrs.new = insertelement <4 x i64*> %baseptrs, i64* %second_baseptr, i64 0
+ %indices.new = insertelement <4 x i64> %indices, i64 %second_indice, i64 0
+ %ptrs = getelementptr inbounds i64, <4 x i64*> %baseptrs.new, <4 x i64> %indices.new
+
+ %ptr.0 = extractelement <4 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <4 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ %ptr.2 = extractelement <4 x i64*> %ptrs, i64 2
+ call void @use(i64* %ptr.2)
+
+ %ptr.3 = extractelement <4 x i64*> %ptrs, i64 3
+ call void @use(i64* %ptr.3)
+
+ ret void
+}
+
+;-------------------------------------------------------------------------------
+
+define void @first_two_baseptrs_is_knownequal.4elts(<3 x i64*> %baseptrs, i64* %second_baseptr, <3 x i64> %indices) {
+; CHECK-LABEL: @first_two_baseptrs_is_knownequal.4elts(
+; CHECK-NEXT: [[BASEPTRS_NEW_TMP:%.*]] = insertelement <3 x i64*> [[BASEPTRS:%.*]], i64* [[SECOND_BASEPTR:%.*]], i64 0
+; CHECK-NEXT: [[BASEPTRS_NEW:%.*]] = insertelement <3 x i64*> [[BASEPTRS_NEW_TMP]], i64* [[SECOND_BASEPTR]], i64 1
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <3 x i64*> [[BASEPTRS_NEW]], <3 x i64> [[INDICES:%.*]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: [[PTR_2:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 2
+; CHECK-NEXT: call void @use(i64* [[PTR_2]])
+; CHECK-NEXT: ret void
+;
+ %baseptrs.new.tmp = insertelement <3 x i64*> %baseptrs, i64* %second_baseptr, i64 0
+ %baseptrs.new = insertelement <3 x i64*> %baseptrs.new.tmp, i64* %second_baseptr, i64 1
+ %ptrs = getelementptr inbounds i64, <3 x i64*> %baseptrs.new, <3 x i64> %indices
+
+ %ptr.0 = extractelement <3 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <3 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ %ptr.2 = extractelement <3 x i64*> %ptrs, i64 2
+ call void @use(i64* %ptr.2)
+
+ ret void
+}
+
+define void @first_two_indices_is_knownequal.4elts(<3 x i64*> %baseptrs, <3 x i64> %indices, i64 %second_indice) {
+; CHECK-LABEL: @first_two_indices_is_knownequal.4elts(
+; CHECK-NEXT: [[INDICES_NEW_TMP:%.*]] = insertelement <3 x i64> [[INDICES:%.*]], i64 [[SECOND_INDICE:%.*]], i64 0
+; CHECK-NEXT: [[INDICES_NEW:%.*]] = insertelement <3 x i64> [[INDICES_NEW_TMP]], i64 [[SECOND_INDICE]], i64 1
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <3 x i64*> [[BASEPTRS:%.*]], <3 x i64> [[INDICES_NEW]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: [[PTR_2:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 2
+; CHECK-NEXT: call void @use(i64* [[PTR_2]])
+; CHECK-NEXT: ret void
+;
+ %indices.new.tmp = insertelement <3 x i64> %indices, i64 %second_indice, i64 0
+ %indices.new = insertelement <3 x i64> %indices.new.tmp, i64 %second_indice, i64 1
+ %ptrs = getelementptr inbounds i64, <3 x i64*> %baseptrs, <3 x i64> %indices.new
+
+ %ptr.0 = extractelement <3 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <3 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ %ptr.2 = extractelement <3 x i64*> %ptrs, i64 2
+ call void @use(i64* %ptr.2)
+
+ ret void
+}
+
+define void @first_two_indices_and_first_two_baseptrs_are_knownequal.4elts(<3 x i64*> %baseptrs, i64* %second_baseptr, <3 x i64> %indices, i64 %second_indice) {
+; CHECK-LABEL: @first_two_indices_and_first_two_baseptrs_are_knownequal.4elts(
+; CHECK-NEXT: [[BASEPTRS_NEW_TMP:%.*]] = insertelement <3 x i64*> [[BASEPTRS:%.*]], i64* [[SECOND_BASEPTR:%.*]], i64 0
+; CHECK-NEXT: [[BASEPTRS_NEW:%.*]] = insertelement <3 x i64*> [[BASEPTRS_NEW_TMP]], i64* [[SECOND_BASEPTR]], i64 1
+; CHECK-NEXT: [[INDICES_NEW_TMP:%.*]] = insertelement <3 x i64> [[INDICES:%.*]], i64 [[SECOND_INDICE:%.*]], i64 0
+; CHECK-NEXT: [[INDICES_NEW:%.*]] = insertelement <3 x i64> [[INDICES_NEW_TMP]], i64 [[SECOND_INDICE]], i64 1
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <3 x i64*> [[BASEPTRS_NEW]], <3 x i64> [[INDICES_NEW]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: [[PTR_2:%.*]] = extractelement <3 x i64*> [[PTRS]], i64 2
+; CHECK-NEXT: call void @use(i64* [[PTR_2]])
+; CHECK-NEXT: ret void
+;
+ %baseptrs.new.tmp = insertelement <3 x i64*> %baseptrs, i64* %second_baseptr, i64 0
+ %baseptrs.new = insertelement <3 x i64*> %baseptrs.new.tmp, i64* %second_baseptr, i64 1
+ %indices.new.tmp = insertelement <3 x i64> %indices, i64 %second_indice, i64 0
+ %indices.new = insertelement <3 x i64> %indices.new.tmp, i64 %second_indice, i64 1
+ %ptrs = getelementptr inbounds i64, <3 x i64*> %baseptrs.new, <3 x i64> %indices.new
+
+ %ptr.0 = extractelement <3 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <3 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ %ptr.2 = extractelement <3 x i64*> %ptrs, i64 2
+ call void @use(i64* %ptr.2)
+
+ ret void
+}
+
+;===============================================================================
+
+define <2 x i64*> @first_indice_and_baseptr_need_extraction.2elts.extrause(<2 x i64*> %baseptrs, i64* %second_baseptr, <2 x i64> %indices, i64 %second_indice) {
+; CHECK-LABEL: @first_indice_and_baseptr_need_extraction.2elts.extrause(
+; CHECK-NEXT: [[BASEPTRS_NEW:%.*]] = insertelement <2 x i64*> [[BASEPTRS:%.*]], i64* [[SECOND_BASEPTR:%.*]], i64 0
+; CHECK-NEXT: [[INDICES_NEW:%.*]] = insertelement <2 x i64> [[INDICES:%.*]], i64 [[SECOND_INDICE:%.*]], i64 0
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <2 x i64*> [[BASEPTRS_NEW]], <2 x i64> [[INDICES_NEW]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <2 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <2 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: ret <2 x i64*> [[PTRS]]
+;
+ %baseptrs.new = insertelement <2 x i64*> %baseptrs, i64* %second_baseptr, i64 0
+ %indices.new = insertelement <2 x i64> %indices, i64 %second_indice, i64 0
+ %ptrs = getelementptr inbounds i64, <2 x i64*> %baseptrs.new, <2 x i64> %indices.new
+
+ %ptr.0 = extractelement <2 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <2 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ ret <2 x i64*> %ptrs
+}
+
+define i64* @first_indice_and_baseptr_need_extraction.2elts.variable_extraction(<2 x i64*> %baseptrs, i64* %second_baseptr, <2 x i64> %indices, i64 %second_indice, i64 %variable_extract_idx) {
+; CHECK-LABEL: @first_indice_and_baseptr_need_extraction.2elts.variable_extraction(
+; CHECK-NEXT: [[BASEPTRS_NEW:%.*]] = insertelement <2 x i64*> [[BASEPTRS:%.*]], i64* [[SECOND_BASEPTR:%.*]], i64 0
+; CHECK-NEXT: [[INDICES_NEW:%.*]] = insertelement <2 x i64> [[INDICES:%.*]], i64 [[SECOND_INDICE:%.*]], i64 0
+; CHECK-NEXT: [[PTRS:%.*]] = getelementptr inbounds i64, <2 x i64*> [[BASEPTRS_NEW]], <2 x i64> [[INDICES_NEW]]
+; CHECK-NEXT: [[PTR_0:%.*]] = extractelement <2 x i64*> [[PTRS]], i64 0
+; CHECK-NEXT: call void @use(i64* [[PTR_0]])
+; CHECK-NEXT: [[PTR_1:%.*]] = extractelement <2 x i64*> [[PTRS]], i64 1
+; CHECK-NEXT: call void @use(i64* [[PTR_1]])
+; CHECK-NEXT: [[PTR_VAR:%.*]] = extractelement <2 x i64*> [[PTRS]], i64 [[VARIABLE_EXTRACT_IDX:%.*]]
+; CHECK-NEXT: ret i64* [[PTR_VAR]]
+;
+ %baseptrs.new = insertelement <2 x i64*> %baseptrs, i64* %second_baseptr, i64 0
+ %indices.new = insertelement <2 x i64> %indices, i64 %second_indice, i64 0
+ %ptrs = getelementptr inbounds i64, <2 x i64*> %baseptrs.new, <2 x i64> %indices.new
+
+ %ptr.0 = extractelement <2 x i64*> %ptrs, i64 0
+ call void @use(i64* %ptr.0)
+
+ %ptr.1 = extractelement <2 x i64*> %ptrs, i64 1
+ call void @use(i64* %ptr.1)
+
+ %ptr.var = extractelement <2 x i64*> %ptrs, i64 %variable_extract_idx
+
+ ret i64* %ptr.var
+}
More information about the llvm-commits
mailing list