[llvm-branch-commits] [llvm] AMDGPU: Replace insertelement poison with insertelement undef (PR #130896)

Tue Mar 11 22:48:06 PDT 2025

llvmbot wrote:




@llvm/pr-subscribers-backend-amdgpu

Author: Matt Arsenault (arsenm)

<details>
<summary>Changes</summary>

This is the bulk update with perl, with cases which require additional
update left for later.

---

Patch is 300.54 KiB, truncated to 20.00 KiB below, full version: https://github.com/llvm/llvm-project/pull/130896.diff


136 Files Affected:

- (modified) llvm/test/CodeGen/AMDGPU/add3.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/amdpal_scratch_mergedshader.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/any_extend_vector_inreg.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/anyext.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/bf16-conversions.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/bfi_nested.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/big_alu.ll (+90-90) 
- (modified) llvm/test/CodeGen/AMDGPU/bug-deadlanes.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/bug-v4f64-subvector.ll (+8-8) 
- (modified) llvm/test/CodeGen/AMDGPU/build-vector-insert-elt-infloop.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/build-vector-packed-partial-undef.ll (+12-12) 
- (modified) llvm/test/CodeGen/AMDGPU/build_vector-r600.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/build_vector.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/bypass-div.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/chain-hi-to-lo.ll (+15-15) 
- (modified) llvm/test/CodeGen/AMDGPU/coalescer_remat.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/collapse-endcf.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/complex-folding.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/cube.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/cvt_f32_ubyte.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/dagcomb-shuffle-vecextend-non2.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/dagcombiner-bug-illegal-vec4-int-to-fp.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/dead-machine-elim-after-dead-lane.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/debug-value.ll (+4-4) 
- (modified) llvm/test/CodeGen/AMDGPU/debug-value2.ll (+9-9) 
- (modified) llvm/test/CodeGen/AMDGPU/divergence-driven-abs.ll (+4-4) 
- (modified) llvm/test/CodeGen/AMDGPU/divergence-driven-buildvector.ll (+16-16) 
- (modified) llvm/test/CodeGen/AMDGPU/ds-combine-with-dependence.ll (+4-4) 
- (modified) llvm/test/CodeGen/AMDGPU/ds_read2.ll (+5-5) 
- (modified) llvm/test/CodeGen/AMDGPU/ds_read2_superreg.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/ds_write2.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/extract-subvector-equal-length.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/extract-vector-elt-build-vector-combine.ll (+3-3) 
- (modified) llvm/test/CodeGen/AMDGPU/fcanonicalize-elimination.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/flat-offset-bug.ll (+4-4) 
- (modified) llvm/test/CodeGen/AMDGPU/floor.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/fmac.sdwa.ll (+3-3) 
- (modified) llvm/test/CodeGen/AMDGPU/fmad-formation-fmul-distribute-denormal-mode.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/fmad.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/fmax.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/fmin.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/fneg-combines.f16.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/fneg-combines.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/fneg-combines.new.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/frame-index-elimination.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/function-returns.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/global-load-saddr-to-vaddr.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/global-saddr-load.ll (+4-4) 
- (modified) llvm/test/CodeGen/AMDGPU/image-schedule.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/indirect-addressing-si.ll (+4-4) 
- (modified) llvm/test/CodeGen/AMDGPU/input-mods.r600.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/insert_vector_dynelt.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/insert_vector_elt.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/jump-address.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/kcache-fold.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/lds-bounds.ll (+4-4) 
- (modified) llvm/test/CodeGen/AMDGPU/lds-dma-waits.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/lds-misaligned-bug.ll (+12-12) 
- (modified) llvm/test/CodeGen/AMDGPU/llvm.amdgcn.image.nsa.ll (+4-4) 
- (modified) llvm/test/CodeGen/AMDGPU/llvm.amdgcn.image.sample.d16.dim.ll (+3-3) 
- (modified) llvm/test/CodeGen/AMDGPU/llvm.amdgcn.image.sample.dim.ll (+8-8) 
- (modified) llvm/test/CodeGen/AMDGPU/llvm.amdgcn.intersect_ray.ll (+18-18) 
- (modified) llvm/test/CodeGen/AMDGPU/llvm.amdgcn.udot2.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/llvm.pow.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/llvm.r600.cube.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/load-hi16.ll (+50-50) 
- (modified) llvm/test/CodeGen/AMDGPU/load-input-fold.ll (+3-3) 
- (modified) llvm/test/CodeGen/AMDGPU/load-lo16.ll (+9-9) 
- (modified) llvm/test/CodeGen/AMDGPU/loop-live-out-copy-undef-subrange.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/lower-work-group-id-intrinsics-hsa.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/lower-work-group-id-intrinsics-pal.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/mad-mix-hi.ll (+6-6) 
- (modified) llvm/test/CodeGen/AMDGPU/mad_uint24.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/max-literals.ll (+4-4) 
- (modified) llvm/test/CodeGen/AMDGPU/memory_clause.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/merge-store-crash.ll (+3-3) 
- (modified) llvm/test/CodeGen/AMDGPU/mfma-loop.ll (+3-3) 
- (modified) llvm/test/CodeGen/AMDGPU/nsa-reassign.ll (+4-4) 
- (modified) llvm/test/CodeGen/AMDGPU/operand-folding.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/pack.v2f16.ll (+10-10) 
- (modified) llvm/test/CodeGen/AMDGPU/pack.v2i16.ll (+9-9) 
- (modified) llvm/test/CodeGen/AMDGPU/packed-fp32.ll (+12-12) 
- (modified) llvm/test/CodeGen/AMDGPU/packed-op-sel.ll (+11-11) 
- (modified) llvm/test/CodeGen/AMDGPU/predicate-dp4.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/ps-shader-arg-count.ll (+28-28) 
- (modified) llvm/test/CodeGen/AMDGPU/pv-packing.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/pv.ll (+8-8) 
- (modified) llvm/test/CodeGen/AMDGPU/r600-encoding.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/r600-export-fix.ll (+8-8) 
- (modified) llvm/test/CodeGen/AMDGPU/r600-infinite-loop-bug-while-reorganizing-vector.ll (+4-4) 
- (modified) llvm/test/CodeGen/AMDGPU/r600cfg.ll (+5-5) 
- (modified) llvm/test/CodeGen/AMDGPU/reassoc-scalar.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/rv7x0_count3.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/scalar_to_vector.ll (+5-5) 
- (modified) llvm/test/CodeGen/AMDGPU/schedule-fs-loop-nested-if.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/schedule-fs-loop-nested.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/schedule-fs-loop.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/schedule-if-2.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/schedule-if.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/schedule-vs-if-nested-loop-failure.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/schedule-vs-if-nested-loop.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/scheduler-subrange-crash.ll (+7-7) 
- (modified) llvm/test/CodeGen/AMDGPU/sdwa-peephole.ll (+4-4) 
- (modified) llvm/test/CodeGen/AMDGPU/sgpr-copy-duplicate-operand.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/shared-op-cycle.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/si-sgpr-spill.ll (+7-7) 
- (modified) llvm/test/CodeGen/AMDGPU/si-triv-disjoint-mem-access.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/si-vector-hang.ll (+4-4) 
- (modified) llvm/test/CodeGen/AMDGPU/skip-promote-alloca-vector-users.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/smfmac_no_agprs.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/sminmax.ll (+8-8) 
- (modified) llvm/test/CodeGen/AMDGPU/sminmax.v2i16.ll (+8-8) 
- (modified) llvm/test/CodeGen/AMDGPU/smrd.ll (+3-3) 
- (modified) llvm/test/CodeGen/AMDGPU/spill-vector-superclass.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/split-scalar-i64-add.ll (+5-5) 
- (modified) llvm/test/CodeGen/AMDGPU/splitkit-getsubrangeformask.ll (+16-16) 
- (modified) llvm/test/CodeGen/AMDGPU/sram-ecc-default.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/subreg-coalescer-crash.ll (+7-7) 
- (modified) llvm/test/CodeGen/AMDGPU/subreg-coalescer-undef-use.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/subreg-eliminate-dead.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/swizzle-export.ll (+7-7) 
- (modified) llvm/test/CodeGen/AMDGPU/tex-clause-antidep.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/texture-input-merge.ll (+3-3) 
- (modified) llvm/test/CodeGen/AMDGPU/trunc-combine.ll (+4-4) 
- (modified) llvm/test/CodeGen/AMDGPU/undefined-subreg-liverange.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/unigine-liveness-crash.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/unpack-half.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/v_pack.ll (+4-4) 
- (modified) llvm/test/CodeGen/AMDGPU/v_sat_pk_u8_i16.ll (+4-4) 
- (modified) llvm/test/CodeGen/AMDGPU/vector-legalizer-divergence.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/vector_shuffle.packed.ll (+3-3) 
- (modified) llvm/test/CodeGen/AMDGPU/vgpr-spill-emergency-stack-slot-compute.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/vgpr-spill-emergency-stack-slot.ll (+1-1) 
- (modified) llvm/test/CodeGen/AMDGPU/widen-vselect-and-mask.ll (+8-8) 
- (modified) llvm/test/CodeGen/AMDGPU/wqm-gfx11.ll (+2-2) 
- (modified) llvm/test/CodeGen/AMDGPU/xor3.ll (+2-2) 


``````````diff

diff --git a/llvm/test/CodeGen/AMDGPU/add3.ll b/llvm/test/CodeGen/AMDGPU/add3.ll
index d3f9c2d0fbc54..0d80296bb67b6 100644
--- a/llvm/test/CodeGen/AMDGPU/add3.ll
+++ b/llvm/test/CodeGen/AMDGPU/add3.ll
@@ -181,7 +181,7 @@ define amdgpu_ps <2 x float> @add3_multiuse_outer(i32 %a, i32 %b, i32 %c, i32 %x
   %inner = add i32 %a, %b
   %outer = add i32 %inner, %c
   %x1 = mul i32 %outer, %x
-  %r1 = insertelement <2 x i32> undef, i32 %outer, i32 0
+  %r1 = insertelement <2 x i32> poison, i32 %outer, i32 0
   %r0 = insertelement <2 x i32> %r1, i32 %x1, i32 1
   %bc = bitcast <2 x i32> %r0 to <2 x float>
   ret <2 x float> %bc
@@ -207,7 +207,7 @@ define amdgpu_ps <2 x float> @add3_multiuse_inner(i32 %a, i32 %b, i32 %c) {
 ; GFX10-NEXT:    ; return to shader part epilog
   %inner = add i32 %a, %b
   %outer = add i32 %inner, %c
-  %r1 = insertelement <2 x i32> undef, i32 %inner, i32 0
+  %r1 = insertelement <2 x i32> poison, i32 %inner, i32 0
   %r0 = insertelement <2 x i32> %r1, i32 %outer, i32 1
   %bc = bitcast <2 x i32> %r0 to <2 x float>
   ret <2 x float> %bc
diff --git a/llvm/test/CodeGen/AMDGPU/amdpal_scratch_mergedshader.ll b/llvm/test/CodeGen/AMDGPU/amdpal_scratch_mergedshader.ll
index 2aea4497c12ba..b610fca02f92e 100644
--- a/llvm/test/CodeGen/AMDGPU/amdpal_scratch_mergedshader.ll
+++ b/llvm/test/CodeGen/AMDGPU/amdpal_scratch_mergedshader.ll
@@ -17,7 +17,7 @@ define amdgpu_hs void @_amdgpu_hs_main(i32 inreg %arg, i32 inreg %arg1, i32 inre
 
 .beginls:                                         ; preds = %.entry
   %tmp15 = extractelement <6 x i32> %arg8, i32 3
-  %.0.vec.insert.i = insertelement <2 x i32> undef, i32 %tmp15, i32 0
+  %.0.vec.insert.i = insertelement <2 x i32> poison, i32 %tmp15, i32 0
   %.4.vec.insert.i = shufflevector <2 x i32> %.0.vec.insert.i, <2 x i32> undef, <2 x i32> <i32 0, i32 3>
   %tmp16 = bitcast <2 x i32> %.4.vec.insert.i to i64
   br label %.endls
diff --git a/llvm/test/CodeGen/AMDGPU/any_extend_vector_inreg.ll b/llvm/test/CodeGen/AMDGPU/any_extend_vector_inreg.ll
index 07e39d798f58d..8bcef24c8e23d 100644
--- a/llvm/test/CodeGen/AMDGPU/any_extend_vector_inreg.ll
+++ b/llvm/test/CodeGen/AMDGPU/any_extend_vector_inreg.ll
@@ -36,7 +36,7 @@ bb:
   %tmp21 = getelementptr inbounds <8 x i8>, ptr addrspace(1) %arg, i64 4
   %tmp23 = load <16 x i8>, ptr addrspace(1) %tmp21, align 16
   %tmp24 = extractelement <16 x i8> %tmp23, i64 3
-  %tmp1 = insertelement <16 x i8> undef, i8 %tmp3, i32 2
+  %tmp1 = insertelement <16 x i8> poison, i8 %tmp3, i32 2
   %tmp4 = insertelement <16 x i8> %tmp1, i8 0, i32 3
   %tmp5 = insertelement <16 x i8> %tmp4, i8 0, i32 4
   %tmp7 = insertelement <16 x i8> %tmp5, i8 %tmp6, i32 5
diff --git a/llvm/test/CodeGen/AMDGPU/anyext.ll b/llvm/test/CodeGen/AMDGPU/anyext.ll
index 6e16c90033273..f0aa141e65a5c 100644
--- a/llvm/test/CodeGen/AMDGPU/anyext.ll
+++ b/llvm/test/CodeGen/AMDGPU/anyext.ll
@@ -187,7 +187,7 @@ define amdgpu_kernel void @anyext_v2i16_to_v2i32() #0 {
 ; GFX9-NEXT:    s_endpgm
 bb:
   %tmp = load i16, ptr addrspace(1) undef, align 2
-  %tmp2 = insertelement <2 x i16> undef, i16 %tmp, i32 1
+  %tmp2 = insertelement <2 x i16> poison, i16 %tmp, i32 1
   %tmp4 = and <2 x i16> %tmp2, <i16 -32767, i16 -32767>
   %tmp5 = zext <2 x i16> %tmp4 to <2 x i32>
   %tmp6 = shl nuw <2 x i32> %tmp5, <i32 16, i32 16>
diff --git a/llvm/test/CodeGen/AMDGPU/bf16-conversions.ll b/llvm/test/CodeGen/AMDGPU/bf16-conversions.ll
index 0b5d47df2cc35..4c01e583713a7 100644
--- a/llvm/test/CodeGen/AMDGPU/bf16-conversions.ll
+++ b/llvm/test/CodeGen/AMDGPU/bf16-conversions.ll
@@ -189,7 +189,7 @@ define amdgpu_ps float @fptrunc_f32_f32_to_v2bf16(float %a, float %b) {
 entry:
   %a.cvt = fptrunc float %a to bfloat
   %b.cvt = fptrunc float %b to bfloat
-  %v2.1 = insertelement <2 x bfloat> undef, bfloat %a.cvt, i32 0
+  %v2.1 = insertelement <2 x bfloat> poison, bfloat %a.cvt, i32 0
   %v2.2 = insertelement <2 x bfloat> %v2.1, bfloat %b.cvt, i32 1
   %ret = bitcast <2 x bfloat> %v2.2 to float
   ret float %ret
@@ -226,7 +226,7 @@ entry:
   %a.cvt = fptrunc float %a.neg to bfloat
   %b.abs = call float @llvm.fabs.f32(float %b)
   %b.cvt = fptrunc float %b.abs to bfloat
-  %v2.1 = insertelement <2 x bfloat> undef, bfloat %a.cvt, i32 0
+  %v2.1 = insertelement <2 x bfloat> poison, bfloat %a.cvt, i32 0
   %v2.2 = insertelement <2 x bfloat> %v2.1, bfloat %b.cvt, i32 1
   %ret = bitcast <2 x bfloat> %v2.2 to float
   ret float %ret
diff --git a/llvm/test/CodeGen/AMDGPU/bfi_nested.ll b/llvm/test/CodeGen/AMDGPU/bfi_nested.ll
index 4b38215ebc597..3d52c158a6017 100644
--- a/llvm/test/CodeGen/AMDGPU/bfi_nested.ll
+++ b/llvm/test/CodeGen/AMDGPU/bfi_nested.ll
@@ -297,7 +297,7 @@ define amdgpu_kernel void @v_bfi_dont_applied_for_scalar_ops(ptr addrspace(1) %o
 ; GCN-NEXT:    s_endpgm
   %shift = lshr i32 %b, 16
   %tr = trunc i32 %shift to i16
-  %tmp = insertelement <2 x i16> undef, i16 %a, i32 0
+  %tmp = insertelement <2 x i16> poison, i16 %a, i32 0
   %vec = insertelement <2 x i16> %tmp, i16 %tr, i32 1
   %val = bitcast <2 x i16> %vec to i32
   store i32 %val, ptr addrspace(1) %out, align 4
diff --git a/llvm/test/CodeGen/AMDGPU/big_alu.ll b/llvm/test/CodeGen/AMDGPU/big_alu.ll
index 0daa14a63f21a..b3b6259838341 100644
--- a/llvm/test/CodeGen/AMDGPU/big_alu.ll
+++ b/llvm/test/CodeGen/AMDGPU/big_alu.ll
@@ -90,11 +90,11 @@ main_body:
   br i1 %tmp81, label %IF137, label %ENDIF136
 
 IF137:                                            ; preds = %main_body
-  %tmp82 = insertelement <4 x float> undef, float %tmp30, i32 0
+  %tmp82 = insertelement <4 x float> poison, float %tmp30, i32 0
   %tmp83 = insertelement <4 x float> %tmp82, float %tmp31, i32 1
   %tmp84 = insertelement <4 x float> %tmp83, float %tmp32, i32 2
   %tmp85 = insertelement <4 x float> %tmp84, float 0.000000e+00, i32 3
-  %tmp86 = insertelement <4 x float> undef, float %tmp30, i32 0
+  %tmp86 = insertelement <4 x float> poison, float %tmp30, i32 0
   %tmp87 = insertelement <4 x float> %tmp86, float %tmp31, i32 1
   %tmp88 = insertelement <4 x float> %tmp87, float %tmp32, i32 2
   %tmp89 = insertelement <4 x float> %tmp88, float 0.000000e+00, i32 3
@@ -103,20 +103,20 @@ IF137:                                            ; preds = %main_body
   %tmp92 = fmul float %tmp30, %tmp91
   %tmp93 = fmul float %tmp31, %tmp91
   %tmp94 = fmul float %tmp32, %tmp91
-  %tmp95 = insertelement <4 x float> undef, float %tmp92, i32 0
+  %tmp95 = insertelement <4 x float> poison, float %tmp92, i32 0
   %tmp96 = insertelement <4 x float> %tmp95, float %tmp93, i32 1
   %tmp97 = insertelement <4 x float> %tmp96, float %tmp94, i32 2
   %tmp98 = insertelement <4 x float> %tmp97, float 0.000000e+00, i32 3
-  %tmp99 = insertelement <4 x float> undef, float %tmp37, i32 0
+  %tmp99 = insertelement <4 x float> poison, float %tmp37, i32 0
   %tmp100 = insertelement <4 x float> %tmp99, float %tmp38, i32 1
   %tmp101 = insertelement <4 x float> %tmp100, float %tmp39, i32 2
   %tmp102 = insertelement <4 x float> %tmp101, float 0.000000e+00, i32 3
   %tmp103 = call float @llvm.r600.dot4(<4 x float> %tmp98, <4 x float> %tmp102)
-  %tmp104 = insertelement <4 x float> undef, float %tmp92, i32 0
+  %tmp104 = insertelement <4 x float> poison, float %tmp92, i32 0
   %tmp105 = insertelement <4 x float> %tmp104, float %tmp93, i32 1
   %tmp106 = insertelement <4 x float> %tmp105, float %tmp94, i32 2
   %tmp107 = insertelement <4 x float> %tmp106, float 0.000000e+00, i32 3
-  %tmp108 = insertelement <4 x float> undef, float %tmp40, i32 0
+  %tmp108 = insertelement <4 x float> poison, float %tmp40, i32 0
   %tmp109 = insertelement <4 x float> %tmp108, float %tmp41, i32 1
   %tmp110 = insertelement <4 x float> %tmp109, float %tmp42, i32 2
   %tmp111 = insertelement <4 x float> %tmp110, float 0.000000e+00, i32 3
@@ -124,11 +124,11 @@ IF137:                                            ; preds = %main_body
   %tmp113 = fsub float -0.000000e+00, %tmp92
   %tmp114 = fsub float -0.000000e+00, %tmp93
   %tmp115 = fsub float -0.000000e+00, %tmp94
-  %tmp116 = insertelement <4 x float> undef, float %tmp34, i32 0
+  %tmp116 = insertelement <4 x float> poison, float %tmp34, i32 0
   %tmp117 = insertelement <4 x float> %tmp116, float %tmp35, i32 1
   %tmp118 = insertelement <4 x float> %tmp117, float %tmp36, i32 2
   %tmp119 = insertelement <4 x float> %tmp118, float 0.000000e+00, i32 3
-  %tmp120 = insertelement <4 x float> undef, float %tmp113, i32 0
+  %tmp120 = insertelement <4 x float> poison, float %tmp113, i32 0
   %tmp121 = insertelement <4 x float> %tmp120, float %tmp114, i32 1
   %tmp122 = insertelement <4 x float> %tmp121, float %tmp115, i32 2
   %tmp123 = insertelement <4 x float> %tmp122, float 0.000000e+00, i32 3
@@ -155,7 +155,7 @@ ENDIF136:                                         ; preds = %ENDIF154, %main_bod
   %tmp138 = fmul float %tmp26, 0x3F847AE140000000
   %tmp139 = fmul float %tmp27, 0x3F847AE140000000
   %tmp140 = fmul float %tmp28, 0x3F847AE140000000
-  %tmp141 = insertelement <4 x float> undef, float %tmp138, i32 0
+  %tmp141 = insertelement <4 x float> poison, float %tmp138, i32 0
   %tmp142 = insertelement <4 x float> %tmp141, float %tmp139, i32 1
   %tmp143 = insertelement <4 x float> %tmp142, float %tmp140, i32 2
   %tmp144 = insertelement <4 x float> %tmp143, float 0.000000e+00, i32 3
@@ -163,7 +163,7 @@ ENDIF136:                                         ; preds = %ENDIF154, %main_bod
   %tmp146 = extractelement <4 x float> %tmp144, i32 1
   %tmp147 = extractelement <4 x float> %tmp144, i32 2
   %tmp148 = extractelement <4 x float> %tmp144, i32 3
-  %tmp149 = insertelement <4 x float> undef, float %tmp145, i32 0
+  %tmp149 = insertelement <4 x float> poison, float %tmp145, i32 0
   %tmp150 = insertelement <4 x float> %tmp149, float %tmp146, i32 1
   %tmp151 = insertelement <4 x float> %tmp150, float %tmp147, i32 2
   %tmp152 = insertelement <4 x float> %tmp151, float %tmp148, i32 3
@@ -176,7 +176,7 @@ ENDIF136:                                         ; preds = %ENDIF154, %main_bod
   %tmp159 = fmul float %tmp26, 0x3F45A07B40000000
   %tmp160 = fmul float %tmp27, 0x3F45A07B40000000
   %tmp161 = fmul float %tmp28, 0x3F45A07B40000000
-  %tmp162 = insertelement <4 x float> undef, float %tmp159, i32 0
+  %tmp162 = insertelement <4 x float> poison, float %tmp159, i32 0
   %tmp163 = insertelement <4 x float> %tmp162, float %tmp160, i32 1
   %tmp164 = insertelement <4 x float> %tmp163, float %tmp161, i32 2
   %tmp165 = insertelement <4 x float> %tmp164, float 0.000000e+00, i32 3
@@ -184,7 +184,7 @@ ENDIF136:                                         ; preds = %ENDIF154, %main_bod
   %tmp167 = extractelement <4 x float> %tmp165, i32 1
   %tmp168 = extractelement <4 x float> %tmp165, i32 2
   %tmp169 = extractelement <4 x float> %tmp165, i32 3
-  %tmp170 = insertelement <4 x float> undef, float %tmp166, i32 0
+  %tmp170 = insertelement <4 x float> poison, float %tmp166, i32 0
   %tmp171 = insertelement <4 x float> %tmp170, float %tmp167, i32 1
   %tmp172 = insertelement <4 x float> %tmp171, float %tmp168, i32 2
   %tmp173 = insertelement <4 x float> %tmp172, float %tmp169, i32 3
@@ -251,28 +251,28 @@ ENDIF136:                                         ; preds = %ENDIF154, %main_bod
   %tmp227 = fmul float %clamp.i14, %tmp226
   %tmp228 = fmul float %tmp26, 0x3F368B5CC0000000
   %tmp229 = fmul float %tmp27, 0x3F368B5CC0000000
-  %tmp230 = insertelement <4 x float> undef, float %tmp228, i32 0
+  %tmp230 = insertelement <4 x float> poison, float %tmp228, i32 0
   %tmp231 = insertelement <4 x float> %tmp230, float %tmp229, i32 1
   %tmp232 = insertelement <4 x float> %tmp231, float 0.000000e+00, i32 2
   %tmp233 = insertelement <4 x float> %tmp232, float 0.000000e+00, i32 3
   %tmp234 = extractelement <4 x float> %tmp233, i32 0
   %tmp235 = extractelement <4 x float> %tmp233, i32 1
-  %tmp236 = insertelement <4 x float> undef, float %tmp234, i32 0
+  %tmp236 = insertelement <4 x float> poison, float %tmp234, i32 0
   %tmp237 = insertelement <4 x float> %tmp236, float %tmp235, i32 1
-  %tmp238 = insertelement <4 x float> %tmp237, float undef, i32 2
-  %tmp239 = insertelement <4 x float> %tmp238, float undef, i32 3
+  %tmp238 = insertelement <4 x float> %tmp237, float poison, i32 2
+  %tmp239 = insertelement <4 x float> %tmp238, float poison, i32 3
   %tmp240 = shufflevector <4 x float> %tmp239, <4 x float> %tmp239, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
   %tmp241 = call <4 x float> @llvm.r600.tex(<4 x float> %tmp240, i32 0, i32 0, i32 0, i32 17, i32 1, i32 1, i32 1, i32 1, i32 1)
   %tmp242 = extractelement <4 x float> %tmp241, i32 0
-  %tmp243 = insertelement <4 x float> undef, float %tmp242, i32 0
+  %tmp243 = insertelement <4 x float> poison, float %tmp242, i32 0
   %tmp244 = insertelement <4 x float> %tmp243, float %tmp229, i32 1
   %tmp245 = insertelement <4 x float> %tmp244, float 0.000000e+00, i32 2
   %tmp246 = insertelement <4 x float> %tmp245, float 0.000000e+00, i32 3
   %tmp247 = extractelement <4 x float> %tmp246, i32 0
-  %tmp248 = insertelement <4 x float> undef, float %tmp247, i32 0
-  %tmp249 = insertelement <4 x float> %tmp248, float undef, i32 1
-  %tmp250 = insertelement <4 x float> %tmp249, float undef, i32 2
-  %tmp251 = insertelement <4 x float> %tmp250, float undef, i32 3
+  %tmp248 = insertelement <4 x float> poison, float %tmp247, i32 0
+  %tmp249 = insertelement <4 x float> %tmp248, float poison, i32 1
+  %tmp250 = insertelement <4 x float> %tmp249, float poison, i32 2
+  %tmp251 = insertelement <4 x float> %tmp250, float poison, i32 3
   %tmp252 = shufflevector <4 x float> %tmp251, <4 x float> %tmp251, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
   %tmp253 = call <4 x float> @llvm.r600.tex(<4 x float> %tmp252, i32 0, i32 0, i32 0, i32 18, i32 2, i32 1, i32 1, i32 1, i32 1)
   %tmp254 = extractelement <4 x float> %tmp253, i32 0
@@ -312,16 +312,16 @@ ENDIF136:                                         ; preds = %ENDIF154, %main_bod
   %tmp285 = fmul float %clamp.i8, %tmp284
   %tmp286 = fmul float %tmp26, 0x3F22DFD6A0000000
   %tmp287 = fmul float %tmp27, 0x3F22DFD6A0000000
-  %tmp288 = insertelement <4 x float> undef, float %tmp286, i32 0
+  %tmp288 = insertelement <4 x float> poison, float %tmp286, i32 0
   %tmp289 = insertelement <4 x float> %tmp288, float %tmp287, i32 1
   %tmp290 = insertelement <4 x float> %tmp289, float 0.000000e+00, i32 2
   %tmp291 = insertelement <4 x float> %tmp290, float 0.000000e+00, i32 3
   %tmp292 = extractelement <4 x float> %tmp291, i32 0
   %tmp293 = extractelement <4 x float> %tmp291, i32 1
-  %tmp294 = insertelement <4 x float> undef, float %tmp292, i32 0
+  %tmp294 = insertelement <4 x float> poison, float %tmp292, i32 0
   %tmp295 = insertelement <4 x float> %tmp294, float %tmp293, i32 1
-  %tmp296 = insertelement <4 x float> %tmp295, float undef, i32 2
-  %tmp297 = insertelement <4 x float> %tmp296, float undef, i32 3
+  %tmp296 = insertelement <4 x float> %tmp295, float poison, i32 2
+  %tmp297 = insertelement <4 x float> %tmp296, float poison, i32 3
   %tmp298 = shufflevector <4 x float> %tmp297, <4 x float> %tmp297, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
   %tmp299 = call <4 x float> @llvm.r600.tex(<4 x float> %tmp298, i32 0, i32 0, i32 0, i32 19, i32 3, i32 1, i32 1, i32 1, i32 1)
   %tmp300 = extractelement <4 x float> %tmp299, i32 0
@@ -347,11 +347,11 @@ ENDIF136:                                         ; preds = %ENDIF154, %main_bod
   %tmp320 = fadd float %tmp319, %tmp314
   %tmp321 = fmul float %temp70.0, %tmp36
   %tmp322 = fadd float %tmp321, %tmp316
-  %tmp323 = insertelement <4 x float> undef, float %tmp318, i32 0
+  %tmp323 = insertelement <4 x float> poison, float %tmp318, i32 0
   %tmp324 = insertelement <4 x float> %tmp323, float %tmp320, i32 1
   %tmp325 = insertelement <4 x float> %tmp324, float %tmp322, i32 2
   %tmp326 = insertelement <4 x float> %tmp325, float 0.000000e+00, i32 3
-  %tmp327 = insertelement <4 x float> undef, float %tmp318, i32 0
+  %tmp327 = insertelement <4 x float> poison, float %tmp318, i32 0
   %tmp328 = insertelement <4 x float> %tmp327, float %tmp320, i32 1
   %tmp329 = insertelement <4 x float> %tmp328, float %tmp322, i32 2
   %tmp330 = insertelement <4 x float> %tmp329, float 0.000000e+00, i32 3
@@ -380,11 +380,11 @@ ENDIF136:                                         ; preds = %ENDIF154, %main_bod
   %tmp353 = fsub float -0.000000e+00, %result.i
   %tmp354 = fsub float -0.000000e+00, %tmp347
   %tmp355 = fadd float %tmp353, %tmp354
-  %tmp356 = insertelement <4 x float> undef, float %tmp43, i32 0
+  %tmp356 = insertelement <4 x float> poison, float %tmp43, i32 0
   %tmp357 = insertelement <4 x float> %tmp356, float %tmp44, i32 1
   %tmp358 = insertelement <4 x float> %tmp357, float %tmp45, i32 2
   %tmp359 = insertelement <4 x float> %tmp358, float 0.000000e+00, i32 3
-  %tmp360 = insertelement <4 x float> undef, float %tmp43, i32 0
+  %tmp360 = insertelement <4 x float> poison, float %tmp43, i32 0
   %tmp361 = insertelement <4 x float> %tmp360, float %tmp44, i32 1
   %tmp362 = insertelement <4 x float> %tmp361, float %tmp45, i32 2
   %tmp363 = insertelement <4 x float> %tmp362, float 0.000000e+00, i32 3
@@ -407,11 +407,11 @@ ENDIF136:                                         ; preds = %ENDIF154, %main_bod
   %tmp379 = fsub float -0.000000e+00, %result.i
   %tmp380 = fsub float -0.000000e+00, %tmp347
   %tmp381 = fadd float %tmp379, %tmp380
-  %tmp382 = insertelement <4 x float> undef, float %tmp43, i32 0
+  %tmp382 = insertelement <4 x float> poison, float %tmp43, i32 0
   %tmp383 = insertelement <4 x float> %tmp382, float %tmp44, i32 1
   %tmp384 = insertelement <4 x float> %tmp383, float %tmp45, i32 2
   %tmp385 = insertelement <4 x float> %tmp384, float 0.000000e+00, i32 3
-  %tmp386 = insertelement <4 x float> undef, float %tmp43, i32 0
+  %tmp386 = insertelement <4 x float> poison, float %tmp43, i32 0
   %tmp387 = insertelement <4 x float> %tmp386, float %tmp44, i32 1
   %tmp388 = insertelement <4 x float> %tmp387, float %tmp45, i32 2
   %tmp389 = insertelement <4 x float> %tmp388, float 0.000000e+00, i32 3
@@ -492,16 +492,16 @@ IF140:                                            ; preds = %LOOP
   %tmp422 = fadd float %tmp421, %tmp22
   %tmp423 = fmul float %tmp130, %temp92.0
   %tmp424 = fadd float %tmp423, %tmp23
-  %tmp425 = insertelement <4 x float> undef, float %tmp422, i32 0
+  %tmp425 = insertelement <4 x float> poison, float %tmp422, i32 0
   %tmp426 = insertelement <4 x float> %tmp425, float %tmp424, i32 1
   %tmp427 = insertelement <4 x float> %tmp426, float 0.000000e+00, i32 2
   %tmp428 = insertelement <4 x float> %tmp427, float 0.000000e+00, i32 3
   %tmp429 = extractelement <4 x float> %tmp428, i32 0
   %tmp430 = extractelement <4 x float> %tmp428, i32 1
-  %tmp431 = insertelement <4 x float> undef, float %tmp429, i32 0
+  %tmp431 = insertelement <4 x float> poison, float %tmp429, i32 0
   %tmp432 = insertelement <4 x float> %tmp431, float %tmp430, i32 1
-  %tmp433 = insertelement <4 x float> %tmp432, float undef, i32 2
-  %tmp434 = insertelement <4 x float> %tmp433, float undef, i32 3
+  %tmp433 = insertelement <4 x float> %tmp432, float poison, i32 2
+  %tmp434 = insertelement <4 x float> %tmp433, float poison, i32 3
   %tmp435 = shufflevector <4 x float> %tmp434, <4 x float> %tmp434, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
   %tmp436 = call <4 x float> @llvm.r600.tex(<4 x float> %tmp435, i32 0, i32 0, i32 0, i32 20, i32 4, i32 1, i32 1, i32 1, i32 1)
   %tmp437 = extractelement <4 x float> %tmp436, i32 3
@@ -518,16 +518,16 @@ ENDIF139:                                         ; preds = %LOOP
   %tmp445 = fadd float %tmp444, %tmp22
   %tmp446 = fmul float %tmp130, %tmp443
   %tmp447 = fadd float %tmp446, %tmp23
-  %tmp448 = insertelement <4 x float> undef, float %tmp445, i32 0
+  %tmp448 = insertelement <4 x float> poison, float %tmp445, i32 0
   %tmp449 = insertelement <4 x float> %tmp448, float %tmp447, i32 1
   %tmp450 = insertelement <4 x float> %tmp449, float 0.000000e+00, i32 2
   %tmp451 = insertelement <4 x float> %tmp450, float 0.000000e+00, i32 3
   %tmp452 = extractelement <4 x float> %tmp451, i32 0
   %tmp453 = extractelement <4 x float> %tmp451, i32 1
-  %tmp454 = insertelement <4 x float> undef, float %tmp452, i32 0
+  %tmp454 = insertelement <4 x float> poison, float %tmp452, i32 0
   %tmp455 = insertelement <4 x float> %tmp454, float %tmp453, i32 1
-  %tmp456 = insertelement <4 x float> %tmp455, float undef, i32 2
-  %tmp4...
[truncated]

``````````

</details>


https://github.com/llvm/llvm-project/pull/130896