[llvm] a88f4f1 - AMDGPU: Fix a test typo reading a partially undefined vector
Matt Arsenault via llvm-commits
llvm-commits at lists.llvm.org
Thu Feb 27 05:17:54 PST 2025
Author: Matt Arsenault
Date: 2025-02-27T20:17:20+07:00
New Revision: a88f4f1962b47aa8db49b8687a7f8b9097a3d13b
URL: https://github.com/llvm/llvm-project/commit/a88f4f1962b47aa8db49b8687a7f8b9097a3d13b
DIFF: https://github.com/llvm/llvm-project/commit/a88f4f1962b47aa8db49b8687a7f8b9097a3d13b.diff
LOG: AMDGPU: Fix a test typo reading a partially undefined vector
This avoids a surprising test diff in a future commit that
happened to change the read registers to something else. Also
migrate from undef to poison.
Added:
Modified:
llvm/test/CodeGen/AMDGPU/acc-ldst.ll
Removed:
################################################################################
diff --git a/llvm/test/CodeGen/AMDGPU/acc-ldst.ll b/llvm/test/CodeGen/AMDGPU/acc-ldst.ll
index be4d6a2c27895..5c484e1e52da8 100644
--- a/llvm/test/CodeGen/AMDGPU/acc-ldst.ll
+++ b/llvm/test/CodeGen/AMDGPU/acc-ldst.ll
@@ -204,7 +204,7 @@ bb:
%tid = call i32 @llvm.amdgcn.workitem.id.x()
%gep = getelementptr inbounds i32, ptr addrspace(1) %arg, i32 %tid
%in.1 = atomicrmw volatile sub ptr addrspace(1) %gep, i32 1 syncscope("agent") seq_cst
- %tmp0 = insertelement <4 x i32> undef, i32 %in.1, i32 0
+ %tmp0 = insertelement <4 x i32> poison, i32 %in.1, i32 0
%tmp1 = insertelement <4 x i32> %tmp0, i32 0, i32 1
%tmp2 = insertelement <4 x i32> %tmp1, i32 0, i32 2
%tmp3 = insertelement <4 x i32> %tmp2, i32 0, i32 3
@@ -227,13 +227,13 @@ bb:
%tid = call i32 @llvm.amdgcn.workitem.id.x()
%gep = getelementptr inbounds i64, ptr addrspace(1) %arg, i32 %tid
%in.1 = atomicrmw volatile sub ptr addrspace(1) %gep, i64 1 syncscope("agent") seq_cst
- %tmp0 = insertelement <2 x i64> undef, i64 %in.1, i32 0
+ %tmp0 = insertelement <2 x i64> poison, i64 %in.1, i32 0
%tmp1 = insertelement <2 x i64> %tmp0, i64 0, i32 1
- %tmp2 = bitcast <2 x i64> %tmp0 to <4 x i32>
+ %tmp2 = bitcast <2 x i64> %tmp1 to <4 x i32>
%mai.1 = tail call <4 x i32> @llvm.amdgcn.mfma.i32.4x4x4i8(i32 1, i32 2, <4 x i32> %tmp2, i32 0, i32 0, i32 0)
%elt.1 = extractelement <4 x i32> %mai.1, i32 0
%elt.2 = extractelement <4 x i32> %mai.1, i32 1
- %v2.1 = insertelement <2 x i32> undef, i32 %elt.1, i32 0
+ %v2.1 = insertelement <2 x i32> poison, i32 %elt.1, i32 0
%v2.2 = insertelement <2 x i32> %v2.1, i32 %elt.2, i32 1
%v2 = bitcast <2 x i32> %v2.2 to i64
%val = atomicrmw volatile add ptr addrspace(1) %gep, i64 %v2 syncscope("agent") seq_cst
More information about the llvm-commits
mailing list