[llvm] [X86] Generate `kmov` for masking integers (PR #120593)
Abhishek Kaushik via llvm-commits
llvm-commits at lists.llvm.org
Tue Feb 4 23:13:19 PST 2025
abhishek-kaushik22 wrote:
> @abhishek-kaushik22 Can you confirm if this will fix #72803 please?
Yes, for
```llvm
define void @example(ptr noalias nocapture noundef writeonly sret([8 x i32]) align 4 dereferenceable(32) %_0, ptr noalias nocapture noundef readonly align 4 dereferenceable(32) %a, i64 noundef %m, ptr noalias nocapture noundef readonly align 4 dereferenceable(32) %b) {
start:
%0 = insertelement <8 x i64> poison, i64 %m, i64 0
%1 = shufflevector <8 x i64> %0, <8 x i64> poison, <8 x i32> zeroinitializer
%2 = and <8 x i64> %1, <i64 1, i64 2, i64 4, i64 8, i64 16, i64 32, i64 64, i64 128>
%3 = icmp eq <8 x i64> %2, zeroinitializer
%4 = load <8 x i32>, ptr %b, align 4
%5 = select <8 x i1> %3, <8 x i32> zeroinitializer, <8 x i32> %4
%6 = load <8 x i32>, ptr %a, align 4
%7 = add <8 x i32> %6, %5
store <8 x i32> %7, ptr %_0, align 4
ret void
}
```
this generates
```asm
movq %rdi, %rax
kmovd %edx, %k1
vmovdqu (%rsi), %ymm0
vpaddd (%rcx), %ymm0, %ymm0 {%k1}
vmovdqu %ymm0, (%rdi)
vzeroupper
retq
```
https://github.com/llvm/llvm-project/pull/120593
More information about the llvm-commits
mailing list