[llvm] [MachinePipeliner] Fix loop-carried dependencies analysis (PR #121907)

Ikhlas Ajbar via llvm-commits llvm-commits at lists.llvm.org
Tue Feb 25 10:23:58 PST 2025


iajbar wrote:

@kasuga-fj, please find the testcase.ll bellow.  With this patch, only one loop is pipelined. Thank you.
target triple = "hexagon"

define void @IntegratePerRow(i32 %width, ptr %0, ptr %1) {
entry:
  br label %for.body

for.body:                                         ; preds = %for.body, %entry
  %sIntg3.036 = phi <32 x i32> [ zeroinitializer, %entry ], [ %4, %for.body ]
  %niter = phi i32 [ 0, %entry ], [ %niter.next.1, %for.body ]
  %2 = tail call <32 x i32> @llvm.hexagon.V6.vrdelta.128B(<32 x i32> %sIntg3.036, <32 x i32> zeroinitializer)
  %3 = tail call <32 x i32> @llvm.hexagon.V6.vaddw.128B(<32 x i32> %2, <32 x i32> zeroinitializer)
  %4 = tail call <32 x i32> @llvm.hexagon.V6.vaddw.128B(<32 x i32> %3, <32 x i32> zeroinitializer)
  store <32 x i32> %4, ptr %0, align 128
  store <32 x i32> zeroinitializer, ptr %1, align 128
  %niter.next.1 = add i32 %niter, 1
  %niter.ncmp.1.not = icmp eq i32 %niter, %width
  br i1 %niter.ncmp.1.not, label %for.end.loopexit.unr-lcssa, label %for.body

for.end.loopexit.unr-lcssa:                       ; preds = %for.body
  ret void
}

; Function Attrs: nocallback nofree nosync nounwind willreturn memory(none)
declare <64 x i32> @llvm.hexagon.V6.vshuffvdd.128B(<32 x i32>, <32 x i32>, i32) #0

; Function Attrs: nocallback nofree nosync nounwind willreturn memory(none)
declare <32 x i32> @llvm.hexagon.V6.vrdelta.128B(<32 x i32>, <32 x i32>) #0

; Function Attrs: nocallback nofree nosync nounwind willreturn memory(none)
declare <32 x i32> @llvm.hexagon.V6.hi.128B(<64 x i32>) #0

; Function Attrs: nocallback nofree nosync nounwind willreturn memory(none)
declare <32 x i32> @llvm.hexagon.V6.vaddw.128B(<32 x i32>, <32 x i32>) #0

define void @IntegrateImage(ptr %src, i32 %srcWidth, ptr %dst) {
entry:
  br label %for.body.i

for.body.i:                                       ; preds = %for.body.i, %entry
  %pIn.038.i = phi ptr [ null, %entry ], [ %incdec.ptr.i.1, %for.body.i ]
  %niter = phi i32 [ 0, %entry ], [ %niter.next.1, %for.body.i ]
  %0 = load <32 x i32>, ptr %pIn.038.i, align 128, !noalias !0
  %1 = tail call <64 x i32> @llvm.hexagon.V6.vshuffvdd.128B(<32 x i32> zeroinitializer, <32 x i32> %0, i32 0)
  %2 = tail call <32 x i32> @llvm.hexagon.V6.hi.128B(<64 x i32> %1)
  store <32 x i32> zeroinitializer, ptr %src, align 128, !alias.scope !0
  store <32 x i32> %2, ptr %dst, align 128, !alias.scope !0
  %incdec.ptr.i.1 = getelementptr i8, ptr %pIn.038.i, i32 256
  %niter.next.1 = add i32 %niter, 1
  %niter.ncmp.1.not = icmp eq i32 %niter, %srcWidth
  br i1 %niter.ncmp.1.not, label %IntegratePerRow.exit.loopexit.unr-lcssa, label %for.body.i

IntegratePerRow.exit.loopexit.unr-lcssa:          ; preds = %for.body.i
  ret void
}
uselistorder ptr @llvm.hexagon.V6.vaddw.128B, { 1, 0 }

attributes #0 = { nocallback nofree nosync nounwind willreturn memory(none) }
!0 = !{!1}
!1 = distinct !{!1, !2, !"IntegratePerRow: %dst"}
!2 = distinct !{!2, !"IntegratePerRow"}


https://github.com/llvm/llvm-project/pull/121907


More information about the llvm-commits mailing list