[PATCH] D49720: [ARM] Fix over-alignment in arguments that are HA of 128-bit vectors

Mon Jul 30 01:49:53 PDT 2018

This revision was automatically updated to reflect the committed changes.
Closed by commit rL338233: [ARM] Fix over-alignment in arguments that are HA of 128-bit vectors (authored by petr.pavlu, committed by ).

Changed prior to commit:
  https://reviews.llvm.org/D49720?vs=157430&id=157928#toc

Repository:
  rL LLVM

https://reviews.llvm.org/D49720

Files:
  llvm/trunk/lib/Target/ARM/ARMCallingConv.h
  llvm/trunk/test/CodeGen/ARM/aggregate-padding.ll


Index: llvm/trunk/lib/Target/ARM/ARMCallingConv.h
===================================================================

--- llvm/trunk/lib/Target/ARM/ARMCallingConv.h
+++ llvm/trunk/lib/Target/ARM/ARMCallingConv.h
@@ -269,14 +269,15 @@
   for (auto Reg : RegList)
     State.AllocateReg(Reg);
 
+  // After the first item has been allocated, the rest are packed as tightly as
+  // possible. (E.g. an incoming i64 would have starting Align of 8, but we'll
+  // be allocating a bunch of i32 slots).
+  unsigned RestAlign = std::min(Align, Size);
+
   for (auto &It : PendingMembers) {
     It.convertToMem(State.AllocateStack(Size, Align));
     State.addLoc(It);
-
-    // After the first item has been allocated, the rest are packed as tightly
-    // as possible. (E.g. an incoming i64 would have starting Align of 8, but
-    // we'll be allocating a bunch of i32 slots).
-    Align = Size;
+    Align = RestAlign;
   }
 
   // All pending members have now been allocated
Index: llvm/trunk/test/CodeGen/ARM/aggregate-padding.ll
===================================================================
--- llvm/trunk/test/CodeGen/ARM/aggregate-padding.ll
+++ llvm/trunk/test/CodeGen/ARM/aggregate-padding.ll
@@ -99,3 +99,19 @@
   %sum = add i16 %val0, %val2
   ret i16 %sum
 }
+
+; [2 x <4 x i32>] should be aligned only on a 64-bit boundary and contiguous.
+; None of the two <4 x i32> elements should introduce any padding to 128 bits.
+define i32 @test_4xi32_64bit_aligned_and_contiguous([8 x double], float, [2 x <4 x i32>] %arg) nounwind {
+; CHECK-LABEL: test_4xi32_64bit_aligned_and_contiguous:
+; CHECK-DAG: ldr [[VAL0_0:r[0-9]+]], [sp, #8]
+; CHECK-DAG: ldr [[VAL1_0:r[0-9]+]], [sp, #24]
+; CHECK: add r0, [[VAL0_0]], [[VAL1_0]]
+
+  %val0 = extractvalue [2 x <4 x i32>] %arg, 0
+  %val0_0 = extractelement <4 x i32> %val0, i32 0
+  %val1 = extractvalue [2 x <4 x i32>] %arg, 1
+  %val1_0 = extractelement <4 x i32> %val1, i32 0
+  %sum = add i32 %val0_0, %val1_0
+  ret i32 %sum
+}


-------------- next part --------------
A non-text attachment was scrubbed...
Name: D49720.157928.patch
Type: text/x-patch
Size: 1988 bytes
Desc: not available
URL: <http://lists.llvm.org/pipermail/llvm-commits/attachments/20180730/83e41c91/attachment.bin>